diff --git "a/trainer_state.json" "b/trainer_state.json" deleted file mode 100644--- "a/trainer_state.json" +++ /dev/null @@ -1,510019 +0,0 @@ -{ - "best_metric": null, - "best_model_checkpoint": null, - "epoch": 2.17859339758048, - "eval_steps": 500, - "global_step": 85000, - "is_hyper_param_search": false, - "is_local_process_zero": true, - "is_world_process_zero": true, - "log_history": [ - { - "epoch": 0.0, - "learning_rate": 1.7079419299743807e-09, - "loss": 2.8359, - "step": 1 - }, - { - "epoch": 0.0, - "learning_rate": 3.4158838599487614e-09, - "loss": 2.4531, - "step": 2 - }, - { - "epoch": 0.0, - "learning_rate": 5.123825789923143e-09, - "loss": 2.2266, - "step": 3 - }, - { - "epoch": 0.0, - "learning_rate": 6.831767719897523e-09, - "loss": 2.5566, - "step": 4 - }, - { - "epoch": 0.0, - "learning_rate": 8.539709649871904e-09, - "loss": 2.7461, - "step": 5 - }, - { - "epoch": 0.0, - "learning_rate": 1.0247651579846285e-08, - "loss": 2.5, - "step": 6 - }, - { - "epoch": 0.0, - "learning_rate": 1.1955593509820665e-08, - "loss": 2.4414, - "step": 7 - }, - { - "epoch": 0.0, - "learning_rate": 1.3663535439795045e-08, - "loss": 2.5781, - "step": 8 - }, - { - "epoch": 0.0, - "learning_rate": 1.5371477369769426e-08, - "loss": 2.8516, - "step": 9 - }, - { - "epoch": 0.0, - "learning_rate": 1.707941929974381e-08, - "loss": 2.3164, - "step": 10 - }, - { - "epoch": 0.0, - "learning_rate": 1.8787361229718188e-08, - "loss": 2.6289, - "step": 11 - }, - { - "epoch": 0.0, - "learning_rate": 2.049530315969257e-08, - "loss": 2.1953, - "step": 12 - }, - { - "epoch": 0.0, - "learning_rate": 2.220324508966695e-08, - "loss": 2.8398, - "step": 13 - }, - { - "epoch": 0.0, - "learning_rate": 2.391118701964133e-08, - "loss": 2.748, - "step": 14 - }, - { - "epoch": 0.0, - "learning_rate": 2.561912894961571e-08, - "loss": 2.5137, - "step": 15 - }, - { - "epoch": 0.0, - "learning_rate": 2.732707087959009e-08, - "loss": 2.5234, - "step": 16 - }, - { - "epoch": 0.0, - "learning_rate": 2.9035012809564473e-08, - "loss": 3.0508, - "step": 17 - }, - { - "epoch": 0.0, - "learning_rate": 3.074295473953885e-08, - "loss": 2.9062, - "step": 18 - }, - { - "epoch": 0.0, - "learning_rate": 3.2450896669513235e-08, - "loss": 2.25, - "step": 19 - }, - { - "epoch": 0.0, - "learning_rate": 3.415883859948762e-08, - "loss": 2.2539, - "step": 20 - }, - { - "epoch": 0.0, - "learning_rate": 3.5866780529461994e-08, - "loss": 2.1191, - "step": 21 - }, - { - "epoch": 0.0, - "learning_rate": 3.7574722459436376e-08, - "loss": 2.3359, - "step": 22 - }, - { - "epoch": 0.0, - "learning_rate": 3.928266438941076e-08, - "loss": 2.041, - "step": 23 - }, - { - "epoch": 0.0, - "learning_rate": 4.099060631938514e-08, - "loss": 2.2305, - "step": 24 - }, - { - "epoch": 0.0, - "learning_rate": 4.269854824935952e-08, - "loss": 2.4023, - "step": 25 - }, - { - "epoch": 0.0, - "learning_rate": 4.44064901793339e-08, - "loss": 3.2969, - "step": 26 - }, - { - "epoch": 0.0, - "learning_rate": 4.611443210930828e-08, - "loss": 2.0156, - "step": 27 - }, - { - "epoch": 0.0, - "learning_rate": 4.782237403928266e-08, - "loss": 2.4844, - "step": 28 - }, - { - "epoch": 0.0, - "learning_rate": 4.953031596925705e-08, - "loss": 2.8926, - "step": 29 - }, - { - "epoch": 0.0, - "learning_rate": 5.123825789923142e-08, - "loss": 2.2285, - "step": 30 - }, - { - "epoch": 0.0, - "learning_rate": 5.2946199829205806e-08, - "loss": 2.832, - "step": 31 - }, - { - "epoch": 0.0, - "learning_rate": 5.465414175918018e-08, - "loss": 2.7812, - "step": 32 - }, - { - "epoch": 0.0, - "learning_rate": 5.6362083689154564e-08, - "loss": 1.9473, - "step": 33 - }, - { - "epoch": 0.0, - "learning_rate": 5.807002561912895e-08, - "loss": 2.3086, - "step": 34 - }, - { - "epoch": 0.0, - "learning_rate": 5.977796754910333e-08, - "loss": 2.4219, - "step": 35 - }, - { - "epoch": 0.0, - "learning_rate": 6.14859094790777e-08, - "loss": 2.8789, - "step": 36 - }, - { - "epoch": 0.0, - "learning_rate": 6.31938514090521e-08, - "loss": 2.0215, - "step": 37 - }, - { - "epoch": 0.0, - "learning_rate": 6.490179333902647e-08, - "loss": 2.2305, - "step": 38 - }, - { - "epoch": 0.0, - "learning_rate": 6.660973526900085e-08, - "loss": 2.3164, - "step": 39 - }, - { - "epoch": 0.0, - "learning_rate": 6.831767719897524e-08, - "loss": 2.2891, - "step": 40 - }, - { - "epoch": 0.0, - "learning_rate": 7.002561912894961e-08, - "loss": 2.0488, - "step": 41 - }, - { - "epoch": 0.0, - "learning_rate": 7.173356105892399e-08, - "loss": 2.1172, - "step": 42 - }, - { - "epoch": 0.0, - "learning_rate": 7.344150298889836e-08, - "loss": 2.4062, - "step": 43 - }, - { - "epoch": 0.0, - "learning_rate": 7.514944491887275e-08, - "loss": 2.1133, - "step": 44 - }, - { - "epoch": 0.0, - "learning_rate": 7.685738684884714e-08, - "loss": 2.084, - "step": 45 - }, - { - "epoch": 0.0, - "learning_rate": 7.856532877882152e-08, - "loss": 2.0781, - "step": 46 - }, - { - "epoch": 0.0, - "learning_rate": 8.02732707087959e-08, - "loss": 1.7383, - "step": 47 - }, - { - "epoch": 0.0, - "learning_rate": 8.198121263877028e-08, - "loss": 1.9531, - "step": 48 - }, - { - "epoch": 0.0, - "learning_rate": 8.368915456874466e-08, - "loss": 1.916, - "step": 49 - }, - { - "epoch": 0.0, - "learning_rate": 8.539709649871903e-08, - "loss": 1.9609, - "step": 50 - }, - { - "epoch": 0.0, - "learning_rate": 8.710503842869342e-08, - "loss": 2.1758, - "step": 51 - }, - { - "epoch": 0.0, - "learning_rate": 8.88129803586678e-08, - "loss": 2.0781, - "step": 52 - }, - { - "epoch": 0.0, - "learning_rate": 9.052092228864218e-08, - "loss": 2.0742, - "step": 53 - }, - { - "epoch": 0.0, - "learning_rate": 9.222886421861656e-08, - "loss": 1.9629, - "step": 54 - }, - { - "epoch": 0.0, - "learning_rate": 9.393680614859094e-08, - "loss": 1.9492, - "step": 55 - }, - { - "epoch": 0.0, - "learning_rate": 9.564474807856532e-08, - "loss": 1.75, - "step": 56 - }, - { - "epoch": 0.0, - "learning_rate": 9.73526900085397e-08, - "loss": 1.7578, - "step": 57 - }, - { - "epoch": 0.0, - "learning_rate": 9.90606319385141e-08, - "loss": 1.707, - "step": 58 - }, - { - "epoch": 0.0, - "learning_rate": 1.0076857386848847e-07, - "loss": 1.9395, - "step": 59 - }, - { - "epoch": 0.0, - "learning_rate": 1.0247651579846285e-07, - "loss": 1.6738, - "step": 60 - }, - { - "epoch": 0.0, - "learning_rate": 1.0418445772843724e-07, - "loss": 1.8789, - "step": 61 - }, - { - "epoch": 0.0, - "learning_rate": 1.0589239965841161e-07, - "loss": 1.7871, - "step": 62 - }, - { - "epoch": 0.0, - "learning_rate": 1.0760034158838599e-07, - "loss": 1.6641, - "step": 63 - }, - { - "epoch": 0.0, - "learning_rate": 1.0930828351836036e-07, - "loss": 1.6641, - "step": 64 - }, - { - "epoch": 0.0, - "learning_rate": 1.1101622544833475e-07, - "loss": 1.7539, - "step": 65 - }, - { - "epoch": 0.0, - "learning_rate": 1.1272416737830913e-07, - "loss": 1.6777, - "step": 66 - }, - { - "epoch": 0.0, - "learning_rate": 1.144321093082835e-07, - "loss": 1.4297, - "step": 67 - }, - { - "epoch": 0.0, - "learning_rate": 1.161400512382579e-07, - "loss": 1.5352, - "step": 68 - }, - { - "epoch": 0.0, - "learning_rate": 1.1784799316823227e-07, - "loss": 1.6836, - "step": 69 - }, - { - "epoch": 0.0, - "learning_rate": 1.1955593509820666e-07, - "loss": 1.373, - "step": 70 - }, - { - "epoch": 0.0, - "learning_rate": 1.2126387702818105e-07, - "loss": 1.4453, - "step": 71 - }, - { - "epoch": 0.0, - "learning_rate": 1.229718189581554e-07, - "loss": 1.5762, - "step": 72 - }, - { - "epoch": 0.0, - "learning_rate": 1.246797608881298e-07, - "loss": 1.7363, - "step": 73 - }, - { - "epoch": 0.0, - "learning_rate": 1.263877028181042e-07, - "loss": 1.54, - "step": 74 - }, - { - "epoch": 0.0, - "learning_rate": 1.2809564474807855e-07, - "loss": 1.4727, - "step": 75 - }, - { - "epoch": 0.0, - "learning_rate": 1.2980358667805294e-07, - "loss": 1.5723, - "step": 76 - }, - { - "epoch": 0.0, - "learning_rate": 1.3151152860802733e-07, - "loss": 1.5781, - "step": 77 - }, - { - "epoch": 0.0, - "learning_rate": 1.332194705380017e-07, - "loss": 1.8008, - "step": 78 - }, - { - "epoch": 0.0, - "learning_rate": 1.3492741246797608e-07, - "loss": 1.4004, - "step": 79 - }, - { - "epoch": 0.0, - "learning_rate": 1.3663535439795047e-07, - "loss": 1.6807, - "step": 80 - }, - { - "epoch": 0.0, - "learning_rate": 1.3834329632792486e-07, - "loss": 1.4199, - "step": 81 - }, - { - "epoch": 0.0, - "learning_rate": 1.4005123825789922e-07, - "loss": 1.2354, - "step": 82 - }, - { - "epoch": 0.0, - "learning_rate": 1.417591801878736e-07, - "loss": 1.2344, - "step": 83 - }, - { - "epoch": 0.0, - "learning_rate": 1.4346712211784797e-07, - "loss": 1.6914, - "step": 84 - }, - { - "epoch": 0.0, - "learning_rate": 1.4517506404782236e-07, - "loss": 1.5156, - "step": 85 - }, - { - "epoch": 0.0, - "learning_rate": 1.4688300597779673e-07, - "loss": 1.3789, - "step": 86 - }, - { - "epoch": 0.0, - "learning_rate": 1.4859094790777114e-07, - "loss": 1.6191, - "step": 87 - }, - { - "epoch": 0.0, - "learning_rate": 1.502988898377455e-07, - "loss": 1.4922, - "step": 88 - }, - { - "epoch": 0.0, - "learning_rate": 1.520068317677199e-07, - "loss": 1.4766, - "step": 89 - }, - { - "epoch": 0.0, - "learning_rate": 1.5371477369769428e-07, - "loss": 1.165, - "step": 90 - }, - { - "epoch": 0.0, - "learning_rate": 1.5542271562766865e-07, - "loss": 1.3555, - "step": 91 - }, - { - "epoch": 0.0, - "learning_rate": 1.5713065755764303e-07, - "loss": 1.3516, - "step": 92 - }, - { - "epoch": 0.0, - "learning_rate": 1.588385994876174e-07, - "loss": 1.543, - "step": 93 - }, - { - "epoch": 0.0, - "learning_rate": 1.605465414175918e-07, - "loss": 1.416, - "step": 94 - }, - { - "epoch": 0.0, - "learning_rate": 1.6225448334756618e-07, - "loss": 1.4863, - "step": 95 - }, - { - "epoch": 0.0, - "learning_rate": 1.6396242527754057e-07, - "loss": 1.4414, - "step": 96 - }, - { - "epoch": 0.0, - "learning_rate": 1.6567036720751493e-07, - "loss": 1.3887, - "step": 97 - }, - { - "epoch": 0.0, - "learning_rate": 1.6737830913748932e-07, - "loss": 1.4336, - "step": 98 - }, - { - "epoch": 0.0, - "learning_rate": 1.6908625106746368e-07, - "loss": 1.3652, - "step": 99 - }, - { - "epoch": 0.0, - "learning_rate": 1.7079419299743807e-07, - "loss": 1.4316, - "step": 100 - }, - { - "epoch": 0.0, - "learning_rate": 1.7250213492741248e-07, - "loss": 1.0703, - "step": 101 - }, - { - "epoch": 0.0, - "learning_rate": 1.7421007685738685e-07, - "loss": 1.4082, - "step": 102 - }, - { - "epoch": 0.0, - "learning_rate": 1.7591801878736124e-07, - "loss": 1.1934, - "step": 103 - }, - { - "epoch": 0.0, - "learning_rate": 1.776259607173356e-07, - "loss": 1.4219, - "step": 104 - }, - { - "epoch": 0.0, - "learning_rate": 1.7933390264731e-07, - "loss": 1.3633, - "step": 105 - }, - { - "epoch": 0.0, - "learning_rate": 1.8104184457728435e-07, - "loss": 1.4551, - "step": 106 - }, - { - "epoch": 0.0, - "learning_rate": 1.8274978650725874e-07, - "loss": 1.0342, - "step": 107 - }, - { - "epoch": 0.0, - "learning_rate": 1.8445772843723313e-07, - "loss": 1.0078, - "step": 108 - }, - { - "epoch": 0.0, - "learning_rate": 1.8616567036720752e-07, - "loss": 1.3086, - "step": 109 - }, - { - "epoch": 0.0, - "learning_rate": 1.8787361229718188e-07, - "loss": 1.3477, - "step": 110 - }, - { - "epoch": 0.0, - "learning_rate": 1.8958155422715627e-07, - "loss": 1.2305, - "step": 111 - }, - { - "epoch": 0.0, - "learning_rate": 1.9128949615713063e-07, - "loss": 1.3457, - "step": 112 - }, - { - "epoch": 0.0, - "learning_rate": 1.9299743808710502e-07, - "loss": 1.2266, - "step": 113 - }, - { - "epoch": 0.0, - "learning_rate": 1.947053800170794e-07, - "loss": 0.9448, - "step": 114 - }, - { - "epoch": 0.0, - "learning_rate": 1.964133219470538e-07, - "loss": 1.0908, - "step": 115 - }, - { - "epoch": 0.0, - "learning_rate": 1.981212638770282e-07, - "loss": 1.1914, - "step": 116 - }, - { - "epoch": 0.0, - "learning_rate": 1.9982920580700255e-07, - "loss": 1.2041, - "step": 117 - }, - { - "epoch": 0.0, - "learning_rate": 2.0153714773697694e-07, - "loss": 1.498, - "step": 118 - }, - { - "epoch": 0.0, - "learning_rate": 2.032450896669513e-07, - "loss": 1.5176, - "step": 119 - }, - { - "epoch": 0.0, - "learning_rate": 2.049530315969257e-07, - "loss": 1.4189, - "step": 120 - }, - { - "epoch": 0.0, - "learning_rate": 2.0666097352690006e-07, - "loss": 1.3984, - "step": 121 - }, - { - "epoch": 0.0, - "learning_rate": 2.0836891545687447e-07, - "loss": 1.3066, - "step": 122 - }, - { - "epoch": 0.0, - "learning_rate": 2.1007685738684883e-07, - "loss": 1.1553, - "step": 123 - }, - { - "epoch": 0.0, - "learning_rate": 2.1178479931682322e-07, - "loss": 1.3281, - "step": 124 - }, - { - "epoch": 0.0, - "learning_rate": 2.1349274124679759e-07, - "loss": 1.1719, - "step": 125 - }, - { - "epoch": 0.0, - "learning_rate": 2.1520068317677198e-07, - "loss": 1.0166, - "step": 126 - }, - { - "epoch": 0.0, - "learning_rate": 2.1690862510674636e-07, - "loss": 1.0801, - "step": 127 - }, - { - "epoch": 0.0, - "learning_rate": 2.1861656703672073e-07, - "loss": 1.2656, - "step": 128 - }, - { - "epoch": 0.0, - "learning_rate": 2.2032450896669514e-07, - "loss": 1.1465, - "step": 129 - }, - { - "epoch": 0.0, - "learning_rate": 2.220324508966695e-07, - "loss": 1.0635, - "step": 130 - }, - { - "epoch": 0.0, - "learning_rate": 2.237403928266439e-07, - "loss": 1.2129, - "step": 131 - }, - { - "epoch": 0.0, - "learning_rate": 2.2544833475661826e-07, - "loss": 1.126, - "step": 132 - }, - { - "epoch": 0.0, - "learning_rate": 2.2715627668659265e-07, - "loss": 1.2422, - "step": 133 - }, - { - "epoch": 0.0, - "learning_rate": 2.28864218616567e-07, - "loss": 1.1582, - "step": 134 - }, - { - "epoch": 0.0, - "learning_rate": 2.305721605465414e-07, - "loss": 1.0537, - "step": 135 - }, - { - "epoch": 0.0, - "learning_rate": 2.322801024765158e-07, - "loss": 1.2129, - "step": 136 - }, - { - "epoch": 0.0, - "learning_rate": 2.3398804440649018e-07, - "loss": 1.1875, - "step": 137 - }, - { - "epoch": 0.0, - "learning_rate": 2.3569598633646454e-07, - "loss": 0.9678, - "step": 138 - }, - { - "epoch": 0.0, - "learning_rate": 2.3740392826643893e-07, - "loss": 1.2578, - "step": 139 - }, - { - "epoch": 0.0, - "learning_rate": 2.391118701964133e-07, - "loss": 1.1621, - "step": 140 - }, - { - "epoch": 0.0, - "learning_rate": 2.408198121263877e-07, - "loss": 1.2871, - "step": 141 - }, - { - "epoch": 0.0, - "learning_rate": 2.425277540563621e-07, - "loss": 1.0742, - "step": 142 - }, - { - "epoch": 0.0, - "learning_rate": 2.4423569598633643e-07, - "loss": 1.0781, - "step": 143 - }, - { - "epoch": 0.0, - "learning_rate": 2.459436379163108e-07, - "loss": 1.1885, - "step": 144 - }, - { - "epoch": 0.0, - "learning_rate": 2.476515798462852e-07, - "loss": 1.1855, - "step": 145 - }, - { - "epoch": 0.0, - "learning_rate": 2.493595217762596e-07, - "loss": 1.2354, - "step": 146 - }, - { - "epoch": 0.0, - "learning_rate": 2.51067463706234e-07, - "loss": 1.0176, - "step": 147 - }, - { - "epoch": 0.0, - "learning_rate": 2.527754056362084e-07, - "loss": 1.0557, - "step": 148 - }, - { - "epoch": 0.0, - "learning_rate": 2.544833475661827e-07, - "loss": 1.1113, - "step": 149 - }, - { - "epoch": 0.0, - "learning_rate": 2.561912894961571e-07, - "loss": 1.4492, - "step": 150 - }, - { - "epoch": 0.0, - "learning_rate": 2.578992314261315e-07, - "loss": 1.1611, - "step": 151 - }, - { - "epoch": 0.0, - "learning_rate": 2.596071733561059e-07, - "loss": 1.1807, - "step": 152 - }, - { - "epoch": 0.0, - "learning_rate": 2.6131511528608027e-07, - "loss": 1.25, - "step": 153 - }, - { - "epoch": 0.0, - "learning_rate": 2.6302305721605466e-07, - "loss": 1.1367, - "step": 154 - }, - { - "epoch": 0.0, - "learning_rate": 2.6473099914602905e-07, - "loss": 1.2207, - "step": 155 - }, - { - "epoch": 0.0, - "learning_rate": 2.664389410760034e-07, - "loss": 1.2891, - "step": 156 - }, - { - "epoch": 0.0, - "learning_rate": 2.681468830059778e-07, - "loss": 1.2412, - "step": 157 - }, - { - "epoch": 0.0, - "learning_rate": 2.6985482493595216e-07, - "loss": 0.9463, - "step": 158 - }, - { - "epoch": 0.0, - "learning_rate": 2.7156276686592655e-07, - "loss": 1.2891, - "step": 159 - }, - { - "epoch": 0.0, - "learning_rate": 2.7327070879590094e-07, - "loss": 1.2041, - "step": 160 - }, - { - "epoch": 0.0, - "learning_rate": 2.749786507258753e-07, - "loss": 1.0771, - "step": 161 - }, - { - "epoch": 0.0, - "learning_rate": 2.766865926558497e-07, - "loss": 1.2969, - "step": 162 - }, - { - "epoch": 0.0, - "learning_rate": 2.7839453458582406e-07, - "loss": 1.4609, - "step": 163 - }, - { - "epoch": 0.0, - "learning_rate": 2.8010247651579845e-07, - "loss": 0.9658, - "step": 164 - }, - { - "epoch": 0.0, - "learning_rate": 2.8181041844577283e-07, - "loss": 1.0439, - "step": 165 - }, - { - "epoch": 0.0, - "learning_rate": 2.835183603757472e-07, - "loss": 1.1113, - "step": 166 - }, - { - "epoch": 0.0, - "learning_rate": 2.852263023057216e-07, - "loss": 1.3906, - "step": 167 - }, - { - "epoch": 0.0, - "learning_rate": 2.8693424423569595e-07, - "loss": 1.0508, - "step": 168 - }, - { - "epoch": 0.0, - "learning_rate": 2.886421861656704e-07, - "loss": 1.1279, - "step": 169 - }, - { - "epoch": 0.0, - "learning_rate": 2.9035012809564473e-07, - "loss": 1.2852, - "step": 170 - }, - { - "epoch": 0.0, - "learning_rate": 2.920580700256191e-07, - "loss": 0.8525, - "step": 171 - }, - { - "epoch": 0.0, - "learning_rate": 2.9376601195559345e-07, - "loss": 1.25, - "step": 172 - }, - { - "epoch": 0.0, - "learning_rate": 2.954739538855679e-07, - "loss": 1.0869, - "step": 173 - }, - { - "epoch": 0.0, - "learning_rate": 2.971818958155423e-07, - "loss": 1.2266, - "step": 174 - }, - { - "epoch": 0.0, - "learning_rate": 2.988898377455166e-07, - "loss": 1.4424, - "step": 175 - }, - { - "epoch": 0.0, - "learning_rate": 3.00597779675491e-07, - "loss": 0.9077, - "step": 176 - }, - { - "epoch": 0.0, - "learning_rate": 3.023057216054654e-07, - "loss": 1.1211, - "step": 177 - }, - { - "epoch": 0.0, - "learning_rate": 3.040136635354398e-07, - "loss": 1.252, - "step": 178 - }, - { - "epoch": 0.0, - "learning_rate": 3.057216054654141e-07, - "loss": 1.0664, - "step": 179 - }, - { - "epoch": 0.0, - "learning_rate": 3.0742954739538857e-07, - "loss": 1.0996, - "step": 180 - }, - { - "epoch": 0.0, - "learning_rate": 3.0913748932536296e-07, - "loss": 1.1709, - "step": 181 - }, - { - "epoch": 0.0, - "learning_rate": 3.108454312553373e-07, - "loss": 0.8936, - "step": 182 - }, - { - "epoch": 0.0, - "learning_rate": 3.125533731853117e-07, - "loss": 1.2891, - "step": 183 - }, - { - "epoch": 0.0, - "learning_rate": 3.1426131511528607e-07, - "loss": 1.0977, - "step": 184 - }, - { - "epoch": 0.0, - "learning_rate": 3.1596925704526046e-07, - "loss": 1.4473, - "step": 185 - }, - { - "epoch": 0.0, - "learning_rate": 3.176771989752348e-07, - "loss": 1.3115, - "step": 186 - }, - { - "epoch": 0.0, - "learning_rate": 3.193851409052092e-07, - "loss": 1.0586, - "step": 187 - }, - { - "epoch": 0.0, - "learning_rate": 3.210930828351836e-07, - "loss": 1.3301, - "step": 188 - }, - { - "epoch": 0.0, - "learning_rate": 3.2280102476515796e-07, - "loss": 1.126, - "step": 189 - }, - { - "epoch": 0.0, - "learning_rate": 3.2450896669513235e-07, - "loss": 0.9668, - "step": 190 - }, - { - "epoch": 0.0, - "learning_rate": 3.2621690862510674e-07, - "loss": 1.1221, - "step": 191 - }, - { - "epoch": 0.0, - "learning_rate": 3.2792485055508113e-07, - "loss": 1.291, - "step": 192 - }, - { - "epoch": 0.0, - "learning_rate": 3.2963279248505547e-07, - "loss": 1.1934, - "step": 193 - }, - { - "epoch": 0.0, - "learning_rate": 3.3134073441502986e-07, - "loss": 1.1357, - "step": 194 - }, - { - "epoch": 0.0, - "learning_rate": 3.330486763450043e-07, - "loss": 1.1934, - "step": 195 - }, - { - "epoch": 0.01, - "learning_rate": 3.3475661827497863e-07, - "loss": 1.2578, - "step": 196 - }, - { - "epoch": 0.01, - "learning_rate": 3.36464560204953e-07, - "loss": 1.1631, - "step": 197 - }, - { - "epoch": 0.01, - "learning_rate": 3.3817250213492736e-07, - "loss": 1.1602, - "step": 198 - }, - { - "epoch": 0.01, - "learning_rate": 3.398804440649018e-07, - "loss": 1.248, - "step": 199 - }, - { - "epoch": 0.01, - "learning_rate": 3.4158838599487614e-07, - "loss": 1.1162, - "step": 200 - }, - { - "epoch": 0.01, - "learning_rate": 3.4329632792485053e-07, - "loss": 1.1123, - "step": 201 - }, - { - "epoch": 0.01, - "learning_rate": 3.4500426985482497e-07, - "loss": 1.1084, - "step": 202 - }, - { - "epoch": 0.01, - "learning_rate": 3.467122117847993e-07, - "loss": 1.2285, - "step": 203 - }, - { - "epoch": 0.01, - "learning_rate": 3.484201537147737e-07, - "loss": 1.1211, - "step": 204 - }, - { - "epoch": 0.01, - "learning_rate": 3.5012809564474803e-07, - "loss": 1.0586, - "step": 205 - }, - { - "epoch": 0.01, - "learning_rate": 3.5183603757472247e-07, - "loss": 1.1143, - "step": 206 - }, - { - "epoch": 0.01, - "learning_rate": 3.535439795046968e-07, - "loss": 1.2773, - "step": 207 - }, - { - "epoch": 0.01, - "learning_rate": 3.552519214346712e-07, - "loss": 1.0332, - "step": 208 - }, - { - "epoch": 0.01, - "learning_rate": 3.569598633646456e-07, - "loss": 1.0371, - "step": 209 - }, - { - "epoch": 0.01, - "learning_rate": 3.5866780529462e-07, - "loss": 0.8853, - "step": 210 - }, - { - "epoch": 0.01, - "learning_rate": 3.6037574722459437e-07, - "loss": 1.1816, - "step": 211 - }, - { - "epoch": 0.01, - "learning_rate": 3.620836891545687e-07, - "loss": 1.1865, - "step": 212 - }, - { - "epoch": 0.01, - "learning_rate": 3.637916310845431e-07, - "loss": 1.2402, - "step": 213 - }, - { - "epoch": 0.01, - "learning_rate": 3.654995730145175e-07, - "loss": 1.1846, - "step": 214 - }, - { - "epoch": 0.01, - "learning_rate": 3.6720751494449187e-07, - "loss": 1.2129, - "step": 215 - }, - { - "epoch": 0.01, - "learning_rate": 3.6891545687446626e-07, - "loss": 1.1211, - "step": 216 - }, - { - "epoch": 0.01, - "learning_rate": 3.7062339880444065e-07, - "loss": 1.002, - "step": 217 - }, - { - "epoch": 0.01, - "learning_rate": 3.7233134073441504e-07, - "loss": 0.915, - "step": 218 - }, - { - "epoch": 0.01, - "learning_rate": 3.7403928266438937e-07, - "loss": 1.1201, - "step": 219 - }, - { - "epoch": 0.01, - "learning_rate": 3.7574722459436376e-07, - "loss": 1.0869, - "step": 220 - }, - { - "epoch": 0.01, - "learning_rate": 3.7745516652433815e-07, - "loss": 1.0088, - "step": 221 - }, - { - "epoch": 0.01, - "learning_rate": 3.7916310845431254e-07, - "loss": 0.9395, - "step": 222 - }, - { - "epoch": 0.01, - "learning_rate": 3.8087105038428693e-07, - "loss": 1.1514, - "step": 223 - }, - { - "epoch": 0.01, - "learning_rate": 3.8257899231426127e-07, - "loss": 0.9434, - "step": 224 - }, - { - "epoch": 0.01, - "learning_rate": 3.842869342442357e-07, - "loss": 0.9873, - "step": 225 - }, - { - "epoch": 0.01, - "learning_rate": 3.8599487617421004e-07, - "loss": 1.1006, - "step": 226 - }, - { - "epoch": 0.01, - "learning_rate": 3.8770281810418443e-07, - "loss": 1.0166, - "step": 227 - }, - { - "epoch": 0.01, - "learning_rate": 3.894107600341588e-07, - "loss": 1.2129, - "step": 228 - }, - { - "epoch": 0.01, - "learning_rate": 3.911187019641332e-07, - "loss": 1.1572, - "step": 229 - }, - { - "epoch": 0.01, - "learning_rate": 3.928266438941076e-07, - "loss": 0.9033, - "step": 230 - }, - { - "epoch": 0.01, - "learning_rate": 3.9453458582408194e-07, - "loss": 0.959, - "step": 231 - }, - { - "epoch": 0.01, - "learning_rate": 3.962425277540564e-07, - "loss": 1.1064, - "step": 232 - }, - { - "epoch": 0.01, - "learning_rate": 3.979504696840307e-07, - "loss": 1.1416, - "step": 233 - }, - { - "epoch": 0.01, - "learning_rate": 3.996584116140051e-07, - "loss": 1.3711, - "step": 234 - }, - { - "epoch": 0.01, - "learning_rate": 4.0136635354397944e-07, - "loss": 1.043, - "step": 235 - }, - { - "epoch": 0.01, - "learning_rate": 4.030742954739539e-07, - "loss": 1.0303, - "step": 236 - }, - { - "epoch": 0.01, - "learning_rate": 4.0478223740392827e-07, - "loss": 0.8579, - "step": 237 - }, - { - "epoch": 0.01, - "learning_rate": 4.064901793339026e-07, - "loss": 1.1992, - "step": 238 - }, - { - "epoch": 0.01, - "learning_rate": 4.08198121263877e-07, - "loss": 0.8105, - "step": 239 - }, - { - "epoch": 0.01, - "learning_rate": 4.099060631938514e-07, - "loss": 1.0303, - "step": 240 - }, - { - "epoch": 0.01, - "learning_rate": 4.116140051238258e-07, - "loss": 1.0039, - "step": 241 - }, - { - "epoch": 0.01, - "learning_rate": 4.133219470538001e-07, - "loss": 1.3086, - "step": 242 - }, - { - "epoch": 0.01, - "learning_rate": 4.1502988898377455e-07, - "loss": 1.1338, - "step": 243 - }, - { - "epoch": 0.01, - "learning_rate": 4.1673783091374894e-07, - "loss": 1.0273, - "step": 244 - }, - { - "epoch": 0.01, - "learning_rate": 4.184457728437233e-07, - "loss": 0.9795, - "step": 245 - }, - { - "epoch": 0.01, - "learning_rate": 4.2015371477369767e-07, - "loss": 0.9775, - "step": 246 - }, - { - "epoch": 0.01, - "learning_rate": 4.2186165670367206e-07, - "loss": 1.1836, - "step": 247 - }, - { - "epoch": 0.01, - "learning_rate": 4.2356959863364645e-07, - "loss": 1.1309, - "step": 248 - }, - { - "epoch": 0.01, - "learning_rate": 4.252775405636208e-07, - "loss": 1.1484, - "step": 249 - }, - { - "epoch": 0.01, - "learning_rate": 4.2698548249359517e-07, - "loss": 0.7554, - "step": 250 - }, - { - "epoch": 0.01, - "learning_rate": 4.286934244235696e-07, - "loss": 0.9375, - "step": 251 - }, - { - "epoch": 0.01, - "learning_rate": 4.3040136635354395e-07, - "loss": 1.1152, - "step": 252 - }, - { - "epoch": 0.01, - "learning_rate": 4.3210930828351834e-07, - "loss": 0.9209, - "step": 253 - }, - { - "epoch": 0.01, - "learning_rate": 4.3381725021349273e-07, - "loss": 0.9922, - "step": 254 - }, - { - "epoch": 0.01, - "learning_rate": 4.355251921434671e-07, - "loss": 1.0566, - "step": 255 - }, - { - "epoch": 0.01, - "learning_rate": 4.3723313407344145e-07, - "loss": 1.0693, - "step": 256 - }, - { - "epoch": 0.01, - "learning_rate": 4.3894107600341584e-07, - "loss": 1.0098, - "step": 257 - }, - { - "epoch": 0.01, - "learning_rate": 4.406490179333903e-07, - "loss": 1.2002, - "step": 258 - }, - { - "epoch": 0.01, - "learning_rate": 4.423569598633646e-07, - "loss": 1.0488, - "step": 259 - }, - { - "epoch": 0.01, - "learning_rate": 4.44064901793339e-07, - "loss": 1.1133, - "step": 260 - }, - { - "epoch": 0.01, - "learning_rate": 4.4577284372331335e-07, - "loss": 1.0498, - "step": 261 - }, - { - "epoch": 0.01, - "learning_rate": 4.474807856532878e-07, - "loss": 0.9395, - "step": 262 - }, - { - "epoch": 0.01, - "learning_rate": 4.491887275832621e-07, - "loss": 1.0898, - "step": 263 - }, - { - "epoch": 0.01, - "learning_rate": 4.508966695132365e-07, - "loss": 1.3242, - "step": 264 - }, - { - "epoch": 0.01, - "learning_rate": 4.5260461144321096e-07, - "loss": 0.8994, - "step": 265 - }, - { - "epoch": 0.01, - "learning_rate": 4.543125533731853e-07, - "loss": 1.0664, - "step": 266 - }, - { - "epoch": 0.01, - "learning_rate": 4.560204953031597e-07, - "loss": 0.8447, - "step": 267 - }, - { - "epoch": 0.01, - "learning_rate": 4.57728437233134e-07, - "loss": 0.9893, - "step": 268 - }, - { - "epoch": 0.01, - "learning_rate": 4.5943637916310846e-07, - "loss": 1.0898, - "step": 269 - }, - { - "epoch": 0.01, - "learning_rate": 4.611443210930828e-07, - "loss": 1.2002, - "step": 270 - }, - { - "epoch": 0.01, - "learning_rate": 4.628522630230572e-07, - "loss": 0.9106, - "step": 271 - }, - { - "epoch": 0.01, - "learning_rate": 4.645602049530316e-07, - "loss": 1.2363, - "step": 272 - }, - { - "epoch": 0.01, - "learning_rate": 4.6626814688300596e-07, - "loss": 1.3057, - "step": 273 - }, - { - "epoch": 0.01, - "learning_rate": 4.6797608881298035e-07, - "loss": 0.9131, - "step": 274 - }, - { - "epoch": 0.01, - "learning_rate": 4.696840307429547e-07, - "loss": 1.0869, - "step": 275 - }, - { - "epoch": 0.01, - "learning_rate": 4.713919726729291e-07, - "loss": 1.0244, - "step": 276 - }, - { - "epoch": 0.01, - "learning_rate": 4.730999146029035e-07, - "loss": 1.0195, - "step": 277 - }, - { - "epoch": 0.01, - "learning_rate": 4.7480785653287786e-07, - "loss": 1.0977, - "step": 278 - }, - { - "epoch": 0.01, - "learning_rate": 4.7651579846285225e-07, - "loss": 0.9365, - "step": 279 - }, - { - "epoch": 0.01, - "learning_rate": 4.782237403928266e-07, - "loss": 1.2754, - "step": 280 - }, - { - "epoch": 0.01, - "learning_rate": 4.79931682322801e-07, - "loss": 1.0928, - "step": 281 - }, - { - "epoch": 0.01, - "learning_rate": 4.816396242527754e-07, - "loss": 1.1465, - "step": 282 - }, - { - "epoch": 0.01, - "learning_rate": 4.833475661827497e-07, - "loss": 0.856, - "step": 283 - }, - { - "epoch": 0.01, - "learning_rate": 4.850555081127242e-07, - "loss": 1.1621, - "step": 284 - }, - { - "epoch": 0.01, - "learning_rate": 4.867634500426985e-07, - "loss": 1.0645, - "step": 285 - }, - { - "epoch": 0.01, - "learning_rate": 4.884713919726729e-07, - "loss": 1.0635, - "step": 286 - }, - { - "epoch": 0.01, - "learning_rate": 4.901793339026473e-07, - "loss": 1.1826, - "step": 287 - }, - { - "epoch": 0.01, - "learning_rate": 4.918872758326216e-07, - "loss": 0.9922, - "step": 288 - }, - { - "epoch": 0.01, - "learning_rate": 4.935952177625961e-07, - "loss": 1.2051, - "step": 289 - }, - { - "epoch": 0.01, - "learning_rate": 4.953031596925704e-07, - "loss": 1.0996, - "step": 290 - }, - { - "epoch": 0.01, - "learning_rate": 4.970111016225449e-07, - "loss": 1.1465, - "step": 291 - }, - { - "epoch": 0.01, - "learning_rate": 4.987190435525192e-07, - "loss": 0.959, - "step": 292 - }, - { - "epoch": 0.01, - "learning_rate": 5.004269854824936e-07, - "loss": 1.0752, - "step": 293 - }, - { - "epoch": 0.01, - "learning_rate": 5.02134927412468e-07, - "loss": 1.0166, - "step": 294 - }, - { - "epoch": 0.01, - "learning_rate": 5.038428693424423e-07, - "loss": 1.1826, - "step": 295 - }, - { - "epoch": 0.01, - "learning_rate": 5.055508112724168e-07, - "loss": 1.1201, - "step": 296 - }, - { - "epoch": 0.01, - "learning_rate": 5.072587532023911e-07, - "loss": 1.1641, - "step": 297 - }, - { - "epoch": 0.01, - "learning_rate": 5.089666951323654e-07, - "loss": 0.9453, - "step": 298 - }, - { - "epoch": 0.01, - "learning_rate": 5.106746370623399e-07, - "loss": 1.1025, - "step": 299 - }, - { - "epoch": 0.01, - "learning_rate": 5.123825789923142e-07, - "loss": 1.1543, - "step": 300 - }, - { - "epoch": 0.01, - "learning_rate": 5.140905209222886e-07, - "loss": 1.0498, - "step": 301 - }, - { - "epoch": 0.01, - "learning_rate": 5.15798462852263e-07, - "loss": 0.9502, - "step": 302 - }, - { - "epoch": 0.01, - "learning_rate": 5.175064047822374e-07, - "loss": 1.1162, - "step": 303 - }, - { - "epoch": 0.01, - "learning_rate": 5.192143467122118e-07, - "loss": 0.8975, - "step": 304 - }, - { - "epoch": 0.01, - "learning_rate": 5.209222886421861e-07, - "loss": 1.4521, - "step": 305 - }, - { - "epoch": 0.01, - "learning_rate": 5.226302305721605e-07, - "loss": 1.1406, - "step": 306 - }, - { - "epoch": 0.01, - "learning_rate": 5.243381725021349e-07, - "loss": 1.1289, - "step": 307 - }, - { - "epoch": 0.01, - "learning_rate": 5.260461144321093e-07, - "loss": 1.064, - "step": 308 - }, - { - "epoch": 0.01, - "learning_rate": 5.277540563620837e-07, - "loss": 0.9507, - "step": 309 - }, - { - "epoch": 0.01, - "learning_rate": 5.294619982920581e-07, - "loss": 1.1094, - "step": 310 - }, - { - "epoch": 0.01, - "learning_rate": 5.311699402220324e-07, - "loss": 0.9355, - "step": 311 - }, - { - "epoch": 0.01, - "learning_rate": 5.328778821520068e-07, - "loss": 1.1289, - "step": 312 - }, - { - "epoch": 0.01, - "learning_rate": 5.345858240819812e-07, - "loss": 1.2461, - "step": 313 - }, - { - "epoch": 0.01, - "learning_rate": 5.362937660119555e-07, - "loss": 1.1348, - "step": 314 - }, - { - "epoch": 0.01, - "learning_rate": 5.3800170794193e-07, - "loss": 0.9053, - "step": 315 - }, - { - "epoch": 0.01, - "learning_rate": 5.397096498719043e-07, - "loss": 1.1006, - "step": 316 - }, - { - "epoch": 0.01, - "learning_rate": 5.414175918018788e-07, - "loss": 1.0391, - "step": 317 - }, - { - "epoch": 0.01, - "learning_rate": 5.431255337318531e-07, - "loss": 0.9883, - "step": 318 - }, - { - "epoch": 0.01, - "learning_rate": 5.448334756618274e-07, - "loss": 1.1436, - "step": 319 - }, - { - "epoch": 0.01, - "learning_rate": 5.465414175918019e-07, - "loss": 1.0342, - "step": 320 - }, - { - "epoch": 0.01, - "learning_rate": 5.482493595217762e-07, - "loss": 0.8926, - "step": 321 - }, - { - "epoch": 0.01, - "learning_rate": 5.499573014517506e-07, - "loss": 0.9258, - "step": 322 - }, - { - "epoch": 0.01, - "learning_rate": 5.51665243381725e-07, - "loss": 0.9902, - "step": 323 - }, - { - "epoch": 0.01, - "learning_rate": 5.533731853116994e-07, - "loss": 0.9766, - "step": 324 - }, - { - "epoch": 0.01, - "learning_rate": 5.550811272416738e-07, - "loss": 1.0791, - "step": 325 - }, - { - "epoch": 0.01, - "learning_rate": 5.567890691716481e-07, - "loss": 0.8574, - "step": 326 - }, - { - "epoch": 0.01, - "learning_rate": 5.584970111016226e-07, - "loss": 1.1416, - "step": 327 - }, - { - "epoch": 0.01, - "learning_rate": 5.602049530315969e-07, - "loss": 1.0605, - "step": 328 - }, - { - "epoch": 0.01, - "learning_rate": 5.619128949615712e-07, - "loss": 0.9629, - "step": 329 - }, - { - "epoch": 0.01, - "learning_rate": 5.636208368915457e-07, - "loss": 1.3828, - "step": 330 - }, - { - "epoch": 0.01, - "learning_rate": 5.653287788215201e-07, - "loss": 1.0889, - "step": 331 - }, - { - "epoch": 0.01, - "learning_rate": 5.670367207514944e-07, - "loss": 1.0586, - "step": 332 - }, - { - "epoch": 0.01, - "learning_rate": 5.687446626814688e-07, - "loss": 1.0518, - "step": 333 - }, - { - "epoch": 0.01, - "learning_rate": 5.704526046114432e-07, - "loss": 0.9277, - "step": 334 - }, - { - "epoch": 0.01, - "learning_rate": 5.721605465414176e-07, - "loss": 1.1211, - "step": 335 - }, - { - "epoch": 0.01, - "learning_rate": 5.738684884713919e-07, - "loss": 1.084, - "step": 336 - }, - { - "epoch": 0.01, - "learning_rate": 5.755764304013662e-07, - "loss": 0.9268, - "step": 337 - }, - { - "epoch": 0.01, - "learning_rate": 5.772843723313408e-07, - "loss": 1.1348, - "step": 338 - }, - { - "epoch": 0.01, - "learning_rate": 5.789923142613151e-07, - "loss": 1.0332, - "step": 339 - }, - { - "epoch": 0.01, - "learning_rate": 5.807002561912895e-07, - "loss": 0.8828, - "step": 340 - }, - { - "epoch": 0.01, - "learning_rate": 5.824081981212639e-07, - "loss": 0.8628, - "step": 341 - }, - { - "epoch": 0.01, - "learning_rate": 5.841161400512382e-07, - "loss": 1.0225, - "step": 342 - }, - { - "epoch": 0.01, - "learning_rate": 5.858240819812126e-07, - "loss": 0.6987, - "step": 343 - }, - { - "epoch": 0.01, - "learning_rate": 5.875320239111869e-07, - "loss": 0.9922, - "step": 344 - }, - { - "epoch": 0.01, - "learning_rate": 5.892399658411615e-07, - "loss": 0.9609, - "step": 345 - }, - { - "epoch": 0.01, - "learning_rate": 5.909479077711358e-07, - "loss": 1.0303, - "step": 346 - }, - { - "epoch": 0.01, - "learning_rate": 5.926558497011101e-07, - "loss": 1.0186, - "step": 347 - }, - { - "epoch": 0.01, - "learning_rate": 5.943637916310846e-07, - "loss": 0.9668, - "step": 348 - }, - { - "epoch": 0.01, - "learning_rate": 5.960717335610589e-07, - "loss": 1.0811, - "step": 349 - }, - { - "epoch": 0.01, - "learning_rate": 5.977796754910332e-07, - "loss": 1.0498, - "step": 350 - }, - { - "epoch": 0.01, - "learning_rate": 5.994876174210076e-07, - "loss": 1.2266, - "step": 351 - }, - { - "epoch": 0.01, - "learning_rate": 6.01195559350982e-07, - "loss": 1.1455, - "step": 352 - }, - { - "epoch": 0.01, - "learning_rate": 6.029035012809565e-07, - "loss": 0.8936, - "step": 353 - }, - { - "epoch": 0.01, - "learning_rate": 6.046114432109308e-07, - "loss": 0.9014, - "step": 354 - }, - { - "epoch": 0.01, - "learning_rate": 6.063193851409052e-07, - "loss": 0.9902, - "step": 355 - }, - { - "epoch": 0.01, - "learning_rate": 6.080273270708796e-07, - "loss": 1.1016, - "step": 356 - }, - { - "epoch": 0.01, - "learning_rate": 6.097352690008539e-07, - "loss": 0.9785, - "step": 357 - }, - { - "epoch": 0.01, - "learning_rate": 6.114432109308282e-07, - "loss": 0.9844, - "step": 358 - }, - { - "epoch": 0.01, - "learning_rate": 6.131511528608027e-07, - "loss": 1.0771, - "step": 359 - }, - { - "epoch": 0.01, - "learning_rate": 6.148590947907771e-07, - "loss": 0.9385, - "step": 360 - }, - { - "epoch": 0.01, - "learning_rate": 6.165670367207515e-07, - "loss": 0.9951, - "step": 361 - }, - { - "epoch": 0.01, - "learning_rate": 6.182749786507259e-07, - "loss": 1.0596, - "step": 362 - }, - { - "epoch": 0.01, - "learning_rate": 6.199829205807002e-07, - "loss": 0.8716, - "step": 363 - }, - { - "epoch": 0.01, - "learning_rate": 6.216908625106746e-07, - "loss": 0.9834, - "step": 364 - }, - { - "epoch": 0.01, - "learning_rate": 6.233988044406489e-07, - "loss": 1.1426, - "step": 365 - }, - { - "epoch": 0.01, - "learning_rate": 6.251067463706234e-07, - "loss": 1.0342, - "step": 366 - }, - { - "epoch": 0.01, - "learning_rate": 6.268146883005978e-07, - "loss": 1.1494, - "step": 367 - }, - { - "epoch": 0.01, - "learning_rate": 6.285226302305721e-07, - "loss": 1.1699, - "step": 368 - }, - { - "epoch": 0.01, - "learning_rate": 6.302305721605466e-07, - "loss": 1.1826, - "step": 369 - }, - { - "epoch": 0.01, - "learning_rate": 6.319385140905209e-07, - "loss": 0.9854, - "step": 370 - }, - { - "epoch": 0.01, - "learning_rate": 6.336464560204953e-07, - "loss": 0.8887, - "step": 371 - }, - { - "epoch": 0.01, - "learning_rate": 6.353543979504696e-07, - "loss": 0.7451, - "step": 372 - }, - { - "epoch": 0.01, - "learning_rate": 6.37062339880444e-07, - "loss": 0.9766, - "step": 373 - }, - { - "epoch": 0.01, - "learning_rate": 6.387702818104184e-07, - "loss": 1.3242, - "step": 374 - }, - { - "epoch": 0.01, - "learning_rate": 6.404782237403928e-07, - "loss": 1.0547, - "step": 375 - }, - { - "epoch": 0.01, - "learning_rate": 6.421861656703673e-07, - "loss": 0.9727, - "step": 376 - }, - { - "epoch": 0.01, - "learning_rate": 6.438941076003416e-07, - "loss": 0.6865, - "step": 377 - }, - { - "epoch": 0.01, - "learning_rate": 6.456020495303159e-07, - "loss": 0.9463, - "step": 378 - }, - { - "epoch": 0.01, - "learning_rate": 6.473099914602903e-07, - "loss": 0.9258, - "step": 379 - }, - { - "epoch": 0.01, - "learning_rate": 6.490179333902647e-07, - "loss": 1.1016, - "step": 380 - }, - { - "epoch": 0.01, - "learning_rate": 6.50725875320239e-07, - "loss": 0.9629, - "step": 381 - }, - { - "epoch": 0.01, - "learning_rate": 6.524338172502135e-07, - "loss": 0.9453, - "step": 382 - }, - { - "epoch": 0.01, - "learning_rate": 6.541417591801879e-07, - "loss": 0.8516, - "step": 383 - }, - { - "epoch": 0.01, - "learning_rate": 6.558497011101623e-07, - "loss": 0.9092, - "step": 384 - }, - { - "epoch": 0.01, - "learning_rate": 6.575576430401366e-07, - "loss": 1.1934, - "step": 385 - }, - { - "epoch": 0.01, - "learning_rate": 6.592655849701109e-07, - "loss": 1.0176, - "step": 386 - }, - { - "epoch": 0.01, - "learning_rate": 6.609735269000854e-07, - "loss": 0.9209, - "step": 387 - }, - { - "epoch": 0.01, - "learning_rate": 6.626814688300597e-07, - "loss": 0.8428, - "step": 388 - }, - { - "epoch": 0.01, - "learning_rate": 6.64389410760034e-07, - "loss": 1.083, - "step": 389 - }, - { - "epoch": 0.01, - "learning_rate": 6.660973526900086e-07, - "loss": 1.0059, - "step": 390 - }, - { - "epoch": 0.01, - "learning_rate": 6.678052946199829e-07, - "loss": 0.9551, - "step": 391 - }, - { - "epoch": 0.01, - "learning_rate": 6.695132365499573e-07, - "loss": 1.2363, - "step": 392 - }, - { - "epoch": 0.01, - "learning_rate": 6.712211784799316e-07, - "loss": 0.8877, - "step": 393 - }, - { - "epoch": 0.01, - "learning_rate": 6.72929120409906e-07, - "loss": 1.2549, - "step": 394 - }, - { - "epoch": 0.01, - "learning_rate": 6.746370623398804e-07, - "loss": 1.0254, - "step": 395 - }, - { - "epoch": 0.01, - "learning_rate": 6.763450042698547e-07, - "loss": 0.9619, - "step": 396 - }, - { - "epoch": 0.01, - "learning_rate": 6.780529461998293e-07, - "loss": 0.8408, - "step": 397 - }, - { - "epoch": 0.01, - "learning_rate": 6.797608881298036e-07, - "loss": 0.8213, - "step": 398 - }, - { - "epoch": 0.01, - "learning_rate": 6.814688300597779e-07, - "loss": 0.9805, - "step": 399 - }, - { - "epoch": 0.01, - "learning_rate": 6.831767719897523e-07, - "loss": 1.1094, - "step": 400 - }, - { - "epoch": 0.01, - "learning_rate": 6.848847139197267e-07, - "loss": 0.9609, - "step": 401 - }, - { - "epoch": 0.01, - "learning_rate": 6.865926558497011e-07, - "loss": 1.1543, - "step": 402 - }, - { - "epoch": 0.01, - "learning_rate": 6.883005977796754e-07, - "loss": 0.8228, - "step": 403 - }, - { - "epoch": 0.01, - "learning_rate": 6.900085397096499e-07, - "loss": 0.957, - "step": 404 - }, - { - "epoch": 0.01, - "learning_rate": 6.917164816396243e-07, - "loss": 0.9033, - "step": 405 - }, - { - "epoch": 0.01, - "learning_rate": 6.934244235695986e-07, - "loss": 1.1436, - "step": 406 - }, - { - "epoch": 0.01, - "learning_rate": 6.951323654995729e-07, - "loss": 1.1338, - "step": 407 - }, - { - "epoch": 0.01, - "learning_rate": 6.968403074295474e-07, - "loss": 0.9258, - "step": 408 - }, - { - "epoch": 0.01, - "learning_rate": 6.985482493595217e-07, - "loss": 1.0791, - "step": 409 - }, - { - "epoch": 0.01, - "learning_rate": 7.002561912894961e-07, - "loss": 1.166, - "step": 410 - }, - { - "epoch": 0.01, - "learning_rate": 7.019641332194705e-07, - "loss": 1.021, - "step": 411 - }, - { - "epoch": 0.01, - "learning_rate": 7.036720751494449e-07, - "loss": 1.0732, - "step": 412 - }, - { - "epoch": 0.01, - "learning_rate": 7.053800170794193e-07, - "loss": 1.0522, - "step": 413 - }, - { - "epoch": 0.01, - "learning_rate": 7.070879590093936e-07, - "loss": 1.0146, - "step": 414 - }, - { - "epoch": 0.01, - "learning_rate": 7.087959009393681e-07, - "loss": 0.9131, - "step": 415 - }, - { - "epoch": 0.01, - "learning_rate": 7.105038428693424e-07, - "loss": 1.0723, - "step": 416 - }, - { - "epoch": 0.01, - "learning_rate": 7.122117847993167e-07, - "loss": 0.814, - "step": 417 - }, - { - "epoch": 0.01, - "learning_rate": 7.139197267292912e-07, - "loss": 1.2051, - "step": 418 - }, - { - "epoch": 0.01, - "learning_rate": 7.156276686592656e-07, - "loss": 0.9053, - "step": 419 - }, - { - "epoch": 0.01, - "learning_rate": 7.1733561058924e-07, - "loss": 0.8457, - "step": 420 - }, - { - "epoch": 0.01, - "learning_rate": 7.190435525192143e-07, - "loss": 1.0205, - "step": 421 - }, - { - "epoch": 0.01, - "learning_rate": 7.207514944491887e-07, - "loss": 1.1445, - "step": 422 - }, - { - "epoch": 0.01, - "learning_rate": 7.224594363791631e-07, - "loss": 0.9727, - "step": 423 - }, - { - "epoch": 0.01, - "learning_rate": 7.241673783091374e-07, - "loss": 1.2812, - "step": 424 - }, - { - "epoch": 0.01, - "learning_rate": 7.258753202391118e-07, - "loss": 1.1436, - "step": 425 - }, - { - "epoch": 0.01, - "learning_rate": 7.275832621690862e-07, - "loss": 1.0098, - "step": 426 - }, - { - "epoch": 0.01, - "learning_rate": 7.292912040990606e-07, - "loss": 0.9795, - "step": 427 - }, - { - "epoch": 0.01, - "learning_rate": 7.30999146029035e-07, - "loss": 1.0107, - "step": 428 - }, - { - "epoch": 0.01, - "learning_rate": 7.327070879590094e-07, - "loss": 0.9326, - "step": 429 - }, - { - "epoch": 0.01, - "learning_rate": 7.344150298889837e-07, - "loss": 0.811, - "step": 430 - }, - { - "epoch": 0.01, - "learning_rate": 7.361229718189581e-07, - "loss": 1.0801, - "step": 431 - }, - { - "epoch": 0.01, - "learning_rate": 7.378309137489325e-07, - "loss": 1.0322, - "step": 432 - }, - { - "epoch": 0.01, - "learning_rate": 7.395388556789069e-07, - "loss": 0.8447, - "step": 433 - }, - { - "epoch": 0.01, - "learning_rate": 7.412467976088813e-07, - "loss": 0.916, - "step": 434 - }, - { - "epoch": 0.01, - "learning_rate": 7.429547395388556e-07, - "loss": 1.0225, - "step": 435 - }, - { - "epoch": 0.01, - "learning_rate": 7.446626814688301e-07, - "loss": 0.8467, - "step": 436 - }, - { - "epoch": 0.01, - "learning_rate": 7.463706233988044e-07, - "loss": 1.0645, - "step": 437 - }, - { - "epoch": 0.01, - "learning_rate": 7.480785653287787e-07, - "loss": 1.2012, - "step": 438 - }, - { - "epoch": 0.01, - "learning_rate": 7.497865072587532e-07, - "loss": 1.2334, - "step": 439 - }, - { - "epoch": 0.01, - "learning_rate": 7.514944491887275e-07, - "loss": 0.9316, - "step": 440 - }, - { - "epoch": 0.01, - "learning_rate": 7.53202391118702e-07, - "loss": 0.9658, - "step": 441 - }, - { - "epoch": 0.01, - "learning_rate": 7.549103330486763e-07, - "loss": 0.9922, - "step": 442 - }, - { - "epoch": 0.01, - "learning_rate": 7.566182749786507e-07, - "loss": 1.0156, - "step": 443 - }, - { - "epoch": 0.01, - "learning_rate": 7.583262169086251e-07, - "loss": 1.0127, - "step": 444 - }, - { - "epoch": 0.01, - "learning_rate": 7.600341588385994e-07, - "loss": 0.918, - "step": 445 - }, - { - "epoch": 0.01, - "learning_rate": 7.617421007685739e-07, - "loss": 1.0498, - "step": 446 - }, - { - "epoch": 0.01, - "learning_rate": 7.634500426985482e-07, - "loss": 0.959, - "step": 447 - }, - { - "epoch": 0.01, - "learning_rate": 7.651579846285225e-07, - "loss": 0.9277, - "step": 448 - }, - { - "epoch": 0.01, - "learning_rate": 7.66865926558497e-07, - "loss": 0.9609, - "step": 449 - }, - { - "epoch": 0.01, - "learning_rate": 7.685738684884714e-07, - "loss": 0.7563, - "step": 450 - }, - { - "epoch": 0.01, - "learning_rate": 7.702818104184458e-07, - "loss": 1.3008, - "step": 451 - }, - { - "epoch": 0.01, - "learning_rate": 7.719897523484201e-07, - "loss": 1.2383, - "step": 452 - }, - { - "epoch": 0.01, - "learning_rate": 7.736976942783945e-07, - "loss": 0.9932, - "step": 453 - }, - { - "epoch": 0.01, - "learning_rate": 7.754056362083689e-07, - "loss": 1.0752, - "step": 454 - }, - { - "epoch": 0.01, - "learning_rate": 7.771135781383432e-07, - "loss": 0.9736, - "step": 455 - }, - { - "epoch": 0.01, - "learning_rate": 7.788215200683176e-07, - "loss": 1.2686, - "step": 456 - }, - { - "epoch": 0.01, - "learning_rate": 7.805294619982921e-07, - "loss": 1.0439, - "step": 457 - }, - { - "epoch": 0.01, - "learning_rate": 7.822374039282664e-07, - "loss": 1.0811, - "step": 458 - }, - { - "epoch": 0.01, - "learning_rate": 7.839453458582408e-07, - "loss": 1.1406, - "step": 459 - }, - { - "epoch": 0.01, - "learning_rate": 7.856532877882152e-07, - "loss": 1.0122, - "step": 460 - }, - { - "epoch": 0.01, - "learning_rate": 7.873612297181895e-07, - "loss": 1.1104, - "step": 461 - }, - { - "epoch": 0.01, - "learning_rate": 7.890691716481639e-07, - "loss": 1.0459, - "step": 462 - }, - { - "epoch": 0.01, - "learning_rate": 7.907771135781382e-07, - "loss": 0.9883, - "step": 463 - }, - { - "epoch": 0.01, - "learning_rate": 7.924850555081128e-07, - "loss": 1.207, - "step": 464 - }, - { - "epoch": 0.01, - "learning_rate": 7.941929974380871e-07, - "loss": 0.9541, - "step": 465 - }, - { - "epoch": 0.01, - "learning_rate": 7.959009393680614e-07, - "loss": 1.0352, - "step": 466 - }, - { - "epoch": 0.01, - "learning_rate": 7.976088812980359e-07, - "loss": 0.9136, - "step": 467 - }, - { - "epoch": 0.01, - "learning_rate": 7.993168232280102e-07, - "loss": 1.0059, - "step": 468 - }, - { - "epoch": 0.01, - "learning_rate": 8.010247651579845e-07, - "loss": 0.8223, - "step": 469 - }, - { - "epoch": 0.01, - "learning_rate": 8.027327070879589e-07, - "loss": 0.8262, - "step": 470 - }, - { - "epoch": 0.01, - "learning_rate": 8.044406490179334e-07, - "loss": 1.0186, - "step": 471 - }, - { - "epoch": 0.01, - "learning_rate": 8.061485909479078e-07, - "loss": 0.7524, - "step": 472 - }, - { - "epoch": 0.01, - "learning_rate": 8.078565328778821e-07, - "loss": 0.8809, - "step": 473 - }, - { - "epoch": 0.01, - "learning_rate": 8.095644748078565e-07, - "loss": 0.8242, - "step": 474 - }, - { - "epoch": 0.01, - "learning_rate": 8.112724167378309e-07, - "loss": 1.0674, - "step": 475 - }, - { - "epoch": 0.01, - "learning_rate": 8.129803586678052e-07, - "loss": 1.0117, - "step": 476 - }, - { - "epoch": 0.01, - "learning_rate": 8.146883005977796e-07, - "loss": 1.0762, - "step": 477 - }, - { - "epoch": 0.01, - "learning_rate": 8.16396242527754e-07, - "loss": 0.9668, - "step": 478 - }, - { - "epoch": 0.01, - "learning_rate": 8.181041844577284e-07, - "loss": 1.0527, - "step": 479 - }, - { - "epoch": 0.01, - "learning_rate": 8.198121263877028e-07, - "loss": 1.0928, - "step": 480 - }, - { - "epoch": 0.01, - "learning_rate": 8.215200683176772e-07, - "loss": 1.1113, - "step": 481 - }, - { - "epoch": 0.01, - "learning_rate": 8.232280102476516e-07, - "loss": 0.8477, - "step": 482 - }, - { - "epoch": 0.01, - "learning_rate": 8.249359521776259e-07, - "loss": 0.9634, - "step": 483 - }, - { - "epoch": 0.01, - "learning_rate": 8.266438941076002e-07, - "loss": 0.9795, - "step": 484 - }, - { - "epoch": 0.01, - "learning_rate": 8.283518360375747e-07, - "loss": 1.0674, - "step": 485 - }, - { - "epoch": 0.01, - "learning_rate": 8.300597779675491e-07, - "loss": 1.0791, - "step": 486 - }, - { - "epoch": 0.01, - "learning_rate": 8.317677198975234e-07, - "loss": 1.0176, - "step": 487 - }, - { - "epoch": 0.01, - "learning_rate": 8.334756618274979e-07, - "loss": 0.9053, - "step": 488 - }, - { - "epoch": 0.01, - "learning_rate": 8.351836037574722e-07, - "loss": 0.9131, - "step": 489 - }, - { - "epoch": 0.01, - "learning_rate": 8.368915456874466e-07, - "loss": 1.2344, - "step": 490 - }, - { - "epoch": 0.01, - "learning_rate": 8.385994876174209e-07, - "loss": 1.0029, - "step": 491 - }, - { - "epoch": 0.01, - "learning_rate": 8.403074295473953e-07, - "loss": 1.0283, - "step": 492 - }, - { - "epoch": 0.01, - "learning_rate": 8.420153714773698e-07, - "loss": 0.9668, - "step": 493 - }, - { - "epoch": 0.01, - "learning_rate": 8.437233134073441e-07, - "loss": 1.2949, - "step": 494 - }, - { - "epoch": 0.01, - "learning_rate": 8.454312553373186e-07, - "loss": 1.0537, - "step": 495 - }, - { - "epoch": 0.01, - "learning_rate": 8.471391972672929e-07, - "loss": 1.0264, - "step": 496 - }, - { - "epoch": 0.01, - "learning_rate": 8.488471391972672e-07, - "loss": 0.9355, - "step": 497 - }, - { - "epoch": 0.01, - "learning_rate": 8.505550811272416e-07, - "loss": 1.123, - "step": 498 - }, - { - "epoch": 0.01, - "learning_rate": 8.52263023057216e-07, - "loss": 0.9248, - "step": 499 - }, - { - "epoch": 0.01, - "learning_rate": 8.539709649871903e-07, - "loss": 1.0684, - "step": 500 - }, - { - "epoch": 0.01, - "learning_rate": 8.556789069171648e-07, - "loss": 0.9834, - "step": 501 - }, - { - "epoch": 0.01, - "learning_rate": 8.573868488471392e-07, - "loss": 0.9893, - "step": 502 - }, - { - "epoch": 0.01, - "learning_rate": 8.590947907771136e-07, - "loss": 1.1426, - "step": 503 - }, - { - "epoch": 0.01, - "learning_rate": 8.608027327070879e-07, - "loss": 0.8242, - "step": 504 - }, - { - "epoch": 0.01, - "learning_rate": 8.625106746370622e-07, - "loss": 1.1387, - "step": 505 - }, - { - "epoch": 0.01, - "learning_rate": 8.642186165670367e-07, - "loss": 0.833, - "step": 506 - }, - { - "epoch": 0.01, - "learning_rate": 8.65926558497011e-07, - "loss": 1.1562, - "step": 507 - }, - { - "epoch": 0.01, - "learning_rate": 8.676345004269855e-07, - "loss": 0.9736, - "step": 508 - }, - { - "epoch": 0.01, - "learning_rate": 8.693424423569599e-07, - "loss": 1.168, - "step": 509 - }, - { - "epoch": 0.01, - "learning_rate": 8.710503842869342e-07, - "loss": 1.0205, - "step": 510 - }, - { - "epoch": 0.01, - "learning_rate": 8.727583262169086e-07, - "loss": 0.9839, - "step": 511 - }, - { - "epoch": 0.01, - "learning_rate": 8.744662681468829e-07, - "loss": 0.9004, - "step": 512 - }, - { - "epoch": 0.01, - "learning_rate": 8.761742100768573e-07, - "loss": 1.1885, - "step": 513 - }, - { - "epoch": 0.01, - "learning_rate": 8.778821520068317e-07, - "loss": 1.1719, - "step": 514 - }, - { - "epoch": 0.01, - "learning_rate": 8.79590093936806e-07, - "loss": 1.1523, - "step": 515 - }, - { - "epoch": 0.01, - "learning_rate": 8.812980358667806e-07, - "loss": 1.084, - "step": 516 - }, - { - "epoch": 0.01, - "learning_rate": 8.830059777967549e-07, - "loss": 1.209, - "step": 517 - }, - { - "epoch": 0.01, - "learning_rate": 8.847139197267292e-07, - "loss": 0.8115, - "step": 518 - }, - { - "epoch": 0.01, - "learning_rate": 8.864218616567036e-07, - "loss": 1.0215, - "step": 519 - }, - { - "epoch": 0.01, - "learning_rate": 8.88129803586678e-07, - "loss": 1.042, - "step": 520 - }, - { - "epoch": 0.01, - "learning_rate": 8.898377455166524e-07, - "loss": 1.0703, - "step": 521 - }, - { - "epoch": 0.01, - "learning_rate": 8.915456874466267e-07, - "loss": 0.9746, - "step": 522 - }, - { - "epoch": 0.01, - "learning_rate": 8.932536293766012e-07, - "loss": 0.9473, - "step": 523 - }, - { - "epoch": 0.01, - "learning_rate": 8.949615713065756e-07, - "loss": 0.9346, - "step": 524 - }, - { - "epoch": 0.01, - "learning_rate": 8.966695132365499e-07, - "loss": 0.9453, - "step": 525 - }, - { - "epoch": 0.01, - "learning_rate": 8.983774551665242e-07, - "loss": 1.0654, - "step": 526 - }, - { - "epoch": 0.01, - "learning_rate": 9.000853970964987e-07, - "loss": 1.0488, - "step": 527 - }, - { - "epoch": 0.01, - "learning_rate": 9.01793339026473e-07, - "loss": 0.9424, - "step": 528 - }, - { - "epoch": 0.01, - "learning_rate": 9.035012809564474e-07, - "loss": 0.8389, - "step": 529 - }, - { - "epoch": 0.01, - "learning_rate": 9.052092228864219e-07, - "loss": 1.1895, - "step": 530 - }, - { - "epoch": 0.01, - "learning_rate": 9.069171648163962e-07, - "loss": 1.0527, - "step": 531 - }, - { - "epoch": 0.01, - "learning_rate": 9.086251067463706e-07, - "loss": 0.9111, - "step": 532 - }, - { - "epoch": 0.01, - "learning_rate": 9.103330486763449e-07, - "loss": 0.9941, - "step": 533 - }, - { - "epoch": 0.01, - "learning_rate": 9.120409906063194e-07, - "loss": 1.0127, - "step": 534 - }, - { - "epoch": 0.01, - "learning_rate": 9.137489325362937e-07, - "loss": 1.0547, - "step": 535 - }, - { - "epoch": 0.01, - "learning_rate": 9.15456874466268e-07, - "loss": 0.9854, - "step": 536 - }, - { - "epoch": 0.01, - "learning_rate": 9.171648163962425e-07, - "loss": 0.9316, - "step": 537 - }, - { - "epoch": 0.01, - "learning_rate": 9.188727583262169e-07, - "loss": 0.9326, - "step": 538 - }, - { - "epoch": 0.01, - "learning_rate": 9.205807002561913e-07, - "loss": 1.0537, - "step": 539 - }, - { - "epoch": 0.01, - "learning_rate": 9.222886421861656e-07, - "loss": 0.917, - "step": 540 - }, - { - "epoch": 0.01, - "learning_rate": 9.2399658411614e-07, - "loss": 0.9658, - "step": 541 - }, - { - "epoch": 0.01, - "learning_rate": 9.257045260461144e-07, - "loss": 1.0029, - "step": 542 - }, - { - "epoch": 0.01, - "learning_rate": 9.274124679760887e-07, - "loss": 0.9424, - "step": 543 - }, - { - "epoch": 0.01, - "learning_rate": 9.291204099060631e-07, - "loss": 0.8638, - "step": 544 - }, - { - "epoch": 0.01, - "learning_rate": 9.308283518360376e-07, - "loss": 1.0195, - "step": 545 - }, - { - "epoch": 0.01, - "learning_rate": 9.325362937660119e-07, - "loss": 1.0195, - "step": 546 - }, - { - "epoch": 0.01, - "learning_rate": 9.342442356959863e-07, - "loss": 0.9619, - "step": 547 - }, - { - "epoch": 0.01, - "learning_rate": 9.359521776259607e-07, - "loss": 1.2627, - "step": 548 - }, - { - "epoch": 0.01, - "learning_rate": 9.37660119555935e-07, - "loss": 1.0508, - "step": 549 - }, - { - "epoch": 0.01, - "learning_rate": 9.393680614859094e-07, - "loss": 0.7354, - "step": 550 - }, - { - "epoch": 0.01, - "learning_rate": 9.410760034158838e-07, - "loss": 1.0186, - "step": 551 - }, - { - "epoch": 0.01, - "learning_rate": 9.427839453458582e-07, - "loss": 1.0352, - "step": 552 - }, - { - "epoch": 0.01, - "learning_rate": 9.444918872758326e-07, - "loss": 0.9785, - "step": 553 - }, - { - "epoch": 0.01, - "learning_rate": 9.46199829205807e-07, - "loss": 0.9395, - "step": 554 - }, - { - "epoch": 0.01, - "learning_rate": 9.479077711357814e-07, - "loss": 0.959, - "step": 555 - }, - { - "epoch": 0.01, - "learning_rate": 9.496157130657557e-07, - "loss": 0.9268, - "step": 556 - }, - { - "epoch": 0.01, - "learning_rate": 9.5132365499573e-07, - "loss": 0.9746, - "step": 557 - }, - { - "epoch": 0.01, - "learning_rate": 9.530315969257045e-07, - "loss": 0.7124, - "step": 558 - }, - { - "epoch": 0.01, - "learning_rate": 9.547395388556788e-07, - "loss": 0.8438, - "step": 559 - }, - { - "epoch": 0.01, - "learning_rate": 9.564474807856533e-07, - "loss": 1.1055, - "step": 560 - }, - { - "epoch": 0.01, - "learning_rate": 9.581554227156277e-07, - "loss": 0.8066, - "step": 561 - }, - { - "epoch": 0.01, - "learning_rate": 9.59863364645602e-07, - "loss": 0.8984, - "step": 562 - }, - { - "epoch": 0.01, - "learning_rate": 9.615713065755764e-07, - "loss": 0.9697, - "step": 563 - }, - { - "epoch": 0.01, - "learning_rate": 9.632792485055508e-07, - "loss": 0.9766, - "step": 564 - }, - { - "epoch": 0.01, - "learning_rate": 9.64987190435525e-07, - "loss": 1.0391, - "step": 565 - }, - { - "epoch": 0.01, - "learning_rate": 9.666951323654995e-07, - "loss": 0.8633, - "step": 566 - }, - { - "epoch": 0.01, - "learning_rate": 9.68403074295474e-07, - "loss": 1.002, - "step": 567 - }, - { - "epoch": 0.01, - "learning_rate": 9.701110162254484e-07, - "loss": 0.9912, - "step": 568 - }, - { - "epoch": 0.01, - "learning_rate": 9.718189581554226e-07, - "loss": 1.0107, - "step": 569 - }, - { - "epoch": 0.01, - "learning_rate": 9.73526900085397e-07, - "loss": 0.9365, - "step": 570 - }, - { - "epoch": 0.01, - "learning_rate": 9.752348420153715e-07, - "loss": 0.9604, - "step": 571 - }, - { - "epoch": 0.01, - "learning_rate": 9.769427839453457e-07, - "loss": 0.709, - "step": 572 - }, - { - "epoch": 0.01, - "learning_rate": 9.786507258753202e-07, - "loss": 0.8633, - "step": 573 - }, - { - "epoch": 0.01, - "learning_rate": 9.803586678052946e-07, - "loss": 1.0596, - "step": 574 - }, - { - "epoch": 0.01, - "learning_rate": 9.82066609735269e-07, - "loss": 1.1348, - "step": 575 - }, - { - "epoch": 0.01, - "learning_rate": 9.837745516652433e-07, - "loss": 1.0977, - "step": 576 - }, - { - "epoch": 0.01, - "learning_rate": 9.854824935952177e-07, - "loss": 0.7944, - "step": 577 - }, - { - "epoch": 0.01, - "learning_rate": 9.871904355251922e-07, - "loss": 0.9824, - "step": 578 - }, - { - "epoch": 0.01, - "learning_rate": 9.888983774551664e-07, - "loss": 1.0898, - "step": 579 - }, - { - "epoch": 0.01, - "learning_rate": 9.906063193851408e-07, - "loss": 0.8818, - "step": 580 - }, - { - "epoch": 0.01, - "learning_rate": 9.923142613151153e-07, - "loss": 1.1143, - "step": 581 - }, - { - "epoch": 0.01, - "learning_rate": 9.940222032450897e-07, - "loss": 0.8672, - "step": 582 - }, - { - "epoch": 0.01, - "learning_rate": 9.95730145175064e-07, - "loss": 1.0283, - "step": 583 - }, - { - "epoch": 0.01, - "learning_rate": 9.974380871050384e-07, - "loss": 0.8799, - "step": 584 - }, - { - "epoch": 0.01, - "learning_rate": 9.991460290350128e-07, - "loss": 1.1914, - "step": 585 - }, - { - "epoch": 0.02, - "learning_rate": 1.0008539709649873e-06, - "loss": 0.8599, - "step": 586 - }, - { - "epoch": 0.02, - "learning_rate": 1.0025619128949615e-06, - "loss": 1.0684, - "step": 587 - }, - { - "epoch": 0.02, - "learning_rate": 1.004269854824936e-06, - "loss": 1.001, - "step": 588 - }, - { - "epoch": 0.02, - "learning_rate": 1.0059777967549104e-06, - "loss": 0.9033, - "step": 589 - }, - { - "epoch": 0.02, - "learning_rate": 1.0076857386848846e-06, - "loss": 1.1318, - "step": 590 - }, - { - "epoch": 0.02, - "learning_rate": 1.009393680614859e-06, - "loss": 0.8853, - "step": 591 - }, - { - "epoch": 0.02, - "learning_rate": 1.0111016225448335e-06, - "loss": 0.9932, - "step": 592 - }, - { - "epoch": 0.02, - "learning_rate": 1.0128095644748077e-06, - "loss": 0.873, - "step": 593 - }, - { - "epoch": 0.02, - "learning_rate": 1.0145175064047822e-06, - "loss": 1.0547, - "step": 594 - }, - { - "epoch": 0.02, - "learning_rate": 1.0162254483347566e-06, - "loss": 0.9053, - "step": 595 - }, - { - "epoch": 0.02, - "learning_rate": 1.0179333902647309e-06, - "loss": 0.9551, - "step": 596 - }, - { - "epoch": 0.02, - "learning_rate": 1.0196413321947053e-06, - "loss": 1.0186, - "step": 597 - }, - { - "epoch": 0.02, - "learning_rate": 1.0213492741246797e-06, - "loss": 0.9121, - "step": 598 - }, - { - "epoch": 0.02, - "learning_rate": 1.023057216054654e-06, - "loss": 1.0146, - "step": 599 - }, - { - "epoch": 0.02, - "learning_rate": 1.0247651579846284e-06, - "loss": 1.1279, - "step": 600 - }, - { - "epoch": 0.02, - "learning_rate": 1.0264730999146029e-06, - "loss": 0.9238, - "step": 601 - }, - { - "epoch": 0.02, - "learning_rate": 1.0281810418445773e-06, - "loss": 1.0566, - "step": 602 - }, - { - "epoch": 0.02, - "learning_rate": 1.0298889837745517e-06, - "loss": 0.897, - "step": 603 - }, - { - "epoch": 0.02, - "learning_rate": 1.031596925704526e-06, - "loss": 0.9668, - "step": 604 - }, - { - "epoch": 0.02, - "learning_rate": 1.0333048676345004e-06, - "loss": 0.8691, - "step": 605 - }, - { - "epoch": 0.02, - "learning_rate": 1.0350128095644749e-06, - "loss": 0.8613, - "step": 606 - }, - { - "epoch": 0.02, - "learning_rate": 1.036720751494449e-06, - "loss": 1.1328, - "step": 607 - }, - { - "epoch": 0.02, - "learning_rate": 1.0384286934244235e-06, - "loss": 1.043, - "step": 608 - }, - { - "epoch": 0.02, - "learning_rate": 1.040136635354398e-06, - "loss": 0.7407, - "step": 609 - }, - { - "epoch": 0.02, - "learning_rate": 1.0418445772843722e-06, - "loss": 1.1055, - "step": 610 - }, - { - "epoch": 0.02, - "learning_rate": 1.0435525192143466e-06, - "loss": 1.042, - "step": 611 - }, - { - "epoch": 0.02, - "learning_rate": 1.045260461144321e-06, - "loss": 1.0234, - "step": 612 - }, - { - "epoch": 0.02, - "learning_rate": 1.0469684030742953e-06, - "loss": 1.0381, - "step": 613 - }, - { - "epoch": 0.02, - "learning_rate": 1.0486763450042698e-06, - "loss": 0.9014, - "step": 614 - }, - { - "epoch": 0.02, - "learning_rate": 1.050384286934244e-06, - "loss": 0.9463, - "step": 615 - }, - { - "epoch": 0.02, - "learning_rate": 1.0520922288642186e-06, - "loss": 1.1914, - "step": 616 - }, - { - "epoch": 0.02, - "learning_rate": 1.053800170794193e-06, - "loss": 0.9873, - "step": 617 - }, - { - "epoch": 0.02, - "learning_rate": 1.0555081127241673e-06, - "loss": 0.9131, - "step": 618 - }, - { - "epoch": 0.02, - "learning_rate": 1.0572160546541418e-06, - "loss": 1.1064, - "step": 619 - }, - { - "epoch": 0.02, - "learning_rate": 1.0589239965841162e-06, - "loss": 1.1885, - "step": 620 - }, - { - "epoch": 0.02, - "learning_rate": 1.0606319385140904e-06, - "loss": 0.9678, - "step": 621 - }, - { - "epoch": 0.02, - "learning_rate": 1.0623398804440649e-06, - "loss": 0.9121, - "step": 622 - }, - { - "epoch": 0.02, - "learning_rate": 1.0640478223740393e-06, - "loss": 0.9619, - "step": 623 - }, - { - "epoch": 0.02, - "learning_rate": 1.0657557643040135e-06, - "loss": 1.1855, - "step": 624 - }, - { - "epoch": 0.02, - "learning_rate": 1.067463706233988e-06, - "loss": 1.0947, - "step": 625 - }, - { - "epoch": 0.02, - "learning_rate": 1.0691716481639624e-06, - "loss": 1.0938, - "step": 626 - }, - { - "epoch": 0.02, - "learning_rate": 1.0708795900939367e-06, - "loss": 0.6758, - "step": 627 - }, - { - "epoch": 0.02, - "learning_rate": 1.072587532023911e-06, - "loss": 0.9932, - "step": 628 - }, - { - "epoch": 0.02, - "learning_rate": 1.0742954739538853e-06, - "loss": 0.9453, - "step": 629 - }, - { - "epoch": 0.02, - "learning_rate": 1.07600341588386e-06, - "loss": 0.9561, - "step": 630 - }, - { - "epoch": 0.02, - "learning_rate": 1.0777113578138344e-06, - "loss": 0.7319, - "step": 631 - }, - { - "epoch": 0.02, - "learning_rate": 1.0794192997438087e-06, - "loss": 0.9922, - "step": 632 - }, - { - "epoch": 0.02, - "learning_rate": 1.081127241673783e-06, - "loss": 1.0449, - "step": 633 - }, - { - "epoch": 0.02, - "learning_rate": 1.0828351836037575e-06, - "loss": 1.0742, - "step": 634 - }, - { - "epoch": 0.02, - "learning_rate": 1.0845431255337318e-06, - "loss": 1.1143, - "step": 635 - }, - { - "epoch": 0.02, - "learning_rate": 1.0862510674637062e-06, - "loss": 1.1494, - "step": 636 - }, - { - "epoch": 0.02, - "learning_rate": 1.0879590093936807e-06, - "loss": 0.8838, - "step": 637 - }, - { - "epoch": 0.02, - "learning_rate": 1.0896669513236549e-06, - "loss": 0.9619, - "step": 638 - }, - { - "epoch": 0.02, - "learning_rate": 1.0913748932536293e-06, - "loss": 0.915, - "step": 639 - }, - { - "epoch": 0.02, - "learning_rate": 1.0930828351836038e-06, - "loss": 0.9707, - "step": 640 - }, - { - "epoch": 0.02, - "learning_rate": 1.094790777113578e-06, - "loss": 1.0088, - "step": 641 - }, - { - "epoch": 0.02, - "learning_rate": 1.0964987190435524e-06, - "loss": 1.1182, - "step": 642 - }, - { - "epoch": 0.02, - "learning_rate": 1.0982066609735267e-06, - "loss": 1.1133, - "step": 643 - }, - { - "epoch": 0.02, - "learning_rate": 1.0999146029035011e-06, - "loss": 1.0312, - "step": 644 - }, - { - "epoch": 0.02, - "learning_rate": 1.1016225448334758e-06, - "loss": 0.9873, - "step": 645 - }, - { - "epoch": 0.02, - "learning_rate": 1.10333048676345e-06, - "loss": 1.1318, - "step": 646 - }, - { - "epoch": 0.02, - "learning_rate": 1.1050384286934244e-06, - "loss": 0.9844, - "step": 647 - }, - { - "epoch": 0.02, - "learning_rate": 1.1067463706233989e-06, - "loss": 0.9072, - "step": 648 - }, - { - "epoch": 0.02, - "learning_rate": 1.1084543125533731e-06, - "loss": 1.0332, - "step": 649 - }, - { - "epoch": 0.02, - "learning_rate": 1.1101622544833476e-06, - "loss": 0.8164, - "step": 650 - }, - { - "epoch": 0.02, - "learning_rate": 1.111870196413322e-06, - "loss": 0.9629, - "step": 651 - }, - { - "epoch": 0.02, - "learning_rate": 1.1135781383432962e-06, - "loss": 0.6284, - "step": 652 - }, - { - "epoch": 0.02, - "learning_rate": 1.1152860802732707e-06, - "loss": 0.8906, - "step": 653 - }, - { - "epoch": 0.02, - "learning_rate": 1.1169940222032451e-06, - "loss": 1.0557, - "step": 654 - }, - { - "epoch": 0.02, - "learning_rate": 1.1187019641332193e-06, - "loss": 1.0605, - "step": 655 - }, - { - "epoch": 0.02, - "learning_rate": 1.1204099060631938e-06, - "loss": 1.2363, - "step": 656 - }, - { - "epoch": 0.02, - "learning_rate": 1.122117847993168e-06, - "loss": 1.0537, - "step": 657 - }, - { - "epoch": 0.02, - "learning_rate": 1.1238257899231425e-06, - "loss": 0.9785, - "step": 658 - }, - { - "epoch": 0.02, - "learning_rate": 1.125533731853117e-06, - "loss": 0.9521, - "step": 659 - }, - { - "epoch": 0.02, - "learning_rate": 1.1272416737830913e-06, - "loss": 1.0654, - "step": 660 - }, - { - "epoch": 0.02, - "learning_rate": 1.1289496157130658e-06, - "loss": 0.6738, - "step": 661 - }, - { - "epoch": 0.02, - "learning_rate": 1.1306575576430402e-06, - "loss": 0.7402, - "step": 662 - }, - { - "epoch": 0.02, - "learning_rate": 1.1323654995730145e-06, - "loss": 1.084, - "step": 663 - }, - { - "epoch": 0.02, - "learning_rate": 1.134073441502989e-06, - "loss": 0.9072, - "step": 664 - }, - { - "epoch": 0.02, - "learning_rate": 1.1357813834329633e-06, - "loss": 1.0918, - "step": 665 - }, - { - "epoch": 0.02, - "learning_rate": 1.1374893253629376e-06, - "loss": 0.8584, - "step": 666 - }, - { - "epoch": 0.02, - "learning_rate": 1.139197267292912e-06, - "loss": 1.1641, - "step": 667 - }, - { - "epoch": 0.02, - "learning_rate": 1.1409052092228865e-06, - "loss": 0.8535, - "step": 668 - }, - { - "epoch": 0.02, - "learning_rate": 1.1426131511528607e-06, - "loss": 0.9209, - "step": 669 - }, - { - "epoch": 0.02, - "learning_rate": 1.1443210930828351e-06, - "loss": 0.9756, - "step": 670 - }, - { - "epoch": 0.02, - "learning_rate": 1.1460290350128094e-06, - "loss": 1.1562, - "step": 671 - }, - { - "epoch": 0.02, - "learning_rate": 1.1477369769427838e-06, - "loss": 0.9678, - "step": 672 - }, - { - "epoch": 0.02, - "learning_rate": 1.1494449188727582e-06, - "loss": 0.8994, - "step": 673 - }, - { - "epoch": 0.02, - "learning_rate": 1.1511528608027325e-06, - "loss": 0.9141, - "step": 674 - }, - { - "epoch": 0.02, - "learning_rate": 1.1528608027327071e-06, - "loss": 0.8994, - "step": 675 - }, - { - "epoch": 0.02, - "learning_rate": 1.1545687446626816e-06, - "loss": 1.166, - "step": 676 - }, - { - "epoch": 0.02, - "learning_rate": 1.1562766865926558e-06, - "loss": 0.9707, - "step": 677 - }, - { - "epoch": 0.02, - "learning_rate": 1.1579846285226302e-06, - "loss": 1.1758, - "step": 678 - }, - { - "epoch": 0.02, - "learning_rate": 1.1596925704526047e-06, - "loss": 0.9434, - "step": 679 - }, - { - "epoch": 0.02, - "learning_rate": 1.161400512382579e-06, - "loss": 1.0176, - "step": 680 - }, - { - "epoch": 0.02, - "learning_rate": 1.1631084543125534e-06, - "loss": 1.2666, - "step": 681 - }, - { - "epoch": 0.02, - "learning_rate": 1.1648163962425278e-06, - "loss": 1.0596, - "step": 682 - }, - { - "epoch": 0.02, - "learning_rate": 1.166524338172502e-06, - "loss": 0.9473, - "step": 683 - }, - { - "epoch": 0.02, - "learning_rate": 1.1682322801024765e-06, - "loss": 1.0088, - "step": 684 - }, - { - "epoch": 0.02, - "learning_rate": 1.1699402220324507e-06, - "loss": 0.9141, - "step": 685 - }, - { - "epoch": 0.02, - "learning_rate": 1.1716481639624251e-06, - "loss": 1.0713, - "step": 686 - }, - { - "epoch": 0.02, - "learning_rate": 1.1733561058923996e-06, - "loss": 0.9824, - "step": 687 - }, - { - "epoch": 0.02, - "learning_rate": 1.1750640478223738e-06, - "loss": 0.9385, - "step": 688 - }, - { - "epoch": 0.02, - "learning_rate": 1.1767719897523483e-06, - "loss": 1.0166, - "step": 689 - }, - { - "epoch": 0.02, - "learning_rate": 1.178479931682323e-06, - "loss": 0.8662, - "step": 690 - }, - { - "epoch": 0.02, - "learning_rate": 1.1801878736122971e-06, - "loss": 0.9346, - "step": 691 - }, - { - "epoch": 0.02, - "learning_rate": 1.1818958155422716e-06, - "loss": 0.7891, - "step": 692 - }, - { - "epoch": 0.02, - "learning_rate": 1.183603757472246e-06, - "loss": 1.0342, - "step": 693 - }, - { - "epoch": 0.02, - "learning_rate": 1.1853116994022203e-06, - "loss": 0.8042, - "step": 694 - }, - { - "epoch": 0.02, - "learning_rate": 1.1870196413321947e-06, - "loss": 1.0547, - "step": 695 - }, - { - "epoch": 0.02, - "learning_rate": 1.1887275832621691e-06, - "loss": 1.0205, - "step": 696 - }, - { - "epoch": 0.02, - "learning_rate": 1.1904355251921434e-06, - "loss": 0.9878, - "step": 697 - }, - { - "epoch": 0.02, - "learning_rate": 1.1921434671221178e-06, - "loss": 0.9795, - "step": 698 - }, - { - "epoch": 0.02, - "learning_rate": 1.193851409052092e-06, - "loss": 0.9092, - "step": 699 - }, - { - "epoch": 0.02, - "learning_rate": 1.1955593509820665e-06, - "loss": 0.8379, - "step": 700 - }, - { - "epoch": 0.02, - "learning_rate": 1.197267292912041e-06, - "loss": 0.9785, - "step": 701 - }, - { - "epoch": 0.02, - "learning_rate": 1.1989752348420152e-06, - "loss": 1.0195, - "step": 702 - }, - { - "epoch": 0.02, - "learning_rate": 1.2006831767719896e-06, - "loss": 0.8945, - "step": 703 - }, - { - "epoch": 0.02, - "learning_rate": 1.202391118701964e-06, - "loss": 1.0625, - "step": 704 - }, - { - "epoch": 0.02, - "learning_rate": 1.2040990606319385e-06, - "loss": 0.8818, - "step": 705 - }, - { - "epoch": 0.02, - "learning_rate": 1.205807002561913e-06, - "loss": 0.7749, - "step": 706 - }, - { - "epoch": 0.02, - "learning_rate": 1.2075149444918874e-06, - "loss": 1.0859, - "step": 707 - }, - { - "epoch": 0.02, - "learning_rate": 1.2092228864218616e-06, - "loss": 1.1035, - "step": 708 - }, - { - "epoch": 0.02, - "learning_rate": 1.210930828351836e-06, - "loss": 1.083, - "step": 709 - }, - { - "epoch": 0.02, - "learning_rate": 1.2126387702818105e-06, - "loss": 1.1172, - "step": 710 - }, - { - "epoch": 0.02, - "learning_rate": 1.2143467122117847e-06, - "loss": 0.8496, - "step": 711 - }, - { - "epoch": 0.02, - "learning_rate": 1.2160546541417592e-06, - "loss": 0.8213, - "step": 712 - }, - { - "epoch": 0.02, - "learning_rate": 1.2177625960717334e-06, - "loss": 1.0283, - "step": 713 - }, - { - "epoch": 0.02, - "learning_rate": 1.2194705380017078e-06, - "loss": 1.0127, - "step": 714 - }, - { - "epoch": 0.02, - "learning_rate": 1.2211784799316823e-06, - "loss": 0.998, - "step": 715 - }, - { - "epoch": 0.02, - "learning_rate": 1.2228864218616565e-06, - "loss": 1.0264, - "step": 716 - }, - { - "epoch": 0.02, - "learning_rate": 1.224594363791631e-06, - "loss": 0.9131, - "step": 717 - }, - { - "epoch": 0.02, - "learning_rate": 1.2263023057216054e-06, - "loss": 0.9854, - "step": 718 - }, - { - "epoch": 0.02, - "learning_rate": 1.2280102476515798e-06, - "loss": 0.9233, - "step": 719 - }, - { - "epoch": 0.02, - "learning_rate": 1.2297181895815543e-06, - "loss": 1.0811, - "step": 720 - }, - { - "epoch": 0.02, - "learning_rate": 1.2314261315115287e-06, - "loss": 0.8799, - "step": 721 - }, - { - "epoch": 0.02, - "learning_rate": 1.233134073441503e-06, - "loss": 1.0508, - "step": 722 - }, - { - "epoch": 0.02, - "learning_rate": 1.2348420153714774e-06, - "loss": 1.0869, - "step": 723 - }, - { - "epoch": 0.02, - "learning_rate": 1.2365499573014518e-06, - "loss": 1.002, - "step": 724 - }, - { - "epoch": 0.02, - "learning_rate": 1.238257899231426e-06, - "loss": 1.0117, - "step": 725 - }, - { - "epoch": 0.02, - "learning_rate": 1.2399658411614005e-06, - "loss": 0.8574, - "step": 726 - }, - { - "epoch": 0.02, - "learning_rate": 1.2416737830913747e-06, - "loss": 1.3379, - "step": 727 - }, - { - "epoch": 0.02, - "learning_rate": 1.2433817250213492e-06, - "loss": 0.9717, - "step": 728 - }, - { - "epoch": 0.02, - "learning_rate": 1.2450896669513236e-06, - "loss": 0.8809, - "step": 729 - }, - { - "epoch": 0.02, - "learning_rate": 1.2467976088812978e-06, - "loss": 0.8301, - "step": 730 - }, - { - "epoch": 0.02, - "learning_rate": 1.2485055508112723e-06, - "loss": 0.7637, - "step": 731 - }, - { - "epoch": 0.02, - "learning_rate": 1.2502134927412467e-06, - "loss": 0.6958, - "step": 732 - }, - { - "epoch": 0.02, - "learning_rate": 1.251921434671221e-06, - "loss": 1.1045, - "step": 733 - }, - { - "epoch": 0.02, - "learning_rate": 1.2536293766011956e-06, - "loss": 0.8911, - "step": 734 - }, - { - "epoch": 0.02, - "learning_rate": 1.25533731853117e-06, - "loss": 0.8438, - "step": 735 - }, - { - "epoch": 0.02, - "learning_rate": 1.2570452604611443e-06, - "loss": 1.1592, - "step": 736 - }, - { - "epoch": 0.02, - "learning_rate": 1.2587532023911187e-06, - "loss": 0.8154, - "step": 737 - }, - { - "epoch": 0.02, - "learning_rate": 1.2604611443210932e-06, - "loss": 0.9756, - "step": 738 - }, - { - "epoch": 0.02, - "learning_rate": 1.2621690862510674e-06, - "loss": 1.0635, - "step": 739 - }, - { - "epoch": 0.02, - "learning_rate": 1.2638770281810418e-06, - "loss": 0.9199, - "step": 740 - }, - { - "epoch": 0.02, - "learning_rate": 1.265584970111016e-06, - "loss": 0.7734, - "step": 741 - }, - { - "epoch": 0.02, - "learning_rate": 1.2672929120409905e-06, - "loss": 1.0293, - "step": 742 - }, - { - "epoch": 0.02, - "learning_rate": 1.269000853970965e-06, - "loss": 0.9814, - "step": 743 - }, - { - "epoch": 0.02, - "learning_rate": 1.2707087959009392e-06, - "loss": 0.9409, - "step": 744 - }, - { - "epoch": 0.02, - "learning_rate": 1.2724167378309136e-06, - "loss": 0.998, - "step": 745 - }, - { - "epoch": 0.02, - "learning_rate": 1.274124679760888e-06, - "loss": 1.0283, - "step": 746 - }, - { - "epoch": 0.02, - "learning_rate": 1.2758326216908623e-06, - "loss": 1.1074, - "step": 747 - }, - { - "epoch": 0.02, - "learning_rate": 1.2775405636208367e-06, - "loss": 0.6064, - "step": 748 - }, - { - "epoch": 0.02, - "learning_rate": 1.2792485055508114e-06, - "loss": 0.8022, - "step": 749 - }, - { - "epoch": 0.02, - "learning_rate": 1.2809564474807856e-06, - "loss": 1.0547, - "step": 750 - }, - { - "epoch": 0.02, - "learning_rate": 1.28266438941076e-06, - "loss": 0.9316, - "step": 751 - }, - { - "epoch": 0.02, - "learning_rate": 1.2843723313407345e-06, - "loss": 1.085, - "step": 752 - }, - { - "epoch": 0.02, - "learning_rate": 1.2860802732707087e-06, - "loss": 0.8472, - "step": 753 - }, - { - "epoch": 0.02, - "learning_rate": 1.2877882152006832e-06, - "loss": 1.0645, - "step": 754 - }, - { - "epoch": 0.02, - "learning_rate": 1.2894961571306574e-06, - "loss": 1.0449, - "step": 755 - }, - { - "epoch": 0.02, - "learning_rate": 1.2912040990606319e-06, - "loss": 1.0264, - "step": 756 - }, - { - "epoch": 0.02, - "learning_rate": 1.2929120409906063e-06, - "loss": 1.0244, - "step": 757 - }, - { - "epoch": 0.02, - "learning_rate": 1.2946199829205805e-06, - "loss": 0.8545, - "step": 758 - }, - { - "epoch": 0.02, - "learning_rate": 1.296327924850555e-06, - "loss": 1.1943, - "step": 759 - }, - { - "epoch": 0.02, - "learning_rate": 1.2980358667805294e-06, - "loss": 0.998, - "step": 760 - }, - { - "epoch": 0.02, - "learning_rate": 1.2997438087105036e-06, - "loss": 0.9805, - "step": 761 - }, - { - "epoch": 0.02, - "learning_rate": 1.301451750640478e-06, - "loss": 1.1426, - "step": 762 - }, - { - "epoch": 0.02, - "learning_rate": 1.3031596925704525e-06, - "loss": 1.1133, - "step": 763 - }, - { - "epoch": 0.02, - "learning_rate": 1.304867634500427e-06, - "loss": 1.1699, - "step": 764 - }, - { - "epoch": 0.02, - "learning_rate": 1.3065755764304014e-06, - "loss": 0.9077, - "step": 765 - }, - { - "epoch": 0.02, - "learning_rate": 1.3082835183603758e-06, - "loss": 0.8193, - "step": 766 - }, - { - "epoch": 0.02, - "learning_rate": 1.30999146029035e-06, - "loss": 0.7754, - "step": 767 - }, - { - "epoch": 0.02, - "learning_rate": 1.3116994022203245e-06, - "loss": 1.376, - "step": 768 - }, - { - "epoch": 0.02, - "learning_rate": 1.313407344150299e-06, - "loss": 1.0488, - "step": 769 - }, - { - "epoch": 0.02, - "learning_rate": 1.3151152860802732e-06, - "loss": 1.043, - "step": 770 - }, - { - "epoch": 0.02, - "learning_rate": 1.3168232280102476e-06, - "loss": 0.9512, - "step": 771 - }, - { - "epoch": 0.02, - "learning_rate": 1.3185311699402219e-06, - "loss": 0.9775, - "step": 772 - }, - { - "epoch": 0.02, - "learning_rate": 1.3202391118701963e-06, - "loss": 1.0596, - "step": 773 - }, - { - "epoch": 0.02, - "learning_rate": 1.3219470538001707e-06, - "loss": 1.1182, - "step": 774 - }, - { - "epoch": 0.02, - "learning_rate": 1.323654995730145e-06, - "loss": 0.9014, - "step": 775 - }, - { - "epoch": 0.02, - "learning_rate": 1.3253629376601194e-06, - "loss": 1.0137, - "step": 776 - }, - { - "epoch": 0.02, - "learning_rate": 1.3270708795900939e-06, - "loss": 1.1074, - "step": 777 - }, - { - "epoch": 0.02, - "learning_rate": 1.328778821520068e-06, - "loss": 0.8018, - "step": 778 - }, - { - "epoch": 0.02, - "learning_rate": 1.3304867634500427e-06, - "loss": 1.0273, - "step": 779 - }, - { - "epoch": 0.02, - "learning_rate": 1.3321947053800172e-06, - "loss": 1.123, - "step": 780 - }, - { - "epoch": 0.02, - "learning_rate": 1.3339026473099914e-06, - "loss": 1.1133, - "step": 781 - }, - { - "epoch": 0.02, - "learning_rate": 1.3356105892399659e-06, - "loss": 1.0449, - "step": 782 - }, - { - "epoch": 0.02, - "learning_rate": 1.3373185311699403e-06, - "loss": 1.001, - "step": 783 - }, - { - "epoch": 0.02, - "learning_rate": 1.3390264730999145e-06, - "loss": 0.8457, - "step": 784 - }, - { - "epoch": 0.02, - "learning_rate": 1.340734415029889e-06, - "loss": 1.0039, - "step": 785 - }, - { - "epoch": 0.02, - "learning_rate": 1.3424423569598632e-06, - "loss": 0.959, - "step": 786 - }, - { - "epoch": 0.02, - "learning_rate": 1.3441502988898376e-06, - "loss": 1.0107, - "step": 787 - }, - { - "epoch": 0.02, - "learning_rate": 1.345858240819812e-06, - "loss": 0.8447, - "step": 788 - }, - { - "epoch": 0.02, - "learning_rate": 1.3475661827497863e-06, - "loss": 1.0781, - "step": 789 - }, - { - "epoch": 0.02, - "learning_rate": 1.3492741246797608e-06, - "loss": 0.9902, - "step": 790 - }, - { - "epoch": 0.02, - "learning_rate": 1.3509820666097352e-06, - "loss": 1.0771, - "step": 791 - }, - { - "epoch": 0.02, - "learning_rate": 1.3526900085397094e-06, - "loss": 1.0342, - "step": 792 - }, - { - "epoch": 0.02, - "learning_rate": 1.3543979504696839e-06, - "loss": 1.0869, - "step": 793 - }, - { - "epoch": 0.02, - "learning_rate": 1.3561058923996585e-06, - "loss": 0.9365, - "step": 794 - }, - { - "epoch": 0.02, - "learning_rate": 1.3578138343296328e-06, - "loss": 1.0195, - "step": 795 - }, - { - "epoch": 0.02, - "learning_rate": 1.3595217762596072e-06, - "loss": 1.04, - "step": 796 - }, - { - "epoch": 0.02, - "learning_rate": 1.3612297181895816e-06, - "loss": 0.9233, - "step": 797 - }, - { - "epoch": 0.02, - "learning_rate": 1.3629376601195559e-06, - "loss": 1.1133, - "step": 798 - }, - { - "epoch": 0.02, - "learning_rate": 1.3646456020495303e-06, - "loss": 0.9268, - "step": 799 - }, - { - "epoch": 0.02, - "learning_rate": 1.3663535439795045e-06, - "loss": 1.1152, - "step": 800 - }, - { - "epoch": 0.02, - "learning_rate": 1.368061485909479e-06, - "loss": 0.9072, - "step": 801 - }, - { - "epoch": 0.02, - "learning_rate": 1.3697694278394534e-06, - "loss": 0.9512, - "step": 802 - }, - { - "epoch": 0.02, - "learning_rate": 1.3714773697694277e-06, - "loss": 1.0371, - "step": 803 - }, - { - "epoch": 0.02, - "learning_rate": 1.3731853116994021e-06, - "loss": 0.8809, - "step": 804 - }, - { - "epoch": 0.02, - "learning_rate": 1.3748932536293765e-06, - "loss": 0.7393, - "step": 805 - }, - { - "epoch": 0.02, - "learning_rate": 1.3766011955593508e-06, - "loss": 1.1621, - "step": 806 - }, - { - "epoch": 0.02, - "learning_rate": 1.3783091374893252e-06, - "loss": 0.9854, - "step": 807 - }, - { - "epoch": 0.02, - "learning_rate": 1.3800170794192999e-06, - "loss": 0.728, - "step": 808 - }, - { - "epoch": 0.02, - "learning_rate": 1.381725021349274e-06, - "loss": 0.8242, - "step": 809 - }, - { - "epoch": 0.02, - "learning_rate": 1.3834329632792485e-06, - "loss": 0.8809, - "step": 810 - }, - { - "epoch": 0.02, - "learning_rate": 1.385140905209223e-06, - "loss": 0.834, - "step": 811 - }, - { - "epoch": 0.02, - "learning_rate": 1.3868488471391972e-06, - "loss": 0.8906, - "step": 812 - }, - { - "epoch": 0.02, - "learning_rate": 1.3885567890691717e-06, - "loss": 0.9229, - "step": 813 - }, - { - "epoch": 0.02, - "learning_rate": 1.3902647309991459e-06, - "loss": 0.9111, - "step": 814 - }, - { - "epoch": 0.02, - "learning_rate": 1.3919726729291203e-06, - "loss": 0.9824, - "step": 815 - }, - { - "epoch": 0.02, - "learning_rate": 1.3936806148590948e-06, - "loss": 1.04, - "step": 816 - }, - { - "epoch": 0.02, - "learning_rate": 1.395388556789069e-06, - "loss": 0.8945, - "step": 817 - }, - { - "epoch": 0.02, - "learning_rate": 1.3970964987190434e-06, - "loss": 1.0371, - "step": 818 - }, - { - "epoch": 0.02, - "learning_rate": 1.3988044406490179e-06, - "loss": 1.0391, - "step": 819 - }, - { - "epoch": 0.02, - "learning_rate": 1.4005123825789921e-06, - "loss": 0.9834, - "step": 820 - }, - { - "epoch": 0.02, - "learning_rate": 1.4022203245089666e-06, - "loss": 1.0117, - "step": 821 - }, - { - "epoch": 0.02, - "learning_rate": 1.403928266438941e-06, - "loss": 1.1016, - "step": 822 - }, - { - "epoch": 0.02, - "learning_rate": 1.4056362083689154e-06, - "loss": 0.9141, - "step": 823 - }, - { - "epoch": 0.02, - "learning_rate": 1.4073441502988899e-06, - "loss": 0.8418, - "step": 824 - }, - { - "epoch": 0.02, - "learning_rate": 1.4090520922288643e-06, - "loss": 0.8779, - "step": 825 - }, - { - "epoch": 0.02, - "learning_rate": 1.4107600341588386e-06, - "loss": 0.9258, - "step": 826 - }, - { - "epoch": 0.02, - "learning_rate": 1.412467976088813e-06, - "loss": 1.0723, - "step": 827 - }, - { - "epoch": 0.02, - "learning_rate": 1.4141759180187872e-06, - "loss": 1.0674, - "step": 828 - }, - { - "epoch": 0.02, - "learning_rate": 1.4158838599487617e-06, - "loss": 1.2344, - "step": 829 - }, - { - "epoch": 0.02, - "learning_rate": 1.4175918018787361e-06, - "loss": 0.8555, - "step": 830 - }, - { - "epoch": 0.02, - "learning_rate": 1.4192997438087103e-06, - "loss": 1.168, - "step": 831 - }, - { - "epoch": 0.02, - "learning_rate": 1.4210076857386848e-06, - "loss": 0.8145, - "step": 832 - }, - { - "epoch": 0.02, - "learning_rate": 1.4227156276686592e-06, - "loss": 1.208, - "step": 833 - }, - { - "epoch": 0.02, - "learning_rate": 1.4244235695986335e-06, - "loss": 0.9678, - "step": 834 - }, - { - "epoch": 0.02, - "learning_rate": 1.426131511528608e-06, - "loss": 1.0273, - "step": 835 - }, - { - "epoch": 0.02, - "learning_rate": 1.4278394534585823e-06, - "loss": 1.0703, - "step": 836 - }, - { - "epoch": 0.02, - "learning_rate": 1.4295473953885566e-06, - "loss": 1.1152, - "step": 837 - }, - { - "epoch": 0.02, - "learning_rate": 1.4312553373185312e-06, - "loss": 1.001, - "step": 838 - }, - { - "epoch": 0.02, - "learning_rate": 1.4329632792485057e-06, - "loss": 1.0566, - "step": 839 - }, - { - "epoch": 0.02, - "learning_rate": 1.43467122117848e-06, - "loss": 0.8623, - "step": 840 - }, - { - "epoch": 0.02, - "learning_rate": 1.4363791631084543e-06, - "loss": 0.9131, - "step": 841 - }, - { - "epoch": 0.02, - "learning_rate": 1.4380871050384286e-06, - "loss": 1.0273, - "step": 842 - }, - { - "epoch": 0.02, - "learning_rate": 1.439795046968403e-06, - "loss": 0.9912, - "step": 843 - }, - { - "epoch": 0.02, - "learning_rate": 1.4415029888983775e-06, - "loss": 1.0156, - "step": 844 - }, - { - "epoch": 0.02, - "learning_rate": 1.4432109308283517e-06, - "loss": 0.7725, - "step": 845 - }, - { - "epoch": 0.02, - "learning_rate": 1.4449188727583261e-06, - "loss": 0.9414, - "step": 846 - }, - { - "epoch": 0.02, - "learning_rate": 1.4466268146883006e-06, - "loss": 0.8857, - "step": 847 - }, - { - "epoch": 0.02, - "learning_rate": 1.4483347566182748e-06, - "loss": 0.7764, - "step": 848 - }, - { - "epoch": 0.02, - "learning_rate": 1.4500426985482492e-06, - "loss": 1.0166, - "step": 849 - }, - { - "epoch": 0.02, - "learning_rate": 1.4517506404782237e-06, - "loss": 0.8965, - "step": 850 - }, - { - "epoch": 0.02, - "learning_rate": 1.453458582408198e-06, - "loss": 0.9111, - "step": 851 - }, - { - "epoch": 0.02, - "learning_rate": 1.4551665243381724e-06, - "loss": 0.9004, - "step": 852 - }, - { - "epoch": 0.02, - "learning_rate": 1.456874466268147e-06, - "loss": 1.082, - "step": 853 - }, - { - "epoch": 0.02, - "learning_rate": 1.4585824081981212e-06, - "loss": 0.8086, - "step": 854 - }, - { - "epoch": 0.02, - "learning_rate": 1.4602903501280957e-06, - "loss": 0.9932, - "step": 855 - }, - { - "epoch": 0.02, - "learning_rate": 1.46199829205807e-06, - "loss": 0.9355, - "step": 856 - }, - { - "epoch": 0.02, - "learning_rate": 1.4637062339880444e-06, - "loss": 1.0879, - "step": 857 - }, - { - "epoch": 0.02, - "learning_rate": 1.4654141759180188e-06, - "loss": 1.082, - "step": 858 - }, - { - "epoch": 0.02, - "learning_rate": 1.467122117847993e-06, - "loss": 0.834, - "step": 859 - }, - { - "epoch": 0.02, - "learning_rate": 1.4688300597779675e-06, - "loss": 0.8706, - "step": 860 - }, - { - "epoch": 0.02, - "learning_rate": 1.470538001707942e-06, - "loss": 1.0312, - "step": 861 - }, - { - "epoch": 0.02, - "learning_rate": 1.4722459436379161e-06, - "loss": 0.9141, - "step": 862 - }, - { - "epoch": 0.02, - "learning_rate": 1.4739538855678906e-06, - "loss": 1.3086, - "step": 863 - }, - { - "epoch": 0.02, - "learning_rate": 1.475661827497865e-06, - "loss": 0.9463, - "step": 864 - }, - { - "epoch": 0.02, - "learning_rate": 1.4773697694278393e-06, - "loss": 1.0088, - "step": 865 - }, - { - "epoch": 0.02, - "learning_rate": 1.4790777113578137e-06, - "loss": 1.1201, - "step": 866 - }, - { - "epoch": 0.02, - "learning_rate": 1.480785653287788e-06, - "loss": 1.0791, - "step": 867 - }, - { - "epoch": 0.02, - "learning_rate": 1.4824935952177626e-06, - "loss": 0.8369, - "step": 868 - }, - { - "epoch": 0.02, - "learning_rate": 1.484201537147737e-06, - "loss": 0.9839, - "step": 869 - }, - { - "epoch": 0.02, - "learning_rate": 1.4859094790777113e-06, - "loss": 0.9873, - "step": 870 - }, - { - "epoch": 0.02, - "learning_rate": 1.4876174210076857e-06, - "loss": 0.9912, - "step": 871 - }, - { - "epoch": 0.02, - "learning_rate": 1.4893253629376601e-06, - "loss": 1.0078, - "step": 872 - }, - { - "epoch": 0.02, - "learning_rate": 1.4910333048676344e-06, - "loss": 0.9521, - "step": 873 - }, - { - "epoch": 0.02, - "learning_rate": 1.4927412467976088e-06, - "loss": 1.0254, - "step": 874 - }, - { - "epoch": 0.02, - "learning_rate": 1.4944491887275833e-06, - "loss": 1.04, - "step": 875 - }, - { - "epoch": 0.02, - "learning_rate": 1.4961571306575575e-06, - "loss": 0.8369, - "step": 876 - }, - { - "epoch": 0.02, - "learning_rate": 1.497865072587532e-06, - "loss": 1.1191, - "step": 877 - }, - { - "epoch": 0.02, - "learning_rate": 1.4995730145175064e-06, - "loss": 0.9336, - "step": 878 - }, - { - "epoch": 0.02, - "learning_rate": 1.5012809564474806e-06, - "loss": 0.957, - "step": 879 - }, - { - "epoch": 0.02, - "learning_rate": 1.502988898377455e-06, - "loss": 0.8203, - "step": 880 - }, - { - "epoch": 0.02, - "learning_rate": 1.5046968403074293e-06, - "loss": 0.9077, - "step": 881 - }, - { - "epoch": 0.02, - "learning_rate": 1.506404782237404e-06, - "loss": 1.0049, - "step": 882 - }, - { - "epoch": 0.02, - "learning_rate": 1.5081127241673784e-06, - "loss": 1.0254, - "step": 883 - }, - { - "epoch": 0.02, - "learning_rate": 1.5098206660973526e-06, - "loss": 1.085, - "step": 884 - }, - { - "epoch": 0.02, - "learning_rate": 1.511528608027327e-06, - "loss": 0.8916, - "step": 885 - }, - { - "epoch": 0.02, - "learning_rate": 1.5132365499573015e-06, - "loss": 1.1279, - "step": 886 - }, - { - "epoch": 0.02, - "learning_rate": 1.5149444918872757e-06, - "loss": 1.1855, - "step": 887 - }, - { - "epoch": 0.02, - "learning_rate": 1.5166524338172502e-06, - "loss": 1.0742, - "step": 888 - }, - { - "epoch": 0.02, - "learning_rate": 1.5183603757472246e-06, - "loss": 1.0605, - "step": 889 - }, - { - "epoch": 0.02, - "learning_rate": 1.5200683176771988e-06, - "loss": 0.9053, - "step": 890 - }, - { - "epoch": 0.02, - "learning_rate": 1.5217762596071733e-06, - "loss": 1.0137, - "step": 891 - }, - { - "epoch": 0.02, - "learning_rate": 1.5234842015371477e-06, - "loss": 0.8271, - "step": 892 - }, - { - "epoch": 0.02, - "learning_rate": 1.525192143467122e-06, - "loss": 0.9521, - "step": 893 - }, - { - "epoch": 0.02, - "learning_rate": 1.5269000853970964e-06, - "loss": 1.1836, - "step": 894 - }, - { - "epoch": 0.02, - "learning_rate": 1.5286080273270708e-06, - "loss": 1.1328, - "step": 895 - }, - { - "epoch": 0.02, - "learning_rate": 1.530315969257045e-06, - "loss": 1.1211, - "step": 896 - }, - { - "epoch": 0.02, - "learning_rate": 1.5320239111870197e-06, - "loss": 0.8066, - "step": 897 - }, - { - "epoch": 0.02, - "learning_rate": 1.533731853116994e-06, - "loss": 1.124, - "step": 898 - }, - { - "epoch": 0.02, - "learning_rate": 1.5354397950469684e-06, - "loss": 0.9336, - "step": 899 - }, - { - "epoch": 0.02, - "learning_rate": 1.5371477369769428e-06, - "loss": 1.0684, - "step": 900 - }, - { - "epoch": 0.02, - "learning_rate": 1.538855678906917e-06, - "loss": 0.8394, - "step": 901 - }, - { - "epoch": 0.02, - "learning_rate": 1.5405636208368915e-06, - "loss": 0.7148, - "step": 902 - }, - { - "epoch": 0.02, - "learning_rate": 1.542271562766866e-06, - "loss": 0.8916, - "step": 903 - }, - { - "epoch": 0.02, - "learning_rate": 1.5439795046968402e-06, - "loss": 0.8721, - "step": 904 - }, - { - "epoch": 0.02, - "learning_rate": 1.5456874466268146e-06, - "loss": 1.0615, - "step": 905 - }, - { - "epoch": 0.02, - "learning_rate": 1.547395388556789e-06, - "loss": 1.0742, - "step": 906 - }, - { - "epoch": 0.02, - "learning_rate": 1.5491033304867633e-06, - "loss": 1.106, - "step": 907 - }, - { - "epoch": 0.02, - "learning_rate": 1.5508112724167377e-06, - "loss": 0.6533, - "step": 908 - }, - { - "epoch": 0.02, - "learning_rate": 1.5525192143467122e-06, - "loss": 0.8271, - "step": 909 - }, - { - "epoch": 0.02, - "learning_rate": 1.5542271562766864e-06, - "loss": 0.957, - "step": 910 - }, - { - "epoch": 0.02, - "learning_rate": 1.5559350982066608e-06, - "loss": 0.939, - "step": 911 - }, - { - "epoch": 0.02, - "learning_rate": 1.5576430401366353e-06, - "loss": 1.1309, - "step": 912 - }, - { - "epoch": 0.02, - "learning_rate": 1.5593509820666097e-06, - "loss": 0.9258, - "step": 913 - }, - { - "epoch": 0.02, - "learning_rate": 1.5610589239965842e-06, - "loss": 0.8096, - "step": 914 - }, - { - "epoch": 0.02, - "learning_rate": 1.5627668659265584e-06, - "loss": 0.9619, - "step": 915 - }, - { - "epoch": 0.02, - "learning_rate": 1.5644748078565328e-06, - "loss": 0.9287, - "step": 916 - }, - { - "epoch": 0.02, - "learning_rate": 1.5661827497865073e-06, - "loss": 0.8394, - "step": 917 - }, - { - "epoch": 0.02, - "learning_rate": 1.5678906917164815e-06, - "loss": 1.0352, - "step": 918 - }, - { - "epoch": 0.02, - "learning_rate": 1.569598633646456e-06, - "loss": 0.7988, - "step": 919 - }, - { - "epoch": 0.02, - "learning_rate": 1.5713065755764304e-06, - "loss": 1.0566, - "step": 920 - }, - { - "epoch": 0.02, - "learning_rate": 1.5730145175064046e-06, - "loss": 0.9941, - "step": 921 - }, - { - "epoch": 0.02, - "learning_rate": 1.574722459436379e-06, - "loss": 0.9443, - "step": 922 - }, - { - "epoch": 0.02, - "learning_rate": 1.5764304013663535e-06, - "loss": 1.1211, - "step": 923 - }, - { - "epoch": 0.02, - "learning_rate": 1.5781383432963277e-06, - "loss": 0.8564, - "step": 924 - }, - { - "epoch": 0.02, - "learning_rate": 1.5798462852263022e-06, - "loss": 1.1045, - "step": 925 - }, - { - "epoch": 0.02, - "learning_rate": 1.5815542271562764e-06, - "loss": 0.8726, - "step": 926 - }, - { - "epoch": 0.02, - "learning_rate": 1.583262169086251e-06, - "loss": 1.0859, - "step": 927 - }, - { - "epoch": 0.02, - "learning_rate": 1.5849701110162255e-06, - "loss": 1.3301, - "step": 928 - }, - { - "epoch": 0.02, - "learning_rate": 1.5866780529461997e-06, - "loss": 1.2305, - "step": 929 - }, - { - "epoch": 0.02, - "learning_rate": 1.5883859948761742e-06, - "loss": 0.9453, - "step": 930 - }, - { - "epoch": 0.02, - "learning_rate": 1.5900939368061486e-06, - "loss": 1.1299, - "step": 931 - }, - { - "epoch": 0.02, - "learning_rate": 1.5918018787361229e-06, - "loss": 0.8857, - "step": 932 - }, - { - "epoch": 0.02, - "learning_rate": 1.5935098206660973e-06, - "loss": 0.9326, - "step": 933 - }, - { - "epoch": 0.02, - "learning_rate": 1.5952177625960717e-06, - "loss": 0.8394, - "step": 934 - }, - { - "epoch": 0.02, - "learning_rate": 1.596925704526046e-06, - "loss": 1.1836, - "step": 935 - }, - { - "epoch": 0.02, - "learning_rate": 1.5986336464560204e-06, - "loss": 1.0166, - "step": 936 - }, - { - "epoch": 0.02, - "learning_rate": 1.6003415883859949e-06, - "loss": 1.0518, - "step": 937 - }, - { - "epoch": 0.02, - "learning_rate": 1.602049530315969e-06, - "loss": 0.9209, - "step": 938 - }, - { - "epoch": 0.02, - "learning_rate": 1.6037574722459435e-06, - "loss": 0.8721, - "step": 939 - }, - { - "epoch": 0.02, - "learning_rate": 1.6054654141759178e-06, - "loss": 1.1602, - "step": 940 - }, - { - "epoch": 0.02, - "learning_rate": 1.6071733561058922e-06, - "loss": 1.0078, - "step": 941 - }, - { - "epoch": 0.02, - "learning_rate": 1.6088812980358669e-06, - "loss": 0.8848, - "step": 942 - }, - { - "epoch": 0.02, - "learning_rate": 1.610589239965841e-06, - "loss": 0.833, - "step": 943 - }, - { - "epoch": 0.02, - "learning_rate": 1.6122971818958155e-06, - "loss": 0.8809, - "step": 944 - }, - { - "epoch": 0.02, - "learning_rate": 1.61400512382579e-06, - "loss": 0.9521, - "step": 945 - }, - { - "epoch": 0.02, - "learning_rate": 1.6157130657557642e-06, - "loss": 0.8433, - "step": 946 - }, - { - "epoch": 0.02, - "learning_rate": 1.6174210076857386e-06, - "loss": 0.6768, - "step": 947 - }, - { - "epoch": 0.02, - "learning_rate": 1.619128949615713e-06, - "loss": 0.9404, - "step": 948 - }, - { - "epoch": 0.02, - "learning_rate": 1.6208368915456873e-06, - "loss": 0.8823, - "step": 949 - }, - { - "epoch": 0.02, - "learning_rate": 1.6225448334756618e-06, - "loss": 0.9521, - "step": 950 - }, - { - "epoch": 0.02, - "learning_rate": 1.6242527754056362e-06, - "loss": 1.1934, - "step": 951 - }, - { - "epoch": 0.02, - "learning_rate": 1.6259607173356104e-06, - "loss": 1.041, - "step": 952 - }, - { - "epoch": 0.02, - "learning_rate": 1.6276686592655849e-06, - "loss": 1.0215, - "step": 953 - }, - { - "epoch": 0.02, - "learning_rate": 1.629376601195559e-06, - "loss": 0.8281, - "step": 954 - }, - { - "epoch": 0.02, - "learning_rate": 1.6310845431255335e-06, - "loss": 1.0557, - "step": 955 - }, - { - "epoch": 0.02, - "learning_rate": 1.632792485055508e-06, - "loss": 1.2266, - "step": 956 - }, - { - "epoch": 0.02, - "learning_rate": 1.6345004269854824e-06, - "loss": 1.0703, - "step": 957 - }, - { - "epoch": 0.02, - "learning_rate": 1.6362083689154569e-06, - "loss": 0.8506, - "step": 958 - }, - { - "epoch": 0.02, - "learning_rate": 1.6379163108454313e-06, - "loss": 1.1279, - "step": 959 - }, - { - "epoch": 0.02, - "learning_rate": 1.6396242527754055e-06, - "loss": 0.9316, - "step": 960 - }, - { - "epoch": 0.02, - "learning_rate": 1.64133219470538e-06, - "loss": 1.0254, - "step": 961 - }, - { - "epoch": 0.02, - "learning_rate": 1.6430401366353544e-06, - "loss": 0.8682, - "step": 962 - }, - { - "epoch": 0.02, - "learning_rate": 1.6447480785653287e-06, - "loss": 1.1543, - "step": 963 - }, - { - "epoch": 0.02, - "learning_rate": 1.646456020495303e-06, - "loss": 0.8853, - "step": 964 - }, - { - "epoch": 0.02, - "learning_rate": 1.6481639624252775e-06, - "loss": 0.9795, - "step": 965 - }, - { - "epoch": 0.02, - "learning_rate": 1.6498719043552518e-06, - "loss": 1.0537, - "step": 966 - }, - { - "epoch": 0.02, - "learning_rate": 1.6515798462852262e-06, - "loss": 1.0938, - "step": 967 - }, - { - "epoch": 0.02, - "learning_rate": 1.6532877882152004e-06, - "loss": 1.0791, - "step": 968 - }, - { - "epoch": 0.02, - "learning_rate": 1.6549957301451749e-06, - "loss": 0.7156, - "step": 969 - }, - { - "epoch": 0.02, - "learning_rate": 1.6567036720751493e-06, - "loss": 1.0244, - "step": 970 - }, - { - "epoch": 0.02, - "learning_rate": 1.6584116140051238e-06, - "loss": 1.0127, - "step": 971 - }, - { - "epoch": 0.02, - "learning_rate": 1.6601195559350982e-06, - "loss": 0.958, - "step": 972 - }, - { - "epoch": 0.02, - "learning_rate": 1.6618274978650727e-06, - "loss": 1.126, - "step": 973 - }, - { - "epoch": 0.02, - "learning_rate": 1.6635354397950469e-06, - "loss": 1.1924, - "step": 974 - }, - { - "epoch": 0.02, - "learning_rate": 1.6652433817250213e-06, - "loss": 1.1172, - "step": 975 - }, - { - "epoch": 0.03, - "learning_rate": 1.6669513236549958e-06, - "loss": 0.9131, - "step": 976 - }, - { - "epoch": 0.03, - "learning_rate": 1.66865926558497e-06, - "loss": 0.9766, - "step": 977 - }, - { - "epoch": 0.03, - "learning_rate": 1.6703672075149444e-06, - "loss": 0.7871, - "step": 978 - }, - { - "epoch": 0.03, - "learning_rate": 1.6720751494449189e-06, - "loss": 1.085, - "step": 979 - }, - { - "epoch": 0.03, - "learning_rate": 1.6737830913748931e-06, - "loss": 0.9561, - "step": 980 - }, - { - "epoch": 0.03, - "learning_rate": 1.6754910333048676e-06, - "loss": 0.7715, - "step": 981 - }, - { - "epoch": 0.03, - "learning_rate": 1.6771989752348418e-06, - "loss": 0.8154, - "step": 982 - }, - { - "epoch": 0.03, - "learning_rate": 1.6789069171648162e-06, - "loss": 1.0205, - "step": 983 - }, - { - "epoch": 0.03, - "learning_rate": 1.6806148590947907e-06, - "loss": 1.1289, - "step": 984 - }, - { - "epoch": 0.03, - "learning_rate": 1.682322801024765e-06, - "loss": 1.0391, - "step": 985 - }, - { - "epoch": 0.03, - "learning_rate": 1.6840307429547396e-06, - "loss": 1.0186, - "step": 986 - }, - { - "epoch": 0.03, - "learning_rate": 1.685738684884714e-06, - "loss": 0.959, - "step": 987 - }, - { - "epoch": 0.03, - "learning_rate": 1.6874466268146882e-06, - "loss": 1.0381, - "step": 988 - }, - { - "epoch": 0.03, - "learning_rate": 1.6891545687446627e-06, - "loss": 0.9844, - "step": 989 - }, - { - "epoch": 0.03, - "learning_rate": 1.6908625106746371e-06, - "loss": 1.123, - "step": 990 - }, - { - "epoch": 0.03, - "learning_rate": 1.6925704526046113e-06, - "loss": 1.1426, - "step": 991 - }, - { - "epoch": 0.03, - "learning_rate": 1.6942783945345858e-06, - "loss": 0.9521, - "step": 992 - }, - { - "epoch": 0.03, - "learning_rate": 1.6959863364645602e-06, - "loss": 0.7764, - "step": 993 - }, - { - "epoch": 0.03, - "learning_rate": 1.6976942783945345e-06, - "loss": 1.0537, - "step": 994 - }, - { - "epoch": 0.03, - "learning_rate": 1.699402220324509e-06, - "loss": 1.1094, - "step": 995 - }, - { - "epoch": 0.03, - "learning_rate": 1.7011101622544831e-06, - "loss": 0.9736, - "step": 996 - }, - { - "epoch": 0.03, - "learning_rate": 1.7028181041844576e-06, - "loss": 0.9883, - "step": 997 - }, - { - "epoch": 0.03, - "learning_rate": 1.704526046114432e-06, - "loss": 0.999, - "step": 998 - }, - { - "epoch": 0.03, - "learning_rate": 1.7062339880444062e-06, - "loss": 0.9941, - "step": 999 - }, - { - "epoch": 0.03, - "learning_rate": 1.7079419299743807e-06, - "loss": 0.9629, - "step": 1000 - }, - { - "epoch": 0.03, - "learning_rate": 1.7096498719043553e-06, - "loss": 0.9141, - "step": 1001 - }, - { - "epoch": 0.03, - "learning_rate": 1.7113578138343296e-06, - "loss": 0.759, - "step": 1002 - }, - { - "epoch": 0.03, - "learning_rate": 1.713065755764304e-06, - "loss": 1.0723, - "step": 1003 - }, - { - "epoch": 0.03, - "learning_rate": 1.7147736976942785e-06, - "loss": 0.8672, - "step": 1004 - }, - { - "epoch": 0.03, - "learning_rate": 1.7164816396242527e-06, - "loss": 1.1592, - "step": 1005 - }, - { - "epoch": 0.03, - "learning_rate": 1.7181895815542271e-06, - "loss": 1.0557, - "step": 1006 - }, - { - "epoch": 0.03, - "learning_rate": 1.7198975234842016e-06, - "loss": 0.8232, - "step": 1007 - }, - { - "epoch": 0.03, - "learning_rate": 1.7216054654141758e-06, - "loss": 0.8516, - "step": 1008 - }, - { - "epoch": 0.03, - "learning_rate": 1.7233134073441502e-06, - "loss": 0.8926, - "step": 1009 - }, - { - "epoch": 0.03, - "learning_rate": 1.7250213492741245e-06, - "loss": 0.8789, - "step": 1010 - }, - { - "epoch": 0.03, - "learning_rate": 1.726729291204099e-06, - "loss": 1.1182, - "step": 1011 - }, - { - "epoch": 0.03, - "learning_rate": 1.7284372331340734e-06, - "loss": 0.8672, - "step": 1012 - }, - { - "epoch": 0.03, - "learning_rate": 1.7301451750640476e-06, - "loss": 1.0625, - "step": 1013 - }, - { - "epoch": 0.03, - "learning_rate": 1.731853116994022e-06, - "loss": 1.0449, - "step": 1014 - }, - { - "epoch": 0.03, - "learning_rate": 1.7335610589239965e-06, - "loss": 0.8184, - "step": 1015 - }, - { - "epoch": 0.03, - "learning_rate": 1.735269000853971e-06, - "loss": 1.082, - "step": 1016 - }, - { - "epoch": 0.03, - "learning_rate": 1.7369769427839454e-06, - "loss": 1.1465, - "step": 1017 - }, - { - "epoch": 0.03, - "learning_rate": 1.7386848847139198e-06, - "loss": 0.6377, - "step": 1018 - }, - { - "epoch": 0.03, - "learning_rate": 1.740392826643894e-06, - "loss": 0.915, - "step": 1019 - }, - { - "epoch": 0.03, - "learning_rate": 1.7421007685738685e-06, - "loss": 1.0547, - "step": 1020 - }, - { - "epoch": 0.03, - "learning_rate": 1.743808710503843e-06, - "loss": 1.2793, - "step": 1021 - }, - { - "epoch": 0.03, - "learning_rate": 1.7455166524338171e-06, - "loss": 0.8604, - "step": 1022 - }, - { - "epoch": 0.03, - "learning_rate": 1.7472245943637916e-06, - "loss": 0.9111, - "step": 1023 - }, - { - "epoch": 0.03, - "learning_rate": 1.7489325362937658e-06, - "loss": 0.9062, - "step": 1024 - }, - { - "epoch": 0.03, - "learning_rate": 1.7506404782237403e-06, - "loss": 1.0752, - "step": 1025 - }, - { - "epoch": 0.03, - "learning_rate": 1.7523484201537147e-06, - "loss": 1.123, - "step": 1026 - }, - { - "epoch": 0.03, - "learning_rate": 1.754056362083689e-06, - "loss": 1.0762, - "step": 1027 - }, - { - "epoch": 0.03, - "learning_rate": 1.7557643040136634e-06, - "loss": 0.8467, - "step": 1028 - }, - { - "epoch": 0.03, - "learning_rate": 1.7574722459436378e-06, - "loss": 1.0283, - "step": 1029 - }, - { - "epoch": 0.03, - "learning_rate": 1.759180187873612e-06, - "loss": 0.9092, - "step": 1030 - }, - { - "epoch": 0.03, - "learning_rate": 1.7608881298035867e-06, - "loss": 0.8926, - "step": 1031 - }, - { - "epoch": 0.03, - "learning_rate": 1.7625960717335611e-06, - "loss": 0.9033, - "step": 1032 - }, - { - "epoch": 0.03, - "learning_rate": 1.7643040136635354e-06, - "loss": 0.8647, - "step": 1033 - }, - { - "epoch": 0.03, - "learning_rate": 1.7660119555935098e-06, - "loss": 1.1143, - "step": 1034 - }, - { - "epoch": 0.03, - "learning_rate": 1.7677198975234843e-06, - "loss": 0.9775, - "step": 1035 - }, - { - "epoch": 0.03, - "learning_rate": 1.7694278394534585e-06, - "loss": 0.9717, - "step": 1036 - }, - { - "epoch": 0.03, - "learning_rate": 1.771135781383433e-06, - "loss": 0.9805, - "step": 1037 - }, - { - "epoch": 0.03, - "learning_rate": 1.7728437233134072e-06, - "loss": 0.8062, - "step": 1038 - }, - { - "epoch": 0.03, - "learning_rate": 1.7745516652433816e-06, - "loss": 0.7954, - "step": 1039 - }, - { - "epoch": 0.03, - "learning_rate": 1.776259607173356e-06, - "loss": 0.9238, - "step": 1040 - }, - { - "epoch": 0.03, - "learning_rate": 1.7779675491033303e-06, - "loss": 0.9883, - "step": 1041 - }, - { - "epoch": 0.03, - "learning_rate": 1.7796754910333047e-06, - "loss": 1.0879, - "step": 1042 - }, - { - "epoch": 0.03, - "learning_rate": 1.7813834329632792e-06, - "loss": 1.127, - "step": 1043 - }, - { - "epoch": 0.03, - "learning_rate": 1.7830913748932534e-06, - "loss": 0.8008, - "step": 1044 - }, - { - "epoch": 0.03, - "learning_rate": 1.7847993168232278e-06, - "loss": 0.9463, - "step": 1045 - }, - { - "epoch": 0.03, - "learning_rate": 1.7865072587532025e-06, - "loss": 0.96, - "step": 1046 - }, - { - "epoch": 0.03, - "learning_rate": 1.7882152006831767e-06, - "loss": 1.0117, - "step": 1047 - }, - { - "epoch": 0.03, - "learning_rate": 1.7899231426131512e-06, - "loss": 0.8945, - "step": 1048 - }, - { - "epoch": 0.03, - "learning_rate": 1.7916310845431256e-06, - "loss": 0.7495, - "step": 1049 - }, - { - "epoch": 0.03, - "learning_rate": 1.7933390264730998e-06, - "loss": 1.0996, - "step": 1050 - }, - { - "epoch": 0.03, - "learning_rate": 1.7950469684030743e-06, - "loss": 1.1709, - "step": 1051 - }, - { - "epoch": 0.03, - "learning_rate": 1.7967549103330485e-06, - "loss": 1.0645, - "step": 1052 - }, - { - "epoch": 0.03, - "learning_rate": 1.798462852263023e-06, - "loss": 0.9971, - "step": 1053 - }, - { - "epoch": 0.03, - "learning_rate": 1.8001707941929974e-06, - "loss": 1.0469, - "step": 1054 - }, - { - "epoch": 0.03, - "learning_rate": 1.8018787361229716e-06, - "loss": 0.937, - "step": 1055 - }, - { - "epoch": 0.03, - "learning_rate": 1.803586678052946e-06, - "loss": 0.8828, - "step": 1056 - }, - { - "epoch": 0.03, - "learning_rate": 1.8052946199829205e-06, - "loss": 0.9277, - "step": 1057 - }, - { - "epoch": 0.03, - "learning_rate": 1.8070025619128947e-06, - "loss": 0.9805, - "step": 1058 - }, - { - "epoch": 0.03, - "learning_rate": 1.8087105038428692e-06, - "loss": 0.9165, - "step": 1059 - }, - { - "epoch": 0.03, - "learning_rate": 1.8104184457728438e-06, - "loss": 0.9912, - "step": 1060 - }, - { - "epoch": 0.03, - "learning_rate": 1.812126387702818e-06, - "loss": 0.7705, - "step": 1061 - }, - { - "epoch": 0.03, - "learning_rate": 1.8138343296327925e-06, - "loss": 0.8242, - "step": 1062 - }, - { - "epoch": 0.03, - "learning_rate": 1.815542271562767e-06, - "loss": 0.8877, - "step": 1063 - }, - { - "epoch": 0.03, - "learning_rate": 1.8172502134927412e-06, - "loss": 0.7451, - "step": 1064 - }, - { - "epoch": 0.03, - "learning_rate": 1.8189581554227156e-06, - "loss": 0.8818, - "step": 1065 - }, - { - "epoch": 0.03, - "learning_rate": 1.8206660973526898e-06, - "loss": 0.8135, - "step": 1066 - }, - { - "epoch": 0.03, - "learning_rate": 1.8223740392826643e-06, - "loss": 1.0557, - "step": 1067 - }, - { - "epoch": 0.03, - "learning_rate": 1.8240819812126387e-06, - "loss": 0.9028, - "step": 1068 - }, - { - "epoch": 0.03, - "learning_rate": 1.825789923142613e-06, - "loss": 0.6206, - "step": 1069 - }, - { - "epoch": 0.03, - "learning_rate": 1.8274978650725874e-06, - "loss": 1.1514, - "step": 1070 - }, - { - "epoch": 0.03, - "learning_rate": 1.8292058070025618e-06, - "loss": 0.9014, - "step": 1071 - }, - { - "epoch": 0.03, - "learning_rate": 1.830913748932536e-06, - "loss": 1.042, - "step": 1072 - }, - { - "epoch": 0.03, - "learning_rate": 1.8326216908625105e-06, - "loss": 0.9893, - "step": 1073 - }, - { - "epoch": 0.03, - "learning_rate": 1.834329632792485e-06, - "loss": 0.8906, - "step": 1074 - }, - { - "epoch": 0.03, - "learning_rate": 1.8360375747224594e-06, - "loss": 0.9561, - "step": 1075 - }, - { - "epoch": 0.03, - "learning_rate": 1.8377455166524338e-06, - "loss": 0.9414, - "step": 1076 - }, - { - "epoch": 0.03, - "learning_rate": 1.8394534585824083e-06, - "loss": 1.0771, - "step": 1077 - }, - { - "epoch": 0.03, - "learning_rate": 1.8411614005123825e-06, - "loss": 1.0557, - "step": 1078 - }, - { - "epoch": 0.03, - "learning_rate": 1.842869342442357e-06, - "loss": 1.0293, - "step": 1079 - }, - { - "epoch": 0.03, - "learning_rate": 1.8445772843723312e-06, - "loss": 0.9072, - "step": 1080 - }, - { - "epoch": 0.03, - "learning_rate": 1.8462852263023056e-06, - "loss": 1.0332, - "step": 1081 - }, - { - "epoch": 0.03, - "learning_rate": 1.84799316823228e-06, - "loss": 0.9111, - "step": 1082 - }, - { - "epoch": 0.03, - "learning_rate": 1.8497011101622543e-06, - "loss": 0.9839, - "step": 1083 - }, - { - "epoch": 0.03, - "learning_rate": 1.8514090520922287e-06, - "loss": 1.0654, - "step": 1084 - }, - { - "epoch": 0.03, - "learning_rate": 1.8531169940222032e-06, - "loss": 0.8013, - "step": 1085 - }, - { - "epoch": 0.03, - "learning_rate": 1.8548249359521774e-06, - "loss": 1.0381, - "step": 1086 - }, - { - "epoch": 0.03, - "learning_rate": 1.8565328778821519e-06, - "loss": 1.082, - "step": 1087 - }, - { - "epoch": 0.03, - "learning_rate": 1.8582408198121263e-06, - "loss": 0.9414, - "step": 1088 - }, - { - "epoch": 0.03, - "learning_rate": 1.8599487617421005e-06, - "loss": 1.0918, - "step": 1089 - }, - { - "epoch": 0.03, - "learning_rate": 1.8616567036720752e-06, - "loss": 0.8799, - "step": 1090 - }, - { - "epoch": 0.03, - "learning_rate": 1.8633646456020496e-06, - "loss": 0.9521, - "step": 1091 - }, - { - "epoch": 0.03, - "learning_rate": 1.8650725875320239e-06, - "loss": 1.0879, - "step": 1092 - }, - { - "epoch": 0.03, - "learning_rate": 1.8667805294619983e-06, - "loss": 1.041, - "step": 1093 - }, - { - "epoch": 0.03, - "learning_rate": 1.8684884713919725e-06, - "loss": 0.7607, - "step": 1094 - }, - { - "epoch": 0.03, - "learning_rate": 1.870196413321947e-06, - "loss": 0.9458, - "step": 1095 - }, - { - "epoch": 0.03, - "learning_rate": 1.8719043552519214e-06, - "loss": 1.0664, - "step": 1096 - }, - { - "epoch": 0.03, - "learning_rate": 1.8736122971818956e-06, - "loss": 1.0898, - "step": 1097 - }, - { - "epoch": 0.03, - "learning_rate": 1.87532023911187e-06, - "loss": 0.8857, - "step": 1098 - }, - { - "epoch": 0.03, - "learning_rate": 1.8770281810418445e-06, - "loss": 1.0527, - "step": 1099 - }, - { - "epoch": 0.03, - "learning_rate": 1.8787361229718188e-06, - "loss": 0.876, - "step": 1100 - }, - { - "epoch": 0.03, - "learning_rate": 1.8804440649017932e-06, - "loss": 1.0801, - "step": 1101 - }, - { - "epoch": 0.03, - "learning_rate": 1.8821520068317676e-06, - "loss": 0.8174, - "step": 1102 - }, - { - "epoch": 0.03, - "learning_rate": 1.8838599487617419e-06, - "loss": 0.9844, - "step": 1103 - }, - { - "epoch": 0.03, - "learning_rate": 1.8855678906917163e-06, - "loss": 1.2305, - "step": 1104 - }, - { - "epoch": 0.03, - "learning_rate": 1.887275832621691e-06, - "loss": 1.0312, - "step": 1105 - }, - { - "epoch": 0.03, - "learning_rate": 1.8889837745516652e-06, - "loss": 0.8306, - "step": 1106 - }, - { - "epoch": 0.03, - "learning_rate": 1.8906917164816396e-06, - "loss": 0.7549, - "step": 1107 - }, - { - "epoch": 0.03, - "learning_rate": 1.892399658411614e-06, - "loss": 0.9272, - "step": 1108 - }, - { - "epoch": 0.03, - "learning_rate": 1.8941076003415883e-06, - "loss": 0.8765, - "step": 1109 - }, - { - "epoch": 0.03, - "learning_rate": 1.8958155422715628e-06, - "loss": 1.0986, - "step": 1110 - }, - { - "epoch": 0.03, - "learning_rate": 1.897523484201537e-06, - "loss": 1.1367, - "step": 1111 - }, - { - "epoch": 0.03, - "learning_rate": 1.8992314261315114e-06, - "loss": 0.9619, - "step": 1112 - }, - { - "epoch": 0.03, - "learning_rate": 1.9009393680614859e-06, - "loss": 1.0088, - "step": 1113 - }, - { - "epoch": 0.03, - "learning_rate": 1.90264730999146e-06, - "loss": 1.0298, - "step": 1114 - }, - { - "epoch": 0.03, - "learning_rate": 1.9043552519214345e-06, - "loss": 0.9512, - "step": 1115 - }, - { - "epoch": 0.03, - "learning_rate": 1.906063193851409e-06, - "loss": 1.0615, - "step": 1116 - }, - { - "epoch": 0.03, - "learning_rate": 1.9077711357813834e-06, - "loss": 0.9092, - "step": 1117 - }, - { - "epoch": 0.03, - "learning_rate": 1.9094790777113577e-06, - "loss": 1.209, - "step": 1118 - }, - { - "epoch": 0.03, - "learning_rate": 1.911187019641332e-06, - "loss": 1.1641, - "step": 1119 - }, - { - "epoch": 0.03, - "learning_rate": 1.9128949615713065e-06, - "loss": 1.0791, - "step": 1120 - }, - { - "epoch": 0.03, - "learning_rate": 1.9146029035012808e-06, - "loss": 0.7524, - "step": 1121 - }, - { - "epoch": 0.03, - "learning_rate": 1.9163108454312554e-06, - "loss": 0.8574, - "step": 1122 - }, - { - "epoch": 0.03, - "learning_rate": 1.9180187873612297e-06, - "loss": 0.9902, - "step": 1123 - }, - { - "epoch": 0.03, - "learning_rate": 1.919726729291204e-06, - "loss": 1.2393, - "step": 1124 - }, - { - "epoch": 0.03, - "learning_rate": 1.9214346712211785e-06, - "loss": 0.958, - "step": 1125 - }, - { - "epoch": 0.03, - "learning_rate": 1.9231426131511528e-06, - "loss": 1.1992, - "step": 1126 - }, - { - "epoch": 0.03, - "learning_rate": 1.924850555081127e-06, - "loss": 0.9814, - "step": 1127 - }, - { - "epoch": 0.03, - "learning_rate": 1.9265584970111017e-06, - "loss": 1.0049, - "step": 1128 - }, - { - "epoch": 0.03, - "learning_rate": 1.928266438941076e-06, - "loss": 1.1299, - "step": 1129 - }, - { - "epoch": 0.03, - "learning_rate": 1.92997438087105e-06, - "loss": 0.8892, - "step": 1130 - }, - { - "epoch": 0.03, - "learning_rate": 1.9316823228010248e-06, - "loss": 0.9189, - "step": 1131 - }, - { - "epoch": 0.03, - "learning_rate": 1.933390264730999e-06, - "loss": 0.7764, - "step": 1132 - }, - { - "epoch": 0.03, - "learning_rate": 1.9350982066609732e-06, - "loss": 0.9619, - "step": 1133 - }, - { - "epoch": 0.03, - "learning_rate": 1.936806148590948e-06, - "loss": 0.9346, - "step": 1134 - }, - { - "epoch": 0.03, - "learning_rate": 1.938514090520922e-06, - "loss": 1.084, - "step": 1135 - }, - { - "epoch": 0.03, - "learning_rate": 1.9402220324508968e-06, - "loss": 0.9355, - "step": 1136 - }, - { - "epoch": 0.03, - "learning_rate": 1.941929974380871e-06, - "loss": 1.1738, - "step": 1137 - }, - { - "epoch": 0.03, - "learning_rate": 1.9436379163108452e-06, - "loss": 1.1045, - "step": 1138 - }, - { - "epoch": 0.03, - "learning_rate": 1.94534585824082e-06, - "loss": 0.9688, - "step": 1139 - }, - { - "epoch": 0.03, - "learning_rate": 1.947053800170794e-06, - "loss": 0.9932, - "step": 1140 - }, - { - "epoch": 0.03, - "learning_rate": 1.9487617421007683e-06, - "loss": 0.9414, - "step": 1141 - }, - { - "epoch": 0.03, - "learning_rate": 1.950469684030743e-06, - "loss": 1.0459, - "step": 1142 - }, - { - "epoch": 0.03, - "learning_rate": 1.9521776259607172e-06, - "loss": 1.126, - "step": 1143 - }, - { - "epoch": 0.03, - "learning_rate": 1.9538855678906915e-06, - "loss": 0.7808, - "step": 1144 - }, - { - "epoch": 0.03, - "learning_rate": 1.955593509820666e-06, - "loss": 0.916, - "step": 1145 - }, - { - "epoch": 0.03, - "learning_rate": 1.9573014517506403e-06, - "loss": 1.1494, - "step": 1146 - }, - { - "epoch": 0.03, - "learning_rate": 1.9590093936806146e-06, - "loss": 0.9453, - "step": 1147 - }, - { - "epoch": 0.03, - "learning_rate": 1.9607173356105892e-06, - "loss": 1.0137, - "step": 1148 - }, - { - "epoch": 0.03, - "learning_rate": 1.9624252775405635e-06, - "loss": 0.9766, - "step": 1149 - }, - { - "epoch": 0.03, - "learning_rate": 1.964133219470538e-06, - "loss": 1.1035, - "step": 1150 - }, - { - "epoch": 0.03, - "learning_rate": 1.9658411614005123e-06, - "loss": 1.1084, - "step": 1151 - }, - { - "epoch": 0.03, - "learning_rate": 1.9675491033304866e-06, - "loss": 0.9346, - "step": 1152 - }, - { - "epoch": 0.03, - "learning_rate": 1.9692570452604612e-06, - "loss": 1.0039, - "step": 1153 - }, - { - "epoch": 0.03, - "learning_rate": 1.9709649871904355e-06, - "loss": 1.1416, - "step": 1154 - }, - { - "epoch": 0.03, - "learning_rate": 1.9726729291204097e-06, - "loss": 0.957, - "step": 1155 - }, - { - "epoch": 0.03, - "learning_rate": 1.9743808710503843e-06, - "loss": 0.9189, - "step": 1156 - }, - { - "epoch": 0.03, - "learning_rate": 1.9760888129803586e-06, - "loss": 0.7988, - "step": 1157 - }, - { - "epoch": 0.03, - "learning_rate": 1.977796754910333e-06, - "loss": 0.9365, - "step": 1158 - }, - { - "epoch": 0.03, - "learning_rate": 1.9795046968403075e-06, - "loss": 0.6909, - "step": 1159 - }, - { - "epoch": 0.03, - "learning_rate": 1.9812126387702817e-06, - "loss": 1.2227, - "step": 1160 - }, - { - "epoch": 0.03, - "learning_rate": 1.982920580700256e-06, - "loss": 1.0127, - "step": 1161 - }, - { - "epoch": 0.03, - "learning_rate": 1.9846285226302306e-06, - "loss": 1.0625, - "step": 1162 - }, - { - "epoch": 0.03, - "learning_rate": 1.986336464560205e-06, - "loss": 1.0898, - "step": 1163 - }, - { - "epoch": 0.03, - "learning_rate": 1.9880444064901795e-06, - "loss": 0.9346, - "step": 1164 - }, - { - "epoch": 0.03, - "learning_rate": 1.9897523484201537e-06, - "loss": 0.9248, - "step": 1165 - }, - { - "epoch": 0.03, - "learning_rate": 1.991460290350128e-06, - "loss": 0.9502, - "step": 1166 - }, - { - "epoch": 0.03, - "learning_rate": 1.9931682322801026e-06, - "loss": 0.7476, - "step": 1167 - }, - { - "epoch": 0.03, - "learning_rate": 1.994876174210077e-06, - "loss": 1.0654, - "step": 1168 - }, - { - "epoch": 0.03, - "learning_rate": 1.996584116140051e-06, - "loss": 0.998, - "step": 1169 - }, - { - "epoch": 0.03, - "learning_rate": 1.9982920580700257e-06, - "loss": 1.2603, - "step": 1170 - }, - { - "epoch": 0.03, - "learning_rate": 2e-06, - "loss": 0.9443, - "step": 1171 - }, - { - "epoch": 0.03, - "learning_rate": 1.999999996554496e-06, - "loss": 0.918, - "step": 1172 - }, - { - "epoch": 0.03, - "learning_rate": 1.999999986217985e-06, - "loss": 0.9023, - "step": 1173 - }, - { - "epoch": 0.03, - "learning_rate": 1.999999968990466e-06, - "loss": 1.0205, - "step": 1174 - }, - { - "epoch": 0.03, - "learning_rate": 1.99999994487194e-06, - "loss": 0.7886, - "step": 1175 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999999138624065e-06, - "loss": 1.0078, - "step": 1176 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999998759618665e-06, - "loss": 0.9609, - "step": 1177 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999998311703195e-06, - "loss": 0.959, - "step": 1178 - }, - { - "epoch": 0.03, - "learning_rate": 1.999999779487766e-06, - "loss": 0.8906, - "step": 1179 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999997209142066e-06, - "loss": 1.1406, - "step": 1180 - }, - { - "epoch": 0.03, - "learning_rate": 1.999999655449642e-06, - "loss": 1.041, - "step": 1181 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999995830940713e-06, - "loss": 0.9463, - "step": 1182 - }, - { - "epoch": 0.03, - "learning_rate": 1.999999503847497e-06, - "loss": 0.8613, - "step": 1183 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999994177099176e-06, - "loss": 1.0049, - "step": 1184 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999993246813355e-06, - "loss": 0.9443, - "step": 1185 - }, - { - "epoch": 0.03, - "learning_rate": 1.99999922476175e-06, - "loss": 1.1504, - "step": 1186 - }, - { - "epoch": 0.03, - "learning_rate": 1.999999117951162e-06, - "loss": 0.9932, - "step": 1187 - }, - { - "epoch": 0.03, - "learning_rate": 1.999999004249573e-06, - "loss": 1.0068, - "step": 1188 - }, - { - "epoch": 0.03, - "learning_rate": 1.999998883656983e-06, - "loss": 1.0723, - "step": 1189 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999987561733936e-06, - "loss": 0.9795, - "step": 1190 - }, - { - "epoch": 0.03, - "learning_rate": 1.999998621798805e-06, - "loss": 1.0098, - "step": 1191 - }, - { - "epoch": 0.03, - "learning_rate": 1.999998480533218e-06, - "loss": 1.0654, - "step": 1192 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999983323766343e-06, - "loss": 0.7603, - "step": 1193 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999981773290545e-06, - "loss": 1.1143, - "step": 1194 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999980153904797e-06, - "loss": 0.8125, - "step": 1195 - }, - { - "epoch": 0.03, - "learning_rate": 1.999997846560911e-06, - "loss": 0.999, - "step": 1196 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999976708403496e-06, - "loss": 0.9111, - "step": 1197 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999974882287964e-06, - "loss": 1.0264, - "step": 1198 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999972987262533e-06, - "loss": 1.1074, - "step": 1199 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999971023327215e-06, - "loss": 1.0342, - "step": 1200 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999968990482015e-06, - "loss": 0.7637, - "step": 1201 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999966888726957e-06, - "loss": 1.0762, - "step": 1202 - }, - { - "epoch": 0.03, - "learning_rate": 1.999996471806205e-06, - "loss": 1.0103, - "step": 1203 - }, - { - "epoch": 0.03, - "learning_rate": 1.999996247848731e-06, - "loss": 0.9541, - "step": 1204 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999960170002755e-06, - "loss": 1.1533, - "step": 1205 - }, - { - "epoch": 0.03, - "learning_rate": 1.99999577926084e-06, - "loss": 0.6733, - "step": 1206 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999955346304255e-06, - "loss": 0.9844, - "step": 1207 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999952831090346e-06, - "loss": 0.7695, - "step": 1208 - }, - { - "epoch": 0.03, - "learning_rate": 1.999995024696669e-06, - "loss": 0.916, - "step": 1209 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999947593933296e-06, - "loss": 0.9863, - "step": 1210 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999944871990188e-06, - "loss": 0.9697, - "step": 1211 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999942081137384e-06, - "loss": 0.7896, - "step": 1212 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999939221374905e-06, - "loss": 1.0518, - "step": 1213 - }, - { - "epoch": 0.03, - "learning_rate": 1.999993629270277e-06, - "loss": 0.8398, - "step": 1214 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999933295120998e-06, - "loss": 0.894, - "step": 1215 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999930228629608e-06, - "loss": 0.6821, - "step": 1216 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999927093228627e-06, - "loss": 1.0898, - "step": 1217 - }, - { - "epoch": 0.03, - "learning_rate": 1.999992388891807e-06, - "loss": 1.0723, - "step": 1218 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999920615697963e-06, - "loss": 0.8779, - "step": 1219 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999917273568326e-06, - "loss": 0.877, - "step": 1220 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999913862529183e-06, - "loss": 1.0771, - "step": 1221 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999910382580564e-06, - "loss": 0.8574, - "step": 1222 - }, - { - "epoch": 0.03, - "learning_rate": 1.999990683372248e-06, - "loss": 0.9736, - "step": 1223 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999903215954966e-06, - "loss": 0.9453, - "step": 1224 - }, - { - "epoch": 0.03, - "learning_rate": 1.999989952927804e-06, - "loss": 0.8955, - "step": 1225 - }, - { - "epoch": 0.03, - "learning_rate": 1.999989577369174e-06, - "loss": 1.0928, - "step": 1226 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999891949196075e-06, - "loss": 0.9648, - "step": 1227 - }, - { - "epoch": 0.03, - "learning_rate": 1.999988805579108e-06, - "loss": 0.833, - "step": 1228 - }, - { - "epoch": 0.03, - "learning_rate": 1.999988409347678e-06, - "loss": 1.0234, - "step": 1229 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999880062253203e-06, - "loss": 0.8438, - "step": 1230 - }, - { - "epoch": 0.03, - "learning_rate": 1.999987596212038e-06, - "loss": 1.0664, - "step": 1231 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999871793078335e-06, - "loss": 0.8477, - "step": 1232 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999867555127097e-06, - "loss": 0.8809, - "step": 1233 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999863248266697e-06, - "loss": 1.1553, - "step": 1234 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999858872497164e-06, - "loss": 1.0635, - "step": 1235 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999854427818527e-06, - "loss": 0.8882, - "step": 1236 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999849914230817e-06, - "loss": 0.9727, - "step": 1237 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999845331734067e-06, - "loss": 1.084, - "step": 1238 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999840680328307e-06, - "loss": 1.1387, - "step": 1239 - }, - { - "epoch": 0.03, - "learning_rate": 1.999983596001357e-06, - "loss": 1.0928, - "step": 1240 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999831170789888e-06, - "loss": 1.1201, - "step": 1241 - }, - { - "epoch": 0.03, - "learning_rate": 1.999982631265729e-06, - "loss": 1.0059, - "step": 1242 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999821385615817e-06, - "loss": 0.7881, - "step": 1243 - }, - { - "epoch": 0.03, - "learning_rate": 1.99998163896655e-06, - "loss": 1.0986, - "step": 1244 - }, - { - "epoch": 0.03, - "learning_rate": 1.999981132480637e-06, - "loss": 0.9883, - "step": 1245 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999806191038467e-06, - "loss": 0.8926, - "step": 1246 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999800988361824e-06, - "loss": 1.0127, - "step": 1247 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999795716776476e-06, - "loss": 1.0391, - "step": 1248 - }, - { - "epoch": 0.03, - "learning_rate": 1.999979037628246e-06, - "loss": 0.9375, - "step": 1249 - }, - { - "epoch": 0.03, - "learning_rate": 1.999978496687981e-06, - "loss": 0.8613, - "step": 1250 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999779488568572e-06, - "loss": 0.7905, - "step": 1251 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999773941348776e-06, - "loss": 1.0049, - "step": 1252 - }, - { - "epoch": 0.03, - "learning_rate": 1.999976832522046e-06, - "loss": 1.0547, - "step": 1253 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999762640183664e-06, - "loss": 0.9321, - "step": 1254 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999756886238434e-06, - "loss": 1.0684, - "step": 1255 - }, - { - "epoch": 0.03, - "learning_rate": 1.99997510633848e-06, - "loss": 1.0352, - "step": 1256 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999745171622806e-06, - "loss": 1.0361, - "step": 1257 - }, - { - "epoch": 0.03, - "learning_rate": 1.999973921095249e-06, - "loss": 0.9629, - "step": 1258 - }, - { - "epoch": 0.03, - "learning_rate": 1.99997331813739e-06, - "loss": 0.96, - "step": 1259 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999727082887074e-06, - "loss": 0.9287, - "step": 1260 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999720915492047e-06, - "loss": 0.9653, - "step": 1261 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999714679188874e-06, - "loss": 0.8271, - "step": 1262 - }, - { - "epoch": 0.03, - "learning_rate": 1.999970837397759e-06, - "loss": 0.8311, - "step": 1263 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999701999858234e-06, - "loss": 1.1191, - "step": 1264 - }, - { - "epoch": 0.03, - "learning_rate": 1.999969555683086e-06, - "loss": 1.1191, - "step": 1265 - }, - { - "epoch": 0.03, - "learning_rate": 1.999968904489551e-06, - "loss": 1.0583, - "step": 1266 - }, - { - "epoch": 0.03, - "learning_rate": 1.999968246405223e-06, - "loss": 1.0273, - "step": 1267 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999675814301055e-06, - "loss": 0.769, - "step": 1268 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999669095642045e-06, - "loss": 0.7451, - "step": 1269 - }, - { - "epoch": 0.03, - "learning_rate": 1.999966230807524e-06, - "loss": 0.9219, - "step": 1270 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999655451600682e-06, - "loss": 1.041, - "step": 1271 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999648526218424e-06, - "loss": 1.1357, - "step": 1272 - }, - { - "epoch": 0.03, - "learning_rate": 1.999964153192851e-06, - "loss": 1.0693, - "step": 1273 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999634468730996e-06, - "loss": 0.6895, - "step": 1274 - }, - { - "epoch": 0.03, - "learning_rate": 1.999962733662592e-06, - "loss": 1.1719, - "step": 1275 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999620135613343e-06, - "loss": 1.0264, - "step": 1276 - }, - { - "epoch": 0.03, - "learning_rate": 1.99996128656933e-06, - "loss": 0.9707, - "step": 1277 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999605526865854e-06, - "loss": 1.2891, - "step": 1278 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999598119131052e-06, - "loss": 0.9844, - "step": 1279 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999590642488943e-06, - "loss": 0.8994, - "step": 1280 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999583096939578e-06, - "loss": 1.1836, - "step": 1281 - }, - { - "epoch": 0.03, - "learning_rate": 1.999957548248301e-06, - "loss": 0.9238, - "step": 1282 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999567799119296e-06, - "loss": 1.0645, - "step": 1283 - }, - { - "epoch": 0.03, - "learning_rate": 1.999956004684848e-06, - "loss": 0.9746, - "step": 1284 - }, - { - "epoch": 0.03, - "learning_rate": 1.999955222567062e-06, - "loss": 0.9033, - "step": 1285 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999544335585773e-06, - "loss": 0.9121, - "step": 1286 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999536376593992e-06, - "loss": 1.125, - "step": 1287 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999528348695324e-06, - "loss": 0.793, - "step": 1288 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999520251889835e-06, - "loss": 0.9561, - "step": 1289 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999512086177576e-06, - "loss": 0.9316, - "step": 1290 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999503851558602e-06, - "loss": 0.9229, - "step": 1291 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999495548032973e-06, - "loss": 0.9355, - "step": 1292 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999487175600744e-06, - "loss": 1.207, - "step": 1293 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999478734261974e-06, - "loss": 0.9131, - "step": 1294 - }, - { - "epoch": 0.03, - "learning_rate": 1.999947022401672e-06, - "loss": 0.7646, - "step": 1295 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999461644865042e-06, - "loss": 0.7559, - "step": 1296 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999452996806996e-06, - "loss": 1.0391, - "step": 1297 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999444279842646e-06, - "loss": 0.8662, - "step": 1298 - }, - { - "epoch": 0.03, - "learning_rate": 1.999943549397205e-06, - "loss": 0.9121, - "step": 1299 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999426639195267e-06, - "loss": 1.0693, - "step": 1300 - }, - { - "epoch": 0.03, - "learning_rate": 1.999941771551236e-06, - "loss": 0.8398, - "step": 1301 - }, - { - "epoch": 0.03, - "learning_rate": 1.999940872292339e-06, - "loss": 0.9824, - "step": 1302 - }, - { - "epoch": 0.03, - "learning_rate": 1.999939966142842e-06, - "loss": 1.1318, - "step": 1303 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999390531027512e-06, - "loss": 0.8726, - "step": 1304 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999381331720725e-06, - "loss": 1.002, - "step": 1305 - }, - { - "epoch": 0.03, - "learning_rate": 1.999937206350813e-06, - "loss": 0.8428, - "step": 1306 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999362726389783e-06, - "loss": 1.001, - "step": 1307 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999353320365753e-06, - "loss": 0.7402, - "step": 1308 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999343845436104e-06, - "loss": 0.9736, - "step": 1309 - }, - { - "epoch": 0.03, - "learning_rate": 1.99993343016009e-06, - "loss": 0.8823, - "step": 1310 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999324688860208e-06, - "loss": 0.9863, - "step": 1311 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999315007214095e-06, - "loss": 0.9883, - "step": 1312 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999305256662628e-06, - "loss": 1.1133, - "step": 1313 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999295437205873e-06, - "loss": 0.916, - "step": 1314 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999285548843898e-06, - "loss": 0.998, - "step": 1315 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999275591576767e-06, - "loss": 0.7402, - "step": 1316 - }, - { - "epoch": 0.03, - "learning_rate": 1.999926556540455e-06, - "loss": 1.0215, - "step": 1317 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999255470327325e-06, - "loss": 1.0527, - "step": 1318 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999245306345153e-06, - "loss": 0.7427, - "step": 1319 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999235073458105e-06, - "loss": 1.0127, - "step": 1320 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999224771666256e-06, - "loss": 1.1123, - "step": 1321 - }, - { - "epoch": 0.03, - "learning_rate": 1.999921440096967e-06, - "loss": 0.728, - "step": 1322 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999203961368424e-06, - "loss": 0.9824, - "step": 1323 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999193452862585e-06, - "loss": 0.6914, - "step": 1324 - }, - { - "epoch": 0.03, - "learning_rate": 1.999918287545223e-06, - "loss": 0.8369, - "step": 1325 - }, - { - "epoch": 0.03, - "learning_rate": 1.999917222913743e-06, - "loss": 1.0996, - "step": 1326 - }, - { - "epoch": 0.03, - "learning_rate": 1.999916151391826e-06, - "loss": 0.8389, - "step": 1327 - }, - { - "epoch": 0.03, - "learning_rate": 1.999915072979479e-06, - "loss": 0.9609, - "step": 1328 - }, - { - "epoch": 0.03, - "learning_rate": 1.99991398767671e-06, - "loss": 0.7471, - "step": 1329 - }, - { - "epoch": 0.03, - "learning_rate": 1.999912895483526e-06, - "loss": 1.0107, - "step": 1330 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999117963999348e-06, - "loss": 0.9326, - "step": 1331 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999106904259434e-06, - "loss": 0.876, - "step": 1332 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999095775615604e-06, - "loss": 1.207, - "step": 1333 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999084578067927e-06, - "loss": 0.9746, - "step": 1334 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999073311616483e-06, - "loss": 1.1729, - "step": 1335 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999061976261353e-06, - "loss": 1.0996, - "step": 1336 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999050572002603e-06, - "loss": 0.9258, - "step": 1337 - }, - { - "epoch": 0.03, - "learning_rate": 1.999903909884033e-06, - "loss": 0.9727, - "step": 1338 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999027556774595e-06, - "loss": 1.0723, - "step": 1339 - }, - { - "epoch": 0.03, - "learning_rate": 1.999901594580549e-06, - "loss": 0.7607, - "step": 1340 - }, - { - "epoch": 0.03, - "learning_rate": 1.9999004265933086e-06, - "loss": 0.9971, - "step": 1341 - }, - { - "epoch": 0.03, - "learning_rate": 1.9998992517157475e-06, - "loss": 0.916, - "step": 1342 - }, - { - "epoch": 0.03, - "learning_rate": 1.9998980699478724e-06, - "loss": 1.124, - "step": 1343 - }, - { - "epoch": 0.03, - "learning_rate": 1.9998968812896926e-06, - "loss": 0.6675, - "step": 1344 - }, - { - "epoch": 0.03, - "learning_rate": 1.9998956857412157e-06, - "loss": 0.9834, - "step": 1345 - }, - { - "epoch": 0.03, - "learning_rate": 1.99989448330245e-06, - "loss": 0.7178, - "step": 1346 - }, - { - "epoch": 0.03, - "learning_rate": 1.999893273973404e-06, - "loss": 0.8975, - "step": 1347 - }, - { - "epoch": 0.03, - "learning_rate": 1.999892057754086e-06, - "loss": 0.916, - "step": 1348 - }, - { - "epoch": 0.03, - "learning_rate": 1.999890834644504e-06, - "loss": 0.9346, - "step": 1349 - }, - { - "epoch": 0.03, - "learning_rate": 1.9998896046446667e-06, - "loss": 1.1758, - "step": 1350 - }, - { - "epoch": 0.03, - "learning_rate": 1.9998883677545826e-06, - "loss": 0.9658, - "step": 1351 - }, - { - "epoch": 0.03, - "learning_rate": 1.9998871239742604e-06, - "loss": 0.8965, - "step": 1352 - }, - { - "epoch": 0.03, - "learning_rate": 1.9998858733037083e-06, - "loss": 0.8799, - "step": 1353 - }, - { - "epoch": 0.03, - "learning_rate": 1.9998846157429355e-06, - "loss": 1.085, - "step": 1354 - }, - { - "epoch": 0.03, - "learning_rate": 1.9998833512919498e-06, - "loss": 0.9307, - "step": 1355 - }, - { - "epoch": 0.03, - "learning_rate": 1.9998820799507606e-06, - "loss": 0.8916, - "step": 1356 - }, - { - "epoch": 0.03, - "learning_rate": 1.9998808017193764e-06, - "loss": 1.0518, - "step": 1357 - }, - { - "epoch": 0.03, - "learning_rate": 1.9998795165978057e-06, - "loss": 1.1328, - "step": 1358 - }, - { - "epoch": 0.03, - "learning_rate": 1.999878224586058e-06, - "loss": 0.9863, - "step": 1359 - }, - { - "epoch": 0.03, - "learning_rate": 1.9998769256841423e-06, - "loss": 0.8193, - "step": 1360 - }, - { - "epoch": 0.03, - "learning_rate": 1.9998756198920666e-06, - "loss": 0.7339, - "step": 1361 - }, - { - "epoch": 0.03, - "learning_rate": 1.9998743072098403e-06, - "loss": 1.0117, - "step": 1362 - }, - { - "epoch": 0.03, - "learning_rate": 1.999872987637473e-06, - "loss": 0.7773, - "step": 1363 - }, - { - "epoch": 0.03, - "learning_rate": 1.9998716611749734e-06, - "loss": 1.0908, - "step": 1364 - }, - { - "epoch": 0.03, - "learning_rate": 1.9998703278223506e-06, - "loss": 1.0107, - "step": 1365 - }, - { - "epoch": 0.04, - "learning_rate": 1.9998689875796136e-06, - "loss": 0.8828, - "step": 1366 - }, - { - "epoch": 0.04, - "learning_rate": 1.9998676404467722e-06, - "loss": 0.8174, - "step": 1367 - }, - { - "epoch": 0.04, - "learning_rate": 1.9998662864238345e-06, - "loss": 1.1143, - "step": 1368 - }, - { - "epoch": 0.04, - "learning_rate": 1.9998649255108115e-06, - "loss": 0.9473, - "step": 1369 - }, - { - "epoch": 0.04, - "learning_rate": 1.9998635577077116e-06, - "loss": 0.9541, - "step": 1370 - }, - { - "epoch": 0.04, - "learning_rate": 1.9998621830145442e-06, - "loss": 1.043, - "step": 1371 - }, - { - "epoch": 0.04, - "learning_rate": 1.999860801431319e-06, - "loss": 1.0986, - "step": 1372 - }, - { - "epoch": 0.04, - "learning_rate": 1.9998594129580458e-06, - "loss": 1.0469, - "step": 1373 - }, - { - "epoch": 0.04, - "learning_rate": 1.9998580175947334e-06, - "loss": 1.0, - "step": 1374 - }, - { - "epoch": 0.04, - "learning_rate": 1.999856615341392e-06, - "loss": 1.0068, - "step": 1375 - }, - { - "epoch": 0.04, - "learning_rate": 1.9998552061980313e-06, - "loss": 0.8867, - "step": 1376 - }, - { - "epoch": 0.04, - "learning_rate": 1.9998537901646607e-06, - "loss": 0.9561, - "step": 1377 - }, - { - "epoch": 0.04, - "learning_rate": 1.99985236724129e-06, - "loss": 0.8076, - "step": 1378 - }, - { - "epoch": 0.04, - "learning_rate": 1.999850937427929e-06, - "loss": 0.8545, - "step": 1379 - }, - { - "epoch": 0.04, - "learning_rate": 1.999849500724588e-06, - "loss": 0.9077, - "step": 1380 - }, - { - "epoch": 0.04, - "learning_rate": 1.9998480571312758e-06, - "loss": 0.8906, - "step": 1381 - }, - { - "epoch": 0.04, - "learning_rate": 1.9998466066480037e-06, - "loss": 0.9248, - "step": 1382 - }, - { - "epoch": 0.04, - "learning_rate": 1.999845149274781e-06, - "loss": 0.9844, - "step": 1383 - }, - { - "epoch": 0.04, - "learning_rate": 1.9998436850116173e-06, - "loss": 0.7305, - "step": 1384 - }, - { - "epoch": 0.04, - "learning_rate": 1.999842213858524e-06, - "loss": 1.2217, - "step": 1385 - }, - { - "epoch": 0.04, - "learning_rate": 1.99984073581551e-06, - "loss": 0.5537, - "step": 1386 - }, - { - "epoch": 0.04, - "learning_rate": 1.999839250882586e-06, - "loss": 0.9404, - "step": 1387 - }, - { - "epoch": 0.04, - "learning_rate": 1.9998377590597626e-06, - "loss": 0.8486, - "step": 1388 - }, - { - "epoch": 0.04, - "learning_rate": 1.999836260347049e-06, - "loss": 0.833, - "step": 1389 - }, - { - "epoch": 0.04, - "learning_rate": 1.9998347547444564e-06, - "loss": 1.1914, - "step": 1390 - }, - { - "epoch": 0.04, - "learning_rate": 1.999833242251995e-06, - "loss": 0.9512, - "step": 1391 - }, - { - "epoch": 0.04, - "learning_rate": 1.999831722869675e-06, - "loss": 1.084, - "step": 1392 - }, - { - "epoch": 0.04, - "learning_rate": 1.9998301965975074e-06, - "loss": 0.9863, - "step": 1393 - }, - { - "epoch": 0.04, - "learning_rate": 1.999828663435502e-06, - "loss": 1.0908, - "step": 1394 - }, - { - "epoch": 0.04, - "learning_rate": 1.99982712338367e-06, - "loss": 1.0332, - "step": 1395 - }, - { - "epoch": 0.04, - "learning_rate": 1.9998255764420215e-06, - "loss": 0.877, - "step": 1396 - }, - { - "epoch": 0.04, - "learning_rate": 1.9998240226105676e-06, - "loss": 0.8955, - "step": 1397 - }, - { - "epoch": 0.04, - "learning_rate": 1.999822461889319e-06, - "loss": 1.0156, - "step": 1398 - }, - { - "epoch": 0.04, - "learning_rate": 1.999820894278286e-06, - "loss": 0.8506, - "step": 1399 - }, - { - "epoch": 0.04, - "learning_rate": 1.9998193197774795e-06, - "loss": 0.873, - "step": 1400 - }, - { - "epoch": 0.04, - "learning_rate": 1.9998177383869108e-06, - "loss": 0.9932, - "step": 1401 - }, - { - "epoch": 0.04, - "learning_rate": 1.9998161501065904e-06, - "loss": 1.0742, - "step": 1402 - }, - { - "epoch": 0.04, - "learning_rate": 1.999814554936529e-06, - "loss": 0.9756, - "step": 1403 - }, - { - "epoch": 0.04, - "learning_rate": 1.9998129528767387e-06, - "loss": 0.9453, - "step": 1404 - }, - { - "epoch": 0.04, - "learning_rate": 1.9998113439272297e-06, - "loss": 0.9238, - "step": 1405 - }, - { - "epoch": 0.04, - "learning_rate": 1.9998097280880123e-06, - "loss": 1.0498, - "step": 1406 - }, - { - "epoch": 0.04, - "learning_rate": 1.9998081053590996e-06, - "loss": 1.04, - "step": 1407 - }, - { - "epoch": 0.04, - "learning_rate": 1.999806475740501e-06, - "loss": 1.165, - "step": 1408 - }, - { - "epoch": 0.04, - "learning_rate": 1.9998048392322287e-06, - "loss": 0.9717, - "step": 1409 - }, - { - "epoch": 0.04, - "learning_rate": 1.9998031958342937e-06, - "loss": 0.9297, - "step": 1410 - }, - { - "epoch": 0.04, - "learning_rate": 1.999801545546707e-06, - "loss": 0.9258, - "step": 1411 - }, - { - "epoch": 0.04, - "learning_rate": 1.9997998883694803e-06, - "loss": 1.0537, - "step": 1412 - }, - { - "epoch": 0.04, - "learning_rate": 1.9997982243026256e-06, - "loss": 1.0371, - "step": 1413 - }, - { - "epoch": 0.04, - "learning_rate": 1.999796553346153e-06, - "loss": 1.0371, - "step": 1414 - }, - { - "epoch": 0.04, - "learning_rate": 1.9997948755000756e-06, - "loss": 1.0049, - "step": 1415 - }, - { - "epoch": 0.04, - "learning_rate": 1.9997931907644036e-06, - "loss": 0.9893, - "step": 1416 - }, - { - "epoch": 0.04, - "learning_rate": 1.9997914991391494e-06, - "loss": 0.9556, - "step": 1417 - }, - { - "epoch": 0.04, - "learning_rate": 1.9997898006243244e-06, - "loss": 1.1875, - "step": 1418 - }, - { - "epoch": 0.04, - "learning_rate": 1.9997880952199406e-06, - "loss": 0.6499, - "step": 1419 - }, - { - "epoch": 0.04, - "learning_rate": 1.999786382926009e-06, - "loss": 0.7822, - "step": 1420 - }, - { - "epoch": 0.04, - "learning_rate": 1.9997846637425424e-06, - "loss": 1.0264, - "step": 1421 - }, - { - "epoch": 0.04, - "learning_rate": 1.9997829376695513e-06, - "loss": 0.8823, - "step": 1422 - }, - { - "epoch": 0.04, - "learning_rate": 1.9997812047070492e-06, - "loss": 1.0352, - "step": 1423 - }, - { - "epoch": 0.04, - "learning_rate": 1.999779464855047e-06, - "loss": 0.7891, - "step": 1424 - }, - { - "epoch": 0.04, - "learning_rate": 1.999777718113557e-06, - "loss": 1.0459, - "step": 1425 - }, - { - "epoch": 0.04, - "learning_rate": 1.999775964482591e-06, - "loss": 0.8213, - "step": 1426 - }, - { - "epoch": 0.04, - "learning_rate": 1.9997742039621613e-06, - "loss": 1.0518, - "step": 1427 - }, - { - "epoch": 0.04, - "learning_rate": 1.99977243655228e-06, - "loss": 1.042, - "step": 1428 - }, - { - "epoch": 0.04, - "learning_rate": 1.9997706622529596e-06, - "loss": 0.6528, - "step": 1429 - }, - { - "epoch": 0.04, - "learning_rate": 1.999768881064212e-06, - "loss": 1.2793, - "step": 1430 - }, - { - "epoch": 0.04, - "learning_rate": 1.9997670929860492e-06, - "loss": 1.0957, - "step": 1431 - }, - { - "epoch": 0.04, - "learning_rate": 1.999765298018484e-06, - "loss": 0.8369, - "step": 1432 - }, - { - "epoch": 0.04, - "learning_rate": 1.9997634961615284e-06, - "loss": 1.1738, - "step": 1433 - }, - { - "epoch": 0.04, - "learning_rate": 1.999761687415195e-06, - "loss": 1.0186, - "step": 1434 - }, - { - "epoch": 0.04, - "learning_rate": 1.9997598717794966e-06, - "loss": 1.1865, - "step": 1435 - }, - { - "epoch": 0.04, - "learning_rate": 1.9997580492544454e-06, - "loss": 0.9385, - "step": 1436 - }, - { - "epoch": 0.04, - "learning_rate": 1.9997562198400534e-06, - "loss": 1.0156, - "step": 1437 - }, - { - "epoch": 0.04, - "learning_rate": 1.9997543835363338e-06, - "loss": 1.127, - "step": 1438 - }, - { - "epoch": 0.04, - "learning_rate": 1.9997525403432996e-06, - "loss": 0.9453, - "step": 1439 - }, - { - "epoch": 0.04, - "learning_rate": 1.999750690260963e-06, - "loss": 1.0527, - "step": 1440 - }, - { - "epoch": 0.04, - "learning_rate": 1.999748833289337e-06, - "loss": 1.0205, - "step": 1441 - }, - { - "epoch": 0.04, - "learning_rate": 1.9997469694284336e-06, - "loss": 1.3848, - "step": 1442 - }, - { - "epoch": 0.04, - "learning_rate": 1.9997450986782667e-06, - "loss": 0.9551, - "step": 1443 - }, - { - "epoch": 0.04, - "learning_rate": 1.999743221038849e-06, - "loss": 1.127, - "step": 1444 - }, - { - "epoch": 0.04, - "learning_rate": 1.9997413365101926e-06, - "loss": 0.9561, - "step": 1445 - }, - { - "epoch": 0.04, - "learning_rate": 1.9997394450923117e-06, - "loss": 1.1621, - "step": 1446 - }, - { - "epoch": 0.04, - "learning_rate": 1.9997375467852183e-06, - "loss": 0.9551, - "step": 1447 - }, - { - "epoch": 0.04, - "learning_rate": 1.999735641588926e-06, - "loss": 1.041, - "step": 1448 - }, - { - "epoch": 0.04, - "learning_rate": 1.999733729503448e-06, - "loss": 1.04, - "step": 1449 - }, - { - "epoch": 0.04, - "learning_rate": 1.9997318105287972e-06, - "loss": 0.9551, - "step": 1450 - }, - { - "epoch": 0.04, - "learning_rate": 1.999729884664987e-06, - "loss": 0.7969, - "step": 1451 - }, - { - "epoch": 0.04, - "learning_rate": 1.9997279519120304e-06, - "loss": 0.7788, - "step": 1452 - }, - { - "epoch": 0.04, - "learning_rate": 1.9997260122699414e-06, - "loss": 1.0234, - "step": 1453 - }, - { - "epoch": 0.04, - "learning_rate": 1.9997240657387326e-06, - "loss": 1.0186, - "step": 1454 - }, - { - "epoch": 0.04, - "learning_rate": 1.9997221123184177e-06, - "loss": 0.9375, - "step": 1455 - }, - { - "epoch": 0.04, - "learning_rate": 1.9997201520090102e-06, - "loss": 1.1514, - "step": 1456 - }, - { - "epoch": 0.04, - "learning_rate": 1.9997181848105237e-06, - "loss": 0.9395, - "step": 1457 - }, - { - "epoch": 0.04, - "learning_rate": 1.9997162107229717e-06, - "loss": 0.8613, - "step": 1458 - }, - { - "epoch": 0.04, - "learning_rate": 1.9997142297463673e-06, - "loss": 0.9316, - "step": 1459 - }, - { - "epoch": 0.04, - "learning_rate": 1.999712241880725e-06, - "loss": 0.8242, - "step": 1460 - }, - { - "epoch": 0.04, - "learning_rate": 1.9997102471260577e-06, - "loss": 1.0547, - "step": 1461 - }, - { - "epoch": 0.04, - "learning_rate": 1.99970824548238e-06, - "loss": 0.8408, - "step": 1462 - }, - { - "epoch": 0.04, - "learning_rate": 1.999706236949705e-06, - "loss": 0.8994, - "step": 1463 - }, - { - "epoch": 0.04, - "learning_rate": 1.9997042215280467e-06, - "loss": 0.7217, - "step": 1464 - }, - { - "epoch": 0.04, - "learning_rate": 1.999702199217419e-06, - "loss": 0.7227, - "step": 1465 - }, - { - "epoch": 0.04, - "learning_rate": 1.999700170017836e-06, - "loss": 0.7627, - "step": 1466 - }, - { - "epoch": 0.04, - "learning_rate": 1.9996981339293116e-06, - "loss": 0.9014, - "step": 1467 - }, - { - "epoch": 0.04, - "learning_rate": 1.9996960909518597e-06, - "loss": 1.0273, - "step": 1468 - }, - { - "epoch": 0.04, - "learning_rate": 1.999694041085495e-06, - "loss": 0.8245, - "step": 1469 - }, - { - "epoch": 0.04, - "learning_rate": 1.9996919843302304e-06, - "loss": 0.9795, - "step": 1470 - }, - { - "epoch": 0.04, - "learning_rate": 1.9996899206860814e-06, - "loss": 0.9043, - "step": 1471 - }, - { - "epoch": 0.04, - "learning_rate": 1.9996878501530613e-06, - "loss": 0.8486, - "step": 1472 - }, - { - "epoch": 0.04, - "learning_rate": 1.999685772731185e-06, - "loss": 0.8555, - "step": 1473 - }, - { - "epoch": 0.04, - "learning_rate": 1.9996836884204657e-06, - "loss": 0.8545, - "step": 1474 - }, - { - "epoch": 0.04, - "learning_rate": 1.999681597220919e-06, - "loss": 0.9551, - "step": 1475 - }, - { - "epoch": 0.04, - "learning_rate": 1.999679499132559e-06, - "loss": 0.8506, - "step": 1476 - }, - { - "epoch": 0.04, - "learning_rate": 1.9996773941554e-06, - "loss": 0.8989, - "step": 1477 - }, - { - "epoch": 0.04, - "learning_rate": 1.999675282289456e-06, - "loss": 0.8877, - "step": 1478 - }, - { - "epoch": 0.04, - "learning_rate": 1.9996731635347427e-06, - "loss": 0.6934, - "step": 1479 - }, - { - "epoch": 0.04, - "learning_rate": 1.999671037891274e-06, - "loss": 1.0088, - "step": 1480 - }, - { - "epoch": 0.04, - "learning_rate": 1.9996689053590643e-06, - "loss": 0.8633, - "step": 1481 - }, - { - "epoch": 0.04, - "learning_rate": 1.999666765938129e-06, - "loss": 0.8779, - "step": 1482 - }, - { - "epoch": 0.04, - "learning_rate": 1.999664619628482e-06, - "loss": 1.0723, - "step": 1483 - }, - { - "epoch": 0.04, - "learning_rate": 1.999662466430139e-06, - "loss": 1.0791, - "step": 1484 - }, - { - "epoch": 0.04, - "learning_rate": 1.9996603063431143e-06, - "loss": 1.0684, - "step": 1485 - }, - { - "epoch": 0.04, - "learning_rate": 1.999658139367423e-06, - "loss": 0.8223, - "step": 1486 - }, - { - "epoch": 0.04, - "learning_rate": 1.9996559655030795e-06, - "loss": 1.0176, - "step": 1487 - }, - { - "epoch": 0.04, - "learning_rate": 1.9996537847500995e-06, - "loss": 1.0225, - "step": 1488 - }, - { - "epoch": 0.04, - "learning_rate": 1.999651597108498e-06, - "loss": 0.9043, - "step": 1489 - }, - { - "epoch": 0.04, - "learning_rate": 1.999649402578289e-06, - "loss": 0.8159, - "step": 1490 - }, - { - "epoch": 0.04, - "learning_rate": 1.999647201159489e-06, - "loss": 1.0518, - "step": 1491 - }, - { - "epoch": 0.04, - "learning_rate": 1.9996449928521122e-06, - "loss": 1.0391, - "step": 1492 - }, - { - "epoch": 0.04, - "learning_rate": 1.9996427776561748e-06, - "loss": 1.0928, - "step": 1493 - }, - { - "epoch": 0.04, - "learning_rate": 1.999640555571691e-06, - "loss": 0.8594, - "step": 1494 - }, - { - "epoch": 0.04, - "learning_rate": 1.9996383265986763e-06, - "loss": 1.124, - "step": 1495 - }, - { - "epoch": 0.04, - "learning_rate": 1.9996360907371467e-06, - "loss": 1.0605, - "step": 1496 - }, - { - "epoch": 0.04, - "learning_rate": 1.9996338479871177e-06, - "loss": 0.8867, - "step": 1497 - }, - { - "epoch": 0.04, - "learning_rate": 1.999631598348604e-06, - "loss": 1.0967, - "step": 1498 - }, - { - "epoch": 0.04, - "learning_rate": 1.9996293418216206e-06, - "loss": 0.7886, - "step": 1499 - }, - { - "epoch": 0.04, - "learning_rate": 1.999627078406185e-06, - "loss": 1.166, - "step": 1500 - }, - { - "epoch": 0.04, - "learning_rate": 1.999624808102311e-06, - "loss": 1.1758, - "step": 1501 - }, - { - "epoch": 0.04, - "learning_rate": 1.999622530910015e-06, - "loss": 0.9106, - "step": 1502 - }, - { - "epoch": 0.04, - "learning_rate": 1.999620246829313e-06, - "loss": 0.8818, - "step": 1503 - }, - { - "epoch": 0.04, - "learning_rate": 1.99961795586022e-06, - "loss": 1.0947, - "step": 1504 - }, - { - "epoch": 0.04, - "learning_rate": 1.9996156580027517e-06, - "loss": 0.8105, - "step": 1505 - }, - { - "epoch": 0.04, - "learning_rate": 1.999613353256925e-06, - "loss": 1.0605, - "step": 1506 - }, - { - "epoch": 0.04, - "learning_rate": 1.9996110416227547e-06, - "loss": 0.8506, - "step": 1507 - }, - { - "epoch": 0.04, - "learning_rate": 1.9996087231002576e-06, - "loss": 0.877, - "step": 1508 - }, - { - "epoch": 0.04, - "learning_rate": 1.999606397689449e-06, - "loss": 0.958, - "step": 1509 - }, - { - "epoch": 0.04, - "learning_rate": 1.999604065390345e-06, - "loss": 0.959, - "step": 1510 - }, - { - "epoch": 0.04, - "learning_rate": 1.999601726202962e-06, - "loss": 0.9902, - "step": 1511 - }, - { - "epoch": 0.04, - "learning_rate": 1.999599380127316e-06, - "loss": 1.1445, - "step": 1512 - }, - { - "epoch": 0.04, - "learning_rate": 1.999597027163423e-06, - "loss": 0.915, - "step": 1513 - }, - { - "epoch": 0.04, - "learning_rate": 1.9995946673112996e-06, - "loss": 1.0547, - "step": 1514 - }, - { - "epoch": 0.04, - "learning_rate": 1.9995923005709615e-06, - "loss": 0.8569, - "step": 1515 - }, - { - "epoch": 0.04, - "learning_rate": 1.9995899269424253e-06, - "loss": 0.9375, - "step": 1516 - }, - { - "epoch": 0.04, - "learning_rate": 1.9995875464257076e-06, - "loss": 1.0537, - "step": 1517 - }, - { - "epoch": 0.04, - "learning_rate": 1.9995851590208242e-06, - "loss": 0.9463, - "step": 1518 - }, - { - "epoch": 0.04, - "learning_rate": 1.9995827647277923e-06, - "loss": 1.0273, - "step": 1519 - }, - { - "epoch": 0.04, - "learning_rate": 1.9995803635466275e-06, - "loss": 0.835, - "step": 1520 - }, - { - "epoch": 0.04, - "learning_rate": 1.9995779554773476e-06, - "loss": 1.1064, - "step": 1521 - }, - { - "epoch": 0.04, - "learning_rate": 1.9995755405199678e-06, - "loss": 0.9014, - "step": 1522 - }, - { - "epoch": 0.04, - "learning_rate": 1.999573118674506e-06, - "loss": 0.8662, - "step": 1523 - }, - { - "epoch": 0.04, - "learning_rate": 1.999570689940978e-06, - "loss": 1.1318, - "step": 1524 - }, - { - "epoch": 0.04, - "learning_rate": 1.9995682543194006e-06, - "loss": 0.8418, - "step": 1525 - }, - { - "epoch": 0.04, - "learning_rate": 1.999565811809791e-06, - "loss": 1.0977, - "step": 1526 - }, - { - "epoch": 0.04, - "learning_rate": 1.999563362412166e-06, - "loss": 0.9766, - "step": 1527 - }, - { - "epoch": 0.04, - "learning_rate": 1.999560906126542e-06, - "loss": 1.0645, - "step": 1528 - }, - { - "epoch": 0.04, - "learning_rate": 1.9995584429529363e-06, - "loss": 0.9307, - "step": 1529 - }, - { - "epoch": 0.04, - "learning_rate": 1.999555972891366e-06, - "loss": 0.9482, - "step": 1530 - }, - { - "epoch": 0.04, - "learning_rate": 1.999553495941848e-06, - "loss": 0.8428, - "step": 1531 - }, - { - "epoch": 0.04, - "learning_rate": 1.999551012104399e-06, - "loss": 1.1367, - "step": 1532 - }, - { - "epoch": 0.04, - "learning_rate": 1.9995485213790365e-06, - "loss": 0.9805, - "step": 1533 - }, - { - "epoch": 0.04, - "learning_rate": 1.9995460237657778e-06, - "loss": 0.9844, - "step": 1534 - }, - { - "epoch": 0.04, - "learning_rate": 1.99954351926464e-06, - "loss": 1.0449, - "step": 1535 - }, - { - "epoch": 0.04, - "learning_rate": 1.9995410078756397e-06, - "loss": 0.7256, - "step": 1536 - }, - { - "epoch": 0.04, - "learning_rate": 1.9995384895987954e-06, - "loss": 1.0244, - "step": 1537 - }, - { - "epoch": 0.04, - "learning_rate": 1.9995359644341235e-06, - "loss": 1.1416, - "step": 1538 - }, - { - "epoch": 0.04, - "learning_rate": 1.999533432381642e-06, - "loss": 0.9023, - "step": 1539 - }, - { - "epoch": 0.04, - "learning_rate": 1.9995308934413675e-06, - "loss": 0.9844, - "step": 1540 - }, - { - "epoch": 0.04, - "learning_rate": 1.9995283476133184e-06, - "loss": 0.9971, - "step": 1541 - }, - { - "epoch": 0.04, - "learning_rate": 1.999525794897512e-06, - "loss": 0.9946, - "step": 1542 - }, - { - "epoch": 0.04, - "learning_rate": 1.9995232352939655e-06, - "loss": 0.8398, - "step": 1543 - }, - { - "epoch": 0.04, - "learning_rate": 1.9995206688026972e-06, - "loss": 0.7612, - "step": 1544 - }, - { - "epoch": 0.04, - "learning_rate": 1.999518095423724e-06, - "loss": 1.0303, - "step": 1545 - }, - { - "epoch": 0.04, - "learning_rate": 1.9995155151570646e-06, - "loss": 1.043, - "step": 1546 - }, - { - "epoch": 0.04, - "learning_rate": 1.999512928002736e-06, - "loss": 0.7935, - "step": 1547 - }, - { - "epoch": 0.04, - "learning_rate": 1.9995103339607558e-06, - "loss": 0.9727, - "step": 1548 - }, - { - "epoch": 0.04, - "learning_rate": 1.999507733031143e-06, - "loss": 1.0918, - "step": 1549 - }, - { - "epoch": 0.04, - "learning_rate": 1.9995051252139147e-06, - "loss": 0.9775, - "step": 1550 - }, - { - "epoch": 0.04, - "learning_rate": 1.999502510509089e-06, - "loss": 1.0801, - "step": 1551 - }, - { - "epoch": 0.04, - "learning_rate": 1.9994998889166837e-06, - "loss": 0.9668, - "step": 1552 - }, - { - "epoch": 0.04, - "learning_rate": 1.9994972604367174e-06, - "loss": 0.8999, - "step": 1553 - }, - { - "epoch": 0.04, - "learning_rate": 1.9994946250692076e-06, - "loss": 1.0742, - "step": 1554 - }, - { - "epoch": 0.04, - "learning_rate": 1.999491982814173e-06, - "loss": 1.0664, - "step": 1555 - }, - { - "epoch": 0.04, - "learning_rate": 1.9994893336716317e-06, - "loss": 0.9912, - "step": 1556 - }, - { - "epoch": 0.04, - "learning_rate": 1.9994866776416016e-06, - "loss": 1.0098, - "step": 1557 - }, - { - "epoch": 0.04, - "learning_rate": 1.9994840147241013e-06, - "loss": 1.0605, - "step": 1558 - }, - { - "epoch": 0.04, - "learning_rate": 1.9994813449191495e-06, - "loss": 0.9033, - "step": 1559 - }, - { - "epoch": 0.04, - "learning_rate": 1.999478668226764e-06, - "loss": 1.2324, - "step": 1560 - }, - { - "epoch": 0.04, - "learning_rate": 1.999475984646963e-06, - "loss": 1.1172, - "step": 1561 - }, - { - "epoch": 0.04, - "learning_rate": 1.9994732941797658e-06, - "loss": 0.918, - "step": 1562 - }, - { - "epoch": 0.04, - "learning_rate": 1.9994705968251907e-06, - "loss": 0.7783, - "step": 1563 - }, - { - "epoch": 0.04, - "learning_rate": 1.9994678925832564e-06, - "loss": 1.1055, - "step": 1564 - }, - { - "epoch": 0.04, - "learning_rate": 1.9994651814539803e-06, - "loss": 0.8374, - "step": 1565 - }, - { - "epoch": 0.04, - "learning_rate": 1.999462463437383e-06, - "loss": 1.0898, - "step": 1566 - }, - { - "epoch": 0.04, - "learning_rate": 1.999459738533482e-06, - "loss": 1.1279, - "step": 1567 - }, - { - "epoch": 0.04, - "learning_rate": 1.9994570067422962e-06, - "loss": 1.1543, - "step": 1568 - }, - { - "epoch": 0.04, - "learning_rate": 1.9994542680638453e-06, - "loss": 0.8213, - "step": 1569 - }, - { - "epoch": 0.04, - "learning_rate": 1.999451522498147e-06, - "loss": 1.0059, - "step": 1570 - }, - { - "epoch": 0.04, - "learning_rate": 1.999448770045221e-06, - "loss": 1.1279, - "step": 1571 - }, - { - "epoch": 0.04, - "learning_rate": 1.9994460107050856e-06, - "loss": 0.8525, - "step": 1572 - }, - { - "epoch": 0.04, - "learning_rate": 1.99944324447776e-06, - "loss": 1.1152, - "step": 1573 - }, - { - "epoch": 0.04, - "learning_rate": 1.999440471363264e-06, - "loss": 0.8008, - "step": 1574 - }, - { - "epoch": 0.04, - "learning_rate": 1.9994376913616156e-06, - "loss": 0.9697, - "step": 1575 - }, - { - "epoch": 0.04, - "learning_rate": 1.9994349044728352e-06, - "loss": 0.7773, - "step": 1576 - }, - { - "epoch": 0.04, - "learning_rate": 1.999432110696941e-06, - "loss": 0.9307, - "step": 1577 - }, - { - "epoch": 0.04, - "learning_rate": 1.999429310033952e-06, - "loss": 1.0098, - "step": 1578 - }, - { - "epoch": 0.04, - "learning_rate": 1.9994265024838892e-06, - "loss": 1.125, - "step": 1579 - }, - { - "epoch": 0.04, - "learning_rate": 1.99942368804677e-06, - "loss": 1.125, - "step": 1580 - }, - { - "epoch": 0.04, - "learning_rate": 1.999420866722615e-06, - "loss": 1.1309, - "step": 1581 - }, - { - "epoch": 0.04, - "learning_rate": 1.999418038511443e-06, - "loss": 0.8936, - "step": 1582 - }, - { - "epoch": 0.04, - "learning_rate": 1.9994152034132742e-06, - "loss": 0.7495, - "step": 1583 - }, - { - "epoch": 0.04, - "learning_rate": 1.999412361428127e-06, - "loss": 0.6406, - "step": 1584 - }, - { - "epoch": 0.04, - "learning_rate": 1.999409512556022e-06, - "loss": 1.0166, - "step": 1585 - }, - { - "epoch": 0.04, - "learning_rate": 1.9994066567969787e-06, - "loss": 0.8389, - "step": 1586 - }, - { - "epoch": 0.04, - "learning_rate": 1.9994037941510165e-06, - "loss": 0.8076, - "step": 1587 - }, - { - "epoch": 0.04, - "learning_rate": 1.9994009246181547e-06, - "loss": 0.7783, - "step": 1588 - }, - { - "epoch": 0.04, - "learning_rate": 1.9993980481984145e-06, - "loss": 0.9165, - "step": 1589 - }, - { - "epoch": 0.04, - "learning_rate": 1.999395164891814e-06, - "loss": 1.1572, - "step": 1590 - }, - { - "epoch": 0.04, - "learning_rate": 1.9993922746983744e-06, - "loss": 0.7473, - "step": 1591 - }, - { - "epoch": 0.04, - "learning_rate": 1.999389377618115e-06, - "loss": 0.7969, - "step": 1592 - }, - { - "epoch": 0.04, - "learning_rate": 1.999386473651055e-06, - "loss": 0.9785, - "step": 1593 - }, - { - "epoch": 0.04, - "learning_rate": 1.999383562797216e-06, - "loss": 1.0273, - "step": 1594 - }, - { - "epoch": 0.04, - "learning_rate": 1.9993806450566177e-06, - "loss": 0.7676, - "step": 1595 - }, - { - "epoch": 0.04, - "learning_rate": 1.999377720429279e-06, - "loss": 0.8628, - "step": 1596 - }, - { - "epoch": 0.04, - "learning_rate": 1.9993747889152215e-06, - "loss": 1.1709, - "step": 1597 - }, - { - "epoch": 0.04, - "learning_rate": 1.9993718505144645e-06, - "loss": 0.9492, - "step": 1598 - }, - { - "epoch": 0.04, - "learning_rate": 1.9993689052270286e-06, - "loss": 1.0029, - "step": 1599 - }, - { - "epoch": 0.04, - "learning_rate": 1.999365953052934e-06, - "loss": 0.8291, - "step": 1600 - }, - { - "epoch": 0.04, - "learning_rate": 1.999362993992201e-06, - "loss": 1.042, - "step": 1601 - }, - { - "epoch": 0.04, - "learning_rate": 1.99936002804485e-06, - "loss": 1.0566, - "step": 1602 - }, - { - "epoch": 0.04, - "learning_rate": 1.999357055210902e-06, - "loss": 0.8452, - "step": 1603 - }, - { - "epoch": 0.04, - "learning_rate": 1.9993540754903764e-06, - "loss": 1.0996, - "step": 1604 - }, - { - "epoch": 0.04, - "learning_rate": 1.9993510888832947e-06, - "loss": 1.166, - "step": 1605 - }, - { - "epoch": 0.04, - "learning_rate": 1.999348095389677e-06, - "loss": 0.9253, - "step": 1606 - }, - { - "epoch": 0.04, - "learning_rate": 1.999345095009544e-06, - "loss": 0.8589, - "step": 1607 - }, - { - "epoch": 0.04, - "learning_rate": 1.9993420877429165e-06, - "loss": 1.2207, - "step": 1608 - }, - { - "epoch": 0.04, - "learning_rate": 1.9993390735898147e-06, - "loss": 0.8809, - "step": 1609 - }, - { - "epoch": 0.04, - "learning_rate": 1.99933605255026e-06, - "loss": 1.0078, - "step": 1610 - }, - { - "epoch": 0.04, - "learning_rate": 1.999333024624273e-06, - "loss": 0.9238, - "step": 1611 - }, - { - "epoch": 0.04, - "learning_rate": 1.999329989811875e-06, - "loss": 0.8311, - "step": 1612 - }, - { - "epoch": 0.04, - "learning_rate": 1.999326948113086e-06, - "loss": 0.9629, - "step": 1613 - }, - { - "epoch": 0.04, - "learning_rate": 1.9993238995279277e-06, - "loss": 1.1055, - "step": 1614 - }, - { - "epoch": 0.04, - "learning_rate": 1.9993208440564207e-06, - "loss": 0.8184, - "step": 1615 - }, - { - "epoch": 0.04, - "learning_rate": 1.9993177816985863e-06, - "loss": 1.0654, - "step": 1616 - }, - { - "epoch": 0.04, - "learning_rate": 1.9993147124544455e-06, - "loss": 0.8213, - "step": 1617 - }, - { - "epoch": 0.04, - "learning_rate": 1.9993116363240193e-06, - "loss": 0.9639, - "step": 1618 - }, - { - "epoch": 0.04, - "learning_rate": 1.9993085533073295e-06, - "loss": 0.9814, - "step": 1619 - }, - { - "epoch": 0.04, - "learning_rate": 1.9993054634043965e-06, - "loss": 1.0938, - "step": 1620 - }, - { - "epoch": 0.04, - "learning_rate": 1.9993023666152424e-06, - "loss": 0.8604, - "step": 1621 - }, - { - "epoch": 0.04, - "learning_rate": 1.999299262939888e-06, - "loss": 0.8472, - "step": 1622 - }, - { - "epoch": 0.04, - "learning_rate": 1.9992961523783545e-06, - "loss": 0.9385, - "step": 1623 - }, - { - "epoch": 0.04, - "learning_rate": 1.999293034930664e-06, - "loss": 0.9717, - "step": 1624 - }, - { - "epoch": 0.04, - "learning_rate": 1.9992899105968373e-06, - "loss": 0.7954, - "step": 1625 - }, - { - "epoch": 0.04, - "learning_rate": 1.9992867793768963e-06, - "loss": 0.9414, - "step": 1626 - }, - { - "epoch": 0.04, - "learning_rate": 1.999283641270863e-06, - "loss": 0.938, - "step": 1627 - }, - { - "epoch": 0.04, - "learning_rate": 1.999280496278758e-06, - "loss": 0.896, - "step": 1628 - }, - { - "epoch": 0.04, - "learning_rate": 1.9992773444006043e-06, - "loss": 1.1504, - "step": 1629 - }, - { - "epoch": 0.04, - "learning_rate": 1.9992741856364224e-06, - "loss": 1.0752, - "step": 1630 - }, - { - "epoch": 0.04, - "learning_rate": 1.9992710199862344e-06, - "loss": 1.1104, - "step": 1631 - }, - { - "epoch": 0.04, - "learning_rate": 1.9992678474500625e-06, - "loss": 1.1387, - "step": 1632 - }, - { - "epoch": 0.04, - "learning_rate": 1.999264668027928e-06, - "loss": 0.9512, - "step": 1633 - }, - { - "epoch": 0.04, - "learning_rate": 1.999261481719854e-06, - "loss": 0.9375, - "step": 1634 - }, - { - "epoch": 0.04, - "learning_rate": 1.9992582885258605e-06, - "loss": 1.1729, - "step": 1635 - }, - { - "epoch": 0.04, - "learning_rate": 1.9992550884459715e-06, - "loss": 0.9688, - "step": 1636 - }, - { - "epoch": 0.04, - "learning_rate": 1.9992518814802074e-06, - "loss": 0.8936, - "step": 1637 - }, - { - "epoch": 0.04, - "learning_rate": 1.9992486676285915e-06, - "loss": 1.1064, - "step": 1638 - }, - { - "epoch": 0.04, - "learning_rate": 1.9992454468911453e-06, - "loss": 0.9648, - "step": 1639 - }, - { - "epoch": 0.04, - "learning_rate": 1.9992422192678913e-06, - "loss": 1.1211, - "step": 1640 - }, - { - "epoch": 0.04, - "learning_rate": 1.999238984758851e-06, - "loss": 0.8062, - "step": 1641 - }, - { - "epoch": 0.04, - "learning_rate": 1.9992357433640484e-06, - "loss": 0.9414, - "step": 1642 - }, - { - "epoch": 0.04, - "learning_rate": 1.999232495083504e-06, - "loss": 1.1533, - "step": 1643 - }, - { - "epoch": 0.04, - "learning_rate": 1.999229239917241e-06, - "loss": 0.9775, - "step": 1644 - }, - { - "epoch": 0.04, - "learning_rate": 1.9992259778652822e-06, - "loss": 1.0303, - "step": 1645 - }, - { - "epoch": 0.04, - "learning_rate": 1.999222708927649e-06, - "loss": 1.043, - "step": 1646 - }, - { - "epoch": 0.04, - "learning_rate": 1.999219433104365e-06, - "loss": 1.0879, - "step": 1647 - }, - { - "epoch": 0.04, - "learning_rate": 1.999216150395452e-06, - "loss": 0.9023, - "step": 1648 - }, - { - "epoch": 0.04, - "learning_rate": 1.9992128608009335e-06, - "loss": 1.0557, - "step": 1649 - }, - { - "epoch": 0.04, - "learning_rate": 1.999209564320831e-06, - "loss": 1.1309, - "step": 1650 - }, - { - "epoch": 0.04, - "learning_rate": 1.9992062609551682e-06, - "loss": 0.8105, - "step": 1651 - }, - { - "epoch": 0.04, - "learning_rate": 1.9992029507039676e-06, - "loss": 1.1309, - "step": 1652 - }, - { - "epoch": 0.04, - "learning_rate": 1.9991996335672517e-06, - "loss": 0.8496, - "step": 1653 - }, - { - "epoch": 0.04, - "learning_rate": 1.9991963095450436e-06, - "loss": 0.9219, - "step": 1654 - }, - { - "epoch": 0.04, - "learning_rate": 1.999192978637366e-06, - "loss": 0.9717, - "step": 1655 - }, - { - "epoch": 0.04, - "learning_rate": 1.9991896408442424e-06, - "loss": 0.9385, - "step": 1656 - }, - { - "epoch": 0.04, - "learning_rate": 1.9991862961656954e-06, - "loss": 0.7324, - "step": 1657 - }, - { - "epoch": 0.04, - "learning_rate": 1.999182944601748e-06, - "loss": 1.084, - "step": 1658 - }, - { - "epoch": 0.04, - "learning_rate": 1.9991795861524233e-06, - "loss": 0.8599, - "step": 1659 - }, - { - "epoch": 0.04, - "learning_rate": 1.9991762208177447e-06, - "loss": 0.8389, - "step": 1660 - }, - { - "epoch": 0.04, - "learning_rate": 1.9991728485977347e-06, - "loss": 0.9453, - "step": 1661 - }, - { - "epoch": 0.04, - "learning_rate": 1.999169469492418e-06, - "loss": 0.9941, - "step": 1662 - }, - { - "epoch": 0.04, - "learning_rate": 1.999166083501816e-06, - "loss": 1.2207, - "step": 1663 - }, - { - "epoch": 0.04, - "learning_rate": 1.9991626906259534e-06, - "loss": 1.0576, - "step": 1664 - }, - { - "epoch": 0.04, - "learning_rate": 1.999159290864853e-06, - "loss": 0.958, - "step": 1665 - }, - { - "epoch": 0.04, - "learning_rate": 1.9991558842185386e-06, - "loss": 0.8574, - "step": 1666 - }, - { - "epoch": 0.04, - "learning_rate": 1.999152470687033e-06, - "loss": 1.2197, - "step": 1667 - }, - { - "epoch": 0.04, - "learning_rate": 1.999149050270361e-06, - "loss": 0.9854, - "step": 1668 - }, - { - "epoch": 0.04, - "learning_rate": 1.9991456229685446e-06, - "loss": 1.0791, - "step": 1669 - }, - { - "epoch": 0.04, - "learning_rate": 1.9991421887816083e-06, - "loss": 1.1025, - "step": 1670 - }, - { - "epoch": 0.04, - "learning_rate": 1.999138747709576e-06, - "loss": 1.0205, - "step": 1671 - }, - { - "epoch": 0.04, - "learning_rate": 1.999135299752471e-06, - "loss": 0.8145, - "step": 1672 - }, - { - "epoch": 0.04, - "learning_rate": 1.999131844910317e-06, - "loss": 1.0859, - "step": 1673 - }, - { - "epoch": 0.04, - "learning_rate": 1.9991283831831376e-06, - "loss": 1.1084, - "step": 1674 - }, - { - "epoch": 0.04, - "learning_rate": 1.9991249145709574e-06, - "loss": 0.9141, - "step": 1675 - }, - { - "epoch": 0.04, - "learning_rate": 1.9991214390737994e-06, - "loss": 0.6851, - "step": 1676 - }, - { - "epoch": 0.04, - "learning_rate": 1.9991179566916883e-06, - "loss": 1.0488, - "step": 1677 - }, - { - "epoch": 0.04, - "learning_rate": 1.999114467424648e-06, - "loss": 0.8306, - "step": 1678 - }, - { - "epoch": 0.04, - "learning_rate": 1.999110971272702e-06, - "loss": 1.0273, - "step": 1679 - }, - { - "epoch": 0.04, - "learning_rate": 1.999107468235875e-06, - "loss": 0.915, - "step": 1680 - }, - { - "epoch": 0.04, - "learning_rate": 1.9991039583141906e-06, - "loss": 0.8135, - "step": 1681 - }, - { - "epoch": 0.04, - "learning_rate": 1.9991004415076733e-06, - "loss": 0.8157, - "step": 1682 - }, - { - "epoch": 0.04, - "learning_rate": 1.9990969178163477e-06, - "loss": 0.9941, - "step": 1683 - }, - { - "epoch": 0.04, - "learning_rate": 1.9990933872402375e-06, - "loss": 0.8926, - "step": 1684 - }, - { - "epoch": 0.04, - "learning_rate": 1.999089849779367e-06, - "loss": 0.9482, - "step": 1685 - }, - { - "epoch": 0.04, - "learning_rate": 1.999086305433761e-06, - "loss": 0.8691, - "step": 1686 - }, - { - "epoch": 0.04, - "learning_rate": 1.9990827542034437e-06, - "loss": 1.2578, - "step": 1687 - }, - { - "epoch": 0.04, - "learning_rate": 1.9990791960884395e-06, - "loss": 0.9639, - "step": 1688 - }, - { - "epoch": 0.04, - "learning_rate": 1.999075631088773e-06, - "loss": 1.1738, - "step": 1689 - }, - { - "epoch": 0.04, - "learning_rate": 1.999072059204469e-06, - "loss": 0.8311, - "step": 1690 - }, - { - "epoch": 0.04, - "learning_rate": 1.9990684804355516e-06, - "loss": 1.0938, - "step": 1691 - }, - { - "epoch": 0.04, - "learning_rate": 1.999064894782046e-06, - "loss": 1.1533, - "step": 1692 - }, - { - "epoch": 0.04, - "learning_rate": 1.9990613022439765e-06, - "loss": 0.9297, - "step": 1693 - }, - { - "epoch": 0.04, - "learning_rate": 1.9990577028213684e-06, - "loss": 0.8062, - "step": 1694 - }, - { - "epoch": 0.04, - "learning_rate": 1.9990540965142455e-06, - "loss": 0.6846, - "step": 1695 - }, - { - "epoch": 0.04, - "learning_rate": 1.9990504833226337e-06, - "loss": 0.9062, - "step": 1696 - }, - { - "epoch": 0.04, - "learning_rate": 1.9990468632465574e-06, - "loss": 0.9473, - "step": 1697 - }, - { - "epoch": 0.04, - "learning_rate": 1.9990432362860417e-06, - "loss": 0.9629, - "step": 1698 - }, - { - "epoch": 0.04, - "learning_rate": 1.999039602441111e-06, - "loss": 1.1035, - "step": 1699 - }, - { - "epoch": 0.04, - "learning_rate": 1.9990359617117916e-06, - "loss": 1.0391, - "step": 1700 - }, - { - "epoch": 0.04, - "learning_rate": 1.9990323140981075e-06, - "loss": 1.0166, - "step": 1701 - }, - { - "epoch": 0.04, - "learning_rate": 1.9990286596000844e-06, - "loss": 1.0264, - "step": 1702 - }, - { - "epoch": 0.04, - "learning_rate": 1.999024998217747e-06, - "loss": 1.0117, - "step": 1703 - }, - { - "epoch": 0.04, - "learning_rate": 1.9990213299511206e-06, - "loss": 0.9824, - "step": 1704 - }, - { - "epoch": 0.04, - "learning_rate": 1.999017654800231e-06, - "loss": 0.687, - "step": 1705 - }, - { - "epoch": 0.04, - "learning_rate": 1.9990139727651034e-06, - "loss": 0.873, - "step": 1706 - }, - { - "epoch": 0.04, - "learning_rate": 1.9990102838457624e-06, - "loss": 1.0879, - "step": 1707 - }, - { - "epoch": 0.04, - "learning_rate": 1.999006588042234e-06, - "loss": 0.8877, - "step": 1708 - }, - { - "epoch": 0.04, - "learning_rate": 1.9990028853545443e-06, - "loss": 1.0547, - "step": 1709 - }, - { - "epoch": 0.04, - "learning_rate": 1.9989991757827176e-06, - "loss": 0.8799, - "step": 1710 - }, - { - "epoch": 0.04, - "learning_rate": 1.9989954593267802e-06, - "loss": 0.9863, - "step": 1711 - }, - { - "epoch": 0.04, - "learning_rate": 1.9989917359867574e-06, - "loss": 0.7686, - "step": 1712 - }, - { - "epoch": 0.04, - "learning_rate": 1.9989880057626755e-06, - "loss": 0.6729, - "step": 1713 - }, - { - "epoch": 0.04, - "learning_rate": 1.998984268654559e-06, - "loss": 0.8477, - "step": 1714 - }, - { - "epoch": 0.04, - "learning_rate": 1.9989805246624347e-06, - "loss": 0.8809, - "step": 1715 - }, - { - "epoch": 0.04, - "learning_rate": 1.998976773786328e-06, - "loss": 0.6428, - "step": 1716 - }, - { - "epoch": 0.04, - "learning_rate": 1.998973016026265e-06, - "loss": 0.9922, - "step": 1717 - }, - { - "epoch": 0.04, - "learning_rate": 1.9989692513822713e-06, - "loss": 1.0752, - "step": 1718 - }, - { - "epoch": 0.04, - "learning_rate": 1.998965479854373e-06, - "loss": 1.0547, - "step": 1719 - }, - { - "epoch": 0.04, - "learning_rate": 1.998961701442596e-06, - "loss": 0.8896, - "step": 1720 - }, - { - "epoch": 0.04, - "learning_rate": 1.998957916146966e-06, - "loss": 1.1797, - "step": 1721 - }, - { - "epoch": 0.04, - "learning_rate": 1.99895412396751e-06, - "loss": 0.9365, - "step": 1722 - }, - { - "epoch": 0.04, - "learning_rate": 1.9989503249042535e-06, - "loss": 1.0645, - "step": 1723 - }, - { - "epoch": 0.04, - "learning_rate": 1.9989465189572226e-06, - "loss": 1.0713, - "step": 1724 - }, - { - "epoch": 0.04, - "learning_rate": 1.9989427061264435e-06, - "loss": 1.0586, - "step": 1725 - }, - { - "epoch": 0.04, - "learning_rate": 1.998938886411943e-06, - "loss": 0.8027, - "step": 1726 - }, - { - "epoch": 0.04, - "learning_rate": 1.998935059813747e-06, - "loss": 1.1504, - "step": 1727 - }, - { - "epoch": 0.04, - "learning_rate": 1.998931226331882e-06, - "loss": 1.1152, - "step": 1728 - }, - { - "epoch": 0.04, - "learning_rate": 1.998927385966374e-06, - "loss": 1.1221, - "step": 1729 - }, - { - "epoch": 0.04, - "learning_rate": 1.9989235387172502e-06, - "loss": 0.9307, - "step": 1730 - }, - { - "epoch": 0.04, - "learning_rate": 1.998919684584537e-06, - "loss": 0.7588, - "step": 1731 - }, - { - "epoch": 0.04, - "learning_rate": 1.9989158235682604e-06, - "loss": 0.8721, - "step": 1732 - }, - { - "epoch": 0.04, - "learning_rate": 1.998911955668447e-06, - "loss": 0.79, - "step": 1733 - }, - { - "epoch": 0.04, - "learning_rate": 1.998908080885124e-06, - "loss": 0.8198, - "step": 1734 - }, - { - "epoch": 0.04, - "learning_rate": 1.9989041992183182e-06, - "loss": 1.0439, - "step": 1735 - }, - { - "epoch": 0.04, - "learning_rate": 1.9989003106680554e-06, - "loss": 1.0967, - "step": 1736 - }, - { - "epoch": 0.04, - "learning_rate": 1.9988964152343637e-06, - "loss": 0.9146, - "step": 1737 - }, - { - "epoch": 0.04, - "learning_rate": 1.998892512917269e-06, - "loss": 0.9922, - "step": 1738 - }, - { - "epoch": 0.04, - "learning_rate": 1.998888603716798e-06, - "loss": 0.9307, - "step": 1739 - }, - { - "epoch": 0.04, - "learning_rate": 1.998884687632979e-06, - "loss": 1.0156, - "step": 1740 - }, - { - "epoch": 0.04, - "learning_rate": 1.9988807646658375e-06, - "loss": 1.0254, - "step": 1741 - }, - { - "epoch": 0.04, - "learning_rate": 1.998876834815401e-06, - "loss": 0.9307, - "step": 1742 - }, - { - "epoch": 0.04, - "learning_rate": 1.998872898081697e-06, - "loss": 0.9395, - "step": 1743 - }, - { - "epoch": 0.04, - "learning_rate": 1.998868954464752e-06, - "loss": 0.9395, - "step": 1744 - }, - { - "epoch": 0.04, - "learning_rate": 1.9988650039645937e-06, - "loss": 1.0781, - "step": 1745 - }, - { - "epoch": 0.04, - "learning_rate": 1.998861046581249e-06, - "loss": 0.9092, - "step": 1746 - }, - { - "epoch": 0.04, - "learning_rate": 1.998857082314745e-06, - "loss": 0.9619, - "step": 1747 - }, - { - "epoch": 0.04, - "learning_rate": 1.99885311116511e-06, - "loss": 0.8418, - "step": 1748 - }, - { - "epoch": 0.04, - "learning_rate": 1.99884913313237e-06, - "loss": 1.0107, - "step": 1749 - }, - { - "epoch": 0.04, - "learning_rate": 1.9988451482165534e-06, - "loss": 1.0693, - "step": 1750 - }, - { - "epoch": 0.04, - "learning_rate": 1.9988411564176877e-06, - "loss": 0.585, - "step": 1751 - }, - { - "epoch": 0.04, - "learning_rate": 1.9988371577357996e-06, - "loss": 1.1025, - "step": 1752 - }, - { - "epoch": 0.04, - "learning_rate": 1.998833152170917e-06, - "loss": 1.0127, - "step": 1753 - }, - { - "epoch": 0.04, - "learning_rate": 1.9988291397230677e-06, - "loss": 1.0195, - "step": 1754 - }, - { - "epoch": 0.04, - "learning_rate": 1.998825120392279e-06, - "loss": 1.0059, - "step": 1755 - }, - { - "epoch": 0.05, - "learning_rate": 1.9988210941785794e-06, - "loss": 0.813, - "step": 1756 - }, - { - "epoch": 0.05, - "learning_rate": 1.998817061081996e-06, - "loss": 0.9575, - "step": 1757 - }, - { - "epoch": 0.05, - "learning_rate": 1.9988130211025566e-06, - "loss": 0.874, - "step": 1758 - }, - { - "epoch": 0.05, - "learning_rate": 1.998808974240289e-06, - "loss": 0.9082, - "step": 1759 - }, - { - "epoch": 0.05, - "learning_rate": 1.9988049204952215e-06, - "loss": 0.9834, - "step": 1760 - }, - { - "epoch": 0.05, - "learning_rate": 1.9988008598673813e-06, - "loss": 0.9121, - "step": 1761 - }, - { - "epoch": 0.05, - "learning_rate": 1.998796792356797e-06, - "loss": 0.9648, - "step": 1762 - }, - { - "epoch": 0.05, - "learning_rate": 1.9987927179634966e-06, - "loss": 0.916, - "step": 1763 - }, - { - "epoch": 0.05, - "learning_rate": 1.998788636687508e-06, - "loss": 1.0762, - "step": 1764 - }, - { - "epoch": 0.05, - "learning_rate": 1.998784548528859e-06, - "loss": 0.7773, - "step": 1765 - }, - { - "epoch": 0.05, - "learning_rate": 1.998780453487579e-06, - "loss": 0.8271, - "step": 1766 - }, - { - "epoch": 0.05, - "learning_rate": 1.998776351563694e-06, - "loss": 0.9336, - "step": 1767 - }, - { - "epoch": 0.05, - "learning_rate": 1.998772242757235e-06, - "loss": 1.0684, - "step": 1768 - }, - { - "epoch": 0.05, - "learning_rate": 1.9987681270682284e-06, - "loss": 0.8691, - "step": 1769 - }, - { - "epoch": 0.05, - "learning_rate": 1.9987640044967028e-06, - "loss": 1.0322, - "step": 1770 - }, - { - "epoch": 0.05, - "learning_rate": 1.998759875042687e-06, - "loss": 1.0107, - "step": 1771 - }, - { - "epoch": 0.05, - "learning_rate": 1.99875573870621e-06, - "loss": 0.9771, - "step": 1772 - }, - { - "epoch": 0.05, - "learning_rate": 1.998751595487299e-06, - "loss": 1.0117, - "step": 1773 - }, - { - "epoch": 0.05, - "learning_rate": 1.9987474453859832e-06, - "loss": 1.1914, - "step": 1774 - }, - { - "epoch": 0.05, - "learning_rate": 1.9987432884022914e-06, - "loss": 0.7246, - "step": 1775 - }, - { - "epoch": 0.05, - "learning_rate": 1.998739124536252e-06, - "loss": 0.8457, - "step": 1776 - }, - { - "epoch": 0.05, - "learning_rate": 1.998734953787894e-06, - "loss": 0.998, - "step": 1777 - }, - { - "epoch": 0.05, - "learning_rate": 1.9987307761572456e-06, - "loss": 0.9697, - "step": 1778 - }, - { - "epoch": 0.05, - "learning_rate": 1.998726591644336e-06, - "loss": 1.0547, - "step": 1779 - }, - { - "epoch": 0.05, - "learning_rate": 1.9987224002491937e-06, - "loss": 0.8652, - "step": 1780 - }, - { - "epoch": 0.05, - "learning_rate": 1.998718201971848e-06, - "loss": 0.9814, - "step": 1781 - }, - { - "epoch": 0.05, - "learning_rate": 1.998713996812328e-06, - "loss": 0.999, - "step": 1782 - }, - { - "epoch": 0.05, - "learning_rate": 1.9987097847706614e-06, - "loss": 0.9629, - "step": 1783 - }, - { - "epoch": 0.05, - "learning_rate": 1.9987055658468786e-06, - "loss": 1.1191, - "step": 1784 - }, - { - "epoch": 0.05, - "learning_rate": 1.998701340041008e-06, - "loss": 1.0957, - "step": 1785 - }, - { - "epoch": 0.05, - "learning_rate": 1.9986971073530796e-06, - "loss": 1.041, - "step": 1786 - }, - { - "epoch": 0.05, - "learning_rate": 1.9986928677831214e-06, - "loss": 0.9502, - "step": 1787 - }, - { - "epoch": 0.05, - "learning_rate": 1.998688621331163e-06, - "loss": 1.0273, - "step": 1788 - }, - { - "epoch": 0.05, - "learning_rate": 1.9986843679972337e-06, - "loss": 0.9521, - "step": 1789 - }, - { - "epoch": 0.05, - "learning_rate": 1.9986801077813633e-06, - "loss": 1.0566, - "step": 1790 - }, - { - "epoch": 0.05, - "learning_rate": 1.9986758406835806e-06, - "loss": 0.7463, - "step": 1791 - }, - { - "epoch": 0.05, - "learning_rate": 1.998671566703915e-06, - "loss": 0.9502, - "step": 1792 - }, - { - "epoch": 0.05, - "learning_rate": 1.998667285842396e-06, - "loss": 0.915, - "step": 1793 - }, - { - "epoch": 0.05, - "learning_rate": 1.9986629980990536e-06, - "loss": 1.0508, - "step": 1794 - }, - { - "epoch": 0.05, - "learning_rate": 1.9986587034739165e-06, - "loss": 1.0264, - "step": 1795 - }, - { - "epoch": 0.05, - "learning_rate": 1.998654401967015e-06, - "loss": 0.8252, - "step": 1796 - }, - { - "epoch": 0.05, - "learning_rate": 1.9986500935783784e-06, - "loss": 0.9834, - "step": 1797 - }, - { - "epoch": 0.05, - "learning_rate": 1.9986457783080363e-06, - "loss": 0.8604, - "step": 1798 - }, - { - "epoch": 0.05, - "learning_rate": 1.9986414561560186e-06, - "loss": 0.7881, - "step": 1799 - }, - { - "epoch": 0.05, - "learning_rate": 1.998637127122355e-06, - "loss": 1.0645, - "step": 1800 - }, - { - "epoch": 0.05, - "learning_rate": 1.998632791207076e-06, - "loss": 0.8447, - "step": 1801 - }, - { - "epoch": 0.05, - "learning_rate": 1.99862844841021e-06, - "loss": 1.1025, - "step": 1802 - }, - { - "epoch": 0.05, - "learning_rate": 1.998624098731789e-06, - "loss": 1.124, - "step": 1803 - }, - { - "epoch": 0.05, - "learning_rate": 1.998619742171841e-06, - "loss": 0.9131, - "step": 1804 - }, - { - "epoch": 0.05, - "learning_rate": 1.998615378730397e-06, - "loss": 1.0791, - "step": 1805 - }, - { - "epoch": 0.05, - "learning_rate": 1.9986110084074867e-06, - "loss": 0.9512, - "step": 1806 - }, - { - "epoch": 0.05, - "learning_rate": 1.9986066312031403e-06, - "loss": 0.9814, - "step": 1807 - }, - { - "epoch": 0.05, - "learning_rate": 1.998602247117388e-06, - "loss": 1.0273, - "step": 1808 - }, - { - "epoch": 0.05, - "learning_rate": 1.9985978561502608e-06, - "loss": 0.9604, - "step": 1809 - }, - { - "epoch": 0.05, - "learning_rate": 1.9985934583017877e-06, - "loss": 0.7681, - "step": 1810 - }, - { - "epoch": 0.05, - "learning_rate": 1.9985890535719995e-06, - "loss": 0.8281, - "step": 1811 - }, - { - "epoch": 0.05, - "learning_rate": 1.9985846419609266e-06, - "loss": 1.3066, - "step": 1812 - }, - { - "epoch": 0.05, - "learning_rate": 1.9985802234685995e-06, - "loss": 1.0215, - "step": 1813 - }, - { - "epoch": 0.05, - "learning_rate": 1.9985757980950484e-06, - "loss": 0.5566, - "step": 1814 - }, - { - "epoch": 0.05, - "learning_rate": 1.998571365840304e-06, - "loss": 1.0391, - "step": 1815 - }, - { - "epoch": 0.05, - "learning_rate": 1.998566926704397e-06, - "loss": 0.8662, - "step": 1816 - }, - { - "epoch": 0.05, - "learning_rate": 1.9985624806873576e-06, - "loss": 0.8203, - "step": 1817 - }, - { - "epoch": 0.05, - "learning_rate": 1.9985580277892167e-06, - "loss": 0.9795, - "step": 1818 - }, - { - "epoch": 0.05, - "learning_rate": 1.998553568010005e-06, - "loss": 1.1699, - "step": 1819 - }, - { - "epoch": 0.05, - "learning_rate": 1.9985491013497527e-06, - "loss": 1.043, - "step": 1820 - }, - { - "epoch": 0.05, - "learning_rate": 1.998544627808491e-06, - "loss": 1.208, - "step": 1821 - }, - { - "epoch": 0.05, - "learning_rate": 1.998540147386251e-06, - "loss": 0.9775, - "step": 1822 - }, - { - "epoch": 0.05, - "learning_rate": 1.998535660083063e-06, - "loss": 1.1777, - "step": 1823 - }, - { - "epoch": 0.05, - "learning_rate": 1.998531165898959e-06, - "loss": 0.8574, - "step": 1824 - }, - { - "epoch": 0.05, - "learning_rate": 1.9985266648339685e-06, - "loss": 0.8652, - "step": 1825 - }, - { - "epoch": 0.05, - "learning_rate": 1.9985221568881233e-06, - "loss": 1.126, - "step": 1826 - }, - { - "epoch": 0.05, - "learning_rate": 1.9985176420614546e-06, - "loss": 0.9805, - "step": 1827 - }, - { - "epoch": 0.05, - "learning_rate": 1.998513120353993e-06, - "loss": 0.7686, - "step": 1828 - }, - { - "epoch": 0.05, - "learning_rate": 1.99850859176577e-06, - "loss": 0.918, - "step": 1829 - }, - { - "epoch": 0.05, - "learning_rate": 1.9985040562968168e-06, - "loss": 0.8945, - "step": 1830 - }, - { - "epoch": 0.05, - "learning_rate": 1.9984995139471644e-06, - "loss": 1.0869, - "step": 1831 - }, - { - "epoch": 0.05, - "learning_rate": 1.9984949647168448e-06, - "loss": 0.8994, - "step": 1832 - }, - { - "epoch": 0.05, - "learning_rate": 1.9984904086058885e-06, - "loss": 1.0, - "step": 1833 - }, - { - "epoch": 0.05, - "learning_rate": 1.9984858456143274e-06, - "loss": 1.1719, - "step": 1834 - }, - { - "epoch": 0.05, - "learning_rate": 1.9984812757421927e-06, - "loss": 0.9268, - "step": 1835 - }, - { - "epoch": 0.05, - "learning_rate": 1.998476698989516e-06, - "loss": 0.8589, - "step": 1836 - }, - { - "epoch": 0.05, - "learning_rate": 1.9984721153563287e-06, - "loss": 1.1191, - "step": 1837 - }, - { - "epoch": 0.05, - "learning_rate": 1.9984675248426626e-06, - "loss": 0.9199, - "step": 1838 - }, - { - "epoch": 0.05, - "learning_rate": 1.9984629274485496e-06, - "loss": 1.0771, - "step": 1839 - }, - { - "epoch": 0.05, - "learning_rate": 1.9984583231740205e-06, - "loss": 0.8047, - "step": 1840 - }, - { - "epoch": 0.05, - "learning_rate": 1.998453712019108e-06, - "loss": 1.0674, - "step": 1841 - }, - { - "epoch": 0.05, - "learning_rate": 1.998449093983843e-06, - "loss": 0.9473, - "step": 1842 - }, - { - "epoch": 0.05, - "learning_rate": 1.998444469068258e-06, - "loss": 0.9941, - "step": 1843 - }, - { - "epoch": 0.05, - "learning_rate": 1.9984398372723844e-06, - "loss": 0.835, - "step": 1844 - }, - { - "epoch": 0.05, - "learning_rate": 1.9984351985962546e-06, - "loss": 1.0693, - "step": 1845 - }, - { - "epoch": 0.05, - "learning_rate": 1.9984305530399003e-06, - "loss": 0.874, - "step": 1846 - }, - { - "epoch": 0.05, - "learning_rate": 1.9984259006033536e-06, - "loss": 0.9849, - "step": 1847 - }, - { - "epoch": 0.05, - "learning_rate": 1.998421241286646e-06, - "loss": 1.0693, - "step": 1848 - }, - { - "epoch": 0.05, - "learning_rate": 1.9984165750898104e-06, - "loss": 1.1006, - "step": 1849 - }, - { - "epoch": 0.05, - "learning_rate": 1.998411902012879e-06, - "loss": 1.0557, - "step": 1850 - }, - { - "epoch": 0.05, - "learning_rate": 1.9984072220558834e-06, - "loss": 1.084, - "step": 1851 - }, - { - "epoch": 0.05, - "learning_rate": 1.9984025352188557e-06, - "loss": 1.0947, - "step": 1852 - }, - { - "epoch": 0.05, - "learning_rate": 1.998397841501829e-06, - "loss": 1.3066, - "step": 1853 - }, - { - "epoch": 0.05, - "learning_rate": 1.998393140904835e-06, - "loss": 1.2227, - "step": 1854 - }, - { - "epoch": 0.05, - "learning_rate": 1.9983884334279063e-06, - "loss": 1.0918, - "step": 1855 - }, - { - "epoch": 0.05, - "learning_rate": 1.9983837190710755e-06, - "loss": 0.9248, - "step": 1856 - }, - { - "epoch": 0.05, - "learning_rate": 1.9983789978343746e-06, - "loss": 1.0264, - "step": 1857 - }, - { - "epoch": 0.05, - "learning_rate": 1.998374269717837e-06, - "loss": 1.168, - "step": 1858 - }, - { - "epoch": 0.05, - "learning_rate": 1.9983695347214946e-06, - "loss": 0.8779, - "step": 1859 - }, - { - "epoch": 0.05, - "learning_rate": 1.9983647928453804e-06, - "loss": 0.9697, - "step": 1860 - }, - { - "epoch": 0.05, - "learning_rate": 1.9983600440895264e-06, - "loss": 1.0752, - "step": 1861 - }, - { - "epoch": 0.05, - "learning_rate": 1.9983552884539663e-06, - "loss": 0.7705, - "step": 1862 - }, - { - "epoch": 0.05, - "learning_rate": 1.9983505259387317e-06, - "loss": 1.3057, - "step": 1863 - }, - { - "epoch": 0.05, - "learning_rate": 1.998345756543857e-06, - "loss": 1.0225, - "step": 1864 - }, - { - "epoch": 0.05, - "learning_rate": 1.9983409802693734e-06, - "loss": 1.0498, - "step": 1865 - }, - { - "epoch": 0.05, - "learning_rate": 1.998336197115315e-06, - "loss": 0.9961, - "step": 1866 - }, - { - "epoch": 0.05, - "learning_rate": 1.998331407081714e-06, - "loss": 0.8359, - "step": 1867 - }, - { - "epoch": 0.05, - "learning_rate": 1.9983266101686038e-06, - "loss": 0.9185, - "step": 1868 - }, - { - "epoch": 0.05, - "learning_rate": 1.9983218063760175e-06, - "loss": 0.9854, - "step": 1869 - }, - { - "epoch": 0.05, - "learning_rate": 1.998316995703988e-06, - "loss": 0.9443, - "step": 1870 - }, - { - "epoch": 0.05, - "learning_rate": 1.9983121781525484e-06, - "loss": 1.0449, - "step": 1871 - }, - { - "epoch": 0.05, - "learning_rate": 1.9983073537217325e-06, - "loss": 1.1328, - "step": 1872 - }, - { - "epoch": 0.05, - "learning_rate": 1.9983025224115725e-06, - "loss": 1.0195, - "step": 1873 - }, - { - "epoch": 0.05, - "learning_rate": 1.9982976842221027e-06, - "loss": 0.7285, - "step": 1874 - }, - { - "epoch": 0.05, - "learning_rate": 1.9982928391533557e-06, - "loss": 0.8398, - "step": 1875 - }, - { - "epoch": 0.05, - "learning_rate": 1.998287987205366e-06, - "loss": 1.1318, - "step": 1876 - }, - { - "epoch": 0.05, - "learning_rate": 1.9982831283781653e-06, - "loss": 1.1074, - "step": 1877 - }, - { - "epoch": 0.05, - "learning_rate": 1.9982782626717883e-06, - "loss": 1.0146, - "step": 1878 - }, - { - "epoch": 0.05, - "learning_rate": 1.9982733900862684e-06, - "loss": 1.0439, - "step": 1879 - }, - { - "epoch": 0.05, - "learning_rate": 1.9982685106216387e-06, - "loss": 0.9531, - "step": 1880 - }, - { - "epoch": 0.05, - "learning_rate": 1.9982636242779333e-06, - "loss": 0.876, - "step": 1881 - }, - { - "epoch": 0.05, - "learning_rate": 1.998258731055186e-06, - "loss": 0.959, - "step": 1882 - }, - { - "epoch": 0.05, - "learning_rate": 1.99825383095343e-06, - "loss": 0.9707, - "step": 1883 - }, - { - "epoch": 0.05, - "learning_rate": 1.9982489239726995e-06, - "loss": 0.6416, - "step": 1884 - }, - { - "epoch": 0.05, - "learning_rate": 1.9982440101130276e-06, - "loss": 0.9312, - "step": 1885 - }, - { - "epoch": 0.05, - "learning_rate": 1.9982390893744496e-06, - "loss": 1.0459, - "step": 1886 - }, - { - "epoch": 0.05, - "learning_rate": 1.998234161756998e-06, - "loss": 0.8423, - "step": 1887 - }, - { - "epoch": 0.05, - "learning_rate": 1.998229227260707e-06, - "loss": 0.9473, - "step": 1888 - }, - { - "epoch": 0.05, - "learning_rate": 1.998224285885611e-06, - "loss": 0.8452, - "step": 1889 - }, - { - "epoch": 0.05, - "learning_rate": 1.9982193376317438e-06, - "loss": 0.96, - "step": 1890 - }, - { - "epoch": 0.05, - "learning_rate": 1.99821438249914e-06, - "loss": 0.9814, - "step": 1891 - }, - { - "epoch": 0.05, - "learning_rate": 1.998209420487833e-06, - "loss": 0.9297, - "step": 1892 - }, - { - "epoch": 0.05, - "learning_rate": 1.9982044515978574e-06, - "loss": 1.084, - "step": 1893 - }, - { - "epoch": 0.05, - "learning_rate": 1.998199475829248e-06, - "loss": 0.9932, - "step": 1894 - }, - { - "epoch": 0.05, - "learning_rate": 1.9981944931820376e-06, - "loss": 0.8604, - "step": 1895 - }, - { - "epoch": 0.05, - "learning_rate": 1.998189503656262e-06, - "loss": 0.8037, - "step": 1896 - }, - { - "epoch": 0.05, - "learning_rate": 1.9981845072519546e-06, - "loss": 0.8389, - "step": 1897 - }, - { - "epoch": 0.05, - "learning_rate": 1.99817950396915e-06, - "loss": 0.9941, - "step": 1898 - }, - { - "epoch": 0.05, - "learning_rate": 1.9981744938078834e-06, - "loss": 0.916, - "step": 1899 - }, - { - "epoch": 0.05, - "learning_rate": 1.9981694767681886e-06, - "loss": 0.9014, - "step": 1900 - }, - { - "epoch": 0.05, - "learning_rate": 1.9981644528501005e-06, - "loss": 1.002, - "step": 1901 - }, - { - "epoch": 0.05, - "learning_rate": 1.9981594220536538e-06, - "loss": 0.9463, - "step": 1902 - }, - { - "epoch": 0.05, - "learning_rate": 1.998154384378883e-06, - "loss": 0.9277, - "step": 1903 - }, - { - "epoch": 0.05, - "learning_rate": 1.9981493398258223e-06, - "loss": 0.9814, - "step": 1904 - }, - { - "epoch": 0.05, - "learning_rate": 1.9981442883945074e-06, - "loss": 0.8418, - "step": 1905 - }, - { - "epoch": 0.05, - "learning_rate": 1.998139230084972e-06, - "loss": 1.0977, - "step": 1906 - }, - { - "epoch": 0.05, - "learning_rate": 1.9981341648972525e-06, - "loss": 1.1152, - "step": 1907 - }, - { - "epoch": 0.05, - "learning_rate": 1.9981290928313824e-06, - "loss": 0.7014, - "step": 1908 - }, - { - "epoch": 0.05, - "learning_rate": 1.998124013887397e-06, - "loss": 0.8828, - "step": 1909 - }, - { - "epoch": 0.05, - "learning_rate": 1.998118928065332e-06, - "loss": 1.0664, - "step": 1910 - }, - { - "epoch": 0.05, - "learning_rate": 1.998113835365222e-06, - "loss": 0.9639, - "step": 1911 - }, - { - "epoch": 0.05, - "learning_rate": 1.9981087357871016e-06, - "loss": 1.0498, - "step": 1912 - }, - { - "epoch": 0.05, - "learning_rate": 1.9981036293310064e-06, - "loss": 1.082, - "step": 1913 - }, - { - "epoch": 0.05, - "learning_rate": 1.998098515996972e-06, - "loss": 0.7969, - "step": 1914 - }, - { - "epoch": 0.05, - "learning_rate": 1.9980933957850325e-06, - "loss": 1.0264, - "step": 1915 - }, - { - "epoch": 0.05, - "learning_rate": 1.998088268695224e-06, - "loss": 1.0986, - "step": 1916 - }, - { - "epoch": 0.05, - "learning_rate": 1.9980831347275822e-06, - "loss": 0.8838, - "step": 1917 - }, - { - "epoch": 0.05, - "learning_rate": 1.9980779938821417e-06, - "loss": 0.9014, - "step": 1918 - }, - { - "epoch": 0.05, - "learning_rate": 1.9980728461589385e-06, - "loss": 0.8623, - "step": 1919 - }, - { - "epoch": 0.05, - "learning_rate": 1.9980676915580073e-06, - "loss": 1.084, - "step": 1920 - }, - { - "epoch": 0.05, - "learning_rate": 1.998062530079384e-06, - "loss": 1.1387, - "step": 1921 - }, - { - "epoch": 0.05, - "learning_rate": 1.998057361723105e-06, - "loss": 1.0322, - "step": 1922 - }, - { - "epoch": 0.05, - "learning_rate": 1.9980521864892047e-06, - "loss": 1.1797, - "step": 1923 - }, - { - "epoch": 0.05, - "learning_rate": 1.998047004377719e-06, - "loss": 0.9424, - "step": 1924 - }, - { - "epoch": 0.05, - "learning_rate": 1.9980418153886843e-06, - "loss": 0.8262, - "step": 1925 - }, - { - "epoch": 0.05, - "learning_rate": 1.998036619522136e-06, - "loss": 1.0312, - "step": 1926 - }, - { - "epoch": 0.05, - "learning_rate": 1.9980314167781092e-06, - "loss": 1.0205, - "step": 1927 - }, - { - "epoch": 0.05, - "learning_rate": 1.9980262071566406e-06, - "loss": 0.8232, - "step": 1928 - }, - { - "epoch": 0.05, - "learning_rate": 1.9980209906577663e-06, - "loss": 0.9893, - "step": 1929 - }, - { - "epoch": 0.05, - "learning_rate": 1.9980157672815214e-06, - "loss": 1.0996, - "step": 1930 - }, - { - "epoch": 0.05, - "learning_rate": 1.998010537027942e-06, - "loss": 1.0566, - "step": 1931 - }, - { - "epoch": 0.05, - "learning_rate": 1.9980052998970655e-06, - "loss": 1.0439, - "step": 1932 - }, - { - "epoch": 0.05, - "learning_rate": 1.998000055888926e-06, - "loss": 1.0957, - "step": 1933 - }, - { - "epoch": 0.05, - "learning_rate": 1.997994805003561e-06, - "loss": 0.9131, - "step": 1934 - }, - { - "epoch": 0.05, - "learning_rate": 1.997989547241006e-06, - "loss": 1.0869, - "step": 1935 - }, - { - "epoch": 0.05, - "learning_rate": 1.9979842826012974e-06, - "loss": 0.9053, - "step": 1936 - }, - { - "epoch": 0.05, - "learning_rate": 1.997979011084472e-06, - "loss": 1.0254, - "step": 1937 - }, - { - "epoch": 0.05, - "learning_rate": 1.9979737326905654e-06, - "loss": 1.207, - "step": 1938 - }, - { - "epoch": 0.05, - "learning_rate": 1.9979684474196144e-06, - "loss": 0.9668, - "step": 1939 - }, - { - "epoch": 0.05, - "learning_rate": 1.9979631552716554e-06, - "loss": 0.8672, - "step": 1940 - }, - { - "epoch": 0.05, - "learning_rate": 1.9979578562467244e-06, - "loss": 1.041, - "step": 1941 - }, - { - "epoch": 0.05, - "learning_rate": 1.9979525503448587e-06, - "loss": 0.7715, - "step": 1942 - }, - { - "epoch": 0.05, - "learning_rate": 1.9979472375660943e-06, - "loss": 0.7002, - "step": 1943 - }, - { - "epoch": 0.05, - "learning_rate": 1.9979419179104675e-06, - "loss": 1.0566, - "step": 1944 - }, - { - "epoch": 0.05, - "learning_rate": 1.997936591378016e-06, - "loss": 1.0781, - "step": 1945 - }, - { - "epoch": 0.05, - "learning_rate": 1.997931257968776e-06, - "loss": 1.0645, - "step": 1946 - }, - { - "epoch": 0.05, - "learning_rate": 1.997925917682784e-06, - "loss": 1.0869, - "step": 1947 - }, - { - "epoch": 0.05, - "learning_rate": 1.9979205705200764e-06, - "loss": 0.9365, - "step": 1948 - }, - { - "epoch": 0.05, - "learning_rate": 1.997915216480691e-06, - "loss": 0.9248, - "step": 1949 - }, - { - "epoch": 0.05, - "learning_rate": 1.997909855564664e-06, - "loss": 0.7549, - "step": 1950 - }, - { - "epoch": 0.05, - "learning_rate": 1.9979044877720335e-06, - "loss": 1.0068, - "step": 1951 - }, - { - "epoch": 0.05, - "learning_rate": 1.997899113102835e-06, - "loss": 1.0469, - "step": 1952 - }, - { - "epoch": 0.05, - "learning_rate": 1.9978937315571065e-06, - "loss": 1.0752, - "step": 1953 - }, - { - "epoch": 0.05, - "learning_rate": 1.997888343134884e-06, - "loss": 0.9922, - "step": 1954 - }, - { - "epoch": 0.05, - "learning_rate": 1.9978829478362062e-06, - "loss": 1.0, - "step": 1955 - }, - { - "epoch": 0.05, - "learning_rate": 1.9978775456611094e-06, - "loss": 0.8057, - "step": 1956 - }, - { - "epoch": 0.05, - "learning_rate": 1.9978721366096305e-06, - "loss": 0.5181, - "step": 1957 - }, - { - "epoch": 0.05, - "learning_rate": 1.9978667206818073e-06, - "loss": 0.8486, - "step": 1958 - }, - { - "epoch": 0.05, - "learning_rate": 1.997861297877677e-06, - "loss": 0.9355, - "step": 1959 - }, - { - "epoch": 0.05, - "learning_rate": 1.997855868197277e-06, - "loss": 0.9873, - "step": 1960 - }, - { - "epoch": 0.05, - "learning_rate": 1.9978504316406447e-06, - "loss": 0.9863, - "step": 1961 - }, - { - "epoch": 0.05, - "learning_rate": 1.9978449882078177e-06, - "loss": 0.9854, - "step": 1962 - }, - { - "epoch": 0.05, - "learning_rate": 1.997839537898833e-06, - "loss": 0.957, - "step": 1963 - }, - { - "epoch": 0.05, - "learning_rate": 1.9978340807137287e-06, - "loss": 0.6782, - "step": 1964 - }, - { - "epoch": 0.05, - "learning_rate": 1.9978286166525425e-06, - "loss": 0.915, - "step": 1965 - }, - { - "epoch": 0.05, - "learning_rate": 1.997823145715311e-06, - "loss": 0.9185, - "step": 1966 - }, - { - "epoch": 0.05, - "learning_rate": 1.9978176679020736e-06, - "loss": 1.3047, - "step": 1967 - }, - { - "epoch": 0.05, - "learning_rate": 1.997812183212866e-06, - "loss": 1.0977, - "step": 1968 - }, - { - "epoch": 0.05, - "learning_rate": 1.997806691647728e-06, - "loss": 1.0107, - "step": 1969 - }, - { - "epoch": 0.05, - "learning_rate": 1.9978011932066965e-06, - "loss": 0.8652, - "step": 1970 - }, - { - "epoch": 0.05, - "learning_rate": 1.997795687889809e-06, - "loss": 0.9199, - "step": 1971 - }, - { - "epoch": 0.05, - "learning_rate": 1.997790175697104e-06, - "loss": 0.998, - "step": 1972 - }, - { - "epoch": 0.05, - "learning_rate": 1.9977846566286196e-06, - "loss": 0.8711, - "step": 1973 - }, - { - "epoch": 0.05, - "learning_rate": 1.9977791306843938e-06, - "loss": 1.1494, - "step": 1974 - }, - { - "epoch": 0.05, - "learning_rate": 1.997773597864464e-06, - "loss": 0.9609, - "step": 1975 - }, - { - "epoch": 0.05, - "learning_rate": 1.997768058168869e-06, - "loss": 1.125, - "step": 1976 - }, - { - "epoch": 0.05, - "learning_rate": 1.9977625115976468e-06, - "loss": 1.1738, - "step": 1977 - }, - { - "epoch": 0.05, - "learning_rate": 1.9977569581508355e-06, - "loss": 0.9297, - "step": 1978 - }, - { - "epoch": 0.05, - "learning_rate": 1.997751397828473e-06, - "loss": 1.1328, - "step": 1979 - }, - { - "epoch": 0.05, - "learning_rate": 1.997745830630599e-06, - "loss": 1.0459, - "step": 1980 - }, - { - "epoch": 0.05, - "learning_rate": 1.99774025655725e-06, - "loss": 1.0352, - "step": 1981 - }, - { - "epoch": 0.05, - "learning_rate": 1.997734675608466e-06, - "loss": 0.9395, - "step": 1982 - }, - { - "epoch": 0.05, - "learning_rate": 1.997729087784285e-06, - "loss": 0.834, - "step": 1983 - }, - { - "epoch": 0.05, - "learning_rate": 1.9977234930847447e-06, - "loss": 1.0449, - "step": 1984 - }, - { - "epoch": 0.05, - "learning_rate": 1.9977178915098848e-06, - "loss": 0.9941, - "step": 1985 - }, - { - "epoch": 0.05, - "learning_rate": 1.997712283059743e-06, - "loss": 0.6355, - "step": 1986 - }, - { - "epoch": 0.05, - "learning_rate": 1.997706667734358e-06, - "loss": 0.7588, - "step": 1987 - }, - { - "epoch": 0.05, - "learning_rate": 1.99770104553377e-06, - "loss": 1.0859, - "step": 1988 - }, - { - "epoch": 0.05, - "learning_rate": 1.997695416458016e-06, - "loss": 1.1895, - "step": 1989 - }, - { - "epoch": 0.05, - "learning_rate": 1.997689780507135e-06, - "loss": 0.9248, - "step": 1990 - }, - { - "epoch": 0.05, - "learning_rate": 1.997684137681166e-06, - "loss": 0.7959, - "step": 1991 - }, - { - "epoch": 0.05, - "learning_rate": 1.9976784879801488e-06, - "loss": 0.7959, - "step": 1992 - }, - { - "epoch": 0.05, - "learning_rate": 1.9976728314041213e-06, - "loss": 1.1064, - "step": 1993 - }, - { - "epoch": 0.05, - "learning_rate": 1.997667167953122e-06, - "loss": 0.8691, - "step": 1994 - }, - { - "epoch": 0.05, - "learning_rate": 1.997661497627192e-06, - "loss": 0.7659, - "step": 1995 - }, - { - "epoch": 0.05, - "learning_rate": 1.9976558204263686e-06, - "loss": 1.1172, - "step": 1996 - }, - { - "epoch": 0.05, - "learning_rate": 1.997650136350691e-06, - "loss": 0.8516, - "step": 1997 - }, - { - "epoch": 0.05, - "learning_rate": 1.9976444454001993e-06, - "loss": 0.9766, - "step": 1998 - }, - { - "epoch": 0.05, - "learning_rate": 1.997638747574932e-06, - "loss": 1.0088, - "step": 1999 - }, - { - "epoch": 0.05, - "learning_rate": 1.9976330428749282e-06, - "loss": 1.0693, - "step": 2000 - }, - { - "epoch": 0.05, - "learning_rate": 1.997627331300228e-06, - "loss": 1.0771, - "step": 2001 - }, - { - "epoch": 0.05, - "learning_rate": 1.9976216128508706e-06, - "loss": 0.9688, - "step": 2002 - }, - { - "epoch": 0.05, - "learning_rate": 1.9976158875268946e-06, - "loss": 0.9004, - "step": 2003 - }, - { - "epoch": 0.05, - "learning_rate": 1.99761015532834e-06, - "loss": 0.9932, - "step": 2004 - }, - { - "epoch": 0.05, - "learning_rate": 1.9976044162552467e-06, - "loss": 0.7998, - "step": 2005 - }, - { - "epoch": 0.05, - "learning_rate": 1.997598670307653e-06, - "loss": 0.9551, - "step": 2006 - }, - { - "epoch": 0.05, - "learning_rate": 1.9975929174856004e-06, - "loss": 0.9941, - "step": 2007 - }, - { - "epoch": 0.05, - "learning_rate": 1.997587157789127e-06, - "loss": 0.8818, - "step": 2008 - }, - { - "epoch": 0.05, - "learning_rate": 1.9975813912182724e-06, - "loss": 0.9062, - "step": 2009 - }, - { - "epoch": 0.05, - "learning_rate": 1.9975756177730778e-06, - "loss": 0.9902, - "step": 2010 - }, - { - "epoch": 0.05, - "learning_rate": 1.9975698374535814e-06, - "loss": 0.8374, - "step": 2011 - }, - { - "epoch": 0.05, - "learning_rate": 1.997564050259824e-06, - "loss": 0.96, - "step": 2012 - }, - { - "epoch": 0.05, - "learning_rate": 1.9975582561918453e-06, - "loss": 1.0664, - "step": 2013 - }, - { - "epoch": 0.05, - "learning_rate": 1.997552455249685e-06, - "loss": 0.7451, - "step": 2014 - }, - { - "epoch": 0.05, - "learning_rate": 1.9975466474333834e-06, - "loss": 0.8682, - "step": 2015 - }, - { - "epoch": 0.05, - "learning_rate": 1.9975408327429803e-06, - "loss": 0.9102, - "step": 2016 - }, - { - "epoch": 0.05, - "learning_rate": 1.9975350111785156e-06, - "loss": 0.8188, - "step": 2017 - }, - { - "epoch": 0.05, - "learning_rate": 1.9975291827400295e-06, - "loss": 0.9688, - "step": 2018 - }, - { - "epoch": 0.05, - "learning_rate": 1.9975233474275624e-06, - "loss": 0.9639, - "step": 2019 - }, - { - "epoch": 0.05, - "learning_rate": 1.9975175052411543e-06, - "loss": 0.9707, - "step": 2020 - }, - { - "epoch": 0.05, - "learning_rate": 1.997511656180845e-06, - "loss": 0.9756, - "step": 2021 - }, - { - "epoch": 0.05, - "learning_rate": 1.9975058002466765e-06, - "loss": 1.0352, - "step": 2022 - }, - { - "epoch": 0.05, - "learning_rate": 1.9974999374386873e-06, - "loss": 0.7651, - "step": 2023 - }, - { - "epoch": 0.05, - "learning_rate": 1.997494067756919e-06, - "loss": 0.9248, - "step": 2024 - }, - { - "epoch": 0.05, - "learning_rate": 1.997488191201411e-06, - "loss": 1.1104, - "step": 2025 - }, - { - "epoch": 0.05, - "learning_rate": 1.997482307772204e-06, - "loss": 1.0605, - "step": 2026 - }, - { - "epoch": 0.05, - "learning_rate": 1.9974764174693395e-06, - "loss": 1.0762, - "step": 2027 - }, - { - "epoch": 0.05, - "learning_rate": 1.9974705202928576e-06, - "loss": 0.9766, - "step": 2028 - }, - { - "epoch": 0.05, - "learning_rate": 1.997464616242799e-06, - "loss": 0.9561, - "step": 2029 - }, - { - "epoch": 0.05, - "learning_rate": 1.9974587053192035e-06, - "loss": 1.0439, - "step": 2030 - }, - { - "epoch": 0.05, - "learning_rate": 1.9974527875221127e-06, - "loss": 0.8906, - "step": 2031 - }, - { - "epoch": 0.05, - "learning_rate": 1.9974468628515676e-06, - "loss": 1.1406, - "step": 2032 - }, - { - "epoch": 0.05, - "learning_rate": 1.997440931307608e-06, - "loss": 1.1562, - "step": 2033 - }, - { - "epoch": 0.05, - "learning_rate": 1.9974349928902757e-06, - "loss": 1.0664, - "step": 2034 - }, - { - "epoch": 0.05, - "learning_rate": 1.997429047599612e-06, - "loss": 0.8252, - "step": 2035 - }, - { - "epoch": 0.05, - "learning_rate": 1.9974230954356563e-06, - "loss": 0.9199, - "step": 2036 - }, - { - "epoch": 0.05, - "learning_rate": 1.9974171363984507e-06, - "loss": 0.9434, - "step": 2037 - }, - { - "epoch": 0.05, - "learning_rate": 1.997411170488036e-06, - "loss": 0.9541, - "step": 2038 - }, - { - "epoch": 0.05, - "learning_rate": 1.997405197704454e-06, - "loss": 0.8125, - "step": 2039 - }, - { - "epoch": 0.05, - "learning_rate": 1.9973992180477443e-06, - "loss": 0.8369, - "step": 2040 - }, - { - "epoch": 0.05, - "learning_rate": 1.99739323151795e-06, - "loss": 0.9072, - "step": 2041 - }, - { - "epoch": 0.05, - "learning_rate": 1.9973872381151107e-06, - "loss": 1.2539, - "step": 2042 - }, - { - "epoch": 0.05, - "learning_rate": 1.9973812378392688e-06, - "loss": 0.9834, - "step": 2043 - }, - { - "epoch": 0.05, - "learning_rate": 1.997375230690465e-06, - "loss": 1.0635, - "step": 2044 - }, - { - "epoch": 0.05, - "learning_rate": 1.997369216668741e-06, - "loss": 1.2051, - "step": 2045 - }, - { - "epoch": 0.05, - "learning_rate": 1.9973631957741383e-06, - "loss": 1.2891, - "step": 2046 - }, - { - "epoch": 0.05, - "learning_rate": 1.997357168006698e-06, - "loss": 1.1719, - "step": 2047 - }, - { - "epoch": 0.05, - "learning_rate": 1.9973511333664627e-06, - "loss": 0.959, - "step": 2048 - }, - { - "epoch": 0.05, - "learning_rate": 1.9973450918534726e-06, - "loss": 0.897, - "step": 2049 - }, - { - "epoch": 0.05, - "learning_rate": 1.99733904346777e-06, - "loss": 0.8496, - "step": 2050 - }, - { - "epoch": 0.05, - "learning_rate": 1.9973329882093964e-06, - "loss": 0.8789, - "step": 2051 - }, - { - "epoch": 0.05, - "learning_rate": 1.997326926078394e-06, - "loss": 0.7881, - "step": 2052 - }, - { - "epoch": 0.05, - "learning_rate": 1.997320857074804e-06, - "loss": 0.9092, - "step": 2053 - }, - { - "epoch": 0.05, - "learning_rate": 1.9973147811986683e-06, - "loss": 1.0195, - "step": 2054 - }, - { - "epoch": 0.05, - "learning_rate": 1.997308698450029e-06, - "loss": 0.9492, - "step": 2055 - }, - { - "epoch": 0.05, - "learning_rate": 1.997302608828928e-06, - "loss": 0.958, - "step": 2056 - }, - { - "epoch": 0.05, - "learning_rate": 1.9972965123354072e-06, - "loss": 0.9248, - "step": 2057 - }, - { - "epoch": 0.05, - "learning_rate": 1.9972904089695087e-06, - "loss": 0.9355, - "step": 2058 - }, - { - "epoch": 0.05, - "learning_rate": 1.9972842987312744e-06, - "loss": 0.9629, - "step": 2059 - }, - { - "epoch": 0.05, - "learning_rate": 1.9972781816207463e-06, - "loss": 0.7534, - "step": 2060 - }, - { - "epoch": 0.05, - "learning_rate": 1.997272057637967e-06, - "loss": 0.9316, - "step": 2061 - }, - { - "epoch": 0.05, - "learning_rate": 1.997265926782978e-06, - "loss": 0.9932, - "step": 2062 - }, - { - "epoch": 0.05, - "learning_rate": 1.997259789055822e-06, - "loss": 1.1631, - "step": 2063 - }, - { - "epoch": 0.05, - "learning_rate": 1.9972536444565413e-06, - "loss": 0.9307, - "step": 2064 - }, - { - "epoch": 0.05, - "learning_rate": 1.9972474929851785e-06, - "loss": 1.1758, - "step": 2065 - }, - { - "epoch": 0.05, - "learning_rate": 1.9972413346417756e-06, - "loss": 0.8535, - "step": 2066 - }, - { - "epoch": 0.05, - "learning_rate": 1.9972351694263753e-06, - "loss": 0.8877, - "step": 2067 - }, - { - "epoch": 0.05, - "learning_rate": 1.9972289973390196e-06, - "loss": 0.9014, - "step": 2068 - }, - { - "epoch": 0.05, - "learning_rate": 1.9972228183797516e-06, - "loss": 0.9512, - "step": 2069 - }, - { - "epoch": 0.05, - "learning_rate": 1.9972166325486134e-06, - "loss": 1.0146, - "step": 2070 - }, - { - "epoch": 0.05, - "learning_rate": 1.9972104398456476e-06, - "loss": 1.0098, - "step": 2071 - }, - { - "epoch": 0.05, - "learning_rate": 1.997204240270898e-06, - "loss": 0.9961, - "step": 2072 - }, - { - "epoch": 0.05, - "learning_rate": 1.997198033824406e-06, - "loss": 1.0635, - "step": 2073 - }, - { - "epoch": 0.05, - "learning_rate": 1.9971918205062145e-06, - "loss": 0.6246, - "step": 2074 - }, - { - "epoch": 0.05, - "learning_rate": 1.9971856003163668e-06, - "loss": 0.9639, - "step": 2075 - }, - { - "epoch": 0.05, - "learning_rate": 1.9971793732549054e-06, - "loss": 0.9502, - "step": 2076 - }, - { - "epoch": 0.05, - "learning_rate": 1.997173139321874e-06, - "loss": 0.9287, - "step": 2077 - }, - { - "epoch": 0.05, - "learning_rate": 1.997166898517314e-06, - "loss": 1.1602, - "step": 2078 - }, - { - "epoch": 0.05, - "learning_rate": 1.9971606508412705e-06, - "loss": 0.6318, - "step": 2079 - }, - { - "epoch": 0.05, - "learning_rate": 1.9971543962937848e-06, - "loss": 0.9038, - "step": 2080 - }, - { - "epoch": 0.05, - "learning_rate": 1.9971481348749006e-06, - "loss": 1.1377, - "step": 2081 - }, - { - "epoch": 0.05, - "learning_rate": 1.9971418665846615e-06, - "loss": 0.8838, - "step": 2082 - }, - { - "epoch": 0.05, - "learning_rate": 1.9971355914231094e-06, - "loss": 1.0156, - "step": 2083 - }, - { - "epoch": 0.05, - "learning_rate": 1.9971293093902893e-06, - "loss": 1.1309, - "step": 2084 - }, - { - "epoch": 0.05, - "learning_rate": 1.997123020486243e-06, - "loss": 0.9854, - "step": 2085 - }, - { - "epoch": 0.05, - "learning_rate": 1.997116724711015e-06, - "loss": 1.0801, - "step": 2086 - }, - { - "epoch": 0.05, - "learning_rate": 1.997110422064648e-06, - "loss": 0.9336, - "step": 2087 - }, - { - "epoch": 0.05, - "learning_rate": 1.997104112547185e-06, - "loss": 0.6624, - "step": 2088 - }, - { - "epoch": 0.05, - "learning_rate": 1.9970977961586704e-06, - "loss": 1.0576, - "step": 2089 - }, - { - "epoch": 0.05, - "learning_rate": 1.9970914728991474e-06, - "loss": 0.9463, - "step": 2090 - }, - { - "epoch": 0.05, - "learning_rate": 1.9970851427686595e-06, - "loss": 0.9414, - "step": 2091 - }, - { - "epoch": 0.05, - "learning_rate": 1.9970788057672505e-06, - "loss": 0.79, - "step": 2092 - }, - { - "epoch": 0.05, - "learning_rate": 1.997072461894964e-06, - "loss": 0.7668, - "step": 2093 - }, - { - "epoch": 0.05, - "learning_rate": 1.997066111151843e-06, - "loss": 1.0605, - "step": 2094 - }, - { - "epoch": 0.05, - "learning_rate": 1.997059753537932e-06, - "loss": 1.0146, - "step": 2095 - }, - { - "epoch": 0.05, - "learning_rate": 1.997053389053275e-06, - "loss": 0.7148, - "step": 2096 - }, - { - "epoch": 0.05, - "learning_rate": 1.9970470176979156e-06, - "loss": 0.9971, - "step": 2097 - }, - { - "epoch": 0.05, - "learning_rate": 1.9970406394718975e-06, - "loss": 0.9053, - "step": 2098 - }, - { - "epoch": 0.05, - "learning_rate": 1.9970342543752653e-06, - "loss": 0.9482, - "step": 2099 - }, - { - "epoch": 0.05, - "learning_rate": 1.997027862408062e-06, - "loss": 1.0898, - "step": 2100 - }, - { - "epoch": 0.05, - "learning_rate": 1.9970214635703324e-06, - "loss": 0.9189, - "step": 2101 - }, - { - "epoch": 0.05, - "learning_rate": 1.9970150578621203e-06, - "loss": 1.1445, - "step": 2102 - }, - { - "epoch": 0.05, - "learning_rate": 1.9970086452834698e-06, - "loss": 0.9629, - "step": 2103 - }, - { - "epoch": 0.05, - "learning_rate": 1.9970022258344253e-06, - "loss": 0.8818, - "step": 2104 - }, - { - "epoch": 0.05, - "learning_rate": 1.996995799515031e-06, - "loss": 1.1348, - "step": 2105 - }, - { - "epoch": 0.05, - "learning_rate": 1.996989366325331e-06, - "loss": 0.958, - "step": 2106 - }, - { - "epoch": 0.05, - "learning_rate": 1.9969829262653697e-06, - "loss": 1.0303, - "step": 2107 - }, - { - "epoch": 0.05, - "learning_rate": 1.9969764793351917e-06, - "loss": 1.0791, - "step": 2108 - }, - { - "epoch": 0.05, - "learning_rate": 1.996970025534841e-06, - "loss": 0.9785, - "step": 2109 - }, - { - "epoch": 0.05, - "learning_rate": 1.9969635648643625e-06, - "loss": 0.8955, - "step": 2110 - }, - { - "epoch": 0.05, - "learning_rate": 1.9969570973238006e-06, - "loss": 1.1738, - "step": 2111 - }, - { - "epoch": 0.05, - "learning_rate": 1.9969506229131997e-06, - "loss": 1.1318, - "step": 2112 - }, - { - "epoch": 0.05, - "learning_rate": 1.9969441416326047e-06, - "loss": 0.9668, - "step": 2113 - }, - { - "epoch": 0.05, - "learning_rate": 1.99693765348206e-06, - "loss": 1.0234, - "step": 2114 - }, - { - "epoch": 0.05, - "learning_rate": 1.99693115846161e-06, - "loss": 0.9521, - "step": 2115 - }, - { - "epoch": 0.05, - "learning_rate": 1.9969246565713004e-06, - "loss": 1.1494, - "step": 2116 - }, - { - "epoch": 0.05, - "learning_rate": 1.9969181478111753e-06, - "loss": 0.6646, - "step": 2117 - }, - { - "epoch": 0.05, - "learning_rate": 1.9969116321812796e-06, - "loss": 1.0762, - "step": 2118 - }, - { - "epoch": 0.05, - "learning_rate": 1.9969051096816583e-06, - "loss": 0.7627, - "step": 2119 - }, - { - "epoch": 0.05, - "learning_rate": 1.9968985803123568e-06, - "loss": 1.0381, - "step": 2120 - }, - { - "epoch": 0.05, - "learning_rate": 1.996892044073419e-06, - "loss": 0.8838, - "step": 2121 - }, - { - "epoch": 0.05, - "learning_rate": 1.996885500964891e-06, - "loss": 1.2061, - "step": 2122 - }, - { - "epoch": 0.05, - "learning_rate": 1.9968789509868175e-06, - "loss": 0.9219, - "step": 2123 - }, - { - "epoch": 0.05, - "learning_rate": 1.9968723941392432e-06, - "loss": 1.1582, - "step": 2124 - }, - { - "epoch": 0.05, - "learning_rate": 1.996865830422214e-06, - "loss": 1.0596, - "step": 2125 - }, - { - "epoch": 0.05, - "learning_rate": 1.9968592598357746e-06, - "loss": 1.1299, - "step": 2126 - }, - { - "epoch": 0.05, - "learning_rate": 1.996852682379971e-06, - "loss": 0.8682, - "step": 2127 - }, - { - "epoch": 0.05, - "learning_rate": 1.9968460980548477e-06, - "loss": 1.1045, - "step": 2128 - }, - { - "epoch": 0.05, - "learning_rate": 1.9968395068604504e-06, - "loss": 0.957, - "step": 2129 - }, - { - "epoch": 0.05, - "learning_rate": 1.9968329087968247e-06, - "loss": 1.1406, - "step": 2130 - }, - { - "epoch": 0.05, - "learning_rate": 1.996826303864016e-06, - "loss": 1.0205, - "step": 2131 - }, - { - "epoch": 0.05, - "learning_rate": 1.9968196920620693e-06, - "loss": 0.707, - "step": 2132 - }, - { - "epoch": 0.05, - "learning_rate": 1.996813073391031e-06, - "loss": 0.7773, - "step": 2133 - }, - { - "epoch": 0.05, - "learning_rate": 1.9968064478509457e-06, - "loss": 0.9658, - "step": 2134 - }, - { - "epoch": 0.05, - "learning_rate": 1.99679981544186e-06, - "loss": 0.9121, - "step": 2135 - }, - { - "epoch": 0.05, - "learning_rate": 1.9967931761638195e-06, - "loss": 1.0078, - "step": 2136 - }, - { - "epoch": 0.05, - "learning_rate": 1.9967865300168692e-06, - "loss": 1.0527, - "step": 2137 - }, - { - "epoch": 0.05, - "learning_rate": 1.9967798770010557e-06, - "loss": 0.9834, - "step": 2138 - }, - { - "epoch": 0.05, - "learning_rate": 1.9967732171164245e-06, - "loss": 0.877, - "step": 2139 - }, - { - "epoch": 0.05, - "learning_rate": 1.9967665503630215e-06, - "loss": 1.1191, - "step": 2140 - }, - { - "epoch": 0.05, - "learning_rate": 1.9967598767408928e-06, - "loss": 1.21, - "step": 2141 - }, - { - "epoch": 0.05, - "learning_rate": 1.996753196250084e-06, - "loss": 1.082, - "step": 2142 - }, - { - "epoch": 0.05, - "learning_rate": 1.9967465088906416e-06, - "loss": 0.8076, - "step": 2143 - }, - { - "epoch": 0.05, - "learning_rate": 1.9967398146626115e-06, - "loss": 0.8706, - "step": 2144 - }, - { - "epoch": 0.05, - "learning_rate": 1.9967331135660395e-06, - "loss": 1.1289, - "step": 2145 - }, - { - "epoch": 0.06, - "learning_rate": 1.9967264056009727e-06, - "loss": 0.7769, - "step": 2146 - }, - { - "epoch": 0.06, - "learning_rate": 1.996719690767456e-06, - "loss": 0.9902, - "step": 2147 - }, - { - "epoch": 0.06, - "learning_rate": 1.996712969065537e-06, - "loss": 0.8926, - "step": 2148 - }, - { - "epoch": 0.06, - "learning_rate": 1.9967062404952607e-06, - "loss": 0.7456, - "step": 2149 - }, - { - "epoch": 0.06, - "learning_rate": 1.9966995050566746e-06, - "loss": 1.042, - "step": 2150 - }, - { - "epoch": 0.06, - "learning_rate": 1.9966927627498246e-06, - "loss": 0.8359, - "step": 2151 - }, - { - "epoch": 0.06, - "learning_rate": 1.996686013574757e-06, - "loss": 0.9746, - "step": 2152 - }, - { - "epoch": 0.06, - "learning_rate": 1.996679257531519e-06, - "loss": 0.8081, - "step": 2153 - }, - { - "epoch": 0.06, - "learning_rate": 1.9966724946201567e-06, - "loss": 1.1191, - "step": 2154 - }, - { - "epoch": 0.06, - "learning_rate": 1.9966657248407163e-06, - "loss": 0.8574, - "step": 2155 - }, - { - "epoch": 0.06, - "learning_rate": 1.996658948193245e-06, - "loss": 0.8428, - "step": 2156 - }, - { - "epoch": 0.06, - "learning_rate": 1.99665216467779e-06, - "loss": 0.9443, - "step": 2157 - }, - { - "epoch": 0.06, - "learning_rate": 1.9966453742943966e-06, - "loss": 0.6816, - "step": 2158 - }, - { - "epoch": 0.06, - "learning_rate": 1.996638577043113e-06, - "loss": 1.002, - "step": 2159 - }, - { - "epoch": 0.06, - "learning_rate": 1.996631772923985e-06, - "loss": 1.0254, - "step": 2160 - }, - { - "epoch": 0.06, - "learning_rate": 1.9966249619370597e-06, - "loss": 0.8799, - "step": 2161 - }, - { - "epoch": 0.06, - "learning_rate": 1.996618144082385e-06, - "loss": 0.7119, - "step": 2162 - }, - { - "epoch": 0.06, - "learning_rate": 1.9966113193600065e-06, - "loss": 0.9795, - "step": 2163 - }, - { - "epoch": 0.06, - "learning_rate": 1.996604487769972e-06, - "loss": 0.9365, - "step": 2164 - }, - { - "epoch": 0.06, - "learning_rate": 1.9965976493123285e-06, - "loss": 0.9502, - "step": 2165 - }, - { - "epoch": 0.06, - "learning_rate": 1.996590803987123e-06, - "loss": 0.8838, - "step": 2166 - }, - { - "epoch": 0.06, - "learning_rate": 1.996583951794403e-06, - "loss": 0.9932, - "step": 2167 - }, - { - "epoch": 0.06, - "learning_rate": 1.9965770927342158e-06, - "loss": 1.1201, - "step": 2168 - }, - { - "epoch": 0.06, - "learning_rate": 1.9965702268066073e-06, - "loss": 1.1016, - "step": 2169 - }, - { - "epoch": 0.06, - "learning_rate": 1.9965633540116267e-06, - "loss": 0.9053, - "step": 2170 - }, - { - "epoch": 0.06, - "learning_rate": 1.99655647434932e-06, - "loss": 1.0352, - "step": 2171 - }, - { - "epoch": 0.06, - "learning_rate": 1.9965495878197355e-06, - "loss": 1.1172, - "step": 2172 - }, - { - "epoch": 0.06, - "learning_rate": 1.9965426944229197e-06, - "loss": 1.1748, - "step": 2173 - }, - { - "epoch": 0.06, - "learning_rate": 1.9965357941589215e-06, - "loss": 0.729, - "step": 2174 - }, - { - "epoch": 0.06, - "learning_rate": 1.9965288870277866e-06, - "loss": 0.8936, - "step": 2175 - }, - { - "epoch": 0.06, - "learning_rate": 1.9965219730295643e-06, - "loss": 0.8086, - "step": 2176 - }, - { - "epoch": 0.06, - "learning_rate": 1.9965150521643013e-06, - "loss": 1.0576, - "step": 2177 - }, - { - "epoch": 0.06, - "learning_rate": 1.9965081244320458e-06, - "loss": 1.0488, - "step": 2178 - }, - { - "epoch": 0.06, - "learning_rate": 1.9965011898328454e-06, - "loss": 1.0312, - "step": 2179 - }, - { - "epoch": 0.06, - "learning_rate": 1.9964942483667472e-06, - "loss": 0.7231, - "step": 2180 - }, - { - "epoch": 0.06, - "learning_rate": 1.9964873000338e-06, - "loss": 0.8984, - "step": 2181 - }, - { - "epoch": 0.06, - "learning_rate": 1.9964803448340515e-06, - "loss": 0.8037, - "step": 2182 - }, - { - "epoch": 0.06, - "learning_rate": 1.9964733827675487e-06, - "loss": 1.1738, - "step": 2183 - }, - { - "epoch": 0.06, - "learning_rate": 1.996466413834341e-06, - "loss": 0.9873, - "step": 2184 - }, - { - "epoch": 0.06, - "learning_rate": 1.9964594380344754e-06, - "loss": 0.9072, - "step": 2185 - }, - { - "epoch": 0.06, - "learning_rate": 1.996452455368e-06, - "loss": 1.1377, - "step": 2186 - }, - { - "epoch": 0.06, - "learning_rate": 1.9964454658349637e-06, - "loss": 1.0645, - "step": 2187 - }, - { - "epoch": 0.06, - "learning_rate": 1.996438469435414e-06, - "loss": 0.7314, - "step": 2188 - }, - { - "epoch": 0.06, - "learning_rate": 1.9964314661693995e-06, - "loss": 0.9355, - "step": 2189 - }, - { - "epoch": 0.06, - "learning_rate": 1.9964244560369677e-06, - "loss": 0.9932, - "step": 2190 - }, - { - "epoch": 0.06, - "learning_rate": 1.9964174390381676e-06, - "loss": 1.0088, - "step": 2191 - }, - { - "epoch": 0.06, - "learning_rate": 1.996410415173048e-06, - "loss": 1.0576, - "step": 2192 - }, - { - "epoch": 0.06, - "learning_rate": 1.996403384441656e-06, - "loss": 0.9736, - "step": 2193 - }, - { - "epoch": 0.06, - "learning_rate": 1.996396346844041e-06, - "loss": 1.0098, - "step": 2194 - }, - { - "epoch": 0.06, - "learning_rate": 1.9963893023802513e-06, - "loss": 0.7744, - "step": 2195 - }, - { - "epoch": 0.06, - "learning_rate": 1.996382251050335e-06, - "loss": 0.8379, - "step": 2196 - }, - { - "epoch": 0.06, - "learning_rate": 1.996375192854342e-06, - "loss": 1.0088, - "step": 2197 - }, - { - "epoch": 0.06, - "learning_rate": 1.996368127792319e-06, - "loss": 0.7959, - "step": 2198 - }, - { - "epoch": 0.06, - "learning_rate": 1.9963610558643166e-06, - "loss": 0.8691, - "step": 2199 - }, - { - "epoch": 0.06, - "learning_rate": 1.996353977070382e-06, - "loss": 0.877, - "step": 2200 - }, - { - "epoch": 0.06, - "learning_rate": 1.9963468914105647e-06, - "loss": 0.7087, - "step": 2201 - }, - { - "epoch": 0.06, - "learning_rate": 1.9963397988849135e-06, - "loss": 0.999, - "step": 2202 - }, - { - "epoch": 0.06, - "learning_rate": 1.996332699493477e-06, - "loss": 0.9541, - "step": 2203 - }, - { - "epoch": 0.06, - "learning_rate": 1.996325593236305e-06, - "loss": 0.8262, - "step": 2204 - }, - { - "epoch": 0.06, - "learning_rate": 1.996318480113445e-06, - "loss": 1.1494, - "step": 2205 - }, - { - "epoch": 0.06, - "learning_rate": 1.9963113601249475e-06, - "loss": 1.0771, - "step": 2206 - }, - { - "epoch": 0.06, - "learning_rate": 1.9963042332708607e-06, - "loss": 0.9941, - "step": 2207 - }, - { - "epoch": 0.06, - "learning_rate": 1.996297099551234e-06, - "loss": 0.8926, - "step": 2208 - }, - { - "epoch": 0.06, - "learning_rate": 1.996289958966116e-06, - "loss": 0.9375, - "step": 2209 - }, - { - "epoch": 0.06, - "learning_rate": 1.9962828115155566e-06, - "loss": 0.8057, - "step": 2210 - }, - { - "epoch": 0.06, - "learning_rate": 1.996275657199605e-06, - "loss": 0.9219, - "step": 2211 - }, - { - "epoch": 0.06, - "learning_rate": 1.9962684960183102e-06, - "loss": 1.1777, - "step": 2212 - }, - { - "epoch": 0.06, - "learning_rate": 1.9962613279717215e-06, - "loss": 0.876, - "step": 2213 - }, - { - "epoch": 0.06, - "learning_rate": 1.996254153059889e-06, - "loss": 0.957, - "step": 2214 - }, - { - "epoch": 0.06, - "learning_rate": 1.996246971282861e-06, - "loss": 0.9863, - "step": 2215 - }, - { - "epoch": 0.06, - "learning_rate": 1.9962397826406882e-06, - "loss": 0.7559, - "step": 2216 - }, - { - "epoch": 0.06, - "learning_rate": 1.9962325871334193e-06, - "loss": 0.999, - "step": 2217 - }, - { - "epoch": 0.06, - "learning_rate": 1.996225384761104e-06, - "loss": 0.8477, - "step": 2218 - }, - { - "epoch": 0.06, - "learning_rate": 1.9962181755237916e-06, - "loss": 0.9551, - "step": 2219 - }, - { - "epoch": 0.06, - "learning_rate": 1.996210959421533e-06, - "loss": 0.79, - "step": 2220 - }, - { - "epoch": 0.06, - "learning_rate": 1.9962037364543765e-06, - "loss": 0.4814, - "step": 2221 - }, - { - "epoch": 0.06, - "learning_rate": 1.996196506622373e-06, - "loss": 1.0068, - "step": 2222 - }, - { - "epoch": 0.06, - "learning_rate": 1.9961892699255715e-06, - "loss": 0.9521, - "step": 2223 - }, - { - "epoch": 0.06, - "learning_rate": 1.9961820263640224e-06, - "loss": 1.0527, - "step": 2224 - }, - { - "epoch": 0.06, - "learning_rate": 1.9961747759377757e-06, - "loss": 0.9619, - "step": 2225 - }, - { - "epoch": 0.06, - "learning_rate": 1.9961675186468805e-06, - "loss": 1.0781, - "step": 2226 - }, - { - "epoch": 0.06, - "learning_rate": 1.996160254491388e-06, - "loss": 1.0156, - "step": 2227 - }, - { - "epoch": 0.06, - "learning_rate": 1.9961529834713474e-06, - "loss": 1.1602, - "step": 2228 - }, - { - "epoch": 0.06, - "learning_rate": 1.996145705586809e-06, - "loss": 0.9424, - "step": 2229 - }, - { - "epoch": 0.06, - "learning_rate": 1.996138420837823e-06, - "loss": 1.041, - "step": 2230 - }, - { - "epoch": 0.06, - "learning_rate": 1.99613112922444e-06, - "loss": 0.8896, - "step": 2231 - }, - { - "epoch": 0.06, - "learning_rate": 1.9961238307467096e-06, - "loss": 1.0098, - "step": 2232 - }, - { - "epoch": 0.06, - "learning_rate": 1.9961165254046822e-06, - "loss": 0.9756, - "step": 2233 - }, - { - "epoch": 0.06, - "learning_rate": 1.9961092131984083e-06, - "loss": 1.25, - "step": 2234 - }, - { - "epoch": 0.06, - "learning_rate": 1.9961018941279385e-06, - "loss": 0.8525, - "step": 2235 - }, - { - "epoch": 0.06, - "learning_rate": 1.9960945681933226e-06, - "loss": 0.6929, - "step": 2236 - }, - { - "epoch": 0.06, - "learning_rate": 1.996087235394612e-06, - "loss": 1.0459, - "step": 2237 - }, - { - "epoch": 0.06, - "learning_rate": 1.9960798957318566e-06, - "loss": 1.1016, - "step": 2238 - }, - { - "epoch": 0.06, - "learning_rate": 1.996072549205107e-06, - "loss": 0.9277, - "step": 2239 - }, - { - "epoch": 0.06, - "learning_rate": 1.996065195814414e-06, - "loss": 1.0322, - "step": 2240 - }, - { - "epoch": 0.06, - "learning_rate": 1.9960578355598285e-06, - "loss": 0.8436, - "step": 2241 - }, - { - "epoch": 0.06, - "learning_rate": 1.9960504684414004e-06, - "loss": 0.8682, - "step": 2242 - }, - { - "epoch": 0.06, - "learning_rate": 1.9960430944591815e-06, - "loss": 0.9482, - "step": 2243 - }, - { - "epoch": 0.06, - "learning_rate": 1.9960357136132217e-06, - "loss": 1.0342, - "step": 2244 - }, - { - "epoch": 0.06, - "learning_rate": 1.9960283259035726e-06, - "loss": 0.8721, - "step": 2245 - }, - { - "epoch": 0.06, - "learning_rate": 1.9960209313302847e-06, - "loss": 1.1348, - "step": 2246 - }, - { - "epoch": 0.06, - "learning_rate": 1.9960135298934087e-06, - "loss": 0.8447, - "step": 2247 - }, - { - "epoch": 0.06, - "learning_rate": 1.9960061215929964e-06, - "loss": 0.8643, - "step": 2248 - }, - { - "epoch": 0.06, - "learning_rate": 1.995998706429098e-06, - "loss": 0.9453, - "step": 2249 - }, - { - "epoch": 0.06, - "learning_rate": 1.9959912844017653e-06, - "loss": 1.2715, - "step": 2250 - }, - { - "epoch": 0.06, - "learning_rate": 1.995983855511049e-06, - "loss": 0.8945, - "step": 2251 - }, - { - "epoch": 0.06, - "learning_rate": 1.9959764197570007e-06, - "loss": 0.8193, - "step": 2252 - }, - { - "epoch": 0.06, - "learning_rate": 1.9959689771396707e-06, - "loss": 0.9775, - "step": 2253 - }, - { - "epoch": 0.06, - "learning_rate": 1.995961527659112e-06, - "loss": 0.9116, - "step": 2254 - }, - { - "epoch": 0.06, - "learning_rate": 1.995954071315374e-06, - "loss": 0.8623, - "step": 2255 - }, - { - "epoch": 0.06, - "learning_rate": 1.995946608108509e-06, - "loss": 0.9756, - "step": 2256 - }, - { - "epoch": 0.06, - "learning_rate": 1.995939138038569e-06, - "loss": 1.0811, - "step": 2257 - }, - { - "epoch": 0.06, - "learning_rate": 1.9959316611056045e-06, - "loss": 0.8818, - "step": 2258 - }, - { - "epoch": 0.06, - "learning_rate": 1.9959241773096674e-06, - "loss": 1.0742, - "step": 2259 - }, - { - "epoch": 0.06, - "learning_rate": 1.9959166866508093e-06, - "loss": 1.0498, - "step": 2260 - }, - { - "epoch": 0.06, - "learning_rate": 1.9959091891290815e-06, - "loss": 1.0469, - "step": 2261 - }, - { - "epoch": 0.06, - "learning_rate": 1.9959016847445364e-06, - "loss": 0.8135, - "step": 2262 - }, - { - "epoch": 0.06, - "learning_rate": 1.995894173497225e-06, - "loss": 0.8057, - "step": 2263 - }, - { - "epoch": 0.06, - "learning_rate": 1.9958866553871997e-06, - "loss": 1.0635, - "step": 2264 - }, - { - "epoch": 0.06, - "learning_rate": 1.9958791304145114e-06, - "loss": 1.0615, - "step": 2265 - }, - { - "epoch": 0.06, - "learning_rate": 1.995871598579213e-06, - "loss": 0.8926, - "step": 2266 - }, - { - "epoch": 0.06, - "learning_rate": 1.9958640598813556e-06, - "loss": 1.0391, - "step": 2267 - }, - { - "epoch": 0.06, - "learning_rate": 1.9958565143209914e-06, - "loss": 0.9883, - "step": 2268 - }, - { - "epoch": 0.06, - "learning_rate": 1.9958489618981726e-06, - "loss": 0.8838, - "step": 2269 - }, - { - "epoch": 0.06, - "learning_rate": 1.995841402612951e-06, - "loss": 0.9658, - "step": 2270 - }, - { - "epoch": 0.06, - "learning_rate": 1.9958338364653785e-06, - "loss": 1.1045, - "step": 2271 - }, - { - "epoch": 0.06, - "learning_rate": 1.9958262634555077e-06, - "loss": 0.8887, - "step": 2272 - }, - { - "epoch": 0.06, - "learning_rate": 1.995818683583391e-06, - "loss": 1.0703, - "step": 2273 - }, - { - "epoch": 0.06, - "learning_rate": 1.99581109684908e-06, - "loss": 0.8525, - "step": 2274 - }, - { - "epoch": 0.06, - "learning_rate": 1.995803503252627e-06, - "loss": 0.9668, - "step": 2275 - }, - { - "epoch": 0.06, - "learning_rate": 1.9957959027940847e-06, - "loss": 1.1445, - "step": 2276 - }, - { - "epoch": 0.06, - "learning_rate": 1.9957882954735054e-06, - "loss": 0.7466, - "step": 2277 - }, - { - "epoch": 0.06, - "learning_rate": 1.995780681290941e-06, - "loss": 1.0049, - "step": 2278 - }, - { - "epoch": 0.06, - "learning_rate": 1.9957730602464448e-06, - "loss": 0.9854, - "step": 2279 - }, - { - "epoch": 0.06, - "learning_rate": 1.995765432340069e-06, - "loss": 1.1113, - "step": 2280 - }, - { - "epoch": 0.06, - "learning_rate": 1.9957577975718655e-06, - "loss": 0.9307, - "step": 2281 - }, - { - "epoch": 0.06, - "learning_rate": 1.995750155941888e-06, - "loss": 0.8398, - "step": 2282 - }, - { - "epoch": 0.06, - "learning_rate": 1.9957425074501886e-06, - "loss": 0.9756, - "step": 2283 - }, - { - "epoch": 0.06, - "learning_rate": 1.99573485209682e-06, - "loss": 0.7549, - "step": 2284 - }, - { - "epoch": 0.06, - "learning_rate": 1.995727189881835e-06, - "loss": 0.8184, - "step": 2285 - }, - { - "epoch": 0.06, - "learning_rate": 1.995719520805287e-06, - "loss": 1.0244, - "step": 2286 - }, - { - "epoch": 0.06, - "learning_rate": 1.995711844867227e-06, - "loss": 1.0615, - "step": 2287 - }, - { - "epoch": 0.06, - "learning_rate": 1.9957041620677104e-06, - "loss": 0.7686, - "step": 2288 - }, - { - "epoch": 0.06, - "learning_rate": 1.995696472406788e-06, - "loss": 1.1123, - "step": 2289 - }, - { - "epoch": 0.06, - "learning_rate": 1.9956887758845144e-06, - "loss": 1.1699, - "step": 2290 - }, - { - "epoch": 0.06, - "learning_rate": 1.9956810725009414e-06, - "loss": 0.698, - "step": 2291 - }, - { - "epoch": 0.06, - "learning_rate": 1.995673362256123e-06, - "loss": 0.9854, - "step": 2292 - }, - { - "epoch": 0.06, - "learning_rate": 1.995665645150111e-06, - "loss": 1.0225, - "step": 2293 - }, - { - "epoch": 0.06, - "learning_rate": 1.9956579211829603e-06, - "loss": 0.9326, - "step": 2294 - }, - { - "epoch": 0.06, - "learning_rate": 1.9956501903547236e-06, - "loss": 0.9395, - "step": 2295 - }, - { - "epoch": 0.06, - "learning_rate": 1.9956424526654535e-06, - "loss": 1.002, - "step": 2296 - }, - { - "epoch": 0.06, - "learning_rate": 1.995634708115204e-06, - "loss": 0.9814, - "step": 2297 - }, - { - "epoch": 0.06, - "learning_rate": 1.995626956704028e-06, - "loss": 0.8896, - "step": 2298 - }, - { - "epoch": 0.06, - "learning_rate": 1.995619198431979e-06, - "loss": 0.9082, - "step": 2299 - }, - { - "epoch": 0.06, - "learning_rate": 1.995611433299111e-06, - "loss": 0.8267, - "step": 2300 - }, - { - "epoch": 0.06, - "learning_rate": 1.9956036613054766e-06, - "loss": 1.1543, - "step": 2301 - }, - { - "epoch": 0.06, - "learning_rate": 1.9955958824511303e-06, - "loss": 1.0537, - "step": 2302 - }, - { - "epoch": 0.06, - "learning_rate": 1.995588096736125e-06, - "loss": 1.0791, - "step": 2303 - }, - { - "epoch": 0.06, - "learning_rate": 1.9955803041605146e-06, - "loss": 0.9893, - "step": 2304 - }, - { - "epoch": 0.06, - "learning_rate": 1.9955725047243527e-06, - "loss": 0.9727, - "step": 2305 - }, - { - "epoch": 0.06, - "learning_rate": 1.9955646984276933e-06, - "loss": 1.0098, - "step": 2306 - }, - { - "epoch": 0.06, - "learning_rate": 1.9955568852705904e-06, - "loss": 0.8047, - "step": 2307 - }, - { - "epoch": 0.06, - "learning_rate": 1.9955490652530966e-06, - "loss": 0.8506, - "step": 2308 - }, - { - "epoch": 0.06, - "learning_rate": 1.995541238375267e-06, - "loss": 0.835, - "step": 2309 - }, - { - "epoch": 0.06, - "learning_rate": 1.995533404637156e-06, - "loss": 1.0127, - "step": 2310 - }, - { - "epoch": 0.06, - "learning_rate": 1.995525564038816e-06, - "loss": 1.0547, - "step": 2311 - }, - { - "epoch": 0.06, - "learning_rate": 1.995517716580302e-06, - "loss": 1.1191, - "step": 2312 - }, - { - "epoch": 0.06, - "learning_rate": 1.995509862261668e-06, - "loss": 1.001, - "step": 2313 - }, - { - "epoch": 0.06, - "learning_rate": 1.995502001082968e-06, - "loss": 0.9307, - "step": 2314 - }, - { - "epoch": 0.06, - "learning_rate": 1.9954941330442558e-06, - "loss": 1.0215, - "step": 2315 - }, - { - "epoch": 0.06, - "learning_rate": 1.9954862581455864e-06, - "loss": 0.9375, - "step": 2316 - }, - { - "epoch": 0.06, - "learning_rate": 1.9954783763870137e-06, - "loss": 0.9443, - "step": 2317 - }, - { - "epoch": 0.06, - "learning_rate": 1.9954704877685917e-06, - "loss": 0.6733, - "step": 2318 - }, - { - "epoch": 0.06, - "learning_rate": 1.995462592290375e-06, - "loss": 0.8398, - "step": 2319 - }, - { - "epoch": 0.06, - "learning_rate": 1.9954546899524187e-06, - "loss": 0.8809, - "step": 2320 - }, - { - "epoch": 0.06, - "learning_rate": 1.995446780754776e-06, - "loss": 0.8125, - "step": 2321 - }, - { - "epoch": 0.06, - "learning_rate": 1.9954388646975023e-06, - "loss": 0.9102, - "step": 2322 - }, - { - "epoch": 0.06, - "learning_rate": 1.9954309417806517e-06, - "loss": 1.0957, - "step": 2323 - }, - { - "epoch": 0.06, - "learning_rate": 1.995423012004279e-06, - "loss": 1.0527, - "step": 2324 - }, - { - "epoch": 0.06, - "learning_rate": 1.9954150753684387e-06, - "loss": 0.8975, - "step": 2325 - }, - { - "epoch": 0.06, - "learning_rate": 1.995407131873186e-06, - "loss": 0.9062, - "step": 2326 - }, - { - "epoch": 0.06, - "learning_rate": 1.995399181518575e-06, - "loss": 0.957, - "step": 2327 - }, - { - "epoch": 0.06, - "learning_rate": 1.9953912243046607e-06, - "loss": 1.1621, - "step": 2328 - }, - { - "epoch": 0.06, - "learning_rate": 1.9953832602314977e-06, - "loss": 0.9873, - "step": 2329 - }, - { - "epoch": 0.06, - "learning_rate": 1.9953752892991416e-06, - "loss": 0.8926, - "step": 2330 - }, - { - "epoch": 0.06, - "learning_rate": 1.9953673115076464e-06, - "loss": 1.1045, - "step": 2331 - }, - { - "epoch": 0.06, - "learning_rate": 1.995359326857068e-06, - "loss": 0.833, - "step": 2332 - }, - { - "epoch": 0.06, - "learning_rate": 1.9953513353474607e-06, - "loss": 1.248, - "step": 2333 - }, - { - "epoch": 0.06, - "learning_rate": 1.99534333697888e-06, - "loss": 0.9287, - "step": 2334 - }, - { - "epoch": 0.06, - "learning_rate": 1.9953353317513806e-06, - "loss": 0.9062, - "step": 2335 - }, - { - "epoch": 0.06, - "learning_rate": 1.995327319665018e-06, - "loss": 0.9199, - "step": 2336 - }, - { - "epoch": 0.06, - "learning_rate": 1.9953193007198475e-06, - "loss": 1.2217, - "step": 2337 - }, - { - "epoch": 0.06, - "learning_rate": 1.9953112749159236e-06, - "loss": 0.999, - "step": 2338 - }, - { - "epoch": 0.06, - "learning_rate": 1.995303242253303e-06, - "loss": 0.8936, - "step": 2339 - }, - { - "epoch": 0.06, - "learning_rate": 1.9952952027320397e-06, - "loss": 1.0186, - "step": 2340 - }, - { - "epoch": 0.06, - "learning_rate": 1.9952871563521897e-06, - "loss": 1.043, - "step": 2341 - }, - { - "epoch": 0.06, - "learning_rate": 1.9952791031138085e-06, - "loss": 0.8491, - "step": 2342 - }, - { - "epoch": 0.06, - "learning_rate": 1.9952710430169515e-06, - "loss": 1.1406, - "step": 2343 - }, - { - "epoch": 0.06, - "learning_rate": 1.9952629760616743e-06, - "loss": 1.1162, - "step": 2344 - }, - { - "epoch": 0.06, - "learning_rate": 1.9952549022480323e-06, - "loss": 0.917, - "step": 2345 - }, - { - "epoch": 0.06, - "learning_rate": 1.995246821576081e-06, - "loss": 1.0137, - "step": 2346 - }, - { - "epoch": 0.06, - "learning_rate": 1.995238734045877e-06, - "loss": 0.8096, - "step": 2347 - }, - { - "epoch": 0.06, - "learning_rate": 1.995230639657475e-06, - "loss": 0.7749, - "step": 2348 - }, - { - "epoch": 0.06, - "learning_rate": 1.995222538410931e-06, - "loss": 1.0176, - "step": 2349 - }, - { - "epoch": 0.06, - "learning_rate": 1.995214430306301e-06, - "loss": 0.8799, - "step": 2350 - }, - { - "epoch": 0.06, - "learning_rate": 1.995206315343641e-06, - "loss": 0.9961, - "step": 2351 - }, - { - "epoch": 0.06, - "learning_rate": 1.9951981935230065e-06, - "loss": 0.791, - "step": 2352 - }, - { - "epoch": 0.06, - "learning_rate": 1.9951900648444537e-06, - "loss": 1.0195, - "step": 2353 - }, - { - "epoch": 0.06, - "learning_rate": 1.995181929308039e-06, - "loss": 0.6948, - "step": 2354 - }, - { - "epoch": 0.06, - "learning_rate": 1.995173786913818e-06, - "loss": 1.0361, - "step": 2355 - }, - { - "epoch": 0.06, - "learning_rate": 1.9951656376618467e-06, - "loss": 0.8799, - "step": 2356 - }, - { - "epoch": 0.06, - "learning_rate": 1.995157481552182e-06, - "loss": 0.6646, - "step": 2357 - }, - { - "epoch": 0.06, - "learning_rate": 1.995149318584879e-06, - "loss": 0.9277, - "step": 2358 - }, - { - "epoch": 0.06, - "learning_rate": 1.9951411487599947e-06, - "loss": 0.96, - "step": 2359 - }, - { - "epoch": 0.06, - "learning_rate": 1.995132972077585e-06, - "loss": 0.9971, - "step": 2360 - }, - { - "epoch": 0.06, - "learning_rate": 1.995124788537707e-06, - "loss": 0.9961, - "step": 2361 - }, - { - "epoch": 0.06, - "learning_rate": 1.9951165981404165e-06, - "loss": 1.1084, - "step": 2362 - }, - { - "epoch": 0.06, - "learning_rate": 1.9951084008857696e-06, - "loss": 0.7422, - "step": 2363 - }, - { - "epoch": 0.06, - "learning_rate": 1.9951001967738235e-06, - "loss": 1.248, - "step": 2364 - }, - { - "epoch": 0.06, - "learning_rate": 1.995091985804634e-06, - "loss": 0.9854, - "step": 2365 - }, - { - "epoch": 0.06, - "learning_rate": 1.995083767978259e-06, - "loss": 1.085, - "step": 2366 - }, - { - "epoch": 0.06, - "learning_rate": 1.9950755432947536e-06, - "loss": 1.1084, - "step": 2367 - }, - { - "epoch": 0.06, - "learning_rate": 1.995067311754175e-06, - "loss": 0.9932, - "step": 2368 - }, - { - "epoch": 0.06, - "learning_rate": 1.9950590733565804e-06, - "loss": 1.1162, - "step": 2369 - }, - { - "epoch": 0.06, - "learning_rate": 1.995050828102026e-06, - "loss": 1.0127, - "step": 2370 - }, - { - "epoch": 0.06, - "learning_rate": 1.995042575990569e-06, - "loss": 0.7891, - "step": 2371 - }, - { - "epoch": 0.06, - "learning_rate": 1.9950343170222658e-06, - "loss": 0.9844, - "step": 2372 - }, - { - "epoch": 0.06, - "learning_rate": 1.9950260511971737e-06, - "loss": 1.1143, - "step": 2373 - }, - { - "epoch": 0.06, - "learning_rate": 1.9950177785153495e-06, - "loss": 1.0068, - "step": 2374 - }, - { - "epoch": 0.06, - "learning_rate": 1.995009498976851e-06, - "loss": 1.1152, - "step": 2375 - }, - { - "epoch": 0.06, - "learning_rate": 1.995001212581734e-06, - "loss": 0.9595, - "step": 2376 - }, - { - "epoch": 0.06, - "learning_rate": 1.9949929193300555e-06, - "loss": 0.9932, - "step": 2377 - }, - { - "epoch": 0.06, - "learning_rate": 1.994984619221874e-06, - "loss": 0.9434, - "step": 2378 - }, - { - "epoch": 0.06, - "learning_rate": 1.994976312257246e-06, - "loss": 1.0889, - "step": 2379 - }, - { - "epoch": 0.06, - "learning_rate": 1.994967998436228e-06, - "loss": 0.9785, - "step": 2380 - }, - { - "epoch": 0.06, - "learning_rate": 1.994959677758879e-06, - "loss": 1.1016, - "step": 2381 - }, - { - "epoch": 0.06, - "learning_rate": 1.9949513502252547e-06, - "loss": 0.9922, - "step": 2382 - }, - { - "epoch": 0.06, - "learning_rate": 1.9949430158354134e-06, - "loss": 0.8086, - "step": 2383 - }, - { - "epoch": 0.06, - "learning_rate": 1.994934674589412e-06, - "loss": 1.002, - "step": 2384 - }, - { - "epoch": 0.06, - "learning_rate": 1.994926326487309e-06, - "loss": 0.894, - "step": 2385 - }, - { - "epoch": 0.06, - "learning_rate": 1.9949179715291604e-06, - "loss": 0.8369, - "step": 2386 - }, - { - "epoch": 0.06, - "learning_rate": 1.9949096097150243e-06, - "loss": 1.0791, - "step": 2387 - }, - { - "epoch": 0.06, - "learning_rate": 1.994901241044959e-06, - "loss": 0.998, - "step": 2388 - }, - { - "epoch": 0.06, - "learning_rate": 1.994892865519022e-06, - "loss": 0.8984, - "step": 2389 - }, - { - "epoch": 0.06, - "learning_rate": 1.9948844831372705e-06, - "loss": 0.9697, - "step": 2390 - }, - { - "epoch": 0.06, - "learning_rate": 1.994876093899762e-06, - "loss": 0.9067, - "step": 2391 - }, - { - "epoch": 0.06, - "learning_rate": 1.9948676978065556e-06, - "loss": 1.0605, - "step": 2392 - }, - { - "epoch": 0.06, - "learning_rate": 1.994859294857708e-06, - "loss": 1.002, - "step": 2393 - }, - { - "epoch": 0.06, - "learning_rate": 1.9948508850532777e-06, - "loss": 1.1035, - "step": 2394 - }, - { - "epoch": 0.06, - "learning_rate": 1.994842468393322e-06, - "loss": 0.8354, - "step": 2395 - }, - { - "epoch": 0.06, - "learning_rate": 1.9948340448779e-06, - "loss": 0.9199, - "step": 2396 - }, - { - "epoch": 0.06, - "learning_rate": 1.9948256145070685e-06, - "loss": 0.9971, - "step": 2397 - }, - { - "epoch": 0.06, - "learning_rate": 1.9948171772808866e-06, - "loss": 1.1768, - "step": 2398 - }, - { - "epoch": 0.06, - "learning_rate": 1.9948087331994116e-06, - "loss": 1.1006, - "step": 2399 - }, - { - "epoch": 0.06, - "learning_rate": 1.9948002822627025e-06, - "loss": 1.0352, - "step": 2400 - }, - { - "epoch": 0.06, - "learning_rate": 1.994791824470817e-06, - "loss": 0.9961, - "step": 2401 - }, - { - "epoch": 0.06, - "learning_rate": 1.9947833598238135e-06, - "loss": 0.9492, - "step": 2402 - }, - { - "epoch": 0.06, - "learning_rate": 1.99477488832175e-06, - "loss": 0.6167, - "step": 2403 - }, - { - "epoch": 0.06, - "learning_rate": 1.9947664099646858e-06, - "loss": 0.9932, - "step": 2404 - }, - { - "epoch": 0.06, - "learning_rate": 1.9947579247526783e-06, - "loss": 0.9785, - "step": 2405 - }, - { - "epoch": 0.06, - "learning_rate": 1.9947494326857866e-06, - "loss": 1.0459, - "step": 2406 - }, - { - "epoch": 0.06, - "learning_rate": 1.9947409337640693e-06, - "loss": 0.9824, - "step": 2407 - }, - { - "epoch": 0.06, - "learning_rate": 1.9947324279875842e-06, - "loss": 0.957, - "step": 2408 - }, - { - "epoch": 0.06, - "learning_rate": 1.994723915356391e-06, - "loss": 0.9336, - "step": 2409 - }, - { - "epoch": 0.06, - "learning_rate": 1.9947153958705476e-06, - "loss": 1.2168, - "step": 2410 - }, - { - "epoch": 0.06, - "learning_rate": 1.9947068695301126e-06, - "loss": 1.0107, - "step": 2411 - }, - { - "epoch": 0.06, - "learning_rate": 1.994698336335145e-06, - "loss": 0.9209, - "step": 2412 - }, - { - "epoch": 0.06, - "learning_rate": 1.994689796285704e-06, - "loss": 1.1143, - "step": 2413 - }, - { - "epoch": 0.06, - "learning_rate": 1.994681249381848e-06, - "loss": 1.2363, - "step": 2414 - }, - { - "epoch": 0.06, - "learning_rate": 1.9946726956236364e-06, - "loss": 0.7778, - "step": 2415 - }, - { - "epoch": 0.06, - "learning_rate": 1.9946641350111272e-06, - "loss": 1.0508, - "step": 2416 - }, - { - "epoch": 0.06, - "learning_rate": 1.99465556754438e-06, - "loss": 0.9121, - "step": 2417 - }, - { - "epoch": 0.06, - "learning_rate": 1.994646993223454e-06, - "loss": 0.876, - "step": 2418 - }, - { - "epoch": 0.06, - "learning_rate": 1.994638412048408e-06, - "loss": 1.0195, - "step": 2419 - }, - { - "epoch": 0.06, - "learning_rate": 1.994629824019301e-06, - "loss": 1.0898, - "step": 2420 - }, - { - "epoch": 0.06, - "learning_rate": 1.994621229136192e-06, - "loss": 1.0039, - "step": 2421 - }, - { - "epoch": 0.06, - "learning_rate": 1.9946126273991415e-06, - "loss": 0.5532, - "step": 2422 - }, - { - "epoch": 0.06, - "learning_rate": 1.994604018808207e-06, - "loss": 1.0195, - "step": 2423 - }, - { - "epoch": 0.06, - "learning_rate": 1.9945954033634494e-06, - "loss": 0.9448, - "step": 2424 - }, - { - "epoch": 0.06, - "learning_rate": 1.994586781064927e-06, - "loss": 0.707, - "step": 2425 - }, - { - "epoch": 0.06, - "learning_rate": 1.9945781519127e-06, - "loss": 0.9785, - "step": 2426 - }, - { - "epoch": 0.06, - "learning_rate": 1.9945695159068267e-06, - "loss": 1.0322, - "step": 2427 - }, - { - "epoch": 0.06, - "learning_rate": 1.994560873047368e-06, - "loss": 0.9736, - "step": 2428 - }, - { - "epoch": 0.06, - "learning_rate": 1.9945522233343827e-06, - "loss": 1.0117, - "step": 2429 - }, - { - "epoch": 0.06, - "learning_rate": 1.9945435667679302e-06, - "loss": 0.9004, - "step": 2430 - }, - { - "epoch": 0.06, - "learning_rate": 1.9945349033480706e-06, - "loss": 1.043, - "step": 2431 - }, - { - "epoch": 0.06, - "learning_rate": 1.994526233074863e-06, - "loss": 0.9102, - "step": 2432 - }, - { - "epoch": 0.06, - "learning_rate": 1.9945175559483685e-06, - "loss": 0.9858, - "step": 2433 - }, - { - "epoch": 0.06, - "learning_rate": 1.994508871968646e-06, - "loss": 1.1143, - "step": 2434 - }, - { - "epoch": 0.06, - "learning_rate": 1.9945001811357547e-06, - "loss": 1.0098, - "step": 2435 - }, - { - "epoch": 0.06, - "learning_rate": 1.9944914834497557e-06, - "loss": 0.8867, - "step": 2436 - }, - { - "epoch": 0.06, - "learning_rate": 1.994482778910708e-06, - "loss": 1.0176, - "step": 2437 - }, - { - "epoch": 0.06, - "learning_rate": 1.994474067518672e-06, - "loss": 1.0547, - "step": 2438 - }, - { - "epoch": 0.06, - "learning_rate": 1.9944653492737074e-06, - "loss": 1.25, - "step": 2439 - }, - { - "epoch": 0.06, - "learning_rate": 1.9944566241758753e-06, - "loss": 0.915, - "step": 2440 - }, - { - "epoch": 0.06, - "learning_rate": 1.9944478922252345e-06, - "loss": 0.8887, - "step": 2441 - }, - { - "epoch": 0.06, - "learning_rate": 1.994439153421846e-06, - "loss": 1.0244, - "step": 2442 - }, - { - "epoch": 0.06, - "learning_rate": 1.99443040776577e-06, - "loss": 0.8955, - "step": 2443 - }, - { - "epoch": 0.06, - "learning_rate": 1.9944216552570663e-06, - "loss": 0.9277, - "step": 2444 - }, - { - "epoch": 0.06, - "learning_rate": 1.994412895895795e-06, - "loss": 0.874, - "step": 2445 - }, - { - "epoch": 0.06, - "learning_rate": 1.9944041296820178e-06, - "loss": 1.0215, - "step": 2446 - }, - { - "epoch": 0.06, - "learning_rate": 1.994395356615794e-06, - "loss": 1.0742, - "step": 2447 - }, - { - "epoch": 0.06, - "learning_rate": 1.994386576697184e-06, - "loss": 0.8887, - "step": 2448 - }, - { - "epoch": 0.06, - "learning_rate": 1.9943777899262484e-06, - "loss": 0.8193, - "step": 2449 - }, - { - "epoch": 0.06, - "learning_rate": 1.994368996303048e-06, - "loss": 0.9482, - "step": 2450 - }, - { - "epoch": 0.06, - "learning_rate": 1.9943601958276436e-06, - "loss": 0.7939, - "step": 2451 - }, - { - "epoch": 0.06, - "learning_rate": 1.9943513885000956e-06, - "loss": 0.9443, - "step": 2452 - }, - { - "epoch": 0.06, - "learning_rate": 1.994342574320465e-06, - "loss": 0.8525, - "step": 2453 - }, - { - "epoch": 0.06, - "learning_rate": 1.9943337532888116e-06, - "loss": 1.1572, - "step": 2454 - }, - { - "epoch": 0.06, - "learning_rate": 1.994324925405197e-06, - "loss": 1.085, - "step": 2455 - }, - { - "epoch": 0.06, - "learning_rate": 1.994316090669682e-06, - "loss": 0.8604, - "step": 2456 - }, - { - "epoch": 0.06, - "learning_rate": 1.994307249082327e-06, - "loss": 0.8896, - "step": 2457 - }, - { - "epoch": 0.06, - "learning_rate": 1.9942984006431934e-06, - "loss": 0.7378, - "step": 2458 - }, - { - "epoch": 0.06, - "learning_rate": 1.994289545352342e-06, - "loss": 1.0439, - "step": 2459 - }, - { - "epoch": 0.06, - "learning_rate": 1.994280683209834e-06, - "loss": 0.9248, - "step": 2460 - }, - { - "epoch": 0.06, - "learning_rate": 1.99427181421573e-06, - "loss": 0.8896, - "step": 2461 - }, - { - "epoch": 0.06, - "learning_rate": 1.9942629383700917e-06, - "loss": 1.2637, - "step": 2462 - }, - { - "epoch": 0.06, - "learning_rate": 1.9942540556729795e-06, - "loss": 1.0723, - "step": 2463 - }, - { - "epoch": 0.06, - "learning_rate": 1.994245166124456e-06, - "loss": 1.0732, - "step": 2464 - }, - { - "epoch": 0.06, - "learning_rate": 1.9942362697245804e-06, - "loss": 0.7988, - "step": 2465 - }, - { - "epoch": 0.06, - "learning_rate": 1.994227366473416e-06, - "loss": 0.9678, - "step": 2466 - }, - { - "epoch": 0.06, - "learning_rate": 1.994218456371023e-06, - "loss": 0.895, - "step": 2467 - }, - { - "epoch": 0.06, - "learning_rate": 1.994209539417463e-06, - "loss": 0.9727, - "step": 2468 - }, - { - "epoch": 0.06, - "learning_rate": 1.9942006156127975e-06, - "loss": 0.998, - "step": 2469 - }, - { - "epoch": 0.06, - "learning_rate": 1.9941916849570886e-06, - "loss": 1.1523, - "step": 2470 - }, - { - "epoch": 0.06, - "learning_rate": 1.9941827474503967e-06, - "loss": 0.9863, - "step": 2471 - }, - { - "epoch": 0.06, - "learning_rate": 1.9941738030927843e-06, - "loss": 1.0078, - "step": 2472 - }, - { - "epoch": 0.06, - "learning_rate": 1.9941648518843125e-06, - "loss": 1.1377, - "step": 2473 - }, - { - "epoch": 0.06, - "learning_rate": 1.9941558938250434e-06, - "loss": 1.0957, - "step": 2474 - }, - { - "epoch": 0.06, - "learning_rate": 1.9941469289150383e-06, - "loss": 1.0459, - "step": 2475 - }, - { - "epoch": 0.06, - "learning_rate": 1.9941379571543595e-06, - "loss": 0.9922, - "step": 2476 - }, - { - "epoch": 0.06, - "learning_rate": 1.9941289785430684e-06, - "loss": 1.0039, - "step": 2477 - }, - { - "epoch": 0.06, - "learning_rate": 1.9941199930812267e-06, - "loss": 0.9248, - "step": 2478 - }, - { - "epoch": 0.06, - "learning_rate": 1.994111000768897e-06, - "loss": 1.1348, - "step": 2479 - }, - { - "epoch": 0.06, - "learning_rate": 1.994102001606141e-06, - "loss": 0.9609, - "step": 2480 - }, - { - "epoch": 0.06, - "learning_rate": 1.9940929955930203e-06, - "loss": 0.8936, - "step": 2481 - }, - { - "epoch": 0.06, - "learning_rate": 1.9940839827295976e-06, - "loss": 0.8867, - "step": 2482 - }, - { - "epoch": 0.06, - "learning_rate": 1.994074963015934e-06, - "loss": 0.9521, - "step": 2483 - }, - { - "epoch": 0.06, - "learning_rate": 1.994065936452093e-06, - "loss": 1.0039, - "step": 2484 - }, - { - "epoch": 0.06, - "learning_rate": 1.9940569030381357e-06, - "loss": 0.8413, - "step": 2485 - }, - { - "epoch": 0.06, - "learning_rate": 1.9940478627741247e-06, - "loss": 0.8691, - "step": 2486 - }, - { - "epoch": 0.06, - "learning_rate": 1.9940388156601226e-06, - "loss": 0.9961, - "step": 2487 - }, - { - "epoch": 0.06, - "learning_rate": 1.9940297616961918e-06, - "loss": 0.9375, - "step": 2488 - }, - { - "epoch": 0.06, - "learning_rate": 1.994020700882394e-06, - "loss": 1.0498, - "step": 2489 - }, - { - "epoch": 0.06, - "learning_rate": 1.994011633218792e-06, - "loss": 1.123, - "step": 2490 - }, - { - "epoch": 0.06, - "learning_rate": 1.9940025587054485e-06, - "loss": 0.8787, - "step": 2491 - }, - { - "epoch": 0.06, - "learning_rate": 1.993993477342426e-06, - "loss": 0.6821, - "step": 2492 - }, - { - "epoch": 0.06, - "learning_rate": 1.9939843891297865e-06, - "loss": 0.8354, - "step": 2493 - }, - { - "epoch": 0.06, - "learning_rate": 1.9939752940675935e-06, - "loss": 0.918, - "step": 2494 - }, - { - "epoch": 0.06, - "learning_rate": 1.993966192155909e-06, - "loss": 0.9932, - "step": 2495 - }, - { - "epoch": 0.06, - "learning_rate": 1.993957083394796e-06, - "loss": 0.8574, - "step": 2496 - }, - { - "epoch": 0.06, - "learning_rate": 1.9939479677843175e-06, - "loss": 0.833, - "step": 2497 - }, - { - "epoch": 0.06, - "learning_rate": 1.9939388453245355e-06, - "loss": 0.9707, - "step": 2498 - }, - { - "epoch": 0.06, - "learning_rate": 1.993929716015514e-06, - "loss": 1.0742, - "step": 2499 - }, - { - "epoch": 0.06, - "learning_rate": 1.993920579857315e-06, - "loss": 0.854, - "step": 2500 - }, - { - "epoch": 0.06, - "learning_rate": 1.9939114368500014e-06, - "loss": 0.8633, - "step": 2501 - }, - { - "epoch": 0.06, - "learning_rate": 1.993902286993637e-06, - "loss": 1.1475, - "step": 2502 - }, - { - "epoch": 0.06, - "learning_rate": 1.9938931302882846e-06, - "loss": 0.9365, - "step": 2503 - }, - { - "epoch": 0.06, - "learning_rate": 1.993883966734007e-06, - "loss": 1.1084, - "step": 2504 - }, - { - "epoch": 0.06, - "learning_rate": 1.9938747963308677e-06, - "loss": 1.1514, - "step": 2505 - }, - { - "epoch": 0.06, - "learning_rate": 1.993865619078929e-06, - "loss": 0.8496, - "step": 2506 - }, - { - "epoch": 0.06, - "learning_rate": 1.9938564349782555e-06, - "loss": 0.9902, - "step": 2507 - }, - { - "epoch": 0.06, - "learning_rate": 1.9938472440289094e-06, - "loss": 1.0654, - "step": 2508 - }, - { - "epoch": 0.06, - "learning_rate": 1.9938380462309546e-06, - "loss": 0.9268, - "step": 2509 - }, - { - "epoch": 0.06, - "learning_rate": 1.993828841584454e-06, - "loss": 0.7979, - "step": 2510 - }, - { - "epoch": 0.06, - "learning_rate": 1.993819630089472e-06, - "loss": 0.9834, - "step": 2511 - }, - { - "epoch": 0.06, - "learning_rate": 1.993810411746071e-06, - "loss": 0.8584, - "step": 2512 - }, - { - "epoch": 0.06, - "learning_rate": 1.993801186554315e-06, - "loss": 0.917, - "step": 2513 - }, - { - "epoch": 0.06, - "learning_rate": 1.9937919545142673e-06, - "loss": 1.0713, - "step": 2514 - }, - { - "epoch": 0.06, - "learning_rate": 1.993782715625992e-06, - "loss": 0.9795, - "step": 2515 - }, - { - "epoch": 0.06, - "learning_rate": 1.9937734698895524e-06, - "loss": 1.0176, - "step": 2516 - }, - { - "epoch": 0.06, - "learning_rate": 1.9937642173050123e-06, - "loss": 1.0273, - "step": 2517 - }, - { - "epoch": 0.06, - "learning_rate": 1.9937549578724357e-06, - "loss": 0.8877, - "step": 2518 - }, - { - "epoch": 0.06, - "learning_rate": 1.9937456915918858e-06, - "loss": 0.9473, - "step": 2519 - }, - { - "epoch": 0.06, - "learning_rate": 1.9937364184634272e-06, - "loss": 0.79, - "step": 2520 - }, - { - "epoch": 0.06, - "learning_rate": 1.993727138487123e-06, - "loss": 1.0098, - "step": 2521 - }, - { - "epoch": 0.06, - "learning_rate": 1.993717851663038e-06, - "loss": 0.8105, - "step": 2522 - }, - { - "epoch": 0.06, - "learning_rate": 1.9937085579912357e-06, - "loss": 1.1084, - "step": 2523 - }, - { - "epoch": 0.06, - "learning_rate": 1.99369925747178e-06, - "loss": 1.0166, - "step": 2524 - }, - { - "epoch": 0.06, - "learning_rate": 1.9936899501047354e-06, - "loss": 0.9844, - "step": 2525 - }, - { - "epoch": 0.06, - "learning_rate": 1.993680635890166e-06, - "loss": 0.9639, - "step": 2526 - }, - { - "epoch": 0.06, - "learning_rate": 1.9936713148281356e-06, - "loss": 1.0537, - "step": 2527 - }, - { - "epoch": 0.06, - "learning_rate": 1.9936619869187085e-06, - "loss": 0.9824, - "step": 2528 - }, - { - "epoch": 0.06, - "learning_rate": 1.993652652161949e-06, - "loss": 0.9834, - "step": 2529 - }, - { - "epoch": 0.06, - "learning_rate": 1.993643310557922e-06, - "loss": 0.8809, - "step": 2530 - }, - { - "epoch": 0.06, - "learning_rate": 1.9936339621066914e-06, - "loss": 0.9199, - "step": 2531 - }, - { - "epoch": 0.06, - "learning_rate": 1.993624606808322e-06, - "loss": 0.9561, - "step": 2532 - }, - { - "epoch": 0.06, - "learning_rate": 1.993615244662877e-06, - "loss": 0.9805, - "step": 2533 - }, - { - "epoch": 0.06, - "learning_rate": 1.9936058756704224e-06, - "loss": 0.9199, - "step": 2534 - }, - { - "epoch": 0.06, - "learning_rate": 1.9935964998310223e-06, - "loss": 1.0049, - "step": 2535 - }, - { - "epoch": 0.06, - "learning_rate": 1.993587117144741e-06, - "loss": 0.6753, - "step": 2536 - }, - { - "epoch": 0.07, - "learning_rate": 1.9935777276116434e-06, - "loss": 1.0479, - "step": 2537 - }, - { - "epoch": 0.07, - "learning_rate": 1.9935683312317942e-06, - "loss": 1.125, - "step": 2538 - }, - { - "epoch": 0.07, - "learning_rate": 1.9935589280052583e-06, - "loss": 0.874, - "step": 2539 - }, - { - "epoch": 0.07, - "learning_rate": 1.9935495179321e-06, - "loss": 1.0654, - "step": 2540 - }, - { - "epoch": 0.07, - "learning_rate": 1.993540101012385e-06, - "loss": 0.874, - "step": 2541 - }, - { - "epoch": 0.07, - "learning_rate": 1.9935306772461773e-06, - "loss": 0.9121, - "step": 2542 - }, - { - "epoch": 0.07, - "learning_rate": 1.993521246633542e-06, - "loss": 0.8154, - "step": 2543 - }, - { - "epoch": 0.07, - "learning_rate": 1.9935118091745443e-06, - "loss": 0.9971, - "step": 2544 - }, - { - "epoch": 0.07, - "learning_rate": 1.9935023648692495e-06, - "loss": 0.7935, - "step": 2545 - }, - { - "epoch": 0.07, - "learning_rate": 1.9934929137177224e-06, - "loss": 1.001, - "step": 2546 - }, - { - "epoch": 0.07, - "learning_rate": 1.9934834557200283e-06, - "loss": 0.9414, - "step": 2547 - }, - { - "epoch": 0.07, - "learning_rate": 1.993473990876232e-06, - "loss": 0.959, - "step": 2548 - }, - { - "epoch": 0.07, - "learning_rate": 1.9934645191863987e-06, - "loss": 0.8457, - "step": 2549 - }, - { - "epoch": 0.07, - "learning_rate": 1.9934550406505937e-06, - "loss": 0.9072, - "step": 2550 - }, - { - "epoch": 0.07, - "learning_rate": 1.993445555268883e-06, - "loss": 1.0381, - "step": 2551 - }, - { - "epoch": 0.07, - "learning_rate": 1.9934360630413313e-06, - "loss": 0.9355, - "step": 2552 - }, - { - "epoch": 0.07, - "learning_rate": 1.9934265639680042e-06, - "loss": 1.0068, - "step": 2553 - }, - { - "epoch": 0.07, - "learning_rate": 1.9934170580489675e-06, - "loss": 1.0029, - "step": 2554 - }, - { - "epoch": 0.07, - "learning_rate": 1.993407545284286e-06, - "loss": 0.9121, - "step": 2555 - }, - { - "epoch": 0.07, - "learning_rate": 1.9933980256740254e-06, - "loss": 0.8259, - "step": 2556 - }, - { - "epoch": 0.07, - "learning_rate": 1.9933884992182517e-06, - "loss": 0.917, - "step": 2557 - }, - { - "epoch": 0.07, - "learning_rate": 1.9933789659170306e-06, - "loss": 1.0059, - "step": 2558 - }, - { - "epoch": 0.07, - "learning_rate": 1.993369425770427e-06, - "loss": 1.2354, - "step": 2559 - }, - { - "epoch": 0.07, - "learning_rate": 1.9933598787785073e-06, - "loss": 0.9912, - "step": 2560 - }, - { - "epoch": 0.07, - "learning_rate": 1.993350324941338e-06, - "loss": 0.8223, - "step": 2561 - }, - { - "epoch": 0.07, - "learning_rate": 1.993340764258983e-06, - "loss": 0.9639, - "step": 2562 - }, - { - "epoch": 0.07, - "learning_rate": 1.9933311967315096e-06, - "loss": 0.9717, - "step": 2563 - }, - { - "epoch": 0.07, - "learning_rate": 1.993321622358984e-06, - "loss": 0.9365, - "step": 2564 - }, - { - "epoch": 0.07, - "learning_rate": 1.993312041141471e-06, - "loss": 0.77, - "step": 2565 - }, - { - "epoch": 0.07, - "learning_rate": 1.9933024530790374e-06, - "loss": 1.1982, - "step": 2566 - }, - { - "epoch": 0.07, - "learning_rate": 1.993292858171749e-06, - "loss": 0.9932, - "step": 2567 - }, - { - "epoch": 0.07, - "learning_rate": 1.993283256419672e-06, - "loss": 0.998, - "step": 2568 - }, - { - "epoch": 0.07, - "learning_rate": 1.993273647822873e-06, - "loss": 1.0049, - "step": 2569 - }, - { - "epoch": 0.07, - "learning_rate": 1.9932640323814173e-06, - "loss": 1.1357, - "step": 2570 - }, - { - "epoch": 0.07, - "learning_rate": 1.9932544100953717e-06, - "loss": 1.0, - "step": 2571 - }, - { - "epoch": 0.07, - "learning_rate": 1.9932447809648028e-06, - "loss": 1.1094, - "step": 2572 - }, - { - "epoch": 0.07, - "learning_rate": 1.9932351449897765e-06, - "loss": 1.1562, - "step": 2573 - }, - { - "epoch": 0.07, - "learning_rate": 1.993225502170359e-06, - "loss": 0.6772, - "step": 2574 - }, - { - "epoch": 0.07, - "learning_rate": 1.9932158525066173e-06, - "loss": 1.085, - "step": 2575 - }, - { - "epoch": 0.07, - "learning_rate": 1.9932061959986175e-06, - "loss": 1.2236, - "step": 2576 - }, - { - "epoch": 0.07, - "learning_rate": 1.9931965326464263e-06, - "loss": 0.8228, - "step": 2577 - }, - { - "epoch": 0.07, - "learning_rate": 1.9931868624501106e-06, - "loss": 1.0332, - "step": 2578 - }, - { - "epoch": 0.07, - "learning_rate": 1.9931771854097365e-06, - "loss": 1.0264, - "step": 2579 - }, - { - "epoch": 0.07, - "learning_rate": 1.993167501525371e-06, - "loss": 0.9141, - "step": 2580 - }, - { - "epoch": 0.07, - "learning_rate": 1.9931578107970808e-06, - "loss": 1.0713, - "step": 2581 - }, - { - "epoch": 0.07, - "learning_rate": 1.9931481132249325e-06, - "loss": 0.999, - "step": 2582 - }, - { - "epoch": 0.07, - "learning_rate": 1.9931384088089927e-06, - "loss": 0.9131, - "step": 2583 - }, - { - "epoch": 0.07, - "learning_rate": 1.9931286975493295e-06, - "loss": 1.0488, - "step": 2584 - }, - { - "epoch": 0.07, - "learning_rate": 1.993118979446008e-06, - "loss": 1.0127, - "step": 2585 - }, - { - "epoch": 0.07, - "learning_rate": 1.9931092544990967e-06, - "loss": 0.9746, - "step": 2586 - }, - { - "epoch": 0.07, - "learning_rate": 1.993099522708662e-06, - "loss": 0.9346, - "step": 2587 - }, - { - "epoch": 0.07, - "learning_rate": 1.993089784074771e-06, - "loss": 1.0518, - "step": 2588 - }, - { - "epoch": 0.07, - "learning_rate": 1.9930800385974905e-06, - "loss": 0.9082, - "step": 2589 - }, - { - "epoch": 0.07, - "learning_rate": 1.993070286276888e-06, - "loss": 0.874, - "step": 2590 - }, - { - "epoch": 0.07, - "learning_rate": 1.9930605271130307e-06, - "loss": 0.791, - "step": 2591 - }, - { - "epoch": 0.07, - "learning_rate": 1.993050761105986e-06, - "loss": 0.8486, - "step": 2592 - }, - { - "epoch": 0.07, - "learning_rate": 1.9930409882558207e-06, - "loss": 1.2598, - "step": 2593 - }, - { - "epoch": 0.07, - "learning_rate": 1.9930312085626026e-06, - "loss": 0.9111, - "step": 2594 - }, - { - "epoch": 0.07, - "learning_rate": 1.993021422026399e-06, - "loss": 0.6909, - "step": 2595 - }, - { - "epoch": 0.07, - "learning_rate": 1.9930116286472772e-06, - "loss": 0.9863, - "step": 2596 - }, - { - "epoch": 0.07, - "learning_rate": 1.9930018284253046e-06, - "loss": 0.9404, - "step": 2597 - }, - { - "epoch": 0.07, - "learning_rate": 1.9929920213605493e-06, - "loss": 0.9746, - "step": 2598 - }, - { - "epoch": 0.07, - "learning_rate": 1.992982207453078e-06, - "loss": 1.0322, - "step": 2599 - }, - { - "epoch": 0.07, - "learning_rate": 1.9929723867029592e-06, - "loss": 1.0596, - "step": 2600 - }, - { - "epoch": 0.07, - "learning_rate": 1.99296255911026e-06, - "loss": 1.0146, - "step": 2601 - }, - { - "epoch": 0.07, - "learning_rate": 1.9929527246750487e-06, - "loss": 0.9619, - "step": 2602 - }, - { - "epoch": 0.07, - "learning_rate": 1.992942883397392e-06, - "loss": 1.0068, - "step": 2603 - }, - { - "epoch": 0.07, - "learning_rate": 1.992933035277359e-06, - "loss": 1.0747, - "step": 2604 - }, - { - "epoch": 0.07, - "learning_rate": 1.992923180315017e-06, - "loss": 1.0303, - "step": 2605 - }, - { - "epoch": 0.07, - "learning_rate": 1.9929133185104333e-06, - "loss": 0.8574, - "step": 2606 - }, - { - "epoch": 0.07, - "learning_rate": 1.9929034498636764e-06, - "loss": 1.0771, - "step": 2607 - }, - { - "epoch": 0.07, - "learning_rate": 1.992893574374815e-06, - "loss": 1.0488, - "step": 2608 - }, - { - "epoch": 0.07, - "learning_rate": 1.992883692043916e-06, - "loss": 0.8262, - "step": 2609 - }, - { - "epoch": 0.07, - "learning_rate": 1.992873802871048e-06, - "loss": 0.8408, - "step": 2610 - }, - { - "epoch": 0.07, - "learning_rate": 1.9928639068562793e-06, - "loss": 0.9258, - "step": 2611 - }, - { - "epoch": 0.07, - "learning_rate": 1.9928540039996777e-06, - "loss": 0.6797, - "step": 2612 - }, - { - "epoch": 0.07, - "learning_rate": 1.992844094301312e-06, - "loss": 0.7793, - "step": 2613 - }, - { - "epoch": 0.07, - "learning_rate": 1.9928341777612497e-06, - "loss": 1.0381, - "step": 2614 - }, - { - "epoch": 0.07, - "learning_rate": 1.9928242543795596e-06, - "loss": 1.0342, - "step": 2615 - }, - { - "epoch": 0.07, - "learning_rate": 1.9928143241563103e-06, - "loss": 1.0, - "step": 2616 - }, - { - "epoch": 0.07, - "learning_rate": 1.99280438709157e-06, - "loss": 0.9092, - "step": 2617 - }, - { - "epoch": 0.07, - "learning_rate": 1.992794443185407e-06, - "loss": 0.9019, - "step": 2618 - }, - { - "epoch": 0.07, - "learning_rate": 1.99278449243789e-06, - "loss": 0.8799, - "step": 2619 - }, - { - "epoch": 0.07, - "learning_rate": 1.992774534849088e-06, - "loss": 0.998, - "step": 2620 - }, - { - "epoch": 0.07, - "learning_rate": 1.992764570419069e-06, - "loss": 1.001, - "step": 2621 - }, - { - "epoch": 0.07, - "learning_rate": 1.9927545991479016e-06, - "loss": 0.9893, - "step": 2622 - }, - { - "epoch": 0.07, - "learning_rate": 1.9927446210356546e-06, - "loss": 1.0596, - "step": 2623 - }, - { - "epoch": 0.07, - "learning_rate": 1.9927346360823975e-06, - "loss": 0.9316, - "step": 2624 - }, - { - "epoch": 0.07, - "learning_rate": 1.992724644288198e-06, - "loss": 1.0391, - "step": 2625 - }, - { - "epoch": 0.07, - "learning_rate": 1.9927146456531256e-06, - "loss": 0.752, - "step": 2626 - }, - { - "epoch": 0.07, - "learning_rate": 1.992704640177249e-06, - "loss": 0.9053, - "step": 2627 - }, - { - "epoch": 0.07, - "learning_rate": 1.9926946278606372e-06, - "loss": 0.8521, - "step": 2628 - }, - { - "epoch": 0.07, - "learning_rate": 1.9926846087033597e-06, - "loss": 0.5986, - "step": 2629 - }, - { - "epoch": 0.07, - "learning_rate": 1.9926745827054848e-06, - "loss": 0.8047, - "step": 2630 - }, - { - "epoch": 0.07, - "learning_rate": 1.992664549867082e-06, - "loss": 0.5306, - "step": 2631 - }, - { - "epoch": 0.07, - "learning_rate": 1.99265451018822e-06, - "loss": 0.918, - "step": 2632 - }, - { - "epoch": 0.07, - "learning_rate": 1.9926444636689682e-06, - "loss": 0.9893, - "step": 2633 - }, - { - "epoch": 0.07, - "learning_rate": 1.992634410309396e-06, - "loss": 1.1016, - "step": 2634 - }, - { - "epoch": 0.07, - "learning_rate": 1.992624350109573e-06, - "loss": 0.8965, - "step": 2635 - }, - { - "epoch": 0.07, - "learning_rate": 1.9926142830695677e-06, - "loss": 1.0635, - "step": 2636 - }, - { - "epoch": 0.07, - "learning_rate": 1.9926042091894496e-06, - "loss": 0.9795, - "step": 2637 - }, - { - "epoch": 0.07, - "learning_rate": 1.992594128469289e-06, - "loss": 0.9688, - "step": 2638 - }, - { - "epoch": 0.07, - "learning_rate": 1.9925840409091542e-06, - "loss": 0.9688, - "step": 2639 - }, - { - "epoch": 0.07, - "learning_rate": 1.9925739465091154e-06, - "loss": 0.5957, - "step": 2640 - }, - { - "epoch": 0.07, - "learning_rate": 1.9925638452692428e-06, - "loss": 1.0, - "step": 2641 - }, - { - "epoch": 0.07, - "learning_rate": 1.9925537371896045e-06, - "loss": 1.0049, - "step": 2642 - }, - { - "epoch": 0.07, - "learning_rate": 1.992543622270271e-06, - "loss": 0.9336, - "step": 2643 - }, - { - "epoch": 0.07, - "learning_rate": 1.992533500511312e-06, - "loss": 1.0234, - "step": 2644 - }, - { - "epoch": 0.07, - "learning_rate": 1.9925233719127967e-06, - "loss": 1.1602, - "step": 2645 - }, - { - "epoch": 0.07, - "learning_rate": 1.992513236474796e-06, - "loss": 1.0117, - "step": 2646 - }, - { - "epoch": 0.07, - "learning_rate": 1.992503094197379e-06, - "loss": 0.8652, - "step": 2647 - }, - { - "epoch": 0.07, - "learning_rate": 1.992492945080615e-06, - "loss": 0.8965, - "step": 2648 - }, - { - "epoch": 0.07, - "learning_rate": 1.992482789124576e-06, - "loss": 1.082, - "step": 2649 - }, - { - "epoch": 0.07, - "learning_rate": 1.9924726263293294e-06, - "loss": 0.8281, - "step": 2650 - }, - { - "epoch": 0.07, - "learning_rate": 1.9924624566949467e-06, - "loss": 1.0605, - "step": 2651 - }, - { - "epoch": 0.07, - "learning_rate": 1.992452280221498e-06, - "loss": 1.0293, - "step": 2652 - }, - { - "epoch": 0.07, - "learning_rate": 1.9924420969090527e-06, - "loss": 0.8633, - "step": 2653 - }, - { - "epoch": 0.07, - "learning_rate": 1.9924319067576817e-06, - "loss": 0.7598, - "step": 2654 - }, - { - "epoch": 0.07, - "learning_rate": 1.9924217097674547e-06, - "loss": 0.7446, - "step": 2655 - }, - { - "epoch": 0.07, - "learning_rate": 1.9924115059384425e-06, - "loss": 1.1201, - "step": 2656 - }, - { - "epoch": 0.07, - "learning_rate": 1.992401295270715e-06, - "loss": 0.8218, - "step": 2657 - }, - { - "epoch": 0.07, - "learning_rate": 1.9923910777643425e-06, - "loss": 0.7305, - "step": 2658 - }, - { - "epoch": 0.07, - "learning_rate": 1.9923808534193957e-06, - "loss": 0.8691, - "step": 2659 - }, - { - "epoch": 0.07, - "learning_rate": 1.992370622235945e-06, - "loss": 0.7676, - "step": 2660 - }, - { - "epoch": 0.07, - "learning_rate": 1.992360384214061e-06, - "loss": 1.0156, - "step": 2661 - }, - { - "epoch": 0.07, - "learning_rate": 1.992350139353814e-06, - "loss": 0.8999, - "step": 2662 - }, - { - "epoch": 0.07, - "learning_rate": 1.9923398876552748e-06, - "loss": 0.8232, - "step": 2663 - }, - { - "epoch": 0.07, - "learning_rate": 1.9923296291185132e-06, - "loss": 0.9248, - "step": 2664 - }, - { - "epoch": 0.07, - "learning_rate": 1.9923193637436013e-06, - "loss": 0.6572, - "step": 2665 - }, - { - "epoch": 0.07, - "learning_rate": 1.9923090915306094e-06, - "loss": 1.1377, - "step": 2666 - }, - { - "epoch": 0.07, - "learning_rate": 1.9922988124796077e-06, - "loss": 1.0811, - "step": 2667 - }, - { - "epoch": 0.07, - "learning_rate": 1.992288526590667e-06, - "loss": 0.8804, - "step": 2668 - }, - { - "epoch": 0.07, - "learning_rate": 1.9922782338638594e-06, - "loss": 0.9697, - "step": 2669 - }, - { - "epoch": 0.07, - "learning_rate": 1.9922679342992545e-06, - "loss": 1.001, - "step": 2670 - }, - { - "epoch": 0.07, - "learning_rate": 1.9922576278969237e-06, - "loss": 0.9785, - "step": 2671 - }, - { - "epoch": 0.07, - "learning_rate": 1.9922473146569385e-06, - "loss": 0.9932, - "step": 2672 - }, - { - "epoch": 0.07, - "learning_rate": 1.992236994579369e-06, - "loss": 1.1768, - "step": 2673 - }, - { - "epoch": 0.07, - "learning_rate": 1.9922266676642873e-06, - "loss": 0.7588, - "step": 2674 - }, - { - "epoch": 0.07, - "learning_rate": 1.992216333911764e-06, - "loss": 1.083, - "step": 2675 - }, - { - "epoch": 0.07, - "learning_rate": 1.9922059933218706e-06, - "loss": 0.6689, - "step": 2676 - }, - { - "epoch": 0.07, - "learning_rate": 1.992195645894678e-06, - "loss": 0.8896, - "step": 2677 - }, - { - "epoch": 0.07, - "learning_rate": 1.9921852916302576e-06, - "loss": 1.1504, - "step": 2678 - }, - { - "epoch": 0.07, - "learning_rate": 1.992174930528681e-06, - "loss": 0.9834, - "step": 2679 - }, - { - "epoch": 0.07, - "learning_rate": 1.9921645625900196e-06, - "loss": 0.8516, - "step": 2680 - }, - { - "epoch": 0.07, - "learning_rate": 1.9921541878143448e-06, - "loss": 0.6638, - "step": 2681 - }, - { - "epoch": 0.07, - "learning_rate": 1.992143806201728e-06, - "loss": 0.8564, - "step": 2682 - }, - { - "epoch": 0.07, - "learning_rate": 1.99213341775224e-06, - "loss": 0.8521, - "step": 2683 - }, - { - "epoch": 0.07, - "learning_rate": 1.992123022465954e-06, - "loss": 1.1074, - "step": 2684 - }, - { - "epoch": 0.07, - "learning_rate": 1.9921126203429403e-06, - "loss": 1.1094, - "step": 2685 - }, - { - "epoch": 0.07, - "learning_rate": 1.9921022113832714e-06, - "loss": 0.8513, - "step": 2686 - }, - { - "epoch": 0.07, - "learning_rate": 1.9920917955870183e-06, - "loss": 1.1465, - "step": 2687 - }, - { - "epoch": 0.07, - "learning_rate": 1.992081372954253e-06, - "loss": 0.8242, - "step": 2688 - }, - { - "epoch": 0.07, - "learning_rate": 1.9920709434850476e-06, - "loss": 1.1416, - "step": 2689 - }, - { - "epoch": 0.07, - "learning_rate": 1.9920605071794744e-06, - "loss": 1.2217, - "step": 2690 - }, - { - "epoch": 0.07, - "learning_rate": 1.992050064037604e-06, - "loss": 0.9141, - "step": 2691 - }, - { - "epoch": 0.07, - "learning_rate": 1.9920396140595096e-06, - "loss": 0.9512, - "step": 2692 - }, - { - "epoch": 0.07, - "learning_rate": 1.9920291572452626e-06, - "loss": 0.9072, - "step": 2693 - }, - { - "epoch": 0.07, - "learning_rate": 1.992018693594935e-06, - "loss": 1.0381, - "step": 2694 - }, - { - "epoch": 0.07, - "learning_rate": 1.9920082231085994e-06, - "loss": 0.8955, - "step": 2695 - }, - { - "epoch": 0.07, - "learning_rate": 1.9919977457863273e-06, - "loss": 0.8379, - "step": 2696 - }, - { - "epoch": 0.07, - "learning_rate": 1.9919872616281914e-06, - "loss": 0.7734, - "step": 2697 - }, - { - "epoch": 0.07, - "learning_rate": 1.9919767706342637e-06, - "loss": 0.7817, - "step": 2698 - }, - { - "epoch": 0.07, - "learning_rate": 1.9919662728046167e-06, - "loss": 0.8916, - "step": 2699 - }, - { - "epoch": 0.07, - "learning_rate": 1.9919557681393227e-06, - "loss": 1.1318, - "step": 2700 - }, - { - "epoch": 0.07, - "learning_rate": 1.991945256638454e-06, - "loss": 0.9844, - "step": 2701 - }, - { - "epoch": 0.07, - "learning_rate": 1.9919347383020824e-06, - "loss": 0.7778, - "step": 2702 - }, - { - "epoch": 0.07, - "learning_rate": 1.9919242131302817e-06, - "loss": 1.0879, - "step": 2703 - }, - { - "epoch": 0.07, - "learning_rate": 1.9919136811231238e-06, - "loss": 0.78, - "step": 2704 - }, - { - "epoch": 0.07, - "learning_rate": 1.991903142280681e-06, - "loss": 1.041, - "step": 2705 - }, - { - "epoch": 0.07, - "learning_rate": 1.9918925966030262e-06, - "loss": 0.8848, - "step": 2706 - }, - { - "epoch": 0.07, - "learning_rate": 1.9918820440902323e-06, - "loss": 0.9443, - "step": 2707 - }, - { - "epoch": 0.07, - "learning_rate": 1.9918714847423713e-06, - "loss": 0.9316, - "step": 2708 - }, - { - "epoch": 0.07, - "learning_rate": 1.9918609185595163e-06, - "loss": 1.0205, - "step": 2709 - }, - { - "epoch": 0.07, - "learning_rate": 1.991850345541741e-06, - "loss": 0.9854, - "step": 2710 - }, - { - "epoch": 0.07, - "learning_rate": 1.9918397656891166e-06, - "loss": 0.9766, - "step": 2711 - }, - { - "epoch": 0.07, - "learning_rate": 1.9918291790017176e-06, - "loss": 0.8838, - "step": 2712 - }, - { - "epoch": 0.07, - "learning_rate": 1.9918185854796156e-06, - "loss": 1.0967, - "step": 2713 - }, - { - "epoch": 0.07, - "learning_rate": 1.9918079851228848e-06, - "loss": 1.0889, - "step": 2714 - }, - { - "epoch": 0.07, - "learning_rate": 1.991797377931597e-06, - "loss": 1.0898, - "step": 2715 - }, - { - "epoch": 0.07, - "learning_rate": 1.9917867639058264e-06, - "loss": 0.9473, - "step": 2716 - }, - { - "epoch": 0.07, - "learning_rate": 1.991776143045646e-06, - "loss": 0.9785, - "step": 2717 - }, - { - "epoch": 0.07, - "learning_rate": 1.9917655153511283e-06, - "loss": 0.7195, - "step": 2718 - }, - { - "epoch": 0.07, - "learning_rate": 1.991754880822347e-06, - "loss": 0.9473, - "step": 2719 - }, - { - "epoch": 0.07, - "learning_rate": 1.9917442394593756e-06, - "loss": 1.1348, - "step": 2720 - }, - { - "epoch": 0.07, - "learning_rate": 1.9917335912622866e-06, - "loss": 1.1631, - "step": 2721 - }, - { - "epoch": 0.07, - "learning_rate": 1.9917229362311546e-06, - "loss": 0.8623, - "step": 2722 - }, - { - "epoch": 0.07, - "learning_rate": 1.991712274366052e-06, - "loss": 0.7261, - "step": 2723 - }, - { - "epoch": 0.07, - "learning_rate": 1.9917016056670526e-06, - "loss": 0.959, - "step": 2724 - }, - { - "epoch": 0.07, - "learning_rate": 1.9916909301342296e-06, - "loss": 0.8516, - "step": 2725 - }, - { - "epoch": 0.07, - "learning_rate": 1.9916802477676574e-06, - "loss": 0.9932, - "step": 2726 - }, - { - "epoch": 0.07, - "learning_rate": 1.991669558567409e-06, - "loss": 1.0205, - "step": 2727 - }, - { - "epoch": 0.07, - "learning_rate": 1.9916588625335583e-06, - "loss": 1.0449, - "step": 2728 - }, - { - "epoch": 0.07, - "learning_rate": 1.991648159666179e-06, - "loss": 1.0859, - "step": 2729 - }, - { - "epoch": 0.07, - "learning_rate": 1.9916374499653443e-06, - "loss": 0.8633, - "step": 2730 - }, - { - "epoch": 0.07, - "learning_rate": 1.9916267334311288e-06, - "loss": 1.0225, - "step": 2731 - }, - { - "epoch": 0.07, - "learning_rate": 1.991616010063606e-06, - "loss": 0.9414, - "step": 2732 - }, - { - "epoch": 0.07, - "learning_rate": 1.9916052798628495e-06, - "loss": 0.9434, - "step": 2733 - }, - { - "epoch": 0.07, - "learning_rate": 1.9915945428289336e-06, - "loss": 0.8975, - "step": 2734 - }, - { - "epoch": 0.07, - "learning_rate": 1.991583798961932e-06, - "loss": 1.0264, - "step": 2735 - }, - { - "epoch": 0.07, - "learning_rate": 1.9915730482619197e-06, - "loss": 0.8662, - "step": 2736 - }, - { - "epoch": 0.07, - "learning_rate": 1.991562290728969e-06, - "loss": 0.9883, - "step": 2737 - }, - { - "epoch": 0.07, - "learning_rate": 1.991551526363156e-06, - "loss": 0.9414, - "step": 2738 - }, - { - "epoch": 0.07, - "learning_rate": 1.9915407551645536e-06, - "loss": 1.0029, - "step": 2739 - }, - { - "epoch": 0.07, - "learning_rate": 1.9915299771332363e-06, - "loss": 0.9795, - "step": 2740 - }, - { - "epoch": 0.07, - "learning_rate": 1.9915191922692786e-06, - "loss": 0.8477, - "step": 2741 - }, - { - "epoch": 0.07, - "learning_rate": 1.9915084005727547e-06, - "loss": 0.96, - "step": 2742 - }, - { - "epoch": 0.07, - "learning_rate": 1.9914976020437386e-06, - "loss": 0.7598, - "step": 2743 - }, - { - "epoch": 0.07, - "learning_rate": 1.991486796682305e-06, - "loss": 0.9414, - "step": 2744 - }, - { - "epoch": 0.07, - "learning_rate": 1.991475984488529e-06, - "loss": 0.915, - "step": 2745 - }, - { - "epoch": 0.07, - "learning_rate": 1.991465165462484e-06, - "loss": 0.8906, - "step": 2746 - }, - { - "epoch": 0.07, - "learning_rate": 1.991454339604245e-06, - "loss": 1.1064, - "step": 2747 - }, - { - "epoch": 0.07, - "learning_rate": 1.9914435069138865e-06, - "loss": 1.04, - "step": 2748 - }, - { - "epoch": 0.07, - "learning_rate": 1.9914326673914835e-06, - "loss": 0.5889, - "step": 2749 - }, - { - "epoch": 0.07, - "learning_rate": 1.9914218210371106e-06, - "loss": 0.9678, - "step": 2750 - }, - { - "epoch": 0.07, - "learning_rate": 1.9914109678508427e-06, - "loss": 0.9775, - "step": 2751 - }, - { - "epoch": 0.07, - "learning_rate": 1.991400107832754e-06, - "loss": 0.8169, - "step": 2752 - }, - { - "epoch": 0.07, - "learning_rate": 1.9913892409829195e-06, - "loss": 1.0615, - "step": 2753 - }, - { - "epoch": 0.07, - "learning_rate": 1.9913783673014146e-06, - "loss": 1.1777, - "step": 2754 - }, - { - "epoch": 0.07, - "learning_rate": 1.9913674867883138e-06, - "loss": 0.9404, - "step": 2755 - }, - { - "epoch": 0.07, - "learning_rate": 1.991356599443692e-06, - "loss": 1.2021, - "step": 2756 - }, - { - "epoch": 0.07, - "learning_rate": 1.9913457052676247e-06, - "loss": 0.9014, - "step": 2757 - }, - { - "epoch": 0.07, - "learning_rate": 1.9913348042601864e-06, - "loss": 1.0156, - "step": 2758 - }, - { - "epoch": 0.07, - "learning_rate": 1.9913238964214524e-06, - "loss": 0.6641, - "step": 2759 - }, - { - "epoch": 0.07, - "learning_rate": 1.9913129817514985e-06, - "loss": 0.8047, - "step": 2760 - }, - { - "epoch": 0.07, - "learning_rate": 1.9913020602503988e-06, - "loss": 0.896, - "step": 2761 - }, - { - "epoch": 0.07, - "learning_rate": 1.9912911319182295e-06, - "loss": 0.9785, - "step": 2762 - }, - { - "epoch": 0.07, - "learning_rate": 1.991280196755065e-06, - "loss": 0.6899, - "step": 2763 - }, - { - "epoch": 0.07, - "learning_rate": 1.9912692547609816e-06, - "loss": 0.9307, - "step": 2764 - }, - { - "epoch": 0.07, - "learning_rate": 1.9912583059360537e-06, - "loss": 0.9072, - "step": 2765 - }, - { - "epoch": 0.07, - "learning_rate": 1.991247350280358e-06, - "loss": 1.1201, - "step": 2766 - }, - { - "epoch": 0.07, - "learning_rate": 1.991236387793969e-06, - "loss": 1.0303, - "step": 2767 - }, - { - "epoch": 0.07, - "learning_rate": 1.9912254184769627e-06, - "loss": 0.7358, - "step": 2768 - }, - { - "epoch": 0.07, - "learning_rate": 1.9912144423294147e-06, - "loss": 0.8237, - "step": 2769 - }, - { - "epoch": 0.07, - "learning_rate": 1.9912034593514e-06, - "loss": 0.9199, - "step": 2770 - }, - { - "epoch": 0.07, - "learning_rate": 1.9911924695429953e-06, - "loss": 0.7891, - "step": 2771 - }, - { - "epoch": 0.07, - "learning_rate": 1.9911814729042757e-06, - "loss": 1.0371, - "step": 2772 - }, - { - "epoch": 0.07, - "learning_rate": 1.9911704694353165e-06, - "loss": 0.709, - "step": 2773 - }, - { - "epoch": 0.07, - "learning_rate": 1.991159459136195e-06, - "loss": 1.1152, - "step": 2774 - }, - { - "epoch": 0.07, - "learning_rate": 1.9911484420069855e-06, - "loss": 0.8335, - "step": 2775 - }, - { - "epoch": 0.07, - "learning_rate": 1.991137418047765e-06, - "loss": 0.8057, - "step": 2776 - }, - { - "epoch": 0.07, - "learning_rate": 1.991126387258609e-06, - "loss": 0.9956, - "step": 2777 - }, - { - "epoch": 0.07, - "learning_rate": 1.9911153496395933e-06, - "loss": 0.8457, - "step": 2778 - }, - { - "epoch": 0.07, - "learning_rate": 1.9911043051907943e-06, - "loss": 0.7085, - "step": 2779 - }, - { - "epoch": 0.07, - "learning_rate": 1.9910932539122882e-06, - "loss": 1.1826, - "step": 2780 - }, - { - "epoch": 0.07, - "learning_rate": 1.9910821958041512e-06, - "loss": 1.2158, - "step": 2781 - }, - { - "epoch": 0.07, - "learning_rate": 1.9910711308664588e-06, - "loss": 0.8164, - "step": 2782 - }, - { - "epoch": 0.07, - "learning_rate": 1.9910600590992883e-06, - "loss": 0.9238, - "step": 2783 - }, - { - "epoch": 0.07, - "learning_rate": 1.991048980502715e-06, - "loss": 0.4988, - "step": 2784 - }, - { - "epoch": 0.07, - "learning_rate": 1.9910378950768157e-06, - "loss": 0.6453, - "step": 2785 - }, - { - "epoch": 0.07, - "learning_rate": 1.991026802821667e-06, - "loss": 1.002, - "step": 2786 - }, - { - "epoch": 0.07, - "learning_rate": 1.991015703737345e-06, - "loss": 1.0254, - "step": 2787 - }, - { - "epoch": 0.07, - "learning_rate": 1.9910045978239264e-06, - "loss": 0.8467, - "step": 2788 - }, - { - "epoch": 0.07, - "learning_rate": 1.9909934850814876e-06, - "loss": 0.7847, - "step": 2789 - }, - { - "epoch": 0.07, - "learning_rate": 1.9909823655101052e-06, - "loss": 0.9619, - "step": 2790 - }, - { - "epoch": 0.07, - "learning_rate": 1.990971239109856e-06, - "loss": 1.1201, - "step": 2791 - }, - { - "epoch": 0.07, - "learning_rate": 1.990960105880816e-06, - "loss": 1.1172, - "step": 2792 - }, - { - "epoch": 0.07, - "learning_rate": 1.990948965823063e-06, - "loss": 0.9219, - "step": 2793 - }, - { - "epoch": 0.07, - "learning_rate": 1.9909378189366728e-06, - "loss": 1.1133, - "step": 2794 - }, - { - "epoch": 0.07, - "learning_rate": 1.990926665221723e-06, - "loss": 0.7793, - "step": 2795 - }, - { - "epoch": 0.07, - "learning_rate": 1.9909155046782894e-06, - "loss": 0.9932, - "step": 2796 - }, - { - "epoch": 0.07, - "learning_rate": 1.9909043373064504e-06, - "loss": 0.8877, - "step": 2797 - }, - { - "epoch": 0.07, - "learning_rate": 1.9908931631062816e-06, - "loss": 0.9014, - "step": 2798 - }, - { - "epoch": 0.07, - "learning_rate": 1.9908819820778605e-06, - "loss": 0.9912, - "step": 2799 - }, - { - "epoch": 0.07, - "learning_rate": 1.9908707942212645e-06, - "loss": 1.1729, - "step": 2800 - }, - { - "epoch": 0.07, - "learning_rate": 1.99085959953657e-06, - "loss": 0.854, - "step": 2801 - }, - { - "epoch": 0.07, - "learning_rate": 1.9908483980238546e-06, - "loss": 1.1289, - "step": 2802 - }, - { - "epoch": 0.07, - "learning_rate": 1.9908371896831958e-06, - "loss": 1.0498, - "step": 2803 - }, - { - "epoch": 0.07, - "learning_rate": 1.99082597451467e-06, - "loss": 0.9443, - "step": 2804 - }, - { - "epoch": 0.07, - "learning_rate": 1.990814752518355e-06, - "loss": 0.9658, - "step": 2805 - }, - { - "epoch": 0.07, - "learning_rate": 1.990803523694328e-06, - "loss": 1.1309, - "step": 2806 - }, - { - "epoch": 0.07, - "learning_rate": 1.9907922880426668e-06, - "loss": 1.0303, - "step": 2807 - }, - { - "epoch": 0.07, - "learning_rate": 1.9907810455634482e-06, - "loss": 0.9609, - "step": 2808 - }, - { - "epoch": 0.07, - "learning_rate": 1.99076979625675e-06, - "loss": 1.0527, - "step": 2809 - }, - { - "epoch": 0.07, - "learning_rate": 1.9907585401226495e-06, - "loss": 0.8833, - "step": 2810 - }, - { - "epoch": 0.07, - "learning_rate": 1.9907472771612244e-06, - "loss": 0.8955, - "step": 2811 - }, - { - "epoch": 0.07, - "learning_rate": 1.9907360073725527e-06, - "loss": 1.0625, - "step": 2812 - }, - { - "epoch": 0.07, - "learning_rate": 1.9907247307567113e-06, - "loss": 1.1543, - "step": 2813 - }, - { - "epoch": 0.07, - "learning_rate": 1.9907134473137783e-06, - "loss": 1.0146, - "step": 2814 - }, - { - "epoch": 0.07, - "learning_rate": 1.9907021570438318e-06, - "loss": 0.8799, - "step": 2815 - }, - { - "epoch": 0.07, - "learning_rate": 1.9906908599469488e-06, - "loss": 1.0352, - "step": 2816 - }, - { - "epoch": 0.07, - "learning_rate": 1.990679556023208e-06, - "loss": 0.9443, - "step": 2817 - }, - { - "epoch": 0.07, - "learning_rate": 1.9906682452726868e-06, - "loss": 1.0381, - "step": 2818 - }, - { - "epoch": 0.07, - "learning_rate": 1.990656927695463e-06, - "loss": 0.9854, - "step": 2819 - }, - { - "epoch": 0.07, - "learning_rate": 1.9906456032916152e-06, - "loss": 0.9873, - "step": 2820 - }, - { - "epoch": 0.07, - "learning_rate": 1.9906342720612204e-06, - "loss": 0.958, - "step": 2821 - }, - { - "epoch": 0.07, - "learning_rate": 1.990622934004358e-06, - "loss": 1.0127, - "step": 2822 - }, - { - "epoch": 0.07, - "learning_rate": 1.9906115891211054e-06, - "loss": 1.1191, - "step": 2823 - }, - { - "epoch": 0.07, - "learning_rate": 1.9906002374115407e-06, - "loss": 0.9043, - "step": 2824 - }, - { - "epoch": 0.07, - "learning_rate": 1.9905888788757424e-06, - "loss": 0.9941, - "step": 2825 - }, - { - "epoch": 0.07, - "learning_rate": 1.9905775135137887e-06, - "loss": 1.0859, - "step": 2826 - }, - { - "epoch": 0.07, - "learning_rate": 1.9905661413257574e-06, - "loss": 0.6499, - "step": 2827 - }, - { - "epoch": 0.07, - "learning_rate": 1.9905547623117277e-06, - "loss": 1.0049, - "step": 2828 - }, - { - "epoch": 0.07, - "learning_rate": 1.990543376471778e-06, - "loss": 1.1191, - "step": 2829 - }, - { - "epoch": 0.07, - "learning_rate": 1.9905319838059856e-06, - "loss": 1.0547, - "step": 2830 - }, - { - "epoch": 0.07, - "learning_rate": 1.9905205843144304e-06, - "loss": 1.2803, - "step": 2831 - }, - { - "epoch": 0.07, - "learning_rate": 1.9905091779971903e-06, - "loss": 0.9375, - "step": 2832 - }, - { - "epoch": 0.07, - "learning_rate": 1.990497764854344e-06, - "loss": 0.8008, - "step": 2833 - }, - { - "epoch": 0.07, - "learning_rate": 1.99048634488597e-06, - "loss": 1.1465, - "step": 2834 - }, - { - "epoch": 0.07, - "learning_rate": 1.990474918092147e-06, - "loss": 1.0498, - "step": 2835 - }, - { - "epoch": 0.07, - "learning_rate": 1.9904634844729543e-06, - "loss": 0.7744, - "step": 2836 - }, - { - "epoch": 0.07, - "learning_rate": 1.99045204402847e-06, - "loss": 0.8257, - "step": 2837 - }, - { - "epoch": 0.07, - "learning_rate": 1.990440596758773e-06, - "loss": 1.0859, - "step": 2838 - }, - { - "epoch": 0.07, - "learning_rate": 1.990429142663942e-06, - "loss": 0.895, - "step": 2839 - }, - { - "epoch": 0.07, - "learning_rate": 1.990417681744057e-06, - "loss": 0.9785, - "step": 2840 - }, - { - "epoch": 0.07, - "learning_rate": 1.990406213999196e-06, - "loss": 1.0342, - "step": 2841 - }, - { - "epoch": 0.07, - "learning_rate": 1.9903947394294386e-06, - "loss": 0.9424, - "step": 2842 - }, - { - "epoch": 0.07, - "learning_rate": 1.990383258034863e-06, - "loss": 0.917, - "step": 2843 - }, - { - "epoch": 0.07, - "learning_rate": 1.9903717698155496e-06, - "loss": 0.8408, - "step": 2844 - }, - { - "epoch": 0.07, - "learning_rate": 1.9903602747715764e-06, - "loss": 1.0234, - "step": 2845 - }, - { - "epoch": 0.07, - "learning_rate": 1.9903487729030232e-06, - "loss": 0.9824, - "step": 2846 - }, - { - "epoch": 0.07, - "learning_rate": 1.9903372642099688e-06, - "loss": 1.1123, - "step": 2847 - }, - { - "epoch": 0.07, - "learning_rate": 1.990325748692493e-06, - "loss": 0.8975, - "step": 2848 - }, - { - "epoch": 0.07, - "learning_rate": 1.9903142263506754e-06, - "loss": 0.9746, - "step": 2849 - }, - { - "epoch": 0.07, - "learning_rate": 1.9903026971845945e-06, - "loss": 0.7715, - "step": 2850 - }, - { - "epoch": 0.07, - "learning_rate": 1.9902911611943304e-06, - "loss": 1.1191, - "step": 2851 - }, - { - "epoch": 0.07, - "learning_rate": 1.9902796183799622e-06, - "loss": 0.6689, - "step": 2852 - }, - { - "epoch": 0.07, - "learning_rate": 1.99026806874157e-06, - "loss": 0.9463, - "step": 2853 - }, - { - "epoch": 0.07, - "learning_rate": 1.9902565122792333e-06, - "loss": 0.9277, - "step": 2854 - }, - { - "epoch": 0.07, - "learning_rate": 1.990244948993031e-06, - "loss": 0.9512, - "step": 2855 - }, - { - "epoch": 0.07, - "learning_rate": 1.9902333788830435e-06, - "loss": 1.0078, - "step": 2856 - }, - { - "epoch": 0.07, - "learning_rate": 1.99022180194935e-06, - "loss": 1.0889, - "step": 2857 - }, - { - "epoch": 0.07, - "learning_rate": 1.990210218192031e-06, - "loss": 0.9307, - "step": 2858 - }, - { - "epoch": 0.07, - "learning_rate": 1.9901986276111654e-06, - "loss": 1.0117, - "step": 2859 - }, - { - "epoch": 0.07, - "learning_rate": 1.990187030206834e-06, - "loss": 1.0576, - "step": 2860 - }, - { - "epoch": 0.07, - "learning_rate": 1.9901754259791164e-06, - "loss": 0.8926, - "step": 2861 - }, - { - "epoch": 0.07, - "learning_rate": 1.990163814928092e-06, - "loss": 1.0303, - "step": 2862 - }, - { - "epoch": 0.07, - "learning_rate": 1.990152197053842e-06, - "loss": 0.8892, - "step": 2863 - }, - { - "epoch": 0.07, - "learning_rate": 1.990140572356445e-06, - "loss": 0.9297, - "step": 2864 - }, - { - "epoch": 0.07, - "learning_rate": 1.990128940835982e-06, - "loss": 1.0732, - "step": 2865 - }, - { - "epoch": 0.07, - "learning_rate": 1.9901173024925332e-06, - "loss": 0.8799, - "step": 2866 - }, - { - "epoch": 0.07, - "learning_rate": 1.9901056573261787e-06, - "loss": 1.0234, - "step": 2867 - }, - { - "epoch": 0.07, - "learning_rate": 1.990094005336998e-06, - "loss": 1.0488, - "step": 2868 - }, - { - "epoch": 0.07, - "learning_rate": 1.9900823465250727e-06, - "loss": 0.9658, - "step": 2869 - }, - { - "epoch": 0.07, - "learning_rate": 1.990070680890482e-06, - "loss": 0.8081, - "step": 2870 - }, - { - "epoch": 0.07, - "learning_rate": 1.990059008433307e-06, - "loss": 0.8076, - "step": 2871 - }, - { - "epoch": 0.07, - "learning_rate": 1.990047329153628e-06, - "loss": 0.8071, - "step": 2872 - }, - { - "epoch": 0.07, - "learning_rate": 1.9900356430515252e-06, - "loss": 0.9336, - "step": 2873 - }, - { - "epoch": 0.07, - "learning_rate": 1.9900239501270794e-06, - "loss": 1.0605, - "step": 2874 - }, - { - "epoch": 0.07, - "learning_rate": 1.9900122503803705e-06, - "loss": 0.9482, - "step": 2875 - }, - { - "epoch": 0.07, - "learning_rate": 1.9900005438114804e-06, - "loss": 0.9102, - "step": 2876 - }, - { - "epoch": 0.07, - "learning_rate": 1.989988830420489e-06, - "loss": 0.8223, - "step": 2877 - }, - { - "epoch": 0.07, - "learning_rate": 1.989977110207477e-06, - "loss": 1.0254, - "step": 2878 - }, - { - "epoch": 0.07, - "learning_rate": 1.9899653831725253e-06, - "loss": 0.7896, - "step": 2879 - }, - { - "epoch": 0.07, - "learning_rate": 1.9899536493157145e-06, - "loss": 1.1357, - "step": 2880 - }, - { - "epoch": 0.07, - "learning_rate": 1.9899419086371257e-06, - "loss": 1.0254, - "step": 2881 - }, - { - "epoch": 0.07, - "learning_rate": 1.98993016113684e-06, - "loss": 1.0957, - "step": 2882 - }, - { - "epoch": 0.07, - "learning_rate": 1.989918406814938e-06, - "loss": 0.7412, - "step": 2883 - }, - { - "epoch": 0.07, - "learning_rate": 1.9899066456715003e-06, - "loss": 1.082, - "step": 2884 - }, - { - "epoch": 0.07, - "learning_rate": 1.9898948777066086e-06, - "loss": 0.8096, - "step": 2885 - }, - { - "epoch": 0.07, - "learning_rate": 1.989883102920344e-06, - "loss": 0.832, - "step": 2886 - }, - { - "epoch": 0.07, - "learning_rate": 1.9898713213127875e-06, - "loss": 0.9775, - "step": 2887 - }, - { - "epoch": 0.07, - "learning_rate": 1.9898595328840203e-06, - "loss": 1.0264, - "step": 2888 - }, - { - "epoch": 0.07, - "learning_rate": 1.9898477376341234e-06, - "loss": 0.9502, - "step": 2889 - }, - { - "epoch": 0.07, - "learning_rate": 1.9898359355631782e-06, - "loss": 0.9912, - "step": 2890 - }, - { - "epoch": 0.07, - "learning_rate": 1.9898241266712665e-06, - "loss": 1.0322, - "step": 2891 - }, - { - "epoch": 0.07, - "learning_rate": 1.989812310958469e-06, - "loss": 1.0068, - "step": 2892 - }, - { - "epoch": 0.07, - "learning_rate": 1.989800488424867e-06, - "loss": 0.875, - "step": 2893 - }, - { - "epoch": 0.07, - "learning_rate": 1.9897886590705426e-06, - "loss": 0.7861, - "step": 2894 - }, - { - "epoch": 0.07, - "learning_rate": 1.9897768228955772e-06, - "loss": 0.9414, - "step": 2895 - }, - { - "epoch": 0.07, - "learning_rate": 1.9897649799000527e-06, - "loss": 1.3027, - "step": 2896 - }, - { - "epoch": 0.07, - "learning_rate": 1.9897531300840494e-06, - "loss": 1.0273, - "step": 2897 - }, - { - "epoch": 0.07, - "learning_rate": 1.9897412734476504e-06, - "loss": 0.9131, - "step": 2898 - }, - { - "epoch": 0.07, - "learning_rate": 1.9897294099909367e-06, - "loss": 0.9678, - "step": 2899 - }, - { - "epoch": 0.07, - "learning_rate": 1.98971753971399e-06, - "loss": 1.0059, - "step": 2900 - }, - { - "epoch": 0.07, - "learning_rate": 1.989705662616892e-06, - "loss": 0.998, - "step": 2901 - }, - { - "epoch": 0.07, - "learning_rate": 1.9896937786997253e-06, - "loss": 0.9189, - "step": 2902 - }, - { - "epoch": 0.07, - "learning_rate": 1.989681887962571e-06, - "loss": 0.7532, - "step": 2903 - }, - { - "epoch": 0.07, - "learning_rate": 1.9896699904055115e-06, - "loss": 1.0059, - "step": 2904 - }, - { - "epoch": 0.07, - "learning_rate": 1.989658086028629e-06, - "loss": 0.9658, - "step": 2905 - }, - { - "epoch": 0.07, - "learning_rate": 1.9896461748320044e-06, - "loss": 0.71, - "step": 2906 - }, - { - "epoch": 0.07, - "learning_rate": 1.989634256815721e-06, - "loss": 0.9922, - "step": 2907 - }, - { - "epoch": 0.07, - "learning_rate": 1.98962233197986e-06, - "loss": 0.9512, - "step": 2908 - }, - { - "epoch": 0.07, - "learning_rate": 1.9896104003245043e-06, - "loss": 1.0264, - "step": 2909 - }, - { - "epoch": 0.07, - "learning_rate": 1.989598461849736e-06, - "loss": 1.1621, - "step": 2910 - }, - { - "epoch": 0.07, - "learning_rate": 1.9895865165556373e-06, - "loss": 1.0566, - "step": 2911 - }, - { - "epoch": 0.07, - "learning_rate": 1.98957456444229e-06, - "loss": 1.0469, - "step": 2912 - }, - { - "epoch": 0.07, - "learning_rate": 1.989562605509777e-06, - "loss": 0.875, - "step": 2913 - }, - { - "epoch": 0.07, - "learning_rate": 1.989550639758181e-06, - "loss": 0.96, - "step": 2914 - }, - { - "epoch": 0.07, - "learning_rate": 1.989538667187584e-06, - "loss": 0.9727, - "step": 2915 - }, - { - "epoch": 0.07, - "learning_rate": 1.989526687798068e-06, - "loss": 1.0088, - "step": 2916 - }, - { - "epoch": 0.07, - "learning_rate": 1.989514701589717e-06, - "loss": 0.8945, - "step": 2917 - }, - { - "epoch": 0.07, - "learning_rate": 1.9895027085626123e-06, - "loss": 1.0049, - "step": 2918 - }, - { - "epoch": 0.07, - "learning_rate": 1.9894907087168367e-06, - "loss": 1.0801, - "step": 2919 - }, - { - "epoch": 0.07, - "learning_rate": 1.9894787020524735e-06, - "loss": 1.1777, - "step": 2920 - }, - { - "epoch": 0.07, - "learning_rate": 1.989466688569605e-06, - "loss": 0.957, - "step": 2921 - }, - { - "epoch": 0.07, - "learning_rate": 1.989454668268314e-06, - "loss": 1.0713, - "step": 2922 - }, - { - "epoch": 0.07, - "learning_rate": 1.9894426411486835e-06, - "loss": 0.8789, - "step": 2923 - }, - { - "epoch": 0.07, - "learning_rate": 1.989430607210796e-06, - "loss": 1.0752, - "step": 2924 - }, - { - "epoch": 0.07, - "learning_rate": 1.989418566454735e-06, - "loss": 0.7412, - "step": 2925 - }, - { - "epoch": 0.07, - "learning_rate": 1.989406518880583e-06, - "loss": 1.0684, - "step": 2926 - }, - { - "epoch": 0.08, - "learning_rate": 1.9893944644884235e-06, - "loss": 0.9238, - "step": 2927 - }, - { - "epoch": 0.08, - "learning_rate": 1.989382403278339e-06, - "loss": 0.8013, - "step": 2928 - }, - { - "epoch": 0.08, - "learning_rate": 1.989370335250413e-06, - "loss": 0.9658, - "step": 2929 - }, - { - "epoch": 0.08, - "learning_rate": 1.9893582604047286e-06, - "loss": 0.8472, - "step": 2930 - }, - { - "epoch": 0.08, - "learning_rate": 1.9893461787413687e-06, - "loss": 0.7554, - "step": 2931 - }, - { - "epoch": 0.08, - "learning_rate": 1.989334090260417e-06, - "loss": 1.1611, - "step": 2932 - }, - { - "epoch": 0.08, - "learning_rate": 1.989321994961957e-06, - "loss": 0.8945, - "step": 2933 - }, - { - "epoch": 0.08, - "learning_rate": 1.9893098928460708e-06, - "loss": 1.0947, - "step": 2934 - }, - { - "epoch": 0.08, - "learning_rate": 1.989297783912843e-06, - "loss": 1.2236, - "step": 2935 - }, - { - "epoch": 0.08, - "learning_rate": 1.989285668162357e-06, - "loss": 0.9844, - "step": 2936 - }, - { - "epoch": 0.08, - "learning_rate": 1.9892735455946957e-06, - "loss": 1.002, - "step": 2937 - }, - { - "epoch": 0.08, - "learning_rate": 1.989261416209943e-06, - "loss": 0.8232, - "step": 2938 - }, - { - "epoch": 0.08, - "learning_rate": 1.9892492800081823e-06, - "loss": 0.9883, - "step": 2939 - }, - { - "epoch": 0.08, - "learning_rate": 1.9892371369894975e-06, - "loss": 1.0098, - "step": 2940 - }, - { - "epoch": 0.08, - "learning_rate": 1.9892249871539724e-06, - "loss": 0.8428, - "step": 2941 - }, - { - "epoch": 0.08, - "learning_rate": 1.98921283050169e-06, - "loss": 0.9111, - "step": 2942 - }, - { - "epoch": 0.08, - "learning_rate": 1.989200667032735e-06, - "loss": 0.9883, - "step": 2943 - }, - { - "epoch": 0.08, - "learning_rate": 1.98918849674719e-06, - "loss": 1.127, - "step": 2944 - }, - { - "epoch": 0.08, - "learning_rate": 1.98917631964514e-06, - "loss": 1.0273, - "step": 2945 - }, - { - "epoch": 0.08, - "learning_rate": 1.9891641357266683e-06, - "loss": 0.8584, - "step": 2946 - }, - { - "epoch": 0.08, - "learning_rate": 1.9891519449918596e-06, - "loss": 1.292, - "step": 2947 - }, - { - "epoch": 0.08, - "learning_rate": 1.989139747440797e-06, - "loss": 0.8364, - "step": 2948 - }, - { - "epoch": 0.08, - "learning_rate": 1.9891275430735646e-06, - "loss": 0.959, - "step": 2949 - }, - { - "epoch": 0.08, - "learning_rate": 1.9891153318902473e-06, - "loss": 1.0781, - "step": 2950 - }, - { - "epoch": 0.08, - "learning_rate": 1.9891031138909286e-06, - "loss": 1.0342, - "step": 2951 - }, - { - "epoch": 0.08, - "learning_rate": 1.989090889075693e-06, - "loss": 0.9619, - "step": 2952 - }, - { - "epoch": 0.08, - "learning_rate": 1.9890786574446247e-06, - "loss": 0.9316, - "step": 2953 - }, - { - "epoch": 0.08, - "learning_rate": 1.9890664189978074e-06, - "loss": 1.0361, - "step": 2954 - }, - { - "epoch": 0.08, - "learning_rate": 1.9890541737353265e-06, - "loss": 0.8838, - "step": 2955 - }, - { - "epoch": 0.08, - "learning_rate": 1.9890419216572652e-06, - "loss": 0.8984, - "step": 2956 - }, - { - "epoch": 0.08, - "learning_rate": 1.9890296627637092e-06, - "loss": 1.1406, - "step": 2957 - }, - { - "epoch": 0.08, - "learning_rate": 1.989017397054742e-06, - "loss": 0.8945, - "step": 2958 - }, - { - "epoch": 0.08, - "learning_rate": 1.9890051245304488e-06, - "loss": 0.7891, - "step": 2959 - }, - { - "epoch": 0.08, - "learning_rate": 1.9889928451909133e-06, - "loss": 0.9941, - "step": 2960 - }, - { - "epoch": 0.08, - "learning_rate": 1.9889805590362206e-06, - "loss": 0.9668, - "step": 2961 - }, - { - "epoch": 0.08, - "learning_rate": 1.988968266066456e-06, - "loss": 0.7515, - "step": 2962 - }, - { - "epoch": 0.08, - "learning_rate": 1.988955966281703e-06, - "loss": 0.9365, - "step": 2963 - }, - { - "epoch": 0.08, - "learning_rate": 1.9889436596820472e-06, - "loss": 0.8535, - "step": 2964 - }, - { - "epoch": 0.08, - "learning_rate": 1.988931346267573e-06, - "loss": 0.9922, - "step": 2965 - }, - { - "epoch": 0.08, - "learning_rate": 1.988919026038366e-06, - "loss": 0.96, - "step": 2966 - }, - { - "epoch": 0.08, - "learning_rate": 1.98890669899451e-06, - "loss": 0.7402, - "step": 2967 - }, - { - "epoch": 0.08, - "learning_rate": 1.9888943651360906e-06, - "loss": 0.8906, - "step": 2968 - }, - { - "epoch": 0.08, - "learning_rate": 1.9888820244631925e-06, - "loss": 0.8296, - "step": 2969 - }, - { - "epoch": 0.08, - "learning_rate": 1.9888696769759012e-06, - "loss": 0.6973, - "step": 2970 - }, - { - "epoch": 0.08, - "learning_rate": 1.9888573226743014e-06, - "loss": 1.0098, - "step": 2971 - }, - { - "epoch": 0.08, - "learning_rate": 1.9888449615584783e-06, - "loss": 0.7231, - "step": 2972 - }, - { - "epoch": 0.08, - "learning_rate": 1.988832593628517e-06, - "loss": 0.9717, - "step": 2973 - }, - { - "epoch": 0.08, - "learning_rate": 1.988820218884503e-06, - "loss": 0.875, - "step": 2974 - }, - { - "epoch": 0.08, - "learning_rate": 1.9888078373265213e-06, - "loss": 1.04, - "step": 2975 - }, - { - "epoch": 0.08, - "learning_rate": 1.9887954489546573e-06, - "loss": 0.9883, - "step": 2976 - }, - { - "epoch": 0.08, - "learning_rate": 1.9887830537689964e-06, - "loss": 0.8262, - "step": 2977 - }, - { - "epoch": 0.08, - "learning_rate": 1.9887706517696237e-06, - "loss": 0.9004, - "step": 2978 - }, - { - "epoch": 0.08, - "learning_rate": 1.9887582429566257e-06, - "loss": 0.9844, - "step": 2979 - }, - { - "epoch": 0.08, - "learning_rate": 1.9887458273300866e-06, - "loss": 0.8457, - "step": 2980 - }, - { - "epoch": 0.08, - "learning_rate": 1.988733404890093e-06, - "loss": 0.8315, - "step": 2981 - }, - { - "epoch": 0.08, - "learning_rate": 1.9887209756367296e-06, - "loss": 0.7615, - "step": 2982 - }, - { - "epoch": 0.08, - "learning_rate": 1.9887085395700823e-06, - "loss": 0.9316, - "step": 2983 - }, - { - "epoch": 0.08, - "learning_rate": 1.9886960966902373e-06, - "loss": 0.7651, - "step": 2984 - }, - { - "epoch": 0.08, - "learning_rate": 1.98868364699728e-06, - "loss": 0.75, - "step": 2985 - }, - { - "epoch": 0.08, - "learning_rate": 1.9886711904912965e-06, - "loss": 1.1426, - "step": 2986 - }, - { - "epoch": 0.08, - "learning_rate": 1.988658727172372e-06, - "loss": 0.9058, - "step": 2987 - }, - { - "epoch": 0.08, - "learning_rate": 1.9886462570405927e-06, - "loss": 1.042, - "step": 2988 - }, - { - "epoch": 0.08, - "learning_rate": 1.9886337800960447e-06, - "loss": 0.9932, - "step": 2989 - }, - { - "epoch": 0.08, - "learning_rate": 1.988621296338814e-06, - "loss": 1.1201, - "step": 2990 - }, - { - "epoch": 0.08, - "learning_rate": 1.9886088057689865e-06, - "loss": 0.9629, - "step": 2991 - }, - { - "epoch": 0.08, - "learning_rate": 1.9885963083866477e-06, - "loss": 0.9619, - "step": 2992 - }, - { - "epoch": 0.08, - "learning_rate": 1.988583804191885e-06, - "loss": 1.0273, - "step": 2993 - }, - { - "epoch": 0.08, - "learning_rate": 1.988571293184784e-06, - "loss": 1.0088, - "step": 2994 - }, - { - "epoch": 0.08, - "learning_rate": 1.98855877536543e-06, - "loss": 0.8584, - "step": 2995 - }, - { - "epoch": 0.08, - "learning_rate": 1.98854625073391e-06, - "loss": 1.0186, - "step": 2996 - }, - { - "epoch": 0.08, - "learning_rate": 1.9885337192903105e-06, - "loss": 0.9092, - "step": 2997 - }, - { - "epoch": 0.08, - "learning_rate": 1.9885211810347184e-06, - "loss": 0.9131, - "step": 2998 - }, - { - "epoch": 0.08, - "learning_rate": 1.9885086359672182e-06, - "loss": 0.9131, - "step": 2999 - }, - { - "epoch": 0.08, - "learning_rate": 1.988496084087898e-06, - "loss": 0.918, - "step": 3000 - }, - { - "epoch": 0.08, - "learning_rate": 1.988483525396844e-06, - "loss": 0.7183, - "step": 3001 - }, - { - "epoch": 0.08, - "learning_rate": 1.9884709598941427e-06, - "loss": 1.1016, - "step": 3002 - }, - { - "epoch": 0.08, - "learning_rate": 1.98845838757988e-06, - "loss": 0.9834, - "step": 3003 - }, - { - "epoch": 0.08, - "learning_rate": 1.9884458084541435e-06, - "loss": 1.0723, - "step": 3004 - }, - { - "epoch": 0.08, - "learning_rate": 1.9884332225170195e-06, - "loss": 0.832, - "step": 3005 - }, - { - "epoch": 0.08, - "learning_rate": 1.988420629768595e-06, - "loss": 1.1221, - "step": 3006 - }, - { - "epoch": 0.08, - "learning_rate": 1.9884080302089554e-06, - "loss": 1.0078, - "step": 3007 - }, - { - "epoch": 0.08, - "learning_rate": 1.9883954238381894e-06, - "loss": 1.084, - "step": 3008 - }, - { - "epoch": 0.08, - "learning_rate": 1.9883828106563828e-06, - "loss": 0.9556, - "step": 3009 - }, - { - "epoch": 0.08, - "learning_rate": 1.988370190663623e-06, - "loss": 1.2598, - "step": 3010 - }, - { - "epoch": 0.08, - "learning_rate": 1.9883575638599966e-06, - "loss": 0.8438, - "step": 3011 - }, - { - "epoch": 0.08, - "learning_rate": 1.9883449302455907e-06, - "loss": 1.0752, - "step": 3012 - }, - { - "epoch": 0.08, - "learning_rate": 1.9883322898204927e-06, - "loss": 1.0166, - "step": 3013 - }, - { - "epoch": 0.08, - "learning_rate": 1.988319642584789e-06, - "loss": 0.7588, - "step": 3014 - }, - { - "epoch": 0.08, - "learning_rate": 1.9883069885385673e-06, - "loss": 1.0791, - "step": 3015 - }, - { - "epoch": 0.08, - "learning_rate": 1.9882943276819153e-06, - "loss": 0.7661, - "step": 3016 - }, - { - "epoch": 0.08, - "learning_rate": 1.988281660014919e-06, - "loss": 1.168, - "step": 3017 - }, - { - "epoch": 0.08, - "learning_rate": 1.988268985537666e-06, - "loss": 0.9922, - "step": 3018 - }, - { - "epoch": 0.08, - "learning_rate": 1.988256304250245e-06, - "loss": 0.7769, - "step": 3019 - }, - { - "epoch": 0.08, - "learning_rate": 1.9882436161527413e-06, - "loss": 1.0811, - "step": 3020 - }, - { - "epoch": 0.08, - "learning_rate": 1.9882309212452437e-06, - "loss": 1.0225, - "step": 3021 - }, - { - "epoch": 0.08, - "learning_rate": 1.9882182195278396e-06, - "loss": 0.8896, - "step": 3022 - }, - { - "epoch": 0.08, - "learning_rate": 1.9882055110006163e-06, - "loss": 1.1553, - "step": 3023 - }, - { - "epoch": 0.08, - "learning_rate": 1.988192795663661e-06, - "loss": 0.8662, - "step": 3024 - }, - { - "epoch": 0.08, - "learning_rate": 1.988180073517062e-06, - "loss": 0.9863, - "step": 3025 - }, - { - "epoch": 0.08, - "learning_rate": 1.9881673445609065e-06, - "loss": 0.9277, - "step": 3026 - }, - { - "epoch": 0.08, - "learning_rate": 1.988154608795282e-06, - "loss": 0.9092, - "step": 3027 - }, - { - "epoch": 0.08, - "learning_rate": 1.9881418662202774e-06, - "loss": 0.9365, - "step": 3028 - }, - { - "epoch": 0.08, - "learning_rate": 1.9881291168359794e-06, - "loss": 1.1035, - "step": 3029 - }, - { - "epoch": 0.08, - "learning_rate": 1.988116360642476e-06, - "loss": 1.2432, - "step": 3030 - }, - { - "epoch": 0.08, - "learning_rate": 1.9881035976398554e-06, - "loss": 1.0527, - "step": 3031 - }, - { - "epoch": 0.08, - "learning_rate": 1.9880908278282055e-06, - "loss": 1.0098, - "step": 3032 - }, - { - "epoch": 0.08, - "learning_rate": 1.9880780512076143e-06, - "loss": 0.9434, - "step": 3033 - }, - { - "epoch": 0.08, - "learning_rate": 1.9880652677781696e-06, - "loss": 0.9805, - "step": 3034 - }, - { - "epoch": 0.08, - "learning_rate": 1.9880524775399597e-06, - "loss": 1.0381, - "step": 3035 - }, - { - "epoch": 0.08, - "learning_rate": 1.988039680493073e-06, - "loss": 1.0117, - "step": 3036 - }, - { - "epoch": 0.08, - "learning_rate": 1.9880268766375972e-06, - "loss": 1.0732, - "step": 3037 - }, - { - "epoch": 0.08, - "learning_rate": 1.9880140659736207e-06, - "loss": 0.9932, - "step": 3038 - }, - { - "epoch": 0.08, - "learning_rate": 1.988001248501232e-06, - "loss": 0.5859, - "step": 3039 - }, - { - "epoch": 0.08, - "learning_rate": 1.987988424220519e-06, - "loss": 0.9404, - "step": 3040 - }, - { - "epoch": 0.08, - "learning_rate": 1.98797559313157e-06, - "loss": 0.8506, - "step": 3041 - }, - { - "epoch": 0.08, - "learning_rate": 1.9879627552344743e-06, - "loss": 0.9756, - "step": 3042 - }, - { - "epoch": 0.08, - "learning_rate": 1.9879499105293194e-06, - "loss": 1.0381, - "step": 3043 - }, - { - "epoch": 0.08, - "learning_rate": 1.9879370590161948e-06, - "loss": 0.8311, - "step": 3044 - }, - { - "epoch": 0.08, - "learning_rate": 1.987924200695188e-06, - "loss": 0.958, - "step": 3045 - }, - { - "epoch": 0.08, - "learning_rate": 1.987911335566388e-06, - "loss": 0.7563, - "step": 3046 - }, - { - "epoch": 0.08, - "learning_rate": 1.987898463629884e-06, - "loss": 1.0742, - "step": 3047 - }, - { - "epoch": 0.08, - "learning_rate": 1.987885584885764e-06, - "loss": 0.7568, - "step": 3048 - }, - { - "epoch": 0.08, - "learning_rate": 1.987872699334116e-06, - "loss": 0.8818, - "step": 3049 - }, - { - "epoch": 0.08, - "learning_rate": 1.987859806975031e-06, - "loss": 0.917, - "step": 3050 - }, - { - "epoch": 0.08, - "learning_rate": 1.987846907808596e-06, - "loss": 0.8032, - "step": 3051 - }, - { - "epoch": 0.08, - "learning_rate": 1.9878340018349007e-06, - "loss": 1.2471, - "step": 3052 - }, - { - "epoch": 0.08, - "learning_rate": 1.987821089054034e-06, - "loss": 0.8525, - "step": 3053 - }, - { - "epoch": 0.08, - "learning_rate": 1.9878081694660847e-06, - "loss": 0.8027, - "step": 3054 - }, - { - "epoch": 0.08, - "learning_rate": 1.9877952430711415e-06, - "loss": 0.9883, - "step": 3055 - }, - { - "epoch": 0.08, - "learning_rate": 1.987782309869294e-06, - "loss": 0.873, - "step": 3056 - }, - { - "epoch": 0.08, - "learning_rate": 1.9877693698606316e-06, - "loss": 0.9307, - "step": 3057 - }, - { - "epoch": 0.08, - "learning_rate": 1.9877564230452424e-06, - "loss": 0.9541, - "step": 3058 - }, - { - "epoch": 0.08, - "learning_rate": 1.9877434694232163e-06, - "loss": 1.0898, - "step": 3059 - }, - { - "epoch": 0.08, - "learning_rate": 1.9877305089946426e-06, - "loss": 0.959, - "step": 3060 - }, - { - "epoch": 0.08, - "learning_rate": 1.9877175417596103e-06, - "loss": 1.0078, - "step": 3061 - }, - { - "epoch": 0.08, - "learning_rate": 1.987704567718209e-06, - "loss": 0.8857, - "step": 3062 - }, - { - "epoch": 0.08, - "learning_rate": 1.9876915868705286e-06, - "loss": 0.8984, - "step": 3063 - }, - { - "epoch": 0.08, - "learning_rate": 1.9876785992166575e-06, - "loss": 0.6851, - "step": 3064 - }, - { - "epoch": 0.08, - "learning_rate": 1.9876656047566857e-06, - "loss": 0.9609, - "step": 3065 - }, - { - "epoch": 0.08, - "learning_rate": 1.987652603490703e-06, - "loss": 1.0332, - "step": 3066 - }, - { - "epoch": 0.08, - "learning_rate": 1.987639595418799e-06, - "loss": 0.96, - "step": 3067 - }, - { - "epoch": 0.08, - "learning_rate": 1.9876265805410623e-06, - "loss": 1.0068, - "step": 3068 - }, - { - "epoch": 0.08, - "learning_rate": 1.987613558857584e-06, - "loss": 0.8779, - "step": 3069 - }, - { - "epoch": 0.08, - "learning_rate": 1.9876005303684532e-06, - "loss": 1.0859, - "step": 3070 - }, - { - "epoch": 0.08, - "learning_rate": 1.987587495073759e-06, - "loss": 0.8457, - "step": 3071 - }, - { - "epoch": 0.08, - "learning_rate": 1.9875744529735927e-06, - "loss": 1.1035, - "step": 3072 - }, - { - "epoch": 0.08, - "learning_rate": 1.987561404068043e-06, - "loss": 0.8066, - "step": 3073 - }, - { - "epoch": 0.08, - "learning_rate": 1.9875483483572002e-06, - "loss": 0.9883, - "step": 3074 - }, - { - "epoch": 0.08, - "learning_rate": 1.9875352858411546e-06, - "loss": 0.9014, - "step": 3075 - }, - { - "epoch": 0.08, - "learning_rate": 1.987522216519996e-06, - "loss": 0.9658, - "step": 3076 - }, - { - "epoch": 0.08, - "learning_rate": 1.9875091403938137e-06, - "loss": 1.0205, - "step": 3077 - }, - { - "epoch": 0.08, - "learning_rate": 1.9874960574626985e-06, - "loss": 0.7451, - "step": 3078 - }, - { - "epoch": 0.08, - "learning_rate": 1.987482967726741e-06, - "loss": 1.0986, - "step": 3079 - }, - { - "epoch": 0.08, - "learning_rate": 1.9874698711860306e-06, - "loss": 0.9277, - "step": 3080 - }, - { - "epoch": 0.08, - "learning_rate": 1.9874567678406578e-06, - "loss": 0.959, - "step": 3081 - }, - { - "epoch": 0.08, - "learning_rate": 1.987443657690713e-06, - "loss": 0.8799, - "step": 3082 - }, - { - "epoch": 0.08, - "learning_rate": 1.987430540736287e-06, - "loss": 0.8818, - "step": 3083 - }, - { - "epoch": 0.08, - "learning_rate": 1.987417416977469e-06, - "loss": 1.0889, - "step": 3084 - }, - { - "epoch": 0.08, - "learning_rate": 1.9874042864143506e-06, - "loss": 1.002, - "step": 3085 - }, - { - "epoch": 0.08, - "learning_rate": 1.9873911490470215e-06, - "loss": 0.812, - "step": 3086 - }, - { - "epoch": 0.08, - "learning_rate": 1.9873780048755725e-06, - "loss": 0.7695, - "step": 3087 - }, - { - "epoch": 0.08, - "learning_rate": 1.9873648539000946e-06, - "loss": 1.0557, - "step": 3088 - }, - { - "epoch": 0.08, - "learning_rate": 1.9873516961206776e-06, - "loss": 0.772, - "step": 3089 - }, - { - "epoch": 0.08, - "learning_rate": 1.987338531537413e-06, - "loss": 0.8403, - "step": 3090 - }, - { - "epoch": 0.08, - "learning_rate": 1.9873253601503904e-06, - "loss": 0.8594, - "step": 3091 - }, - { - "epoch": 0.08, - "learning_rate": 1.987312181959702e-06, - "loss": 0.7607, - "step": 3092 - }, - { - "epoch": 0.08, - "learning_rate": 1.9872989969654377e-06, - "loss": 1.0889, - "step": 3093 - }, - { - "epoch": 0.08, - "learning_rate": 1.9872858051676885e-06, - "loss": 0.9922, - "step": 3094 - }, - { - "epoch": 0.08, - "learning_rate": 1.987272606566545e-06, - "loss": 1.0107, - "step": 3095 - }, - { - "epoch": 0.08, - "learning_rate": 1.9872594011620993e-06, - "loss": 0.8613, - "step": 3096 - }, - { - "epoch": 0.08, - "learning_rate": 1.987246188954441e-06, - "loss": 1.0117, - "step": 3097 - }, - { - "epoch": 0.08, - "learning_rate": 1.987232969943662e-06, - "loss": 0.9609, - "step": 3098 - }, - { - "epoch": 0.08, - "learning_rate": 1.9872197441298534e-06, - "loss": 0.9365, - "step": 3099 - }, - { - "epoch": 0.08, - "learning_rate": 1.9872065115131057e-06, - "loss": 0.8657, - "step": 3100 - }, - { - "epoch": 0.08, - "learning_rate": 1.9871932720935103e-06, - "loss": 0.9648, - "step": 3101 - }, - { - "epoch": 0.08, - "learning_rate": 1.9871800258711586e-06, - "loss": 0.8789, - "step": 3102 - }, - { - "epoch": 0.08, - "learning_rate": 1.9871667728461427e-06, - "loss": 0.8555, - "step": 3103 - }, - { - "epoch": 0.08, - "learning_rate": 1.987153513018552e-06, - "loss": 0.9023, - "step": 3104 - }, - { - "epoch": 0.08, - "learning_rate": 1.98714024638848e-06, - "loss": 1.0361, - "step": 3105 - }, - { - "epoch": 0.08, - "learning_rate": 1.9871269729560164e-06, - "loss": 0.6875, - "step": 3106 - }, - { - "epoch": 0.08, - "learning_rate": 1.9871136927212538e-06, - "loss": 0.9385, - "step": 3107 - }, - { - "epoch": 0.08, - "learning_rate": 1.9871004056842833e-06, - "loss": 0.9941, - "step": 3108 - }, - { - "epoch": 0.08, - "learning_rate": 1.987087111845196e-06, - "loss": 0.604, - "step": 3109 - }, - { - "epoch": 0.08, - "learning_rate": 1.9870738112040845e-06, - "loss": 1.0596, - "step": 3110 - }, - { - "epoch": 0.08, - "learning_rate": 1.9870605037610396e-06, - "loss": 0.8696, - "step": 3111 - }, - { - "epoch": 0.08, - "learning_rate": 1.9870471895161533e-06, - "loss": 0.9336, - "step": 3112 - }, - { - "epoch": 0.08, - "learning_rate": 1.9870338684695174e-06, - "loss": 0.9424, - "step": 3113 - }, - { - "epoch": 0.08, - "learning_rate": 1.9870205406212235e-06, - "loss": 1.085, - "step": 3114 - }, - { - "epoch": 0.08, - "learning_rate": 1.987007205971364e-06, - "loss": 0.9434, - "step": 3115 - }, - { - "epoch": 0.08, - "learning_rate": 1.98699386452003e-06, - "loss": 1.0039, - "step": 3116 - }, - { - "epoch": 0.08, - "learning_rate": 1.9869805162673137e-06, - "loss": 0.8975, - "step": 3117 - }, - { - "epoch": 0.08, - "learning_rate": 1.9869671612133074e-06, - "loss": 0.9746, - "step": 3118 - }, - { - "epoch": 0.08, - "learning_rate": 1.9869537993581035e-06, - "loss": 1.0059, - "step": 3119 - }, - { - "epoch": 0.08, - "learning_rate": 1.9869404307017925e-06, - "loss": 1.1191, - "step": 3120 - }, - { - "epoch": 0.08, - "learning_rate": 1.9869270552444685e-06, - "loss": 1.0371, - "step": 3121 - }, - { - "epoch": 0.08, - "learning_rate": 1.986913672986222e-06, - "loss": 1.1426, - "step": 3122 - }, - { - "epoch": 0.08, - "learning_rate": 1.9869002839271464e-06, - "loss": 1.0234, - "step": 3123 - }, - { - "epoch": 0.08, - "learning_rate": 1.986886888067333e-06, - "loss": 0.9551, - "step": 3124 - }, - { - "epoch": 0.08, - "learning_rate": 1.986873485406875e-06, - "loss": 1.0537, - "step": 3125 - }, - { - "epoch": 0.08, - "learning_rate": 1.9868600759458644e-06, - "loss": 0.8486, - "step": 3126 - }, - { - "epoch": 0.08, - "learning_rate": 1.986846659684393e-06, - "loss": 0.8633, - "step": 3127 - }, - { - "epoch": 0.08, - "learning_rate": 1.9868332366225544e-06, - "loss": 0.8975, - "step": 3128 - }, - { - "epoch": 0.08, - "learning_rate": 1.98681980676044e-06, - "loss": 0.8994, - "step": 3129 - }, - { - "epoch": 0.08, - "learning_rate": 1.986806370098144e-06, - "loss": 0.7173, - "step": 3130 - }, - { - "epoch": 0.08, - "learning_rate": 1.9867929266357564e-06, - "loss": 0.9727, - "step": 3131 - }, - { - "epoch": 0.08, - "learning_rate": 1.986779476373372e-06, - "loss": 1.0381, - "step": 3132 - }, - { - "epoch": 0.08, - "learning_rate": 1.986766019311083e-06, - "loss": 1.0117, - "step": 3133 - }, - { - "epoch": 0.08, - "learning_rate": 1.9867525554489814e-06, - "loss": 0.8042, - "step": 3134 - }, - { - "epoch": 0.08, - "learning_rate": 1.9867390847871607e-06, - "loss": 0.957, - "step": 3135 - }, - { - "epoch": 0.08, - "learning_rate": 1.9867256073257136e-06, - "loss": 0.875, - "step": 3136 - }, - { - "epoch": 0.08, - "learning_rate": 1.986712123064733e-06, - "loss": 1.0723, - "step": 3137 - }, - { - "epoch": 0.08, - "learning_rate": 1.986698632004311e-06, - "loss": 1.0518, - "step": 3138 - }, - { - "epoch": 0.08, - "learning_rate": 1.986685134144542e-06, - "loss": 1.0625, - "step": 3139 - }, - { - "epoch": 0.08, - "learning_rate": 1.986671629485518e-06, - "loss": 0.6519, - "step": 3140 - }, - { - "epoch": 0.08, - "learning_rate": 1.9866581180273324e-06, - "loss": 0.7412, - "step": 3141 - }, - { - "epoch": 0.08, - "learning_rate": 1.986644599770078e-06, - "loss": 0.8452, - "step": 3142 - }, - { - "epoch": 0.08, - "learning_rate": 1.986631074713849e-06, - "loss": 0.8408, - "step": 3143 - }, - { - "epoch": 0.08, - "learning_rate": 1.986617542858737e-06, - "loss": 1.1816, - "step": 3144 - }, - { - "epoch": 0.08, - "learning_rate": 1.986604004204836e-06, - "loss": 1.04, - "step": 3145 - }, - { - "epoch": 0.08, - "learning_rate": 1.98659045875224e-06, - "loss": 0.9365, - "step": 3146 - }, - { - "epoch": 0.08, - "learning_rate": 1.986576906501041e-06, - "loss": 0.917, - "step": 3147 - }, - { - "epoch": 0.08, - "learning_rate": 1.9865633474513338e-06, - "loss": 1.0195, - "step": 3148 - }, - { - "epoch": 0.08, - "learning_rate": 1.9865497816032107e-06, - "loss": 1.0205, - "step": 3149 - }, - { - "epoch": 0.08, - "learning_rate": 1.9865362089567657e-06, - "loss": 0.9844, - "step": 3150 - }, - { - "epoch": 0.08, - "learning_rate": 1.9865226295120926e-06, - "loss": 0.8721, - "step": 3151 - }, - { - "epoch": 0.08, - "learning_rate": 1.986509043269284e-06, - "loss": 0.958, - "step": 3152 - }, - { - "epoch": 0.08, - "learning_rate": 1.9864954502284344e-06, - "loss": 1.1016, - "step": 3153 - }, - { - "epoch": 0.08, - "learning_rate": 1.9864818503896372e-06, - "loss": 0.9072, - "step": 3154 - }, - { - "epoch": 0.08, - "learning_rate": 1.986468243752986e-06, - "loss": 1.0371, - "step": 3155 - }, - { - "epoch": 0.08, - "learning_rate": 1.986454630318575e-06, - "loss": 0.9043, - "step": 3156 - }, - { - "epoch": 0.08, - "learning_rate": 1.9864410100864974e-06, - "loss": 1.0107, - "step": 3157 - }, - { - "epoch": 0.08, - "learning_rate": 1.9864273830568474e-06, - "loss": 0.9404, - "step": 3158 - }, - { - "epoch": 0.08, - "learning_rate": 1.9864137492297187e-06, - "loss": 0.7251, - "step": 3159 - }, - { - "epoch": 0.08, - "learning_rate": 1.986400108605205e-06, - "loss": 1.1445, - "step": 3160 - }, - { - "epoch": 0.08, - "learning_rate": 1.9863864611834018e-06, - "loss": 0.9609, - "step": 3161 - }, - { - "epoch": 0.08, - "learning_rate": 1.9863728069644016e-06, - "loss": 0.7861, - "step": 3162 - }, - { - "epoch": 0.08, - "learning_rate": 1.9863591459482988e-06, - "loss": 0.8867, - "step": 3163 - }, - { - "epoch": 0.08, - "learning_rate": 1.9863454781351877e-06, - "loss": 1.2627, - "step": 3164 - }, - { - "epoch": 0.08, - "learning_rate": 1.9863318035251623e-06, - "loss": 0.8125, - "step": 3165 - }, - { - "epoch": 0.08, - "learning_rate": 1.986318122118317e-06, - "loss": 0.9907, - "step": 3166 - }, - { - "epoch": 0.08, - "learning_rate": 1.9863044339147463e-06, - "loss": 1.0605, - "step": 3167 - }, - { - "epoch": 0.08, - "learning_rate": 1.9862907389145444e-06, - "loss": 0.8779, - "step": 3168 - }, - { - "epoch": 0.08, - "learning_rate": 1.9862770371178053e-06, - "loss": 0.8242, - "step": 3169 - }, - { - "epoch": 0.08, - "learning_rate": 1.986263328524624e-06, - "loss": 0.835, - "step": 3170 - }, - { - "epoch": 0.08, - "learning_rate": 1.986249613135094e-06, - "loss": 1.1562, - "step": 3171 - }, - { - "epoch": 0.08, - "learning_rate": 1.986235890949311e-06, - "loss": 0.8447, - "step": 3172 - }, - { - "epoch": 0.08, - "learning_rate": 1.9862221619673688e-06, - "loss": 0.8057, - "step": 3173 - }, - { - "epoch": 0.08, - "learning_rate": 1.9862084261893627e-06, - "loss": 0.8965, - "step": 3174 - }, - { - "epoch": 0.08, - "learning_rate": 1.9861946836153864e-06, - "loss": 1.126, - "step": 3175 - }, - { - "epoch": 0.08, - "learning_rate": 1.986180934245535e-06, - "loss": 1.1123, - "step": 3176 - }, - { - "epoch": 0.08, - "learning_rate": 1.986167178079904e-06, - "loss": 0.9248, - "step": 3177 - }, - { - "epoch": 0.08, - "learning_rate": 1.986153415118587e-06, - "loss": 0.9414, - "step": 3178 - }, - { - "epoch": 0.08, - "learning_rate": 1.9861396453616793e-06, - "loss": 1.0205, - "step": 3179 - }, - { - "epoch": 0.08, - "learning_rate": 1.986125868809276e-06, - "loss": 0.9067, - "step": 3180 - }, - { - "epoch": 0.08, - "learning_rate": 1.986112085461472e-06, - "loss": 0.9961, - "step": 3181 - }, - { - "epoch": 0.08, - "learning_rate": 1.986098295318362e-06, - "loss": 0.7607, - "step": 3182 - }, - { - "epoch": 0.08, - "learning_rate": 1.9860844983800415e-06, - "loss": 1.1641, - "step": 3183 - }, - { - "epoch": 0.08, - "learning_rate": 1.9860706946466048e-06, - "loss": 0.9355, - "step": 3184 - }, - { - "epoch": 0.08, - "learning_rate": 1.9860568841181478e-06, - "loss": 0.8818, - "step": 3185 - }, - { - "epoch": 0.08, - "learning_rate": 1.9860430667947654e-06, - "loss": 0.7275, - "step": 3186 - }, - { - "epoch": 0.08, - "learning_rate": 1.9860292426765524e-06, - "loss": 1.0098, - "step": 3187 - }, - { - "epoch": 0.08, - "learning_rate": 1.986015411763605e-06, - "loss": 0.8857, - "step": 3188 - }, - { - "epoch": 0.08, - "learning_rate": 1.986001574056018e-06, - "loss": 0.7896, - "step": 3189 - }, - { - "epoch": 0.08, - "learning_rate": 1.985987729553886e-06, - "loss": 0.7422, - "step": 3190 - }, - { - "epoch": 0.08, - "learning_rate": 1.9859738782573053e-06, - "loss": 0.9219, - "step": 3191 - }, - { - "epoch": 0.08, - "learning_rate": 1.9859600201663716e-06, - "loss": 0.9688, - "step": 3192 - }, - { - "epoch": 0.08, - "learning_rate": 1.9859461552811795e-06, - "loss": 0.666, - "step": 3193 - }, - { - "epoch": 0.08, - "learning_rate": 1.985932283601825e-06, - "loss": 0.8091, - "step": 3194 - }, - { - "epoch": 0.08, - "learning_rate": 1.985918405128404e-06, - "loss": 0.8887, - "step": 3195 - }, - { - "epoch": 0.08, - "learning_rate": 1.9859045198610114e-06, - "loss": 0.9834, - "step": 3196 - }, - { - "epoch": 0.08, - "learning_rate": 1.985890627799744e-06, - "loss": 1.0039, - "step": 3197 - }, - { - "epoch": 0.08, - "learning_rate": 1.9858767289446965e-06, - "loss": 0.9893, - "step": 3198 - }, - { - "epoch": 0.08, - "learning_rate": 1.9858628232959646e-06, - "loss": 0.9639, - "step": 3199 - }, - { - "epoch": 0.08, - "learning_rate": 1.985848910853645e-06, - "loss": 0.9043, - "step": 3200 - }, - { - "epoch": 0.08, - "learning_rate": 1.985834991617833e-06, - "loss": 0.7871, - "step": 3201 - }, - { - "epoch": 0.08, - "learning_rate": 1.9858210655886246e-06, - "loss": 0.7026, - "step": 3202 - }, - { - "epoch": 0.08, - "learning_rate": 1.985807132766116e-06, - "loss": 1.1328, - "step": 3203 - }, - { - "epoch": 0.08, - "learning_rate": 1.985793193150403e-06, - "loss": 0.8682, - "step": 3204 - }, - { - "epoch": 0.08, - "learning_rate": 1.985779246741581e-06, - "loss": 0.916, - "step": 3205 - }, - { - "epoch": 0.08, - "learning_rate": 1.9857652935397475e-06, - "loss": 0.6958, - "step": 3206 - }, - { - "epoch": 0.08, - "learning_rate": 1.9857513335449976e-06, - "loss": 0.7896, - "step": 3207 - }, - { - "epoch": 0.08, - "learning_rate": 1.9857373667574276e-06, - "loss": 1.0303, - "step": 3208 - }, - { - "epoch": 0.08, - "learning_rate": 1.9857233931771344e-06, - "loss": 0.9863, - "step": 3209 - }, - { - "epoch": 0.08, - "learning_rate": 1.985709412804214e-06, - "loss": 0.7676, - "step": 3210 - }, - { - "epoch": 0.08, - "learning_rate": 1.985695425638762e-06, - "loss": 0.8838, - "step": 3211 - }, - { - "epoch": 0.08, - "learning_rate": 1.9856814316808756e-06, - "loss": 1.0674, - "step": 3212 - }, - { - "epoch": 0.08, - "learning_rate": 1.985667430930651e-06, - "loss": 0.8101, - "step": 3213 - }, - { - "epoch": 0.08, - "learning_rate": 1.9856534233881846e-06, - "loss": 0.6655, - "step": 3214 - }, - { - "epoch": 0.08, - "learning_rate": 1.9856394090535734e-06, - "loss": 0.9443, - "step": 3215 - }, - { - "epoch": 0.08, - "learning_rate": 1.985625387926913e-06, - "loss": 0.8696, - "step": 3216 - }, - { - "epoch": 0.08, - "learning_rate": 1.985611360008301e-06, - "loss": 0.9023, - "step": 3217 - }, - { - "epoch": 0.08, - "learning_rate": 1.9855973252978338e-06, - "loss": 0.9639, - "step": 3218 - }, - { - "epoch": 0.08, - "learning_rate": 1.985583283795608e-06, - "loss": 0.8926, - "step": 3219 - }, - { - "epoch": 0.08, - "learning_rate": 1.98556923550172e-06, - "loss": 0.7139, - "step": 3220 - }, - { - "epoch": 0.08, - "learning_rate": 1.985555180416267e-06, - "loss": 0.8086, - "step": 3221 - }, - { - "epoch": 0.08, - "learning_rate": 1.985541118539346e-06, - "loss": 0.7598, - "step": 3222 - }, - { - "epoch": 0.08, - "learning_rate": 1.9855270498710536e-06, - "loss": 0.9248, - "step": 3223 - }, - { - "epoch": 0.08, - "learning_rate": 1.985512974411487e-06, - "loss": 0.6973, - "step": 3224 - }, - { - "epoch": 0.08, - "learning_rate": 1.985498892160743e-06, - "loss": 0.7969, - "step": 3225 - }, - { - "epoch": 0.08, - "learning_rate": 1.9854848031189183e-06, - "loss": 0.8638, - "step": 3226 - }, - { - "epoch": 0.08, - "learning_rate": 1.985470707286111e-06, - "loss": 1.0127, - "step": 3227 - }, - { - "epoch": 0.08, - "learning_rate": 1.985456604662417e-06, - "loss": 1.1738, - "step": 3228 - }, - { - "epoch": 0.08, - "learning_rate": 1.9854424952479343e-06, - "loss": 0.8657, - "step": 3229 - }, - { - "epoch": 0.08, - "learning_rate": 1.98542837904276e-06, - "loss": 0.7275, - "step": 3230 - }, - { - "epoch": 0.08, - "learning_rate": 1.9854142560469914e-06, - "loss": 0.8442, - "step": 3231 - }, - { - "epoch": 0.08, - "learning_rate": 1.9854001262607255e-06, - "loss": 0.9961, - "step": 3232 - }, - { - "epoch": 0.08, - "learning_rate": 1.98538598968406e-06, - "loss": 1.125, - "step": 3233 - }, - { - "epoch": 0.08, - "learning_rate": 1.9853718463170925e-06, - "loss": 1.0234, - "step": 3234 - }, - { - "epoch": 0.08, - "learning_rate": 1.9853576961599198e-06, - "loss": 1.0391, - "step": 3235 - }, - { - "epoch": 0.08, - "learning_rate": 1.9853435392126395e-06, - "loss": 1.0684, - "step": 3236 - }, - { - "epoch": 0.08, - "learning_rate": 1.98532937547535e-06, - "loss": 0.8672, - "step": 3237 - }, - { - "epoch": 0.08, - "learning_rate": 1.985315204948148e-06, - "loss": 1.0742, - "step": 3238 - }, - { - "epoch": 0.08, - "learning_rate": 1.9853010276311318e-06, - "loss": 0.9111, - "step": 3239 - }, - { - "epoch": 0.08, - "learning_rate": 1.9852868435243986e-06, - "loss": 0.8818, - "step": 3240 - }, - { - "epoch": 0.08, - "learning_rate": 1.9852726526280463e-06, - "loss": 1.0518, - "step": 3241 - }, - { - "epoch": 0.08, - "learning_rate": 1.9852584549421727e-06, - "loss": 0.8701, - "step": 3242 - }, - { - "epoch": 0.08, - "learning_rate": 1.9852442504668755e-06, - "loss": 0.9092, - "step": 3243 - }, - { - "epoch": 0.08, - "learning_rate": 1.985230039202253e-06, - "loss": 0.9404, - "step": 3244 - }, - { - "epoch": 0.08, - "learning_rate": 1.985215821148403e-06, - "loss": 0.8145, - "step": 3245 - }, - { - "epoch": 0.08, - "learning_rate": 1.9852015963054226e-06, - "loss": 0.8525, - "step": 3246 - }, - { - "epoch": 0.08, - "learning_rate": 1.985187364673411e-06, - "loss": 0.8701, - "step": 3247 - }, - { - "epoch": 0.08, - "learning_rate": 1.985173126252466e-06, - "loss": 0.9111, - "step": 3248 - }, - { - "epoch": 0.08, - "learning_rate": 1.9851588810426853e-06, - "loss": 1.0, - "step": 3249 - }, - { - "epoch": 0.08, - "learning_rate": 1.9851446290441675e-06, - "loss": 1.0293, - "step": 3250 - }, - { - "epoch": 0.08, - "learning_rate": 1.9851303702570102e-06, - "loss": 0.8877, - "step": 3251 - }, - { - "epoch": 0.08, - "learning_rate": 1.9851161046813125e-06, - "loss": 0.9023, - "step": 3252 - }, - { - "epoch": 0.08, - "learning_rate": 1.985101832317172e-06, - "loss": 0.8955, - "step": 3253 - }, - { - "epoch": 0.08, - "learning_rate": 1.9850875531646877e-06, - "loss": 0.6221, - "step": 3254 - }, - { - "epoch": 0.08, - "learning_rate": 1.9850732672239576e-06, - "loss": 0.8716, - "step": 3255 - }, - { - "epoch": 0.08, - "learning_rate": 1.98505897449508e-06, - "loss": 0.9668, - "step": 3256 - }, - { - "epoch": 0.08, - "learning_rate": 1.9850446749781533e-06, - "loss": 0.8262, - "step": 3257 - }, - { - "epoch": 0.08, - "learning_rate": 1.985030368673277e-06, - "loss": 0.8501, - "step": 3258 - }, - { - "epoch": 0.08, - "learning_rate": 1.9850160555805483e-06, - "loss": 0.9023, - "step": 3259 - }, - { - "epoch": 0.08, - "learning_rate": 1.985001735700067e-06, - "loss": 1.0498, - "step": 3260 - }, - { - "epoch": 0.08, - "learning_rate": 1.9849874090319306e-06, - "loss": 0.9395, - "step": 3261 - }, - { - "epoch": 0.08, - "learning_rate": 1.9849730755762394e-06, - "loss": 1.0752, - "step": 3262 - }, - { - "epoch": 0.08, - "learning_rate": 1.9849587353330906e-06, - "loss": 0.8926, - "step": 3263 - }, - { - "epoch": 0.08, - "learning_rate": 1.9849443883025842e-06, - "loss": 1.0176, - "step": 3264 - }, - { - "epoch": 0.08, - "learning_rate": 1.9849300344848185e-06, - "loss": 0.9248, - "step": 3265 - }, - { - "epoch": 0.08, - "learning_rate": 1.984915673879892e-06, - "loss": 0.7703, - "step": 3266 - }, - { - "epoch": 0.08, - "learning_rate": 1.9849013064879047e-06, - "loss": 0.9951, - "step": 3267 - }, - { - "epoch": 0.08, - "learning_rate": 1.984886932308955e-06, - "loss": 1.0205, - "step": 3268 - }, - { - "epoch": 0.08, - "learning_rate": 1.984872551343142e-06, - "loss": 1.1758, - "step": 3269 - }, - { - "epoch": 0.08, - "learning_rate": 1.9848581635905647e-06, - "loss": 1.0186, - "step": 3270 - }, - { - "epoch": 0.08, - "learning_rate": 1.984843769051322e-06, - "loss": 0.7812, - "step": 3271 - }, - { - "epoch": 0.08, - "learning_rate": 1.984829367725514e-06, - "loss": 0.8828, - "step": 3272 - }, - { - "epoch": 0.08, - "learning_rate": 1.9848149596132393e-06, - "loss": 0.8276, - "step": 3273 - }, - { - "epoch": 0.08, - "learning_rate": 1.984800544714597e-06, - "loss": 0.8643, - "step": 3274 - }, - { - "epoch": 0.08, - "learning_rate": 1.984786123029687e-06, - "loss": 1.0312, - "step": 3275 - }, - { - "epoch": 0.08, - "learning_rate": 1.9847716945586085e-06, - "loss": 0.998, - "step": 3276 - }, - { - "epoch": 0.08, - "learning_rate": 1.9847572593014604e-06, - "loss": 0.9189, - "step": 3277 - }, - { - "epoch": 0.08, - "learning_rate": 1.984742817258343e-06, - "loss": 1.2344, - "step": 3278 - }, - { - "epoch": 0.08, - "learning_rate": 1.984728368429355e-06, - "loss": 1.0449, - "step": 3279 - }, - { - "epoch": 0.08, - "learning_rate": 1.9847139128145966e-06, - "loss": 0.8521, - "step": 3280 - }, - { - "epoch": 0.08, - "learning_rate": 1.984699450414167e-06, - "loss": 1.0049, - "step": 3281 - }, - { - "epoch": 0.08, - "learning_rate": 1.9846849812281664e-06, - "loss": 0.8672, - "step": 3282 - }, - { - "epoch": 0.08, - "learning_rate": 1.984670505256694e-06, - "loss": 0.8438, - "step": 3283 - }, - { - "epoch": 0.08, - "learning_rate": 1.9846560224998496e-06, - "loss": 1.0605, - "step": 3284 - }, - { - "epoch": 0.08, - "learning_rate": 1.984641532957733e-06, - "loss": 1.0947, - "step": 3285 - }, - { - "epoch": 0.08, - "learning_rate": 1.9846270366304443e-06, - "loss": 0.5449, - "step": 3286 - }, - { - "epoch": 0.08, - "learning_rate": 1.9846125335180835e-06, - "loss": 1.2373, - "step": 3287 - }, - { - "epoch": 0.08, - "learning_rate": 1.98459802362075e-06, - "loss": 1.0996, - "step": 3288 - }, - { - "epoch": 0.08, - "learning_rate": 1.984583506938544e-06, - "loss": 0.9277, - "step": 3289 - }, - { - "epoch": 0.08, - "learning_rate": 1.984568983471566e-06, - "loss": 0.917, - "step": 3290 - }, - { - "epoch": 0.08, - "learning_rate": 1.9845544532199155e-06, - "loss": 0.9365, - "step": 3291 - }, - { - "epoch": 0.08, - "learning_rate": 1.984539916183693e-06, - "loss": 1.1699, - "step": 3292 - }, - { - "epoch": 0.08, - "learning_rate": 1.984525372362998e-06, - "loss": 0.8091, - "step": 3293 - }, - { - "epoch": 0.08, - "learning_rate": 1.9845108217579314e-06, - "loss": 0.8423, - "step": 3294 - }, - { - "epoch": 0.08, - "learning_rate": 1.984496264368594e-06, - "loss": 0.7661, - "step": 3295 - }, - { - "epoch": 0.08, - "learning_rate": 1.9844817001950843e-06, - "loss": 0.8066, - "step": 3296 - }, - { - "epoch": 0.08, - "learning_rate": 1.984467129237504e-06, - "loss": 0.8682, - "step": 3297 - }, - { - "epoch": 0.08, - "learning_rate": 1.9844525514959536e-06, - "loss": 0.8389, - "step": 3298 - }, - { - "epoch": 0.08, - "learning_rate": 1.9844379669705336e-06, - "loss": 0.8477, - "step": 3299 - }, - { - "epoch": 0.08, - "learning_rate": 1.9844233756613436e-06, - "loss": 1.127, - "step": 3300 - }, - { - "epoch": 0.08, - "learning_rate": 1.984408777568485e-06, - "loss": 0.9746, - "step": 3301 - }, - { - "epoch": 0.08, - "learning_rate": 1.9843941726920577e-06, - "loss": 1.208, - "step": 3302 - }, - { - "epoch": 0.08, - "learning_rate": 1.984379561032163e-06, - "loss": 1.166, - "step": 3303 - }, - { - "epoch": 0.08, - "learning_rate": 1.984364942588901e-06, - "loss": 0.8877, - "step": 3304 - }, - { - "epoch": 0.08, - "learning_rate": 1.984350317362373e-06, - "loss": 1.1562, - "step": 3305 - }, - { - "epoch": 0.08, - "learning_rate": 1.9843356853526795e-06, - "loss": 0.9668, - "step": 3306 - }, - { - "epoch": 0.08, - "learning_rate": 1.9843210465599215e-06, - "loss": 0.8662, - "step": 3307 - }, - { - "epoch": 0.08, - "learning_rate": 1.9843064009841995e-06, - "loss": 0.9365, - "step": 3308 - }, - { - "epoch": 0.08, - "learning_rate": 1.9842917486256146e-06, - "loss": 0.9268, - "step": 3309 - }, - { - "epoch": 0.08, - "learning_rate": 1.984277089484268e-06, - "loss": 0.9473, - "step": 3310 - }, - { - "epoch": 0.08, - "learning_rate": 1.9842624235602606e-06, - "loss": 0.8711, - "step": 3311 - }, - { - "epoch": 0.08, - "learning_rate": 1.9842477508536934e-06, - "loss": 1.1396, - "step": 3312 - }, - { - "epoch": 0.08, - "learning_rate": 1.984233071364667e-06, - "loss": 0.9805, - "step": 3313 - }, - { - "epoch": 0.08, - "learning_rate": 1.984218385093284e-06, - "loss": 0.8716, - "step": 3314 - }, - { - "epoch": 0.08, - "learning_rate": 1.984203692039644e-06, - "loss": 0.8896, - "step": 3315 - }, - { - "epoch": 0.08, - "learning_rate": 1.984188992203849e-06, - "loss": 0.8955, - "step": 3316 - }, - { - "epoch": 0.09, - "learning_rate": 1.984174285586e-06, - "loss": 0.9785, - "step": 3317 - }, - { - "epoch": 0.09, - "learning_rate": 1.9841595721861993e-06, - "loss": 0.8145, - "step": 3318 - }, - { - "epoch": 0.09, - "learning_rate": 1.984144852004547e-06, - "loss": 0.8926, - "step": 3319 - }, - { - "epoch": 0.09, - "learning_rate": 1.984130125041145e-06, - "loss": 0.9863, - "step": 3320 - }, - { - "epoch": 0.09, - "learning_rate": 1.984115391296095e-06, - "loss": 0.9766, - "step": 3321 - }, - { - "epoch": 0.09, - "learning_rate": 1.9841006507694987e-06, - "loss": 0.9287, - "step": 3322 - }, - { - "epoch": 0.09, - "learning_rate": 1.984085903461457e-06, - "loss": 1.1035, - "step": 3323 - }, - { - "epoch": 0.09, - "learning_rate": 1.984071149372072e-06, - "loss": 1.0615, - "step": 3324 - }, - { - "epoch": 0.09, - "learning_rate": 1.9840563885014456e-06, - "loss": 0.9932, - "step": 3325 - }, - { - "epoch": 0.09, - "learning_rate": 1.984041620849679e-06, - "loss": 0.8818, - "step": 3326 - }, - { - "epoch": 0.09, - "learning_rate": 1.9840268464168738e-06, - "loss": 0.9248, - "step": 3327 - }, - { - "epoch": 0.09, - "learning_rate": 1.9840120652031325e-06, - "loss": 0.9883, - "step": 3328 - }, - { - "epoch": 0.09, - "learning_rate": 1.9839972772085566e-06, - "loss": 0.9463, - "step": 3329 - }, - { - "epoch": 0.09, - "learning_rate": 1.983982482433248e-06, - "loss": 1.0312, - "step": 3330 - }, - { - "epoch": 0.09, - "learning_rate": 1.983967680877309e-06, - "loss": 0.8433, - "step": 3331 - }, - { - "epoch": 0.09, - "learning_rate": 1.983952872540841e-06, - "loss": 0.8613, - "step": 3332 - }, - { - "epoch": 0.09, - "learning_rate": 1.983938057423946e-06, - "loss": 1.041, - "step": 3333 - }, - { - "epoch": 0.09, - "learning_rate": 1.983923235526727e-06, - "loss": 0.874, - "step": 3334 - }, - { - "epoch": 0.09, - "learning_rate": 1.983908406849285e-06, - "loss": 0.8486, - "step": 3335 - }, - { - "epoch": 0.09, - "learning_rate": 1.9838935713917234e-06, - "loss": 0.7642, - "step": 3336 - }, - { - "epoch": 0.09, - "learning_rate": 1.983878729154143e-06, - "loss": 0.9082, - "step": 3337 - }, - { - "epoch": 0.09, - "learning_rate": 1.9838638801366476e-06, - "loss": 0.8296, - "step": 3338 - }, - { - "epoch": 0.09, - "learning_rate": 1.9838490243393383e-06, - "loss": 1.1025, - "step": 3339 - }, - { - "epoch": 0.09, - "learning_rate": 1.983834161762318e-06, - "loss": 0.9434, - "step": 3340 - }, - { - "epoch": 0.09, - "learning_rate": 1.983819292405689e-06, - "loss": 0.9658, - "step": 3341 - }, - { - "epoch": 0.09, - "learning_rate": 1.983804416269554e-06, - "loss": 0.7695, - "step": 3342 - }, - { - "epoch": 0.09, - "learning_rate": 1.9837895333540153e-06, - "loss": 0.8457, - "step": 3343 - }, - { - "epoch": 0.09, - "learning_rate": 1.983774643659175e-06, - "loss": 0.9414, - "step": 3344 - }, - { - "epoch": 0.09, - "learning_rate": 1.983759747185137e-06, - "loss": 1.1035, - "step": 3345 - }, - { - "epoch": 0.09, - "learning_rate": 1.9837448439320025e-06, - "loss": 1.0527, - "step": 3346 - }, - { - "epoch": 0.09, - "learning_rate": 1.9837299338998753e-06, - "loss": 0.9824, - "step": 3347 - }, - { - "epoch": 0.09, - "learning_rate": 1.9837150170888575e-06, - "loss": 0.9062, - "step": 3348 - }, - { - "epoch": 0.09, - "learning_rate": 1.9837000934990523e-06, - "loss": 0.9463, - "step": 3349 - }, - { - "epoch": 0.09, - "learning_rate": 1.983685163130562e-06, - "loss": 0.9443, - "step": 3350 - }, - { - "epoch": 0.09, - "learning_rate": 1.98367022598349e-06, - "loss": 1.0566, - "step": 3351 - }, - { - "epoch": 0.09, - "learning_rate": 1.9836552820579387e-06, - "loss": 0.8633, - "step": 3352 - }, - { - "epoch": 0.09, - "learning_rate": 1.983640331354012e-06, - "loss": 1.0088, - "step": 3353 - }, - { - "epoch": 0.09, - "learning_rate": 1.983625373871812e-06, - "loss": 1.1172, - "step": 3354 - }, - { - "epoch": 0.09, - "learning_rate": 1.983610409611442e-06, - "loss": 0.9316, - "step": 3355 - }, - { - "epoch": 0.09, - "learning_rate": 1.9835954385730056e-06, - "loss": 0.8877, - "step": 3356 - }, - { - "epoch": 0.09, - "learning_rate": 1.9835804607566056e-06, - "loss": 0.8691, - "step": 3357 - }, - { - "epoch": 0.09, - "learning_rate": 1.983565476162345e-06, - "loss": 0.9854, - "step": 3358 - }, - { - "epoch": 0.09, - "learning_rate": 1.9835504847903274e-06, - "loss": 0.8721, - "step": 3359 - }, - { - "epoch": 0.09, - "learning_rate": 1.983535486640656e-06, - "loss": 0.8423, - "step": 3360 - }, - { - "epoch": 0.09, - "learning_rate": 1.983520481713434e-06, - "loss": 1.0791, - "step": 3361 - }, - { - "epoch": 0.09, - "learning_rate": 1.983505470008765e-06, - "loss": 0.8301, - "step": 3362 - }, - { - "epoch": 0.09, - "learning_rate": 1.983490451526752e-06, - "loss": 1.0576, - "step": 3363 - }, - { - "epoch": 0.09, - "learning_rate": 1.9834754262674995e-06, - "loss": 1.0068, - "step": 3364 - }, - { - "epoch": 0.09, - "learning_rate": 1.98346039423111e-06, - "loss": 0.9512, - "step": 3365 - }, - { - "epoch": 0.09, - "learning_rate": 1.9834453554176874e-06, - "loss": 0.998, - "step": 3366 - }, - { - "epoch": 0.09, - "learning_rate": 1.9834303098273357e-06, - "loss": 0.9092, - "step": 3367 - }, - { - "epoch": 0.09, - "learning_rate": 1.9834152574601584e-06, - "loss": 0.8926, - "step": 3368 - }, - { - "epoch": 0.09, - "learning_rate": 1.983400198316259e-06, - "loss": 0.9404, - "step": 3369 - }, - { - "epoch": 0.09, - "learning_rate": 1.983385132395741e-06, - "loss": 0.8965, - "step": 3370 - }, - { - "epoch": 0.09, - "learning_rate": 1.9833700596987093e-06, - "loss": 0.9102, - "step": 3371 - }, - { - "epoch": 0.09, - "learning_rate": 1.983354980225267e-06, - "loss": 1.0439, - "step": 3372 - }, - { - "epoch": 0.09, - "learning_rate": 1.9833398939755176e-06, - "loss": 0.9551, - "step": 3373 - }, - { - "epoch": 0.09, - "learning_rate": 1.9833248009495658e-06, - "loss": 0.9688, - "step": 3374 - }, - { - "epoch": 0.09, - "learning_rate": 1.9833097011475155e-06, - "loss": 0.7656, - "step": 3375 - }, - { - "epoch": 0.09, - "learning_rate": 1.98329459456947e-06, - "loss": 0.8447, - "step": 3376 - }, - { - "epoch": 0.09, - "learning_rate": 1.9832794812155353e-06, - "loss": 1.0879, - "step": 3377 - }, - { - "epoch": 0.09, - "learning_rate": 1.9832643610858133e-06, - "loss": 1.123, - "step": 3378 - }, - { - "epoch": 0.09, - "learning_rate": 1.9832492341804095e-06, - "loss": 0.9346, - "step": 3379 - }, - { - "epoch": 0.09, - "learning_rate": 1.983234100499428e-06, - "loss": 0.9829, - "step": 3380 - }, - { - "epoch": 0.09, - "learning_rate": 1.983218960042972e-06, - "loss": 0.8594, - "step": 3381 - }, - { - "epoch": 0.09, - "learning_rate": 1.9832038128111473e-06, - "loss": 0.8994, - "step": 3382 - }, - { - "epoch": 0.09, - "learning_rate": 1.983188658804058e-06, - "loss": 1.0859, - "step": 3383 - }, - { - "epoch": 0.09, - "learning_rate": 1.983173498021808e-06, - "loss": 1.0703, - "step": 3384 - }, - { - "epoch": 0.09, - "learning_rate": 1.983158330464502e-06, - "loss": 1.0625, - "step": 3385 - }, - { - "epoch": 0.09, - "learning_rate": 1.983143156132244e-06, - "loss": 1.0137, - "step": 3386 - }, - { - "epoch": 0.09, - "learning_rate": 1.9831279750251396e-06, - "loss": 0.9873, - "step": 3387 - }, - { - "epoch": 0.09, - "learning_rate": 1.983112787143293e-06, - "loss": 0.9355, - "step": 3388 - }, - { - "epoch": 0.09, - "learning_rate": 1.9830975924868083e-06, - "loss": 0.7539, - "step": 3389 - }, - { - "epoch": 0.09, - "learning_rate": 1.9830823910557914e-06, - "loss": 0.8418, - "step": 3390 - }, - { - "epoch": 0.09, - "learning_rate": 1.9830671828503456e-06, - "loss": 0.7686, - "step": 3391 - }, - { - "epoch": 0.09, - "learning_rate": 1.9830519678705767e-06, - "loss": 0.9814, - "step": 3392 - }, - { - "epoch": 0.09, - "learning_rate": 1.983036746116589e-06, - "loss": 0.8325, - "step": 3393 - }, - { - "epoch": 0.09, - "learning_rate": 1.983021517588488e-06, - "loss": 0.7979, - "step": 3394 - }, - { - "epoch": 0.09, - "learning_rate": 1.983006282286378e-06, - "loss": 1.0898, - "step": 3395 - }, - { - "epoch": 0.09, - "learning_rate": 1.982991040210365e-06, - "loss": 0.9238, - "step": 3396 - }, - { - "epoch": 0.09, - "learning_rate": 1.9829757913605526e-06, - "loss": 0.9756, - "step": 3397 - }, - { - "epoch": 0.09, - "learning_rate": 1.9829605357370466e-06, - "loss": 0.9873, - "step": 3398 - }, - { - "epoch": 0.09, - "learning_rate": 1.9829452733399523e-06, - "loss": 0.6626, - "step": 3399 - }, - { - "epoch": 0.09, - "learning_rate": 1.982930004169375e-06, - "loss": 0.9766, - "step": 3400 - }, - { - "epoch": 0.09, - "learning_rate": 1.982914728225419e-06, - "loss": 0.6255, - "step": 3401 - }, - { - "epoch": 0.09, - "learning_rate": 1.9828994455081907e-06, - "loss": 0.9238, - "step": 3402 - }, - { - "epoch": 0.09, - "learning_rate": 1.9828841560177947e-06, - "loss": 1.0459, - "step": 3403 - }, - { - "epoch": 0.09, - "learning_rate": 1.9828688597543365e-06, - "loss": 1.1904, - "step": 3404 - }, - { - "epoch": 0.09, - "learning_rate": 1.9828535567179216e-06, - "loss": 0.897, - "step": 3405 - }, - { - "epoch": 0.09, - "learning_rate": 1.9828382469086554e-06, - "loss": 1.0635, - "step": 3406 - }, - { - "epoch": 0.09, - "learning_rate": 1.9828229303266437e-06, - "loss": 0.9521, - "step": 3407 - }, - { - "epoch": 0.09, - "learning_rate": 1.9828076069719916e-06, - "loss": 0.9014, - "step": 3408 - }, - { - "epoch": 0.09, - "learning_rate": 1.9827922768448046e-06, - "loss": 0.9609, - "step": 3409 - }, - { - "epoch": 0.09, - "learning_rate": 1.9827769399451886e-06, - "loss": 0.9697, - "step": 3410 - }, - { - "epoch": 0.09, - "learning_rate": 1.9827615962732498e-06, - "loss": 0.8291, - "step": 3411 - }, - { - "epoch": 0.09, - "learning_rate": 1.982746245829093e-06, - "loss": 0.8745, - "step": 3412 - }, - { - "epoch": 0.09, - "learning_rate": 1.9827308886128244e-06, - "loss": 1.0225, - "step": 3413 - }, - { - "epoch": 0.09, - "learning_rate": 1.9827155246245497e-06, - "loss": 0.7676, - "step": 3414 - }, - { - "epoch": 0.09, - "learning_rate": 1.9827001538643752e-06, - "loss": 0.9854, - "step": 3415 - }, - { - "epoch": 0.09, - "learning_rate": 1.9826847763324066e-06, - "loss": 1.0684, - "step": 3416 - }, - { - "epoch": 0.09, - "learning_rate": 1.9826693920287496e-06, - "loss": 0.8672, - "step": 3417 - }, - { - "epoch": 0.09, - "learning_rate": 1.98265400095351e-06, - "loss": 0.9668, - "step": 3418 - }, - { - "epoch": 0.09, - "learning_rate": 1.9826386031067946e-06, - "loss": 0.8311, - "step": 3419 - }, - { - "epoch": 0.09, - "learning_rate": 1.9826231984887096e-06, - "loss": 1.0596, - "step": 3420 - }, - { - "epoch": 0.09, - "learning_rate": 1.98260778709936e-06, - "loss": 0.8618, - "step": 3421 - }, - { - "epoch": 0.09, - "learning_rate": 1.982592368938853e-06, - "loss": 0.8994, - "step": 3422 - }, - { - "epoch": 0.09, - "learning_rate": 1.9825769440072947e-06, - "loss": 0.998, - "step": 3423 - }, - { - "epoch": 0.09, - "learning_rate": 1.9825615123047913e-06, - "loss": 0.8701, - "step": 3424 - }, - { - "epoch": 0.09, - "learning_rate": 1.9825460738314486e-06, - "loss": 1.0703, - "step": 3425 - }, - { - "epoch": 0.09, - "learning_rate": 1.9825306285873744e-06, - "loss": 0.9551, - "step": 3426 - }, - { - "epoch": 0.09, - "learning_rate": 1.982515176572673e-06, - "loss": 1.0049, - "step": 3427 - }, - { - "epoch": 0.09, - "learning_rate": 1.9824997177874533e-06, - "loss": 0.9814, - "step": 3428 - }, - { - "epoch": 0.09, - "learning_rate": 1.9824842522318195e-06, - "loss": 0.9756, - "step": 3429 - }, - { - "epoch": 0.09, - "learning_rate": 1.98246877990588e-06, - "loss": 0.9854, - "step": 3430 - }, - { - "epoch": 0.09, - "learning_rate": 1.9824533008097407e-06, - "loss": 0.8311, - "step": 3431 - }, - { - "epoch": 0.09, - "learning_rate": 1.9824378149435083e-06, - "loss": 0.7773, - "step": 3432 - }, - { - "epoch": 0.09, - "learning_rate": 1.9824223223072893e-06, - "loss": 1.0459, - "step": 3433 - }, - { - "epoch": 0.09, - "learning_rate": 1.982406822901191e-06, - "loss": 1.1885, - "step": 3434 - }, - { - "epoch": 0.09, - "learning_rate": 1.9823913167253195e-06, - "loss": 0.8291, - "step": 3435 - }, - { - "epoch": 0.09, - "learning_rate": 1.9823758037797818e-06, - "loss": 0.7935, - "step": 3436 - }, - { - "epoch": 0.09, - "learning_rate": 1.9823602840646856e-06, - "loss": 0.668, - "step": 3437 - }, - { - "epoch": 0.09, - "learning_rate": 1.9823447575801368e-06, - "loss": 0.8765, - "step": 3438 - }, - { - "epoch": 0.09, - "learning_rate": 1.982329224326243e-06, - "loss": 1.0137, - "step": 3439 - }, - { - "epoch": 0.09, - "learning_rate": 1.982313684303111e-06, - "loss": 1.083, - "step": 3440 - }, - { - "epoch": 0.09, - "learning_rate": 1.982298137510848e-06, - "loss": 0.9062, - "step": 3441 - }, - { - "epoch": 0.09, - "learning_rate": 1.9822825839495613e-06, - "loss": 0.9541, - "step": 3442 - }, - { - "epoch": 0.09, - "learning_rate": 1.982267023619358e-06, - "loss": 0.9253, - "step": 3443 - }, - { - "epoch": 0.09, - "learning_rate": 1.9822514565203448e-06, - "loss": 0.9795, - "step": 3444 - }, - { - "epoch": 0.09, - "learning_rate": 1.9822358826526298e-06, - "loss": 1.0156, - "step": 3445 - }, - { - "epoch": 0.09, - "learning_rate": 1.98222030201632e-06, - "loss": 0.8994, - "step": 3446 - }, - { - "epoch": 0.09, - "learning_rate": 1.982204714611522e-06, - "loss": 0.854, - "step": 3447 - }, - { - "epoch": 0.09, - "learning_rate": 1.9821891204383444e-06, - "loss": 1.0479, - "step": 3448 - }, - { - "epoch": 0.09, - "learning_rate": 1.982173519496894e-06, - "loss": 1.0957, - "step": 3449 - }, - { - "epoch": 0.09, - "learning_rate": 1.9821579117872787e-06, - "loss": 1.2402, - "step": 3450 - }, - { - "epoch": 0.09, - "learning_rate": 1.9821422973096054e-06, - "loss": 0.9775, - "step": 3451 - }, - { - "epoch": 0.09, - "learning_rate": 1.9821266760639826e-06, - "loss": 0.9121, - "step": 3452 - }, - { - "epoch": 0.09, - "learning_rate": 1.982111048050517e-06, - "loss": 1.1973, - "step": 3453 - }, - { - "epoch": 0.09, - "learning_rate": 1.982095413269317e-06, - "loss": 0.9146, - "step": 3454 - }, - { - "epoch": 0.09, - "learning_rate": 1.98207977172049e-06, - "loss": 0.7881, - "step": 3455 - }, - { - "epoch": 0.09, - "learning_rate": 1.982064123404144e-06, - "loss": 0.8799, - "step": 3456 - }, - { - "epoch": 0.09, - "learning_rate": 1.9820484683203867e-06, - "loss": 0.9336, - "step": 3457 - }, - { - "epoch": 0.09, - "learning_rate": 1.9820328064693257e-06, - "loss": 0.8975, - "step": 3458 - }, - { - "epoch": 0.09, - "learning_rate": 1.9820171378510695e-06, - "loss": 0.8398, - "step": 3459 - }, - { - "epoch": 0.09, - "learning_rate": 1.9820014624657257e-06, - "loss": 0.8477, - "step": 3460 - }, - { - "epoch": 0.09, - "learning_rate": 1.9819857803134025e-06, - "loss": 0.9717, - "step": 3461 - }, - { - "epoch": 0.09, - "learning_rate": 1.9819700913942077e-06, - "loss": 1.125, - "step": 3462 - }, - { - "epoch": 0.09, - "learning_rate": 1.9819543957082497e-06, - "loss": 0.9927, - "step": 3463 - }, - { - "epoch": 0.09, - "learning_rate": 1.9819386932556363e-06, - "loss": 0.9736, - "step": 3464 - }, - { - "epoch": 0.09, - "learning_rate": 1.981922984036476e-06, - "loss": 0.8535, - "step": 3465 - }, - { - "epoch": 0.09, - "learning_rate": 1.9819072680508776e-06, - "loss": 0.8262, - "step": 3466 - }, - { - "epoch": 0.09, - "learning_rate": 1.981891545298948e-06, - "loss": 1.2754, - "step": 3467 - }, - { - "epoch": 0.09, - "learning_rate": 1.9818758157807967e-06, - "loss": 0.6885, - "step": 3468 - }, - { - "epoch": 0.09, - "learning_rate": 1.9818600794965317e-06, - "loss": 0.8311, - "step": 3469 - }, - { - "epoch": 0.09, - "learning_rate": 1.9818443364462616e-06, - "loss": 0.7017, - "step": 3470 - }, - { - "epoch": 0.09, - "learning_rate": 1.9818285866300946e-06, - "loss": 1.0674, - "step": 3471 - }, - { - "epoch": 0.09, - "learning_rate": 1.9818128300481394e-06, - "loss": 1.0508, - "step": 3472 - }, - { - "epoch": 0.09, - "learning_rate": 1.9817970667005047e-06, - "loss": 1.0576, - "step": 3473 - }, - { - "epoch": 0.09, - "learning_rate": 1.981781296587299e-06, - "loss": 0.8584, - "step": 3474 - }, - { - "epoch": 0.09, - "learning_rate": 1.981765519708631e-06, - "loss": 1.0112, - "step": 3475 - }, - { - "epoch": 0.09, - "learning_rate": 1.9817497360646087e-06, - "loss": 0.9346, - "step": 3476 - }, - { - "epoch": 0.09, - "learning_rate": 1.9817339456553424e-06, - "loss": 0.9209, - "step": 3477 - }, - { - "epoch": 0.09, - "learning_rate": 1.9817181484809396e-06, - "loss": 0.8174, - "step": 3478 - }, - { - "epoch": 0.09, - "learning_rate": 1.9817023445415103e-06, - "loss": 0.9424, - "step": 3479 - }, - { - "epoch": 0.09, - "learning_rate": 1.9816865338371622e-06, - "loss": 0.9639, - "step": 3480 - }, - { - "epoch": 0.09, - "learning_rate": 1.9816707163680046e-06, - "loss": 0.9839, - "step": 3481 - }, - { - "epoch": 0.09, - "learning_rate": 1.981654892134147e-06, - "loss": 1.0654, - "step": 3482 - }, - { - "epoch": 0.09, - "learning_rate": 1.981639061135698e-06, - "loss": 0.9609, - "step": 3483 - }, - { - "epoch": 0.09, - "learning_rate": 1.9816232233727668e-06, - "loss": 0.9932, - "step": 3484 - }, - { - "epoch": 0.09, - "learning_rate": 1.9816073788454626e-06, - "loss": 0.853, - "step": 3485 - }, - { - "epoch": 0.09, - "learning_rate": 1.9815915275538944e-06, - "loss": 0.8066, - "step": 3486 - }, - { - "epoch": 0.09, - "learning_rate": 1.9815756694981718e-06, - "loss": 1.3145, - "step": 3487 - }, - { - "epoch": 0.09, - "learning_rate": 1.9815598046784036e-06, - "loss": 0.8789, - "step": 3488 - }, - { - "epoch": 0.09, - "learning_rate": 1.9815439330946996e-06, - "loss": 0.9424, - "step": 3489 - }, - { - "epoch": 0.09, - "learning_rate": 1.981528054747169e-06, - "loss": 1.0273, - "step": 3490 - }, - { - "epoch": 0.09, - "learning_rate": 1.981512169635921e-06, - "loss": 1.2324, - "step": 3491 - }, - { - "epoch": 0.09, - "learning_rate": 1.981496277761065e-06, - "loss": 0.9609, - "step": 3492 - }, - { - "epoch": 0.09, - "learning_rate": 1.9814803791227114e-06, - "loss": 0.8066, - "step": 3493 - }, - { - "epoch": 0.09, - "learning_rate": 1.9814644737209684e-06, - "loss": 0.9458, - "step": 3494 - }, - { - "epoch": 0.09, - "learning_rate": 1.9814485615559468e-06, - "loss": 1.0811, - "step": 3495 - }, - { - "epoch": 0.09, - "learning_rate": 1.9814326426277554e-06, - "loss": 0.9805, - "step": 3496 - }, - { - "epoch": 0.09, - "learning_rate": 1.981416716936504e-06, - "loss": 1.1035, - "step": 3497 - }, - { - "epoch": 0.09, - "learning_rate": 1.981400784482303e-06, - "loss": 0.9629, - "step": 3498 - }, - { - "epoch": 0.09, - "learning_rate": 1.981384845265262e-06, - "loss": 0.7427, - "step": 3499 - }, - { - "epoch": 0.09, - "learning_rate": 1.98136889928549e-06, - "loss": 1.1133, - "step": 3500 - }, - { - "epoch": 0.09, - "learning_rate": 1.9813529465430985e-06, - "loss": 1.1309, - "step": 3501 - }, - { - "epoch": 0.09, - "learning_rate": 1.9813369870381957e-06, - "loss": 0.9766, - "step": 3502 - }, - { - "epoch": 0.09, - "learning_rate": 1.9813210207708923e-06, - "loss": 1.0459, - "step": 3503 - }, - { - "epoch": 0.09, - "learning_rate": 1.9813050477412984e-06, - "loss": 0.9219, - "step": 3504 - }, - { - "epoch": 0.09, - "learning_rate": 1.981289067949524e-06, - "loss": 0.8691, - "step": 3505 - }, - { - "epoch": 0.09, - "learning_rate": 1.9812730813956792e-06, - "loss": 0.9092, - "step": 3506 - }, - { - "epoch": 0.09, - "learning_rate": 1.981257088079874e-06, - "loss": 1.0566, - "step": 3507 - }, - { - "epoch": 0.09, - "learning_rate": 1.9812410880022194e-06, - "loss": 0.9473, - "step": 3508 - }, - { - "epoch": 0.09, - "learning_rate": 1.9812250811628247e-06, - "loss": 0.7129, - "step": 3509 - }, - { - "epoch": 0.09, - "learning_rate": 1.9812090675618003e-06, - "loss": 0.7993, - "step": 3510 - }, - { - "epoch": 0.09, - "learning_rate": 1.981193047199257e-06, - "loss": 1.1602, - "step": 3511 - }, - { - "epoch": 0.09, - "learning_rate": 1.981177020075305e-06, - "loss": 1.0273, - "step": 3512 - }, - { - "epoch": 0.09, - "learning_rate": 1.981160986190055e-06, - "loss": 0.9531, - "step": 3513 - }, - { - "epoch": 0.09, - "learning_rate": 1.9811449455436167e-06, - "loss": 0.8975, - "step": 3514 - }, - { - "epoch": 0.09, - "learning_rate": 1.9811288981361017e-06, - "loss": 1.0117, - "step": 3515 - }, - { - "epoch": 0.09, - "learning_rate": 1.9811128439676196e-06, - "loss": 0.5906, - "step": 3516 - }, - { - "epoch": 0.09, - "learning_rate": 1.981096783038282e-06, - "loss": 1.0488, - "step": 3517 - }, - { - "epoch": 0.09, - "learning_rate": 1.9810807153481987e-06, - "loss": 0.6719, - "step": 3518 - }, - { - "epoch": 0.09, - "learning_rate": 1.9810646408974806e-06, - "loss": 0.9736, - "step": 3519 - }, - { - "epoch": 0.09, - "learning_rate": 1.981048559686239e-06, - "loss": 0.9824, - "step": 3520 - }, - { - "epoch": 0.09, - "learning_rate": 1.9810324717145844e-06, - "loss": 1.1797, - "step": 3521 - }, - { - "epoch": 0.09, - "learning_rate": 1.9810163769826275e-06, - "loss": 1.0225, - "step": 3522 - }, - { - "epoch": 0.09, - "learning_rate": 1.9810002754904795e-06, - "loss": 0.9707, - "step": 3523 - }, - { - "epoch": 0.09, - "learning_rate": 1.980984167238251e-06, - "loss": 1.0215, - "step": 3524 - }, - { - "epoch": 0.09, - "learning_rate": 1.980968052226053e-06, - "loss": 0.7119, - "step": 3525 - }, - { - "epoch": 0.09, - "learning_rate": 1.980951930453997e-06, - "loss": 0.8613, - "step": 3526 - }, - { - "epoch": 0.09, - "learning_rate": 1.9809358019221937e-06, - "loss": 0.6729, - "step": 3527 - }, - { - "epoch": 0.09, - "learning_rate": 1.9809196666307545e-06, - "loss": 0.9814, - "step": 3528 - }, - { - "epoch": 0.09, - "learning_rate": 1.9809035245797903e-06, - "loss": 0.8408, - "step": 3529 - }, - { - "epoch": 0.09, - "learning_rate": 1.980887375769413e-06, - "loss": 0.9688, - "step": 3530 - }, - { - "epoch": 0.09, - "learning_rate": 1.9808712201997327e-06, - "loss": 1.0371, - "step": 3531 - }, - { - "epoch": 0.09, - "learning_rate": 1.980855057870862e-06, - "loss": 0.8848, - "step": 3532 - }, - { - "epoch": 0.09, - "learning_rate": 1.9808388887829115e-06, - "loss": 0.9922, - "step": 3533 - }, - { - "epoch": 0.09, - "learning_rate": 1.9808227129359925e-06, - "loss": 1.127, - "step": 3534 - }, - { - "epoch": 0.09, - "learning_rate": 1.980806530330217e-06, - "loss": 0.8213, - "step": 3535 - }, - { - "epoch": 0.09, - "learning_rate": 1.980790340965696e-06, - "loss": 0.8018, - "step": 3536 - }, - { - "epoch": 0.09, - "learning_rate": 1.980774144842542e-06, - "loss": 0.9824, - "step": 3537 - }, - { - "epoch": 0.09, - "learning_rate": 1.9807579419608657e-06, - "loss": 0.8525, - "step": 3538 - }, - { - "epoch": 0.09, - "learning_rate": 1.9807417323207787e-06, - "loss": 0.6411, - "step": 3539 - }, - { - "epoch": 0.09, - "learning_rate": 1.9807255159223933e-06, - "loss": 0.8428, - "step": 3540 - }, - { - "epoch": 0.09, - "learning_rate": 1.980709292765821e-06, - "loss": 0.9795, - "step": 3541 - }, - { - "epoch": 0.09, - "learning_rate": 1.9806930628511732e-06, - "loss": 0.957, - "step": 3542 - }, - { - "epoch": 0.09, - "learning_rate": 1.9806768261785625e-06, - "loss": 0.8936, - "step": 3543 - }, - { - "epoch": 0.09, - "learning_rate": 1.9806605827481002e-06, - "loss": 1.041, - "step": 3544 - }, - { - "epoch": 0.09, - "learning_rate": 1.9806443325598985e-06, - "loss": 1.0479, - "step": 3545 - }, - { - "epoch": 0.09, - "learning_rate": 1.980628075614069e-06, - "loss": 1.0342, - "step": 3546 - }, - { - "epoch": 0.09, - "learning_rate": 1.9806118119107246e-06, - "loss": 1.1104, - "step": 3547 - }, - { - "epoch": 0.09, - "learning_rate": 1.980595541449976e-06, - "loss": 0.9688, - "step": 3548 - }, - { - "epoch": 0.09, - "learning_rate": 1.9805792642319366e-06, - "loss": 0.9521, - "step": 3549 - }, - { - "epoch": 0.09, - "learning_rate": 1.9805629802567184e-06, - "loss": 0.9111, - "step": 3550 - }, - { - "epoch": 0.09, - "learning_rate": 1.980546689524433e-06, - "loss": 0.8965, - "step": 3551 - }, - { - "epoch": 0.09, - "learning_rate": 1.9805303920351926e-06, - "loss": 0.9395, - "step": 3552 - }, - { - "epoch": 0.09, - "learning_rate": 1.9805140877891106e-06, - "loss": 1.0391, - "step": 3553 - }, - { - "epoch": 0.09, - "learning_rate": 1.980497776786298e-06, - "loss": 0.8467, - "step": 3554 - }, - { - "epoch": 0.09, - "learning_rate": 1.980481459026868e-06, - "loss": 0.9619, - "step": 3555 - }, - { - "epoch": 0.09, - "learning_rate": 1.9804651345109327e-06, - "loss": 1.1328, - "step": 3556 - }, - { - "epoch": 0.09, - "learning_rate": 1.9804488032386048e-06, - "loss": 0.8101, - "step": 3557 - }, - { - "epoch": 0.09, - "learning_rate": 1.980432465209997e-06, - "loss": 1.0, - "step": 3558 - }, - { - "epoch": 0.09, - "learning_rate": 1.9804161204252217e-06, - "loss": 0.8623, - "step": 3559 - }, - { - "epoch": 0.09, - "learning_rate": 1.9803997688843915e-06, - "loss": 0.8398, - "step": 3560 - }, - { - "epoch": 0.09, - "learning_rate": 1.980383410587619e-06, - "loss": 1.0117, - "step": 3561 - }, - { - "epoch": 0.09, - "learning_rate": 1.980367045535017e-06, - "loss": 0.7671, - "step": 3562 - }, - { - "epoch": 0.09, - "learning_rate": 1.9803506737266978e-06, - "loss": 0.9961, - "step": 3563 - }, - { - "epoch": 0.09, - "learning_rate": 1.9803342951627755e-06, - "loss": 1.1045, - "step": 3564 - }, - { - "epoch": 0.09, - "learning_rate": 1.980317909843362e-06, - "loss": 1.0381, - "step": 3565 - }, - { - "epoch": 0.09, - "learning_rate": 1.98030151776857e-06, - "loss": 0.9795, - "step": 3566 - }, - { - "epoch": 0.09, - "learning_rate": 1.980285118938513e-06, - "loss": 0.9883, - "step": 3567 - }, - { - "epoch": 0.09, - "learning_rate": 1.980268713353304e-06, - "loss": 0.998, - "step": 3568 - }, - { - "epoch": 0.09, - "learning_rate": 1.9802523010130557e-06, - "loss": 0.832, - "step": 3569 - }, - { - "epoch": 0.09, - "learning_rate": 1.9802358819178815e-06, - "loss": 1.1631, - "step": 3570 - }, - { - "epoch": 0.09, - "learning_rate": 1.9802194560678943e-06, - "loss": 0.8584, - "step": 3571 - }, - { - "epoch": 0.09, - "learning_rate": 1.9802030234632078e-06, - "loss": 1.1465, - "step": 3572 - }, - { - "epoch": 0.09, - "learning_rate": 1.980186584103934e-06, - "loss": 1.0527, - "step": 3573 - }, - { - "epoch": 0.09, - "learning_rate": 1.980170137990188e-06, - "loss": 1.1035, - "step": 3574 - }, - { - "epoch": 0.09, - "learning_rate": 1.9801536851220817e-06, - "loss": 0.7163, - "step": 3575 - }, - { - "epoch": 0.09, - "learning_rate": 1.9801372254997293e-06, - "loss": 0.9834, - "step": 3576 - }, - { - "epoch": 0.09, - "learning_rate": 1.9801207591232436e-06, - "loss": 0.9434, - "step": 3577 - }, - { - "epoch": 0.09, - "learning_rate": 1.980104285992738e-06, - "loss": 0.9004, - "step": 3578 - }, - { - "epoch": 0.09, - "learning_rate": 1.980087806108327e-06, - "loss": 0.9707, - "step": 3579 - }, - { - "epoch": 0.09, - "learning_rate": 1.9800713194701233e-06, - "loss": 0.916, - "step": 3580 - }, - { - "epoch": 0.09, - "learning_rate": 1.9800548260782406e-06, - "loss": 0.9883, - "step": 3581 - }, - { - "epoch": 0.09, - "learning_rate": 1.980038325932793e-06, - "loss": 1.0332, - "step": 3582 - }, - { - "epoch": 0.09, - "learning_rate": 1.9800218190338933e-06, - "loss": 0.8501, - "step": 3583 - }, - { - "epoch": 0.09, - "learning_rate": 1.9800053053816567e-06, - "loss": 0.769, - "step": 3584 - }, - { - "epoch": 0.09, - "learning_rate": 1.9799887849761954e-06, - "loss": 0.9287, - "step": 3585 - }, - { - "epoch": 0.09, - "learning_rate": 1.979972257817624e-06, - "loss": 1.1221, - "step": 3586 - }, - { - "epoch": 0.09, - "learning_rate": 1.979955723906057e-06, - "loss": 0.9307, - "step": 3587 - }, - { - "epoch": 0.09, - "learning_rate": 1.979939183241607e-06, - "loss": 0.9766, - "step": 3588 - }, - { - "epoch": 0.09, - "learning_rate": 1.979922635824389e-06, - "loss": 0.7964, - "step": 3589 - }, - { - "epoch": 0.09, - "learning_rate": 1.979906081654517e-06, - "loss": 0.9414, - "step": 3590 - }, - { - "epoch": 0.09, - "learning_rate": 1.9798895207321045e-06, - "loss": 0.7886, - "step": 3591 - }, - { - "epoch": 0.09, - "learning_rate": 1.9798729530572657e-06, - "loss": 0.8467, - "step": 3592 - }, - { - "epoch": 0.09, - "learning_rate": 1.9798563786301153e-06, - "loss": 0.9126, - "step": 3593 - }, - { - "epoch": 0.09, - "learning_rate": 1.979839797450767e-06, - "loss": 0.8506, - "step": 3594 - }, - { - "epoch": 0.09, - "learning_rate": 1.9798232095193353e-06, - "loss": 0.9785, - "step": 3595 - }, - { - "epoch": 0.09, - "learning_rate": 1.9798066148359344e-06, - "loss": 1.0801, - "step": 3596 - }, - { - "epoch": 0.09, - "learning_rate": 1.979790013400679e-06, - "loss": 1.1357, - "step": 3597 - }, - { - "epoch": 0.09, - "learning_rate": 1.979773405213683e-06, - "loss": 0.9746, - "step": 3598 - }, - { - "epoch": 0.09, - "learning_rate": 1.979756790275061e-06, - "loss": 1.0059, - "step": 3599 - }, - { - "epoch": 0.09, - "learning_rate": 1.979740168584928e-06, - "loss": 0.7754, - "step": 3600 - }, - { - "epoch": 0.09, - "learning_rate": 1.9797235401433973e-06, - "loss": 0.8628, - "step": 3601 - }, - { - "epoch": 0.09, - "learning_rate": 1.979706904950585e-06, - "loss": 0.9824, - "step": 3602 - }, - { - "epoch": 0.09, - "learning_rate": 1.9796902630066045e-06, - "loss": 0.8779, - "step": 3603 - }, - { - "epoch": 0.09, - "learning_rate": 1.9796736143115714e-06, - "loss": 0.9307, - "step": 3604 - }, - { - "epoch": 0.09, - "learning_rate": 1.9796569588656e-06, - "loss": 0.8379, - "step": 3605 - }, - { - "epoch": 0.09, - "learning_rate": 1.9796402966688046e-06, - "loss": 0.8311, - "step": 3606 - }, - { - "epoch": 0.09, - "learning_rate": 1.9796236277213014e-06, - "loss": 0.7515, - "step": 3607 - }, - { - "epoch": 0.09, - "learning_rate": 1.979606952023204e-06, - "loss": 0.9229, - "step": 3608 - }, - { - "epoch": 0.09, - "learning_rate": 1.9795902695746274e-06, - "loss": 0.6699, - "step": 3609 - }, - { - "epoch": 0.09, - "learning_rate": 1.9795735803756866e-06, - "loss": 1.2305, - "step": 3610 - }, - { - "epoch": 0.09, - "learning_rate": 1.9795568844264976e-06, - "loss": 0.8516, - "step": 3611 - }, - { - "epoch": 0.09, - "learning_rate": 1.979540181727174e-06, - "loss": 0.9365, - "step": 3612 - }, - { - "epoch": 0.09, - "learning_rate": 1.979523472277832e-06, - "loss": 0.9209, - "step": 3613 - }, - { - "epoch": 0.09, - "learning_rate": 1.9795067560785867e-06, - "loss": 1.0586, - "step": 3614 - }, - { - "epoch": 0.09, - "learning_rate": 1.9794900331295524e-06, - "loss": 1.0186, - "step": 3615 - }, - { - "epoch": 0.09, - "learning_rate": 1.979473303430845e-06, - "loss": 1.168, - "step": 3616 - }, - { - "epoch": 0.09, - "learning_rate": 1.97945656698258e-06, - "loss": 1.0156, - "step": 3617 - }, - { - "epoch": 0.09, - "learning_rate": 1.979439823784872e-06, - "loss": 1.0459, - "step": 3618 - }, - { - "epoch": 0.09, - "learning_rate": 1.979423073837837e-06, - "loss": 0.9873, - "step": 3619 - }, - { - "epoch": 0.09, - "learning_rate": 1.97940631714159e-06, - "loss": 1.1172, - "step": 3620 - }, - { - "epoch": 0.09, - "learning_rate": 1.979389553696247e-06, - "loss": 1.1152, - "step": 3621 - }, - { - "epoch": 0.09, - "learning_rate": 1.979372783501923e-06, - "loss": 1.1348, - "step": 3622 - }, - { - "epoch": 0.09, - "learning_rate": 1.9793560065587338e-06, - "loss": 1.0254, - "step": 3623 - }, - { - "epoch": 0.09, - "learning_rate": 1.9793392228667947e-06, - "loss": 0.9062, - "step": 3624 - }, - { - "epoch": 0.09, - "learning_rate": 1.979322432426222e-06, - "loss": 0.8447, - "step": 3625 - }, - { - "epoch": 0.09, - "learning_rate": 1.9793056352371303e-06, - "loss": 0.6501, - "step": 3626 - }, - { - "epoch": 0.09, - "learning_rate": 1.9792888312996367e-06, - "loss": 0.7432, - "step": 3627 - }, - { - "epoch": 0.09, - "learning_rate": 1.979272020613856e-06, - "loss": 0.8154, - "step": 3628 - }, - { - "epoch": 0.09, - "learning_rate": 1.979255203179905e-06, - "loss": 0.8408, - "step": 3629 - }, - { - "epoch": 0.09, - "learning_rate": 1.979238378997899e-06, - "loss": 1.1689, - "step": 3630 - }, - { - "epoch": 0.09, - "learning_rate": 1.979221548067953e-06, - "loss": 1.0488, - "step": 3631 - }, - { - "epoch": 0.09, - "learning_rate": 1.979204710390185e-06, - "loss": 1.3066, - "step": 3632 - }, - { - "epoch": 0.09, - "learning_rate": 1.979187865964709e-06, - "loss": 0.8789, - "step": 3633 - }, - { - "epoch": 0.09, - "learning_rate": 1.9791710147916426e-06, - "loss": 0.8496, - "step": 3634 - }, - { - "epoch": 0.09, - "learning_rate": 1.979154156871101e-06, - "loss": 0.9893, - "step": 3635 - }, - { - "epoch": 0.09, - "learning_rate": 1.979137292203201e-06, - "loss": 1.083, - "step": 3636 - }, - { - "epoch": 0.09, - "learning_rate": 1.9791204207880585e-06, - "loss": 0.7617, - "step": 3637 - }, - { - "epoch": 0.09, - "learning_rate": 1.97910354262579e-06, - "loss": 1.0557, - "step": 3638 - }, - { - "epoch": 0.09, - "learning_rate": 1.979086657716511e-06, - "loss": 1.0049, - "step": 3639 - }, - { - "epoch": 0.09, - "learning_rate": 1.979069766060339e-06, - "loss": 1.1094, - "step": 3640 - }, - { - "epoch": 0.09, - "learning_rate": 1.9790528676573895e-06, - "loss": 0.8398, - "step": 3641 - }, - { - "epoch": 0.09, - "learning_rate": 1.979035962507779e-06, - "loss": 0.8857, - "step": 3642 - }, - { - "epoch": 0.09, - "learning_rate": 1.979019050611625e-06, - "loss": 0.7837, - "step": 3643 - }, - { - "epoch": 0.09, - "learning_rate": 1.979002131969043e-06, - "loss": 0.7483, - "step": 3644 - }, - { - "epoch": 0.09, - "learning_rate": 1.97898520658015e-06, - "loss": 0.9727, - "step": 3645 - }, - { - "epoch": 0.09, - "learning_rate": 1.978968274445063e-06, - "loss": 1.0391, - "step": 3646 - }, - { - "epoch": 0.09, - "learning_rate": 1.9789513355638976e-06, - "loss": 0.8623, - "step": 3647 - }, - { - "epoch": 0.09, - "learning_rate": 1.978934389936771e-06, - "loss": 1.0908, - "step": 3648 - }, - { - "epoch": 0.09, - "learning_rate": 1.9789174375638002e-06, - "loss": 0.8848, - "step": 3649 - }, - { - "epoch": 0.09, - "learning_rate": 1.9789004784451023e-06, - "loss": 0.9619, - "step": 3650 - }, - { - "epoch": 0.09, - "learning_rate": 1.9788835125807933e-06, - "loss": 0.9473, - "step": 3651 - }, - { - "epoch": 0.09, - "learning_rate": 1.9788665399709912e-06, - "loss": 0.9629, - "step": 3652 - }, - { - "epoch": 0.09, - "learning_rate": 1.9788495606158122e-06, - "loss": 0.9316, - "step": 3653 - }, - { - "epoch": 0.09, - "learning_rate": 1.978832574515373e-06, - "loss": 0.9873, - "step": 3654 - }, - { - "epoch": 0.09, - "learning_rate": 1.978815581669792e-06, - "loss": 0.8789, - "step": 3655 - }, - { - "epoch": 0.09, - "learning_rate": 1.9787985820791846e-06, - "loss": 0.9248, - "step": 3656 - }, - { - "epoch": 0.09, - "learning_rate": 1.9787815757436693e-06, - "loss": 1.127, - "step": 3657 - }, - { - "epoch": 0.09, - "learning_rate": 1.9787645626633627e-06, - "loss": 0.8652, - "step": 3658 - }, - { - "epoch": 0.09, - "learning_rate": 1.978747542838382e-06, - "loss": 0.998, - "step": 3659 - }, - { - "epoch": 0.09, - "learning_rate": 1.9787305162688444e-06, - "loss": 0.96, - "step": 3660 - }, - { - "epoch": 0.09, - "learning_rate": 1.978713482954868e-06, - "loss": 1.165, - "step": 3661 - }, - { - "epoch": 0.09, - "learning_rate": 1.978696442896569e-06, - "loss": 0.9854, - "step": 3662 - }, - { - "epoch": 0.09, - "learning_rate": 1.9786793960940656e-06, - "loss": 1.0596, - "step": 3663 - }, - { - "epoch": 0.09, - "learning_rate": 1.9786623425474753e-06, - "loss": 1.0039, - "step": 3664 - }, - { - "epoch": 0.09, - "learning_rate": 1.9786452822569154e-06, - "loss": 0.9346, - "step": 3665 - }, - { - "epoch": 0.09, - "learning_rate": 1.9786282152225032e-06, - "loss": 0.9014, - "step": 3666 - }, - { - "epoch": 0.09, - "learning_rate": 1.9786111414443565e-06, - "loss": 1.0381, - "step": 3667 - }, - { - "epoch": 0.09, - "learning_rate": 1.9785940609225934e-06, - "loss": 0.957, - "step": 3668 - }, - { - "epoch": 0.09, - "learning_rate": 1.978576973657331e-06, - "loss": 0.9443, - "step": 3669 - }, - { - "epoch": 0.09, - "learning_rate": 1.9785598796486873e-06, - "loss": 0.9033, - "step": 3670 - }, - { - "epoch": 0.09, - "learning_rate": 1.97854277889678e-06, - "loss": 0.9331, - "step": 3671 - }, - { - "epoch": 0.09, - "learning_rate": 1.9785256714017272e-06, - "loss": 0.8008, - "step": 3672 - }, - { - "epoch": 0.09, - "learning_rate": 1.9785085571636466e-06, - "loss": 1.0693, - "step": 3673 - }, - { - "epoch": 0.09, - "learning_rate": 1.978491436182656e-06, - "loss": 0.7695, - "step": 3674 - }, - { - "epoch": 0.09, - "learning_rate": 1.978474308458874e-06, - "loss": 0.8545, - "step": 3675 - }, - { - "epoch": 0.09, - "learning_rate": 1.9784571739924174e-06, - "loss": 1.1025, - "step": 3676 - }, - { - "epoch": 0.09, - "learning_rate": 1.9784400327834055e-06, - "loss": 0.7803, - "step": 3677 - }, - { - "epoch": 0.09, - "learning_rate": 1.9784228848319557e-06, - "loss": 1.0234, - "step": 3678 - }, - { - "epoch": 0.09, - "learning_rate": 1.978405730138187e-06, - "loss": 0.9766, - "step": 3679 - }, - { - "epoch": 0.09, - "learning_rate": 1.978388568702216e-06, - "loss": 0.7783, - "step": 3680 - }, - { - "epoch": 0.09, - "learning_rate": 1.9783714005241626e-06, - "loss": 0.9697, - "step": 3681 - }, - { - "epoch": 0.09, - "learning_rate": 1.9783542256041444e-06, - "loss": 1.0332, - "step": 3682 - }, - { - "epoch": 0.09, - "learning_rate": 1.9783370439422797e-06, - "loss": 0.9961, - "step": 3683 - }, - { - "epoch": 0.09, - "learning_rate": 1.9783198555386874e-06, - "loss": 0.9785, - "step": 3684 - }, - { - "epoch": 0.09, - "learning_rate": 1.9783026603934854e-06, - "loss": 0.7075, - "step": 3685 - }, - { - "epoch": 0.09, - "learning_rate": 1.9782854585067923e-06, - "loss": 1.1289, - "step": 3686 - }, - { - "epoch": 0.09, - "learning_rate": 1.978268249878727e-06, - "loss": 0.6968, - "step": 3687 - }, - { - "epoch": 0.09, - "learning_rate": 1.9782510345094075e-06, - "loss": 1.0898, - "step": 3688 - }, - { - "epoch": 0.09, - "learning_rate": 1.9782338123989527e-06, - "loss": 1.0859, - "step": 3689 - }, - { - "epoch": 0.09, - "learning_rate": 1.9782165835474815e-06, - "loss": 0.79, - "step": 3690 - }, - { - "epoch": 0.09, - "learning_rate": 1.978199347955112e-06, - "loss": 0.915, - "step": 3691 - }, - { - "epoch": 0.09, - "learning_rate": 1.9781821056219638e-06, - "loss": 0.7925, - "step": 3692 - }, - { - "epoch": 0.09, - "learning_rate": 1.9781648565481556e-06, - "loss": 0.8066, - "step": 3693 - }, - { - "epoch": 0.09, - "learning_rate": 1.9781476007338054e-06, - "loss": 1.0156, - "step": 3694 - }, - { - "epoch": 0.09, - "learning_rate": 1.978130338179033e-06, - "loss": 1.124, - "step": 3695 - }, - { - "epoch": 0.09, - "learning_rate": 1.978113068883957e-06, - "loss": 0.9717, - "step": 3696 - }, - { - "epoch": 0.09, - "learning_rate": 1.9780957928486967e-06, - "loss": 1.168, - "step": 3697 - }, - { - "epoch": 0.09, - "learning_rate": 1.9780785100733708e-06, - "loss": 0.6641, - "step": 3698 - }, - { - "epoch": 0.09, - "learning_rate": 1.9780612205580983e-06, - "loss": 0.9961, - "step": 3699 - }, - { - "epoch": 0.09, - "learning_rate": 1.9780439243029986e-06, - "loss": 0.7305, - "step": 3700 - }, - { - "epoch": 0.09, - "learning_rate": 1.9780266213081907e-06, - "loss": 0.8867, - "step": 3701 - }, - { - "epoch": 0.09, - "learning_rate": 1.978009311573794e-06, - "loss": 0.8936, - "step": 3702 - }, - { - "epoch": 0.09, - "learning_rate": 1.977991995099928e-06, - "loss": 0.7646, - "step": 3703 - }, - { - "epoch": 0.09, - "learning_rate": 1.9779746718867114e-06, - "loss": 0.856, - "step": 3704 - }, - { - "epoch": 0.09, - "learning_rate": 1.9779573419342643e-06, - "loss": 0.792, - "step": 3705 - }, - { - "epoch": 0.09, - "learning_rate": 1.9779400052427053e-06, - "loss": 0.8894, - "step": 3706 - }, - { - "epoch": 0.1, - "learning_rate": 1.9779226618121548e-06, - "loss": 0.8242, - "step": 3707 - }, - { - "epoch": 0.1, - "learning_rate": 1.9779053116427316e-06, - "loss": 0.8091, - "step": 3708 - }, - { - "epoch": 0.1, - "learning_rate": 1.9778879547345557e-06, - "loss": 0.9805, - "step": 3709 - }, - { - "epoch": 0.1, - "learning_rate": 1.9778705910877466e-06, - "loss": 0.7881, - "step": 3710 - }, - { - "epoch": 0.1, - "learning_rate": 1.977853220702424e-06, - "loss": 0.8789, - "step": 3711 - }, - { - "epoch": 0.1, - "learning_rate": 1.977835843578707e-06, - "loss": 0.9951, - "step": 3712 - }, - { - "epoch": 0.1, - "learning_rate": 1.9778184597167157e-06, - "loss": 0.8535, - "step": 3713 - }, - { - "epoch": 0.1, - "learning_rate": 1.9778010691165707e-06, - "loss": 1.0898, - "step": 3714 - }, - { - "epoch": 0.1, - "learning_rate": 1.9777836717783908e-06, - "loss": 0.9424, - "step": 3715 - }, - { - "epoch": 0.1, - "learning_rate": 1.9777662677022963e-06, - "loss": 0.793, - "step": 3716 - }, - { - "epoch": 0.1, - "learning_rate": 1.9777488568884066e-06, - "loss": 0.832, - "step": 3717 - }, - { - "epoch": 0.1, - "learning_rate": 1.9777314393368425e-06, - "loss": 1.0088, - "step": 3718 - }, - { - "epoch": 0.1, - "learning_rate": 1.977714015047724e-06, - "loss": 1.0449, - "step": 3719 - }, - { - "epoch": 0.1, - "learning_rate": 1.9776965840211703e-06, - "loss": 0.9414, - "step": 3720 - }, - { - "epoch": 0.1, - "learning_rate": 1.977679146257302e-06, - "loss": 0.6611, - "step": 3721 - }, - { - "epoch": 0.1, - "learning_rate": 1.9776617017562395e-06, - "loss": 0.7129, - "step": 3722 - }, - { - "epoch": 0.1, - "learning_rate": 1.977644250518103e-06, - "loss": 1.1094, - "step": 3723 - }, - { - "epoch": 0.1, - "learning_rate": 1.9776267925430126e-06, - "loss": 0.9404, - "step": 3724 - }, - { - "epoch": 0.1, - "learning_rate": 1.9776093278310884e-06, - "loss": 1.0654, - "step": 3725 - }, - { - "epoch": 0.1, - "learning_rate": 1.977591856382451e-06, - "loss": 1.0811, - "step": 3726 - }, - { - "epoch": 0.1, - "learning_rate": 1.9775743781972205e-06, - "loss": 0.7852, - "step": 3727 - }, - { - "epoch": 0.1, - "learning_rate": 1.9775568932755184e-06, - "loss": 0.8833, - "step": 3728 - }, - { - "epoch": 0.1, - "learning_rate": 1.9775394016174635e-06, - "loss": 0.8271, - "step": 3729 - }, - { - "epoch": 0.1, - "learning_rate": 1.977521903223177e-06, - "loss": 0.9199, - "step": 3730 - }, - { - "epoch": 0.1, - "learning_rate": 1.9775043980927804e-06, - "loss": 1.0264, - "step": 3731 - }, - { - "epoch": 0.1, - "learning_rate": 1.9774868862263935e-06, - "loss": 1.0127, - "step": 3732 - }, - { - "epoch": 0.1, - "learning_rate": 1.977469367624137e-06, - "loss": 1.0791, - "step": 3733 - }, - { - "epoch": 0.1, - "learning_rate": 1.9774518422861317e-06, - "loss": 0.9199, - "step": 3734 - }, - { - "epoch": 0.1, - "learning_rate": 1.9774343102124986e-06, - "loss": 0.9575, - "step": 3735 - }, - { - "epoch": 0.1, - "learning_rate": 1.977416771403358e-06, - "loss": 0.7998, - "step": 3736 - }, - { - "epoch": 0.1, - "learning_rate": 1.977399225858831e-06, - "loss": 0.9448, - "step": 3737 - }, - { - "epoch": 0.1, - "learning_rate": 1.9773816735790383e-06, - "loss": 0.8604, - "step": 3738 - }, - { - "epoch": 0.1, - "learning_rate": 1.9773641145641015e-06, - "loss": 1.0996, - "step": 3739 - }, - { - "epoch": 0.1, - "learning_rate": 1.977346548814141e-06, - "loss": 0.9238, - "step": 3740 - }, - { - "epoch": 0.1, - "learning_rate": 1.9773289763292783e-06, - "loss": 1.0986, - "step": 3741 - }, - { - "epoch": 0.1, - "learning_rate": 1.977311397109634e-06, - "loss": 1.0186, - "step": 3742 - }, - { - "epoch": 0.1, - "learning_rate": 1.9772938111553295e-06, - "loss": 0.9746, - "step": 3743 - }, - { - "epoch": 0.1, - "learning_rate": 1.977276218466486e-06, - "loss": 1.0029, - "step": 3744 - }, - { - "epoch": 0.1, - "learning_rate": 1.977258619043225e-06, - "loss": 0.9932, - "step": 3745 - }, - { - "epoch": 0.1, - "learning_rate": 1.977241012885667e-06, - "loss": 0.6455, - "step": 3746 - }, - { - "epoch": 0.1, - "learning_rate": 1.9772233999939345e-06, - "loss": 0.8579, - "step": 3747 - }, - { - "epoch": 0.1, - "learning_rate": 1.9772057803681473e-06, - "loss": 0.9912, - "step": 3748 - }, - { - "epoch": 0.1, - "learning_rate": 1.977188154008428e-06, - "loss": 0.999, - "step": 3749 - }, - { - "epoch": 0.1, - "learning_rate": 1.9771705209148978e-06, - "loss": 0.8613, - "step": 3750 - }, - { - "epoch": 0.1, - "learning_rate": 1.9771528810876785e-06, - "loss": 1.0586, - "step": 3751 - }, - { - "epoch": 0.1, - "learning_rate": 1.9771352345268907e-06, - "loss": 0.8877, - "step": 3752 - }, - { - "epoch": 0.1, - "learning_rate": 1.977117581232657e-06, - "loss": 0.7451, - "step": 3753 - }, - { - "epoch": 0.1, - "learning_rate": 1.9770999212050986e-06, - "loss": 0.9238, - "step": 3754 - }, - { - "epoch": 0.1, - "learning_rate": 1.9770822544443373e-06, - "loss": 0.9521, - "step": 3755 - }, - { - "epoch": 0.1, - "learning_rate": 1.9770645809504946e-06, - "loss": 0.822, - "step": 3756 - }, - { - "epoch": 0.1, - "learning_rate": 1.977046900723693e-06, - "loss": 0.8496, - "step": 3757 - }, - { - "epoch": 0.1, - "learning_rate": 1.9770292137640532e-06, - "loss": 1.1211, - "step": 3758 - }, - { - "epoch": 0.1, - "learning_rate": 1.977011520071698e-06, - "loss": 0.9736, - "step": 3759 - }, - { - "epoch": 0.1, - "learning_rate": 1.9769938196467486e-06, - "loss": 0.6973, - "step": 3760 - }, - { - "epoch": 0.1, - "learning_rate": 1.976976112489328e-06, - "loss": 1.0176, - "step": 3761 - }, - { - "epoch": 0.1, - "learning_rate": 1.9769583985995574e-06, - "loss": 1.0283, - "step": 3762 - }, - { - "epoch": 0.1, - "learning_rate": 1.976940677977559e-06, - "loss": 0.5742, - "step": 3763 - }, - { - "epoch": 0.1, - "learning_rate": 1.9769229506234553e-06, - "loss": 0.9648, - "step": 3764 - }, - { - "epoch": 0.1, - "learning_rate": 1.9769052165373682e-06, - "loss": 0.9326, - "step": 3765 - }, - { - "epoch": 0.1, - "learning_rate": 1.97688747571942e-06, - "loss": 0.8574, - "step": 3766 - }, - { - "epoch": 0.1, - "learning_rate": 1.9768697281697322e-06, - "loss": 0.8145, - "step": 3767 - }, - { - "epoch": 0.1, - "learning_rate": 1.976851973888428e-06, - "loss": 1.1182, - "step": 3768 - }, - { - "epoch": 0.1, - "learning_rate": 1.9768342128756295e-06, - "loss": 1.0312, - "step": 3769 - }, - { - "epoch": 0.1, - "learning_rate": 1.976816445131459e-06, - "loss": 1.002, - "step": 3770 - }, - { - "epoch": 0.1, - "learning_rate": 1.976798670656039e-06, - "loss": 1.0244, - "step": 3771 - }, - { - "epoch": 0.1, - "learning_rate": 1.9767808894494923e-06, - "loss": 0.9922, - "step": 3772 - }, - { - "epoch": 0.1, - "learning_rate": 1.9767631015119405e-06, - "loss": 1.0879, - "step": 3773 - }, - { - "epoch": 0.1, - "learning_rate": 1.9767453068435075e-06, - "loss": 0.9453, - "step": 3774 - }, - { - "epoch": 0.1, - "learning_rate": 1.9767275054443147e-06, - "loss": 1.0098, - "step": 3775 - }, - { - "epoch": 0.1, - "learning_rate": 1.9767096973144855e-06, - "loss": 0.77, - "step": 3776 - }, - { - "epoch": 0.1, - "learning_rate": 1.9766918824541423e-06, - "loss": 1.0498, - "step": 3777 - }, - { - "epoch": 0.1, - "learning_rate": 1.976674060863408e-06, - "loss": 1.0684, - "step": 3778 - }, - { - "epoch": 0.1, - "learning_rate": 1.9766562325424053e-06, - "loss": 0.9658, - "step": 3779 - }, - { - "epoch": 0.1, - "learning_rate": 1.976638397491257e-06, - "loss": 1.0195, - "step": 3780 - }, - { - "epoch": 0.1, - "learning_rate": 1.9766205557100868e-06, - "loss": 1.0234, - "step": 3781 - }, - { - "epoch": 0.1, - "learning_rate": 1.9766027071990164e-06, - "loss": 0.9033, - "step": 3782 - }, - { - "epoch": 0.1, - "learning_rate": 1.9765848519581692e-06, - "loss": 1.0156, - "step": 3783 - }, - { - "epoch": 0.1, - "learning_rate": 1.9765669899876686e-06, - "loss": 1.0908, - "step": 3784 - }, - { - "epoch": 0.1, - "learning_rate": 1.976549121287638e-06, - "loss": 0.7427, - "step": 3785 - }, - { - "epoch": 0.1, - "learning_rate": 1.976531245858199e-06, - "loss": 0.6909, - "step": 3786 - }, - { - "epoch": 0.1, - "learning_rate": 1.9765133636994768e-06, - "loss": 0.8516, - "step": 3787 - }, - { - "epoch": 0.1, - "learning_rate": 1.976495474811593e-06, - "loss": 0.9834, - "step": 3788 - }, - { - "epoch": 0.1, - "learning_rate": 1.976477579194672e-06, - "loss": 0.8945, - "step": 3789 - }, - { - "epoch": 0.1, - "learning_rate": 1.976459676848836e-06, - "loss": 0.9639, - "step": 3790 - }, - { - "epoch": 0.1, - "learning_rate": 1.9764417677742095e-06, - "loss": 0.7886, - "step": 3791 - }, - { - "epoch": 0.1, - "learning_rate": 1.9764238519709154e-06, - "loss": 0.5181, - "step": 3792 - }, - { - "epoch": 0.1, - "learning_rate": 1.976405929439077e-06, - "loss": 1.1582, - "step": 3793 - }, - { - "epoch": 0.1, - "learning_rate": 1.976388000178818e-06, - "loss": 0.9111, - "step": 3794 - }, - { - "epoch": 0.1, - "learning_rate": 1.976370064190262e-06, - "loss": 1.0, - "step": 3795 - }, - { - "epoch": 0.1, - "learning_rate": 1.976352121473532e-06, - "loss": 0.855, - "step": 3796 - }, - { - "epoch": 0.1, - "learning_rate": 1.976334172028753e-06, - "loss": 0.9062, - "step": 3797 - }, - { - "epoch": 0.1, - "learning_rate": 1.976316215856047e-06, - "loss": 0.7915, - "step": 3798 - }, - { - "epoch": 0.1, - "learning_rate": 1.976298252955539e-06, - "loss": 1.0098, - "step": 3799 - }, - { - "epoch": 0.1, - "learning_rate": 1.9762802833273526e-06, - "loss": 0.8057, - "step": 3800 - }, - { - "epoch": 0.1, - "learning_rate": 1.976262306971611e-06, - "loss": 1.0459, - "step": 3801 - }, - { - "epoch": 0.1, - "learning_rate": 1.9762443238884386e-06, - "loss": 0.9053, - "step": 3802 - }, - { - "epoch": 0.1, - "learning_rate": 1.9762263340779595e-06, - "loss": 1.0508, - "step": 3803 - }, - { - "epoch": 0.1, - "learning_rate": 1.976208337540297e-06, - "loss": 0.9121, - "step": 3804 - }, - { - "epoch": 0.1, - "learning_rate": 1.9761903342755755e-06, - "loss": 0.8271, - "step": 3805 - }, - { - "epoch": 0.1, - "learning_rate": 1.976172324283919e-06, - "loss": 0.7041, - "step": 3806 - }, - { - "epoch": 0.1, - "learning_rate": 1.976154307565452e-06, - "loss": 1.0488, - "step": 3807 - }, - { - "epoch": 0.1, - "learning_rate": 1.9761362841202977e-06, - "loss": 0.9189, - "step": 3808 - }, - { - "epoch": 0.1, - "learning_rate": 1.9761182539485812e-06, - "loss": 0.8799, - "step": 3809 - }, - { - "epoch": 0.1, - "learning_rate": 1.9761002170504263e-06, - "loss": 1.0928, - "step": 3810 - }, - { - "epoch": 0.1, - "learning_rate": 1.9760821734259577e-06, - "loss": 1.0576, - "step": 3811 - }, - { - "epoch": 0.1, - "learning_rate": 1.976064123075299e-06, - "loss": 1.0557, - "step": 3812 - }, - { - "epoch": 0.1, - "learning_rate": 1.9760460659985755e-06, - "loss": 0.9053, - "step": 3813 - }, - { - "epoch": 0.1, - "learning_rate": 1.9760280021959115e-06, - "loss": 0.918, - "step": 3814 - }, - { - "epoch": 0.1, - "learning_rate": 1.9760099316674306e-06, - "loss": 0.9824, - "step": 3815 - }, - { - "epoch": 0.1, - "learning_rate": 1.9759918544132577e-06, - "loss": 0.9766, - "step": 3816 - }, - { - "epoch": 0.1, - "learning_rate": 1.975973770433518e-06, - "loss": 1.0664, - "step": 3817 - }, - { - "epoch": 0.1, - "learning_rate": 1.9759556797283357e-06, - "loss": 1.0635, - "step": 3818 - }, - { - "epoch": 0.1, - "learning_rate": 1.975937582297835e-06, - "loss": 0.8203, - "step": 3819 - }, - { - "epoch": 0.1, - "learning_rate": 1.9759194781421416e-06, - "loss": 0.8423, - "step": 3820 - }, - { - "epoch": 0.1, - "learning_rate": 1.9759013672613795e-06, - "loss": 0.8413, - "step": 3821 - }, - { - "epoch": 0.1, - "learning_rate": 1.9758832496556735e-06, - "loss": 0.7852, - "step": 3822 - }, - { - "epoch": 0.1, - "learning_rate": 1.975865125325149e-06, - "loss": 0.686, - "step": 3823 - }, - { - "epoch": 0.1, - "learning_rate": 1.97584699426993e-06, - "loss": 1.1602, - "step": 3824 - }, - { - "epoch": 0.1, - "learning_rate": 1.9758288564901427e-06, - "loss": 0.8428, - "step": 3825 - }, - { - "epoch": 0.1, - "learning_rate": 1.975810711985911e-06, - "loss": 0.9307, - "step": 3826 - }, - { - "epoch": 0.1, - "learning_rate": 1.9757925607573604e-06, - "loss": 1.0664, - "step": 3827 - }, - { - "epoch": 0.1, - "learning_rate": 1.9757744028046155e-06, - "loss": 1.0195, - "step": 3828 - }, - { - "epoch": 0.1, - "learning_rate": 1.9757562381278025e-06, - "loss": 1.1914, - "step": 3829 - }, - { - "epoch": 0.1, - "learning_rate": 1.9757380667270454e-06, - "loss": 0.8672, - "step": 3830 - }, - { - "epoch": 0.1, - "learning_rate": 1.97571988860247e-06, - "loss": 0.9707, - "step": 3831 - }, - { - "epoch": 0.1, - "learning_rate": 1.9757017037542014e-06, - "loss": 0.7891, - "step": 3832 - }, - { - "epoch": 0.1, - "learning_rate": 1.9756835121823652e-06, - "loss": 0.9746, - "step": 3833 - }, - { - "epoch": 0.1, - "learning_rate": 1.975665313887087e-06, - "loss": 1.124, - "step": 3834 - }, - { - "epoch": 0.1, - "learning_rate": 1.975647108868491e-06, - "loss": 1.0225, - "step": 3835 - }, - { - "epoch": 0.1, - "learning_rate": 1.9756288971267033e-06, - "loss": 1.0117, - "step": 3836 - }, - { - "epoch": 0.1, - "learning_rate": 1.9756106786618497e-06, - "loss": 0.8232, - "step": 3837 - }, - { - "epoch": 0.1, - "learning_rate": 1.9755924534740558e-06, - "loss": 1.0967, - "step": 3838 - }, - { - "epoch": 0.1, - "learning_rate": 1.975574221563447e-06, - "loss": 0.9443, - "step": 3839 - }, - { - "epoch": 0.1, - "learning_rate": 1.975555982930149e-06, - "loss": 0.8965, - "step": 3840 - }, - { - "epoch": 0.1, - "learning_rate": 1.9755377375742866e-06, - "loss": 0.8413, - "step": 3841 - }, - { - "epoch": 0.1, - "learning_rate": 1.9755194854959867e-06, - "loss": 0.8203, - "step": 3842 - }, - { - "epoch": 0.1, - "learning_rate": 1.9755012266953746e-06, - "loss": 1.0498, - "step": 3843 - }, - { - "epoch": 0.1, - "learning_rate": 1.975482961172576e-06, - "loss": 1.0635, - "step": 3844 - }, - { - "epoch": 0.1, - "learning_rate": 1.9754646889277177e-06, - "loss": 1.124, - "step": 3845 - }, - { - "epoch": 0.1, - "learning_rate": 1.975446409960924e-06, - "loss": 1.1738, - "step": 3846 - }, - { - "epoch": 0.1, - "learning_rate": 1.975428124272322e-06, - "loss": 1.1123, - "step": 3847 - }, - { - "epoch": 0.1, - "learning_rate": 1.9754098318620377e-06, - "loss": 0.8955, - "step": 3848 - }, - { - "epoch": 0.1, - "learning_rate": 1.9753915327301966e-06, - "loss": 1.0967, - "step": 3849 - }, - { - "epoch": 0.1, - "learning_rate": 1.975373226876925e-06, - "loss": 0.8691, - "step": 3850 - }, - { - "epoch": 0.1, - "learning_rate": 1.9753549143023496e-06, - "loss": 0.9639, - "step": 3851 - }, - { - "epoch": 0.1, - "learning_rate": 1.9753365950065957e-06, - "loss": 1.1211, - "step": 3852 - }, - { - "epoch": 0.1, - "learning_rate": 1.97531826898979e-06, - "loss": 1.0068, - "step": 3853 - }, - { - "epoch": 0.1, - "learning_rate": 1.975299936252059e-06, - "loss": 1.0361, - "step": 3854 - }, - { - "epoch": 0.1, - "learning_rate": 1.9752815967935285e-06, - "loss": 0.9033, - "step": 3855 - }, - { - "epoch": 0.1, - "learning_rate": 1.9752632506143253e-06, - "loss": 1.1719, - "step": 3856 - }, - { - "epoch": 0.1, - "learning_rate": 1.9752448977145755e-06, - "loss": 0.6787, - "step": 3857 - }, - { - "epoch": 0.1, - "learning_rate": 1.9752265380944057e-06, - "loss": 0.9475, - "step": 3858 - }, - { - "epoch": 0.1, - "learning_rate": 1.9752081717539426e-06, - "loss": 0.8574, - "step": 3859 - }, - { - "epoch": 0.1, - "learning_rate": 1.9751897986933128e-06, - "loss": 0.9268, - "step": 3860 - }, - { - "epoch": 0.1, - "learning_rate": 1.9751714189126425e-06, - "loss": 0.8833, - "step": 3861 - }, - { - "epoch": 0.1, - "learning_rate": 1.9751530324120583e-06, - "loss": 0.8853, - "step": 3862 - }, - { - "epoch": 0.1, - "learning_rate": 1.9751346391916877e-06, - "loss": 0.8984, - "step": 3863 - }, - { - "epoch": 0.1, - "learning_rate": 1.9751162392516565e-06, - "loss": 0.9351, - "step": 3864 - }, - { - "epoch": 0.1, - "learning_rate": 1.9750978325920923e-06, - "loss": 0.7559, - "step": 3865 - }, - { - "epoch": 0.1, - "learning_rate": 1.9750794192131215e-06, - "loss": 1.1113, - "step": 3866 - }, - { - "epoch": 0.1, - "learning_rate": 1.975060999114871e-06, - "loss": 0.7617, - "step": 3867 - }, - { - "epoch": 0.1, - "learning_rate": 1.975042572297468e-06, - "loss": 0.8345, - "step": 3868 - }, - { - "epoch": 0.1, - "learning_rate": 1.975024138761039e-06, - "loss": 0.6475, - "step": 3869 - }, - { - "epoch": 0.1, - "learning_rate": 1.975005698505711e-06, - "loss": 1.0059, - "step": 3870 - }, - { - "epoch": 0.1, - "learning_rate": 1.974987251531612e-06, - "loss": 1.041, - "step": 3871 - }, - { - "epoch": 0.1, - "learning_rate": 1.9749687978388683e-06, - "loss": 0.6875, - "step": 3872 - }, - { - "epoch": 0.1, - "learning_rate": 1.9749503374276067e-06, - "loss": 0.7793, - "step": 3873 - }, - { - "epoch": 0.1, - "learning_rate": 1.9749318702979554e-06, - "loss": 0.8242, - "step": 3874 - }, - { - "epoch": 0.1, - "learning_rate": 1.9749133964500416e-06, - "loss": 0.918, - "step": 3875 - }, - { - "epoch": 0.1, - "learning_rate": 1.9748949158839918e-06, - "loss": 1.001, - "step": 3876 - }, - { - "epoch": 0.1, - "learning_rate": 1.974876428599934e-06, - "loss": 1.085, - "step": 3877 - }, - { - "epoch": 0.1, - "learning_rate": 1.974857934597995e-06, - "loss": 0.8164, - "step": 3878 - }, - { - "epoch": 0.1, - "learning_rate": 1.9748394338783028e-06, - "loss": 0.7246, - "step": 3879 - }, - { - "epoch": 0.1, - "learning_rate": 1.974820926440985e-06, - "loss": 1.04, - "step": 3880 - }, - { - "epoch": 0.1, - "learning_rate": 1.9748024122861684e-06, - "loss": 0.8857, - "step": 3881 - }, - { - "epoch": 0.1, - "learning_rate": 1.974783891413981e-06, - "loss": 0.9473, - "step": 3882 - }, - { - "epoch": 0.1, - "learning_rate": 1.9747653638245505e-06, - "loss": 0.9448, - "step": 3883 - }, - { - "epoch": 0.1, - "learning_rate": 1.9747468295180045e-06, - "loss": 0.9111, - "step": 3884 - }, - { - "epoch": 0.1, - "learning_rate": 1.9747282884944708e-06, - "loss": 0.9209, - "step": 3885 - }, - { - "epoch": 0.1, - "learning_rate": 1.9747097407540775e-06, - "loss": 1.1074, - "step": 3886 - }, - { - "epoch": 0.1, - "learning_rate": 1.9746911862969515e-06, - "loss": 0.8193, - "step": 3887 - }, - { - "epoch": 0.1, - "learning_rate": 1.9746726251232213e-06, - "loss": 0.8555, - "step": 3888 - }, - { - "epoch": 0.1, - "learning_rate": 1.974654057233015e-06, - "loss": 0.9639, - "step": 3889 - }, - { - "epoch": 0.1, - "learning_rate": 1.97463548262646e-06, - "loss": 0.9346, - "step": 3890 - }, - { - "epoch": 0.1, - "learning_rate": 1.974616901303684e-06, - "loss": 0.8291, - "step": 3891 - }, - { - "epoch": 0.1, - "learning_rate": 1.974598313264816e-06, - "loss": 0.8179, - "step": 3892 - }, - { - "epoch": 0.1, - "learning_rate": 1.9745797185099837e-06, - "loss": 1.0742, - "step": 3893 - }, - { - "epoch": 0.1, - "learning_rate": 1.9745611170393155e-06, - "loss": 1.0947, - "step": 3894 - }, - { - "epoch": 0.1, - "learning_rate": 1.974542508852939e-06, - "loss": 0.7578, - "step": 3895 - }, - { - "epoch": 0.1, - "learning_rate": 1.9745238939509826e-06, - "loss": 0.6943, - "step": 3896 - }, - { - "epoch": 0.1, - "learning_rate": 1.9745052723335742e-06, - "loss": 0.5601, - "step": 3897 - }, - { - "epoch": 0.1, - "learning_rate": 1.9744866440008434e-06, - "loss": 0.8633, - "step": 3898 - }, - { - "epoch": 0.1, - "learning_rate": 1.974468008952918e-06, - "loss": 1.1123, - "step": 3899 - }, - { - "epoch": 0.1, - "learning_rate": 1.9744493671899253e-06, - "loss": 0.8223, - "step": 3900 - }, - { - "epoch": 0.1, - "learning_rate": 1.974430718711995e-06, - "loss": 0.8613, - "step": 3901 - }, - { - "epoch": 0.1, - "learning_rate": 1.9744120635192557e-06, - "loss": 0.585, - "step": 3902 - }, - { - "epoch": 0.1, - "learning_rate": 1.974393401611835e-06, - "loss": 0.7217, - "step": 3903 - }, - { - "epoch": 0.1, - "learning_rate": 1.974374732989862e-06, - "loss": 0.9531, - "step": 3904 - }, - { - "epoch": 0.1, - "learning_rate": 1.974356057653466e-06, - "loss": 0.8887, - "step": 3905 - }, - { - "epoch": 0.1, - "learning_rate": 1.974337375602774e-06, - "loss": 1.1221, - "step": 3906 - }, - { - "epoch": 0.1, - "learning_rate": 1.9743186868379164e-06, - "loss": 1.1699, - "step": 3907 - }, - { - "epoch": 0.1, - "learning_rate": 1.9742999913590212e-06, - "loss": 0.8867, - "step": 3908 - }, - { - "epoch": 0.1, - "learning_rate": 1.9742812891662176e-06, - "loss": 0.7773, - "step": 3909 - }, - { - "epoch": 0.1, - "learning_rate": 1.9742625802596343e-06, - "loss": 1.0039, - "step": 3910 - }, - { - "epoch": 0.1, - "learning_rate": 1.9742438646394e-06, - "loss": 1.0684, - "step": 3911 - }, - { - "epoch": 0.1, - "learning_rate": 1.974225142305644e-06, - "loss": 0.729, - "step": 3912 - }, - { - "epoch": 0.1, - "learning_rate": 1.974206413258495e-06, - "loss": 0.5249, - "step": 3913 - }, - { - "epoch": 0.1, - "learning_rate": 1.9741876774980827e-06, - "loss": 1.0332, - "step": 3914 - }, - { - "epoch": 0.1, - "learning_rate": 1.9741689350245353e-06, - "loss": 0.9268, - "step": 3915 - }, - { - "epoch": 0.1, - "learning_rate": 1.9741501858379825e-06, - "loss": 0.7861, - "step": 3916 - }, - { - "epoch": 0.1, - "learning_rate": 1.9741314299385534e-06, - "loss": 0.9463, - "step": 3917 - }, - { - "epoch": 0.1, - "learning_rate": 1.9741126673263776e-06, - "loss": 0.9219, - "step": 3918 - }, - { - "epoch": 0.1, - "learning_rate": 1.9740938980015835e-06, - "loss": 0.9414, - "step": 3919 - }, - { - "epoch": 0.1, - "learning_rate": 1.9740751219643014e-06, - "loss": 0.8174, - "step": 3920 - }, - { - "epoch": 0.1, - "learning_rate": 1.97405633921466e-06, - "loss": 0.8809, - "step": 3921 - }, - { - "epoch": 0.1, - "learning_rate": 1.9740375497527893e-06, - "loss": 0.7959, - "step": 3922 - }, - { - "epoch": 0.1, - "learning_rate": 1.9740187535788185e-06, - "loss": 1.0479, - "step": 3923 - }, - { - "epoch": 0.1, - "learning_rate": 1.973999950692877e-06, - "loss": 0.9932, - "step": 3924 - }, - { - "epoch": 0.1, - "learning_rate": 1.973981141095094e-06, - "loss": 0.8838, - "step": 3925 - }, - { - "epoch": 0.1, - "learning_rate": 1.9739623247856e-06, - "loss": 0.8867, - "step": 3926 - }, - { - "epoch": 0.1, - "learning_rate": 1.9739435017645243e-06, - "loss": 0.9346, - "step": 3927 - }, - { - "epoch": 0.1, - "learning_rate": 1.9739246720319967e-06, - "loss": 1.1387, - "step": 3928 - }, - { - "epoch": 0.1, - "learning_rate": 1.973905835588147e-06, - "loss": 1.126, - "step": 3929 - }, - { - "epoch": 0.1, - "learning_rate": 1.973886992433104e-06, - "loss": 1.0039, - "step": 3930 - }, - { - "epoch": 0.1, - "learning_rate": 1.973868142566999e-06, - "loss": 0.8716, - "step": 3931 - }, - { - "epoch": 0.1, - "learning_rate": 1.9738492859899613e-06, - "loss": 1.0859, - "step": 3932 - }, - { - "epoch": 0.1, - "learning_rate": 1.973830422702121e-06, - "loss": 0.8306, - "step": 3933 - }, - { - "epoch": 0.1, - "learning_rate": 1.973811552703607e-06, - "loss": 1.1133, - "step": 3934 - }, - { - "epoch": 0.1, - "learning_rate": 1.9737926759945508e-06, - "loss": 0.6754, - "step": 3935 - }, - { - "epoch": 0.1, - "learning_rate": 1.9737737925750823e-06, - "loss": 0.9805, - "step": 3936 - }, - { - "epoch": 0.1, - "learning_rate": 1.9737549024453307e-06, - "loss": 0.8906, - "step": 3937 - }, - { - "epoch": 0.1, - "learning_rate": 1.973736005605427e-06, - "loss": 0.791, - "step": 3938 - }, - { - "epoch": 0.1, - "learning_rate": 1.973717102055501e-06, - "loss": 0.8301, - "step": 3939 - }, - { - "epoch": 0.1, - "learning_rate": 1.973698191795683e-06, - "loss": 0.8838, - "step": 3940 - }, - { - "epoch": 0.1, - "learning_rate": 1.973679274826104e-06, - "loss": 0.8711, - "step": 3941 - }, - { - "epoch": 0.1, - "learning_rate": 1.973660351146893e-06, - "loss": 0.8984, - "step": 3942 - }, - { - "epoch": 0.1, - "learning_rate": 1.9736414207581813e-06, - "loss": 1.0605, - "step": 3943 - }, - { - "epoch": 0.1, - "learning_rate": 1.973622483660099e-06, - "loss": 0.9648, - "step": 3944 - }, - { - "epoch": 0.1, - "learning_rate": 1.9736035398527774e-06, - "loss": 0.9365, - "step": 3945 - }, - { - "epoch": 0.1, - "learning_rate": 1.973584589336346e-06, - "loss": 0.8994, - "step": 3946 - }, - { - "epoch": 0.1, - "learning_rate": 1.9735656321109362e-06, - "loss": 1.0713, - "step": 3947 - }, - { - "epoch": 0.1, - "learning_rate": 1.9735466681766785e-06, - "loss": 1.0352, - "step": 3948 - }, - { - "epoch": 0.1, - "learning_rate": 1.973527697533703e-06, - "loss": 0.7363, - "step": 3949 - }, - { - "epoch": 0.1, - "learning_rate": 1.9735087201821406e-06, - "loss": 0.875, - "step": 3950 - }, - { - "epoch": 0.1, - "learning_rate": 1.9734897361221225e-06, - "loss": 0.9492, - "step": 3951 - }, - { - "epoch": 0.1, - "learning_rate": 1.9734707453537793e-06, - "loss": 0.959, - "step": 3952 - }, - { - "epoch": 0.1, - "learning_rate": 1.9734517478772418e-06, - "loss": 0.9004, - "step": 3953 - }, - { - "epoch": 0.1, - "learning_rate": 1.9734327436926408e-06, - "loss": 0.7739, - "step": 3954 - }, - { - "epoch": 0.1, - "learning_rate": 1.9734137328001076e-06, - "loss": 1.2988, - "step": 3955 - }, - { - "epoch": 0.1, - "learning_rate": 1.9733947151997723e-06, - "loss": 0.8765, - "step": 3956 - }, - { - "epoch": 0.1, - "learning_rate": 1.9733756908917674e-06, - "loss": 0.8779, - "step": 3957 - }, - { - "epoch": 0.1, - "learning_rate": 1.9733566598762234e-06, - "loss": 0.9619, - "step": 3958 - }, - { - "epoch": 0.1, - "learning_rate": 1.9733376221532707e-06, - "loss": 1.0342, - "step": 3959 - }, - { - "epoch": 0.1, - "learning_rate": 1.9733185777230415e-06, - "loss": 1.0391, - "step": 3960 - }, - { - "epoch": 0.1, - "learning_rate": 1.973299526585667e-06, - "loss": 0.6128, - "step": 3961 - }, - { - "epoch": 0.1, - "learning_rate": 1.9732804687412776e-06, - "loss": 0.8564, - "step": 3962 - }, - { - "epoch": 0.1, - "learning_rate": 1.973261404190005e-06, - "loss": 1.1143, - "step": 3963 - }, - { - "epoch": 0.1, - "learning_rate": 1.973242332931981e-06, - "loss": 0.9326, - "step": 3964 - }, - { - "epoch": 0.1, - "learning_rate": 1.9732232549673365e-06, - "loss": 1.0537, - "step": 3965 - }, - { - "epoch": 0.1, - "learning_rate": 1.9732041702962037e-06, - "loss": 0.8398, - "step": 3966 - }, - { - "epoch": 0.1, - "learning_rate": 1.9731850789187134e-06, - "loss": 0.9482, - "step": 3967 - }, - { - "epoch": 0.1, - "learning_rate": 1.973165980834997e-06, - "loss": 0.8462, - "step": 3968 - }, - { - "epoch": 0.1, - "learning_rate": 1.9731468760451867e-06, - "loss": 0.6079, - "step": 3969 - }, - { - "epoch": 0.1, - "learning_rate": 1.9731277645494137e-06, - "loss": 0.6143, - "step": 3970 - }, - { - "epoch": 0.1, - "learning_rate": 1.9731086463478104e-06, - "loss": 0.9658, - "step": 3971 - }, - { - "epoch": 0.1, - "learning_rate": 1.9730895214405077e-06, - "loss": 0.915, - "step": 3972 - }, - { - "epoch": 0.1, - "learning_rate": 1.973070389827638e-06, - "loss": 0.9629, - "step": 3973 - }, - { - "epoch": 0.1, - "learning_rate": 1.973051251509333e-06, - "loss": 0.8066, - "step": 3974 - }, - { - "epoch": 0.1, - "learning_rate": 1.973032106485724e-06, - "loss": 0.9629, - "step": 3975 - }, - { - "epoch": 0.1, - "learning_rate": 1.973012954756944e-06, - "loss": 1.0137, - "step": 3976 - }, - { - "epoch": 0.1, - "learning_rate": 1.972993796323124e-06, - "loss": 0.8545, - "step": 3977 - }, - { - "epoch": 0.1, - "learning_rate": 1.972974631184396e-06, - "loss": 0.8154, - "step": 3978 - }, - { - "epoch": 0.1, - "learning_rate": 1.972955459340893e-06, - "loss": 1.0625, - "step": 3979 - }, - { - "epoch": 0.1, - "learning_rate": 1.9729362807927467e-06, - "loss": 0.9111, - "step": 3980 - }, - { - "epoch": 0.1, - "learning_rate": 1.972917095540089e-06, - "loss": 1.0439, - "step": 3981 - }, - { - "epoch": 0.1, - "learning_rate": 1.972897903583052e-06, - "loss": 0.8623, - "step": 3982 - }, - { - "epoch": 0.1, - "learning_rate": 1.9728787049217684e-06, - "loss": 0.876, - "step": 3983 - }, - { - "epoch": 0.1, - "learning_rate": 1.97285949955637e-06, - "loss": 0.96, - "step": 3984 - }, - { - "epoch": 0.1, - "learning_rate": 1.97284028748699e-06, - "loss": 0.7756, - "step": 3985 - }, - { - "epoch": 0.1, - "learning_rate": 1.9728210687137597e-06, - "loss": 0.9248, - "step": 3986 - }, - { - "epoch": 0.1, - "learning_rate": 1.972801843236812e-06, - "loss": 0.8652, - "step": 3987 - }, - { - "epoch": 0.1, - "learning_rate": 1.9727826110562804e-06, - "loss": 1.0176, - "step": 3988 - }, - { - "epoch": 0.1, - "learning_rate": 1.9727633721722955e-06, - "loss": 1.0732, - "step": 3989 - }, - { - "epoch": 0.1, - "learning_rate": 1.9727441265849914e-06, - "loss": 0.9336, - "step": 3990 - }, - { - "epoch": 0.1, - "learning_rate": 1.9727248742945e-06, - "loss": 0.9473, - "step": 3991 - }, - { - "epoch": 0.1, - "learning_rate": 1.972705615300954e-06, - "loss": 1.0498, - "step": 3992 - }, - { - "epoch": 0.1, - "learning_rate": 1.9726863496044864e-06, - "loss": 0.8486, - "step": 3993 - }, - { - "epoch": 0.1, - "learning_rate": 1.97266707720523e-06, - "loss": 1.0439, - "step": 3994 - }, - { - "epoch": 0.1, - "learning_rate": 1.9726477981033168e-06, - "loss": 1.0156, - "step": 3995 - }, - { - "epoch": 0.1, - "learning_rate": 1.9726285122988807e-06, - "loss": 0.9375, - "step": 3996 - }, - { - "epoch": 0.1, - "learning_rate": 1.9726092197920542e-06, - "loss": 0.9775, - "step": 3997 - }, - { - "epoch": 0.1, - "learning_rate": 1.9725899205829703e-06, - "loss": 0.9082, - "step": 3998 - }, - { - "epoch": 0.1, - "learning_rate": 1.9725706146717614e-06, - "loss": 0.9697, - "step": 3999 - }, - { - "epoch": 0.1, - "learning_rate": 1.972551302058562e-06, - "loss": 0.9521, - "step": 4000 - }, - { - "epoch": 0.1, - "learning_rate": 1.9725319827435034e-06, - "loss": 1.0049, - "step": 4001 - }, - { - "epoch": 0.1, - "learning_rate": 1.9725126567267195e-06, - "loss": 0.999, - "step": 4002 - }, - { - "epoch": 0.1, - "learning_rate": 1.9724933240083442e-06, - "loss": 0.8613, - "step": 4003 - }, - { - "epoch": 0.1, - "learning_rate": 1.97247398458851e-06, - "loss": 1.0322, - "step": 4004 - }, - { - "epoch": 0.1, - "learning_rate": 1.9724546384673493e-06, - "loss": 0.8623, - "step": 4005 - }, - { - "epoch": 0.1, - "learning_rate": 1.9724352856449973e-06, - "loss": 1.0869, - "step": 4006 - }, - { - "epoch": 0.1, - "learning_rate": 1.972415926121586e-06, - "loss": 1.0791, - "step": 4007 - }, - { - "epoch": 0.1, - "learning_rate": 1.972396559897249e-06, - "loss": 0.8252, - "step": 4008 - }, - { - "epoch": 0.1, - "learning_rate": 1.9723771869721206e-06, - "loss": 0.9951, - "step": 4009 - }, - { - "epoch": 0.1, - "learning_rate": 1.972357807346333e-06, - "loss": 0.9033, - "step": 4010 - }, - { - "epoch": 0.1, - "learning_rate": 1.972338421020021e-06, - "loss": 0.9199, - "step": 4011 - }, - { - "epoch": 0.1, - "learning_rate": 1.972319027993317e-06, - "loss": 0.8018, - "step": 4012 - }, - { - "epoch": 0.1, - "learning_rate": 1.972299628266356e-06, - "loss": 1.0283, - "step": 4013 - }, - { - "epoch": 0.1, - "learning_rate": 1.97228022183927e-06, - "loss": 0.8584, - "step": 4014 - }, - { - "epoch": 0.1, - "learning_rate": 1.9722608087121945e-06, - "loss": 0.8135, - "step": 4015 - }, - { - "epoch": 0.1, - "learning_rate": 1.972241388885262e-06, - "loss": 1.1162, - "step": 4016 - }, - { - "epoch": 0.1, - "learning_rate": 1.972221962358607e-06, - "loss": 0.7607, - "step": 4017 - }, - { - "epoch": 0.1, - "learning_rate": 1.9722025291323626e-06, - "loss": 1.0449, - "step": 4018 - }, - { - "epoch": 0.1, - "learning_rate": 1.9721830892066637e-06, - "loss": 0.7881, - "step": 4019 - }, - { - "epoch": 0.1, - "learning_rate": 1.972163642581643e-06, - "loss": 0.7793, - "step": 4020 - }, - { - "epoch": 0.1, - "learning_rate": 1.972144189257436e-06, - "loss": 0.8369, - "step": 4021 - }, - { - "epoch": 0.1, - "learning_rate": 1.972124729234176e-06, - "loss": 0.915, - "step": 4022 - }, - { - "epoch": 0.1, - "learning_rate": 1.9721052625119975e-06, - "loss": 0.9043, - "step": 4023 - }, - { - "epoch": 0.1, - "learning_rate": 1.9720857890910338e-06, - "loss": 0.9961, - "step": 4024 - }, - { - "epoch": 0.1, - "learning_rate": 1.972066308971419e-06, - "loss": 0.9932, - "step": 4025 - }, - { - "epoch": 0.1, - "learning_rate": 1.972046822153289e-06, - "loss": 0.8838, - "step": 4026 - }, - { - "epoch": 0.1, - "learning_rate": 1.9720273286367765e-06, - "loss": 0.6909, - "step": 4027 - }, - { - "epoch": 0.1, - "learning_rate": 1.9720078284220167e-06, - "loss": 1.1221, - "step": 4028 - }, - { - "epoch": 0.1, - "learning_rate": 1.9719883215091433e-06, - "loss": 0.9902, - "step": 4029 - }, - { - "epoch": 0.1, - "learning_rate": 1.971968807898291e-06, - "loss": 0.7812, - "step": 4030 - }, - { - "epoch": 0.1, - "learning_rate": 1.971949287589594e-06, - "loss": 1.0889, - "step": 4031 - }, - { - "epoch": 0.1, - "learning_rate": 1.9719297605831878e-06, - "loss": 0.8228, - "step": 4032 - }, - { - "epoch": 0.1, - "learning_rate": 1.971910226879206e-06, - "loss": 0.9961, - "step": 4033 - }, - { - "epoch": 0.1, - "learning_rate": 1.9718906864777838e-06, - "loss": 1.0088, - "step": 4034 - }, - { - "epoch": 0.1, - "learning_rate": 1.971871139379055e-06, - "loss": 0.8945, - "step": 4035 - }, - { - "epoch": 0.1, - "learning_rate": 1.971851585583155e-06, - "loss": 0.8877, - "step": 4036 - }, - { - "epoch": 0.1, - "learning_rate": 1.9718320250902183e-06, - "loss": 0.9531, - "step": 4037 - }, - { - "epoch": 0.1, - "learning_rate": 1.97181245790038e-06, - "loss": 0.873, - "step": 4038 - }, - { - "epoch": 0.1, - "learning_rate": 1.9717928840137744e-06, - "loss": 0.8281, - "step": 4039 - }, - { - "epoch": 0.1, - "learning_rate": 1.971773303430537e-06, - "loss": 0.6963, - "step": 4040 - }, - { - "epoch": 0.1, - "learning_rate": 1.971753716150802e-06, - "loss": 1.0762, - "step": 4041 - }, - { - "epoch": 0.1, - "learning_rate": 1.9717341221747056e-06, - "loss": 1.0059, - "step": 4042 - }, - { - "epoch": 0.1, - "learning_rate": 1.9717145215023818e-06, - "loss": 0.8906, - "step": 4043 - }, - { - "epoch": 0.1, - "learning_rate": 1.971694914133965e-06, - "loss": 1.123, - "step": 4044 - }, - { - "epoch": 0.1, - "learning_rate": 1.971675300069592e-06, - "loss": 1.1104, - "step": 4045 - }, - { - "epoch": 0.1, - "learning_rate": 1.9716556793093974e-06, - "loss": 1.0596, - "step": 4046 - }, - { - "epoch": 0.1, - "learning_rate": 1.9716360518535156e-06, - "loss": 0.833, - "step": 4047 - }, - { - "epoch": 0.1, - "learning_rate": 1.9716164177020828e-06, - "loss": 1.042, - "step": 4048 - }, - { - "epoch": 0.1, - "learning_rate": 1.9715967768552336e-06, - "loss": 0.915, - "step": 4049 - }, - { - "epoch": 0.1, - "learning_rate": 1.9715771293131034e-06, - "loss": 0.9639, - "step": 4050 - }, - { - "epoch": 0.1, - "learning_rate": 1.9715574750758284e-06, - "loss": 0.9453, - "step": 4051 - }, - { - "epoch": 0.1, - "learning_rate": 1.9715378141435435e-06, - "loss": 0.9893, - "step": 4052 - }, - { - "epoch": 0.1, - "learning_rate": 1.971518146516384e-06, - "loss": 0.9365, - "step": 4053 - }, - { - "epoch": 0.1, - "learning_rate": 1.9714984721944856e-06, - "loss": 0.9258, - "step": 4054 - }, - { - "epoch": 0.1, - "learning_rate": 1.9714787911779844e-06, - "loss": 1.1602, - "step": 4055 - }, - { - "epoch": 0.1, - "learning_rate": 1.9714591034670147e-06, - "loss": 1.1182, - "step": 4056 - }, - { - "epoch": 0.1, - "learning_rate": 1.9714394090617136e-06, - "loss": 0.8574, - "step": 4057 - }, - { - "epoch": 0.1, - "learning_rate": 1.9714197079622158e-06, - "loss": 0.9287, - "step": 4058 - }, - { - "epoch": 0.1, - "learning_rate": 1.9714000001686577e-06, - "loss": 0.9258, - "step": 4059 - }, - { - "epoch": 0.1, - "learning_rate": 1.9713802856811744e-06, - "loss": 0.9521, - "step": 4060 - }, - { - "epoch": 0.1, - "learning_rate": 1.971360564499903e-06, - "loss": 0.874, - "step": 4061 - }, - { - "epoch": 0.1, - "learning_rate": 1.971340836624978e-06, - "loss": 0.793, - "step": 4062 - }, - { - "epoch": 0.1, - "learning_rate": 1.9713211020565362e-06, - "loss": 1.1494, - "step": 4063 - }, - { - "epoch": 0.1, - "learning_rate": 1.971301360794713e-06, - "loss": 0.79, - "step": 4064 - }, - { - "epoch": 0.1, - "learning_rate": 1.9712816128396454e-06, - "loss": 0.8965, - "step": 4065 - }, - { - "epoch": 0.1, - "learning_rate": 1.9712618581914684e-06, - "loss": 1.0332, - "step": 4066 - }, - { - "epoch": 0.1, - "learning_rate": 1.971242096850319e-06, - "loss": 0.8359, - "step": 4067 - }, - { - "epoch": 0.1, - "learning_rate": 1.9712223288163326e-06, - "loss": 0.8838, - "step": 4068 - }, - { - "epoch": 0.1, - "learning_rate": 1.971202554089646e-06, - "loss": 0.9189, - "step": 4069 - }, - { - "epoch": 0.1, - "learning_rate": 1.971182772670395e-06, - "loss": 0.7852, - "step": 4070 - }, - { - "epoch": 0.1, - "learning_rate": 1.9711629845587163e-06, - "loss": 0.8828, - "step": 4071 - }, - { - "epoch": 0.1, - "learning_rate": 1.971143189754746e-06, - "loss": 0.8164, - "step": 4072 - }, - { - "epoch": 0.1, - "learning_rate": 1.971123388258621e-06, - "loss": 0.8032, - "step": 4073 - }, - { - "epoch": 0.1, - "learning_rate": 1.9711035800704773e-06, - "loss": 0.8345, - "step": 4074 - }, - { - "epoch": 0.1, - "learning_rate": 1.9710837651904515e-06, - "loss": 0.9355, - "step": 4075 - }, - { - "epoch": 0.1, - "learning_rate": 1.97106394361868e-06, - "loss": 1.042, - "step": 4076 - }, - { - "epoch": 0.1, - "learning_rate": 1.9710441153552993e-06, - "loss": 1.0791, - "step": 4077 - }, - { - "epoch": 0.1, - "learning_rate": 1.971024280400447e-06, - "loss": 0.7861, - "step": 4078 - }, - { - "epoch": 0.1, - "learning_rate": 1.9710044387542583e-06, - "loss": 0.8501, - "step": 4079 - }, - { - "epoch": 0.1, - "learning_rate": 1.970984590416871e-06, - "loss": 0.5171, - "step": 4080 - }, - { - "epoch": 0.1, - "learning_rate": 1.9709647353884217e-06, - "loss": 0.9697, - "step": 4081 - }, - { - "epoch": 0.1, - "learning_rate": 1.970944873669047e-06, - "loss": 0.7319, - "step": 4082 - }, - { - "epoch": 0.1, - "learning_rate": 1.9709250052588838e-06, - "loss": 0.7734, - "step": 4083 - }, - { - "epoch": 0.1, - "learning_rate": 1.970905130158069e-06, - "loss": 0.8809, - "step": 4084 - }, - { - "epoch": 0.1, - "learning_rate": 1.9708852483667393e-06, - "loss": 0.8789, - "step": 4085 - }, - { - "epoch": 0.1, - "learning_rate": 1.970865359885033e-06, - "loss": 0.9688, - "step": 4086 - }, - { - "epoch": 0.1, - "learning_rate": 1.970845464713085e-06, - "loss": 0.7573, - "step": 4087 - }, - { - "epoch": 0.1, - "learning_rate": 1.9708255628510344e-06, - "loss": 1.1367, - "step": 4088 - }, - { - "epoch": 0.1, - "learning_rate": 1.970805654299017e-06, - "loss": 1.0801, - "step": 4089 - }, - { - "epoch": 0.1, - "learning_rate": 1.970785739057171e-06, - "loss": 1.0654, - "step": 4090 - }, - { - "epoch": 0.1, - "learning_rate": 1.9707658171256326e-06, - "loss": 0.8672, - "step": 4091 - }, - { - "epoch": 0.1, - "learning_rate": 1.9707458885045395e-06, - "loss": 1.0713, - "step": 4092 - }, - { - "epoch": 0.1, - "learning_rate": 1.9707259531940295e-06, - "loss": 0.9482, - "step": 4093 - }, - { - "epoch": 0.1, - "learning_rate": 1.97070601119424e-06, - "loss": 0.8809, - "step": 4094 - }, - { - "epoch": 0.1, - "learning_rate": 1.9706860625053078e-06, - "loss": 1.1396, - "step": 4095 - }, - { - "epoch": 0.1, - "learning_rate": 1.97066610712737e-06, - "loss": 0.9102, - "step": 4096 - }, - { - "epoch": 0.11, - "learning_rate": 1.970646145060565e-06, - "loss": 0.8091, - "step": 4097 - }, - { - "epoch": 0.11, - "learning_rate": 1.970626176305031e-06, - "loss": 0.8896, - "step": 4098 - }, - { - "epoch": 0.11, - "learning_rate": 1.970606200860904e-06, - "loss": 0.8682, - "step": 4099 - }, - { - "epoch": 0.11, - "learning_rate": 1.970586218728322e-06, - "loss": 0.7229, - "step": 4100 - }, - { - "epoch": 0.11, - "learning_rate": 1.9705662299074235e-06, - "loss": 0.9893, - "step": 4101 - }, - { - "epoch": 0.11, - "learning_rate": 1.9705462343983454e-06, - "loss": 1.0615, - "step": 4102 - }, - { - "epoch": 0.11, - "learning_rate": 1.970526232201226e-06, - "loss": 1.0566, - "step": 4103 - }, - { - "epoch": 0.11, - "learning_rate": 1.970506223316203e-06, - "loss": 0.8394, - "step": 4104 - }, - { - "epoch": 0.11, - "learning_rate": 1.9704862077434146e-06, - "loss": 0.8198, - "step": 4105 - }, - { - "epoch": 0.11, - "learning_rate": 1.970466185482998e-06, - "loss": 0.7607, - "step": 4106 - }, - { - "epoch": 0.11, - "learning_rate": 1.9704461565350923e-06, - "loss": 0.7827, - "step": 4107 - }, - { - "epoch": 0.11, - "learning_rate": 1.9704261208998337e-06, - "loss": 0.874, - "step": 4108 - }, - { - "epoch": 0.11, - "learning_rate": 1.9704060785773623e-06, - "loss": 0.9248, - "step": 4109 - }, - { - "epoch": 0.11, - "learning_rate": 1.9703860295678147e-06, - "loss": 1.0449, - "step": 4110 - }, - { - "epoch": 0.11, - "learning_rate": 1.97036597387133e-06, - "loss": 1.0264, - "step": 4111 - }, - { - "epoch": 0.11, - "learning_rate": 1.9703459114880458e-06, - "loss": 0.8535, - "step": 4112 - }, - { - "epoch": 0.11, - "learning_rate": 1.970325842418101e-06, - "loss": 0.9912, - "step": 4113 - }, - { - "epoch": 0.11, - "learning_rate": 1.970305766661633e-06, - "loss": 0.917, - "step": 4114 - }, - { - "epoch": 0.11, - "learning_rate": 1.9702856842187807e-06, - "loss": 0.8306, - "step": 4115 - }, - { - "epoch": 0.11, - "learning_rate": 1.970265595089683e-06, - "loss": 0.9561, - "step": 4116 - }, - { - "epoch": 0.11, - "learning_rate": 1.970245499274477e-06, - "loss": 1.0127, - "step": 4117 - }, - { - "epoch": 0.11, - "learning_rate": 1.970225396773302e-06, - "loss": 0.9302, - "step": 4118 - }, - { - "epoch": 0.11, - "learning_rate": 1.9702052875862967e-06, - "loss": 0.6108, - "step": 4119 - }, - { - "epoch": 0.11, - "learning_rate": 1.9701851717135997e-06, - "loss": 1.166, - "step": 4120 - }, - { - "epoch": 0.11, - "learning_rate": 1.970165049155349e-06, - "loss": 0.8994, - "step": 4121 - }, - { - "epoch": 0.11, - "learning_rate": 1.970144919911684e-06, - "loss": 0.9668, - "step": 4122 - }, - { - "epoch": 0.11, - "learning_rate": 1.9701247839827427e-06, - "loss": 0.875, - "step": 4123 - }, - { - "epoch": 0.11, - "learning_rate": 1.970104641368664e-06, - "loss": 0.5879, - "step": 4124 - }, - { - "epoch": 0.11, - "learning_rate": 1.970084492069587e-06, - "loss": 1.083, - "step": 4125 - }, - { - "epoch": 0.11, - "learning_rate": 1.970064336085651e-06, - "loss": 0.9561, - "step": 4126 - }, - { - "epoch": 0.11, - "learning_rate": 1.9700441734169937e-06, - "loss": 0.8184, - "step": 4127 - }, - { - "epoch": 0.11, - "learning_rate": 1.970024004063755e-06, - "loss": 0.8857, - "step": 4128 - }, - { - "epoch": 0.11, - "learning_rate": 1.970003828026073e-06, - "loss": 0.8442, - "step": 4129 - }, - { - "epoch": 0.11, - "learning_rate": 1.969983645304088e-06, - "loss": 0.8438, - "step": 4130 - }, - { - "epoch": 0.11, - "learning_rate": 1.969963455897938e-06, - "loss": 0.9004, - "step": 4131 - }, - { - "epoch": 0.11, - "learning_rate": 1.9699432598077627e-06, - "loss": 0.9053, - "step": 4132 - }, - { - "epoch": 0.11, - "learning_rate": 1.969923057033701e-06, - "loss": 1.0908, - "step": 4133 - }, - { - "epoch": 0.11, - "learning_rate": 1.969902847575892e-06, - "loss": 0.8467, - "step": 4134 - }, - { - "epoch": 0.11, - "learning_rate": 1.9698826314344756e-06, - "loss": 1.0869, - "step": 4135 - }, - { - "epoch": 0.11, - "learning_rate": 1.96986240860959e-06, - "loss": 1.0703, - "step": 4136 - }, - { - "epoch": 0.11, - "learning_rate": 1.969842179101376e-06, - "loss": 1.1797, - "step": 4137 - }, - { - "epoch": 0.11, - "learning_rate": 1.9698219429099713e-06, - "loss": 0.8652, - "step": 4138 - }, - { - "epoch": 0.11, - "learning_rate": 1.969801700035517e-06, - "loss": 0.7227, - "step": 4139 - }, - { - "epoch": 0.11, - "learning_rate": 1.9697814504781514e-06, - "loss": 0.8379, - "step": 4140 - }, - { - "epoch": 0.11, - "learning_rate": 1.969761194238015e-06, - "loss": 0.8564, - "step": 4141 - }, - { - "epoch": 0.11, - "learning_rate": 1.9697409313152465e-06, - "loss": 0.9795, - "step": 4142 - }, - { - "epoch": 0.11, - "learning_rate": 1.969720661709986e-06, - "loss": 0.8955, - "step": 4143 - }, - { - "epoch": 0.11, - "learning_rate": 1.969700385422373e-06, - "loss": 1.0068, - "step": 4144 - }, - { - "epoch": 0.11, - "learning_rate": 1.9696801024525472e-06, - "loss": 1.0479, - "step": 4145 - }, - { - "epoch": 0.11, - "learning_rate": 1.969659812800649e-06, - "loss": 1.0615, - "step": 4146 - }, - { - "epoch": 0.11, - "learning_rate": 1.969639516466817e-06, - "loss": 0.9736, - "step": 4147 - }, - { - "epoch": 0.11, - "learning_rate": 1.9696192134511923e-06, - "loss": 0.8096, - "step": 4148 - }, - { - "epoch": 0.11, - "learning_rate": 1.969598903753914e-06, - "loss": 0.9844, - "step": 4149 - }, - { - "epoch": 0.11, - "learning_rate": 1.969578587375123e-06, - "loss": 0.9385, - "step": 4150 - }, - { - "epoch": 0.11, - "learning_rate": 1.969558264314958e-06, - "loss": 1.0068, - "step": 4151 - }, - { - "epoch": 0.11, - "learning_rate": 1.9695379345735596e-06, - "loss": 0.8867, - "step": 4152 - }, - { - "epoch": 0.11, - "learning_rate": 1.9695175981510684e-06, - "loss": 0.9043, - "step": 4153 - }, - { - "epoch": 0.11, - "learning_rate": 1.969497255047624e-06, - "loss": 0.8574, - "step": 4154 - }, - { - "epoch": 0.11, - "learning_rate": 1.9694769052633666e-06, - "loss": 1.0039, - "step": 4155 - }, - { - "epoch": 0.11, - "learning_rate": 1.9694565487984364e-06, - "loss": 0.9297, - "step": 4156 - }, - { - "epoch": 0.11, - "learning_rate": 1.969436185652974e-06, - "loss": 0.9844, - "step": 4157 - }, - { - "epoch": 0.11, - "learning_rate": 1.9694158158271192e-06, - "loss": 0.96, - "step": 4158 - }, - { - "epoch": 0.11, - "learning_rate": 1.969395439321013e-06, - "loss": 1.0469, - "step": 4159 - }, - { - "epoch": 0.11, - "learning_rate": 1.9693750561347954e-06, - "loss": 0.9756, - "step": 4160 - }, - { - "epoch": 0.11, - "learning_rate": 1.969354666268607e-06, - "loss": 1.0986, - "step": 4161 - }, - { - "epoch": 0.11, - "learning_rate": 1.969334269722588e-06, - "loss": 0.7256, - "step": 4162 - }, - { - "epoch": 0.11, - "learning_rate": 1.9693138664968797e-06, - "loss": 0.9614, - "step": 4163 - }, - { - "epoch": 0.11, - "learning_rate": 1.9692934565916215e-06, - "loss": 0.9912, - "step": 4164 - }, - { - "epoch": 0.11, - "learning_rate": 1.969273040006956e-06, - "loss": 1.1162, - "step": 4165 - }, - { - "epoch": 0.11, - "learning_rate": 1.9692526167430215e-06, - "loss": 0.8979, - "step": 4166 - }, - { - "epoch": 0.11, - "learning_rate": 1.96923218679996e-06, - "loss": 0.877, - "step": 4167 - }, - { - "epoch": 0.11, - "learning_rate": 1.9692117501779127e-06, - "loss": 0.9385, - "step": 4168 - }, - { - "epoch": 0.11, - "learning_rate": 1.9691913068770198e-06, - "loss": 0.731, - "step": 4169 - }, - { - "epoch": 0.11, - "learning_rate": 1.9691708568974224e-06, - "loss": 1.1953, - "step": 4170 - }, - { - "epoch": 0.11, - "learning_rate": 1.9691504002392608e-06, - "loss": 1.0586, - "step": 4171 - }, - { - "epoch": 0.11, - "learning_rate": 1.9691299369026767e-06, - "loss": 0.9844, - "step": 4172 - }, - { - "epoch": 0.11, - "learning_rate": 1.969109466887811e-06, - "loss": 0.9229, - "step": 4173 - }, - { - "epoch": 0.11, - "learning_rate": 1.969088990194805e-06, - "loss": 1.0283, - "step": 4174 - }, - { - "epoch": 0.11, - "learning_rate": 1.9690685068237986e-06, - "loss": 0.8535, - "step": 4175 - }, - { - "epoch": 0.11, - "learning_rate": 1.9690480167749346e-06, - "loss": 0.875, - "step": 4176 - }, - { - "epoch": 0.11, - "learning_rate": 1.969027520048353e-06, - "loss": 0.9121, - "step": 4177 - }, - { - "epoch": 0.11, - "learning_rate": 1.9690070166441954e-06, - "loss": 0.9619, - "step": 4178 - }, - { - "epoch": 0.11, - "learning_rate": 1.968986506562603e-06, - "loss": 0.9756, - "step": 4179 - }, - { - "epoch": 0.11, - "learning_rate": 1.9689659898037173e-06, - "loss": 0.9092, - "step": 4180 - }, - { - "epoch": 0.11, - "learning_rate": 1.96894546636768e-06, - "loss": 0.7373, - "step": 4181 - }, - { - "epoch": 0.11, - "learning_rate": 1.968924936254632e-06, - "loss": 0.9287, - "step": 4182 - }, - { - "epoch": 0.11, - "learning_rate": 1.9689043994647148e-06, - "loss": 0.9824, - "step": 4183 - }, - { - "epoch": 0.11, - "learning_rate": 1.9688838559980702e-06, - "loss": 0.9951, - "step": 4184 - }, - { - "epoch": 0.11, - "learning_rate": 1.9688633058548397e-06, - "loss": 0.9268, - "step": 4185 - }, - { - "epoch": 0.11, - "learning_rate": 1.968842749035165e-06, - "loss": 0.9668, - "step": 4186 - }, - { - "epoch": 0.11, - "learning_rate": 1.9688221855391873e-06, - "loss": 0.8438, - "step": 4187 - }, - { - "epoch": 0.11, - "learning_rate": 1.9688016153670483e-06, - "loss": 0.7729, - "step": 4188 - }, - { - "epoch": 0.11, - "learning_rate": 1.9687810385188904e-06, - "loss": 0.7739, - "step": 4189 - }, - { - "epoch": 0.11, - "learning_rate": 1.968760454994855e-06, - "loss": 0.8457, - "step": 4190 - }, - { - "epoch": 0.11, - "learning_rate": 1.968739864795084e-06, - "loss": 0.6318, - "step": 4191 - }, - { - "epoch": 0.11, - "learning_rate": 1.9687192679197194e-06, - "loss": 0.7949, - "step": 4192 - }, - { - "epoch": 0.11, - "learning_rate": 1.9686986643689033e-06, - "loss": 0.9941, - "step": 4193 - }, - { - "epoch": 0.11, - "learning_rate": 1.968678054142777e-06, - "loss": 0.7578, - "step": 4194 - }, - { - "epoch": 0.11, - "learning_rate": 1.9686574372414827e-06, - "loss": 0.7505, - "step": 4195 - }, - { - "epoch": 0.11, - "learning_rate": 1.968636813665163e-06, - "loss": 1.0195, - "step": 4196 - }, - { - "epoch": 0.11, - "learning_rate": 1.9686161834139594e-06, - "loss": 0.9824, - "step": 4197 - }, - { - "epoch": 0.11, - "learning_rate": 1.9685955464880145e-06, - "loss": 1.0107, - "step": 4198 - }, - { - "epoch": 0.11, - "learning_rate": 1.9685749028874706e-06, - "loss": 0.9053, - "step": 4199 - }, - { - "epoch": 0.11, - "learning_rate": 1.9685542526124698e-06, - "loss": 0.7881, - "step": 4200 - }, - { - "epoch": 0.11, - "learning_rate": 1.968533595663154e-06, - "loss": 0.7734, - "step": 4201 - }, - { - "epoch": 0.11, - "learning_rate": 1.968512932039666e-06, - "loss": 1.0234, - "step": 4202 - }, - { - "epoch": 0.11, - "learning_rate": 1.968492261742148e-06, - "loss": 0.9424, - "step": 4203 - }, - { - "epoch": 0.11, - "learning_rate": 1.9684715847707425e-06, - "loss": 0.9141, - "step": 4204 - }, - { - "epoch": 0.11, - "learning_rate": 1.968450901125592e-06, - "loss": 1.0635, - "step": 4205 - }, - { - "epoch": 0.11, - "learning_rate": 1.9684302108068393e-06, - "loss": 1.0596, - "step": 4206 - }, - { - "epoch": 0.11, - "learning_rate": 1.968409513814626e-06, - "loss": 0.8389, - "step": 4207 - }, - { - "epoch": 0.11, - "learning_rate": 1.9683888101490964e-06, - "loss": 1.0693, - "step": 4208 - }, - { - "epoch": 0.11, - "learning_rate": 1.9683680998103912e-06, - "loss": 0.8076, - "step": 4209 - }, - { - "epoch": 0.11, - "learning_rate": 1.9683473827986547e-06, - "loss": 0.9678, - "step": 4210 - }, - { - "epoch": 0.11, - "learning_rate": 1.968326659114029e-06, - "loss": 1.0166, - "step": 4211 - }, - { - "epoch": 0.11, - "learning_rate": 1.968305928756657e-06, - "loss": 0.877, - "step": 4212 - }, - { - "epoch": 0.11, - "learning_rate": 1.9682851917266815e-06, - "loss": 0.9639, - "step": 4213 - }, - { - "epoch": 0.11, - "learning_rate": 1.968264448024245e-06, - "loss": 0.9414, - "step": 4214 - }, - { - "epoch": 0.11, - "learning_rate": 1.968243697649492e-06, - "loss": 0.9199, - "step": 4215 - }, - { - "epoch": 0.11, - "learning_rate": 1.9682229406025634e-06, - "loss": 0.8164, - "step": 4216 - }, - { - "epoch": 0.11, - "learning_rate": 1.968202176883603e-06, - "loss": 0.9258, - "step": 4217 - }, - { - "epoch": 0.11, - "learning_rate": 1.968181406492755e-06, - "loss": 0.8662, - "step": 4218 - }, - { - "epoch": 0.11, - "learning_rate": 1.968160629430161e-06, - "loss": 0.894, - "step": 4219 - }, - { - "epoch": 0.11, - "learning_rate": 1.968139845695965e-06, - "loss": 1.1016, - "step": 4220 - }, - { - "epoch": 0.11, - "learning_rate": 1.9681190552903096e-06, - "loss": 0.8984, - "step": 4221 - }, - { - "epoch": 0.11, - "learning_rate": 1.968098258213339e-06, - "loss": 1.0225, - "step": 4222 - }, - { - "epoch": 0.11, - "learning_rate": 1.9680774544651956e-06, - "loss": 0.7485, - "step": 4223 - }, - { - "epoch": 0.11, - "learning_rate": 1.9680566440460237e-06, - "loss": 0.7822, - "step": 4224 - }, - { - "epoch": 0.11, - "learning_rate": 1.968035826955966e-06, - "loss": 0.8774, - "step": 4225 - }, - { - "epoch": 0.11, - "learning_rate": 1.9680150031951657e-06, - "loss": 1.0625, - "step": 4226 - }, - { - "epoch": 0.11, - "learning_rate": 1.9679941727637667e-06, - "loss": 1.0195, - "step": 4227 - }, - { - "epoch": 0.11, - "learning_rate": 1.967973335661913e-06, - "loss": 0.8022, - "step": 4228 - }, - { - "epoch": 0.11, - "learning_rate": 1.9679524918897473e-06, - "loss": 0.606, - "step": 4229 - }, - { - "epoch": 0.11, - "learning_rate": 1.967931641447414e-06, - "loss": 1.0977, - "step": 4230 - }, - { - "epoch": 0.11, - "learning_rate": 1.967910784335056e-06, - "loss": 0.9805, - "step": 4231 - }, - { - "epoch": 0.11, - "learning_rate": 1.967889920552818e-06, - "loss": 0.9307, - "step": 4232 - }, - { - "epoch": 0.11, - "learning_rate": 1.967869050100843e-06, - "loss": 0.9131, - "step": 4233 - }, - { - "epoch": 0.11, - "learning_rate": 1.967848172979275e-06, - "loss": 0.999, - "step": 4234 - }, - { - "epoch": 0.11, - "learning_rate": 1.967827289188258e-06, - "loss": 0.9873, - "step": 4235 - }, - { - "epoch": 0.11, - "learning_rate": 1.967806398727936e-06, - "loss": 0.8105, - "step": 4236 - }, - { - "epoch": 0.11, - "learning_rate": 1.9677855015984528e-06, - "loss": 0.9258, - "step": 4237 - }, - { - "epoch": 0.11, - "learning_rate": 1.967764597799952e-06, - "loss": 0.8042, - "step": 4238 - }, - { - "epoch": 0.11, - "learning_rate": 1.967743687332578e-06, - "loss": 0.959, - "step": 4239 - }, - { - "epoch": 0.11, - "learning_rate": 1.9677227701964757e-06, - "loss": 0.9199, - "step": 4240 - }, - { - "epoch": 0.11, - "learning_rate": 1.967701846391788e-06, - "loss": 0.8174, - "step": 4241 - }, - { - "epoch": 0.11, - "learning_rate": 1.9676809159186595e-06, - "loss": 1.0625, - "step": 4242 - }, - { - "epoch": 0.11, - "learning_rate": 1.9676599787772346e-06, - "loss": 0.9053, - "step": 4243 - }, - { - "epoch": 0.11, - "learning_rate": 1.9676390349676576e-06, - "loss": 1.0273, - "step": 4244 - }, - { - "epoch": 0.11, - "learning_rate": 1.9676180844900725e-06, - "loss": 0.8516, - "step": 4245 - }, - { - "epoch": 0.11, - "learning_rate": 1.9675971273446237e-06, - "loss": 0.8772, - "step": 4246 - }, - { - "epoch": 0.11, - "learning_rate": 1.967576163531456e-06, - "loss": 1.1572, - "step": 4247 - }, - { - "epoch": 0.11, - "learning_rate": 1.967555193050714e-06, - "loss": 0.917, - "step": 4248 - }, - { - "epoch": 0.11, - "learning_rate": 1.967534215902541e-06, - "loss": 1.0107, - "step": 4249 - }, - { - "epoch": 0.11, - "learning_rate": 1.967513232087083e-06, - "loss": 1.0303, - "step": 4250 - }, - { - "epoch": 0.11, - "learning_rate": 1.967492241604484e-06, - "loss": 0.9229, - "step": 4251 - }, - { - "epoch": 0.11, - "learning_rate": 1.967471244454889e-06, - "loss": 1.0859, - "step": 4252 - }, - { - "epoch": 0.11, - "learning_rate": 1.9674502406384415e-06, - "loss": 1.0605, - "step": 4253 - }, - { - "epoch": 0.11, - "learning_rate": 1.9674292301552878e-06, - "loss": 0.9468, - "step": 4254 - }, - { - "epoch": 0.11, - "learning_rate": 1.9674082130055714e-06, - "loss": 1.291, - "step": 4255 - }, - { - "epoch": 0.11, - "learning_rate": 1.967387189189438e-06, - "loss": 1.082, - "step": 4256 - }, - { - "epoch": 0.11, - "learning_rate": 1.9673661587070326e-06, - "loss": 1.0449, - "step": 4257 - }, - { - "epoch": 0.11, - "learning_rate": 1.967345121558499e-06, - "loss": 0.9941, - "step": 4258 - }, - { - "epoch": 0.11, - "learning_rate": 1.967324077743983e-06, - "loss": 1.1279, - "step": 4259 - }, - { - "epoch": 0.11, - "learning_rate": 1.9673030272636295e-06, - "loss": 0.7354, - "step": 4260 - }, - { - "epoch": 0.11, - "learning_rate": 1.9672819701175837e-06, - "loss": 0.9336, - "step": 4261 - }, - { - "epoch": 0.11, - "learning_rate": 1.9672609063059907e-06, - "loss": 0.9531, - "step": 4262 - }, - { - "epoch": 0.11, - "learning_rate": 1.967239835828995e-06, - "loss": 0.7742, - "step": 4263 - }, - { - "epoch": 0.11, - "learning_rate": 1.9672187586867426e-06, - "loss": 0.752, - "step": 4264 - }, - { - "epoch": 0.11, - "learning_rate": 1.9671976748793784e-06, - "loss": 0.8975, - "step": 4265 - }, - { - "epoch": 0.11, - "learning_rate": 1.9671765844070478e-06, - "loss": 0.9912, - "step": 4266 - }, - { - "epoch": 0.11, - "learning_rate": 1.967155487269896e-06, - "loss": 0.7002, - "step": 4267 - }, - { - "epoch": 0.11, - "learning_rate": 1.967134383468068e-06, - "loss": 0.9795, - "step": 4268 - }, - { - "epoch": 0.11, - "learning_rate": 1.96711327300171e-06, - "loss": 1.043, - "step": 4269 - }, - { - "epoch": 0.11, - "learning_rate": 1.9670921558709673e-06, - "loss": 0.7002, - "step": 4270 - }, - { - "epoch": 0.11, - "learning_rate": 1.967071032075985e-06, - "loss": 1.1182, - "step": 4271 - }, - { - "epoch": 0.11, - "learning_rate": 1.967049901616909e-06, - "loss": 0.9805, - "step": 4272 - }, - { - "epoch": 0.11, - "learning_rate": 1.967028764493885e-06, - "loss": 1.2305, - "step": 4273 - }, - { - "epoch": 0.11, - "learning_rate": 1.9670076207070583e-06, - "loss": 0.8701, - "step": 4274 - }, - { - "epoch": 0.11, - "learning_rate": 1.9669864702565746e-06, - "loss": 1.0898, - "step": 4275 - }, - { - "epoch": 0.11, - "learning_rate": 1.96696531314258e-06, - "loss": 0.7871, - "step": 4276 - }, - { - "epoch": 0.11, - "learning_rate": 1.9669441493652204e-06, - "loss": 0.9797, - "step": 4277 - }, - { - "epoch": 0.11, - "learning_rate": 1.966922978924641e-06, - "loss": 0.9766, - "step": 4278 - }, - { - "epoch": 0.11, - "learning_rate": 1.966901801820988e-06, - "loss": 0.8799, - "step": 4279 - }, - { - "epoch": 0.11, - "learning_rate": 1.9668806180544074e-06, - "loss": 1.0547, - "step": 4280 - }, - { - "epoch": 0.11, - "learning_rate": 1.9668594276250456e-06, - "loss": 0.7957, - "step": 4281 - }, - { - "epoch": 0.11, - "learning_rate": 1.966838230533048e-06, - "loss": 0.9912, - "step": 4282 - }, - { - "epoch": 0.11, - "learning_rate": 1.9668170267785606e-06, - "loss": 1.0234, - "step": 4283 - }, - { - "epoch": 0.11, - "learning_rate": 1.9667958163617297e-06, - "loss": 0.9336, - "step": 4284 - }, - { - "epoch": 0.11, - "learning_rate": 1.9667745992827017e-06, - "loss": 0.918, - "step": 4285 - }, - { - "epoch": 0.11, - "learning_rate": 1.9667533755416224e-06, - "loss": 0.7212, - "step": 4286 - }, - { - "epoch": 0.11, - "learning_rate": 1.9667321451386387e-06, - "loss": 0.5596, - "step": 4287 - }, - { - "epoch": 0.11, - "learning_rate": 1.9667109080738963e-06, - "loss": 0.9756, - "step": 4288 - }, - { - "epoch": 0.11, - "learning_rate": 1.966689664347542e-06, - "loss": 0.8882, - "step": 4289 - }, - { - "epoch": 0.11, - "learning_rate": 1.966668413959721e-06, - "loss": 1.0371, - "step": 4290 - }, - { - "epoch": 0.11, - "learning_rate": 1.966647156910582e-06, - "loss": 0.8398, - "step": 4291 - }, - { - "epoch": 0.11, - "learning_rate": 1.9666258932002692e-06, - "loss": 0.9688, - "step": 4292 - }, - { - "epoch": 0.11, - "learning_rate": 1.9666046228289306e-06, - "loss": 0.9736, - "step": 4293 - }, - { - "epoch": 0.11, - "learning_rate": 1.9665833457967115e-06, - "loss": 1.0684, - "step": 4294 - }, - { - "epoch": 0.11, - "learning_rate": 1.96656206210376e-06, - "loss": 0.7754, - "step": 4295 - }, - { - "epoch": 0.11, - "learning_rate": 1.9665407717502217e-06, - "loss": 0.8623, - "step": 4296 - }, - { - "epoch": 0.11, - "learning_rate": 1.966519474736244e-06, - "loss": 1.0107, - "step": 4297 - }, - { - "epoch": 0.11, - "learning_rate": 1.9664981710619727e-06, - "loss": 1.0234, - "step": 4298 - }, - { - "epoch": 0.11, - "learning_rate": 1.9664768607275556e-06, - "loss": 1.043, - "step": 4299 - }, - { - "epoch": 0.11, - "learning_rate": 1.966455543733139e-06, - "loss": 0.8408, - "step": 4300 - }, - { - "epoch": 0.11, - "learning_rate": 1.9664342200788697e-06, - "loss": 0.9243, - "step": 4301 - }, - { - "epoch": 0.11, - "learning_rate": 1.9664128897648953e-06, - "loss": 0.9922, - "step": 4302 - }, - { - "epoch": 0.11, - "learning_rate": 1.9663915527913623e-06, - "loss": 0.9316, - "step": 4303 - }, - { - "epoch": 0.11, - "learning_rate": 1.966370209158418e-06, - "loss": 1.0244, - "step": 4304 - }, - { - "epoch": 0.11, - "learning_rate": 1.966348858866209e-06, - "loss": 0.9316, - "step": 4305 - }, - { - "epoch": 0.11, - "learning_rate": 1.9663275019148827e-06, - "loss": 1.0107, - "step": 4306 - }, - { - "epoch": 0.11, - "learning_rate": 1.9663061383045864e-06, - "loss": 1.0469, - "step": 4307 - }, - { - "epoch": 0.11, - "learning_rate": 1.966284768035467e-06, - "loss": 0.7871, - "step": 4308 - }, - { - "epoch": 0.11, - "learning_rate": 1.9662633911076723e-06, - "loss": 0.9307, - "step": 4309 - }, - { - "epoch": 0.11, - "learning_rate": 1.966242007521349e-06, - "loss": 1.0068, - "step": 4310 - }, - { - "epoch": 0.11, - "learning_rate": 1.966220617276645e-06, - "loss": 0.9229, - "step": 4311 - }, - { - "epoch": 0.11, - "learning_rate": 1.966199220373707e-06, - "loss": 0.7954, - "step": 4312 - }, - { - "epoch": 0.11, - "learning_rate": 1.966177816812683e-06, - "loss": 1.0498, - "step": 4313 - }, - { - "epoch": 0.11, - "learning_rate": 1.9661564065937205e-06, - "loss": 0.8594, - "step": 4314 - }, - { - "epoch": 0.11, - "learning_rate": 1.966134989716967e-06, - "loss": 0.832, - "step": 4315 - }, - { - "epoch": 0.11, - "learning_rate": 1.96611356618257e-06, - "loss": 1.0068, - "step": 4316 - }, - { - "epoch": 0.11, - "learning_rate": 1.966092135990677e-06, - "loss": 0.981, - "step": 4317 - }, - { - "epoch": 0.11, - "learning_rate": 1.966070699141436e-06, - "loss": 0.915, - "step": 4318 - }, - { - "epoch": 0.11, - "learning_rate": 1.9660492556349943e-06, - "loss": 0.7178, - "step": 4319 - }, - { - "epoch": 0.11, - "learning_rate": 1.9660278054714995e-06, - "loss": 0.9521, - "step": 4320 - }, - { - "epoch": 0.11, - "learning_rate": 1.9660063486511003e-06, - "loss": 0.8682, - "step": 4321 - }, - { - "epoch": 0.11, - "learning_rate": 1.965984885173944e-06, - "loss": 0.7876, - "step": 4322 - }, - { - "epoch": 0.11, - "learning_rate": 1.9659634150401784e-06, - "loss": 1.0752, - "step": 4323 - }, - { - "epoch": 0.11, - "learning_rate": 1.9659419382499518e-06, - "loss": 0.873, - "step": 4324 - }, - { - "epoch": 0.11, - "learning_rate": 1.965920454803412e-06, - "loss": 0.9727, - "step": 4325 - }, - { - "epoch": 0.11, - "learning_rate": 1.965898964700707e-06, - "loss": 1.0068, - "step": 4326 - }, - { - "epoch": 0.11, - "learning_rate": 1.965877467941985e-06, - "loss": 0.8013, - "step": 4327 - }, - { - "epoch": 0.11, - "learning_rate": 1.9658559645273937e-06, - "loss": 0.7939, - "step": 4328 - }, - { - "epoch": 0.11, - "learning_rate": 1.965834454457082e-06, - "loss": 0.8613, - "step": 4329 - }, - { - "epoch": 0.11, - "learning_rate": 1.9658129377311975e-06, - "loss": 0.8359, - "step": 4330 - }, - { - "epoch": 0.11, - "learning_rate": 1.9657914143498893e-06, - "loss": 0.75, - "step": 4331 - }, - { - "epoch": 0.11, - "learning_rate": 1.9657698843133047e-06, - "loss": 0.833, - "step": 4332 - }, - { - "epoch": 0.11, - "learning_rate": 1.965748347621593e-06, - "loss": 0.7847, - "step": 4333 - }, - { - "epoch": 0.11, - "learning_rate": 1.9657268042749015e-06, - "loss": 0.9785, - "step": 4334 - }, - { - "epoch": 0.11, - "learning_rate": 1.9657052542733793e-06, - "loss": 0.9102, - "step": 4335 - }, - { - "epoch": 0.11, - "learning_rate": 1.9656836976171754e-06, - "loss": 1.335, - "step": 4336 - }, - { - "epoch": 0.11, - "learning_rate": 1.9656621343064376e-06, - "loss": 0.9014, - "step": 4337 - }, - { - "epoch": 0.11, - "learning_rate": 1.965640564341315e-06, - "loss": 0.9253, - "step": 4338 - }, - { - "epoch": 0.11, - "learning_rate": 1.9656189877219556e-06, - "loss": 0.9023, - "step": 4339 - }, - { - "epoch": 0.11, - "learning_rate": 1.965597404448509e-06, - "loss": 0.8857, - "step": 4340 - }, - { - "epoch": 0.11, - "learning_rate": 1.9655758145211226e-06, - "loss": 0.7158, - "step": 4341 - }, - { - "epoch": 0.11, - "learning_rate": 1.9655542179399467e-06, - "loss": 1.0186, - "step": 4342 - }, - { - "epoch": 0.11, - "learning_rate": 1.9655326147051287e-06, - "loss": 1.1797, - "step": 4343 - }, - { - "epoch": 0.11, - "learning_rate": 1.9655110048168186e-06, - "loss": 0.8462, - "step": 4344 - }, - { - "epoch": 0.11, - "learning_rate": 1.9654893882751647e-06, - "loss": 1.0371, - "step": 4345 - }, - { - "epoch": 0.11, - "learning_rate": 1.965467765080316e-06, - "loss": 0.749, - "step": 4346 - }, - { - "epoch": 0.11, - "learning_rate": 1.965446135232422e-06, - "loss": 0.8506, - "step": 4347 - }, - { - "epoch": 0.11, - "learning_rate": 1.9654244987316315e-06, - "loss": 1.0898, - "step": 4348 - }, - { - "epoch": 0.11, - "learning_rate": 1.9654028555780934e-06, - "loss": 0.7068, - "step": 4349 - }, - { - "epoch": 0.11, - "learning_rate": 1.9653812057719564e-06, - "loss": 0.9102, - "step": 4350 - }, - { - "epoch": 0.11, - "learning_rate": 1.965359549313371e-06, - "loss": 0.9521, - "step": 4351 - }, - { - "epoch": 0.11, - "learning_rate": 1.965337886202485e-06, - "loss": 0.9463, - "step": 4352 - }, - { - "epoch": 0.11, - "learning_rate": 1.9653162164394487e-06, - "loss": 0.7939, - "step": 4353 - }, - { - "epoch": 0.11, - "learning_rate": 1.965294540024411e-06, - "loss": 0.915, - "step": 4354 - }, - { - "epoch": 0.11, - "learning_rate": 1.965272856957521e-06, - "loss": 0.9463, - "step": 4355 - }, - { - "epoch": 0.11, - "learning_rate": 1.9652511672389286e-06, - "loss": 1.0742, - "step": 4356 - }, - { - "epoch": 0.11, - "learning_rate": 1.9652294708687833e-06, - "loss": 0.8271, - "step": 4357 - }, - { - "epoch": 0.11, - "learning_rate": 1.9652077678472347e-06, - "loss": 1.1113, - "step": 4358 - }, - { - "epoch": 0.11, - "learning_rate": 1.9651860581744315e-06, - "loss": 1.0225, - "step": 4359 - }, - { - "epoch": 0.11, - "learning_rate": 1.965164341850524e-06, - "loss": 0.8398, - "step": 4360 - }, - { - "epoch": 0.11, - "learning_rate": 1.965142618875662e-06, - "loss": 0.8193, - "step": 4361 - }, - { - "epoch": 0.11, - "learning_rate": 1.9651208892499945e-06, - "loss": 1.0479, - "step": 4362 - }, - { - "epoch": 0.11, - "learning_rate": 1.9650991529736723e-06, - "loss": 0.8623, - "step": 4363 - }, - { - "epoch": 0.11, - "learning_rate": 1.965077410046844e-06, - "loss": 0.8809, - "step": 4364 - }, - { - "epoch": 0.11, - "learning_rate": 1.96505566046966e-06, - "loss": 0.7996, - "step": 4365 - }, - { - "epoch": 0.11, - "learning_rate": 1.9650339042422705e-06, - "loss": 0.9121, - "step": 4366 - }, - { - "epoch": 0.11, - "learning_rate": 1.965012141364825e-06, - "loss": 0.6411, - "step": 4367 - }, - { - "epoch": 0.11, - "learning_rate": 1.9649903718374735e-06, - "loss": 0.8315, - "step": 4368 - }, - { - "epoch": 0.11, - "learning_rate": 1.964968595660366e-06, - "loss": 1.0449, - "step": 4369 - }, - { - "epoch": 0.11, - "learning_rate": 1.964946812833653e-06, - "loss": 0.9277, - "step": 4370 - }, - { - "epoch": 0.11, - "learning_rate": 1.9649250233574833e-06, - "loss": 1.0576, - "step": 4371 - }, - { - "epoch": 0.11, - "learning_rate": 1.9649032272320087e-06, - "loss": 1.083, - "step": 4372 - }, - { - "epoch": 0.11, - "learning_rate": 1.9648814244573783e-06, - "loss": 1.0371, - "step": 4373 - }, - { - "epoch": 0.11, - "learning_rate": 1.964859615033743e-06, - "loss": 0.9893, - "step": 4374 - }, - { - "epoch": 0.11, - "learning_rate": 1.9648377989612527e-06, - "loss": 0.9736, - "step": 4375 - }, - { - "epoch": 0.11, - "learning_rate": 1.9648159762400578e-06, - "loss": 0.9004, - "step": 4376 - }, - { - "epoch": 0.11, - "learning_rate": 1.9647941468703085e-06, - "loss": 1.0762, - "step": 4377 - }, - { - "epoch": 0.11, - "learning_rate": 1.9647723108521557e-06, - "loss": 1.0322, - "step": 4378 - }, - { - "epoch": 0.11, - "learning_rate": 1.96475046818575e-06, - "loss": 0.9692, - "step": 4379 - }, - { - "epoch": 0.11, - "learning_rate": 1.964728618871241e-06, - "loss": 0.8643, - "step": 4380 - }, - { - "epoch": 0.11, - "learning_rate": 1.96470676290878e-06, - "loss": 1.0488, - "step": 4381 - }, - { - "epoch": 0.11, - "learning_rate": 1.964684900298517e-06, - "loss": 1.001, - "step": 4382 - }, - { - "epoch": 0.11, - "learning_rate": 1.9646630310406036e-06, - "loss": 0.9492, - "step": 4383 - }, - { - "epoch": 0.11, - "learning_rate": 1.96464115513519e-06, - "loss": 0.6587, - "step": 4384 - }, - { - "epoch": 0.11, - "learning_rate": 1.9646192725824265e-06, - "loss": 0.958, - "step": 4385 - }, - { - "epoch": 0.11, - "learning_rate": 1.9645973833824647e-06, - "loss": 0.9258, - "step": 4386 - }, - { - "epoch": 0.11, - "learning_rate": 1.964575487535455e-06, - "loss": 0.6914, - "step": 4387 - }, - { - "epoch": 0.11, - "learning_rate": 1.964553585041548e-06, - "loss": 1.1113, - "step": 4388 - }, - { - "epoch": 0.11, - "learning_rate": 1.964531675900895e-06, - "loss": 1.0508, - "step": 4389 - }, - { - "epoch": 0.11, - "learning_rate": 1.9645097601136475e-06, - "loss": 0.998, - "step": 4390 - }, - { - "epoch": 0.11, - "learning_rate": 1.9644878376799555e-06, - "loss": 1.001, - "step": 4391 - }, - { - "epoch": 0.11, - "learning_rate": 1.9644659085999704e-06, - "loss": 1.04, - "step": 4392 - }, - { - "epoch": 0.11, - "learning_rate": 1.9644439728738437e-06, - "loss": 1.0615, - "step": 4393 - }, - { - "epoch": 0.11, - "learning_rate": 1.9644220305017263e-06, - "loss": 0.9648, - "step": 4394 - }, - { - "epoch": 0.11, - "learning_rate": 1.9644000814837693e-06, - "loss": 1.0234, - "step": 4395 - }, - { - "epoch": 0.11, - "learning_rate": 1.964378125820124e-06, - "loss": 1.0264, - "step": 4396 - }, - { - "epoch": 0.11, - "learning_rate": 1.9643561635109414e-06, - "loss": 0.8701, - "step": 4397 - }, - { - "epoch": 0.11, - "learning_rate": 1.964334194556374e-06, - "loss": 0.8916, - "step": 4398 - }, - { - "epoch": 0.11, - "learning_rate": 1.964312218956572e-06, - "loss": 1.0205, - "step": 4399 - }, - { - "epoch": 0.11, - "learning_rate": 1.964290236711687e-06, - "loss": 0.7769, - "step": 4400 - }, - { - "epoch": 0.11, - "learning_rate": 1.964268247821871e-06, - "loss": 0.6143, - "step": 4401 - }, - { - "epoch": 0.11, - "learning_rate": 1.9642462522872753e-06, - "loss": 1.0361, - "step": 4402 - }, - { - "epoch": 0.11, - "learning_rate": 1.964224250108051e-06, - "loss": 0.9717, - "step": 4403 - }, - { - "epoch": 0.11, - "learning_rate": 1.9642022412843504e-06, - "loss": 0.9336, - "step": 4404 - }, - { - "epoch": 0.11, - "learning_rate": 1.9641802258163245e-06, - "loss": 1.0068, - "step": 4405 - }, - { - "epoch": 0.11, - "learning_rate": 1.9641582037041257e-06, - "loss": 1.0283, - "step": 4406 - }, - { - "epoch": 0.11, - "learning_rate": 1.9641361749479054e-06, - "loss": 1.0059, - "step": 4407 - }, - { - "epoch": 0.11, - "learning_rate": 1.9641141395478157e-06, - "loss": 0.8994, - "step": 4408 - }, - { - "epoch": 0.11, - "learning_rate": 1.964092097504008e-06, - "loss": 1.207, - "step": 4409 - }, - { - "epoch": 0.11, - "learning_rate": 1.9640700488166344e-06, - "loss": 0.9023, - "step": 4410 - }, - { - "epoch": 0.11, - "learning_rate": 1.9640479934858463e-06, - "loss": 1.0703, - "step": 4411 - }, - { - "epoch": 0.11, - "learning_rate": 1.9640259315117967e-06, - "loss": 0.9844, - "step": 4412 - }, - { - "epoch": 0.11, - "learning_rate": 1.964003862894637e-06, - "loss": 1.0625, - "step": 4413 - }, - { - "epoch": 0.11, - "learning_rate": 1.9639817876345194e-06, - "loss": 0.9414, - "step": 4414 - }, - { - "epoch": 0.11, - "learning_rate": 1.9639597057315963e-06, - "loss": 1.0703, - "step": 4415 - }, - { - "epoch": 0.11, - "learning_rate": 1.963937617186019e-06, - "loss": 0.8267, - "step": 4416 - }, - { - "epoch": 0.11, - "learning_rate": 1.963915521997941e-06, - "loss": 0.6824, - "step": 4417 - }, - { - "epoch": 0.11, - "learning_rate": 1.9638934201675133e-06, - "loss": 1.0137, - "step": 4418 - }, - { - "epoch": 0.11, - "learning_rate": 1.9638713116948886e-06, - "loss": 1.0693, - "step": 4419 - }, - { - "epoch": 0.11, - "learning_rate": 1.96384919658022e-06, - "loss": 1.04, - "step": 4420 - }, - { - "epoch": 0.11, - "learning_rate": 1.963827074823659e-06, - "loss": 0.833, - "step": 4421 - }, - { - "epoch": 0.11, - "learning_rate": 1.9638049464253584e-06, - "loss": 1.0342, - "step": 4422 - }, - { - "epoch": 0.11, - "learning_rate": 1.963782811385471e-06, - "loss": 1.1064, - "step": 4423 - }, - { - "epoch": 0.11, - "learning_rate": 1.9637606697041483e-06, - "loss": 0.8237, - "step": 4424 - }, - { - "epoch": 0.11, - "learning_rate": 1.9637385213815437e-06, - "loss": 0.7256, - "step": 4425 - }, - { - "epoch": 0.11, - "learning_rate": 1.96371636641781e-06, - "loss": 1.0205, - "step": 4426 - }, - { - "epoch": 0.11, - "learning_rate": 1.963694204813099e-06, - "loss": 0.876, - "step": 4427 - }, - { - "epoch": 0.11, - "learning_rate": 1.9636720365675647e-06, - "loss": 0.9658, - "step": 4428 - }, - { - "epoch": 0.11, - "learning_rate": 1.963649861681359e-06, - "loss": 0.6602, - "step": 4429 - }, - { - "epoch": 0.11, - "learning_rate": 1.963627680154634e-06, - "loss": 0.7637, - "step": 4430 - }, - { - "epoch": 0.11, - "learning_rate": 1.963605491987544e-06, - "loss": 1.0029, - "step": 4431 - }, - { - "epoch": 0.11, - "learning_rate": 1.9635832971802414e-06, - "loss": 1.0508, - "step": 4432 - }, - { - "epoch": 0.11, - "learning_rate": 1.963561095732879e-06, - "loss": 0.9639, - "step": 4433 - }, - { - "epoch": 0.11, - "learning_rate": 1.9635388876456094e-06, - "loss": 0.6597, - "step": 4434 - }, - { - "epoch": 0.11, - "learning_rate": 1.9635166729185863e-06, - "loss": 0.9248, - "step": 4435 - }, - { - "epoch": 0.11, - "learning_rate": 1.9634944515519625e-06, - "loss": 0.707, - "step": 4436 - }, - { - "epoch": 0.11, - "learning_rate": 1.963472223545891e-06, - "loss": 1.0088, - "step": 4437 - }, - { - "epoch": 0.11, - "learning_rate": 1.963449988900526e-06, - "loss": 0.8848, - "step": 4438 - }, - { - "epoch": 0.11, - "learning_rate": 1.9634277476160188e-06, - "loss": 1.0073, - "step": 4439 - }, - { - "epoch": 0.11, - "learning_rate": 1.963405499692524e-06, - "loss": 1.0625, - "step": 4440 - }, - { - "epoch": 0.11, - "learning_rate": 1.9633832451301947e-06, - "loss": 0.8135, - "step": 4441 - }, - { - "epoch": 0.11, - "learning_rate": 1.963360983929184e-06, - "loss": 0.7588, - "step": 4442 - }, - { - "epoch": 0.11, - "learning_rate": 1.9633387160896455e-06, - "loss": 0.9355, - "step": 4443 - }, - { - "epoch": 0.11, - "learning_rate": 1.963316441611733e-06, - "loss": 0.6941, - "step": 4444 - }, - { - "epoch": 0.11, - "learning_rate": 1.9632941604955993e-06, - "loss": 0.9043, - "step": 4445 - }, - { - "epoch": 0.11, - "learning_rate": 1.9632718727413986e-06, - "loss": 1.0498, - "step": 4446 - }, - { - "epoch": 0.11, - "learning_rate": 1.9632495783492835e-06, - "loss": 0.9453, - "step": 4447 - }, - { - "epoch": 0.11, - "learning_rate": 1.9632272773194088e-06, - "loss": 0.957, - "step": 4448 - }, - { - "epoch": 0.11, - "learning_rate": 1.9632049696519276e-06, - "loss": 0.9434, - "step": 4449 - }, - { - "epoch": 0.11, - "learning_rate": 1.963182655346994e-06, - "loss": 0.7002, - "step": 4450 - }, - { - "epoch": 0.11, - "learning_rate": 1.9631603344047606e-06, - "loss": 0.9961, - "step": 4451 - }, - { - "epoch": 0.11, - "learning_rate": 1.9631380068253827e-06, - "loss": 0.9492, - "step": 4452 - }, - { - "epoch": 0.11, - "learning_rate": 1.9631156726090133e-06, - "loss": 0.793, - "step": 4453 - }, - { - "epoch": 0.11, - "learning_rate": 1.9630933317558066e-06, - "loss": 0.9873, - "step": 4454 - }, - { - "epoch": 0.11, - "learning_rate": 1.9630709842659163e-06, - "loss": 0.9268, - "step": 4455 - }, - { - "epoch": 0.11, - "learning_rate": 1.9630486301394967e-06, - "loss": 1.0215, - "step": 4456 - }, - { - "epoch": 0.11, - "learning_rate": 1.963026269376702e-06, - "loss": 1.002, - "step": 4457 - }, - { - "epoch": 0.11, - "learning_rate": 1.963003901977686e-06, - "loss": 0.9766, - "step": 4458 - }, - { - "epoch": 0.11, - "learning_rate": 1.962981527942602e-06, - "loss": 0.8613, - "step": 4459 - }, - { - "epoch": 0.11, - "learning_rate": 1.962959147271606e-06, - "loss": 0.6514, - "step": 4460 - }, - { - "epoch": 0.11, - "learning_rate": 1.9629367599648505e-06, - "loss": 0.7637, - "step": 4461 - }, - { - "epoch": 0.11, - "learning_rate": 1.962914366022491e-06, - "loss": 1.084, - "step": 4462 - }, - { - "epoch": 0.11, - "learning_rate": 1.962891965444681e-06, - "loss": 0.8633, - "step": 4463 - }, - { - "epoch": 0.11, - "learning_rate": 1.9628695582315756e-06, - "loss": 1.0732, - "step": 4464 - }, - { - "epoch": 0.11, - "learning_rate": 1.962847144383328e-06, - "loss": 0.9131, - "step": 4465 - }, - { - "epoch": 0.11, - "learning_rate": 1.962824723900094e-06, - "loss": 0.9961, - "step": 4466 - }, - { - "epoch": 0.11, - "learning_rate": 1.962802296782028e-06, - "loss": 0.6755, - "step": 4467 - }, - { - "epoch": 0.11, - "learning_rate": 1.9627798630292836e-06, - "loss": 0.8174, - "step": 4468 - }, - { - "epoch": 0.11, - "learning_rate": 1.9627574226420162e-06, - "loss": 0.8286, - "step": 4469 - }, - { - "epoch": 0.11, - "learning_rate": 1.96273497562038e-06, - "loss": 0.9111, - "step": 4470 - }, - { - "epoch": 0.11, - "learning_rate": 1.9627125219645294e-06, - "loss": 0.9121, - "step": 4471 - }, - { - "epoch": 0.11, - "learning_rate": 1.96269006167462e-06, - "loss": 1.0605, - "step": 4472 - }, - { - "epoch": 0.11, - "learning_rate": 1.962667594750806e-06, - "loss": 0.7646, - "step": 4473 - }, - { - "epoch": 0.11, - "learning_rate": 1.9626451211932423e-06, - "loss": 0.998, - "step": 4474 - }, - { - "epoch": 0.11, - "learning_rate": 1.962622641002084e-06, - "loss": 0.9463, - "step": 4475 - }, - { - "epoch": 0.11, - "learning_rate": 1.9626001541774856e-06, - "loss": 0.8877, - "step": 4476 - }, - { - "epoch": 0.11, - "learning_rate": 1.9625776607196023e-06, - "loss": 0.9512, - "step": 4477 - }, - { - "epoch": 0.11, - "learning_rate": 1.9625551606285887e-06, - "loss": 0.877, - "step": 4478 - }, - { - "epoch": 0.11, - "learning_rate": 1.9625326539046007e-06, - "loss": 0.9922, - "step": 4479 - }, - { - "epoch": 0.11, - "learning_rate": 1.9625101405477925e-06, - "loss": 1.1797, - "step": 4480 - }, - { - "epoch": 0.11, - "learning_rate": 1.96248762055832e-06, - "loss": 0.9199, - "step": 4481 - }, - { - "epoch": 0.11, - "learning_rate": 1.962465093936338e-06, - "loss": 0.8574, - "step": 4482 - }, - { - "epoch": 0.11, - "learning_rate": 1.962442560682002e-06, - "loss": 0.8701, - "step": 4483 - }, - { - "epoch": 0.11, - "learning_rate": 1.9624200207954663e-06, - "loss": 1.0703, - "step": 4484 - }, - { - "epoch": 0.11, - "learning_rate": 1.9623974742768874e-06, - "loss": 0.8379, - "step": 4485 - }, - { - "epoch": 0.11, - "learning_rate": 1.9623749211264205e-06, - "loss": 0.957, - "step": 4486 - }, - { - "epoch": 0.12, - "learning_rate": 1.9623523613442206e-06, - "loss": 0.835, - "step": 4487 - }, - { - "epoch": 0.12, - "learning_rate": 1.962329794930443e-06, - "loss": 0.8184, - "step": 4488 - }, - { - "epoch": 0.12, - "learning_rate": 1.962307221885244e-06, - "loss": 0.8652, - "step": 4489 - }, - { - "epoch": 0.12, - "learning_rate": 1.962284642208778e-06, - "loss": 0.9028, - "step": 4490 - }, - { - "epoch": 0.12, - "learning_rate": 1.962262055901202e-06, - "loss": 0.9019, - "step": 4491 - }, - { - "epoch": 0.12, - "learning_rate": 1.9622394629626706e-06, - "loss": 0.9492, - "step": 4492 - }, - { - "epoch": 0.12, - "learning_rate": 1.9622168633933396e-06, - "loss": 0.918, - "step": 4493 - }, - { - "epoch": 0.12, - "learning_rate": 1.9621942571933648e-06, - "loss": 0.8682, - "step": 4494 - }, - { - "epoch": 0.12, - "learning_rate": 1.9621716443629025e-06, - "loss": 0.8271, - "step": 4495 - }, - { - "epoch": 0.12, - "learning_rate": 1.962149024902108e-06, - "loss": 1.0273, - "step": 4496 - }, - { - "epoch": 0.12, - "learning_rate": 1.9621263988111375e-06, - "loss": 1.0195, - "step": 4497 - }, - { - "epoch": 0.12, - "learning_rate": 1.962103766090147e-06, - "loss": 0.9287, - "step": 4498 - }, - { - "epoch": 0.12, - "learning_rate": 1.9620811267392914e-06, - "loss": 0.8516, - "step": 4499 - }, - { - "epoch": 0.12, - "learning_rate": 1.9620584807587276e-06, - "loss": 1.0, - "step": 4500 - }, - { - "epoch": 0.12, - "learning_rate": 1.962035828148612e-06, - "loss": 0.9326, - "step": 4501 - }, - { - "epoch": 0.12, - "learning_rate": 1.9620131689090996e-06, - "loss": 0.7256, - "step": 4502 - }, - { - "epoch": 0.12, - "learning_rate": 1.961990503040348e-06, - "loss": 0.9453, - "step": 4503 - }, - { - "epoch": 0.12, - "learning_rate": 1.961967830542512e-06, - "loss": 1.0264, - "step": 4504 - }, - { - "epoch": 0.12, - "learning_rate": 1.9619451514157485e-06, - "loss": 0.6426, - "step": 4505 - }, - { - "epoch": 0.12, - "learning_rate": 1.9619224656602138e-06, - "loss": 0.9912, - "step": 4506 - }, - { - "epoch": 0.12, - "learning_rate": 1.961899773276064e-06, - "loss": 0.9922, - "step": 4507 - }, - { - "epoch": 0.12, - "learning_rate": 1.9618770742634555e-06, - "loss": 0.7822, - "step": 4508 - }, - { - "epoch": 0.12, - "learning_rate": 1.9618543686225454e-06, - "loss": 0.7827, - "step": 4509 - }, - { - "epoch": 0.12, - "learning_rate": 1.961831656353489e-06, - "loss": 0.958, - "step": 4510 - }, - { - "epoch": 0.12, - "learning_rate": 1.9618089374564433e-06, - "loss": 0.8789, - "step": 4511 - }, - { - "epoch": 0.12, - "learning_rate": 1.9617862119315656e-06, - "loss": 0.999, - "step": 4512 - }, - { - "epoch": 0.12, - "learning_rate": 1.9617634797790113e-06, - "loss": 1.0166, - "step": 4513 - }, - { - "epoch": 0.12, - "learning_rate": 1.961740740998938e-06, - "loss": 0.9014, - "step": 4514 - }, - { - "epoch": 0.12, - "learning_rate": 1.9617179955915017e-06, - "loss": 1.0967, - "step": 4515 - }, - { - "epoch": 0.12, - "learning_rate": 1.9616952435568594e-06, - "loss": 1.0166, - "step": 4516 - }, - { - "epoch": 0.12, - "learning_rate": 1.961672484895168e-06, - "loss": 0.8887, - "step": 4517 - }, - { - "epoch": 0.12, - "learning_rate": 1.961649719606584e-06, - "loss": 1.0703, - "step": 4518 - }, - { - "epoch": 0.12, - "learning_rate": 1.961626947691265e-06, - "loss": 0.9277, - "step": 4519 - }, - { - "epoch": 0.12, - "learning_rate": 1.961604169149367e-06, - "loss": 1.0, - "step": 4520 - }, - { - "epoch": 0.12, - "learning_rate": 1.9615813839810474e-06, - "loss": 1.0, - "step": 4521 - }, - { - "epoch": 0.12, - "learning_rate": 1.9615585921864634e-06, - "loss": 1.0752, - "step": 4522 - }, - { - "epoch": 0.12, - "learning_rate": 1.9615357937657723e-06, - "loss": 0.7461, - "step": 4523 - }, - { - "epoch": 0.12, - "learning_rate": 1.96151298871913e-06, - "loss": 0.7222, - "step": 4524 - }, - { - "epoch": 0.12, - "learning_rate": 1.961490177046695e-06, - "loss": 1.0684, - "step": 4525 - }, - { - "epoch": 0.12, - "learning_rate": 1.9614673587486235e-06, - "loss": 0.9727, - "step": 4526 - }, - { - "epoch": 0.12, - "learning_rate": 1.9614445338250737e-06, - "loss": 0.9453, - "step": 4527 - }, - { - "epoch": 0.12, - "learning_rate": 1.961421702276202e-06, - "loss": 0.8232, - "step": 4528 - }, - { - "epoch": 0.12, - "learning_rate": 1.9613988641021662e-06, - "loss": 1.0752, - "step": 4529 - }, - { - "epoch": 0.12, - "learning_rate": 1.9613760193031234e-06, - "loss": 1.0098, - "step": 4530 - }, - { - "epoch": 0.12, - "learning_rate": 1.9613531678792312e-06, - "loss": 0.8506, - "step": 4531 - }, - { - "epoch": 0.12, - "learning_rate": 1.961330309830647e-06, - "loss": 1.0498, - "step": 4532 - }, - { - "epoch": 0.12, - "learning_rate": 1.9613074451575286e-06, - "loss": 0.8496, - "step": 4533 - }, - { - "epoch": 0.12, - "learning_rate": 1.9612845738600332e-06, - "loss": 0.9551, - "step": 4534 - }, - { - "epoch": 0.12, - "learning_rate": 1.9612616959383188e-06, - "loss": 0.7803, - "step": 4535 - }, - { - "epoch": 0.12, - "learning_rate": 1.961238811392543e-06, - "loss": 0.7969, - "step": 4536 - }, - { - "epoch": 0.12, - "learning_rate": 1.9612159202228625e-06, - "loss": 0.9014, - "step": 4537 - }, - { - "epoch": 0.12, - "learning_rate": 1.9611930224294362e-06, - "loss": 1.0986, - "step": 4538 - }, - { - "epoch": 0.12, - "learning_rate": 1.9611701180124215e-06, - "loss": 1.0234, - "step": 4539 - }, - { - "epoch": 0.12, - "learning_rate": 1.9611472069719763e-06, - "loss": 1.0361, - "step": 4540 - }, - { - "epoch": 0.12, - "learning_rate": 1.9611242893082587e-06, - "loss": 0.9512, - "step": 4541 - }, - { - "epoch": 0.12, - "learning_rate": 1.9611013650214256e-06, - "loss": 0.9189, - "step": 4542 - }, - { - "epoch": 0.12, - "learning_rate": 1.9610784341116365e-06, - "loss": 0.9688, - "step": 4543 - }, - { - "epoch": 0.12, - "learning_rate": 1.9610554965790483e-06, - "loss": 0.9199, - "step": 4544 - }, - { - "epoch": 0.12, - "learning_rate": 1.9610325524238196e-06, - "loss": 0.8848, - "step": 4545 - }, - { - "epoch": 0.12, - "learning_rate": 1.961009601646108e-06, - "loss": 0.998, - "step": 4546 - }, - { - "epoch": 0.12, - "learning_rate": 1.960986644246072e-06, - "loss": 0.4448, - "step": 4547 - }, - { - "epoch": 0.12, - "learning_rate": 1.96096368022387e-06, - "loss": 1.0, - "step": 4548 - }, - { - "epoch": 0.12, - "learning_rate": 1.96094070957966e-06, - "loss": 0.834, - "step": 4549 - }, - { - "epoch": 0.12, - "learning_rate": 1.9609177323136005e-06, - "loss": 1.167, - "step": 4550 - }, - { - "epoch": 0.12, - "learning_rate": 1.9608947484258494e-06, - "loss": 0.918, - "step": 4551 - }, - { - "epoch": 0.12, - "learning_rate": 1.9608717579165655e-06, - "loss": 1.0176, - "step": 4552 - }, - { - "epoch": 0.12, - "learning_rate": 1.9608487607859066e-06, - "loss": 0.8828, - "step": 4553 - }, - { - "epoch": 0.12, - "learning_rate": 1.960825757034032e-06, - "loss": 1.0127, - "step": 4554 - }, - { - "epoch": 0.12, - "learning_rate": 1.9608027466611e-06, - "loss": 0.9287, - "step": 4555 - }, - { - "epoch": 0.12, - "learning_rate": 1.960779729667269e-06, - "loss": 0.9219, - "step": 4556 - }, - { - "epoch": 0.12, - "learning_rate": 1.960756706052697e-06, - "loss": 0.9053, - "step": 4557 - }, - { - "epoch": 0.12, - "learning_rate": 1.960733675817544e-06, - "loss": 0.9766, - "step": 4558 - }, - { - "epoch": 0.12, - "learning_rate": 1.9607106389619672e-06, - "loss": 1.0508, - "step": 4559 - }, - { - "epoch": 0.12, - "learning_rate": 1.960687595486127e-06, - "loss": 0.7871, - "step": 4560 - }, - { - "epoch": 0.12, - "learning_rate": 1.960664545390181e-06, - "loss": 0.8428, - "step": 4561 - }, - { - "epoch": 0.12, - "learning_rate": 1.9606414886742883e-06, - "loss": 1.0293, - "step": 4562 - }, - { - "epoch": 0.12, - "learning_rate": 1.960618425338608e-06, - "loss": 0.9014, - "step": 4563 - }, - { - "epoch": 0.12, - "learning_rate": 1.9605953553832986e-06, - "loss": 0.9375, - "step": 4564 - }, - { - "epoch": 0.12, - "learning_rate": 1.9605722788085196e-06, - "loss": 0.6968, - "step": 4565 - }, - { - "epoch": 0.12, - "learning_rate": 1.9605491956144296e-06, - "loss": 1.0156, - "step": 4566 - }, - { - "epoch": 0.12, - "learning_rate": 1.960526105801188e-06, - "loss": 0.8848, - "step": 4567 - }, - { - "epoch": 0.12, - "learning_rate": 1.9605030093689535e-06, - "loss": 0.8506, - "step": 4568 - }, - { - "epoch": 0.12, - "learning_rate": 1.960479906317886e-06, - "loss": 1.0742, - "step": 4569 - }, - { - "epoch": 0.12, - "learning_rate": 1.9604567966481434e-06, - "loss": 0.8174, - "step": 4570 - }, - { - "epoch": 0.12, - "learning_rate": 1.960433680359886e-06, - "loss": 0.9629, - "step": 4571 - }, - { - "epoch": 0.12, - "learning_rate": 1.9604105574532736e-06, - "loss": 0.9609, - "step": 4572 - }, - { - "epoch": 0.12, - "learning_rate": 1.960387427928464e-06, - "loss": 1.0059, - "step": 4573 - }, - { - "epoch": 0.12, - "learning_rate": 1.9603642917856176e-06, - "loss": 0.9287, - "step": 4574 - }, - { - "epoch": 0.12, - "learning_rate": 1.9603411490248936e-06, - "loss": 1.2695, - "step": 4575 - }, - { - "epoch": 0.12, - "learning_rate": 1.9603179996464516e-06, - "loss": 0.7305, - "step": 4576 - }, - { - "epoch": 0.12, - "learning_rate": 1.960294843650451e-06, - "loss": 0.8643, - "step": 4577 - }, - { - "epoch": 0.12, - "learning_rate": 1.9602716810370515e-06, - "loss": 1.0205, - "step": 4578 - }, - { - "epoch": 0.12, - "learning_rate": 1.9602485118064124e-06, - "loss": 0.96, - "step": 4579 - }, - { - "epoch": 0.12, - "learning_rate": 1.9602253359586935e-06, - "loss": 1.0107, - "step": 4580 - }, - { - "epoch": 0.12, - "learning_rate": 1.9602021534940544e-06, - "loss": 0.9839, - "step": 4581 - }, - { - "epoch": 0.12, - "learning_rate": 1.960178964412655e-06, - "loss": 0.8647, - "step": 4582 - }, - { - "epoch": 0.12, - "learning_rate": 1.9601557687146556e-06, - "loss": 0.8672, - "step": 4583 - }, - { - "epoch": 0.12, - "learning_rate": 1.9601325664002157e-06, - "loss": 1.1592, - "step": 4584 - }, - { - "epoch": 0.12, - "learning_rate": 1.9601093574694943e-06, - "loss": 1.0381, - "step": 4585 - }, - { - "epoch": 0.12, - "learning_rate": 1.9600861419226528e-06, - "loss": 1.2871, - "step": 4586 - }, - { - "epoch": 0.12, - "learning_rate": 1.96006291975985e-06, - "loss": 0.917, - "step": 4587 - }, - { - "epoch": 0.12, - "learning_rate": 1.960039690981246e-06, - "loss": 0.9746, - "step": 4588 - }, - { - "epoch": 0.12, - "learning_rate": 1.960016455587002e-06, - "loss": 0.9868, - "step": 4589 - }, - { - "epoch": 0.12, - "learning_rate": 1.959993213577277e-06, - "loss": 0.8584, - "step": 4590 - }, - { - "epoch": 0.12, - "learning_rate": 1.9599699649522312e-06, - "loss": 1.0684, - "step": 4591 - }, - { - "epoch": 0.12, - "learning_rate": 1.9599467097120256e-06, - "loss": 0.9443, - "step": 4592 - }, - { - "epoch": 0.12, - "learning_rate": 1.9599234478568197e-06, - "loss": 0.7471, - "step": 4593 - }, - { - "epoch": 0.12, - "learning_rate": 1.9599001793867743e-06, - "loss": 0.9893, - "step": 4594 - }, - { - "epoch": 0.12, - "learning_rate": 1.959876904302049e-06, - "loss": 0.7896, - "step": 4595 - }, - { - "epoch": 0.12, - "learning_rate": 1.959853622602805e-06, - "loss": 0.835, - "step": 4596 - }, - { - "epoch": 0.12, - "learning_rate": 1.959830334289203e-06, - "loss": 0.8828, - "step": 4597 - }, - { - "epoch": 0.12, - "learning_rate": 1.959807039361402e-06, - "loss": 0.9775, - "step": 4598 - }, - { - "epoch": 0.12, - "learning_rate": 1.959783737819564e-06, - "loss": 0.8535, - "step": 4599 - }, - { - "epoch": 0.12, - "learning_rate": 1.959760429663849e-06, - "loss": 0.9766, - "step": 4600 - }, - { - "epoch": 0.12, - "learning_rate": 1.9597371148944175e-06, - "loss": 0.8906, - "step": 4601 - }, - { - "epoch": 0.12, - "learning_rate": 1.9597137935114305e-06, - "loss": 0.9326, - "step": 4602 - }, - { - "epoch": 0.12, - "learning_rate": 1.9596904655150482e-06, - "loss": 0.9297, - "step": 4603 - }, - { - "epoch": 0.12, - "learning_rate": 1.9596671309054317e-06, - "loss": 0.9971, - "step": 4604 - }, - { - "epoch": 0.12, - "learning_rate": 1.9596437896827418e-06, - "loss": 1.1973, - "step": 4605 - }, - { - "epoch": 0.12, - "learning_rate": 1.9596204418471394e-06, - "loss": 0.959, - "step": 4606 - }, - { - "epoch": 0.12, - "learning_rate": 1.959597087398785e-06, - "loss": 1.2051, - "step": 4607 - }, - { - "epoch": 0.12, - "learning_rate": 1.9595737263378404e-06, - "loss": 1.1426, - "step": 4608 - }, - { - "epoch": 0.12, - "learning_rate": 1.959550358664465e-06, - "loss": 0.8188, - "step": 4609 - }, - { - "epoch": 0.12, - "learning_rate": 1.9595269843788216e-06, - "loss": 1.0508, - "step": 4610 - }, - { - "epoch": 0.12, - "learning_rate": 1.9595036034810708e-06, - "loss": 1.0742, - "step": 4611 - }, - { - "epoch": 0.12, - "learning_rate": 1.9594802159713727e-06, - "loss": 1.0391, - "step": 4612 - }, - { - "epoch": 0.12, - "learning_rate": 1.959456821849889e-06, - "loss": 0.9619, - "step": 4613 - }, - { - "epoch": 0.12, - "learning_rate": 1.959433421116782e-06, - "loss": 1.001, - "step": 4614 - }, - { - "epoch": 0.12, - "learning_rate": 1.959410013772211e-06, - "loss": 0.8486, - "step": 4615 - }, - { - "epoch": 0.12, - "learning_rate": 1.9593865998163395e-06, - "loss": 0.9424, - "step": 4616 - }, - { - "epoch": 0.12, - "learning_rate": 1.959363179249327e-06, - "loss": 0.9287, - "step": 4617 - }, - { - "epoch": 0.12, - "learning_rate": 1.9593397520713357e-06, - "loss": 0.8184, - "step": 4618 - }, - { - "epoch": 0.12, - "learning_rate": 1.959316318282527e-06, - "loss": 0.9648, - "step": 4619 - }, - { - "epoch": 0.12, - "learning_rate": 1.9592928778830623e-06, - "loss": 0.998, - "step": 4620 - }, - { - "epoch": 0.12, - "learning_rate": 1.9592694308731032e-06, - "loss": 0.6064, - "step": 4621 - }, - { - "epoch": 0.12, - "learning_rate": 1.959245977252811e-06, - "loss": 0.9189, - "step": 4622 - }, - { - "epoch": 0.12, - "learning_rate": 1.9592225170223473e-06, - "loss": 0.6179, - "step": 4623 - }, - { - "epoch": 0.12, - "learning_rate": 1.9591990501818745e-06, - "loss": 0.8438, - "step": 4624 - }, - { - "epoch": 0.12, - "learning_rate": 1.9591755767315537e-06, - "loss": 1.1123, - "step": 4625 - }, - { - "epoch": 0.12, - "learning_rate": 1.959152096671547e-06, - "loss": 0.9131, - "step": 4626 - }, - { - "epoch": 0.12, - "learning_rate": 1.9591286100020153e-06, - "loss": 0.8779, - "step": 4627 - }, - { - "epoch": 0.12, - "learning_rate": 1.9591051167231213e-06, - "loss": 0.9531, - "step": 4628 - }, - { - "epoch": 0.12, - "learning_rate": 1.959081616835027e-06, - "loss": 0.8369, - "step": 4629 - }, - { - "epoch": 0.12, - "learning_rate": 1.9590581103378936e-06, - "loss": 0.8218, - "step": 4630 - }, - { - "epoch": 0.12, - "learning_rate": 1.959034597231884e-06, - "loss": 0.7534, - "step": 4631 - }, - { - "epoch": 0.12, - "learning_rate": 1.9590110775171594e-06, - "loss": 0.9355, - "step": 4632 - }, - { - "epoch": 0.12, - "learning_rate": 1.958987551193882e-06, - "loss": 0.9912, - "step": 4633 - }, - { - "epoch": 0.12, - "learning_rate": 1.9589640182622146e-06, - "loss": 0.9355, - "step": 4634 - }, - { - "epoch": 0.12, - "learning_rate": 1.958940478722319e-06, - "loss": 1.002, - "step": 4635 - }, - { - "epoch": 0.12, - "learning_rate": 1.958916932574357e-06, - "loss": 0.9697, - "step": 4636 - }, - { - "epoch": 0.12, - "learning_rate": 1.958893379818491e-06, - "loss": 0.9014, - "step": 4637 - }, - { - "epoch": 0.12, - "learning_rate": 1.958869820454884e-06, - "loss": 1.0049, - "step": 4638 - }, - { - "epoch": 0.12, - "learning_rate": 1.9588462544836974e-06, - "loss": 1.082, - "step": 4639 - }, - { - "epoch": 0.12, - "learning_rate": 1.9588226819050943e-06, - "loss": 1.0547, - "step": 4640 - }, - { - "epoch": 0.12, - "learning_rate": 1.9587991027192365e-06, - "loss": 0.6802, - "step": 4641 - }, - { - "epoch": 0.12, - "learning_rate": 1.958775516926287e-06, - "loss": 0.8682, - "step": 4642 - }, - { - "epoch": 0.12, - "learning_rate": 1.9587519245264084e-06, - "loss": 1.0996, - "step": 4643 - }, - { - "epoch": 0.12, - "learning_rate": 1.958728325519763e-06, - "loss": 0.8994, - "step": 4644 - }, - { - "epoch": 0.12, - "learning_rate": 1.9587047199065136e-06, - "loss": 0.9009, - "step": 4645 - }, - { - "epoch": 0.12, - "learning_rate": 1.9586811076868223e-06, - "loss": 0.7886, - "step": 4646 - }, - { - "epoch": 0.12, - "learning_rate": 1.9586574888608522e-06, - "loss": 1.1826, - "step": 4647 - }, - { - "epoch": 0.12, - "learning_rate": 1.9586338634287663e-06, - "loss": 0.999, - "step": 4648 - }, - { - "epoch": 0.12, - "learning_rate": 1.9586102313907275e-06, - "loss": 0.8564, - "step": 4649 - }, - { - "epoch": 0.12, - "learning_rate": 1.9585865927468982e-06, - "loss": 1.0635, - "step": 4650 - }, - { - "epoch": 0.12, - "learning_rate": 1.9585629474974414e-06, - "loss": 0.7344, - "step": 4651 - }, - { - "epoch": 0.12, - "learning_rate": 1.9585392956425197e-06, - "loss": 0.9814, - "step": 4652 - }, - { - "epoch": 0.12, - "learning_rate": 1.958515637182297e-06, - "loss": 0.8462, - "step": 4653 - }, - { - "epoch": 0.12, - "learning_rate": 1.9584919721169355e-06, - "loss": 0.8906, - "step": 4654 - }, - { - "epoch": 0.12, - "learning_rate": 1.9584683004465987e-06, - "loss": 1.1426, - "step": 4655 - }, - { - "epoch": 0.12, - "learning_rate": 1.9584446221714497e-06, - "loss": 1.0361, - "step": 4656 - }, - { - "epoch": 0.12, - "learning_rate": 1.9584209372916514e-06, - "loss": 0.8989, - "step": 4657 - }, - { - "epoch": 0.12, - "learning_rate": 1.958397245807367e-06, - "loss": 1.0293, - "step": 4658 - }, - { - "epoch": 0.12, - "learning_rate": 1.9583735477187604e-06, - "loss": 0.6797, - "step": 4659 - }, - { - "epoch": 0.12, - "learning_rate": 1.958349843025994e-06, - "loss": 0.9639, - "step": 4660 - }, - { - "epoch": 0.12, - "learning_rate": 1.958326131729232e-06, - "loss": 0.8169, - "step": 4661 - }, - { - "epoch": 0.12, - "learning_rate": 1.9583024138286372e-06, - "loss": 0.9238, - "step": 4662 - }, - { - "epoch": 0.12, - "learning_rate": 1.9582786893243734e-06, - "loss": 0.8262, - "step": 4663 - }, - { - "epoch": 0.12, - "learning_rate": 1.9582549582166035e-06, - "loss": 1.0879, - "step": 4664 - }, - { - "epoch": 0.12, - "learning_rate": 1.958231220505492e-06, - "loss": 1.0332, - "step": 4665 - }, - { - "epoch": 0.12, - "learning_rate": 1.9582074761912013e-06, - "loss": 0.875, - "step": 4666 - }, - { - "epoch": 0.12, - "learning_rate": 1.958183725273896e-06, - "loss": 0.583, - "step": 4667 - }, - { - "epoch": 0.12, - "learning_rate": 1.9581599677537394e-06, - "loss": 1.0625, - "step": 4668 - }, - { - "epoch": 0.12, - "learning_rate": 1.958136203630895e-06, - "loss": 1.1504, - "step": 4669 - }, - { - "epoch": 0.12, - "learning_rate": 1.958112432905527e-06, - "loss": 0.9893, - "step": 4670 - }, - { - "epoch": 0.12, - "learning_rate": 1.9580886555777993e-06, - "loss": 0.9219, - "step": 4671 - }, - { - "epoch": 0.12, - "learning_rate": 1.958064871647875e-06, - "loss": 1.0254, - "step": 4672 - }, - { - "epoch": 0.12, - "learning_rate": 1.9580410811159186e-06, - "loss": 0.7803, - "step": 4673 - }, - { - "epoch": 0.12, - "learning_rate": 1.9580172839820935e-06, - "loss": 0.9102, - "step": 4674 - }, - { - "epoch": 0.12, - "learning_rate": 1.9579934802465647e-06, - "loss": 0.9814, - "step": 4675 - }, - { - "epoch": 0.12, - "learning_rate": 1.9579696699094954e-06, - "loss": 0.8037, - "step": 4676 - }, - { - "epoch": 0.12, - "learning_rate": 1.9579458529710494e-06, - "loss": 0.7871, - "step": 4677 - }, - { - "epoch": 0.12, - "learning_rate": 1.9579220294313914e-06, - "loss": 0.8799, - "step": 4678 - }, - { - "epoch": 0.12, - "learning_rate": 1.957898199290686e-06, - "loss": 0.7114, - "step": 4679 - }, - { - "epoch": 0.12, - "learning_rate": 1.957874362549096e-06, - "loss": 0.915, - "step": 4680 - }, - { - "epoch": 0.12, - "learning_rate": 1.9578505192067875e-06, - "loss": 0.8535, - "step": 4681 - }, - { - "epoch": 0.12, - "learning_rate": 1.9578266692639234e-06, - "loss": 1.1543, - "step": 4682 - }, - { - "epoch": 0.12, - "learning_rate": 1.9578028127206685e-06, - "loss": 0.8857, - "step": 4683 - }, - { - "epoch": 0.12, - "learning_rate": 1.957778949577187e-06, - "loss": 0.7671, - "step": 4684 - }, - { - "epoch": 0.12, - "learning_rate": 1.957755079833644e-06, - "loss": 0.9873, - "step": 4685 - }, - { - "epoch": 0.12, - "learning_rate": 1.957731203490203e-06, - "loss": 1.0654, - "step": 4686 - }, - { - "epoch": 0.12, - "learning_rate": 1.9577073205470293e-06, - "loss": 0.9287, - "step": 4687 - }, - { - "epoch": 0.12, - "learning_rate": 1.9576834310042873e-06, - "loss": 0.8613, - "step": 4688 - }, - { - "epoch": 0.12, - "learning_rate": 1.9576595348621413e-06, - "loss": 1.1543, - "step": 4689 - }, - { - "epoch": 0.12, - "learning_rate": 1.957635632120756e-06, - "loss": 0.8032, - "step": 4690 - }, - { - "epoch": 0.12, - "learning_rate": 1.957611722780297e-06, - "loss": 1.1348, - "step": 4691 - }, - { - "epoch": 0.12, - "learning_rate": 1.957587806840928e-06, - "loss": 1.1133, - "step": 4692 - }, - { - "epoch": 0.12, - "learning_rate": 1.9575638843028142e-06, - "loss": 0.7556, - "step": 4693 - }, - { - "epoch": 0.12, - "learning_rate": 1.9575399551661206e-06, - "loss": 1.0049, - "step": 4694 - }, - { - "epoch": 0.12, - "learning_rate": 1.9575160194310115e-06, - "loss": 0.7139, - "step": 4695 - }, - { - "epoch": 0.12, - "learning_rate": 1.957492077097653e-06, - "loss": 0.7769, - "step": 4696 - }, - { - "epoch": 0.12, - "learning_rate": 1.9574681281662085e-06, - "loss": 1.1074, - "step": 4697 - }, - { - "epoch": 0.12, - "learning_rate": 1.9574441726368445e-06, - "loss": 0.9717, - "step": 4698 - }, - { - "epoch": 0.12, - "learning_rate": 1.9574202105097253e-06, - "loss": 0.9502, - "step": 4699 - }, - { - "epoch": 0.12, - "learning_rate": 1.957396241785016e-06, - "loss": 0.918, - "step": 4700 - }, - { - "epoch": 0.12, - "learning_rate": 1.9573722664628824e-06, - "loss": 0.8145, - "step": 4701 - }, - { - "epoch": 0.12, - "learning_rate": 1.957348284543489e-06, - "loss": 1.0107, - "step": 4702 - }, - { - "epoch": 0.12, - "learning_rate": 1.9573242960270012e-06, - "loss": 0.8828, - "step": 4703 - }, - { - "epoch": 0.12, - "learning_rate": 1.957300300913585e-06, - "loss": 1.0674, - "step": 4704 - }, - { - "epoch": 0.12, - "learning_rate": 1.9572762992034048e-06, - "loss": 0.6616, - "step": 4705 - }, - { - "epoch": 0.12, - "learning_rate": 1.957252290896626e-06, - "loss": 1.1553, - "step": 4706 - }, - { - "epoch": 0.12, - "learning_rate": 1.9572282759934153e-06, - "loss": 0.9678, - "step": 4707 - }, - { - "epoch": 0.12, - "learning_rate": 1.9572042544939367e-06, - "loss": 0.9834, - "step": 4708 - }, - { - "epoch": 0.12, - "learning_rate": 1.9571802263983568e-06, - "loss": 0.9922, - "step": 4709 - }, - { - "epoch": 0.12, - "learning_rate": 1.9571561917068406e-06, - "loss": 1.0732, - "step": 4710 - }, - { - "epoch": 0.12, - "learning_rate": 1.9571321504195534e-06, - "loss": 0.9922, - "step": 4711 - }, - { - "epoch": 0.12, - "learning_rate": 1.9571081025366617e-06, - "loss": 0.9248, - "step": 4712 - }, - { - "epoch": 0.12, - "learning_rate": 1.9570840480583305e-06, - "loss": 1.0625, - "step": 4713 - }, - { - "epoch": 0.12, - "learning_rate": 1.9570599869847264e-06, - "loss": 0.6919, - "step": 4714 - }, - { - "epoch": 0.12, - "learning_rate": 1.9570359193160145e-06, - "loss": 0.8511, - "step": 4715 - }, - { - "epoch": 0.12, - "learning_rate": 1.9570118450523608e-06, - "loss": 1.1348, - "step": 4716 - }, - { - "epoch": 0.12, - "learning_rate": 1.9569877641939313e-06, - "loss": 0.959, - "step": 4717 - }, - { - "epoch": 0.12, - "learning_rate": 1.9569636767408917e-06, - "loss": 0.9609, - "step": 4718 - }, - { - "epoch": 0.12, - "learning_rate": 1.9569395826934083e-06, - "loss": 0.917, - "step": 4719 - }, - { - "epoch": 0.12, - "learning_rate": 1.956915482051647e-06, - "loss": 1.1621, - "step": 4720 - }, - { - "epoch": 0.12, - "learning_rate": 1.956891374815774e-06, - "loss": 0.9238, - "step": 4721 - }, - { - "epoch": 0.12, - "learning_rate": 1.9568672609859553e-06, - "loss": 0.9062, - "step": 4722 - }, - { - "epoch": 0.12, - "learning_rate": 1.956843140562357e-06, - "loss": 1.0615, - "step": 4723 - }, - { - "epoch": 0.12, - "learning_rate": 1.956819013545145e-06, - "loss": 0.8062, - "step": 4724 - }, - { - "epoch": 0.12, - "learning_rate": 1.9567948799344868e-06, - "loss": 0.8086, - "step": 4725 - }, - { - "epoch": 0.12, - "learning_rate": 1.956770739730547e-06, - "loss": 0.7227, - "step": 4726 - }, - { - "epoch": 0.12, - "learning_rate": 1.9567465929334933e-06, - "loss": 0.8799, - "step": 4727 - }, - { - "epoch": 0.12, - "learning_rate": 1.9567224395434915e-06, - "loss": 1.0381, - "step": 4728 - }, - { - "epoch": 0.12, - "learning_rate": 1.956698279560708e-06, - "loss": 1.0557, - "step": 4729 - }, - { - "epoch": 0.12, - "learning_rate": 1.9566741129853098e-06, - "loss": 1.0244, - "step": 4730 - }, - { - "epoch": 0.12, - "learning_rate": 1.956649939817463e-06, - "loss": 1.0986, - "step": 4731 - }, - { - "epoch": 0.12, - "learning_rate": 1.956625760057334e-06, - "loss": 0.6719, - "step": 4732 - }, - { - "epoch": 0.12, - "learning_rate": 1.9566015737050894e-06, - "loss": 0.8057, - "step": 4733 - }, - { - "epoch": 0.12, - "learning_rate": 1.9565773807608966e-06, - "loss": 0.8848, - "step": 4734 - }, - { - "epoch": 0.12, - "learning_rate": 1.9565531812249215e-06, - "loss": 1.1465, - "step": 4735 - }, - { - "epoch": 0.12, - "learning_rate": 1.9565289750973317e-06, - "loss": 0.9331, - "step": 4736 - }, - { - "epoch": 0.12, - "learning_rate": 1.956504762378293e-06, - "loss": 0.8955, - "step": 4737 - }, - { - "epoch": 0.12, - "learning_rate": 1.956480543067973e-06, - "loss": 0.9248, - "step": 4738 - }, - { - "epoch": 0.12, - "learning_rate": 1.9564563171665386e-06, - "loss": 0.7402, - "step": 4739 - }, - { - "epoch": 0.12, - "learning_rate": 1.956432084674156e-06, - "loss": 0.9512, - "step": 4740 - }, - { - "epoch": 0.12, - "learning_rate": 1.956407845590993e-06, - "loss": 1.0938, - "step": 4741 - }, - { - "epoch": 0.12, - "learning_rate": 1.9563835999172163e-06, - "loss": 1.0098, - "step": 4742 - }, - { - "epoch": 0.12, - "learning_rate": 1.956359347652993e-06, - "loss": 1.0762, - "step": 4743 - }, - { - "epoch": 0.12, - "learning_rate": 1.95633508879849e-06, - "loss": 1.0986, - "step": 4744 - }, - { - "epoch": 0.12, - "learning_rate": 1.9563108233538745e-06, - "loss": 1.0938, - "step": 4745 - }, - { - "epoch": 0.12, - "learning_rate": 1.9562865513193143e-06, - "loss": 0.917, - "step": 4746 - }, - { - "epoch": 0.12, - "learning_rate": 1.956262272694976e-06, - "loss": 1.0586, - "step": 4747 - }, - { - "epoch": 0.12, - "learning_rate": 1.9562379874810273e-06, - "loss": 0.9238, - "step": 4748 - }, - { - "epoch": 0.12, - "learning_rate": 1.9562136956776355e-06, - "loss": 0.9365, - "step": 4749 - }, - { - "epoch": 0.12, - "learning_rate": 1.9561893972849677e-06, - "loss": 0.9438, - "step": 4750 - }, - { - "epoch": 0.12, - "learning_rate": 1.9561650923031916e-06, - "loss": 0.9053, - "step": 4751 - }, - { - "epoch": 0.12, - "learning_rate": 1.9561407807324746e-06, - "loss": 0.9023, - "step": 4752 - }, - { - "epoch": 0.12, - "learning_rate": 1.9561164625729843e-06, - "loss": 0.7988, - "step": 4753 - }, - { - "epoch": 0.12, - "learning_rate": 1.9560921378248885e-06, - "loss": 0.9229, - "step": 4754 - }, - { - "epoch": 0.12, - "learning_rate": 1.9560678064883544e-06, - "loss": 0.8467, - "step": 4755 - }, - { - "epoch": 0.12, - "learning_rate": 1.9560434685635494e-06, - "loss": 0.9932, - "step": 4756 - }, - { - "epoch": 0.12, - "learning_rate": 1.956019124050642e-06, - "loss": 1.1113, - "step": 4757 - }, - { - "epoch": 0.12, - "learning_rate": 1.9559947729497997e-06, - "loss": 0.8516, - "step": 4758 - }, - { - "epoch": 0.12, - "learning_rate": 1.95597041526119e-06, - "loss": 1.0107, - "step": 4759 - }, - { - "epoch": 0.12, - "learning_rate": 1.955946050984981e-06, - "loss": 0.7876, - "step": 4760 - }, - { - "epoch": 0.12, - "learning_rate": 1.9559216801213405e-06, - "loss": 1.0537, - "step": 4761 - }, - { - "epoch": 0.12, - "learning_rate": 1.9558973026704367e-06, - "loss": 0.9014, - "step": 4762 - }, - { - "epoch": 0.12, - "learning_rate": 1.955872918632437e-06, - "loss": 0.7114, - "step": 4763 - }, - { - "epoch": 0.12, - "learning_rate": 1.95584852800751e-06, - "loss": 0.9658, - "step": 4764 - }, - { - "epoch": 0.12, - "learning_rate": 1.9558241307958235e-06, - "loss": 0.7617, - "step": 4765 - }, - { - "epoch": 0.12, - "learning_rate": 1.955799726997546e-06, - "loss": 1.0488, - "step": 4766 - }, - { - "epoch": 0.12, - "learning_rate": 1.955775316612845e-06, - "loss": 1.0801, - "step": 4767 - }, - { - "epoch": 0.12, - "learning_rate": 1.955750899641889e-06, - "loss": 1.0605, - "step": 4768 - }, - { - "epoch": 0.12, - "learning_rate": 1.9557264760848465e-06, - "loss": 1.332, - "step": 4769 - }, - { - "epoch": 0.12, - "learning_rate": 1.9557020459418857e-06, - "loss": 0.915, - "step": 4770 - }, - { - "epoch": 0.12, - "learning_rate": 1.955677609213175e-06, - "loss": 0.9707, - "step": 4771 - }, - { - "epoch": 0.12, - "learning_rate": 1.9556531658988824e-06, - "loss": 0.7236, - "step": 4772 - }, - { - "epoch": 0.12, - "learning_rate": 1.9556287159991766e-06, - "loss": 0.6362, - "step": 4773 - }, - { - "epoch": 0.12, - "learning_rate": 1.9556042595142263e-06, - "loss": 0.9648, - "step": 4774 - }, - { - "epoch": 0.12, - "learning_rate": 1.9555797964442e-06, - "loss": 0.9248, - "step": 4775 - }, - { - "epoch": 0.12, - "learning_rate": 1.9555553267892656e-06, - "loss": 0.876, - "step": 4776 - }, - { - "epoch": 0.12, - "learning_rate": 1.9555308505495923e-06, - "loss": 0.9043, - "step": 4777 - }, - { - "epoch": 0.12, - "learning_rate": 1.955506367725349e-06, - "loss": 1.083, - "step": 4778 - }, - { - "epoch": 0.12, - "learning_rate": 1.9554818783167038e-06, - "loss": 1.0527, - "step": 4779 - }, - { - "epoch": 0.12, - "learning_rate": 1.955457382323826e-06, - "loss": 1.0234, - "step": 4780 - }, - { - "epoch": 0.12, - "learning_rate": 1.9554328797468843e-06, - "loss": 0.9131, - "step": 4781 - }, - { - "epoch": 0.12, - "learning_rate": 1.9554083705860473e-06, - "loss": 0.8047, - "step": 4782 - }, - { - "epoch": 0.12, - "learning_rate": 1.9553838548414836e-06, - "loss": 0.9053, - "step": 4783 - }, - { - "epoch": 0.12, - "learning_rate": 1.955359332513363e-06, - "loss": 1.124, - "step": 4784 - }, - { - "epoch": 0.12, - "learning_rate": 1.955334803601854e-06, - "loss": 0.8135, - "step": 4785 - }, - { - "epoch": 0.12, - "learning_rate": 1.9553102681071257e-06, - "loss": 0.9951, - "step": 4786 - }, - { - "epoch": 0.12, - "learning_rate": 1.9552857260293466e-06, - "loss": 0.8604, - "step": 4787 - }, - { - "epoch": 0.12, - "learning_rate": 1.955261177368687e-06, - "loss": 1.042, - "step": 4788 - }, - { - "epoch": 0.12, - "learning_rate": 1.9552366221253147e-06, - "loss": 1.0703, - "step": 4789 - }, - { - "epoch": 0.12, - "learning_rate": 1.9552120602994004e-06, - "loss": 0.8887, - "step": 4790 - }, - { - "epoch": 0.12, - "learning_rate": 1.955187491891112e-06, - "loss": 0.9756, - "step": 4791 - }, - { - "epoch": 0.12, - "learning_rate": 1.9551629169006197e-06, - "loss": 0.9824, - "step": 4792 - }, - { - "epoch": 0.12, - "learning_rate": 1.9551383353280922e-06, - "loss": 1.0107, - "step": 4793 - }, - { - "epoch": 0.12, - "learning_rate": 1.9551137471736995e-06, - "loss": 1.0557, - "step": 4794 - }, - { - "epoch": 0.12, - "learning_rate": 1.955089152437611e-06, - "loss": 0.7991, - "step": 4795 - }, - { - "epoch": 0.12, - "learning_rate": 1.9550645511199953e-06, - "loss": 1.1338, - "step": 4796 - }, - { - "epoch": 0.12, - "learning_rate": 1.9550399432210227e-06, - "loss": 0.9893, - "step": 4797 - }, - { - "epoch": 0.12, - "learning_rate": 1.955015328740863e-06, - "loss": 0.8052, - "step": 4798 - }, - { - "epoch": 0.12, - "learning_rate": 1.9549907076796853e-06, - "loss": 0.7949, - "step": 4799 - }, - { - "epoch": 0.12, - "learning_rate": 1.954966080037659e-06, - "loss": 0.9951, - "step": 4800 - }, - { - "epoch": 0.12, - "learning_rate": 1.954941445814955e-06, - "loss": 0.9209, - "step": 4801 - }, - { - "epoch": 0.12, - "learning_rate": 1.954916805011742e-06, - "loss": 1.0576, - "step": 4802 - }, - { - "epoch": 0.12, - "learning_rate": 1.9548921576281896e-06, - "loss": 0.6929, - "step": 4803 - }, - { - "epoch": 0.12, - "learning_rate": 1.954867503664469e-06, - "loss": 1.0703, - "step": 4804 - }, - { - "epoch": 0.12, - "learning_rate": 1.9548428431207483e-06, - "loss": 0.8975, - "step": 4805 - }, - { - "epoch": 0.12, - "learning_rate": 1.954818175997199e-06, - "loss": 0.8262, - "step": 4806 - }, - { - "epoch": 0.12, - "learning_rate": 1.95479350229399e-06, - "loss": 0.8262, - "step": 4807 - }, - { - "epoch": 0.12, - "learning_rate": 1.9547688220112923e-06, - "loss": 1.0352, - "step": 4808 - }, - { - "epoch": 0.12, - "learning_rate": 1.954744135149275e-06, - "loss": 0.9238, - "step": 4809 - }, - { - "epoch": 0.12, - "learning_rate": 1.9547194417081088e-06, - "loss": 0.7949, - "step": 4810 - }, - { - "epoch": 0.12, - "learning_rate": 1.9546947416879635e-06, - "loss": 0.9805, - "step": 4811 - }, - { - "epoch": 0.12, - "learning_rate": 1.9546700350890095e-06, - "loss": 1.0635, - "step": 4812 - }, - { - "epoch": 0.12, - "learning_rate": 1.9546453219114175e-06, - "loss": 1.0527, - "step": 4813 - }, - { - "epoch": 0.12, - "learning_rate": 1.954620602155357e-06, - "loss": 1.0352, - "step": 4814 - }, - { - "epoch": 0.12, - "learning_rate": 1.9545958758209992e-06, - "loss": 0.8496, - "step": 4815 - }, - { - "epoch": 0.12, - "learning_rate": 1.9545711429085136e-06, - "loss": 0.6333, - "step": 4816 - }, - { - "epoch": 0.12, - "learning_rate": 1.954546403418071e-06, - "loss": 0.9424, - "step": 4817 - }, - { - "epoch": 0.12, - "learning_rate": 1.954521657349842e-06, - "loss": 0.8101, - "step": 4818 - }, - { - "epoch": 0.12, - "learning_rate": 1.9544969047039973e-06, - "loss": 1.1484, - "step": 4819 - }, - { - "epoch": 0.12, - "learning_rate": 1.954472145480707e-06, - "loss": 1.0176, - "step": 4820 - }, - { - "epoch": 0.12, - "learning_rate": 1.954447379680142e-06, - "loss": 1.0684, - "step": 4821 - }, - { - "epoch": 0.12, - "learning_rate": 1.9544226073024727e-06, - "loss": 0.9951, - "step": 4822 - }, - { - "epoch": 0.12, - "learning_rate": 1.9543978283478705e-06, - "loss": 0.8633, - "step": 4823 - }, - { - "epoch": 0.12, - "learning_rate": 1.954373042816505e-06, - "loss": 0.916, - "step": 4824 - }, - { - "epoch": 0.12, - "learning_rate": 1.954348250708548e-06, - "loss": 0.9805, - "step": 4825 - }, - { - "epoch": 0.12, - "learning_rate": 1.95432345202417e-06, - "loss": 1.0361, - "step": 4826 - }, - { - "epoch": 0.12, - "learning_rate": 1.954298646763542e-06, - "loss": 1.0293, - "step": 4827 - }, - { - "epoch": 0.12, - "learning_rate": 1.9542738349268343e-06, - "loss": 1.0889, - "step": 4828 - }, - { - "epoch": 0.12, - "learning_rate": 1.954249016514219e-06, - "loss": 0.9961, - "step": 4829 - }, - { - "epoch": 0.12, - "learning_rate": 1.954224191525866e-06, - "loss": 0.8555, - "step": 4830 - }, - { - "epoch": 0.12, - "learning_rate": 1.954199359961947e-06, - "loss": 1.0273, - "step": 4831 - }, - { - "epoch": 0.12, - "learning_rate": 1.9541745218226334e-06, - "loss": 0.873, - "step": 4832 - }, - { - "epoch": 0.12, - "learning_rate": 1.954149677108096e-06, - "loss": 0.8945, - "step": 4833 - }, - { - "epoch": 0.12, - "learning_rate": 1.9541248258185055e-06, - "loss": 0.8555, - "step": 4834 - }, - { - "epoch": 0.12, - "learning_rate": 1.954099967954034e-06, - "loss": 1.0723, - "step": 4835 - }, - { - "epoch": 0.12, - "learning_rate": 1.954075103514852e-06, - "loss": 0.9971, - "step": 4836 - }, - { - "epoch": 0.12, - "learning_rate": 1.9540502325011317e-06, - "loss": 0.8037, - "step": 4837 - }, - { - "epoch": 0.12, - "learning_rate": 1.9540253549130436e-06, - "loss": 0.8809, - "step": 4838 - }, - { - "epoch": 0.12, - "learning_rate": 1.9540004707507597e-06, - "loss": 0.9277, - "step": 4839 - }, - { - "epoch": 0.12, - "learning_rate": 1.953975580014452e-06, - "loss": 0.8271, - "step": 4840 - }, - { - "epoch": 0.12, - "learning_rate": 1.9539506827042904e-06, - "loss": 0.6279, - "step": 4841 - }, - { - "epoch": 0.12, - "learning_rate": 1.953925778820448e-06, - "loss": 0.9736, - "step": 4842 - }, - { - "epoch": 0.12, - "learning_rate": 1.9539008683630957e-06, - "loss": 1.0596, - "step": 4843 - }, - { - "epoch": 0.12, - "learning_rate": 1.953875951332405e-06, - "loss": 1.0557, - "step": 4844 - }, - { - "epoch": 0.12, - "learning_rate": 1.9538510277285487e-06, - "loss": 0.9365, - "step": 4845 - }, - { - "epoch": 0.12, - "learning_rate": 1.953826097551697e-06, - "loss": 0.7783, - "step": 4846 - }, - { - "epoch": 0.12, - "learning_rate": 1.9538011608020227e-06, - "loss": 1.1475, - "step": 4847 - }, - { - "epoch": 0.12, - "learning_rate": 1.9537762174796975e-06, - "loss": 0.7998, - "step": 4848 - }, - { - "epoch": 0.12, - "learning_rate": 1.953751267584893e-06, - "loss": 0.8745, - "step": 4849 - }, - { - "epoch": 0.12, - "learning_rate": 1.9537263111177815e-06, - "loss": 1.0049, - "step": 4850 - }, - { - "epoch": 0.12, - "learning_rate": 1.9537013480785346e-06, - "loss": 0.7881, - "step": 4851 - }, - { - "epoch": 0.12, - "learning_rate": 1.9536763784673247e-06, - "loss": 0.6265, - "step": 4852 - }, - { - "epoch": 0.12, - "learning_rate": 1.9536514022843237e-06, - "loss": 0.9121, - "step": 4853 - }, - { - "epoch": 0.12, - "learning_rate": 1.9536264195297035e-06, - "loss": 0.916, - "step": 4854 - }, - { - "epoch": 0.12, - "learning_rate": 1.9536014302036366e-06, - "loss": 0.832, - "step": 4855 - }, - { - "epoch": 0.12, - "learning_rate": 1.953576434306295e-06, - "loss": 1.0371, - "step": 4856 - }, - { - "epoch": 0.12, - "learning_rate": 1.9535514318378506e-06, - "loss": 0.7466, - "step": 4857 - }, - { - "epoch": 0.12, - "learning_rate": 1.9535264227984767e-06, - "loss": 0.9502, - "step": 4858 - }, - { - "epoch": 0.12, - "learning_rate": 1.9535014071883447e-06, - "loss": 0.8115, - "step": 4859 - }, - { - "epoch": 0.12, - "learning_rate": 1.9534763850076273e-06, - "loss": 0.9243, - "step": 4860 - }, - { - "epoch": 0.12, - "learning_rate": 1.953451356256497e-06, - "loss": 0.9844, - "step": 4861 - }, - { - "epoch": 0.12, - "learning_rate": 1.9534263209351265e-06, - "loss": 0.9971, - "step": 4862 - }, - { - "epoch": 0.12, - "learning_rate": 1.9534012790436877e-06, - "loss": 0.9541, - "step": 4863 - }, - { - "epoch": 0.12, - "learning_rate": 1.953376230582353e-06, - "loss": 0.7859, - "step": 4864 - }, - { - "epoch": 0.12, - "learning_rate": 1.9533511755512963e-06, - "loss": 1.0, - "step": 4865 - }, - { - "epoch": 0.12, - "learning_rate": 1.9533261139506888e-06, - "loss": 1.1523, - "step": 4866 - }, - { - "epoch": 0.12, - "learning_rate": 1.9533010457807046e-06, - "loss": 1.0869, - "step": 4867 - }, - { - "epoch": 0.12, - "learning_rate": 1.9532759710415154e-06, - "loss": 1.0195, - "step": 4868 - }, - { - "epoch": 0.12, - "learning_rate": 1.953250889733294e-06, - "loss": 0.8398, - "step": 4869 - }, - { - "epoch": 0.12, - "learning_rate": 1.9532258018562136e-06, - "loss": 0.812, - "step": 4870 - }, - { - "epoch": 0.12, - "learning_rate": 1.9532007074104467e-06, - "loss": 0.9531, - "step": 4871 - }, - { - "epoch": 0.12, - "learning_rate": 1.953175606396167e-06, - "loss": 0.8853, - "step": 4872 - }, - { - "epoch": 0.12, - "learning_rate": 1.953150498813547e-06, - "loss": 0.9746, - "step": 4873 - }, - { - "epoch": 0.12, - "learning_rate": 1.9531253846627594e-06, - "loss": 1.0469, - "step": 4874 - }, - { - "epoch": 0.12, - "learning_rate": 1.953100263943978e-06, - "loss": 0.7832, - "step": 4875 - }, - { - "epoch": 0.12, - "learning_rate": 1.953075136657375e-06, - "loss": 0.7559, - "step": 4876 - }, - { - "epoch": 0.12, - "learning_rate": 1.9530500028031245e-06, - "loss": 1.0391, - "step": 4877 - }, - { - "epoch": 0.13, - "learning_rate": 1.953024862381399e-06, - "loss": 1.0439, - "step": 4878 - }, - { - "epoch": 0.13, - "learning_rate": 1.952999715392372e-06, - "loss": 0.8232, - "step": 4879 - }, - { - "epoch": 0.13, - "learning_rate": 1.952974561836217e-06, - "loss": 0.8379, - "step": 4880 - }, - { - "epoch": 0.13, - "learning_rate": 1.9529494017131064e-06, - "loss": 0.8291, - "step": 4881 - }, - { - "epoch": 0.13, - "learning_rate": 1.952924235023215e-06, - "loss": 1.0752, - "step": 4882 - }, - { - "epoch": 0.13, - "learning_rate": 1.952899061766715e-06, - "loss": 1.1074, - "step": 4883 - }, - { - "epoch": 0.13, - "learning_rate": 1.952873881943781e-06, - "loss": 0.9385, - "step": 4884 - }, - { - "epoch": 0.13, - "learning_rate": 1.9528486955545854e-06, - "loss": 0.6804, - "step": 4885 - }, - { - "epoch": 0.13, - "learning_rate": 1.952823502599302e-06, - "loss": 0.9824, - "step": 4886 - }, - { - "epoch": 0.13, - "learning_rate": 1.9527983030781054e-06, - "loss": 0.8164, - "step": 4887 - }, - { - "epoch": 0.13, - "learning_rate": 1.952773096991168e-06, - "loss": 0.8877, - "step": 4888 - }, - { - "epoch": 0.13, - "learning_rate": 1.9527478843386637e-06, - "loss": 1.0732, - "step": 4889 - }, - { - "epoch": 0.13, - "learning_rate": 1.952722665120767e-06, - "loss": 0.8857, - "step": 4890 - }, - { - "epoch": 0.13, - "learning_rate": 1.952697439337651e-06, - "loss": 0.79, - "step": 4891 - }, - { - "epoch": 0.13, - "learning_rate": 1.95267220698949e-06, - "loss": 0.8584, - "step": 4892 - }, - { - "epoch": 0.13, - "learning_rate": 1.9526469680764573e-06, - "loss": 0.917, - "step": 4893 - }, - { - "epoch": 0.13, - "learning_rate": 1.9526217225987273e-06, - "loss": 1.0332, - "step": 4894 - }, - { - "epoch": 0.13, - "learning_rate": 1.952596470556474e-06, - "loss": 0.9053, - "step": 4895 - }, - { - "epoch": 0.13, - "learning_rate": 1.952571211949871e-06, - "loss": 0.8145, - "step": 4896 - }, - { - "epoch": 0.13, - "learning_rate": 1.9525459467790924e-06, - "loss": 0.9531, - "step": 4897 - }, - { - "epoch": 0.13, - "learning_rate": 1.952520675044313e-06, - "loss": 1.0576, - "step": 4898 - }, - { - "epoch": 0.13, - "learning_rate": 1.952495396745706e-06, - "loss": 0.999, - "step": 4899 - }, - { - "epoch": 0.13, - "learning_rate": 1.9524701118834465e-06, - "loss": 1.0303, - "step": 4900 - }, - { - "epoch": 0.13, - "learning_rate": 1.952444820457708e-06, - "loss": 0.9131, - "step": 4901 - }, - { - "epoch": 0.13, - "learning_rate": 1.9524195224686646e-06, - "loss": 0.9795, - "step": 4902 - }, - { - "epoch": 0.13, - "learning_rate": 1.9523942179164916e-06, - "loss": 1.0859, - "step": 4903 - }, - { - "epoch": 0.13, - "learning_rate": 1.952368906801363e-06, - "loss": 0.9082, - "step": 4904 - }, - { - "epoch": 0.13, - "learning_rate": 1.9523435891234525e-06, - "loss": 0.8135, - "step": 4905 - }, - { - "epoch": 0.13, - "learning_rate": 1.9523182648829354e-06, - "loss": 0.9873, - "step": 4906 - }, - { - "epoch": 0.13, - "learning_rate": 1.952292934079986e-06, - "loss": 0.873, - "step": 4907 - }, - { - "epoch": 0.13, - "learning_rate": 1.9522675967147786e-06, - "loss": 0.804, - "step": 4908 - }, - { - "epoch": 0.13, - "learning_rate": 1.9522422527874883e-06, - "loss": 0.8818, - "step": 4909 - }, - { - "epoch": 0.13, - "learning_rate": 1.9522169022982892e-06, - "loss": 0.6587, - "step": 4910 - }, - { - "epoch": 0.13, - "learning_rate": 1.9521915452473563e-06, - "loss": 1.0029, - "step": 4911 - }, - { - "epoch": 0.13, - "learning_rate": 1.9521661816348645e-06, - "loss": 1.2744, - "step": 4912 - }, - { - "epoch": 0.13, - "learning_rate": 1.952140811460988e-06, - "loss": 0.8184, - "step": 4913 - }, - { - "epoch": 0.13, - "learning_rate": 1.952115434725902e-06, - "loss": 1.0098, - "step": 4914 - }, - { - "epoch": 0.13, - "learning_rate": 1.952090051429782e-06, - "loss": 0.9834, - "step": 4915 - }, - { - "epoch": 0.13, - "learning_rate": 1.9520646615728013e-06, - "loss": 0.9058, - "step": 4916 - }, - { - "epoch": 0.13, - "learning_rate": 1.9520392651551363e-06, - "loss": 0.9385, - "step": 4917 - }, - { - "epoch": 0.13, - "learning_rate": 1.9520138621769615e-06, - "loss": 0.999, - "step": 4918 - }, - { - "epoch": 0.13, - "learning_rate": 1.951988452638452e-06, - "loss": 0.8896, - "step": 4919 - }, - { - "epoch": 0.13, - "learning_rate": 1.9519630365397826e-06, - "loss": 0.8584, - "step": 4920 - }, - { - "epoch": 0.13, - "learning_rate": 1.9519376138811293e-06, - "loss": 0.9258, - "step": 4921 - }, - { - "epoch": 0.13, - "learning_rate": 1.9519121846626665e-06, - "loss": 0.8184, - "step": 4922 - }, - { - "epoch": 0.13, - "learning_rate": 1.9518867488845693e-06, - "loss": 0.9492, - "step": 4923 - }, - { - "epoch": 0.13, - "learning_rate": 1.9518613065470134e-06, - "loss": 1.1582, - "step": 4924 - }, - { - "epoch": 0.13, - "learning_rate": 1.9518358576501745e-06, - "loss": 0.9111, - "step": 4925 - }, - { - "epoch": 0.13, - "learning_rate": 1.951810402194227e-06, - "loss": 1.166, - "step": 4926 - }, - { - "epoch": 0.13, - "learning_rate": 1.951784940179347e-06, - "loss": 1.0293, - "step": 4927 - }, - { - "epoch": 0.13, - "learning_rate": 1.95175947160571e-06, - "loss": 0.958, - "step": 4928 - }, - { - "epoch": 0.13, - "learning_rate": 1.951733996473491e-06, - "loss": 1.1025, - "step": 4929 - }, - { - "epoch": 0.13, - "learning_rate": 1.9517085147828665e-06, - "loss": 0.856, - "step": 4930 - }, - { - "epoch": 0.13, - "learning_rate": 1.9516830265340106e-06, - "loss": 0.8232, - "step": 4931 - }, - { - "epoch": 0.13, - "learning_rate": 1.9516575317271e-06, - "loss": 0.918, - "step": 4932 - }, - { - "epoch": 0.13, - "learning_rate": 1.9516320303623103e-06, - "loss": 0.7419, - "step": 4933 - }, - { - "epoch": 0.13, - "learning_rate": 1.951606522439817e-06, - "loss": 0.8706, - "step": 4934 - }, - { - "epoch": 0.13, - "learning_rate": 1.9515810079597962e-06, - "loss": 1.04, - "step": 4935 - }, - { - "epoch": 0.13, - "learning_rate": 1.9515554869224233e-06, - "loss": 0.6313, - "step": 4936 - }, - { - "epoch": 0.13, - "learning_rate": 1.9515299593278744e-06, - "loss": 0.9355, - "step": 4937 - }, - { - "epoch": 0.13, - "learning_rate": 1.951504425176325e-06, - "loss": 1.0703, - "step": 4938 - }, - { - "epoch": 0.13, - "learning_rate": 1.9514788844679517e-06, - "loss": 0.9072, - "step": 4939 - }, - { - "epoch": 0.13, - "learning_rate": 1.9514533372029304e-06, - "loss": 1.0391, - "step": 4940 - }, - { - "epoch": 0.13, - "learning_rate": 1.951427783381437e-06, - "loss": 0.9121, - "step": 4941 - }, - { - "epoch": 0.13, - "learning_rate": 1.9514022230036475e-06, - "loss": 1.0957, - "step": 4942 - }, - { - "epoch": 0.13, - "learning_rate": 1.9513766560697376e-06, - "loss": 0.9062, - "step": 4943 - }, - { - "epoch": 0.13, - "learning_rate": 1.9513510825798845e-06, - "loss": 0.9355, - "step": 4944 - }, - { - "epoch": 0.13, - "learning_rate": 1.9513255025342637e-06, - "loss": 0.9243, - "step": 4945 - }, - { - "epoch": 0.13, - "learning_rate": 1.9512999159330518e-06, - "loss": 1.0723, - "step": 4946 - }, - { - "epoch": 0.13, - "learning_rate": 1.951274322776425e-06, - "loss": 1.0498, - "step": 4947 - }, - { - "epoch": 0.13, - "learning_rate": 1.9512487230645595e-06, - "loss": 0.9453, - "step": 4948 - }, - { - "epoch": 0.13, - "learning_rate": 1.9512231167976315e-06, - "loss": 0.916, - "step": 4949 - }, - { - "epoch": 0.13, - "learning_rate": 1.9511975039758184e-06, - "loss": 0.8035, - "step": 4950 - }, - { - "epoch": 0.13, - "learning_rate": 1.951171884599296e-06, - "loss": 0.8203, - "step": 4951 - }, - { - "epoch": 0.13, - "learning_rate": 1.951146258668241e-06, - "loss": 0.9717, - "step": 4952 - }, - { - "epoch": 0.13, - "learning_rate": 1.95112062618283e-06, - "loss": 1.0596, - "step": 4953 - }, - { - "epoch": 0.13, - "learning_rate": 1.9510949871432396e-06, - "loss": 1.0479, - "step": 4954 - }, - { - "epoch": 0.13, - "learning_rate": 1.951069341549646e-06, - "loss": 0.9463, - "step": 4955 - }, - { - "epoch": 0.13, - "learning_rate": 1.9510436894022267e-06, - "loss": 0.9912, - "step": 4956 - }, - { - "epoch": 0.13, - "learning_rate": 1.951018030701158e-06, - "loss": 1.0049, - "step": 4957 - }, - { - "epoch": 0.13, - "learning_rate": 1.9509923654466174e-06, - "loss": 0.9619, - "step": 4958 - }, - { - "epoch": 0.13, - "learning_rate": 1.9509666936387804e-06, - "loss": 1.0312, - "step": 4959 - }, - { - "epoch": 0.13, - "learning_rate": 1.9509410152778256e-06, - "loss": 0.748, - "step": 4960 - }, - { - "epoch": 0.13, - "learning_rate": 1.9509153303639283e-06, - "loss": 0.8862, - "step": 4961 - }, - { - "epoch": 0.13, - "learning_rate": 1.950889638897267e-06, - "loss": 0.8525, - "step": 4962 - }, - { - "epoch": 0.13, - "learning_rate": 1.9508639408780173e-06, - "loss": 0.7832, - "step": 4963 - }, - { - "epoch": 0.13, - "learning_rate": 1.9508382363063572e-06, - "loss": 1.0703, - "step": 4964 - }, - { - "epoch": 0.13, - "learning_rate": 1.950812525182464e-06, - "loss": 1.0908, - "step": 4965 - }, - { - "epoch": 0.13, - "learning_rate": 1.950786807506514e-06, - "loss": 0.9717, - "step": 4966 - }, - { - "epoch": 0.13, - "learning_rate": 1.9507610832786853e-06, - "loss": 0.9424, - "step": 4967 - }, - { - "epoch": 0.13, - "learning_rate": 1.9507353524991545e-06, - "loss": 1.0547, - "step": 4968 - }, - { - "epoch": 0.13, - "learning_rate": 1.9507096151680997e-06, - "loss": 0.8984, - "step": 4969 - }, - { - "epoch": 0.13, - "learning_rate": 1.9506838712856973e-06, - "loss": 0.9072, - "step": 4970 - }, - { - "epoch": 0.13, - "learning_rate": 1.9506581208521252e-06, - "loss": 1.0518, - "step": 4971 - }, - { - "epoch": 0.13, - "learning_rate": 1.950632363867561e-06, - "loss": 0.6567, - "step": 4972 - }, - { - "epoch": 0.13, - "learning_rate": 1.950606600332182e-06, - "loss": 0.7812, - "step": 4973 - }, - { - "epoch": 0.13, - "learning_rate": 1.9505808302461653e-06, - "loss": 1.04, - "step": 4974 - }, - { - "epoch": 0.13, - "learning_rate": 1.9505550536096896e-06, - "loss": 0.7524, - "step": 4975 - }, - { - "epoch": 0.13, - "learning_rate": 1.9505292704229315e-06, - "loss": 0.9727, - "step": 4976 - }, - { - "epoch": 0.13, - "learning_rate": 1.950503480686069e-06, - "loss": 1.0908, - "step": 4977 - }, - { - "epoch": 0.13, - "learning_rate": 1.95047768439928e-06, - "loss": 1.0566, - "step": 4978 - }, - { - "epoch": 0.13, - "learning_rate": 1.950451881562742e-06, - "loss": 0.9873, - "step": 4979 - }, - { - "epoch": 0.13, - "learning_rate": 1.9504260721766328e-06, - "loss": 0.9414, - "step": 4980 - }, - { - "epoch": 0.13, - "learning_rate": 1.9504002562411305e-06, - "loss": 1.1328, - "step": 4981 - }, - { - "epoch": 0.13, - "learning_rate": 1.9503744337564126e-06, - "loss": 1.1367, - "step": 4982 - }, - { - "epoch": 0.13, - "learning_rate": 1.9503486047226575e-06, - "loss": 0.9619, - "step": 4983 - }, - { - "epoch": 0.13, - "learning_rate": 1.950322769140043e-06, - "loss": 1.0234, - "step": 4984 - }, - { - "epoch": 0.13, - "learning_rate": 1.950296927008747e-06, - "loss": 0.7251, - "step": 4985 - }, - { - "epoch": 0.13, - "learning_rate": 1.950271078328948e-06, - "loss": 0.9648, - "step": 4986 - }, - { - "epoch": 0.13, - "learning_rate": 1.9502452231008234e-06, - "loss": 1.0918, - "step": 4987 - }, - { - "epoch": 0.13, - "learning_rate": 1.950219361324552e-06, - "loss": 0.9961, - "step": 4988 - }, - { - "epoch": 0.13, - "learning_rate": 1.950193493000312e-06, - "loss": 0.9492, - "step": 4989 - }, - { - "epoch": 0.13, - "learning_rate": 1.9501676181282815e-06, - "loss": 1.042, - "step": 4990 - }, - { - "epoch": 0.13, - "learning_rate": 1.9501417367086383e-06, - "loss": 0.8633, - "step": 4991 - }, - { - "epoch": 0.13, - "learning_rate": 1.9501158487415613e-06, - "loss": 0.8525, - "step": 4992 - }, - { - "epoch": 0.13, - "learning_rate": 1.9500899542272292e-06, - "loss": 1.0811, - "step": 4993 - }, - { - "epoch": 0.13, - "learning_rate": 1.9500640531658195e-06, - "loss": 0.7583, - "step": 4994 - }, - { - "epoch": 0.13, - "learning_rate": 1.9500381455575117e-06, - "loss": 0.9961, - "step": 4995 - }, - { - "epoch": 0.13, - "learning_rate": 1.9500122314024838e-06, - "loss": 1.0859, - "step": 4996 - }, - { - "epoch": 0.13, - "learning_rate": 1.9499863107009143e-06, - "loss": 0.7959, - "step": 4997 - }, - { - "epoch": 0.13, - "learning_rate": 1.949960383452982e-06, - "loss": 0.792, - "step": 4998 - }, - { - "epoch": 0.13, - "learning_rate": 1.9499344496588655e-06, - "loss": 0.9727, - "step": 4999 - }, - { - "epoch": 0.13, - "learning_rate": 1.9499085093187436e-06, - "loss": 0.5552, - "step": 5000 - }, - { - "epoch": 0.13, - "learning_rate": 1.999151346260752e-06, - "loss": 1.1875, - "step": 5001 - }, - { - "epoch": 0.13, - "learning_rate": 1.9991502061419393e-06, - "loss": 1.3135, - "step": 5002 - }, - { - "epoch": 0.13, - "learning_rate": 1.9991490652581228e-06, - "loss": 0.833, - "step": 5003 - }, - { - "epoch": 0.13, - "learning_rate": 1.999147923609304e-06, - "loss": 0.96, - "step": 5004 - }, - { - "epoch": 0.13, - "learning_rate": 1.9991467811954844e-06, - "loss": 0.8867, - "step": 5005 - }, - { - "epoch": 0.13, - "learning_rate": 1.9991456380166635e-06, - "loss": 0.9023, - "step": 5006 - }, - { - "epoch": 0.13, - "learning_rate": 1.999144494072842e-06, - "loss": 0.8223, - "step": 5007 - }, - { - "epoch": 0.13, - "learning_rate": 1.9991433493640226e-06, - "loss": 0.915, - "step": 5008 - }, - { - "epoch": 0.13, - "learning_rate": 1.9991422038902045e-06, - "loss": 0.918, - "step": 5009 - }, - { - "epoch": 0.13, - "learning_rate": 1.9991410576513897e-06, - "loss": 0.9062, - "step": 5010 - }, - { - "epoch": 0.13, - "learning_rate": 1.999139910647578e-06, - "loss": 0.8828, - "step": 5011 - }, - { - "epoch": 0.13, - "learning_rate": 1.999138762878771e-06, - "loss": 1.0586, - "step": 5012 - }, - { - "epoch": 0.13, - "learning_rate": 1.9991376143449693e-06, - "loss": 0.8301, - "step": 5013 - }, - { - "epoch": 0.13, - "learning_rate": 1.999136465046174e-06, - "loss": 0.9434, - "step": 5014 - }, - { - "epoch": 0.13, - "learning_rate": 1.999135314982386e-06, - "loss": 1.0273, - "step": 5015 - }, - { - "epoch": 0.13, - "learning_rate": 1.9991341641536055e-06, - "loss": 1.0654, - "step": 5016 - }, - { - "epoch": 0.13, - "learning_rate": 1.999133012559834e-06, - "loss": 0.9531, - "step": 5017 - }, - { - "epoch": 0.13, - "learning_rate": 1.999131860201073e-06, - "loss": 1.04, - "step": 5018 - }, - { - "epoch": 0.13, - "learning_rate": 1.999130707077322e-06, - "loss": 1.0762, - "step": 5019 - }, - { - "epoch": 0.13, - "learning_rate": 1.9991295531885826e-06, - "loss": 0.9863, - "step": 5020 - }, - { - "epoch": 0.13, - "learning_rate": 1.999128398534856e-06, - "loss": 0.9482, - "step": 5021 - }, - { - "epoch": 0.13, - "learning_rate": 1.9991272431161425e-06, - "loss": 0.7305, - "step": 5022 - }, - { - "epoch": 0.13, - "learning_rate": 1.9991260869324427e-06, - "loss": 0.9287, - "step": 5023 - }, - { - "epoch": 0.13, - "learning_rate": 1.999124929983759e-06, - "loss": 0.8789, - "step": 5024 - }, - { - "epoch": 0.13, - "learning_rate": 1.9991237722700907e-06, - "loss": 0.917, - "step": 5025 - }, - { - "epoch": 0.13, - "learning_rate": 1.999122613791439e-06, - "loss": 1.1738, - "step": 5026 - }, - { - "epoch": 0.13, - "learning_rate": 1.9991214545478056e-06, - "loss": 0.8887, - "step": 5027 - }, - { - "epoch": 0.13, - "learning_rate": 1.999120294539191e-06, - "loss": 1.3105, - "step": 5028 - }, - { - "epoch": 0.13, - "learning_rate": 1.9991191337655953e-06, - "loss": 0.9297, - "step": 5029 - }, - { - "epoch": 0.13, - "learning_rate": 1.9991179722270205e-06, - "loss": 0.9941, - "step": 5030 - }, - { - "epoch": 0.13, - "learning_rate": 1.9991168099234666e-06, - "loss": 0.9365, - "step": 5031 - }, - { - "epoch": 0.13, - "learning_rate": 1.999115646854935e-06, - "loss": 0.9414, - "step": 5032 - }, - { - "epoch": 0.13, - "learning_rate": 1.9991144830214267e-06, - "loss": 0.6777, - "step": 5033 - }, - { - "epoch": 0.13, - "learning_rate": 1.9991133184229425e-06, - "loss": 0.8989, - "step": 5034 - }, - { - "epoch": 0.13, - "learning_rate": 1.999112153059483e-06, - "loss": 1.0195, - "step": 5035 - }, - { - "epoch": 0.13, - "learning_rate": 1.999110986931049e-06, - "loss": 0.957, - "step": 5036 - }, - { - "epoch": 0.13, - "learning_rate": 1.9991098200376422e-06, - "loss": 0.8501, - "step": 5037 - }, - { - "epoch": 0.13, - "learning_rate": 1.9991086523792625e-06, - "loss": 0.9111, - "step": 5038 - }, - { - "epoch": 0.13, - "learning_rate": 1.9991074839559116e-06, - "loss": 0.9072, - "step": 5039 - }, - { - "epoch": 0.13, - "learning_rate": 1.9991063147675896e-06, - "loss": 1.0996, - "step": 5040 - }, - { - "epoch": 0.13, - "learning_rate": 1.999105144814298e-06, - "loss": 0.8662, - "step": 5041 - }, - { - "epoch": 0.13, - "learning_rate": 1.9991039740960377e-06, - "loss": 0.8857, - "step": 5042 - }, - { - "epoch": 0.13, - "learning_rate": 1.9991028026128095e-06, - "loss": 0.8481, - "step": 5043 - }, - { - "epoch": 0.13, - "learning_rate": 1.9991016303646136e-06, - "loss": 0.6938, - "step": 5044 - }, - { - "epoch": 0.13, - "learning_rate": 1.999100457351452e-06, - "loss": 1.002, - "step": 5045 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990992835733254e-06, - "loss": 0.9062, - "step": 5046 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990981090302343e-06, - "loss": 0.8906, - "step": 5047 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990969337221793e-06, - "loss": 1.0195, - "step": 5048 - }, - { - "epoch": 0.13, - "learning_rate": 1.999095757649162e-06, - "loss": 0.8633, - "step": 5049 - }, - { - "epoch": 0.13, - "learning_rate": 1.999094580811183e-06, - "loss": 0.8569, - "step": 5050 - }, - { - "epoch": 0.13, - "learning_rate": 1.999093403208243e-06, - "loss": 1.0654, - "step": 5051 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990922248403433e-06, - "loss": 0.7432, - "step": 5052 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990910457074848e-06, - "loss": 0.957, - "step": 5053 - }, - { - "epoch": 0.13, - "learning_rate": 1.999089865809668e-06, - "loss": 1.1035, - "step": 5054 - }, - { - "epoch": 0.13, - "learning_rate": 1.999088685146894e-06, - "loss": 1.0107, - "step": 5055 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990875037191637e-06, - "loss": 0.9521, - "step": 5056 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990863215264783e-06, - "loss": 0.9678, - "step": 5057 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990851385688382e-06, - "loss": 0.8965, - "step": 5058 - }, - { - "epoch": 0.13, - "learning_rate": 1.999083954846245e-06, - "loss": 1.041, - "step": 5059 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990827703586986e-06, - "loss": 0.7783, - "step": 5060 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990815851062006e-06, - "loss": 1.3086, - "step": 5061 - }, - { - "epoch": 0.13, - "learning_rate": 1.999080399088752e-06, - "loss": 0.8311, - "step": 5062 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990792123063532e-06, - "loss": 1.0273, - "step": 5063 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990780247590054e-06, - "loss": 0.8848, - "step": 5064 - }, - { - "epoch": 0.13, - "learning_rate": 1.99907683644671e-06, - "loss": 1.0615, - "step": 5065 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990756473694664e-06, - "loss": 0.7148, - "step": 5066 - }, - { - "epoch": 0.13, - "learning_rate": 1.999074457527277e-06, - "loss": 1.0596, - "step": 5067 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990732669201423e-06, - "loss": 1.0107, - "step": 5068 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990720755480634e-06, - "loss": 0.9238, - "step": 5069 - }, - { - "epoch": 0.13, - "learning_rate": 1.999070883411041e-06, - "loss": 0.7217, - "step": 5070 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990696905090757e-06, - "loss": 0.8779, - "step": 5071 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990684968421686e-06, - "loss": 0.8701, - "step": 5072 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990673024103208e-06, - "loss": 1.1138, - "step": 5073 - }, - { - "epoch": 0.13, - "learning_rate": 1.999066107213533e-06, - "loss": 0.834, - "step": 5074 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990649112518063e-06, - "loss": 0.9551, - "step": 5075 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990637145251413e-06, - "loss": 0.8857, - "step": 5076 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990625170335395e-06, - "loss": 1.0332, - "step": 5077 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990613187770012e-06, - "loss": 1.1074, - "step": 5078 - }, - { - "epoch": 0.13, - "learning_rate": 1.999060119755528e-06, - "loss": 1.0127, - "step": 5079 - }, - { - "epoch": 0.13, - "learning_rate": 1.99905891996912e-06, - "loss": 0.5747, - "step": 5080 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990577194177783e-06, - "loss": 0.9941, - "step": 5081 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990565181015047e-06, - "loss": 0.7622, - "step": 5082 - }, - { - "epoch": 0.13, - "learning_rate": 1.999055316020299e-06, - "loss": 0.9561, - "step": 5083 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990541131741626e-06, - "loss": 0.9453, - "step": 5084 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990529095630967e-06, - "loss": 0.8276, - "step": 5085 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990517051871016e-06, - "loss": 0.8887, - "step": 5086 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990505000461786e-06, - "loss": 1.1504, - "step": 5087 - }, - { - "epoch": 0.13, - "learning_rate": 1.999049294140329e-06, - "loss": 0.9961, - "step": 5088 - }, - { - "epoch": 0.13, - "learning_rate": 1.999048087469553e-06, - "loss": 0.4961, - "step": 5089 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990468800338517e-06, - "loss": 0.9307, - "step": 5090 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990456718332263e-06, - "loss": 1.0977, - "step": 5091 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990444628676777e-06, - "loss": 0.9434, - "step": 5092 - }, - { - "epoch": 0.13, - "learning_rate": 1.999043253137206e-06, - "loss": 0.9688, - "step": 5093 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990420426418135e-06, - "loss": 0.8867, - "step": 5094 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990408313815005e-06, - "loss": 1.0264, - "step": 5095 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990396193562672e-06, - "loss": 0.9961, - "step": 5096 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990384065661158e-06, - "loss": 1.0078, - "step": 5097 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990371930110465e-06, - "loss": 0.7246, - "step": 5098 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990359786910604e-06, - "loss": 0.9688, - "step": 5099 - }, - { - "epoch": 0.13, - "learning_rate": 1.999034763606158e-06, - "loss": 0.7329, - "step": 5100 - }, - { - "epoch": 0.13, - "learning_rate": 1.999033547756341e-06, - "loss": 1.0234, - "step": 5101 - }, - { - "epoch": 0.13, - "learning_rate": 1.99903233114161e-06, - "loss": 0.8496, - "step": 5102 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990311137619654e-06, - "loss": 1.123, - "step": 5103 - }, - { - "epoch": 0.13, - "learning_rate": 1.999029895617409e-06, - "loss": 0.6885, - "step": 5104 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990286767079418e-06, - "loss": 0.9697, - "step": 5105 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990274570335635e-06, - "loss": 0.8306, - "step": 5106 - }, - { - "epoch": 0.13, - "learning_rate": 1.999026236594276e-06, - "loss": 0.8926, - "step": 5107 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990250153900803e-06, - "loss": 1.0654, - "step": 5108 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990237934209767e-06, - "loss": 0.8208, - "step": 5109 - }, - { - "epoch": 0.13, - "learning_rate": 1.999022570686967e-06, - "loss": 1.1445, - "step": 5110 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990213471880514e-06, - "loss": 0.9023, - "step": 5111 - }, - { - "epoch": 0.13, - "learning_rate": 1.999020122924231e-06, - "loss": 0.9727, - "step": 5112 - }, - { - "epoch": 0.13, - "learning_rate": 1.999018897895507e-06, - "loss": 0.8115, - "step": 5113 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990176721018803e-06, - "loss": 1.0293, - "step": 5114 - }, - { - "epoch": 0.13, - "learning_rate": 1.999016445543351e-06, - "loss": 1.0439, - "step": 5115 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990152182199213e-06, - "loss": 1.0586, - "step": 5116 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990139901315916e-06, - "loss": 0.9893, - "step": 5117 - }, - { - "epoch": 0.13, - "learning_rate": 1.999012761278363e-06, - "loss": 1.0605, - "step": 5118 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990115316602358e-06, - "loss": 1.1885, - "step": 5119 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990103012772117e-06, - "loss": 0.957, - "step": 5120 - }, - { - "epoch": 0.13, - "learning_rate": 1.999009070129291e-06, - "loss": 0.8291, - "step": 5121 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990078382164755e-06, - "loss": 1.0938, - "step": 5122 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990066055387654e-06, - "loss": 0.9775, - "step": 5123 - }, - { - "epoch": 0.13, - "learning_rate": 1.999005372096162e-06, - "loss": 0.6768, - "step": 5124 - }, - { - "epoch": 0.13, - "learning_rate": 1.9990041378886654e-06, - "loss": 1.0635, - "step": 5125 - }, - { - "epoch": 0.13, - "learning_rate": 1.999002902916278e-06, - "loss": 0.8721, - "step": 5126 - }, - { - "epoch": 0.13, - "learning_rate": 1.999001667179e-06, - "loss": 0.8867, - "step": 5127 - }, - { - "epoch": 0.13, - "learning_rate": 1.999000430676832e-06, - "loss": 0.7139, - "step": 5128 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989991934097757e-06, - "loss": 0.9941, - "step": 5129 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989979553778315e-06, - "loss": 1.0684, - "step": 5130 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989967165810004e-06, - "loss": 0.8125, - "step": 5131 - }, - { - "epoch": 0.13, - "learning_rate": 1.998995477019284e-06, - "loss": 1.0098, - "step": 5132 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989942366926816e-06, - "loss": 0.9238, - "step": 5133 - }, - { - "epoch": 0.13, - "learning_rate": 1.998992995601196e-06, - "loss": 1.0391, - "step": 5134 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989917537448273e-06, - "loss": 0.679, - "step": 5135 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989905111235764e-06, - "loss": 1.0059, - "step": 5136 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989892677374446e-06, - "loss": 0.8535, - "step": 5137 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989880235864324e-06, - "loss": 1.0225, - "step": 5138 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989867786705413e-06, - "loss": 0.9316, - "step": 5139 - }, - { - "epoch": 0.13, - "learning_rate": 1.998985532989772e-06, - "loss": 0.8936, - "step": 5140 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989842865441253e-06, - "loss": 0.8604, - "step": 5141 - }, - { - "epoch": 0.13, - "learning_rate": 1.998983039333602e-06, - "loss": 0.8896, - "step": 5142 - }, - { - "epoch": 0.13, - "learning_rate": 1.998981791358204e-06, - "loss": 0.7856, - "step": 5143 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989805426179306e-06, - "loss": 0.8516, - "step": 5144 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989792931127846e-06, - "loss": 0.8115, - "step": 5145 - }, - { - "epoch": 0.13, - "learning_rate": 1.998978042842765e-06, - "loss": 0.9619, - "step": 5146 - }, - { - "epoch": 0.13, - "learning_rate": 1.998976791807875e-06, - "loss": 0.9111, - "step": 5147 - }, - { - "epoch": 0.13, - "learning_rate": 1.998975540008114e-06, - "loss": 0.8252, - "step": 5148 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989742874434834e-06, - "loss": 0.7056, - "step": 5149 - }, - { - "epoch": 0.13, - "learning_rate": 1.998973034113984e-06, - "loss": 0.9131, - "step": 5150 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989717800196172e-06, - "loss": 1.1348, - "step": 5151 - }, - { - "epoch": 0.13, - "learning_rate": 1.998970525160383e-06, - "loss": 0.8862, - "step": 5152 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989692695362837e-06, - "loss": 1.082, - "step": 5153 - }, - { - "epoch": 0.13, - "learning_rate": 1.998968013147319e-06, - "loss": 0.8203, - "step": 5154 - }, - { - "epoch": 0.13, - "learning_rate": 1.998966755993491e-06, - "loss": 0.9731, - "step": 5155 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989654980747996e-06, - "loss": 0.9243, - "step": 5156 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989642393912464e-06, - "loss": 0.9189, - "step": 5157 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989629799428323e-06, - "loss": 0.9048, - "step": 5158 - }, - { - "epoch": 0.13, - "learning_rate": 1.998961719729558e-06, - "loss": 0.8735, - "step": 5159 - }, - { - "epoch": 0.13, - "learning_rate": 1.998960458751425e-06, - "loss": 1.0127, - "step": 5160 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989591970084334e-06, - "loss": 1.1953, - "step": 5161 - }, - { - "epoch": 0.13, - "learning_rate": 1.998957934500585e-06, - "loss": 1.0674, - "step": 5162 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989566712278806e-06, - "loss": 0.9531, - "step": 5163 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989554071903206e-06, - "loss": 0.9424, - "step": 5164 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989541423879065e-06, - "loss": 0.8711, - "step": 5165 - }, - { - "epoch": 0.13, - "learning_rate": 1.99895287682064e-06, - "loss": 0.9297, - "step": 5166 - }, - { - "epoch": 0.13, - "learning_rate": 1.99895161048852e-06, - "loss": 0.8135, - "step": 5167 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989503433915493e-06, - "loss": 0.9141, - "step": 5168 - }, - { - "epoch": 0.13, - "learning_rate": 1.998949075529728e-06, - "loss": 0.8662, - "step": 5169 - }, - { - "epoch": 0.13, - "learning_rate": 1.998947806903057e-06, - "loss": 0.8525, - "step": 5170 - }, - { - "epoch": 0.13, - "learning_rate": 1.998946537511538e-06, - "loss": 0.7568, - "step": 5171 - }, - { - "epoch": 0.13, - "learning_rate": 1.998945267355172e-06, - "loss": 1.1768, - "step": 5172 - }, - { - "epoch": 0.13, - "learning_rate": 1.998943996433959e-06, - "loss": 1.0293, - "step": 5173 - }, - { - "epoch": 0.13, - "learning_rate": 1.998942724747901e-06, - "loss": 0.9697, - "step": 5174 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989414522969978e-06, - "loss": 1.0391, - "step": 5175 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989401790812514e-06, - "loss": 1.2441, - "step": 5176 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989389051006623e-06, - "loss": 0.9453, - "step": 5177 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989376303552316e-06, - "loss": 1.0361, - "step": 5178 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989363548449607e-06, - "loss": 0.9062, - "step": 5179 - }, - { - "epoch": 0.13, - "learning_rate": 1.99893507856985e-06, - "loss": 1.0674, - "step": 5180 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989338015299e-06, - "loss": 0.845, - "step": 5181 - }, - { - "epoch": 0.13, - "learning_rate": 1.998932523725113e-06, - "loss": 0.814, - "step": 5182 - }, - { - "epoch": 0.13, - "learning_rate": 1.998931245155489e-06, - "loss": 0.998, - "step": 5183 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989299658210297e-06, - "loss": 0.9375, - "step": 5184 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989286857217354e-06, - "loss": 0.8691, - "step": 5185 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989274048576077e-06, - "loss": 0.9512, - "step": 5186 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989261232286464e-06, - "loss": 0.7051, - "step": 5187 - }, - { - "epoch": 0.13, - "learning_rate": 1.998924840834854e-06, - "loss": 0.7319, - "step": 5188 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989235576762303e-06, - "loss": 0.9736, - "step": 5189 - }, - { - "epoch": 0.13, - "learning_rate": 1.998922273752777e-06, - "loss": 0.834, - "step": 5190 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989209890644946e-06, - "loss": 1.1523, - "step": 5191 - }, - { - "epoch": 0.13, - "learning_rate": 1.998919703611385e-06, - "loss": 1.1191, - "step": 5192 - }, - { - "epoch": 0.13, - "learning_rate": 1.998918417393448e-06, - "loss": 0.72, - "step": 5193 - }, - { - "epoch": 0.13, - "learning_rate": 1.998917130410685e-06, - "loss": 0.9922, - "step": 5194 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989158426630973e-06, - "loss": 1.0303, - "step": 5195 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989145541506856e-06, - "loss": 0.8623, - "step": 5196 - }, - { - "epoch": 0.13, - "learning_rate": 1.998913264873451e-06, - "loss": 1.166, - "step": 5197 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989119748313942e-06, - "loss": 0.8062, - "step": 5198 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989106840245168e-06, - "loss": 0.9648, - "step": 5199 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989093924528194e-06, - "loss": 0.8638, - "step": 5200 - }, - { - "epoch": 0.13, - "learning_rate": 1.998908100116303e-06, - "loss": 0.835, - "step": 5201 - }, - { - "epoch": 0.13, - "learning_rate": 1.998906807014968e-06, - "loss": 0.8535, - "step": 5202 - }, - { - "epoch": 0.13, - "learning_rate": 1.998905513148817e-06, - "loss": 0.917, - "step": 5203 - }, - { - "epoch": 0.13, - "learning_rate": 1.998904218517849e-06, - "loss": 0.7212, - "step": 5204 - }, - { - "epoch": 0.13, - "learning_rate": 1.998902923122067e-06, - "loss": 1.1143, - "step": 5205 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989016269614703e-06, - "loss": 0.7993, - "step": 5206 - }, - { - "epoch": 0.13, - "learning_rate": 1.9989003300360605e-06, - "loss": 0.7148, - "step": 5207 - }, - { - "epoch": 0.13, - "learning_rate": 1.998899032345839e-06, - "loss": 0.6194, - "step": 5208 - }, - { - "epoch": 0.13, - "learning_rate": 1.998897733890806e-06, - "loss": 0.9814, - "step": 5209 - }, - { - "epoch": 0.13, - "learning_rate": 1.998896434670963e-06, - "loss": 0.9277, - "step": 5210 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988951346863114e-06, - "loss": 0.9619, - "step": 5211 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988938339368515e-06, - "loss": 1.0195, - "step": 5212 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988925324225844e-06, - "loss": 0.9141, - "step": 5213 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988912301435113e-06, - "loss": 0.8066, - "step": 5214 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988899270996327e-06, - "loss": 0.9033, - "step": 5215 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988886232909507e-06, - "loss": 0.8545, - "step": 5216 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988873187174653e-06, - "loss": 1.083, - "step": 5217 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988860133791777e-06, - "loss": 0.9805, - "step": 5218 - }, - { - "epoch": 0.13, - "learning_rate": 1.998884707276089e-06, - "loss": 0.9697, - "step": 5219 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988834004082004e-06, - "loss": 1.0488, - "step": 5220 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988820927755127e-06, - "loss": 0.8789, - "step": 5221 - }, - { - "epoch": 0.13, - "learning_rate": 1.998880784378027e-06, - "loss": 0.9629, - "step": 5222 - }, - { - "epoch": 0.13, - "learning_rate": 1.998879475215744e-06, - "loss": 0.5991, - "step": 5223 - }, - { - "epoch": 0.13, - "learning_rate": 1.998878165288665e-06, - "loss": 0.9229, - "step": 5224 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988768545967908e-06, - "loss": 1.2188, - "step": 5225 - }, - { - "epoch": 0.13, - "learning_rate": 1.998875543140123e-06, - "loss": 0.7983, - "step": 5226 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988742309186614e-06, - "loss": 0.9033, - "step": 5227 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988729179324083e-06, - "loss": 0.6704, - "step": 5228 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988716041813637e-06, - "loss": 1.1797, - "step": 5229 - }, - { - "epoch": 0.13, - "learning_rate": 1.998870289665529e-06, - "loss": 1.0195, - "step": 5230 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988689743849057e-06, - "loss": 1.0186, - "step": 5231 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988676583394944e-06, - "loss": 0.915, - "step": 5232 - }, - { - "epoch": 0.13, - "learning_rate": 1.998866341529296e-06, - "loss": 0.7568, - "step": 5233 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988650239543113e-06, - "loss": 0.8887, - "step": 5234 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988637056145414e-06, - "loss": 1.0342, - "step": 5235 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988623865099877e-06, - "loss": 0.666, - "step": 5236 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988610666406513e-06, - "loss": 0.5898, - "step": 5237 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988597460065327e-06, - "loss": 0.9668, - "step": 5238 - }, - { - "epoch": 0.13, - "learning_rate": 1.998858424607633e-06, - "loss": 0.999, - "step": 5239 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988571024439538e-06, - "loss": 0.9727, - "step": 5240 - }, - { - "epoch": 0.13, - "learning_rate": 1.998855779515495e-06, - "loss": 0.8564, - "step": 5241 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988544558222586e-06, - "loss": 0.748, - "step": 5242 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988531313642453e-06, - "loss": 1.0518, - "step": 5243 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988518061414557e-06, - "loss": 1.1045, - "step": 5244 - }, - { - "epoch": 0.13, - "learning_rate": 1.998850480153892e-06, - "loss": 0.8564, - "step": 5245 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988491534015535e-06, - "loss": 0.401, - "step": 5246 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988478258844426e-06, - "loss": 1.1318, - "step": 5247 - }, - { - "epoch": 0.13, - "learning_rate": 1.99884649760256e-06, - "loss": 1.0654, - "step": 5248 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988451685559062e-06, - "loss": 0.8896, - "step": 5249 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988438387444825e-06, - "loss": 0.9336, - "step": 5250 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988425081682905e-06, - "loss": 0.8652, - "step": 5251 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988411768273306e-06, - "loss": 0.6875, - "step": 5252 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988398447216034e-06, - "loss": 1.0332, - "step": 5253 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988385118511113e-06, - "loss": 0.9346, - "step": 5254 - }, - { - "epoch": 0.13, - "learning_rate": 1.998837178215854e-06, - "loss": 0.9316, - "step": 5255 - }, - { - "epoch": 0.13, - "learning_rate": 1.998835843815833e-06, - "loss": 1.0645, - "step": 5256 - }, - { - "epoch": 0.13, - "learning_rate": 1.998834508651049e-06, - "loss": 1.0781, - "step": 5257 - }, - { - "epoch": 0.13, - "learning_rate": 1.998833172721504e-06, - "loss": 0.731, - "step": 5258 - }, - { - "epoch": 0.13, - "learning_rate": 1.998831836027198e-06, - "loss": 0.7827, - "step": 5259 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988304985681322e-06, - "loss": 0.9932, - "step": 5260 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988291603443084e-06, - "loss": 1.0088, - "step": 5261 - }, - { - "epoch": 0.13, - "learning_rate": 1.998827821355727e-06, - "loss": 0.8564, - "step": 5262 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988264816023883e-06, - "loss": 0.8955, - "step": 5263 - }, - { - "epoch": 0.13, - "learning_rate": 1.998825141084295e-06, - "loss": 0.6968, - "step": 5264 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988237998014468e-06, - "loss": 0.7283, - "step": 5265 - }, - { - "epoch": 0.13, - "learning_rate": 1.9988224577538448e-06, - "loss": 0.8438, - "step": 5266 - }, - { - "epoch": 0.13, - "learning_rate": 1.998821114941491e-06, - "loss": 0.9668, - "step": 5267 - }, - { - "epoch": 0.14, - "learning_rate": 1.998819771364385e-06, - "loss": 0.9409, - "step": 5268 - }, - { - "epoch": 0.14, - "learning_rate": 1.9988184270225292e-06, - "loss": 0.9512, - "step": 5269 - }, - { - "epoch": 0.14, - "learning_rate": 1.998817081915924e-06, - "loss": 0.8022, - "step": 5270 - }, - { - "epoch": 0.14, - "learning_rate": 1.9988157360445706e-06, - "loss": 0.8857, - "step": 5271 - }, - { - "epoch": 0.14, - "learning_rate": 1.9988143894084696e-06, - "loss": 0.959, - "step": 5272 - }, - { - "epoch": 0.14, - "learning_rate": 1.9988130420076228e-06, - "loss": 0.936, - "step": 5273 - }, - { - "epoch": 0.14, - "learning_rate": 1.99881169384203e-06, - "loss": 0.6899, - "step": 5274 - }, - { - "epoch": 0.14, - "learning_rate": 1.998810344911694e-06, - "loss": 0.8799, - "step": 5275 - }, - { - "epoch": 0.14, - "learning_rate": 1.9988089952166142e-06, - "loss": 1.0625, - "step": 5276 - }, - { - "epoch": 0.14, - "learning_rate": 1.9988076447567926e-06, - "loss": 0.9053, - "step": 5277 - }, - { - "epoch": 0.14, - "learning_rate": 1.99880629353223e-06, - "loss": 1.0547, - "step": 5278 - }, - { - "epoch": 0.14, - "learning_rate": 1.998804941542927e-06, - "loss": 1.0176, - "step": 5279 - }, - { - "epoch": 0.14, - "learning_rate": 1.998803588788885e-06, - "loss": 0.7144, - "step": 5280 - }, - { - "epoch": 0.14, - "learning_rate": 1.9988022352701052e-06, - "loss": 1.0137, - "step": 5281 - }, - { - "epoch": 0.14, - "learning_rate": 1.998800880986588e-06, - "loss": 1.0049, - "step": 5282 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987995259383356e-06, - "loss": 0.6733, - "step": 5283 - }, - { - "epoch": 0.14, - "learning_rate": 1.998798170125348e-06, - "loss": 0.9434, - "step": 5284 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987968135476267e-06, - "loss": 0.9404, - "step": 5285 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987954562051724e-06, - "loss": 0.9014, - "step": 5286 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987940980979863e-06, - "loss": 0.8105, - "step": 5287 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987927392260695e-06, - "loss": 1.0078, - "step": 5288 - }, - { - "epoch": 0.14, - "learning_rate": 1.998791379589423e-06, - "loss": 0.9346, - "step": 5289 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987900191880482e-06, - "loss": 1.0098, - "step": 5290 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987886580219453e-06, - "loss": 0.8857, - "step": 5291 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987872960911165e-06, - "loss": 1.0547, - "step": 5292 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987859333955618e-06, - "loss": 0.8125, - "step": 5293 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987845699352824e-06, - "loss": 1.0117, - "step": 5294 - }, - { - "epoch": 0.14, - "learning_rate": 1.99878320571028e-06, - "loss": 0.9355, - "step": 5295 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987818407205553e-06, - "loss": 1.0229, - "step": 5296 - }, - { - "epoch": 0.14, - "learning_rate": 1.998780474966109e-06, - "loss": 0.8984, - "step": 5297 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987791084469423e-06, - "loss": 0.9014, - "step": 5298 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987777411630567e-06, - "loss": 1.0762, - "step": 5299 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987763731144528e-06, - "loss": 0.7231, - "step": 5300 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987750043011314e-06, - "loss": 0.7188, - "step": 5301 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987736347230943e-06, - "loss": 0.8174, - "step": 5302 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987722643803424e-06, - "loss": 0.8193, - "step": 5303 - }, - { - "epoch": 0.14, - "learning_rate": 1.998770893272876e-06, - "loss": 0.9229, - "step": 5304 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987695214006967e-06, - "loss": 0.6689, - "step": 5305 - }, - { - "epoch": 0.14, - "learning_rate": 1.998768148763806e-06, - "loss": 0.9971, - "step": 5306 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987667753622037e-06, - "loss": 0.9502, - "step": 5307 - }, - { - "epoch": 0.14, - "learning_rate": 1.998765401195892e-06, - "loss": 0.8848, - "step": 5308 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987640262648714e-06, - "loss": 0.9492, - "step": 5309 - }, - { - "epoch": 0.14, - "learning_rate": 1.998762650569143e-06, - "loss": 0.6956, - "step": 5310 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987612741087084e-06, - "loss": 1.1416, - "step": 5311 - }, - { - "epoch": 0.14, - "learning_rate": 1.998759896883568e-06, - "loss": 0.9463, - "step": 5312 - }, - { - "epoch": 0.14, - "learning_rate": 1.998758518893723e-06, - "loss": 0.7988, - "step": 5313 - }, - { - "epoch": 0.14, - "learning_rate": 1.998757140139175e-06, - "loss": 1.084, - "step": 5314 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987557606199238e-06, - "loss": 0.9727, - "step": 5315 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987543803359717e-06, - "loss": 0.9912, - "step": 5316 - }, - { - "epoch": 0.14, - "learning_rate": 1.998752999287319e-06, - "loss": 1.0469, - "step": 5317 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987516174739674e-06, - "loss": 1.041, - "step": 5318 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987502348959177e-06, - "loss": 1.1094, - "step": 5319 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987488515531704e-06, - "loss": 0.708, - "step": 5320 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987474674457273e-06, - "loss": 0.7935, - "step": 5321 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987460825735892e-06, - "loss": 1.1152, - "step": 5322 - }, - { - "epoch": 0.14, - "learning_rate": 1.998744696936757e-06, - "loss": 0.9707, - "step": 5323 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987433105352323e-06, - "loss": 0.959, - "step": 5324 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987419233690156e-06, - "loss": 0.8125, - "step": 5325 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987405354381077e-06, - "loss": 0.9131, - "step": 5326 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987391467425107e-06, - "loss": 0.9795, - "step": 5327 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987377572822247e-06, - "loss": 1.0371, - "step": 5328 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987363670572513e-06, - "loss": 0.7822, - "step": 5329 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987349760675914e-06, - "loss": 0.8706, - "step": 5330 - }, - { - "epoch": 0.14, - "learning_rate": 1.998733584313246e-06, - "loss": 0.9199, - "step": 5331 - }, - { - "epoch": 0.14, - "learning_rate": 1.998732191794216e-06, - "loss": 1.1055, - "step": 5332 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987307985105027e-06, - "loss": 0.8398, - "step": 5333 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987294044621073e-06, - "loss": 1.0762, - "step": 5334 - }, - { - "epoch": 0.14, - "learning_rate": 1.998728009649031e-06, - "loss": 1.0205, - "step": 5335 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987266140712742e-06, - "loss": 0.8765, - "step": 5336 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987252177288383e-06, - "loss": 0.8394, - "step": 5337 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987238206217243e-06, - "loss": 0.8989, - "step": 5338 - }, - { - "epoch": 0.14, - "learning_rate": 1.998722422749934e-06, - "loss": 0.8579, - "step": 5339 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987210241134673e-06, - "loss": 0.8887, - "step": 5340 - }, - { - "epoch": 0.14, - "learning_rate": 1.998719624712326e-06, - "loss": 0.9131, - "step": 5341 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987182245465112e-06, - "loss": 0.6753, - "step": 5342 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987168236160235e-06, - "loss": 1.0342, - "step": 5343 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987154219208645e-06, - "loss": 1.0459, - "step": 5344 - }, - { - "epoch": 0.14, - "learning_rate": 1.998714019461035e-06, - "loss": 0.8184, - "step": 5345 - }, - { - "epoch": 0.14, - "learning_rate": 1.998712616236536e-06, - "loss": 0.9688, - "step": 5346 - }, - { - "epoch": 0.14, - "learning_rate": 1.998711212247369e-06, - "loss": 1.0986, - "step": 5347 - }, - { - "epoch": 0.14, - "learning_rate": 1.998709807493534e-06, - "loss": 0.9639, - "step": 5348 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987084019750335e-06, - "loss": 0.6875, - "step": 5349 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987069956918676e-06, - "loss": 0.9004, - "step": 5350 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987055886440377e-06, - "loss": 0.6086, - "step": 5351 - }, - { - "epoch": 0.14, - "learning_rate": 1.998704180831545e-06, - "loss": 1.084, - "step": 5352 - }, - { - "epoch": 0.14, - "learning_rate": 1.99870277225439e-06, - "loss": 0.9907, - "step": 5353 - }, - { - "epoch": 0.14, - "learning_rate": 1.9987013629125748e-06, - "loss": 0.8525, - "step": 5354 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986999528060995e-06, - "loss": 0.8813, - "step": 5355 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986985419349657e-06, - "loss": 0.9346, - "step": 5356 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986971302991746e-06, - "loss": 0.9766, - "step": 5357 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986957178987266e-06, - "loss": 0.9443, - "step": 5358 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986943047336234e-06, - "loss": 0.9043, - "step": 5359 - }, - { - "epoch": 0.14, - "learning_rate": 1.998692890803866e-06, - "loss": 0.8301, - "step": 5360 - }, - { - "epoch": 0.14, - "learning_rate": 1.998691476109455e-06, - "loss": 0.9766, - "step": 5361 - }, - { - "epoch": 0.14, - "learning_rate": 1.998690060650392e-06, - "loss": 0.9453, - "step": 5362 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986886444266784e-06, - "loss": 0.9365, - "step": 5363 - }, - { - "epoch": 0.14, - "learning_rate": 1.998687227438314e-06, - "loss": 1.0352, - "step": 5364 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986858096853014e-06, - "loss": 1.0312, - "step": 5365 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986843911676408e-06, - "loss": 0.9023, - "step": 5366 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986829718853334e-06, - "loss": 0.8721, - "step": 5367 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986815518383806e-06, - "loss": 0.9893, - "step": 5368 - }, - { - "epoch": 0.14, - "learning_rate": 1.998680131026783e-06, - "loss": 0.957, - "step": 5369 - }, - { - "epoch": 0.14, - "learning_rate": 1.998678709450542e-06, - "loss": 1.0078, - "step": 5370 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986772871096585e-06, - "loss": 0.9746, - "step": 5371 - }, - { - "epoch": 0.14, - "learning_rate": 1.998675864004134e-06, - "loss": 1.0918, - "step": 5372 - }, - { - "epoch": 0.14, - "learning_rate": 1.998674440133969e-06, - "loss": 0.6768, - "step": 5373 - }, - { - "epoch": 0.14, - "learning_rate": 1.998673015499165e-06, - "loss": 0.877, - "step": 5374 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986715900997234e-06, - "loss": 0.8271, - "step": 5375 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986701639356443e-06, - "loss": 0.9312, - "step": 5376 - }, - { - "epoch": 0.14, - "learning_rate": 1.99866873700693e-06, - "loss": 1.0034, - "step": 5377 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986673093135804e-06, - "loss": 0.7661, - "step": 5378 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986658808555972e-06, - "loss": 0.9971, - "step": 5379 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986644516329817e-06, - "loss": 0.8545, - "step": 5380 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986630216457348e-06, - "loss": 0.8262, - "step": 5381 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986615908938576e-06, - "loss": 1.1045, - "step": 5382 - }, - { - "epoch": 0.14, - "learning_rate": 1.998660159377351e-06, - "loss": 0.958, - "step": 5383 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986587270962157e-06, - "loss": 1.0908, - "step": 5384 - }, - { - "epoch": 0.14, - "learning_rate": 1.998657294050454e-06, - "loss": 0.8262, - "step": 5385 - }, - { - "epoch": 0.14, - "learning_rate": 1.998655860240066e-06, - "loss": 1.001, - "step": 5386 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986544256650536e-06, - "loss": 0.8408, - "step": 5387 - }, - { - "epoch": 0.14, - "learning_rate": 1.998652990325417e-06, - "loss": 0.7534, - "step": 5388 - }, - { - "epoch": 0.14, - "learning_rate": 1.998651554221158e-06, - "loss": 0.957, - "step": 5389 - }, - { - "epoch": 0.14, - "learning_rate": 1.998650117352277e-06, - "loss": 0.8857, - "step": 5390 - }, - { - "epoch": 0.14, - "learning_rate": 1.998648679718776e-06, - "loss": 0.9648, - "step": 5391 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986472413206553e-06, - "loss": 0.6479, - "step": 5392 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986458021579163e-06, - "loss": 1.001, - "step": 5393 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986443622305603e-06, - "loss": 1.0361, - "step": 5394 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986429215385884e-06, - "loss": 0.8916, - "step": 5395 - }, - { - "epoch": 0.14, - "learning_rate": 1.998641480082001e-06, - "loss": 0.9043, - "step": 5396 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986400378608003e-06, - "loss": 0.8037, - "step": 5397 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986385948749866e-06, - "loss": 0.9355, - "step": 5398 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986371511245613e-06, - "loss": 0.9023, - "step": 5399 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986357066095253e-06, - "loss": 1.0752, - "step": 5400 - }, - { - "epoch": 0.14, - "learning_rate": 1.99863426132988e-06, - "loss": 0.8086, - "step": 5401 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986328152856262e-06, - "loss": 0.8662, - "step": 5402 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986313684767653e-06, - "loss": 0.9707, - "step": 5403 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986299209032983e-06, - "loss": 0.7422, - "step": 5404 - }, - { - "epoch": 0.14, - "learning_rate": 1.998628472565226e-06, - "loss": 0.8965, - "step": 5405 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986270234625504e-06, - "loss": 0.699, - "step": 5406 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986255735952716e-06, - "loss": 0.9805, - "step": 5407 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986241229633914e-06, - "loss": 1.0352, - "step": 5408 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986226715669102e-06, - "loss": 1.084, - "step": 5409 - }, - { - "epoch": 0.14, - "learning_rate": 1.99862121940583e-06, - "loss": 1.1396, - "step": 5410 - }, - { - "epoch": 0.14, - "learning_rate": 1.998619766480151e-06, - "loss": 0.6528, - "step": 5411 - }, - { - "epoch": 0.14, - "learning_rate": 1.998618312789875e-06, - "loss": 0.9102, - "step": 5412 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986168583350026e-06, - "loss": 0.7998, - "step": 5413 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986154031155356e-06, - "loss": 0.9316, - "step": 5414 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986139471314744e-06, - "loss": 0.8887, - "step": 5415 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986124903828204e-06, - "loss": 0.875, - "step": 5416 - }, - { - "epoch": 0.14, - "learning_rate": 1.998611032869575e-06, - "loss": 0.8901, - "step": 5417 - }, - { - "epoch": 0.14, - "learning_rate": 1.998609574591739e-06, - "loss": 0.8252, - "step": 5418 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986081155493137e-06, - "loss": 0.96, - "step": 5419 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986066557422998e-06, - "loss": 1.0254, - "step": 5420 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986051951706984e-06, - "loss": 1.0195, - "step": 5421 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986037338345114e-06, - "loss": 0.8428, - "step": 5422 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986022717337394e-06, - "loss": 0.9297, - "step": 5423 - }, - { - "epoch": 0.14, - "learning_rate": 1.9986008088683835e-06, - "loss": 0.7266, - "step": 5424 - }, - { - "epoch": 0.14, - "learning_rate": 1.9985993452384447e-06, - "loss": 0.835, - "step": 5425 - }, - { - "epoch": 0.14, - "learning_rate": 1.998597880843925e-06, - "loss": 1.1396, - "step": 5426 - }, - { - "epoch": 0.14, - "learning_rate": 1.998596415684824e-06, - "loss": 0.8252, - "step": 5427 - }, - { - "epoch": 0.14, - "learning_rate": 1.9985949497611442e-06, - "loss": 0.8721, - "step": 5428 - }, - { - "epoch": 0.14, - "learning_rate": 1.9985934830728855e-06, - "loss": 1.0879, - "step": 5429 - }, - { - "epoch": 0.14, - "learning_rate": 1.9985920156200503e-06, - "loss": 0.7671, - "step": 5430 - }, - { - "epoch": 0.14, - "learning_rate": 1.9985905474026387e-06, - "loss": 0.8169, - "step": 5431 - }, - { - "epoch": 0.14, - "learning_rate": 1.9985890784206524e-06, - "loss": 0.9951, - "step": 5432 - }, - { - "epoch": 0.14, - "learning_rate": 1.9985876086740923e-06, - "loss": 0.9424, - "step": 5433 - }, - { - "epoch": 0.14, - "learning_rate": 1.99858613816296e-06, - "loss": 0.8037, - "step": 5434 - }, - { - "epoch": 0.14, - "learning_rate": 1.998584666887256e-06, - "loss": 0.8408, - "step": 5435 - }, - { - "epoch": 0.14, - "learning_rate": 1.9985831948469813e-06, - "loss": 0.8062, - "step": 5436 - }, - { - "epoch": 0.14, - "learning_rate": 1.9985817220421376e-06, - "loss": 0.7637, - "step": 5437 - }, - { - "epoch": 0.14, - "learning_rate": 1.998580248472726e-06, - "loss": 0.8789, - "step": 5438 - }, - { - "epoch": 0.14, - "learning_rate": 1.998578774138747e-06, - "loss": 0.9609, - "step": 5439 - }, - { - "epoch": 0.14, - "learning_rate": 1.9985772990402024e-06, - "loss": 0.9297, - "step": 5440 - }, - { - "epoch": 0.14, - "learning_rate": 1.998575823177093e-06, - "loss": 1.1426, - "step": 5441 - }, - { - "epoch": 0.14, - "learning_rate": 1.99857434654942e-06, - "loss": 0.917, - "step": 5442 - }, - { - "epoch": 0.14, - "learning_rate": 1.9985728691571847e-06, - "loss": 0.7798, - "step": 5443 - }, - { - "epoch": 0.14, - "learning_rate": 1.998571391000388e-06, - "loss": 0.8818, - "step": 5444 - }, - { - "epoch": 0.14, - "learning_rate": 1.9985699120790306e-06, - "loss": 0.8193, - "step": 5445 - }, - { - "epoch": 0.14, - "learning_rate": 1.998568432393115e-06, - "loss": 0.791, - "step": 5446 - }, - { - "epoch": 0.14, - "learning_rate": 1.998566951942641e-06, - "loss": 0.8403, - "step": 5447 - }, - { - "epoch": 0.14, - "learning_rate": 1.99856547072761e-06, - "loss": 1.165, - "step": 5448 - }, - { - "epoch": 0.14, - "learning_rate": 1.9985639887480233e-06, - "loss": 0.9658, - "step": 5449 - }, - { - "epoch": 0.14, - "learning_rate": 1.9985625060038823e-06, - "loss": 0.7969, - "step": 5450 - }, - { - "epoch": 0.14, - "learning_rate": 1.9985610224951882e-06, - "loss": 0.8955, - "step": 5451 - }, - { - "epoch": 0.14, - "learning_rate": 1.9985595382219415e-06, - "loss": 1.0391, - "step": 5452 - }, - { - "epoch": 0.14, - "learning_rate": 1.9985580531841437e-06, - "loss": 0.9541, - "step": 5453 - }, - { - "epoch": 0.14, - "learning_rate": 1.998556567381796e-06, - "loss": 0.9727, - "step": 5454 - }, - { - "epoch": 0.14, - "learning_rate": 1.9985550808149e-06, - "loss": 0.8975, - "step": 5455 - }, - { - "epoch": 0.14, - "learning_rate": 1.9985535934834554e-06, - "loss": 0.7158, - "step": 5456 - }, - { - "epoch": 0.14, - "learning_rate": 1.9985521053874642e-06, - "loss": 0.8071, - "step": 5457 - }, - { - "epoch": 0.14, - "learning_rate": 1.998550616526928e-06, - "loss": 0.9307, - "step": 5458 - }, - { - "epoch": 0.14, - "learning_rate": 1.9985491269018475e-06, - "loss": 1.166, - "step": 5459 - }, - { - "epoch": 0.14, - "learning_rate": 1.9985476365122237e-06, - "loss": 0.8457, - "step": 5460 - }, - { - "epoch": 0.14, - "learning_rate": 1.998546145358058e-06, - "loss": 1.0645, - "step": 5461 - }, - { - "epoch": 0.14, - "learning_rate": 1.9985446534393514e-06, - "loss": 0.4753, - "step": 5462 - }, - { - "epoch": 0.14, - "learning_rate": 1.998543160756105e-06, - "loss": 0.9912, - "step": 5463 - }, - { - "epoch": 0.14, - "learning_rate": 1.99854166730832e-06, - "loss": 0.9922, - "step": 5464 - }, - { - "epoch": 0.14, - "learning_rate": 1.9985401730959976e-06, - "loss": 0.8828, - "step": 5465 - }, - { - "epoch": 0.14, - "learning_rate": 1.998538678119139e-06, - "loss": 1.0098, - "step": 5466 - }, - { - "epoch": 0.14, - "learning_rate": 1.9985371823777454e-06, - "loss": 0.9883, - "step": 5467 - }, - { - "epoch": 0.14, - "learning_rate": 1.9985356858718173e-06, - "loss": 0.8828, - "step": 5468 - }, - { - "epoch": 0.14, - "learning_rate": 1.998534188601357e-06, - "loss": 1.0322, - "step": 5469 - }, - { - "epoch": 0.14, - "learning_rate": 1.9985326905663646e-06, - "loss": 0.9497, - "step": 5470 - }, - { - "epoch": 0.14, - "learning_rate": 1.998531191766841e-06, - "loss": 1.0654, - "step": 5471 - }, - { - "epoch": 0.14, - "learning_rate": 1.998529692202789e-06, - "loss": 0.9316, - "step": 5472 - }, - { - "epoch": 0.14, - "learning_rate": 1.998528191874208e-06, - "loss": 0.7969, - "step": 5473 - }, - { - "epoch": 0.14, - "learning_rate": 1.998526690781101e-06, - "loss": 0.9639, - "step": 5474 - }, - { - "epoch": 0.14, - "learning_rate": 1.998525188923467e-06, - "loss": 1.1572, - "step": 5475 - }, - { - "epoch": 0.14, - "learning_rate": 1.998523686301308e-06, - "loss": 1.0684, - "step": 5476 - }, - { - "epoch": 0.14, - "learning_rate": 1.998522182914626e-06, - "loss": 1.0635, - "step": 5477 - }, - { - "epoch": 0.14, - "learning_rate": 1.9985206787634213e-06, - "loss": 0.877, - "step": 5478 - }, - { - "epoch": 0.14, - "learning_rate": 1.9985191738476953e-06, - "loss": 0.9668, - "step": 5479 - }, - { - "epoch": 0.14, - "learning_rate": 1.998517668167449e-06, - "loss": 1.0098, - "step": 5480 - }, - { - "epoch": 0.14, - "learning_rate": 1.998516161722683e-06, - "loss": 0.7876, - "step": 5481 - }, - { - "epoch": 0.14, - "learning_rate": 1.9985146545134e-06, - "loss": 0.6973, - "step": 5482 - }, - { - "epoch": 0.14, - "learning_rate": 1.9985131465396e-06, - "loss": 1.0674, - "step": 5483 - }, - { - "epoch": 0.14, - "learning_rate": 1.998511637801284e-06, - "loss": 1.166, - "step": 5484 - }, - { - "epoch": 0.14, - "learning_rate": 1.998510128298454e-06, - "loss": 0.7439, - "step": 5485 - }, - { - "epoch": 0.14, - "learning_rate": 1.9985086180311104e-06, - "loss": 1.0371, - "step": 5486 - }, - { - "epoch": 0.14, - "learning_rate": 1.998507106999255e-06, - "loss": 0.9521, - "step": 5487 - }, - { - "epoch": 0.14, - "learning_rate": 1.9985055952028886e-06, - "loss": 0.8633, - "step": 5488 - }, - { - "epoch": 0.14, - "learning_rate": 1.998504082642012e-06, - "loss": 0.9434, - "step": 5489 - }, - { - "epoch": 0.14, - "learning_rate": 1.9985025693166267e-06, - "loss": 0.8823, - "step": 5490 - }, - { - "epoch": 0.14, - "learning_rate": 1.9985010552267343e-06, - "loss": 0.918, - "step": 5491 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984995403723354e-06, - "loss": 0.918, - "step": 5492 - }, - { - "epoch": 0.14, - "learning_rate": 1.998498024753431e-06, - "loss": 1.0908, - "step": 5493 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984965083700234e-06, - "loss": 0.9575, - "step": 5494 - }, - { - "epoch": 0.14, - "learning_rate": 1.998494991222112e-06, - "loss": 0.8467, - "step": 5495 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984934733096998e-06, - "loss": 0.999, - "step": 5496 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984919546327864e-06, - "loss": 0.8945, - "step": 5497 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984904351913737e-06, - "loss": 1.0918, - "step": 5498 - }, - { - "epoch": 0.14, - "learning_rate": 1.998488914985463e-06, - "loss": 0.9238, - "step": 5499 - }, - { - "epoch": 0.14, - "learning_rate": 1.998487394015055e-06, - "loss": 1.0068, - "step": 5500 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984858722801515e-06, - "loss": 0.8564, - "step": 5501 - }, - { - "epoch": 0.14, - "learning_rate": 1.998484349780753e-06, - "loss": 0.9951, - "step": 5502 - }, - { - "epoch": 0.14, - "learning_rate": 1.998482826516861e-06, - "loss": 0.7705, - "step": 5503 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984813024884764e-06, - "loss": 0.8604, - "step": 5504 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984797776956006e-06, - "loss": 0.8228, - "step": 5505 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984782521382352e-06, - "loss": 0.9932, - "step": 5506 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984767258163807e-06, - "loss": 0.8555, - "step": 5507 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984751987300387e-06, - "loss": 0.9336, - "step": 5508 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984736708792096e-06, - "loss": 0.9326, - "step": 5509 - }, - { - "epoch": 0.14, - "learning_rate": 1.998472142263895e-06, - "loss": 0.8608, - "step": 5510 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984706128840967e-06, - "loss": 0.917, - "step": 5511 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984690827398154e-06, - "loss": 1.0439, - "step": 5512 - }, - { - "epoch": 0.14, - "learning_rate": 1.998467551831052e-06, - "loss": 0.9316, - "step": 5513 - }, - { - "epoch": 0.14, - "learning_rate": 1.998466020157808e-06, - "loss": 0.9375, - "step": 5514 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984644877200843e-06, - "loss": 0.7876, - "step": 5515 - }, - { - "epoch": 0.14, - "learning_rate": 1.998462954517883e-06, - "loss": 1.2334, - "step": 5516 - }, - { - "epoch": 0.14, - "learning_rate": 1.998461420551204e-06, - "loss": 0.8081, - "step": 5517 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984598858200487e-06, - "loss": 0.7246, - "step": 5518 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984583503244186e-06, - "loss": 1.0703, - "step": 5519 - }, - { - "epoch": 0.14, - "learning_rate": 1.998456814064315e-06, - "loss": 1.1152, - "step": 5520 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984552770397393e-06, - "loss": 0.6763, - "step": 5521 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984537392506917e-06, - "loss": 0.9507, - "step": 5522 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984522006971744e-06, - "loss": 0.8491, - "step": 5523 - }, - { - "epoch": 0.14, - "learning_rate": 1.998450661379188e-06, - "loss": 1.0059, - "step": 5524 - }, - { - "epoch": 0.14, - "learning_rate": 1.998449121296734e-06, - "loss": 1.1943, - "step": 5525 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984475804498135e-06, - "loss": 0.9531, - "step": 5526 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984460388384272e-06, - "loss": 0.8242, - "step": 5527 - }, - { - "epoch": 0.14, - "learning_rate": 1.998444496462577e-06, - "loss": 0.8633, - "step": 5528 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984429533222635e-06, - "loss": 0.8447, - "step": 5529 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984414094174885e-06, - "loss": 0.9863, - "step": 5530 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984398647482524e-06, - "loss": 0.626, - "step": 5531 - }, - { - "epoch": 0.14, - "learning_rate": 1.998438319314557e-06, - "loss": 0.9214, - "step": 5532 - }, - { - "epoch": 0.14, - "learning_rate": 1.998436773116403e-06, - "loss": 0.9619, - "step": 5533 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984352261537923e-06, - "loss": 0.9077, - "step": 5534 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984336784267257e-06, - "loss": 0.9272, - "step": 5535 - }, - { - "epoch": 0.14, - "learning_rate": 1.998432129935204e-06, - "loss": 0.9697, - "step": 5536 - }, - { - "epoch": 0.14, - "learning_rate": 1.998430580679229e-06, - "loss": 1.0459, - "step": 5537 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984290306588013e-06, - "loss": 0.9111, - "step": 5538 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984274798739225e-06, - "loss": 0.8916, - "step": 5539 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984259283245943e-06, - "loss": 1.0645, - "step": 5540 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984243760108167e-06, - "loss": 0.8398, - "step": 5541 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984228229325915e-06, - "loss": 0.916, - "step": 5542 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984212690899195e-06, - "loss": 0.9541, - "step": 5543 - }, - { - "epoch": 0.14, - "learning_rate": 1.998419714482803e-06, - "loss": 0.9697, - "step": 5544 - }, - { - "epoch": 0.14, - "learning_rate": 1.998418159111242e-06, - "loss": 0.8975, - "step": 5545 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984166029752382e-06, - "loss": 0.9561, - "step": 5546 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984150460747925e-06, - "loss": 0.9531, - "step": 5547 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984134884099064e-06, - "loss": 0.7285, - "step": 5548 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984119299805814e-06, - "loss": 0.8232, - "step": 5549 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984103707868177e-06, - "loss": 0.9297, - "step": 5550 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984088108286174e-06, - "loss": 0.9902, - "step": 5551 - }, - { - "epoch": 0.14, - "learning_rate": 1.9984072501059812e-06, - "loss": 1.1172, - "step": 5552 - }, - { - "epoch": 0.14, - "learning_rate": 1.998405688618911e-06, - "loss": 0.9609, - "step": 5553 - }, - { - "epoch": 0.14, - "learning_rate": 1.998404126367407e-06, - "loss": 0.8799, - "step": 5554 - }, - { - "epoch": 0.14, - "learning_rate": 1.998402563351471e-06, - "loss": 1.0371, - "step": 5555 - }, - { - "epoch": 0.14, - "learning_rate": 1.998400999571104e-06, - "loss": 1.0469, - "step": 5556 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983994350263075e-06, - "loss": 0.8721, - "step": 5557 - }, - { - "epoch": 0.14, - "learning_rate": 1.998397869717082e-06, - "loss": 0.7549, - "step": 5558 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983963036434296e-06, - "loss": 1.0674, - "step": 5559 - }, - { - "epoch": 0.14, - "learning_rate": 1.998394736805351e-06, - "loss": 0.7539, - "step": 5560 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983931692028473e-06, - "loss": 1.0107, - "step": 5561 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983916008359197e-06, - "loss": 0.6118, - "step": 5562 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983900317045698e-06, - "loss": 0.7656, - "step": 5563 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983884618087985e-06, - "loss": 1.0869, - "step": 5564 - }, - { - "epoch": 0.14, - "learning_rate": 1.998386891148607e-06, - "loss": 0.9062, - "step": 5565 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983853197239968e-06, - "loss": 0.8682, - "step": 5566 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983837475349685e-06, - "loss": 1.0068, - "step": 5567 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983821745815243e-06, - "loss": 0.7998, - "step": 5568 - }, - { - "epoch": 0.14, - "learning_rate": 1.998380600863664e-06, - "loss": 0.9658, - "step": 5569 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983790263813903e-06, - "loss": 0.9502, - "step": 5570 - }, - { - "epoch": 0.14, - "learning_rate": 1.998377451134703e-06, - "loss": 1.1582, - "step": 5571 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983758751236046e-06, - "loss": 0.686, - "step": 5572 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983742983480953e-06, - "loss": 1.0137, - "step": 5573 - }, - { - "epoch": 0.14, - "learning_rate": 1.998372720808177e-06, - "loss": 0.6724, - "step": 5574 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983711425038503e-06, - "loss": 0.8145, - "step": 5575 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983695634351166e-06, - "loss": 0.7446, - "step": 5576 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983679836019776e-06, - "loss": 1.0244, - "step": 5577 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983664030044342e-06, - "loss": 1.0752, - "step": 5578 - }, - { - "epoch": 0.14, - "learning_rate": 1.998364821642487e-06, - "loss": 0.7764, - "step": 5579 - }, - { - "epoch": 0.14, - "learning_rate": 1.998363239516138e-06, - "loss": 0.8948, - "step": 5580 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983616566253886e-06, - "loss": 0.6699, - "step": 5581 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983600729702396e-06, - "loss": 0.6992, - "step": 5582 - }, - { - "epoch": 0.14, - "learning_rate": 1.998358488550692e-06, - "loss": 1.0996, - "step": 5583 - }, - { - "epoch": 0.14, - "learning_rate": 1.998356903366747e-06, - "loss": 0.7119, - "step": 5584 - }, - { - "epoch": 0.14, - "learning_rate": 1.998355317418406e-06, - "loss": 0.9736, - "step": 5585 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983537307056702e-06, - "loss": 0.8557, - "step": 5586 - }, - { - "epoch": 0.14, - "learning_rate": 1.998352143228541e-06, - "loss": 0.9141, - "step": 5587 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983505549870197e-06, - "loss": 1.0527, - "step": 5588 - }, - { - "epoch": 0.14, - "learning_rate": 1.998348965981107e-06, - "loss": 0.8164, - "step": 5589 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983473762108044e-06, - "loss": 0.8193, - "step": 5590 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983457856761135e-06, - "loss": 0.9102, - "step": 5591 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983441943770347e-06, - "loss": 0.7759, - "step": 5592 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983426023135696e-06, - "loss": 0.9277, - "step": 5593 - }, - { - "epoch": 0.14, - "learning_rate": 1.99834100948572e-06, - "loss": 1.0654, - "step": 5594 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983394158934863e-06, - "loss": 0.8208, - "step": 5595 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983378215368697e-06, - "loss": 0.915, - "step": 5596 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983362264158723e-06, - "loss": 0.9414, - "step": 5597 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983346305304942e-06, - "loss": 1.1396, - "step": 5598 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983330338807375e-06, - "loss": 0.8125, - "step": 5599 - }, - { - "epoch": 0.14, - "learning_rate": 1.998331436466603e-06, - "loss": 0.7285, - "step": 5600 - }, - { - "epoch": 0.14, - "learning_rate": 1.998329838288092e-06, - "loss": 0.9951, - "step": 5601 - }, - { - "epoch": 0.14, - "learning_rate": 1.998328239345206e-06, - "loss": 0.9697, - "step": 5602 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983266396379456e-06, - "loss": 0.8652, - "step": 5603 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983250391663127e-06, - "loss": 0.7734, - "step": 5604 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983234379303083e-06, - "loss": 0.918, - "step": 5605 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983218359299334e-06, - "loss": 1.0449, - "step": 5606 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983202331651892e-06, - "loss": 0.9121, - "step": 5607 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983186296360774e-06, - "loss": 0.8613, - "step": 5608 - }, - { - "epoch": 0.14, - "learning_rate": 1.998317025342599e-06, - "loss": 0.7646, - "step": 5609 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983154202847547e-06, - "loss": 0.8799, - "step": 5610 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983138144625464e-06, - "loss": 0.9004, - "step": 5611 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983122078759747e-06, - "loss": 0.9292, - "step": 5612 - }, - { - "epoch": 0.14, - "learning_rate": 1.998310600525042e-06, - "loss": 1.0225, - "step": 5613 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983089924097484e-06, - "loss": 1.0674, - "step": 5614 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983073835300954e-06, - "loss": 1.0449, - "step": 5615 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983057738860846e-06, - "loss": 1.0361, - "step": 5616 - }, - { - "epoch": 0.14, - "learning_rate": 1.998304163477717e-06, - "loss": 0.9658, - "step": 5617 - }, - { - "epoch": 0.14, - "learning_rate": 1.9983025523049936e-06, - "loss": 0.8838, - "step": 5618 - }, - { - "epoch": 0.14, - "learning_rate": 1.998300940367916e-06, - "loss": 0.8496, - "step": 5619 - }, - { - "epoch": 0.14, - "learning_rate": 1.998299327666485e-06, - "loss": 0.8604, - "step": 5620 - }, - { - "epoch": 0.14, - "learning_rate": 1.9982977142007023e-06, - "loss": 0.769, - "step": 5621 - }, - { - "epoch": 0.14, - "learning_rate": 1.998296099970569e-06, - "loss": 1.0312, - "step": 5622 - }, - { - "epoch": 0.14, - "learning_rate": 1.9982944849760864e-06, - "loss": 0.8682, - "step": 5623 - }, - { - "epoch": 0.14, - "learning_rate": 1.9982928692172553e-06, - "loss": 1.0703, - "step": 5624 - }, - { - "epoch": 0.14, - "learning_rate": 1.9982912526940775e-06, - "loss": 0.8555, - "step": 5625 - }, - { - "epoch": 0.14, - "learning_rate": 1.9982896354065536e-06, - "loss": 0.6973, - "step": 5626 - }, - { - "epoch": 0.14, - "learning_rate": 1.9982880173546858e-06, - "loss": 1.002, - "step": 5627 - }, - { - "epoch": 0.14, - "learning_rate": 1.9982863985384745e-06, - "loss": 0.9424, - "step": 5628 - }, - { - "epoch": 0.14, - "learning_rate": 1.998284778957921e-06, - "loss": 0.9043, - "step": 5629 - }, - { - "epoch": 0.14, - "learning_rate": 1.998283158613027e-06, - "loss": 0.6655, - "step": 5630 - }, - { - "epoch": 0.14, - "learning_rate": 1.9982815375037934e-06, - "loss": 0.749, - "step": 5631 - }, - { - "epoch": 0.14, - "learning_rate": 1.9982799156302214e-06, - "loss": 1.082, - "step": 5632 - }, - { - "epoch": 0.14, - "learning_rate": 1.9982782929923127e-06, - "loss": 1.1934, - "step": 5633 - }, - { - "epoch": 0.14, - "learning_rate": 1.998276669590068e-06, - "loss": 0.7783, - "step": 5634 - }, - { - "epoch": 0.14, - "learning_rate": 1.9982750454234885e-06, - "loss": 1.043, - "step": 5635 - }, - { - "epoch": 0.14, - "learning_rate": 1.998273420492576e-06, - "loss": 0.9629, - "step": 5636 - }, - { - "epoch": 0.14, - "learning_rate": 1.9982717947973316e-06, - "loss": 0.9248, - "step": 5637 - }, - { - "epoch": 0.14, - "learning_rate": 1.9982701683377563e-06, - "loss": 1.0654, - "step": 5638 - }, - { - "epoch": 0.14, - "learning_rate": 1.9982685411138515e-06, - "loss": 0.7686, - "step": 5639 - }, - { - "epoch": 0.14, - "learning_rate": 1.998266913125618e-06, - "loss": 0.9639, - "step": 5640 - }, - { - "epoch": 0.14, - "learning_rate": 1.9982652843730577e-06, - "loss": 0.9844, - "step": 5641 - }, - { - "epoch": 0.14, - "learning_rate": 1.9982636548561717e-06, - "loss": 1.1621, - "step": 5642 - }, - { - "epoch": 0.14, - "learning_rate": 1.9982620245749608e-06, - "loss": 0.8892, - "step": 5643 - }, - { - "epoch": 0.14, - "learning_rate": 1.9982603935294267e-06, - "loss": 1.1348, - "step": 5644 - }, - { - "epoch": 0.14, - "learning_rate": 1.9982587617195704e-06, - "loss": 0.7651, - "step": 5645 - }, - { - "epoch": 0.14, - "learning_rate": 1.9982571291453934e-06, - "loss": 0.8701, - "step": 5646 - }, - { - "epoch": 0.14, - "learning_rate": 1.9982554958068967e-06, - "loss": 0.9258, - "step": 5647 - }, - { - "epoch": 0.14, - "learning_rate": 1.998253861704082e-06, - "loss": 0.9941, - "step": 5648 - }, - { - "epoch": 0.14, - "learning_rate": 1.99825222683695e-06, - "loss": 1.0898, - "step": 5649 - }, - { - "epoch": 0.14, - "learning_rate": 1.998250591205502e-06, - "loss": 1.001, - "step": 5650 - }, - { - "epoch": 0.14, - "learning_rate": 1.99824895480974e-06, - "loss": 0.9238, - "step": 5651 - }, - { - "epoch": 0.14, - "learning_rate": 1.998247317649664e-06, - "loss": 0.814, - "step": 5652 - }, - { - "epoch": 0.14, - "learning_rate": 1.998245679725276e-06, - "loss": 1.0332, - "step": 5653 - }, - { - "epoch": 0.14, - "learning_rate": 1.9982440410365776e-06, - "loss": 0.8652, - "step": 5654 - }, - { - "epoch": 0.14, - "learning_rate": 1.9982424015835694e-06, - "loss": 0.8906, - "step": 5655 - }, - { - "epoch": 0.14, - "learning_rate": 1.998240761366253e-06, - "loss": 0.8398, - "step": 5656 - }, - { - "epoch": 0.14, - "learning_rate": 1.9982391203846294e-06, - "loss": 0.9912, - "step": 5657 - }, - { - "epoch": 0.15, - "learning_rate": 1.9982374786387e-06, - "loss": 0.8174, - "step": 5658 - }, - { - "epoch": 0.15, - "learning_rate": 1.9982358361284663e-06, - "loss": 1.0352, - "step": 5659 - }, - { - "epoch": 0.15, - "learning_rate": 1.998234192853929e-06, - "loss": 0.9736, - "step": 5660 - }, - { - "epoch": 0.15, - "learning_rate": 1.99823254881509e-06, - "loss": 0.918, - "step": 5661 - }, - { - "epoch": 0.15, - "learning_rate": 1.99823090401195e-06, - "loss": 0.9609, - "step": 5662 - }, - { - "epoch": 0.15, - "learning_rate": 1.9982292584445104e-06, - "loss": 0.9065, - "step": 5663 - }, - { - "epoch": 0.15, - "learning_rate": 1.9982276121127727e-06, - "loss": 0.7937, - "step": 5664 - }, - { - "epoch": 0.15, - "learning_rate": 1.998225965016738e-06, - "loss": 1.0566, - "step": 5665 - }, - { - "epoch": 0.15, - "learning_rate": 1.998224317156408e-06, - "loss": 0.8208, - "step": 5666 - }, - { - "epoch": 0.15, - "learning_rate": 1.998222668531783e-06, - "loss": 0.7832, - "step": 5667 - }, - { - "epoch": 0.15, - "learning_rate": 1.998221019142865e-06, - "loss": 0.8389, - "step": 5668 - }, - { - "epoch": 0.15, - "learning_rate": 1.998219368989655e-06, - "loss": 0.9092, - "step": 5669 - }, - { - "epoch": 0.15, - "learning_rate": 1.9982177180721544e-06, - "loss": 0.8916, - "step": 5670 - }, - { - "epoch": 0.15, - "learning_rate": 1.9982160663903643e-06, - "loss": 1.0381, - "step": 5671 - }, - { - "epoch": 0.15, - "learning_rate": 1.998214413944286e-06, - "loss": 1.1406, - "step": 5672 - }, - { - "epoch": 0.15, - "learning_rate": 1.9982127607339213e-06, - "loss": 0.7715, - "step": 5673 - }, - { - "epoch": 0.15, - "learning_rate": 1.99821110675927e-06, - "loss": 1.082, - "step": 5674 - }, - { - "epoch": 0.15, - "learning_rate": 1.9982094520203353e-06, - "loss": 0.9482, - "step": 5675 - }, - { - "epoch": 0.15, - "learning_rate": 1.9982077965171175e-06, - "loss": 0.9092, - "step": 5676 - }, - { - "epoch": 0.15, - "learning_rate": 1.9982061402496172e-06, - "loss": 0.9675, - "step": 5677 - }, - { - "epoch": 0.15, - "learning_rate": 1.998204483217837e-06, - "loss": 1.1006, - "step": 5678 - }, - { - "epoch": 0.15, - "learning_rate": 1.9982028254217773e-06, - "loss": 0.7075, - "step": 5679 - }, - { - "epoch": 0.15, - "learning_rate": 1.9982011668614393e-06, - "loss": 0.8594, - "step": 5680 - }, - { - "epoch": 0.15, - "learning_rate": 1.998199507536825e-06, - "loss": 0.8931, - "step": 5681 - }, - { - "epoch": 0.15, - "learning_rate": 1.9981978474479353e-06, - "loss": 0.835, - "step": 5682 - }, - { - "epoch": 0.15, - "learning_rate": 1.9981961865947706e-06, - "loss": 0.9268, - "step": 5683 - }, - { - "epoch": 0.15, - "learning_rate": 1.998194524977334e-06, - "loss": 0.9727, - "step": 5684 - }, - { - "epoch": 0.15, - "learning_rate": 1.998192862595625e-06, - "loss": 0.875, - "step": 5685 - }, - { - "epoch": 0.15, - "learning_rate": 1.998191199449646e-06, - "loss": 0.9863, - "step": 5686 - }, - { - "epoch": 0.15, - "learning_rate": 1.998189535539398e-06, - "loss": 0.959, - "step": 5687 - }, - { - "epoch": 0.15, - "learning_rate": 1.9981878708648817e-06, - "loss": 1.0586, - "step": 5688 - }, - { - "epoch": 0.15, - "learning_rate": 1.998186205426099e-06, - "loss": 1.0186, - "step": 5689 - }, - { - "epoch": 0.15, - "learning_rate": 1.9981845392230514e-06, - "loss": 0.8906, - "step": 5690 - }, - { - "epoch": 0.15, - "learning_rate": 1.9981828722557395e-06, - "loss": 0.9004, - "step": 5691 - }, - { - "epoch": 0.15, - "learning_rate": 1.998181204524165e-06, - "loss": 0.8311, - "step": 5692 - }, - { - "epoch": 0.15, - "learning_rate": 1.998179536028329e-06, - "loss": 0.8716, - "step": 5693 - }, - { - "epoch": 0.15, - "learning_rate": 1.998177866768233e-06, - "loss": 0.8711, - "step": 5694 - }, - { - "epoch": 0.15, - "learning_rate": 1.9981761967438773e-06, - "loss": 0.9189, - "step": 5695 - }, - { - "epoch": 0.15, - "learning_rate": 1.998174525955265e-06, - "loss": 1.0, - "step": 5696 - }, - { - "epoch": 0.15, - "learning_rate": 1.998172854402396e-06, - "loss": 1.0029, - "step": 5697 - }, - { - "epoch": 0.15, - "learning_rate": 1.9981711820852717e-06, - "loss": 0.9834, - "step": 5698 - }, - { - "epoch": 0.15, - "learning_rate": 1.998169509003894e-06, - "loss": 1.0547, - "step": 5699 - }, - { - "epoch": 0.15, - "learning_rate": 1.9981678351582635e-06, - "loss": 0.9883, - "step": 5700 - }, - { - "epoch": 0.15, - "learning_rate": 1.998166160548382e-06, - "loss": 1.0166, - "step": 5701 - }, - { - "epoch": 0.15, - "learning_rate": 1.9981644851742504e-06, - "loss": 0.7046, - "step": 5702 - }, - { - "epoch": 0.15, - "learning_rate": 1.99816280903587e-06, - "loss": 0.8657, - "step": 5703 - }, - { - "epoch": 0.15, - "learning_rate": 1.9981611321332428e-06, - "loss": 1.1777, - "step": 5704 - }, - { - "epoch": 0.15, - "learning_rate": 1.998159454466369e-06, - "loss": 0.9902, - "step": 5705 - }, - { - "epoch": 0.15, - "learning_rate": 1.9981577760352505e-06, - "loss": 0.9043, - "step": 5706 - }, - { - "epoch": 0.15, - "learning_rate": 1.998156096839889e-06, - "loss": 0.9639, - "step": 5707 - }, - { - "epoch": 0.15, - "learning_rate": 1.9981544168802845e-06, - "loss": 0.9302, - "step": 5708 - }, - { - "epoch": 0.15, - "learning_rate": 1.9981527361564396e-06, - "loss": 0.9004, - "step": 5709 - }, - { - "epoch": 0.15, - "learning_rate": 1.9981510546683546e-06, - "loss": 0.793, - "step": 5710 - }, - { - "epoch": 0.15, - "learning_rate": 1.9981493724160316e-06, - "loss": 0.8105, - "step": 5711 - }, - { - "epoch": 0.15, - "learning_rate": 1.9981476893994714e-06, - "loss": 0.9912, - "step": 5712 - }, - { - "epoch": 0.15, - "learning_rate": 1.9981460056186753e-06, - "loss": 0.9531, - "step": 5713 - }, - { - "epoch": 0.15, - "learning_rate": 1.998144321073645e-06, - "loss": 0.7188, - "step": 5714 - }, - { - "epoch": 0.15, - "learning_rate": 1.9981426357643813e-06, - "loss": 0.999, - "step": 5715 - }, - { - "epoch": 0.15, - "learning_rate": 1.9981409496908856e-06, - "loss": 1.0771, - "step": 5716 - }, - { - "epoch": 0.15, - "learning_rate": 1.9981392628531594e-06, - "loss": 0.9629, - "step": 5717 - }, - { - "epoch": 0.15, - "learning_rate": 1.9981375752512037e-06, - "loss": 0.9766, - "step": 5718 - }, - { - "epoch": 0.15, - "learning_rate": 1.99813588688502e-06, - "loss": 0.9941, - "step": 5719 - }, - { - "epoch": 0.15, - "learning_rate": 1.9981341977546096e-06, - "loss": 0.9932, - "step": 5720 - }, - { - "epoch": 0.15, - "learning_rate": 1.9981325078599738e-06, - "loss": 0.916, - "step": 5721 - }, - { - "epoch": 0.15, - "learning_rate": 1.998130817201114e-06, - "loss": 1.0947, - "step": 5722 - }, - { - "epoch": 0.15, - "learning_rate": 1.9981291257780307e-06, - "loss": 0.8359, - "step": 5723 - }, - { - "epoch": 0.15, - "learning_rate": 1.9981274335907266e-06, - "loss": 0.7358, - "step": 5724 - }, - { - "epoch": 0.15, - "learning_rate": 1.9981257406392017e-06, - "loss": 1.042, - "step": 5725 - }, - { - "epoch": 0.15, - "learning_rate": 1.998124046923458e-06, - "loss": 1.0703, - "step": 5726 - }, - { - "epoch": 0.15, - "learning_rate": 1.9981223524434965e-06, - "loss": 1.0811, - "step": 5727 - }, - { - "epoch": 0.15, - "learning_rate": 1.998120657199319e-06, - "loss": 0.7292, - "step": 5728 - }, - { - "epoch": 0.15, - "learning_rate": 1.9981189611909255e-06, - "loss": 0.5605, - "step": 5729 - }, - { - "epoch": 0.15, - "learning_rate": 1.9981172644183194e-06, - "loss": 0.9463, - "step": 5730 - }, - { - "epoch": 0.15, - "learning_rate": 1.9981155668815e-06, - "loss": 0.9688, - "step": 5731 - }, - { - "epoch": 0.15, - "learning_rate": 1.99811386858047e-06, - "loss": 0.8096, - "step": 5732 - }, - { - "epoch": 0.15, - "learning_rate": 1.9981121695152294e-06, - "loss": 1.0918, - "step": 5733 - }, - { - "epoch": 0.15, - "learning_rate": 1.9981104696857805e-06, - "loss": 0.7705, - "step": 5734 - }, - { - "epoch": 0.15, - "learning_rate": 1.9981087690921245e-06, - "loss": 1.0625, - "step": 5735 - }, - { - "epoch": 0.15, - "learning_rate": 1.9981070677342623e-06, - "loss": 1.0537, - "step": 5736 - }, - { - "epoch": 0.15, - "learning_rate": 1.9981053656121955e-06, - "loss": 1.0029, - "step": 5737 - }, - { - "epoch": 0.15, - "learning_rate": 1.998103662725925e-06, - "loss": 1.083, - "step": 5738 - }, - { - "epoch": 0.15, - "learning_rate": 1.998101959075453e-06, - "loss": 0.8877, - "step": 5739 - }, - { - "epoch": 0.15, - "learning_rate": 1.9981002546607796e-06, - "loss": 0.6938, - "step": 5740 - }, - { - "epoch": 0.15, - "learning_rate": 1.9980985494819072e-06, - "loss": 0.8203, - "step": 5741 - }, - { - "epoch": 0.15, - "learning_rate": 1.9980968435388363e-06, - "loss": 0.8184, - "step": 5742 - }, - { - "epoch": 0.15, - "learning_rate": 1.998095136831569e-06, - "loss": 0.7871, - "step": 5743 - }, - { - "epoch": 0.15, - "learning_rate": 1.9980934293601056e-06, - "loss": 0.9902, - "step": 5744 - }, - { - "epoch": 0.15, - "learning_rate": 1.998091721124448e-06, - "loss": 0.9121, - "step": 5745 - }, - { - "epoch": 0.15, - "learning_rate": 1.998090012124598e-06, - "loss": 0.9688, - "step": 5746 - }, - { - "epoch": 0.15, - "learning_rate": 1.998088302360556e-06, - "loss": 0.9014, - "step": 5747 - }, - { - "epoch": 0.15, - "learning_rate": 1.998086591832324e-06, - "loss": 0.8398, - "step": 5748 - }, - { - "epoch": 0.15, - "learning_rate": 1.9980848805399024e-06, - "loss": 0.8623, - "step": 5749 - }, - { - "epoch": 0.15, - "learning_rate": 1.9980831684832936e-06, - "loss": 0.9814, - "step": 5750 - }, - { - "epoch": 0.15, - "learning_rate": 1.998081455662498e-06, - "loss": 0.7002, - "step": 5751 - }, - { - "epoch": 0.15, - "learning_rate": 1.998079742077518e-06, - "loss": 1.1357, - "step": 5752 - }, - { - "epoch": 0.15, - "learning_rate": 1.9980780277283535e-06, - "loss": 0.8818, - "step": 5753 - }, - { - "epoch": 0.15, - "learning_rate": 1.998076312615007e-06, - "loss": 0.8652, - "step": 5754 - }, - { - "epoch": 0.15, - "learning_rate": 1.998074596737479e-06, - "loss": 0.7339, - "step": 5755 - }, - { - "epoch": 0.15, - "learning_rate": 1.9980728800957713e-06, - "loss": 0.999, - "step": 5756 - }, - { - "epoch": 0.15, - "learning_rate": 1.9980711626898852e-06, - "loss": 0.9707, - "step": 5757 - }, - { - "epoch": 0.15, - "learning_rate": 1.9980694445198217e-06, - "loss": 1.145, - "step": 5758 - }, - { - "epoch": 0.15, - "learning_rate": 1.9980677255855828e-06, - "loss": 1.0674, - "step": 5759 - }, - { - "epoch": 0.15, - "learning_rate": 1.998066005887169e-06, - "loss": 0.9795, - "step": 5760 - }, - { - "epoch": 0.15, - "learning_rate": 1.998064285424582e-06, - "loss": 0.9717, - "step": 5761 - }, - { - "epoch": 0.15, - "learning_rate": 1.998062564197823e-06, - "loss": 1.125, - "step": 5762 - }, - { - "epoch": 0.15, - "learning_rate": 1.9980608422068933e-06, - "loss": 0.9326, - "step": 5763 - }, - { - "epoch": 0.15, - "learning_rate": 1.9980591194517947e-06, - "loss": 0.8506, - "step": 5764 - }, - { - "epoch": 0.15, - "learning_rate": 1.998057395932528e-06, - "loss": 0.8726, - "step": 5765 - }, - { - "epoch": 0.15, - "learning_rate": 1.9980556716490943e-06, - "loss": 0.6884, - "step": 5766 - }, - { - "epoch": 0.15, - "learning_rate": 1.9980539466014955e-06, - "loss": 0.657, - "step": 5767 - }, - { - "epoch": 0.15, - "learning_rate": 1.9980522207897327e-06, - "loss": 0.9351, - "step": 5768 - }, - { - "epoch": 0.15, - "learning_rate": 1.998050494213807e-06, - "loss": 0.6743, - "step": 5769 - }, - { - "epoch": 0.15, - "learning_rate": 1.99804876687372e-06, - "loss": 1.0264, - "step": 5770 - }, - { - "epoch": 0.15, - "learning_rate": 1.998047038769473e-06, - "loss": 0.843, - "step": 5771 - }, - { - "epoch": 0.15, - "learning_rate": 1.9980453099010674e-06, - "loss": 0.9971, - "step": 5772 - }, - { - "epoch": 0.15, - "learning_rate": 1.9980435802685042e-06, - "loss": 0.9609, - "step": 5773 - }, - { - "epoch": 0.15, - "learning_rate": 1.998041849871785e-06, - "loss": 1.0547, - "step": 5774 - }, - { - "epoch": 0.15, - "learning_rate": 1.998040118710911e-06, - "loss": 1.0732, - "step": 5775 - }, - { - "epoch": 0.15, - "learning_rate": 1.998038386785884e-06, - "loss": 0.7661, - "step": 5776 - }, - { - "epoch": 0.15, - "learning_rate": 1.9980366540967044e-06, - "loss": 0.9004, - "step": 5777 - }, - { - "epoch": 0.15, - "learning_rate": 1.9980349206433743e-06, - "loss": 0.8403, - "step": 5778 - }, - { - "epoch": 0.15, - "learning_rate": 1.9980331864258946e-06, - "loss": 0.8955, - "step": 5779 - }, - { - "epoch": 0.15, - "learning_rate": 1.9980314514442667e-06, - "loss": 1.2197, - "step": 5780 - }, - { - "epoch": 0.15, - "learning_rate": 1.9980297156984923e-06, - "loss": 0.9902, - "step": 5781 - }, - { - "epoch": 0.15, - "learning_rate": 1.998027979188572e-06, - "loss": 0.9453, - "step": 5782 - }, - { - "epoch": 0.15, - "learning_rate": 1.9980262419145076e-06, - "loss": 0.8555, - "step": 5783 - }, - { - "epoch": 0.15, - "learning_rate": 1.9980245038763007e-06, - "loss": 0.9766, - "step": 5784 - }, - { - "epoch": 0.15, - "learning_rate": 1.9980227650739524e-06, - "loss": 0.8027, - "step": 5785 - }, - { - "epoch": 0.15, - "learning_rate": 1.9980210255074635e-06, - "loss": 0.9697, - "step": 5786 - }, - { - "epoch": 0.15, - "learning_rate": 1.9980192851768365e-06, - "loss": 1.1484, - "step": 5787 - }, - { - "epoch": 0.15, - "learning_rate": 1.9980175440820714e-06, - "loss": 0.8652, - "step": 5788 - }, - { - "epoch": 0.15, - "learning_rate": 1.9980158022231704e-06, - "loss": 1.0176, - "step": 5789 - }, - { - "epoch": 0.15, - "learning_rate": 1.9980140596001343e-06, - "loss": 0.9639, - "step": 5790 - }, - { - "epoch": 0.15, - "learning_rate": 1.9980123162129652e-06, - "loss": 1.0664, - "step": 5791 - }, - { - "epoch": 0.15, - "learning_rate": 1.998010572061664e-06, - "loss": 0.9658, - "step": 5792 - }, - { - "epoch": 0.15, - "learning_rate": 1.9980088271462315e-06, - "loss": 0.8262, - "step": 5793 - }, - { - "epoch": 0.15, - "learning_rate": 1.9980070814666698e-06, - "loss": 0.832, - "step": 5794 - }, - { - "epoch": 0.15, - "learning_rate": 1.99800533502298e-06, - "loss": 0.9404, - "step": 5795 - }, - { - "epoch": 0.15, - "learning_rate": 1.9980035878151635e-06, - "loss": 0.957, - "step": 5796 - }, - { - "epoch": 0.15, - "learning_rate": 1.998001839843221e-06, - "loss": 0.96, - "step": 5797 - }, - { - "epoch": 0.15, - "learning_rate": 1.998000091107155e-06, - "loss": 1.0234, - "step": 5798 - }, - { - "epoch": 0.15, - "learning_rate": 1.997998341606966e-06, - "loss": 0.8574, - "step": 5799 - }, - { - "epoch": 0.15, - "learning_rate": 1.9979965913426555e-06, - "loss": 0.7944, - "step": 5800 - }, - { - "epoch": 0.15, - "learning_rate": 1.997994840314225e-06, - "loss": 0.8198, - "step": 5801 - }, - { - "epoch": 0.15, - "learning_rate": 1.9979930885216754e-06, - "loss": 0.9746, - "step": 5802 - }, - { - "epoch": 0.15, - "learning_rate": 1.9979913359650087e-06, - "loss": 1.1738, - "step": 5803 - }, - { - "epoch": 0.15, - "learning_rate": 1.997989582644226e-06, - "loss": 1.0107, - "step": 5804 - }, - { - "epoch": 0.15, - "learning_rate": 1.9979878285593285e-06, - "loss": 0.8584, - "step": 5805 - }, - { - "epoch": 0.15, - "learning_rate": 1.9979860737103175e-06, - "loss": 0.8906, - "step": 5806 - }, - { - "epoch": 0.15, - "learning_rate": 1.9979843180971943e-06, - "loss": 0.938, - "step": 5807 - }, - { - "epoch": 0.15, - "learning_rate": 1.997982561719961e-06, - "loss": 0.998, - "step": 5808 - }, - { - "epoch": 0.15, - "learning_rate": 1.997980804578618e-06, - "loss": 0.9404, - "step": 5809 - }, - { - "epoch": 0.15, - "learning_rate": 1.997979046673167e-06, - "loss": 1.0811, - "step": 5810 - }, - { - "epoch": 0.15, - "learning_rate": 1.997977288003609e-06, - "loss": 0.7686, - "step": 5811 - }, - { - "epoch": 0.15, - "learning_rate": 1.997975528569946e-06, - "loss": 0.9199, - "step": 5812 - }, - { - "epoch": 0.15, - "learning_rate": 1.997973768372179e-06, - "loss": 0.8555, - "step": 5813 - }, - { - "epoch": 0.15, - "learning_rate": 1.9979720074103095e-06, - "loss": 1.0078, - "step": 5814 - }, - { - "epoch": 0.15, - "learning_rate": 1.9979702456843384e-06, - "loss": 1.3057, - "step": 5815 - }, - { - "epoch": 0.15, - "learning_rate": 1.9979684831942673e-06, - "loss": 0.8164, - "step": 5816 - }, - { - "epoch": 0.15, - "learning_rate": 1.997966719940098e-06, - "loss": 0.7744, - "step": 5817 - }, - { - "epoch": 0.15, - "learning_rate": 1.9979649559218313e-06, - "loss": 1.1133, - "step": 5818 - }, - { - "epoch": 0.15, - "learning_rate": 1.997963191139469e-06, - "loss": 0.8906, - "step": 5819 - }, - { - "epoch": 0.15, - "learning_rate": 1.997961425593012e-06, - "loss": 0.6958, - "step": 5820 - }, - { - "epoch": 0.15, - "learning_rate": 1.997959659282462e-06, - "loss": 0.8047, - "step": 5821 - }, - { - "epoch": 0.15, - "learning_rate": 1.9979578922078194e-06, - "loss": 0.7695, - "step": 5822 - }, - { - "epoch": 0.15, - "learning_rate": 1.997956124369087e-06, - "loss": 1.0596, - "step": 5823 - }, - { - "epoch": 0.15, - "learning_rate": 1.9979543557662653e-06, - "loss": 0.9346, - "step": 5824 - }, - { - "epoch": 0.15, - "learning_rate": 1.9979525863993556e-06, - "loss": 0.8818, - "step": 5825 - }, - { - "epoch": 0.15, - "learning_rate": 1.99795081626836e-06, - "loss": 1.041, - "step": 5826 - }, - { - "epoch": 0.15, - "learning_rate": 1.997949045373279e-06, - "loss": 0.9365, - "step": 5827 - }, - { - "epoch": 0.15, - "learning_rate": 1.9979472737141147e-06, - "loss": 0.9507, - "step": 5828 - }, - { - "epoch": 0.15, - "learning_rate": 1.9979455012908675e-06, - "loss": 0.9238, - "step": 5829 - }, - { - "epoch": 0.15, - "learning_rate": 1.99794372810354e-06, - "loss": 0.8428, - "step": 5830 - }, - { - "epoch": 0.15, - "learning_rate": 1.997941954152132e-06, - "loss": 0.752, - "step": 5831 - }, - { - "epoch": 0.15, - "learning_rate": 1.997940179436646e-06, - "loss": 0.8003, - "step": 5832 - }, - { - "epoch": 0.15, - "learning_rate": 1.9979384039570837e-06, - "loss": 0.9834, - "step": 5833 - }, - { - "epoch": 0.15, - "learning_rate": 1.9979366277134452e-06, - "loss": 0.792, - "step": 5834 - }, - { - "epoch": 0.15, - "learning_rate": 1.9979348507057326e-06, - "loss": 0.9385, - "step": 5835 - }, - { - "epoch": 0.15, - "learning_rate": 1.9979330729339475e-06, - "loss": 1.0068, - "step": 5836 - }, - { - "epoch": 0.15, - "learning_rate": 1.997931294398091e-06, - "loss": 0.9053, - "step": 5837 - }, - { - "epoch": 0.15, - "learning_rate": 1.997929515098164e-06, - "loss": 0.4937, - "step": 5838 - }, - { - "epoch": 0.15, - "learning_rate": 1.9979277350341683e-06, - "loss": 0.8457, - "step": 5839 - }, - { - "epoch": 0.15, - "learning_rate": 1.9979259542061054e-06, - "loss": 0.854, - "step": 5840 - }, - { - "epoch": 0.15, - "learning_rate": 1.9979241726139765e-06, - "loss": 0.7764, - "step": 5841 - }, - { - "epoch": 0.15, - "learning_rate": 1.9979223902577827e-06, - "loss": 0.9517, - "step": 5842 - }, - { - "epoch": 0.15, - "learning_rate": 1.997920607137526e-06, - "loss": 0.752, - "step": 5843 - }, - { - "epoch": 0.15, - "learning_rate": 1.997918823253207e-06, - "loss": 0.9385, - "step": 5844 - }, - { - "epoch": 0.15, - "learning_rate": 1.9979170386048274e-06, - "loss": 1.2168, - "step": 5845 - }, - { - "epoch": 0.15, - "learning_rate": 1.997915253192389e-06, - "loss": 0.9678, - "step": 5846 - }, - { - "epoch": 0.15, - "learning_rate": 1.9979134670158927e-06, - "loss": 1.0557, - "step": 5847 - }, - { - "epoch": 0.15, - "learning_rate": 1.9979116800753397e-06, - "loss": 0.855, - "step": 5848 - }, - { - "epoch": 0.15, - "learning_rate": 1.9979098923707318e-06, - "loss": 1.1055, - "step": 5849 - }, - { - "epoch": 0.15, - "learning_rate": 1.9979081039020696e-06, - "loss": 1.1562, - "step": 5850 - }, - { - "epoch": 0.15, - "learning_rate": 1.9979063146693557e-06, - "loss": 0.9775, - "step": 5851 - }, - { - "epoch": 0.15, - "learning_rate": 1.9979045246725906e-06, - "loss": 0.9141, - "step": 5852 - }, - { - "epoch": 0.15, - "learning_rate": 1.9979027339117764e-06, - "loss": 0.9473, - "step": 5853 - }, - { - "epoch": 0.15, - "learning_rate": 1.9979009423869134e-06, - "loss": 0.8447, - "step": 5854 - }, - { - "epoch": 0.15, - "learning_rate": 1.9978991500980035e-06, - "loss": 0.8174, - "step": 5855 - }, - { - "epoch": 0.15, - "learning_rate": 1.997897357045048e-06, - "loss": 0.7744, - "step": 5856 - }, - { - "epoch": 0.15, - "learning_rate": 1.997895563228049e-06, - "loss": 1.0127, - "step": 5857 - }, - { - "epoch": 0.15, - "learning_rate": 1.9978937686470068e-06, - "loss": 0.8984, - "step": 5858 - }, - { - "epoch": 0.15, - "learning_rate": 1.9978919733019236e-06, - "loss": 1.042, - "step": 5859 - }, - { - "epoch": 0.15, - "learning_rate": 1.9978901771927997e-06, - "loss": 1.001, - "step": 5860 - }, - { - "epoch": 0.15, - "learning_rate": 1.9978883803196378e-06, - "loss": 0.9902, - "step": 5861 - }, - { - "epoch": 0.15, - "learning_rate": 1.9978865826824386e-06, - "loss": 1.0078, - "step": 5862 - }, - { - "epoch": 0.15, - "learning_rate": 1.997884784281203e-06, - "loss": 0.9844, - "step": 5863 - }, - { - "epoch": 0.15, - "learning_rate": 1.9978829851159334e-06, - "loss": 0.9707, - "step": 5864 - }, - { - "epoch": 0.15, - "learning_rate": 1.997881185186631e-06, - "loss": 1.0605, - "step": 5865 - }, - { - "epoch": 0.15, - "learning_rate": 1.997879384493296e-06, - "loss": 1.001, - "step": 5866 - }, - { - "epoch": 0.15, - "learning_rate": 1.9978775830359308e-06, - "loss": 0.9121, - "step": 5867 - }, - { - "epoch": 0.15, - "learning_rate": 1.997875780814537e-06, - "loss": 0.8418, - "step": 5868 - }, - { - "epoch": 0.15, - "learning_rate": 1.9978739778291156e-06, - "loss": 0.9551, - "step": 5869 - }, - { - "epoch": 0.15, - "learning_rate": 1.997872174079668e-06, - "loss": 0.9023, - "step": 5870 - }, - { - "epoch": 0.15, - "learning_rate": 1.9978703695661953e-06, - "loss": 0.8081, - "step": 5871 - }, - { - "epoch": 0.15, - "learning_rate": 1.997868564288699e-06, - "loss": 1.0547, - "step": 5872 - }, - { - "epoch": 0.15, - "learning_rate": 1.997866758247181e-06, - "loss": 0.8564, - "step": 5873 - }, - { - "epoch": 0.15, - "learning_rate": 1.997864951441642e-06, - "loss": 0.8228, - "step": 5874 - }, - { - "epoch": 0.15, - "learning_rate": 1.997863143872084e-06, - "loss": 0.8438, - "step": 5875 - }, - { - "epoch": 0.15, - "learning_rate": 1.997861335538508e-06, - "loss": 0.8701, - "step": 5876 - }, - { - "epoch": 0.15, - "learning_rate": 1.9978595264409157e-06, - "loss": 1.123, - "step": 5877 - }, - { - "epoch": 0.15, - "learning_rate": 1.9978577165793077e-06, - "loss": 1.1562, - "step": 5878 - }, - { - "epoch": 0.15, - "learning_rate": 1.9978559059536862e-06, - "loss": 0.8613, - "step": 5879 - }, - { - "epoch": 0.15, - "learning_rate": 1.9978540945640525e-06, - "loss": 0.9834, - "step": 5880 - }, - { - "epoch": 0.15, - "learning_rate": 1.9978522824104072e-06, - "loss": 1.0273, - "step": 5881 - }, - { - "epoch": 0.15, - "learning_rate": 1.997850469492753e-06, - "loss": 0.9648, - "step": 5882 - }, - { - "epoch": 0.15, - "learning_rate": 1.99784865581109e-06, - "loss": 1.0996, - "step": 5883 - }, - { - "epoch": 0.15, - "learning_rate": 1.9978468413654207e-06, - "loss": 1.1465, - "step": 5884 - }, - { - "epoch": 0.15, - "learning_rate": 1.9978450261557455e-06, - "loss": 0.981, - "step": 5885 - }, - { - "epoch": 0.15, - "learning_rate": 1.9978432101820663e-06, - "loss": 0.9346, - "step": 5886 - }, - { - "epoch": 0.15, - "learning_rate": 1.9978413934443847e-06, - "loss": 0.9648, - "step": 5887 - }, - { - "epoch": 0.15, - "learning_rate": 1.9978395759427018e-06, - "loss": 1.2129, - "step": 5888 - }, - { - "epoch": 0.15, - "learning_rate": 1.997837757677019e-06, - "loss": 1.0273, - "step": 5889 - }, - { - "epoch": 0.15, - "learning_rate": 1.997835938647337e-06, - "loss": 0.9297, - "step": 5890 - }, - { - "epoch": 0.15, - "learning_rate": 1.997834118853659e-06, - "loss": 1.1816, - "step": 5891 - }, - { - "epoch": 0.15, - "learning_rate": 1.997832298295985e-06, - "loss": 0.9365, - "step": 5892 - }, - { - "epoch": 0.15, - "learning_rate": 1.9978304769743163e-06, - "loss": 0.8877, - "step": 5893 - }, - { - "epoch": 0.15, - "learning_rate": 1.997828654888655e-06, - "loss": 1.0811, - "step": 5894 - }, - { - "epoch": 0.15, - "learning_rate": 1.9978268320390017e-06, - "loss": 0.9639, - "step": 5895 - }, - { - "epoch": 0.15, - "learning_rate": 1.997825008425359e-06, - "loss": 0.9375, - "step": 5896 - }, - { - "epoch": 0.15, - "learning_rate": 1.997823184047727e-06, - "loss": 1.2168, - "step": 5897 - }, - { - "epoch": 0.15, - "learning_rate": 1.9978213589061083e-06, - "loss": 1.1064, - "step": 5898 - }, - { - "epoch": 0.15, - "learning_rate": 1.997819533000503e-06, - "loss": 0.8052, - "step": 5899 - }, - { - "epoch": 0.15, - "learning_rate": 1.9978177063309136e-06, - "loss": 0.6492, - "step": 5900 - }, - { - "epoch": 0.15, - "learning_rate": 1.9978158788973407e-06, - "loss": 0.7031, - "step": 5901 - }, - { - "epoch": 0.15, - "learning_rate": 1.9978140506997865e-06, - "loss": 0.8032, - "step": 5902 - }, - { - "epoch": 0.15, - "learning_rate": 1.9978122217382514e-06, - "loss": 0.895, - "step": 5903 - }, - { - "epoch": 0.15, - "learning_rate": 1.997810392012738e-06, - "loss": 0.9844, - "step": 5904 - }, - { - "epoch": 0.15, - "learning_rate": 1.9978085615232463e-06, - "loss": 1.1484, - "step": 5905 - }, - { - "epoch": 0.15, - "learning_rate": 1.9978067302697794e-06, - "loss": 0.9219, - "step": 5906 - }, - { - "epoch": 0.15, - "learning_rate": 1.997804898252337e-06, - "loss": 0.9756, - "step": 5907 - }, - { - "epoch": 0.15, - "learning_rate": 1.9978030654709217e-06, - "loss": 0.9463, - "step": 5908 - }, - { - "epoch": 0.15, - "learning_rate": 1.9978012319255343e-06, - "loss": 0.8813, - "step": 5909 - }, - { - "epoch": 0.15, - "learning_rate": 1.9977993976161767e-06, - "loss": 0.8008, - "step": 5910 - }, - { - "epoch": 0.15, - "learning_rate": 1.9977975625428494e-06, - "loss": 0.9531, - "step": 5911 - }, - { - "epoch": 0.15, - "learning_rate": 1.9977957267055544e-06, - "loss": 1.0938, - "step": 5912 - }, - { - "epoch": 0.15, - "learning_rate": 1.9977938901042933e-06, - "loss": 0.8271, - "step": 5913 - }, - { - "epoch": 0.15, - "learning_rate": 1.9977920527390673e-06, - "loss": 0.9688, - "step": 5914 - }, - { - "epoch": 0.15, - "learning_rate": 1.997790214609878e-06, - "loss": 0.8584, - "step": 5915 - }, - { - "epoch": 0.15, - "learning_rate": 1.9977883757167263e-06, - "loss": 1.0342, - "step": 5916 - }, - { - "epoch": 0.15, - "learning_rate": 1.9977865360596146e-06, - "loss": 0.9688, - "step": 5917 - }, - { - "epoch": 0.15, - "learning_rate": 1.997784695638543e-06, - "loss": 0.9238, - "step": 5918 - }, - { - "epoch": 0.15, - "learning_rate": 1.9977828544535137e-06, - "loss": 0.9443, - "step": 5919 - }, - { - "epoch": 0.15, - "learning_rate": 1.997781012504528e-06, - "loss": 0.8359, - "step": 5920 - }, - { - "epoch": 0.15, - "learning_rate": 1.997779169791587e-06, - "loss": 0.7622, - "step": 5921 - }, - { - "epoch": 0.15, - "learning_rate": 1.9977773263146925e-06, - "loss": 0.9736, - "step": 5922 - }, - { - "epoch": 0.15, - "learning_rate": 1.9977754820738456e-06, - "loss": 0.9834, - "step": 5923 - }, - { - "epoch": 0.15, - "learning_rate": 1.997773637069048e-06, - "loss": 0.6057, - "step": 5924 - }, - { - "epoch": 0.15, - "learning_rate": 1.9977717913003016e-06, - "loss": 0.771, - "step": 5925 - }, - { - "epoch": 0.15, - "learning_rate": 1.9977699447676062e-06, - "loss": 0.9561, - "step": 5926 - }, - { - "epoch": 0.15, - "learning_rate": 1.997768097470965e-06, - "loss": 1.1084, - "step": 5927 - }, - { - "epoch": 0.15, - "learning_rate": 1.9977662494103786e-06, - "loss": 0.9824, - "step": 5928 - }, - { - "epoch": 0.15, - "learning_rate": 1.997764400585848e-06, - "loss": 1.1426, - "step": 5929 - }, - { - "epoch": 0.15, - "learning_rate": 1.9977625509973754e-06, - "loss": 0.8076, - "step": 5930 - }, - { - "epoch": 0.15, - "learning_rate": 1.997760700644962e-06, - "loss": 0.8037, - "step": 5931 - }, - { - "epoch": 0.15, - "learning_rate": 1.997758849528609e-06, - "loss": 0.8643, - "step": 5932 - }, - { - "epoch": 0.15, - "learning_rate": 1.9977569976483177e-06, - "loss": 1.002, - "step": 5933 - }, - { - "epoch": 0.15, - "learning_rate": 1.99775514500409e-06, - "loss": 1.1338, - "step": 5934 - }, - { - "epoch": 0.15, - "learning_rate": 1.997753291595927e-06, - "loss": 0.9238, - "step": 5935 - }, - { - "epoch": 0.15, - "learning_rate": 1.99775143742383e-06, - "loss": 1.0869, - "step": 5936 - }, - { - "epoch": 0.15, - "learning_rate": 1.997749582487801e-06, - "loss": 1.1289, - "step": 5937 - }, - { - "epoch": 0.15, - "learning_rate": 1.9977477267878402e-06, - "loss": 1.041, - "step": 5938 - }, - { - "epoch": 0.15, - "learning_rate": 1.997745870323951e-06, - "loss": 1.1162, - "step": 5939 - }, - { - "epoch": 0.15, - "learning_rate": 1.997744013096133e-06, - "loss": 1.0361, - "step": 5940 - }, - { - "epoch": 0.15, - "learning_rate": 1.9977421551043884e-06, - "loss": 0.8281, - "step": 5941 - }, - { - "epoch": 0.15, - "learning_rate": 1.9977402963487184e-06, - "loss": 1.1104, - "step": 5942 - }, - { - "epoch": 0.15, - "learning_rate": 1.9977384368291246e-06, - "loss": 0.7705, - "step": 5943 - }, - { - "epoch": 0.15, - "learning_rate": 1.9977365765456083e-06, - "loss": 0.9414, - "step": 5944 - }, - { - "epoch": 0.15, - "learning_rate": 1.997734715498171e-06, - "loss": 1.0469, - "step": 5945 - }, - { - "epoch": 0.15, - "learning_rate": 1.997732853686814e-06, - "loss": 0.7827, - "step": 5946 - }, - { - "epoch": 0.15, - "learning_rate": 1.9977309911115392e-06, - "loss": 1.0264, - "step": 5947 - }, - { - "epoch": 0.15, - "learning_rate": 1.9977291277723473e-06, - "loss": 0.9541, - "step": 5948 - }, - { - "epoch": 0.15, - "learning_rate": 1.9977272636692406e-06, - "loss": 0.8125, - "step": 5949 - }, - { - "epoch": 0.15, - "learning_rate": 1.9977253988022194e-06, - "loss": 0.8887, - "step": 5950 - }, - { - "epoch": 0.15, - "learning_rate": 1.9977235331712862e-06, - "loss": 0.998, - "step": 5951 - }, - { - "epoch": 0.15, - "learning_rate": 1.9977216667764416e-06, - "loss": 0.7949, - "step": 5952 - }, - { - "epoch": 0.15, - "learning_rate": 1.9977197996176876e-06, - "loss": 0.7363, - "step": 5953 - }, - { - "epoch": 0.15, - "learning_rate": 1.997717931695025e-06, - "loss": 0.8057, - "step": 5954 - }, - { - "epoch": 0.15, - "learning_rate": 1.9977160630084562e-06, - "loss": 0.8076, - "step": 5955 - }, - { - "epoch": 0.15, - "learning_rate": 1.997714193557982e-06, - "loss": 0.9863, - "step": 5956 - }, - { - "epoch": 0.15, - "learning_rate": 1.997712323343604e-06, - "loss": 0.8623, - "step": 5957 - }, - { - "epoch": 0.15, - "learning_rate": 1.9977104523653234e-06, - "loss": 0.9287, - "step": 5958 - }, - { - "epoch": 0.15, - "learning_rate": 1.9977085806231415e-06, - "loss": 0.8789, - "step": 5959 - }, - { - "epoch": 0.15, - "learning_rate": 1.9977067081170605e-06, - "loss": 0.9131, - "step": 5960 - }, - { - "epoch": 0.15, - "learning_rate": 1.997704834847081e-06, - "loss": 0.9805, - "step": 5961 - }, - { - "epoch": 0.15, - "learning_rate": 1.997702960813205e-06, - "loss": 1.127, - "step": 5962 - }, - { - "epoch": 0.15, - "learning_rate": 1.9977010860154337e-06, - "loss": 1.1543, - "step": 5963 - }, - { - "epoch": 0.15, - "learning_rate": 1.9976992104537685e-06, - "loss": 0.9863, - "step": 5964 - }, - { - "epoch": 0.15, - "learning_rate": 1.997697334128211e-06, - "loss": 0.9434, - "step": 5965 - }, - { - "epoch": 0.15, - "learning_rate": 1.9976954570387622e-06, - "loss": 0.7144, - "step": 5966 - }, - { - "epoch": 0.15, - "learning_rate": 1.997693579185424e-06, - "loss": 0.8506, - "step": 5967 - }, - { - "epoch": 0.15, - "learning_rate": 1.9976917005681977e-06, - "loss": 0.9248, - "step": 5968 - }, - { - "epoch": 0.15, - "learning_rate": 1.9976898211870848e-06, - "loss": 1.1562, - "step": 5969 - }, - { - "epoch": 0.15, - "learning_rate": 1.9976879410420867e-06, - "loss": 1.0156, - "step": 5970 - }, - { - "epoch": 0.15, - "learning_rate": 1.997686060133205e-06, - "loss": 0.9707, - "step": 5971 - }, - { - "epoch": 0.15, - "learning_rate": 1.9976841784604407e-06, - "loss": 1.0186, - "step": 5972 - }, - { - "epoch": 0.15, - "learning_rate": 1.9976822960237954e-06, - "loss": 0.7423, - "step": 5973 - }, - { - "epoch": 0.15, - "learning_rate": 1.9976804128232708e-06, - "loss": 1.1357, - "step": 5974 - }, - { - "epoch": 0.15, - "learning_rate": 1.997678528858868e-06, - "loss": 0.7515, - "step": 5975 - }, - { - "epoch": 0.15, - "learning_rate": 1.997676644130589e-06, - "loss": 0.8828, - "step": 5976 - }, - { - "epoch": 0.15, - "learning_rate": 1.9976747586384346e-06, - "loss": 1.0527, - "step": 5977 - }, - { - "epoch": 0.15, - "learning_rate": 1.997672872382407e-06, - "loss": 0.9688, - "step": 5978 - }, - { - "epoch": 0.15, - "learning_rate": 1.9976709853625064e-06, - "loss": 0.9043, - "step": 5979 - }, - { - "epoch": 0.15, - "learning_rate": 1.9976690975787352e-06, - "loss": 0.7217, - "step": 5980 - }, - { - "epoch": 0.15, - "learning_rate": 1.997667209031095e-06, - "loss": 1.0508, - "step": 5981 - }, - { - "epoch": 0.15, - "learning_rate": 1.9976653197195867e-06, - "loss": 0.7021, - "step": 5982 - }, - { - "epoch": 0.15, - "learning_rate": 1.997663429644212e-06, - "loss": 1.0781, - "step": 5983 - }, - { - "epoch": 0.15, - "learning_rate": 1.9976615388049722e-06, - "loss": 0.8633, - "step": 5984 - }, - { - "epoch": 0.15, - "learning_rate": 1.997659647201869e-06, - "loss": 0.9258, - "step": 5985 - }, - { - "epoch": 0.15, - "learning_rate": 1.9976577548349032e-06, - "loss": 0.8369, - "step": 5986 - }, - { - "epoch": 0.15, - "learning_rate": 1.9976558617040773e-06, - "loss": 0.8179, - "step": 5987 - }, - { - "epoch": 0.15, - "learning_rate": 1.9976539678093916e-06, - "loss": 0.9912, - "step": 5988 - }, - { - "epoch": 0.15, - "learning_rate": 1.997652073150849e-06, - "loss": 0.9473, - "step": 5989 - }, - { - "epoch": 0.15, - "learning_rate": 1.9976501777284496e-06, - "loss": 1.0928, - "step": 5990 - }, - { - "epoch": 0.15, - "learning_rate": 1.997648281542195e-06, - "loss": 0.7959, - "step": 5991 - }, - { - "epoch": 0.15, - "learning_rate": 1.9976463845920873e-06, - "loss": 0.9805, - "step": 5992 - }, - { - "epoch": 0.15, - "learning_rate": 1.997644486878128e-06, - "loss": 0.7324, - "step": 5993 - }, - { - "epoch": 0.15, - "learning_rate": 1.9976425884003176e-06, - "loss": 0.7036, - "step": 5994 - }, - { - "epoch": 0.15, - "learning_rate": 1.997640689158658e-06, - "loss": 0.7578, - "step": 5995 - }, - { - "epoch": 0.15, - "learning_rate": 1.9976387891531513e-06, - "loss": 1.0557, - "step": 5996 - }, - { - "epoch": 0.15, - "learning_rate": 1.9976368883837984e-06, - "loss": 1.083, - "step": 5997 - }, - { - "epoch": 0.15, - "learning_rate": 1.9976349868506004e-06, - "loss": 0.752, - "step": 5998 - }, - { - "epoch": 0.15, - "learning_rate": 1.9976330845535596e-06, - "loss": 0.9023, - "step": 5999 - }, - { - "epoch": 0.15, - "learning_rate": 1.997631181492677e-06, - "loss": 1.207, - "step": 6000 - }, - { - "epoch": 0.15, - "learning_rate": 1.9976292776679536e-06, - "loss": 0.8984, - "step": 6001 - }, - { - "epoch": 0.15, - "learning_rate": 1.997627373079392e-06, - "loss": 1.1162, - "step": 6002 - }, - { - "epoch": 0.15, - "learning_rate": 1.997625467726992e-06, - "loss": 0.9453, - "step": 6003 - }, - { - "epoch": 0.15, - "learning_rate": 1.9976235616107573e-06, - "loss": 0.8877, - "step": 6004 - }, - { - "epoch": 0.15, - "learning_rate": 1.9976216547306876e-06, - "loss": 1.084, - "step": 6005 - }, - { - "epoch": 0.15, - "learning_rate": 1.9976197470867848e-06, - "loss": 0.9902, - "step": 6006 - }, - { - "epoch": 0.15, - "learning_rate": 1.9976178386790505e-06, - "loss": 1.0879, - "step": 6007 - }, - { - "epoch": 0.15, - "learning_rate": 1.9976159295074856e-06, - "loss": 0.8984, - "step": 6008 - }, - { - "epoch": 0.15, - "learning_rate": 1.9976140195720927e-06, - "loss": 0.9736, - "step": 6009 - }, - { - "epoch": 0.15, - "learning_rate": 1.9976121088728726e-06, - "loss": 0.7651, - "step": 6010 - }, - { - "epoch": 0.15, - "learning_rate": 1.9976101974098265e-06, - "loss": 0.8232, - "step": 6011 - }, - { - "epoch": 0.15, - "learning_rate": 1.997608285182956e-06, - "loss": 0.5034, - "step": 6012 - }, - { - "epoch": 0.15, - "learning_rate": 1.9976063721922633e-06, - "loss": 1.1406, - "step": 6013 - }, - { - "epoch": 0.15, - "learning_rate": 1.9976044584377488e-06, - "loss": 0.8652, - "step": 6014 - }, - { - "epoch": 0.15, - "learning_rate": 1.997602543919414e-06, - "loss": 1.0342, - "step": 6015 - }, - { - "epoch": 0.15, - "learning_rate": 1.9976006286372617e-06, - "loss": 1.1182, - "step": 6016 - }, - { - "epoch": 0.15, - "learning_rate": 1.9975987125912922e-06, - "loss": 1.0283, - "step": 6017 - }, - { - "epoch": 0.15, - "learning_rate": 1.9975967957815074e-06, - "loss": 0.6411, - "step": 6018 - }, - { - "epoch": 0.15, - "learning_rate": 1.997594878207908e-06, - "loss": 0.835, - "step": 6019 - }, - { - "epoch": 0.15, - "learning_rate": 1.9975929598704967e-06, - "loss": 0.6238, - "step": 6020 - }, - { - "epoch": 0.15, - "learning_rate": 1.997591040769274e-06, - "loss": 0.8291, - "step": 6021 - }, - { - "epoch": 0.15, - "learning_rate": 1.9975891209042416e-06, - "loss": 0.9355, - "step": 6022 - }, - { - "epoch": 0.15, - "learning_rate": 1.9975872002754012e-06, - "loss": 0.8369, - "step": 6023 - }, - { - "epoch": 0.15, - "learning_rate": 1.9975852788827543e-06, - "loss": 0.9453, - "step": 6024 - }, - { - "epoch": 0.15, - "learning_rate": 1.9975833567263023e-06, - "loss": 1.2227, - "step": 6025 - }, - { - "epoch": 0.15, - "learning_rate": 1.9975814338060463e-06, - "loss": 1.2393, - "step": 6026 - }, - { - "epoch": 0.15, - "learning_rate": 1.997579510121988e-06, - "loss": 1.1514, - "step": 6027 - }, - { - "epoch": 0.15, - "learning_rate": 1.9975775856741294e-06, - "loss": 1.0146, - "step": 6028 - }, - { - "epoch": 0.15, - "learning_rate": 1.997575660462471e-06, - "loss": 0.9941, - "step": 6029 - }, - { - "epoch": 0.15, - "learning_rate": 1.997573734487015e-06, - "loss": 0.9287, - "step": 6030 - }, - { - "epoch": 0.15, - "learning_rate": 1.997571807747763e-06, - "loss": 0.918, - "step": 6031 - }, - { - "epoch": 0.15, - "learning_rate": 1.9975698802447156e-06, - "loss": 1.0469, - "step": 6032 - }, - { - "epoch": 0.15, - "learning_rate": 1.997567951977875e-06, - "loss": 0.8262, - "step": 6033 - }, - { - "epoch": 0.15, - "learning_rate": 1.997566022947243e-06, - "loss": 0.7939, - "step": 6034 - }, - { - "epoch": 0.15, - "learning_rate": 1.99756409315282e-06, - "loss": 1.5156, - "step": 6035 - }, - { - "epoch": 0.15, - "learning_rate": 1.997562162594608e-06, - "loss": 0.7715, - "step": 6036 - }, - { - "epoch": 0.15, - "learning_rate": 1.9975602312726087e-06, - "loss": 0.917, - "step": 6037 - }, - { - "epoch": 0.15, - "learning_rate": 1.9975582991868235e-06, - "loss": 0.9785, - "step": 6038 - }, - { - "epoch": 0.15, - "learning_rate": 1.9975563663372534e-06, - "loss": 1.1123, - "step": 6039 - }, - { - "epoch": 0.15, - "learning_rate": 1.9975544327239006e-06, - "loss": 0.9365, - "step": 6040 - }, - { - "epoch": 0.15, - "learning_rate": 1.9975524983467664e-06, - "loss": 0.8003, - "step": 6041 - }, - { - "epoch": 0.15, - "learning_rate": 1.9975505632058515e-06, - "loss": 0.6558, - "step": 6042 - }, - { - "epoch": 0.15, - "learning_rate": 1.997548627301158e-06, - "loss": 0.9121, - "step": 6043 - }, - { - "epoch": 0.15, - "learning_rate": 1.997546690632688e-06, - "loss": 0.9473, - "step": 6044 - }, - { - "epoch": 0.15, - "learning_rate": 1.9975447532004423e-06, - "loss": 0.9512, - "step": 6045 - }, - { - "epoch": 0.15, - "learning_rate": 1.9975428150044223e-06, - "loss": 0.8652, - "step": 6046 - }, - { - "epoch": 0.15, - "learning_rate": 1.9975408760446293e-06, - "loss": 0.7344, - "step": 6047 - }, - { - "epoch": 0.16, - "learning_rate": 1.9975389363210654e-06, - "loss": 0.6387, - "step": 6048 - }, - { - "epoch": 0.16, - "learning_rate": 1.997536995833732e-06, - "loss": 0.9805, - "step": 6049 - }, - { - "epoch": 0.16, - "learning_rate": 1.9975350545826306e-06, - "loss": 0.9082, - "step": 6050 - }, - { - "epoch": 0.16, - "learning_rate": 1.9975331125677617e-06, - "loss": 0.7764, - "step": 6051 - }, - { - "epoch": 0.16, - "learning_rate": 1.997531169789128e-06, - "loss": 0.7139, - "step": 6052 - }, - { - "epoch": 0.16, - "learning_rate": 1.9975292262467304e-06, - "loss": 0.7407, - "step": 6053 - }, - { - "epoch": 0.16, - "learning_rate": 1.9975272819405705e-06, - "loss": 1.0215, - "step": 6054 - }, - { - "epoch": 0.16, - "learning_rate": 1.9975253368706503e-06, - "loss": 0.6831, - "step": 6055 - }, - { - "epoch": 0.16, - "learning_rate": 1.9975233910369706e-06, - "loss": 0.9609, - "step": 6056 - }, - { - "epoch": 0.16, - "learning_rate": 1.997521444439533e-06, - "loss": 0.8252, - "step": 6057 - }, - { - "epoch": 0.16, - "learning_rate": 1.997519497078339e-06, - "loss": 1.0186, - "step": 6058 - }, - { - "epoch": 0.16, - "learning_rate": 1.99751754895339e-06, - "loss": 0.8232, - "step": 6059 - }, - { - "epoch": 0.16, - "learning_rate": 1.997515600064688e-06, - "loss": 0.833, - "step": 6060 - }, - { - "epoch": 0.16, - "learning_rate": 1.997513650412234e-06, - "loss": 0.9502, - "step": 6061 - }, - { - "epoch": 0.16, - "learning_rate": 1.99751169999603e-06, - "loss": 0.8306, - "step": 6062 - }, - { - "epoch": 0.16, - "learning_rate": 1.997509748816077e-06, - "loss": 0.8267, - "step": 6063 - }, - { - "epoch": 0.16, - "learning_rate": 1.9975077968723764e-06, - "loss": 0.873, - "step": 6064 - }, - { - "epoch": 0.16, - "learning_rate": 1.99750584416493e-06, - "loss": 0.9688, - "step": 6065 - }, - { - "epoch": 0.16, - "learning_rate": 1.9975038906937397e-06, - "loss": 0.7876, - "step": 6066 - }, - { - "epoch": 0.16, - "learning_rate": 1.997501936458806e-06, - "loss": 1.0996, - "step": 6067 - }, - { - "epoch": 0.16, - "learning_rate": 1.9974999814601313e-06, - "loss": 0.8438, - "step": 6068 - }, - { - "epoch": 0.16, - "learning_rate": 1.9974980256977166e-06, - "loss": 0.9287, - "step": 6069 - }, - { - "epoch": 0.16, - "learning_rate": 1.9974960691715635e-06, - "loss": 0.8984, - "step": 6070 - }, - { - "epoch": 0.16, - "learning_rate": 1.997494111881674e-06, - "loss": 0.9111, - "step": 6071 - }, - { - "epoch": 0.16, - "learning_rate": 1.997492153828048e-06, - "loss": 0.8896, - "step": 6072 - }, - { - "epoch": 0.16, - "learning_rate": 1.997490195010689e-06, - "loss": 0.8926, - "step": 6073 - }, - { - "epoch": 0.16, - "learning_rate": 1.9974882354295975e-06, - "loss": 0.9497, - "step": 6074 - }, - { - "epoch": 0.16, - "learning_rate": 1.997486275084775e-06, - "loss": 1.0039, - "step": 6075 - }, - { - "epoch": 0.16, - "learning_rate": 1.9974843139762234e-06, - "loss": 0.8687, - "step": 6076 - }, - { - "epoch": 0.16, - "learning_rate": 1.9974823521039435e-06, - "loss": 0.8877, - "step": 6077 - }, - { - "epoch": 0.16, - "learning_rate": 1.9974803894679377e-06, - "loss": 1.0664, - "step": 6078 - }, - { - "epoch": 0.16, - "learning_rate": 1.9974784260682063e-06, - "loss": 1.0508, - "step": 6079 - }, - { - "epoch": 0.16, - "learning_rate": 1.9974764619047523e-06, - "loss": 0.8857, - "step": 6080 - }, - { - "epoch": 0.16, - "learning_rate": 1.997474496977576e-06, - "loss": 1.1621, - "step": 6081 - }, - { - "epoch": 0.16, - "learning_rate": 1.9974725312866795e-06, - "loss": 0.9443, - "step": 6082 - }, - { - "epoch": 0.16, - "learning_rate": 1.997470564832064e-06, - "loss": 0.812, - "step": 6083 - }, - { - "epoch": 0.16, - "learning_rate": 1.997468597613731e-06, - "loss": 0.9893, - "step": 6084 - }, - { - "epoch": 0.16, - "learning_rate": 1.9974666296316828e-06, - "loss": 1.0479, - "step": 6085 - }, - { - "epoch": 0.16, - "learning_rate": 1.99746466088592e-06, - "loss": 0.8945, - "step": 6086 - }, - { - "epoch": 0.16, - "learning_rate": 1.997462691376444e-06, - "loss": 0.8916, - "step": 6087 - }, - { - "epoch": 0.16, - "learning_rate": 1.997460721103257e-06, - "loss": 0.7891, - "step": 6088 - }, - { - "epoch": 0.16, - "learning_rate": 1.9974587500663604e-06, - "loss": 0.9385, - "step": 6089 - }, - { - "epoch": 0.16, - "learning_rate": 1.9974567782657554e-06, - "loss": 1.002, - "step": 6090 - }, - { - "epoch": 0.16, - "learning_rate": 1.997454805701443e-06, - "loss": 0.8818, - "step": 6091 - }, - { - "epoch": 0.16, - "learning_rate": 1.9974528323734263e-06, - "loss": 0.9033, - "step": 6092 - }, - { - "epoch": 0.16, - "learning_rate": 1.9974508582817047e-06, - "loss": 0.8086, - "step": 6093 - }, - { - "epoch": 0.16, - "learning_rate": 1.9974488834262817e-06, - "loss": 1.0479, - "step": 6094 - }, - { - "epoch": 0.16, - "learning_rate": 1.9974469078071577e-06, - "loss": 0.9492, - "step": 6095 - }, - { - "epoch": 0.16, - "learning_rate": 1.997444931424335e-06, - "loss": 1.0381, - "step": 6096 - }, - { - "epoch": 0.16, - "learning_rate": 1.9974429542778136e-06, - "loss": 0.6196, - "step": 6097 - }, - { - "epoch": 0.16, - "learning_rate": 1.9974409763675968e-06, - "loss": 0.9922, - "step": 6098 - }, - { - "epoch": 0.16, - "learning_rate": 1.9974389976936844e-06, - "loss": 0.9248, - "step": 6099 - }, - { - "epoch": 0.16, - "learning_rate": 1.9974370182560796e-06, - "loss": 1.0166, - "step": 6100 - }, - { - "epoch": 0.16, - "learning_rate": 1.9974350380547827e-06, - "loss": 1.0244, - "step": 6101 - }, - { - "epoch": 0.16, - "learning_rate": 1.9974330570897957e-06, - "loss": 0.8926, - "step": 6102 - }, - { - "epoch": 0.16, - "learning_rate": 1.9974310753611205e-06, - "loss": 0.9668, - "step": 6103 - }, - { - "epoch": 0.16, - "learning_rate": 1.997429092868758e-06, - "loss": 0.8682, - "step": 6104 - }, - { - "epoch": 0.16, - "learning_rate": 1.99742710961271e-06, - "loss": 0.9619, - "step": 6105 - }, - { - "epoch": 0.16, - "learning_rate": 1.9974251255929774e-06, - "loss": 1.1807, - "step": 6106 - }, - { - "epoch": 0.16, - "learning_rate": 1.9974231408095625e-06, - "loss": 0.8633, - "step": 6107 - }, - { - "epoch": 0.16, - "learning_rate": 1.997421155262467e-06, - "loss": 0.8838, - "step": 6108 - }, - { - "epoch": 0.16, - "learning_rate": 1.9974191689516913e-06, - "loss": 0.9248, - "step": 6109 - }, - { - "epoch": 0.16, - "learning_rate": 1.9974171818772382e-06, - "loss": 1.0469, - "step": 6110 - }, - { - "epoch": 0.16, - "learning_rate": 1.9974151940391083e-06, - "loss": 0.8906, - "step": 6111 - }, - { - "epoch": 0.16, - "learning_rate": 1.9974132054373037e-06, - "loss": 1.1123, - "step": 6112 - }, - { - "epoch": 0.16, - "learning_rate": 1.997411216071825e-06, - "loss": 0.8789, - "step": 6113 - }, - { - "epoch": 0.16, - "learning_rate": 1.9974092259426753e-06, - "loss": 0.915, - "step": 6114 - }, - { - "epoch": 0.16, - "learning_rate": 1.997407235049855e-06, - "loss": 1.1377, - "step": 6115 - }, - { - "epoch": 0.16, - "learning_rate": 1.9974052433933653e-06, - "loss": 0.9229, - "step": 6116 - }, - { - "epoch": 0.16, - "learning_rate": 1.9974032509732085e-06, - "loss": 0.7988, - "step": 6117 - }, - { - "epoch": 0.16, - "learning_rate": 1.9974012577893864e-06, - "loss": 1.042, - "step": 6118 - }, - { - "epoch": 0.16, - "learning_rate": 1.9973992638418996e-06, - "loss": 1.1035, - "step": 6119 - }, - { - "epoch": 0.16, - "learning_rate": 1.99739726913075e-06, - "loss": 0.9531, - "step": 6120 - }, - { - "epoch": 0.16, - "learning_rate": 1.997395273655939e-06, - "loss": 0.7847, - "step": 6121 - }, - { - "epoch": 0.16, - "learning_rate": 1.997393277417469e-06, - "loss": 1.0, - "step": 6122 - }, - { - "epoch": 0.16, - "learning_rate": 1.99739128041534e-06, - "loss": 0.8086, - "step": 6123 - }, - { - "epoch": 0.16, - "learning_rate": 1.997389282649555e-06, - "loss": 0.9512, - "step": 6124 - }, - { - "epoch": 0.16, - "learning_rate": 1.9973872841201145e-06, - "loss": 1.0156, - "step": 6125 - }, - { - "epoch": 0.16, - "learning_rate": 1.9973852848270206e-06, - "loss": 0.8906, - "step": 6126 - }, - { - "epoch": 0.16, - "learning_rate": 1.9973832847702745e-06, - "loss": 0.7642, - "step": 6127 - }, - { - "epoch": 0.16, - "learning_rate": 1.997381283949878e-06, - "loss": 1.0859, - "step": 6128 - }, - { - "epoch": 0.16, - "learning_rate": 1.9973792823658324e-06, - "loss": 0.8135, - "step": 6129 - }, - { - "epoch": 0.16, - "learning_rate": 1.9973772800181395e-06, - "loss": 0.873, - "step": 6130 - }, - { - "epoch": 0.16, - "learning_rate": 1.9973752769068003e-06, - "loss": 0.8418, - "step": 6131 - }, - { - "epoch": 0.16, - "learning_rate": 1.997373273031817e-06, - "loss": 1.0645, - "step": 6132 - }, - { - "epoch": 0.16, - "learning_rate": 1.997371268393191e-06, - "loss": 0.877, - "step": 6133 - }, - { - "epoch": 0.16, - "learning_rate": 1.9973692629909237e-06, - "loss": 0.8857, - "step": 6134 - }, - { - "epoch": 0.16, - "learning_rate": 1.9973672568250164e-06, - "loss": 1.0557, - "step": 6135 - }, - { - "epoch": 0.16, - "learning_rate": 1.997365249895471e-06, - "loss": 0.6982, - "step": 6136 - }, - { - "epoch": 0.16, - "learning_rate": 1.997363242202289e-06, - "loss": 0.8804, - "step": 6137 - }, - { - "epoch": 0.16, - "learning_rate": 1.9973612337454716e-06, - "loss": 0.9961, - "step": 6138 - }, - { - "epoch": 0.16, - "learning_rate": 1.9973592245250203e-06, - "loss": 0.9365, - "step": 6139 - }, - { - "epoch": 0.16, - "learning_rate": 1.997357214540937e-06, - "loss": 0.8926, - "step": 6140 - }, - { - "epoch": 0.16, - "learning_rate": 1.9973552037932234e-06, - "loss": 0.8828, - "step": 6141 - }, - { - "epoch": 0.16, - "learning_rate": 1.997353192281881e-06, - "loss": 0.8301, - "step": 6142 - }, - { - "epoch": 0.16, - "learning_rate": 1.9973511800069106e-06, - "loss": 0.8477, - "step": 6143 - }, - { - "epoch": 0.16, - "learning_rate": 1.9973491669683143e-06, - "loss": 0.895, - "step": 6144 - }, - { - "epoch": 0.16, - "learning_rate": 1.997347153166094e-06, - "loss": 0.8037, - "step": 6145 - }, - { - "epoch": 0.16, - "learning_rate": 1.9973451386002507e-06, - "loss": 1.3008, - "step": 6146 - }, - { - "epoch": 0.16, - "learning_rate": 1.9973431232707856e-06, - "loss": 1.083, - "step": 6147 - }, - { - "epoch": 0.16, - "learning_rate": 1.9973411071777016e-06, - "loss": 1.1016, - "step": 6148 - }, - { - "epoch": 0.16, - "learning_rate": 1.997339090320999e-06, - "loss": 0.9375, - "step": 6149 - }, - { - "epoch": 0.16, - "learning_rate": 1.9973370727006793e-06, - "loss": 1.1846, - "step": 6150 - }, - { - "epoch": 0.16, - "learning_rate": 1.997335054316745e-06, - "loss": 0.9932, - "step": 6151 - }, - { - "epoch": 0.16, - "learning_rate": 1.997333035169197e-06, - "loss": 0.9473, - "step": 6152 - }, - { - "epoch": 0.16, - "learning_rate": 1.9973310152580366e-06, - "loss": 0.9326, - "step": 6153 - }, - { - "epoch": 0.16, - "learning_rate": 1.997328994583266e-06, - "loss": 0.6665, - "step": 6154 - }, - { - "epoch": 0.16, - "learning_rate": 1.9973269731448865e-06, - "loss": 0.9951, - "step": 6155 - }, - { - "epoch": 0.16, - "learning_rate": 1.9973249509428997e-06, - "loss": 0.9639, - "step": 6156 - }, - { - "epoch": 0.16, - "learning_rate": 1.9973229279773064e-06, - "loss": 0.7725, - "step": 6157 - }, - { - "epoch": 0.16, - "learning_rate": 1.9973209042481094e-06, - "loss": 1.1455, - "step": 6158 - }, - { - "epoch": 0.16, - "learning_rate": 1.9973188797553093e-06, - "loss": 1.0137, - "step": 6159 - }, - { - "epoch": 0.16, - "learning_rate": 1.9973168544989086e-06, - "loss": 1.0, - "step": 6160 - }, - { - "epoch": 0.16, - "learning_rate": 1.9973148284789077e-06, - "loss": 0.9482, - "step": 6161 - }, - { - "epoch": 0.16, - "learning_rate": 1.9973128016953087e-06, - "loss": 1.0342, - "step": 6162 - }, - { - "epoch": 0.16, - "learning_rate": 1.9973107741481133e-06, - "loss": 0.9854, - "step": 6163 - }, - { - "epoch": 0.16, - "learning_rate": 1.9973087458373228e-06, - "loss": 0.9062, - "step": 6164 - }, - { - "epoch": 0.16, - "learning_rate": 1.997306716762939e-06, - "loss": 0.9648, - "step": 6165 - }, - { - "epoch": 0.16, - "learning_rate": 1.997304686924963e-06, - "loss": 1.0986, - "step": 6166 - }, - { - "epoch": 0.16, - "learning_rate": 1.997302656323397e-06, - "loss": 0.9268, - "step": 6167 - }, - { - "epoch": 0.16, - "learning_rate": 1.997300624958242e-06, - "loss": 1.2861, - "step": 6168 - }, - { - "epoch": 0.16, - "learning_rate": 1.9972985928294997e-06, - "loss": 0.9307, - "step": 6169 - }, - { - "epoch": 0.16, - "learning_rate": 1.997296559937172e-06, - "loss": 0.8818, - "step": 6170 - }, - { - "epoch": 0.16, - "learning_rate": 1.99729452628126e-06, - "loss": 0.8252, - "step": 6171 - }, - { - "epoch": 0.16, - "learning_rate": 1.9972924918617657e-06, - "loss": 1.0098, - "step": 6172 - }, - { - "epoch": 0.16, - "learning_rate": 1.9972904566786903e-06, - "loss": 0.7153, - "step": 6173 - }, - { - "epoch": 0.16, - "learning_rate": 1.997288420732035e-06, - "loss": 1.21, - "step": 6174 - }, - { - "epoch": 0.16, - "learning_rate": 1.9972863840218023e-06, - "loss": 1.0703, - "step": 6175 - }, - { - "epoch": 0.16, - "learning_rate": 1.997284346547993e-06, - "loss": 0.918, - "step": 6176 - }, - { - "epoch": 0.16, - "learning_rate": 1.9972823083106092e-06, - "loss": 0.9233, - "step": 6177 - }, - { - "epoch": 0.16, - "learning_rate": 1.997280269309652e-06, - "loss": 0.999, - "step": 6178 - }, - { - "epoch": 0.16, - "learning_rate": 1.9972782295451233e-06, - "loss": 1.0225, - "step": 6179 - }, - { - "epoch": 0.16, - "learning_rate": 1.9972761890170244e-06, - "loss": 0.875, - "step": 6180 - }, - { - "epoch": 0.16, - "learning_rate": 1.997274147725357e-06, - "loss": 0.832, - "step": 6181 - }, - { - "epoch": 0.16, - "learning_rate": 1.9972721056701223e-06, - "loss": 1.0156, - "step": 6182 - }, - { - "epoch": 0.16, - "learning_rate": 1.9972700628513227e-06, - "loss": 0.9941, - "step": 6183 - }, - { - "epoch": 0.16, - "learning_rate": 1.9972680192689593e-06, - "loss": 1.1543, - "step": 6184 - }, - { - "epoch": 0.16, - "learning_rate": 1.9972659749230333e-06, - "loss": 1.04, - "step": 6185 - }, - { - "epoch": 0.16, - "learning_rate": 1.9972639298135466e-06, - "loss": 0.8623, - "step": 6186 - }, - { - "epoch": 0.16, - "learning_rate": 1.997261883940501e-06, - "loss": 1.0137, - "step": 6187 - }, - { - "epoch": 0.16, - "learning_rate": 1.997259837303898e-06, - "loss": 1.0996, - "step": 6188 - }, - { - "epoch": 0.16, - "learning_rate": 1.9972577899037384e-06, - "loss": 1.0791, - "step": 6189 - }, - { - "epoch": 0.16, - "learning_rate": 1.997255741740025e-06, - "loss": 0.918, - "step": 6190 - }, - { - "epoch": 0.16, - "learning_rate": 1.9972536928127583e-06, - "loss": 0.9785, - "step": 6191 - }, - { - "epoch": 0.16, - "learning_rate": 1.9972516431219405e-06, - "loss": 0.9453, - "step": 6192 - }, - { - "epoch": 0.16, - "learning_rate": 1.997249592667573e-06, - "loss": 0.9268, - "step": 6193 - }, - { - "epoch": 0.16, - "learning_rate": 1.9972475414496573e-06, - "loss": 1.0303, - "step": 6194 - }, - { - "epoch": 0.16, - "learning_rate": 1.9972454894681948e-06, - "loss": 0.9648, - "step": 6195 - }, - { - "epoch": 0.16, - "learning_rate": 1.9972434367231876e-06, - "loss": 0.9238, - "step": 6196 - }, - { - "epoch": 0.16, - "learning_rate": 1.9972413832146365e-06, - "loss": 0.8821, - "step": 6197 - }, - { - "epoch": 0.16, - "learning_rate": 1.997239328942544e-06, - "loss": 0.7886, - "step": 6198 - }, - { - "epoch": 0.16, - "learning_rate": 1.997237273906911e-06, - "loss": 0.8242, - "step": 6199 - }, - { - "epoch": 0.16, - "learning_rate": 1.9972352181077394e-06, - "loss": 1.0586, - "step": 6200 - }, - { - "epoch": 0.16, - "learning_rate": 1.9972331615450306e-06, - "loss": 1.0195, - "step": 6201 - }, - { - "epoch": 0.16, - "learning_rate": 1.9972311042187864e-06, - "loss": 1.0439, - "step": 6202 - }, - { - "epoch": 0.16, - "learning_rate": 1.9972290461290076e-06, - "loss": 0.7812, - "step": 6203 - }, - { - "epoch": 0.16, - "learning_rate": 1.997226987275697e-06, - "loss": 1.0732, - "step": 6204 - }, - { - "epoch": 0.16, - "learning_rate": 1.9972249276588553e-06, - "loss": 0.877, - "step": 6205 - }, - { - "epoch": 0.16, - "learning_rate": 1.997222867278484e-06, - "loss": 0.7075, - "step": 6206 - }, - { - "epoch": 0.16, - "learning_rate": 1.997220806134585e-06, - "loss": 0.9482, - "step": 6207 - }, - { - "epoch": 0.16, - "learning_rate": 1.9972187442271606e-06, - "loss": 0.7344, - "step": 6208 - }, - { - "epoch": 0.16, - "learning_rate": 1.9972166815562113e-06, - "loss": 0.96, - "step": 6209 - }, - { - "epoch": 0.16, - "learning_rate": 1.997214618121739e-06, - "loss": 1.0605, - "step": 6210 - }, - { - "epoch": 0.16, - "learning_rate": 1.997212553923745e-06, - "loss": 1.0645, - "step": 6211 - }, - { - "epoch": 0.16, - "learning_rate": 1.997210488962232e-06, - "loss": 0.894, - "step": 6212 - }, - { - "epoch": 0.16, - "learning_rate": 1.9972084232372e-06, - "loss": 0.9043, - "step": 6213 - }, - { - "epoch": 0.16, - "learning_rate": 1.9972063567486517e-06, - "loss": 1.1406, - "step": 6214 - }, - { - "epoch": 0.16, - "learning_rate": 1.9972042894965882e-06, - "loss": 0.9023, - "step": 6215 - }, - { - "epoch": 0.16, - "learning_rate": 1.9972022214810114e-06, - "loss": 0.9233, - "step": 6216 - }, - { - "epoch": 0.16, - "learning_rate": 1.997200152701923e-06, - "loss": 0.9424, - "step": 6217 - }, - { - "epoch": 0.16, - "learning_rate": 1.997198083159324e-06, - "loss": 1.1523, - "step": 6218 - }, - { - "epoch": 0.16, - "learning_rate": 1.997196012853216e-06, - "loss": 1.0303, - "step": 6219 - }, - { - "epoch": 0.16, - "learning_rate": 1.997193941783601e-06, - "loss": 0.9385, - "step": 6220 - }, - { - "epoch": 0.16, - "learning_rate": 1.9971918699504804e-06, - "loss": 0.8931, - "step": 6221 - }, - { - "epoch": 0.16, - "learning_rate": 1.9971897973538563e-06, - "loss": 0.8115, - "step": 6222 - }, - { - "epoch": 0.16, - "learning_rate": 1.9971877239937295e-06, - "loss": 0.707, - "step": 6223 - }, - { - "epoch": 0.16, - "learning_rate": 1.9971856498701015e-06, - "loss": 0.7227, - "step": 6224 - }, - { - "epoch": 0.16, - "learning_rate": 1.997183574982975e-06, - "loss": 0.8389, - "step": 6225 - }, - { - "epoch": 0.16, - "learning_rate": 1.9971814993323508e-06, - "loss": 0.9854, - "step": 6226 - }, - { - "epoch": 0.16, - "learning_rate": 1.99717942291823e-06, - "loss": 0.8657, - "step": 6227 - }, - { - "epoch": 0.16, - "learning_rate": 1.9971773457406155e-06, - "loss": 1.1572, - "step": 6228 - }, - { - "epoch": 0.16, - "learning_rate": 1.997175267799508e-06, - "loss": 0.8472, - "step": 6229 - }, - { - "epoch": 0.16, - "learning_rate": 1.9971731890949085e-06, - "loss": 0.9844, - "step": 6230 - }, - { - "epoch": 0.16, - "learning_rate": 1.9971711096268203e-06, - "loss": 1.1318, - "step": 6231 - }, - { - "epoch": 0.16, - "learning_rate": 1.9971690293952433e-06, - "loss": 0.9883, - "step": 6232 - }, - { - "epoch": 0.16, - "learning_rate": 1.9971669484001804e-06, - "loss": 0.7383, - "step": 6233 - }, - { - "epoch": 0.16, - "learning_rate": 1.9971648666416325e-06, - "loss": 1.0439, - "step": 6234 - }, - { - "epoch": 0.16, - "learning_rate": 1.997162784119601e-06, - "loss": 0.8867, - "step": 6235 - }, - { - "epoch": 0.16, - "learning_rate": 1.997160700834088e-06, - "loss": 0.9307, - "step": 6236 - }, - { - "epoch": 0.16, - "learning_rate": 1.997158616785095e-06, - "loss": 1.1113, - "step": 6237 - }, - { - "epoch": 0.16, - "learning_rate": 1.997156531972623e-06, - "loss": 0.9028, - "step": 6238 - }, - { - "epoch": 0.16, - "learning_rate": 1.9971544463966747e-06, - "loss": 0.9814, - "step": 6239 - }, - { - "epoch": 0.16, - "learning_rate": 1.997152360057251e-06, - "loss": 0.8213, - "step": 6240 - }, - { - "epoch": 0.16, - "learning_rate": 1.997150272954353e-06, - "loss": 0.8311, - "step": 6241 - }, - { - "epoch": 0.16, - "learning_rate": 1.9971481850879835e-06, - "loss": 0.8252, - "step": 6242 - }, - { - "epoch": 0.16, - "learning_rate": 1.9971460964581434e-06, - "loss": 1.0547, - "step": 6243 - }, - { - "epoch": 0.16, - "learning_rate": 1.9971440070648344e-06, - "loss": 1.0742, - "step": 6244 - }, - { - "epoch": 0.16, - "learning_rate": 1.997141916908058e-06, - "loss": 0.9111, - "step": 6245 - }, - { - "epoch": 0.16, - "learning_rate": 1.997139825987816e-06, - "loss": 0.877, - "step": 6246 - }, - { - "epoch": 0.16, - "learning_rate": 1.99713773430411e-06, - "loss": 1.2109, - "step": 6247 - }, - { - "epoch": 0.16, - "learning_rate": 1.997135641856941e-06, - "loss": 1.0264, - "step": 6248 - }, - { - "epoch": 0.16, - "learning_rate": 1.997133548646311e-06, - "loss": 0.8447, - "step": 6249 - }, - { - "epoch": 0.16, - "learning_rate": 1.9971314546722226e-06, - "loss": 1.0107, - "step": 6250 - }, - { - "epoch": 0.16, - "learning_rate": 1.997129359934676e-06, - "loss": 0.8008, - "step": 6251 - }, - { - "epoch": 0.16, - "learning_rate": 1.997127264433673e-06, - "loss": 0.9072, - "step": 6252 - }, - { - "epoch": 0.16, - "learning_rate": 1.9971251681692157e-06, - "loss": 1.1299, - "step": 6253 - }, - { - "epoch": 0.16, - "learning_rate": 1.9971230711413057e-06, - "loss": 0.7422, - "step": 6254 - }, - { - "epoch": 0.16, - "learning_rate": 1.997120973349944e-06, - "loss": 0.9316, - "step": 6255 - }, - { - "epoch": 0.16, - "learning_rate": 1.997118874795133e-06, - "loss": 1.041, - "step": 6256 - }, - { - "epoch": 0.16, - "learning_rate": 1.997116775476874e-06, - "loss": 0.7578, - "step": 6257 - }, - { - "epoch": 0.16, - "learning_rate": 1.9971146753951683e-06, - "loss": 1.0781, - "step": 6258 - }, - { - "epoch": 0.16, - "learning_rate": 1.997112574550018e-06, - "loss": 0.9863, - "step": 6259 - }, - { - "epoch": 0.16, - "learning_rate": 1.997110472941424e-06, - "loss": 0.9199, - "step": 6260 - }, - { - "epoch": 0.16, - "learning_rate": 1.9971083705693882e-06, - "loss": 0.9238, - "step": 6261 - }, - { - "epoch": 0.16, - "learning_rate": 1.997106267433913e-06, - "loss": 0.8672, - "step": 6262 - }, - { - "epoch": 0.16, - "learning_rate": 1.997104163534999e-06, - "loss": 0.8906, - "step": 6263 - }, - { - "epoch": 0.16, - "learning_rate": 1.9971020588726485e-06, - "loss": 0.8848, - "step": 6264 - }, - { - "epoch": 0.16, - "learning_rate": 1.997099953446863e-06, - "loss": 1.0127, - "step": 6265 - }, - { - "epoch": 0.16, - "learning_rate": 1.997097847257643e-06, - "loss": 0.9326, - "step": 6266 - }, - { - "epoch": 0.16, - "learning_rate": 1.9970957403049917e-06, - "loss": 0.7383, - "step": 6267 - }, - { - "epoch": 0.16, - "learning_rate": 1.99709363258891e-06, - "loss": 1.0166, - "step": 6268 - }, - { - "epoch": 0.16, - "learning_rate": 1.9970915241093995e-06, - "loss": 0.8174, - "step": 6269 - }, - { - "epoch": 0.16, - "learning_rate": 1.9970894148664616e-06, - "loss": 0.6146, - "step": 6270 - }, - { - "epoch": 0.16, - "learning_rate": 1.9970873048600984e-06, - "loss": 0.9229, - "step": 6271 - }, - { - "epoch": 0.16, - "learning_rate": 1.9970851940903117e-06, - "loss": 0.8159, - "step": 6272 - }, - { - "epoch": 0.16, - "learning_rate": 1.9970830825571018e-06, - "loss": 1.0537, - "step": 6273 - }, - { - "epoch": 0.16, - "learning_rate": 1.9970809702604716e-06, - "loss": 0.8779, - "step": 6274 - }, - { - "epoch": 0.16, - "learning_rate": 1.997078857200423e-06, - "loss": 1.1484, - "step": 6275 - }, - { - "epoch": 0.16, - "learning_rate": 1.9970767433769563e-06, - "loss": 0.9824, - "step": 6276 - }, - { - "epoch": 0.16, - "learning_rate": 1.997074628790074e-06, - "loss": 0.8208, - "step": 6277 - }, - { - "epoch": 0.16, - "learning_rate": 1.9970725134397774e-06, - "loss": 1.0469, - "step": 6278 - }, - { - "epoch": 0.16, - "learning_rate": 1.9970703973260683e-06, - "loss": 0.6956, - "step": 6279 - }, - { - "epoch": 0.16, - "learning_rate": 1.9970682804489483e-06, - "loss": 0.8428, - "step": 6280 - }, - { - "epoch": 0.16, - "learning_rate": 1.997066162808419e-06, - "loss": 0.8516, - "step": 6281 - }, - { - "epoch": 0.16, - "learning_rate": 1.997064044404482e-06, - "loss": 0.9736, - "step": 6282 - }, - { - "epoch": 0.16, - "learning_rate": 1.9970619252371385e-06, - "loss": 0.8154, - "step": 6283 - }, - { - "epoch": 0.16, - "learning_rate": 1.997059805306391e-06, - "loss": 0.875, - "step": 6284 - }, - { - "epoch": 0.16, - "learning_rate": 1.9970576846122402e-06, - "loss": 1.001, - "step": 6285 - }, - { - "epoch": 0.16, - "learning_rate": 1.9970555631546887e-06, - "loss": 0.7803, - "step": 6286 - }, - { - "epoch": 0.16, - "learning_rate": 1.9970534409337373e-06, - "loss": 0.8389, - "step": 6287 - }, - { - "epoch": 0.16, - "learning_rate": 1.997051317949388e-06, - "loss": 0.8105, - "step": 6288 - }, - { - "epoch": 0.16, - "learning_rate": 1.997049194201642e-06, - "loss": 0.8633, - "step": 6289 - }, - { - "epoch": 0.16, - "learning_rate": 1.9970470696905017e-06, - "loss": 0.9004, - "step": 6290 - }, - { - "epoch": 0.16, - "learning_rate": 1.9970449444159682e-06, - "loss": 1.0557, - "step": 6291 - }, - { - "epoch": 0.16, - "learning_rate": 1.9970428183780433e-06, - "loss": 0.8716, - "step": 6292 - }, - { - "epoch": 0.16, - "learning_rate": 1.9970406915767282e-06, - "loss": 0.9473, - "step": 6293 - }, - { - "epoch": 0.16, - "learning_rate": 1.997038564012025e-06, - "loss": 1.0986, - "step": 6294 - }, - { - "epoch": 0.16, - "learning_rate": 1.9970364356839357e-06, - "loss": 1.0342, - "step": 6295 - }, - { - "epoch": 0.16, - "learning_rate": 1.9970343065924613e-06, - "loss": 1.0957, - "step": 6296 - }, - { - "epoch": 0.16, - "learning_rate": 1.9970321767376034e-06, - "loss": 1.0996, - "step": 6297 - }, - { - "epoch": 0.16, - "learning_rate": 1.997030046119364e-06, - "loss": 0.7466, - "step": 6298 - }, - { - "epoch": 0.16, - "learning_rate": 1.997027914737744e-06, - "loss": 0.8574, - "step": 6299 - }, - { - "epoch": 0.16, - "learning_rate": 1.997025782592746e-06, - "loss": 0.7256, - "step": 6300 - }, - { - "epoch": 0.16, - "learning_rate": 1.997023649684371e-06, - "loss": 0.8271, - "step": 6301 - }, - { - "epoch": 0.16, - "learning_rate": 1.997021516012621e-06, - "loss": 0.9551, - "step": 6302 - }, - { - "epoch": 0.16, - "learning_rate": 1.9970193815774977e-06, - "loss": 1.0371, - "step": 6303 - }, - { - "epoch": 0.16, - "learning_rate": 1.997017246379002e-06, - "loss": 0.9912, - "step": 6304 - }, - { - "epoch": 0.16, - "learning_rate": 1.9970151104171363e-06, - "loss": 0.9609, - "step": 6305 - }, - { - "epoch": 0.16, - "learning_rate": 1.9970129736919023e-06, - "loss": 1.0068, - "step": 6306 - }, - { - "epoch": 0.16, - "learning_rate": 1.9970108362033006e-06, - "loss": 0.7581, - "step": 6307 - }, - { - "epoch": 0.16, - "learning_rate": 1.9970086979513343e-06, - "loss": 0.835, - "step": 6308 - }, - { - "epoch": 0.16, - "learning_rate": 1.9970065589360036e-06, - "loss": 0.9326, - "step": 6309 - }, - { - "epoch": 0.16, - "learning_rate": 1.997004419157311e-06, - "loss": 1.0117, - "step": 6310 - }, - { - "epoch": 0.16, - "learning_rate": 1.997002278615258e-06, - "loss": 0.7842, - "step": 6311 - }, - { - "epoch": 0.16, - "learning_rate": 1.9970001373098464e-06, - "loss": 0.8525, - "step": 6312 - }, - { - "epoch": 0.16, - "learning_rate": 1.9969979952410776e-06, - "loss": 0.9297, - "step": 6313 - }, - { - "epoch": 0.16, - "learning_rate": 1.9969958524089533e-06, - "loss": 0.8848, - "step": 6314 - }, - { - "epoch": 0.16, - "learning_rate": 1.996993708813475e-06, - "loss": 0.9424, - "step": 6315 - }, - { - "epoch": 0.16, - "learning_rate": 1.9969915644546445e-06, - "loss": 0.9619, - "step": 6316 - }, - { - "epoch": 0.16, - "learning_rate": 1.9969894193324633e-06, - "loss": 0.7539, - "step": 6317 - }, - { - "epoch": 0.16, - "learning_rate": 1.996987273446933e-06, - "loss": 0.874, - "step": 6318 - }, - { - "epoch": 0.16, - "learning_rate": 1.996985126798056e-06, - "loss": 0.9834, - "step": 6319 - }, - { - "epoch": 0.16, - "learning_rate": 1.9969829793858327e-06, - "loss": 0.7891, - "step": 6320 - }, - { - "epoch": 0.16, - "learning_rate": 1.9969808312102655e-06, - "loss": 0.875, - "step": 6321 - }, - { - "epoch": 0.16, - "learning_rate": 1.996978682271356e-06, - "loss": 0.8232, - "step": 6322 - }, - { - "epoch": 0.16, - "learning_rate": 1.996976532569106e-06, - "loss": 0.9346, - "step": 6323 - }, - { - "epoch": 0.16, - "learning_rate": 1.9969743821035165e-06, - "loss": 1.0186, - "step": 6324 - }, - { - "epoch": 0.16, - "learning_rate": 1.99697223087459e-06, - "loss": 0.877, - "step": 6325 - }, - { - "epoch": 0.16, - "learning_rate": 1.9969700788823273e-06, - "loss": 0.9902, - "step": 6326 - }, - { - "epoch": 0.16, - "learning_rate": 1.9969679261267305e-06, - "loss": 1.0928, - "step": 6327 - }, - { - "epoch": 0.16, - "learning_rate": 1.9969657726078017e-06, - "loss": 1.041, - "step": 6328 - }, - { - "epoch": 0.16, - "learning_rate": 1.9969636183255415e-06, - "loss": 0.7871, - "step": 6329 - }, - { - "epoch": 0.16, - "learning_rate": 1.996961463279952e-06, - "loss": 0.9082, - "step": 6330 - }, - { - "epoch": 0.16, - "learning_rate": 1.9969593074710354e-06, - "loss": 0.9932, - "step": 6331 - }, - { - "epoch": 0.16, - "learning_rate": 1.996957150898793e-06, - "loss": 0.9141, - "step": 6332 - }, - { - "epoch": 0.16, - "learning_rate": 1.996954993563226e-06, - "loss": 1.0479, - "step": 6333 - }, - { - "epoch": 0.16, - "learning_rate": 1.9969528354643365e-06, - "loss": 1.0488, - "step": 6334 - }, - { - "epoch": 0.16, - "learning_rate": 1.996950676602126e-06, - "loss": 0.8613, - "step": 6335 - }, - { - "epoch": 0.16, - "learning_rate": 1.996948516976596e-06, - "loss": 0.7979, - "step": 6336 - }, - { - "epoch": 0.16, - "learning_rate": 1.996946356587749e-06, - "loss": 0.9268, - "step": 6337 - }, - { - "epoch": 0.16, - "learning_rate": 1.9969441954355856e-06, - "loss": 1.0605, - "step": 6338 - }, - { - "epoch": 0.16, - "learning_rate": 1.9969420335201077e-06, - "loss": 0.9688, - "step": 6339 - }, - { - "epoch": 0.16, - "learning_rate": 1.996939870841317e-06, - "loss": 1.0615, - "step": 6340 - }, - { - "epoch": 0.16, - "learning_rate": 1.996937707399216e-06, - "loss": 0.8652, - "step": 6341 - }, - { - "epoch": 0.16, - "learning_rate": 1.996935543193805e-06, - "loss": 0.915, - "step": 6342 - }, - { - "epoch": 0.16, - "learning_rate": 1.9969333782250864e-06, - "loss": 1.1572, - "step": 6343 - }, - { - "epoch": 0.16, - "learning_rate": 1.996931212493062e-06, - "loss": 0.8389, - "step": 6344 - }, - { - "epoch": 0.16, - "learning_rate": 1.9969290459977333e-06, - "loss": 0.7471, - "step": 6345 - }, - { - "epoch": 0.16, - "learning_rate": 1.9969268787391017e-06, - "loss": 1.0117, - "step": 6346 - }, - { - "epoch": 0.16, - "learning_rate": 1.9969247107171688e-06, - "loss": 0.8779, - "step": 6347 - }, - { - "epoch": 0.16, - "learning_rate": 1.996922541931937e-06, - "loss": 0.8154, - "step": 6348 - }, - { - "epoch": 0.16, - "learning_rate": 1.996920372383407e-06, - "loss": 0.9561, - "step": 6349 - }, - { - "epoch": 0.16, - "learning_rate": 1.9969182020715807e-06, - "loss": 1.124, - "step": 6350 - }, - { - "epoch": 0.16, - "learning_rate": 1.9969160309964604e-06, - "loss": 1.0205, - "step": 6351 - }, - { - "epoch": 0.16, - "learning_rate": 1.9969138591580473e-06, - "loss": 0.9395, - "step": 6352 - }, - { - "epoch": 0.16, - "learning_rate": 1.9969116865563432e-06, - "loss": 0.8706, - "step": 6353 - }, - { - "epoch": 0.16, - "learning_rate": 1.9969095131913494e-06, - "loss": 0.9092, - "step": 6354 - }, - { - "epoch": 0.16, - "learning_rate": 1.996907339063068e-06, - "loss": 0.8008, - "step": 6355 - }, - { - "epoch": 0.16, - "learning_rate": 1.9969051641715004e-06, - "loss": 0.9756, - "step": 6356 - }, - { - "epoch": 0.16, - "learning_rate": 1.9969029885166483e-06, - "loss": 0.8838, - "step": 6357 - }, - { - "epoch": 0.16, - "learning_rate": 1.996900812098513e-06, - "loss": 0.9741, - "step": 6358 - }, - { - "epoch": 0.16, - "learning_rate": 1.996898634917097e-06, - "loss": 1.1738, - "step": 6359 - }, - { - "epoch": 0.16, - "learning_rate": 1.996896456972402e-06, - "loss": 0.7871, - "step": 6360 - }, - { - "epoch": 0.16, - "learning_rate": 1.996894278264429e-06, - "loss": 0.8726, - "step": 6361 - }, - { - "epoch": 0.16, - "learning_rate": 1.9968920987931797e-06, - "loss": 0.8018, - "step": 6362 - }, - { - "epoch": 0.16, - "learning_rate": 1.996889918558656e-06, - "loss": 1.0713, - "step": 6363 - }, - { - "epoch": 0.16, - "learning_rate": 1.9968877375608597e-06, - "loss": 1.0811, - "step": 6364 - }, - { - "epoch": 0.16, - "learning_rate": 1.996885555799792e-06, - "loss": 0.9482, - "step": 6365 - }, - { - "epoch": 0.16, - "learning_rate": 1.9968833732754547e-06, - "loss": 1.0879, - "step": 6366 - }, - { - "epoch": 0.16, - "learning_rate": 1.9968811899878502e-06, - "loss": 0.9551, - "step": 6367 - }, - { - "epoch": 0.16, - "learning_rate": 1.9968790059369792e-06, - "loss": 0.9316, - "step": 6368 - }, - { - "epoch": 0.16, - "learning_rate": 1.996876821122844e-06, - "loss": 0.8623, - "step": 6369 - }, - { - "epoch": 0.16, - "learning_rate": 1.996874635545446e-06, - "loss": 0.8101, - "step": 6370 - }, - { - "epoch": 0.16, - "learning_rate": 1.996872449204787e-06, - "loss": 1.1143, - "step": 6371 - }, - { - "epoch": 0.16, - "learning_rate": 1.9968702621008683e-06, - "loss": 0.645, - "step": 6372 - }, - { - "epoch": 0.16, - "learning_rate": 1.996868074233692e-06, - "loss": 0.8955, - "step": 6373 - }, - { - "epoch": 0.16, - "learning_rate": 1.99686588560326e-06, - "loss": 1.1309, - "step": 6374 - }, - { - "epoch": 0.16, - "learning_rate": 1.9968636962095732e-06, - "loss": 0.8711, - "step": 6375 - }, - { - "epoch": 0.16, - "learning_rate": 1.996861506052634e-06, - "loss": 0.9092, - "step": 6376 - }, - { - "epoch": 0.16, - "learning_rate": 1.9968593151324436e-06, - "loss": 1.0264, - "step": 6377 - }, - { - "epoch": 0.16, - "learning_rate": 1.996857123449004e-06, - "loss": 0.916, - "step": 6378 - }, - { - "epoch": 0.16, - "learning_rate": 1.9968549310023166e-06, - "loss": 0.9902, - "step": 6379 - }, - { - "epoch": 0.16, - "learning_rate": 1.996852737792383e-06, - "loss": 1.123, - "step": 6380 - }, - { - "epoch": 0.16, - "learning_rate": 1.9968505438192055e-06, - "loss": 0.8965, - "step": 6381 - }, - { - "epoch": 0.16, - "learning_rate": 1.9968483490827852e-06, - "loss": 0.8457, - "step": 6382 - }, - { - "epoch": 0.16, - "learning_rate": 1.996846153583124e-06, - "loss": 0.8975, - "step": 6383 - }, - { - "epoch": 0.16, - "learning_rate": 1.9968439573202235e-06, - "loss": 1.0332, - "step": 6384 - }, - { - "epoch": 0.16, - "learning_rate": 1.9968417602940856e-06, - "loss": 0.8154, - "step": 6385 - }, - { - "epoch": 0.16, - "learning_rate": 1.9968395625047116e-06, - "loss": 0.9316, - "step": 6386 - }, - { - "epoch": 0.16, - "learning_rate": 1.9968373639521034e-06, - "loss": 1.0498, - "step": 6387 - }, - { - "epoch": 0.16, - "learning_rate": 1.9968351646362625e-06, - "loss": 1.0127, - "step": 6388 - }, - { - "epoch": 0.16, - "learning_rate": 1.9968329645571912e-06, - "loss": 0.8799, - "step": 6389 - }, - { - "epoch": 0.16, - "learning_rate": 1.9968307637148903e-06, - "loss": 0.8184, - "step": 6390 - }, - { - "epoch": 0.16, - "learning_rate": 1.9968285621093623e-06, - "loss": 0.9658, - "step": 6391 - }, - { - "epoch": 0.16, - "learning_rate": 1.9968263597406084e-06, - "loss": 0.876, - "step": 6392 - }, - { - "epoch": 0.16, - "learning_rate": 1.99682415660863e-06, - "loss": 0.8955, - "step": 6393 - }, - { - "epoch": 0.16, - "learning_rate": 1.9968219527134297e-06, - "loss": 0.918, - "step": 6394 - }, - { - "epoch": 0.16, - "learning_rate": 1.9968197480550086e-06, - "loss": 0.9355, - "step": 6395 - }, - { - "epoch": 0.16, - "learning_rate": 1.996817542633368e-06, - "loss": 0.7949, - "step": 6396 - }, - { - "epoch": 0.16, - "learning_rate": 1.9968153364485105e-06, - "loss": 0.9604, - "step": 6397 - }, - { - "epoch": 0.16, - "learning_rate": 1.996813129500437e-06, - "loss": 1.1455, - "step": 6398 - }, - { - "epoch": 0.16, - "learning_rate": 1.99681092178915e-06, - "loss": 0.9883, - "step": 6399 - }, - { - "epoch": 0.16, - "learning_rate": 1.99680871331465e-06, - "loss": 1.0557, - "step": 6400 - }, - { - "epoch": 0.16, - "learning_rate": 1.9968065040769398e-06, - "loss": 1.1699, - "step": 6401 - }, - { - "epoch": 0.16, - "learning_rate": 1.996804294076021e-06, - "loss": 1.043, - "step": 6402 - }, - { - "epoch": 0.16, - "learning_rate": 1.9968020833118946e-06, - "loss": 0.8438, - "step": 6403 - }, - { - "epoch": 0.16, - "learning_rate": 1.9967998717845627e-06, - "loss": 0.9814, - "step": 6404 - }, - { - "epoch": 0.16, - "learning_rate": 1.996797659494027e-06, - "loss": 1.1953, - "step": 6405 - }, - { - "epoch": 0.16, - "learning_rate": 1.9967954464402893e-06, - "loss": 0.9336, - "step": 6406 - }, - { - "epoch": 0.16, - "learning_rate": 1.996793232623351e-06, - "loss": 0.959, - "step": 6407 - }, - { - "epoch": 0.16, - "learning_rate": 1.9967910180432143e-06, - "loss": 0.8877, - "step": 6408 - }, - { - "epoch": 0.16, - "learning_rate": 1.9967888026998804e-06, - "loss": 0.998, - "step": 6409 - }, - { - "epoch": 0.16, - "learning_rate": 1.9967865865933507e-06, - "loss": 0.8799, - "step": 6410 - }, - { - "epoch": 0.16, - "learning_rate": 1.996784369723628e-06, - "loss": 0.9597, - "step": 6411 - }, - { - "epoch": 0.16, - "learning_rate": 1.9967821520907127e-06, - "loss": 0.8857, - "step": 6412 - }, - { - "epoch": 0.16, - "learning_rate": 1.9967799336946073e-06, - "loss": 0.8716, - "step": 6413 - }, - { - "epoch": 0.16, - "learning_rate": 1.9967777145353137e-06, - "loss": 0.873, - "step": 6414 - }, - { - "epoch": 0.16, - "learning_rate": 1.996775494612833e-06, - "loss": 0.9395, - "step": 6415 - }, - { - "epoch": 0.16, - "learning_rate": 1.9967732739271674e-06, - "loss": 0.8901, - "step": 6416 - }, - { - "epoch": 0.16, - "learning_rate": 1.996771052478318e-06, - "loss": 0.9326, - "step": 6417 - }, - { - "epoch": 0.16, - "learning_rate": 1.9967688302662867e-06, - "loss": 0.9912, - "step": 6418 - }, - { - "epoch": 0.16, - "learning_rate": 1.9967666072910754e-06, - "loss": 0.8301, - "step": 6419 - }, - { - "epoch": 0.16, - "learning_rate": 1.996764383552686e-06, - "loss": 1.0166, - "step": 6420 - }, - { - "epoch": 0.16, - "learning_rate": 1.9967621590511203e-06, - "loss": 1.1211, - "step": 6421 - }, - { - "epoch": 0.16, - "learning_rate": 1.996759933786379e-06, - "loss": 0.896, - "step": 6422 - }, - { - "epoch": 0.16, - "learning_rate": 1.9967577077584647e-06, - "loss": 0.6357, - "step": 6423 - }, - { - "epoch": 0.16, - "learning_rate": 1.9967554809673785e-06, - "loss": 0.959, - "step": 6424 - }, - { - "epoch": 0.16, - "learning_rate": 1.9967532534131228e-06, - "loss": 0.75, - "step": 6425 - }, - { - "epoch": 0.16, - "learning_rate": 1.996751025095699e-06, - "loss": 0.8955, - "step": 6426 - }, - { - "epoch": 0.16, - "learning_rate": 1.996748796015109e-06, - "loss": 0.8506, - "step": 6427 - }, - { - "epoch": 0.16, - "learning_rate": 1.9967465661713535e-06, - "loss": 0.8428, - "step": 6428 - }, - { - "epoch": 0.16, - "learning_rate": 1.996744335564436e-06, - "loss": 0.8545, - "step": 6429 - }, - { - "epoch": 0.16, - "learning_rate": 1.9967421041943565e-06, - "loss": 0.8237, - "step": 6430 - }, - { - "epoch": 0.16, - "learning_rate": 1.9967398720611173e-06, - "loss": 0.7686, - "step": 6431 - }, - { - "epoch": 0.16, - "learning_rate": 1.9967376391647205e-06, - "loss": 0.8018, - "step": 6432 - }, - { - "epoch": 0.16, - "learning_rate": 1.9967354055051678e-06, - "loss": 1.1006, - "step": 6433 - }, - { - "epoch": 0.16, - "learning_rate": 1.9967331710824604e-06, - "loss": 0.7974, - "step": 6434 - }, - { - "epoch": 0.16, - "learning_rate": 1.9967309358966e-06, - "loss": 0.7788, - "step": 6435 - }, - { - "epoch": 0.16, - "learning_rate": 1.9967286999475888e-06, - "loss": 1.001, - "step": 6436 - }, - { - "epoch": 0.16, - "learning_rate": 1.996726463235428e-06, - "loss": 1.0625, - "step": 6437 - }, - { - "epoch": 0.17, - "learning_rate": 1.9967242257601197e-06, - "loss": 0.8262, - "step": 6438 - }, - { - "epoch": 0.17, - "learning_rate": 1.9967219875216657e-06, - "loss": 0.6118, - "step": 6439 - }, - { - "epoch": 0.17, - "learning_rate": 1.996719748520067e-06, - "loss": 1.0381, - "step": 6440 - }, - { - "epoch": 0.17, - "learning_rate": 1.9967175087553267e-06, - "loss": 0.9844, - "step": 6441 - }, - { - "epoch": 0.17, - "learning_rate": 1.996715268227445e-06, - "loss": 0.9404, - "step": 6442 - }, - { - "epoch": 0.17, - "learning_rate": 1.9967130269364245e-06, - "loss": 0.6919, - "step": 6443 - }, - { - "epoch": 0.17, - "learning_rate": 1.9967107848822666e-06, - "loss": 1.0918, - "step": 6444 - }, - { - "epoch": 0.17, - "learning_rate": 1.9967085420649727e-06, - "loss": 0.7017, - "step": 6445 - }, - { - "epoch": 0.17, - "learning_rate": 1.9967062984845453e-06, - "loss": 1.125, - "step": 6446 - }, - { - "epoch": 0.17, - "learning_rate": 1.9967040541409856e-06, - "loss": 0.7422, - "step": 6447 - }, - { - "epoch": 0.17, - "learning_rate": 1.9967018090342955e-06, - "loss": 0.8975, - "step": 6448 - }, - { - "epoch": 0.17, - "learning_rate": 1.996699563164477e-06, - "loss": 0.9033, - "step": 6449 - }, - { - "epoch": 0.17, - "learning_rate": 1.9966973165315304e-06, - "loss": 0.9717, - "step": 6450 - }, - { - "epoch": 0.17, - "learning_rate": 1.9966950691354593e-06, - "loss": 0.9268, - "step": 6451 - }, - { - "epoch": 0.17, - "learning_rate": 1.9966928209762644e-06, - "loss": 1.1016, - "step": 6452 - }, - { - "epoch": 0.17, - "learning_rate": 1.996690572053948e-06, - "loss": 0.8779, - "step": 6453 - }, - { - "epoch": 0.17, - "learning_rate": 1.996688322368511e-06, - "loss": 1.0664, - "step": 6454 - }, - { - "epoch": 0.17, - "learning_rate": 1.996686071919956e-06, - "loss": 0.9004, - "step": 6455 - }, - { - "epoch": 0.17, - "learning_rate": 1.996683820708284e-06, - "loss": 0.8984, - "step": 6456 - }, - { - "epoch": 0.17, - "learning_rate": 1.9966815687334974e-06, - "loss": 0.9014, - "step": 6457 - }, - { - "epoch": 0.17, - "learning_rate": 1.996679315995597e-06, - "loss": 0.8501, - "step": 6458 - }, - { - "epoch": 0.17, - "learning_rate": 1.9966770624945854e-06, - "loss": 0.96, - "step": 6459 - }, - { - "epoch": 0.17, - "learning_rate": 1.9966748082304637e-06, - "loss": 0.9805, - "step": 6460 - }, - { - "epoch": 0.17, - "learning_rate": 1.9966725532032343e-06, - "loss": 0.9482, - "step": 6461 - }, - { - "epoch": 0.17, - "learning_rate": 1.9966702974128985e-06, - "loss": 1.0703, - "step": 6462 - }, - { - "epoch": 0.17, - "learning_rate": 1.996668040859458e-06, - "loss": 1.0303, - "step": 6463 - }, - { - "epoch": 0.17, - "learning_rate": 1.9966657835429146e-06, - "loss": 0.9668, - "step": 6464 - }, - { - "epoch": 0.17, - "learning_rate": 1.99666352546327e-06, - "loss": 0.915, - "step": 6465 - }, - { - "epoch": 0.17, - "learning_rate": 1.996661266620526e-06, - "loss": 0.8291, - "step": 6466 - }, - { - "epoch": 0.17, - "learning_rate": 1.9966590070146845e-06, - "loss": 0.8877, - "step": 6467 - }, - { - "epoch": 0.17, - "learning_rate": 1.996656746645747e-06, - "loss": 0.8838, - "step": 6468 - }, - { - "epoch": 0.17, - "learning_rate": 1.9966544855137147e-06, - "loss": 1.1133, - "step": 6469 - }, - { - "epoch": 0.17, - "learning_rate": 1.99665222361859e-06, - "loss": 1.0146, - "step": 6470 - }, - { - "epoch": 0.17, - "learning_rate": 1.9966499609603753e-06, - "loss": 0.9326, - "step": 6471 - }, - { - "epoch": 0.17, - "learning_rate": 1.996647697539071e-06, - "loss": 0.9346, - "step": 6472 - }, - { - "epoch": 0.17, - "learning_rate": 1.9966454333546794e-06, - "loss": 0.9844, - "step": 6473 - }, - { - "epoch": 0.17, - "learning_rate": 1.996643168407202e-06, - "loss": 0.9541, - "step": 6474 - }, - { - "epoch": 0.17, - "learning_rate": 1.996640902696641e-06, - "loss": 0.9165, - "step": 6475 - }, - { - "epoch": 0.17, - "learning_rate": 1.996638636222998e-06, - "loss": 0.8203, - "step": 6476 - }, - { - "epoch": 0.17, - "learning_rate": 1.9966363689862744e-06, - "loss": 0.957, - "step": 6477 - }, - { - "epoch": 0.17, - "learning_rate": 1.9966341009864725e-06, - "loss": 0.8901, - "step": 6478 - }, - { - "epoch": 0.17, - "learning_rate": 1.9966318322235933e-06, - "loss": 0.833, - "step": 6479 - }, - { - "epoch": 0.17, - "learning_rate": 1.996629562697639e-06, - "loss": 1.0762, - "step": 6480 - }, - { - "epoch": 0.17, - "learning_rate": 1.9966272924086116e-06, - "loss": 0.9014, - "step": 6481 - }, - { - "epoch": 0.17, - "learning_rate": 1.9966250213565125e-06, - "loss": 1.1367, - "step": 6482 - }, - { - "epoch": 0.17, - "learning_rate": 1.996622749541343e-06, - "loss": 0.6929, - "step": 6483 - }, - { - "epoch": 0.17, - "learning_rate": 1.9966204769631055e-06, - "loss": 0.8105, - "step": 6484 - }, - { - "epoch": 0.17, - "learning_rate": 1.996618203621802e-06, - "loss": 0.7129, - "step": 6485 - }, - { - "epoch": 0.17, - "learning_rate": 1.996615929517433e-06, - "loss": 1.1006, - "step": 6486 - }, - { - "epoch": 0.17, - "learning_rate": 1.996613654650001e-06, - "loss": 1.1992, - "step": 6487 - }, - { - "epoch": 0.17, - "learning_rate": 1.9966113790195084e-06, - "loss": 1.0059, - "step": 6488 - }, - { - "epoch": 0.17, - "learning_rate": 1.996609102625956e-06, - "loss": 0.9121, - "step": 6489 - }, - { - "epoch": 0.17, - "learning_rate": 1.9966068254693454e-06, - "loss": 0.832, - "step": 6490 - }, - { - "epoch": 0.17, - "learning_rate": 1.9966045475496792e-06, - "loss": 0.9077, - "step": 6491 - }, - { - "epoch": 0.17, - "learning_rate": 1.9966022688669592e-06, - "loss": 0.791, - "step": 6492 - }, - { - "epoch": 0.17, - "learning_rate": 1.9965999894211862e-06, - "loss": 0.8594, - "step": 6493 - }, - { - "epoch": 0.17, - "learning_rate": 1.996597709212362e-06, - "loss": 0.9971, - "step": 6494 - }, - { - "epoch": 0.17, - "learning_rate": 1.996595428240489e-06, - "loss": 1.0986, - "step": 6495 - }, - { - "epoch": 0.17, - "learning_rate": 1.9965931465055694e-06, - "loss": 0.9072, - "step": 6496 - }, - { - "epoch": 0.17, - "learning_rate": 1.9965908640076034e-06, - "loss": 0.8477, - "step": 6497 - }, - { - "epoch": 0.17, - "learning_rate": 1.996588580746594e-06, - "loss": 0.8984, - "step": 6498 - }, - { - "epoch": 0.17, - "learning_rate": 1.9965862967225423e-06, - "loss": 0.6973, - "step": 6499 - }, - { - "epoch": 0.17, - "learning_rate": 1.9965840119354503e-06, - "loss": 1.0225, - "step": 6500 - }, - { - "epoch": 0.17, - "learning_rate": 1.99658172638532e-06, - "loss": 0.9058, - "step": 6501 - }, - { - "epoch": 0.17, - "learning_rate": 1.996579440072153e-06, - "loss": 0.8584, - "step": 6502 - }, - { - "epoch": 0.17, - "learning_rate": 1.9965771529959504e-06, - "loss": 0.6104, - "step": 6503 - }, - { - "epoch": 0.17, - "learning_rate": 1.996574865156715e-06, - "loss": 0.8447, - "step": 6504 - }, - { - "epoch": 0.17, - "learning_rate": 1.996572576554448e-06, - "loss": 0.6143, - "step": 6505 - }, - { - "epoch": 0.17, - "learning_rate": 1.996570287189151e-06, - "loss": 0.9668, - "step": 6506 - }, - { - "epoch": 0.17, - "learning_rate": 1.996567997060826e-06, - "loss": 0.7373, - "step": 6507 - }, - { - "epoch": 0.17, - "learning_rate": 1.9965657061694748e-06, - "loss": 0.8442, - "step": 6508 - }, - { - "epoch": 0.17, - "learning_rate": 1.996563414515099e-06, - "loss": 0.6055, - "step": 6509 - }, - { - "epoch": 0.17, - "learning_rate": 1.9965611220977005e-06, - "loss": 0.9355, - "step": 6510 - }, - { - "epoch": 0.17, - "learning_rate": 1.9965588289172806e-06, - "loss": 1.0137, - "step": 6511 - }, - { - "epoch": 0.17, - "learning_rate": 1.996556534973842e-06, - "loss": 1.0029, - "step": 6512 - }, - { - "epoch": 0.17, - "learning_rate": 1.9965542402673855e-06, - "loss": 0.8228, - "step": 6513 - }, - { - "epoch": 0.17, - "learning_rate": 1.9965519447979133e-06, - "loss": 0.7617, - "step": 6514 - }, - { - "epoch": 0.17, - "learning_rate": 1.996549648565427e-06, - "loss": 0.9053, - "step": 6515 - }, - { - "epoch": 0.17, - "learning_rate": 1.996547351569929e-06, - "loss": 0.8662, - "step": 6516 - }, - { - "epoch": 0.17, - "learning_rate": 1.99654505381142e-06, - "loss": 1.1113, - "step": 6517 - }, - { - "epoch": 0.17, - "learning_rate": 1.996542755289902e-06, - "loss": 0.959, - "step": 6518 - }, - { - "epoch": 0.17, - "learning_rate": 1.996540456005378e-06, - "loss": 0.9854, - "step": 6519 - }, - { - "epoch": 0.17, - "learning_rate": 1.996538155957848e-06, - "loss": 0.8896, - "step": 6520 - }, - { - "epoch": 0.17, - "learning_rate": 1.9965358551473147e-06, - "loss": 1.0771, - "step": 6521 - }, - { - "epoch": 0.17, - "learning_rate": 1.99653355357378e-06, - "loss": 1.042, - "step": 6522 - }, - { - "epoch": 0.17, - "learning_rate": 1.996531251237245e-06, - "loss": 0.8857, - "step": 6523 - }, - { - "epoch": 0.17, - "learning_rate": 1.9965289481377117e-06, - "loss": 1.0039, - "step": 6524 - }, - { - "epoch": 0.17, - "learning_rate": 1.9965266442751827e-06, - "loss": 0.8174, - "step": 6525 - }, - { - "epoch": 0.17, - "learning_rate": 1.9965243396496583e-06, - "loss": 0.8916, - "step": 6526 - }, - { - "epoch": 0.17, - "learning_rate": 1.996522034261142e-06, - "loss": 0.8667, - "step": 6527 - }, - { - "epoch": 0.17, - "learning_rate": 1.996519728109634e-06, - "loss": 0.9131, - "step": 6528 - }, - { - "epoch": 0.17, - "learning_rate": 1.9965174211951363e-06, - "loss": 0.6948, - "step": 6529 - }, - { - "epoch": 0.17, - "learning_rate": 1.996515113517652e-06, - "loss": 0.8213, - "step": 6530 - }, - { - "epoch": 0.17, - "learning_rate": 1.996512805077181e-06, - "loss": 1.1201, - "step": 6531 - }, - { - "epoch": 0.17, - "learning_rate": 1.9965104958737263e-06, - "loss": 1.0059, - "step": 6532 - }, - { - "epoch": 0.17, - "learning_rate": 1.9965081859072894e-06, - "loss": 0.957, - "step": 6533 - }, - { - "epoch": 0.17, - "learning_rate": 1.996505875177872e-06, - "loss": 1.0039, - "step": 6534 - }, - { - "epoch": 0.17, - "learning_rate": 1.9965035636854756e-06, - "loss": 1.0137, - "step": 6535 - }, - { - "epoch": 0.17, - "learning_rate": 1.9965012514301024e-06, - "loss": 1.0156, - "step": 6536 - }, - { - "epoch": 0.17, - "learning_rate": 1.9964989384117538e-06, - "loss": 0.7607, - "step": 6537 - }, - { - "epoch": 0.17, - "learning_rate": 1.996496624630432e-06, - "loss": 0.8857, - "step": 6538 - }, - { - "epoch": 0.17, - "learning_rate": 1.9964943100861388e-06, - "loss": 0.7485, - "step": 6539 - }, - { - "epoch": 0.17, - "learning_rate": 1.9964919947788754e-06, - "loss": 1.1875, - "step": 6540 - }, - { - "epoch": 0.17, - "learning_rate": 1.996489678708644e-06, - "loss": 1.0137, - "step": 6541 - }, - { - "epoch": 0.17, - "learning_rate": 1.9964873618754467e-06, - "loss": 0.9453, - "step": 6542 - }, - { - "epoch": 0.17, - "learning_rate": 1.9964850442792844e-06, - "loss": 1.0039, - "step": 6543 - }, - { - "epoch": 0.17, - "learning_rate": 1.996482725920159e-06, - "loss": 0.8579, - "step": 6544 - }, - { - "epoch": 0.17, - "learning_rate": 1.996480406798073e-06, - "loss": 1.0586, - "step": 6545 - }, - { - "epoch": 0.17, - "learning_rate": 1.9964780869130276e-06, - "loss": 0.8389, - "step": 6546 - }, - { - "epoch": 0.17, - "learning_rate": 1.996475766265025e-06, - "loss": 1.3164, - "step": 6547 - }, - { - "epoch": 0.17, - "learning_rate": 1.996473444854067e-06, - "loss": 0.8145, - "step": 6548 - }, - { - "epoch": 0.17, - "learning_rate": 1.9964711226801547e-06, - "loss": 0.8389, - "step": 6549 - }, - { - "epoch": 0.17, - "learning_rate": 1.99646879974329e-06, - "loss": 1.0762, - "step": 6550 - }, - { - "epoch": 0.17, - "learning_rate": 1.996466476043475e-06, - "loss": 1.0264, - "step": 6551 - }, - { - "epoch": 0.17, - "learning_rate": 1.9964641515807118e-06, - "loss": 0.9404, - "step": 6552 - }, - { - "epoch": 0.17, - "learning_rate": 1.9964618263550018e-06, - "loss": 0.7397, - "step": 6553 - }, - { - "epoch": 0.17, - "learning_rate": 1.9964595003663467e-06, - "loss": 0.9473, - "step": 6554 - }, - { - "epoch": 0.17, - "learning_rate": 1.9964571736147484e-06, - "loss": 0.873, - "step": 6555 - }, - { - "epoch": 0.17, - "learning_rate": 1.9964548461002084e-06, - "loss": 0.9961, - "step": 6556 - }, - { - "epoch": 0.17, - "learning_rate": 1.9964525178227293e-06, - "loss": 0.9014, - "step": 6557 - }, - { - "epoch": 0.17, - "learning_rate": 1.9964501887823116e-06, - "loss": 0.9873, - "step": 6558 - }, - { - "epoch": 0.17, - "learning_rate": 1.9964478589789586e-06, - "loss": 0.8423, - "step": 6559 - }, - { - "epoch": 0.17, - "learning_rate": 1.9964455284126707e-06, - "loss": 0.9336, - "step": 6560 - }, - { - "epoch": 0.17, - "learning_rate": 1.9964431970834505e-06, - "loss": 0.9727, - "step": 6561 - }, - { - "epoch": 0.17, - "learning_rate": 1.9964408649912997e-06, - "loss": 1.1426, - "step": 6562 - }, - { - "epoch": 0.17, - "learning_rate": 1.9964385321362195e-06, - "loss": 0.7136, - "step": 6563 - }, - { - "epoch": 0.17, - "learning_rate": 1.9964361985182125e-06, - "loss": 1.0742, - "step": 6564 - }, - { - "epoch": 0.17, - "learning_rate": 1.99643386413728e-06, - "loss": 0.8398, - "step": 6565 - }, - { - "epoch": 0.17, - "learning_rate": 1.996431528993424e-06, - "loss": 1.0449, - "step": 6566 - }, - { - "epoch": 0.17, - "learning_rate": 1.996429193086646e-06, - "loss": 0.8555, - "step": 6567 - }, - { - "epoch": 0.17, - "learning_rate": 1.9964268564169482e-06, - "loss": 0.9033, - "step": 6568 - }, - { - "epoch": 0.17, - "learning_rate": 1.996424518984332e-06, - "loss": 1.1035, - "step": 6569 - }, - { - "epoch": 0.17, - "learning_rate": 1.9964221807888e-06, - "loss": 0.9482, - "step": 6570 - }, - { - "epoch": 0.17, - "learning_rate": 1.9964198418303523e-06, - "loss": 1.0615, - "step": 6571 - }, - { - "epoch": 0.17, - "learning_rate": 1.996417502108992e-06, - "loss": 1.0762, - "step": 6572 - }, - { - "epoch": 0.17, - "learning_rate": 1.9964151616247214e-06, - "loss": 0.8154, - "step": 6573 - }, - { - "epoch": 0.17, - "learning_rate": 1.996412820377541e-06, - "loss": 0.7856, - "step": 6574 - }, - { - "epoch": 0.17, - "learning_rate": 1.9964104783674532e-06, - "loss": 0.8926, - "step": 6575 - }, - { - "epoch": 0.17, - "learning_rate": 1.9964081355944596e-06, - "loss": 1.1016, - "step": 6576 - }, - { - "epoch": 0.17, - "learning_rate": 1.996405792058562e-06, - "loss": 0.9014, - "step": 6577 - }, - { - "epoch": 0.17, - "learning_rate": 1.9964034477597623e-06, - "loss": 0.8018, - "step": 6578 - }, - { - "epoch": 0.17, - "learning_rate": 1.9964011026980628e-06, - "loss": 0.9951, - "step": 6579 - }, - { - "epoch": 0.17, - "learning_rate": 1.9963987568734644e-06, - "loss": 0.959, - "step": 6580 - }, - { - "epoch": 0.17, - "learning_rate": 1.9963964102859693e-06, - "loss": 0.9346, - "step": 6581 - }, - { - "epoch": 0.17, - "learning_rate": 1.996394062935579e-06, - "loss": 0.9424, - "step": 6582 - }, - { - "epoch": 0.17, - "learning_rate": 1.996391714822296e-06, - "loss": 0.8545, - "step": 6583 - }, - { - "epoch": 0.17, - "learning_rate": 1.9963893659461217e-06, - "loss": 0.937, - "step": 6584 - }, - { - "epoch": 0.17, - "learning_rate": 1.996387016307058e-06, - "loss": 0.9502, - "step": 6585 - }, - { - "epoch": 0.17, - "learning_rate": 1.996384665905106e-06, - "loss": 0.9941, - "step": 6586 - }, - { - "epoch": 0.17, - "learning_rate": 1.9963823147402683e-06, - "loss": 1.0098, - "step": 6587 - }, - { - "epoch": 0.17, - "learning_rate": 1.996379962812547e-06, - "loss": 0.9014, - "step": 6588 - }, - { - "epoch": 0.17, - "learning_rate": 1.996377610121943e-06, - "loss": 0.9961, - "step": 6589 - }, - { - "epoch": 0.17, - "learning_rate": 1.9963752566684586e-06, - "loss": 0.8774, - "step": 6590 - }, - { - "epoch": 0.17, - "learning_rate": 1.996372902452095e-06, - "loss": 0.8892, - "step": 6591 - }, - { - "epoch": 0.17, - "learning_rate": 1.996370547472855e-06, - "loss": 0.96, - "step": 6592 - }, - { - "epoch": 0.17, - "learning_rate": 1.9963681917307395e-06, - "loss": 1.002, - "step": 6593 - }, - { - "epoch": 0.17, - "learning_rate": 1.9963658352257507e-06, - "loss": 0.876, - "step": 6594 - }, - { - "epoch": 0.17, - "learning_rate": 1.9963634779578905e-06, - "loss": 0.8013, - "step": 6595 - }, - { - "epoch": 0.17, - "learning_rate": 1.9963611199271607e-06, - "loss": 0.9932, - "step": 6596 - }, - { - "epoch": 0.17, - "learning_rate": 1.9963587611335634e-06, - "loss": 1.0645, - "step": 6597 - }, - { - "epoch": 0.17, - "learning_rate": 1.9963564015770994e-06, - "loss": 0.8672, - "step": 6598 - }, - { - "epoch": 0.17, - "learning_rate": 1.9963540412577713e-06, - "loss": 0.9658, - "step": 6599 - }, - { - "epoch": 0.17, - "learning_rate": 1.9963516801755807e-06, - "loss": 1.0684, - "step": 6600 - }, - { - "epoch": 0.17, - "learning_rate": 1.9963493183305294e-06, - "loss": 1.0293, - "step": 6601 - }, - { - "epoch": 0.17, - "learning_rate": 1.9963469557226195e-06, - "loss": 0.8496, - "step": 6602 - }, - { - "epoch": 0.17, - "learning_rate": 1.9963445923518522e-06, - "loss": 0.8779, - "step": 6603 - }, - { - "epoch": 0.17, - "learning_rate": 1.9963422282182297e-06, - "loss": 0.9053, - "step": 6604 - }, - { - "epoch": 0.17, - "learning_rate": 1.996339863321754e-06, - "loss": 0.9258, - "step": 6605 - }, - { - "epoch": 0.17, - "learning_rate": 1.9963374976624266e-06, - "loss": 1.083, - "step": 6606 - }, - { - "epoch": 0.17, - "learning_rate": 1.9963351312402494e-06, - "loss": 0.8184, - "step": 6607 - }, - { - "epoch": 0.17, - "learning_rate": 1.996332764055224e-06, - "loss": 0.7705, - "step": 6608 - }, - { - "epoch": 0.17, - "learning_rate": 1.9963303961073525e-06, - "loss": 0.6948, - "step": 6609 - }, - { - "epoch": 0.17, - "learning_rate": 1.996328027396637e-06, - "loss": 0.7383, - "step": 6610 - }, - { - "epoch": 0.17, - "learning_rate": 1.9963256579230784e-06, - "loss": 0.9258, - "step": 6611 - }, - { - "epoch": 0.17, - "learning_rate": 1.9963232876866796e-06, - "loss": 0.8945, - "step": 6612 - }, - { - "epoch": 0.17, - "learning_rate": 1.9963209166874413e-06, - "loss": 1.0166, - "step": 6613 - }, - { - "epoch": 0.17, - "learning_rate": 1.996318544925366e-06, - "loss": 0.876, - "step": 6614 - }, - { - "epoch": 0.17, - "learning_rate": 1.9963161724004556e-06, - "loss": 1.1016, - "step": 6615 - }, - { - "epoch": 0.17, - "learning_rate": 1.9963137991127117e-06, - "loss": 0.7764, - "step": 6616 - }, - { - "epoch": 0.17, - "learning_rate": 1.9963114250621363e-06, - "loss": 1.0664, - "step": 6617 - }, - { - "epoch": 0.17, - "learning_rate": 1.996309050248731e-06, - "loss": 1.1133, - "step": 6618 - }, - { - "epoch": 0.17, - "learning_rate": 1.9963066746724973e-06, - "loss": 0.8018, - "step": 6619 - }, - { - "epoch": 0.17, - "learning_rate": 1.996304298333438e-06, - "loss": 0.7847, - "step": 6620 - }, - { - "epoch": 0.17, - "learning_rate": 1.9963019212315533e-06, - "loss": 0.8906, - "step": 6621 - }, - { - "epoch": 0.17, - "learning_rate": 1.996299543366847e-06, - "loss": 0.9932, - "step": 6622 - }, - { - "epoch": 0.17, - "learning_rate": 1.9962971647393197e-06, - "loss": 0.9609, - "step": 6623 - }, - { - "epoch": 0.17, - "learning_rate": 1.9962947853489732e-06, - "loss": 0.8926, - "step": 6624 - }, - { - "epoch": 0.17, - "learning_rate": 1.99629240519581e-06, - "loss": 0.6577, - "step": 6625 - }, - { - "epoch": 0.17, - "learning_rate": 1.996290024279831e-06, - "loss": 1.002, - "step": 6626 - }, - { - "epoch": 0.17, - "learning_rate": 1.996287642601039e-06, - "loss": 1.0479, - "step": 6627 - }, - { - "epoch": 0.17, - "learning_rate": 1.996285260159435e-06, - "loss": 1.0371, - "step": 6628 - }, - { - "epoch": 0.17, - "learning_rate": 1.9962828769550216e-06, - "loss": 1.0391, - "step": 6629 - }, - { - "epoch": 0.17, - "learning_rate": 1.9962804929878e-06, - "loss": 0.9004, - "step": 6630 - }, - { - "epoch": 0.17, - "learning_rate": 1.996278108257772e-06, - "loss": 0.8223, - "step": 6631 - }, - { - "epoch": 0.17, - "learning_rate": 1.99627572276494e-06, - "loss": 0.7305, - "step": 6632 - }, - { - "epoch": 0.17, - "learning_rate": 1.9962733365093058e-06, - "loss": 0.8799, - "step": 6633 - }, - { - "epoch": 0.17, - "learning_rate": 1.9962709494908702e-06, - "loss": 1.1211, - "step": 6634 - }, - { - "epoch": 0.17, - "learning_rate": 1.996268561709636e-06, - "loss": 0.8755, - "step": 6635 - }, - { - "epoch": 0.17, - "learning_rate": 1.996266173165605e-06, - "loss": 0.7661, - "step": 6636 - }, - { - "epoch": 0.17, - "learning_rate": 1.9962637838587786e-06, - "loss": 1.0527, - "step": 6637 - }, - { - "epoch": 0.17, - "learning_rate": 1.9962613937891584e-06, - "loss": 1.0781, - "step": 6638 - }, - { - "epoch": 0.17, - "learning_rate": 1.9962590029567474e-06, - "loss": 1.0586, - "step": 6639 - }, - { - "epoch": 0.17, - "learning_rate": 1.9962566113615464e-06, - "loss": 0.916, - "step": 6640 - }, - { - "epoch": 0.17, - "learning_rate": 1.9962542190035574e-06, - "loss": 0.9131, - "step": 6641 - }, - { - "epoch": 0.17, - "learning_rate": 1.9962518258827827e-06, - "loss": 0.6523, - "step": 6642 - }, - { - "epoch": 0.17, - "learning_rate": 1.9962494319992235e-06, - "loss": 0.9883, - "step": 6643 - }, - { - "epoch": 0.17, - "learning_rate": 1.996247037352882e-06, - "loss": 0.832, - "step": 6644 - }, - { - "epoch": 0.17, - "learning_rate": 1.9962446419437595e-06, - "loss": 0.9111, - "step": 6645 - }, - { - "epoch": 0.17, - "learning_rate": 1.996242245771859e-06, - "loss": 0.9482, - "step": 6646 - }, - { - "epoch": 0.17, - "learning_rate": 1.9962398488371813e-06, - "loss": 0.8008, - "step": 6647 - }, - { - "epoch": 0.17, - "learning_rate": 1.9962374511397287e-06, - "loss": 1.0186, - "step": 6648 - }, - { - "epoch": 0.17, - "learning_rate": 1.9962350526795027e-06, - "loss": 0.8516, - "step": 6649 - }, - { - "epoch": 0.17, - "learning_rate": 1.9962326534565057e-06, - "loss": 0.8857, - "step": 6650 - }, - { - "epoch": 0.17, - "learning_rate": 1.9962302534707386e-06, - "loss": 0.9404, - "step": 6651 - }, - { - "epoch": 0.17, - "learning_rate": 1.996227852722204e-06, - "loss": 0.9072, - "step": 6652 - }, - { - "epoch": 0.17, - "learning_rate": 1.9962254512109037e-06, - "loss": 1.0166, - "step": 6653 - }, - { - "epoch": 0.17, - "learning_rate": 1.9962230489368394e-06, - "loss": 0.9004, - "step": 6654 - }, - { - "epoch": 0.17, - "learning_rate": 1.996220645900013e-06, - "loss": 0.9473, - "step": 6655 - }, - { - "epoch": 0.17, - "learning_rate": 1.996218242100426e-06, - "loss": 0.5815, - "step": 6656 - }, - { - "epoch": 0.17, - "learning_rate": 1.9962158375380804e-06, - "loss": 0.8896, - "step": 6657 - }, - { - "epoch": 0.17, - "learning_rate": 1.9962134322129785e-06, - "loss": 0.9814, - "step": 6658 - }, - { - "epoch": 0.17, - "learning_rate": 1.9962110261251216e-06, - "loss": 0.8418, - "step": 6659 - }, - { - "epoch": 0.17, - "learning_rate": 1.9962086192745116e-06, - "loss": 1.0615, - "step": 6660 - }, - { - "epoch": 0.17, - "learning_rate": 1.9962062116611505e-06, - "loss": 0.9717, - "step": 6661 - }, - { - "epoch": 0.17, - "learning_rate": 1.9962038032850405e-06, - "loss": 1.0303, - "step": 6662 - }, - { - "epoch": 0.17, - "learning_rate": 1.9962013941461825e-06, - "loss": 0.9092, - "step": 6663 - }, - { - "epoch": 0.17, - "learning_rate": 1.9961989842445792e-06, - "loss": 0.8994, - "step": 6664 - }, - { - "epoch": 0.17, - "learning_rate": 1.9961965735802318e-06, - "loss": 0.833, - "step": 6665 - }, - { - "epoch": 0.17, - "learning_rate": 1.996194162153143e-06, - "loss": 0.8945, - "step": 6666 - }, - { - "epoch": 0.17, - "learning_rate": 1.996191749963314e-06, - "loss": 1.1377, - "step": 6667 - }, - { - "epoch": 0.17, - "learning_rate": 1.996189337010747e-06, - "loss": 0.8018, - "step": 6668 - }, - { - "epoch": 0.17, - "learning_rate": 1.996186923295443e-06, - "loss": 0.916, - "step": 6669 - }, - { - "epoch": 0.17, - "learning_rate": 1.9961845088174048e-06, - "loss": 0.8525, - "step": 6670 - }, - { - "epoch": 0.17, - "learning_rate": 1.996182093576634e-06, - "loss": 0.7646, - "step": 6671 - }, - { - "epoch": 0.17, - "learning_rate": 1.9961796775731325e-06, - "loss": 0.8887, - "step": 6672 - }, - { - "epoch": 0.17, - "learning_rate": 1.9961772608069015e-06, - "loss": 0.9189, - "step": 6673 - }, - { - "epoch": 0.17, - "learning_rate": 1.996174843277944e-06, - "loss": 0.8721, - "step": 6674 - }, - { - "epoch": 0.17, - "learning_rate": 1.996172424986261e-06, - "loss": 0.8467, - "step": 6675 - }, - { - "epoch": 0.17, - "learning_rate": 1.9961700059318544e-06, - "loss": 0.9854, - "step": 6676 - }, - { - "epoch": 0.17, - "learning_rate": 1.9961675861147264e-06, - "loss": 1.0059, - "step": 6677 - }, - { - "epoch": 0.17, - "learning_rate": 1.9961651655348786e-06, - "loss": 0.8311, - "step": 6678 - }, - { - "epoch": 0.17, - "learning_rate": 1.996162744192313e-06, - "loss": 0.9434, - "step": 6679 - }, - { - "epoch": 0.17, - "learning_rate": 1.9961603220870313e-06, - "loss": 0.9863, - "step": 6680 - }, - { - "epoch": 0.17, - "learning_rate": 1.996157899219036e-06, - "loss": 0.7812, - "step": 6681 - }, - { - "epoch": 0.17, - "learning_rate": 1.9961554755883275e-06, - "loss": 1.166, - "step": 6682 - }, - { - "epoch": 0.17, - "learning_rate": 1.996153051194909e-06, - "loss": 1.0332, - "step": 6683 - }, - { - "epoch": 0.17, - "learning_rate": 1.996150626038782e-06, - "loss": 0.9102, - "step": 6684 - }, - { - "epoch": 0.17, - "learning_rate": 1.996148200119948e-06, - "loss": 0.8403, - "step": 6685 - }, - { - "epoch": 0.17, - "learning_rate": 1.9961457734384096e-06, - "loss": 0.9434, - "step": 6686 - }, - { - "epoch": 0.17, - "learning_rate": 1.9961433459941675e-06, - "loss": 1.0762, - "step": 6687 - }, - { - "epoch": 0.17, - "learning_rate": 1.9961409177872247e-06, - "loss": 0.9736, - "step": 6688 - }, - { - "epoch": 0.17, - "learning_rate": 1.9961384888175826e-06, - "loss": 1.2139, - "step": 6689 - }, - { - "epoch": 0.17, - "learning_rate": 1.996136059085243e-06, - "loss": 0.8682, - "step": 6690 - }, - { - "epoch": 0.17, - "learning_rate": 1.9961336285902077e-06, - "loss": 0.8281, - "step": 6691 - }, - { - "epoch": 0.17, - "learning_rate": 1.996131197332479e-06, - "loss": 0.8413, - "step": 6692 - }, - { - "epoch": 0.17, - "learning_rate": 1.9961287653120583e-06, - "loss": 0.75, - "step": 6693 - }, - { - "epoch": 0.17, - "learning_rate": 1.9961263325289476e-06, - "loss": 1.0264, - "step": 6694 - }, - { - "epoch": 0.17, - "learning_rate": 1.9961238989831485e-06, - "loss": 1.0576, - "step": 6695 - }, - { - "epoch": 0.17, - "learning_rate": 1.996121464674663e-06, - "loss": 1.0088, - "step": 6696 - }, - { - "epoch": 0.17, - "learning_rate": 1.996119029603494e-06, - "loss": 0.7788, - "step": 6697 - }, - { - "epoch": 0.17, - "learning_rate": 1.9961165937696414e-06, - "loss": 0.9004, - "step": 6698 - }, - { - "epoch": 0.17, - "learning_rate": 1.9961141571731092e-06, - "loss": 1.0332, - "step": 6699 - }, - { - "epoch": 0.17, - "learning_rate": 1.996111719813897e-06, - "loss": 0.8955, - "step": 6700 - }, - { - "epoch": 0.17, - "learning_rate": 1.996109281692009e-06, - "loss": 0.9209, - "step": 6701 - }, - { - "epoch": 0.17, - "learning_rate": 1.996106842807445e-06, - "loss": 1.0049, - "step": 6702 - }, - { - "epoch": 0.17, - "learning_rate": 1.9961044031602085e-06, - "loss": 0.8115, - "step": 6703 - }, - { - "epoch": 0.17, - "learning_rate": 1.9961019627503005e-06, - "loss": 0.8579, - "step": 6704 - }, - { - "epoch": 0.17, - "learning_rate": 1.9960995215777227e-06, - "loss": 0.7529, - "step": 6705 - }, - { - "epoch": 0.17, - "learning_rate": 1.996097079642478e-06, - "loss": 0.8369, - "step": 6706 - }, - { - "epoch": 0.17, - "learning_rate": 1.9960946369445665e-06, - "loss": 0.9121, - "step": 6707 - }, - { - "epoch": 0.17, - "learning_rate": 1.996092193483992e-06, - "loss": 0.9644, - "step": 6708 - }, - { - "epoch": 0.17, - "learning_rate": 1.996089749260755e-06, - "loss": 1.0078, - "step": 6709 - }, - { - "epoch": 0.17, - "learning_rate": 1.9960873042748583e-06, - "loss": 0.9521, - "step": 6710 - }, - { - "epoch": 0.17, - "learning_rate": 1.9960848585263032e-06, - "loss": 0.8652, - "step": 6711 - }, - { - "epoch": 0.17, - "learning_rate": 1.9960824120150916e-06, - "loss": 0.9199, - "step": 6712 - }, - { - "epoch": 0.17, - "learning_rate": 1.9960799647412254e-06, - "loss": 1.002, - "step": 6713 - }, - { - "epoch": 0.17, - "learning_rate": 1.996077516704707e-06, - "loss": 0.9258, - "step": 6714 - }, - { - "epoch": 0.17, - "learning_rate": 1.9960750679055372e-06, - "loss": 0.8594, - "step": 6715 - }, - { - "epoch": 0.17, - "learning_rate": 1.996072618343719e-06, - "loss": 0.7705, - "step": 6716 - }, - { - "epoch": 0.17, - "learning_rate": 1.996070168019254e-06, - "loss": 0.959, - "step": 6717 - }, - { - "epoch": 0.17, - "learning_rate": 1.9960677169321433e-06, - "loss": 0.9766, - "step": 6718 - }, - { - "epoch": 0.17, - "learning_rate": 1.9960652650823896e-06, - "loss": 0.8457, - "step": 6719 - }, - { - "epoch": 0.17, - "learning_rate": 1.9960628124699945e-06, - "loss": 0.9814, - "step": 6720 - }, - { - "epoch": 0.17, - "learning_rate": 1.99606035909496e-06, - "loss": 0.9404, - "step": 6721 - }, - { - "epoch": 0.17, - "learning_rate": 1.996057904957288e-06, - "loss": 0.7598, - "step": 6722 - }, - { - "epoch": 0.17, - "learning_rate": 1.99605545005698e-06, - "loss": 0.9453, - "step": 6723 - }, - { - "epoch": 0.17, - "learning_rate": 1.9960529943940382e-06, - "loss": 1.0889, - "step": 6724 - }, - { - "epoch": 0.17, - "learning_rate": 1.9960505379684643e-06, - "loss": 0.7617, - "step": 6725 - }, - { - "epoch": 0.17, - "learning_rate": 1.9960480807802604e-06, - "loss": 0.8945, - "step": 6726 - }, - { - "epoch": 0.17, - "learning_rate": 1.9960456228294284e-06, - "loss": 0.8848, - "step": 6727 - }, - { - "epoch": 0.17, - "learning_rate": 1.99604316411597e-06, - "loss": 0.9199, - "step": 6728 - }, - { - "epoch": 0.17, - "learning_rate": 1.9960407046398875e-06, - "loss": 0.9756, - "step": 6729 - }, - { - "epoch": 0.17, - "learning_rate": 1.9960382444011818e-06, - "loss": 0.9609, - "step": 6730 - }, - { - "epoch": 0.17, - "learning_rate": 1.996035783399856e-06, - "loss": 0.7988, - "step": 6731 - }, - { - "epoch": 0.17, - "learning_rate": 1.996033321635911e-06, - "loss": 0.9463, - "step": 6732 - }, - { - "epoch": 0.17, - "learning_rate": 1.9960308591093493e-06, - "loss": 0.7773, - "step": 6733 - }, - { - "epoch": 0.17, - "learning_rate": 1.9960283958201725e-06, - "loss": 0.7422, - "step": 6734 - }, - { - "epoch": 0.17, - "learning_rate": 1.9960259317683823e-06, - "loss": 0.876, - "step": 6735 - }, - { - "epoch": 0.17, - "learning_rate": 1.9960234669539813e-06, - "loss": 0.9775, - "step": 6736 - }, - { - "epoch": 0.17, - "learning_rate": 1.9960210013769706e-06, - "loss": 0.9482, - "step": 6737 - }, - { - "epoch": 0.17, - "learning_rate": 1.9960185350373525e-06, - "loss": 0.8862, - "step": 6738 - }, - { - "epoch": 0.17, - "learning_rate": 1.9960160679351286e-06, - "loss": 1.1367, - "step": 6739 - }, - { - "epoch": 0.17, - "learning_rate": 1.9960136000703014e-06, - "loss": 0.8428, - "step": 6740 - }, - { - "epoch": 0.17, - "learning_rate": 1.9960111314428723e-06, - "loss": 0.8613, - "step": 6741 - }, - { - "epoch": 0.17, - "learning_rate": 1.9960086620528433e-06, - "loss": 0.8643, - "step": 6742 - }, - { - "epoch": 0.17, - "learning_rate": 1.996006191900216e-06, - "loss": 0.9932, - "step": 6743 - }, - { - "epoch": 0.17, - "learning_rate": 1.9960037209849926e-06, - "loss": 1.0557, - "step": 6744 - }, - { - "epoch": 0.17, - "learning_rate": 1.996001249307175e-06, - "loss": 0.8042, - "step": 6745 - }, - { - "epoch": 0.17, - "learning_rate": 1.9959987768667653e-06, - "loss": 0.9707, - "step": 6746 - }, - { - "epoch": 0.17, - "learning_rate": 1.9959963036637645e-06, - "loss": 1.0312, - "step": 6747 - }, - { - "epoch": 0.17, - "learning_rate": 1.995993829698176e-06, - "loss": 0.833, - "step": 6748 - }, - { - "epoch": 0.17, - "learning_rate": 1.99599135497e-06, - "loss": 1.0615, - "step": 6749 - }, - { - "epoch": 0.17, - "learning_rate": 1.99598887947924e-06, - "loss": 1.0908, - "step": 6750 - }, - { - "epoch": 0.17, - "learning_rate": 1.9959864032258964e-06, - "loss": 0.8369, - "step": 6751 - }, - { - "epoch": 0.17, - "learning_rate": 1.9959839262099722e-06, - "loss": 1.1025, - "step": 6752 - }, - { - "epoch": 0.17, - "learning_rate": 1.995981448431469e-06, - "loss": 0.6089, - "step": 6753 - }, - { - "epoch": 0.17, - "learning_rate": 1.995978969890388e-06, - "loss": 0.9414, - "step": 6754 - }, - { - "epoch": 0.17, - "learning_rate": 1.995976490586732e-06, - "loss": 1.0537, - "step": 6755 - }, - { - "epoch": 0.17, - "learning_rate": 1.995974010520503e-06, - "loss": 1.0283, - "step": 6756 - }, - { - "epoch": 0.17, - "learning_rate": 1.9959715296917023e-06, - "loss": 1.0908, - "step": 6757 - }, - { - "epoch": 0.17, - "learning_rate": 1.995969048100332e-06, - "loss": 1.001, - "step": 6758 - }, - { - "epoch": 0.17, - "learning_rate": 1.9959665657463938e-06, - "loss": 0.9434, - "step": 6759 - }, - { - "epoch": 0.17, - "learning_rate": 1.9959640826298897e-06, - "loss": 0.9092, - "step": 6760 - }, - { - "epoch": 0.17, - "learning_rate": 1.995961598750822e-06, - "loss": 0.8887, - "step": 6761 - }, - { - "epoch": 0.17, - "learning_rate": 1.995959114109192e-06, - "loss": 0.6328, - "step": 6762 - }, - { - "epoch": 0.17, - "learning_rate": 1.9959566287050023e-06, - "loss": 0.9473, - "step": 6763 - }, - { - "epoch": 0.17, - "learning_rate": 1.995954142538254e-06, - "loss": 0.9062, - "step": 6764 - }, - { - "epoch": 0.17, - "learning_rate": 1.9959516556089495e-06, - "loss": 0.7866, - "step": 6765 - }, - { - "epoch": 0.17, - "learning_rate": 1.9959491679170906e-06, - "loss": 1.0811, - "step": 6766 - }, - { - "epoch": 0.17, - "learning_rate": 1.9959466794626797e-06, - "loss": 0.9688, - "step": 6767 - }, - { - "epoch": 0.17, - "learning_rate": 1.9959441902457177e-06, - "loss": 1.0791, - "step": 6768 - }, - { - "epoch": 0.17, - "learning_rate": 1.9959417002662075e-06, - "loss": 0.8955, - "step": 6769 - }, - { - "epoch": 0.17, - "learning_rate": 1.99593920952415e-06, - "loss": 0.8271, - "step": 6770 - }, - { - "epoch": 0.17, - "learning_rate": 1.9959367180195476e-06, - "loss": 0.7935, - "step": 6771 - }, - { - "epoch": 0.17, - "learning_rate": 1.9959342257524026e-06, - "loss": 0.7725, - "step": 6772 - }, - { - "epoch": 0.17, - "learning_rate": 1.9959317327227166e-06, - "loss": 0.9043, - "step": 6773 - }, - { - "epoch": 0.17, - "learning_rate": 1.9959292389304913e-06, - "loss": 0.9619, - "step": 6774 - }, - { - "epoch": 0.17, - "learning_rate": 1.995926744375729e-06, - "loss": 0.9014, - "step": 6775 - }, - { - "epoch": 0.17, - "learning_rate": 1.9959242490584313e-06, - "loss": 0.7729, - "step": 6776 - }, - { - "epoch": 0.17, - "learning_rate": 1.9959217529786e-06, - "loss": 0.8857, - "step": 6777 - }, - { - "epoch": 0.17, - "learning_rate": 1.9959192561362374e-06, - "loss": 1.0605, - "step": 6778 - }, - { - "epoch": 0.17, - "learning_rate": 1.995916758531345e-06, - "loss": 0.9746, - "step": 6779 - }, - { - "epoch": 0.17, - "learning_rate": 1.995914260163925e-06, - "loss": 0.6294, - "step": 6780 - }, - { - "epoch": 0.17, - "learning_rate": 1.995911761033979e-06, - "loss": 1.04, - "step": 6781 - }, - { - "epoch": 0.17, - "learning_rate": 1.9959092611415094e-06, - "loss": 0.7773, - "step": 6782 - }, - { - "epoch": 0.17, - "learning_rate": 1.995906760486518e-06, - "loss": 0.875, - "step": 6783 - }, - { - "epoch": 0.17, - "learning_rate": 1.9959042590690066e-06, - "loss": 1.0566, - "step": 6784 - }, - { - "epoch": 0.17, - "learning_rate": 1.995901756888977e-06, - "loss": 0.6748, - "step": 6785 - }, - { - "epoch": 0.17, - "learning_rate": 1.9958992539464314e-06, - "loss": 0.9912, - "step": 6786 - }, - { - "epoch": 0.17, - "learning_rate": 1.9958967502413714e-06, - "loss": 0.7979, - "step": 6787 - }, - { - "epoch": 0.17, - "learning_rate": 1.995894245773799e-06, - "loss": 0.9482, - "step": 6788 - }, - { - "epoch": 0.17, - "learning_rate": 1.995891740543716e-06, - "loss": 0.9248, - "step": 6789 - }, - { - "epoch": 0.17, - "learning_rate": 1.995889234551125e-06, - "loss": 1.2266, - "step": 6790 - }, - { - "epoch": 0.17, - "learning_rate": 1.995886727796027e-06, - "loss": 1.002, - "step": 6791 - }, - { - "epoch": 0.17, - "learning_rate": 1.995884220278424e-06, - "loss": 0.9414, - "step": 6792 - }, - { - "epoch": 0.17, - "learning_rate": 1.9958817119983186e-06, - "loss": 0.916, - "step": 6793 - }, - { - "epoch": 0.17, - "learning_rate": 1.9958792029557127e-06, - "loss": 1.082, - "step": 6794 - }, - { - "epoch": 0.17, - "learning_rate": 1.9958766931506074e-06, - "loss": 0.8037, - "step": 6795 - }, - { - "epoch": 0.17, - "learning_rate": 1.995874182583005e-06, - "loss": 0.6543, - "step": 6796 - }, - { - "epoch": 0.17, - "learning_rate": 1.995871671252908e-06, - "loss": 0.8264, - "step": 6797 - }, - { - "epoch": 0.17, - "learning_rate": 1.9958691591603178e-06, - "loss": 0.8584, - "step": 6798 - }, - { - "epoch": 0.17, - "learning_rate": 1.995866646305236e-06, - "loss": 0.833, - "step": 6799 - }, - { - "epoch": 0.17, - "learning_rate": 1.995864132687665e-06, - "loss": 1.1445, - "step": 6800 - }, - { - "epoch": 0.17, - "learning_rate": 1.9958616183076073e-06, - "loss": 0.6812, - "step": 6801 - }, - { - "epoch": 0.17, - "learning_rate": 1.9958591031650636e-06, - "loss": 0.7637, - "step": 6802 - }, - { - "epoch": 0.17, - "learning_rate": 1.9958565872600366e-06, - "loss": 0.9111, - "step": 6803 - }, - { - "epoch": 0.17, - "learning_rate": 1.9958540705925274e-06, - "loss": 0.8857, - "step": 6804 - }, - { - "epoch": 0.17, - "learning_rate": 1.995851553162539e-06, - "loss": 1.1641, - "step": 6805 - }, - { - "epoch": 0.17, - "learning_rate": 1.9958490349700728e-06, - "loss": 0.6763, - "step": 6806 - }, - { - "epoch": 0.17, - "learning_rate": 1.9958465160151307e-06, - "loss": 0.7061, - "step": 6807 - }, - { - "epoch": 0.17, - "learning_rate": 1.995843996297715e-06, - "loss": 0.9385, - "step": 6808 - }, - { - "epoch": 0.17, - "learning_rate": 1.995841475817827e-06, - "loss": 0.9834, - "step": 6809 - }, - { - "epoch": 0.17, - "learning_rate": 1.995838954575469e-06, - "loss": 0.8657, - "step": 6810 - }, - { - "epoch": 0.17, - "learning_rate": 1.995836432570643e-06, - "loss": 0.8799, - "step": 6811 - }, - { - "epoch": 0.17, - "learning_rate": 1.995833909803351e-06, - "loss": 0.8174, - "step": 6812 - }, - { - "epoch": 0.17, - "learning_rate": 1.9958313862735948e-06, - "loss": 1.0234, - "step": 6813 - }, - { - "epoch": 0.17, - "learning_rate": 1.9958288619813758e-06, - "loss": 0.9175, - "step": 6814 - }, - { - "epoch": 0.17, - "learning_rate": 1.9958263369266967e-06, - "loss": 0.9033, - "step": 6815 - }, - { - "epoch": 0.17, - "learning_rate": 1.995823811109559e-06, - "loss": 1.0391, - "step": 6816 - }, - { - "epoch": 0.17, - "learning_rate": 1.9958212845299654e-06, - "loss": 0.8223, - "step": 6817 - }, - { - "epoch": 0.17, - "learning_rate": 1.995818757187917e-06, - "loss": 0.9258, - "step": 6818 - }, - { - "epoch": 0.17, - "learning_rate": 1.9958162290834157e-06, - "loss": 0.7725, - "step": 6819 - }, - { - "epoch": 0.17, - "learning_rate": 1.9958137002164637e-06, - "loss": 0.7998, - "step": 6820 - }, - { - "epoch": 0.17, - "learning_rate": 1.995811170587063e-06, - "loss": 1.0156, - "step": 6821 - }, - { - "epoch": 0.17, - "learning_rate": 1.9958086401952157e-06, - "loss": 0.748, - "step": 6822 - }, - { - "epoch": 0.17, - "learning_rate": 1.995806109040923e-06, - "loss": 0.5327, - "step": 6823 - }, - { - "epoch": 0.17, - "learning_rate": 1.995803577124188e-06, - "loss": 1.1523, - "step": 6824 - }, - { - "epoch": 0.17, - "learning_rate": 1.995801044445011e-06, - "loss": 0.957, - "step": 6825 - }, - { - "epoch": 0.17, - "learning_rate": 1.995798511003396e-06, - "loss": 0.7397, - "step": 6826 - }, - { - "epoch": 0.17, - "learning_rate": 1.9957959767993435e-06, - "loss": 0.8174, - "step": 6827 - }, - { - "epoch": 0.18, - "learning_rate": 1.995793441832856e-06, - "loss": 0.915, - "step": 6828 - }, - { - "epoch": 0.18, - "learning_rate": 1.995790906103935e-06, - "loss": 0.8252, - "step": 6829 - }, - { - "epoch": 0.18, - "learning_rate": 1.9957883696125823e-06, - "loss": 1.1699, - "step": 6830 - }, - { - "epoch": 0.18, - "learning_rate": 1.995785832358801e-06, - "loss": 1.0635, - "step": 6831 - }, - { - "epoch": 0.18, - "learning_rate": 1.995783294342592e-06, - "loss": 1.0068, - "step": 6832 - }, - { - "epoch": 0.18, - "learning_rate": 1.9957807555639573e-06, - "loss": 0.917, - "step": 6833 - }, - { - "epoch": 0.18, - "learning_rate": 1.995778216022899e-06, - "loss": 0.8682, - "step": 6834 - }, - { - "epoch": 0.18, - "learning_rate": 1.9957756757194194e-06, - "loss": 0.9229, - "step": 6835 - }, - { - "epoch": 0.18, - "learning_rate": 1.99577313465352e-06, - "loss": 1.1426, - "step": 6836 - }, - { - "epoch": 0.18, - "learning_rate": 1.995770592825203e-06, - "loss": 1.0576, - "step": 6837 - }, - { - "epoch": 0.18, - "learning_rate": 1.99576805023447e-06, - "loss": 0.9395, - "step": 6838 - }, - { - "epoch": 0.18, - "learning_rate": 1.9957655068813234e-06, - "loss": 0.7998, - "step": 6839 - }, - { - "epoch": 0.18, - "learning_rate": 1.995762962765765e-06, - "loss": 0.897, - "step": 6840 - }, - { - "epoch": 0.18, - "learning_rate": 1.9957604178877967e-06, - "loss": 1.1846, - "step": 6841 - }, - { - "epoch": 0.18, - "learning_rate": 1.99575787224742e-06, - "loss": 0.916, - "step": 6842 - }, - { - "epoch": 0.18, - "learning_rate": 1.9957553258446376e-06, - "loss": 1.1016, - "step": 6843 - }, - { - "epoch": 0.18, - "learning_rate": 1.9957527786794513e-06, - "loss": 0.9033, - "step": 6844 - }, - { - "epoch": 0.18, - "learning_rate": 1.995750230751863e-06, - "loss": 0.855, - "step": 6845 - }, - { - "epoch": 0.18, - "learning_rate": 1.9957476820618742e-06, - "loss": 1.0049, - "step": 6846 - }, - { - "epoch": 0.18, - "learning_rate": 1.9957451326094873e-06, - "loss": 0.7783, - "step": 6847 - }, - { - "epoch": 0.18, - "learning_rate": 1.995742582394704e-06, - "loss": 1.0312, - "step": 6848 - }, - { - "epoch": 0.18, - "learning_rate": 1.9957400314175265e-06, - "loss": 0.9531, - "step": 6849 - }, - { - "epoch": 0.18, - "learning_rate": 1.9957374796779566e-06, - "loss": 0.7256, - "step": 6850 - }, - { - "epoch": 0.18, - "learning_rate": 1.9957349271759965e-06, - "loss": 0.9688, - "step": 6851 - }, - { - "epoch": 0.18, - "learning_rate": 1.995732373911648e-06, - "loss": 1.0889, - "step": 6852 - }, - { - "epoch": 0.18, - "learning_rate": 1.9957298198849128e-06, - "loss": 0.9004, - "step": 6853 - }, - { - "epoch": 0.18, - "learning_rate": 1.995727265095793e-06, - "loss": 0.9326, - "step": 6854 - }, - { - "epoch": 0.18, - "learning_rate": 1.99572470954429e-06, - "loss": 0.6863, - "step": 6855 - }, - { - "epoch": 0.18, - "learning_rate": 1.995722153230408e-06, - "loss": 0.9912, - "step": 6856 - }, - { - "epoch": 0.18, - "learning_rate": 1.9957195961541458e-06, - "loss": 1.0615, - "step": 6857 - }, - { - "epoch": 0.18, - "learning_rate": 1.9957170383155075e-06, - "loss": 1.0176, - "step": 6858 - }, - { - "epoch": 0.18, - "learning_rate": 1.9957144797144942e-06, - "loss": 0.9619, - "step": 6859 - }, - { - "epoch": 0.18, - "learning_rate": 1.9957119203511085e-06, - "loss": 1.0615, - "step": 6860 - }, - { - "epoch": 0.18, - "learning_rate": 1.9957093602253517e-06, - "loss": 0.7285, - "step": 6861 - }, - { - "epoch": 0.18, - "learning_rate": 1.9957067993372263e-06, - "loss": 0.7402, - "step": 6862 - }, - { - "epoch": 0.18, - "learning_rate": 1.9957042376867335e-06, - "loss": 0.96, - "step": 6863 - }, - { - "epoch": 0.18, - "learning_rate": 1.9957016752738763e-06, - "loss": 0.8965, - "step": 6864 - }, - { - "epoch": 0.18, - "learning_rate": 1.9956991120986556e-06, - "loss": 0.8677, - "step": 6865 - }, - { - "epoch": 0.18, - "learning_rate": 1.9956965481610743e-06, - "loss": 0.6758, - "step": 6866 - }, - { - "epoch": 0.18, - "learning_rate": 1.9956939834611337e-06, - "loss": 0.9912, - "step": 6867 - }, - { - "epoch": 0.18, - "learning_rate": 1.9956914179988364e-06, - "loss": 1.0762, - "step": 6868 - }, - { - "epoch": 0.18, - "learning_rate": 1.9956888517741836e-06, - "loss": 0.8555, - "step": 6869 - }, - { - "epoch": 0.18, - "learning_rate": 1.9956862847871774e-06, - "loss": 0.958, - "step": 6870 - }, - { - "epoch": 0.18, - "learning_rate": 1.9956837170378204e-06, - "loss": 1.002, - "step": 6871 - }, - { - "epoch": 0.18, - "learning_rate": 1.9956811485261138e-06, - "loss": 0.6783, - "step": 6872 - }, - { - "epoch": 0.18, - "learning_rate": 1.99567857925206e-06, - "loss": 1.0459, - "step": 6873 - }, - { - "epoch": 0.18, - "learning_rate": 1.9956760092156613e-06, - "loss": 1.001, - "step": 6874 - }, - { - "epoch": 0.18, - "learning_rate": 1.995673438416919e-06, - "loss": 1.0166, - "step": 6875 - }, - { - "epoch": 0.18, - "learning_rate": 1.9956708668558355e-06, - "loss": 0.9219, - "step": 6876 - }, - { - "epoch": 0.18, - "learning_rate": 1.9956682945324125e-06, - "loss": 0.8047, - "step": 6877 - }, - { - "epoch": 0.18, - "learning_rate": 1.9956657214466518e-06, - "loss": 0.9727, - "step": 6878 - }, - { - "epoch": 0.18, - "learning_rate": 1.995663147598556e-06, - "loss": 0.9307, - "step": 6879 - }, - { - "epoch": 0.18, - "learning_rate": 1.9956605729881265e-06, - "loss": 0.9814, - "step": 6880 - }, - { - "epoch": 0.18, - "learning_rate": 1.9956579976153654e-06, - "loss": 1.0908, - "step": 6881 - }, - { - "epoch": 0.18, - "learning_rate": 1.9956554214802746e-06, - "loss": 0.9746, - "step": 6882 - }, - { - "epoch": 0.18, - "learning_rate": 1.9956528445828568e-06, - "loss": 0.917, - "step": 6883 - }, - { - "epoch": 0.18, - "learning_rate": 1.995650266923113e-06, - "loss": 0.8003, - "step": 6884 - }, - { - "epoch": 0.18, - "learning_rate": 1.995647688501046e-06, - "loss": 0.7876, - "step": 6885 - }, - { - "epoch": 0.18, - "learning_rate": 1.995645109316657e-06, - "loss": 1.1377, - "step": 6886 - }, - { - "epoch": 0.18, - "learning_rate": 1.995642529369948e-06, - "loss": 0.7495, - "step": 6887 - }, - { - "epoch": 0.18, - "learning_rate": 1.995639948660922e-06, - "loss": 1.0527, - "step": 6888 - }, - { - "epoch": 0.18, - "learning_rate": 1.9956373671895797e-06, - "loss": 1.043, - "step": 6889 - }, - { - "epoch": 0.18, - "learning_rate": 1.9956347849559237e-06, - "loss": 1.1318, - "step": 6890 - }, - { - "epoch": 0.18, - "learning_rate": 1.9956322019599562e-06, - "loss": 1.1699, - "step": 6891 - }, - { - "epoch": 0.18, - "learning_rate": 1.9956296182016786e-06, - "loss": 0.8506, - "step": 6892 - }, - { - "epoch": 0.18, - "learning_rate": 1.995627033681094e-06, - "loss": 0.6597, - "step": 6893 - }, - { - "epoch": 0.18, - "learning_rate": 1.9956244483982026e-06, - "loss": 0.9746, - "step": 6894 - }, - { - "epoch": 0.18, - "learning_rate": 1.9956218623530077e-06, - "loss": 0.8818, - "step": 6895 - }, - { - "epoch": 0.18, - "learning_rate": 1.995619275545511e-06, - "loss": 1.0781, - "step": 6896 - }, - { - "epoch": 0.18, - "learning_rate": 1.9956166879757143e-06, - "loss": 1.0537, - "step": 6897 - }, - { - "epoch": 0.18, - "learning_rate": 1.9956140996436197e-06, - "loss": 1.0195, - "step": 6898 - }, - { - "epoch": 0.18, - "learning_rate": 1.995611510549229e-06, - "loss": 0.8101, - "step": 6899 - }, - { - "epoch": 0.18, - "learning_rate": 1.9956089206925445e-06, - "loss": 0.6479, - "step": 6900 - }, - { - "epoch": 0.18, - "learning_rate": 1.995606330073568e-06, - "loss": 0.7568, - "step": 6901 - }, - { - "epoch": 0.18, - "learning_rate": 1.9956037386923014e-06, - "loss": 0.7002, - "step": 6902 - }, - { - "epoch": 0.18, - "learning_rate": 1.995601146548747e-06, - "loss": 0.9277, - "step": 6903 - }, - { - "epoch": 0.18, - "learning_rate": 1.995598553642906e-06, - "loss": 0.8271, - "step": 6904 - }, - { - "epoch": 0.18, - "learning_rate": 1.995595959974782e-06, - "loss": 0.8599, - "step": 6905 - }, - { - "epoch": 0.18, - "learning_rate": 1.9955933655443753e-06, - "loss": 0.7793, - "step": 6906 - }, - { - "epoch": 0.18, - "learning_rate": 1.9955907703516887e-06, - "loss": 0.877, - "step": 6907 - }, - { - "epoch": 0.18, - "learning_rate": 1.995588174396724e-06, - "loss": 0.9482, - "step": 6908 - }, - { - "epoch": 0.18, - "learning_rate": 1.995585577679483e-06, - "loss": 0.8623, - "step": 6909 - }, - { - "epoch": 0.18, - "learning_rate": 1.9955829801999685e-06, - "loss": 0.835, - "step": 6910 - }, - { - "epoch": 0.18, - "learning_rate": 1.9955803819581813e-06, - "loss": 0.7461, - "step": 6911 - }, - { - "epoch": 0.18, - "learning_rate": 1.9955777829541243e-06, - "loss": 0.8789, - "step": 6912 - }, - { - "epoch": 0.18, - "learning_rate": 1.9955751831877985e-06, - "loss": 0.9795, - "step": 6913 - }, - { - "epoch": 0.18, - "learning_rate": 1.9955725826592075e-06, - "loss": 0.9668, - "step": 6914 - }, - { - "epoch": 0.18, - "learning_rate": 1.995569981368352e-06, - "loss": 0.9199, - "step": 6915 - }, - { - "epoch": 0.18, - "learning_rate": 1.9955673793152343e-06, - "loss": 0.915, - "step": 6916 - }, - { - "epoch": 0.18, - "learning_rate": 1.9955647764998563e-06, - "loss": 1.0107, - "step": 6917 - }, - { - "epoch": 0.18, - "learning_rate": 1.9955621729222203e-06, - "loss": 0.9219, - "step": 6918 - }, - { - "epoch": 0.18, - "learning_rate": 1.9955595685823282e-06, - "loss": 1.0098, - "step": 6919 - }, - { - "epoch": 0.18, - "learning_rate": 1.9955569634801816e-06, - "loss": 0.689, - "step": 6920 - }, - { - "epoch": 0.18, - "learning_rate": 1.995554357615783e-06, - "loss": 0.7676, - "step": 6921 - }, - { - "epoch": 0.18, - "learning_rate": 1.9955517509891343e-06, - "loss": 0.9873, - "step": 6922 - }, - { - "epoch": 0.18, - "learning_rate": 1.9955491436002375e-06, - "loss": 1.2285, - "step": 6923 - }, - { - "epoch": 0.18, - "learning_rate": 1.995546535449094e-06, - "loss": 1.1064, - "step": 6924 - }, - { - "epoch": 0.18, - "learning_rate": 1.995543926535707e-06, - "loss": 0.9453, - "step": 6925 - }, - { - "epoch": 0.18, - "learning_rate": 1.995541316860077e-06, - "loss": 1.1211, - "step": 6926 - }, - { - "epoch": 0.18, - "learning_rate": 1.995538706422207e-06, - "loss": 0.874, - "step": 6927 - }, - { - "epoch": 0.18, - "learning_rate": 1.995536095222099e-06, - "loss": 0.8975, - "step": 6928 - }, - { - "epoch": 0.18, - "learning_rate": 1.995533483259755e-06, - "loss": 1.0654, - "step": 6929 - }, - { - "epoch": 0.18, - "learning_rate": 1.9955308705351763e-06, - "loss": 0.8301, - "step": 6930 - }, - { - "epoch": 0.18, - "learning_rate": 1.9955282570483657e-06, - "loss": 0.8447, - "step": 6931 - }, - { - "epoch": 0.18, - "learning_rate": 1.995525642799325e-06, - "loss": 0.9609, - "step": 6932 - }, - { - "epoch": 0.18, - "learning_rate": 1.9955230277880557e-06, - "loss": 0.8989, - "step": 6933 - }, - { - "epoch": 0.18, - "learning_rate": 1.9955204120145606e-06, - "loss": 0.7607, - "step": 6934 - }, - { - "epoch": 0.18, - "learning_rate": 1.9955177954788413e-06, - "loss": 0.7568, - "step": 6935 - }, - { - "epoch": 0.18, - "learning_rate": 1.9955151781808996e-06, - "loss": 0.9521, - "step": 6936 - }, - { - "epoch": 0.18, - "learning_rate": 1.9955125601207374e-06, - "loss": 1.04, - "step": 6937 - }, - { - "epoch": 0.18, - "learning_rate": 1.9955099412983578e-06, - "loss": 0.8076, - "step": 6938 - }, - { - "epoch": 0.18, - "learning_rate": 1.995507321713761e-06, - "loss": 1.2461, - "step": 6939 - }, - { - "epoch": 0.18, - "learning_rate": 1.9955047013669506e-06, - "loss": 0.8564, - "step": 6940 - }, - { - "epoch": 0.18, - "learning_rate": 1.995502080257928e-06, - "loss": 0.9912, - "step": 6941 - }, - { - "epoch": 0.18, - "learning_rate": 1.9954994583866953e-06, - "loss": 0.8232, - "step": 6942 - }, - { - "epoch": 0.18, - "learning_rate": 1.9954968357532544e-06, - "loss": 0.9229, - "step": 6943 - }, - { - "epoch": 0.18, - "learning_rate": 1.995494212357607e-06, - "loss": 0.6648, - "step": 6944 - }, - { - "epoch": 0.18, - "learning_rate": 1.995491588199756e-06, - "loss": 0.9688, - "step": 6945 - }, - { - "epoch": 0.18, - "learning_rate": 1.9954889632797026e-06, - "loss": 0.916, - "step": 6946 - }, - { - "epoch": 0.18, - "learning_rate": 1.9954863375974493e-06, - "loss": 1.0469, - "step": 6947 - }, - { - "epoch": 0.18, - "learning_rate": 1.9954837111529975e-06, - "loss": 0.957, - "step": 6948 - }, - { - "epoch": 0.18, - "learning_rate": 1.9954810839463496e-06, - "loss": 0.79, - "step": 6949 - }, - { - "epoch": 0.18, - "learning_rate": 1.995478455977508e-06, - "loss": 0.6865, - "step": 6950 - }, - { - "epoch": 0.18, - "learning_rate": 1.9954758272464738e-06, - "loss": 1.0439, - "step": 6951 - }, - { - "epoch": 0.18, - "learning_rate": 1.99547319775325e-06, - "loss": 0.9463, - "step": 6952 - }, - { - "epoch": 0.18, - "learning_rate": 1.995470567497838e-06, - "loss": 1.0039, - "step": 6953 - }, - { - "epoch": 0.18, - "learning_rate": 1.9954679364802397e-06, - "loss": 0.8799, - "step": 6954 - }, - { - "epoch": 0.18, - "learning_rate": 1.995465304700458e-06, - "loss": 1.0098, - "step": 6955 - }, - { - "epoch": 0.18, - "learning_rate": 1.9954626721584933e-06, - "loss": 0.9438, - "step": 6956 - }, - { - "epoch": 0.18, - "learning_rate": 1.9954600388543495e-06, - "loss": 0.9678, - "step": 6957 - }, - { - "epoch": 0.18, - "learning_rate": 1.9954574047880276e-06, - "loss": 0.8896, - "step": 6958 - }, - { - "epoch": 0.18, - "learning_rate": 1.9954547699595294e-06, - "loss": 0.7705, - "step": 6959 - }, - { - "epoch": 0.18, - "learning_rate": 1.9954521343688574e-06, - "loss": 0.8389, - "step": 6960 - }, - { - "epoch": 0.18, - "learning_rate": 1.9954494980160133e-06, - "loss": 0.8779, - "step": 6961 - }, - { - "epoch": 0.18, - "learning_rate": 1.9954468609009997e-06, - "loss": 0.9893, - "step": 6962 - }, - { - "epoch": 0.18, - "learning_rate": 1.995444223023818e-06, - "loss": 0.8398, - "step": 6963 - }, - { - "epoch": 0.18, - "learning_rate": 1.9954415843844704e-06, - "loss": 0.875, - "step": 6964 - }, - { - "epoch": 0.18, - "learning_rate": 1.995438944982959e-06, - "loss": 1.0039, - "step": 6965 - }, - { - "epoch": 0.18, - "learning_rate": 1.9954363048192854e-06, - "loss": 1.0557, - "step": 6966 - }, - { - "epoch": 0.18, - "learning_rate": 1.9954336638934523e-06, - "loss": 0.8657, - "step": 6967 - }, - { - "epoch": 0.18, - "learning_rate": 1.995431022205462e-06, - "loss": 0.8799, - "step": 6968 - }, - { - "epoch": 0.18, - "learning_rate": 1.995428379755315e-06, - "loss": 0.9316, - "step": 6969 - }, - { - "epoch": 0.18, - "learning_rate": 1.9954257365430144e-06, - "loss": 0.7437, - "step": 6970 - }, - { - "epoch": 0.18, - "learning_rate": 1.9954230925685627e-06, - "loss": 0.958, - "step": 6971 - }, - { - "epoch": 0.18, - "learning_rate": 1.995420447831961e-06, - "loss": 0.8008, - "step": 6972 - }, - { - "epoch": 0.18, - "learning_rate": 1.9954178023332113e-06, - "loss": 1.1416, - "step": 6973 - }, - { - "epoch": 0.18, - "learning_rate": 1.995415156072316e-06, - "loss": 0.8613, - "step": 6974 - }, - { - "epoch": 0.18, - "learning_rate": 1.9954125090492778e-06, - "loss": 0.8828, - "step": 6975 - }, - { - "epoch": 0.18, - "learning_rate": 1.9954098612640973e-06, - "loss": 0.7534, - "step": 6976 - }, - { - "epoch": 0.18, - "learning_rate": 1.9954072127167774e-06, - "loss": 0.9336, - "step": 6977 - }, - { - "epoch": 0.18, - "learning_rate": 1.99540456340732e-06, - "loss": 1.1201, - "step": 6978 - }, - { - "epoch": 0.18, - "learning_rate": 1.995401913335727e-06, - "loss": 0.8652, - "step": 6979 - }, - { - "epoch": 0.18, - "learning_rate": 1.995399262502001e-06, - "loss": 1.0762, - "step": 6980 - }, - { - "epoch": 0.18, - "learning_rate": 1.995396610906143e-06, - "loss": 0.8213, - "step": 6981 - }, - { - "epoch": 0.18, - "learning_rate": 1.995393958548156e-06, - "loss": 1.0088, - "step": 6982 - }, - { - "epoch": 0.18, - "learning_rate": 1.995391305428041e-06, - "loss": 0.5601, - "step": 6983 - }, - { - "epoch": 0.18, - "learning_rate": 1.9953886515458014e-06, - "loss": 0.9199, - "step": 6984 - }, - { - "epoch": 0.18, - "learning_rate": 1.995385996901438e-06, - "loss": 0.7734, - "step": 6985 - }, - { - "epoch": 0.18, - "learning_rate": 1.9953833414949536e-06, - "loss": 1.1084, - "step": 6986 - }, - { - "epoch": 0.18, - "learning_rate": 1.9953806853263496e-06, - "loss": 1.0635, - "step": 6987 - }, - { - "epoch": 0.18, - "learning_rate": 1.9953780283956287e-06, - "loss": 0.873, - "step": 6988 - }, - { - "epoch": 0.18, - "learning_rate": 1.9953753707027923e-06, - "loss": 1.0547, - "step": 6989 - }, - { - "epoch": 0.18, - "learning_rate": 1.995372712247843e-06, - "loss": 0.9106, - "step": 6990 - }, - { - "epoch": 0.18, - "learning_rate": 1.9953700530307825e-06, - "loss": 0.9443, - "step": 6991 - }, - { - "epoch": 0.18, - "learning_rate": 1.995367393051613e-06, - "loss": 0.8184, - "step": 6992 - }, - { - "epoch": 0.18, - "learning_rate": 1.9953647323103363e-06, - "loss": 0.8018, - "step": 6993 - }, - { - "epoch": 0.18, - "learning_rate": 1.9953620708069546e-06, - "loss": 0.9912, - "step": 6994 - }, - { - "epoch": 0.18, - "learning_rate": 1.99535940854147e-06, - "loss": 0.8154, - "step": 6995 - }, - { - "epoch": 0.18, - "learning_rate": 1.9953567455138844e-06, - "loss": 1.0557, - "step": 6996 - }, - { - "epoch": 0.18, - "learning_rate": 1.9953540817242002e-06, - "loss": 1.0098, - "step": 6997 - }, - { - "epoch": 0.18, - "learning_rate": 1.995351417172419e-06, - "loss": 1.0166, - "step": 6998 - }, - { - "epoch": 0.18, - "learning_rate": 1.995348751858543e-06, - "loss": 0.9814, - "step": 6999 - }, - { - "epoch": 0.18, - "learning_rate": 1.9953460857825737e-06, - "loss": 1.0566, - "step": 7000 - }, - { - "epoch": 0.18, - "learning_rate": 1.995343418944514e-06, - "loss": 0.9453, - "step": 7001 - }, - { - "epoch": 0.18, - "learning_rate": 1.9953407513443662e-06, - "loss": 0.7954, - "step": 7002 - }, - { - "epoch": 0.18, - "learning_rate": 1.995338082982131e-06, - "loss": 0.9316, - "step": 7003 - }, - { - "epoch": 0.18, - "learning_rate": 1.9953354138578117e-06, - "loss": 0.8838, - "step": 7004 - }, - { - "epoch": 0.18, - "learning_rate": 1.9953327439714096e-06, - "loss": 1.0303, - "step": 7005 - }, - { - "epoch": 0.18, - "learning_rate": 1.995330073322927e-06, - "loss": 0.8828, - "step": 7006 - }, - { - "epoch": 0.18, - "learning_rate": 1.995327401912366e-06, - "loss": 1.0205, - "step": 7007 - }, - { - "epoch": 0.18, - "learning_rate": 1.9953247297397283e-06, - "loss": 0.8809, - "step": 7008 - }, - { - "epoch": 0.18, - "learning_rate": 1.9953220568050165e-06, - "loss": 1.0391, - "step": 7009 - }, - { - "epoch": 0.18, - "learning_rate": 1.995319383108232e-06, - "loss": 0.9043, - "step": 7010 - }, - { - "epoch": 0.18, - "learning_rate": 1.9953167086493776e-06, - "loss": 0.9492, - "step": 7011 - }, - { - "epoch": 0.18, - "learning_rate": 1.9953140334284553e-06, - "loss": 0.7075, - "step": 7012 - }, - { - "epoch": 0.18, - "learning_rate": 1.9953113574454663e-06, - "loss": 0.9512, - "step": 7013 - }, - { - "epoch": 0.18, - "learning_rate": 1.9953086807004127e-06, - "loss": 0.7505, - "step": 7014 - }, - { - "epoch": 0.18, - "learning_rate": 1.9953060031932976e-06, - "loss": 0.875, - "step": 7015 - }, - { - "epoch": 0.18, - "learning_rate": 1.9953033249241227e-06, - "loss": 0.6748, - "step": 7016 - }, - { - "epoch": 0.18, - "learning_rate": 1.9953006458928895e-06, - "loss": 0.9043, - "step": 7017 - }, - { - "epoch": 0.18, - "learning_rate": 1.9952979660996003e-06, - "loss": 1.1992, - "step": 7018 - }, - { - "epoch": 0.18, - "learning_rate": 1.995295285544257e-06, - "loss": 0.813, - "step": 7019 - }, - { - "epoch": 0.18, - "learning_rate": 1.9952926042268626e-06, - "loss": 0.7881, - "step": 7020 - }, - { - "epoch": 0.18, - "learning_rate": 1.995289922147418e-06, - "loss": 0.8633, - "step": 7021 - }, - { - "epoch": 0.18, - "learning_rate": 1.9952872393059256e-06, - "loss": 0.8291, - "step": 7022 - }, - { - "epoch": 0.18, - "learning_rate": 1.9952845557023874e-06, - "loss": 0.5107, - "step": 7023 - }, - { - "epoch": 0.18, - "learning_rate": 1.995281871336806e-06, - "loss": 1.0156, - "step": 7024 - }, - { - "epoch": 0.18, - "learning_rate": 1.9952791862091827e-06, - "loss": 1.0176, - "step": 7025 - }, - { - "epoch": 0.18, - "learning_rate": 1.99527650031952e-06, - "loss": 0.8389, - "step": 7026 - }, - { - "epoch": 0.18, - "learning_rate": 1.99527381366782e-06, - "loss": 0.8599, - "step": 7027 - }, - { - "epoch": 0.18, - "learning_rate": 1.9952711262540843e-06, - "loss": 0.916, - "step": 7028 - }, - { - "epoch": 0.18, - "learning_rate": 1.9952684380783152e-06, - "loss": 0.9717, - "step": 7029 - }, - { - "epoch": 0.18, - "learning_rate": 1.995265749140515e-06, - "loss": 0.79, - "step": 7030 - }, - { - "epoch": 0.18, - "learning_rate": 1.9952630594406855e-06, - "loss": 1.0303, - "step": 7031 - }, - { - "epoch": 0.18, - "learning_rate": 1.995260368978829e-06, - "loss": 0.8184, - "step": 7032 - }, - { - "epoch": 0.18, - "learning_rate": 1.995257677754947e-06, - "loss": 0.7476, - "step": 7033 - }, - { - "epoch": 0.18, - "learning_rate": 1.9952549857690427e-06, - "loss": 0.6899, - "step": 7034 - }, - { - "epoch": 0.18, - "learning_rate": 1.9952522930211168e-06, - "loss": 0.9414, - "step": 7035 - }, - { - "epoch": 0.18, - "learning_rate": 1.995249599511172e-06, - "loss": 0.9385, - "step": 7036 - }, - { - "epoch": 0.18, - "learning_rate": 1.9952469052392108e-06, - "loss": 0.791, - "step": 7037 - }, - { - "epoch": 0.18, - "learning_rate": 1.9952442102052344e-06, - "loss": 0.8965, - "step": 7038 - }, - { - "epoch": 0.18, - "learning_rate": 1.9952415144092452e-06, - "loss": 0.8906, - "step": 7039 - }, - { - "epoch": 0.18, - "learning_rate": 1.9952388178512457e-06, - "loss": 0.9561, - "step": 7040 - }, - { - "epoch": 0.18, - "learning_rate": 1.9952361205312376e-06, - "loss": 0.8633, - "step": 7041 - }, - { - "epoch": 0.18, - "learning_rate": 1.995233422449223e-06, - "loss": 0.9346, - "step": 7042 - }, - { - "epoch": 0.18, - "learning_rate": 1.9952307236052035e-06, - "loss": 0.9727, - "step": 7043 - }, - { - "epoch": 0.18, - "learning_rate": 1.9952280239991818e-06, - "loss": 0.9873, - "step": 7044 - }, - { - "epoch": 0.18, - "learning_rate": 1.99522532363116e-06, - "loss": 0.8281, - "step": 7045 - }, - { - "epoch": 0.18, - "learning_rate": 1.9952226225011395e-06, - "loss": 0.9033, - "step": 7046 - }, - { - "epoch": 0.18, - "learning_rate": 1.9952199206091232e-06, - "loss": 0.9209, - "step": 7047 - }, - { - "epoch": 0.18, - "learning_rate": 1.9952172179551127e-06, - "loss": 0.9756, - "step": 7048 - }, - { - "epoch": 0.18, - "learning_rate": 1.9952145145391097e-06, - "loss": 0.7114, - "step": 7049 - }, - { - "epoch": 0.18, - "learning_rate": 1.995211810361117e-06, - "loss": 0.8398, - "step": 7050 - }, - { - "epoch": 0.18, - "learning_rate": 1.9952091054211366e-06, - "loss": 0.9062, - "step": 7051 - }, - { - "epoch": 0.18, - "learning_rate": 1.9952063997191704e-06, - "loss": 0.9512, - "step": 7052 - }, - { - "epoch": 0.18, - "learning_rate": 1.99520369325522e-06, - "loss": 1.1426, - "step": 7053 - }, - { - "epoch": 0.18, - "learning_rate": 1.995200986029288e-06, - "loss": 0.9473, - "step": 7054 - }, - { - "epoch": 0.18, - "learning_rate": 1.9951982780413766e-06, - "loss": 0.9941, - "step": 7055 - }, - { - "epoch": 0.18, - "learning_rate": 1.9951955692914876e-06, - "loss": 0.9092, - "step": 7056 - }, - { - "epoch": 0.18, - "learning_rate": 1.9951928597796227e-06, - "loss": 0.8154, - "step": 7057 - }, - { - "epoch": 0.18, - "learning_rate": 1.9951901495057847e-06, - "loss": 1.0791, - "step": 7058 - }, - { - "epoch": 0.18, - "learning_rate": 1.9951874384699753e-06, - "loss": 0.8726, - "step": 7059 - }, - { - "epoch": 0.18, - "learning_rate": 1.9951847266721967e-06, - "loss": 0.8818, - "step": 7060 - }, - { - "epoch": 0.18, - "learning_rate": 1.995182014112451e-06, - "loss": 0.9902, - "step": 7061 - }, - { - "epoch": 0.18, - "learning_rate": 1.99517930079074e-06, - "loss": 0.9395, - "step": 7062 - }, - { - "epoch": 0.18, - "learning_rate": 1.995176586707066e-06, - "loss": 0.8213, - "step": 7063 - }, - { - "epoch": 0.18, - "learning_rate": 1.9951738718614314e-06, - "loss": 0.7573, - "step": 7064 - }, - { - "epoch": 0.18, - "learning_rate": 1.9951711562538375e-06, - "loss": 0.8237, - "step": 7065 - }, - { - "epoch": 0.18, - "learning_rate": 1.995168439884287e-06, - "loss": 0.9629, - "step": 7066 - }, - { - "epoch": 0.18, - "learning_rate": 1.9951657227527814e-06, - "loss": 0.9609, - "step": 7067 - }, - { - "epoch": 0.18, - "learning_rate": 1.995163004859324e-06, - "loss": 0.8652, - "step": 7068 - }, - { - "epoch": 0.18, - "learning_rate": 1.9951602862039153e-06, - "loss": 0.8086, - "step": 7069 - }, - { - "epoch": 0.18, - "learning_rate": 1.995157566786558e-06, - "loss": 0.8369, - "step": 7070 - }, - { - "epoch": 0.18, - "learning_rate": 1.995154846607255e-06, - "loss": 0.6631, - "step": 7071 - }, - { - "epoch": 0.18, - "learning_rate": 1.9951521256660074e-06, - "loss": 0.7676, - "step": 7072 - }, - { - "epoch": 0.18, - "learning_rate": 1.995149403962817e-06, - "loss": 0.8218, - "step": 7073 - }, - { - "epoch": 0.18, - "learning_rate": 1.9951466814976878e-06, - "loss": 0.9121, - "step": 7074 - }, - { - "epoch": 0.18, - "learning_rate": 1.995143958270619e-06, - "loss": 1.0596, - "step": 7075 - }, - { - "epoch": 0.18, - "learning_rate": 1.995141234281615e-06, - "loss": 0.9072, - "step": 7076 - }, - { - "epoch": 0.18, - "learning_rate": 1.9951385095306776e-06, - "loss": 0.9326, - "step": 7077 - }, - { - "epoch": 0.18, - "learning_rate": 1.995135784017808e-06, - "loss": 0.7854, - "step": 7078 - }, - { - "epoch": 0.18, - "learning_rate": 1.9951330577430085e-06, - "loss": 1.1006, - "step": 7079 - }, - { - "epoch": 0.18, - "learning_rate": 1.9951303307062814e-06, - "loss": 0.563, - "step": 7080 - }, - { - "epoch": 0.18, - "learning_rate": 1.9951276029076286e-06, - "loss": 1.0605, - "step": 7081 - }, - { - "epoch": 0.18, - "learning_rate": 1.9951248743470527e-06, - "loss": 0.748, - "step": 7082 - }, - { - "epoch": 0.18, - "learning_rate": 1.9951221450245554e-06, - "loss": 0.8906, - "step": 7083 - }, - { - "epoch": 0.18, - "learning_rate": 1.995119414940139e-06, - "loss": 0.9375, - "step": 7084 - }, - { - "epoch": 0.18, - "learning_rate": 1.995116684093805e-06, - "loss": 0.6401, - "step": 7085 - }, - { - "epoch": 0.18, - "learning_rate": 1.995113952485556e-06, - "loss": 0.8809, - "step": 7086 - }, - { - "epoch": 0.18, - "learning_rate": 1.995111220115394e-06, - "loss": 1.1152, - "step": 7087 - }, - { - "epoch": 0.18, - "learning_rate": 1.9951084869833212e-06, - "loss": 0.8447, - "step": 7088 - }, - { - "epoch": 0.18, - "learning_rate": 1.9951057530893393e-06, - "loss": 0.9277, - "step": 7089 - }, - { - "epoch": 0.18, - "learning_rate": 1.995103018433451e-06, - "loss": 1.1357, - "step": 7090 - }, - { - "epoch": 0.18, - "learning_rate": 1.9951002830156583e-06, - "loss": 0.8564, - "step": 7091 - }, - { - "epoch": 0.18, - "learning_rate": 1.9950975468359626e-06, - "loss": 0.9121, - "step": 7092 - }, - { - "epoch": 0.18, - "learning_rate": 1.9950948098943667e-06, - "loss": 0.7568, - "step": 7093 - }, - { - "epoch": 0.18, - "learning_rate": 1.9950920721908723e-06, - "loss": 0.9619, - "step": 7094 - }, - { - "epoch": 0.18, - "learning_rate": 1.995089333725482e-06, - "loss": 0.8184, - "step": 7095 - }, - { - "epoch": 0.18, - "learning_rate": 1.995086594498197e-06, - "loss": 0.9932, - "step": 7096 - }, - { - "epoch": 0.18, - "learning_rate": 1.9950838545090205e-06, - "loss": 0.8848, - "step": 7097 - }, - { - "epoch": 0.18, - "learning_rate": 1.9950811137579536e-06, - "loss": 0.7493, - "step": 7098 - }, - { - "epoch": 0.18, - "learning_rate": 1.9950783722449993e-06, - "loss": 0.8135, - "step": 7099 - }, - { - "epoch": 0.18, - "learning_rate": 1.995075629970159e-06, - "loss": 0.75, - "step": 7100 - }, - { - "epoch": 0.18, - "learning_rate": 1.995072886933435e-06, - "loss": 1.2041, - "step": 7101 - }, - { - "epoch": 0.18, - "learning_rate": 1.9950701431348294e-06, - "loss": 1.0693, - "step": 7102 - }, - { - "epoch": 0.18, - "learning_rate": 1.995067398574344e-06, - "loss": 0.7173, - "step": 7103 - }, - { - "epoch": 0.18, - "learning_rate": 1.9950646532519823e-06, - "loss": 0.7988, - "step": 7104 - }, - { - "epoch": 0.18, - "learning_rate": 1.9950619071677445e-06, - "loss": 1.0146, - "step": 7105 - }, - { - "epoch": 0.18, - "learning_rate": 1.995059160321634e-06, - "loss": 1.0312, - "step": 7106 - }, - { - "epoch": 0.18, - "learning_rate": 1.995056412713652e-06, - "loss": 1.04, - "step": 7107 - }, - { - "epoch": 0.18, - "learning_rate": 1.9950536643438016e-06, - "loss": 0.959, - "step": 7108 - }, - { - "epoch": 0.18, - "learning_rate": 1.9950509152120836e-06, - "loss": 0.8564, - "step": 7109 - }, - { - "epoch": 0.18, - "learning_rate": 1.9950481653185014e-06, - "loss": 0.8662, - "step": 7110 - }, - { - "epoch": 0.18, - "learning_rate": 1.9950454146630567e-06, - "loss": 1.0713, - "step": 7111 - }, - { - "epoch": 0.18, - "learning_rate": 1.995042663245751e-06, - "loss": 0.7812, - "step": 7112 - }, - { - "epoch": 0.18, - "learning_rate": 1.9950399110665874e-06, - "loss": 0.874, - "step": 7113 - }, - { - "epoch": 0.18, - "learning_rate": 1.995037158125567e-06, - "loss": 1.1416, - "step": 7114 - }, - { - "epoch": 0.18, - "learning_rate": 1.995034404422693e-06, - "loss": 0.8652, - "step": 7115 - }, - { - "epoch": 0.18, - "learning_rate": 1.9950316499579666e-06, - "loss": 1.0664, - "step": 7116 - }, - { - "epoch": 0.18, - "learning_rate": 1.9950288947313905e-06, - "loss": 0.7529, - "step": 7117 - }, - { - "epoch": 0.18, - "learning_rate": 1.9950261387429657e-06, - "loss": 1.002, - "step": 7118 - }, - { - "epoch": 0.18, - "learning_rate": 1.995023381992696e-06, - "loss": 1.0205, - "step": 7119 - }, - { - "epoch": 0.18, - "learning_rate": 1.995020624480582e-06, - "loss": 0.8364, - "step": 7120 - }, - { - "epoch": 0.18, - "learning_rate": 1.9950178662066267e-06, - "loss": 1.0166, - "step": 7121 - }, - { - "epoch": 0.18, - "learning_rate": 1.995015107170832e-06, - "loss": 0.7754, - "step": 7122 - }, - { - "epoch": 0.18, - "learning_rate": 1.9950123473732e-06, - "loss": 0.9766, - "step": 7123 - }, - { - "epoch": 0.18, - "learning_rate": 1.995009586813733e-06, - "loss": 0.833, - "step": 7124 - }, - { - "epoch": 0.18, - "learning_rate": 1.9950068254924324e-06, - "loss": 0.8438, - "step": 7125 - }, - { - "epoch": 0.18, - "learning_rate": 1.9950040634093015e-06, - "loss": 0.8965, - "step": 7126 - }, - { - "epoch": 0.18, - "learning_rate": 1.9950013005643412e-06, - "loss": 0.7837, - "step": 7127 - }, - { - "epoch": 0.18, - "learning_rate": 1.994998536957555e-06, - "loss": 1.1055, - "step": 7128 - }, - { - "epoch": 0.18, - "learning_rate": 1.994995772588943e-06, - "loss": 0.8145, - "step": 7129 - }, - { - "epoch": 0.18, - "learning_rate": 1.994993007458509e-06, - "loss": 0.8496, - "step": 7130 - }, - { - "epoch": 0.18, - "learning_rate": 1.9949902415662547e-06, - "loss": 0.7461, - "step": 7131 - }, - { - "epoch": 0.18, - "learning_rate": 1.994987474912182e-06, - "loss": 0.8174, - "step": 7132 - }, - { - "epoch": 0.18, - "learning_rate": 1.994984707496293e-06, - "loss": 1.0664, - "step": 7133 - }, - { - "epoch": 0.18, - "learning_rate": 1.9949819393185905e-06, - "loss": 0.9561, - "step": 7134 - }, - { - "epoch": 0.18, - "learning_rate": 1.9949791703790756e-06, - "loss": 0.9453, - "step": 7135 - }, - { - "epoch": 0.18, - "learning_rate": 1.9949764006777508e-06, - "loss": 1.04, - "step": 7136 - }, - { - "epoch": 0.18, - "learning_rate": 1.994973630214619e-06, - "loss": 1.0078, - "step": 7137 - }, - { - "epoch": 0.18, - "learning_rate": 1.994970858989681e-06, - "loss": 0.9229, - "step": 7138 - }, - { - "epoch": 0.18, - "learning_rate": 1.9949680870029395e-06, - "loss": 0.8486, - "step": 7139 - }, - { - "epoch": 0.18, - "learning_rate": 1.994965314254397e-06, - "loss": 1.0635, - "step": 7140 - }, - { - "epoch": 0.18, - "learning_rate": 1.9949625407440554e-06, - "loss": 0.834, - "step": 7141 - }, - { - "epoch": 0.18, - "learning_rate": 1.9949597664719167e-06, - "loss": 0.8262, - "step": 7142 - }, - { - "epoch": 0.18, - "learning_rate": 1.994956991437983e-06, - "loss": 0.8408, - "step": 7143 - }, - { - "epoch": 0.18, - "learning_rate": 1.9949542156422564e-06, - "loss": 0.9033, - "step": 7144 - }, - { - "epoch": 0.18, - "learning_rate": 1.994951439084739e-06, - "loss": 1.0947, - "step": 7145 - }, - { - "epoch": 0.18, - "learning_rate": 1.994948661765433e-06, - "loss": 0.8262, - "step": 7146 - }, - { - "epoch": 0.18, - "learning_rate": 1.9949458836843406e-06, - "loss": 0.7266, - "step": 7147 - }, - { - "epoch": 0.18, - "learning_rate": 1.994943104841464e-06, - "loss": 0.9121, - "step": 7148 - }, - { - "epoch": 0.18, - "learning_rate": 1.9949403252368052e-06, - "loss": 0.9111, - "step": 7149 - }, - { - "epoch": 0.18, - "learning_rate": 1.9949375448703666e-06, - "loss": 0.9023, - "step": 7150 - }, - { - "epoch": 0.18, - "learning_rate": 1.9949347637421497e-06, - "loss": 0.8794, - "step": 7151 - }, - { - "epoch": 0.18, - "learning_rate": 1.994931981852157e-06, - "loss": 0.9229, - "step": 7152 - }, - { - "epoch": 0.18, - "learning_rate": 1.9949291992003905e-06, - "loss": 0.8164, - "step": 7153 - }, - { - "epoch": 0.18, - "learning_rate": 1.994926415786853e-06, - "loss": 1.0439, - "step": 7154 - }, - { - "epoch": 0.18, - "learning_rate": 1.994923631611546e-06, - "loss": 1.0391, - "step": 7155 - }, - { - "epoch": 0.18, - "learning_rate": 1.9949208466744713e-06, - "loss": 0.521, - "step": 7156 - }, - { - "epoch": 0.18, - "learning_rate": 1.9949180609756316e-06, - "loss": 0.9307, - "step": 7157 - }, - { - "epoch": 0.18, - "learning_rate": 1.994915274515029e-06, - "loss": 0.9014, - "step": 7158 - }, - { - "epoch": 0.18, - "learning_rate": 1.9949124872926654e-06, - "loss": 0.9453, - "step": 7159 - }, - { - "epoch": 0.18, - "learning_rate": 1.994909699308543e-06, - "loss": 0.7358, - "step": 7160 - }, - { - "epoch": 0.18, - "learning_rate": 1.9949069105626645e-06, - "loss": 0.9111, - "step": 7161 - }, - { - "epoch": 0.18, - "learning_rate": 1.994904121055031e-06, - "loss": 0.9932, - "step": 7162 - }, - { - "epoch": 0.18, - "learning_rate": 1.9949013307856456e-06, - "loss": 1.0146, - "step": 7163 - }, - { - "epoch": 0.18, - "learning_rate": 1.9948985397545095e-06, - "loss": 0.8325, - "step": 7164 - }, - { - "epoch": 0.18, - "learning_rate": 1.9948957479616256e-06, - "loss": 0.8965, - "step": 7165 - }, - { - "epoch": 0.18, - "learning_rate": 1.9948929554069956e-06, - "loss": 1.0391, - "step": 7166 - }, - { - "epoch": 0.18, - "learning_rate": 1.994890162090622e-06, - "loss": 0.6484, - "step": 7167 - }, - { - "epoch": 0.18, - "learning_rate": 1.994887368012507e-06, - "loss": 0.7886, - "step": 7168 - }, - { - "epoch": 0.18, - "learning_rate": 1.994884573172652e-06, - "loss": 0.8848, - "step": 7169 - }, - { - "epoch": 0.18, - "learning_rate": 1.99488177757106e-06, - "loss": 0.96, - "step": 7170 - }, - { - "epoch": 0.18, - "learning_rate": 1.9948789812077323e-06, - "loss": 0.9023, - "step": 7171 - }, - { - "epoch": 0.18, - "learning_rate": 1.994876184082672e-06, - "loss": 0.8535, - "step": 7172 - }, - { - "epoch": 0.18, - "learning_rate": 1.99487338619588e-06, - "loss": 0.9541, - "step": 7173 - }, - { - "epoch": 0.18, - "learning_rate": 1.99487058754736e-06, - "loss": 0.9487, - "step": 7174 - }, - { - "epoch": 0.18, - "learning_rate": 1.994867788137113e-06, - "loss": 0.8975, - "step": 7175 - }, - { - "epoch": 0.18, - "learning_rate": 1.9948649879651414e-06, - "loss": 0.8369, - "step": 7176 - }, - { - "epoch": 0.18, - "learning_rate": 1.994862187031448e-06, - "loss": 0.8005, - "step": 7177 - }, - { - "epoch": 0.18, - "learning_rate": 1.9948593853360337e-06, - "loss": 0.9316, - "step": 7178 - }, - { - "epoch": 0.18, - "learning_rate": 1.9948565828789013e-06, - "loss": 0.7136, - "step": 7179 - }, - { - "epoch": 0.18, - "learning_rate": 1.9948537796600533e-06, - "loss": 0.8613, - "step": 7180 - }, - { - "epoch": 0.18, - "learning_rate": 1.9948509756794914e-06, - "loss": 1.0352, - "step": 7181 - }, - { - "epoch": 0.18, - "learning_rate": 1.9948481709372182e-06, - "loss": 0.8926, - "step": 7182 - }, - { - "epoch": 0.18, - "learning_rate": 1.994845365433235e-06, - "loss": 0.8857, - "step": 7183 - }, - { - "epoch": 0.18, - "learning_rate": 1.9948425591675447e-06, - "loss": 0.9629, - "step": 7184 - }, - { - "epoch": 0.18, - "learning_rate": 1.994839752140149e-06, - "loss": 0.9014, - "step": 7185 - }, - { - "epoch": 0.18, - "learning_rate": 1.9948369443510504e-06, - "loss": 1.1328, - "step": 7186 - }, - { - "epoch": 0.18, - "learning_rate": 1.994834135800251e-06, - "loss": 0.719, - "step": 7187 - }, - { - "epoch": 0.18, - "learning_rate": 1.9948313264877524e-06, - "loss": 0.9141, - "step": 7188 - }, - { - "epoch": 0.18, - "learning_rate": 1.9948285164135575e-06, - "loss": 0.9414, - "step": 7189 - }, - { - "epoch": 0.18, - "learning_rate": 1.9948257055776683e-06, - "loss": 0.9443, - "step": 7190 - }, - { - "epoch": 0.18, - "learning_rate": 1.9948228939800864e-06, - "loss": 0.9404, - "step": 7191 - }, - { - "epoch": 0.18, - "learning_rate": 1.994820081620815e-06, - "loss": 0.9492, - "step": 7192 - }, - { - "epoch": 0.18, - "learning_rate": 1.994817268499855e-06, - "loss": 0.9619, - "step": 7193 - }, - { - "epoch": 0.18, - "learning_rate": 1.9948144546172093e-06, - "loss": 0.8218, - "step": 7194 - }, - { - "epoch": 0.18, - "learning_rate": 1.99481163997288e-06, - "loss": 0.793, - "step": 7195 - }, - { - "epoch": 0.18, - "learning_rate": 1.9948088245668694e-06, - "loss": 0.9922, - "step": 7196 - }, - { - "epoch": 0.18, - "learning_rate": 1.994806008399179e-06, - "loss": 1.0967, - "step": 7197 - }, - { - "epoch": 0.18, - "learning_rate": 1.9948031914698117e-06, - "loss": 0.8188, - "step": 7198 - }, - { - "epoch": 0.18, - "learning_rate": 1.9948003737787688e-06, - "loss": 1.0088, - "step": 7199 - }, - { - "epoch": 0.18, - "learning_rate": 1.9947975553260535e-06, - "loss": 0.9053, - "step": 7200 - }, - { - "epoch": 0.18, - "learning_rate": 1.9947947361116672e-06, - "loss": 0.9307, - "step": 7201 - }, - { - "epoch": 0.18, - "learning_rate": 1.9947919161356128e-06, - "loss": 0.9033, - "step": 7202 - }, - { - "epoch": 0.18, - "learning_rate": 1.9947890953978915e-06, - "loss": 0.8857, - "step": 7203 - }, - { - "epoch": 0.18, - "learning_rate": 1.994786273898506e-06, - "loss": 0.8311, - "step": 7204 - }, - { - "epoch": 0.18, - "learning_rate": 1.9947834516374585e-06, - "loss": 1.0156, - "step": 7205 - }, - { - "epoch": 0.18, - "learning_rate": 1.9947806286147507e-06, - "loss": 1.1172, - "step": 7206 - }, - { - "epoch": 0.18, - "learning_rate": 1.9947778048303857e-06, - "loss": 0.8281, - "step": 7207 - }, - { - "epoch": 0.18, - "learning_rate": 1.994774980284365e-06, - "loss": 0.915, - "step": 7208 - }, - { - "epoch": 0.18, - "learning_rate": 1.9947721549766903e-06, - "loss": 0.8955, - "step": 7209 - }, - { - "epoch": 0.18, - "learning_rate": 1.9947693289073646e-06, - "loss": 0.7788, - "step": 7210 - }, - { - "epoch": 0.18, - "learning_rate": 1.99476650207639e-06, - "loss": 0.7622, - "step": 7211 - }, - { - "epoch": 0.18, - "learning_rate": 1.994763674483768e-06, - "loss": 0.8833, - "step": 7212 - }, - { - "epoch": 0.18, - "learning_rate": 1.9947608461295016e-06, - "loss": 0.7998, - "step": 7213 - }, - { - "epoch": 0.18, - "learning_rate": 1.9947580170135923e-06, - "loss": 0.8906, - "step": 7214 - }, - { - "epoch": 0.18, - "learning_rate": 1.9947551871360425e-06, - "loss": 0.8906, - "step": 7215 - }, - { - "epoch": 0.18, - "learning_rate": 1.9947523564968546e-06, - "loss": 0.9287, - "step": 7216 - }, - { - "epoch": 0.18, - "learning_rate": 1.9947495250960308e-06, - "loss": 0.8115, - "step": 7217 - }, - { - "epoch": 0.19, - "learning_rate": 1.9947466929335723e-06, - "loss": 0.7881, - "step": 7218 - }, - { - "epoch": 0.19, - "learning_rate": 1.9947438600094825e-06, - "loss": 0.9492, - "step": 7219 - }, - { - "epoch": 0.19, - "learning_rate": 1.9947410263237628e-06, - "loss": 1.0107, - "step": 7220 - }, - { - "epoch": 0.19, - "learning_rate": 1.994738191876416e-06, - "loss": 0.7556, - "step": 7221 - }, - { - "epoch": 0.19, - "learning_rate": 1.994735356667444e-06, - "loss": 0.874, - "step": 7222 - }, - { - "epoch": 0.19, - "learning_rate": 1.994732520696848e-06, - "loss": 0.689, - "step": 7223 - }, - { - "epoch": 0.19, - "learning_rate": 1.994729683964632e-06, - "loss": 0.8447, - "step": 7224 - }, - { - "epoch": 0.19, - "learning_rate": 1.9947268464707965e-06, - "loss": 0.6499, - "step": 7225 - }, - { - "epoch": 0.19, - "learning_rate": 1.994724008215345e-06, - "loss": 1.0762, - "step": 7226 - }, - { - "epoch": 0.19, - "learning_rate": 1.9947211691982787e-06, - "loss": 0.7109, - "step": 7227 - }, - { - "epoch": 0.19, - "learning_rate": 1.9947183294196003e-06, - "loss": 0.8511, - "step": 7228 - }, - { - "epoch": 0.19, - "learning_rate": 1.9947154888793117e-06, - "loss": 0.877, - "step": 7229 - }, - { - "epoch": 0.19, - "learning_rate": 1.994712647577415e-06, - "loss": 1.0337, - "step": 7230 - }, - { - "epoch": 0.19, - "learning_rate": 1.994709805513913e-06, - "loss": 0.875, - "step": 7231 - }, - { - "epoch": 0.19, - "learning_rate": 1.994706962688807e-06, - "loss": 1.1074, - "step": 7232 - }, - { - "epoch": 0.19, - "learning_rate": 1.9947041191021e-06, - "loss": 0.9453, - "step": 7233 - }, - { - "epoch": 0.19, - "learning_rate": 1.994701274753794e-06, - "loss": 0.9209, - "step": 7234 - }, - { - "epoch": 0.19, - "learning_rate": 1.99469842964389e-06, - "loss": 1.0293, - "step": 7235 - }, - { - "epoch": 0.19, - "learning_rate": 1.9946955837723923e-06, - "loss": 0.8037, - "step": 7236 - }, - { - "epoch": 0.19, - "learning_rate": 1.9946927371393013e-06, - "loss": 0.8916, - "step": 7237 - }, - { - "epoch": 0.19, - "learning_rate": 1.9946898897446197e-06, - "loss": 0.707, - "step": 7238 - }, - { - "epoch": 0.19, - "learning_rate": 1.9946870415883504e-06, - "loss": 0.8994, - "step": 7239 - }, - { - "epoch": 0.19, - "learning_rate": 1.9946841926704943e-06, - "loss": 0.8955, - "step": 7240 - }, - { - "epoch": 0.19, - "learning_rate": 1.9946813429910544e-06, - "loss": 0.7695, - "step": 7241 - }, - { - "epoch": 0.19, - "learning_rate": 1.994678492550033e-06, - "loss": 0.7661, - "step": 7242 - }, - { - "epoch": 0.19, - "learning_rate": 1.994675641347432e-06, - "loss": 0.8838, - "step": 7243 - }, - { - "epoch": 0.19, - "learning_rate": 1.994672789383253e-06, - "loss": 0.876, - "step": 7244 - }, - { - "epoch": 0.19, - "learning_rate": 1.9946699366574995e-06, - "loss": 0.877, - "step": 7245 - }, - { - "epoch": 0.19, - "learning_rate": 1.9946670831701726e-06, - "loss": 0.9756, - "step": 7246 - }, - { - "epoch": 0.19, - "learning_rate": 1.9946642289212754e-06, - "loss": 0.9648, - "step": 7247 - }, - { - "epoch": 0.19, - "learning_rate": 1.9946613739108087e-06, - "loss": 0.7588, - "step": 7248 - }, - { - "epoch": 0.19, - "learning_rate": 1.994658518138776e-06, - "loss": 0.8223, - "step": 7249 - }, - { - "epoch": 0.19, - "learning_rate": 1.994655661605179e-06, - "loss": 1.0186, - "step": 7250 - }, - { - "epoch": 0.19, - "learning_rate": 1.9946528043100196e-06, - "loss": 1.0996, - "step": 7251 - }, - { - "epoch": 0.19, - "learning_rate": 1.994649946253301e-06, - "loss": 0.9053, - "step": 7252 - }, - { - "epoch": 0.19, - "learning_rate": 1.994647087435024e-06, - "loss": 0.9951, - "step": 7253 - }, - { - "epoch": 0.19, - "learning_rate": 1.9946442278551915e-06, - "loss": 0.9541, - "step": 7254 - }, - { - "epoch": 0.19, - "learning_rate": 1.9946413675138057e-06, - "loss": 0.8594, - "step": 7255 - }, - { - "epoch": 0.19, - "learning_rate": 1.9946385064108686e-06, - "loss": 0.8604, - "step": 7256 - }, - { - "epoch": 0.19, - "learning_rate": 1.994635644546383e-06, - "loss": 0.833, - "step": 7257 - }, - { - "epoch": 0.19, - "learning_rate": 1.99463278192035e-06, - "loss": 0.8291, - "step": 7258 - }, - { - "epoch": 0.19, - "learning_rate": 1.9946299185327734e-06, - "loss": 1.0762, - "step": 7259 - }, - { - "epoch": 0.19, - "learning_rate": 1.9946270543836534e-06, - "loss": 0.916, - "step": 7260 - }, - { - "epoch": 0.19, - "learning_rate": 1.9946241894729937e-06, - "loss": 0.8955, - "step": 7261 - }, - { - "epoch": 0.19, - "learning_rate": 1.9946213238007963e-06, - "loss": 1.0254, - "step": 7262 - }, - { - "epoch": 0.19, - "learning_rate": 1.9946184573670624e-06, - "loss": 0.96, - "step": 7263 - }, - { - "epoch": 0.19, - "learning_rate": 1.994615590171795e-06, - "loss": 0.7593, - "step": 7264 - }, - { - "epoch": 0.19, - "learning_rate": 1.9946127222149966e-06, - "loss": 0.8069, - "step": 7265 - }, - { - "epoch": 0.19, - "learning_rate": 1.9946098534966683e-06, - "loss": 0.8857, - "step": 7266 - }, - { - "epoch": 0.19, - "learning_rate": 1.994606984016814e-06, - "loss": 0.915, - "step": 7267 - }, - { - "epoch": 0.19, - "learning_rate": 1.994604113775434e-06, - "loss": 0.7969, - "step": 7268 - }, - { - "epoch": 0.19, - "learning_rate": 1.9946012427725317e-06, - "loss": 0.9639, - "step": 7269 - }, - { - "epoch": 0.19, - "learning_rate": 1.9945983710081087e-06, - "loss": 0.9639, - "step": 7270 - }, - { - "epoch": 0.19, - "learning_rate": 1.9945954984821675e-06, - "loss": 0.7949, - "step": 7271 - }, - { - "epoch": 0.19, - "learning_rate": 1.9945926251947106e-06, - "loss": 0.8667, - "step": 7272 - }, - { - "epoch": 0.19, - "learning_rate": 1.9945897511457393e-06, - "loss": 0.8604, - "step": 7273 - }, - { - "epoch": 0.19, - "learning_rate": 1.994586876335257e-06, - "loss": 0.7852, - "step": 7274 - }, - { - "epoch": 0.19, - "learning_rate": 1.9945840007632647e-06, - "loss": 0.8643, - "step": 7275 - }, - { - "epoch": 0.19, - "learning_rate": 1.9945811244297655e-06, - "loss": 0.9043, - "step": 7276 - }, - { - "epoch": 0.19, - "learning_rate": 1.9945782473347613e-06, - "loss": 0.8428, - "step": 7277 - }, - { - "epoch": 0.19, - "learning_rate": 1.994575369478254e-06, - "loss": 1.0312, - "step": 7278 - }, - { - "epoch": 0.19, - "learning_rate": 1.9945724908602465e-06, - "loss": 0.8804, - "step": 7279 - }, - { - "epoch": 0.19, - "learning_rate": 1.9945696114807402e-06, - "loss": 0.9688, - "step": 7280 - }, - { - "epoch": 0.19, - "learning_rate": 1.9945667313397378e-06, - "loss": 0.9893, - "step": 7281 - }, - { - "epoch": 0.19, - "learning_rate": 1.9945638504372412e-06, - "loss": 0.9072, - "step": 7282 - }, - { - "epoch": 0.19, - "learning_rate": 1.9945609687732528e-06, - "loss": 0.9717, - "step": 7283 - }, - { - "epoch": 0.19, - "learning_rate": 1.994558086347775e-06, - "loss": 1.0977, - "step": 7284 - }, - { - "epoch": 0.19, - "learning_rate": 1.99455520316081e-06, - "loss": 0.8975, - "step": 7285 - }, - { - "epoch": 0.19, - "learning_rate": 1.9945523192123595e-06, - "loss": 0.9971, - "step": 7286 - }, - { - "epoch": 0.19, - "learning_rate": 1.994549434502426e-06, - "loss": 0.9355, - "step": 7287 - }, - { - "epoch": 0.19, - "learning_rate": 1.994546549031012e-06, - "loss": 0.8955, - "step": 7288 - }, - { - "epoch": 0.19, - "learning_rate": 1.9945436627981192e-06, - "loss": 1.1318, - "step": 7289 - }, - { - "epoch": 0.19, - "learning_rate": 1.9945407758037503e-06, - "loss": 0.8936, - "step": 7290 - }, - { - "epoch": 0.19, - "learning_rate": 1.994537888047907e-06, - "loss": 0.71, - "step": 7291 - }, - { - "epoch": 0.19, - "learning_rate": 1.9945349995305917e-06, - "loss": 0.9395, - "step": 7292 - }, - { - "epoch": 0.19, - "learning_rate": 1.9945321102518067e-06, - "loss": 1.0449, - "step": 7293 - }, - { - "epoch": 0.19, - "learning_rate": 1.9945292202115543e-06, - "loss": 0.8389, - "step": 7294 - }, - { - "epoch": 0.19, - "learning_rate": 1.9945263294098367e-06, - "loss": 0.6997, - "step": 7295 - }, - { - "epoch": 0.19, - "learning_rate": 1.994523437846656e-06, - "loss": 1.0391, - "step": 7296 - }, - { - "epoch": 0.19, - "learning_rate": 1.9945205455220146e-06, - "loss": 0.9619, - "step": 7297 - }, - { - "epoch": 0.19, - "learning_rate": 1.9945176524359143e-06, - "loss": 0.8037, - "step": 7298 - }, - { - "epoch": 0.19, - "learning_rate": 1.9945147585883576e-06, - "loss": 0.9805, - "step": 7299 - }, - { - "epoch": 0.19, - "learning_rate": 1.9945118639793463e-06, - "loss": 0.7705, - "step": 7300 - }, - { - "epoch": 0.19, - "learning_rate": 1.9945089686088833e-06, - "loss": 0.9082, - "step": 7301 - }, - { - "epoch": 0.19, - "learning_rate": 1.9945060724769707e-06, - "loss": 0.7349, - "step": 7302 - }, - { - "epoch": 0.19, - "learning_rate": 1.9945031755836107e-06, - "loss": 0.9961, - "step": 7303 - }, - { - "epoch": 0.19, - "learning_rate": 1.994500277928805e-06, - "loss": 1.0137, - "step": 7304 - }, - { - "epoch": 0.19, - "learning_rate": 1.9944973795125558e-06, - "loss": 0.959, - "step": 7305 - }, - { - "epoch": 0.19, - "learning_rate": 1.994494480334866e-06, - "loss": 1.0039, - "step": 7306 - }, - { - "epoch": 0.19, - "learning_rate": 1.9944915803957377e-06, - "loss": 1.0146, - "step": 7307 - }, - { - "epoch": 0.19, - "learning_rate": 1.994488679695173e-06, - "loss": 1.083, - "step": 7308 - }, - { - "epoch": 0.19, - "learning_rate": 1.9944857782331738e-06, - "loss": 0.6694, - "step": 7309 - }, - { - "epoch": 0.19, - "learning_rate": 1.9944828760097424e-06, - "loss": 0.998, - "step": 7310 - }, - { - "epoch": 0.19, - "learning_rate": 1.9944799730248814e-06, - "loss": 0.7983, - "step": 7311 - }, - { - "epoch": 0.19, - "learning_rate": 1.9944770692785932e-06, - "loss": 0.7266, - "step": 7312 - }, - { - "epoch": 0.19, - "learning_rate": 1.994474164770879e-06, - "loss": 0.9531, - "step": 7313 - }, - { - "epoch": 0.19, - "learning_rate": 1.9944712595017422e-06, - "loss": 0.6921, - "step": 7314 - }, - { - "epoch": 0.19, - "learning_rate": 1.994468353471184e-06, - "loss": 1.0596, - "step": 7315 - }, - { - "epoch": 0.19, - "learning_rate": 1.9944654466792073e-06, - "loss": 0.8262, - "step": 7316 - }, - { - "epoch": 0.19, - "learning_rate": 1.9944625391258143e-06, - "loss": 0.9326, - "step": 7317 - }, - { - "epoch": 0.19, - "learning_rate": 1.994459630811007e-06, - "loss": 1.0967, - "step": 7318 - }, - { - "epoch": 0.19, - "learning_rate": 1.9944567217347873e-06, - "loss": 1.082, - "step": 7319 - }, - { - "epoch": 0.19, - "learning_rate": 1.9944538118971582e-06, - "loss": 1.0322, - "step": 7320 - }, - { - "epoch": 0.19, - "learning_rate": 1.9944509012981215e-06, - "loss": 0.8164, - "step": 7321 - }, - { - "epoch": 0.19, - "learning_rate": 1.9944479899376793e-06, - "loss": 0.9023, - "step": 7322 - }, - { - "epoch": 0.19, - "learning_rate": 1.9944450778158345e-06, - "loss": 0.8965, - "step": 7323 - }, - { - "epoch": 0.19, - "learning_rate": 1.9944421649325883e-06, - "loss": 0.9541, - "step": 7324 - }, - { - "epoch": 0.19, - "learning_rate": 1.9944392512879434e-06, - "loss": 0.7109, - "step": 7325 - }, - { - "epoch": 0.19, - "learning_rate": 1.9944363368819028e-06, - "loss": 1.0537, - "step": 7326 - }, - { - "epoch": 0.19, - "learning_rate": 1.994433421714467e-06, - "loss": 0.8486, - "step": 7327 - }, - { - "epoch": 0.19, - "learning_rate": 1.99443050578564e-06, - "loss": 0.8633, - "step": 7328 - }, - { - "epoch": 0.19, - "learning_rate": 1.994427589095423e-06, - "loss": 0.8267, - "step": 7329 - }, - { - "epoch": 0.19, - "learning_rate": 1.9944246716438185e-06, - "loss": 1.0576, - "step": 7330 - }, - { - "epoch": 0.19, - "learning_rate": 1.994421753430829e-06, - "loss": 0.7739, - "step": 7331 - }, - { - "epoch": 0.19, - "learning_rate": 1.994418834456456e-06, - "loss": 0.8457, - "step": 7332 - }, - { - "epoch": 0.19, - "learning_rate": 1.994415914720703e-06, - "loss": 0.9775, - "step": 7333 - }, - { - "epoch": 0.19, - "learning_rate": 1.994412994223571e-06, - "loss": 0.582, - "step": 7334 - }, - { - "epoch": 0.19, - "learning_rate": 1.9944100729650628e-06, - "loss": 0.9688, - "step": 7335 - }, - { - "epoch": 0.19, - "learning_rate": 1.99440715094518e-06, - "loss": 0.8457, - "step": 7336 - }, - { - "epoch": 0.19, - "learning_rate": 1.9944042281639263e-06, - "loss": 1.0566, - "step": 7337 - }, - { - "epoch": 0.19, - "learning_rate": 1.994401304621302e-06, - "loss": 1.25, - "step": 7338 - }, - { - "epoch": 0.19, - "learning_rate": 1.9943983803173112e-06, - "loss": 0.9736, - "step": 7339 - }, - { - "epoch": 0.19, - "learning_rate": 1.9943954552519547e-06, - "loss": 1.0752, - "step": 7340 - }, - { - "epoch": 0.19, - "learning_rate": 1.9943925294252358e-06, - "loss": 0.9326, - "step": 7341 - }, - { - "epoch": 0.19, - "learning_rate": 1.9943896028371562e-06, - "loss": 1.0645, - "step": 7342 - }, - { - "epoch": 0.19, - "learning_rate": 1.9943866754877177e-06, - "loss": 0.6782, - "step": 7343 - }, - { - "epoch": 0.19, - "learning_rate": 1.9943837473769232e-06, - "loss": 0.7925, - "step": 7344 - }, - { - "epoch": 0.19, - "learning_rate": 1.9943808185047753e-06, - "loss": 0.7178, - "step": 7345 - }, - { - "epoch": 0.19, - "learning_rate": 1.994377888871275e-06, - "loss": 1.0166, - "step": 7346 - }, - { - "epoch": 0.19, - "learning_rate": 1.994374958476426e-06, - "loss": 0.9385, - "step": 7347 - }, - { - "epoch": 0.19, - "learning_rate": 1.9943720273202295e-06, - "loss": 1.1289, - "step": 7348 - }, - { - "epoch": 0.19, - "learning_rate": 1.994369095402688e-06, - "loss": 0.9521, - "step": 7349 - }, - { - "epoch": 0.19, - "learning_rate": 1.994366162723804e-06, - "loss": 1.1465, - "step": 7350 - }, - { - "epoch": 0.19, - "learning_rate": 1.9943632292835797e-06, - "loss": 0.8701, - "step": 7351 - }, - { - "epoch": 0.19, - "learning_rate": 1.9943602950820165e-06, - "loss": 0.7788, - "step": 7352 - }, - { - "epoch": 0.19, - "learning_rate": 1.994357360119118e-06, - "loss": 0.8955, - "step": 7353 - }, - { - "epoch": 0.19, - "learning_rate": 1.9943544243948852e-06, - "loss": 1.0029, - "step": 7354 - }, - { - "epoch": 0.19, - "learning_rate": 1.9943514879093214e-06, - "loss": 1.001, - "step": 7355 - }, - { - "epoch": 0.19, - "learning_rate": 1.9943485506624283e-06, - "loss": 0.8691, - "step": 7356 - }, - { - "epoch": 0.19, - "learning_rate": 1.994345612654208e-06, - "loss": 0.9512, - "step": 7357 - }, - { - "epoch": 0.19, - "learning_rate": 1.9943426738846635e-06, - "loss": 1.0195, - "step": 7358 - }, - { - "epoch": 0.19, - "learning_rate": 1.994339734353796e-06, - "loss": 0.917, - "step": 7359 - }, - { - "epoch": 0.19, - "learning_rate": 1.9943367940616085e-06, - "loss": 1.0186, - "step": 7360 - }, - { - "epoch": 0.19, - "learning_rate": 1.994333853008103e-06, - "loss": 0.9756, - "step": 7361 - }, - { - "epoch": 0.19, - "learning_rate": 1.994330911193282e-06, - "loss": 0.6533, - "step": 7362 - }, - { - "epoch": 0.19, - "learning_rate": 1.9943279686171473e-06, - "loss": 0.7783, - "step": 7363 - }, - { - "epoch": 0.19, - "learning_rate": 1.994325025279702e-06, - "loss": 1.5605, - "step": 7364 - }, - { - "epoch": 0.19, - "learning_rate": 1.9943220811809466e-06, - "loss": 0.834, - "step": 7365 - }, - { - "epoch": 0.19, - "learning_rate": 1.9943191363208854e-06, - "loss": 0.9365, - "step": 7366 - }, - { - "epoch": 0.19, - "learning_rate": 1.9943161906995194e-06, - "loss": 0.8403, - "step": 7367 - }, - { - "epoch": 0.19, - "learning_rate": 1.994313244316851e-06, - "loss": 0.9189, - "step": 7368 - }, - { - "epoch": 0.19, - "learning_rate": 1.9943102971728833e-06, - "loss": 1.0781, - "step": 7369 - }, - { - "epoch": 0.19, - "learning_rate": 1.9943073492676175e-06, - "loss": 0.8613, - "step": 7370 - }, - { - "epoch": 0.19, - "learning_rate": 1.9943044006010563e-06, - "loss": 1.0049, - "step": 7371 - }, - { - "epoch": 0.19, - "learning_rate": 1.994301451173202e-06, - "loss": 0.8955, - "step": 7372 - }, - { - "epoch": 0.19, - "learning_rate": 1.994298500984057e-06, - "loss": 0.9014, - "step": 7373 - }, - { - "epoch": 0.19, - "learning_rate": 1.9942955500336233e-06, - "loss": 0.7783, - "step": 7374 - }, - { - "epoch": 0.19, - "learning_rate": 1.9942925983219027e-06, - "loss": 0.6914, - "step": 7375 - }, - { - "epoch": 0.19, - "learning_rate": 1.9942896458488987e-06, - "loss": 1.0244, - "step": 7376 - }, - { - "epoch": 0.19, - "learning_rate": 1.9942866926146123e-06, - "loss": 0.8857, - "step": 7377 - }, - { - "epoch": 0.19, - "learning_rate": 1.9942837386190466e-06, - "loss": 0.9277, - "step": 7378 - }, - { - "epoch": 0.19, - "learning_rate": 1.9942807838622033e-06, - "loss": 0.9038, - "step": 7379 - }, - { - "epoch": 0.19, - "learning_rate": 1.9942778283440853e-06, - "loss": 0.9028, - "step": 7380 - }, - { - "epoch": 0.19, - "learning_rate": 1.994274872064694e-06, - "loss": 0.9639, - "step": 7381 - }, - { - "epoch": 0.19, - "learning_rate": 1.9942719150240324e-06, - "loss": 0.9912, - "step": 7382 - }, - { - "epoch": 0.19, - "learning_rate": 1.9942689572221027e-06, - "loss": 0.8687, - "step": 7383 - }, - { - "epoch": 0.19, - "learning_rate": 1.9942659986589067e-06, - "loss": 0.9717, - "step": 7384 - }, - { - "epoch": 0.19, - "learning_rate": 1.994263039334447e-06, - "loss": 0.7974, - "step": 7385 - }, - { - "epoch": 0.19, - "learning_rate": 1.994260079248726e-06, - "loss": 0.6245, - "step": 7386 - }, - { - "epoch": 0.19, - "learning_rate": 1.9942571184017454e-06, - "loss": 1.1426, - "step": 7387 - }, - { - "epoch": 0.19, - "learning_rate": 1.994254156793508e-06, - "loss": 0.8594, - "step": 7388 - }, - { - "epoch": 0.19, - "learning_rate": 1.994251194424016e-06, - "loss": 0.8174, - "step": 7389 - }, - { - "epoch": 0.19, - "learning_rate": 1.9942482312932717e-06, - "loss": 0.9873, - "step": 7390 - }, - { - "epoch": 0.19, - "learning_rate": 1.994245267401277e-06, - "loss": 0.6895, - "step": 7391 - }, - { - "epoch": 0.19, - "learning_rate": 1.9942423027480345e-06, - "loss": 1.0361, - "step": 7392 - }, - { - "epoch": 0.19, - "learning_rate": 1.9942393373335465e-06, - "loss": 0.9521, - "step": 7393 - }, - { - "epoch": 0.19, - "learning_rate": 1.9942363711578147e-06, - "loss": 0.8557, - "step": 7394 - }, - { - "epoch": 0.19, - "learning_rate": 1.9942334042208426e-06, - "loss": 0.7202, - "step": 7395 - }, - { - "epoch": 0.19, - "learning_rate": 1.9942304365226314e-06, - "loss": 0.7256, - "step": 7396 - }, - { - "epoch": 0.19, - "learning_rate": 1.994227468063183e-06, - "loss": 0.9971, - "step": 7397 - }, - { - "epoch": 0.19, - "learning_rate": 1.9942244988425014e-06, - "loss": 0.9131, - "step": 7398 - }, - { - "epoch": 0.19, - "learning_rate": 1.9942215288605872e-06, - "loss": 0.9756, - "step": 7399 - }, - { - "epoch": 0.19, - "learning_rate": 1.9942185581174433e-06, - "loss": 1.0547, - "step": 7400 - }, - { - "epoch": 0.19, - "learning_rate": 1.994215586613072e-06, - "loss": 0.8662, - "step": 7401 - }, - { - "epoch": 0.19, - "learning_rate": 1.9942126143474755e-06, - "loss": 0.9355, - "step": 7402 - }, - { - "epoch": 0.19, - "learning_rate": 1.9942096413206562e-06, - "loss": 0.9717, - "step": 7403 - }, - { - "epoch": 0.19, - "learning_rate": 1.9942066675326165e-06, - "loss": 0.877, - "step": 7404 - }, - { - "epoch": 0.19, - "learning_rate": 1.9942036929833584e-06, - "loss": 0.9004, - "step": 7405 - }, - { - "epoch": 0.19, - "learning_rate": 1.994200717672884e-06, - "loss": 1.0322, - "step": 7406 - }, - { - "epoch": 0.19, - "learning_rate": 1.994197741601196e-06, - "loss": 1.0264, - "step": 7407 - }, - { - "epoch": 0.19, - "learning_rate": 1.9941947647682965e-06, - "loss": 0.8984, - "step": 7408 - }, - { - "epoch": 0.19, - "learning_rate": 1.994191787174188e-06, - "loss": 0.7466, - "step": 7409 - }, - { - "epoch": 0.19, - "learning_rate": 1.994188808818872e-06, - "loss": 0.9873, - "step": 7410 - }, - { - "epoch": 0.19, - "learning_rate": 1.9941858297023517e-06, - "loss": 0.8062, - "step": 7411 - }, - { - "epoch": 0.19, - "learning_rate": 1.9941828498246288e-06, - "loss": 0.7295, - "step": 7412 - }, - { - "epoch": 0.19, - "learning_rate": 1.994179869185706e-06, - "loss": 0.6675, - "step": 7413 - }, - { - "epoch": 0.19, - "learning_rate": 1.9941768877855854e-06, - "loss": 0.7119, - "step": 7414 - }, - { - "epoch": 0.19, - "learning_rate": 1.994173905624269e-06, - "loss": 0.8906, - "step": 7415 - }, - { - "epoch": 0.19, - "learning_rate": 1.9941709227017597e-06, - "loss": 0.8887, - "step": 7416 - }, - { - "epoch": 0.19, - "learning_rate": 1.9941679390180598e-06, - "loss": 0.647, - "step": 7417 - }, - { - "epoch": 0.19, - "learning_rate": 1.9941649545731703e-06, - "loss": 0.9014, - "step": 7418 - }, - { - "epoch": 0.19, - "learning_rate": 1.994161969367095e-06, - "loss": 0.8574, - "step": 7419 - }, - { - "epoch": 0.19, - "learning_rate": 1.9941589833998354e-06, - "loss": 0.8516, - "step": 7420 - }, - { - "epoch": 0.19, - "learning_rate": 1.9941559966713943e-06, - "loss": 0.9648, - "step": 7421 - }, - { - "epoch": 0.19, - "learning_rate": 1.9941530091817733e-06, - "loss": 0.752, - "step": 7422 - }, - { - "epoch": 0.19, - "learning_rate": 1.994150020930975e-06, - "loss": 0.9902, - "step": 7423 - }, - { - "epoch": 0.19, - "learning_rate": 1.994147031919002e-06, - "loss": 0.9414, - "step": 7424 - }, - { - "epoch": 0.19, - "learning_rate": 1.994144042145856e-06, - "loss": 0.8643, - "step": 7425 - }, - { - "epoch": 0.19, - "learning_rate": 1.99414105161154e-06, - "loss": 0.748, - "step": 7426 - }, - { - "epoch": 0.19, - "learning_rate": 1.9941380603160556e-06, - "loss": 1.002, - "step": 7427 - }, - { - "epoch": 0.19, - "learning_rate": 1.994135068259406e-06, - "loss": 1.0176, - "step": 7428 - }, - { - "epoch": 0.19, - "learning_rate": 1.994132075441592e-06, - "loss": 0.8223, - "step": 7429 - }, - { - "epoch": 0.19, - "learning_rate": 1.9941290818626175e-06, - "loss": 0.9873, - "step": 7430 - }, - { - "epoch": 0.19, - "learning_rate": 1.9941260875224838e-06, - "loss": 0.9893, - "step": 7431 - }, - { - "epoch": 0.19, - "learning_rate": 1.9941230924211935e-06, - "loss": 0.8389, - "step": 7432 - }, - { - "epoch": 0.19, - "learning_rate": 1.9941200965587484e-06, - "loss": 1.0654, - "step": 7433 - }, - { - "epoch": 0.19, - "learning_rate": 1.994117099935152e-06, - "loss": 1.0889, - "step": 7434 - }, - { - "epoch": 0.19, - "learning_rate": 1.994114102550405e-06, - "loss": 1.0, - "step": 7435 - }, - { - "epoch": 0.19, - "learning_rate": 1.9941111044045113e-06, - "loss": 0.8447, - "step": 7436 - }, - { - "epoch": 0.19, - "learning_rate": 1.9941081054974724e-06, - "loss": 0.8379, - "step": 7437 - }, - { - "epoch": 0.19, - "learning_rate": 1.9941051058292905e-06, - "loss": 0.8301, - "step": 7438 - }, - { - "epoch": 0.19, - "learning_rate": 1.9941021053999677e-06, - "loss": 0.9785, - "step": 7439 - }, - { - "epoch": 0.19, - "learning_rate": 1.994099104209507e-06, - "loss": 1.0283, - "step": 7440 - }, - { - "epoch": 0.19, - "learning_rate": 1.9940961022579102e-06, - "loss": 0.877, - "step": 7441 - }, - { - "epoch": 0.19, - "learning_rate": 1.99409309954518e-06, - "loss": 0.8828, - "step": 7442 - }, - { - "epoch": 0.19, - "learning_rate": 1.994090096071318e-06, - "loss": 0.8896, - "step": 7443 - }, - { - "epoch": 0.19, - "learning_rate": 1.9940870918363273e-06, - "loss": 0.958, - "step": 7444 - }, - { - "epoch": 0.19, - "learning_rate": 1.9940840868402094e-06, - "loss": 0.8154, - "step": 7445 - }, - { - "epoch": 0.19, - "learning_rate": 1.9940810810829673e-06, - "loss": 0.9277, - "step": 7446 - }, - { - "epoch": 0.19, - "learning_rate": 1.994078074564603e-06, - "loss": 0.7729, - "step": 7447 - }, - { - "epoch": 0.19, - "learning_rate": 1.9940750672851185e-06, - "loss": 0.9639, - "step": 7448 - }, - { - "epoch": 0.19, - "learning_rate": 1.994072059244517e-06, - "loss": 1.041, - "step": 7449 - }, - { - "epoch": 0.19, - "learning_rate": 1.9940690504428e-06, - "loss": 0.9199, - "step": 7450 - }, - { - "epoch": 0.19, - "learning_rate": 1.9940660408799696e-06, - "loss": 1.0669, - "step": 7451 - }, - { - "epoch": 0.19, - "learning_rate": 1.994063030556029e-06, - "loss": 0.9043, - "step": 7452 - }, - { - "epoch": 0.19, - "learning_rate": 1.99406001947098e-06, - "loss": 0.7607, - "step": 7453 - }, - { - "epoch": 0.19, - "learning_rate": 1.994057007624825e-06, - "loss": 0.9385, - "step": 7454 - }, - { - "epoch": 0.19, - "learning_rate": 1.994053995017566e-06, - "loss": 0.9775, - "step": 7455 - }, - { - "epoch": 0.19, - "learning_rate": 1.994050981649206e-06, - "loss": 0.7441, - "step": 7456 - }, - { - "epoch": 0.19, - "learning_rate": 1.9940479675197465e-06, - "loss": 0.9658, - "step": 7457 - }, - { - "epoch": 0.19, - "learning_rate": 1.9940449526291904e-06, - "loss": 0.8457, - "step": 7458 - }, - { - "epoch": 0.19, - "learning_rate": 1.9940419369775395e-06, - "loss": 1.1104, - "step": 7459 - }, - { - "epoch": 0.19, - "learning_rate": 1.9940389205647965e-06, - "loss": 1.1836, - "step": 7460 - }, - { - "epoch": 0.19, - "learning_rate": 1.994035903390964e-06, - "loss": 1.0303, - "step": 7461 - }, - { - "epoch": 0.19, - "learning_rate": 1.9940328854560434e-06, - "loss": 0.9443, - "step": 7462 - }, - { - "epoch": 0.19, - "learning_rate": 1.9940298667600376e-06, - "loss": 1.1094, - "step": 7463 - }, - { - "epoch": 0.19, - "learning_rate": 1.994026847302949e-06, - "loss": 0.8555, - "step": 7464 - }, - { - "epoch": 0.19, - "learning_rate": 1.99402382708478e-06, - "loss": 0.9473, - "step": 7465 - }, - { - "epoch": 0.19, - "learning_rate": 1.994020806105532e-06, - "loss": 0.9502, - "step": 7466 - }, - { - "epoch": 0.19, - "learning_rate": 1.9940177843652084e-06, - "loss": 1.0439, - "step": 7467 - }, - { - "epoch": 0.19, - "learning_rate": 1.994014761863811e-06, - "loss": 0.7959, - "step": 7468 - }, - { - "epoch": 0.19, - "learning_rate": 1.9940117386013425e-06, - "loss": 0.96, - "step": 7469 - }, - { - "epoch": 0.19, - "learning_rate": 1.9940087145778043e-06, - "loss": 1.0293, - "step": 7470 - }, - { - "epoch": 0.19, - "learning_rate": 1.9940056897932e-06, - "loss": 0.7441, - "step": 7471 - }, - { - "epoch": 0.19, - "learning_rate": 1.9940026642475308e-06, - "loss": 0.9111, - "step": 7472 - }, - { - "epoch": 0.19, - "learning_rate": 1.9939996379407996e-06, - "loss": 0.8877, - "step": 7473 - }, - { - "epoch": 0.19, - "learning_rate": 1.9939966108730086e-06, - "loss": 1.0498, - "step": 7474 - }, - { - "epoch": 0.19, - "learning_rate": 1.99399358304416e-06, - "loss": 1.0127, - "step": 7475 - }, - { - "epoch": 0.19, - "learning_rate": 1.9939905544542563e-06, - "loss": 0.9961, - "step": 7476 - }, - { - "epoch": 0.19, - "learning_rate": 1.9939875251032997e-06, - "loss": 0.8228, - "step": 7477 - }, - { - "epoch": 0.19, - "learning_rate": 1.9939844949912926e-06, - "loss": 1.1348, - "step": 7478 - }, - { - "epoch": 0.19, - "learning_rate": 1.9939814641182373e-06, - "loss": 0.9082, - "step": 7479 - }, - { - "epoch": 0.19, - "learning_rate": 1.993978432484136e-06, - "loss": 1.0264, - "step": 7480 - }, - { - "epoch": 0.19, - "learning_rate": 1.9939754000889914e-06, - "loss": 0.9473, - "step": 7481 - }, - { - "epoch": 0.19, - "learning_rate": 1.9939723669328054e-06, - "loss": 0.8496, - "step": 7482 - }, - { - "epoch": 0.19, - "learning_rate": 1.9939693330155802e-06, - "loss": 1.04, - "step": 7483 - }, - { - "epoch": 0.19, - "learning_rate": 1.993966298337319e-06, - "loss": 0.8682, - "step": 7484 - }, - { - "epoch": 0.19, - "learning_rate": 1.993963262898023e-06, - "loss": 0.8789, - "step": 7485 - }, - { - "epoch": 0.19, - "learning_rate": 1.993960226697695e-06, - "loss": 1.0908, - "step": 7486 - }, - { - "epoch": 0.19, - "learning_rate": 1.9939571897363375e-06, - "loss": 0.8169, - "step": 7487 - }, - { - "epoch": 0.19, - "learning_rate": 1.9939541520139523e-06, - "loss": 0.6921, - "step": 7488 - }, - { - "epoch": 0.19, - "learning_rate": 1.993951113530543e-06, - "loss": 0.999, - "step": 7489 - }, - { - "epoch": 0.19, - "learning_rate": 1.99394807428611e-06, - "loss": 0.877, - "step": 7490 - }, - { - "epoch": 0.19, - "learning_rate": 1.9939450342806573e-06, - "loss": 0.7354, - "step": 7491 - }, - { - "epoch": 0.19, - "learning_rate": 1.9939419935141865e-06, - "loss": 1.0332, - "step": 7492 - }, - { - "epoch": 0.19, - "learning_rate": 1.9939389519867002e-06, - "loss": 0.8486, - "step": 7493 - }, - { - "epoch": 0.19, - "learning_rate": 1.9939359096982e-06, - "loss": 0.9082, - "step": 7494 - }, - { - "epoch": 0.19, - "learning_rate": 1.9939328666486893e-06, - "loss": 0.8667, - "step": 7495 - }, - { - "epoch": 0.19, - "learning_rate": 1.9939298228381697e-06, - "loss": 0.8711, - "step": 7496 - }, - { - "epoch": 0.19, - "learning_rate": 1.9939267782666435e-06, - "loss": 0.9961, - "step": 7497 - }, - { - "epoch": 0.19, - "learning_rate": 1.993923732934114e-06, - "loss": 1.002, - "step": 7498 - }, - { - "epoch": 0.19, - "learning_rate": 1.993920686840582e-06, - "loss": 1.0225, - "step": 7499 - }, - { - "epoch": 0.19, - "learning_rate": 1.9939176399860508e-06, - "loss": 1.0195, - "step": 7500 - }, - { - "epoch": 0.19, - "learning_rate": 1.9939145923705228e-06, - "loss": 0.8218, - "step": 7501 - }, - { - "epoch": 0.19, - "learning_rate": 1.993911543994e-06, - "loss": 0.9629, - "step": 7502 - }, - { - "epoch": 0.19, - "learning_rate": 1.9939084948564848e-06, - "loss": 1.1094, - "step": 7503 - }, - { - "epoch": 0.19, - "learning_rate": 1.99390544495798e-06, - "loss": 0.9727, - "step": 7504 - }, - { - "epoch": 0.19, - "learning_rate": 1.993902394298487e-06, - "loss": 0.9658, - "step": 7505 - }, - { - "epoch": 0.19, - "learning_rate": 1.9938993428780085e-06, - "loss": 0.9619, - "step": 7506 - }, - { - "epoch": 0.19, - "learning_rate": 1.9938962906965473e-06, - "loss": 0.8838, - "step": 7507 - }, - { - "epoch": 0.19, - "learning_rate": 1.9938932377541054e-06, - "loss": 0.876, - "step": 7508 - }, - { - "epoch": 0.19, - "learning_rate": 1.993890184050685e-06, - "loss": 0.9385, - "step": 7509 - }, - { - "epoch": 0.19, - "learning_rate": 1.9938871295862886e-06, - "loss": 0.8809, - "step": 7510 - }, - { - "epoch": 0.19, - "learning_rate": 1.9938840743609187e-06, - "loss": 0.8579, - "step": 7511 - }, - { - "epoch": 0.19, - "learning_rate": 1.9938810183745775e-06, - "loss": 0.6924, - "step": 7512 - }, - { - "epoch": 0.19, - "learning_rate": 1.993877961627267e-06, - "loss": 0.9336, - "step": 7513 - }, - { - "epoch": 0.19, - "learning_rate": 1.99387490411899e-06, - "loss": 0.9761, - "step": 7514 - }, - { - "epoch": 0.19, - "learning_rate": 1.993871845849749e-06, - "loss": 1.04, - "step": 7515 - }, - { - "epoch": 0.19, - "learning_rate": 1.9938687868195456e-06, - "loss": 0.814, - "step": 7516 - }, - { - "epoch": 0.19, - "learning_rate": 1.9938657270283823e-06, - "loss": 0.7646, - "step": 7517 - }, - { - "epoch": 0.19, - "learning_rate": 1.993862666476262e-06, - "loss": 0.7485, - "step": 7518 - }, - { - "epoch": 0.19, - "learning_rate": 1.9938596051631872e-06, - "loss": 0.7847, - "step": 7519 - }, - { - "epoch": 0.19, - "learning_rate": 1.9938565430891592e-06, - "loss": 1.0908, - "step": 7520 - }, - { - "epoch": 0.19, - "learning_rate": 1.9938534802541814e-06, - "loss": 0.8213, - "step": 7521 - }, - { - "epoch": 0.19, - "learning_rate": 1.9938504166582554e-06, - "loss": 1.1855, - "step": 7522 - }, - { - "epoch": 0.19, - "learning_rate": 1.9938473523013838e-06, - "loss": 0.8867, - "step": 7523 - }, - { - "epoch": 0.19, - "learning_rate": 1.993844287183569e-06, - "loss": 0.9268, - "step": 7524 - }, - { - "epoch": 0.19, - "learning_rate": 1.9938412213048135e-06, - "loss": 1.0293, - "step": 7525 - }, - { - "epoch": 0.19, - "learning_rate": 1.9938381546651195e-06, - "loss": 0.7129, - "step": 7526 - }, - { - "epoch": 0.19, - "learning_rate": 1.993835087264489e-06, - "loss": 0.7842, - "step": 7527 - }, - { - "epoch": 0.19, - "learning_rate": 1.993832019102925e-06, - "loss": 1.0938, - "step": 7528 - }, - { - "epoch": 0.19, - "learning_rate": 1.9938289501804295e-06, - "loss": 0.9336, - "step": 7529 - }, - { - "epoch": 0.19, - "learning_rate": 1.9938258804970048e-06, - "loss": 0.9209, - "step": 7530 - }, - { - "epoch": 0.19, - "learning_rate": 1.9938228100526535e-06, - "loss": 1.0977, - "step": 7531 - }, - { - "epoch": 0.19, - "learning_rate": 1.9938197388473774e-06, - "loss": 1.0957, - "step": 7532 - }, - { - "epoch": 0.19, - "learning_rate": 1.9938166668811794e-06, - "loss": 0.8789, - "step": 7533 - }, - { - "epoch": 0.19, - "learning_rate": 1.9938135941540616e-06, - "loss": 1.0234, - "step": 7534 - }, - { - "epoch": 0.19, - "learning_rate": 1.9938105206660266e-06, - "loss": 1.0132, - "step": 7535 - }, - { - "epoch": 0.19, - "learning_rate": 1.9938074464170765e-06, - "loss": 0.8574, - "step": 7536 - }, - { - "epoch": 0.19, - "learning_rate": 1.993804371407214e-06, - "loss": 0.8525, - "step": 7537 - }, - { - "epoch": 0.19, - "learning_rate": 1.9938012956364407e-06, - "loss": 1.2109, - "step": 7538 - }, - { - "epoch": 0.19, - "learning_rate": 1.9937982191047596e-06, - "loss": 0.9805, - "step": 7539 - }, - { - "epoch": 0.19, - "learning_rate": 1.993795141812173e-06, - "loss": 0.9863, - "step": 7540 - }, - { - "epoch": 0.19, - "learning_rate": 1.993792063758683e-06, - "loss": 0.7451, - "step": 7541 - }, - { - "epoch": 0.19, - "learning_rate": 1.993788984944292e-06, - "loss": 0.8193, - "step": 7542 - }, - { - "epoch": 0.19, - "learning_rate": 1.993785905369003e-06, - "loss": 0.8154, - "step": 7543 - }, - { - "epoch": 0.19, - "learning_rate": 1.9937828250328176e-06, - "loss": 0.7625, - "step": 7544 - }, - { - "epoch": 0.19, - "learning_rate": 1.9937797439357382e-06, - "loss": 0.8931, - "step": 7545 - }, - { - "epoch": 0.19, - "learning_rate": 1.9937766620777675e-06, - "loss": 0.833, - "step": 7546 - }, - { - "epoch": 0.19, - "learning_rate": 1.9937735794589075e-06, - "loss": 0.7761, - "step": 7547 - }, - { - "epoch": 0.19, - "learning_rate": 1.993770496079161e-06, - "loss": 0.9268, - "step": 7548 - }, - { - "epoch": 0.19, - "learning_rate": 1.9937674119385298e-06, - "loss": 0.6821, - "step": 7549 - }, - { - "epoch": 0.19, - "learning_rate": 1.993764327037017e-06, - "loss": 0.8516, - "step": 7550 - }, - { - "epoch": 0.19, - "learning_rate": 1.9937612413746242e-06, - "loss": 0.7202, - "step": 7551 - }, - { - "epoch": 0.19, - "learning_rate": 1.9937581549513543e-06, - "loss": 0.7627, - "step": 7552 - }, - { - "epoch": 0.19, - "learning_rate": 1.99375506776721e-06, - "loss": 0.8574, - "step": 7553 - }, - { - "epoch": 0.19, - "learning_rate": 1.9937519798221923e-06, - "loss": 0.8896, - "step": 7554 - }, - { - "epoch": 0.19, - "learning_rate": 1.993748891116305e-06, - "loss": 0.7217, - "step": 7555 - }, - { - "epoch": 0.19, - "learning_rate": 1.9937458016495494e-06, - "loss": 0.7354, - "step": 7556 - }, - { - "epoch": 0.19, - "learning_rate": 1.9937427114219284e-06, - "loss": 1.1484, - "step": 7557 - }, - { - "epoch": 0.19, - "learning_rate": 1.9937396204334443e-06, - "loss": 0.7231, - "step": 7558 - }, - { - "epoch": 0.19, - "learning_rate": 1.9937365286841e-06, - "loss": 0.915, - "step": 7559 - }, - { - "epoch": 0.19, - "learning_rate": 1.9937334361738965e-06, - "loss": 0.9111, - "step": 7560 - }, - { - "epoch": 0.19, - "learning_rate": 1.9937303429028374e-06, - "loss": 0.8486, - "step": 7561 - }, - { - "epoch": 0.19, - "learning_rate": 1.993727248870925e-06, - "loss": 0.9082, - "step": 7562 - }, - { - "epoch": 0.19, - "learning_rate": 1.993724154078161e-06, - "loss": 0.8853, - "step": 7563 - }, - { - "epoch": 0.19, - "learning_rate": 1.993721058524548e-06, - "loss": 0.9258, - "step": 7564 - }, - { - "epoch": 0.19, - "learning_rate": 1.9937179622100885e-06, - "loss": 1.0195, - "step": 7565 - }, - { - "epoch": 0.19, - "learning_rate": 1.993714865134785e-06, - "loss": 0.8613, - "step": 7566 - }, - { - "epoch": 0.19, - "learning_rate": 1.9937117672986398e-06, - "loss": 0.5889, - "step": 7567 - }, - { - "epoch": 0.19, - "learning_rate": 1.9937086687016547e-06, - "loss": 0.8091, - "step": 7568 - }, - { - "epoch": 0.19, - "learning_rate": 1.993705569343833e-06, - "loss": 0.7026, - "step": 7569 - }, - { - "epoch": 0.19, - "learning_rate": 1.9937024692251765e-06, - "loss": 0.9756, - "step": 7570 - }, - { - "epoch": 0.19, - "learning_rate": 1.993699368345688e-06, - "loss": 0.9385, - "step": 7571 - }, - { - "epoch": 0.19, - "learning_rate": 1.9936962667053695e-06, - "loss": 0.9189, - "step": 7572 - }, - { - "epoch": 0.19, - "learning_rate": 1.993693164304223e-06, - "loss": 0.6958, - "step": 7573 - }, - { - "epoch": 0.19, - "learning_rate": 1.993690061142252e-06, - "loss": 1.1611, - "step": 7574 - }, - { - "epoch": 0.19, - "learning_rate": 1.993686957219458e-06, - "loss": 1.0537, - "step": 7575 - }, - { - "epoch": 0.19, - "learning_rate": 1.993683852535843e-06, - "loss": 0.9297, - "step": 7576 - }, - { - "epoch": 0.19, - "learning_rate": 1.9936807470914107e-06, - "loss": 0.8281, - "step": 7577 - }, - { - "epoch": 0.19, - "learning_rate": 1.9936776408861623e-06, - "loss": 0.7202, - "step": 7578 - }, - { - "epoch": 0.19, - "learning_rate": 1.993674533920101e-06, - "loss": 0.6978, - "step": 7579 - }, - { - "epoch": 0.19, - "learning_rate": 1.9936714261932285e-06, - "loss": 1.0078, - "step": 7580 - }, - { - "epoch": 0.19, - "learning_rate": 1.9936683177055478e-06, - "loss": 1.1035, - "step": 7581 - }, - { - "epoch": 0.19, - "learning_rate": 1.9936652084570603e-06, - "loss": 1.0137, - "step": 7582 - }, - { - "epoch": 0.19, - "learning_rate": 1.9936620984477696e-06, - "loss": 0.7036, - "step": 7583 - }, - { - "epoch": 0.19, - "learning_rate": 1.9936589876776772e-06, - "loss": 0.749, - "step": 7584 - }, - { - "epoch": 0.19, - "learning_rate": 1.9936558761467863e-06, - "loss": 1.0049, - "step": 7585 - }, - { - "epoch": 0.19, - "learning_rate": 1.9936527638550983e-06, - "loss": 0.8452, - "step": 7586 - }, - { - "epoch": 0.19, - "learning_rate": 1.993649650802616e-06, - "loss": 0.8818, - "step": 7587 - }, - { - "epoch": 0.19, - "learning_rate": 1.993646536989342e-06, - "loss": 0.8887, - "step": 7588 - }, - { - "epoch": 0.19, - "learning_rate": 1.993643422415279e-06, - "loss": 0.7583, - "step": 7589 - }, - { - "epoch": 0.19, - "learning_rate": 1.993640307080429e-06, - "loss": 0.7622, - "step": 7590 - }, - { - "epoch": 0.19, - "learning_rate": 1.9936371909847934e-06, - "loss": 1.3301, - "step": 7591 - }, - { - "epoch": 0.19, - "learning_rate": 1.993634074128376e-06, - "loss": 0.9873, - "step": 7592 - }, - { - "epoch": 0.19, - "learning_rate": 1.993630956511179e-06, - "loss": 1.0977, - "step": 7593 - }, - { - "epoch": 0.19, - "learning_rate": 1.993627838133204e-06, - "loss": 1.0986, - "step": 7594 - }, - { - "epoch": 0.19, - "learning_rate": 1.993624718994454e-06, - "loss": 0.8262, - "step": 7595 - }, - { - "epoch": 0.19, - "learning_rate": 1.9936215990949308e-06, - "loss": 0.9673, - "step": 7596 - }, - { - "epoch": 0.19, - "learning_rate": 1.9936184784346378e-06, - "loss": 0.7715, - "step": 7597 - }, - { - "epoch": 0.19, - "learning_rate": 1.9936153570135766e-06, - "loss": 0.9102, - "step": 7598 - }, - { - "epoch": 0.19, - "learning_rate": 1.9936122348317495e-06, - "loss": 0.9736, - "step": 7599 - }, - { - "epoch": 0.19, - "learning_rate": 1.9936091118891597e-06, - "loss": 0.9883, - "step": 7600 - }, - { - "epoch": 0.19, - "learning_rate": 1.9936059881858085e-06, - "loss": 0.7705, - "step": 7601 - }, - { - "epoch": 0.19, - "learning_rate": 1.9936028637216998e-06, - "loss": 0.728, - "step": 7602 - }, - { - "epoch": 0.19, - "learning_rate": 1.9935997384968343e-06, - "loss": 1.0303, - "step": 7603 - }, - { - "epoch": 0.19, - "learning_rate": 1.9935966125112156e-06, - "loss": 0.7861, - "step": 7604 - }, - { - "epoch": 0.19, - "learning_rate": 1.9935934857648456e-06, - "loss": 0.8818, - "step": 7605 - }, - { - "epoch": 0.19, - "learning_rate": 1.9935903582577265e-06, - "loss": 0.9443, - "step": 7606 - }, - { - "epoch": 0.19, - "learning_rate": 1.993587229989861e-06, - "loss": 1.0977, - "step": 7607 - }, - { - "epoch": 0.19, - "learning_rate": 1.9935841009612517e-06, - "loss": 0.8057, - "step": 7608 - }, - { - "epoch": 0.2, - "learning_rate": 1.9935809711719006e-06, - "loss": 0.8545, - "step": 7609 - }, - { - "epoch": 0.2, - "learning_rate": 1.9935778406218106e-06, - "loss": 0.6428, - "step": 7610 - }, - { - "epoch": 0.2, - "learning_rate": 1.993574709310983e-06, - "loss": 1.0625, - "step": 7611 - }, - { - "epoch": 0.2, - "learning_rate": 1.9935715772394215e-06, - "loss": 0.8813, - "step": 7612 - }, - { - "epoch": 0.2, - "learning_rate": 1.993568444407128e-06, - "loss": 0.8467, - "step": 7613 - }, - { - "epoch": 0.2, - "learning_rate": 1.993565310814104e-06, - "loss": 0.6943, - "step": 7614 - }, - { - "epoch": 0.2, - "learning_rate": 1.9935621764603534e-06, - "loss": 1.082, - "step": 7615 - }, - { - "epoch": 0.2, - "learning_rate": 1.9935590413458777e-06, - "loss": 1.0879, - "step": 7616 - }, - { - "epoch": 0.2, - "learning_rate": 1.99355590547068e-06, - "loss": 1.3418, - "step": 7617 - }, - { - "epoch": 0.2, - "learning_rate": 1.9935527688347616e-06, - "loss": 1.0107, - "step": 7618 - }, - { - "epoch": 0.2, - "learning_rate": 1.993549631438126e-06, - "loss": 0.9961, - "step": 7619 - }, - { - "epoch": 0.2, - "learning_rate": 1.9935464932807745e-06, - "loss": 1.0469, - "step": 7620 - }, - { - "epoch": 0.2, - "learning_rate": 1.993543354362711e-06, - "loss": 1.2129, - "step": 7621 - }, - { - "epoch": 0.2, - "learning_rate": 1.9935402146839364e-06, - "loss": 0.8018, - "step": 7622 - }, - { - "epoch": 0.2, - "learning_rate": 1.9935370742444538e-06, - "loss": 1.0801, - "step": 7623 - }, - { - "epoch": 0.2, - "learning_rate": 1.993533933044266e-06, - "loss": 0.9404, - "step": 7624 - }, - { - "epoch": 0.2, - "learning_rate": 1.9935307910833743e-06, - "loss": 0.9414, - "step": 7625 - }, - { - "epoch": 0.2, - "learning_rate": 1.993527648361782e-06, - "loss": 0.8481, - "step": 7626 - }, - { - "epoch": 0.2, - "learning_rate": 1.9935245048794917e-06, - "loss": 1.1602, - "step": 7627 - }, - { - "epoch": 0.2, - "learning_rate": 1.993521360636505e-06, - "loss": 1.043, - "step": 7628 - }, - { - "epoch": 0.2, - "learning_rate": 1.993518215632825e-06, - "loss": 0.8921, - "step": 7629 - }, - { - "epoch": 0.2, - "learning_rate": 1.993515069868453e-06, - "loss": 0.9258, - "step": 7630 - }, - { - "epoch": 0.2, - "learning_rate": 1.993511923343393e-06, - "loss": 0.5981, - "step": 7631 - }, - { - "epoch": 0.2, - "learning_rate": 1.9935087760576462e-06, - "loss": 0.7261, - "step": 7632 - }, - { - "epoch": 0.2, - "learning_rate": 1.9935056280112153e-06, - "loss": 0.6523, - "step": 7633 - }, - { - "epoch": 0.2, - "learning_rate": 1.9935024792041034e-06, - "loss": 1.0098, - "step": 7634 - }, - { - "epoch": 0.2, - "learning_rate": 1.993499329636312e-06, - "loss": 1.0146, - "step": 7635 - }, - { - "epoch": 0.2, - "learning_rate": 1.9934961793078434e-06, - "loss": 1.0684, - "step": 7636 - }, - { - "epoch": 0.2, - "learning_rate": 1.993493028218701e-06, - "loss": 0.9824, - "step": 7637 - }, - { - "epoch": 0.2, - "learning_rate": 1.9934898763688864e-06, - "loss": 0.7939, - "step": 7638 - }, - { - "epoch": 0.2, - "learning_rate": 1.9934867237584027e-06, - "loss": 1.1719, - "step": 7639 - }, - { - "epoch": 0.2, - "learning_rate": 1.9934835703872516e-06, - "loss": 0.9072, - "step": 7640 - }, - { - "epoch": 0.2, - "learning_rate": 1.9934804162554357e-06, - "loss": 0.9951, - "step": 7641 - }, - { - "epoch": 0.2, - "learning_rate": 1.993477261362958e-06, - "loss": 0.9668, - "step": 7642 - }, - { - "epoch": 0.2, - "learning_rate": 1.99347410570982e-06, - "loss": 0.7773, - "step": 7643 - }, - { - "epoch": 0.2, - "learning_rate": 1.9934709492960245e-06, - "loss": 1.0264, - "step": 7644 - }, - { - "epoch": 0.2, - "learning_rate": 1.993467792121574e-06, - "loss": 0.9248, - "step": 7645 - }, - { - "epoch": 0.2, - "learning_rate": 1.9934646341864712e-06, - "loss": 1.0742, - "step": 7646 - }, - { - "epoch": 0.2, - "learning_rate": 1.9934614754907177e-06, - "loss": 1.0117, - "step": 7647 - }, - { - "epoch": 0.2, - "learning_rate": 1.9934583160343167e-06, - "loss": 0.9844, - "step": 7648 - }, - { - "epoch": 0.2, - "learning_rate": 1.9934551558172704e-06, - "loss": 0.8916, - "step": 7649 - }, - { - "epoch": 0.2, - "learning_rate": 1.9934519948395814e-06, - "loss": 0.7622, - "step": 7650 - }, - { - "epoch": 0.2, - "learning_rate": 1.9934488331012516e-06, - "loss": 0.8345, - "step": 7651 - }, - { - "epoch": 0.2, - "learning_rate": 1.9934456706022837e-06, - "loss": 0.896, - "step": 7652 - }, - { - "epoch": 0.2, - "learning_rate": 1.9934425073426803e-06, - "loss": 0.8779, - "step": 7653 - }, - { - "epoch": 0.2, - "learning_rate": 1.9934393433224438e-06, - "loss": 0.875, - "step": 7654 - }, - { - "epoch": 0.2, - "learning_rate": 1.993436178541576e-06, - "loss": 0.8955, - "step": 7655 - }, - { - "epoch": 0.2, - "learning_rate": 1.99343301300008e-06, - "loss": 1.0996, - "step": 7656 - }, - { - "epoch": 0.2, - "learning_rate": 1.993429846697958e-06, - "loss": 0.7637, - "step": 7657 - }, - { - "epoch": 0.2, - "learning_rate": 1.9934266796352126e-06, - "loss": 0.3926, - "step": 7658 - }, - { - "epoch": 0.2, - "learning_rate": 1.993423511811846e-06, - "loss": 0.9941, - "step": 7659 - }, - { - "epoch": 0.2, - "learning_rate": 1.993420343227861e-06, - "loss": 0.9014, - "step": 7660 - }, - { - "epoch": 0.2, - "learning_rate": 1.993417173883259e-06, - "loss": 0.6885, - "step": 7661 - }, - { - "epoch": 0.2, - "learning_rate": 1.9934140037780437e-06, - "loss": 1.0312, - "step": 7662 - }, - { - "epoch": 0.2, - "learning_rate": 1.993410832912217e-06, - "loss": 0.8086, - "step": 7663 - }, - { - "epoch": 0.2, - "learning_rate": 1.9934076612857804e-06, - "loss": 0.8765, - "step": 7664 - }, - { - "epoch": 0.2, - "learning_rate": 1.9934044888987384e-06, - "loss": 1.0996, - "step": 7665 - }, - { - "epoch": 0.2, - "learning_rate": 1.9934013157510917e-06, - "loss": 0.8442, - "step": 7666 - }, - { - "epoch": 0.2, - "learning_rate": 1.9933981418428433e-06, - "loss": 0.6479, - "step": 7667 - }, - { - "epoch": 0.2, - "learning_rate": 1.9933949671739957e-06, - "loss": 1.0205, - "step": 7668 - }, - { - "epoch": 0.2, - "learning_rate": 1.993391791744551e-06, - "loss": 0.9004, - "step": 7669 - }, - { - "epoch": 0.2, - "learning_rate": 1.9933886155545124e-06, - "loss": 0.8813, - "step": 7670 - }, - { - "epoch": 0.2, - "learning_rate": 1.9933854386038817e-06, - "loss": 0.7908, - "step": 7671 - }, - { - "epoch": 0.2, - "learning_rate": 1.993382260892661e-06, - "loss": 0.9775, - "step": 7672 - }, - { - "epoch": 0.2, - "learning_rate": 1.993379082420854e-06, - "loss": 0.8691, - "step": 7673 - }, - { - "epoch": 0.2, - "learning_rate": 1.9933759031884616e-06, - "loss": 0.77, - "step": 7674 - }, - { - "epoch": 0.2, - "learning_rate": 1.9933727231954873e-06, - "loss": 1.0059, - "step": 7675 - }, - { - "epoch": 0.2, - "learning_rate": 1.9933695424419328e-06, - "loss": 0.6592, - "step": 7676 - }, - { - "epoch": 0.2, - "learning_rate": 1.993366360927801e-06, - "loss": 0.7876, - "step": 7677 - }, - { - "epoch": 0.2, - "learning_rate": 1.9933631786530945e-06, - "loss": 1.0254, - "step": 7678 - }, - { - "epoch": 0.2, - "learning_rate": 1.9933599956178153e-06, - "loss": 0.6318, - "step": 7679 - }, - { - "epoch": 0.2, - "learning_rate": 1.9933568118219663e-06, - "loss": 0.9727, - "step": 7680 - }, - { - "epoch": 0.2, - "learning_rate": 1.9933536272655498e-06, - "loss": 0.9268, - "step": 7681 - }, - { - "epoch": 0.2, - "learning_rate": 1.9933504419485676e-06, - "loss": 0.9502, - "step": 7682 - }, - { - "epoch": 0.2, - "learning_rate": 1.9933472558710227e-06, - "loss": 0.8877, - "step": 7683 - }, - { - "epoch": 0.2, - "learning_rate": 1.9933440690329175e-06, - "loss": 1.1348, - "step": 7684 - }, - { - "epoch": 0.2, - "learning_rate": 1.9933408814342547e-06, - "loss": 1.1367, - "step": 7685 - }, - { - "epoch": 0.2, - "learning_rate": 1.9933376930750364e-06, - "loss": 0.7573, - "step": 7686 - }, - { - "epoch": 0.2, - "learning_rate": 1.993334503955265e-06, - "loss": 0.749, - "step": 7687 - }, - { - "epoch": 0.2, - "learning_rate": 1.993331314074943e-06, - "loss": 0.8428, - "step": 7688 - }, - { - "epoch": 0.2, - "learning_rate": 1.9933281234340727e-06, - "loss": 0.958, - "step": 7689 - }, - { - "epoch": 0.2, - "learning_rate": 1.993324932032657e-06, - "loss": 1.0088, - "step": 7690 - }, - { - "epoch": 0.2, - "learning_rate": 1.993321739870698e-06, - "loss": 0.8555, - "step": 7691 - }, - { - "epoch": 0.2, - "learning_rate": 1.993318546948198e-06, - "loss": 0.9229, - "step": 7692 - }, - { - "epoch": 0.2, - "learning_rate": 1.99331535326516e-06, - "loss": 0.6309, - "step": 7693 - }, - { - "epoch": 0.2, - "learning_rate": 1.9933121588215863e-06, - "loss": 0.9287, - "step": 7694 - }, - { - "epoch": 0.2, - "learning_rate": 1.993308963617479e-06, - "loss": 0.728, - "step": 7695 - }, - { - "epoch": 0.2, - "learning_rate": 1.9933057676528404e-06, - "loss": 0.9355, - "step": 7696 - }, - { - "epoch": 0.2, - "learning_rate": 1.9933025709276733e-06, - "loss": 0.8867, - "step": 7697 - }, - { - "epoch": 0.2, - "learning_rate": 1.9932993734419803e-06, - "loss": 0.7249, - "step": 7698 - }, - { - "epoch": 0.2, - "learning_rate": 1.9932961751957635e-06, - "loss": 1.1113, - "step": 7699 - }, - { - "epoch": 0.2, - "learning_rate": 1.9932929761890255e-06, - "loss": 0.8193, - "step": 7700 - }, - { - "epoch": 0.2, - "learning_rate": 1.993289776421769e-06, - "loss": 0.8789, - "step": 7701 - }, - { - "epoch": 0.2, - "learning_rate": 1.993286575893996e-06, - "loss": 1.0537, - "step": 7702 - }, - { - "epoch": 0.2, - "learning_rate": 1.993283374605709e-06, - "loss": 1.0615, - "step": 7703 - }, - { - "epoch": 0.2, - "learning_rate": 1.9932801725569107e-06, - "loss": 0.9316, - "step": 7704 - }, - { - "epoch": 0.2, - "learning_rate": 1.9932769697476034e-06, - "loss": 0.8428, - "step": 7705 - }, - { - "epoch": 0.2, - "learning_rate": 1.99327376617779e-06, - "loss": 0.749, - "step": 7706 - }, - { - "epoch": 0.2, - "learning_rate": 1.993270561847472e-06, - "loss": 0.7554, - "step": 7707 - }, - { - "epoch": 0.2, - "learning_rate": 1.9932673567566526e-06, - "loss": 1.0176, - "step": 7708 - }, - { - "epoch": 0.2, - "learning_rate": 1.993264150905334e-06, - "loss": 0.7839, - "step": 7709 - }, - { - "epoch": 0.2, - "learning_rate": 1.9932609442935188e-06, - "loss": 0.8398, - "step": 7710 - }, - { - "epoch": 0.2, - "learning_rate": 1.9932577369212094e-06, - "loss": 1.0322, - "step": 7711 - }, - { - "epoch": 0.2, - "learning_rate": 1.993254528788408e-06, - "loss": 1.0625, - "step": 7712 - }, - { - "epoch": 0.2, - "learning_rate": 1.9932513198951175e-06, - "loss": 0.9307, - "step": 7713 - }, - { - "epoch": 0.2, - "learning_rate": 1.99324811024134e-06, - "loss": 0.9717, - "step": 7714 - }, - { - "epoch": 0.2, - "learning_rate": 1.9932448998270783e-06, - "loss": 0.9766, - "step": 7715 - }, - { - "epoch": 0.2, - "learning_rate": 1.9932416886523347e-06, - "loss": 0.9395, - "step": 7716 - }, - { - "epoch": 0.2, - "learning_rate": 1.9932384767171113e-06, - "loss": 1.0537, - "step": 7717 - }, - { - "epoch": 0.2, - "learning_rate": 1.993235264021411e-06, - "loss": 1.0273, - "step": 7718 - }, - { - "epoch": 0.2, - "learning_rate": 1.993232050565236e-06, - "loss": 0.7852, - "step": 7719 - }, - { - "epoch": 0.2, - "learning_rate": 1.993228836348589e-06, - "loss": 0.7793, - "step": 7720 - }, - { - "epoch": 0.2, - "learning_rate": 1.9932256213714726e-06, - "loss": 1.2559, - "step": 7721 - }, - { - "epoch": 0.2, - "learning_rate": 1.9932224056338886e-06, - "loss": 0.8447, - "step": 7722 - }, - { - "epoch": 0.2, - "learning_rate": 1.9932191891358402e-06, - "loss": 0.7266, - "step": 7723 - }, - { - "epoch": 0.2, - "learning_rate": 1.9932159718773295e-06, - "loss": 1.0488, - "step": 7724 - }, - { - "epoch": 0.2, - "learning_rate": 1.9932127538583584e-06, - "loss": 0.8296, - "step": 7725 - }, - { - "epoch": 0.2, - "learning_rate": 1.9932095350789306e-06, - "loss": 1.0225, - "step": 7726 - }, - { - "epoch": 0.2, - "learning_rate": 1.993206315539048e-06, - "loss": 0.8281, - "step": 7727 - }, - { - "epoch": 0.2, - "learning_rate": 1.9932030952387127e-06, - "loss": 0.7461, - "step": 7728 - }, - { - "epoch": 0.2, - "learning_rate": 1.9931998741779273e-06, - "loss": 1.125, - "step": 7729 - }, - { - "epoch": 0.2, - "learning_rate": 1.993196652356695e-06, - "loss": 0.9717, - "step": 7730 - }, - { - "epoch": 0.2, - "learning_rate": 1.993193429775017e-06, - "loss": 0.9727, - "step": 7731 - }, - { - "epoch": 0.2, - "learning_rate": 1.993190206432897e-06, - "loss": 1.1777, - "step": 7732 - }, - { - "epoch": 0.2, - "learning_rate": 1.9931869823303367e-06, - "loss": 0.6738, - "step": 7733 - }, - { - "epoch": 0.2, - "learning_rate": 1.9931837574673387e-06, - "loss": 0.8496, - "step": 7734 - }, - { - "epoch": 0.2, - "learning_rate": 1.9931805318439057e-06, - "loss": 0.8408, - "step": 7735 - }, - { - "epoch": 0.2, - "learning_rate": 1.99317730546004e-06, - "loss": 1.0244, - "step": 7736 - }, - { - "epoch": 0.2, - "learning_rate": 1.9931740783157443e-06, - "loss": 1.0732, - "step": 7737 - }, - { - "epoch": 0.2, - "learning_rate": 1.993170850411021e-06, - "loss": 1.0459, - "step": 7738 - }, - { - "epoch": 0.2, - "learning_rate": 1.993167621745872e-06, - "loss": 0.7803, - "step": 7739 - }, - { - "epoch": 0.2, - "learning_rate": 1.9931643923203003e-06, - "loss": 0.9824, - "step": 7740 - }, - { - "epoch": 0.2, - "learning_rate": 1.9931611621343083e-06, - "loss": 0.9766, - "step": 7741 - }, - { - "epoch": 0.2, - "learning_rate": 1.9931579311878984e-06, - "loss": 0.8691, - "step": 7742 - }, - { - "epoch": 0.2, - "learning_rate": 1.9931546994810736e-06, - "loss": 0.9639, - "step": 7743 - }, - { - "epoch": 0.2, - "learning_rate": 1.9931514670138355e-06, - "loss": 0.7578, - "step": 7744 - }, - { - "epoch": 0.2, - "learning_rate": 1.9931482337861867e-06, - "loss": 0.9883, - "step": 7745 - }, - { - "epoch": 0.2, - "learning_rate": 1.9931449997981302e-06, - "loss": 1.124, - "step": 7746 - }, - { - "epoch": 0.2, - "learning_rate": 1.993141765049669e-06, - "loss": 1.0391, - "step": 7747 - }, - { - "epoch": 0.2, - "learning_rate": 1.993138529540804e-06, - "loss": 0.8682, - "step": 7748 - }, - { - "epoch": 0.2, - "learning_rate": 1.9931352932715385e-06, - "loss": 0.9697, - "step": 7749 - }, - { - "epoch": 0.2, - "learning_rate": 1.993132056241875e-06, - "loss": 0.9185, - "step": 7750 - }, - { - "epoch": 0.2, - "learning_rate": 1.9931288184518164e-06, - "loss": 1.04, - "step": 7751 - }, - { - "epoch": 0.2, - "learning_rate": 1.9931255799013644e-06, - "loss": 1.0449, - "step": 7752 - }, - { - "epoch": 0.2, - "learning_rate": 1.993122340590522e-06, - "loss": 0.645, - "step": 7753 - }, - { - "epoch": 0.2, - "learning_rate": 1.993119100519291e-06, - "loss": 0.9717, - "step": 7754 - }, - { - "epoch": 0.2, - "learning_rate": 1.9931158596876748e-06, - "loss": 1.0127, - "step": 7755 - }, - { - "epoch": 0.2, - "learning_rate": 1.9931126180956756e-06, - "loss": 0.7959, - "step": 7756 - }, - { - "epoch": 0.2, - "learning_rate": 1.9931093757432954e-06, - "loss": 0.8994, - "step": 7757 - }, - { - "epoch": 0.2, - "learning_rate": 1.993106132630537e-06, - "loss": 0.9307, - "step": 7758 - }, - { - "epoch": 0.2, - "learning_rate": 1.9931028887574032e-06, - "loss": 1.1133, - "step": 7759 - }, - { - "epoch": 0.2, - "learning_rate": 1.993099644123896e-06, - "loss": 0.8457, - "step": 7760 - }, - { - "epoch": 0.2, - "learning_rate": 1.9930963987300178e-06, - "loss": 1.1172, - "step": 7761 - }, - { - "epoch": 0.2, - "learning_rate": 1.9930931525757717e-06, - "loss": 0.8057, - "step": 7762 - }, - { - "epoch": 0.2, - "learning_rate": 1.9930899056611598e-06, - "loss": 0.9912, - "step": 7763 - }, - { - "epoch": 0.2, - "learning_rate": 1.9930866579861846e-06, - "loss": 1.1367, - "step": 7764 - }, - { - "epoch": 0.2, - "learning_rate": 1.9930834095508483e-06, - "loss": 0.8975, - "step": 7765 - }, - { - "epoch": 0.2, - "learning_rate": 1.993080160355154e-06, - "loss": 0.5972, - "step": 7766 - }, - { - "epoch": 0.2, - "learning_rate": 1.993076910399104e-06, - "loss": 0.8662, - "step": 7767 - }, - { - "epoch": 0.2, - "learning_rate": 1.9930736596827004e-06, - "loss": 0.9824, - "step": 7768 - }, - { - "epoch": 0.2, - "learning_rate": 1.993070408205946e-06, - "loss": 1.1523, - "step": 7769 - }, - { - "epoch": 0.2, - "learning_rate": 1.9930671559688435e-06, - "loss": 0.9482, - "step": 7770 - }, - { - "epoch": 0.2, - "learning_rate": 1.993063902971395e-06, - "loss": 0.8955, - "step": 7771 - }, - { - "epoch": 0.2, - "learning_rate": 1.993060649213603e-06, - "loss": 1.1592, - "step": 7772 - }, - { - "epoch": 0.2, - "learning_rate": 1.9930573946954702e-06, - "loss": 0.9297, - "step": 7773 - }, - { - "epoch": 0.2, - "learning_rate": 1.993054139416999e-06, - "loss": 1.0781, - "step": 7774 - }, - { - "epoch": 0.2, - "learning_rate": 1.993050883378192e-06, - "loss": 0.8125, - "step": 7775 - }, - { - "epoch": 0.2, - "learning_rate": 1.9930476265790516e-06, - "loss": 0.8828, - "step": 7776 - }, - { - "epoch": 0.2, - "learning_rate": 1.9930443690195806e-06, - "loss": 1.2207, - "step": 7777 - }, - { - "epoch": 0.2, - "learning_rate": 1.9930411106997806e-06, - "loss": 0.9365, - "step": 7778 - }, - { - "epoch": 0.2, - "learning_rate": 1.993037851619655e-06, - "loss": 0.8848, - "step": 7779 - }, - { - "epoch": 0.2, - "learning_rate": 1.9930345917792055e-06, - "loss": 0.8086, - "step": 7780 - }, - { - "epoch": 0.2, - "learning_rate": 1.9930313311784356e-06, - "loss": 1.166, - "step": 7781 - }, - { - "epoch": 0.2, - "learning_rate": 1.9930280698173473e-06, - "loss": 0.7744, - "step": 7782 - }, - { - "epoch": 0.2, - "learning_rate": 1.9930248076959427e-06, - "loss": 0.7322, - "step": 7783 - }, - { - "epoch": 0.2, - "learning_rate": 1.993021544814225e-06, - "loss": 0.8462, - "step": 7784 - }, - { - "epoch": 0.2, - "learning_rate": 1.9930182811721962e-06, - "loss": 1.0127, - "step": 7785 - }, - { - "epoch": 0.2, - "learning_rate": 1.993015016769859e-06, - "loss": 0.7891, - "step": 7786 - }, - { - "epoch": 0.2, - "learning_rate": 1.993011751607216e-06, - "loss": 0.8955, - "step": 7787 - }, - { - "epoch": 0.2, - "learning_rate": 1.993008485684269e-06, - "loss": 1.1992, - "step": 7788 - }, - { - "epoch": 0.2, - "learning_rate": 1.9930052190010217e-06, - "loss": 0.9512, - "step": 7789 - }, - { - "epoch": 0.2, - "learning_rate": 1.993001951557476e-06, - "loss": 1.0361, - "step": 7790 - }, - { - "epoch": 0.2, - "learning_rate": 1.992998683353634e-06, - "loss": 0.9697, - "step": 7791 - }, - { - "epoch": 0.2, - "learning_rate": 1.9929954143894987e-06, - "loss": 1.2949, - "step": 7792 - }, - { - "epoch": 0.2, - "learning_rate": 1.992992144665072e-06, - "loss": 0.8877, - "step": 7793 - }, - { - "epoch": 0.2, - "learning_rate": 1.9929888741803578e-06, - "loss": 0.9023, - "step": 7794 - }, - { - "epoch": 0.2, - "learning_rate": 1.992985602935357e-06, - "loss": 0.7646, - "step": 7795 - }, - { - "epoch": 0.2, - "learning_rate": 1.992982330930073e-06, - "loss": 0.7959, - "step": 7796 - }, - { - "epoch": 0.2, - "learning_rate": 1.9929790581645085e-06, - "loss": 1.0547, - "step": 7797 - }, - { - "epoch": 0.2, - "learning_rate": 1.992975784638665e-06, - "loss": 0.9863, - "step": 7798 - }, - { - "epoch": 0.2, - "learning_rate": 1.9929725103525455e-06, - "loss": 0.9697, - "step": 7799 - }, - { - "epoch": 0.2, - "learning_rate": 1.992969235306153e-06, - "loss": 0.5564, - "step": 7800 - }, - { - "epoch": 0.2, - "learning_rate": 1.9929659594994895e-06, - "loss": 0.7539, - "step": 7801 - }, - { - "epoch": 0.2, - "learning_rate": 1.9929626829325576e-06, - "loss": 0.9434, - "step": 7802 - }, - { - "epoch": 0.2, - "learning_rate": 1.99295940560536e-06, - "loss": 0.8691, - "step": 7803 - }, - { - "epoch": 0.2, - "learning_rate": 1.992956127517899e-06, - "loss": 0.9785, - "step": 7804 - }, - { - "epoch": 0.2, - "learning_rate": 1.9929528486701766e-06, - "loss": 1.1084, - "step": 7805 - }, - { - "epoch": 0.2, - "learning_rate": 1.9929495690621965e-06, - "loss": 0.9121, - "step": 7806 - }, - { - "epoch": 0.2, - "learning_rate": 1.9929462886939603e-06, - "loss": 0.8535, - "step": 7807 - }, - { - "epoch": 0.2, - "learning_rate": 1.9929430075654706e-06, - "loss": 0.9248, - "step": 7808 - }, - { - "epoch": 0.2, - "learning_rate": 1.9929397256767306e-06, - "loss": 0.8691, - "step": 7809 - }, - { - "epoch": 0.2, - "learning_rate": 1.992936443027742e-06, - "loss": 0.9648, - "step": 7810 - }, - { - "epoch": 0.2, - "learning_rate": 1.992933159618508e-06, - "loss": 0.9854, - "step": 7811 - }, - { - "epoch": 0.2, - "learning_rate": 1.9929298754490304e-06, - "loss": 0.9697, - "step": 7812 - }, - { - "epoch": 0.2, - "learning_rate": 1.9929265905193118e-06, - "loss": 1.0254, - "step": 7813 - }, - { - "epoch": 0.2, - "learning_rate": 1.9929233048293552e-06, - "loss": 0.8545, - "step": 7814 - }, - { - "epoch": 0.2, - "learning_rate": 1.992920018379163e-06, - "loss": 0.7227, - "step": 7815 - }, - { - "epoch": 0.2, - "learning_rate": 1.9929167311687373e-06, - "loss": 1.0166, - "step": 7816 - }, - { - "epoch": 0.2, - "learning_rate": 1.9929134431980814e-06, - "loss": 0.6182, - "step": 7817 - }, - { - "epoch": 0.2, - "learning_rate": 1.992910154467197e-06, - "loss": 0.8477, - "step": 7818 - }, - { - "epoch": 0.2, - "learning_rate": 1.992906864976087e-06, - "loss": 0.9531, - "step": 7819 - }, - { - "epoch": 0.2, - "learning_rate": 1.9929035747247536e-06, - "loss": 0.9355, - "step": 7820 - }, - { - "epoch": 0.2, - "learning_rate": 1.9929002837132e-06, - "loss": 0.9834, - "step": 7821 - }, - { - "epoch": 0.2, - "learning_rate": 1.992896991941428e-06, - "loss": 1.1465, - "step": 7822 - }, - { - "epoch": 0.2, - "learning_rate": 1.9928936994094406e-06, - "loss": 0.7935, - "step": 7823 - }, - { - "epoch": 0.2, - "learning_rate": 1.99289040611724e-06, - "loss": 0.75, - "step": 7824 - }, - { - "epoch": 0.2, - "learning_rate": 1.992887112064829e-06, - "loss": 0.9746, - "step": 7825 - }, - { - "epoch": 0.2, - "learning_rate": 1.99288381725221e-06, - "loss": 1.0332, - "step": 7826 - }, - { - "epoch": 0.2, - "learning_rate": 1.9928805216793856e-06, - "loss": 1.1416, - "step": 7827 - }, - { - "epoch": 0.2, - "learning_rate": 1.9928772253463584e-06, - "loss": 0.9658, - "step": 7828 - }, - { - "epoch": 0.2, - "learning_rate": 1.9928739282531306e-06, - "loss": 0.9912, - "step": 7829 - }, - { - "epoch": 0.2, - "learning_rate": 1.9928706303997047e-06, - "loss": 0.7046, - "step": 7830 - }, - { - "epoch": 0.2, - "learning_rate": 1.9928673317860836e-06, - "loss": 0.9463, - "step": 7831 - }, - { - "epoch": 0.2, - "learning_rate": 1.9928640324122696e-06, - "loss": 0.6748, - "step": 7832 - }, - { - "epoch": 0.2, - "learning_rate": 1.992860732278265e-06, - "loss": 0.7695, - "step": 7833 - }, - { - "epoch": 0.2, - "learning_rate": 1.992857431384073e-06, - "loss": 0.9512, - "step": 7834 - }, - { - "epoch": 0.2, - "learning_rate": 1.9928541297296955e-06, - "loss": 0.9414, - "step": 7835 - }, - { - "epoch": 0.2, - "learning_rate": 1.9928508273151353e-06, - "loss": 0.8193, - "step": 7836 - }, - { - "epoch": 0.2, - "learning_rate": 1.9928475241403947e-06, - "loss": 0.8721, - "step": 7837 - }, - { - "epoch": 0.2, - "learning_rate": 1.9928442202054768e-06, - "loss": 0.918, - "step": 7838 - }, - { - "epoch": 0.2, - "learning_rate": 1.992840915510383e-06, - "loss": 0.9707, - "step": 7839 - }, - { - "epoch": 0.2, - "learning_rate": 1.9928376100551173e-06, - "loss": 0.7158, - "step": 7840 - }, - { - "epoch": 0.2, - "learning_rate": 1.9928343038396814e-06, - "loss": 0.9561, - "step": 7841 - }, - { - "epoch": 0.2, - "learning_rate": 1.9928309968640774e-06, - "loss": 0.656, - "step": 7842 - }, - { - "epoch": 0.2, - "learning_rate": 1.992827689128309e-06, - "loss": 1.0508, - "step": 7843 - }, - { - "epoch": 0.2, - "learning_rate": 1.9928243806323776e-06, - "loss": 0.8467, - "step": 7844 - }, - { - "epoch": 0.2, - "learning_rate": 1.992821071376287e-06, - "loss": 0.9102, - "step": 7845 - }, - { - "epoch": 0.2, - "learning_rate": 1.9928177613600383e-06, - "loss": 1.1172, - "step": 7846 - }, - { - "epoch": 0.2, - "learning_rate": 1.9928144505836344e-06, - "loss": 0.9678, - "step": 7847 - }, - { - "epoch": 0.2, - "learning_rate": 1.9928111390470786e-06, - "loss": 0.7988, - "step": 7848 - }, - { - "epoch": 0.2, - "learning_rate": 1.992807826750373e-06, - "loss": 1.0645, - "step": 7849 - }, - { - "epoch": 0.2, - "learning_rate": 1.99280451369352e-06, - "loss": 0.8926, - "step": 7850 - }, - { - "epoch": 0.2, - "learning_rate": 1.992801199876522e-06, - "loss": 0.7915, - "step": 7851 - }, - { - "epoch": 0.2, - "learning_rate": 1.992797885299382e-06, - "loss": 0.8506, - "step": 7852 - }, - { - "epoch": 0.2, - "learning_rate": 1.9927945699621023e-06, - "loss": 1.0508, - "step": 7853 - }, - { - "epoch": 0.2, - "learning_rate": 1.9927912538646857e-06, - "loss": 0.9512, - "step": 7854 - }, - { - "epoch": 0.2, - "learning_rate": 1.9927879370071337e-06, - "loss": 0.8564, - "step": 7855 - }, - { - "epoch": 0.2, - "learning_rate": 1.9927846193894505e-06, - "loss": 0.9453, - "step": 7856 - }, - { - "epoch": 0.2, - "learning_rate": 1.9927813010116374e-06, - "loss": 0.957, - "step": 7857 - }, - { - "epoch": 0.2, - "learning_rate": 1.992777981873697e-06, - "loss": 1.0195, - "step": 7858 - }, - { - "epoch": 0.2, - "learning_rate": 1.9927746619756325e-06, - "loss": 0.8682, - "step": 7859 - }, - { - "epoch": 0.2, - "learning_rate": 1.9927713413174463e-06, - "loss": 0.9404, - "step": 7860 - }, - { - "epoch": 0.2, - "learning_rate": 1.9927680198991402e-06, - "loss": 1.1758, - "step": 7861 - }, - { - "epoch": 0.2, - "learning_rate": 1.992764697720718e-06, - "loss": 0.9629, - "step": 7862 - }, - { - "epoch": 0.2, - "learning_rate": 1.992761374782181e-06, - "loss": 0.6934, - "step": 7863 - }, - { - "epoch": 0.2, - "learning_rate": 1.992758051083532e-06, - "loss": 0.9463, - "step": 7864 - }, - { - "epoch": 0.2, - "learning_rate": 1.9927547266247746e-06, - "loss": 0.916, - "step": 7865 - }, - { - "epoch": 0.2, - "learning_rate": 1.99275140140591e-06, - "loss": 0.6348, - "step": 7866 - }, - { - "epoch": 0.2, - "learning_rate": 1.992748075426941e-06, - "loss": 1.0879, - "step": 7867 - }, - { - "epoch": 0.2, - "learning_rate": 1.9927447486878713e-06, - "loss": 1.0312, - "step": 7868 - }, - { - "epoch": 0.2, - "learning_rate": 1.9927414211887022e-06, - "loss": 0.8086, - "step": 7869 - }, - { - "epoch": 0.2, - "learning_rate": 1.9927380929294362e-06, - "loss": 0.832, - "step": 7870 - }, - { - "epoch": 0.2, - "learning_rate": 1.9927347639100768e-06, - "loss": 1.0244, - "step": 7871 - }, - { - "epoch": 0.2, - "learning_rate": 1.992731434130626e-06, - "loss": 0.9531, - "step": 7872 - }, - { - "epoch": 0.2, - "learning_rate": 1.9927281035910863e-06, - "loss": 0.9229, - "step": 7873 - }, - { - "epoch": 0.2, - "learning_rate": 1.9927247722914603e-06, - "loss": 1.2012, - "step": 7874 - }, - { - "epoch": 0.2, - "learning_rate": 1.9927214402317506e-06, - "loss": 1.0488, - "step": 7875 - }, - { - "epoch": 0.2, - "learning_rate": 1.9927181074119597e-06, - "loss": 0.957, - "step": 7876 - }, - { - "epoch": 0.2, - "learning_rate": 1.9927147738320906e-06, - "loss": 0.8677, - "step": 7877 - }, - { - "epoch": 0.2, - "learning_rate": 1.992711439492145e-06, - "loss": 0.9463, - "step": 7878 - }, - { - "epoch": 0.2, - "learning_rate": 1.992708104392126e-06, - "loss": 1.0049, - "step": 7879 - }, - { - "epoch": 0.2, - "learning_rate": 1.992704768532036e-06, - "loss": 1.0596, - "step": 7880 - }, - { - "epoch": 0.2, - "learning_rate": 1.9927014319118778e-06, - "loss": 0.8633, - "step": 7881 - }, - { - "epoch": 0.2, - "learning_rate": 1.9926980945316534e-06, - "loss": 0.8594, - "step": 7882 - }, - { - "epoch": 0.2, - "learning_rate": 1.992694756391366e-06, - "loss": 0.9814, - "step": 7883 - }, - { - "epoch": 0.2, - "learning_rate": 1.992691417491018e-06, - "loss": 1.1025, - "step": 7884 - }, - { - "epoch": 0.2, - "learning_rate": 1.9926880778306114e-06, - "loss": 1.2188, - "step": 7885 - }, - { - "epoch": 0.2, - "learning_rate": 1.9926847374101495e-06, - "loss": 0.6938, - "step": 7886 - }, - { - "epoch": 0.2, - "learning_rate": 1.9926813962296343e-06, - "loss": 0.9072, - "step": 7887 - }, - { - "epoch": 0.2, - "learning_rate": 1.992678054289069e-06, - "loss": 0.7349, - "step": 7888 - }, - { - "epoch": 0.2, - "learning_rate": 1.9926747115884557e-06, - "loss": 0.7964, - "step": 7889 - }, - { - "epoch": 0.2, - "learning_rate": 1.992671368127797e-06, - "loss": 0.8652, - "step": 7890 - }, - { - "epoch": 0.2, - "learning_rate": 1.992668023907095e-06, - "loss": 0.9424, - "step": 7891 - }, - { - "epoch": 0.2, - "learning_rate": 1.992664678926353e-06, - "loss": 0.751, - "step": 7892 - }, - { - "epoch": 0.2, - "learning_rate": 1.9926613331855733e-06, - "loss": 0.8359, - "step": 7893 - }, - { - "epoch": 0.2, - "learning_rate": 1.9926579866847586e-06, - "loss": 0.8936, - "step": 7894 - }, - { - "epoch": 0.2, - "learning_rate": 1.992654639423911e-06, - "loss": 0.9414, - "step": 7895 - }, - { - "epoch": 0.2, - "learning_rate": 1.9926512914030335e-06, - "loss": 0.7412, - "step": 7896 - }, - { - "epoch": 0.2, - "learning_rate": 1.992647942622129e-06, - "loss": 1.0723, - "step": 7897 - }, - { - "epoch": 0.2, - "learning_rate": 1.992644593081199e-06, - "loss": 0.9766, - "step": 7898 - }, - { - "epoch": 0.2, - "learning_rate": 1.9926412427802475e-06, - "loss": 0.6621, - "step": 7899 - }, - { - "epoch": 0.2, - "learning_rate": 1.9926378917192755e-06, - "loss": 1.1191, - "step": 7900 - }, - { - "epoch": 0.2, - "learning_rate": 1.9926345398982863e-06, - "loss": 0.9668, - "step": 7901 - }, - { - "epoch": 0.2, - "learning_rate": 1.992631187317283e-06, - "loss": 1.0381, - "step": 7902 - }, - { - "epoch": 0.2, - "learning_rate": 1.992627833976267e-06, - "loss": 0.7043, - "step": 7903 - }, - { - "epoch": 0.2, - "learning_rate": 1.992624479875242e-06, - "loss": 1.0303, - "step": 7904 - }, - { - "epoch": 0.2, - "learning_rate": 1.99262112501421e-06, - "loss": 0.998, - "step": 7905 - }, - { - "epoch": 0.2, - "learning_rate": 1.9926177693931734e-06, - "loss": 0.9014, - "step": 7906 - }, - { - "epoch": 0.2, - "learning_rate": 1.9926144130121353e-06, - "loss": 1.0156, - "step": 7907 - }, - { - "epoch": 0.2, - "learning_rate": 1.9926110558710978e-06, - "loss": 0.8613, - "step": 7908 - }, - { - "epoch": 0.2, - "learning_rate": 1.9926076979700637e-06, - "loss": 1.082, - "step": 7909 - }, - { - "epoch": 0.2, - "learning_rate": 1.9926043393090357e-06, - "loss": 0.8457, - "step": 7910 - }, - { - "epoch": 0.2, - "learning_rate": 1.992600979888016e-06, - "loss": 0.915, - "step": 7911 - }, - { - "epoch": 0.2, - "learning_rate": 1.9925976197070075e-06, - "loss": 0.8213, - "step": 7912 - }, - { - "epoch": 0.2, - "learning_rate": 1.9925942587660125e-06, - "loss": 0.6411, - "step": 7913 - }, - { - "epoch": 0.2, - "learning_rate": 1.9925908970650336e-06, - "loss": 0.9082, - "step": 7914 - }, - { - "epoch": 0.2, - "learning_rate": 1.9925875346040735e-06, - "loss": 1.0107, - "step": 7915 - }, - { - "epoch": 0.2, - "learning_rate": 1.992584171383135e-06, - "loss": 0.832, - "step": 7916 - }, - { - "epoch": 0.2, - "learning_rate": 1.9925808074022205e-06, - "loss": 1.0415, - "step": 7917 - }, - { - "epoch": 0.2, - "learning_rate": 1.9925774426613323e-06, - "loss": 0.8525, - "step": 7918 - }, - { - "epoch": 0.2, - "learning_rate": 1.9925740771604734e-06, - "loss": 1.083, - "step": 7919 - }, - { - "epoch": 0.2, - "learning_rate": 1.992570710899646e-06, - "loss": 1.0098, - "step": 7920 - }, - { - "epoch": 0.2, - "learning_rate": 1.992567343878853e-06, - "loss": 0.8516, - "step": 7921 - }, - { - "epoch": 0.2, - "learning_rate": 1.9925639760980965e-06, - "loss": 1.0693, - "step": 7922 - }, - { - "epoch": 0.2, - "learning_rate": 1.9925606075573796e-06, - "loss": 0.8564, - "step": 7923 - }, - { - "epoch": 0.2, - "learning_rate": 1.9925572382567046e-06, - "loss": 0.812, - "step": 7924 - }, - { - "epoch": 0.2, - "learning_rate": 1.9925538681960747e-06, - "loss": 0.8965, - "step": 7925 - }, - { - "epoch": 0.2, - "learning_rate": 1.9925504973754915e-06, - "loss": 1.1162, - "step": 7926 - }, - { - "epoch": 0.2, - "learning_rate": 1.992547125794958e-06, - "loss": 0.771, - "step": 7927 - }, - { - "epoch": 0.2, - "learning_rate": 1.9925437534544766e-06, - "loss": 1.0322, - "step": 7928 - }, - { - "epoch": 0.2, - "learning_rate": 1.9925403803540504e-06, - "loss": 1.1221, - "step": 7929 - }, - { - "epoch": 0.2, - "learning_rate": 1.9925370064936815e-06, - "loss": 0.7432, - "step": 7930 - }, - { - "epoch": 0.2, - "learning_rate": 1.992533631873373e-06, - "loss": 0.9814, - "step": 7931 - }, - { - "epoch": 0.2, - "learning_rate": 1.9925302564931265e-06, - "loss": 0.9473, - "step": 7932 - }, - { - "epoch": 0.2, - "learning_rate": 1.992526880352946e-06, - "loss": 0.9531, - "step": 7933 - }, - { - "epoch": 0.2, - "learning_rate": 1.9925235034528325e-06, - "loss": 0.7305, - "step": 7934 - }, - { - "epoch": 0.2, - "learning_rate": 1.99252012579279e-06, - "loss": 0.8438, - "step": 7935 - }, - { - "epoch": 0.2, - "learning_rate": 1.99251674737282e-06, - "loss": 1.0312, - "step": 7936 - }, - { - "epoch": 0.2, - "learning_rate": 1.992513368192926e-06, - "loss": 0.9385, - "step": 7937 - }, - { - "epoch": 0.2, - "learning_rate": 1.99250998825311e-06, - "loss": 1.1953, - "step": 7938 - }, - { - "epoch": 0.2, - "learning_rate": 1.9925066075533746e-06, - "loss": 0.9971, - "step": 7939 - }, - { - "epoch": 0.2, - "learning_rate": 1.992503226093723e-06, - "loss": 0.7983, - "step": 7940 - }, - { - "epoch": 0.2, - "learning_rate": 1.9924998438741566e-06, - "loss": 0.6494, - "step": 7941 - }, - { - "epoch": 0.2, - "learning_rate": 1.9924964608946792e-06, - "loss": 0.9834, - "step": 7942 - }, - { - "epoch": 0.2, - "learning_rate": 1.9924930771552927e-06, - "loss": 0.814, - "step": 7943 - }, - { - "epoch": 0.2, - "learning_rate": 1.9924896926559998e-06, - "loss": 0.8174, - "step": 7944 - }, - { - "epoch": 0.2, - "learning_rate": 1.9924863073968036e-06, - "loss": 1.0469, - "step": 7945 - }, - { - "epoch": 0.2, - "learning_rate": 1.9924829213777057e-06, - "loss": 0.9014, - "step": 7946 - }, - { - "epoch": 0.2, - "learning_rate": 1.99247953459871e-06, - "loss": 0.9668, - "step": 7947 - }, - { - "epoch": 0.2, - "learning_rate": 1.992476147059818e-06, - "loss": 1.1182, - "step": 7948 - }, - { - "epoch": 0.2, - "learning_rate": 1.9924727587610325e-06, - "loss": 0.9082, - "step": 7949 - }, - { - "epoch": 0.2, - "learning_rate": 1.992469369702356e-06, - "loss": 0.752, - "step": 7950 - }, - { - "epoch": 0.2, - "learning_rate": 1.992465979883792e-06, - "loss": 0.9648, - "step": 7951 - }, - { - "epoch": 0.2, - "learning_rate": 1.992462589305342e-06, - "loss": 0.7842, - "step": 7952 - }, - { - "epoch": 0.2, - "learning_rate": 1.9924591979670093e-06, - "loss": 1.0088, - "step": 7953 - }, - { - "epoch": 0.2, - "learning_rate": 1.992455805868796e-06, - "loss": 0.9072, - "step": 7954 - }, - { - "epoch": 0.2, - "learning_rate": 1.992452413010705e-06, - "loss": 0.7559, - "step": 7955 - }, - { - "epoch": 0.2, - "learning_rate": 1.9924490193927385e-06, - "loss": 0.7046, - "step": 7956 - }, - { - "epoch": 0.2, - "learning_rate": 1.9924456250148997e-06, - "loss": 1.124, - "step": 7957 - }, - { - "epoch": 0.2, - "learning_rate": 1.992442229877191e-06, - "loss": 0.8623, - "step": 7958 - }, - { - "epoch": 0.2, - "learning_rate": 1.992438833979615e-06, - "loss": 0.7188, - "step": 7959 - }, - { - "epoch": 0.2, - "learning_rate": 1.992435437322174e-06, - "loss": 0.8945, - "step": 7960 - }, - { - "epoch": 0.2, - "learning_rate": 1.992432039904871e-06, - "loss": 0.9043, - "step": 7961 - }, - { - "epoch": 0.2, - "learning_rate": 1.9924286417277082e-06, - "loss": 0.5986, - "step": 7962 - }, - { - "epoch": 0.2, - "learning_rate": 1.9924252427906884e-06, - "loss": 0.8657, - "step": 7963 - }, - { - "epoch": 0.2, - "learning_rate": 1.9924218430938143e-06, - "loss": 1.0166, - "step": 7964 - }, - { - "epoch": 0.2, - "learning_rate": 1.9924184426370886e-06, - "loss": 0.8242, - "step": 7965 - }, - { - "epoch": 0.2, - "learning_rate": 1.9924150414205137e-06, - "loss": 0.7017, - "step": 7966 - }, - { - "epoch": 0.2, - "learning_rate": 1.992411639444092e-06, - "loss": 0.832, - "step": 7967 - }, - { - "epoch": 0.2, - "learning_rate": 1.9924082367078265e-06, - "loss": 0.7437, - "step": 7968 - }, - { - "epoch": 0.2, - "learning_rate": 1.9924048332117195e-06, - "loss": 0.957, - "step": 7969 - }, - { - "epoch": 0.2, - "learning_rate": 1.992401428955774e-06, - "loss": 0.8711, - "step": 7970 - }, - { - "epoch": 0.2, - "learning_rate": 1.992398023939992e-06, - "loss": 0.7881, - "step": 7971 - }, - { - "epoch": 0.2, - "learning_rate": 1.992394618164377e-06, - "loss": 1.0996, - "step": 7972 - }, - { - "epoch": 0.2, - "learning_rate": 1.9923912116289306e-06, - "loss": 0.8496, - "step": 7973 - }, - { - "epoch": 0.2, - "learning_rate": 1.9923878043336564e-06, - "loss": 0.9082, - "step": 7974 - }, - { - "epoch": 0.2, - "learning_rate": 1.992384396278556e-06, - "loss": 0.8369, - "step": 7975 - }, - { - "epoch": 0.2, - "learning_rate": 1.9923809874636327e-06, - "loss": 0.8545, - "step": 7976 - }, - { - "epoch": 0.2, - "learning_rate": 1.992377577888889e-06, - "loss": 0.9922, - "step": 7977 - }, - { - "epoch": 0.2, - "learning_rate": 1.992374167554327e-06, - "loss": 1.0117, - "step": 7978 - }, - { - "epoch": 0.2, - "learning_rate": 1.9923707564599503e-06, - "loss": 0.8936, - "step": 7979 - }, - { - "epoch": 0.2, - "learning_rate": 1.9923673446057606e-06, - "loss": 0.8311, - "step": 7980 - }, - { - "epoch": 0.2, - "learning_rate": 1.9923639319917607e-06, - "loss": 0.9365, - "step": 7981 - }, - { - "epoch": 0.2, - "learning_rate": 1.9923605186179536e-06, - "loss": 1.0273, - "step": 7982 - }, - { - "epoch": 0.2, - "learning_rate": 1.9923571044843415e-06, - "loss": 0.9302, - "step": 7983 - }, - { - "epoch": 0.2, - "learning_rate": 1.9923536895909273e-06, - "loss": 0.9102, - "step": 7984 - }, - { - "epoch": 0.2, - "learning_rate": 1.992350273937714e-06, - "loss": 0.9902, - "step": 7985 - }, - { - "epoch": 0.2, - "learning_rate": 1.992346857524703e-06, - "loss": 0.875, - "step": 7986 - }, - { - "epoch": 0.2, - "learning_rate": 1.992343440351898e-06, - "loss": 1.0352, - "step": 7987 - }, - { - "epoch": 0.2, - "learning_rate": 1.992340022419301e-06, - "loss": 0.9697, - "step": 7988 - }, - { - "epoch": 0.2, - "learning_rate": 1.992336603726915e-06, - "loss": 0.9707, - "step": 7989 - }, - { - "epoch": 0.2, - "learning_rate": 1.992333184274743e-06, - "loss": 0.9434, - "step": 7990 - }, - { - "epoch": 0.2, - "learning_rate": 1.9923297640627867e-06, - "loss": 1.0381, - "step": 7991 - }, - { - "epoch": 0.2, - "learning_rate": 1.9923263430910488e-06, - "loss": 0.8784, - "step": 7992 - }, - { - "epoch": 0.2, - "learning_rate": 1.9923229213595324e-06, - "loss": 0.8311, - "step": 7993 - }, - { - "epoch": 0.2, - "learning_rate": 1.9923194988682403e-06, - "loss": 0.8408, - "step": 7994 - }, - { - "epoch": 0.2, - "learning_rate": 1.9923160756171744e-06, - "loss": 1.0732, - "step": 7995 - }, - { - "epoch": 0.2, - "learning_rate": 1.992312651606338e-06, - "loss": 0.8271, - "step": 7996 - }, - { - "epoch": 0.2, - "learning_rate": 1.9923092268357333e-06, - "loss": 1.0371, - "step": 7997 - }, - { - "epoch": 0.2, - "learning_rate": 1.992305801305363e-06, - "loss": 0.8193, - "step": 7998 - }, - { - "epoch": 0.21, - "learning_rate": 1.99230237501523e-06, - "loss": 0.9004, - "step": 7999 - }, - { - "epoch": 0.21, - "learning_rate": 1.9922989479653364e-06, - "loss": 0.7939, - "step": 8000 - }, - { - "epoch": 0.21, - "learning_rate": 1.9922955201556853e-06, - "loss": 0.8057, - "step": 8001 - }, - { - "epoch": 0.21, - "learning_rate": 1.992292091586279e-06, - "loss": 0.9766, - "step": 8002 - }, - { - "epoch": 0.21, - "learning_rate": 1.9922886622571204e-06, - "loss": 0.9658, - "step": 8003 - }, - { - "epoch": 0.21, - "learning_rate": 1.992285232168212e-06, - "loss": 0.75, - "step": 8004 - }, - { - "epoch": 0.21, - "learning_rate": 1.9922818013195566e-06, - "loss": 0.9785, - "step": 8005 - }, - { - "epoch": 0.21, - "learning_rate": 1.9922783697111563e-06, - "loss": 0.8662, - "step": 8006 - }, - { - "epoch": 0.21, - "learning_rate": 1.9922749373430145e-06, - "loss": 0.6714, - "step": 8007 - }, - { - "epoch": 0.21, - "learning_rate": 1.992271504215133e-06, - "loss": 1.0996, - "step": 8008 - }, - { - "epoch": 0.21, - "learning_rate": 1.992268070327515e-06, - "loss": 0.8213, - "step": 8009 - }, - { - "epoch": 0.21, - "learning_rate": 1.992264635680163e-06, - "loss": 0.8545, - "step": 8010 - }, - { - "epoch": 0.21, - "learning_rate": 1.9922612002730794e-06, - "loss": 1.041, - "step": 8011 - }, - { - "epoch": 0.21, - "learning_rate": 1.992257764106267e-06, - "loss": 1.0723, - "step": 8012 - }, - { - "epoch": 0.21, - "learning_rate": 1.992254327179729e-06, - "loss": 1.001, - "step": 8013 - }, - { - "epoch": 0.21, - "learning_rate": 1.992250889493467e-06, - "loss": 1.2529, - "step": 8014 - }, - { - "epoch": 0.21, - "learning_rate": 1.992247451047484e-06, - "loss": 0.8394, - "step": 8015 - }, - { - "epoch": 0.21, - "learning_rate": 1.9922440118417833e-06, - "loss": 1.0225, - "step": 8016 - }, - { - "epoch": 0.21, - "learning_rate": 1.9922405718763666e-06, - "loss": 0.9512, - "step": 8017 - }, - { - "epoch": 0.21, - "learning_rate": 1.9922371311512368e-06, - "loss": 1.0469, - "step": 8018 - }, - { - "epoch": 0.21, - "learning_rate": 1.992233689666397e-06, - "loss": 0.9316, - "step": 8019 - }, - { - "epoch": 0.21, - "learning_rate": 1.9922302474218494e-06, - "loss": 0.9663, - "step": 8020 - }, - { - "epoch": 0.21, - "learning_rate": 1.9922268044175966e-06, - "loss": 1.0283, - "step": 8021 - }, - { - "epoch": 0.21, - "learning_rate": 1.992223360653641e-06, - "loss": 0.9014, - "step": 8022 - }, - { - "epoch": 0.21, - "learning_rate": 1.9922199161299865e-06, - "loss": 0.9111, - "step": 8023 - }, - { - "epoch": 0.21, - "learning_rate": 1.992216470846634e-06, - "loss": 0.7363, - "step": 8024 - }, - { - "epoch": 0.21, - "learning_rate": 1.9922130248035873e-06, - "loss": 0.874, - "step": 8025 - }, - { - "epoch": 0.21, - "learning_rate": 1.9922095780008487e-06, - "loss": 0.9521, - "step": 8026 - }, - { - "epoch": 0.21, - "learning_rate": 1.992206130438421e-06, - "loss": 0.9209, - "step": 8027 - }, - { - "epoch": 0.21, - "learning_rate": 1.992202682116307e-06, - "loss": 0.8184, - "step": 8028 - }, - { - "epoch": 0.21, - "learning_rate": 1.9921992330345084e-06, - "loss": 0.7949, - "step": 8029 - }, - { - "epoch": 0.21, - "learning_rate": 1.9921957831930284e-06, - "loss": 0.853, - "step": 8030 - }, - { - "epoch": 0.21, - "learning_rate": 1.99219233259187e-06, - "loss": 0.8652, - "step": 8031 - }, - { - "epoch": 0.21, - "learning_rate": 1.9921888812310354e-06, - "loss": 0.8818, - "step": 8032 - }, - { - "epoch": 0.21, - "learning_rate": 1.9921854291105274e-06, - "loss": 0.7266, - "step": 8033 - }, - { - "epoch": 0.21, - "learning_rate": 1.992181976230349e-06, - "loss": 1.2266, - "step": 8034 - }, - { - "epoch": 0.21, - "learning_rate": 1.9921785225905022e-06, - "loss": 0.8906, - "step": 8035 - }, - { - "epoch": 0.21, - "learning_rate": 1.99217506819099e-06, - "loss": 1.1748, - "step": 8036 - }, - { - "epoch": 0.21, - "learning_rate": 1.992171613031815e-06, - "loss": 1.0283, - "step": 8037 - }, - { - "epoch": 0.21, - "learning_rate": 1.99216815711298e-06, - "loss": 1.0146, - "step": 8038 - }, - { - "epoch": 0.21, - "learning_rate": 1.992164700434487e-06, - "loss": 1.0869, - "step": 8039 - }, - { - "epoch": 0.21, - "learning_rate": 1.9921612429963394e-06, - "loss": 0.7754, - "step": 8040 - }, - { - "epoch": 0.21, - "learning_rate": 1.992157784798539e-06, - "loss": 0.6963, - "step": 8041 - }, - { - "epoch": 0.21, - "learning_rate": 1.9921543258410897e-06, - "loss": 0.8291, - "step": 8042 - }, - { - "epoch": 0.21, - "learning_rate": 1.9921508661239934e-06, - "loss": 1.0674, - "step": 8043 - }, - { - "epoch": 0.21, - "learning_rate": 1.992147405647253e-06, - "loss": 0.7642, - "step": 8044 - }, - { - "epoch": 0.21, - "learning_rate": 1.9921439444108704e-06, - "loss": 0.7529, - "step": 8045 - }, - { - "epoch": 0.21, - "learning_rate": 1.992140482414849e-06, - "loss": 0.9082, - "step": 8046 - }, - { - "epoch": 0.21, - "learning_rate": 1.992137019659191e-06, - "loss": 1.0596, - "step": 8047 - }, - { - "epoch": 0.21, - "learning_rate": 1.9921335561438996e-06, - "loss": 0.8501, - "step": 8048 - }, - { - "epoch": 0.21, - "learning_rate": 1.992130091868977e-06, - "loss": 0.957, - "step": 8049 - }, - { - "epoch": 0.21, - "learning_rate": 1.9921266268344263e-06, - "loss": 1.209, - "step": 8050 - }, - { - "epoch": 0.21, - "learning_rate": 1.9921231610402497e-06, - "loss": 0.835, - "step": 8051 - }, - { - "epoch": 0.21, - "learning_rate": 1.9921196944864498e-06, - "loss": 0.6782, - "step": 8052 - }, - { - "epoch": 0.21, - "learning_rate": 1.99211622717303e-06, - "loss": 1.0127, - "step": 8053 - }, - { - "epoch": 0.21, - "learning_rate": 1.9921127590999916e-06, - "loss": 0.8955, - "step": 8054 - }, - { - "epoch": 0.21, - "learning_rate": 1.992109290267339e-06, - "loss": 0.7397, - "step": 8055 - }, - { - "epoch": 0.21, - "learning_rate": 1.9921058206750733e-06, - "loss": 1.0557, - "step": 8056 - }, - { - "epoch": 0.21, - "learning_rate": 1.992102350323198e-06, - "loss": 1.1055, - "step": 8057 - }, - { - "epoch": 0.21, - "learning_rate": 1.9920988792117157e-06, - "loss": 0.6382, - "step": 8058 - }, - { - "epoch": 0.21, - "learning_rate": 1.9920954073406287e-06, - "loss": 1.0977, - "step": 8059 - }, - { - "epoch": 0.21, - "learning_rate": 1.9920919347099395e-06, - "loss": 1.1797, - "step": 8060 - }, - { - "epoch": 0.21, - "learning_rate": 1.9920884613196515e-06, - "loss": 0.896, - "step": 8061 - }, - { - "epoch": 0.21, - "learning_rate": 1.9920849871697672e-06, - "loss": 1.1133, - "step": 8062 - }, - { - "epoch": 0.21, - "learning_rate": 1.992081512260289e-06, - "loss": 1.0254, - "step": 8063 - }, - { - "epoch": 0.21, - "learning_rate": 1.992078036591219e-06, - "loss": 0.9219, - "step": 8064 - }, - { - "epoch": 0.21, - "learning_rate": 1.9920745601625613e-06, - "loss": 0.666, - "step": 8065 - }, - { - "epoch": 0.21, - "learning_rate": 1.9920710829743173e-06, - "loss": 0.9111, - "step": 8066 - }, - { - "epoch": 0.21, - "learning_rate": 1.99206760502649e-06, - "loss": 0.9756, - "step": 8067 - }, - { - "epoch": 0.21, - "learning_rate": 1.9920641263190824e-06, - "loss": 1.0127, - "step": 8068 - }, - { - "epoch": 0.21, - "learning_rate": 1.9920606468520966e-06, - "loss": 0.9619, - "step": 8069 - }, - { - "epoch": 0.21, - "learning_rate": 1.9920571666255357e-06, - "loss": 0.8535, - "step": 8070 - }, - { - "epoch": 0.21, - "learning_rate": 1.9920536856394027e-06, - "loss": 0.752, - "step": 8071 - }, - { - "epoch": 0.21, - "learning_rate": 1.9920502038936996e-06, - "loss": 0.9883, - "step": 8072 - }, - { - "epoch": 0.21, - "learning_rate": 1.9920467213884287e-06, - "loss": 1.0732, - "step": 8073 - }, - { - "epoch": 0.21, - "learning_rate": 1.992043238123594e-06, - "loss": 0.7256, - "step": 8074 - }, - { - "epoch": 0.21, - "learning_rate": 1.992039754099197e-06, - "loss": 1.1094, - "step": 8075 - }, - { - "epoch": 0.21, - "learning_rate": 1.992036269315241e-06, - "loss": 0.8452, - "step": 8076 - }, - { - "epoch": 0.21, - "learning_rate": 1.992032783771728e-06, - "loss": 0.7515, - "step": 8077 - }, - { - "epoch": 0.21, - "learning_rate": 1.9920292974686612e-06, - "loss": 0.9248, - "step": 8078 - }, - { - "epoch": 0.21, - "learning_rate": 1.9920258104060434e-06, - "loss": 0.8223, - "step": 8079 - }, - { - "epoch": 0.21, - "learning_rate": 1.992022322583877e-06, - "loss": 0.6875, - "step": 8080 - }, - { - "epoch": 0.21, - "learning_rate": 1.9920188340021647e-06, - "loss": 0.7139, - "step": 8081 - }, - { - "epoch": 0.21, - "learning_rate": 1.9920153446609092e-06, - "loss": 1.0894, - "step": 8082 - }, - { - "epoch": 0.21, - "learning_rate": 1.9920118545601134e-06, - "loss": 0.8701, - "step": 8083 - }, - { - "epoch": 0.21, - "learning_rate": 1.9920083636997798e-06, - "loss": 0.8105, - "step": 8084 - }, - { - "epoch": 0.21, - "learning_rate": 1.9920048720799104e-06, - "loss": 0.9727, - "step": 8085 - }, - { - "epoch": 0.21, - "learning_rate": 1.9920013797005087e-06, - "loss": 0.8604, - "step": 8086 - }, - { - "epoch": 0.21, - "learning_rate": 1.9919978865615772e-06, - "loss": 0.709, - "step": 8087 - }, - { - "epoch": 0.21, - "learning_rate": 1.991994392663119e-06, - "loss": 1.3594, - "step": 8088 - }, - { - "epoch": 0.21, - "learning_rate": 1.991990898005136e-06, - "loss": 0.9873, - "step": 8089 - }, - { - "epoch": 0.21, - "learning_rate": 1.991987402587631e-06, - "loss": 0.8179, - "step": 8090 - }, - { - "epoch": 0.21, - "learning_rate": 1.991983906410607e-06, - "loss": 1.0439, - "step": 8091 - }, - { - "epoch": 0.21, - "learning_rate": 1.9919804094740663e-06, - "loss": 0.8594, - "step": 8092 - }, - { - "epoch": 0.21, - "learning_rate": 1.9919769117780124e-06, - "loss": 0.7881, - "step": 8093 - }, - { - "epoch": 0.21, - "learning_rate": 1.991973413322447e-06, - "loss": 0.9629, - "step": 8094 - }, - { - "epoch": 0.21, - "learning_rate": 1.991969914107373e-06, - "loss": 0.8789, - "step": 8095 - }, - { - "epoch": 0.21, - "learning_rate": 1.9919664141327933e-06, - "loss": 0.957, - "step": 8096 - }, - { - "epoch": 0.21, - "learning_rate": 1.991962913398711e-06, - "loss": 1.1064, - "step": 8097 - }, - { - "epoch": 0.21, - "learning_rate": 1.9919594119051275e-06, - "loss": 0.9658, - "step": 8098 - }, - { - "epoch": 0.21, - "learning_rate": 1.991955909652047e-06, - "loss": 0.9531, - "step": 8099 - }, - { - "epoch": 0.21, - "learning_rate": 1.9919524066394714e-06, - "loss": 0.8311, - "step": 8100 - }, - { - "epoch": 0.21, - "learning_rate": 1.991948902867403e-06, - "loss": 0.7354, - "step": 8101 - }, - { - "epoch": 0.21, - "learning_rate": 1.9919453983358453e-06, - "loss": 0.876, - "step": 8102 - }, - { - "epoch": 0.21, - "learning_rate": 1.9919418930448006e-06, - "loss": 1.1562, - "step": 8103 - }, - { - "epoch": 0.21, - "learning_rate": 1.9919383869942715e-06, - "loss": 0.7207, - "step": 8104 - }, - { - "epoch": 0.21, - "learning_rate": 1.991934880184261e-06, - "loss": 0.8721, - "step": 8105 - }, - { - "epoch": 0.21, - "learning_rate": 1.9919313726147712e-06, - "loss": 1.0186, - "step": 8106 - }, - { - "epoch": 0.21, - "learning_rate": 1.9919278642858052e-06, - "loss": 1.0332, - "step": 8107 - }, - { - "epoch": 0.21, - "learning_rate": 1.9919243551973658e-06, - "loss": 1.1494, - "step": 8108 - }, - { - "epoch": 0.21, - "learning_rate": 1.9919208453494558e-06, - "loss": 1.1309, - "step": 8109 - }, - { - "epoch": 0.21, - "learning_rate": 1.9919173347420774e-06, - "loss": 0.9307, - "step": 8110 - }, - { - "epoch": 0.21, - "learning_rate": 1.9919138233752333e-06, - "loss": 0.8467, - "step": 8111 - }, - { - "epoch": 0.21, - "learning_rate": 1.9919103112489262e-06, - "loss": 0.8936, - "step": 8112 - }, - { - "epoch": 0.21, - "learning_rate": 1.9919067983631597e-06, - "loss": 0.8057, - "step": 8113 - }, - { - "epoch": 0.21, - "learning_rate": 1.9919032847179354e-06, - "loss": 0.9043, - "step": 8114 - }, - { - "epoch": 0.21, - "learning_rate": 1.9918997703132562e-06, - "loss": 0.8242, - "step": 8115 - }, - { - "epoch": 0.21, - "learning_rate": 1.9918962551491252e-06, - "loss": 0.8071, - "step": 8116 - }, - { - "epoch": 0.21, - "learning_rate": 1.9918927392255445e-06, - "loss": 0.9277, - "step": 8117 - }, - { - "epoch": 0.21, - "learning_rate": 1.991889222542518e-06, - "loss": 0.625, - "step": 8118 - }, - { - "epoch": 0.21, - "learning_rate": 1.9918857051000465e-06, - "loss": 0.7041, - "step": 8119 - }, - { - "epoch": 0.21, - "learning_rate": 1.9918821868981343e-06, - "loss": 0.7625, - "step": 8120 - }, - { - "epoch": 0.21, - "learning_rate": 1.9918786679367834e-06, - "loss": 0.7959, - "step": 8121 - }, - { - "epoch": 0.21, - "learning_rate": 1.9918751482159964e-06, - "loss": 1.1445, - "step": 8122 - }, - { - "epoch": 0.21, - "learning_rate": 1.9918716277357765e-06, - "loss": 0.8276, - "step": 8123 - }, - { - "epoch": 0.21, - "learning_rate": 1.9918681064961263e-06, - "loss": 0.876, - "step": 8124 - }, - { - "epoch": 0.21, - "learning_rate": 1.9918645844970476e-06, - "loss": 0.9932, - "step": 8125 - }, - { - "epoch": 0.21, - "learning_rate": 1.9918610617385446e-06, - "loss": 0.707, - "step": 8126 - }, - { - "epoch": 0.21, - "learning_rate": 1.9918575382206185e-06, - "loss": 0.9775, - "step": 8127 - }, - { - "epoch": 0.21, - "learning_rate": 1.991854013943273e-06, - "loss": 0.8589, - "step": 8128 - }, - { - "epoch": 0.21, - "learning_rate": 1.9918504889065107e-06, - "loss": 1.0469, - "step": 8129 - }, - { - "epoch": 0.21, - "learning_rate": 1.9918469631103336e-06, - "loss": 0.9775, - "step": 8130 - }, - { - "epoch": 0.21, - "learning_rate": 1.9918434365547453e-06, - "loss": 1.0781, - "step": 8131 - }, - { - "epoch": 0.21, - "learning_rate": 1.991839909239748e-06, - "loss": 0.8945, - "step": 8132 - }, - { - "epoch": 0.21, - "learning_rate": 1.991836381165344e-06, - "loss": 0.918, - "step": 8133 - }, - { - "epoch": 0.21, - "learning_rate": 1.991832852331537e-06, - "loss": 1.0264, - "step": 8134 - }, - { - "epoch": 0.21, - "learning_rate": 1.9918293227383294e-06, - "loss": 0.8662, - "step": 8135 - }, - { - "epoch": 0.21, - "learning_rate": 1.9918257923857232e-06, - "loss": 0.9277, - "step": 8136 - }, - { - "epoch": 0.21, - "learning_rate": 1.9918222612737216e-06, - "loss": 0.9492, - "step": 8137 - }, - { - "epoch": 0.21, - "learning_rate": 1.9918187294023277e-06, - "loss": 0.8223, - "step": 8138 - }, - { - "epoch": 0.21, - "learning_rate": 1.9918151967715435e-06, - "loss": 0.8042, - "step": 8139 - }, - { - "epoch": 0.21, - "learning_rate": 1.991811663381372e-06, - "loss": 0.7676, - "step": 8140 - }, - { - "epoch": 0.21, - "learning_rate": 1.9918081292318163e-06, - "loss": 0.7969, - "step": 8141 - }, - { - "epoch": 0.21, - "learning_rate": 1.9918045943228784e-06, - "loss": 1.002, - "step": 8142 - }, - { - "epoch": 0.21, - "learning_rate": 1.991801058654561e-06, - "loss": 1.1504, - "step": 8143 - }, - { - "epoch": 0.21, - "learning_rate": 1.991797522226868e-06, - "loss": 0.9043, - "step": 8144 - }, - { - "epoch": 0.21, - "learning_rate": 1.9917939850398006e-06, - "loss": 0.6736, - "step": 8145 - }, - { - "epoch": 0.21, - "learning_rate": 1.991790447093362e-06, - "loss": 0.7134, - "step": 8146 - }, - { - "epoch": 0.21, - "learning_rate": 1.9917869083875558e-06, - "loss": 1.0957, - "step": 8147 - }, - { - "epoch": 0.21, - "learning_rate": 1.9917833689223833e-06, - "loss": 0.9678, - "step": 8148 - }, - { - "epoch": 0.21, - "learning_rate": 1.991779828697848e-06, - "loss": 0.9453, - "step": 8149 - }, - { - "epoch": 0.21, - "learning_rate": 1.9917762877139524e-06, - "loss": 0.7793, - "step": 8150 - }, - { - "epoch": 0.21, - "learning_rate": 1.9917727459706996e-06, - "loss": 0.9775, - "step": 8151 - }, - { - "epoch": 0.21, - "learning_rate": 1.991769203468092e-06, - "loss": 0.9639, - "step": 8152 - }, - { - "epoch": 0.21, - "learning_rate": 1.9917656602061323e-06, - "loss": 0.75, - "step": 8153 - }, - { - "epoch": 0.21, - "learning_rate": 1.991762116184823e-06, - "loss": 0.6724, - "step": 8154 - }, - { - "epoch": 0.21, - "learning_rate": 1.991758571404167e-06, - "loss": 1.1475, - "step": 8155 - }, - { - "epoch": 0.21, - "learning_rate": 1.9917550258641675e-06, - "loss": 1.0518, - "step": 8156 - }, - { - "epoch": 0.21, - "learning_rate": 1.991751479564826e-06, - "loss": 1.0938, - "step": 8157 - }, - { - "epoch": 0.21, - "learning_rate": 1.9917479325061472e-06, - "loss": 1.1475, - "step": 8158 - }, - { - "epoch": 0.21, - "learning_rate": 1.9917443846881317e-06, - "loss": 0.9536, - "step": 8159 - }, - { - "epoch": 0.21, - "learning_rate": 1.9917408361107833e-06, - "loss": 0.8506, - "step": 8160 - }, - { - "epoch": 0.21, - "learning_rate": 1.9917372867741045e-06, - "loss": 0.9541, - "step": 8161 - }, - { - "epoch": 0.21, - "learning_rate": 1.9917337366780985e-06, - "loss": 0.8994, - "step": 8162 - }, - { - "epoch": 0.21, - "learning_rate": 1.991730185822767e-06, - "loss": 0.9023, - "step": 8163 - }, - { - "epoch": 0.21, - "learning_rate": 1.9917266342081136e-06, - "loss": 0.8643, - "step": 8164 - }, - { - "epoch": 0.21, - "learning_rate": 1.991723081834141e-06, - "loss": 0.8945, - "step": 8165 - }, - { - "epoch": 0.21, - "learning_rate": 1.9917195287008508e-06, - "loss": 1.1543, - "step": 8166 - }, - { - "epoch": 0.21, - "learning_rate": 1.9917159748082474e-06, - "loss": 0.8555, - "step": 8167 - }, - { - "epoch": 0.21, - "learning_rate": 1.991712420156332e-06, - "loss": 0.7251, - "step": 8168 - }, - { - "epoch": 0.21, - "learning_rate": 1.9917088647451085e-06, - "loss": 0.6892, - "step": 8169 - }, - { - "epoch": 0.21, - "learning_rate": 1.991705308574579e-06, - "loss": 0.9229, - "step": 8170 - }, - { - "epoch": 0.21, - "learning_rate": 1.9917017516447463e-06, - "loss": 0.7617, - "step": 8171 - }, - { - "epoch": 0.21, - "learning_rate": 1.9916981939556133e-06, - "loss": 0.7363, - "step": 8172 - }, - { - "epoch": 0.21, - "learning_rate": 1.991694635507182e-06, - "loss": 0.9131, - "step": 8173 - }, - { - "epoch": 0.21, - "learning_rate": 1.9916910762994564e-06, - "loss": 1.0146, - "step": 8174 - }, - { - "epoch": 0.21, - "learning_rate": 1.9916875163324384e-06, - "loss": 0.8516, - "step": 8175 - }, - { - "epoch": 0.21, - "learning_rate": 1.9916839556061307e-06, - "loss": 0.9346, - "step": 8176 - }, - { - "epoch": 0.21, - "learning_rate": 1.9916803941205363e-06, - "loss": 0.6929, - "step": 8177 - }, - { - "epoch": 0.21, - "learning_rate": 1.991676831875658e-06, - "loss": 0.7659, - "step": 8178 - }, - { - "epoch": 0.21, - "learning_rate": 1.9916732688714977e-06, - "loss": 0.7939, - "step": 8179 - }, - { - "epoch": 0.21, - "learning_rate": 1.9916697051080594e-06, - "loss": 0.7644, - "step": 8180 - }, - { - "epoch": 0.21, - "learning_rate": 1.9916661405853454e-06, - "loss": 0.7583, - "step": 8181 - }, - { - "epoch": 0.21, - "learning_rate": 1.9916625753033574e-06, - "loss": 0.8613, - "step": 8182 - }, - { - "epoch": 0.21, - "learning_rate": 1.9916590092620997e-06, - "loss": 0.917, - "step": 8183 - }, - { - "epoch": 0.21, - "learning_rate": 1.991655442461574e-06, - "loss": 0.9082, - "step": 8184 - }, - { - "epoch": 0.21, - "learning_rate": 1.9916518749017835e-06, - "loss": 0.751, - "step": 8185 - }, - { - "epoch": 0.21, - "learning_rate": 1.99164830658273e-06, - "loss": 1.1953, - "step": 8186 - }, - { - "epoch": 0.21, - "learning_rate": 1.991644737504418e-06, - "loss": 0.8516, - "step": 8187 - }, - { - "epoch": 0.21, - "learning_rate": 1.9916411676668488e-06, - "loss": 1.0576, - "step": 8188 - }, - { - "epoch": 0.21, - "learning_rate": 1.9916375970700255e-06, - "loss": 1.041, - "step": 8189 - }, - { - "epoch": 0.21, - "learning_rate": 1.991634025713951e-06, - "loss": 0.9463, - "step": 8190 - }, - { - "epoch": 0.21, - "learning_rate": 1.991630453598628e-06, - "loss": 1.0146, - "step": 8191 - }, - { - "epoch": 0.21, - "learning_rate": 1.9916268807240592e-06, - "loss": 0.9287, - "step": 8192 - }, - { - "epoch": 0.21, - "learning_rate": 1.991623307090247e-06, - "loss": 0.9111, - "step": 8193 - }, - { - "epoch": 0.21, - "learning_rate": 1.9916197326971942e-06, - "loss": 1.0986, - "step": 8194 - }, - { - "epoch": 0.21, - "learning_rate": 1.9916161575449045e-06, - "loss": 0.7168, - "step": 8195 - }, - { - "epoch": 0.21, - "learning_rate": 1.9916125816333794e-06, - "loss": 0.7607, - "step": 8196 - }, - { - "epoch": 0.21, - "learning_rate": 1.991609004962622e-06, - "loss": 0.9766, - "step": 8197 - }, - { - "epoch": 0.21, - "learning_rate": 1.991605427532636e-06, - "loss": 0.9082, - "step": 8198 - }, - { - "epoch": 0.21, - "learning_rate": 1.9916018493434227e-06, - "loss": 0.7344, - "step": 8199 - }, - { - "epoch": 0.21, - "learning_rate": 1.9915982703949854e-06, - "loss": 0.915, - "step": 8200 - }, - { - "epoch": 0.21, - "learning_rate": 1.991594690687327e-06, - "loss": 0.8281, - "step": 8201 - }, - { - "epoch": 0.21, - "learning_rate": 1.99159111022045e-06, - "loss": 1.0146, - "step": 8202 - }, - { - "epoch": 0.21, - "learning_rate": 1.9915875289943576e-06, - "loss": 0.749, - "step": 8203 - }, - { - "epoch": 0.21, - "learning_rate": 1.9915839470090523e-06, - "loss": 0.9072, - "step": 8204 - }, - { - "epoch": 0.21, - "learning_rate": 1.9915803642645365e-06, - "loss": 0.689, - "step": 8205 - }, - { - "epoch": 0.21, - "learning_rate": 1.9915767807608132e-06, - "loss": 1.0322, - "step": 8206 - }, - { - "epoch": 0.21, - "learning_rate": 1.9915731964978854e-06, - "loss": 0.7505, - "step": 8207 - }, - { - "epoch": 0.21, - "learning_rate": 1.9915696114757552e-06, - "loss": 0.918, - "step": 8208 - }, - { - "epoch": 0.21, - "learning_rate": 1.991566025694426e-06, - "loss": 0.9268, - "step": 8209 - }, - { - "epoch": 0.21, - "learning_rate": 1.9915624391539003e-06, - "loss": 0.9697, - "step": 8210 - }, - { - "epoch": 0.21, - "learning_rate": 1.9915588518541807e-06, - "loss": 1.0342, - "step": 8211 - }, - { - "epoch": 0.21, - "learning_rate": 1.99155526379527e-06, - "loss": 0.7822, - "step": 8212 - }, - { - "epoch": 0.21, - "learning_rate": 1.991551674977171e-06, - "loss": 1.1123, - "step": 8213 - }, - { - "epoch": 0.21, - "learning_rate": 1.991548085399887e-06, - "loss": 0.7744, - "step": 8214 - }, - { - "epoch": 0.21, - "learning_rate": 1.9915444950634195e-06, - "loss": 0.9336, - "step": 8215 - }, - { - "epoch": 0.21, - "learning_rate": 1.9915409039677726e-06, - "loss": 1.0615, - "step": 8216 - }, - { - "epoch": 0.21, - "learning_rate": 1.9915373121129486e-06, - "loss": 0.9551, - "step": 8217 - }, - { - "epoch": 0.21, - "learning_rate": 1.9915337194989493e-06, - "loss": 1.0723, - "step": 8218 - }, - { - "epoch": 0.21, - "learning_rate": 1.9915301261257786e-06, - "loss": 0.8506, - "step": 8219 - }, - { - "epoch": 0.21, - "learning_rate": 1.991526531993439e-06, - "loss": 0.9951, - "step": 8220 - }, - { - "epoch": 0.21, - "learning_rate": 1.9915229371019328e-06, - "loss": 0.8877, - "step": 8221 - }, - { - "epoch": 0.21, - "learning_rate": 1.9915193414512632e-06, - "loss": 0.7739, - "step": 8222 - }, - { - "epoch": 0.21, - "learning_rate": 1.991515745041433e-06, - "loss": 0.7705, - "step": 8223 - }, - { - "epoch": 0.21, - "learning_rate": 1.9915121478724444e-06, - "loss": 0.9678, - "step": 8224 - }, - { - "epoch": 0.21, - "learning_rate": 1.991508549944301e-06, - "loss": 0.7607, - "step": 8225 - }, - { - "epoch": 0.21, - "learning_rate": 1.9915049512570052e-06, - "loss": 0.9004, - "step": 8226 - }, - { - "epoch": 0.21, - "learning_rate": 1.991501351810559e-06, - "loss": 1.084, - "step": 8227 - }, - { - "epoch": 0.21, - "learning_rate": 1.991497751604966e-06, - "loss": 0.6821, - "step": 8228 - }, - { - "epoch": 0.21, - "learning_rate": 1.991494150640229e-06, - "loss": 0.9287, - "step": 8229 - }, - { - "epoch": 0.21, - "learning_rate": 1.9914905489163507e-06, - "loss": 0.6323, - "step": 8230 - }, - { - "epoch": 0.21, - "learning_rate": 1.9914869464333334e-06, - "loss": 0.9561, - "step": 8231 - }, - { - "epoch": 0.21, - "learning_rate": 1.99148334319118e-06, - "loss": 1.0176, - "step": 8232 - }, - { - "epoch": 0.21, - "learning_rate": 1.9914797391898936e-06, - "loss": 0.7373, - "step": 8233 - }, - { - "epoch": 0.21, - "learning_rate": 1.9914761344294766e-06, - "loss": 0.8857, - "step": 8234 - }, - { - "epoch": 0.21, - "learning_rate": 1.991472528909932e-06, - "loss": 1.0557, - "step": 8235 - }, - { - "epoch": 0.21, - "learning_rate": 1.9914689226312624e-06, - "loss": 0.9814, - "step": 8236 - }, - { - "epoch": 0.21, - "learning_rate": 1.9914653155934706e-06, - "loss": 1.0254, - "step": 8237 - }, - { - "epoch": 0.21, - "learning_rate": 1.9914617077965595e-06, - "loss": 0.6997, - "step": 8238 - }, - { - "epoch": 0.21, - "learning_rate": 1.991458099240532e-06, - "loss": 0.7012, - "step": 8239 - }, - { - "epoch": 0.21, - "learning_rate": 1.9914544899253906e-06, - "loss": 0.8159, - "step": 8240 - }, - { - "epoch": 0.21, - "learning_rate": 1.9914508798511374e-06, - "loss": 0.8535, - "step": 8241 - }, - { - "epoch": 0.21, - "learning_rate": 1.991447269017776e-06, - "loss": 0.8916, - "step": 8242 - }, - { - "epoch": 0.21, - "learning_rate": 1.99144365742531e-06, - "loss": 0.874, - "step": 8243 - }, - { - "epoch": 0.21, - "learning_rate": 1.9914400450737406e-06, - "loss": 0.9453, - "step": 8244 - }, - { - "epoch": 0.21, - "learning_rate": 1.9914364319630708e-06, - "loss": 0.6169, - "step": 8245 - }, - { - "epoch": 0.21, - "learning_rate": 1.991432818093304e-06, - "loss": 1.0771, - "step": 8246 - }, - { - "epoch": 0.21, - "learning_rate": 1.991429203464443e-06, - "loss": 0.6748, - "step": 8247 - }, - { - "epoch": 0.21, - "learning_rate": 1.99142558807649e-06, - "loss": 0.9775, - "step": 8248 - }, - { - "epoch": 0.21, - "learning_rate": 1.9914219719294474e-06, - "loss": 0.7437, - "step": 8249 - }, - { - "epoch": 0.21, - "learning_rate": 1.991418355023319e-06, - "loss": 0.9404, - "step": 8250 - }, - { - "epoch": 0.21, - "learning_rate": 1.9914147373581074e-06, - "loss": 0.7734, - "step": 8251 - }, - { - "epoch": 0.21, - "learning_rate": 1.991411118933815e-06, - "loss": 0.9658, - "step": 8252 - }, - { - "epoch": 0.21, - "learning_rate": 1.991407499750445e-06, - "loss": 1.1846, - "step": 8253 - }, - { - "epoch": 0.21, - "learning_rate": 1.9914038798079994e-06, - "loss": 0.9736, - "step": 8254 - }, - { - "epoch": 0.21, - "learning_rate": 1.9914002591064812e-06, - "loss": 0.8699, - "step": 8255 - }, - { - "epoch": 0.21, - "learning_rate": 1.991396637645894e-06, - "loss": 0.9971, - "step": 8256 - }, - { - "epoch": 0.21, - "learning_rate": 1.9913930154262396e-06, - "loss": 1.1465, - "step": 8257 - }, - { - "epoch": 0.21, - "learning_rate": 1.9913893924475216e-06, - "loss": 0.937, - "step": 8258 - }, - { - "epoch": 0.21, - "learning_rate": 1.9913857687097418e-06, - "loss": 0.9912, - "step": 8259 - }, - { - "epoch": 0.21, - "learning_rate": 1.9913821442129036e-06, - "loss": 0.875, - "step": 8260 - }, - { - "epoch": 0.21, - "learning_rate": 1.99137851895701e-06, - "loss": 0.9844, - "step": 8261 - }, - { - "epoch": 0.21, - "learning_rate": 1.9913748929420634e-06, - "loss": 1.1055, - "step": 8262 - }, - { - "epoch": 0.21, - "learning_rate": 1.991371266168066e-06, - "loss": 1.0674, - "step": 8263 - }, - { - "epoch": 0.21, - "learning_rate": 1.991367638635022e-06, - "loss": 0.9824, - "step": 8264 - }, - { - "epoch": 0.21, - "learning_rate": 1.991364010342933e-06, - "loss": 0.8037, - "step": 8265 - }, - { - "epoch": 0.21, - "learning_rate": 1.9913603812918023e-06, - "loss": 0.7632, - "step": 8266 - }, - { - "epoch": 0.21, - "learning_rate": 1.9913567514816327e-06, - "loss": 1.002, - "step": 8267 - }, - { - "epoch": 0.21, - "learning_rate": 1.9913531209124263e-06, - "loss": 0.7412, - "step": 8268 - }, - { - "epoch": 0.21, - "learning_rate": 1.991349489584187e-06, - "loss": 0.9404, - "step": 8269 - }, - { - "epoch": 0.21, - "learning_rate": 1.9913458574969162e-06, - "loss": 0.8672, - "step": 8270 - }, - { - "epoch": 0.21, - "learning_rate": 1.991342224650618e-06, - "loss": 0.8008, - "step": 8271 - }, - { - "epoch": 0.21, - "learning_rate": 1.9913385910452945e-06, - "loss": 0.9385, - "step": 8272 - }, - { - "epoch": 0.21, - "learning_rate": 1.991334956680949e-06, - "loss": 1.0371, - "step": 8273 - }, - { - "epoch": 0.21, - "learning_rate": 1.9913313215575835e-06, - "loss": 0.9912, - "step": 8274 - }, - { - "epoch": 0.21, - "learning_rate": 1.9913276856752016e-06, - "loss": 1.0137, - "step": 8275 - }, - { - "epoch": 0.21, - "learning_rate": 1.991324049033805e-06, - "loss": 0.8506, - "step": 8276 - }, - { - "epoch": 0.21, - "learning_rate": 1.9913204116333976e-06, - "loss": 0.6814, - "step": 8277 - }, - { - "epoch": 0.21, - "learning_rate": 1.991316773473982e-06, - "loss": 1.0811, - "step": 8278 - }, - { - "epoch": 0.21, - "learning_rate": 1.9913131345555603e-06, - "loss": 0.9014, - "step": 8279 - }, - { - "epoch": 0.21, - "learning_rate": 1.991309494878136e-06, - "loss": 1.0176, - "step": 8280 - }, - { - "epoch": 0.21, - "learning_rate": 1.9913058544417113e-06, - "loss": 0.96, - "step": 8281 - }, - { - "epoch": 0.21, - "learning_rate": 1.991302213246289e-06, - "loss": 0.8994, - "step": 8282 - }, - { - "epoch": 0.21, - "learning_rate": 1.991298571291873e-06, - "loss": 1.042, - "step": 8283 - }, - { - "epoch": 0.21, - "learning_rate": 1.9912949285784648e-06, - "loss": 0.8965, - "step": 8284 - }, - { - "epoch": 0.21, - "learning_rate": 1.9912912851060675e-06, - "loss": 0.6812, - "step": 8285 - }, - { - "epoch": 0.21, - "learning_rate": 1.9912876408746843e-06, - "loss": 0.8296, - "step": 8286 - }, - { - "epoch": 0.21, - "learning_rate": 1.9912839958843176e-06, - "loss": 1.0537, - "step": 8287 - }, - { - "epoch": 0.21, - "learning_rate": 1.9912803501349704e-06, - "loss": 0.6904, - "step": 8288 - }, - { - "epoch": 0.21, - "learning_rate": 1.9912767036266453e-06, - "loss": 0.8652, - "step": 8289 - }, - { - "epoch": 0.21, - "learning_rate": 1.9912730563593457e-06, - "loss": 1.04, - "step": 8290 - }, - { - "epoch": 0.21, - "learning_rate": 1.9912694083330736e-06, - "loss": 0.7061, - "step": 8291 - }, - { - "epoch": 0.21, - "learning_rate": 1.991265759547832e-06, - "loss": 0.8926, - "step": 8292 - }, - { - "epoch": 0.21, - "learning_rate": 1.9912621100036235e-06, - "loss": 0.7725, - "step": 8293 - }, - { - "epoch": 0.21, - "learning_rate": 1.9912584597004514e-06, - "loss": 0.8662, - "step": 8294 - }, - { - "epoch": 0.21, - "learning_rate": 1.9912548086383184e-06, - "loss": 0.9402, - "step": 8295 - }, - { - "epoch": 0.21, - "learning_rate": 1.9912511568172273e-06, - "loss": 0.7788, - "step": 8296 - }, - { - "epoch": 0.21, - "learning_rate": 1.9912475042371807e-06, - "loss": 0.9844, - "step": 8297 - }, - { - "epoch": 0.21, - "learning_rate": 1.991243850898181e-06, - "loss": 0.6172, - "step": 8298 - }, - { - "epoch": 0.21, - "learning_rate": 1.991240196800232e-06, - "loss": 0.9609, - "step": 8299 - }, - { - "epoch": 0.21, - "learning_rate": 1.991236541943336e-06, - "loss": 0.8677, - "step": 8300 - }, - { - "epoch": 0.21, - "learning_rate": 1.9912328863274953e-06, - "loss": 0.9014, - "step": 8301 - }, - { - "epoch": 0.21, - "learning_rate": 1.9912292299527136e-06, - "loss": 0.7817, - "step": 8302 - }, - { - "epoch": 0.21, - "learning_rate": 1.991225572818993e-06, - "loss": 0.9121, - "step": 8303 - }, - { - "epoch": 0.21, - "learning_rate": 1.9912219149263366e-06, - "loss": 1.1172, - "step": 8304 - }, - { - "epoch": 0.21, - "learning_rate": 1.9912182562747472e-06, - "loss": 0.813, - "step": 8305 - }, - { - "epoch": 0.21, - "learning_rate": 1.9912145968642274e-06, - "loss": 1.0986, - "step": 8306 - }, - { - "epoch": 0.21, - "learning_rate": 1.9912109366947804e-06, - "loss": 0.6729, - "step": 8307 - }, - { - "epoch": 0.21, - "learning_rate": 1.991207275766409e-06, - "loss": 1.1035, - "step": 8308 - }, - { - "epoch": 0.21, - "learning_rate": 1.9912036140791153e-06, - "loss": 0.6245, - "step": 8309 - }, - { - "epoch": 0.21, - "learning_rate": 1.9911999516329026e-06, - "loss": 0.8379, - "step": 8310 - }, - { - "epoch": 0.21, - "learning_rate": 1.991196288427774e-06, - "loss": 0.8701, - "step": 8311 - }, - { - "epoch": 0.21, - "learning_rate": 1.9911926244637315e-06, - "loss": 1.1504, - "step": 8312 - }, - { - "epoch": 0.21, - "learning_rate": 1.9911889597407786e-06, - "loss": 1.0996, - "step": 8313 - }, - { - "epoch": 0.21, - "learning_rate": 1.991185294258918e-06, - "loss": 0.8223, - "step": 8314 - }, - { - "epoch": 0.21, - "learning_rate": 1.9911816280181523e-06, - "loss": 1.0195, - "step": 8315 - }, - { - "epoch": 0.21, - "learning_rate": 1.9911779610184845e-06, - "loss": 0.9121, - "step": 8316 - }, - { - "epoch": 0.21, - "learning_rate": 1.991174293259917e-06, - "loss": 0.9336, - "step": 8317 - }, - { - "epoch": 0.21, - "learning_rate": 1.9911706247424534e-06, - "loss": 0.96, - "step": 8318 - }, - { - "epoch": 0.21, - "learning_rate": 1.9911669554660957e-06, - "loss": 0.7017, - "step": 8319 - }, - { - "epoch": 0.21, - "learning_rate": 1.991163285430847e-06, - "loss": 0.915, - "step": 8320 - }, - { - "epoch": 0.21, - "learning_rate": 1.9911596146367104e-06, - "loss": 0.8701, - "step": 8321 - }, - { - "epoch": 0.21, - "learning_rate": 1.9911559430836886e-06, - "loss": 0.8809, - "step": 8322 - }, - { - "epoch": 0.21, - "learning_rate": 1.9911522707717838e-06, - "loss": 0.8496, - "step": 8323 - }, - { - "epoch": 0.21, - "learning_rate": 1.9911485977009993e-06, - "loss": 0.9121, - "step": 8324 - }, - { - "epoch": 0.21, - "learning_rate": 1.9911449238713384e-06, - "loss": 0.8135, - "step": 8325 - }, - { - "epoch": 0.21, - "learning_rate": 1.9911412492828026e-06, - "loss": 0.7778, - "step": 8326 - }, - { - "epoch": 0.21, - "learning_rate": 1.991137573935396e-06, - "loss": 0.9805, - "step": 8327 - }, - { - "epoch": 0.21, - "learning_rate": 1.991133897829121e-06, - "loss": 0.9189, - "step": 8328 - }, - { - "epoch": 0.21, - "learning_rate": 1.9911302209639805e-06, - "loss": 0.9473, - "step": 8329 - }, - { - "epoch": 0.21, - "learning_rate": 1.9911265433399767e-06, - "loss": 0.77, - "step": 8330 - }, - { - "epoch": 0.21, - "learning_rate": 1.991122864957113e-06, - "loss": 0.9883, - "step": 8331 - }, - { - "epoch": 0.21, - "learning_rate": 1.9911191858153928e-06, - "loss": 0.9756, - "step": 8332 - }, - { - "epoch": 0.21, - "learning_rate": 1.9911155059148173e-06, - "loss": 0.8428, - "step": 8333 - }, - { - "epoch": 0.21, - "learning_rate": 1.9911118252553905e-06, - "loss": 0.9375, - "step": 8334 - }, - { - "epoch": 0.21, - "learning_rate": 1.991108143837115e-06, - "loss": 0.8662, - "step": 8335 - }, - { - "epoch": 0.21, - "learning_rate": 1.9911044616599935e-06, - "loss": 0.7402, - "step": 8336 - }, - { - "epoch": 0.21, - "learning_rate": 1.991100778724029e-06, - "loss": 1.2109, - "step": 8337 - }, - { - "epoch": 0.21, - "learning_rate": 1.9910970950292244e-06, - "loss": 0.835, - "step": 8338 - }, - { - "epoch": 0.21, - "learning_rate": 1.991093410575582e-06, - "loss": 1.1143, - "step": 8339 - }, - { - "epoch": 0.21, - "learning_rate": 1.991089725363105e-06, - "loss": 0.9326, - "step": 8340 - }, - { - "epoch": 0.21, - "learning_rate": 1.991086039391796e-06, - "loss": 0.791, - "step": 8341 - }, - { - "epoch": 0.21, - "learning_rate": 1.9910823526616583e-06, - "loss": 0.7998, - "step": 8342 - }, - { - "epoch": 0.21, - "learning_rate": 1.9910786651726947e-06, - "loss": 0.9805, - "step": 8343 - }, - { - "epoch": 0.21, - "learning_rate": 1.9910749769249068e-06, - "loss": 0.8174, - "step": 8344 - }, - { - "epoch": 0.21, - "learning_rate": 1.9910712879182993e-06, - "loss": 0.8223, - "step": 8345 - }, - { - "epoch": 0.21, - "learning_rate": 1.9910675981528736e-06, - "loss": 0.9521, - "step": 8346 - }, - { - "epoch": 0.21, - "learning_rate": 1.991063907628633e-06, - "loss": 0.9023, - "step": 8347 - }, - { - "epoch": 0.21, - "learning_rate": 1.9910602163455805e-06, - "loss": 0.9766, - "step": 8348 - }, - { - "epoch": 0.21, - "learning_rate": 1.9910565243037186e-06, - "loss": 0.8867, - "step": 8349 - }, - { - "epoch": 0.21, - "learning_rate": 1.9910528315030503e-06, - "loss": 0.998, - "step": 8350 - }, - { - "epoch": 0.21, - "learning_rate": 1.9910491379435785e-06, - "loss": 0.9248, - "step": 8351 - }, - { - "epoch": 0.21, - "learning_rate": 1.991045443625306e-06, - "loss": 0.6685, - "step": 8352 - }, - { - "epoch": 0.21, - "learning_rate": 1.9910417485482356e-06, - "loss": 0.6826, - "step": 8353 - }, - { - "epoch": 0.21, - "learning_rate": 1.99103805271237e-06, - "loss": 1.1162, - "step": 8354 - }, - { - "epoch": 0.21, - "learning_rate": 1.991034356117712e-06, - "loss": 0.874, - "step": 8355 - }, - { - "epoch": 0.21, - "learning_rate": 1.991030658764265e-06, - "loss": 0.8721, - "step": 8356 - }, - { - "epoch": 0.21, - "learning_rate": 1.9910269606520308e-06, - "loss": 0.8506, - "step": 8357 - }, - { - "epoch": 0.21, - "learning_rate": 1.9910232617810136e-06, - "loss": 1.1592, - "step": 8358 - }, - { - "epoch": 0.21, - "learning_rate": 1.9910195621512145e-06, - "loss": 0.811, - "step": 8359 - }, - { - "epoch": 0.21, - "learning_rate": 1.991015861762638e-06, - "loss": 0.9463, - "step": 8360 - }, - { - "epoch": 0.21, - "learning_rate": 1.9910121606152857e-06, - "loss": 1.0596, - "step": 8361 - }, - { - "epoch": 0.21, - "learning_rate": 1.9910084587091615e-06, - "loss": 0.915, - "step": 8362 - }, - { - "epoch": 0.21, - "learning_rate": 1.9910047560442676e-06, - "loss": 0.8501, - "step": 8363 - }, - { - "epoch": 0.21, - "learning_rate": 1.9910010526206067e-06, - "loss": 1.0576, - "step": 8364 - }, - { - "epoch": 0.21, - "learning_rate": 1.9909973484381818e-06, - "loss": 1.0166, - "step": 8365 - }, - { - "epoch": 0.21, - "learning_rate": 1.990993643496996e-06, - "loss": 0.9458, - "step": 8366 - }, - { - "epoch": 0.21, - "learning_rate": 1.990989937797052e-06, - "loss": 0.8438, - "step": 8367 - }, - { - "epoch": 0.21, - "learning_rate": 1.990986231338352e-06, - "loss": 0.8047, - "step": 8368 - }, - { - "epoch": 0.21, - "learning_rate": 1.9909825241209e-06, - "loss": 0.9365, - "step": 8369 - }, - { - "epoch": 0.21, - "learning_rate": 1.9909788161446985e-06, - "loss": 1.0107, - "step": 8370 - }, - { - "epoch": 0.21, - "learning_rate": 1.9909751074097497e-06, - "loss": 1.1514, - "step": 8371 - }, - { - "epoch": 0.21, - "learning_rate": 1.990971397916057e-06, - "loss": 0.915, - "step": 8372 - }, - { - "epoch": 0.21, - "learning_rate": 1.9909676876636226e-06, - "loss": 0.7808, - "step": 8373 - }, - { - "epoch": 0.21, - "learning_rate": 1.9909639766524503e-06, - "loss": 1.0, - "step": 8374 - }, - { - "epoch": 0.21, - "learning_rate": 1.9909602648825418e-06, - "loss": 0.9209, - "step": 8375 - }, - { - "epoch": 0.21, - "learning_rate": 1.9909565523539014e-06, - "loss": 0.8564, - "step": 8376 - }, - { - "epoch": 0.21, - "learning_rate": 1.9909528390665304e-06, - "loss": 1.0977, - "step": 8377 - }, - { - "epoch": 0.21, - "learning_rate": 1.990949125020433e-06, - "loss": 0.998, - "step": 8378 - }, - { - "epoch": 0.21, - "learning_rate": 1.990945410215611e-06, - "loss": 0.7964, - "step": 8379 - }, - { - "epoch": 0.21, - "learning_rate": 1.990941694652068e-06, - "loss": 0.9058, - "step": 8380 - }, - { - "epoch": 0.21, - "learning_rate": 1.990937978329806e-06, - "loss": 0.7168, - "step": 8381 - }, - { - "epoch": 0.21, - "learning_rate": 1.990934261248829e-06, - "loss": 1.0156, - "step": 8382 - }, - { - "epoch": 0.21, - "learning_rate": 1.9909305434091387e-06, - "loss": 1.1191, - "step": 8383 - }, - { - "epoch": 0.21, - "learning_rate": 1.9909268248107386e-06, - "loss": 0.8091, - "step": 8384 - }, - { - "epoch": 0.21, - "learning_rate": 1.9909231054536316e-06, - "loss": 0.6785, - "step": 8385 - }, - { - "epoch": 0.21, - "learning_rate": 1.9909193853378202e-06, - "loss": 0.7217, - "step": 8386 - }, - { - "epoch": 0.21, - "learning_rate": 1.9909156644633075e-06, - "loss": 0.8594, - "step": 8387 - }, - { - "epoch": 0.21, - "learning_rate": 1.990911942830096e-06, - "loss": 1.0547, - "step": 8388 - }, - { - "epoch": 0.22, - "learning_rate": 1.990908220438189e-06, - "loss": 0.9326, - "step": 8389 - }, - { - "epoch": 0.22, - "learning_rate": 1.990904497287589e-06, - "loss": 0.8887, - "step": 8390 - }, - { - "epoch": 0.22, - "learning_rate": 1.990900773378299e-06, - "loss": 0.8438, - "step": 8391 - }, - { - "epoch": 0.22, - "learning_rate": 1.990897048710322e-06, - "loss": 0.9238, - "step": 8392 - }, - { - "epoch": 0.22, - "learning_rate": 1.9908933232836606e-06, - "loss": 0.8594, - "step": 8393 - }, - { - "epoch": 0.22, - "learning_rate": 1.9908895970983174e-06, - "loss": 0.8213, - "step": 8394 - }, - { - "epoch": 0.22, - "learning_rate": 1.990885870154296e-06, - "loss": 0.9873, - "step": 8395 - }, - { - "epoch": 0.22, - "learning_rate": 1.9908821424515987e-06, - "loss": 0.9688, - "step": 8396 - }, - { - "epoch": 0.22, - "learning_rate": 1.9908784139902287e-06, - "loss": 0.8169, - "step": 8397 - }, - { - "epoch": 0.22, - "learning_rate": 1.9908746847701884e-06, - "loss": 0.6599, - "step": 8398 - }, - { - "epoch": 0.22, - "learning_rate": 1.990870954791481e-06, - "loss": 0.9023, - "step": 8399 - }, - { - "epoch": 0.22, - "learning_rate": 1.9908672240541093e-06, - "loss": 1.1543, - "step": 8400 - }, - { - "epoch": 0.22, - "learning_rate": 1.990863492558076e-06, - "loss": 0.7109, - "step": 8401 - }, - { - "epoch": 0.22, - "learning_rate": 1.990859760303384e-06, - "loss": 0.8467, - "step": 8402 - }, - { - "epoch": 0.22, - "learning_rate": 1.990856027290037e-06, - "loss": 0.8965, - "step": 8403 - }, - { - "epoch": 0.22, - "learning_rate": 1.9908522935180364e-06, - "loss": 0.8926, - "step": 8404 - }, - { - "epoch": 0.22, - "learning_rate": 1.9908485589873857e-06, - "loss": 0.6917, - "step": 8405 - }, - { - "epoch": 0.22, - "learning_rate": 1.990844823698088e-06, - "loss": 0.9473, - "step": 8406 - }, - { - "epoch": 0.22, - "learning_rate": 1.990841087650146e-06, - "loss": 1.0254, - "step": 8407 - }, - { - "epoch": 0.22, - "learning_rate": 1.9908373508435625e-06, - "loss": 0.9873, - "step": 8408 - }, - { - "epoch": 0.22, - "learning_rate": 1.990833613278341e-06, - "loss": 0.9238, - "step": 8409 - }, - { - "epoch": 0.22, - "learning_rate": 1.9908298749544827e-06, - "loss": 0.9014, - "step": 8410 - }, - { - "epoch": 0.22, - "learning_rate": 1.990826135871992e-06, - "loss": 1.0947, - "step": 8411 - }, - { - "epoch": 0.22, - "learning_rate": 1.9908223960308714e-06, - "loss": 1.1416, - "step": 8412 - }, - { - "epoch": 0.22, - "learning_rate": 1.9908186554311233e-06, - "loss": 0.7837, - "step": 8413 - }, - { - "epoch": 0.22, - "learning_rate": 1.9908149140727514e-06, - "loss": 0.9492, - "step": 8414 - }, - { - "epoch": 0.22, - "learning_rate": 1.9908111719557577e-06, - "loss": 0.8496, - "step": 8415 - }, - { - "epoch": 0.22, - "learning_rate": 1.9908074290801456e-06, - "loss": 0.9541, - "step": 8416 - }, - { - "epoch": 0.22, - "learning_rate": 1.990803685445918e-06, - "loss": 0.9141, - "step": 8417 - }, - { - "epoch": 0.22, - "learning_rate": 1.9907999410530774e-06, - "loss": 0.9648, - "step": 8418 - }, - { - "epoch": 0.22, - "learning_rate": 1.9907961959016267e-06, - "loss": 0.7979, - "step": 8419 - }, - { - "epoch": 0.22, - "learning_rate": 1.9907924499915695e-06, - "loss": 1.0195, - "step": 8420 - }, - { - "epoch": 0.22, - "learning_rate": 1.9907887033229074e-06, - "loss": 0.8604, - "step": 8421 - }, - { - "epoch": 0.22, - "learning_rate": 1.9907849558956444e-06, - "loss": 0.8301, - "step": 8422 - }, - { - "epoch": 0.22, - "learning_rate": 1.9907812077097825e-06, - "loss": 0.9092, - "step": 8423 - }, - { - "epoch": 0.22, - "learning_rate": 1.990777458765325e-06, - "loss": 0.7646, - "step": 8424 - }, - { - "epoch": 0.22, - "learning_rate": 1.990773709062275e-06, - "loss": 1.043, - "step": 8425 - }, - { - "epoch": 0.22, - "learning_rate": 1.9907699586006354e-06, - "loss": 0.8135, - "step": 8426 - }, - { - "epoch": 0.22, - "learning_rate": 1.990766207380408e-06, - "loss": 0.9941, - "step": 8427 - }, - { - "epoch": 0.22, - "learning_rate": 1.9907624554015973e-06, - "loss": 0.9189, - "step": 8428 - }, - { - "epoch": 0.22, - "learning_rate": 1.990758702664205e-06, - "loss": 1.0596, - "step": 8429 - }, - { - "epoch": 0.22, - "learning_rate": 1.990754949168234e-06, - "loss": 0.9355, - "step": 8430 - }, - { - "epoch": 0.22, - "learning_rate": 1.9907511949136884e-06, - "loss": 0.8062, - "step": 8431 - }, - { - "epoch": 0.22, - "learning_rate": 1.990747439900569e-06, - "loss": 1.0557, - "step": 8432 - }, - { - "epoch": 0.22, - "learning_rate": 1.9907436841288806e-06, - "loss": 1.0801, - "step": 8433 - }, - { - "epoch": 0.22, - "learning_rate": 1.990739927598625e-06, - "loss": 1.1729, - "step": 8434 - }, - { - "epoch": 0.22, - "learning_rate": 1.9907361703098057e-06, - "loss": 0.8057, - "step": 8435 - }, - { - "epoch": 0.22, - "learning_rate": 1.990732412262425e-06, - "loss": 0.8633, - "step": 8436 - }, - { - "epoch": 0.22, - "learning_rate": 1.990728653456486e-06, - "loss": 0.7568, - "step": 8437 - }, - { - "epoch": 0.22, - "learning_rate": 1.990724893891992e-06, - "loss": 0.8564, - "step": 8438 - }, - { - "epoch": 0.22, - "learning_rate": 1.990721133568945e-06, - "loss": 1.0234, - "step": 8439 - }, - { - "epoch": 0.22, - "learning_rate": 1.9907173724873486e-06, - "loss": 0.8613, - "step": 8440 - }, - { - "epoch": 0.22, - "learning_rate": 1.9907136106472055e-06, - "loss": 0.9209, - "step": 8441 - }, - { - "epoch": 0.22, - "learning_rate": 1.990709848048519e-06, - "loss": 0.8242, - "step": 8442 - }, - { - "epoch": 0.22, - "learning_rate": 1.9907060846912906e-06, - "loss": 1.0371, - "step": 8443 - }, - { - "epoch": 0.22, - "learning_rate": 1.990702320575525e-06, - "loss": 0.917, - "step": 8444 - }, - { - "epoch": 0.22, - "learning_rate": 1.9906985557012236e-06, - "loss": 0.8525, - "step": 8445 - }, - { - "epoch": 0.22, - "learning_rate": 1.99069479006839e-06, - "loss": 0.9746, - "step": 8446 - }, - { - "epoch": 0.22, - "learning_rate": 1.990691023677027e-06, - "loss": 1.0508, - "step": 8447 - }, - { - "epoch": 0.22, - "learning_rate": 1.990687256527137e-06, - "loss": 0.8477, - "step": 8448 - }, - { - "epoch": 0.22, - "learning_rate": 1.990683488618724e-06, - "loss": 0.8115, - "step": 8449 - }, - { - "epoch": 0.22, - "learning_rate": 1.99067971995179e-06, - "loss": 0.7705, - "step": 8450 - }, - { - "epoch": 0.22, - "learning_rate": 1.990675950526338e-06, - "loss": 0.8799, - "step": 8451 - }, - { - "epoch": 0.22, - "learning_rate": 1.990672180342371e-06, - "loss": 0.9922, - "step": 8452 - }, - { - "epoch": 0.22, - "learning_rate": 1.990668409399892e-06, - "loss": 0.918, - "step": 8453 - }, - { - "epoch": 0.22, - "learning_rate": 1.9906646376989036e-06, - "loss": 0.8252, - "step": 8454 - }, - { - "epoch": 0.22, - "learning_rate": 1.990660865239409e-06, - "loss": 0.9541, - "step": 8455 - }, - { - "epoch": 0.22, - "learning_rate": 1.9906570920214105e-06, - "loss": 0.8564, - "step": 8456 - }, - { - "epoch": 0.22, - "learning_rate": 1.9906533180449115e-06, - "loss": 0.7817, - "step": 8457 - }, - { - "epoch": 0.22, - "learning_rate": 1.9906495433099153e-06, - "loss": 0.9453, - "step": 8458 - }, - { - "epoch": 0.22, - "learning_rate": 1.990645767816424e-06, - "loss": 1.0771, - "step": 8459 - }, - { - "epoch": 0.22, - "learning_rate": 1.9906419915644407e-06, - "loss": 0.8174, - "step": 8460 - }, - { - "epoch": 0.22, - "learning_rate": 1.9906382145539684e-06, - "loss": 0.9561, - "step": 8461 - }, - { - "epoch": 0.22, - "learning_rate": 1.9906344367850103e-06, - "loss": 0.8369, - "step": 8462 - }, - { - "epoch": 0.22, - "learning_rate": 1.990630658257569e-06, - "loss": 0.6333, - "step": 8463 - }, - { - "epoch": 0.22, - "learning_rate": 1.9906268789716467e-06, - "loss": 1.0645, - "step": 8464 - }, - { - "epoch": 0.22, - "learning_rate": 1.990623098927247e-06, - "loss": 0.8867, - "step": 8465 - }, - { - "epoch": 0.22, - "learning_rate": 1.9906193181243733e-06, - "loss": 0.8779, - "step": 8466 - }, - { - "epoch": 0.22, - "learning_rate": 1.9906155365630275e-06, - "loss": 1.0195, - "step": 8467 - }, - { - "epoch": 0.22, - "learning_rate": 1.9906117542432134e-06, - "loss": 0.7412, - "step": 8468 - }, - { - "epoch": 0.22, - "learning_rate": 1.9906079711649333e-06, - "loss": 0.9463, - "step": 8469 - }, - { - "epoch": 0.22, - "learning_rate": 1.99060418732819e-06, - "loss": 0.9932, - "step": 8470 - }, - { - "epoch": 0.22, - "learning_rate": 1.9906004027329868e-06, - "loss": 0.9189, - "step": 8471 - }, - { - "epoch": 0.22, - "learning_rate": 1.990596617379326e-06, - "loss": 0.9375, - "step": 8472 - }, - { - "epoch": 0.22, - "learning_rate": 1.9905928312672114e-06, - "loss": 1.0, - "step": 8473 - }, - { - "epoch": 0.22, - "learning_rate": 1.9905890443966453e-06, - "loss": 1.0791, - "step": 8474 - }, - { - "epoch": 0.22, - "learning_rate": 1.9905852567676303e-06, - "loss": 0.7695, - "step": 8475 - }, - { - "epoch": 0.22, - "learning_rate": 1.99058146838017e-06, - "loss": 0.9658, - "step": 8476 - }, - { - "epoch": 0.22, - "learning_rate": 1.9905776792342674e-06, - "loss": 1.0771, - "step": 8477 - }, - { - "epoch": 0.22, - "learning_rate": 1.9905738893299245e-06, - "loss": 0.999, - "step": 8478 - }, - { - "epoch": 0.22, - "learning_rate": 1.9905700986671454e-06, - "loss": 0.8887, - "step": 8479 - }, - { - "epoch": 0.22, - "learning_rate": 1.9905663072459317e-06, - "loss": 0.9668, - "step": 8480 - }, - { - "epoch": 0.22, - "learning_rate": 1.9905625150662872e-06, - "loss": 1.1006, - "step": 8481 - }, - { - "epoch": 0.22, - "learning_rate": 1.990558722128214e-06, - "loss": 0.9697, - "step": 8482 - }, - { - "epoch": 0.22, - "learning_rate": 1.990554928431716e-06, - "loss": 1.1328, - "step": 8483 - }, - { - "epoch": 0.22, - "learning_rate": 1.9905511339767956e-06, - "loss": 0.6729, - "step": 8484 - }, - { - "epoch": 0.22, - "learning_rate": 1.990547338763456e-06, - "loss": 0.9736, - "step": 8485 - }, - { - "epoch": 0.22, - "learning_rate": 1.9905435427916997e-06, - "loss": 0.7842, - "step": 8486 - }, - { - "epoch": 0.22, - "learning_rate": 1.9905397460615295e-06, - "loss": 0.8926, - "step": 8487 - }, - { - "epoch": 0.22, - "learning_rate": 1.990535948572949e-06, - "loss": 1.0967, - "step": 8488 - }, - { - "epoch": 0.22, - "learning_rate": 1.99053215032596e-06, - "loss": 1.0029, - "step": 8489 - }, - { - "epoch": 0.22, - "learning_rate": 1.9905283513205667e-06, - "loss": 1.0098, - "step": 8490 - }, - { - "epoch": 0.22, - "learning_rate": 1.990524551556771e-06, - "loss": 1.1494, - "step": 8491 - }, - { - "epoch": 0.22, - "learning_rate": 1.990520751034576e-06, - "loss": 1.0664, - "step": 8492 - }, - { - "epoch": 0.22, - "learning_rate": 1.9905169497539858e-06, - "loss": 0.8096, - "step": 8493 - }, - { - "epoch": 0.22, - "learning_rate": 1.9905131477150015e-06, - "loss": 0.8945, - "step": 8494 - }, - { - "epoch": 0.22, - "learning_rate": 1.990509344917627e-06, - "loss": 0.9004, - "step": 8495 - }, - { - "epoch": 0.22, - "learning_rate": 1.990505541361865e-06, - "loss": 1.0576, - "step": 8496 - }, - { - "epoch": 0.22, - "learning_rate": 1.9905017370477185e-06, - "loss": 1.1602, - "step": 8497 - }, - { - "epoch": 0.22, - "learning_rate": 1.9904979319751904e-06, - "loss": 0.8447, - "step": 8498 - }, - { - "epoch": 0.22, - "learning_rate": 1.9904941261442835e-06, - "loss": 0.9028, - "step": 8499 - }, - { - "epoch": 0.22, - "learning_rate": 1.990490319555001e-06, - "loss": 1.2139, - "step": 8500 - }, - { - "epoch": 0.22, - "learning_rate": 1.9904865122073452e-06, - "loss": 0.7651, - "step": 8501 - }, - { - "epoch": 0.22, - "learning_rate": 1.9904827041013197e-06, - "loss": 0.8555, - "step": 8502 - }, - { - "epoch": 0.22, - "learning_rate": 1.990478895236927e-06, - "loss": 0.9424, - "step": 8503 - }, - { - "epoch": 0.22, - "learning_rate": 1.9904750856141704e-06, - "loss": 0.958, - "step": 8504 - }, - { - "epoch": 0.22, - "learning_rate": 1.990471275233052e-06, - "loss": 0.9785, - "step": 8505 - }, - { - "epoch": 0.22, - "learning_rate": 1.990467464093576e-06, - "loss": 1.0566, - "step": 8506 - }, - { - "epoch": 0.22, - "learning_rate": 1.9904636521957443e-06, - "loss": 0.9102, - "step": 8507 - }, - { - "epoch": 0.22, - "learning_rate": 1.99045983953956e-06, - "loss": 1.0137, - "step": 8508 - }, - { - "epoch": 0.22, - "learning_rate": 1.9904560261250265e-06, - "loss": 0.8071, - "step": 8509 - }, - { - "epoch": 0.22, - "learning_rate": 1.9904522119521457e-06, - "loss": 0.6309, - "step": 8510 - }, - { - "epoch": 0.22, - "learning_rate": 1.990448397020922e-06, - "loss": 0.8379, - "step": 8511 - }, - { - "epoch": 0.22, - "learning_rate": 1.990444581331357e-06, - "loss": 0.748, - "step": 8512 - }, - { - "epoch": 0.22, - "learning_rate": 1.990440764883454e-06, - "loss": 0.957, - "step": 8513 - }, - { - "epoch": 0.22, - "learning_rate": 1.9904369476772163e-06, - "loss": 0.9629, - "step": 8514 - }, - { - "epoch": 0.22, - "learning_rate": 1.9904331297126468e-06, - "loss": 0.9766, - "step": 8515 - }, - { - "epoch": 0.22, - "learning_rate": 1.9904293109897477e-06, - "loss": 1.1738, - "step": 8516 - }, - { - "epoch": 0.22, - "learning_rate": 1.990425491508523e-06, - "loss": 0.8662, - "step": 8517 - }, - { - "epoch": 0.22, - "learning_rate": 1.990421671268975e-06, - "loss": 0.7451, - "step": 8518 - }, - { - "epoch": 0.22, - "learning_rate": 1.9904178502711062e-06, - "loss": 0.9111, - "step": 8519 - }, - { - "epoch": 0.22, - "learning_rate": 1.99041402851492e-06, - "loss": 0.9053, - "step": 8520 - }, - { - "epoch": 0.22, - "learning_rate": 1.9904102060004197e-06, - "loss": 0.6328, - "step": 8521 - }, - { - "epoch": 0.22, - "learning_rate": 1.9904063827276073e-06, - "loss": 1.0049, - "step": 8522 - }, - { - "epoch": 0.22, - "learning_rate": 1.9904025586964866e-06, - "loss": 0.9785, - "step": 8523 - }, - { - "epoch": 0.22, - "learning_rate": 1.9903987339070605e-06, - "loss": 1.0508, - "step": 8524 - }, - { - "epoch": 0.22, - "learning_rate": 1.9903949083593315e-06, - "loss": 0.9033, - "step": 8525 - }, - { - "epoch": 0.22, - "learning_rate": 1.990391082053302e-06, - "loss": 0.7344, - "step": 8526 - }, - { - "epoch": 0.22, - "learning_rate": 1.9903872549889764e-06, - "loss": 0.6831, - "step": 8527 - }, - { - "epoch": 0.22, - "learning_rate": 1.9903834271663566e-06, - "loss": 0.8682, - "step": 8528 - }, - { - "epoch": 0.22, - "learning_rate": 1.9903795985854454e-06, - "loss": 0.8418, - "step": 8529 - }, - { - "epoch": 0.22, - "learning_rate": 1.9903757692462466e-06, - "loss": 0.7979, - "step": 8530 - }, - { - "epoch": 0.22, - "learning_rate": 1.9903719391487623e-06, - "loss": 0.9199, - "step": 8531 - }, - { - "epoch": 0.22, - "learning_rate": 1.990368108292996e-06, - "loss": 1.0547, - "step": 8532 - }, - { - "epoch": 0.22, - "learning_rate": 1.99036427667895e-06, - "loss": 1.1504, - "step": 8533 - }, - { - "epoch": 0.22, - "learning_rate": 1.9903604443066277e-06, - "loss": 1.0322, - "step": 8534 - }, - { - "epoch": 0.22, - "learning_rate": 1.990356611176032e-06, - "loss": 0.8232, - "step": 8535 - }, - { - "epoch": 0.22, - "learning_rate": 1.990352777287166e-06, - "loss": 0.9795, - "step": 8536 - }, - { - "epoch": 0.22, - "learning_rate": 1.990348942640032e-06, - "loss": 1.0283, - "step": 8537 - }, - { - "epoch": 0.22, - "learning_rate": 1.9903451072346337e-06, - "loss": 0.7808, - "step": 8538 - }, - { - "epoch": 0.22, - "learning_rate": 1.9903412710709734e-06, - "loss": 1.0195, - "step": 8539 - }, - { - "epoch": 0.22, - "learning_rate": 1.990337434149055e-06, - "loss": 0.9321, - "step": 8540 - }, - { - "epoch": 0.22, - "learning_rate": 1.99033359646888e-06, - "loss": 0.9629, - "step": 8541 - }, - { - "epoch": 0.22, - "learning_rate": 1.990329758030452e-06, - "loss": 0.8203, - "step": 8542 - }, - { - "epoch": 0.22, - "learning_rate": 1.990325918833775e-06, - "loss": 0.999, - "step": 8543 - }, - { - "epoch": 0.22, - "learning_rate": 1.99032207887885e-06, - "loss": 0.9727, - "step": 8544 - }, - { - "epoch": 0.22, - "learning_rate": 1.9903182381656815e-06, - "loss": 0.8066, - "step": 8545 - }, - { - "epoch": 0.22, - "learning_rate": 1.9903143966942713e-06, - "loss": 0.7305, - "step": 8546 - }, - { - "epoch": 0.22, - "learning_rate": 1.9903105544646236e-06, - "loss": 0.8906, - "step": 8547 - }, - { - "epoch": 0.22, - "learning_rate": 1.99030671147674e-06, - "loss": 0.7673, - "step": 8548 - }, - { - "epoch": 0.22, - "learning_rate": 1.9903028677306245e-06, - "loss": 0.7578, - "step": 8549 - }, - { - "epoch": 0.22, - "learning_rate": 1.9902990232262795e-06, - "loss": 0.7344, - "step": 8550 - }, - { - "epoch": 0.22, - "learning_rate": 1.9902951779637084e-06, - "loss": 0.6953, - "step": 8551 - }, - { - "epoch": 0.22, - "learning_rate": 1.9902913319429135e-06, - "loss": 0.8994, - "step": 8552 - }, - { - "epoch": 0.22, - "learning_rate": 1.990287485163898e-06, - "loss": 1.042, - "step": 8553 - }, - { - "epoch": 0.22, - "learning_rate": 1.990283637626665e-06, - "loss": 0.8516, - "step": 8554 - }, - { - "epoch": 0.22, - "learning_rate": 1.9902797893312175e-06, - "loss": 0.8154, - "step": 8555 - }, - { - "epoch": 0.22, - "learning_rate": 1.990275940277558e-06, - "loss": 0.9492, - "step": 8556 - }, - { - "epoch": 0.22, - "learning_rate": 1.9902720904656894e-06, - "loss": 0.8186, - "step": 8557 - }, - { - "epoch": 0.22, - "learning_rate": 1.9902682398956157e-06, - "loss": 0.9404, - "step": 8558 - }, - { - "epoch": 0.22, - "learning_rate": 1.990264388567339e-06, - "loss": 0.9751, - "step": 8559 - }, - { - "epoch": 0.22, - "learning_rate": 1.9902605364808625e-06, - "loss": 0.811, - "step": 8560 - }, - { - "epoch": 0.22, - "learning_rate": 1.9902566836361886e-06, - "loss": 0.8877, - "step": 8561 - }, - { - "epoch": 0.22, - "learning_rate": 1.990252830033321e-06, - "loss": 0.8721, - "step": 8562 - }, - { - "epoch": 0.22, - "learning_rate": 1.9902489756722624e-06, - "loss": 1.0312, - "step": 8563 - }, - { - "epoch": 0.22, - "learning_rate": 1.9902451205530153e-06, - "loss": 1.1191, - "step": 8564 - }, - { - "epoch": 0.22, - "learning_rate": 1.9902412646755835e-06, - "loss": 0.9717, - "step": 8565 - }, - { - "epoch": 0.22, - "learning_rate": 1.990237408039969e-06, - "loss": 1.0127, - "step": 8566 - }, - { - "epoch": 0.22, - "learning_rate": 1.990233550646176e-06, - "loss": 1.2324, - "step": 8567 - }, - { - "epoch": 0.22, - "learning_rate": 1.990229692494206e-06, - "loss": 0.8369, - "step": 8568 - }, - { - "epoch": 0.22, - "learning_rate": 1.990225833584063e-06, - "loss": 0.8506, - "step": 8569 - }, - { - "epoch": 0.22, - "learning_rate": 1.9902219739157493e-06, - "loss": 0.9746, - "step": 8570 - }, - { - "epoch": 0.22, - "learning_rate": 1.9902181134892687e-06, - "loss": 1.1689, - "step": 8571 - }, - { - "epoch": 0.22, - "learning_rate": 1.990214252304623e-06, - "loss": 0.8501, - "step": 8572 - }, - { - "epoch": 0.22, - "learning_rate": 1.9902103903618163e-06, - "loss": 0.7725, - "step": 8573 - }, - { - "epoch": 0.22, - "learning_rate": 1.990206527660851e-06, - "loss": 1.0879, - "step": 8574 - }, - { - "epoch": 0.22, - "learning_rate": 1.99020266420173e-06, - "loss": 1.0547, - "step": 8575 - }, - { - "epoch": 0.22, - "learning_rate": 1.9901987999844564e-06, - "loss": 0.8535, - "step": 8576 - }, - { - "epoch": 0.22, - "learning_rate": 1.9901949350090327e-06, - "loss": 1.0713, - "step": 8577 - }, - { - "epoch": 0.22, - "learning_rate": 1.9901910692754624e-06, - "loss": 0.9062, - "step": 8578 - }, - { - "epoch": 0.22, - "learning_rate": 1.9901872027837485e-06, - "loss": 0.7256, - "step": 8579 - }, - { - "epoch": 0.22, - "learning_rate": 1.990183335533894e-06, - "loss": 0.9678, - "step": 8580 - }, - { - "epoch": 0.22, - "learning_rate": 1.9901794675259013e-06, - "loss": 0.8672, - "step": 8581 - }, - { - "epoch": 0.22, - "learning_rate": 1.990175598759774e-06, - "loss": 0.9526, - "step": 8582 - }, - { - "epoch": 0.22, - "learning_rate": 1.990171729235515e-06, - "loss": 0.9189, - "step": 8583 - }, - { - "epoch": 0.22, - "learning_rate": 1.9901678589531265e-06, - "loss": 0.9722, - "step": 8584 - }, - { - "epoch": 0.22, - "learning_rate": 1.990163987912612e-06, - "loss": 1.1699, - "step": 8585 - }, - { - "epoch": 0.22, - "learning_rate": 1.9901601161139744e-06, - "loss": 0.8311, - "step": 8586 - }, - { - "epoch": 0.22, - "learning_rate": 1.990156243557217e-06, - "loss": 0.9736, - "step": 8587 - }, - { - "epoch": 0.22, - "learning_rate": 1.9901523702423423e-06, - "loss": 1.0195, - "step": 8588 - }, - { - "epoch": 0.22, - "learning_rate": 1.9901484961693536e-06, - "loss": 0.7905, - "step": 8589 - }, - { - "epoch": 0.22, - "learning_rate": 1.990144621338254e-06, - "loss": 0.9961, - "step": 8590 - }, - { - "epoch": 0.22, - "learning_rate": 1.9901407457490457e-06, - "loss": 0.999, - "step": 8591 - }, - { - "epoch": 0.22, - "learning_rate": 1.9901368694017325e-06, - "loss": 0.8535, - "step": 8592 - }, - { - "epoch": 0.22, - "learning_rate": 1.9901329922963167e-06, - "loss": 0.7939, - "step": 8593 - }, - { - "epoch": 0.22, - "learning_rate": 1.990129114432802e-06, - "loss": 0.8701, - "step": 8594 - }, - { - "epoch": 0.22, - "learning_rate": 1.9901252358111907e-06, - "loss": 0.9639, - "step": 8595 - }, - { - "epoch": 0.22, - "learning_rate": 1.990121356431486e-06, - "loss": 0.9404, - "step": 8596 - }, - { - "epoch": 0.22, - "learning_rate": 1.990117476293691e-06, - "loss": 0.9062, - "step": 8597 - }, - { - "epoch": 0.22, - "learning_rate": 1.9901135953978087e-06, - "loss": 0.8711, - "step": 8598 - }, - { - "epoch": 0.22, - "learning_rate": 1.9901097137438417e-06, - "loss": 0.9697, - "step": 8599 - }, - { - "epoch": 0.22, - "learning_rate": 1.9901058313317933e-06, - "loss": 0.8042, - "step": 8600 - }, - { - "epoch": 0.22, - "learning_rate": 1.9901019481616665e-06, - "loss": 0.9404, - "step": 8601 - }, - { - "epoch": 0.22, - "learning_rate": 1.990098064233464e-06, - "loss": 0.9795, - "step": 8602 - }, - { - "epoch": 0.22, - "learning_rate": 1.990094179547189e-06, - "loss": 0.9785, - "step": 8603 - }, - { - "epoch": 0.22, - "learning_rate": 1.9900902941028446e-06, - "loss": 0.8984, - "step": 8604 - }, - { - "epoch": 0.22, - "learning_rate": 1.990086407900433e-06, - "loss": 0.6182, - "step": 8605 - }, - { - "epoch": 0.22, - "learning_rate": 1.9900825209399583e-06, - "loss": 0.8569, - "step": 8606 - }, - { - "epoch": 0.22, - "learning_rate": 1.990078633221423e-06, - "loss": 0.8691, - "step": 8607 - }, - { - "epoch": 0.22, - "learning_rate": 1.99007474474483e-06, - "loss": 0.6846, - "step": 8608 - }, - { - "epoch": 0.22, - "learning_rate": 1.990070855510182e-06, - "loss": 0.9023, - "step": 8609 - }, - { - "epoch": 0.22, - "learning_rate": 1.9900669655174826e-06, - "loss": 0.9922, - "step": 8610 - }, - { - "epoch": 0.22, - "learning_rate": 1.990063074766734e-06, - "loss": 0.957, - "step": 8611 - }, - { - "epoch": 0.22, - "learning_rate": 1.99005918325794e-06, - "loss": 0.9873, - "step": 8612 - }, - { - "epoch": 0.22, - "learning_rate": 1.990055290991103e-06, - "loss": 0.9072, - "step": 8613 - }, - { - "epoch": 0.22, - "learning_rate": 1.990051397966226e-06, - "loss": 1.0156, - "step": 8614 - }, - { - "epoch": 0.22, - "learning_rate": 1.9900475041833127e-06, - "loss": 0.9541, - "step": 8615 - }, - { - "epoch": 0.22, - "learning_rate": 1.9900436096423653e-06, - "loss": 0.9473, - "step": 8616 - }, - { - "epoch": 0.22, - "learning_rate": 1.990039714343387e-06, - "loss": 0.9292, - "step": 8617 - }, - { - "epoch": 0.22, - "learning_rate": 1.9900358182863807e-06, - "loss": 1.1035, - "step": 8618 - }, - { - "epoch": 0.22, - "learning_rate": 1.9900319214713498e-06, - "loss": 0.635, - "step": 8619 - }, - { - "epoch": 0.22, - "learning_rate": 1.9900280238982968e-06, - "loss": 0.9297, - "step": 8620 - }, - { - "epoch": 0.22, - "learning_rate": 1.990024125567225e-06, - "loss": 0.8818, - "step": 8621 - }, - { - "epoch": 0.22, - "learning_rate": 1.990020226478137e-06, - "loss": 0.9629, - "step": 8622 - }, - { - "epoch": 0.22, - "learning_rate": 1.9900163266310363e-06, - "loss": 1.0098, - "step": 8623 - }, - { - "epoch": 0.22, - "learning_rate": 1.990012426025925e-06, - "loss": 0.7712, - "step": 8624 - }, - { - "epoch": 0.22, - "learning_rate": 1.9900085246628075e-06, - "loss": 0.8457, - "step": 8625 - }, - { - "epoch": 0.22, - "learning_rate": 1.9900046225416857e-06, - "loss": 0.9316, - "step": 8626 - }, - { - "epoch": 0.22, - "learning_rate": 1.990000719662563e-06, - "loss": 0.9883, - "step": 8627 - }, - { - "epoch": 0.22, - "learning_rate": 1.989996816025442e-06, - "loss": 0.833, - "step": 8628 - }, - { - "epoch": 0.22, - "learning_rate": 1.989992911630326e-06, - "loss": 0.9023, - "step": 8629 - }, - { - "epoch": 0.22, - "learning_rate": 1.989989006477218e-06, - "loss": 0.5591, - "step": 8630 - }, - { - "epoch": 0.22, - "learning_rate": 1.989985100566121e-06, - "loss": 0.9146, - "step": 8631 - }, - { - "epoch": 0.22, - "learning_rate": 1.9899811938970382e-06, - "loss": 0.9463, - "step": 8632 - }, - { - "epoch": 0.22, - "learning_rate": 1.9899772864699716e-06, - "loss": 0.9062, - "step": 8633 - }, - { - "epoch": 0.22, - "learning_rate": 1.9899733782849256e-06, - "loss": 0.833, - "step": 8634 - }, - { - "epoch": 0.22, - "learning_rate": 1.9899694693419024e-06, - "loss": 1.0137, - "step": 8635 - }, - { - "epoch": 0.22, - "learning_rate": 1.989965559640905e-06, - "loss": 0.875, - "step": 8636 - }, - { - "epoch": 0.22, - "learning_rate": 1.989961649181936e-06, - "loss": 0.751, - "step": 8637 - }, - { - "epoch": 0.22, - "learning_rate": 1.9899577379649996e-06, - "loss": 0.9111, - "step": 8638 - }, - { - "epoch": 0.22, - "learning_rate": 1.9899538259900978e-06, - "loss": 1.1406, - "step": 8639 - }, - { - "epoch": 0.22, - "learning_rate": 1.989949913257234e-06, - "loss": 0.6367, - "step": 8640 - }, - { - "epoch": 0.22, - "learning_rate": 1.989945999766411e-06, - "loss": 0.8955, - "step": 8641 - }, - { - "epoch": 0.22, - "learning_rate": 1.9899420855176315e-06, - "loss": 1.0576, - "step": 8642 - }, - { - "epoch": 0.22, - "learning_rate": 1.9899381705108993e-06, - "loss": 0.9355, - "step": 8643 - }, - { - "epoch": 0.22, - "learning_rate": 1.9899342547462167e-06, - "loss": 0.9502, - "step": 8644 - }, - { - "epoch": 0.22, - "learning_rate": 1.9899303382235874e-06, - "loss": 0.6582, - "step": 8645 - }, - { - "epoch": 0.22, - "learning_rate": 1.9899264209430135e-06, - "loss": 0.9624, - "step": 8646 - }, - { - "epoch": 0.22, - "learning_rate": 1.989922502904499e-06, - "loss": 0.8789, - "step": 8647 - }, - { - "epoch": 0.22, - "learning_rate": 1.9899185841080457e-06, - "loss": 0.918, - "step": 8648 - }, - { - "epoch": 0.22, - "learning_rate": 1.9899146645536576e-06, - "loss": 1.1162, - "step": 8649 - }, - { - "epoch": 0.22, - "learning_rate": 1.9899107442413373e-06, - "loss": 0.9619, - "step": 8650 - }, - { - "epoch": 0.22, - "learning_rate": 1.9899068231710876e-06, - "loss": 0.8145, - "step": 8651 - }, - { - "epoch": 0.22, - "learning_rate": 1.989902901342912e-06, - "loss": 0.8467, - "step": 8652 - }, - { - "epoch": 0.22, - "learning_rate": 1.9898989787568135e-06, - "loss": 0.7344, - "step": 8653 - }, - { - "epoch": 0.22, - "learning_rate": 1.9898950554127945e-06, - "loss": 0.8516, - "step": 8654 - }, - { - "epoch": 0.22, - "learning_rate": 1.9898911313108585e-06, - "loss": 0.9326, - "step": 8655 - }, - { - "epoch": 0.22, - "learning_rate": 1.989887206451009e-06, - "loss": 0.7969, - "step": 8656 - }, - { - "epoch": 0.22, - "learning_rate": 1.989883280833247e-06, - "loss": 0.7949, - "step": 8657 - }, - { - "epoch": 0.22, - "learning_rate": 1.989879354457578e-06, - "loss": 0.8359, - "step": 8658 - }, - { - "epoch": 0.22, - "learning_rate": 1.9898754273240033e-06, - "loss": 0.9551, - "step": 8659 - }, - { - "epoch": 0.22, - "learning_rate": 1.989871499432527e-06, - "loss": 0.9697, - "step": 8660 - }, - { - "epoch": 0.22, - "learning_rate": 1.9898675707831515e-06, - "loss": 1.0137, - "step": 8661 - }, - { - "epoch": 0.22, - "learning_rate": 1.9898636413758797e-06, - "loss": 1.0, - "step": 8662 - }, - { - "epoch": 0.22, - "learning_rate": 1.9898597112107145e-06, - "loss": 0.8857, - "step": 8663 - }, - { - "epoch": 0.22, - "learning_rate": 1.98985578028766e-06, - "loss": 0.8662, - "step": 8664 - }, - { - "epoch": 0.22, - "learning_rate": 1.989851848606718e-06, - "loss": 0.8291, - "step": 8665 - }, - { - "epoch": 0.22, - "learning_rate": 1.9898479161678923e-06, - "loss": 0.9043, - "step": 8666 - }, - { - "epoch": 0.22, - "learning_rate": 1.989843982971185e-06, - "loss": 0.79, - "step": 8667 - }, - { - "epoch": 0.22, - "learning_rate": 1.9898400490166e-06, - "loss": 0.9385, - "step": 8668 - }, - { - "epoch": 0.22, - "learning_rate": 1.9898361143041402e-06, - "loss": 0.834, - "step": 8669 - }, - { - "epoch": 0.22, - "learning_rate": 1.989832178833808e-06, - "loss": 0.9233, - "step": 8670 - }, - { - "epoch": 0.22, - "learning_rate": 1.989828242605607e-06, - "loss": 1.1445, - "step": 8671 - }, - { - "epoch": 0.22, - "learning_rate": 1.98982430561954e-06, - "loss": 0.7607, - "step": 8672 - }, - { - "epoch": 0.22, - "learning_rate": 1.9898203678756104e-06, - "loss": 1.2188, - "step": 8673 - }, - { - "epoch": 0.22, - "learning_rate": 1.9898164293738204e-06, - "loss": 0.917, - "step": 8674 - }, - { - "epoch": 0.22, - "learning_rate": 1.9898124901141735e-06, - "loss": 0.9326, - "step": 8675 - }, - { - "epoch": 0.22, - "learning_rate": 1.9898085500966726e-06, - "loss": 0.8018, - "step": 8676 - }, - { - "epoch": 0.22, - "learning_rate": 1.989804609321321e-06, - "loss": 0.9346, - "step": 8677 - }, - { - "epoch": 0.22, - "learning_rate": 1.9898006677881218e-06, - "loss": 1.0918, - "step": 8678 - }, - { - "epoch": 0.22, - "learning_rate": 1.9897967254970773e-06, - "loss": 0.9131, - "step": 8679 - }, - { - "epoch": 0.22, - "learning_rate": 1.9897927824481912e-06, - "loss": 0.834, - "step": 8680 - }, - { - "epoch": 0.22, - "learning_rate": 1.989788838641466e-06, - "loss": 0.9844, - "step": 8681 - }, - { - "epoch": 0.22, - "learning_rate": 1.989784894076905e-06, - "loss": 0.999, - "step": 8682 - }, - { - "epoch": 0.22, - "learning_rate": 1.9897809487545115e-06, - "loss": 1.0146, - "step": 8683 - }, - { - "epoch": 0.22, - "learning_rate": 1.9897770026742884e-06, - "loss": 0.7725, - "step": 8684 - }, - { - "epoch": 0.22, - "learning_rate": 1.989773055836238e-06, - "loss": 1.1777, - "step": 8685 - }, - { - "epoch": 0.22, - "learning_rate": 1.9897691082403644e-06, - "loss": 0.8643, - "step": 8686 - }, - { - "epoch": 0.22, - "learning_rate": 1.9897651598866698e-06, - "loss": 0.8975, - "step": 8687 - }, - { - "epoch": 0.22, - "learning_rate": 1.9897612107751576e-06, - "loss": 0.9648, - "step": 8688 - }, - { - "epoch": 0.22, - "learning_rate": 1.989757260905831e-06, - "loss": 0.8867, - "step": 8689 - }, - { - "epoch": 0.22, - "learning_rate": 1.9897533102786923e-06, - "loss": 0.6387, - "step": 8690 - }, - { - "epoch": 0.22, - "learning_rate": 1.9897493588937454e-06, - "loss": 0.96, - "step": 8691 - }, - { - "epoch": 0.22, - "learning_rate": 1.989745406750993e-06, - "loss": 0.7822, - "step": 8692 - }, - { - "epoch": 0.22, - "learning_rate": 1.9897414538504377e-06, - "loss": 1.0244, - "step": 8693 - }, - { - "epoch": 0.22, - "learning_rate": 1.9897375001920828e-06, - "loss": 0.9453, - "step": 8694 - }, - { - "epoch": 0.22, - "learning_rate": 1.9897335457759315e-06, - "loss": 1.1924, - "step": 8695 - }, - { - "epoch": 0.22, - "learning_rate": 1.989729590601987e-06, - "loss": 0.8623, - "step": 8696 - }, - { - "epoch": 0.22, - "learning_rate": 1.989725634670252e-06, - "loss": 0.7881, - "step": 8697 - }, - { - "epoch": 0.22, - "learning_rate": 1.9897216779807294e-06, - "loss": 0.8853, - "step": 8698 - }, - { - "epoch": 0.22, - "learning_rate": 1.9897177205334225e-06, - "loss": 0.9521, - "step": 8699 - }, - { - "epoch": 0.22, - "learning_rate": 1.989713762328334e-06, - "loss": 1.0137, - "step": 8700 - }, - { - "epoch": 0.22, - "learning_rate": 1.989709803365468e-06, - "loss": 0.916, - "step": 8701 - }, - { - "epoch": 0.22, - "learning_rate": 1.9897058436448258e-06, - "loss": 0.8564, - "step": 8702 - }, - { - "epoch": 0.22, - "learning_rate": 1.989701883166412e-06, - "loss": 0.9365, - "step": 8703 - }, - { - "epoch": 0.22, - "learning_rate": 1.9896979219302287e-06, - "loss": 0.8281, - "step": 8704 - }, - { - "epoch": 0.22, - "learning_rate": 1.989693959936279e-06, - "loss": 1.2402, - "step": 8705 - }, - { - "epoch": 0.22, - "learning_rate": 1.989689997184566e-06, - "loss": 0.8711, - "step": 8706 - }, - { - "epoch": 0.22, - "learning_rate": 1.9896860336750936e-06, - "loss": 1.0254, - "step": 8707 - }, - { - "epoch": 0.22, - "learning_rate": 1.9896820694078636e-06, - "loss": 0.9268, - "step": 8708 - }, - { - "epoch": 0.22, - "learning_rate": 1.9896781043828796e-06, - "loss": 0.9346, - "step": 8709 - }, - { - "epoch": 0.22, - "learning_rate": 1.9896741386001446e-06, - "loss": 0.7163, - "step": 8710 - }, - { - "epoch": 0.22, - "learning_rate": 1.9896701720596616e-06, - "loss": 0.8359, - "step": 8711 - }, - { - "epoch": 0.22, - "learning_rate": 1.989666204761434e-06, - "loss": 0.8809, - "step": 8712 - }, - { - "epoch": 0.22, - "learning_rate": 1.989662236705464e-06, - "loss": 0.6641, - "step": 8713 - }, - { - "epoch": 0.22, - "learning_rate": 1.989658267891755e-06, - "loss": 1.0029, - "step": 8714 - }, - { - "epoch": 0.22, - "learning_rate": 1.989654298320311e-06, - "loss": 0.8232, - "step": 8715 - }, - { - "epoch": 0.22, - "learning_rate": 1.9896503279911337e-06, - "loss": 0.9141, - "step": 8716 - }, - { - "epoch": 0.22, - "learning_rate": 1.9896463569042267e-06, - "loss": 0.9648, - "step": 8717 - }, - { - "epoch": 0.22, - "learning_rate": 1.989642385059593e-06, - "loss": 1.0674, - "step": 8718 - }, - { - "epoch": 0.22, - "learning_rate": 1.9896384124572356e-06, - "loss": 0.8799, - "step": 8719 - }, - { - "epoch": 0.22, - "learning_rate": 1.9896344390971573e-06, - "loss": 1.0, - "step": 8720 - }, - { - "epoch": 0.22, - "learning_rate": 1.9896304649793615e-06, - "loss": 0.958, - "step": 8721 - }, - { - "epoch": 0.22, - "learning_rate": 1.9896264901038515e-06, - "loss": 0.9961, - "step": 8722 - }, - { - "epoch": 0.22, - "learning_rate": 1.98962251447063e-06, - "loss": 0.9395, - "step": 8723 - }, - { - "epoch": 0.22, - "learning_rate": 1.9896185380797e-06, - "loss": 0.9814, - "step": 8724 - }, - { - "epoch": 0.22, - "learning_rate": 1.989614560931064e-06, - "loss": 0.9536, - "step": 8725 - }, - { - "epoch": 0.22, - "learning_rate": 1.989610583024726e-06, - "loss": 1.0391, - "step": 8726 - }, - { - "epoch": 0.22, - "learning_rate": 1.9896066043606893e-06, - "loss": 0.9492, - "step": 8727 - }, - { - "epoch": 0.22, - "learning_rate": 1.9896026249389557e-06, - "loss": 0.7646, - "step": 8728 - }, - { - "epoch": 0.22, - "learning_rate": 1.9895986447595287e-06, - "loss": 0.9912, - "step": 8729 - }, - { - "epoch": 0.22, - "learning_rate": 1.989594663822412e-06, - "loss": 0.6636, - "step": 8730 - }, - { - "epoch": 0.22, - "learning_rate": 1.989590682127608e-06, - "loss": 0.8926, - "step": 8731 - }, - { - "epoch": 0.22, - "learning_rate": 1.9895866996751197e-06, - "loss": 1.123, - "step": 8732 - }, - { - "epoch": 0.22, - "learning_rate": 1.9895827164649507e-06, - "loss": 1.0566, - "step": 8733 - }, - { - "epoch": 0.22, - "learning_rate": 1.9895787324971036e-06, - "loss": 0.7632, - "step": 8734 - }, - { - "epoch": 0.22, - "learning_rate": 1.9895747477715817e-06, - "loss": 0.4839, - "step": 8735 - }, - { - "epoch": 0.22, - "learning_rate": 1.9895707622883876e-06, - "loss": 0.7407, - "step": 8736 - }, - { - "epoch": 0.22, - "learning_rate": 1.9895667760475246e-06, - "loss": 0.9414, - "step": 8737 - }, - { - "epoch": 0.22, - "learning_rate": 1.989562789048996e-06, - "loss": 0.874, - "step": 8738 - }, - { - "epoch": 0.22, - "learning_rate": 1.9895588012928052e-06, - "loss": 0.873, - "step": 8739 - }, - { - "epoch": 0.22, - "learning_rate": 1.989554812778954e-06, - "loss": 0.6748, - "step": 8740 - }, - { - "epoch": 0.22, - "learning_rate": 1.9895508235074464e-06, - "loss": 1.166, - "step": 8741 - }, - { - "epoch": 0.22, - "learning_rate": 1.9895468334782853e-06, - "loss": 1.084, - "step": 8742 - }, - { - "epoch": 0.22, - "learning_rate": 1.9895428426914736e-06, - "loss": 0.7529, - "step": 8743 - }, - { - "epoch": 0.22, - "learning_rate": 1.9895388511470146e-06, - "loss": 0.8213, - "step": 8744 - }, - { - "epoch": 0.22, - "learning_rate": 1.989534858844911e-06, - "loss": 0.7275, - "step": 8745 - }, - { - "epoch": 0.22, - "learning_rate": 1.9895308657851663e-06, - "loss": 0.96, - "step": 8746 - }, - { - "epoch": 0.22, - "learning_rate": 1.989526871967783e-06, - "loss": 0.918, - "step": 8747 - }, - { - "epoch": 0.22, - "learning_rate": 1.9895228773927646e-06, - "loss": 1.1074, - "step": 8748 - }, - { - "epoch": 0.22, - "learning_rate": 1.989518882060114e-06, - "loss": 0.875, - "step": 8749 - }, - { - "epoch": 0.22, - "learning_rate": 1.9895148859698344e-06, - "loss": 0.7515, - "step": 8750 - }, - { - "epoch": 0.22, - "learning_rate": 1.989510889121929e-06, - "loss": 1.0205, - "step": 8751 - }, - { - "epoch": 0.22, - "learning_rate": 1.9895068915164003e-06, - "loss": 0.8711, - "step": 8752 - }, - { - "epoch": 0.22, - "learning_rate": 1.9895028931532515e-06, - "loss": 1.2109, - "step": 8753 - }, - { - "epoch": 0.22, - "learning_rate": 1.989498894032486e-06, - "loss": 0.8584, - "step": 8754 - }, - { - "epoch": 0.22, - "learning_rate": 1.9894948941541067e-06, - "loss": 0.6992, - "step": 8755 - }, - { - "epoch": 0.22, - "learning_rate": 1.9894908935181166e-06, - "loss": 0.8237, - "step": 8756 - }, - { - "epoch": 0.22, - "learning_rate": 1.989486892124519e-06, - "loss": 0.876, - "step": 8757 - }, - { - "epoch": 0.22, - "learning_rate": 1.989482889973317e-06, - "loss": 0.9707, - "step": 8758 - }, - { - "epoch": 0.22, - "learning_rate": 1.989478887064513e-06, - "loss": 0.9023, - "step": 8759 - }, - { - "epoch": 0.22, - "learning_rate": 1.9894748833981104e-06, - "loss": 0.9502, - "step": 8760 - }, - { - "epoch": 0.22, - "learning_rate": 1.9894708789741127e-06, - "loss": 0.9141, - "step": 8761 - }, - { - "epoch": 0.22, - "learning_rate": 1.9894668737925227e-06, - "loss": 1.0273, - "step": 8762 - }, - { - "epoch": 0.22, - "learning_rate": 1.989462867853343e-06, - "loss": 0.8672, - "step": 8763 - }, - { - "epoch": 0.22, - "learning_rate": 1.9894588611565778e-06, - "loss": 0.791, - "step": 8764 - }, - { - "epoch": 0.22, - "learning_rate": 1.989454853702229e-06, - "loss": 0.8169, - "step": 8765 - }, - { - "epoch": 0.22, - "learning_rate": 1.9894508454903e-06, - "loss": 0.7939, - "step": 8766 - }, - { - "epoch": 0.22, - "learning_rate": 1.989446836520794e-06, - "loss": 1.2529, - "step": 8767 - }, - { - "epoch": 0.22, - "learning_rate": 1.9894428267937144e-06, - "loss": 0.9199, - "step": 8768 - }, - { - "epoch": 0.22, - "learning_rate": 1.9894388163090634e-06, - "loss": 0.8037, - "step": 8769 - }, - { - "epoch": 0.22, - "learning_rate": 1.989434805066845e-06, - "loss": 0.8809, - "step": 8770 - }, - { - "epoch": 0.22, - "learning_rate": 1.989430793067062e-06, - "loss": 0.9941, - "step": 8771 - }, - { - "epoch": 0.22, - "learning_rate": 1.9894267803097173e-06, - "loss": 0.677, - "step": 8772 - }, - { - "epoch": 0.22, - "learning_rate": 1.9894227667948135e-06, - "loss": 0.9375, - "step": 8773 - }, - { - "epoch": 0.22, - "learning_rate": 1.9894187525223544e-06, - "loss": 0.7764, - "step": 8774 - }, - { - "epoch": 0.22, - "learning_rate": 1.989414737492343e-06, - "loss": 1.0225, - "step": 8775 - }, - { - "epoch": 0.22, - "learning_rate": 1.989410721704782e-06, - "loss": 0.8467, - "step": 8776 - }, - { - "epoch": 0.22, - "learning_rate": 1.989406705159675e-06, - "loss": 0.6572, - "step": 8777 - }, - { - "epoch": 0.22, - "learning_rate": 1.9894026878570246e-06, - "loss": 0.7974, - "step": 8778 - }, - { - "epoch": 0.23, - "learning_rate": 1.989398669796834e-06, - "loss": 0.769, - "step": 8779 - }, - { - "epoch": 0.23, - "learning_rate": 1.989394650979107e-06, - "loss": 0.6606, - "step": 8780 - }, - { - "epoch": 0.23, - "learning_rate": 1.989390631403845e-06, - "loss": 0.8496, - "step": 8781 - }, - { - "epoch": 0.23, - "learning_rate": 1.9893866110710523e-06, - "loss": 1.0693, - "step": 8782 - }, - { - "epoch": 0.23, - "learning_rate": 1.9893825899807322e-06, - "loss": 0.9883, - "step": 8783 - }, - { - "epoch": 0.23, - "learning_rate": 1.9893785681328873e-06, - "loss": 0.9648, - "step": 8784 - }, - { - "epoch": 0.23, - "learning_rate": 1.9893745455275205e-06, - "loss": 1.001, - "step": 8785 - }, - { - "epoch": 0.23, - "learning_rate": 1.9893705221646352e-06, - "loss": 0.8594, - "step": 8786 - }, - { - "epoch": 0.23, - "learning_rate": 1.9893664980442344e-06, - "loss": 1.0361, - "step": 8787 - }, - { - "epoch": 0.23, - "learning_rate": 1.989362473166321e-06, - "loss": 0.825, - "step": 8788 - }, - { - "epoch": 0.23, - "learning_rate": 1.9893584475308983e-06, - "loss": 0.9922, - "step": 8789 - }, - { - "epoch": 0.23, - "learning_rate": 1.9893544211379695e-06, - "loss": 1.043, - "step": 8790 - }, - { - "epoch": 0.23, - "learning_rate": 1.9893503939875374e-06, - "loss": 0.6387, - "step": 8791 - }, - { - "epoch": 0.23, - "learning_rate": 1.9893463660796054e-06, - "loss": 0.9814, - "step": 8792 - }, - { - "epoch": 0.23, - "learning_rate": 1.989342337414176e-06, - "loss": 0.9092, - "step": 8793 - }, - { - "epoch": 0.23, - "learning_rate": 1.989338307991253e-06, - "loss": 0.7793, - "step": 8794 - }, - { - "epoch": 0.23, - "learning_rate": 1.9893342778108387e-06, - "loss": 1.001, - "step": 8795 - }, - { - "epoch": 0.23, - "learning_rate": 1.989330246872937e-06, - "loss": 0.6812, - "step": 8796 - }, - { - "epoch": 0.23, - "learning_rate": 1.9893262151775505e-06, - "loss": 0.8428, - "step": 8797 - }, - { - "epoch": 0.23, - "learning_rate": 1.9893221827246824e-06, - "loss": 0.834, - "step": 8798 - }, - { - "epoch": 0.23, - "learning_rate": 1.989318149514336e-06, - "loss": 0.8662, - "step": 8799 - }, - { - "epoch": 0.23, - "learning_rate": 1.989314115546514e-06, - "loss": 0.8369, - "step": 8800 - }, - { - "epoch": 0.23, - "learning_rate": 1.98931008082122e-06, - "loss": 0.7808, - "step": 8801 - }, - { - "epoch": 0.23, - "learning_rate": 1.989306045338456e-06, - "loss": 0.9902, - "step": 8802 - }, - { - "epoch": 0.23, - "learning_rate": 1.9893020090982263e-06, - "loss": 0.7793, - "step": 8803 - }, - { - "epoch": 0.23, - "learning_rate": 1.989297972100534e-06, - "loss": 0.9824, - "step": 8804 - }, - { - "epoch": 0.23, - "learning_rate": 1.989293934345381e-06, - "loss": 0.9268, - "step": 8805 - }, - { - "epoch": 0.23, - "learning_rate": 1.9892898958327715e-06, - "loss": 0.8916, - "step": 8806 - }, - { - "epoch": 0.23, - "learning_rate": 1.989285856562708e-06, - "loss": 0.9043, - "step": 8807 - }, - { - "epoch": 0.23, - "learning_rate": 1.9892818165351942e-06, - "loss": 0.9473, - "step": 8808 - }, - { - "epoch": 0.23, - "learning_rate": 1.9892777757502324e-06, - "loss": 0.9932, - "step": 8809 - }, - { - "epoch": 0.23, - "learning_rate": 1.9892737342078263e-06, - "loss": 0.8857, - "step": 8810 - }, - { - "epoch": 0.23, - "learning_rate": 1.9892696919079787e-06, - "loss": 0.7578, - "step": 8811 - }, - { - "epoch": 0.23, - "learning_rate": 1.9892656488506926e-06, - "loss": 0.8125, - "step": 8812 - }, - { - "epoch": 0.23, - "learning_rate": 1.9892616050359715e-06, - "loss": 0.9346, - "step": 8813 - }, - { - "epoch": 0.23, - "learning_rate": 1.9892575604638183e-06, - "loss": 0.8672, - "step": 8814 - }, - { - "epoch": 0.23, - "learning_rate": 1.9892535151342363e-06, - "loss": 0.9424, - "step": 8815 - }, - { - "epoch": 0.23, - "learning_rate": 1.9892494690472277e-06, - "loss": 0.8193, - "step": 8816 - }, - { - "epoch": 0.23, - "learning_rate": 1.989245422202797e-06, - "loss": 0.8838, - "step": 8817 - }, - { - "epoch": 0.23, - "learning_rate": 1.989241374600946e-06, - "loss": 1.0146, - "step": 8818 - }, - { - "epoch": 0.23, - "learning_rate": 1.9892373262416784e-06, - "loss": 1.0283, - "step": 8819 - }, - { - "epoch": 0.23, - "learning_rate": 1.9892332771249978e-06, - "loss": 0.9863, - "step": 8820 - }, - { - "epoch": 0.23, - "learning_rate": 1.989229227250906e-06, - "loss": 0.7998, - "step": 8821 - }, - { - "epoch": 0.23, - "learning_rate": 1.989225176619408e-06, - "loss": 0.9023, - "step": 8822 - }, - { - "epoch": 0.23, - "learning_rate": 1.9892211252305046e-06, - "loss": 1.0791, - "step": 8823 - }, - { - "epoch": 0.23, - "learning_rate": 1.989217073084201e-06, - "loss": 0.5728, - "step": 8824 - }, - { - "epoch": 0.23, - "learning_rate": 1.9892130201804987e-06, - "loss": 0.9697, - "step": 8825 - }, - { - "epoch": 0.23, - "learning_rate": 1.9892089665194015e-06, - "loss": 1.1338, - "step": 8826 - }, - { - "epoch": 0.23, - "learning_rate": 1.989204912100913e-06, - "loss": 1.0273, - "step": 8827 - }, - { - "epoch": 0.23, - "learning_rate": 1.989200856925035e-06, - "loss": 0.7637, - "step": 8828 - }, - { - "epoch": 0.23, - "learning_rate": 1.989196800991772e-06, - "loss": 1.0371, - "step": 8829 - }, - { - "epoch": 0.23, - "learning_rate": 1.9891927443011264e-06, - "loss": 1.1943, - "step": 8830 - }, - { - "epoch": 0.23, - "learning_rate": 1.9891886868531013e-06, - "loss": 1.0918, - "step": 8831 - }, - { - "epoch": 0.23, - "learning_rate": 1.9891846286477e-06, - "loss": 1.0352, - "step": 8832 - }, - { - "epoch": 0.23, - "learning_rate": 1.9891805696849257e-06, - "loss": 1.0029, - "step": 8833 - }, - { - "epoch": 0.23, - "learning_rate": 1.989176509964781e-06, - "loss": 1.1289, - "step": 8834 - }, - { - "epoch": 0.23, - "learning_rate": 1.989172449487269e-06, - "loss": 0.9639, - "step": 8835 - }, - { - "epoch": 0.23, - "learning_rate": 1.989168388252394e-06, - "loss": 0.9648, - "step": 8836 - }, - { - "epoch": 0.23, - "learning_rate": 1.9891643262601576e-06, - "loss": 0.9053, - "step": 8837 - }, - { - "epoch": 0.23, - "learning_rate": 1.989160263510564e-06, - "loss": 0.9219, - "step": 8838 - }, - { - "epoch": 0.23, - "learning_rate": 1.9891562000036154e-06, - "loss": 0.8311, - "step": 8839 - }, - { - "epoch": 0.23, - "learning_rate": 1.9891521357393154e-06, - "loss": 0.7231, - "step": 8840 - }, - { - "epoch": 0.23, - "learning_rate": 1.9891480707176675e-06, - "loss": 0.8169, - "step": 8841 - }, - { - "epoch": 0.23, - "learning_rate": 1.9891440049386744e-06, - "loss": 1.1465, - "step": 8842 - }, - { - "epoch": 0.23, - "learning_rate": 1.989139938402339e-06, - "loss": 1.1562, - "step": 8843 - }, - { - "epoch": 0.23, - "learning_rate": 1.9891358711086645e-06, - "loss": 0.7529, - "step": 8844 - }, - { - "epoch": 0.23, - "learning_rate": 1.989131803057654e-06, - "loss": 0.8091, - "step": 8845 - }, - { - "epoch": 0.23, - "learning_rate": 1.989127734249311e-06, - "loss": 1.082, - "step": 8846 - }, - { - "epoch": 0.23, - "learning_rate": 1.989123664683639e-06, - "loss": 0.7505, - "step": 8847 - }, - { - "epoch": 0.23, - "learning_rate": 1.98911959436064e-06, - "loss": 0.8252, - "step": 8848 - }, - { - "epoch": 0.23, - "learning_rate": 1.9891155232803173e-06, - "loss": 0.8916, - "step": 8849 - }, - { - "epoch": 0.23, - "learning_rate": 1.9891114514426745e-06, - "loss": 0.9268, - "step": 8850 - }, - { - "epoch": 0.23, - "learning_rate": 1.989107378847715e-06, - "loss": 0.8911, - "step": 8851 - }, - { - "epoch": 0.23, - "learning_rate": 1.9891033054954403e-06, - "loss": 1.1719, - "step": 8852 - }, - { - "epoch": 0.23, - "learning_rate": 1.9890992313858557e-06, - "loss": 0.9717, - "step": 8853 - }, - { - "epoch": 0.23, - "learning_rate": 1.989095156518963e-06, - "loss": 0.9346, - "step": 8854 - }, - { - "epoch": 0.23, - "learning_rate": 1.9890910808947658e-06, - "loss": 0.998, - "step": 8855 - }, - { - "epoch": 0.23, - "learning_rate": 1.989087004513267e-06, - "loss": 0.6006, - "step": 8856 - }, - { - "epoch": 0.23, - "learning_rate": 1.989082927374469e-06, - "loss": 0.7793, - "step": 8857 - }, - { - "epoch": 0.23, - "learning_rate": 1.9890788494783767e-06, - "loss": 0.6191, - "step": 8858 - }, - { - "epoch": 0.23, - "learning_rate": 1.9890747708249918e-06, - "loss": 1.1904, - "step": 8859 - }, - { - "epoch": 0.23, - "learning_rate": 1.989070691414318e-06, - "loss": 0.9248, - "step": 8860 - }, - { - "epoch": 0.23, - "learning_rate": 1.989066611246358e-06, - "loss": 0.8076, - "step": 8861 - }, - { - "epoch": 0.23, - "learning_rate": 1.9890625303211157e-06, - "loss": 0.9355, - "step": 8862 - }, - { - "epoch": 0.23, - "learning_rate": 1.9890584486385927e-06, - "loss": 0.7852, - "step": 8863 - }, - { - "epoch": 0.23, - "learning_rate": 1.989054366198794e-06, - "loss": 0.7642, - "step": 8864 - }, - { - "epoch": 0.23, - "learning_rate": 1.9890502830017215e-06, - "loss": 0.9561, - "step": 8865 - }, - { - "epoch": 0.23, - "learning_rate": 1.9890461990473787e-06, - "loss": 0.8174, - "step": 8866 - }, - { - "epoch": 0.23, - "learning_rate": 1.9890421143357685e-06, - "loss": 0.9971, - "step": 8867 - }, - { - "epoch": 0.23, - "learning_rate": 1.989038028866895e-06, - "loss": 0.7598, - "step": 8868 - }, - { - "epoch": 0.23, - "learning_rate": 1.9890339426407597e-06, - "loss": 0.9243, - "step": 8869 - }, - { - "epoch": 0.23, - "learning_rate": 1.989029855657367e-06, - "loss": 0.9072, - "step": 8870 - }, - { - "epoch": 0.23, - "learning_rate": 1.9890257679167195e-06, - "loss": 0.9785, - "step": 8871 - }, - { - "epoch": 0.23, - "learning_rate": 1.9890216794188204e-06, - "loss": 0.9028, - "step": 8872 - }, - { - "epoch": 0.23, - "learning_rate": 1.989017590163673e-06, - "loss": 0.7422, - "step": 8873 - }, - { - "epoch": 0.23, - "learning_rate": 1.9890135001512803e-06, - "loss": 0.6768, - "step": 8874 - }, - { - "epoch": 0.23, - "learning_rate": 1.9890094093816456e-06, - "loss": 0.7676, - "step": 8875 - }, - { - "epoch": 0.23, - "learning_rate": 1.9890053178547715e-06, - "loss": 0.853, - "step": 8876 - }, - { - "epoch": 0.23, - "learning_rate": 1.989001225570662e-06, - "loss": 1.0752, - "step": 8877 - }, - { - "epoch": 0.23, - "learning_rate": 1.988997132529319e-06, - "loss": 0.7222, - "step": 8878 - }, - { - "epoch": 0.23, - "learning_rate": 1.9889930387307466e-06, - "loss": 0.8662, - "step": 8879 - }, - { - "epoch": 0.23, - "learning_rate": 1.988988944174948e-06, - "loss": 0.8242, - "step": 8880 - }, - { - "epoch": 0.23, - "learning_rate": 1.988984848861926e-06, - "loss": 0.6709, - "step": 8881 - }, - { - "epoch": 0.23, - "learning_rate": 1.9889807527916836e-06, - "loss": 0.8896, - "step": 8882 - }, - { - "epoch": 0.23, - "learning_rate": 1.9889766559642242e-06, - "loss": 0.9521, - "step": 8883 - }, - { - "epoch": 0.23, - "learning_rate": 1.988972558379551e-06, - "loss": 0.959, - "step": 8884 - }, - { - "epoch": 0.23, - "learning_rate": 1.988968460037667e-06, - "loss": 0.834, - "step": 8885 - }, - { - "epoch": 0.23, - "learning_rate": 1.988964360938575e-06, - "loss": 0.915, - "step": 8886 - }, - { - "epoch": 0.23, - "learning_rate": 1.9889602610822788e-06, - "loss": 0.7803, - "step": 8887 - }, - { - "epoch": 0.23, - "learning_rate": 1.988956160468781e-06, - "loss": 1.0967, - "step": 8888 - }, - { - "epoch": 0.23, - "learning_rate": 1.988952059098085e-06, - "loss": 0.9307, - "step": 8889 - }, - { - "epoch": 0.23, - "learning_rate": 1.9889479569701937e-06, - "loss": 0.9492, - "step": 8890 - }, - { - "epoch": 0.23, - "learning_rate": 1.9889438540851105e-06, - "loss": 0.8184, - "step": 8891 - }, - { - "epoch": 0.23, - "learning_rate": 1.9889397504428387e-06, - "loss": 0.8711, - "step": 8892 - }, - { - "epoch": 0.23, - "learning_rate": 1.988935646043381e-06, - "loss": 0.7944, - "step": 8893 - }, - { - "epoch": 0.23, - "learning_rate": 1.9889315408867408e-06, - "loss": 0.9102, - "step": 8894 - }, - { - "epoch": 0.23, - "learning_rate": 1.9889274349729214e-06, - "loss": 0.9697, - "step": 8895 - }, - { - "epoch": 0.23, - "learning_rate": 1.9889233283019254e-06, - "loss": 0.7744, - "step": 8896 - }, - { - "epoch": 0.23, - "learning_rate": 1.9889192208737564e-06, - "loss": 1.0, - "step": 8897 - }, - { - "epoch": 0.23, - "learning_rate": 1.9889151126884175e-06, - "loss": 0.9697, - "step": 8898 - }, - { - "epoch": 0.23, - "learning_rate": 1.988911003745912e-06, - "loss": 1.0605, - "step": 8899 - }, - { - "epoch": 0.23, - "learning_rate": 1.9889068940462424e-06, - "loss": 1.0078, - "step": 8900 - }, - { - "epoch": 0.23, - "learning_rate": 1.9889027835894123e-06, - "loss": 0.875, - "step": 8901 - }, - { - "epoch": 0.23, - "learning_rate": 1.988898672375425e-06, - "loss": 0.9736, - "step": 8902 - }, - { - "epoch": 0.23, - "learning_rate": 1.988894560404283e-06, - "loss": 0.627, - "step": 8903 - }, - { - "epoch": 0.23, - "learning_rate": 1.9888904476759906e-06, - "loss": 0.9434, - "step": 8904 - }, - { - "epoch": 0.23, - "learning_rate": 1.9888863341905497e-06, - "loss": 1.0098, - "step": 8905 - }, - { - "epoch": 0.23, - "learning_rate": 1.988882219947964e-06, - "loss": 0.9727, - "step": 8906 - }, - { - "epoch": 0.23, - "learning_rate": 1.988878104948237e-06, - "loss": 0.6646, - "step": 8907 - }, - { - "epoch": 0.23, - "learning_rate": 1.988873989191371e-06, - "loss": 0.9932, - "step": 8908 - }, - { - "epoch": 0.23, - "learning_rate": 1.9888698726773707e-06, - "loss": 1.0576, - "step": 8909 - }, - { - "epoch": 0.23, - "learning_rate": 1.988865755406237e-06, - "loss": 0.9385, - "step": 8910 - }, - { - "epoch": 0.23, - "learning_rate": 1.988861637377975e-06, - "loss": 0.6936, - "step": 8911 - }, - { - "epoch": 0.23, - "learning_rate": 1.9888575185925868e-06, - "loss": 0.9893, - "step": 8912 - }, - { - "epoch": 0.23, - "learning_rate": 1.9888533990500763e-06, - "loss": 1.1094, - "step": 8913 - }, - { - "epoch": 0.23, - "learning_rate": 1.988849278750446e-06, - "loss": 0.8076, - "step": 8914 - }, - { - "epoch": 0.23, - "learning_rate": 1.988845157693699e-06, - "loss": 0.9023, - "step": 8915 - }, - { - "epoch": 0.23, - "learning_rate": 1.9888410358798388e-06, - "loss": 0.9395, - "step": 8916 - }, - { - "epoch": 0.23, - "learning_rate": 1.9888369133088683e-06, - "loss": 1.0244, - "step": 8917 - }, - { - "epoch": 0.23, - "learning_rate": 1.9888327899807915e-06, - "loss": 0.8066, - "step": 8918 - }, - { - "epoch": 0.23, - "learning_rate": 1.9888286658956103e-06, - "loss": 1.1074, - "step": 8919 - }, - { - "epoch": 0.23, - "learning_rate": 1.9888245410533287e-06, - "loss": 0.6292, - "step": 8920 - }, - { - "epoch": 0.23, - "learning_rate": 1.98882041545395e-06, - "loss": 0.8408, - "step": 8921 - }, - { - "epoch": 0.23, - "learning_rate": 1.9888162890974766e-06, - "loss": 0.7258, - "step": 8922 - }, - { - "epoch": 0.23, - "learning_rate": 1.9888121619839117e-06, - "loss": 0.9961, - "step": 8923 - }, - { - "epoch": 0.23, - "learning_rate": 1.988808034113259e-06, - "loss": 0.6824, - "step": 8924 - }, - { - "epoch": 0.23, - "learning_rate": 1.988803905485522e-06, - "loss": 0.7637, - "step": 8925 - }, - { - "epoch": 0.23, - "learning_rate": 1.9887997761007024e-06, - "loss": 0.9248, - "step": 8926 - }, - { - "epoch": 0.23, - "learning_rate": 1.988795645958805e-06, - "loss": 1.0283, - "step": 8927 - }, - { - "epoch": 0.23, - "learning_rate": 1.988791515059832e-06, - "loss": 1.0459, - "step": 8928 - }, - { - "epoch": 0.23, - "learning_rate": 1.9887873834037865e-06, - "loss": 0.8975, - "step": 8929 - }, - { - "epoch": 0.23, - "learning_rate": 1.9887832509906727e-06, - "loss": 1.1592, - "step": 8930 - }, - { - "epoch": 0.23, - "learning_rate": 1.9887791178204923e-06, - "loss": 0.8311, - "step": 8931 - }, - { - "epoch": 0.23, - "learning_rate": 1.9887749838932495e-06, - "loss": 1.0557, - "step": 8932 - }, - { - "epoch": 0.23, - "learning_rate": 1.9887708492089473e-06, - "loss": 1.0781, - "step": 8933 - }, - { - "epoch": 0.23, - "learning_rate": 1.9887667137675886e-06, - "loss": 0.855, - "step": 8934 - }, - { - "epoch": 0.23, - "learning_rate": 1.988762577569177e-06, - "loss": 0.9727, - "step": 8935 - }, - { - "epoch": 0.23, - "learning_rate": 1.9887584406137147e-06, - "loss": 0.9199, - "step": 8936 - }, - { - "epoch": 0.23, - "learning_rate": 1.9887543029012057e-06, - "loss": 0.791, - "step": 8937 - }, - { - "epoch": 0.23, - "learning_rate": 1.9887501644316535e-06, - "loss": 0.9258, - "step": 8938 - }, - { - "epoch": 0.23, - "learning_rate": 1.98874602520506e-06, - "loss": 0.9766, - "step": 8939 - }, - { - "epoch": 0.23, - "learning_rate": 1.98874188522143e-06, - "loss": 0.9375, - "step": 8940 - }, - { - "epoch": 0.23, - "learning_rate": 1.988737744480765e-06, - "loss": 0.9453, - "step": 8941 - }, - { - "epoch": 0.23, - "learning_rate": 1.9887336029830697e-06, - "loss": 0.9531, - "step": 8942 - }, - { - "epoch": 0.23, - "learning_rate": 1.9887294607283457e-06, - "loss": 0.9268, - "step": 8943 - }, - { - "epoch": 0.23, - "learning_rate": 1.988725317716598e-06, - "loss": 0.9336, - "step": 8944 - }, - { - "epoch": 0.23, - "learning_rate": 1.988721173947828e-06, - "loss": 1.0869, - "step": 8945 - }, - { - "epoch": 0.23, - "learning_rate": 1.98871702942204e-06, - "loss": 0.7227, - "step": 8946 - }, - { - "epoch": 0.23, - "learning_rate": 1.988712884139237e-06, - "loss": 0.9219, - "step": 8947 - }, - { - "epoch": 0.23, - "learning_rate": 1.9887087380994216e-06, - "loss": 0.7529, - "step": 8948 - }, - { - "epoch": 0.23, - "learning_rate": 1.9887045913025974e-06, - "loss": 0.8433, - "step": 8949 - }, - { - "epoch": 0.23, - "learning_rate": 1.9887004437487675e-06, - "loss": 0.8853, - "step": 8950 - }, - { - "epoch": 0.23, - "learning_rate": 1.9886962954379354e-06, - "loss": 0.9307, - "step": 8951 - }, - { - "epoch": 0.23, - "learning_rate": 1.988692146370104e-06, - "loss": 0.8809, - "step": 8952 - }, - { - "epoch": 0.23, - "learning_rate": 1.9886879965452764e-06, - "loss": 0.96, - "step": 8953 - }, - { - "epoch": 0.23, - "learning_rate": 1.9886838459634562e-06, - "loss": 1.0005, - "step": 8954 - }, - { - "epoch": 0.23, - "learning_rate": 1.9886796946246457e-06, - "loss": 0.7349, - "step": 8955 - }, - { - "epoch": 0.23, - "learning_rate": 1.988675542528849e-06, - "loss": 0.7949, - "step": 8956 - }, - { - "epoch": 0.23, - "learning_rate": 1.9886713896760687e-06, - "loss": 0.8955, - "step": 8957 - }, - { - "epoch": 0.23, - "learning_rate": 1.988667236066308e-06, - "loss": 0.9883, - "step": 8958 - }, - { - "epoch": 0.23, - "learning_rate": 1.9886630816995704e-06, - "loss": 1.0664, - "step": 8959 - }, - { - "epoch": 0.23, - "learning_rate": 1.988658926575859e-06, - "loss": 0.9727, - "step": 8960 - }, - { - "epoch": 0.23, - "learning_rate": 1.9886547706951775e-06, - "loss": 0.8213, - "step": 8961 - }, - { - "epoch": 0.23, - "learning_rate": 1.988650614057528e-06, - "loss": 1.0059, - "step": 8962 - }, - { - "epoch": 0.23, - "learning_rate": 1.9886464566629137e-06, - "loss": 0.9417, - "step": 8963 - }, - { - "epoch": 0.23, - "learning_rate": 1.9886422985113388e-06, - "loss": 0.6252, - "step": 8964 - }, - { - "epoch": 0.23, - "learning_rate": 1.9886381396028057e-06, - "loss": 1.0137, - "step": 8965 - }, - { - "epoch": 0.23, - "learning_rate": 1.9886339799373178e-06, - "loss": 0.8682, - "step": 8966 - }, - { - "epoch": 0.23, - "learning_rate": 1.988629819514879e-06, - "loss": 1.0957, - "step": 8967 - }, - { - "epoch": 0.23, - "learning_rate": 1.988625658335491e-06, - "loss": 0.8081, - "step": 8968 - }, - { - "epoch": 0.23, - "learning_rate": 1.9886214963991583e-06, - "loss": 0.5977, - "step": 8969 - }, - { - "epoch": 0.23, - "learning_rate": 1.988617333705883e-06, - "loss": 0.9219, - "step": 8970 - }, - { - "epoch": 0.23, - "learning_rate": 1.9886131702556693e-06, - "loss": 1.1387, - "step": 8971 - }, - { - "epoch": 0.23, - "learning_rate": 1.98860900604852e-06, - "loss": 1.1836, - "step": 8972 - }, - { - "epoch": 0.23, - "learning_rate": 1.988604841084438e-06, - "loss": 0.8916, - "step": 8973 - }, - { - "epoch": 0.23, - "learning_rate": 1.988600675363427e-06, - "loss": 0.812, - "step": 8974 - }, - { - "epoch": 0.23, - "learning_rate": 1.98859650888549e-06, - "loss": 0.5825, - "step": 8975 - }, - { - "epoch": 0.23, - "learning_rate": 1.9885923416506297e-06, - "loss": 1.0, - "step": 8976 - }, - { - "epoch": 0.23, - "learning_rate": 1.98858817365885e-06, - "loss": 1.126, - "step": 8977 - }, - { - "epoch": 0.23, - "learning_rate": 1.9885840049101533e-06, - "loss": 1.0801, - "step": 8978 - }, - { - "epoch": 0.23, - "learning_rate": 1.988579835404544e-06, - "loss": 0.7852, - "step": 8979 - }, - { - "epoch": 0.23, - "learning_rate": 1.988575665142024e-06, - "loss": 0.9736, - "step": 8980 - }, - { - "epoch": 0.23, - "learning_rate": 1.9885714941225975e-06, - "loss": 0.8066, - "step": 8981 - }, - { - "epoch": 0.23, - "learning_rate": 1.9885673223462672e-06, - "loss": 0.9131, - "step": 8982 - }, - { - "epoch": 0.23, - "learning_rate": 1.9885631498130364e-06, - "loss": 1.0059, - "step": 8983 - }, - { - "epoch": 0.23, - "learning_rate": 1.988558976522908e-06, - "loss": 0.8047, - "step": 8984 - }, - { - "epoch": 0.23, - "learning_rate": 1.988554802475885e-06, - "loss": 0.6328, - "step": 8985 - }, - { - "epoch": 0.23, - "learning_rate": 1.988550627671972e-06, - "loss": 1.126, - "step": 8986 - }, - { - "epoch": 0.23, - "learning_rate": 1.9885464521111706e-06, - "loss": 0.8496, - "step": 8987 - }, - { - "epoch": 0.23, - "learning_rate": 1.988542275793485e-06, - "loss": 0.998, - "step": 8988 - }, - { - "epoch": 0.23, - "learning_rate": 1.988538098718918e-06, - "loss": 0.5942, - "step": 8989 - }, - { - "epoch": 0.23, - "learning_rate": 1.9885339208874727e-06, - "loss": 1.1025, - "step": 8990 - }, - { - "epoch": 0.23, - "learning_rate": 1.9885297422991523e-06, - "loss": 0.9658, - "step": 8991 - }, - { - "epoch": 0.23, - "learning_rate": 1.98852556295396e-06, - "loss": 0.8496, - "step": 8992 - }, - { - "epoch": 0.23, - "learning_rate": 1.9885213828519e-06, - "loss": 0.7386, - "step": 8993 - }, - { - "epoch": 0.23, - "learning_rate": 1.9885172019929735e-06, - "loss": 0.8745, - "step": 8994 - }, - { - "epoch": 0.23, - "learning_rate": 1.988513020377186e-06, - "loss": 0.8, - "step": 8995 - }, - { - "epoch": 0.23, - "learning_rate": 1.9885088380045386e-06, - "loss": 0.7332, - "step": 8996 - }, - { - "epoch": 0.23, - "learning_rate": 1.9885046548750357e-06, - "loss": 0.9219, - "step": 8997 - }, - { - "epoch": 0.23, - "learning_rate": 1.98850047098868e-06, - "loss": 0.8525, - "step": 8998 - }, - { - "epoch": 0.23, - "learning_rate": 1.9884962863454755e-06, - "loss": 1.0957, - "step": 8999 - }, - { - "epoch": 0.23, - "learning_rate": 1.9884921009454245e-06, - "loss": 1.0293, - "step": 9000 - }, - { - "epoch": 0.23, - "learning_rate": 1.9884879147885306e-06, - "loss": 0.8711, - "step": 9001 - }, - { - "epoch": 0.23, - "learning_rate": 1.988483727874797e-06, - "loss": 0.8857, - "step": 9002 - }, - { - "epoch": 0.23, - "learning_rate": 1.988479540204227e-06, - "loss": 1.0088, - "step": 9003 - }, - { - "epoch": 0.23, - "learning_rate": 1.9884753517768234e-06, - "loss": 0.916, - "step": 9004 - }, - { - "epoch": 0.23, - "learning_rate": 1.9884711625925896e-06, - "loss": 0.9268, - "step": 9005 - }, - { - "epoch": 0.23, - "learning_rate": 1.9884669726515294e-06, - "loss": 0.8232, - "step": 9006 - }, - { - "epoch": 0.23, - "learning_rate": 1.988462781953645e-06, - "loss": 0.8389, - "step": 9007 - }, - { - "epoch": 0.23, - "learning_rate": 1.98845859049894e-06, - "loss": 0.9805, - "step": 9008 - }, - { - "epoch": 0.23, - "learning_rate": 1.988454398287418e-06, - "loss": 0.9541, - "step": 9009 - }, - { - "epoch": 0.23, - "learning_rate": 1.9884502053190818e-06, - "loss": 0.7974, - "step": 9010 - }, - { - "epoch": 0.23, - "learning_rate": 1.988446011593935e-06, - "loss": 1.0381, - "step": 9011 - }, - { - "epoch": 0.23, - "learning_rate": 1.98844181711198e-06, - "loss": 1.0781, - "step": 9012 - }, - { - "epoch": 0.23, - "learning_rate": 1.9884376218732214e-06, - "loss": 0.9219, - "step": 9013 - }, - { - "epoch": 0.23, - "learning_rate": 1.988433425877661e-06, - "loss": 0.9238, - "step": 9014 - }, - { - "epoch": 0.23, - "learning_rate": 1.9884292291253028e-06, - "loss": 0.9893, - "step": 9015 - }, - { - "epoch": 0.23, - "learning_rate": 1.9884250316161493e-06, - "loss": 0.647, - "step": 9016 - }, - { - "epoch": 0.23, - "learning_rate": 1.9884208333502045e-06, - "loss": 0.8467, - "step": 9017 - }, - { - "epoch": 0.23, - "learning_rate": 1.9884166343274713e-06, - "loss": 0.918, - "step": 9018 - }, - { - "epoch": 0.23, - "learning_rate": 1.988412434547953e-06, - "loss": 0.6909, - "step": 9019 - }, - { - "epoch": 0.23, - "learning_rate": 1.988408234011653e-06, - "loss": 0.9854, - "step": 9020 - }, - { - "epoch": 0.23, - "learning_rate": 1.9884040327185737e-06, - "loss": 1.1836, - "step": 9021 - }, - { - "epoch": 0.23, - "learning_rate": 1.9883998306687193e-06, - "loss": 0.9121, - "step": 9022 - }, - { - "epoch": 0.23, - "learning_rate": 1.9883956278620926e-06, - "loss": 0.7378, - "step": 9023 - }, - { - "epoch": 0.23, - "learning_rate": 1.9883914242986965e-06, - "loss": 0.8525, - "step": 9024 - }, - { - "epoch": 0.23, - "learning_rate": 1.9883872199785346e-06, - "loss": 0.8887, - "step": 9025 - }, - { - "epoch": 0.23, - "learning_rate": 1.98838301490161e-06, - "loss": 0.8284, - "step": 9026 - }, - { - "epoch": 0.23, - "learning_rate": 1.9883788090679265e-06, - "loss": 0.8497, - "step": 9027 - }, - { - "epoch": 0.23, - "learning_rate": 1.9883746024774863e-06, - "loss": 0.8145, - "step": 9028 - }, - { - "epoch": 0.23, - "learning_rate": 1.988370395130293e-06, - "loss": 1.002, - "step": 9029 - }, - { - "epoch": 0.23, - "learning_rate": 1.9883661870263505e-06, - "loss": 0.6392, - "step": 9030 - }, - { - "epoch": 0.23, - "learning_rate": 1.9883619781656612e-06, - "loss": 0.6111, - "step": 9031 - }, - { - "epoch": 0.23, - "learning_rate": 1.988357768548228e-06, - "loss": 0.8975, - "step": 9032 - }, - { - "epoch": 0.23, - "learning_rate": 1.9883535581740553e-06, - "loss": 0.7441, - "step": 9033 - }, - { - "epoch": 0.23, - "learning_rate": 1.988349347043146e-06, - "loss": 0.957, - "step": 9034 - }, - { - "epoch": 0.23, - "learning_rate": 1.9883451351555026e-06, - "loss": 0.8093, - "step": 9035 - }, - { - "epoch": 0.23, - "learning_rate": 1.9883409225111286e-06, - "loss": 0.8936, - "step": 9036 - }, - { - "epoch": 0.23, - "learning_rate": 1.9883367091100276e-06, - "loss": 0.9307, - "step": 9037 - }, - { - "epoch": 0.23, - "learning_rate": 1.9883324949522027e-06, - "loss": 0.8438, - "step": 9038 - }, - { - "epoch": 0.23, - "learning_rate": 1.988328280037657e-06, - "loss": 0.7598, - "step": 9039 - }, - { - "epoch": 0.23, - "learning_rate": 1.988324064366394e-06, - "loss": 0.864, - "step": 9040 - }, - { - "epoch": 0.23, - "learning_rate": 1.9883198479384166e-06, - "loss": 0.8203, - "step": 9041 - }, - { - "epoch": 0.23, - "learning_rate": 1.988315630753728e-06, - "loss": 0.8984, - "step": 9042 - }, - { - "epoch": 0.23, - "learning_rate": 1.9883114128123317e-06, - "loss": 0.8369, - "step": 9043 - }, - { - "epoch": 0.23, - "learning_rate": 1.9883071941142306e-06, - "loss": 0.999, - "step": 9044 - }, - { - "epoch": 0.23, - "learning_rate": 1.9883029746594284e-06, - "loss": 0.7842, - "step": 9045 - }, - { - "epoch": 0.23, - "learning_rate": 1.988298754447928e-06, - "loss": 1.0186, - "step": 9046 - }, - { - "epoch": 0.23, - "learning_rate": 1.9882945334797324e-06, - "loss": 0.7549, - "step": 9047 - }, - { - "epoch": 0.23, - "learning_rate": 1.9882903117548455e-06, - "loss": 1.0664, - "step": 9048 - }, - { - "epoch": 0.23, - "learning_rate": 1.9882860892732697e-06, - "loss": 0.8672, - "step": 9049 - }, - { - "epoch": 0.23, - "learning_rate": 1.9882818660350093e-06, - "loss": 0.9395, - "step": 9050 - }, - { - "epoch": 0.23, - "learning_rate": 1.9882776420400664e-06, - "loss": 0.9287, - "step": 9051 - }, - { - "epoch": 0.23, - "learning_rate": 1.988273417288445e-06, - "loss": 0.8955, - "step": 9052 - }, - { - "epoch": 0.23, - "learning_rate": 1.988269191780148e-06, - "loss": 0.748, - "step": 9053 - }, - { - "epoch": 0.23, - "learning_rate": 1.9882649655151785e-06, - "loss": 0.8662, - "step": 9054 - }, - { - "epoch": 0.23, - "learning_rate": 1.9882607384935404e-06, - "loss": 0.9922, - "step": 9055 - }, - { - "epoch": 0.23, - "learning_rate": 1.988256510715236e-06, - "loss": 1.0508, - "step": 9056 - }, - { - "epoch": 0.23, - "learning_rate": 1.9882522821802694e-06, - "loss": 0.9463, - "step": 9057 - }, - { - "epoch": 0.23, - "learning_rate": 1.9882480528886436e-06, - "loss": 1.0742, - "step": 9058 - }, - { - "epoch": 0.23, - "learning_rate": 1.988243822840361e-06, - "loss": 1.0146, - "step": 9059 - }, - { - "epoch": 0.23, - "learning_rate": 1.9882395920354266e-06, - "loss": 0.959, - "step": 9060 - }, - { - "epoch": 0.23, - "learning_rate": 1.988235360473842e-06, - "loss": 0.8496, - "step": 9061 - }, - { - "epoch": 0.23, - "learning_rate": 1.9882311281556107e-06, - "loss": 0.9531, - "step": 9062 - }, - { - "epoch": 0.23, - "learning_rate": 1.9882268950807368e-06, - "loss": 0.918, - "step": 9063 - }, - { - "epoch": 0.23, - "learning_rate": 1.9882226612492227e-06, - "loss": 0.8555, - "step": 9064 - }, - { - "epoch": 0.23, - "learning_rate": 1.988218426661072e-06, - "loss": 0.8496, - "step": 9065 - }, - { - "epoch": 0.23, - "learning_rate": 1.988214191316288e-06, - "loss": 0.833, - "step": 9066 - }, - { - "epoch": 0.23, - "learning_rate": 1.9882099552148737e-06, - "loss": 0.9854, - "step": 9067 - }, - { - "epoch": 0.23, - "learning_rate": 1.9882057183568326e-06, - "loss": 0.75, - "step": 9068 - }, - { - "epoch": 0.23, - "learning_rate": 1.988201480742168e-06, - "loss": 0.8701, - "step": 9069 - }, - { - "epoch": 0.23, - "learning_rate": 1.9881972423708825e-06, - "loss": 1.0342, - "step": 9070 - }, - { - "epoch": 0.23, - "learning_rate": 1.9881930032429803e-06, - "loss": 0.9424, - "step": 9071 - }, - { - "epoch": 0.23, - "learning_rate": 1.988188763358464e-06, - "loss": 1.0693, - "step": 9072 - }, - { - "epoch": 0.23, - "learning_rate": 1.988184522717337e-06, - "loss": 0.874, - "step": 9073 - }, - { - "epoch": 0.23, - "learning_rate": 1.988180281319602e-06, - "loss": 1.2021, - "step": 9074 - }, - { - "epoch": 0.23, - "learning_rate": 1.988176039165263e-06, - "loss": 0.9492, - "step": 9075 - }, - { - "epoch": 0.23, - "learning_rate": 1.988171796254324e-06, - "loss": 1.2012, - "step": 9076 - }, - { - "epoch": 0.23, - "learning_rate": 1.9881675525867862e-06, - "loss": 0.8799, - "step": 9077 - }, - { - "epoch": 0.23, - "learning_rate": 1.9881633081626542e-06, - "loss": 0.8516, - "step": 9078 - }, - { - "epoch": 0.23, - "learning_rate": 1.9881590629819312e-06, - "loss": 0.9541, - "step": 9079 - }, - { - "epoch": 0.23, - "learning_rate": 1.98815481704462e-06, - "loss": 0.7065, - "step": 9080 - }, - { - "epoch": 0.23, - "learning_rate": 1.9881505703507245e-06, - "loss": 1.0264, - "step": 9081 - }, - { - "epoch": 0.23, - "learning_rate": 1.988146322900247e-06, - "loss": 0.9502, - "step": 9082 - }, - { - "epoch": 0.23, - "learning_rate": 1.988142074693192e-06, - "loss": 0.9424, - "step": 9083 - }, - { - "epoch": 0.23, - "learning_rate": 1.9881378257295617e-06, - "loss": 0.9199, - "step": 9084 - }, - { - "epoch": 0.23, - "learning_rate": 1.9881335760093596e-06, - "loss": 1.0176, - "step": 9085 - }, - { - "epoch": 0.23, - "learning_rate": 1.988129325532589e-06, - "loss": 0.9414, - "step": 9086 - }, - { - "epoch": 0.23, - "learning_rate": 1.9881250742992535e-06, - "loss": 1.0586, - "step": 9087 - }, - { - "epoch": 0.23, - "learning_rate": 1.988120822309356e-06, - "loss": 0.8457, - "step": 9088 - }, - { - "epoch": 0.23, - "learning_rate": 1.9881165695628995e-06, - "loss": 0.9473, - "step": 9089 - }, - { - "epoch": 0.23, - "learning_rate": 1.9881123160598876e-06, - "loss": 0.9541, - "step": 9090 - }, - { - "epoch": 0.23, - "learning_rate": 1.9881080618003237e-06, - "loss": 0.9531, - "step": 9091 - }, - { - "epoch": 0.23, - "learning_rate": 1.988103806784211e-06, - "loss": 0.592, - "step": 9092 - }, - { - "epoch": 0.23, - "learning_rate": 1.988099551011553e-06, - "loss": 0.7852, - "step": 9093 - }, - { - "epoch": 0.23, - "learning_rate": 1.9880952944823515e-06, - "loss": 0.8975, - "step": 9094 - }, - { - "epoch": 0.23, - "learning_rate": 1.9880910371966117e-06, - "loss": 0.9336, - "step": 9095 - }, - { - "epoch": 0.23, - "learning_rate": 1.9880867791543363e-06, - "loss": 1.1074, - "step": 9096 - }, - { - "epoch": 0.23, - "learning_rate": 1.9880825203555274e-06, - "loss": 1.0879, - "step": 9097 - }, - { - "epoch": 0.23, - "learning_rate": 1.98807826080019e-06, - "loss": 0.8042, - "step": 9098 - }, - { - "epoch": 0.23, - "learning_rate": 1.9880740004883257e-06, - "loss": 1.0781, - "step": 9099 - }, - { - "epoch": 0.23, - "learning_rate": 1.988069739419939e-06, - "loss": 0.9062, - "step": 9100 - }, - { - "epoch": 0.23, - "learning_rate": 1.988065477595033e-06, - "loss": 0.7451, - "step": 9101 - }, - { - "epoch": 0.23, - "learning_rate": 1.9880612150136102e-06, - "loss": 0.7354, - "step": 9102 - }, - { - "epoch": 0.23, - "learning_rate": 1.9880569516756747e-06, - "loss": 1.0254, - "step": 9103 - }, - { - "epoch": 0.23, - "learning_rate": 1.9880526875812294e-06, - "loss": 0.8799, - "step": 9104 - }, - { - "epoch": 0.23, - "learning_rate": 1.9880484227302775e-06, - "loss": 0.8984, - "step": 9105 - }, - { - "epoch": 0.23, - "learning_rate": 1.988044157122822e-06, - "loss": 0.8789, - "step": 9106 - }, - { - "epoch": 0.23, - "learning_rate": 1.9880398907588673e-06, - "loss": 0.8184, - "step": 9107 - }, - { - "epoch": 0.23, - "learning_rate": 1.988035623638415e-06, - "loss": 0.9756, - "step": 9108 - }, - { - "epoch": 0.23, - "learning_rate": 1.9880313557614697e-06, - "loss": 0.8018, - "step": 9109 - }, - { - "epoch": 0.23, - "learning_rate": 1.988027087128034e-06, - "loss": 0.8994, - "step": 9110 - }, - { - "epoch": 0.23, - "learning_rate": 1.988022817738112e-06, - "loss": 1.0098, - "step": 9111 - }, - { - "epoch": 0.23, - "learning_rate": 1.9880185475917058e-06, - "loss": 0.9082, - "step": 9112 - }, - { - "epoch": 0.23, - "learning_rate": 1.9880142766888194e-06, - "loss": 0.915, - "step": 9113 - }, - { - "epoch": 0.23, - "learning_rate": 1.988010005029456e-06, - "loss": 0.9492, - "step": 9114 - }, - { - "epoch": 0.23, - "learning_rate": 1.9880057326136185e-06, - "loss": 1.0859, - "step": 9115 - }, - { - "epoch": 0.23, - "learning_rate": 1.9880014594413107e-06, - "loss": 0.9766, - "step": 9116 - }, - { - "epoch": 0.23, - "learning_rate": 1.9879971855125355e-06, - "loss": 0.7783, - "step": 9117 - }, - { - "epoch": 0.23, - "learning_rate": 1.9879929108272964e-06, - "loss": 0.9795, - "step": 9118 - }, - { - "epoch": 0.23, - "learning_rate": 1.9879886353855967e-06, - "loss": 0.916, - "step": 9119 - }, - { - "epoch": 0.23, - "learning_rate": 1.987984359187439e-06, - "loss": 0.9922, - "step": 9120 - }, - { - "epoch": 0.23, - "learning_rate": 1.9879800822328276e-06, - "loss": 0.9541, - "step": 9121 - }, - { - "epoch": 0.23, - "learning_rate": 1.987975804521765e-06, - "loss": 0.7598, - "step": 9122 - }, - { - "epoch": 0.23, - "learning_rate": 1.9879715260542547e-06, - "loss": 0.8037, - "step": 9123 - }, - { - "epoch": 0.23, - "learning_rate": 1.9879672468303e-06, - "loss": 1.1074, - "step": 9124 - }, - { - "epoch": 0.23, - "learning_rate": 1.9879629668499044e-06, - "loss": 0.7017, - "step": 9125 - }, - { - "epoch": 0.23, - "learning_rate": 1.987958686113071e-06, - "loss": 0.8389, - "step": 9126 - }, - { - "epoch": 0.23, - "learning_rate": 1.9879544046198033e-06, - "loss": 0.9844, - "step": 9127 - }, - { - "epoch": 0.23, - "learning_rate": 1.987950122370104e-06, - "loss": 0.79, - "step": 9128 - }, - { - "epoch": 0.23, - "learning_rate": 1.9879458393639764e-06, - "loss": 0.8262, - "step": 9129 - }, - { - "epoch": 0.23, - "learning_rate": 1.9879415556014244e-06, - "loss": 0.9316, - "step": 9130 - }, - { - "epoch": 0.23, - "learning_rate": 1.9879372710824513e-06, - "loss": 0.9238, - "step": 9131 - }, - { - "epoch": 0.23, - "learning_rate": 1.9879329858070595e-06, - "loss": 1.1885, - "step": 9132 - }, - { - "epoch": 0.23, - "learning_rate": 1.9879286997752533e-06, - "loss": 0.833, - "step": 9133 - }, - { - "epoch": 0.23, - "learning_rate": 1.9879244129870357e-06, - "loss": 0.8335, - "step": 9134 - }, - { - "epoch": 0.23, - "learning_rate": 1.9879201254424092e-06, - "loss": 1.0273, - "step": 9135 - }, - { - "epoch": 0.23, - "learning_rate": 1.987915837141378e-06, - "loss": 1.001, - "step": 9136 - }, - { - "epoch": 0.23, - "learning_rate": 1.9879115480839452e-06, - "loss": 0.8174, - "step": 9137 - }, - { - "epoch": 0.23, - "learning_rate": 1.9879072582701136e-06, - "loss": 0.7651, - "step": 9138 - }, - { - "epoch": 0.23, - "learning_rate": 1.9879029676998867e-06, - "loss": 0.8828, - "step": 9139 - }, - { - "epoch": 0.23, - "learning_rate": 1.9878986763732683e-06, - "loss": 0.9219, - "step": 9140 - }, - { - "epoch": 0.23, - "learning_rate": 1.9878943842902617e-06, - "loss": 1.0576, - "step": 9141 - }, - { - "epoch": 0.23, - "learning_rate": 1.987890091450869e-06, - "loss": 0.9258, - "step": 9142 - }, - { - "epoch": 0.23, - "learning_rate": 1.9878857978550947e-06, - "loss": 0.9658, - "step": 9143 - }, - { - "epoch": 0.23, - "learning_rate": 1.987881503502942e-06, - "loss": 0.8594, - "step": 9144 - }, - { - "epoch": 0.23, - "learning_rate": 1.987877208394413e-06, - "loss": 0.8242, - "step": 9145 - }, - { - "epoch": 0.23, - "learning_rate": 1.987872912529512e-06, - "loss": 0.9658, - "step": 9146 - }, - { - "epoch": 0.23, - "learning_rate": 1.9878686159082428e-06, - "loss": 0.8564, - "step": 9147 - }, - { - "epoch": 0.23, - "learning_rate": 1.9878643185306077e-06, - "loss": 0.9043, - "step": 9148 - }, - { - "epoch": 0.23, - "learning_rate": 1.98786002039661e-06, - "loss": 0.7559, - "step": 9149 - }, - { - "epoch": 0.23, - "learning_rate": 1.9878557215062536e-06, - "loss": 1.001, - "step": 9150 - }, - { - "epoch": 0.23, - "learning_rate": 1.9878514218595414e-06, - "loss": 1.0381, - "step": 9151 - }, - { - "epoch": 0.23, - "learning_rate": 1.987847121456477e-06, - "loss": 0.6719, - "step": 9152 - }, - { - "epoch": 0.23, - "learning_rate": 1.987842820297063e-06, - "loss": 0.79, - "step": 9153 - }, - { - "epoch": 0.23, - "learning_rate": 1.987838518381304e-06, - "loss": 0.8828, - "step": 9154 - }, - { - "epoch": 0.23, - "learning_rate": 1.987834215709202e-06, - "loss": 0.7593, - "step": 9155 - }, - { - "epoch": 0.23, - "learning_rate": 1.987829912280761e-06, - "loss": 0.959, - "step": 9156 - }, - { - "epoch": 0.23, - "learning_rate": 1.9878256080959832e-06, - "loss": 0.8799, - "step": 9157 - }, - { - "epoch": 0.23, - "learning_rate": 1.9878213031548733e-06, - "loss": 0.9775, - "step": 9158 - }, - { - "epoch": 0.23, - "learning_rate": 1.987816997457434e-06, - "loss": 0.8643, - "step": 9159 - }, - { - "epoch": 0.23, - "learning_rate": 1.987812691003669e-06, - "loss": 0.9189, - "step": 9160 - }, - { - "epoch": 0.23, - "learning_rate": 1.9878083837935812e-06, - "loss": 0.8281, - "step": 9161 - }, - { - "epoch": 0.23, - "learning_rate": 1.9878040758271733e-06, - "loss": 1.0, - "step": 9162 - }, - { - "epoch": 0.23, - "learning_rate": 1.98779976710445e-06, - "loss": 1.042, - "step": 9163 - }, - { - "epoch": 0.23, - "learning_rate": 1.9877954576254133e-06, - "loss": 0.8555, - "step": 9164 - }, - { - "epoch": 0.23, - "learning_rate": 1.987791147390067e-06, - "loss": 1.0088, - "step": 9165 - }, - { - "epoch": 0.23, - "learning_rate": 1.987786836398415e-06, - "loss": 0.8711, - "step": 9166 - }, - { - "epoch": 0.23, - "learning_rate": 1.98778252465046e-06, - "loss": 0.7246, - "step": 9167 - }, - { - "epoch": 0.23, - "learning_rate": 1.987778212146205e-06, - "loss": 0.7979, - "step": 9168 - }, - { - "epoch": 0.24, - "learning_rate": 1.9877738988856536e-06, - "loss": 0.9697, - "step": 9169 - }, - { - "epoch": 0.24, - "learning_rate": 1.9877695848688094e-06, - "loss": 1.04, - "step": 9170 - }, - { - "epoch": 0.24, - "learning_rate": 1.987765270095675e-06, - "loss": 0.918, - "step": 9171 - }, - { - "epoch": 0.24, - "learning_rate": 1.9877609545662545e-06, - "loss": 0.959, - "step": 9172 - }, - { - "epoch": 0.24, - "learning_rate": 1.9877566382805507e-06, - "loss": 0.8701, - "step": 9173 - }, - { - "epoch": 0.24, - "learning_rate": 1.9877523212385673e-06, - "loss": 1.0298, - "step": 9174 - }, - { - "epoch": 0.24, - "learning_rate": 1.9877480034403074e-06, - "loss": 0.9067, - "step": 9175 - }, - { - "epoch": 0.24, - "learning_rate": 1.987743684885774e-06, - "loss": 0.9365, - "step": 9176 - }, - { - "epoch": 0.24, - "learning_rate": 1.9877393655749706e-06, - "loss": 0.8018, - "step": 9177 - }, - { - "epoch": 0.24, - "learning_rate": 1.987735045507901e-06, - "loss": 0.8906, - "step": 9178 - }, - { - "epoch": 0.24, - "learning_rate": 1.987730724684568e-06, - "loss": 0.8262, - "step": 9179 - }, - { - "epoch": 0.24, - "learning_rate": 1.9877264031049747e-06, - "loss": 0.8389, - "step": 9180 - }, - { - "epoch": 0.24, - "learning_rate": 1.9877220807691246e-06, - "loss": 1.0137, - "step": 9181 - }, - { - "epoch": 0.24, - "learning_rate": 1.9877177576770216e-06, - "loss": 0.9521, - "step": 9182 - }, - { - "epoch": 0.24, - "learning_rate": 1.9877134338286684e-06, - "loss": 1.1621, - "step": 9183 - }, - { - "epoch": 0.24, - "learning_rate": 1.987709109224068e-06, - "loss": 0.8799, - "step": 9184 - }, - { - "epoch": 0.24, - "learning_rate": 1.987704783863225e-06, - "loss": 1.0957, - "step": 9185 - }, - { - "epoch": 0.24, - "learning_rate": 1.987700457746141e-06, - "loss": 0.8438, - "step": 9186 - }, - { - "epoch": 0.24, - "learning_rate": 1.9876961308728206e-06, - "loss": 0.877, - "step": 9187 - }, - { - "epoch": 0.24, - "learning_rate": 1.9876918032432667e-06, - "loss": 0.644, - "step": 9188 - }, - { - "epoch": 0.24, - "learning_rate": 1.9876874748574825e-06, - "loss": 0.6123, - "step": 9189 - }, - { - "epoch": 0.24, - "learning_rate": 1.9876831457154716e-06, - "loss": 0.8301, - "step": 9190 - }, - { - "epoch": 0.24, - "learning_rate": 1.987678815817237e-06, - "loss": 0.9609, - "step": 9191 - }, - { - "epoch": 0.24, - "learning_rate": 1.987674485162782e-06, - "loss": 0.6943, - "step": 9192 - }, - { - "epoch": 0.24, - "learning_rate": 1.9876701537521103e-06, - "loss": 0.9229, - "step": 9193 - }, - { - "epoch": 0.24, - "learning_rate": 1.987665821585225e-06, - "loss": 0.8662, - "step": 9194 - }, - { - "epoch": 0.24, - "learning_rate": 1.987661488662129e-06, - "loss": 1.0166, - "step": 9195 - }, - { - "epoch": 0.24, - "learning_rate": 1.987657154982826e-06, - "loss": 1.001, - "step": 9196 - }, - { - "epoch": 0.24, - "learning_rate": 1.98765282054732e-06, - "loss": 0.7109, - "step": 9197 - }, - { - "epoch": 0.24, - "learning_rate": 1.987648485355613e-06, - "loss": 1.0928, - "step": 9198 - }, - { - "epoch": 0.24, - "learning_rate": 1.9876441494077093e-06, - "loss": 0.9287, - "step": 9199 - }, - { - "epoch": 0.24, - "learning_rate": 1.987639812703612e-06, - "loss": 0.9482, - "step": 9200 - }, - { - "epoch": 0.24, - "learning_rate": 1.987635475243324e-06, - "loss": 1.1084, - "step": 9201 - }, - { - "epoch": 0.24, - "learning_rate": 1.987631137026849e-06, - "loss": 0.6577, - "step": 9202 - }, - { - "epoch": 0.24, - "learning_rate": 1.9876267980541905e-06, - "loss": 0.9121, - "step": 9203 - }, - { - "epoch": 0.24, - "learning_rate": 1.9876224583253515e-06, - "loss": 0.8877, - "step": 9204 - }, - { - "epoch": 0.24, - "learning_rate": 1.9876181178403353e-06, - "loss": 1.1387, - "step": 9205 - }, - { - "epoch": 0.24, - "learning_rate": 1.9876137765991448e-06, - "loss": 0.7637, - "step": 9206 - }, - { - "epoch": 0.24, - "learning_rate": 1.9876094346017843e-06, - "loss": 0.9473, - "step": 9207 - }, - { - "epoch": 0.24, - "learning_rate": 1.9876050918482567e-06, - "loss": 0.9473, - "step": 9208 - }, - { - "epoch": 0.24, - "learning_rate": 1.9876007483385654e-06, - "loss": 0.9043, - "step": 9209 - }, - { - "epoch": 0.24, - "learning_rate": 1.9875964040727135e-06, - "loss": 1.2295, - "step": 9210 - }, - { - "epoch": 0.24, - "learning_rate": 1.9875920590507046e-06, - "loss": 0.958, - "step": 9211 - }, - { - "epoch": 0.24, - "learning_rate": 1.9875877132725418e-06, - "loss": 1.0127, - "step": 9212 - }, - { - "epoch": 0.24, - "learning_rate": 1.9875833667382284e-06, - "loss": 0.8945, - "step": 9213 - }, - { - "epoch": 0.24, - "learning_rate": 1.987579019447768e-06, - "loss": 0.8936, - "step": 9214 - }, - { - "epoch": 0.24, - "learning_rate": 1.9875746714011632e-06, - "loss": 1.0, - "step": 9215 - }, - { - "epoch": 0.24, - "learning_rate": 1.9875703225984186e-06, - "loss": 0.7671, - "step": 9216 - }, - { - "epoch": 0.24, - "learning_rate": 1.9875659730395365e-06, - "loss": 0.8027, - "step": 9217 - }, - { - "epoch": 0.24, - "learning_rate": 1.9875616227245204e-06, - "loss": 1.0098, - "step": 9218 - }, - { - "epoch": 0.24, - "learning_rate": 1.9875572716533736e-06, - "loss": 0.8408, - "step": 9219 - }, - { - "epoch": 0.24, - "learning_rate": 1.9875529198261e-06, - "loss": 0.6987, - "step": 9220 - }, - { - "epoch": 0.24, - "learning_rate": 1.9875485672427026e-06, - "loss": 1.0186, - "step": 9221 - }, - { - "epoch": 0.24, - "learning_rate": 1.9875442139031847e-06, - "loss": 0.9766, - "step": 9222 - }, - { - "epoch": 0.24, - "learning_rate": 1.9875398598075492e-06, - "loss": 1.0371, - "step": 9223 - }, - { - "epoch": 0.24, - "learning_rate": 1.9875355049558e-06, - "loss": 0.7357, - "step": 9224 - }, - { - "epoch": 0.24, - "learning_rate": 1.9875311493479406e-06, - "loss": 1.0713, - "step": 9225 - }, - { - "epoch": 0.24, - "learning_rate": 1.987526792983974e-06, - "loss": 1.0684, - "step": 9226 - }, - { - "epoch": 0.24, - "learning_rate": 1.987522435863903e-06, - "loss": 0.9346, - "step": 9227 - }, - { - "epoch": 0.24, - "learning_rate": 1.9875180779877317e-06, - "loss": 0.8643, - "step": 9228 - }, - { - "epoch": 0.24, - "learning_rate": 1.9875137193554632e-06, - "loss": 0.7808, - "step": 9229 - }, - { - "epoch": 0.24, - "learning_rate": 1.987509359967101e-06, - "loss": 1.0566, - "step": 9230 - }, - { - "epoch": 0.24, - "learning_rate": 1.987504999822648e-06, - "loss": 0.9668, - "step": 9231 - }, - { - "epoch": 0.24, - "learning_rate": 1.9875006389221085e-06, - "loss": 0.6887, - "step": 9232 - }, - { - "epoch": 0.24, - "learning_rate": 1.9874962772654842e-06, - "loss": 0.8027, - "step": 9233 - }, - { - "epoch": 0.24, - "learning_rate": 1.9874919148527806e-06, - "loss": 0.9199, - "step": 9234 - }, - { - "epoch": 0.24, - "learning_rate": 1.987487551683999e-06, - "loss": 0.832, - "step": 9235 - }, - { - "epoch": 0.24, - "learning_rate": 1.9874831877591437e-06, - "loss": 0.7275, - "step": 9236 - }, - { - "epoch": 0.24, - "learning_rate": 1.987478823078218e-06, - "loss": 0.8545, - "step": 9237 - }, - { - "epoch": 0.24, - "learning_rate": 1.987474457641225e-06, - "loss": 0.9023, - "step": 9238 - }, - { - "epoch": 0.24, - "learning_rate": 1.9874700914481686e-06, - "loss": 1.1055, - "step": 9239 - }, - { - "epoch": 0.24, - "learning_rate": 1.9874657244990513e-06, - "loss": 0.79, - "step": 9240 - }, - { - "epoch": 0.24, - "learning_rate": 1.987461356793877e-06, - "loss": 0.8789, - "step": 9241 - }, - { - "epoch": 0.24, - "learning_rate": 1.987456988332649e-06, - "loss": 1.0352, - "step": 9242 - }, - { - "epoch": 0.24, - "learning_rate": 1.987452619115371e-06, - "loss": 0.8164, - "step": 9243 - }, - { - "epoch": 0.24, - "learning_rate": 1.9874482491420455e-06, - "loss": 1.0518, - "step": 9244 - }, - { - "epoch": 0.24, - "learning_rate": 1.9874438784126765e-06, - "loss": 1.0557, - "step": 9245 - }, - { - "epoch": 0.24, - "learning_rate": 1.987439506927267e-06, - "loss": 1.0381, - "step": 9246 - }, - { - "epoch": 0.24, - "learning_rate": 1.9874351346858205e-06, - "loss": 0.792, - "step": 9247 - }, - { - "epoch": 0.24, - "learning_rate": 1.98743076168834e-06, - "loss": 0.9609, - "step": 9248 - }, - { - "epoch": 0.24, - "learning_rate": 1.9874263879348295e-06, - "loss": 0.8232, - "step": 9249 - }, - { - "epoch": 0.24, - "learning_rate": 1.9874220134252922e-06, - "loss": 0.8604, - "step": 9250 - }, - { - "epoch": 0.24, - "learning_rate": 1.987417638159731e-06, - "loss": 0.9805, - "step": 9251 - }, - { - "epoch": 0.24, - "learning_rate": 1.9874132621381497e-06, - "loss": 0.9043, - "step": 9252 - }, - { - "epoch": 0.24, - "learning_rate": 1.987408885360551e-06, - "loss": 0.9893, - "step": 9253 - }, - { - "epoch": 0.24, - "learning_rate": 1.9874045078269394e-06, - "loss": 0.5669, - "step": 9254 - }, - { - "epoch": 0.24, - "learning_rate": 1.9874001295373172e-06, - "loss": 0.7163, - "step": 9255 - }, - { - "epoch": 0.24, - "learning_rate": 1.987395750491688e-06, - "loss": 0.9707, - "step": 9256 - }, - { - "epoch": 0.24, - "learning_rate": 1.9873913706900558e-06, - "loss": 0.751, - "step": 9257 - }, - { - "epoch": 0.24, - "learning_rate": 1.987386990132423e-06, - "loss": 0.8354, - "step": 9258 - }, - { - "epoch": 0.24, - "learning_rate": 1.987382608818793e-06, - "loss": 0.916, - "step": 9259 - }, - { - "epoch": 0.24, - "learning_rate": 1.98737822674917e-06, - "loss": 0.8135, - "step": 9260 - }, - { - "epoch": 0.24, - "learning_rate": 1.987373843923557e-06, - "loss": 0.9482, - "step": 9261 - }, - { - "epoch": 0.24, - "learning_rate": 1.987369460341957e-06, - "loss": 1.1562, - "step": 9262 - }, - { - "epoch": 0.24, - "learning_rate": 1.987365076004374e-06, - "loss": 0.9854, - "step": 9263 - }, - { - "epoch": 0.24, - "learning_rate": 1.9873606909108104e-06, - "loss": 0.9385, - "step": 9264 - }, - { - "epoch": 0.24, - "learning_rate": 1.9873563050612706e-06, - "loss": 0.7842, - "step": 9265 - }, - { - "epoch": 0.24, - "learning_rate": 1.987351918455757e-06, - "loss": 0.8491, - "step": 9266 - }, - { - "epoch": 0.24, - "learning_rate": 1.987347531094274e-06, - "loss": 0.6943, - "step": 9267 - }, - { - "epoch": 0.24, - "learning_rate": 1.9873431429768243e-06, - "loss": 0.9883, - "step": 9268 - }, - { - "epoch": 0.24, - "learning_rate": 1.987338754103411e-06, - "loss": 0.835, - "step": 9269 - }, - { - "epoch": 0.24, - "learning_rate": 1.987334364474038e-06, - "loss": 0.9775, - "step": 9270 - }, - { - "epoch": 0.24, - "learning_rate": 1.9873299740887086e-06, - "loss": 0.876, - "step": 9271 - }, - { - "epoch": 0.24, - "learning_rate": 1.9873255829474257e-06, - "loss": 0.7861, - "step": 9272 - }, - { - "epoch": 0.24, - "learning_rate": 1.987321191050193e-06, - "loss": 1.123, - "step": 9273 - }, - { - "epoch": 0.24, - "learning_rate": 1.9873167983970143e-06, - "loss": 1.1172, - "step": 9274 - }, - { - "epoch": 0.24, - "learning_rate": 1.987312404987892e-06, - "loss": 0.9531, - "step": 9275 - }, - { - "epoch": 0.24, - "learning_rate": 1.9873080108228307e-06, - "loss": 0.7893, - "step": 9276 - }, - { - "epoch": 0.24, - "learning_rate": 1.9873036159018323e-06, - "loss": 0.9531, - "step": 9277 - }, - { - "epoch": 0.24, - "learning_rate": 1.9872992202249014e-06, - "loss": 0.9062, - "step": 9278 - }, - { - "epoch": 0.24, - "learning_rate": 1.9872948237920406e-06, - "loss": 1.1621, - "step": 9279 - }, - { - "epoch": 0.24, - "learning_rate": 1.9872904266032537e-06, - "loss": 1.0234, - "step": 9280 - }, - { - "epoch": 0.24, - "learning_rate": 1.987286028658544e-06, - "loss": 0.9395, - "step": 9281 - }, - { - "epoch": 0.24, - "learning_rate": 1.9872816299579144e-06, - "loss": 0.917, - "step": 9282 - }, - { - "epoch": 0.24, - "learning_rate": 1.987277230501369e-06, - "loss": 1.123, - "step": 9283 - }, - { - "epoch": 0.24, - "learning_rate": 1.987272830288911e-06, - "loss": 1.0654, - "step": 9284 - }, - { - "epoch": 0.24, - "learning_rate": 1.9872684293205433e-06, - "loss": 0.9053, - "step": 9285 - }, - { - "epoch": 0.24, - "learning_rate": 1.9872640275962693e-06, - "loss": 0.7354, - "step": 9286 - }, - { - "epoch": 0.24, - "learning_rate": 1.987259625116093e-06, - "loss": 0.916, - "step": 9287 - }, - { - "epoch": 0.24, - "learning_rate": 1.9872552218800178e-06, - "loss": 0.9609, - "step": 9288 - }, - { - "epoch": 0.24, - "learning_rate": 1.987250817888046e-06, - "loss": 1.0615, - "step": 9289 - }, - { - "epoch": 0.24, - "learning_rate": 1.9872464131401818e-06, - "loss": 0.917, - "step": 9290 - }, - { - "epoch": 0.24, - "learning_rate": 1.9872420076364286e-06, - "loss": 0.8633, - "step": 9291 - }, - { - "epoch": 0.24, - "learning_rate": 1.987237601376789e-06, - "loss": 0.9072, - "step": 9292 - }, - { - "epoch": 0.24, - "learning_rate": 1.9872331943612677e-06, - "loss": 1.0273, - "step": 9293 - }, - { - "epoch": 0.24, - "learning_rate": 1.9872287865898668e-06, - "loss": 0.793, - "step": 9294 - }, - { - "epoch": 0.24, - "learning_rate": 1.987224378062591e-06, - "loss": 0.7305, - "step": 9295 - }, - { - "epoch": 0.24, - "learning_rate": 1.987219968779442e-06, - "loss": 0.9668, - "step": 9296 - }, - { - "epoch": 0.24, - "learning_rate": 1.9872155587404246e-06, - "loss": 1.0049, - "step": 9297 - }, - { - "epoch": 0.24, - "learning_rate": 1.9872111479455413e-06, - "loss": 1.0283, - "step": 9298 - }, - { - "epoch": 0.24, - "learning_rate": 1.987206736394796e-06, - "loss": 0.5579, - "step": 9299 - }, - { - "epoch": 0.24, - "learning_rate": 1.987202324088192e-06, - "loss": 1.0264, - "step": 9300 - }, - { - "epoch": 0.24, - "learning_rate": 1.9871979110257324e-06, - "loss": 0.8145, - "step": 9301 - }, - { - "epoch": 0.24, - "learning_rate": 1.987193497207421e-06, - "loss": 0.8574, - "step": 9302 - }, - { - "epoch": 0.24, - "learning_rate": 1.9871890826332603e-06, - "loss": 1.082, - "step": 9303 - }, - { - "epoch": 0.24, - "learning_rate": 1.987184667303255e-06, - "loss": 1.0439, - "step": 9304 - }, - { - "epoch": 0.24, - "learning_rate": 1.9871802512174074e-06, - "loss": 0.624, - "step": 9305 - }, - { - "epoch": 0.24, - "learning_rate": 1.9871758343757214e-06, - "loss": 1.082, - "step": 9306 - }, - { - "epoch": 0.24, - "learning_rate": 1.9871714167782004e-06, - "loss": 1.1514, - "step": 9307 - }, - { - "epoch": 0.24, - "learning_rate": 1.9871669984248473e-06, - "loss": 0.8154, - "step": 9308 - }, - { - "epoch": 0.24, - "learning_rate": 1.987162579315666e-06, - "loss": 0.7529, - "step": 9309 - }, - { - "epoch": 0.24, - "learning_rate": 1.98715815945066e-06, - "loss": 1.0615, - "step": 9310 - }, - { - "epoch": 0.24, - "learning_rate": 1.9871537388298317e-06, - "loss": 0.9199, - "step": 9311 - }, - { - "epoch": 0.24, - "learning_rate": 1.9871493174531856e-06, - "loss": 1.1094, - "step": 9312 - }, - { - "epoch": 0.24, - "learning_rate": 1.9871448953207247e-06, - "loss": 0.9697, - "step": 9313 - }, - { - "epoch": 0.24, - "learning_rate": 1.987140472432452e-06, - "loss": 0.7871, - "step": 9314 - }, - { - "epoch": 0.24, - "learning_rate": 1.987136048788372e-06, - "loss": 0.9033, - "step": 9315 - }, - { - "epoch": 0.24, - "learning_rate": 1.987131624388487e-06, - "loss": 1.0146, - "step": 9316 - }, - { - "epoch": 0.24, - "learning_rate": 1.9871271992328003e-06, - "loss": 1.166, - "step": 9317 - }, - { - "epoch": 0.24, - "learning_rate": 1.987122773321316e-06, - "loss": 0.8799, - "step": 9318 - }, - { - "epoch": 0.24, - "learning_rate": 1.987118346654037e-06, - "loss": 0.832, - "step": 9319 - }, - { - "epoch": 0.24, - "learning_rate": 1.987113919230967e-06, - "loss": 0.6704, - "step": 9320 - }, - { - "epoch": 0.24, - "learning_rate": 1.9871094910521093e-06, - "loss": 1.2793, - "step": 9321 - }, - { - "epoch": 0.24, - "learning_rate": 1.9871050621174673e-06, - "loss": 1.0957, - "step": 9322 - }, - { - "epoch": 0.24, - "learning_rate": 1.9871006324270437e-06, - "loss": 0.8252, - "step": 9323 - }, - { - "epoch": 0.24, - "learning_rate": 1.987096201980843e-06, - "loss": 0.8174, - "step": 9324 - }, - { - "epoch": 0.24, - "learning_rate": 1.9870917707788684e-06, - "loss": 1.2246, - "step": 9325 - }, - { - "epoch": 0.24, - "learning_rate": 1.987087338821123e-06, - "loss": 0.9785, - "step": 9326 - }, - { - "epoch": 0.24, - "learning_rate": 1.98708290610761e-06, - "loss": 0.75, - "step": 9327 - }, - { - "epoch": 0.24, - "learning_rate": 1.987078472638333e-06, - "loss": 0.9092, - "step": 9328 - }, - { - "epoch": 0.24, - "learning_rate": 1.9870740384132954e-06, - "loss": 0.9053, - "step": 9329 - }, - { - "epoch": 0.24, - "learning_rate": 1.987069603432501e-06, - "loss": 1.0098, - "step": 9330 - }, - { - "epoch": 0.24, - "learning_rate": 1.987065167695952e-06, - "loss": 0.8613, - "step": 9331 - }, - { - "epoch": 0.24, - "learning_rate": 1.987060731203653e-06, - "loss": 0.9404, - "step": 9332 - }, - { - "epoch": 0.24, - "learning_rate": 1.987056293955607e-06, - "loss": 0.9707, - "step": 9333 - }, - { - "epoch": 0.24, - "learning_rate": 1.9870518559518176e-06, - "loss": 0.8223, - "step": 9334 - }, - { - "epoch": 0.24, - "learning_rate": 1.9870474171922876e-06, - "loss": 0.9766, - "step": 9335 - }, - { - "epoch": 0.24, - "learning_rate": 1.987042977677021e-06, - "loss": 0.8154, - "step": 9336 - }, - { - "epoch": 0.24, - "learning_rate": 1.987038537406021e-06, - "loss": 0.8447, - "step": 9337 - }, - { - "epoch": 0.24, - "learning_rate": 1.9870340963792906e-06, - "loss": 0.8418, - "step": 9338 - }, - { - "epoch": 0.24, - "learning_rate": 1.9870296545968342e-06, - "loss": 0.9268, - "step": 9339 - }, - { - "epoch": 0.24, - "learning_rate": 1.9870252120586542e-06, - "loss": 0.9404, - "step": 9340 - }, - { - "epoch": 0.24, - "learning_rate": 1.987020768764754e-06, - "loss": 1.0303, - "step": 9341 - }, - { - "epoch": 0.24, - "learning_rate": 1.9870163247151378e-06, - "loss": 1.0381, - "step": 9342 - }, - { - "epoch": 0.24, - "learning_rate": 1.987011879909809e-06, - "loss": 0.8018, - "step": 9343 - }, - { - "epoch": 0.24, - "learning_rate": 1.98700743434877e-06, - "loss": 0.8672, - "step": 9344 - }, - { - "epoch": 0.24, - "learning_rate": 1.987002988032025e-06, - "loss": 0.8066, - "step": 9345 - }, - { - "epoch": 0.24, - "learning_rate": 1.986998540959577e-06, - "loss": 0.8408, - "step": 9346 - }, - { - "epoch": 0.24, - "learning_rate": 1.9869940931314297e-06, - "loss": 1.1885, - "step": 9347 - }, - { - "epoch": 0.24, - "learning_rate": 1.986989644547587e-06, - "loss": 1.1172, - "step": 9348 - }, - { - "epoch": 0.24, - "learning_rate": 1.9869851952080507e-06, - "loss": 1.1416, - "step": 9349 - }, - { - "epoch": 0.24, - "learning_rate": 1.986980745112826e-06, - "loss": 1.2637, - "step": 9350 - }, - { - "epoch": 0.24, - "learning_rate": 1.986976294261915e-06, - "loss": 1.1592, - "step": 9351 - }, - { - "epoch": 0.24, - "learning_rate": 1.9869718426553218e-06, - "loss": 0.9277, - "step": 9352 - }, - { - "epoch": 0.24, - "learning_rate": 1.9869673902930495e-06, - "loss": 1.1191, - "step": 9353 - }, - { - "epoch": 0.24, - "learning_rate": 1.986962937175102e-06, - "loss": 0.5625, - "step": 9354 - }, - { - "epoch": 0.24, - "learning_rate": 1.9869584833014824e-06, - "loss": 0.9355, - "step": 9355 - }, - { - "epoch": 0.24, - "learning_rate": 1.986954028672194e-06, - "loss": 0.7939, - "step": 9356 - }, - { - "epoch": 0.24, - "learning_rate": 1.98694957328724e-06, - "loss": 0.9551, - "step": 9357 - }, - { - "epoch": 0.24, - "learning_rate": 1.9869451171466244e-06, - "loss": 1.084, - "step": 9358 - }, - { - "epoch": 0.24, - "learning_rate": 1.98694066025035e-06, - "loss": 1.0234, - "step": 9359 - }, - { - "epoch": 0.24, - "learning_rate": 1.9869362025984205e-06, - "loss": 0.6665, - "step": 9360 - }, - { - "epoch": 0.24, - "learning_rate": 1.98693174419084e-06, - "loss": 0.8535, - "step": 9361 - }, - { - "epoch": 0.24, - "learning_rate": 1.9869272850276105e-06, - "loss": 0.8193, - "step": 9362 - }, - { - "epoch": 0.24, - "learning_rate": 1.9869228251087363e-06, - "loss": 0.9844, - "step": 9363 - }, - { - "epoch": 0.24, - "learning_rate": 1.986918364434221e-06, - "loss": 1.0059, - "step": 9364 - }, - { - "epoch": 0.24, - "learning_rate": 1.986913903004067e-06, - "loss": 0.9834, - "step": 9365 - }, - { - "epoch": 0.24, - "learning_rate": 1.986909440818279e-06, - "loss": 1.0332, - "step": 9366 - }, - { - "epoch": 0.24, - "learning_rate": 1.9869049778768597e-06, - "loss": 0.8799, - "step": 9367 - }, - { - "epoch": 0.24, - "learning_rate": 1.9869005141798128e-06, - "loss": 0.9756, - "step": 9368 - }, - { - "epoch": 0.24, - "learning_rate": 1.9868960497271413e-06, - "loss": 1.0527, - "step": 9369 - }, - { - "epoch": 0.24, - "learning_rate": 1.986891584518849e-06, - "loss": 0.8906, - "step": 9370 - }, - { - "epoch": 0.24, - "learning_rate": 1.986887118554939e-06, - "loss": 1.0176, - "step": 9371 - }, - { - "epoch": 0.24, - "learning_rate": 1.9868826518354153e-06, - "loss": 0.9458, - "step": 9372 - }, - { - "epoch": 0.24, - "learning_rate": 1.986878184360281e-06, - "loss": 0.96, - "step": 9373 - }, - { - "epoch": 0.24, - "learning_rate": 1.986873716129539e-06, - "loss": 0.7852, - "step": 9374 - }, - { - "epoch": 0.24, - "learning_rate": 1.986869247143193e-06, - "loss": 1.0645, - "step": 9375 - }, - { - "epoch": 0.24, - "learning_rate": 1.986864777401247e-06, - "loss": 0.7744, - "step": 9376 - }, - { - "epoch": 0.24, - "learning_rate": 1.986860306903704e-06, - "loss": 0.9883, - "step": 9377 - }, - { - "epoch": 0.24, - "learning_rate": 1.9868558356505674e-06, - "loss": 0.9473, - "step": 9378 - }, - { - "epoch": 0.24, - "learning_rate": 1.9868513636418408e-06, - "loss": 0.7764, - "step": 9379 - }, - { - "epoch": 0.24, - "learning_rate": 1.9868468908775272e-06, - "loss": 0.8057, - "step": 9380 - }, - { - "epoch": 0.24, - "learning_rate": 1.9868424173576302e-06, - "loss": 0.8643, - "step": 9381 - }, - { - "epoch": 0.24, - "learning_rate": 1.9868379430821536e-06, - "loss": 1.0352, - "step": 9382 - }, - { - "epoch": 0.24, - "learning_rate": 1.9868334680511007e-06, - "loss": 0.916, - "step": 9383 - }, - { - "epoch": 0.24, - "learning_rate": 1.9868289922644745e-06, - "loss": 1.0547, - "step": 9384 - }, - { - "epoch": 0.24, - "learning_rate": 1.986824515722279e-06, - "loss": 0.7979, - "step": 9385 - }, - { - "epoch": 0.24, - "learning_rate": 1.986820038424517e-06, - "loss": 0.958, - "step": 9386 - }, - { - "epoch": 0.24, - "learning_rate": 1.9868155603711926e-06, - "loss": 0.9297, - "step": 9387 - }, - { - "epoch": 0.24, - "learning_rate": 1.986811081562309e-06, - "loss": 0.8633, - "step": 9388 - }, - { - "epoch": 0.24, - "learning_rate": 1.986806601997869e-06, - "loss": 1.0117, - "step": 9389 - }, - { - "epoch": 0.24, - "learning_rate": 1.986802121677877e-06, - "loss": 0.9678, - "step": 9390 - }, - { - "epoch": 0.24, - "learning_rate": 1.986797640602336e-06, - "loss": 0.7827, - "step": 9391 - }, - { - "epoch": 0.24, - "learning_rate": 1.986793158771249e-06, - "loss": 0.959, - "step": 9392 - }, - { - "epoch": 0.24, - "learning_rate": 1.98678867618462e-06, - "loss": 1.0352, - "step": 9393 - }, - { - "epoch": 0.24, - "learning_rate": 1.9867841928424526e-06, - "loss": 0.9404, - "step": 9394 - }, - { - "epoch": 0.24, - "learning_rate": 1.9867797087447498e-06, - "loss": 0.9092, - "step": 9395 - }, - { - "epoch": 0.24, - "learning_rate": 1.9867752238915147e-06, - "loss": 0.9482, - "step": 9396 - }, - { - "epoch": 0.24, - "learning_rate": 1.9867707382827516e-06, - "loss": 0.8096, - "step": 9397 - }, - { - "epoch": 0.24, - "learning_rate": 1.9867662519184635e-06, - "loss": 0.9863, - "step": 9398 - }, - { - "epoch": 0.24, - "learning_rate": 1.986761764798654e-06, - "loss": 0.8135, - "step": 9399 - }, - { - "epoch": 0.24, - "learning_rate": 1.9867572769233263e-06, - "loss": 0.8486, - "step": 9400 - }, - { - "epoch": 0.24, - "learning_rate": 1.986752788292484e-06, - "loss": 0.9209, - "step": 9401 - }, - { - "epoch": 0.24, - "learning_rate": 1.98674829890613e-06, - "loss": 0.9502, - "step": 9402 - }, - { - "epoch": 0.24, - "learning_rate": 1.9867438087642686e-06, - "loss": 0.8838, - "step": 9403 - }, - { - "epoch": 0.24, - "learning_rate": 1.9867393178669024e-06, - "loss": 0.9668, - "step": 9404 - }, - { - "epoch": 0.24, - "learning_rate": 1.986734826214036e-06, - "loss": 1.1484, - "step": 9405 - }, - { - "epoch": 0.24, - "learning_rate": 1.9867303338056717e-06, - "loss": 1.0195, - "step": 9406 - }, - { - "epoch": 0.24, - "learning_rate": 1.986725840641813e-06, - "loss": 0.9463, - "step": 9407 - }, - { - "epoch": 0.24, - "learning_rate": 1.986721346722464e-06, - "loss": 1.0439, - "step": 9408 - }, - { - "epoch": 0.24, - "learning_rate": 1.9867168520476284e-06, - "loss": 0.876, - "step": 9409 - }, - { - "epoch": 0.24, - "learning_rate": 1.986712356617308e-06, - "loss": 0.9463, - "step": 9410 - }, - { - "epoch": 0.24, - "learning_rate": 1.9867078604315083e-06, - "loss": 0.9785, - "step": 9411 - }, - { - "epoch": 0.24, - "learning_rate": 1.9867033634902313e-06, - "loss": 1.0635, - "step": 9412 - }, - { - "epoch": 0.24, - "learning_rate": 1.986698865793481e-06, - "loss": 0.9131, - "step": 9413 - }, - { - "epoch": 0.24, - "learning_rate": 1.9866943673412607e-06, - "loss": 0.8428, - "step": 9414 - }, - { - "epoch": 0.24, - "learning_rate": 1.9866898681335738e-06, - "loss": 0.8467, - "step": 9415 - }, - { - "epoch": 0.24, - "learning_rate": 1.986685368170424e-06, - "loss": 0.9004, - "step": 9416 - }, - { - "epoch": 0.24, - "learning_rate": 1.9866808674518147e-06, - "loss": 0.9014, - "step": 9417 - }, - { - "epoch": 0.24, - "learning_rate": 1.986676365977749e-06, - "loss": 1.1855, - "step": 9418 - }, - { - "epoch": 0.24, - "learning_rate": 1.9866718637482304e-06, - "loss": 0.8496, - "step": 9419 - }, - { - "epoch": 0.24, - "learning_rate": 1.986667360763263e-06, - "loss": 0.8994, - "step": 9420 - }, - { - "epoch": 0.24, - "learning_rate": 1.9866628570228494e-06, - "loss": 0.7085, - "step": 9421 - }, - { - "epoch": 0.24, - "learning_rate": 1.9866583525269935e-06, - "loss": 0.8643, - "step": 9422 - }, - { - "epoch": 0.24, - "learning_rate": 1.986653847275699e-06, - "loss": 1.0352, - "step": 9423 - }, - { - "epoch": 0.24, - "learning_rate": 1.9866493412689684e-06, - "loss": 0.833, - "step": 9424 - }, - { - "epoch": 0.24, - "learning_rate": 1.9866448345068065e-06, - "loss": 1.0312, - "step": 9425 - }, - { - "epoch": 0.24, - "learning_rate": 1.986640326989215e-06, - "loss": 0.9072, - "step": 9426 - }, - { - "epoch": 0.24, - "learning_rate": 1.9866358187161993e-06, - "loss": 0.833, - "step": 9427 - }, - { - "epoch": 0.24, - "learning_rate": 1.9866313096877617e-06, - "loss": 1.1279, - "step": 9428 - }, - { - "epoch": 0.24, - "learning_rate": 1.9866267999039058e-06, - "loss": 0.9961, - "step": 9429 - }, - { - "epoch": 0.24, - "learning_rate": 1.986622289364635e-06, - "loss": 1.0146, - "step": 9430 - }, - { - "epoch": 0.24, - "learning_rate": 1.9866177780699527e-06, - "loss": 0.9297, - "step": 9431 - }, - { - "epoch": 0.24, - "learning_rate": 1.986613266019863e-06, - "loss": 0.8823, - "step": 9432 - }, - { - "epoch": 0.24, - "learning_rate": 1.986608753214369e-06, - "loss": 0.771, - "step": 9433 - }, - { - "epoch": 0.24, - "learning_rate": 1.9866042396534736e-06, - "loss": 0.7119, - "step": 9434 - }, - { - "epoch": 0.24, - "learning_rate": 1.986599725337181e-06, - "loss": 0.7178, - "step": 9435 - }, - { - "epoch": 0.24, - "learning_rate": 1.986595210265494e-06, - "loss": 0.9395, - "step": 9436 - }, - { - "epoch": 0.24, - "learning_rate": 1.9865906944384167e-06, - "loss": 0.7607, - "step": 9437 - }, - { - "epoch": 0.24, - "learning_rate": 1.986586177855952e-06, - "loss": 1.0088, - "step": 9438 - }, - { - "epoch": 0.24, - "learning_rate": 1.986581660518104e-06, - "loss": 0.9766, - "step": 9439 - }, - { - "epoch": 0.24, - "learning_rate": 1.9865771424248756e-06, - "loss": 0.897, - "step": 9440 - }, - { - "epoch": 0.24, - "learning_rate": 1.9865726235762705e-06, - "loss": 1.0654, - "step": 9441 - }, - { - "epoch": 0.24, - "learning_rate": 1.9865681039722915e-06, - "loss": 0.9521, - "step": 9442 - }, - { - "epoch": 0.24, - "learning_rate": 1.9865635836129434e-06, - "loss": 0.9092, - "step": 9443 - }, - { - "epoch": 0.24, - "learning_rate": 1.9865590624982287e-06, - "loss": 1.0947, - "step": 9444 - }, - { - "epoch": 0.24, - "learning_rate": 1.9865545406281516e-06, - "loss": 0.876, - "step": 9445 - }, - { - "epoch": 0.24, - "learning_rate": 1.9865500180027142e-06, - "loss": 0.8052, - "step": 9446 - }, - { - "epoch": 0.24, - "learning_rate": 1.9865454946219213e-06, - "loss": 0.8525, - "step": 9447 - }, - { - "epoch": 0.24, - "learning_rate": 1.9865409704857756e-06, - "loss": 1.0068, - "step": 9448 - }, - { - "epoch": 0.24, - "learning_rate": 1.986536445594281e-06, - "loss": 0.7773, - "step": 9449 - }, - { - "epoch": 0.24, - "learning_rate": 1.986531919947441e-06, - "loss": 0.7542, - "step": 9450 - }, - { - "epoch": 0.24, - "learning_rate": 1.9865273935452585e-06, - "loss": 0.9346, - "step": 9451 - }, - { - "epoch": 0.24, - "learning_rate": 1.986522866387738e-06, - "loss": 0.8506, - "step": 9452 - }, - { - "epoch": 0.24, - "learning_rate": 1.9865183384748816e-06, - "loss": 0.9521, - "step": 9453 - }, - { - "epoch": 0.24, - "learning_rate": 1.9865138098066934e-06, - "loss": 0.9336, - "step": 9454 - }, - { - "epoch": 0.24, - "learning_rate": 1.9865092803831775e-06, - "loss": 0.8535, - "step": 9455 - }, - { - "epoch": 0.24, - "learning_rate": 1.9865047502043366e-06, - "loss": 1.0996, - "step": 9456 - }, - { - "epoch": 0.24, - "learning_rate": 1.9865002192701743e-06, - "loss": 0.916, - "step": 9457 - }, - { - "epoch": 0.24, - "learning_rate": 1.986495687580694e-06, - "loss": 1.001, - "step": 9458 - }, - { - "epoch": 0.24, - "learning_rate": 1.9864911551358994e-06, - "loss": 0.958, - "step": 9459 - }, - { - "epoch": 0.24, - "learning_rate": 1.986486621935794e-06, - "loss": 1.3447, - "step": 9460 - }, - { - "epoch": 0.24, - "learning_rate": 1.9864820879803812e-06, - "loss": 0.918, - "step": 9461 - }, - { - "epoch": 0.24, - "learning_rate": 1.986477553269664e-06, - "loss": 0.8623, - "step": 9462 - }, - { - "epoch": 0.24, - "learning_rate": 1.986473017803647e-06, - "loss": 0.8828, - "step": 9463 - }, - { - "epoch": 0.24, - "learning_rate": 1.9864684815823325e-06, - "loss": 1.084, - "step": 9464 - }, - { - "epoch": 0.24, - "learning_rate": 1.9864639446057247e-06, - "loss": 0.8242, - "step": 9465 - }, - { - "epoch": 0.24, - "learning_rate": 1.9864594068738266e-06, - "loss": 0.9658, - "step": 9466 - }, - { - "epoch": 0.24, - "learning_rate": 1.986454868386642e-06, - "loss": 1.1035, - "step": 9467 - }, - { - "epoch": 0.24, - "learning_rate": 1.986450329144174e-06, - "loss": 0.6523, - "step": 9468 - }, - { - "epoch": 0.24, - "learning_rate": 1.9864457891464267e-06, - "loss": 1.0381, - "step": 9469 - }, - { - "epoch": 0.24, - "learning_rate": 1.986441248393403e-06, - "loss": 0.7769, - "step": 9470 - }, - { - "epoch": 0.24, - "learning_rate": 1.9864367068851068e-06, - "loss": 0.957, - "step": 9471 - }, - { - "epoch": 0.24, - "learning_rate": 1.986432164621541e-06, - "loss": 1.1064, - "step": 9472 - }, - { - "epoch": 0.24, - "learning_rate": 1.9864276216027096e-06, - "loss": 0.8657, - "step": 9473 - }, - { - "epoch": 0.24, - "learning_rate": 1.9864230778286162e-06, - "loss": 0.7979, - "step": 9474 - }, - { - "epoch": 0.24, - "learning_rate": 1.986418533299264e-06, - "loss": 0.8359, - "step": 9475 - }, - { - "epoch": 0.24, - "learning_rate": 1.986413988014656e-06, - "loss": 1.1172, - "step": 9476 - }, - { - "epoch": 0.24, - "learning_rate": 1.9864094419747964e-06, - "loss": 0.8008, - "step": 9477 - }, - { - "epoch": 0.24, - "learning_rate": 1.986404895179689e-06, - "loss": 1.1816, - "step": 9478 - }, - { - "epoch": 0.24, - "learning_rate": 1.986400347629336e-06, - "loss": 1.0869, - "step": 9479 - }, - { - "epoch": 0.24, - "learning_rate": 1.9863957993237418e-06, - "loss": 0.6968, - "step": 9480 - }, - { - "epoch": 0.24, - "learning_rate": 1.9863912502629097e-06, - "loss": 1.1426, - "step": 9481 - }, - { - "epoch": 0.24, - "learning_rate": 1.986386700446843e-06, - "loss": 1.0332, - "step": 9482 - }, - { - "epoch": 0.24, - "learning_rate": 1.986382149875546e-06, - "loss": 0.8643, - "step": 9483 - }, - { - "epoch": 0.24, - "learning_rate": 1.986377598549021e-06, - "loss": 0.9072, - "step": 9484 - }, - { - "epoch": 0.24, - "learning_rate": 1.986373046467272e-06, - "loss": 0.7617, - "step": 9485 - }, - { - "epoch": 0.24, - "learning_rate": 1.9863684936303027e-06, - "loss": 0.9658, - "step": 9486 - }, - { - "epoch": 0.24, - "learning_rate": 1.9863639400381163e-06, - "loss": 0.9258, - "step": 9487 - }, - { - "epoch": 0.24, - "learning_rate": 1.9863593856907165e-06, - "loss": 0.6582, - "step": 9488 - }, - { - "epoch": 0.24, - "learning_rate": 1.9863548305881064e-06, - "loss": 0.958, - "step": 9489 - }, - { - "epoch": 0.24, - "learning_rate": 1.98635027473029e-06, - "loss": 1.0557, - "step": 9490 - }, - { - "epoch": 0.24, - "learning_rate": 1.986345718117271e-06, - "loss": 0.7773, - "step": 9491 - }, - { - "epoch": 0.24, - "learning_rate": 1.9863411607490517e-06, - "loss": 0.9756, - "step": 9492 - }, - { - "epoch": 0.24, - "learning_rate": 1.9863366026256367e-06, - "loss": 0.9648, - "step": 9493 - }, - { - "epoch": 0.24, - "learning_rate": 1.986332043747029e-06, - "loss": 0.8945, - "step": 9494 - }, - { - "epoch": 0.24, - "learning_rate": 1.986327484113232e-06, - "loss": 0.8037, - "step": 9495 - }, - { - "epoch": 0.24, - "learning_rate": 1.9863229237242498e-06, - "loss": 0.8877, - "step": 9496 - }, - { - "epoch": 0.24, - "learning_rate": 1.9863183625800853e-06, - "loss": 0.9443, - "step": 9497 - }, - { - "epoch": 0.24, - "learning_rate": 1.986313800680742e-06, - "loss": 0.834, - "step": 9498 - }, - { - "epoch": 0.24, - "learning_rate": 1.986309238026224e-06, - "loss": 0.8896, - "step": 9499 - }, - { - "epoch": 0.24, - "learning_rate": 1.986304674616534e-06, - "loss": 1.0518, - "step": 9500 - }, - { - "epoch": 0.24, - "learning_rate": 1.9863001104516758e-06, - "loss": 1.0762, - "step": 9501 - }, - { - "epoch": 0.24, - "learning_rate": 1.986295545531653e-06, - "loss": 0.9766, - "step": 9502 - }, - { - "epoch": 0.24, - "learning_rate": 1.9862909798564697e-06, - "loss": 0.8706, - "step": 9503 - }, - { - "epoch": 0.24, - "learning_rate": 1.986286413426128e-06, - "loss": 0.9062, - "step": 9504 - }, - { - "epoch": 0.24, - "learning_rate": 1.9862818462406327e-06, - "loss": 1.0205, - "step": 9505 - }, - { - "epoch": 0.24, - "learning_rate": 1.9862772782999863e-06, - "loss": 0.8096, - "step": 9506 - }, - { - "epoch": 0.24, - "learning_rate": 1.9862727096041928e-06, - "loss": 0.9854, - "step": 9507 - }, - { - "epoch": 0.24, - "learning_rate": 1.9862681401532554e-06, - "loss": 0.6694, - "step": 9508 - }, - { - "epoch": 0.24, - "learning_rate": 1.9862635699471783e-06, - "loss": 0.9053, - "step": 9509 - }, - { - "epoch": 0.24, - "learning_rate": 1.986258998985964e-06, - "loss": 0.9658, - "step": 9510 - }, - { - "epoch": 0.24, - "learning_rate": 1.9862544272696173e-06, - "loss": 1.0303, - "step": 9511 - }, - { - "epoch": 0.24, - "learning_rate": 1.9862498547981404e-06, - "loss": 0.8574, - "step": 9512 - }, - { - "epoch": 0.24, - "learning_rate": 1.9862452815715376e-06, - "loss": 0.9102, - "step": 9513 - }, - { - "epoch": 0.24, - "learning_rate": 1.986240707589812e-06, - "loss": 0.7461, - "step": 9514 - }, - { - "epoch": 0.24, - "learning_rate": 1.986236132852967e-06, - "loss": 0.8594, - "step": 9515 - }, - { - "epoch": 0.24, - "learning_rate": 1.986231557361007e-06, - "loss": 0.9492, - "step": 9516 - }, - { - "epoch": 0.24, - "learning_rate": 1.9862269811139345e-06, - "loss": 0.8682, - "step": 9517 - }, - { - "epoch": 0.24, - "learning_rate": 1.986222404111753e-06, - "loss": 0.8799, - "step": 9518 - }, - { - "epoch": 0.24, - "learning_rate": 1.986217826354467e-06, - "loss": 0.9199, - "step": 9519 - }, - { - "epoch": 0.24, - "learning_rate": 1.9862132478420787e-06, - "loss": 1.0293, - "step": 9520 - }, - { - "epoch": 0.24, - "learning_rate": 1.9862086685745927e-06, - "loss": 0.5576, - "step": 9521 - }, - { - "epoch": 0.24, - "learning_rate": 1.9862040885520115e-06, - "loss": 0.7969, - "step": 9522 - }, - { - "epoch": 0.24, - "learning_rate": 1.98619950777434e-06, - "loss": 0.8999, - "step": 9523 - }, - { - "epoch": 0.24, - "learning_rate": 1.9861949262415803e-06, - "loss": 0.7305, - "step": 9524 - }, - { - "epoch": 0.24, - "learning_rate": 1.9861903439537366e-06, - "loss": 0.8223, - "step": 9525 - }, - { - "epoch": 0.24, - "learning_rate": 1.9861857609108126e-06, - "loss": 0.5046, - "step": 9526 - }, - { - "epoch": 0.24, - "learning_rate": 1.986181177112811e-06, - "loss": 1.001, - "step": 9527 - }, - { - "epoch": 0.24, - "learning_rate": 1.9861765925597362e-06, - "loss": 0.8135, - "step": 9528 - }, - { - "epoch": 0.24, - "learning_rate": 1.9861720072515916e-06, - "loss": 0.9463, - "step": 9529 - }, - { - "epoch": 0.24, - "learning_rate": 1.9861674211883797e-06, - "loss": 1.0742, - "step": 9530 - }, - { - "epoch": 0.24, - "learning_rate": 1.9861628343701053e-06, - "loss": 1.084, - "step": 9531 - }, - { - "epoch": 0.24, - "learning_rate": 1.986158246796771e-06, - "loss": 0.7549, - "step": 9532 - }, - { - "epoch": 0.24, - "learning_rate": 1.986153658468381e-06, - "loss": 0.834, - "step": 9533 - }, - { - "epoch": 0.24, - "learning_rate": 1.9861490693849383e-06, - "loss": 1.0527, - "step": 9534 - }, - { - "epoch": 0.24, - "learning_rate": 1.986144479546447e-06, - "loss": 0.8828, - "step": 9535 - }, - { - "epoch": 0.24, - "learning_rate": 1.9861398889529097e-06, - "loss": 1.0449, - "step": 9536 - }, - { - "epoch": 0.24, - "learning_rate": 1.9861352976043304e-06, - "loss": 0.9863, - "step": 9537 - }, - { - "epoch": 0.24, - "learning_rate": 1.986130705500713e-06, - "loss": 0.9492, - "step": 9538 - }, - { - "epoch": 0.24, - "learning_rate": 1.9861261126420605e-06, - "loss": 0.7227, - "step": 9539 - }, - { - "epoch": 0.24, - "learning_rate": 1.9861215190283766e-06, - "loss": 0.7803, - "step": 9540 - }, - { - "epoch": 0.24, - "learning_rate": 1.986116924659665e-06, - "loss": 1.0527, - "step": 9541 - }, - { - "epoch": 0.24, - "learning_rate": 1.9861123295359284e-06, - "loss": 0.6318, - "step": 9542 - }, - { - "epoch": 0.24, - "learning_rate": 1.9861077336571713e-06, - "loss": 1.125, - "step": 9543 - }, - { - "epoch": 0.24, - "learning_rate": 1.986103137023397e-06, - "loss": 0.8438, - "step": 9544 - }, - { - "epoch": 0.24, - "learning_rate": 1.9860985396346088e-06, - "loss": 0.8887, - "step": 9545 - }, - { - "epoch": 0.24, - "learning_rate": 1.98609394149081e-06, - "loss": 0.7842, - "step": 9546 - }, - { - "epoch": 0.24, - "learning_rate": 1.986089342592005e-06, - "loss": 0.8398, - "step": 9547 - }, - { - "epoch": 0.24, - "learning_rate": 1.986084742938196e-06, - "loss": 0.8464, - "step": 9548 - }, - { - "epoch": 0.24, - "learning_rate": 1.986080142529388e-06, - "loss": 0.834, - "step": 9549 - }, - { - "epoch": 0.24, - "learning_rate": 1.9860755413655833e-06, - "loss": 0.9043, - "step": 9550 - }, - { - "epoch": 0.24, - "learning_rate": 1.9860709394467862e-06, - "loss": 0.9629, - "step": 9551 - }, - { - "epoch": 0.24, - "learning_rate": 1.9860663367729995e-06, - "loss": 0.8809, - "step": 9552 - }, - { - "epoch": 0.24, - "learning_rate": 1.9860617333442273e-06, - "loss": 0.9609, - "step": 9553 - }, - { - "epoch": 0.24, - "learning_rate": 1.986057129160473e-06, - "loss": 0.8076, - "step": 9554 - }, - { - "epoch": 0.24, - "learning_rate": 1.98605252422174e-06, - "loss": 0.8018, - "step": 9555 - }, - { - "epoch": 0.24, - "learning_rate": 1.9860479185280324e-06, - "loss": 1.1982, - "step": 9556 - }, - { - "epoch": 0.24, - "learning_rate": 1.986043312079353e-06, - "loss": 0.8643, - "step": 9557 - }, - { - "epoch": 0.24, - "learning_rate": 1.9860387048757054e-06, - "loss": 0.8301, - "step": 9558 - }, - { - "epoch": 0.25, - "learning_rate": 1.9860340969170933e-06, - "loss": 0.8965, - "step": 9559 - }, - { - "epoch": 0.25, - "learning_rate": 1.9860294882035204e-06, - "loss": 0.8525, - "step": 9560 - }, - { - "epoch": 0.25, - "learning_rate": 1.98602487873499e-06, - "loss": 0.9307, - "step": 9561 - }, - { - "epoch": 0.25, - "learning_rate": 1.986020268511506e-06, - "loss": 1.001, - "step": 9562 - }, - { - "epoch": 0.25, - "learning_rate": 1.986015657533071e-06, - "loss": 1.043, - "step": 9563 - }, - { - "epoch": 0.25, - "learning_rate": 1.9860110457996896e-06, - "loss": 0.8364, - "step": 9564 - }, - { - "epoch": 0.25, - "learning_rate": 1.9860064333113647e-06, - "loss": 0.6614, - "step": 9565 - }, - { - "epoch": 0.25, - "learning_rate": 1.9860018200680997e-06, - "loss": 0.6748, - "step": 9566 - }, - { - "epoch": 0.25, - "learning_rate": 1.9859972060698992e-06, - "loss": 0.9717, - "step": 9567 - }, - { - "epoch": 0.25, - "learning_rate": 1.9859925913167654e-06, - "loss": 1.0039, - "step": 9568 - }, - { - "epoch": 0.25, - "learning_rate": 1.9859879758087024e-06, - "loss": 0.8643, - "step": 9569 - }, - { - "epoch": 0.25, - "learning_rate": 1.985983359545714e-06, - "loss": 0.8281, - "step": 9570 - }, - { - "epoch": 0.25, - "learning_rate": 1.9859787425278035e-06, - "loss": 1.0693, - "step": 9571 - }, - { - "epoch": 0.25, - "learning_rate": 1.9859741247549743e-06, - "loss": 0.9316, - "step": 9572 - }, - { - "epoch": 0.25, - "learning_rate": 1.98596950622723e-06, - "loss": 1.042, - "step": 9573 - }, - { - "epoch": 0.25, - "learning_rate": 1.9859648869445743e-06, - "loss": 0.8643, - "step": 9574 - }, - { - "epoch": 0.25, - "learning_rate": 1.9859602669070107e-06, - "loss": 0.9854, - "step": 9575 - }, - { - "epoch": 0.25, - "learning_rate": 1.9859556461145425e-06, - "loss": 1.0586, - "step": 9576 - }, - { - "epoch": 0.25, - "learning_rate": 1.985951024567173e-06, - "loss": 0.71, - "step": 9577 - }, - { - "epoch": 0.25, - "learning_rate": 1.985946402264907e-06, - "loss": 1.082, - "step": 9578 - }, - { - "epoch": 0.25, - "learning_rate": 1.9859417792077462e-06, - "loss": 0.7676, - "step": 9579 - }, - { - "epoch": 0.25, - "learning_rate": 1.985937155395696e-06, - "loss": 0.8564, - "step": 9580 - }, - { - "epoch": 0.25, - "learning_rate": 1.9859325308287586e-06, - "loss": 1.0146, - "step": 9581 - }, - { - "epoch": 0.25, - "learning_rate": 1.985927905506938e-06, - "loss": 0.7969, - "step": 9582 - }, - { - "epoch": 0.25, - "learning_rate": 1.985923279430238e-06, - "loss": 0.9229, - "step": 9583 - }, - { - "epoch": 0.25, - "learning_rate": 1.9859186525986615e-06, - "loss": 0.9482, - "step": 9584 - }, - { - "epoch": 0.25, - "learning_rate": 1.985914025012213e-06, - "loss": 0.9492, - "step": 9585 - }, - { - "epoch": 0.25, - "learning_rate": 1.9859093966708947e-06, - "loss": 0.8682, - "step": 9586 - }, - { - "epoch": 0.25, - "learning_rate": 1.9859047675747114e-06, - "loss": 1.0166, - "step": 9587 - }, - { - "epoch": 0.25, - "learning_rate": 1.9859001377236663e-06, - "loss": 0.9375, - "step": 9588 - }, - { - "epoch": 0.25, - "learning_rate": 1.9858955071177624e-06, - "loss": 0.8154, - "step": 9589 - }, - { - "epoch": 0.25, - "learning_rate": 1.9858908757570035e-06, - "loss": 0.8848, - "step": 9590 - }, - { - "epoch": 0.25, - "learning_rate": 1.9858862436413938e-06, - "loss": 0.7988, - "step": 9591 - }, - { - "epoch": 0.25, - "learning_rate": 1.985881610770936e-06, - "loss": 1.0029, - "step": 9592 - }, - { - "epoch": 0.25, - "learning_rate": 1.9858769771456343e-06, - "loss": 0.8975, - "step": 9593 - }, - { - "epoch": 0.25, - "learning_rate": 1.9858723427654914e-06, - "loss": 1.1973, - "step": 9594 - }, - { - "epoch": 0.25, - "learning_rate": 1.985867707630512e-06, - "loss": 1.0625, - "step": 9595 - }, - { - "epoch": 0.25, - "learning_rate": 1.985863071740699e-06, - "loss": 0.9756, - "step": 9596 - }, - { - "epoch": 0.25, - "learning_rate": 1.9858584350960552e-06, - "loss": 1.0254, - "step": 9597 - }, - { - "epoch": 0.25, - "learning_rate": 1.985853797696586e-06, - "loss": 0.6426, - "step": 9598 - }, - { - "epoch": 0.25, - "learning_rate": 1.985849159542293e-06, - "loss": 0.8682, - "step": 9599 - }, - { - "epoch": 0.25, - "learning_rate": 1.985844520633181e-06, - "loss": 0.8406, - "step": 9600 - }, - { - "epoch": 0.25, - "learning_rate": 1.985839880969253e-06, - "loss": 1.0967, - "step": 9601 - }, - { - "epoch": 0.25, - "learning_rate": 1.985835240550513e-06, - "loss": 0.7356, - "step": 9602 - }, - { - "epoch": 0.25, - "learning_rate": 1.985830599376964e-06, - "loss": 0.998, - "step": 9603 - }, - { - "epoch": 0.25, - "learning_rate": 1.98582595744861e-06, - "loss": 0.916, - "step": 9604 - }, - { - "epoch": 0.25, - "learning_rate": 1.9858213147654545e-06, - "loss": 0.6084, - "step": 9605 - }, - { - "epoch": 0.25, - "learning_rate": 1.9858166713275008e-06, - "loss": 0.877, - "step": 9606 - }, - { - "epoch": 0.25, - "learning_rate": 1.9858120271347526e-06, - "loss": 0.6006, - "step": 9607 - }, - { - "epoch": 0.25, - "learning_rate": 1.9858073821872133e-06, - "loss": 0.8916, - "step": 9608 - }, - { - "epoch": 0.25, - "learning_rate": 1.985802736484887e-06, - "loss": 0.9492, - "step": 9609 - }, - { - "epoch": 0.25, - "learning_rate": 1.9857980900277765e-06, - "loss": 1.0117, - "step": 9610 - }, - { - "epoch": 0.25, - "learning_rate": 1.985793442815886e-06, - "loss": 1.0732, - "step": 9611 - }, - { - "epoch": 0.25, - "learning_rate": 1.9857887948492186e-06, - "loss": 0.7246, - "step": 9612 - }, - { - "epoch": 0.25, - "learning_rate": 1.9857841461277783e-06, - "loss": 0.8633, - "step": 9613 - }, - { - "epoch": 0.25, - "learning_rate": 1.985779496651568e-06, - "loss": 0.5659, - "step": 9614 - }, - { - "epoch": 0.25, - "learning_rate": 1.9857748464205922e-06, - "loss": 1.1445, - "step": 9615 - }, - { - "epoch": 0.25, - "learning_rate": 1.9857701954348537e-06, - "loss": 0.9707, - "step": 9616 - }, - { - "epoch": 0.25, - "learning_rate": 1.9857655436943563e-06, - "loss": 1.0244, - "step": 9617 - }, - { - "epoch": 0.25, - "learning_rate": 1.9857608911991034e-06, - "loss": 1.0088, - "step": 9618 - }, - { - "epoch": 0.25, - "learning_rate": 1.985756237949099e-06, - "loss": 0.7681, - "step": 9619 - }, - { - "epoch": 0.25, - "learning_rate": 1.985751583944346e-06, - "loss": 0.9092, - "step": 9620 - }, - { - "epoch": 0.25, - "learning_rate": 1.9857469291848486e-06, - "loss": 0.8877, - "step": 9621 - }, - { - "epoch": 0.25, - "learning_rate": 1.9857422736706098e-06, - "loss": 0.8682, - "step": 9622 - }, - { - "epoch": 0.25, - "learning_rate": 1.9857376174016337e-06, - "loss": 1.0859, - "step": 9623 - }, - { - "epoch": 0.25, - "learning_rate": 1.9857329603779237e-06, - "loss": 0.9009, - "step": 9624 - }, - { - "epoch": 0.25, - "learning_rate": 1.985728302599483e-06, - "loss": 0.8047, - "step": 9625 - }, - { - "epoch": 0.25, - "learning_rate": 1.985723644066316e-06, - "loss": 0.7139, - "step": 9626 - }, - { - "epoch": 0.25, - "learning_rate": 1.985718984778425e-06, - "loss": 0.9805, - "step": 9627 - }, - { - "epoch": 0.25, - "learning_rate": 1.985714324735815e-06, - "loss": 1.0615, - "step": 9628 - }, - { - "epoch": 0.25, - "learning_rate": 1.9857096639384887e-06, - "loss": 0.9688, - "step": 9629 - }, - { - "epoch": 0.25, - "learning_rate": 1.9857050023864495e-06, - "loss": 0.915, - "step": 9630 - }, - { - "epoch": 0.25, - "learning_rate": 1.985700340079702e-06, - "loss": 0.8564, - "step": 9631 - }, - { - "epoch": 0.25, - "learning_rate": 1.9856956770182483e-06, - "loss": 0.8047, - "step": 9632 - }, - { - "epoch": 0.25, - "learning_rate": 1.985691013202093e-06, - "loss": 0.7314, - "step": 9633 - }, - { - "epoch": 0.25, - "learning_rate": 1.9856863486312394e-06, - "loss": 0.96, - "step": 9634 - }, - { - "epoch": 0.25, - "learning_rate": 1.9856816833056913e-06, - "loss": 0.9736, - "step": 9635 - }, - { - "epoch": 0.25, - "learning_rate": 1.9856770172254516e-06, - "loss": 0.7871, - "step": 9636 - }, - { - "epoch": 0.25, - "learning_rate": 1.9856723503905247e-06, - "loss": 0.8242, - "step": 9637 - }, - { - "epoch": 0.25, - "learning_rate": 1.985667682800914e-06, - "loss": 0.9375, - "step": 9638 - }, - { - "epoch": 0.25, - "learning_rate": 1.985663014456622e-06, - "loss": 0.8945, - "step": 9639 - }, - { - "epoch": 0.25, - "learning_rate": 1.985658345357654e-06, - "loss": 0.9287, - "step": 9640 - }, - { - "epoch": 0.25, - "learning_rate": 1.9856536755040126e-06, - "loss": 1.1426, - "step": 9641 - }, - { - "epoch": 0.25, - "learning_rate": 1.9856490048957013e-06, - "loss": 0.8623, - "step": 9642 - }, - { - "epoch": 0.25, - "learning_rate": 1.985644333532724e-06, - "loss": 0.7964, - "step": 9643 - }, - { - "epoch": 0.25, - "learning_rate": 1.985639661415084e-06, - "loss": 0.9922, - "step": 9644 - }, - { - "epoch": 0.25, - "learning_rate": 1.985634988542785e-06, - "loss": 0.8594, - "step": 9645 - }, - { - "epoch": 0.25, - "learning_rate": 1.9856303149158312e-06, - "loss": 0.8809, - "step": 9646 - }, - { - "epoch": 0.25, - "learning_rate": 1.985625640534225e-06, - "loss": 0.7393, - "step": 9647 - }, - { - "epoch": 0.25, - "learning_rate": 1.9856209653979706e-06, - "loss": 0.833, - "step": 9648 - }, - { - "epoch": 0.25, - "learning_rate": 1.9856162895070714e-06, - "loss": 1.0801, - "step": 9649 - }, - { - "epoch": 0.25, - "learning_rate": 1.9856116128615315e-06, - "loss": 0.8838, - "step": 9650 - }, - { - "epoch": 0.25, - "learning_rate": 1.9856069354613542e-06, - "loss": 0.959, - "step": 9651 - }, - { - "epoch": 0.25, - "learning_rate": 1.9856022573065426e-06, - "loss": 0.9111, - "step": 9652 - }, - { - "epoch": 0.25, - "learning_rate": 1.985597578397101e-06, - "loss": 0.8613, - "step": 9653 - }, - { - "epoch": 0.25, - "learning_rate": 1.9855928987330324e-06, - "loss": 0.9844, - "step": 9654 - }, - { - "epoch": 0.25, - "learning_rate": 1.9855882183143406e-06, - "loss": 0.8311, - "step": 9655 - }, - { - "epoch": 0.25, - "learning_rate": 1.9855835371410293e-06, - "loss": 0.9365, - "step": 9656 - }, - { - "epoch": 0.25, - "learning_rate": 1.9855788552131022e-06, - "loss": 0.9287, - "step": 9657 - }, - { - "epoch": 0.25, - "learning_rate": 1.985574172530563e-06, - "loss": 0.9238, - "step": 9658 - }, - { - "epoch": 0.25, - "learning_rate": 1.985569489093414e-06, - "loss": 0.688, - "step": 9659 - }, - { - "epoch": 0.25, - "learning_rate": 1.9855648049016605e-06, - "loss": 0.8535, - "step": 9660 - }, - { - "epoch": 0.25, - "learning_rate": 1.9855601199553053e-06, - "loss": 1.0059, - "step": 9661 - }, - { - "epoch": 0.25, - "learning_rate": 1.9855554342543517e-06, - "loss": 0.874, - "step": 9662 - }, - { - "epoch": 0.25, - "learning_rate": 1.9855507477988036e-06, - "loss": 0.7598, - "step": 9663 - }, - { - "epoch": 0.25, - "learning_rate": 1.985546060588665e-06, - "loss": 0.8413, - "step": 9664 - }, - { - "epoch": 0.25, - "learning_rate": 1.985541372623939e-06, - "loss": 0.7529, - "step": 9665 - }, - { - "epoch": 0.25, - "learning_rate": 1.985536683904629e-06, - "loss": 1.0127, - "step": 9666 - }, - { - "epoch": 0.25, - "learning_rate": 1.985531994430739e-06, - "loss": 0.9844, - "step": 9667 - }, - { - "epoch": 0.25, - "learning_rate": 1.9855273042022726e-06, - "loss": 0.8174, - "step": 9668 - }, - { - "epoch": 0.25, - "learning_rate": 1.985522613219233e-06, - "loss": 0.7163, - "step": 9669 - }, - { - "epoch": 0.25, - "learning_rate": 1.9855179214816246e-06, - "loss": 0.9805, - "step": 9670 - }, - { - "epoch": 0.25, - "learning_rate": 1.9855132289894497e-06, - "loss": 1.1084, - "step": 9671 - }, - { - "epoch": 0.25, - "learning_rate": 1.9855085357427132e-06, - "loss": 1.249, - "step": 9672 - }, - { - "epoch": 0.25, - "learning_rate": 1.985503841741418e-06, - "loss": 0.9375, - "step": 9673 - }, - { - "epoch": 0.25, - "learning_rate": 1.9854991469855677e-06, - "loss": 0.4714, - "step": 9674 - }, - { - "epoch": 0.25, - "learning_rate": 1.985494451475166e-06, - "loss": 0.7324, - "step": 9675 - }, - { - "epoch": 0.25, - "learning_rate": 1.9854897552102167e-06, - "loss": 1.0967, - "step": 9676 - }, - { - "epoch": 0.25, - "learning_rate": 1.985485058190723e-06, - "loss": 0.8623, - "step": 9677 - }, - { - "epoch": 0.25, - "learning_rate": 1.9854803604166888e-06, - "loss": 1.04, - "step": 9678 - }, - { - "epoch": 0.25, - "learning_rate": 1.985475661888118e-06, - "loss": 0.7583, - "step": 9679 - }, - { - "epoch": 0.25, - "learning_rate": 1.9854709626050134e-06, - "loss": 0.8486, - "step": 9680 - }, - { - "epoch": 0.25, - "learning_rate": 1.9854662625673788e-06, - "loss": 1.0801, - "step": 9681 - }, - { - "epoch": 0.25, - "learning_rate": 1.985461561775218e-06, - "loss": 0.9141, - "step": 9682 - }, - { - "epoch": 0.25, - "learning_rate": 1.9854568602285347e-06, - "loss": 0.7109, - "step": 9683 - }, - { - "epoch": 0.25, - "learning_rate": 1.985452157927333e-06, - "loss": 0.7915, - "step": 9684 - }, - { - "epoch": 0.25, - "learning_rate": 1.985447454871615e-06, - "loss": 0.582, - "step": 9685 - }, - { - "epoch": 0.25, - "learning_rate": 1.985442751061386e-06, - "loss": 0.7012, - "step": 9686 - }, - { - "epoch": 0.25, - "learning_rate": 1.985438046496648e-06, - "loss": 0.8345, - "step": 9687 - }, - { - "epoch": 0.25, - "learning_rate": 1.9854333411774058e-06, - "loss": 1.0732, - "step": 9688 - }, - { - "epoch": 0.25, - "learning_rate": 1.9854286351036627e-06, - "loss": 1.1338, - "step": 9689 - }, - { - "epoch": 0.25, - "learning_rate": 1.985423928275422e-06, - "loss": 0.9951, - "step": 9690 - }, - { - "epoch": 0.25, - "learning_rate": 1.9854192206926874e-06, - "loss": 0.8291, - "step": 9691 - }, - { - "epoch": 0.25, - "learning_rate": 1.9854145123554627e-06, - "loss": 0.9209, - "step": 9692 - }, - { - "epoch": 0.25, - "learning_rate": 1.985409803263752e-06, - "loss": 1.0361, - "step": 9693 - }, - { - "epoch": 0.25, - "learning_rate": 1.985405093417558e-06, - "loss": 0.7808, - "step": 9694 - }, - { - "epoch": 0.25, - "learning_rate": 1.985400382816884e-06, - "loss": 0.603, - "step": 9695 - }, - { - "epoch": 0.25, - "learning_rate": 1.9853956714617348e-06, - "loss": 0.7021, - "step": 9696 - }, - { - "epoch": 0.25, - "learning_rate": 1.9853909593521133e-06, - "loss": 0.8105, - "step": 9697 - }, - { - "epoch": 0.25, - "learning_rate": 1.9853862464880235e-06, - "loss": 0.9463, - "step": 9698 - }, - { - "epoch": 0.25, - "learning_rate": 1.9853815328694683e-06, - "loss": 0.8652, - "step": 9699 - }, - { - "epoch": 0.25, - "learning_rate": 1.9853768184964524e-06, - "loss": 1.0381, - "step": 9700 - }, - { - "epoch": 0.25, - "learning_rate": 1.9853721033689784e-06, - "loss": 1.0898, - "step": 9701 - }, - { - "epoch": 0.25, - "learning_rate": 1.9853673874870503e-06, - "loss": 1.043, - "step": 9702 - }, - { - "epoch": 0.25, - "learning_rate": 1.9853626708506718e-06, - "loss": 1.0254, - "step": 9703 - }, - { - "epoch": 0.25, - "learning_rate": 1.985357953459846e-06, - "loss": 0.9922, - "step": 9704 - }, - { - "epoch": 0.25, - "learning_rate": 1.9853532353145774e-06, - "loss": 1.082, - "step": 9705 - }, - { - "epoch": 0.25, - "learning_rate": 1.985348516414869e-06, - "loss": 0.96, - "step": 9706 - }, - { - "epoch": 0.25, - "learning_rate": 1.9853437967607244e-06, - "loss": 0.6548, - "step": 9707 - }, - { - "epoch": 0.25, - "learning_rate": 1.9853390763521478e-06, - "loss": 0.5996, - "step": 9708 - }, - { - "epoch": 0.25, - "learning_rate": 1.985334355189142e-06, - "loss": 1.085, - "step": 9709 - }, - { - "epoch": 0.25, - "learning_rate": 1.985329633271711e-06, - "loss": 0.873, - "step": 9710 - }, - { - "epoch": 0.25, - "learning_rate": 1.9853249105998584e-06, - "loss": 0.9082, - "step": 9711 - }, - { - "epoch": 0.25, - "learning_rate": 1.985320187173588e-06, - "loss": 0.832, - "step": 9712 - }, - { - "epoch": 0.25, - "learning_rate": 1.985315462992903e-06, - "loss": 1.1104, - "step": 9713 - }, - { - "epoch": 0.25, - "learning_rate": 1.9853107380578075e-06, - "loss": 0.9795, - "step": 9714 - }, - { - "epoch": 0.25, - "learning_rate": 1.9853060123683044e-06, - "loss": 1.0322, - "step": 9715 - }, - { - "epoch": 0.25, - "learning_rate": 1.9853012859243986e-06, - "loss": 0.7207, - "step": 9716 - }, - { - "epoch": 0.25, - "learning_rate": 1.985296558726092e-06, - "loss": 0.8252, - "step": 9717 - }, - { - "epoch": 0.25, - "learning_rate": 1.98529183077339e-06, - "loss": 0.9238, - "step": 9718 - }, - { - "epoch": 0.25, - "learning_rate": 1.985287102066295e-06, - "loss": 0.9189, - "step": 9719 - }, - { - "epoch": 0.25, - "learning_rate": 1.9852823726048106e-06, - "loss": 0.7373, - "step": 9720 - }, - { - "epoch": 0.25, - "learning_rate": 1.985277642388941e-06, - "loss": 0.8096, - "step": 9721 - }, - { - "epoch": 0.25, - "learning_rate": 1.98527291141869e-06, - "loss": 1.0371, - "step": 9722 - }, - { - "epoch": 0.25, - "learning_rate": 1.9852681796940607e-06, - "loss": 0.8125, - "step": 9723 - }, - { - "epoch": 0.25, - "learning_rate": 1.9852634472150565e-06, - "loss": 0.8833, - "step": 9724 - }, - { - "epoch": 0.25, - "learning_rate": 1.9852587139816815e-06, - "loss": 0.9033, - "step": 9725 - }, - { - "epoch": 0.25, - "learning_rate": 1.9852539799939393e-06, - "loss": 0.9404, - "step": 9726 - }, - { - "epoch": 0.25, - "learning_rate": 1.9852492452518334e-06, - "loss": 1.0742, - "step": 9727 - }, - { - "epoch": 0.25, - "learning_rate": 1.9852445097553675e-06, - "loss": 0.8647, - "step": 9728 - }, - { - "epoch": 0.25, - "learning_rate": 1.985239773504545e-06, - "loss": 0.9053, - "step": 9729 - }, - { - "epoch": 0.25, - "learning_rate": 1.98523503649937e-06, - "loss": 0.8779, - "step": 9730 - }, - { - "epoch": 0.25, - "learning_rate": 1.9852302987398457e-06, - "loss": 0.9795, - "step": 9731 - }, - { - "epoch": 0.25, - "learning_rate": 1.985225560225976e-06, - "loss": 0.6963, - "step": 9732 - }, - { - "epoch": 0.25, - "learning_rate": 1.9852208209577645e-06, - "loss": 0.8867, - "step": 9733 - }, - { - "epoch": 0.25, - "learning_rate": 1.985216080935214e-06, - "loss": 0.6108, - "step": 9734 - }, - { - "epoch": 0.25, - "learning_rate": 1.9852113401583296e-06, - "loss": 1.0225, - "step": 9735 - }, - { - "epoch": 0.25, - "learning_rate": 1.9852065986271136e-06, - "loss": 0.8633, - "step": 9736 - }, - { - "epoch": 0.25, - "learning_rate": 1.9852018563415707e-06, - "loss": 0.9414, - "step": 9737 - }, - { - "epoch": 0.25, - "learning_rate": 1.985197113301704e-06, - "loss": 0.7415, - "step": 9738 - }, - { - "epoch": 0.25, - "learning_rate": 1.985192369507517e-06, - "loss": 0.8999, - "step": 9739 - }, - { - "epoch": 0.25, - "learning_rate": 1.9851876249590137e-06, - "loss": 0.7119, - "step": 9740 - }, - { - "epoch": 0.25, - "learning_rate": 1.985182879656197e-06, - "loss": 0.9092, - "step": 9741 - }, - { - "epoch": 0.25, - "learning_rate": 1.9851781335990715e-06, - "loss": 1.0312, - "step": 9742 - }, - { - "epoch": 0.25, - "learning_rate": 1.98517338678764e-06, - "loss": 0.9473, - "step": 9743 - }, - { - "epoch": 0.25, - "learning_rate": 1.9851686392219073e-06, - "loss": 0.9297, - "step": 9744 - }, - { - "epoch": 0.25, - "learning_rate": 1.985163890901876e-06, - "loss": 0.9248, - "step": 9745 - }, - { - "epoch": 0.25, - "learning_rate": 1.9851591418275495e-06, - "loss": 0.7666, - "step": 9746 - }, - { - "epoch": 0.25, - "learning_rate": 1.9851543919989325e-06, - "loss": 0.7891, - "step": 9747 - }, - { - "epoch": 0.25, - "learning_rate": 1.9851496414160277e-06, - "loss": 0.8271, - "step": 9748 - }, - { - "epoch": 0.25, - "learning_rate": 1.9851448900788396e-06, - "loss": 0.9536, - "step": 9749 - }, - { - "epoch": 0.25, - "learning_rate": 1.9851401379873707e-06, - "loss": 0.7583, - "step": 9750 - }, - { - "epoch": 0.25, - "learning_rate": 1.985135385141626e-06, - "loss": 0.8311, - "step": 9751 - }, - { - "epoch": 0.25, - "learning_rate": 1.985130631541608e-06, - "loss": 1.0186, - "step": 9752 - }, - { - "epoch": 0.25, - "learning_rate": 1.985125877187321e-06, - "loss": 0.9414, - "step": 9753 - }, - { - "epoch": 0.25, - "learning_rate": 1.985121122078768e-06, - "loss": 0.9434, - "step": 9754 - }, - { - "epoch": 0.25, - "learning_rate": 1.9851163662159533e-06, - "loss": 0.7927, - "step": 9755 - }, - { - "epoch": 0.25, - "learning_rate": 1.9851116095988806e-06, - "loss": 0.8003, - "step": 9756 - }, - { - "epoch": 0.25, - "learning_rate": 1.9851068522275526e-06, - "loss": 1.1436, - "step": 9757 - }, - { - "epoch": 0.25, - "learning_rate": 1.985102094101974e-06, - "loss": 0.9053, - "step": 9758 - }, - { - "epoch": 0.25, - "learning_rate": 1.985097335222148e-06, - "loss": 0.9961, - "step": 9759 - }, - { - "epoch": 0.25, - "learning_rate": 1.985092575588078e-06, - "loss": 0.958, - "step": 9760 - }, - { - "epoch": 0.25, - "learning_rate": 1.9850878151997683e-06, - "loss": 0.7378, - "step": 9761 - }, - { - "epoch": 0.25, - "learning_rate": 1.985083054057222e-06, - "loss": 0.8799, - "step": 9762 - }, - { - "epoch": 0.25, - "learning_rate": 1.985078292160443e-06, - "loss": 1.0361, - "step": 9763 - }, - { - "epoch": 0.25, - "learning_rate": 1.9850735295094347e-06, - "loss": 0.876, - "step": 9764 - }, - { - "epoch": 0.25, - "learning_rate": 1.985068766104201e-06, - "loss": 0.9102, - "step": 9765 - }, - { - "epoch": 0.25, - "learning_rate": 1.985064001944745e-06, - "loss": 0.8892, - "step": 9766 - }, - { - "epoch": 0.25, - "learning_rate": 1.9850592370310714e-06, - "loss": 0.8213, - "step": 9767 - }, - { - "epoch": 0.25, - "learning_rate": 1.985054471363183e-06, - "loss": 0.957, - "step": 9768 - }, - { - "epoch": 0.25, - "learning_rate": 1.9850497049410836e-06, - "loss": 0.8486, - "step": 9769 - }, - { - "epoch": 0.25, - "learning_rate": 1.985044937764777e-06, - "loss": 0.8643, - "step": 9770 - }, - { - "epoch": 0.25, - "learning_rate": 1.985040169834267e-06, - "loss": 0.8237, - "step": 9771 - }, - { - "epoch": 0.25, - "learning_rate": 1.985035401149557e-06, - "loss": 1.0322, - "step": 9772 - }, - { - "epoch": 0.25, - "learning_rate": 1.9850306317106504e-06, - "loss": 1.1445, - "step": 9773 - }, - { - "epoch": 0.25, - "learning_rate": 1.985025861517551e-06, - "loss": 0.7529, - "step": 9774 - }, - { - "epoch": 0.25, - "learning_rate": 1.985021090570263e-06, - "loss": 0.9736, - "step": 9775 - }, - { - "epoch": 0.25, - "learning_rate": 1.9850163188687896e-06, - "loss": 0.9531, - "step": 9776 - }, - { - "epoch": 0.25, - "learning_rate": 1.985011546413134e-06, - "loss": 0.9146, - "step": 9777 - }, - { - "epoch": 0.25, - "learning_rate": 1.985006773203301e-06, - "loss": 1.0605, - "step": 9778 - }, - { - "epoch": 0.25, - "learning_rate": 1.9850019992392934e-06, - "loss": 0.9575, - "step": 9779 - }, - { - "epoch": 0.25, - "learning_rate": 1.9849972245211147e-06, - "loss": 1.0605, - "step": 9780 - }, - { - "epoch": 0.25, - "learning_rate": 1.9849924490487693e-06, - "loss": 0.9365, - "step": 9781 - }, - { - "epoch": 0.25, - "learning_rate": 1.9849876728222604e-06, - "loss": 1.0625, - "step": 9782 - }, - { - "epoch": 0.25, - "learning_rate": 1.984982895841592e-06, - "loss": 0.8525, - "step": 9783 - }, - { - "epoch": 0.25, - "learning_rate": 1.984978118106767e-06, - "loss": 1.0088, - "step": 9784 - }, - { - "epoch": 0.25, - "learning_rate": 1.98497333961779e-06, - "loss": 1.0801, - "step": 9785 - }, - { - "epoch": 0.25, - "learning_rate": 1.9849685603746638e-06, - "loss": 0.9453, - "step": 9786 - }, - { - "epoch": 0.25, - "learning_rate": 1.9849637803773925e-06, - "loss": 0.8103, - "step": 9787 - }, - { - "epoch": 0.25, - "learning_rate": 1.98495899962598e-06, - "loss": 0.5916, - "step": 9788 - }, - { - "epoch": 0.25, - "learning_rate": 1.9849542181204292e-06, - "loss": 0.9414, - "step": 9789 - }, - { - "epoch": 0.25, - "learning_rate": 1.984949435860745e-06, - "loss": 0.707, - "step": 9790 - }, - { - "epoch": 0.25, - "learning_rate": 1.9849446528469296e-06, - "loss": 0.9756, - "step": 9791 - }, - { - "epoch": 0.25, - "learning_rate": 1.984939869078988e-06, - "loss": 1.0195, - "step": 9792 - }, - { - "epoch": 0.25, - "learning_rate": 1.9849350845569225e-06, - "loss": 1.0107, - "step": 9793 - }, - { - "epoch": 0.25, - "learning_rate": 1.984930299280738e-06, - "loss": 0.8623, - "step": 9794 - }, - { - "epoch": 0.25, - "learning_rate": 1.9849255132504375e-06, - "loss": 0.9805, - "step": 9795 - }, - { - "epoch": 0.25, - "learning_rate": 1.9849207264660247e-06, - "loss": 0.9883, - "step": 9796 - }, - { - "epoch": 0.25, - "learning_rate": 1.9849159389275035e-06, - "loss": 0.998, - "step": 9797 - }, - { - "epoch": 0.25, - "learning_rate": 1.9849111506348777e-06, - "loss": 0.877, - "step": 9798 - }, - { - "epoch": 0.25, - "learning_rate": 1.9849063615881504e-06, - "loss": 0.8237, - "step": 9799 - }, - { - "epoch": 0.25, - "learning_rate": 1.9849015717873257e-06, - "loss": 0.9873, - "step": 9800 - }, - { - "epoch": 0.25, - "learning_rate": 1.9848967812324075e-06, - "loss": 1.1543, - "step": 9801 - }, - { - "epoch": 0.25, - "learning_rate": 1.9848919899233984e-06, - "loss": 0.9316, - "step": 9802 - }, - { - "epoch": 0.25, - "learning_rate": 1.9848871978603033e-06, - "loss": 0.8936, - "step": 9803 - }, - { - "epoch": 0.25, - "learning_rate": 1.9848824050431253e-06, - "loss": 0.9717, - "step": 9804 - }, - { - "epoch": 0.25, - "learning_rate": 1.984877611471868e-06, - "loss": 0.9038, - "step": 9805 - }, - { - "epoch": 0.25, - "learning_rate": 1.9848728171465352e-06, - "loss": 1.123, - "step": 9806 - }, - { - "epoch": 0.25, - "learning_rate": 1.984868022067131e-06, - "loss": 0.9482, - "step": 9807 - }, - { - "epoch": 0.25, - "learning_rate": 1.984863226233658e-06, - "loss": 1.0381, - "step": 9808 - }, - { - "epoch": 0.25, - "learning_rate": 1.9848584296461207e-06, - "loss": 1.0801, - "step": 9809 - }, - { - "epoch": 0.25, - "learning_rate": 1.9848536323045225e-06, - "loss": 1.0166, - "step": 9810 - }, - { - "epoch": 0.25, - "learning_rate": 1.9848488342088677e-06, - "loss": 0.6909, - "step": 9811 - }, - { - "epoch": 0.25, - "learning_rate": 1.9848440353591587e-06, - "loss": 0.8545, - "step": 9812 - }, - { - "epoch": 0.25, - "learning_rate": 1.9848392357554007e-06, - "loss": 0.9434, - "step": 9813 - }, - { - "epoch": 0.25, - "learning_rate": 1.9848344353975957e-06, - "loss": 0.9893, - "step": 9814 - }, - { - "epoch": 0.25, - "learning_rate": 1.984829634285749e-06, - "loss": 0.8105, - "step": 9815 - }, - { - "epoch": 0.25, - "learning_rate": 1.984824832419863e-06, - "loss": 1.1211, - "step": 9816 - }, - { - "epoch": 0.25, - "learning_rate": 1.9848200297999423e-06, - "loss": 0.9678, - "step": 9817 - }, - { - "epoch": 0.25, - "learning_rate": 1.9848152264259902e-06, - "loss": 0.624, - "step": 9818 - }, - { - "epoch": 0.25, - "learning_rate": 1.98481042229801e-06, - "loss": 1.2012, - "step": 9819 - }, - { - "epoch": 0.25, - "learning_rate": 1.984805617416006e-06, - "loss": 1.0557, - "step": 9820 - }, - { - "epoch": 0.25, - "learning_rate": 1.9848008117799815e-06, - "loss": 0.9922, - "step": 9821 - }, - { - "epoch": 0.25, - "learning_rate": 1.9847960053899404e-06, - "loss": 0.7622, - "step": 9822 - }, - { - "epoch": 0.25, - "learning_rate": 1.984791198245886e-06, - "loss": 0.7114, - "step": 9823 - }, - { - "epoch": 0.25, - "learning_rate": 1.9847863903478227e-06, - "loss": 0.9189, - "step": 9824 - }, - { - "epoch": 0.25, - "learning_rate": 1.9847815816957537e-06, - "loss": 1.001, - "step": 9825 - }, - { - "epoch": 0.25, - "learning_rate": 1.9847767722896824e-06, - "loss": 0.9404, - "step": 9826 - }, - { - "epoch": 0.25, - "learning_rate": 1.984771962129613e-06, - "loss": 1.0, - "step": 9827 - }, - { - "epoch": 0.25, - "learning_rate": 1.9847671512155487e-06, - "loss": 0.8779, - "step": 9828 - }, - { - "epoch": 0.25, - "learning_rate": 1.984762339547494e-06, - "loss": 1.0088, - "step": 9829 - }, - { - "epoch": 0.25, - "learning_rate": 1.9847575271254517e-06, - "loss": 0.873, - "step": 9830 - }, - { - "epoch": 0.25, - "learning_rate": 1.984752713949426e-06, - "loss": 0.8706, - "step": 9831 - }, - { - "epoch": 0.25, - "learning_rate": 1.9847479000194203e-06, - "loss": 1.0234, - "step": 9832 - }, - { - "epoch": 0.25, - "learning_rate": 1.9847430853354387e-06, - "loss": 0.4941, - "step": 9833 - }, - { - "epoch": 0.25, - "learning_rate": 1.984738269897484e-06, - "loss": 1.0977, - "step": 9834 - }, - { - "epoch": 0.25, - "learning_rate": 1.984733453705561e-06, - "loss": 0.9902, - "step": 9835 - }, - { - "epoch": 0.25, - "learning_rate": 1.984728636759673e-06, - "loss": 0.9219, - "step": 9836 - }, - { - "epoch": 0.25, - "learning_rate": 1.984723819059823e-06, - "loss": 1.1699, - "step": 9837 - }, - { - "epoch": 0.25, - "learning_rate": 1.9847190006060154e-06, - "loss": 0.7988, - "step": 9838 - }, - { - "epoch": 0.25, - "learning_rate": 1.984714181398254e-06, - "loss": 1.0137, - "step": 9839 - }, - { - "epoch": 0.25, - "learning_rate": 1.984709361436542e-06, - "loss": 0.8281, - "step": 9840 - }, - { - "epoch": 0.25, - "learning_rate": 1.9847045407208837e-06, - "loss": 0.8633, - "step": 9841 - }, - { - "epoch": 0.25, - "learning_rate": 1.984699719251282e-06, - "loss": 0.9893, - "step": 9842 - }, - { - "epoch": 0.25, - "learning_rate": 1.984694897027741e-06, - "loss": 0.833, - "step": 9843 - }, - { - "epoch": 0.25, - "learning_rate": 1.9846900740502647e-06, - "loss": 1.1484, - "step": 9844 - }, - { - "epoch": 0.25, - "learning_rate": 1.9846852503188565e-06, - "loss": 0.8975, - "step": 9845 - }, - { - "epoch": 0.25, - "learning_rate": 1.9846804258335197e-06, - "loss": 0.751, - "step": 9846 - }, - { - "epoch": 0.25, - "learning_rate": 1.9846756005942587e-06, - "loss": 0.9287, - "step": 9847 - }, - { - "epoch": 0.25, - "learning_rate": 1.9846707746010765e-06, - "loss": 0.9336, - "step": 9848 - }, - { - "epoch": 0.25, - "learning_rate": 1.9846659478539774e-06, - "loss": 0.8882, - "step": 9849 - }, - { - "epoch": 0.25, - "learning_rate": 1.9846611203529652e-06, - "loss": 1.1914, - "step": 9850 - }, - { - "epoch": 0.25, - "learning_rate": 1.984656292098043e-06, - "loss": 0.8647, - "step": 9851 - }, - { - "epoch": 0.25, - "learning_rate": 1.984651463089214e-06, - "loss": 0.9824, - "step": 9852 - }, - { - "epoch": 0.25, - "learning_rate": 1.984646633326484e-06, - "loss": 0.9219, - "step": 9853 - }, - { - "epoch": 0.25, - "learning_rate": 1.9846418028098544e-06, - "loss": 1.0986, - "step": 9854 - }, - { - "epoch": 0.25, - "learning_rate": 1.9846369715393304e-06, - "loss": 1.0557, - "step": 9855 - }, - { - "epoch": 0.25, - "learning_rate": 1.9846321395149145e-06, - "loss": 0.9697, - "step": 9856 - }, - { - "epoch": 0.25, - "learning_rate": 1.984627306736612e-06, - "loss": 0.8945, - "step": 9857 - }, - { - "epoch": 0.25, - "learning_rate": 1.9846224732044247e-06, - "loss": 0.96, - "step": 9858 - }, - { - "epoch": 0.25, - "learning_rate": 1.9846176389183576e-06, - "loss": 1.0977, - "step": 9859 - }, - { - "epoch": 0.25, - "learning_rate": 1.9846128038784142e-06, - "loss": 0.9355, - "step": 9860 - }, - { - "epoch": 0.25, - "learning_rate": 1.9846079680845975e-06, - "loss": 0.9941, - "step": 9861 - }, - { - "epoch": 0.25, - "learning_rate": 1.9846031315369126e-06, - "loss": 1.1016, - "step": 9862 - }, - { - "epoch": 0.25, - "learning_rate": 1.984598294235362e-06, - "loss": 0.9463, - "step": 9863 - }, - { - "epoch": 0.25, - "learning_rate": 1.9845934561799496e-06, - "loss": 0.7002, - "step": 9864 - }, - { - "epoch": 0.25, - "learning_rate": 1.984588617370679e-06, - "loss": 1.0166, - "step": 9865 - }, - { - "epoch": 0.25, - "learning_rate": 1.984583777807555e-06, - "loss": 1.0801, - "step": 9866 - }, - { - "epoch": 0.25, - "learning_rate": 1.9845789374905796e-06, - "loss": 0.8809, - "step": 9867 - }, - { - "epoch": 0.25, - "learning_rate": 1.984574096419758e-06, - "loss": 0.7832, - "step": 9868 - }, - { - "epoch": 0.25, - "learning_rate": 1.984569254595093e-06, - "loss": 1.041, - "step": 9869 - }, - { - "epoch": 0.25, - "learning_rate": 1.9845644120165884e-06, - "loss": 0.9443, - "step": 9870 - }, - { - "epoch": 0.25, - "learning_rate": 1.9845595686842484e-06, - "loss": 0.7676, - "step": 9871 - }, - { - "epoch": 0.25, - "learning_rate": 1.9845547245980765e-06, - "loss": 0.9189, - "step": 9872 - }, - { - "epoch": 0.25, - "learning_rate": 1.984549879758076e-06, - "loss": 1.0371, - "step": 9873 - }, - { - "epoch": 0.25, - "learning_rate": 1.984545034164251e-06, - "loss": 0.874, - "step": 9874 - }, - { - "epoch": 0.25, - "learning_rate": 1.9845401878166054e-06, - "loss": 1.041, - "step": 9875 - }, - { - "epoch": 0.25, - "learning_rate": 1.9845353407151424e-06, - "loss": 1.001, - "step": 9876 - }, - { - "epoch": 0.25, - "learning_rate": 1.9845304928598662e-06, - "loss": 0.8955, - "step": 9877 - }, - { - "epoch": 0.25, - "learning_rate": 1.98452564425078e-06, - "loss": 1.0068, - "step": 9878 - }, - { - "epoch": 0.25, - "learning_rate": 1.984520794887888e-06, - "loss": 0.9658, - "step": 9879 - }, - { - "epoch": 0.25, - "learning_rate": 1.9845159447711935e-06, - "loss": 0.9038, - "step": 9880 - }, - { - "epoch": 0.25, - "learning_rate": 1.9845110939007007e-06, - "loss": 0.8945, - "step": 9881 - }, - { - "epoch": 0.25, - "learning_rate": 1.984506242276413e-06, - "loss": 1.0693, - "step": 9882 - }, - { - "epoch": 0.25, - "learning_rate": 1.984501389898334e-06, - "loss": 0.7183, - "step": 9883 - }, - { - "epoch": 0.25, - "learning_rate": 1.9844965367664674e-06, - "loss": 1.1465, - "step": 9884 - }, - { - "epoch": 0.25, - "learning_rate": 1.9844916828808168e-06, - "loss": 0.832, - "step": 9885 - }, - { - "epoch": 0.25, - "learning_rate": 1.984486828241387e-06, - "loss": 0.6868, - "step": 9886 - }, - { - "epoch": 0.25, - "learning_rate": 1.9844819728481803e-06, - "loss": 0.9111, - "step": 9887 - }, - { - "epoch": 0.25, - "learning_rate": 1.984477116701201e-06, - "loss": 0.666, - "step": 9888 - }, - { - "epoch": 0.25, - "learning_rate": 1.9844722598004534e-06, - "loss": 0.7856, - "step": 9889 - }, - { - "epoch": 0.25, - "learning_rate": 1.9844674021459403e-06, - "loss": 0.9961, - "step": 9890 - }, - { - "epoch": 0.25, - "learning_rate": 1.9844625437376657e-06, - "loss": 0.8652, - "step": 9891 - }, - { - "epoch": 0.25, - "learning_rate": 1.9844576845756335e-06, - "loss": 0.8203, - "step": 9892 - }, - { - "epoch": 0.25, - "learning_rate": 1.984452824659847e-06, - "loss": 0.8398, - "step": 9893 - }, - { - "epoch": 0.25, - "learning_rate": 1.9844479639903107e-06, - "loss": 0.7646, - "step": 9894 - }, - { - "epoch": 0.25, - "learning_rate": 1.984443102567028e-06, - "loss": 0.9233, - "step": 9895 - }, - { - "epoch": 0.25, - "learning_rate": 1.984438240390002e-06, - "loss": 0.9814, - "step": 9896 - }, - { - "epoch": 0.25, - "learning_rate": 1.984433377459237e-06, - "loss": 0.8887, - "step": 9897 - }, - { - "epoch": 0.25, - "learning_rate": 1.9844285137747366e-06, - "loss": 0.7207, - "step": 9898 - }, - { - "epoch": 0.25, - "learning_rate": 1.984423649336505e-06, - "loss": 1.041, - "step": 9899 - }, - { - "epoch": 0.25, - "learning_rate": 1.984418784144545e-06, - "loss": 0.7065, - "step": 9900 - }, - { - "epoch": 0.25, - "learning_rate": 1.9844139181988608e-06, - "loss": 1.0391, - "step": 9901 - }, - { - "epoch": 0.25, - "learning_rate": 1.9844090514994563e-06, - "loss": 0.6558, - "step": 9902 - }, - { - "epoch": 0.25, - "learning_rate": 1.984404184046335e-06, - "loss": 0.9619, - "step": 9903 - }, - { - "epoch": 0.25, - "learning_rate": 1.984399315839501e-06, - "loss": 0.916, - "step": 9904 - }, - { - "epoch": 0.25, - "learning_rate": 1.984394446878957e-06, - "loss": 0.9746, - "step": 9905 - }, - { - "epoch": 0.25, - "learning_rate": 1.9843895771647083e-06, - "loss": 0.9404, - "step": 9906 - }, - { - "epoch": 0.25, - "learning_rate": 1.984384706696757e-06, - "loss": 0.936, - "step": 9907 - }, - { - "epoch": 0.25, - "learning_rate": 1.984379835475108e-06, - "loss": 0.8428, - "step": 9908 - }, - { - "epoch": 0.25, - "learning_rate": 1.9843749634997646e-06, - "loss": 0.8828, - "step": 9909 - }, - { - "epoch": 0.25, - "learning_rate": 1.9843700907707302e-06, - "loss": 0.8838, - "step": 9910 - }, - { - "epoch": 0.25, - "learning_rate": 1.9843652172880093e-06, - "loss": 0.7754, - "step": 9911 - }, - { - "epoch": 0.25, - "learning_rate": 1.9843603430516053e-06, - "loss": 0.8662, - "step": 9912 - }, - { - "epoch": 0.25, - "learning_rate": 1.9843554680615215e-06, - "loss": 0.8857, - "step": 9913 - }, - { - "epoch": 0.25, - "learning_rate": 1.984350592317762e-06, - "loss": 0.8843, - "step": 9914 - }, - { - "epoch": 0.25, - "learning_rate": 1.9843457158203308e-06, - "loss": 0.7432, - "step": 9915 - }, - { - "epoch": 0.25, - "learning_rate": 1.984340838569231e-06, - "loss": 1.1094, - "step": 9916 - }, - { - "epoch": 0.25, - "learning_rate": 1.9843359605644668e-06, - "loss": 0.9766, - "step": 9917 - }, - { - "epoch": 0.25, - "learning_rate": 1.984331081806042e-06, - "loss": 0.9668, - "step": 9918 - }, - { - "epoch": 0.25, - "learning_rate": 1.98432620229396e-06, - "loss": 0.8799, - "step": 9919 - }, - { - "epoch": 0.25, - "learning_rate": 1.9843213220282247e-06, - "loss": 0.7783, - "step": 9920 - }, - { - "epoch": 0.25, - "learning_rate": 1.9843164410088397e-06, - "loss": 1.1426, - "step": 9921 - }, - { - "epoch": 0.25, - "learning_rate": 1.984311559235809e-06, - "loss": 0.8047, - "step": 9922 - }, - { - "epoch": 0.25, - "learning_rate": 1.9843066767091363e-06, - "loss": 0.9482, - "step": 9923 - }, - { - "epoch": 0.25, - "learning_rate": 1.984301793428825e-06, - "loss": 0.9424, - "step": 9924 - }, - { - "epoch": 0.25, - "learning_rate": 1.9842969093948795e-06, - "loss": 0.8071, - "step": 9925 - }, - { - "epoch": 0.25, - "learning_rate": 1.984292024607303e-06, - "loss": 0.8279, - "step": 9926 - }, - { - "epoch": 0.25, - "learning_rate": 1.984287139066099e-06, - "loss": 0.917, - "step": 9927 - }, - { - "epoch": 0.25, - "learning_rate": 1.9842822527712716e-06, - "loss": 1.0234, - "step": 9928 - }, - { - "epoch": 0.25, - "learning_rate": 1.9842773657228246e-06, - "loss": 0.9404, - "step": 9929 - }, - { - "epoch": 0.25, - "learning_rate": 1.984272477920762e-06, - "loss": 0.9551, - "step": 9930 - }, - { - "epoch": 0.25, - "learning_rate": 1.9842675893650867e-06, - "loss": 0.9648, - "step": 9931 - }, - { - "epoch": 0.25, - "learning_rate": 1.9842627000558034e-06, - "loss": 0.9717, - "step": 9932 - }, - { - "epoch": 0.25, - "learning_rate": 1.9842578099929153e-06, - "loss": 0.96, - "step": 9933 - }, - { - "epoch": 0.25, - "learning_rate": 1.984252919176426e-06, - "loss": 0.8604, - "step": 9934 - }, - { - "epoch": 0.25, - "learning_rate": 1.98424802760634e-06, - "loss": 0.8145, - "step": 9935 - }, - { - "epoch": 0.25, - "learning_rate": 1.9842431352826603e-06, - "loss": 0.8604, - "step": 9936 - }, - { - "epoch": 0.25, - "learning_rate": 1.9842382422053907e-06, - "loss": 1.0244, - "step": 9937 - }, - { - "epoch": 0.25, - "learning_rate": 1.9842333483745354e-06, - "loss": 0.8262, - "step": 9938 - }, - { - "epoch": 0.25, - "learning_rate": 1.9842284537900977e-06, - "loss": 0.8721, - "step": 9939 - }, - { - "epoch": 0.25, - "learning_rate": 1.9842235584520815e-06, - "loss": 0.6067, - "step": 9940 - }, - { - "epoch": 0.25, - "learning_rate": 1.984218662360491e-06, - "loss": 0.9639, - "step": 9941 - }, - { - "epoch": 0.25, - "learning_rate": 1.984213765515329e-06, - "loss": 1.0078, - "step": 9942 - }, - { - "epoch": 0.25, - "learning_rate": 1.9842088679166e-06, - "loss": 1.0107, - "step": 9943 - }, - { - "epoch": 0.25, - "learning_rate": 1.984203969564307e-06, - "loss": 1.0469, - "step": 9944 - }, - { - "epoch": 0.25, - "learning_rate": 1.984199070458455e-06, - "loss": 0.7285, - "step": 9945 - }, - { - "epoch": 0.25, - "learning_rate": 1.9841941705990473e-06, - "loss": 0.9336, - "step": 9946 - }, - { - "epoch": 0.25, - "learning_rate": 1.984189269986087e-06, - "loss": 1.0244, - "step": 9947 - }, - { - "epoch": 0.25, - "learning_rate": 1.984184368619578e-06, - "loss": 0.918, - "step": 9948 - }, - { - "epoch": 0.25, - "learning_rate": 1.984179466499524e-06, - "loss": 0.9043, - "step": 9949 - }, - { - "epoch": 0.26, - "learning_rate": 1.9841745636259295e-06, - "loss": 0.6816, - "step": 9950 - }, - { - "epoch": 0.26, - "learning_rate": 1.9841696599987977e-06, - "loss": 0.7852, - "step": 9951 - }, - { - "epoch": 0.26, - "learning_rate": 1.9841647556181326e-06, - "loss": 0.9639, - "step": 9952 - }, - { - "epoch": 0.26, - "learning_rate": 1.9841598504839377e-06, - "loss": 0.9248, - "step": 9953 - }, - { - "epoch": 0.26, - "learning_rate": 1.9841549445962168e-06, - "loss": 0.96, - "step": 9954 - }, - { - "epoch": 0.26, - "learning_rate": 1.9841500379549737e-06, - "loss": 0.8345, - "step": 9955 - }, - { - "epoch": 0.26, - "learning_rate": 1.984145130560212e-06, - "loss": 0.9121, - "step": 9956 - }, - { - "epoch": 0.26, - "learning_rate": 1.984140222411936e-06, - "loss": 0.9717, - "step": 9957 - }, - { - "epoch": 0.26, - "learning_rate": 1.984135313510149e-06, - "loss": 0.9082, - "step": 9958 - }, - { - "epoch": 0.26, - "learning_rate": 1.984130403854855e-06, - "loss": 1.0498, - "step": 9959 - }, - { - "epoch": 0.26, - "learning_rate": 1.984125493446057e-06, - "loss": 0.8691, - "step": 9960 - }, - { - "epoch": 0.26, - "learning_rate": 1.98412058228376e-06, - "loss": 0.9126, - "step": 9961 - }, - { - "epoch": 0.26, - "learning_rate": 1.984115670367967e-06, - "loss": 0.9102, - "step": 9962 - }, - { - "epoch": 0.26, - "learning_rate": 1.984110757698681e-06, - "loss": 0.917, - "step": 9963 - }, - { - "epoch": 0.26, - "learning_rate": 1.9841058442759077e-06, - "loss": 0.8867, - "step": 9964 - }, - { - "epoch": 0.26, - "learning_rate": 1.9841009300996496e-06, - "loss": 0.7539, - "step": 9965 - }, - { - "epoch": 0.26, - "learning_rate": 1.984096015169911e-06, - "loss": 0.6943, - "step": 9966 - }, - { - "epoch": 0.26, - "learning_rate": 1.9840910994866943e-06, - "loss": 1.0908, - "step": 9967 - }, - { - "epoch": 0.26, - "learning_rate": 1.9840861830500047e-06, - "loss": 0.834, - "step": 9968 - }, - { - "epoch": 0.26, - "learning_rate": 1.984081265859846e-06, - "loss": 0.6274, - "step": 9969 - }, - { - "epoch": 0.26, - "learning_rate": 1.984076347916221e-06, - "loss": 0.9307, - "step": 9970 - }, - { - "epoch": 0.26, - "learning_rate": 1.9840714292191344e-06, - "loss": 1.0996, - "step": 9971 - }, - { - "epoch": 0.26, - "learning_rate": 1.9840665097685894e-06, - "loss": 0.8945, - "step": 9972 - }, - { - "epoch": 0.26, - "learning_rate": 1.98406158956459e-06, - "loss": 0.7686, - "step": 9973 - }, - { - "epoch": 0.26, - "learning_rate": 1.98405666860714e-06, - "loss": 1.1143, - "step": 9974 - }, - { - "epoch": 0.26, - "learning_rate": 1.9840517468962425e-06, - "loss": 1.1055, - "step": 9975 - }, - { - "epoch": 0.26, - "learning_rate": 1.9840468244319025e-06, - "loss": 1.1602, - "step": 9976 - }, - { - "epoch": 0.26, - "learning_rate": 1.9840419012141226e-06, - "loss": 1.0293, - "step": 9977 - }, - { - "epoch": 0.26, - "learning_rate": 1.984036977242907e-06, - "loss": 0.8281, - "step": 9978 - }, - { - "epoch": 0.26, - "learning_rate": 1.98403205251826e-06, - "loss": 0.7861, - "step": 9979 - }, - { - "epoch": 0.26, - "learning_rate": 1.9840271270401847e-06, - "loss": 0.8525, - "step": 9980 - }, - { - "epoch": 0.26, - "learning_rate": 1.9840222008086853e-06, - "loss": 0.623, - "step": 9981 - }, - { - "epoch": 0.26, - "learning_rate": 1.984017273823765e-06, - "loss": 1.0342, - "step": 9982 - }, - { - "epoch": 0.26, - "learning_rate": 1.984012346085428e-06, - "loss": 0.9492, - "step": 9983 - }, - { - "epoch": 0.26, - "learning_rate": 1.984007417593678e-06, - "loss": 0.7852, - "step": 9984 - }, - { - "epoch": 0.26, - "learning_rate": 1.9840024883485186e-06, - "loss": 0.9531, - "step": 9985 - }, - { - "epoch": 0.26, - "learning_rate": 1.983997558349954e-06, - "loss": 0.9023, - "step": 9986 - }, - { - "epoch": 0.26, - "learning_rate": 1.9839926275979875e-06, - "loss": 1.0781, - "step": 9987 - }, - { - "epoch": 0.26, - "learning_rate": 1.9839876960926233e-06, - "loss": 0.7373, - "step": 9988 - }, - { - "epoch": 0.26, - "learning_rate": 1.983982763833865e-06, - "loss": 1.0713, - "step": 9989 - }, - { - "epoch": 0.26, - "learning_rate": 1.9839778308217162e-06, - "loss": 0.8223, - "step": 9990 - }, - { - "epoch": 0.26, - "learning_rate": 1.983972897056181e-06, - "loss": 0.9902, - "step": 9991 - }, - { - "epoch": 0.26, - "learning_rate": 1.983967962537263e-06, - "loss": 1.0117, - "step": 9992 - }, - { - "epoch": 0.26, - "learning_rate": 1.9839630272649653e-06, - "loss": 0.9824, - "step": 9993 - }, - { - "epoch": 0.26, - "learning_rate": 1.9839580912392933e-06, - "loss": 0.8672, - "step": 9994 - }, - { - "epoch": 0.26, - "learning_rate": 1.9839531544602494e-06, - "loss": 1.2695, - "step": 9995 - }, - { - "epoch": 0.26, - "learning_rate": 1.9839482169278375e-06, - "loss": 1.1426, - "step": 9996 - }, - { - "epoch": 0.26, - "learning_rate": 1.9839432786420622e-06, - "loss": 1.0713, - "step": 9997 - }, - { - "epoch": 0.26, - "learning_rate": 1.9839383396029265e-06, - "loss": 0.8125, - "step": 9998 - }, - { - "epoch": 0.26, - "learning_rate": 1.9839333998104347e-06, - "loss": 0.9385, - "step": 9999 - }, - { - "epoch": 0.26, - "learning_rate": 1.98392845926459e-06, - "loss": 0.8252, - "step": 10000 - }, - { - "epoch": 0.26, - "learning_rate": 1.9839235179653967e-06, - "loss": 0.8003, - "step": 10001 - }, - { - "epoch": 0.26, - "learning_rate": 1.9839185759128587e-06, - "loss": 0.7197, - "step": 10002 - }, - { - "epoch": 0.26, - "learning_rate": 1.983913633106979e-06, - "loss": 0.9688, - "step": 10003 - }, - { - "epoch": 0.26, - "learning_rate": 1.983908689547762e-06, - "loss": 1.041, - "step": 10004 - }, - { - "epoch": 0.26, - "learning_rate": 1.9839037452352114e-06, - "loss": 0.9365, - "step": 10005 - }, - { - "epoch": 0.26, - "learning_rate": 1.9838988001693313e-06, - "loss": 0.7334, - "step": 10006 - }, - { - "epoch": 0.26, - "learning_rate": 1.9838938543501246e-06, - "loss": 0.7178, - "step": 10007 - }, - { - "epoch": 0.26, - "learning_rate": 1.983888907777596e-06, - "loss": 0.8301, - "step": 10008 - }, - { - "epoch": 0.26, - "learning_rate": 1.983883960451749e-06, - "loss": 0.9375, - "step": 10009 - }, - { - "epoch": 0.26, - "learning_rate": 1.9838790123725868e-06, - "loss": 1.0332, - "step": 10010 - }, - { - "epoch": 0.26, - "learning_rate": 1.9838740635401137e-06, - "loss": 0.9736, - "step": 10011 - }, - { - "epoch": 0.26, - "learning_rate": 1.9838691139543337e-06, - "loss": 1.0303, - "step": 10012 - }, - { - "epoch": 0.26, - "learning_rate": 1.9838641636152503e-06, - "loss": 0.9448, - "step": 10013 - }, - { - "epoch": 0.26, - "learning_rate": 1.9838592125228675e-06, - "loss": 1.0264, - "step": 10014 - }, - { - "epoch": 0.26, - "learning_rate": 1.9838542606771887e-06, - "loss": 1.1133, - "step": 10015 - }, - { - "epoch": 0.26, - "learning_rate": 1.983849308078218e-06, - "loss": 0.7732, - "step": 10016 - }, - { - "epoch": 0.26, - "learning_rate": 1.983844354725959e-06, - "loss": 0.75, - "step": 10017 - }, - { - "epoch": 0.26, - "learning_rate": 1.983839400620416e-06, - "loss": 1.0098, - "step": 10018 - }, - { - "epoch": 0.26, - "learning_rate": 1.983834445761592e-06, - "loss": 0.8257, - "step": 10019 - }, - { - "epoch": 0.26, - "learning_rate": 1.9838294901494916e-06, - "loss": 1.0498, - "step": 10020 - }, - { - "epoch": 0.26, - "learning_rate": 1.983824533784118e-06, - "loss": 0.9375, - "step": 10021 - }, - { - "epoch": 0.26, - "learning_rate": 1.983819576665475e-06, - "loss": 0.9043, - "step": 10022 - }, - { - "epoch": 0.26, - "learning_rate": 1.9838146187935672e-06, - "loss": 1.0283, - "step": 10023 - }, - { - "epoch": 0.26, - "learning_rate": 1.983809660168397e-06, - "loss": 0.7183, - "step": 10024 - }, - { - "epoch": 0.26, - "learning_rate": 1.9838047007899697e-06, - "loss": 0.9434, - "step": 10025 - }, - { - "epoch": 0.26, - "learning_rate": 1.9837997406582876e-06, - "loss": 0.793, - "step": 10026 - }, - { - "epoch": 0.26, - "learning_rate": 1.983794779773356e-06, - "loss": 0.9502, - "step": 10027 - }, - { - "epoch": 0.26, - "learning_rate": 1.9837898181351777e-06, - "loss": 0.7549, - "step": 10028 - }, - { - "epoch": 0.26, - "learning_rate": 1.9837848557437565e-06, - "loss": 0.8564, - "step": 10029 - }, - { - "epoch": 0.26, - "learning_rate": 1.983779892599097e-06, - "loss": 1.001, - "step": 10030 - }, - { - "epoch": 0.26, - "learning_rate": 1.983774928701202e-06, - "loss": 0.9629, - "step": 10031 - }, - { - "epoch": 0.26, - "learning_rate": 1.983769964050076e-06, - "loss": 0.7061, - "step": 10032 - }, - { - "epoch": 0.26, - "learning_rate": 1.9837649986457227e-06, - "loss": 0.9229, - "step": 10033 - }, - { - "epoch": 0.26, - "learning_rate": 1.9837600324881453e-06, - "loss": 0.916, - "step": 10034 - }, - { - "epoch": 0.26, - "learning_rate": 1.9837550655773486e-06, - "loss": 0.7119, - "step": 10035 - }, - { - "epoch": 0.26, - "learning_rate": 1.983750097913336e-06, - "loss": 0.9004, - "step": 10036 - }, - { - "epoch": 0.26, - "learning_rate": 1.9837451294961105e-06, - "loss": 0.7559, - "step": 10037 - }, - { - "epoch": 0.26, - "learning_rate": 1.9837401603256767e-06, - "loss": 0.9707, - "step": 10038 - }, - { - "epoch": 0.26, - "learning_rate": 1.983735190402039e-06, - "loss": 1.0566, - "step": 10039 - }, - { - "epoch": 0.26, - "learning_rate": 1.9837302197251997e-06, - "loss": 0.9678, - "step": 10040 - }, - { - "epoch": 0.26, - "learning_rate": 1.9837252482951637e-06, - "loss": 0.8438, - "step": 10041 - }, - { - "epoch": 0.26, - "learning_rate": 1.9837202761119346e-06, - "loss": 1.0264, - "step": 10042 - }, - { - "epoch": 0.26, - "learning_rate": 1.9837153031755157e-06, - "loss": 0.8252, - "step": 10043 - }, - { - "epoch": 0.26, - "learning_rate": 1.9837103294859117e-06, - "loss": 0.7646, - "step": 10044 - }, - { - "epoch": 0.26, - "learning_rate": 1.983705355043126e-06, - "loss": 0.9316, - "step": 10045 - }, - { - "epoch": 0.26, - "learning_rate": 1.983700379847162e-06, - "loss": 0.8047, - "step": 10046 - }, - { - "epoch": 0.26, - "learning_rate": 1.9836954038980244e-06, - "loss": 0.9814, - "step": 10047 - }, - { - "epoch": 0.26, - "learning_rate": 1.9836904271957157e-06, - "loss": 0.9346, - "step": 10048 - }, - { - "epoch": 0.26, - "learning_rate": 1.983685449740241e-06, - "loss": 0.7183, - "step": 10049 - }, - { - "epoch": 0.26, - "learning_rate": 1.9836804715316035e-06, - "loss": 1.0146, - "step": 10050 - }, - { - "epoch": 0.26, - "learning_rate": 1.983675492569807e-06, - "loss": 1.0898, - "step": 10051 - }, - { - "epoch": 0.26, - "learning_rate": 1.9836705128548552e-06, - "loss": 0.8613, - "step": 10052 - }, - { - "epoch": 0.26, - "learning_rate": 1.9836655323867524e-06, - "loss": 0.916, - "step": 10053 - }, - { - "epoch": 0.26, - "learning_rate": 1.983660551165502e-06, - "loss": 0.9873, - "step": 10054 - }, - { - "epoch": 0.26, - "learning_rate": 1.9836555691911082e-06, - "loss": 1.0205, - "step": 10055 - }, - { - "epoch": 0.26, - "learning_rate": 1.983650586463574e-06, - "loss": 1.1758, - "step": 10056 - }, - { - "epoch": 0.26, - "learning_rate": 1.9836456029829046e-06, - "loss": 0.834, - "step": 10057 - }, - { - "epoch": 0.26, - "learning_rate": 1.9836406187491025e-06, - "loss": 0.8359, - "step": 10058 - }, - { - "epoch": 0.26, - "learning_rate": 1.983635633762172e-06, - "loss": 0.9346, - "step": 10059 - }, - { - "epoch": 0.26, - "learning_rate": 1.983630648022117e-06, - "loss": 0.917, - "step": 10060 - }, - { - "epoch": 0.26, - "learning_rate": 1.983625661528941e-06, - "loss": 0.7803, - "step": 10061 - }, - { - "epoch": 0.26, - "learning_rate": 1.9836206742826483e-06, - "loss": 1.0859, - "step": 10062 - }, - { - "epoch": 0.26, - "learning_rate": 1.9836156862832426e-06, - "loss": 0.8691, - "step": 10063 - }, - { - "epoch": 0.26, - "learning_rate": 1.9836106975307272e-06, - "loss": 0.9453, - "step": 10064 - }, - { - "epoch": 0.26, - "learning_rate": 1.983605708025107e-06, - "loss": 0.7979, - "step": 10065 - }, - { - "epoch": 0.26, - "learning_rate": 1.9836007177663843e-06, - "loss": 0.8428, - "step": 10066 - }, - { - "epoch": 0.26, - "learning_rate": 1.9835957267545644e-06, - "loss": 0.8594, - "step": 10067 - }, - { - "epoch": 0.26, - "learning_rate": 1.98359073498965e-06, - "loss": 0.793, - "step": 10068 - }, - { - "epoch": 0.26, - "learning_rate": 1.983585742471646e-06, - "loss": 0.8325, - "step": 10069 - }, - { - "epoch": 0.26, - "learning_rate": 1.9835807492005553e-06, - "loss": 0.9043, - "step": 10070 - }, - { - "epoch": 0.26, - "learning_rate": 1.9835757551763817e-06, - "loss": 0.731, - "step": 10071 - }, - { - "epoch": 0.26, - "learning_rate": 1.9835707603991297e-06, - "loss": 0.9854, - "step": 10072 - }, - { - "epoch": 0.26, - "learning_rate": 1.983565764868803e-06, - "loss": 0.9629, - "step": 10073 - }, - { - "epoch": 0.26, - "learning_rate": 1.9835607685854047e-06, - "loss": 1.1221, - "step": 10074 - }, - { - "epoch": 0.26, - "learning_rate": 1.9835557715489393e-06, - "loss": 0.8926, - "step": 10075 - }, - { - "epoch": 0.26, - "learning_rate": 1.9835507737594108e-06, - "loss": 0.8486, - "step": 10076 - }, - { - "epoch": 0.26, - "learning_rate": 1.9835457752168225e-06, - "loss": 1.0625, - "step": 10077 - }, - { - "epoch": 0.26, - "learning_rate": 1.9835407759211783e-06, - "loss": 0.918, - "step": 10078 - }, - { - "epoch": 0.26, - "learning_rate": 1.9835357758724825e-06, - "loss": 1.0762, - "step": 10079 - }, - { - "epoch": 0.26, - "learning_rate": 1.9835307750707383e-06, - "loss": 0.7852, - "step": 10080 - }, - { - "epoch": 0.26, - "learning_rate": 1.9835257735159497e-06, - "loss": 0.9648, - "step": 10081 - }, - { - "epoch": 0.26, - "learning_rate": 1.983520771208121e-06, - "loss": 1.0605, - "step": 10082 - }, - { - "epoch": 0.26, - "learning_rate": 1.9835157681472556e-06, - "loss": 0.8481, - "step": 10083 - }, - { - "epoch": 0.26, - "learning_rate": 1.9835107643333573e-06, - "loss": 0.9102, - "step": 10084 - }, - { - "epoch": 0.26, - "learning_rate": 1.9835057597664297e-06, - "loss": 0.8623, - "step": 10085 - }, - { - "epoch": 0.26, - "learning_rate": 1.9835007544464776e-06, - "loss": 0.9619, - "step": 10086 - }, - { - "epoch": 0.26, - "learning_rate": 1.983495748373504e-06, - "loss": 0.8994, - "step": 10087 - }, - { - "epoch": 0.26, - "learning_rate": 1.9834907415475123e-06, - "loss": 0.9087, - "step": 10088 - }, - { - "epoch": 0.26, - "learning_rate": 1.9834857339685076e-06, - "loss": 1.0078, - "step": 10089 - }, - { - "epoch": 0.26, - "learning_rate": 1.983480725636493e-06, - "loss": 0.9424, - "step": 10090 - }, - { - "epoch": 0.26, - "learning_rate": 1.9834757165514724e-06, - "loss": 0.8174, - "step": 10091 - }, - { - "epoch": 0.26, - "learning_rate": 1.9834707067134495e-06, - "loss": 1.0947, - "step": 10092 - }, - { - "epoch": 0.26, - "learning_rate": 1.9834656961224287e-06, - "loss": 1.0283, - "step": 10093 - }, - { - "epoch": 0.26, - "learning_rate": 1.983460684778413e-06, - "loss": 0.8916, - "step": 10094 - }, - { - "epoch": 0.26, - "learning_rate": 1.983455672681407e-06, - "loss": 1.0078, - "step": 10095 - }, - { - "epoch": 0.26, - "learning_rate": 1.983450659831414e-06, - "loss": 0.7437, - "step": 10096 - }, - { - "epoch": 0.26, - "learning_rate": 1.983445646228438e-06, - "loss": 1.1309, - "step": 10097 - }, - { - "epoch": 0.26, - "learning_rate": 1.983440631872483e-06, - "loss": 1.002, - "step": 10098 - }, - { - "epoch": 0.26, - "learning_rate": 1.9834356167635527e-06, - "loss": 0.873, - "step": 10099 - }, - { - "epoch": 0.26, - "learning_rate": 1.9834306009016513e-06, - "loss": 0.9106, - "step": 10100 - }, - { - "epoch": 0.26, - "learning_rate": 1.983425584286782e-06, - "loss": 1.0049, - "step": 10101 - }, - { - "epoch": 0.26, - "learning_rate": 1.983420566918949e-06, - "loss": 1.1025, - "step": 10102 - }, - { - "epoch": 0.26, - "learning_rate": 1.983415548798156e-06, - "loss": 0.9033, - "step": 10103 - }, - { - "epoch": 0.26, - "learning_rate": 1.983410529924407e-06, - "loss": 1.04, - "step": 10104 - }, - { - "epoch": 0.26, - "learning_rate": 1.9834055102977056e-06, - "loss": 0.8027, - "step": 10105 - }, - { - "epoch": 0.26, - "learning_rate": 1.983400489918056e-06, - "loss": 1.0518, - "step": 10106 - }, - { - "epoch": 0.26, - "learning_rate": 1.983395468785462e-06, - "loss": 1.082, - "step": 10107 - }, - { - "epoch": 0.26, - "learning_rate": 1.983390446899927e-06, - "loss": 0.7646, - "step": 10108 - }, - { - "epoch": 0.26, - "learning_rate": 1.9833854242614554e-06, - "loss": 1.0596, - "step": 10109 - }, - { - "epoch": 0.26, - "learning_rate": 1.9833804008700506e-06, - "loss": 0.8011, - "step": 10110 - }, - { - "epoch": 0.26, - "learning_rate": 1.983375376725717e-06, - "loss": 0.9814, - "step": 10111 - }, - { - "epoch": 0.26, - "learning_rate": 1.9833703518284576e-06, - "loss": 0.7432, - "step": 10112 - }, - { - "epoch": 0.26, - "learning_rate": 1.983365326178277e-06, - "loss": 1.0078, - "step": 10113 - }, - { - "epoch": 0.26, - "learning_rate": 1.9833602997751787e-06, - "loss": 0.9609, - "step": 10114 - }, - { - "epoch": 0.26, - "learning_rate": 1.9833552726191666e-06, - "loss": 0.9609, - "step": 10115 - }, - { - "epoch": 0.26, - "learning_rate": 1.983350244710245e-06, - "loss": 0.9756, - "step": 10116 - }, - { - "epoch": 0.26, - "learning_rate": 1.9833452160484167e-06, - "loss": 0.8867, - "step": 10117 - }, - { - "epoch": 0.26, - "learning_rate": 1.9833401866336865e-06, - "loss": 0.8877, - "step": 10118 - }, - { - "epoch": 0.26, - "learning_rate": 1.983335156466058e-06, - "loss": 1.167, - "step": 10119 - }, - { - "epoch": 0.26, - "learning_rate": 1.983330125545535e-06, - "loss": 0.8008, - "step": 10120 - }, - { - "epoch": 0.26, - "learning_rate": 1.9833250938721212e-06, - "loss": 0.8047, - "step": 10121 - }, - { - "epoch": 0.26, - "learning_rate": 1.983320061445821e-06, - "loss": 0.8398, - "step": 10122 - }, - { - "epoch": 0.26, - "learning_rate": 1.983315028266637e-06, - "loss": 0.5034, - "step": 10123 - }, - { - "epoch": 0.26, - "learning_rate": 1.9833099943345744e-06, - "loss": 1.0859, - "step": 10124 - }, - { - "epoch": 0.26, - "learning_rate": 1.9833049596496366e-06, - "loss": 0.8252, - "step": 10125 - }, - { - "epoch": 0.26, - "learning_rate": 1.9832999242118276e-06, - "loss": 0.6182, - "step": 10126 - }, - { - "epoch": 0.26, - "learning_rate": 1.9832948880211506e-06, - "loss": 0.8428, - "step": 10127 - }, - { - "epoch": 0.26, - "learning_rate": 1.98328985107761e-06, - "loss": 0.7676, - "step": 10128 - }, - { - "epoch": 0.26, - "learning_rate": 1.9832848133812097e-06, - "loss": 1.0068, - "step": 10129 - }, - { - "epoch": 0.26, - "learning_rate": 1.9832797749319538e-06, - "loss": 0.8452, - "step": 10130 - }, - { - "epoch": 0.26, - "learning_rate": 1.983274735729845e-06, - "loss": 0.9082, - "step": 10131 - }, - { - "epoch": 0.26, - "learning_rate": 1.9832696957748886e-06, - "loss": 0.9453, - "step": 10132 - }, - { - "epoch": 0.26, - "learning_rate": 1.983264655067088e-06, - "loss": 0.7085, - "step": 10133 - }, - { - "epoch": 0.26, - "learning_rate": 1.983259613606446e-06, - "loss": 0.9688, - "step": 10134 - }, - { - "epoch": 0.26, - "learning_rate": 1.983254571392968e-06, - "loss": 1.0, - "step": 10135 - }, - { - "epoch": 0.26, - "learning_rate": 1.983249528426657e-06, - "loss": 1.127, - "step": 10136 - }, - { - "epoch": 0.26, - "learning_rate": 1.983244484707517e-06, - "loss": 1.0039, - "step": 10137 - }, - { - "epoch": 0.26, - "learning_rate": 1.9832394402355517e-06, - "loss": 0.77, - "step": 10138 - }, - { - "epoch": 0.26, - "learning_rate": 1.9832343950107652e-06, - "loss": 0.7734, - "step": 10139 - }, - { - "epoch": 0.26, - "learning_rate": 1.9832293490331617e-06, - "loss": 0.834, - "step": 10140 - }, - { - "epoch": 0.26, - "learning_rate": 1.9832243023027446e-06, - "loss": 1.209, - "step": 10141 - }, - { - "epoch": 0.26, - "learning_rate": 1.9832192548195176e-06, - "loss": 0.9224, - "step": 10142 - }, - { - "epoch": 0.26, - "learning_rate": 1.983214206583485e-06, - "loss": 1.1025, - "step": 10143 - }, - { - "epoch": 0.26, - "learning_rate": 1.9832091575946506e-06, - "loss": 0.9023, - "step": 10144 - }, - { - "epoch": 0.26, - "learning_rate": 1.9832041078530178e-06, - "loss": 0.5852, - "step": 10145 - }, - { - "epoch": 0.26, - "learning_rate": 1.983199057358591e-06, - "loss": 0.9521, - "step": 10146 - }, - { - "epoch": 0.26, - "learning_rate": 1.9831940061113742e-06, - "loss": 0.9307, - "step": 10147 - }, - { - "epoch": 0.26, - "learning_rate": 1.9831889541113703e-06, - "loss": 0.8369, - "step": 10148 - }, - { - "epoch": 0.26, - "learning_rate": 1.9831839013585845e-06, - "loss": 0.9561, - "step": 10149 - }, - { - "epoch": 0.26, - "learning_rate": 1.9831788478530197e-06, - "loss": 0.7988, - "step": 10150 - }, - { - "epoch": 0.26, - "learning_rate": 1.9831737935946803e-06, - "loss": 1.042, - "step": 10151 - }, - { - "epoch": 0.26, - "learning_rate": 1.9831687385835695e-06, - "loss": 0.8125, - "step": 10152 - }, - { - "epoch": 0.26, - "learning_rate": 1.983163682819692e-06, - "loss": 1.0264, - "step": 10153 - }, - { - "epoch": 0.26, - "learning_rate": 1.983158626303051e-06, - "loss": 0.9512, - "step": 10154 - }, - { - "epoch": 0.26, - "learning_rate": 1.983153569033651e-06, - "loss": 0.8975, - "step": 10155 - }, - { - "epoch": 0.26, - "learning_rate": 1.983148511011495e-06, - "loss": 1.0381, - "step": 10156 - }, - { - "epoch": 0.26, - "learning_rate": 1.983143452236588e-06, - "loss": 0.9043, - "step": 10157 - }, - { - "epoch": 0.26, - "learning_rate": 1.9831383927089327e-06, - "loss": 0.918, - "step": 10158 - }, - { - "epoch": 0.26, - "learning_rate": 1.9831333324285338e-06, - "loss": 1.0898, - "step": 10159 - }, - { - "epoch": 0.26, - "learning_rate": 1.983128271395395e-06, - "loss": 0.9473, - "step": 10160 - }, - { - "epoch": 0.26, - "learning_rate": 1.9831232096095198e-06, - "loss": 0.8945, - "step": 10161 - }, - { - "epoch": 0.26, - "learning_rate": 1.9831181470709123e-06, - "loss": 1.0781, - "step": 10162 - }, - { - "epoch": 0.26, - "learning_rate": 1.9831130837795768e-06, - "loss": 0.96, - "step": 10163 - }, - { - "epoch": 0.26, - "learning_rate": 1.983108019735517e-06, - "loss": 1.0791, - "step": 10164 - }, - { - "epoch": 0.26, - "learning_rate": 1.983102954938736e-06, - "loss": 0.9404, - "step": 10165 - }, - { - "epoch": 0.26, - "learning_rate": 1.9830978893892383e-06, - "loss": 0.6255, - "step": 10166 - }, - { - "epoch": 0.26, - "learning_rate": 1.9830928230870284e-06, - "loss": 1.1006, - "step": 10167 - }, - { - "epoch": 0.26, - "learning_rate": 1.983087756032109e-06, - "loss": 0.959, - "step": 10168 - }, - { - "epoch": 0.26, - "learning_rate": 1.9830826882244845e-06, - "loss": 0.8838, - "step": 10169 - }, - { - "epoch": 0.26, - "learning_rate": 1.9830776196641593e-06, - "loss": 0.9512, - "step": 10170 - }, - { - "epoch": 0.26, - "learning_rate": 1.983072550351136e-06, - "loss": 1.0977, - "step": 10171 - }, - { - "epoch": 0.26, - "learning_rate": 1.98306748028542e-06, - "loss": 0.9658, - "step": 10172 - }, - { - "epoch": 0.26, - "learning_rate": 1.9830624094670138e-06, - "loss": 1.0352, - "step": 10173 - }, - { - "epoch": 0.26, - "learning_rate": 1.9830573378959223e-06, - "loss": 0.71, - "step": 10174 - }, - { - "epoch": 0.26, - "learning_rate": 1.983052265572149e-06, - "loss": 0.7783, - "step": 10175 - }, - { - "epoch": 0.26, - "learning_rate": 1.9830471924956976e-06, - "loss": 1.2266, - "step": 10176 - }, - { - "epoch": 0.26, - "learning_rate": 1.983042118666572e-06, - "loss": 1.0488, - "step": 10177 - }, - { - "epoch": 0.26, - "learning_rate": 1.9830370440847766e-06, - "loss": 0.7393, - "step": 10178 - }, - { - "epoch": 0.26, - "learning_rate": 1.983031968750315e-06, - "loss": 1.0078, - "step": 10179 - }, - { - "epoch": 0.26, - "learning_rate": 1.983026892663191e-06, - "loss": 0.7935, - "step": 10180 - }, - { - "epoch": 0.26, - "learning_rate": 1.9830218158234083e-06, - "loss": 0.8682, - "step": 10181 - }, - { - "epoch": 0.26, - "learning_rate": 1.983016738230971e-06, - "loss": 0.8994, - "step": 10182 - }, - { - "epoch": 0.26, - "learning_rate": 1.983011659885883e-06, - "loss": 1.1191, - "step": 10183 - }, - { - "epoch": 0.26, - "learning_rate": 1.983006580788148e-06, - "loss": 0.8408, - "step": 10184 - }, - { - "epoch": 0.26, - "learning_rate": 1.9830015009377703e-06, - "loss": 0.8926, - "step": 10185 - }, - { - "epoch": 0.26, - "learning_rate": 1.982996420334754e-06, - "loss": 1.0801, - "step": 10186 - }, - { - "epoch": 0.26, - "learning_rate": 1.982991338979102e-06, - "loss": 0.917, - "step": 10187 - }, - { - "epoch": 0.26, - "learning_rate": 1.9829862568708185e-06, - "loss": 0.8926, - "step": 10188 - }, - { - "epoch": 0.26, - "learning_rate": 1.982981174009908e-06, - "loss": 0.9922, - "step": 10189 - }, - { - "epoch": 0.26, - "learning_rate": 1.9829760903963744e-06, - "loss": 0.9795, - "step": 10190 - }, - { - "epoch": 0.26, - "learning_rate": 1.9829710060302204e-06, - "loss": 1.0068, - "step": 10191 - }, - { - "epoch": 0.26, - "learning_rate": 1.982965920911451e-06, - "loss": 0.9307, - "step": 10192 - }, - { - "epoch": 0.26, - "learning_rate": 1.9829608350400696e-06, - "loss": 1.0371, - "step": 10193 - }, - { - "epoch": 0.26, - "learning_rate": 1.9829557484160807e-06, - "loss": 0.9336, - "step": 10194 - }, - { - "epoch": 0.26, - "learning_rate": 1.982950661039488e-06, - "loss": 0.8452, - "step": 10195 - }, - { - "epoch": 0.26, - "learning_rate": 1.9829455729102947e-06, - "loss": 0.8223, - "step": 10196 - }, - { - "epoch": 0.26, - "learning_rate": 1.9829404840285048e-06, - "loss": 0.9053, - "step": 10197 - }, - { - "epoch": 0.26, - "learning_rate": 1.9829353943941235e-06, - "loss": 1.0371, - "step": 10198 - }, - { - "epoch": 0.26, - "learning_rate": 1.982930304007153e-06, - "loss": 0.9473, - "step": 10199 - }, - { - "epoch": 0.26, - "learning_rate": 1.9829252128675986e-06, - "loss": 1.0283, - "step": 10200 - }, - { - "epoch": 0.26, - "learning_rate": 1.982920120975463e-06, - "loss": 0.7871, - "step": 10201 - }, - { - "epoch": 0.26, - "learning_rate": 1.9829150283307507e-06, - "loss": 0.9385, - "step": 10202 - }, - { - "epoch": 0.26, - "learning_rate": 1.982909934933466e-06, - "loss": 0.9307, - "step": 10203 - }, - { - "epoch": 0.26, - "learning_rate": 1.982904840783612e-06, - "loss": 0.9604, - "step": 10204 - }, - { - "epoch": 0.26, - "learning_rate": 1.982899745881193e-06, - "loss": 0.8291, - "step": 10205 - }, - { - "epoch": 0.26, - "learning_rate": 1.982894650226213e-06, - "loss": 0.9341, - "step": 10206 - }, - { - "epoch": 0.26, - "learning_rate": 1.9828895538186754e-06, - "loss": 0.8789, - "step": 10207 - }, - { - "epoch": 0.26, - "learning_rate": 1.9828844566585847e-06, - "loss": 0.9746, - "step": 10208 - }, - { - "epoch": 0.26, - "learning_rate": 1.9828793587459446e-06, - "loss": 1.043, - "step": 10209 - }, - { - "epoch": 0.26, - "learning_rate": 1.982874260080759e-06, - "loss": 0.8735, - "step": 10210 - }, - { - "epoch": 0.26, - "learning_rate": 1.9828691606630316e-06, - "loss": 0.8926, - "step": 10211 - }, - { - "epoch": 0.26, - "learning_rate": 1.9828640604927667e-06, - "loss": 0.9766, - "step": 10212 - }, - { - "epoch": 0.26, - "learning_rate": 1.982858959569968e-06, - "loss": 1.0723, - "step": 10213 - }, - { - "epoch": 0.26, - "learning_rate": 1.982853857894639e-06, - "loss": 0.9473, - "step": 10214 - }, - { - "epoch": 0.26, - "learning_rate": 1.9828487554667844e-06, - "loss": 1.0439, - "step": 10215 - }, - { - "epoch": 0.26, - "learning_rate": 1.982843652286408e-06, - "loss": 0.8301, - "step": 10216 - }, - { - "epoch": 0.26, - "learning_rate": 1.982838548353513e-06, - "loss": 0.8809, - "step": 10217 - }, - { - "epoch": 0.26, - "learning_rate": 1.9828334436681033e-06, - "loss": 0.8623, - "step": 10218 - }, - { - "epoch": 0.26, - "learning_rate": 1.9828283382301837e-06, - "loss": 1.2178, - "step": 10219 - }, - { - "epoch": 0.26, - "learning_rate": 1.9828232320397575e-06, - "loss": 0.9033, - "step": 10220 - }, - { - "epoch": 0.26, - "learning_rate": 1.982818125096829e-06, - "loss": 0.8965, - "step": 10221 - }, - { - "epoch": 0.26, - "learning_rate": 1.9828130174014017e-06, - "loss": 1.0215, - "step": 10222 - }, - { - "epoch": 0.26, - "learning_rate": 1.9828079089534794e-06, - "loss": 0.915, - "step": 10223 - }, - { - "epoch": 0.26, - "learning_rate": 1.9828027997530665e-06, - "loss": 0.9111, - "step": 10224 - }, - { - "epoch": 0.26, - "learning_rate": 1.982797689800167e-06, - "loss": 0.8594, - "step": 10225 - }, - { - "epoch": 0.26, - "learning_rate": 1.982792579094784e-06, - "loss": 0.8677, - "step": 10226 - }, - { - "epoch": 0.26, - "learning_rate": 1.982787467636922e-06, - "loss": 0.9365, - "step": 10227 - }, - { - "epoch": 0.26, - "learning_rate": 1.9827823554265848e-06, - "loss": 0.9404, - "step": 10228 - }, - { - "epoch": 0.26, - "learning_rate": 1.9827772424637765e-06, - "loss": 0.4443, - "step": 10229 - }, - { - "epoch": 0.26, - "learning_rate": 1.982772128748501e-06, - "loss": 0.8965, - "step": 10230 - }, - { - "epoch": 0.26, - "learning_rate": 1.9827670142807617e-06, - "loss": 0.8848, - "step": 10231 - }, - { - "epoch": 0.26, - "learning_rate": 1.982761899060563e-06, - "loss": 0.9424, - "step": 10232 - }, - { - "epoch": 0.26, - "learning_rate": 1.982756783087909e-06, - "loss": 0.8418, - "step": 10233 - }, - { - "epoch": 0.26, - "learning_rate": 1.982751666362803e-06, - "loss": 1.0098, - "step": 10234 - }, - { - "epoch": 0.26, - "learning_rate": 1.9827465488852493e-06, - "loss": 0.9209, - "step": 10235 - }, - { - "epoch": 0.26, - "learning_rate": 1.982741430655252e-06, - "loss": 0.9248, - "step": 10236 - }, - { - "epoch": 0.26, - "learning_rate": 1.982736311672814e-06, - "loss": 1.0117, - "step": 10237 - }, - { - "epoch": 0.26, - "learning_rate": 1.9827311919379406e-06, - "loss": 1.0283, - "step": 10238 - }, - { - "epoch": 0.26, - "learning_rate": 1.982726071450635e-06, - "loss": 0.9863, - "step": 10239 - }, - { - "epoch": 0.26, - "learning_rate": 1.9827209502109015e-06, - "loss": 0.9668, - "step": 10240 - }, - { - "epoch": 0.26, - "learning_rate": 1.9827158282187436e-06, - "loss": 1.0254, - "step": 10241 - }, - { - "epoch": 0.26, - "learning_rate": 1.982710705474165e-06, - "loss": 0.9131, - "step": 10242 - }, - { - "epoch": 0.26, - "learning_rate": 1.9827055819771706e-06, - "loss": 0.8281, - "step": 10243 - }, - { - "epoch": 0.26, - "learning_rate": 1.9827004577277635e-06, - "loss": 0.8438, - "step": 10244 - }, - { - "epoch": 0.26, - "learning_rate": 1.9826953327259476e-06, - "loss": 1.04, - "step": 10245 - }, - { - "epoch": 0.26, - "learning_rate": 1.9826902069717276e-06, - "loss": 0.8633, - "step": 10246 - }, - { - "epoch": 0.26, - "learning_rate": 1.9826850804651064e-06, - "loss": 1.082, - "step": 10247 - }, - { - "epoch": 0.26, - "learning_rate": 1.9826799532060887e-06, - "loss": 0.752, - "step": 10248 - }, - { - "epoch": 0.26, - "learning_rate": 1.982674825194678e-06, - "loss": 0.8828, - "step": 10249 - }, - { - "epoch": 0.26, - "learning_rate": 1.9826696964308783e-06, - "loss": 1.002, - "step": 10250 - }, - { - "epoch": 0.26, - "learning_rate": 1.9826645669146936e-06, - "loss": 0.9736, - "step": 10251 - }, - { - "epoch": 0.26, - "learning_rate": 1.982659436646128e-06, - "loss": 1.085, - "step": 10252 - }, - { - "epoch": 0.26, - "learning_rate": 1.982654305625185e-06, - "loss": 0.9883, - "step": 10253 - }, - { - "epoch": 0.26, - "learning_rate": 1.9826491738518693e-06, - "loss": 0.8818, - "step": 10254 - }, - { - "epoch": 0.26, - "learning_rate": 1.9826440413261838e-06, - "loss": 0.9043, - "step": 10255 - }, - { - "epoch": 0.26, - "learning_rate": 1.982638908048133e-06, - "loss": 0.8408, - "step": 10256 - }, - { - "epoch": 0.26, - "learning_rate": 1.982633774017721e-06, - "loss": 0.8501, - "step": 10257 - }, - { - "epoch": 0.26, - "learning_rate": 1.982628639234951e-06, - "loss": 0.811, - "step": 10258 - }, - { - "epoch": 0.26, - "learning_rate": 1.982623503699828e-06, - "loss": 0.8521, - "step": 10259 - }, - { - "epoch": 0.26, - "learning_rate": 1.9826183674123552e-06, - "loss": 0.7627, - "step": 10260 - }, - { - "epoch": 0.26, - "learning_rate": 1.9826132303725367e-06, - "loss": 0.9355, - "step": 10261 - }, - { - "epoch": 0.26, - "learning_rate": 1.9826080925803764e-06, - "loss": 0.9033, - "step": 10262 - }, - { - "epoch": 0.26, - "learning_rate": 1.982602954035878e-06, - "loss": 1.0557, - "step": 10263 - }, - { - "epoch": 0.26, - "learning_rate": 1.982597814739046e-06, - "loss": 0.8955, - "step": 10264 - }, - { - "epoch": 0.26, - "learning_rate": 1.9825926746898844e-06, - "loss": 1.0049, - "step": 10265 - }, - { - "epoch": 0.26, - "learning_rate": 1.982587533888396e-06, - "loss": 0.7205, - "step": 10266 - }, - { - "epoch": 0.26, - "learning_rate": 1.982582392334586e-06, - "loss": 0.7046, - "step": 10267 - }, - { - "epoch": 0.26, - "learning_rate": 1.982577250028458e-06, - "loss": 1.0439, - "step": 10268 - }, - { - "epoch": 0.26, - "learning_rate": 1.982572106970015e-06, - "loss": 1.0205, - "step": 10269 - }, - { - "epoch": 0.26, - "learning_rate": 1.9825669631592625e-06, - "loss": 0.9746, - "step": 10270 - }, - { - "epoch": 0.26, - "learning_rate": 1.9825618185962033e-06, - "loss": 0.7451, - "step": 10271 - }, - { - "epoch": 0.26, - "learning_rate": 1.982556673280842e-06, - "loss": 0.7002, - "step": 10272 - }, - { - "epoch": 0.26, - "learning_rate": 1.982551527213182e-06, - "loss": 1.0439, - "step": 10273 - }, - { - "epoch": 0.26, - "learning_rate": 1.982546380393227e-06, - "loss": 0.8877, - "step": 10274 - }, - { - "epoch": 0.26, - "learning_rate": 1.982541232820982e-06, - "loss": 0.8906, - "step": 10275 - }, - { - "epoch": 0.26, - "learning_rate": 1.9825360844964504e-06, - "loss": 0.9883, - "step": 10276 - }, - { - "epoch": 0.26, - "learning_rate": 1.982530935419636e-06, - "loss": 1.0225, - "step": 10277 - }, - { - "epoch": 0.26, - "learning_rate": 1.982525785590543e-06, - "loss": 1.0381, - "step": 10278 - }, - { - "epoch": 0.26, - "learning_rate": 1.9825206350091747e-06, - "loss": 0.8848, - "step": 10279 - }, - { - "epoch": 0.26, - "learning_rate": 1.982515483675536e-06, - "loss": 0.9756, - "step": 10280 - }, - { - "epoch": 0.26, - "learning_rate": 1.9825103315896298e-06, - "loss": 0.8145, - "step": 10281 - }, - { - "epoch": 0.26, - "learning_rate": 1.9825051787514614e-06, - "loss": 0.7739, - "step": 10282 - }, - { - "epoch": 0.26, - "learning_rate": 1.9825000251610333e-06, - "loss": 0.7622, - "step": 10283 - }, - { - "epoch": 0.26, - "learning_rate": 1.9824948708183506e-06, - "loss": 0.8115, - "step": 10284 - }, - { - "epoch": 0.26, - "learning_rate": 1.9824897157234163e-06, - "loss": 0.8896, - "step": 10285 - }, - { - "epoch": 0.26, - "learning_rate": 1.982484559876235e-06, - "loss": 0.833, - "step": 10286 - }, - { - "epoch": 0.26, - "learning_rate": 1.9824794032768104e-06, - "loss": 0.9062, - "step": 10287 - }, - { - "epoch": 0.26, - "learning_rate": 1.9824742459251465e-06, - "loss": 0.8154, - "step": 10288 - }, - { - "epoch": 0.26, - "learning_rate": 1.9824690878212474e-06, - "loss": 0.9463, - "step": 10289 - }, - { - "epoch": 0.26, - "learning_rate": 1.9824639289651166e-06, - "loss": 0.7402, - "step": 10290 - }, - { - "epoch": 0.26, - "learning_rate": 1.9824587693567587e-06, - "loss": 0.9629, - "step": 10291 - }, - { - "epoch": 0.26, - "learning_rate": 1.982453608996177e-06, - "loss": 1.2344, - "step": 10292 - }, - { - "epoch": 0.26, - "learning_rate": 1.982448447883376e-06, - "loss": 0.8008, - "step": 10293 - }, - { - "epoch": 0.26, - "learning_rate": 1.9824432860183594e-06, - "loss": 1.1494, - "step": 10294 - }, - { - "epoch": 0.26, - "learning_rate": 1.982438123401131e-06, - "loss": 0.7915, - "step": 10295 - }, - { - "epoch": 0.26, - "learning_rate": 1.9824329600316947e-06, - "loss": 0.8662, - "step": 10296 - }, - { - "epoch": 0.26, - "learning_rate": 1.982427795910055e-06, - "loss": 0.8608, - "step": 10297 - }, - { - "epoch": 0.26, - "learning_rate": 1.9824226310362152e-06, - "loss": 0.9395, - "step": 10298 - }, - { - "epoch": 0.26, - "learning_rate": 1.98241746541018e-06, - "loss": 1.0684, - "step": 10299 - }, - { - "epoch": 0.26, - "learning_rate": 1.9824122990319523e-06, - "loss": 1.0322, - "step": 10300 - }, - { - "epoch": 0.26, - "learning_rate": 1.9824071319015374e-06, - "loss": 1.1611, - "step": 10301 - }, - { - "epoch": 0.26, - "learning_rate": 1.982401964018938e-06, - "loss": 0.7871, - "step": 10302 - }, - { - "epoch": 0.26, - "learning_rate": 1.982396795384159e-06, - "loss": 0.9326, - "step": 10303 - }, - { - "epoch": 0.26, - "learning_rate": 1.9823916259972037e-06, - "loss": 0.8701, - "step": 10304 - }, - { - "epoch": 0.26, - "learning_rate": 1.982386455858076e-06, - "loss": 0.7422, - "step": 10305 - }, - { - "epoch": 0.26, - "learning_rate": 1.982381284966781e-06, - "loss": 0.6772, - "step": 10306 - }, - { - "epoch": 0.26, - "learning_rate": 1.9823761133233213e-06, - "loss": 0.7617, - "step": 10307 - }, - { - "epoch": 0.26, - "learning_rate": 1.9823709409277013e-06, - "loss": 1.0337, - "step": 10308 - }, - { - "epoch": 0.26, - "learning_rate": 1.982365767779925e-06, - "loss": 1.001, - "step": 10309 - }, - { - "epoch": 0.26, - "learning_rate": 1.9823605938799965e-06, - "loss": 0.8994, - "step": 10310 - }, - { - "epoch": 0.26, - "learning_rate": 1.9823554192279197e-06, - "loss": 0.8213, - "step": 10311 - }, - { - "epoch": 0.26, - "learning_rate": 1.9823502438236983e-06, - "loss": 0.7253, - "step": 10312 - }, - { - "epoch": 0.26, - "learning_rate": 1.982345067667337e-06, - "loss": 0.8403, - "step": 10313 - }, - { - "epoch": 0.26, - "learning_rate": 1.9823398907588387e-06, - "loss": 0.8047, - "step": 10314 - }, - { - "epoch": 0.26, - "learning_rate": 1.982334713098208e-06, - "loss": 1.2227, - "step": 10315 - }, - { - "epoch": 0.26, - "learning_rate": 1.982329534685449e-06, - "loss": 0.9482, - "step": 10316 - }, - { - "epoch": 0.26, - "learning_rate": 1.9823243555205657e-06, - "loss": 0.7639, - "step": 10317 - }, - { - "epoch": 0.26, - "learning_rate": 1.9823191756035612e-06, - "loss": 0.9609, - "step": 10318 - }, - { - "epoch": 0.26, - "learning_rate": 1.9823139949344406e-06, - "loss": 0.9834, - "step": 10319 - }, - { - "epoch": 0.26, - "learning_rate": 1.9823088135132073e-06, - "loss": 0.9883, - "step": 10320 - }, - { - "epoch": 0.26, - "learning_rate": 1.982303631339865e-06, - "loss": 0.7153, - "step": 10321 - }, - { - "epoch": 0.26, - "learning_rate": 1.982298448414418e-06, - "loss": 1.1318, - "step": 10322 - }, - { - "epoch": 0.26, - "learning_rate": 1.9822932647368706e-06, - "loss": 0.9102, - "step": 10323 - }, - { - "epoch": 0.26, - "learning_rate": 1.982288080307226e-06, - "loss": 0.7764, - "step": 10324 - }, - { - "epoch": 0.26, - "learning_rate": 1.9822828951254887e-06, - "loss": 0.9316, - "step": 10325 - }, - { - "epoch": 0.26, - "learning_rate": 1.982277709191663e-06, - "loss": 0.7441, - "step": 10326 - }, - { - "epoch": 0.26, - "learning_rate": 1.9822725225057516e-06, - "loss": 1.0029, - "step": 10327 - }, - { - "epoch": 0.26, - "learning_rate": 1.98226733506776e-06, - "loss": 0.646, - "step": 10328 - }, - { - "epoch": 0.26, - "learning_rate": 1.982262146877691e-06, - "loss": 0.5181, - "step": 10329 - }, - { - "epoch": 0.26, - "learning_rate": 1.9822569579355493e-06, - "loss": 0.9561, - "step": 10330 - }, - { - "epoch": 0.26, - "learning_rate": 1.9822517682413383e-06, - "loss": 0.8525, - "step": 10331 - }, - { - "epoch": 0.26, - "learning_rate": 1.982246577795063e-06, - "loss": 0.9336, - "step": 10332 - }, - { - "epoch": 0.26, - "learning_rate": 1.9822413865967257e-06, - "loss": 0.8052, - "step": 10333 - }, - { - "epoch": 0.26, - "learning_rate": 1.9822361946463324e-06, - "loss": 1.0352, - "step": 10334 - }, - { - "epoch": 0.26, - "learning_rate": 1.982231001943885e-06, - "loss": 0.79, - "step": 10335 - }, - { - "epoch": 0.26, - "learning_rate": 1.982225808489389e-06, - "loss": 0.6455, - "step": 10336 - }, - { - "epoch": 0.26, - "learning_rate": 1.982220614282848e-06, - "loss": 1.0977, - "step": 10337 - }, - { - "epoch": 0.26, - "learning_rate": 1.9822154193242654e-06, - "loss": 0.7891, - "step": 10338 - }, - { - "epoch": 0.26, - "learning_rate": 1.982210223613646e-06, - "loss": 1.0293, - "step": 10339 - }, - { - "epoch": 0.27, - "learning_rate": 1.982205027150993e-06, - "loss": 0.8867, - "step": 10340 - }, - { - "epoch": 0.27, - "learning_rate": 1.982199829936311e-06, - "loss": 0.8877, - "step": 10341 - }, - { - "epoch": 0.27, - "learning_rate": 1.982194631969604e-06, - "loss": 0.8599, - "step": 10342 - }, - { - "epoch": 0.27, - "learning_rate": 1.9821894332508754e-06, - "loss": 0.8652, - "step": 10343 - }, - { - "epoch": 0.27, - "learning_rate": 1.9821842337801298e-06, - "loss": 0.8223, - "step": 10344 - }, - { - "epoch": 0.27, - "learning_rate": 1.9821790335573705e-06, - "loss": 0.8701, - "step": 10345 - }, - { - "epoch": 0.27, - "learning_rate": 1.9821738325826018e-06, - "loss": 0.9551, - "step": 10346 - }, - { - "epoch": 0.27, - "learning_rate": 1.982168630855828e-06, - "loss": 0.9775, - "step": 10347 - }, - { - "epoch": 0.27, - "learning_rate": 1.982163428377053e-06, - "loss": 0.958, - "step": 10348 - }, - { - "epoch": 0.27, - "learning_rate": 1.9821582251462807e-06, - "loss": 0.9209, - "step": 10349 - }, - { - "epoch": 0.27, - "learning_rate": 1.9821530211635146e-06, - "loss": 0.8193, - "step": 10350 - }, - { - "epoch": 0.27, - "learning_rate": 1.9821478164287595e-06, - "loss": 0.9775, - "step": 10351 - }, - { - "epoch": 0.27, - "learning_rate": 1.9821426109420186e-06, - "loss": 0.6221, - "step": 10352 - }, - { - "epoch": 0.27, - "learning_rate": 1.9821374047032963e-06, - "loss": 1.1152, - "step": 10353 - }, - { - "epoch": 0.27, - "learning_rate": 1.982132197712597e-06, - "loss": 0.9053, - "step": 10354 - }, - { - "epoch": 0.27, - "learning_rate": 1.982126989969924e-06, - "loss": 1.1475, - "step": 10355 - }, - { - "epoch": 0.27, - "learning_rate": 1.9821217814752814e-06, - "loss": 0.8799, - "step": 10356 - }, - { - "epoch": 0.27, - "learning_rate": 1.982116572228673e-06, - "loss": 0.7275, - "step": 10357 - }, - { - "epoch": 0.27, - "learning_rate": 1.9821113622301037e-06, - "loss": 0.8936, - "step": 10358 - }, - { - "epoch": 0.27, - "learning_rate": 1.9821061514795765e-06, - "loss": 0.9102, - "step": 10359 - }, - { - "epoch": 0.27, - "learning_rate": 1.982100939977096e-06, - "loss": 0.9365, - "step": 10360 - }, - { - "epoch": 0.27, - "learning_rate": 1.982095727722666e-06, - "loss": 0.6919, - "step": 10361 - }, - { - "epoch": 0.27, - "learning_rate": 1.98209051471629e-06, - "loss": 1.1367, - "step": 10362 - }, - { - "epoch": 0.27, - "learning_rate": 1.982085300957973e-06, - "loss": 1.1172, - "step": 10363 - }, - { - "epoch": 0.27, - "learning_rate": 1.9820800864477183e-06, - "loss": 1.0527, - "step": 10364 - }, - { - "epoch": 0.27, - "learning_rate": 1.9820748711855303e-06, - "loss": 0.6191, - "step": 10365 - }, - { - "epoch": 0.27, - "learning_rate": 1.982069655171412e-06, - "loss": 1.0273, - "step": 10366 - }, - { - "epoch": 0.27, - "learning_rate": 1.982064438405369e-06, - "loss": 0.9707, - "step": 10367 - }, - { - "epoch": 0.27, - "learning_rate": 1.9820592208874037e-06, - "loss": 1.0596, - "step": 10368 - }, - { - "epoch": 0.27, - "learning_rate": 1.982054002617521e-06, - "loss": 0.7534, - "step": 10369 - }, - { - "epoch": 0.27, - "learning_rate": 1.982048783595725e-06, - "loss": 0.8369, - "step": 10370 - }, - { - "epoch": 0.27, - "learning_rate": 1.9820435638220188e-06, - "loss": 0.5999, - "step": 10371 - }, - { - "epoch": 0.27, - "learning_rate": 1.9820383432964074e-06, - "loss": 1.0391, - "step": 10372 - }, - { - "epoch": 0.27, - "learning_rate": 1.9820331220188943e-06, - "loss": 0.7764, - "step": 10373 - }, - { - "epoch": 0.27, - "learning_rate": 1.982027899989484e-06, - "loss": 0.7363, - "step": 10374 - }, - { - "epoch": 0.27, - "learning_rate": 1.9820226772081793e-06, - "loss": 0.6836, - "step": 10375 - }, - { - "epoch": 0.27, - "learning_rate": 1.9820174536749857e-06, - "loss": 0.9834, - "step": 10376 - }, - { - "epoch": 0.27, - "learning_rate": 1.9820122293899062e-06, - "loss": 0.9194, - "step": 10377 - }, - { - "epoch": 0.27, - "learning_rate": 1.982007004352945e-06, - "loss": 1.0879, - "step": 10378 - }, - { - "epoch": 0.27, - "learning_rate": 1.9820017785641063e-06, - "loss": 1.1309, - "step": 10379 - }, - { - "epoch": 0.27, - "learning_rate": 1.9819965520233942e-06, - "loss": 0.8037, - "step": 10380 - }, - { - "epoch": 0.27, - "learning_rate": 1.981991324730812e-06, - "loss": 0.8301, - "step": 10381 - }, - { - "epoch": 0.27, - "learning_rate": 1.9819860966863646e-06, - "loss": 0.9902, - "step": 10382 - }, - { - "epoch": 0.27, - "learning_rate": 1.9819808678900554e-06, - "loss": 0.4985, - "step": 10383 - }, - { - "epoch": 0.27, - "learning_rate": 1.981975638341889e-06, - "loss": 0.7568, - "step": 10384 - }, - { - "epoch": 0.27, - "learning_rate": 1.9819704080418685e-06, - "loss": 0.7842, - "step": 10385 - }, - { - "epoch": 0.27, - "learning_rate": 1.9819651769899987e-06, - "loss": 0.8672, - "step": 10386 - }, - { - "epoch": 0.27, - "learning_rate": 1.981959945186283e-06, - "loss": 0.8359, - "step": 10387 - }, - { - "epoch": 0.27, - "learning_rate": 1.981954712630726e-06, - "loss": 0.9658, - "step": 10388 - }, - { - "epoch": 0.27, - "learning_rate": 1.9819494793233316e-06, - "loss": 0.7188, - "step": 10389 - }, - { - "epoch": 0.27, - "learning_rate": 1.9819442452641035e-06, - "loss": 0.834, - "step": 10390 - }, - { - "epoch": 0.27, - "learning_rate": 1.9819390104530456e-06, - "loss": 0.9824, - "step": 10391 - }, - { - "epoch": 0.27, - "learning_rate": 1.9819337748901625e-06, - "loss": 0.8916, - "step": 10392 - }, - { - "epoch": 0.27, - "learning_rate": 1.9819285385754572e-06, - "loss": 0.8584, - "step": 10393 - }, - { - "epoch": 0.27, - "learning_rate": 1.9819233015089353e-06, - "loss": 1.0098, - "step": 10394 - }, - { - "epoch": 0.27, - "learning_rate": 1.981918063690599e-06, - "loss": 0.8828, - "step": 10395 - }, - { - "epoch": 0.27, - "learning_rate": 1.981912825120454e-06, - "loss": 1.0068, - "step": 10396 - }, - { - "epoch": 0.27, - "learning_rate": 1.981907585798503e-06, - "loss": 0.9736, - "step": 10397 - }, - { - "epoch": 0.27, - "learning_rate": 1.98190234572475e-06, - "loss": 0.79, - "step": 10398 - }, - { - "epoch": 0.27, - "learning_rate": 1.9818971048992006e-06, - "loss": 0.8848, - "step": 10399 - }, - { - "epoch": 0.27, - "learning_rate": 1.981891863321857e-06, - "loss": 0.8223, - "step": 10400 - }, - { - "epoch": 0.27, - "learning_rate": 1.9818866209927245e-06, - "loss": 0.8467, - "step": 10401 - }, - { - "epoch": 0.27, - "learning_rate": 1.981881377911806e-06, - "loss": 0.9893, - "step": 10402 - }, - { - "epoch": 0.27, - "learning_rate": 1.9818761340791066e-06, - "loss": 1.0293, - "step": 10403 - }, - { - "epoch": 0.27, - "learning_rate": 1.9818708894946298e-06, - "loss": 0.9346, - "step": 10404 - }, - { - "epoch": 0.27, - "learning_rate": 1.981865644158379e-06, - "loss": 0.793, - "step": 10405 - }, - { - "epoch": 0.27, - "learning_rate": 1.9818603980703594e-06, - "loss": 0.8926, - "step": 10406 - }, - { - "epoch": 0.27, - "learning_rate": 1.9818551512305743e-06, - "loss": 1.0918, - "step": 10407 - }, - { - "epoch": 0.27, - "learning_rate": 1.9818499036390276e-06, - "loss": 0.9248, - "step": 10408 - }, - { - "epoch": 0.27, - "learning_rate": 1.9818446552957235e-06, - "loss": 0.9375, - "step": 10409 - }, - { - "epoch": 0.27, - "learning_rate": 1.9818394062006666e-06, - "loss": 0.9453, - "step": 10410 - }, - { - "epoch": 0.27, - "learning_rate": 1.98183415635386e-06, - "loss": 0.8828, - "step": 10411 - }, - { - "epoch": 0.27, - "learning_rate": 1.9818289057553085e-06, - "loss": 0.751, - "step": 10412 - }, - { - "epoch": 0.27, - "learning_rate": 1.9818236544050154e-06, - "loss": 0.8594, - "step": 10413 - }, - { - "epoch": 0.27, - "learning_rate": 1.9818184023029852e-06, - "loss": 1.0, - "step": 10414 - }, - { - "epoch": 0.27, - "learning_rate": 1.9818131494492218e-06, - "loss": 0.8408, - "step": 10415 - }, - { - "epoch": 0.27, - "learning_rate": 1.9818078958437293e-06, - "loss": 1.0254, - "step": 10416 - }, - { - "epoch": 0.27, - "learning_rate": 1.9818026414865116e-06, - "loss": 1.0723, - "step": 10417 - }, - { - "epoch": 0.27, - "learning_rate": 1.981797386377573e-06, - "loss": 0.5859, - "step": 10418 - }, - { - "epoch": 0.27, - "learning_rate": 1.9817921305169165e-06, - "loss": 0.9326, - "step": 10419 - }, - { - "epoch": 0.27, - "learning_rate": 1.9817868739045477e-06, - "loss": 0.9512, - "step": 10420 - }, - { - "epoch": 0.27, - "learning_rate": 1.9817816165404693e-06, - "loss": 1.0908, - "step": 10421 - }, - { - "epoch": 0.27, - "learning_rate": 1.9817763584246865e-06, - "loss": 0.8394, - "step": 10422 - }, - { - "epoch": 0.27, - "learning_rate": 1.981771099557202e-06, - "loss": 1.0508, - "step": 10423 - }, - { - "epoch": 0.27, - "learning_rate": 1.981765839938021e-06, - "loss": 0.8218, - "step": 10424 - }, - { - "epoch": 0.27, - "learning_rate": 1.9817605795671466e-06, - "loss": 0.9263, - "step": 10425 - }, - { - "epoch": 0.27, - "learning_rate": 1.9817553184445836e-06, - "loss": 0.8848, - "step": 10426 - }, - { - "epoch": 0.27, - "learning_rate": 1.9817500565703356e-06, - "loss": 0.6201, - "step": 10427 - }, - { - "epoch": 0.27, - "learning_rate": 1.9817447939444068e-06, - "loss": 0.8779, - "step": 10428 - }, - { - "epoch": 0.27, - "learning_rate": 1.981739530566801e-06, - "loss": 0.8555, - "step": 10429 - }, - { - "epoch": 0.27, - "learning_rate": 1.9817342664375226e-06, - "loss": 0.8374, - "step": 10430 - }, - { - "epoch": 0.27, - "learning_rate": 1.9817290015565753e-06, - "loss": 0.897, - "step": 10431 - }, - { - "epoch": 0.27, - "learning_rate": 1.9817237359239633e-06, - "loss": 0.9248, - "step": 10432 - }, - { - "epoch": 0.27, - "learning_rate": 1.9817184695396904e-06, - "loss": 1.1494, - "step": 10433 - }, - { - "epoch": 0.27, - "learning_rate": 1.981713202403761e-06, - "loss": 0.9219, - "step": 10434 - }, - { - "epoch": 0.27, - "learning_rate": 1.9817079345161787e-06, - "loss": 0.8799, - "step": 10435 - }, - { - "epoch": 0.27, - "learning_rate": 1.981702665876948e-06, - "loss": 0.9385, - "step": 10436 - }, - { - "epoch": 0.27, - "learning_rate": 1.9816973964860727e-06, - "loss": 1.0215, - "step": 10437 - }, - { - "epoch": 0.27, - "learning_rate": 1.9816921263435566e-06, - "loss": 0.9238, - "step": 10438 - }, - { - "epoch": 0.27, - "learning_rate": 1.9816868554494042e-06, - "loss": 0.7822, - "step": 10439 - }, - { - "epoch": 0.27, - "learning_rate": 1.9816815838036194e-06, - "loss": 1.0078, - "step": 10440 - }, - { - "epoch": 0.27, - "learning_rate": 1.981676311406206e-06, - "loss": 0.9121, - "step": 10441 - }, - { - "epoch": 0.27, - "learning_rate": 1.981671038257168e-06, - "loss": 1.0718, - "step": 10442 - }, - { - "epoch": 0.27, - "learning_rate": 1.98166576435651e-06, - "loss": 0.9775, - "step": 10443 - }, - { - "epoch": 0.27, - "learning_rate": 1.9816604897042356e-06, - "loss": 0.689, - "step": 10444 - }, - { - "epoch": 0.27, - "learning_rate": 1.9816552143003485e-06, - "loss": 0.9053, - "step": 10445 - }, - { - "epoch": 0.27, - "learning_rate": 1.9816499381448535e-06, - "loss": 0.9443, - "step": 10446 - }, - { - "epoch": 0.27, - "learning_rate": 1.9816446612377544e-06, - "loss": 1.1562, - "step": 10447 - }, - { - "epoch": 0.27, - "learning_rate": 1.9816393835790546e-06, - "loss": 0.958, - "step": 10448 - }, - { - "epoch": 0.27, - "learning_rate": 1.981634105168759e-06, - "loss": 0.9346, - "step": 10449 - }, - { - "epoch": 0.27, - "learning_rate": 1.9816288260068715e-06, - "loss": 0.9844, - "step": 10450 - }, - { - "epoch": 0.27, - "learning_rate": 1.981623546093396e-06, - "loss": 0.7563, - "step": 10451 - }, - { - "epoch": 0.27, - "learning_rate": 1.981618265428336e-06, - "loss": 0.9023, - "step": 10452 - }, - { - "epoch": 0.27, - "learning_rate": 1.981612984011696e-06, - "loss": 0.7944, - "step": 10453 - }, - { - "epoch": 0.27, - "learning_rate": 1.9816077018434806e-06, - "loss": 0.9893, - "step": 10454 - }, - { - "epoch": 0.27, - "learning_rate": 1.981602418923693e-06, - "loss": 0.999, - "step": 10455 - }, - { - "epoch": 0.27, - "learning_rate": 1.9815971352523376e-06, - "loss": 0.8774, - "step": 10456 - }, - { - "epoch": 0.27, - "learning_rate": 1.9815918508294186e-06, - "loss": 1.0791, - "step": 10457 - }, - { - "epoch": 0.27, - "learning_rate": 1.9815865656549395e-06, - "loss": 0.9307, - "step": 10458 - }, - { - "epoch": 0.27, - "learning_rate": 1.981581279728905e-06, - "loss": 1.0234, - "step": 10459 - }, - { - "epoch": 0.27, - "learning_rate": 1.9815759930513186e-06, - "loss": 0.8926, - "step": 10460 - }, - { - "epoch": 0.27, - "learning_rate": 1.981570705622185e-06, - "loss": 1.0586, - "step": 10461 - }, - { - "epoch": 0.27, - "learning_rate": 1.9815654174415075e-06, - "loss": 1.043, - "step": 10462 - }, - { - "epoch": 0.27, - "learning_rate": 1.9815601285092904e-06, - "loss": 1.0312, - "step": 10463 - }, - { - "epoch": 0.27, - "learning_rate": 1.981554838825538e-06, - "loss": 0.7996, - "step": 10464 - }, - { - "epoch": 0.27, - "learning_rate": 1.981549548390254e-06, - "loss": 0.8315, - "step": 10465 - }, - { - "epoch": 0.27, - "learning_rate": 1.9815442572034433e-06, - "loss": 0.8125, - "step": 10466 - }, - { - "epoch": 0.27, - "learning_rate": 1.981538965265109e-06, - "loss": 0.9346, - "step": 10467 - }, - { - "epoch": 0.27, - "learning_rate": 1.981533672575255e-06, - "loss": 0.9824, - "step": 10468 - }, - { - "epoch": 0.27, - "learning_rate": 1.981528379133886e-06, - "loss": 1.0947, - "step": 10469 - }, - { - "epoch": 0.27, - "learning_rate": 1.9815230849410056e-06, - "loss": 1.1025, - "step": 10470 - }, - { - "epoch": 0.27, - "learning_rate": 1.981517789996619e-06, - "loss": 1.1113, - "step": 10471 - }, - { - "epoch": 0.27, - "learning_rate": 1.9815124943007287e-06, - "loss": 0.8633, - "step": 10472 - }, - { - "epoch": 0.27, - "learning_rate": 1.9815071978533397e-06, - "loss": 0.7578, - "step": 10473 - }, - { - "epoch": 0.27, - "learning_rate": 1.9815019006544555e-06, - "loss": 1.0986, - "step": 10474 - }, - { - "epoch": 0.27, - "learning_rate": 1.9814966027040802e-06, - "loss": 0.8799, - "step": 10475 - }, - { - "epoch": 0.27, - "learning_rate": 1.9814913040022186e-06, - "loss": 1.0596, - "step": 10476 - }, - { - "epoch": 0.27, - "learning_rate": 1.981486004548874e-06, - "loss": 0.8613, - "step": 10477 - }, - { - "epoch": 0.27, - "learning_rate": 1.9814807043440507e-06, - "loss": 0.6587, - "step": 10478 - }, - { - "epoch": 0.27, - "learning_rate": 1.981475403387753e-06, - "loss": 1.0059, - "step": 10479 - }, - { - "epoch": 0.27, - "learning_rate": 1.9814701016799844e-06, - "loss": 0.7305, - "step": 10480 - }, - { - "epoch": 0.27, - "learning_rate": 1.9814647992207494e-06, - "loss": 1.0527, - "step": 10481 - }, - { - "epoch": 0.27, - "learning_rate": 1.9814594960100518e-06, - "loss": 1.0859, - "step": 10482 - }, - { - "epoch": 0.27, - "learning_rate": 1.981454192047896e-06, - "loss": 0.7754, - "step": 10483 - }, - { - "epoch": 0.27, - "learning_rate": 1.9814488873342856e-06, - "loss": 0.7202, - "step": 10484 - }, - { - "epoch": 0.27, - "learning_rate": 1.981443581869225e-06, - "loss": 0.7979, - "step": 10485 - }, - { - "epoch": 0.27, - "learning_rate": 1.9814382756527183e-06, - "loss": 0.9141, - "step": 10486 - }, - { - "epoch": 0.27, - "learning_rate": 1.9814329686847693e-06, - "loss": 0.9404, - "step": 10487 - }, - { - "epoch": 0.27, - "learning_rate": 1.9814276609653823e-06, - "loss": 0.9404, - "step": 10488 - }, - { - "epoch": 0.27, - "learning_rate": 1.9814223524945613e-06, - "loss": 0.8018, - "step": 10489 - }, - { - "epoch": 0.27, - "learning_rate": 1.9814170432723104e-06, - "loss": 0.9258, - "step": 10490 - }, - { - "epoch": 0.27, - "learning_rate": 1.981411733298633e-06, - "loss": 1.1484, - "step": 10491 - }, - { - "epoch": 0.27, - "learning_rate": 1.9814064225735345e-06, - "loss": 0.9385, - "step": 10492 - }, - { - "epoch": 0.27, - "learning_rate": 1.981401111097018e-06, - "loss": 0.958, - "step": 10493 - }, - { - "epoch": 0.27, - "learning_rate": 1.9813957988690876e-06, - "loss": 1.0576, - "step": 10494 - }, - { - "epoch": 0.27, - "learning_rate": 1.9813904858897483e-06, - "loss": 0.8521, - "step": 10495 - }, - { - "epoch": 0.27, - "learning_rate": 1.9813851721590023e-06, - "loss": 0.9697, - "step": 10496 - }, - { - "epoch": 0.27, - "learning_rate": 1.981379857676856e-06, - "loss": 0.9824, - "step": 10497 - }, - { - "epoch": 0.27, - "learning_rate": 1.981374542443311e-06, - "loss": 0.6826, - "step": 10498 - }, - { - "epoch": 0.27, - "learning_rate": 1.9813692264583733e-06, - "loss": 0.5854, - "step": 10499 - }, - { - "epoch": 0.27, - "learning_rate": 1.9813639097220465e-06, - "loss": 0.834, - "step": 10500 - }, - { - "epoch": 0.27, - "learning_rate": 1.981358592234334e-06, - "loss": 0.6577, - "step": 10501 - }, - { - "epoch": 0.27, - "learning_rate": 1.981353273995241e-06, - "loss": 0.8481, - "step": 10502 - }, - { - "epoch": 0.27, - "learning_rate": 1.98134795500477e-06, - "loss": 1.1094, - "step": 10503 - }, - { - "epoch": 0.27, - "learning_rate": 1.981342635262927e-06, - "loss": 0.9209, - "step": 10504 - }, - { - "epoch": 0.27, - "learning_rate": 1.9813373147697145e-06, - "loss": 0.9814, - "step": 10505 - }, - { - "epoch": 0.27, - "learning_rate": 1.981331993525137e-06, - "loss": 0.9062, - "step": 10506 - }, - { - "epoch": 0.27, - "learning_rate": 1.981326671529199e-06, - "loss": 0.877, - "step": 10507 - }, - { - "epoch": 0.27, - "learning_rate": 1.981321348781904e-06, - "loss": 1.0156, - "step": 10508 - }, - { - "epoch": 0.27, - "learning_rate": 1.9813160252832567e-06, - "loss": 0.7354, - "step": 10509 - }, - { - "epoch": 0.27, - "learning_rate": 1.9813107010332606e-06, - "loss": 1.1396, - "step": 10510 - }, - { - "epoch": 0.27, - "learning_rate": 1.9813053760319204e-06, - "loss": 1.0225, - "step": 10511 - }, - { - "epoch": 0.27, - "learning_rate": 1.9813000502792396e-06, - "loss": 0.9678, - "step": 10512 - }, - { - "epoch": 0.27, - "learning_rate": 1.9812947237752223e-06, - "loss": 1.0166, - "step": 10513 - }, - { - "epoch": 0.27, - "learning_rate": 1.9812893965198733e-06, - "loss": 0.8711, - "step": 10514 - }, - { - "epoch": 0.27, - "learning_rate": 1.9812840685131955e-06, - "loss": 1.0234, - "step": 10515 - }, - { - "epoch": 0.27, - "learning_rate": 1.981278739755194e-06, - "loss": 0.9443, - "step": 10516 - }, - { - "epoch": 0.27, - "learning_rate": 1.981273410245872e-06, - "loss": 1.0859, - "step": 10517 - }, - { - "epoch": 0.27, - "learning_rate": 1.9812680799852343e-06, - "loss": 1.0703, - "step": 10518 - }, - { - "epoch": 0.27, - "learning_rate": 1.981262748973285e-06, - "loss": 0.8115, - "step": 10519 - }, - { - "epoch": 0.27, - "learning_rate": 1.9812574172100277e-06, - "loss": 0.8779, - "step": 10520 - }, - { - "epoch": 0.27, - "learning_rate": 1.981252084695467e-06, - "loss": 0.9248, - "step": 10521 - }, - { - "epoch": 0.27, - "learning_rate": 1.9812467514296063e-06, - "loss": 0.9824, - "step": 10522 - }, - { - "epoch": 0.27, - "learning_rate": 1.98124141741245e-06, - "loss": 0.9824, - "step": 10523 - }, - { - "epoch": 0.27, - "learning_rate": 1.9812360826440025e-06, - "loss": 0.9795, - "step": 10524 - }, - { - "epoch": 0.27, - "learning_rate": 1.981230747124268e-06, - "loss": 1.0908, - "step": 10525 - }, - { - "epoch": 0.27, - "learning_rate": 1.98122541085325e-06, - "loss": 0.9531, - "step": 10526 - }, - { - "epoch": 0.27, - "learning_rate": 1.9812200738309525e-06, - "loss": 0.875, - "step": 10527 - }, - { - "epoch": 0.27, - "learning_rate": 1.98121473605738e-06, - "loss": 0.8799, - "step": 10528 - }, - { - "epoch": 0.27, - "learning_rate": 1.9812093975325367e-06, - "loss": 0.8672, - "step": 10529 - }, - { - "epoch": 0.27, - "learning_rate": 1.9812040582564264e-06, - "loss": 0.8916, - "step": 10530 - }, - { - "epoch": 0.27, - "learning_rate": 1.9811987182290534e-06, - "loss": 0.916, - "step": 10531 - }, - { - "epoch": 0.27, - "learning_rate": 1.9811933774504214e-06, - "loss": 0.8525, - "step": 10532 - }, - { - "epoch": 0.27, - "learning_rate": 1.9811880359205347e-06, - "loss": 0.9863, - "step": 10533 - }, - { - "epoch": 0.27, - "learning_rate": 1.9811826936393976e-06, - "loss": 1.1143, - "step": 10534 - }, - { - "epoch": 0.27, - "learning_rate": 1.9811773506070143e-06, - "loss": 0.833, - "step": 10535 - }, - { - "epoch": 0.27, - "learning_rate": 1.9811720068233885e-06, - "loss": 0.957, - "step": 10536 - }, - { - "epoch": 0.27, - "learning_rate": 1.981166662288524e-06, - "loss": 0.9854, - "step": 10537 - }, - { - "epoch": 0.27, - "learning_rate": 1.981161317002426e-06, - "loss": 0.8682, - "step": 10538 - }, - { - "epoch": 0.27, - "learning_rate": 1.981155970965097e-06, - "loss": 0.792, - "step": 10539 - }, - { - "epoch": 0.27, - "learning_rate": 1.9811506241765426e-06, - "loss": 1.1172, - "step": 10540 - }, - { - "epoch": 0.27, - "learning_rate": 1.981145276636766e-06, - "loss": 0.9785, - "step": 10541 - }, - { - "epoch": 0.27, - "learning_rate": 1.981139928345772e-06, - "loss": 0.9971, - "step": 10542 - }, - { - "epoch": 0.27, - "learning_rate": 1.981134579303564e-06, - "loss": 0.9551, - "step": 10543 - }, - { - "epoch": 0.27, - "learning_rate": 1.981129229510146e-06, - "loss": 0.9248, - "step": 10544 - }, - { - "epoch": 0.27, - "learning_rate": 1.981123878965523e-06, - "loss": 0.959, - "step": 10545 - }, - { - "epoch": 0.27, - "learning_rate": 1.9811185276696985e-06, - "loss": 0.7686, - "step": 10546 - }, - { - "epoch": 0.27, - "learning_rate": 1.9811131756226764e-06, - "loss": 0.8813, - "step": 10547 - }, - { - "epoch": 0.27, - "learning_rate": 1.981107822824461e-06, - "loss": 0.8408, - "step": 10548 - }, - { - "epoch": 0.27, - "learning_rate": 1.981102469275057e-06, - "loss": 0.8643, - "step": 10549 - }, - { - "epoch": 0.27, - "learning_rate": 1.9810971149744672e-06, - "loss": 0.9551, - "step": 10550 - }, - { - "epoch": 0.27, - "learning_rate": 1.981091759922697e-06, - "loss": 0.9863, - "step": 10551 - }, - { - "epoch": 0.27, - "learning_rate": 1.98108640411975e-06, - "loss": 0.9463, - "step": 10552 - }, - { - "epoch": 0.27, - "learning_rate": 1.98108104756563e-06, - "loss": 1.0391, - "step": 10553 - }, - { - "epoch": 0.27, - "learning_rate": 1.981075690260341e-06, - "loss": 0.8857, - "step": 10554 - }, - { - "epoch": 0.27, - "learning_rate": 1.9810703322038884e-06, - "loss": 0.7388, - "step": 10555 - }, - { - "epoch": 0.27, - "learning_rate": 1.9810649733962745e-06, - "loss": 1.0215, - "step": 10556 - }, - { - "epoch": 0.27, - "learning_rate": 1.9810596138375046e-06, - "loss": 0.6738, - "step": 10557 - }, - { - "epoch": 0.27, - "learning_rate": 1.9810542535275825e-06, - "loss": 0.6782, - "step": 10558 - }, - { - "epoch": 0.27, - "learning_rate": 1.981048892466512e-06, - "loss": 0.5791, - "step": 10559 - }, - { - "epoch": 0.27, - "learning_rate": 1.9810435306542977e-06, - "loss": 0.9746, - "step": 10560 - }, - { - "epoch": 0.27, - "learning_rate": 1.9810381680909435e-06, - "loss": 1.0557, - "step": 10561 - }, - { - "epoch": 0.27, - "learning_rate": 1.9810328047764537e-06, - "loss": 0.9639, - "step": 10562 - }, - { - "epoch": 0.27, - "learning_rate": 1.981027440710832e-06, - "loss": 0.8262, - "step": 10563 - }, - { - "epoch": 0.27, - "learning_rate": 1.981022075894082e-06, - "loss": 0.7852, - "step": 10564 - }, - { - "epoch": 0.27, - "learning_rate": 1.9810167103262093e-06, - "loss": 0.9023, - "step": 10565 - }, - { - "epoch": 0.27, - "learning_rate": 1.9810113440072174e-06, - "loss": 0.7744, - "step": 10566 - }, - { - "epoch": 0.27, - "learning_rate": 1.9810059769371097e-06, - "loss": 0.8799, - "step": 10567 - }, - { - "epoch": 0.27, - "learning_rate": 1.9810006091158908e-06, - "loss": 0.8203, - "step": 10568 - }, - { - "epoch": 0.27, - "learning_rate": 1.980995240543565e-06, - "loss": 0.959, - "step": 10569 - }, - { - "epoch": 0.27, - "learning_rate": 1.9809898712201366e-06, - "loss": 0.8838, - "step": 10570 - }, - { - "epoch": 0.27, - "learning_rate": 1.980984501145609e-06, - "loss": 0.9189, - "step": 10571 - }, - { - "epoch": 0.27, - "learning_rate": 1.9809791303199867e-06, - "loss": 0.834, - "step": 10572 - }, - { - "epoch": 0.27, - "learning_rate": 1.9809737587432736e-06, - "loss": 1.0234, - "step": 10573 - }, - { - "epoch": 0.27, - "learning_rate": 1.9809683864154744e-06, - "loss": 0.8857, - "step": 10574 - }, - { - "epoch": 0.27, - "learning_rate": 1.980963013336593e-06, - "loss": 1.1973, - "step": 10575 - }, - { - "epoch": 0.27, - "learning_rate": 1.9809576395066324e-06, - "loss": 0.875, - "step": 10576 - }, - { - "epoch": 0.27, - "learning_rate": 1.9809522649255985e-06, - "loss": 0.9248, - "step": 10577 - }, - { - "epoch": 0.27, - "learning_rate": 1.980946889593494e-06, - "loss": 1.0703, - "step": 10578 - }, - { - "epoch": 0.27, - "learning_rate": 1.980941513510324e-06, - "loss": 0.9736, - "step": 10579 - }, - { - "epoch": 0.27, - "learning_rate": 1.980936136676092e-06, - "loss": 0.8916, - "step": 10580 - }, - { - "epoch": 0.27, - "learning_rate": 1.980930759090802e-06, - "loss": 0.9463, - "step": 10581 - }, - { - "epoch": 0.27, - "learning_rate": 1.980925380754459e-06, - "loss": 0.9961, - "step": 10582 - }, - { - "epoch": 0.27, - "learning_rate": 1.9809200016670664e-06, - "loss": 0.8857, - "step": 10583 - }, - { - "epoch": 0.27, - "learning_rate": 1.980914621828628e-06, - "loss": 0.6204, - "step": 10584 - }, - { - "epoch": 0.27, - "learning_rate": 1.980909241239149e-06, - "loss": 0.9561, - "step": 10585 - }, - { - "epoch": 0.27, - "learning_rate": 1.9809038598986326e-06, - "loss": 0.7666, - "step": 10586 - }, - { - "epoch": 0.27, - "learning_rate": 1.980898477807083e-06, - "loss": 0.9463, - "step": 10587 - }, - { - "epoch": 0.27, - "learning_rate": 1.9808930949645047e-06, - "loss": 0.9756, - "step": 10588 - }, - { - "epoch": 0.27, - "learning_rate": 1.980887711370902e-06, - "loss": 0.9297, - "step": 10589 - }, - { - "epoch": 0.27, - "learning_rate": 1.9808823270262783e-06, - "loss": 1.207, - "step": 10590 - }, - { - "epoch": 0.27, - "learning_rate": 1.980876941930638e-06, - "loss": 1.0205, - "step": 10591 - }, - { - "epoch": 0.27, - "learning_rate": 1.9808715560839855e-06, - "loss": 0.7939, - "step": 10592 - }, - { - "epoch": 0.27, - "learning_rate": 1.980866169486325e-06, - "loss": 0.8906, - "step": 10593 - }, - { - "epoch": 0.27, - "learning_rate": 1.98086078213766e-06, - "loss": 1.0664, - "step": 10594 - }, - { - "epoch": 0.27, - "learning_rate": 1.9808553940379955e-06, - "loss": 0.9443, - "step": 10595 - }, - { - "epoch": 0.27, - "learning_rate": 1.9808500051873346e-06, - "loss": 0.8921, - "step": 10596 - }, - { - "epoch": 0.27, - "learning_rate": 1.980844615585682e-06, - "loss": 0.8965, - "step": 10597 - }, - { - "epoch": 0.27, - "learning_rate": 1.980839225233042e-06, - "loss": 0.8105, - "step": 10598 - }, - { - "epoch": 0.27, - "learning_rate": 1.9808338341294184e-06, - "loss": 0.7417, - "step": 10599 - }, - { - "epoch": 0.27, - "learning_rate": 1.980828442274816e-06, - "loss": 0.9033, - "step": 10600 - }, - { - "epoch": 0.27, - "learning_rate": 1.9808230496692376e-06, - "loss": 1.0225, - "step": 10601 - }, - { - "epoch": 0.27, - "learning_rate": 1.980817656312688e-06, - "loss": 1.1035, - "step": 10602 - }, - { - "epoch": 0.27, - "learning_rate": 1.980812262205172e-06, - "loss": 0.9395, - "step": 10603 - }, - { - "epoch": 0.27, - "learning_rate": 1.980806867346693e-06, - "loss": 0.6216, - "step": 10604 - }, - { - "epoch": 0.27, - "learning_rate": 1.980801471737255e-06, - "loss": 0.9219, - "step": 10605 - }, - { - "epoch": 0.27, - "learning_rate": 1.9807960753768623e-06, - "loss": 0.958, - "step": 10606 - }, - { - "epoch": 0.27, - "learning_rate": 1.9807906782655194e-06, - "loss": 0.7266, - "step": 10607 - }, - { - "epoch": 0.27, - "learning_rate": 1.98078528040323e-06, - "loss": 0.9863, - "step": 10608 - }, - { - "epoch": 0.27, - "learning_rate": 1.980779881789999e-06, - "loss": 0.8535, - "step": 10609 - }, - { - "epoch": 0.27, - "learning_rate": 1.9807744824258294e-06, - "loss": 1.1914, - "step": 10610 - }, - { - "epoch": 0.27, - "learning_rate": 1.980769082310726e-06, - "loss": 0.9229, - "step": 10611 - }, - { - "epoch": 0.27, - "learning_rate": 1.980763681444693e-06, - "loss": 0.7285, - "step": 10612 - }, - { - "epoch": 0.27, - "learning_rate": 1.980758279827734e-06, - "loss": 0.9541, - "step": 10613 - }, - { - "epoch": 0.27, - "learning_rate": 1.980752877459854e-06, - "loss": 1.1641, - "step": 10614 - }, - { - "epoch": 0.27, - "learning_rate": 1.980747474341056e-06, - "loss": 0.9854, - "step": 10615 - }, - { - "epoch": 0.27, - "learning_rate": 1.980742070471345e-06, - "loss": 1.0049, - "step": 10616 - }, - { - "epoch": 0.27, - "learning_rate": 1.980736665850725e-06, - "loss": 0.9492, - "step": 10617 - }, - { - "epoch": 0.27, - "learning_rate": 1.9807312604792e-06, - "loss": 0.7822, - "step": 10618 - }, - { - "epoch": 0.27, - "learning_rate": 1.980725854356774e-06, - "loss": 1.1279, - "step": 10619 - }, - { - "epoch": 0.27, - "learning_rate": 1.9807204474834514e-06, - "loss": 0.7456, - "step": 10620 - }, - { - "epoch": 0.27, - "learning_rate": 1.980715039859236e-06, - "loss": 0.916, - "step": 10621 - }, - { - "epoch": 0.27, - "learning_rate": 1.980709631484133e-06, - "loss": 0.7778, - "step": 10622 - }, - { - "epoch": 0.27, - "learning_rate": 1.980704222358145e-06, - "loss": 0.8438, - "step": 10623 - }, - { - "epoch": 0.27, - "learning_rate": 1.9806988124812772e-06, - "loss": 0.9023, - "step": 10624 - }, - { - "epoch": 0.27, - "learning_rate": 1.980693401853533e-06, - "loss": 1.043, - "step": 10625 - }, - { - "epoch": 0.27, - "learning_rate": 1.9806879904749176e-06, - "loss": 0.9111, - "step": 10626 - }, - { - "epoch": 0.27, - "learning_rate": 1.980682578345434e-06, - "loss": 1.0869, - "step": 10627 - }, - { - "epoch": 0.27, - "learning_rate": 1.9806771654650867e-06, - "loss": 0.9717, - "step": 10628 - }, - { - "epoch": 0.27, - "learning_rate": 1.9806717518338803e-06, - "loss": 0.8311, - "step": 10629 - }, - { - "epoch": 0.27, - "learning_rate": 1.9806663374518185e-06, - "loss": 0.915, - "step": 10630 - }, - { - "epoch": 0.27, - "learning_rate": 1.980660922318906e-06, - "loss": 0.6211, - "step": 10631 - }, - { - "epoch": 0.27, - "learning_rate": 1.9806555064351463e-06, - "loss": 0.7217, - "step": 10632 - }, - { - "epoch": 0.27, - "learning_rate": 1.9806500898005436e-06, - "loss": 0.8965, - "step": 10633 - }, - { - "epoch": 0.27, - "learning_rate": 1.980644672415102e-06, - "loss": 0.9238, - "step": 10634 - }, - { - "epoch": 0.27, - "learning_rate": 1.9806392542788263e-06, - "loss": 0.7446, - "step": 10635 - }, - { - "epoch": 0.27, - "learning_rate": 1.98063383539172e-06, - "loss": 0.6826, - "step": 10636 - }, - { - "epoch": 0.27, - "learning_rate": 1.9806284157537877e-06, - "loss": 0.9736, - "step": 10637 - }, - { - "epoch": 0.27, - "learning_rate": 1.980622995365033e-06, - "loss": 1.0156, - "step": 10638 - }, - { - "epoch": 0.27, - "learning_rate": 1.9806175742254604e-06, - "loss": 0.8135, - "step": 10639 - }, - { - "epoch": 0.27, - "learning_rate": 1.980612152335074e-06, - "loss": 0.9219, - "step": 10640 - }, - { - "epoch": 0.27, - "learning_rate": 1.9806067296938783e-06, - "loss": 0.4023, - "step": 10641 - }, - { - "epoch": 0.27, - "learning_rate": 1.980601306301877e-06, - "loss": 1.1582, - "step": 10642 - }, - { - "epoch": 0.27, - "learning_rate": 1.9805958821590743e-06, - "loss": 0.9502, - "step": 10643 - }, - { - "epoch": 0.27, - "learning_rate": 1.9805904572654743e-06, - "loss": 0.873, - "step": 10644 - }, - { - "epoch": 0.27, - "learning_rate": 1.980585031621081e-06, - "loss": 0.9961, - "step": 10645 - }, - { - "epoch": 0.27, - "learning_rate": 1.9805796052258996e-06, - "loss": 0.958, - "step": 10646 - }, - { - "epoch": 0.27, - "learning_rate": 1.980574178079933e-06, - "loss": 0.9883, - "step": 10647 - }, - { - "epoch": 0.27, - "learning_rate": 1.980568750183186e-06, - "loss": 0.915, - "step": 10648 - }, - { - "epoch": 0.27, - "learning_rate": 1.9805633215356623e-06, - "loss": 0.7598, - "step": 10649 - }, - { - "epoch": 0.27, - "learning_rate": 1.9805578921373666e-06, - "loss": 1.0205, - "step": 10650 - }, - { - "epoch": 0.27, - "learning_rate": 1.9805524619883028e-06, - "loss": 0.999, - "step": 10651 - }, - { - "epoch": 0.27, - "learning_rate": 1.980547031088475e-06, - "loss": 1.0127, - "step": 10652 - }, - { - "epoch": 0.27, - "learning_rate": 1.9805415994378874e-06, - "loss": 0.8438, - "step": 10653 - }, - { - "epoch": 0.27, - "learning_rate": 1.9805361670365443e-06, - "loss": 0.8701, - "step": 10654 - }, - { - "epoch": 0.27, - "learning_rate": 1.9805307338844497e-06, - "loss": 0.834, - "step": 10655 - }, - { - "epoch": 0.27, - "learning_rate": 1.980525299981608e-06, - "loss": 0.6772, - "step": 10656 - }, - { - "epoch": 0.27, - "learning_rate": 1.9805198653280227e-06, - "loss": 0.6511, - "step": 10657 - }, - { - "epoch": 0.27, - "learning_rate": 1.980514429923699e-06, - "loss": 0.9023, - "step": 10658 - }, - { - "epoch": 0.27, - "learning_rate": 1.9805089937686403e-06, - "loss": 0.731, - "step": 10659 - }, - { - "epoch": 0.27, - "learning_rate": 1.9805035568628506e-06, - "loss": 1.0654, - "step": 10660 - }, - { - "epoch": 0.27, - "learning_rate": 1.9804981192063347e-06, - "loss": 0.9258, - "step": 10661 - }, - { - "epoch": 0.27, - "learning_rate": 1.9804926807990964e-06, - "loss": 0.9382, - "step": 10662 - }, - { - "epoch": 0.27, - "learning_rate": 1.9804872416411397e-06, - "loss": 0.8242, - "step": 10663 - }, - { - "epoch": 0.27, - "learning_rate": 1.9804818017324695e-06, - "loss": 1.0801, - "step": 10664 - }, - { - "epoch": 0.27, - "learning_rate": 1.980476361073089e-06, - "loss": 1.0312, - "step": 10665 - }, - { - "epoch": 0.27, - "learning_rate": 1.980470919663003e-06, - "loss": 0.8545, - "step": 10666 - }, - { - "epoch": 0.27, - "learning_rate": 1.9804654775022155e-06, - "loss": 0.9004, - "step": 10667 - }, - { - "epoch": 0.27, - "learning_rate": 1.980460034590731e-06, - "loss": 0.9541, - "step": 10668 - }, - { - "epoch": 0.27, - "learning_rate": 1.9804545909285533e-06, - "loss": 0.9688, - "step": 10669 - }, - { - "epoch": 0.27, - "learning_rate": 1.980449146515686e-06, - "loss": 0.9531, - "step": 10670 - }, - { - "epoch": 0.27, - "learning_rate": 1.980443701352134e-06, - "loss": 0.8574, - "step": 10671 - }, - { - "epoch": 0.27, - "learning_rate": 1.9804382554379017e-06, - "loss": 1.0654, - "step": 10672 - }, - { - "epoch": 0.27, - "learning_rate": 1.980432808772993e-06, - "loss": 0.9678, - "step": 10673 - }, - { - "epoch": 0.27, - "learning_rate": 1.9804273613574117e-06, - "loss": 0.8262, - "step": 10674 - }, - { - "epoch": 0.27, - "learning_rate": 1.980421913191162e-06, - "loss": 0.9424, - "step": 10675 - }, - { - "epoch": 0.27, - "learning_rate": 1.9804164642742487e-06, - "loss": 1.1562, - "step": 10676 - }, - { - "epoch": 0.27, - "learning_rate": 1.9804110146066756e-06, - "loss": 0.6128, - "step": 10677 - }, - { - "epoch": 0.27, - "learning_rate": 1.9804055641884466e-06, - "loss": 1.0293, - "step": 10678 - }, - { - "epoch": 0.27, - "learning_rate": 1.9804001130195665e-06, - "loss": 0.707, - "step": 10679 - }, - { - "epoch": 0.27, - "learning_rate": 1.980394661100039e-06, - "loss": 1.0732, - "step": 10680 - }, - { - "epoch": 0.27, - "learning_rate": 1.9803892084298683e-06, - "loss": 0.7646, - "step": 10681 - }, - { - "epoch": 0.27, - "learning_rate": 1.9803837550090583e-06, - "loss": 0.8552, - "step": 10682 - }, - { - "epoch": 0.27, - "learning_rate": 1.980378300837614e-06, - "loss": 0.9272, - "step": 10683 - }, - { - "epoch": 0.27, - "learning_rate": 1.9803728459155395e-06, - "loss": 0.9473, - "step": 10684 - }, - { - "epoch": 0.27, - "learning_rate": 1.9803673902428378e-06, - "loss": 0.8799, - "step": 10685 - }, - { - "epoch": 0.27, - "learning_rate": 1.980361933819514e-06, - "loss": 1.1592, - "step": 10686 - }, - { - "epoch": 0.27, - "learning_rate": 1.9803564766455727e-06, - "loss": 0.8516, - "step": 10687 - }, - { - "epoch": 0.27, - "learning_rate": 1.9803510187210174e-06, - "loss": 0.8242, - "step": 10688 - }, - { - "epoch": 0.27, - "learning_rate": 1.980345560045852e-06, - "loss": 0.688, - "step": 10689 - }, - { - "epoch": 0.27, - "learning_rate": 1.980340100620081e-06, - "loss": 0.9014, - "step": 10690 - }, - { - "epoch": 0.27, - "learning_rate": 1.980334640443709e-06, - "loss": 0.8311, - "step": 10691 - }, - { - "epoch": 0.27, - "learning_rate": 1.9803291795167396e-06, - "loss": 1.0029, - "step": 10692 - }, - { - "epoch": 0.27, - "learning_rate": 1.9803237178391774e-06, - "loss": 0.6018, - "step": 10693 - }, - { - "epoch": 0.27, - "learning_rate": 1.9803182554110267e-06, - "loss": 1.0859, - "step": 10694 - }, - { - "epoch": 0.27, - "learning_rate": 1.980312792232291e-06, - "loss": 0.8682, - "step": 10695 - }, - { - "epoch": 0.27, - "learning_rate": 1.980307328302975e-06, - "loss": 0.8926, - "step": 10696 - }, - { - "epoch": 0.27, - "learning_rate": 1.9803018636230825e-06, - "loss": 0.7026, - "step": 10697 - }, - { - "epoch": 0.27, - "learning_rate": 1.9802963981926184e-06, - "loss": 0.9893, - "step": 10698 - }, - { - "epoch": 0.27, - "learning_rate": 1.980290932011586e-06, - "loss": 0.8242, - "step": 10699 - }, - { - "epoch": 0.27, - "learning_rate": 1.9802854650799904e-06, - "loss": 1.0176, - "step": 10700 - }, - { - "epoch": 0.27, - "learning_rate": 1.980279997397835e-06, - "loss": 0.9307, - "step": 10701 - }, - { - "epoch": 0.27, - "learning_rate": 1.980274528965124e-06, - "loss": 1.126, - "step": 10702 - }, - { - "epoch": 0.27, - "learning_rate": 1.9802690597818622e-06, - "loss": 0.8848, - "step": 10703 - }, - { - "epoch": 0.27, - "learning_rate": 1.9802635898480535e-06, - "loss": 0.5903, - "step": 10704 - }, - { - "epoch": 0.27, - "learning_rate": 1.9802581191637015e-06, - "loss": 0.9932, - "step": 10705 - }, - { - "epoch": 0.27, - "learning_rate": 1.9802526477288115e-06, - "loss": 1.0469, - "step": 10706 - }, - { - "epoch": 0.27, - "learning_rate": 1.980247175543387e-06, - "loss": 0.9854, - "step": 10707 - }, - { - "epoch": 0.27, - "learning_rate": 1.980241702607432e-06, - "loss": 0.8223, - "step": 10708 - }, - { - "epoch": 0.27, - "learning_rate": 1.9802362289209516e-06, - "loss": 0.814, - "step": 10709 - }, - { - "epoch": 0.27, - "learning_rate": 1.980230754483949e-06, - "loss": 0.7461, - "step": 10710 - }, - { - "epoch": 0.27, - "learning_rate": 1.980225279296429e-06, - "loss": 0.9326, - "step": 10711 - }, - { - "epoch": 0.27, - "learning_rate": 1.9802198033583954e-06, - "loss": 0.8438, - "step": 10712 - }, - { - "epoch": 0.27, - "learning_rate": 1.9802143266698525e-06, - "loss": 0.7168, - "step": 10713 - }, - { - "epoch": 0.27, - "learning_rate": 1.9802088492308045e-06, - "loss": 0.728, - "step": 10714 - }, - { - "epoch": 0.27, - "learning_rate": 1.9802033710412558e-06, - "loss": 1.0107, - "step": 10715 - }, - { - "epoch": 0.27, - "learning_rate": 1.9801978921012104e-06, - "loss": 0.832, - "step": 10716 - }, - { - "epoch": 0.27, - "learning_rate": 1.9801924124106726e-06, - "loss": 0.7754, - "step": 10717 - }, - { - "epoch": 0.27, - "learning_rate": 1.9801869319696467e-06, - "loss": 1.1289, - "step": 10718 - }, - { - "epoch": 0.27, - "learning_rate": 1.9801814507781365e-06, - "loss": 0.958, - "step": 10719 - }, - { - "epoch": 0.27, - "learning_rate": 1.9801759688361466e-06, - "loss": 0.8774, - "step": 10720 - }, - { - "epoch": 0.27, - "learning_rate": 1.980170486143681e-06, - "loss": 0.8354, - "step": 10721 - }, - { - "epoch": 0.27, - "learning_rate": 1.980165002700744e-06, - "loss": 1.1582, - "step": 10722 - }, - { - "epoch": 0.27, - "learning_rate": 1.9801595185073393e-06, - "loss": 0.9102, - "step": 10723 - }, - { - "epoch": 0.27, - "learning_rate": 1.9801540335634723e-06, - "loss": 0.708, - "step": 10724 - }, - { - "epoch": 0.27, - "learning_rate": 1.980148547869146e-06, - "loss": 0.9766, - "step": 10725 - }, - { - "epoch": 0.27, - "learning_rate": 1.9801430614243645e-06, - "loss": 0.9736, - "step": 10726 - }, - { - "epoch": 0.27, - "learning_rate": 1.980137574229133e-06, - "loss": 0.7041, - "step": 10727 - }, - { - "epoch": 0.27, - "learning_rate": 1.9801320862834554e-06, - "loss": 0.8354, - "step": 10728 - }, - { - "epoch": 0.27, - "learning_rate": 1.9801265975873353e-06, - "loss": 0.9043, - "step": 10729 - }, - { - "epoch": 0.28, - "learning_rate": 1.9801211081407775e-06, - "loss": 0.9155, - "step": 10730 - }, - { - "epoch": 0.28, - "learning_rate": 1.9801156179437862e-06, - "loss": 0.8213, - "step": 10731 - }, - { - "epoch": 0.28, - "learning_rate": 1.9801101269963657e-06, - "loss": 0.7065, - "step": 10732 - }, - { - "epoch": 0.28, - "learning_rate": 1.9801046352985193e-06, - "loss": 1.0791, - "step": 10733 - }, - { - "epoch": 0.28, - "learning_rate": 1.980099142850252e-06, - "loss": 1.0342, - "step": 10734 - }, - { - "epoch": 0.28, - "learning_rate": 1.9800936496515683e-06, - "loss": 1.0781, - "step": 10735 - }, - { - "epoch": 0.28, - "learning_rate": 1.9800881557024718e-06, - "loss": 0.9316, - "step": 10736 - }, - { - "epoch": 0.28, - "learning_rate": 1.9800826610029667e-06, - "loss": 0.8662, - "step": 10737 - }, - { - "epoch": 0.28, - "learning_rate": 1.9800771655530574e-06, - "loss": 0.9033, - "step": 10738 - }, - { - "epoch": 0.28, - "learning_rate": 1.980071669352748e-06, - "loss": 0.833, - "step": 10739 - }, - { - "epoch": 0.28, - "learning_rate": 1.980066172402043e-06, - "loss": 0.7676, - "step": 10740 - }, - { - "epoch": 0.28, - "learning_rate": 1.980060674700946e-06, - "loss": 0.9502, - "step": 10741 - }, - { - "epoch": 0.28, - "learning_rate": 1.980055176249462e-06, - "loss": 0.8799, - "step": 10742 - }, - { - "epoch": 0.28, - "learning_rate": 1.9800496770475946e-06, - "loss": 0.9551, - "step": 10743 - }, - { - "epoch": 0.28, - "learning_rate": 1.9800441770953485e-06, - "loss": 1.0605, - "step": 10744 - }, - { - "epoch": 0.28, - "learning_rate": 1.9800386763927275e-06, - "loss": 0.9707, - "step": 10745 - }, - { - "epoch": 0.28, - "learning_rate": 1.9800331749397356e-06, - "loss": 0.9814, - "step": 10746 - }, - { - "epoch": 0.28, - "learning_rate": 1.980027672736378e-06, - "loss": 0.8662, - "step": 10747 - }, - { - "epoch": 0.28, - "learning_rate": 1.9800221697826575e-06, - "loss": 1.1064, - "step": 10748 - }, - { - "epoch": 0.28, - "learning_rate": 1.98001666607858e-06, - "loss": 1.0859, - "step": 10749 - }, - { - "epoch": 0.28, - "learning_rate": 1.980011161624148e-06, - "loss": 0.8574, - "step": 10750 - }, - { - "epoch": 0.28, - "learning_rate": 1.980005656419367e-06, - "loss": 0.8838, - "step": 10751 - }, - { - "epoch": 0.28, - "learning_rate": 1.9800001504642406e-06, - "loss": 0.8447, - "step": 10752 - }, - { - "epoch": 0.28, - "learning_rate": 1.979994643758773e-06, - "loss": 0.7378, - "step": 10753 - }, - { - "epoch": 0.28, - "learning_rate": 1.9799891363029685e-06, - "loss": 0.7124, - "step": 10754 - }, - { - "epoch": 0.28, - "learning_rate": 1.9799836280968315e-06, - "loss": 0.8271, - "step": 10755 - }, - { - "epoch": 0.28, - "learning_rate": 1.9799781191403665e-06, - "loss": 0.6528, - "step": 10756 - }, - { - "epoch": 0.28, - "learning_rate": 1.979972609433577e-06, - "loss": 0.8232, - "step": 10757 - }, - { - "epoch": 0.28, - "learning_rate": 1.979967098976467e-06, - "loss": 0.6895, - "step": 10758 - }, - { - "epoch": 0.28, - "learning_rate": 1.979961587769042e-06, - "loss": 1.1191, - "step": 10759 - }, - { - "epoch": 0.28, - "learning_rate": 1.979956075811305e-06, - "loss": 0.957, - "step": 10760 - }, - { - "epoch": 0.28, - "learning_rate": 1.979950563103261e-06, - "loss": 0.8594, - "step": 10761 - }, - { - "epoch": 0.28, - "learning_rate": 1.979945049644914e-06, - "loss": 0.7451, - "step": 10762 - }, - { - "epoch": 0.28, - "learning_rate": 1.979939535436268e-06, - "loss": 0.874, - "step": 10763 - }, - { - "epoch": 0.28, - "learning_rate": 1.9799340204773273e-06, - "loss": 0.916, - "step": 10764 - }, - { - "epoch": 0.28, - "learning_rate": 1.979928504768096e-06, - "loss": 0.9043, - "step": 10765 - }, - { - "epoch": 0.28, - "learning_rate": 1.979922988308579e-06, - "loss": 1.001, - "step": 10766 - }, - { - "epoch": 0.28, - "learning_rate": 1.9799174710987795e-06, - "loss": 1.0029, - "step": 10767 - }, - { - "epoch": 0.28, - "learning_rate": 1.9799119531387024e-06, - "loss": 0.8906, - "step": 10768 - }, - { - "epoch": 0.28, - "learning_rate": 1.979906434428352e-06, - "loss": 1.0195, - "step": 10769 - }, - { - "epoch": 0.28, - "learning_rate": 1.979900914967732e-06, - "loss": 0.752, - "step": 10770 - }, - { - "epoch": 0.28, - "learning_rate": 1.979895394756847e-06, - "loss": 1.0146, - "step": 10771 - }, - { - "epoch": 0.28, - "learning_rate": 1.9798898737957014e-06, - "loss": 0.8154, - "step": 10772 - }, - { - "epoch": 0.28, - "learning_rate": 1.979884352084299e-06, - "loss": 0.8379, - "step": 10773 - }, - { - "epoch": 0.28, - "learning_rate": 1.9798788296226447e-06, - "loss": 0.8203, - "step": 10774 - }, - { - "epoch": 0.28, - "learning_rate": 1.9798733064107418e-06, - "loss": 0.7744, - "step": 10775 - }, - { - "epoch": 0.28, - "learning_rate": 1.9798677824485947e-06, - "loss": 0.8525, - "step": 10776 - }, - { - "epoch": 0.28, - "learning_rate": 1.979862257736208e-06, - "loss": 0.9785, - "step": 10777 - }, - { - "epoch": 0.28, - "learning_rate": 1.9798567322735858e-06, - "loss": 0.8535, - "step": 10778 - }, - { - "epoch": 0.28, - "learning_rate": 1.979851206060733e-06, - "loss": 1.1855, - "step": 10779 - }, - { - "epoch": 0.28, - "learning_rate": 1.979845679097652e-06, - "loss": 0.7964, - "step": 10780 - }, - { - "epoch": 0.28, - "learning_rate": 1.9798401513843494e-06, - "loss": 0.9883, - "step": 10781 - }, - { - "epoch": 0.28, - "learning_rate": 1.9798346229208274e-06, - "loss": 0.8408, - "step": 10782 - }, - { - "epoch": 0.28, - "learning_rate": 1.9798290937070917e-06, - "loss": 0.8809, - "step": 10783 - }, - { - "epoch": 0.28, - "learning_rate": 1.9798235637431453e-06, - "loss": 0.8828, - "step": 10784 - }, - { - "epoch": 0.28, - "learning_rate": 1.9798180330289937e-06, - "loss": 0.8672, - "step": 10785 - }, - { - "epoch": 0.28, - "learning_rate": 1.9798125015646402e-06, - "loss": 0.9814, - "step": 10786 - }, - { - "epoch": 0.28, - "learning_rate": 1.9798069693500896e-06, - "loss": 0.9902, - "step": 10787 - }, - { - "epoch": 0.28, - "learning_rate": 1.979801436385345e-06, - "loss": 0.8018, - "step": 10788 - }, - { - "epoch": 0.28, - "learning_rate": 1.9797959026704124e-06, - "loss": 0.9297, - "step": 10789 - }, - { - "epoch": 0.28, - "learning_rate": 1.9797903682052944e-06, - "loss": 0.8892, - "step": 10790 - }, - { - "epoch": 0.28, - "learning_rate": 1.9797848329899966e-06, - "loss": 0.832, - "step": 10791 - }, - { - "epoch": 0.28, - "learning_rate": 1.9797792970245223e-06, - "loss": 1.0205, - "step": 10792 - }, - { - "epoch": 0.28, - "learning_rate": 1.979773760308876e-06, - "loss": 1.0234, - "step": 10793 - }, - { - "epoch": 0.28, - "learning_rate": 1.9797682228430623e-06, - "loss": 0.9492, - "step": 10794 - }, - { - "epoch": 0.28, - "learning_rate": 1.9797626846270846e-06, - "loss": 0.6768, - "step": 10795 - }, - { - "epoch": 0.28, - "learning_rate": 1.9797571456609482e-06, - "loss": 0.8213, - "step": 10796 - }, - { - "epoch": 0.28, - "learning_rate": 1.9797516059446566e-06, - "loss": 0.8486, - "step": 10797 - }, - { - "epoch": 0.28, - "learning_rate": 1.9797460654782145e-06, - "loss": 0.9453, - "step": 10798 - }, - { - "epoch": 0.28, - "learning_rate": 1.979740524261625e-06, - "loss": 0.8711, - "step": 10799 - }, - { - "epoch": 0.28, - "learning_rate": 1.979734982294894e-06, - "loss": 0.9395, - "step": 10800 - }, - { - "epoch": 0.28, - "learning_rate": 1.979729439578025e-06, - "loss": 0.9902, - "step": 10801 - }, - { - "epoch": 0.28, - "learning_rate": 1.979723896111022e-06, - "loss": 0.9473, - "step": 10802 - }, - { - "epoch": 0.28, - "learning_rate": 1.9797183518938896e-06, - "loss": 0.8584, - "step": 10803 - }, - { - "epoch": 0.28, - "learning_rate": 1.979712806926632e-06, - "loss": 0.918, - "step": 10804 - }, - { - "epoch": 0.28, - "learning_rate": 1.9797072612092526e-06, - "loss": 1.0176, - "step": 10805 - }, - { - "epoch": 0.28, - "learning_rate": 1.9797017147417573e-06, - "loss": 1.0078, - "step": 10806 - }, - { - "epoch": 0.28, - "learning_rate": 1.9796961675241487e-06, - "loss": 0.9541, - "step": 10807 - }, - { - "epoch": 0.28, - "learning_rate": 1.9796906195564323e-06, - "loss": 0.8755, - "step": 10808 - }, - { - "epoch": 0.28, - "learning_rate": 1.979685070838612e-06, - "loss": 0.9434, - "step": 10809 - }, - { - "epoch": 0.28, - "learning_rate": 1.9796795213706913e-06, - "loss": 1.2549, - "step": 10810 - }, - { - "epoch": 0.28, - "learning_rate": 1.9796739711526756e-06, - "loss": 0.9775, - "step": 10811 - }, - { - "epoch": 0.28, - "learning_rate": 1.979668420184568e-06, - "loss": 0.8809, - "step": 10812 - }, - { - "epoch": 0.28, - "learning_rate": 1.979662868466374e-06, - "loss": 0.7524, - "step": 10813 - }, - { - "epoch": 0.28, - "learning_rate": 1.9796573159980968e-06, - "loss": 0.8335, - "step": 10814 - }, - { - "epoch": 0.28, - "learning_rate": 1.9796517627797413e-06, - "loss": 1.002, - "step": 10815 - }, - { - "epoch": 0.28, - "learning_rate": 1.979646208811311e-06, - "loss": 1.0312, - "step": 10816 - }, - { - "epoch": 0.28, - "learning_rate": 1.979640654092811e-06, - "loss": 0.8506, - "step": 10817 - }, - { - "epoch": 0.28, - "learning_rate": 1.979635098624245e-06, - "loss": 0.6201, - "step": 10818 - }, - { - "epoch": 0.28, - "learning_rate": 1.9796295424056177e-06, - "loss": 1.1016, - "step": 10819 - }, - { - "epoch": 0.28, - "learning_rate": 1.9796239854369328e-06, - "loss": 0.9932, - "step": 10820 - }, - { - "epoch": 0.28, - "learning_rate": 1.979618427718195e-06, - "loss": 0.9561, - "step": 10821 - }, - { - "epoch": 0.28, - "learning_rate": 1.979612869249409e-06, - "loss": 0.8652, - "step": 10822 - }, - { - "epoch": 0.28, - "learning_rate": 1.9796073100305776e-06, - "loss": 1.1582, - "step": 10823 - }, - { - "epoch": 0.28, - "learning_rate": 1.979601750061706e-06, - "loss": 0.9854, - "step": 10824 - }, - { - "epoch": 0.28, - "learning_rate": 1.979596189342799e-06, - "loss": 0.8242, - "step": 10825 - }, - { - "epoch": 0.28, - "learning_rate": 1.97959062787386e-06, - "loss": 1.041, - "step": 10826 - }, - { - "epoch": 0.28, - "learning_rate": 1.9795850656548933e-06, - "loss": 1.0684, - "step": 10827 - }, - { - "epoch": 0.28, - "learning_rate": 1.979579502685903e-06, - "loss": 0.9902, - "step": 10828 - }, - { - "epoch": 0.28, - "learning_rate": 1.9795739389668946e-06, - "loss": 0.9941, - "step": 10829 - }, - { - "epoch": 0.28, - "learning_rate": 1.979568374497871e-06, - "loss": 0.7158, - "step": 10830 - }, - { - "epoch": 0.28, - "learning_rate": 1.9795628092788366e-06, - "loss": 0.9873, - "step": 10831 - }, - { - "epoch": 0.28, - "learning_rate": 1.979557243309797e-06, - "loss": 1.0244, - "step": 10832 - }, - { - "epoch": 0.28, - "learning_rate": 1.9795516765907543e-06, - "loss": 0.9404, - "step": 10833 - }, - { - "epoch": 0.28, - "learning_rate": 1.9795461091217145e-06, - "loss": 1.0791, - "step": 10834 - }, - { - "epoch": 0.28, - "learning_rate": 1.9795405409026813e-06, - "loss": 0.8101, - "step": 10835 - }, - { - "epoch": 0.28, - "learning_rate": 1.9795349719336588e-06, - "loss": 1.0771, - "step": 10836 - }, - { - "epoch": 0.28, - "learning_rate": 1.9795294022146517e-06, - "loss": 0.8516, - "step": 10837 - }, - { - "epoch": 0.28, - "learning_rate": 1.979523831745664e-06, - "loss": 0.7349, - "step": 10838 - }, - { - "epoch": 0.28, - "learning_rate": 1.9795182605266995e-06, - "loss": 0.9006, - "step": 10839 - }, - { - "epoch": 0.28, - "learning_rate": 1.979512688557763e-06, - "loss": 1.0693, - "step": 10840 - }, - { - "epoch": 0.28, - "learning_rate": 1.9795071158388586e-06, - "loss": 0.999, - "step": 10841 - }, - { - "epoch": 0.28, - "learning_rate": 1.979501542369991e-06, - "loss": 0.916, - "step": 10842 - }, - { - "epoch": 0.28, - "learning_rate": 1.979495968151164e-06, - "loss": 0.637, - "step": 10843 - }, - { - "epoch": 0.28, - "learning_rate": 1.979490393182382e-06, - "loss": 0.728, - "step": 10844 - }, - { - "epoch": 0.28, - "learning_rate": 1.979484817463649e-06, - "loss": 0.8955, - "step": 10845 - }, - { - "epoch": 0.28, - "learning_rate": 1.9794792409949697e-06, - "loss": 1.0215, - "step": 10846 - }, - { - "epoch": 0.28, - "learning_rate": 1.979473663776348e-06, - "loss": 0.9326, - "step": 10847 - }, - { - "epoch": 0.28, - "learning_rate": 1.9794680858077887e-06, - "loss": 0.9717, - "step": 10848 - }, - { - "epoch": 0.28, - "learning_rate": 1.979462507089296e-06, - "loss": 0.8252, - "step": 10849 - }, - { - "epoch": 0.28, - "learning_rate": 1.9794569276208726e-06, - "loss": 0.9082, - "step": 10850 - }, - { - "epoch": 0.28, - "learning_rate": 1.9794513474025254e-06, - "loss": 0.9395, - "step": 10851 - }, - { - "epoch": 0.28, - "learning_rate": 1.9794457664342567e-06, - "loss": 0.9482, - "step": 10852 - }, - { - "epoch": 0.28, - "learning_rate": 1.9794401847160716e-06, - "loss": 0.9346, - "step": 10853 - }, - { - "epoch": 0.28, - "learning_rate": 1.979434602247974e-06, - "loss": 0.9258, - "step": 10854 - }, - { - "epoch": 0.28, - "learning_rate": 1.9794290190299684e-06, - "loss": 0.8965, - "step": 10855 - }, - { - "epoch": 0.28, - "learning_rate": 1.979423435062059e-06, - "loss": 0.8557, - "step": 10856 - }, - { - "epoch": 0.28, - "learning_rate": 1.9794178503442505e-06, - "loss": 0.8481, - "step": 10857 - }, - { - "epoch": 0.28, - "learning_rate": 1.9794122648765466e-06, - "loss": 0.71, - "step": 10858 - }, - { - "epoch": 0.28, - "learning_rate": 1.9794066786589518e-06, - "loss": 0.7812, - "step": 10859 - }, - { - "epoch": 0.28, - "learning_rate": 1.97940109169147e-06, - "loss": 0.7588, - "step": 10860 - }, - { - "epoch": 0.28, - "learning_rate": 1.979395503974106e-06, - "loss": 0.8003, - "step": 10861 - }, - { - "epoch": 0.28, - "learning_rate": 1.979389915506864e-06, - "loss": 0.9395, - "step": 10862 - }, - { - "epoch": 0.28, - "learning_rate": 1.979384326289748e-06, - "loss": 1.0195, - "step": 10863 - }, - { - "epoch": 0.28, - "learning_rate": 1.9793787363227628e-06, - "loss": 0.9473, - "step": 10864 - }, - { - "epoch": 0.28, - "learning_rate": 1.979373145605912e-06, - "loss": 0.8965, - "step": 10865 - }, - { - "epoch": 0.28, - "learning_rate": 1.9793675541392004e-06, - "loss": 0.7817, - "step": 10866 - }, - { - "epoch": 0.28, - "learning_rate": 1.979361961922632e-06, - "loss": 0.9238, - "step": 10867 - }, - { - "epoch": 0.28, - "learning_rate": 1.979356368956211e-06, - "loss": 0.9629, - "step": 10868 - }, - { - "epoch": 0.28, - "learning_rate": 1.979350775239942e-06, - "loss": 1.0684, - "step": 10869 - }, - { - "epoch": 0.28, - "learning_rate": 1.9793451807738296e-06, - "loss": 0.9668, - "step": 10870 - }, - { - "epoch": 0.28, - "learning_rate": 1.9793395855578773e-06, - "loss": 0.6836, - "step": 10871 - }, - { - "epoch": 0.28, - "learning_rate": 1.9793339895920894e-06, - "loss": 0.822, - "step": 10872 - }, - { - "epoch": 0.28, - "learning_rate": 1.9793283928764706e-06, - "loss": 0.5303, - "step": 10873 - }, - { - "epoch": 0.28, - "learning_rate": 1.9793227954110253e-06, - "loss": 1.0029, - "step": 10874 - }, - { - "epoch": 0.28, - "learning_rate": 1.9793171971957572e-06, - "loss": 1.0459, - "step": 10875 - }, - { - "epoch": 0.28, - "learning_rate": 1.979311598230672e-06, - "loss": 1.1064, - "step": 10876 - }, - { - "epoch": 0.28, - "learning_rate": 1.9793059985157717e-06, - "loss": 0.9033, - "step": 10877 - }, - { - "epoch": 0.28, - "learning_rate": 1.9793003980510623e-06, - "loss": 1.0029, - "step": 10878 - }, - { - "epoch": 0.28, - "learning_rate": 1.9792947968365475e-06, - "loss": 0.793, - "step": 10879 - }, - { - "epoch": 0.28, - "learning_rate": 1.979289194872232e-06, - "loss": 0.812, - "step": 10880 - }, - { - "epoch": 0.28, - "learning_rate": 1.9792835921581195e-06, - "loss": 0.7998, - "step": 10881 - }, - { - "epoch": 0.28, - "learning_rate": 1.9792779886942147e-06, - "loss": 0.7935, - "step": 10882 - }, - { - "epoch": 0.28, - "learning_rate": 1.979272384480522e-06, - "loss": 0.8096, - "step": 10883 - }, - { - "epoch": 0.28, - "learning_rate": 1.979266779517045e-06, - "loss": 1.0801, - "step": 10884 - }, - { - "epoch": 0.28, - "learning_rate": 1.979261173803789e-06, - "loss": 0.8242, - "step": 10885 - }, - { - "epoch": 0.28, - "learning_rate": 1.9792555673407572e-06, - "loss": 0.9365, - "step": 10886 - }, - { - "epoch": 0.28, - "learning_rate": 1.9792499601279545e-06, - "loss": 0.9883, - "step": 10887 - }, - { - "epoch": 0.28, - "learning_rate": 1.9792443521653853e-06, - "loss": 0.8691, - "step": 10888 - }, - { - "epoch": 0.28, - "learning_rate": 1.979238743453054e-06, - "loss": 0.9297, - "step": 10889 - }, - { - "epoch": 0.28, - "learning_rate": 1.9792331339909644e-06, - "loss": 0.75, - "step": 10890 - }, - { - "epoch": 0.28, - "learning_rate": 1.979227523779121e-06, - "loss": 0.9287, - "step": 10891 - }, - { - "epoch": 0.28, - "learning_rate": 1.9792219128175277e-06, - "loss": 1.0674, - "step": 10892 - }, - { - "epoch": 0.28, - "learning_rate": 1.9792163011061898e-06, - "loss": 0.9639, - "step": 10893 - }, - { - "epoch": 0.28, - "learning_rate": 1.9792106886451107e-06, - "loss": 0.7783, - "step": 10894 - }, - { - "epoch": 0.28, - "learning_rate": 1.979205075434295e-06, - "loss": 0.8994, - "step": 10895 - }, - { - "epoch": 0.28, - "learning_rate": 1.979199461473747e-06, - "loss": 1.3086, - "step": 10896 - }, - { - "epoch": 0.28, - "learning_rate": 1.9791938467634714e-06, - "loss": 0.8081, - "step": 10897 - }, - { - "epoch": 0.28, - "learning_rate": 1.9791882313034714e-06, - "loss": 0.8149, - "step": 10898 - }, - { - "epoch": 0.28, - "learning_rate": 1.9791826150937523e-06, - "loss": 0.9824, - "step": 10899 - }, - { - "epoch": 0.28, - "learning_rate": 1.9791769981343185e-06, - "loss": 1.002, - "step": 10900 - }, - { - "epoch": 0.28, - "learning_rate": 1.9791713804251737e-06, - "loss": 0.9131, - "step": 10901 - }, - { - "epoch": 0.28, - "learning_rate": 1.979165761966322e-06, - "loss": 0.7334, - "step": 10902 - }, - { - "epoch": 0.28, - "learning_rate": 1.9791601427577685e-06, - "loss": 0.8896, - "step": 10903 - }, - { - "epoch": 0.28, - "learning_rate": 1.979154522799517e-06, - "loss": 0.8467, - "step": 10904 - }, - { - "epoch": 0.28, - "learning_rate": 1.979148902091572e-06, - "loss": 1.0674, - "step": 10905 - }, - { - "epoch": 0.28, - "learning_rate": 1.9791432806339374e-06, - "loss": 0.7495, - "step": 10906 - }, - { - "epoch": 0.28, - "learning_rate": 1.979137658426618e-06, - "loss": 0.9453, - "step": 10907 - }, - { - "epoch": 0.28, - "learning_rate": 1.9791320354696176e-06, - "loss": 0.8916, - "step": 10908 - }, - { - "epoch": 0.28, - "learning_rate": 1.9791264117629412e-06, - "loss": 0.708, - "step": 10909 - }, - { - "epoch": 0.28, - "learning_rate": 1.979120787306593e-06, - "loss": 1.0615, - "step": 10910 - }, - { - "epoch": 0.28, - "learning_rate": 1.9791151621005767e-06, - "loss": 0.6472, - "step": 10911 - }, - { - "epoch": 0.28, - "learning_rate": 1.9791095361448965e-06, - "loss": 0.9365, - "step": 10912 - }, - { - "epoch": 0.28, - "learning_rate": 1.979103909439558e-06, - "loss": 1.0469, - "step": 10913 - }, - { - "epoch": 0.28, - "learning_rate": 1.9790982819845642e-06, - "loss": 0.8008, - "step": 10914 - }, - { - "epoch": 0.28, - "learning_rate": 1.9790926537799197e-06, - "loss": 0.8154, - "step": 10915 - }, - { - "epoch": 0.28, - "learning_rate": 1.9790870248256295e-06, - "loss": 0.8159, - "step": 10916 - }, - { - "epoch": 0.28, - "learning_rate": 1.979081395121697e-06, - "loss": 1.123, - "step": 10917 - }, - { - "epoch": 0.28, - "learning_rate": 1.979075764668127e-06, - "loss": 0.8125, - "step": 10918 - }, - { - "epoch": 0.28, - "learning_rate": 1.9790701334649235e-06, - "loss": 0.9893, - "step": 10919 - }, - { - "epoch": 0.28, - "learning_rate": 1.979064501512091e-06, - "loss": 0.8271, - "step": 10920 - }, - { - "epoch": 0.28, - "learning_rate": 1.979058868809634e-06, - "loss": 1.1162, - "step": 10921 - }, - { - "epoch": 0.28, - "learning_rate": 1.979053235357557e-06, - "loss": 0.9834, - "step": 10922 - }, - { - "epoch": 0.28, - "learning_rate": 1.9790476011558636e-06, - "loss": 0.7778, - "step": 10923 - }, - { - "epoch": 0.28, - "learning_rate": 1.9790419662045585e-06, - "loss": 0.8926, - "step": 10924 - }, - { - "epoch": 0.28, - "learning_rate": 1.9790363305036457e-06, - "loss": 0.9932, - "step": 10925 - }, - { - "epoch": 0.28, - "learning_rate": 1.97903069405313e-06, - "loss": 0.7163, - "step": 10926 - }, - { - "epoch": 0.28, - "learning_rate": 1.9790250568530154e-06, - "loss": 0.9551, - "step": 10927 - }, - { - "epoch": 0.28, - "learning_rate": 1.979019418903307e-06, - "loss": 0.9785, - "step": 10928 - }, - { - "epoch": 0.28, - "learning_rate": 1.9790137802040075e-06, - "loss": 0.9746, - "step": 10929 - }, - { - "epoch": 0.28, - "learning_rate": 1.979008140755123e-06, - "loss": 0.915, - "step": 10930 - }, - { - "epoch": 0.28, - "learning_rate": 1.9790025005566563e-06, - "loss": 1.042, - "step": 10931 - }, - { - "epoch": 0.28, - "learning_rate": 1.978996859608613e-06, - "loss": 0.8535, - "step": 10932 - }, - { - "epoch": 0.28, - "learning_rate": 1.9789912179109965e-06, - "loss": 1.0938, - "step": 10933 - }, - { - "epoch": 0.28, - "learning_rate": 1.9789855754638114e-06, - "loss": 0.9238, - "step": 10934 - }, - { - "epoch": 0.28, - "learning_rate": 1.978979932267062e-06, - "loss": 1.0361, - "step": 10935 - }, - { - "epoch": 0.28, - "learning_rate": 1.978974288320753e-06, - "loss": 0.9697, - "step": 10936 - }, - { - "epoch": 0.28, - "learning_rate": 1.978968643624888e-06, - "loss": 0.959, - "step": 10937 - }, - { - "epoch": 0.28, - "learning_rate": 1.978962998179472e-06, - "loss": 0.639, - "step": 10938 - }, - { - "epoch": 0.28, - "learning_rate": 1.978957351984509e-06, - "loss": 0.9023, - "step": 10939 - }, - { - "epoch": 0.28, - "learning_rate": 1.9789517050400033e-06, - "loss": 0.8872, - "step": 10940 - }, - { - "epoch": 0.28, - "learning_rate": 1.9789460573459595e-06, - "loss": 1.0156, - "step": 10941 - }, - { - "epoch": 0.28, - "learning_rate": 1.9789404089023813e-06, - "loss": 0.6934, - "step": 10942 - }, - { - "epoch": 0.28, - "learning_rate": 1.978934759709274e-06, - "loss": 0.7681, - "step": 10943 - }, - { - "epoch": 0.28, - "learning_rate": 1.978929109766641e-06, - "loss": 0.7148, - "step": 10944 - }, - { - "epoch": 0.28, - "learning_rate": 1.978923459074487e-06, - "loss": 0.8848, - "step": 10945 - }, - { - "epoch": 0.28, - "learning_rate": 1.9789178076328163e-06, - "loss": 0.915, - "step": 10946 - }, - { - "epoch": 0.28, - "learning_rate": 1.9789121554416336e-06, - "loss": 0.8047, - "step": 10947 - }, - { - "epoch": 0.28, - "learning_rate": 1.9789065025009424e-06, - "loss": 0.8262, - "step": 10948 - }, - { - "epoch": 0.28, - "learning_rate": 1.9789008488107477e-06, - "loss": 0.9678, - "step": 10949 - }, - { - "epoch": 0.28, - "learning_rate": 1.9788951943710533e-06, - "loss": 0.834, - "step": 10950 - }, - { - "epoch": 0.28, - "learning_rate": 1.9788895391818644e-06, - "loss": 0.7842, - "step": 10951 - }, - { - "epoch": 0.28, - "learning_rate": 1.9788838832431847e-06, - "loss": 0.8105, - "step": 10952 - }, - { - "epoch": 0.28, - "learning_rate": 1.9788782265550186e-06, - "loss": 0.8818, - "step": 10953 - }, - { - "epoch": 0.28, - "learning_rate": 1.97887256911737e-06, - "loss": 1.0449, - "step": 10954 - }, - { - "epoch": 0.28, - "learning_rate": 1.9788669109302445e-06, - "loss": 1.0508, - "step": 10955 - }, - { - "epoch": 0.28, - "learning_rate": 1.9788612519936446e-06, - "loss": 1.1582, - "step": 10956 - }, - { - "epoch": 0.28, - "learning_rate": 1.9788555923075764e-06, - "loss": 0.9561, - "step": 10957 - }, - { - "epoch": 0.28, - "learning_rate": 1.9788499318720433e-06, - "loss": 0.8125, - "step": 10958 - }, - { - "epoch": 0.28, - "learning_rate": 1.97884427068705e-06, - "loss": 0.7495, - "step": 10959 - }, - { - "epoch": 0.28, - "learning_rate": 1.9788386087526005e-06, - "loss": 0.918, - "step": 10960 - }, - { - "epoch": 0.28, - "learning_rate": 1.978832946068699e-06, - "loss": 0.7744, - "step": 10961 - }, - { - "epoch": 0.28, - "learning_rate": 1.9788272826353506e-06, - "loss": 0.8242, - "step": 10962 - }, - { - "epoch": 0.28, - "learning_rate": 1.978821618452559e-06, - "loss": 0.9629, - "step": 10963 - }, - { - "epoch": 0.28, - "learning_rate": 1.9788159535203283e-06, - "loss": 1.0049, - "step": 10964 - }, - { - "epoch": 0.28, - "learning_rate": 1.9788102878386636e-06, - "loss": 0.918, - "step": 10965 - }, - { - "epoch": 0.28, - "learning_rate": 1.9788046214075687e-06, - "loss": 1.1797, - "step": 10966 - }, - { - "epoch": 0.28, - "learning_rate": 1.9787989542270483e-06, - "loss": 0.71, - "step": 10967 - }, - { - "epoch": 0.28, - "learning_rate": 1.9787932862971066e-06, - "loss": 0.9512, - "step": 10968 - }, - { - "epoch": 0.28, - "learning_rate": 1.9787876176177478e-06, - "loss": 0.8164, - "step": 10969 - }, - { - "epoch": 0.28, - "learning_rate": 1.978781948188976e-06, - "loss": 1.0039, - "step": 10970 - }, - { - "epoch": 0.28, - "learning_rate": 1.978776278010796e-06, - "loss": 1.0225, - "step": 10971 - }, - { - "epoch": 0.28, - "learning_rate": 1.9787706070832123e-06, - "loss": 0.832, - "step": 10972 - }, - { - "epoch": 0.28, - "learning_rate": 1.978764935406229e-06, - "loss": 0.9961, - "step": 10973 - }, - { - "epoch": 0.28, - "learning_rate": 1.97875926297985e-06, - "loss": 0.877, - "step": 10974 - }, - { - "epoch": 0.28, - "learning_rate": 1.9787535898040804e-06, - "loss": 0.8652, - "step": 10975 - }, - { - "epoch": 0.28, - "learning_rate": 1.978747915878924e-06, - "loss": 0.9062, - "step": 10976 - }, - { - "epoch": 0.28, - "learning_rate": 1.9787422412043853e-06, - "loss": 0.9199, - "step": 10977 - }, - { - "epoch": 0.28, - "learning_rate": 1.9787365657804686e-06, - "loss": 0.696, - "step": 10978 - }, - { - "epoch": 0.28, - "learning_rate": 1.9787308896071786e-06, - "loss": 0.7852, - "step": 10979 - }, - { - "epoch": 0.28, - "learning_rate": 1.9787252126845193e-06, - "loss": 1.0703, - "step": 10980 - }, - { - "epoch": 0.28, - "learning_rate": 1.9787195350124946e-06, - "loss": 0.7822, - "step": 10981 - }, - { - "epoch": 0.28, - "learning_rate": 1.97871385659111e-06, - "loss": 1.2539, - "step": 10982 - }, - { - "epoch": 0.28, - "learning_rate": 1.978708177420369e-06, - "loss": 0.8721, - "step": 10983 - }, - { - "epoch": 0.28, - "learning_rate": 1.978702497500276e-06, - "loss": 0.9971, - "step": 10984 - }, - { - "epoch": 0.28, - "learning_rate": 1.9786968168308357e-06, - "loss": 1.0605, - "step": 10985 - }, - { - "epoch": 0.28, - "learning_rate": 1.9786911354120522e-06, - "loss": 0.9775, - "step": 10986 - }, - { - "epoch": 0.28, - "learning_rate": 1.9786854532439297e-06, - "loss": 0.7686, - "step": 10987 - }, - { - "epoch": 0.28, - "learning_rate": 1.9786797703264726e-06, - "loss": 1.0977, - "step": 10988 - }, - { - "epoch": 0.28, - "learning_rate": 1.9786740866596862e-06, - "loss": 0.8223, - "step": 10989 - }, - { - "epoch": 0.28, - "learning_rate": 1.9786684022435734e-06, - "loss": 0.8672, - "step": 10990 - }, - { - "epoch": 0.28, - "learning_rate": 1.978662717078139e-06, - "loss": 1.0312, - "step": 10991 - }, - { - "epoch": 0.28, - "learning_rate": 1.9786570311633883e-06, - "loss": 0.8096, - "step": 10992 - }, - { - "epoch": 0.28, - "learning_rate": 1.9786513444993246e-06, - "loss": 0.9893, - "step": 10993 - }, - { - "epoch": 0.28, - "learning_rate": 1.9786456570859526e-06, - "loss": 0.6323, - "step": 10994 - }, - { - "epoch": 0.28, - "learning_rate": 1.9786399689232762e-06, - "loss": 1.0234, - "step": 10995 - }, - { - "epoch": 0.28, - "learning_rate": 1.9786342800113005e-06, - "loss": 0.8584, - "step": 10996 - }, - { - "epoch": 0.28, - "learning_rate": 1.9786285903500297e-06, - "loss": 0.8037, - "step": 10997 - }, - { - "epoch": 0.28, - "learning_rate": 1.9786228999394677e-06, - "loss": 0.5598, - "step": 10998 - }, - { - "epoch": 0.28, - "learning_rate": 1.978617208779619e-06, - "loss": 0.7178, - "step": 10999 - }, - { - "epoch": 0.28, - "learning_rate": 1.9786115168704884e-06, - "loss": 0.9238, - "step": 11000 - }, - { - "epoch": 0.28, - "learning_rate": 1.97860582421208e-06, - "loss": 0.7578, - "step": 11001 - }, - { - "epoch": 0.28, - "learning_rate": 1.9786001308043982e-06, - "loss": 0.7539, - "step": 11002 - }, - { - "epoch": 0.28, - "learning_rate": 1.978594436647447e-06, - "loss": 0.8916, - "step": 11003 - }, - { - "epoch": 0.28, - "learning_rate": 1.978588741741231e-06, - "loss": 0.9824, - "step": 11004 - }, - { - "epoch": 0.28, - "learning_rate": 1.978583046085755e-06, - "loss": 1.125, - "step": 11005 - }, - { - "epoch": 0.28, - "learning_rate": 1.9785773496810224e-06, - "loss": 0.7593, - "step": 11006 - }, - { - "epoch": 0.28, - "learning_rate": 1.978571652527039e-06, - "loss": 0.9521, - "step": 11007 - }, - { - "epoch": 0.28, - "learning_rate": 1.978565954623807e-06, - "loss": 0.8486, - "step": 11008 - }, - { - "epoch": 0.28, - "learning_rate": 1.978560255971333e-06, - "loss": 1.0908, - "step": 11009 - }, - { - "epoch": 0.28, - "learning_rate": 1.97855455656962e-06, - "loss": 0.9316, - "step": 11010 - }, - { - "epoch": 0.28, - "learning_rate": 1.978548856418673e-06, - "loss": 0.8105, - "step": 11011 - }, - { - "epoch": 0.28, - "learning_rate": 1.978543155518496e-06, - "loss": 0.8848, - "step": 11012 - }, - { - "epoch": 0.28, - "learning_rate": 1.9785374538690935e-06, - "loss": 0.8994, - "step": 11013 - }, - { - "epoch": 0.28, - "learning_rate": 1.97853175147047e-06, - "loss": 0.7295, - "step": 11014 - }, - { - "epoch": 0.28, - "learning_rate": 1.97852604832263e-06, - "loss": 0.9849, - "step": 11015 - }, - { - "epoch": 0.28, - "learning_rate": 1.9785203444255768e-06, - "loss": 0.9404, - "step": 11016 - }, - { - "epoch": 0.28, - "learning_rate": 1.978514639779316e-06, - "loss": 0.7871, - "step": 11017 - }, - { - "epoch": 0.28, - "learning_rate": 1.978508934383852e-06, - "loss": 0.8838, - "step": 11018 - }, - { - "epoch": 0.28, - "learning_rate": 1.978503228239188e-06, - "loss": 0.8896, - "step": 11019 - }, - { - "epoch": 0.28, - "learning_rate": 1.9784975213453294e-06, - "loss": 0.8945, - "step": 11020 - }, - { - "epoch": 0.28, - "learning_rate": 1.97849181370228e-06, - "loss": 0.8418, - "step": 11021 - }, - { - "epoch": 0.28, - "learning_rate": 1.9784861053100446e-06, - "loss": 0.7764, - "step": 11022 - }, - { - "epoch": 0.28, - "learning_rate": 1.9784803961686276e-06, - "loss": 0.8013, - "step": 11023 - }, - { - "epoch": 0.28, - "learning_rate": 1.9784746862780327e-06, - "loss": 0.9941, - "step": 11024 - }, - { - "epoch": 0.28, - "learning_rate": 1.978468975638265e-06, - "loss": 1.0703, - "step": 11025 - }, - { - "epoch": 0.28, - "learning_rate": 1.9784632642493287e-06, - "loss": 0.8867, - "step": 11026 - }, - { - "epoch": 0.28, - "learning_rate": 1.9784575521112277e-06, - "loss": 0.7881, - "step": 11027 - }, - { - "epoch": 0.28, - "learning_rate": 1.978451839223967e-06, - "loss": 1.0098, - "step": 11028 - }, - { - "epoch": 0.28, - "learning_rate": 1.9784461255875507e-06, - "loss": 0.8926, - "step": 11029 - }, - { - "epoch": 0.28, - "learning_rate": 1.978440411201983e-06, - "loss": 0.9238, - "step": 11030 - }, - { - "epoch": 0.28, - "learning_rate": 1.9784346960672684e-06, - "loss": 0.9141, - "step": 11031 - }, - { - "epoch": 0.28, - "learning_rate": 1.978428980183412e-06, - "loss": 0.9243, - "step": 11032 - }, - { - "epoch": 0.28, - "learning_rate": 1.9784232635504166e-06, - "loss": 0.915, - "step": 11033 - }, - { - "epoch": 0.28, - "learning_rate": 1.978417546168288e-06, - "loss": 0.9717, - "step": 11034 - }, - { - "epoch": 0.28, - "learning_rate": 1.9784118280370303e-06, - "loss": 0.8994, - "step": 11035 - }, - { - "epoch": 0.28, - "learning_rate": 1.9784061091566473e-06, - "loss": 0.8682, - "step": 11036 - }, - { - "epoch": 0.28, - "learning_rate": 1.9784003895271438e-06, - "loss": 0.8955, - "step": 11037 - }, - { - "epoch": 0.28, - "learning_rate": 1.9783946691485243e-06, - "loss": 0.6479, - "step": 11038 - }, - { - "epoch": 0.28, - "learning_rate": 1.9783889480207927e-06, - "loss": 0.8008, - "step": 11039 - }, - { - "epoch": 0.28, - "learning_rate": 1.978383226143954e-06, - "loss": 0.8184, - "step": 11040 - }, - { - "epoch": 0.28, - "learning_rate": 1.978377503518012e-06, - "loss": 0.9814, - "step": 11041 - }, - { - "epoch": 0.28, - "learning_rate": 1.9783717801429712e-06, - "loss": 1.0127, - "step": 11042 - }, - { - "epoch": 0.28, - "learning_rate": 1.9783660560188364e-06, - "loss": 0.666, - "step": 11043 - }, - { - "epoch": 0.28, - "learning_rate": 1.9783603311456115e-06, - "loss": 1.0166, - "step": 11044 - }, - { - "epoch": 0.28, - "learning_rate": 1.9783546055233016e-06, - "loss": 0.7251, - "step": 11045 - }, - { - "epoch": 0.28, - "learning_rate": 1.97834887915191e-06, - "loss": 0.9482, - "step": 11046 - }, - { - "epoch": 0.28, - "learning_rate": 1.978343152031442e-06, - "loss": 0.9268, - "step": 11047 - }, - { - "epoch": 0.28, - "learning_rate": 1.978337424161901e-06, - "loss": 0.7124, - "step": 11048 - }, - { - "epoch": 0.28, - "learning_rate": 1.9783316955432925e-06, - "loss": 0.8848, - "step": 11049 - }, - { - "epoch": 0.28, - "learning_rate": 1.9783259661756206e-06, - "loss": 0.791, - "step": 11050 - }, - { - "epoch": 0.28, - "learning_rate": 1.978320236058889e-06, - "loss": 0.7925, - "step": 11051 - }, - { - "epoch": 0.28, - "learning_rate": 1.978314505193103e-06, - "loss": 0.792, - "step": 11052 - }, - { - "epoch": 0.28, - "learning_rate": 1.9783087735782666e-06, - "loss": 0.8818, - "step": 11053 - }, - { - "epoch": 0.28, - "learning_rate": 1.9783030412143837e-06, - "loss": 0.9385, - "step": 11054 - }, - { - "epoch": 0.28, - "learning_rate": 1.9782973081014595e-06, - "loss": 0.8896, - "step": 11055 - }, - { - "epoch": 0.28, - "learning_rate": 1.9782915742394976e-06, - "loss": 1.0117, - "step": 11056 - }, - { - "epoch": 0.28, - "learning_rate": 1.9782858396285033e-06, - "loss": 0.8564, - "step": 11057 - }, - { - "epoch": 0.28, - "learning_rate": 1.9782801042684802e-06, - "loss": 1.0596, - "step": 11058 - }, - { - "epoch": 0.28, - "learning_rate": 1.9782743681594336e-06, - "loss": 1.0205, - "step": 11059 - }, - { - "epoch": 0.28, - "learning_rate": 1.9782686313013667e-06, - "loss": 1.0166, - "step": 11060 - }, - { - "epoch": 0.28, - "learning_rate": 1.9782628936942847e-06, - "loss": 1.1738, - "step": 11061 - }, - { - "epoch": 0.28, - "learning_rate": 1.9782571553381918e-06, - "loss": 0.7129, - "step": 11062 - }, - { - "epoch": 0.28, - "learning_rate": 1.978251416233092e-06, - "loss": 1.0527, - "step": 11063 - }, - { - "epoch": 0.28, - "learning_rate": 1.9782456763789906e-06, - "loss": 0.8633, - "step": 11064 - }, - { - "epoch": 0.28, - "learning_rate": 1.978239935775891e-06, - "loss": 0.752, - "step": 11065 - }, - { - "epoch": 0.28, - "learning_rate": 1.9782341944237982e-06, - "loss": 1.0137, - "step": 11066 - }, - { - "epoch": 0.28, - "learning_rate": 1.978228452322717e-06, - "loss": 0.8574, - "step": 11067 - }, - { - "epoch": 0.28, - "learning_rate": 1.978222709472651e-06, - "loss": 0.6001, - "step": 11068 - }, - { - "epoch": 0.28, - "learning_rate": 1.9782169658736044e-06, - "loss": 0.9541, - "step": 11069 - }, - { - "epoch": 0.28, - "learning_rate": 1.978211221525582e-06, - "loss": 0.7397, - "step": 11070 - }, - { - "epoch": 0.28, - "learning_rate": 1.978205476428589e-06, - "loss": 0.917, - "step": 11071 - }, - { - "epoch": 0.28, - "learning_rate": 1.9781997305826287e-06, - "loss": 0.9316, - "step": 11072 - }, - { - "epoch": 0.28, - "learning_rate": 1.9781939839877055e-06, - "loss": 0.8584, - "step": 11073 - }, - { - "epoch": 0.28, - "learning_rate": 1.9781882366438243e-06, - "loss": 0.8154, - "step": 11074 - }, - { - "epoch": 0.28, - "learning_rate": 1.97818248855099e-06, - "loss": 1.0312, - "step": 11075 - }, - { - "epoch": 0.28, - "learning_rate": 1.9781767397092054e-06, - "loss": 0.9834, - "step": 11076 - }, - { - "epoch": 0.28, - "learning_rate": 1.9781709901184766e-06, - "loss": 1.1348, - "step": 11077 - }, - { - "epoch": 0.28, - "learning_rate": 1.9781652397788067e-06, - "loss": 0.9678, - "step": 11078 - }, - { - "epoch": 0.28, - "learning_rate": 1.978159488690201e-06, - "loss": 0.6294, - "step": 11079 - }, - { - "epoch": 0.28, - "learning_rate": 1.978153736852663e-06, - "loss": 1.0791, - "step": 11080 - }, - { - "epoch": 0.28, - "learning_rate": 1.9781479842661985e-06, - "loss": 1.0957, - "step": 11081 - }, - { - "epoch": 0.28, - "learning_rate": 1.9781422309308103e-06, - "loss": 0.9834, - "step": 11082 - }, - { - "epoch": 0.28, - "learning_rate": 1.978136476846504e-06, - "loss": 0.8184, - "step": 11083 - }, - { - "epoch": 0.28, - "learning_rate": 1.9781307220132836e-06, - "loss": 1.0479, - "step": 11084 - }, - { - "epoch": 0.28, - "learning_rate": 1.9781249664311536e-06, - "loss": 1.0957, - "step": 11085 - }, - { - "epoch": 0.28, - "learning_rate": 1.9781192101001178e-06, - "loss": 0.9443, - "step": 11086 - }, - { - "epoch": 0.28, - "learning_rate": 1.978113453020181e-06, - "loss": 0.9067, - "step": 11087 - }, - { - "epoch": 0.28, - "learning_rate": 1.9781076951913484e-06, - "loss": 0.9434, - "step": 11088 - }, - { - "epoch": 0.28, - "learning_rate": 1.9781019366136233e-06, - "loss": 0.7773, - "step": 11089 - }, - { - "epoch": 0.28, - "learning_rate": 1.9780961772870105e-06, - "loss": 0.7056, - "step": 11090 - }, - { - "epoch": 0.28, - "learning_rate": 1.9780904172115147e-06, - "loss": 0.8242, - "step": 11091 - }, - { - "epoch": 0.28, - "learning_rate": 1.9780846563871398e-06, - "loss": 0.9248, - "step": 11092 - }, - { - "epoch": 0.28, - "learning_rate": 1.9780788948138903e-06, - "loss": 0.8218, - "step": 11093 - }, - { - "epoch": 0.28, - "learning_rate": 1.9780731324917714e-06, - "loss": 0.9688, - "step": 11094 - }, - { - "epoch": 0.28, - "learning_rate": 1.9780673694207863e-06, - "loss": 0.874, - "step": 11095 - }, - { - "epoch": 0.28, - "learning_rate": 1.9780616056009404e-06, - "loss": 0.9795, - "step": 11096 - }, - { - "epoch": 0.28, - "learning_rate": 1.978055841032237e-06, - "loss": 0.7837, - "step": 11097 - }, - { - "epoch": 0.28, - "learning_rate": 1.978050075714682e-06, - "loss": 0.8633, - "step": 11098 - }, - { - "epoch": 0.28, - "learning_rate": 1.9780443096482784e-06, - "loss": 0.9648, - "step": 11099 - }, - { - "epoch": 0.28, - "learning_rate": 1.9780385428330317e-06, - "loss": 1.0205, - "step": 11100 - }, - { - "epoch": 0.28, - "learning_rate": 1.9780327752689456e-06, - "loss": 0.8242, - "step": 11101 - }, - { - "epoch": 0.28, - "learning_rate": 1.9780270069560248e-06, - "loss": 0.9619, - "step": 11102 - }, - { - "epoch": 0.28, - "learning_rate": 1.978021237894274e-06, - "loss": 0.9385, - "step": 11103 - }, - { - "epoch": 0.28, - "learning_rate": 1.9780154680836968e-06, - "loss": 0.959, - "step": 11104 - }, - { - "epoch": 0.28, - "learning_rate": 1.9780096975242984e-06, - "loss": 1.0098, - "step": 11105 - }, - { - "epoch": 0.28, - "learning_rate": 1.978003926216083e-06, - "loss": 0.9062, - "step": 11106 - }, - { - "epoch": 0.28, - "learning_rate": 1.977998154159055e-06, - "loss": 0.9932, - "step": 11107 - }, - { - "epoch": 0.28, - "learning_rate": 1.977992381353219e-06, - "loss": 1.0498, - "step": 11108 - }, - { - "epoch": 0.28, - "learning_rate": 1.9779866077985786e-06, - "loss": 0.7393, - "step": 11109 - }, - { - "epoch": 0.28, - "learning_rate": 1.9779808334951392e-06, - "loss": 0.6968, - "step": 11110 - }, - { - "epoch": 0.28, - "learning_rate": 1.9779750584429045e-06, - "loss": 0.8945, - "step": 11111 - }, - { - "epoch": 0.28, - "learning_rate": 1.9779692826418796e-06, - "loss": 1.002, - "step": 11112 - }, - { - "epoch": 0.28, - "learning_rate": 1.9779635060920686e-06, - "loss": 0.7588, - "step": 11113 - }, - { - "epoch": 0.28, - "learning_rate": 1.977957728793476e-06, - "loss": 0.8994, - "step": 11114 - }, - { - "epoch": 0.28, - "learning_rate": 1.977951950746106e-06, - "loss": 1.0566, - "step": 11115 - }, - { - "epoch": 0.28, - "learning_rate": 1.9779461719499627e-06, - "loss": 0.9473, - "step": 11116 - }, - { - "epoch": 0.28, - "learning_rate": 1.9779403924050513e-06, - "loss": 1.0117, - "step": 11117 - }, - { - "epoch": 0.28, - "learning_rate": 1.9779346121113763e-06, - "loss": 0.6704, - "step": 11118 - }, - { - "epoch": 0.28, - "learning_rate": 1.9779288310689415e-06, - "loss": 0.8994, - "step": 11119 - }, - { - "epoch": 0.29, - "learning_rate": 1.9779230492777512e-06, - "loss": 0.998, - "step": 11120 - }, - { - "epoch": 0.29, - "learning_rate": 1.9779172667378105e-06, - "loss": 0.9678, - "step": 11121 - }, - { - "epoch": 0.29, - "learning_rate": 1.9779114834491235e-06, - "loss": 0.5981, - "step": 11122 - }, - { - "epoch": 0.29, - "learning_rate": 1.977905699411695e-06, - "loss": 0.7705, - "step": 11123 - }, - { - "epoch": 0.29, - "learning_rate": 1.9778999146255284e-06, - "loss": 0.7725, - "step": 11124 - }, - { - "epoch": 0.29, - "learning_rate": 1.977894129090629e-06, - "loss": 0.8506, - "step": 11125 - }, - { - "epoch": 0.29, - "learning_rate": 1.9778883428070013e-06, - "loss": 0.9912, - "step": 11126 - }, - { - "epoch": 0.29, - "learning_rate": 1.9778825557746494e-06, - "loss": 0.7676, - "step": 11127 - }, - { - "epoch": 0.29, - "learning_rate": 1.9778767679935775e-06, - "loss": 0.7295, - "step": 11128 - }, - { - "epoch": 0.29, - "learning_rate": 1.977870979463791e-06, - "loss": 0.9912, - "step": 11129 - }, - { - "epoch": 0.29, - "learning_rate": 1.9778651901852926e-06, - "loss": 0.9463, - "step": 11130 - }, - { - "epoch": 0.29, - "learning_rate": 1.977859400158089e-06, - "loss": 0.8672, - "step": 11131 - }, - { - "epoch": 0.29, - "learning_rate": 1.9778536093821824e-06, - "loss": 0.9824, - "step": 11132 - }, - { - "epoch": 0.29, - "learning_rate": 1.9778478178575786e-06, - "loss": 0.9844, - "step": 11133 - }, - { - "epoch": 0.29, - "learning_rate": 1.977842025584282e-06, - "loss": 0.8633, - "step": 11134 - }, - { - "epoch": 0.29, - "learning_rate": 1.9778362325622965e-06, - "loss": 0.9932, - "step": 11135 - }, - { - "epoch": 0.29, - "learning_rate": 1.9778304387916264e-06, - "loss": 1.082, - "step": 11136 - }, - { - "epoch": 0.29, - "learning_rate": 1.9778246442722766e-06, - "loss": 0.9199, - "step": 11137 - }, - { - "epoch": 0.29, - "learning_rate": 1.9778188490042517e-06, - "loss": 0.8823, - "step": 11138 - }, - { - "epoch": 0.29, - "learning_rate": 1.977813052987556e-06, - "loss": 1.0088, - "step": 11139 - }, - { - "epoch": 0.29, - "learning_rate": 1.9778072562221933e-06, - "loss": 0.79, - "step": 11140 - }, - { - "epoch": 0.29, - "learning_rate": 1.977801458708169e-06, - "loss": 1.0957, - "step": 11141 - }, - { - "epoch": 0.29, - "learning_rate": 1.977795660445487e-06, - "loss": 1.042, - "step": 11142 - }, - { - "epoch": 0.29, - "learning_rate": 1.977789861434152e-06, - "loss": 0.8975, - "step": 11143 - }, - { - "epoch": 0.29, - "learning_rate": 1.977784061674168e-06, - "loss": 0.79, - "step": 11144 - }, - { - "epoch": 0.29, - "learning_rate": 1.9777782611655396e-06, - "loss": 0.9463, - "step": 11145 - }, - { - "epoch": 0.29, - "learning_rate": 1.9777724599082714e-06, - "loss": 0.9521, - "step": 11146 - }, - { - "epoch": 0.29, - "learning_rate": 1.977766657902368e-06, - "loss": 1.0908, - "step": 11147 - }, - { - "epoch": 0.29, - "learning_rate": 1.9777608551478334e-06, - "loss": 0.8779, - "step": 11148 - }, - { - "epoch": 0.29, - "learning_rate": 1.9777550516446726e-06, - "loss": 0.8379, - "step": 11149 - }, - { - "epoch": 0.29, - "learning_rate": 1.977749247392889e-06, - "loss": 0.6709, - "step": 11150 - }, - { - "epoch": 0.29, - "learning_rate": 1.9777434423924888e-06, - "loss": 0.9902, - "step": 11151 - }, - { - "epoch": 0.29, - "learning_rate": 1.9777376366434747e-06, - "loss": 0.9727, - "step": 11152 - }, - { - "epoch": 0.29, - "learning_rate": 1.977731830145852e-06, - "loss": 0.9521, - "step": 11153 - }, - { - "epoch": 0.29, - "learning_rate": 1.9777260228996247e-06, - "loss": 0.7026, - "step": 11154 - }, - { - "epoch": 0.29, - "learning_rate": 1.977720214904798e-06, - "loss": 0.7578, - "step": 11155 - }, - { - "epoch": 0.29, - "learning_rate": 1.9777144061613755e-06, - "loss": 0.8926, - "step": 11156 - }, - { - "epoch": 0.29, - "learning_rate": 1.9777085966693627e-06, - "loss": 0.958, - "step": 11157 - }, - { - "epoch": 0.29, - "learning_rate": 1.977702786428763e-06, - "loss": 0.6636, - "step": 11158 - }, - { - "epoch": 0.29, - "learning_rate": 1.9776969754395807e-06, - "loss": 1.0303, - "step": 11159 - }, - { - "epoch": 0.29, - "learning_rate": 1.9776911637018214e-06, - "loss": 0.9121, - "step": 11160 - }, - { - "epoch": 0.29, - "learning_rate": 1.9776853512154886e-06, - "loss": 1.0303, - "step": 11161 - }, - { - "epoch": 0.29, - "learning_rate": 1.977679537980587e-06, - "loss": 0.9199, - "step": 11162 - }, - { - "epoch": 0.29, - "learning_rate": 1.977673723997122e-06, - "loss": 0.7549, - "step": 11163 - }, - { - "epoch": 0.29, - "learning_rate": 1.9776679092650964e-06, - "loss": 0.7607, - "step": 11164 - }, - { - "epoch": 0.29, - "learning_rate": 1.9776620937845157e-06, - "loss": 0.875, - "step": 11165 - }, - { - "epoch": 0.29, - "learning_rate": 1.977656277555384e-06, - "loss": 0.8252, - "step": 11166 - }, - { - "epoch": 0.29, - "learning_rate": 1.9776504605777057e-06, - "loss": 1.0332, - "step": 11167 - }, - { - "epoch": 0.29, - "learning_rate": 1.9776446428514857e-06, - "loss": 0.7988, - "step": 11168 - }, - { - "epoch": 0.29, - "learning_rate": 1.977638824376728e-06, - "loss": 0.6409, - "step": 11169 - }, - { - "epoch": 0.29, - "learning_rate": 1.977633005153437e-06, - "loss": 0.9121, - "step": 11170 - }, - { - "epoch": 0.29, - "learning_rate": 1.9776271851816176e-06, - "loss": 1.0078, - "step": 11171 - }, - { - "epoch": 0.29, - "learning_rate": 1.977621364461274e-06, - "loss": 0.9424, - "step": 11172 - }, - { - "epoch": 0.29, - "learning_rate": 1.9776155429924107e-06, - "loss": 0.9512, - "step": 11173 - }, - { - "epoch": 0.29, - "learning_rate": 1.9776097207750318e-06, - "loss": 0.9023, - "step": 11174 - }, - { - "epoch": 0.29, - "learning_rate": 1.9776038978091426e-06, - "loss": 0.7568, - "step": 11175 - }, - { - "epoch": 0.29, - "learning_rate": 1.9775980740947465e-06, - "loss": 0.8955, - "step": 11176 - }, - { - "epoch": 0.29, - "learning_rate": 1.977592249631849e-06, - "loss": 0.7764, - "step": 11177 - }, - { - "epoch": 0.29, - "learning_rate": 1.977586424420454e-06, - "loss": 0.9141, - "step": 11178 - }, - { - "epoch": 0.29, - "learning_rate": 1.9775805984605658e-06, - "loss": 0.8037, - "step": 11179 - }, - { - "epoch": 0.29, - "learning_rate": 1.9775747717521894e-06, - "loss": 1.0918, - "step": 11180 - }, - { - "epoch": 0.29, - "learning_rate": 1.9775689442953285e-06, - "loss": 1.0049, - "step": 11181 - }, - { - "epoch": 0.29, - "learning_rate": 1.9775631160899883e-06, - "loss": 0.7715, - "step": 11182 - }, - { - "epoch": 0.29, - "learning_rate": 1.977557287136173e-06, - "loss": 0.7681, - "step": 11183 - }, - { - "epoch": 0.29, - "learning_rate": 1.9775514574338866e-06, - "loss": 0.7746, - "step": 11184 - }, - { - "epoch": 0.29, - "learning_rate": 1.977545626983135e-06, - "loss": 0.9375, - "step": 11185 - }, - { - "epoch": 0.29, - "learning_rate": 1.9775397957839207e-06, - "loss": 1.0205, - "step": 11186 - }, - { - "epoch": 0.29, - "learning_rate": 1.9775339638362496e-06, - "loss": 0.8623, - "step": 11187 - }, - { - "epoch": 0.29, - "learning_rate": 1.9775281311401253e-06, - "loss": 1.0811, - "step": 11188 - }, - { - "epoch": 0.29, - "learning_rate": 1.977522297695553e-06, - "loss": 0.9229, - "step": 11189 - }, - { - "epoch": 0.29, - "learning_rate": 1.977516463502537e-06, - "loss": 0.9688, - "step": 11190 - }, - { - "epoch": 0.29, - "learning_rate": 1.977510628561081e-06, - "loss": 0.8975, - "step": 11191 - }, - { - "epoch": 0.29, - "learning_rate": 1.9775047928711905e-06, - "loss": 0.9141, - "step": 11192 - }, - { - "epoch": 0.29, - "learning_rate": 1.977498956432869e-06, - "loss": 0.8569, - "step": 11193 - }, - { - "epoch": 0.29, - "learning_rate": 1.977493119246122e-06, - "loss": 1.0654, - "step": 11194 - }, - { - "epoch": 0.29, - "learning_rate": 1.9774872813109535e-06, - "loss": 0.9072, - "step": 11195 - }, - { - "epoch": 0.29, - "learning_rate": 1.977481442627368e-06, - "loss": 0.6484, - "step": 11196 - }, - { - "epoch": 0.29, - "learning_rate": 1.9774756031953692e-06, - "loss": 1.0137, - "step": 11197 - }, - { - "epoch": 0.29, - "learning_rate": 1.977469763014963e-06, - "loss": 0.8037, - "step": 11198 - }, - { - "epoch": 0.29, - "learning_rate": 1.977463922086153e-06, - "loss": 0.7891, - "step": 11199 - }, - { - "epoch": 0.29, - "learning_rate": 1.977458080408944e-06, - "loss": 0.8525, - "step": 11200 - }, - { - "epoch": 0.29, - "learning_rate": 1.9774522379833396e-06, - "loss": 0.9453, - "step": 11201 - }, - { - "epoch": 0.29, - "learning_rate": 1.9774463948093458e-06, - "loss": 0.9883, - "step": 11202 - }, - { - "epoch": 0.29, - "learning_rate": 1.9774405508869657e-06, - "loss": 0.8906, - "step": 11203 - }, - { - "epoch": 0.29, - "learning_rate": 1.977434706216204e-06, - "loss": 0.9785, - "step": 11204 - }, - { - "epoch": 0.29, - "learning_rate": 1.977428860797066e-06, - "loss": 0.9844, - "step": 11205 - }, - { - "epoch": 0.29, - "learning_rate": 1.9774230146295557e-06, - "loss": 0.8096, - "step": 11206 - }, - { - "epoch": 0.29, - "learning_rate": 1.9774171677136774e-06, - "loss": 0.9961, - "step": 11207 - }, - { - "epoch": 0.29, - "learning_rate": 1.977411320049436e-06, - "loss": 0.9038, - "step": 11208 - }, - { - "epoch": 0.29, - "learning_rate": 1.9774054716368353e-06, - "loss": 0.7363, - "step": 11209 - }, - { - "epoch": 0.29, - "learning_rate": 1.9773996224758805e-06, - "loss": 1.0791, - "step": 11210 - }, - { - "epoch": 0.29, - "learning_rate": 1.977393772566576e-06, - "loss": 0.9756, - "step": 11211 - }, - { - "epoch": 0.29, - "learning_rate": 1.9773879219089253e-06, - "loss": 0.7827, - "step": 11212 - }, - { - "epoch": 0.29, - "learning_rate": 1.9773820705029337e-06, - "loss": 0.7495, - "step": 11213 - }, - { - "epoch": 0.29, - "learning_rate": 1.977376218348606e-06, - "loss": 0.8486, - "step": 11214 - }, - { - "epoch": 0.29, - "learning_rate": 1.9773703654459458e-06, - "loss": 0.7783, - "step": 11215 - }, - { - "epoch": 0.29, - "learning_rate": 1.9773645117949587e-06, - "loss": 0.8252, - "step": 11216 - }, - { - "epoch": 0.29, - "learning_rate": 1.977358657395648e-06, - "loss": 0.8535, - "step": 11217 - }, - { - "epoch": 0.29, - "learning_rate": 1.977352802248019e-06, - "loss": 0.6978, - "step": 11218 - }, - { - "epoch": 0.29, - "learning_rate": 1.9773469463520755e-06, - "loss": 0.957, - "step": 11219 - }, - { - "epoch": 0.29, - "learning_rate": 1.977341089707823e-06, - "loss": 0.8823, - "step": 11220 - }, - { - "epoch": 0.29, - "learning_rate": 1.977335232315265e-06, - "loss": 0.8174, - "step": 11221 - }, - { - "epoch": 0.29, - "learning_rate": 1.9773293741744064e-06, - "loss": 0.9473, - "step": 11222 - }, - { - "epoch": 0.29, - "learning_rate": 1.9773235152852514e-06, - "loss": 0.9277, - "step": 11223 - }, - { - "epoch": 0.29, - "learning_rate": 1.977317655647805e-06, - "loss": 0.7871, - "step": 11224 - }, - { - "epoch": 0.29, - "learning_rate": 1.9773117952620714e-06, - "loss": 1.2305, - "step": 11225 - }, - { - "epoch": 0.29, - "learning_rate": 1.977305934128055e-06, - "loss": 0.5601, - "step": 11226 - }, - { - "epoch": 0.29, - "learning_rate": 1.9773000722457606e-06, - "loss": 0.7622, - "step": 11227 - }, - { - "epoch": 0.29, - "learning_rate": 1.977294209615192e-06, - "loss": 0.8018, - "step": 11228 - }, - { - "epoch": 0.29, - "learning_rate": 1.9772883462363544e-06, - "loss": 0.9951, - "step": 11229 - }, - { - "epoch": 0.29, - "learning_rate": 1.9772824821092523e-06, - "loss": 0.6323, - "step": 11230 - }, - { - "epoch": 0.29, - "learning_rate": 1.97727661723389e-06, - "loss": 0.9814, - "step": 11231 - }, - { - "epoch": 0.29, - "learning_rate": 1.9772707516102716e-06, - "loss": 0.7441, - "step": 11232 - }, - { - "epoch": 0.29, - "learning_rate": 1.9772648852384018e-06, - "loss": 0.8975, - "step": 11233 - }, - { - "epoch": 0.29, - "learning_rate": 1.9772590181182855e-06, - "loss": 0.8574, - "step": 11234 - }, - { - "epoch": 0.29, - "learning_rate": 1.9772531502499266e-06, - "loss": 0.6782, - "step": 11235 - }, - { - "epoch": 0.29, - "learning_rate": 1.97724728163333e-06, - "loss": 0.9893, - "step": 11236 - }, - { - "epoch": 0.29, - "learning_rate": 1.9772414122685003e-06, - "loss": 0.8574, - "step": 11237 - }, - { - "epoch": 0.29, - "learning_rate": 1.9772355421554423e-06, - "loss": 1.0645, - "step": 11238 - }, - { - "epoch": 0.29, - "learning_rate": 1.9772296712941594e-06, - "loss": 0.9316, - "step": 11239 - }, - { - "epoch": 0.29, - "learning_rate": 1.9772237996846562e-06, - "loss": 0.9482, - "step": 11240 - }, - { - "epoch": 0.29, - "learning_rate": 1.9772179273269384e-06, - "loss": 0.895, - "step": 11241 - }, - { - "epoch": 0.29, - "learning_rate": 1.9772120542210093e-06, - "loss": 0.9443, - "step": 11242 - }, - { - "epoch": 0.29, - "learning_rate": 1.977206180366874e-06, - "loss": 0.4089, - "step": 11243 - }, - { - "epoch": 0.29, - "learning_rate": 1.977200305764537e-06, - "loss": 0.6807, - "step": 11244 - }, - { - "epoch": 0.29, - "learning_rate": 1.9771944304140024e-06, - "loss": 0.959, - "step": 11245 - }, - { - "epoch": 0.29, - "learning_rate": 1.9771885543152755e-06, - "loss": 0.8848, - "step": 11246 - }, - { - "epoch": 0.29, - "learning_rate": 1.9771826774683597e-06, - "loss": 0.8936, - "step": 11247 - }, - { - "epoch": 0.29, - "learning_rate": 1.97717679987326e-06, - "loss": 0.8037, - "step": 11248 - }, - { - "epoch": 0.29, - "learning_rate": 1.9771709215299815e-06, - "loss": 0.9121, - "step": 11249 - }, - { - "epoch": 0.29, - "learning_rate": 1.977165042438528e-06, - "loss": 0.8647, - "step": 11250 - }, - { - "epoch": 0.29, - "learning_rate": 1.9771591625989037e-06, - "loss": 0.9521, - "step": 11251 - }, - { - "epoch": 0.29, - "learning_rate": 1.977153282011114e-06, - "loss": 1.0215, - "step": 11252 - }, - { - "epoch": 0.29, - "learning_rate": 1.977147400675163e-06, - "loss": 0.9385, - "step": 11253 - }, - { - "epoch": 0.29, - "learning_rate": 1.977141518591055e-06, - "loss": 0.7822, - "step": 11254 - }, - { - "epoch": 0.29, - "learning_rate": 1.9771356357587944e-06, - "loss": 0.9004, - "step": 11255 - }, - { - "epoch": 0.29, - "learning_rate": 1.9771297521783864e-06, - "loss": 1.1484, - "step": 11256 - }, - { - "epoch": 0.29, - "learning_rate": 1.977123867849835e-06, - "loss": 1.1091, - "step": 11257 - }, - { - "epoch": 0.29, - "learning_rate": 1.9771179827731445e-06, - "loss": 0.9316, - "step": 11258 - }, - { - "epoch": 0.29, - "learning_rate": 1.97711209694832e-06, - "loss": 0.9082, - "step": 11259 - }, - { - "epoch": 0.29, - "learning_rate": 1.9771062103753656e-06, - "loss": 1.04, - "step": 11260 - }, - { - "epoch": 0.29, - "learning_rate": 1.977100323054286e-06, - "loss": 0.853, - "step": 11261 - }, - { - "epoch": 0.29, - "learning_rate": 1.9770944349850854e-06, - "loss": 0.7334, - "step": 11262 - }, - { - "epoch": 0.29, - "learning_rate": 1.9770885461677687e-06, - "loss": 0.8213, - "step": 11263 - }, - { - "epoch": 0.29, - "learning_rate": 1.9770826566023402e-06, - "loss": 0.7622, - "step": 11264 - }, - { - "epoch": 0.29, - "learning_rate": 1.9770767662888042e-06, - "loss": 0.9658, - "step": 11265 - }, - { - "epoch": 0.29, - "learning_rate": 1.9770708752271658e-06, - "loss": 0.8594, - "step": 11266 - }, - { - "epoch": 0.29, - "learning_rate": 1.977064983417429e-06, - "loss": 0.834, - "step": 11267 - }, - { - "epoch": 0.29, - "learning_rate": 1.9770590908595984e-06, - "loss": 0.7637, - "step": 11268 - }, - { - "epoch": 0.29, - "learning_rate": 1.977053197553679e-06, - "loss": 0.8979, - "step": 11269 - }, - { - "epoch": 0.29, - "learning_rate": 1.977047303499674e-06, - "loss": 0.7842, - "step": 11270 - }, - { - "epoch": 0.29, - "learning_rate": 1.9770414086975894e-06, - "loss": 1.0938, - "step": 11271 - }, - { - "epoch": 0.29, - "learning_rate": 1.9770355131474293e-06, - "loss": 1.124, - "step": 11272 - }, - { - "epoch": 0.29, - "learning_rate": 1.9770296168491977e-06, - "loss": 0.9541, - "step": 11273 - }, - { - "epoch": 0.29, - "learning_rate": 1.9770237198028996e-06, - "loss": 1.1426, - "step": 11274 - }, - { - "epoch": 0.29, - "learning_rate": 1.9770178220085393e-06, - "loss": 0.7383, - "step": 11275 - }, - { - "epoch": 0.29, - "learning_rate": 1.9770119234661214e-06, - "loss": 0.8125, - "step": 11276 - }, - { - "epoch": 0.29, - "learning_rate": 1.97700602417565e-06, - "loss": 1.0244, - "step": 11277 - }, - { - "epoch": 0.29, - "learning_rate": 1.9770001241371307e-06, - "loss": 0.9199, - "step": 11278 - }, - { - "epoch": 0.29, - "learning_rate": 1.9769942233505672e-06, - "loss": 0.7959, - "step": 11279 - }, - { - "epoch": 0.29, - "learning_rate": 1.976988321815964e-06, - "loss": 0.8008, - "step": 11280 - }, - { - "epoch": 0.29, - "learning_rate": 1.9769824195333256e-06, - "loss": 0.7373, - "step": 11281 - }, - { - "epoch": 0.29, - "learning_rate": 1.9769765165026567e-06, - "loss": 1.0312, - "step": 11282 - }, - { - "epoch": 0.29, - "learning_rate": 1.976970612723962e-06, - "loss": 0.6875, - "step": 11283 - }, - { - "epoch": 0.29, - "learning_rate": 1.9769647081972458e-06, - "loss": 0.7422, - "step": 11284 - }, - { - "epoch": 0.29, - "learning_rate": 1.9769588029225126e-06, - "loss": 1.0156, - "step": 11285 - }, - { - "epoch": 0.29, - "learning_rate": 1.976952896899767e-06, - "loss": 0.7134, - "step": 11286 - }, - { - "epoch": 0.29, - "learning_rate": 1.9769469901290134e-06, - "loss": 0.8477, - "step": 11287 - }, - { - "epoch": 0.29, - "learning_rate": 1.9769410826102566e-06, - "loss": 0.9424, - "step": 11288 - }, - { - "epoch": 0.29, - "learning_rate": 1.9769351743435006e-06, - "loss": 0.7231, - "step": 11289 - }, - { - "epoch": 0.29, - "learning_rate": 1.9769292653287507e-06, - "loss": 0.6748, - "step": 11290 - }, - { - "epoch": 0.29, - "learning_rate": 1.9769233555660105e-06, - "loss": 1.0391, - "step": 11291 - }, - { - "epoch": 0.29, - "learning_rate": 1.976917445055285e-06, - "loss": 1.0264, - "step": 11292 - }, - { - "epoch": 0.29, - "learning_rate": 1.9769115337965793e-06, - "loss": 0.7861, - "step": 11293 - }, - { - "epoch": 0.29, - "learning_rate": 1.976905621789897e-06, - "loss": 1.1475, - "step": 11294 - }, - { - "epoch": 0.29, - "learning_rate": 1.9768997090352427e-06, - "loss": 0.8281, - "step": 11295 - }, - { - "epoch": 0.29, - "learning_rate": 1.976893795532622e-06, - "loss": 0.9424, - "step": 11296 - }, - { - "epoch": 0.29, - "learning_rate": 1.976887881282038e-06, - "loss": 0.9316, - "step": 11297 - }, - { - "epoch": 0.29, - "learning_rate": 1.976881966283496e-06, - "loss": 0.9443, - "step": 11298 - }, - { - "epoch": 0.29, - "learning_rate": 1.9768760505370005e-06, - "loss": 0.8584, - "step": 11299 - }, - { - "epoch": 0.29, - "learning_rate": 1.9768701340425557e-06, - "loss": 0.7727, - "step": 11300 - }, - { - "epoch": 0.29, - "learning_rate": 1.9768642168001665e-06, - "loss": 0.8691, - "step": 11301 - }, - { - "epoch": 0.29, - "learning_rate": 1.9768582988098374e-06, - "loss": 0.9619, - "step": 11302 - }, - { - "epoch": 0.29, - "learning_rate": 1.9768523800715727e-06, - "loss": 1.0449, - "step": 11303 - }, - { - "epoch": 0.29, - "learning_rate": 1.976846460585377e-06, - "loss": 1.0693, - "step": 11304 - }, - { - "epoch": 0.29, - "learning_rate": 1.9768405403512548e-06, - "loss": 1.083, - "step": 11305 - }, - { - "epoch": 0.29, - "learning_rate": 1.9768346193692113e-06, - "loss": 1.1006, - "step": 11306 - }, - { - "epoch": 0.29, - "learning_rate": 1.9768286976392495e-06, - "loss": 1.1113, - "step": 11307 - }, - { - "epoch": 0.29, - "learning_rate": 1.976822775161376e-06, - "loss": 0.9258, - "step": 11308 - }, - { - "epoch": 0.29, - "learning_rate": 1.9768168519355933e-06, - "loss": 0.8779, - "step": 11309 - }, - { - "epoch": 0.29, - "learning_rate": 1.9768109279619073e-06, - "loss": 0.8545, - "step": 11310 - }, - { - "epoch": 0.29, - "learning_rate": 1.9768050032403218e-06, - "loss": 0.8955, - "step": 11311 - }, - { - "epoch": 0.29, - "learning_rate": 1.9767990777708417e-06, - "loss": 0.7383, - "step": 11312 - }, - { - "epoch": 0.29, - "learning_rate": 1.9767931515534718e-06, - "loss": 0.7651, - "step": 11313 - }, - { - "epoch": 0.29, - "learning_rate": 1.9767872245882158e-06, - "loss": 0.9517, - "step": 11314 - }, - { - "epoch": 0.29, - "learning_rate": 1.976781296875079e-06, - "loss": 0.8564, - "step": 11315 - }, - { - "epoch": 0.29, - "learning_rate": 1.9767753684140656e-06, - "loss": 1.0479, - "step": 11316 - }, - { - "epoch": 0.29, - "learning_rate": 1.9767694392051802e-06, - "loss": 0.7622, - "step": 11317 - }, - { - "epoch": 0.29, - "learning_rate": 1.9767635092484275e-06, - "loss": 0.9033, - "step": 11318 - }, - { - "epoch": 0.29, - "learning_rate": 1.9767575785438116e-06, - "loss": 0.7617, - "step": 11319 - }, - { - "epoch": 0.29, - "learning_rate": 1.9767516470913376e-06, - "loss": 0.8735, - "step": 11320 - }, - { - "epoch": 0.29, - "learning_rate": 1.9767457148910097e-06, - "loss": 0.7563, - "step": 11321 - }, - { - "epoch": 0.29, - "learning_rate": 1.9767397819428326e-06, - "loss": 0.6709, - "step": 11322 - }, - { - "epoch": 0.29, - "learning_rate": 1.9767338482468106e-06, - "loss": 0.9082, - "step": 11323 - }, - { - "epoch": 0.29, - "learning_rate": 1.9767279138029487e-06, - "loss": 1.0625, - "step": 11324 - }, - { - "epoch": 0.29, - "learning_rate": 1.9767219786112507e-06, - "loss": 0.8662, - "step": 11325 - }, - { - "epoch": 0.29, - "learning_rate": 1.976716042671722e-06, - "loss": 0.9062, - "step": 11326 - }, - { - "epoch": 0.29, - "learning_rate": 1.9767101059843664e-06, - "loss": 0.9023, - "step": 11327 - }, - { - "epoch": 0.29, - "learning_rate": 1.976704168549189e-06, - "loss": 0.8496, - "step": 11328 - }, - { - "epoch": 0.29, - "learning_rate": 1.976698230366194e-06, - "loss": 0.917, - "step": 11329 - }, - { - "epoch": 0.29, - "learning_rate": 1.976692291435386e-06, - "loss": 0.8281, - "step": 11330 - }, - { - "epoch": 0.29, - "learning_rate": 1.9766863517567704e-06, - "loss": 0.9463, - "step": 11331 - }, - { - "epoch": 0.29, - "learning_rate": 1.9766804113303503e-06, - "loss": 0.8506, - "step": 11332 - }, - { - "epoch": 0.29, - "learning_rate": 1.9766744701561306e-06, - "loss": 1.0225, - "step": 11333 - }, - { - "epoch": 0.29, - "learning_rate": 1.9766685282341168e-06, - "loss": 1.0244, - "step": 11334 - }, - { - "epoch": 0.29, - "learning_rate": 1.976662585564312e-06, - "loss": 1.0312, - "step": 11335 - }, - { - "epoch": 0.29, - "learning_rate": 1.9766566421467227e-06, - "loss": 0.8965, - "step": 11336 - }, - { - "epoch": 0.29, - "learning_rate": 1.9766506979813515e-06, - "loss": 0.9443, - "step": 11337 - }, - { - "epoch": 0.29, - "learning_rate": 1.976644753068204e-06, - "loss": 1.0068, - "step": 11338 - }, - { - "epoch": 0.29, - "learning_rate": 1.9766388074072845e-06, - "loss": 1.0, - "step": 11339 - }, - { - "epoch": 0.29, - "learning_rate": 1.9766328609985977e-06, - "loss": 0.9141, - "step": 11340 - }, - { - "epoch": 0.29, - "learning_rate": 1.976626913842148e-06, - "loss": 0.7842, - "step": 11341 - }, - { - "epoch": 0.29, - "learning_rate": 1.97662096593794e-06, - "loss": 0.8906, - "step": 11342 - }, - { - "epoch": 0.29, - "learning_rate": 1.976615017285978e-06, - "loss": 0.8838, - "step": 11343 - }, - { - "epoch": 0.29, - "learning_rate": 1.976609067886267e-06, - "loss": 1.0459, - "step": 11344 - }, - { - "epoch": 0.29, - "learning_rate": 1.976603117738811e-06, - "loss": 0.9316, - "step": 11345 - }, - { - "epoch": 0.29, - "learning_rate": 1.976597166843615e-06, - "loss": 0.7778, - "step": 11346 - }, - { - "epoch": 0.29, - "learning_rate": 1.976591215200684e-06, - "loss": 1.0146, - "step": 11347 - }, - { - "epoch": 0.29, - "learning_rate": 1.9765852628100214e-06, - "loss": 0.8613, - "step": 11348 - }, - { - "epoch": 0.29, - "learning_rate": 1.9765793096716324e-06, - "loss": 0.8955, - "step": 11349 - }, - { - "epoch": 0.29, - "learning_rate": 1.976573355785522e-06, - "loss": 0.9561, - "step": 11350 - }, - { - "epoch": 0.29, - "learning_rate": 1.976567401151694e-06, - "loss": 0.9893, - "step": 11351 - }, - { - "epoch": 0.29, - "learning_rate": 1.9765614457701533e-06, - "loss": 0.8877, - "step": 11352 - }, - { - "epoch": 0.29, - "learning_rate": 1.976555489640904e-06, - "loss": 0.8232, - "step": 11353 - }, - { - "epoch": 0.29, - "learning_rate": 1.9765495327639515e-06, - "loss": 0.9287, - "step": 11354 - }, - { - "epoch": 0.29, - "learning_rate": 1.9765435751393e-06, - "loss": 1.0029, - "step": 11355 - }, - { - "epoch": 0.29, - "learning_rate": 1.9765376167669537e-06, - "loss": 1.2188, - "step": 11356 - }, - { - "epoch": 0.29, - "learning_rate": 1.9765316576469176e-06, - "loss": 0.8613, - "step": 11357 - }, - { - "epoch": 0.29, - "learning_rate": 1.976525697779196e-06, - "loss": 0.6992, - "step": 11358 - }, - { - "epoch": 0.29, - "learning_rate": 1.9765197371637937e-06, - "loss": 0.752, - "step": 11359 - }, - { - "epoch": 0.29, - "learning_rate": 1.9765137758007152e-06, - "loss": 0.9492, - "step": 11360 - }, - { - "epoch": 0.29, - "learning_rate": 1.976507813689965e-06, - "loss": 0.8389, - "step": 11361 - }, - { - "epoch": 0.29, - "learning_rate": 1.9765018508315477e-06, - "loss": 0.77, - "step": 11362 - }, - { - "epoch": 0.29, - "learning_rate": 1.9764958872254675e-06, - "loss": 0.8594, - "step": 11363 - }, - { - "epoch": 0.29, - "learning_rate": 1.9764899228717296e-06, - "loss": 1.0508, - "step": 11364 - }, - { - "epoch": 0.29, - "learning_rate": 1.976483957770338e-06, - "loss": 0.7266, - "step": 11365 - }, - { - "epoch": 0.29, - "learning_rate": 1.9764779919212978e-06, - "loss": 1.1133, - "step": 11366 - }, - { - "epoch": 0.29, - "learning_rate": 1.976472025324613e-06, - "loss": 1.1289, - "step": 11367 - }, - { - "epoch": 0.29, - "learning_rate": 1.9764660579802887e-06, - "loss": 0.752, - "step": 11368 - }, - { - "epoch": 0.29, - "learning_rate": 1.9764600898883296e-06, - "loss": 0.9404, - "step": 11369 - }, - { - "epoch": 0.29, - "learning_rate": 1.9764541210487395e-06, - "loss": 1.0215, - "step": 11370 - }, - { - "epoch": 0.29, - "learning_rate": 1.9764481514615234e-06, - "loss": 0.9468, - "step": 11371 - }, - { - "epoch": 0.29, - "learning_rate": 1.9764421811266855e-06, - "loss": 0.8867, - "step": 11372 - }, - { - "epoch": 0.29, - "learning_rate": 1.9764362100442313e-06, - "loss": 0.9395, - "step": 11373 - }, - { - "epoch": 0.29, - "learning_rate": 1.9764302382141643e-06, - "loss": 0.9365, - "step": 11374 - }, - { - "epoch": 0.29, - "learning_rate": 1.97642426563649e-06, - "loss": 0.7734, - "step": 11375 - }, - { - "epoch": 0.29, - "learning_rate": 1.9764182923112123e-06, - "loss": 0.7246, - "step": 11376 - }, - { - "epoch": 0.29, - "learning_rate": 1.9764123182383363e-06, - "loss": 0.9023, - "step": 11377 - }, - { - "epoch": 0.29, - "learning_rate": 1.976406343417866e-06, - "loss": 1.0352, - "step": 11378 - }, - { - "epoch": 0.29, - "learning_rate": 1.976400367849806e-06, - "loss": 0.874, - "step": 11379 - }, - { - "epoch": 0.29, - "learning_rate": 1.9763943915341618e-06, - "loss": 1.0059, - "step": 11380 - }, - { - "epoch": 0.29, - "learning_rate": 1.9763884144709367e-06, - "loss": 0.666, - "step": 11381 - }, - { - "epoch": 0.29, - "learning_rate": 1.9763824366601365e-06, - "loss": 0.7412, - "step": 11382 - }, - { - "epoch": 0.29, - "learning_rate": 1.9763764581017644e-06, - "loss": 1.0444, - "step": 11383 - }, - { - "epoch": 0.29, - "learning_rate": 1.9763704787958265e-06, - "loss": 1.1289, - "step": 11384 - }, - { - "epoch": 0.29, - "learning_rate": 1.976364498742326e-06, - "loss": 0.7964, - "step": 11385 - }, - { - "epoch": 0.29, - "learning_rate": 1.9763585179412683e-06, - "loss": 0.7363, - "step": 11386 - }, - { - "epoch": 0.29, - "learning_rate": 1.9763525363926582e-06, - "loss": 0.916, - "step": 11387 - }, - { - "epoch": 0.29, - "learning_rate": 1.9763465540964992e-06, - "loss": 0.9971, - "step": 11388 - }, - { - "epoch": 0.29, - "learning_rate": 1.9763405710527968e-06, - "loss": 0.7627, - "step": 11389 - }, - { - "epoch": 0.29, - "learning_rate": 1.9763345872615555e-06, - "loss": 1.0381, - "step": 11390 - }, - { - "epoch": 0.29, - "learning_rate": 1.97632860272278e-06, - "loss": 0.9844, - "step": 11391 - }, - { - "epoch": 0.29, - "learning_rate": 1.9763226174364738e-06, - "loss": 0.7385, - "step": 11392 - }, - { - "epoch": 0.29, - "learning_rate": 1.9763166314026425e-06, - "loss": 0.9023, - "step": 11393 - }, - { - "epoch": 0.29, - "learning_rate": 1.9763106446212907e-06, - "loss": 0.835, - "step": 11394 - }, - { - "epoch": 0.29, - "learning_rate": 1.9763046570924226e-06, - "loss": 1.0049, - "step": 11395 - }, - { - "epoch": 0.29, - "learning_rate": 1.976298668816043e-06, - "loss": 0.8867, - "step": 11396 - }, - { - "epoch": 0.29, - "learning_rate": 1.976292679792156e-06, - "loss": 0.9531, - "step": 11397 - }, - { - "epoch": 0.29, - "learning_rate": 1.976286690020767e-06, - "loss": 1.0273, - "step": 11398 - }, - { - "epoch": 0.29, - "learning_rate": 1.9762806995018797e-06, - "loss": 1.0352, - "step": 11399 - }, - { - "epoch": 0.29, - "learning_rate": 1.9762747082355e-06, - "loss": 1.0156, - "step": 11400 - }, - { - "epoch": 0.29, - "learning_rate": 1.976268716221631e-06, - "loss": 1.083, - "step": 11401 - }, - { - "epoch": 0.29, - "learning_rate": 1.976262723460278e-06, - "loss": 0.8965, - "step": 11402 - }, - { - "epoch": 0.29, - "learning_rate": 1.9762567299514455e-06, - "loss": 0.7744, - "step": 11403 - }, - { - "epoch": 0.29, - "learning_rate": 1.9762507356951385e-06, - "loss": 1.0234, - "step": 11404 - }, - { - "epoch": 0.29, - "learning_rate": 1.976244740691361e-06, - "loss": 0.8232, - "step": 11405 - }, - { - "epoch": 0.29, - "learning_rate": 1.976238744940118e-06, - "loss": 0.8984, - "step": 11406 - }, - { - "epoch": 0.29, - "learning_rate": 1.976232748441413e-06, - "loss": 1.0684, - "step": 11407 - }, - { - "epoch": 0.29, - "learning_rate": 1.9762267511952525e-06, - "loss": 0.7146, - "step": 11408 - }, - { - "epoch": 0.29, - "learning_rate": 1.9762207532016396e-06, - "loss": 0.8311, - "step": 11409 - }, - { - "epoch": 0.29, - "learning_rate": 1.9762147544605794e-06, - "loss": 1.1826, - "step": 11410 - }, - { - "epoch": 0.29, - "learning_rate": 1.976208754972076e-06, - "loss": 0.7529, - "step": 11411 - }, - { - "epoch": 0.29, - "learning_rate": 1.976202754736135e-06, - "loss": 1.0527, - "step": 11412 - }, - { - "epoch": 0.29, - "learning_rate": 1.9761967537527605e-06, - "loss": 0.8682, - "step": 11413 - }, - { - "epoch": 0.29, - "learning_rate": 1.976190752021957e-06, - "loss": 0.9482, - "step": 11414 - }, - { - "epoch": 0.29, - "learning_rate": 1.976184749543729e-06, - "loss": 0.7686, - "step": 11415 - }, - { - "epoch": 0.29, - "learning_rate": 1.976178746318081e-06, - "loss": 0.875, - "step": 11416 - }, - { - "epoch": 0.29, - "learning_rate": 1.9761727423450184e-06, - "loss": 0.8799, - "step": 11417 - }, - { - "epoch": 0.29, - "learning_rate": 1.9761667376245447e-06, - "loss": 1.0215, - "step": 11418 - }, - { - "epoch": 0.29, - "learning_rate": 1.976160732156665e-06, - "loss": 0.9746, - "step": 11419 - }, - { - "epoch": 0.29, - "learning_rate": 1.976154725941384e-06, - "loss": 0.999, - "step": 11420 - }, - { - "epoch": 0.29, - "learning_rate": 1.9761487189787067e-06, - "loss": 0.9336, - "step": 11421 - }, - { - "epoch": 0.29, - "learning_rate": 1.9761427112686366e-06, - "loss": 0.8423, - "step": 11422 - }, - { - "epoch": 0.29, - "learning_rate": 1.976136702811179e-06, - "loss": 0.9678, - "step": 11423 - }, - { - "epoch": 0.29, - "learning_rate": 1.9761306936063382e-06, - "loss": 1.0361, - "step": 11424 - }, - { - "epoch": 0.29, - "learning_rate": 1.97612468365412e-06, - "loss": 0.8604, - "step": 11425 - }, - { - "epoch": 0.29, - "learning_rate": 1.9761186729545273e-06, - "loss": 1.0068, - "step": 11426 - }, - { - "epoch": 0.29, - "learning_rate": 1.976112661507565e-06, - "loss": 0.9385, - "step": 11427 - }, - { - "epoch": 0.29, - "learning_rate": 1.9761066493132386e-06, - "loss": 0.876, - "step": 11428 - }, - { - "epoch": 0.29, - "learning_rate": 1.9761006363715525e-06, - "loss": 1.0303, - "step": 11429 - }, - { - "epoch": 0.29, - "learning_rate": 1.9760946226825106e-06, - "loss": 1.1357, - "step": 11430 - }, - { - "epoch": 0.29, - "learning_rate": 1.976088608246118e-06, - "loss": 0.8711, - "step": 11431 - }, - { - "epoch": 0.29, - "learning_rate": 1.9760825930623796e-06, - "loss": 0.6274, - "step": 11432 - }, - { - "epoch": 0.29, - "learning_rate": 1.976076577131299e-06, - "loss": 0.7412, - "step": 11433 - }, - { - "epoch": 0.29, - "learning_rate": 1.9760705604528818e-06, - "loss": 0.8232, - "step": 11434 - }, - { - "epoch": 0.29, - "learning_rate": 1.9760645430271324e-06, - "loss": 0.8936, - "step": 11435 - }, - { - "epoch": 0.29, - "learning_rate": 1.9760585248540548e-06, - "loss": 1.1602, - "step": 11436 - }, - { - "epoch": 0.29, - "learning_rate": 1.9760525059336548e-06, - "loss": 0.917, - "step": 11437 - }, - { - "epoch": 0.29, - "learning_rate": 1.976046486265936e-06, - "loss": 0.6792, - "step": 11438 - }, - { - "epoch": 0.29, - "learning_rate": 1.9760404658509026e-06, - "loss": 0.7144, - "step": 11439 - }, - { - "epoch": 0.29, - "learning_rate": 1.9760344446885605e-06, - "loss": 0.7168, - "step": 11440 - }, - { - "epoch": 0.29, - "learning_rate": 1.9760284227789135e-06, - "loss": 0.7754, - "step": 11441 - }, - { - "epoch": 0.29, - "learning_rate": 1.9760224001219666e-06, - "loss": 0.834, - "step": 11442 - }, - { - "epoch": 0.29, - "learning_rate": 1.976016376717724e-06, - "loss": 1.0166, - "step": 11443 - }, - { - "epoch": 0.29, - "learning_rate": 1.9760103525661908e-06, - "loss": 1.2617, - "step": 11444 - }, - { - "epoch": 0.29, - "learning_rate": 1.9760043276673713e-06, - "loss": 0.8994, - "step": 11445 - }, - { - "epoch": 0.29, - "learning_rate": 1.9759983020212705e-06, - "loss": 1.0693, - "step": 11446 - }, - { - "epoch": 0.29, - "learning_rate": 1.975992275627892e-06, - "loss": 1.1963, - "step": 11447 - }, - { - "epoch": 0.29, - "learning_rate": 1.975986248487241e-06, - "loss": 0.958, - "step": 11448 - }, - { - "epoch": 0.29, - "learning_rate": 1.975980220599323e-06, - "loss": 0.9189, - "step": 11449 - }, - { - "epoch": 0.29, - "learning_rate": 1.9759741919641415e-06, - "loss": 0.9629, - "step": 11450 - }, - { - "epoch": 0.29, - "learning_rate": 1.9759681625817013e-06, - "loss": 0.9346, - "step": 11451 - }, - { - "epoch": 0.29, - "learning_rate": 1.975962132452007e-06, - "loss": 0.5938, - "step": 11452 - }, - { - "epoch": 0.29, - "learning_rate": 1.9759561015750635e-06, - "loss": 0.9756, - "step": 11453 - }, - { - "epoch": 0.29, - "learning_rate": 1.9759500699508756e-06, - "loss": 1.1289, - "step": 11454 - }, - { - "epoch": 0.29, - "learning_rate": 1.975944037579447e-06, - "loss": 0.7905, - "step": 11455 - }, - { - "epoch": 0.29, - "learning_rate": 1.9759380044607836e-06, - "loss": 0.9297, - "step": 11456 - }, - { - "epoch": 0.29, - "learning_rate": 1.9759319705948887e-06, - "loss": 0.8032, - "step": 11457 - }, - { - "epoch": 0.29, - "learning_rate": 1.975925935981768e-06, - "loss": 1.0986, - "step": 11458 - }, - { - "epoch": 0.29, - "learning_rate": 1.975919900621426e-06, - "loss": 0.8848, - "step": 11459 - }, - { - "epoch": 0.29, - "learning_rate": 1.9759138645138664e-06, - "loss": 0.665, - "step": 11460 - }, - { - "epoch": 0.29, - "learning_rate": 1.9759078276590947e-06, - "loss": 0.9922, - "step": 11461 - }, - { - "epoch": 0.29, - "learning_rate": 1.975901790057115e-06, - "loss": 0.9697, - "step": 11462 - }, - { - "epoch": 0.29, - "learning_rate": 1.9758957517079323e-06, - "loss": 0.9248, - "step": 11463 - }, - { - "epoch": 0.29, - "learning_rate": 1.9758897126115514e-06, - "loss": 0.7427, - "step": 11464 - }, - { - "epoch": 0.29, - "learning_rate": 1.9758836727679765e-06, - "loss": 0.9697, - "step": 11465 - }, - { - "epoch": 0.29, - "learning_rate": 1.9758776321772118e-06, - "loss": 0.6082, - "step": 11466 - }, - { - "epoch": 0.29, - "learning_rate": 1.9758715908392628e-06, - "loss": 1.0557, - "step": 11467 - }, - { - "epoch": 0.29, - "learning_rate": 1.975865548754134e-06, - "loss": 0.9502, - "step": 11468 - }, - { - "epoch": 0.29, - "learning_rate": 1.9758595059218297e-06, - "loss": 0.9014, - "step": 11469 - }, - { - "epoch": 0.29, - "learning_rate": 1.975853462342355e-06, - "loss": 0.875, - "step": 11470 - }, - { - "epoch": 0.29, - "learning_rate": 1.9758474180157134e-06, - "loss": 1.0547, - "step": 11471 - }, - { - "epoch": 0.29, - "learning_rate": 1.975841372941911e-06, - "loss": 0.832, - "step": 11472 - }, - { - "epoch": 0.29, - "learning_rate": 1.975835327120951e-06, - "loss": 0.79, - "step": 11473 - }, - { - "epoch": 0.29, - "learning_rate": 1.9758292805528395e-06, - "loss": 0.8037, - "step": 11474 - }, - { - "epoch": 0.29, - "learning_rate": 1.97582323323758e-06, - "loss": 1.0312, - "step": 11475 - }, - { - "epoch": 0.29, - "learning_rate": 1.9758171851751776e-06, - "loss": 0.7975, - "step": 11476 - }, - { - "epoch": 0.29, - "learning_rate": 1.975811136365637e-06, - "loss": 1.0723, - "step": 11477 - }, - { - "epoch": 0.29, - "learning_rate": 1.9758050868089624e-06, - "loss": 0.8486, - "step": 11478 - }, - { - "epoch": 0.29, - "learning_rate": 1.975799036505159e-06, - "loss": 0.8584, - "step": 11479 - }, - { - "epoch": 0.29, - "learning_rate": 1.975792985454231e-06, - "loss": 0.7942, - "step": 11480 - }, - { - "epoch": 0.29, - "learning_rate": 1.975786933656183e-06, - "loss": 0.7246, - "step": 11481 - }, - { - "epoch": 0.29, - "learning_rate": 1.97578088111102e-06, - "loss": 1.0176, - "step": 11482 - }, - { - "epoch": 0.29, - "learning_rate": 1.9757748278187468e-06, - "loss": 0.8667, - "step": 11483 - }, - { - "epoch": 0.29, - "learning_rate": 1.975768773779367e-06, - "loss": 1.0898, - "step": 11484 - }, - { - "epoch": 0.29, - "learning_rate": 1.9757627189928864e-06, - "loss": 0.9189, - "step": 11485 - }, - { - "epoch": 0.29, - "learning_rate": 1.975756663459309e-06, - "loss": 1.0527, - "step": 11486 - }, - { - "epoch": 0.29, - "learning_rate": 1.9757506071786395e-06, - "loss": 0.8486, - "step": 11487 - }, - { - "epoch": 0.29, - "learning_rate": 1.975744550150883e-06, - "loss": 1.0742, - "step": 11488 - }, - { - "epoch": 0.29, - "learning_rate": 1.975738492376043e-06, - "loss": 1.1816, - "step": 11489 - }, - { - "epoch": 0.29, - "learning_rate": 1.975732433854126e-06, - "loss": 1.0879, - "step": 11490 - }, - { - "epoch": 0.29, - "learning_rate": 1.9757263745851348e-06, - "loss": 0.9482, - "step": 11491 - }, - { - "epoch": 0.29, - "learning_rate": 1.9757203145690746e-06, - "loss": 1.0088, - "step": 11492 - }, - { - "epoch": 0.29, - "learning_rate": 1.9757142538059505e-06, - "loss": 1.0264, - "step": 11493 - }, - { - "epoch": 0.29, - "learning_rate": 1.975708192295767e-06, - "loss": 0.8384, - "step": 11494 - }, - { - "epoch": 0.29, - "learning_rate": 1.9757021300385284e-06, - "loss": 0.9268, - "step": 11495 - }, - { - "epoch": 0.29, - "learning_rate": 1.9756960670342394e-06, - "loss": 0.7544, - "step": 11496 - }, - { - "epoch": 0.29, - "learning_rate": 1.975690003282905e-06, - "loss": 1.0713, - "step": 11497 - }, - { - "epoch": 0.29, - "learning_rate": 1.97568393878453e-06, - "loss": 0.9453, - "step": 11498 - }, - { - "epoch": 0.29, - "learning_rate": 1.9756778735391183e-06, - "loss": 0.9414, - "step": 11499 - }, - { - "epoch": 0.29, - "learning_rate": 1.975671807546675e-06, - "loss": 0.8081, - "step": 11500 - }, - { - "epoch": 0.29, - "learning_rate": 1.9756657408072044e-06, - "loss": 0.8271, - "step": 11501 - }, - { - "epoch": 0.29, - "learning_rate": 1.975659673320712e-06, - "loss": 1.0303, - "step": 11502 - }, - { - "epoch": 0.29, - "learning_rate": 1.975653605087201e-06, - "loss": 0.6865, - "step": 11503 - }, - { - "epoch": 0.29, - "learning_rate": 1.9756475361066777e-06, - "loss": 0.9971, - "step": 11504 - }, - { - "epoch": 0.29, - "learning_rate": 1.9756414663791456e-06, - "loss": 0.9167, - "step": 11505 - }, - { - "epoch": 0.29, - "learning_rate": 1.9756353959046095e-06, - "loss": 0.8486, - "step": 11506 - }, - { - "epoch": 0.29, - "learning_rate": 1.9756293246830743e-06, - "loss": 0.7622, - "step": 11507 - }, - { - "epoch": 0.29, - "learning_rate": 1.9756232527145445e-06, - "loss": 0.8125, - "step": 11508 - }, - { - "epoch": 0.29, - "learning_rate": 1.975617179999025e-06, - "loss": 0.7146, - "step": 11509 - }, - { - "epoch": 0.3, - "learning_rate": 1.9756111065365204e-06, - "loss": 0.7915, - "step": 11510 - }, - { - "epoch": 0.3, - "learning_rate": 1.9756050323270354e-06, - "loss": 0.7783, - "step": 11511 - }, - { - "epoch": 0.3, - "learning_rate": 1.975598957370574e-06, - "loss": 0.8013, - "step": 11512 - }, - { - "epoch": 0.3, - "learning_rate": 1.9755928816671415e-06, - "loss": 0.9033, - "step": 11513 - }, - { - "epoch": 0.3, - "learning_rate": 1.9755868052167427e-06, - "loss": 0.6582, - "step": 11514 - }, - { - "epoch": 0.3, - "learning_rate": 1.9755807280193815e-06, - "loss": 1.0459, - "step": 11515 - }, - { - "epoch": 0.3, - "learning_rate": 1.9755746500750636e-06, - "loss": 0.8237, - "step": 11516 - }, - { - "epoch": 0.3, - "learning_rate": 1.9755685713837925e-06, - "loss": 0.9297, - "step": 11517 - }, - { - "epoch": 0.3, - "learning_rate": 1.9755624919455736e-06, - "loss": 0.7891, - "step": 11518 - }, - { - "epoch": 0.3, - "learning_rate": 1.9755564117604113e-06, - "loss": 0.8447, - "step": 11519 - }, - { - "epoch": 0.3, - "learning_rate": 1.97555033082831e-06, - "loss": 0.9795, - "step": 11520 - }, - { - "epoch": 0.3, - "learning_rate": 1.975544249149275e-06, - "loss": 0.8652, - "step": 11521 - }, - { - "epoch": 0.3, - "learning_rate": 1.975538166723311e-06, - "loss": 0.832, - "step": 11522 - }, - { - "epoch": 0.3, - "learning_rate": 1.9755320835504215e-06, - "loss": 1.0635, - "step": 11523 - }, - { - "epoch": 0.3, - "learning_rate": 1.9755259996306126e-06, - "loss": 0.7441, - "step": 11524 - }, - { - "epoch": 0.3, - "learning_rate": 1.975519914963888e-06, - "loss": 0.959, - "step": 11525 - }, - { - "epoch": 0.3, - "learning_rate": 1.9755138295502526e-06, - "loss": 0.8022, - "step": 11526 - }, - { - "epoch": 0.3, - "learning_rate": 1.975507743389711e-06, - "loss": 1.0234, - "step": 11527 - }, - { - "epoch": 0.3, - "learning_rate": 1.9755016564822684e-06, - "loss": 0.8252, - "step": 11528 - }, - { - "epoch": 0.3, - "learning_rate": 1.9754955688279285e-06, - "loss": 1.1387, - "step": 11529 - }, - { - "epoch": 0.3, - "learning_rate": 1.975489480426697e-06, - "loss": 0.9033, - "step": 11530 - }, - { - "epoch": 0.3, - "learning_rate": 1.975483391278578e-06, - "loss": 0.9326, - "step": 11531 - }, - { - "epoch": 0.3, - "learning_rate": 1.975477301383576e-06, - "loss": 0.9277, - "step": 11532 - }, - { - "epoch": 0.3, - "learning_rate": 1.9754712107416963e-06, - "loss": 1.0195, - "step": 11533 - }, - { - "epoch": 0.3, - "learning_rate": 1.9754651193529427e-06, - "loss": 0.96, - "step": 11534 - }, - { - "epoch": 0.3, - "learning_rate": 1.9754590272173204e-06, - "loss": 1.0615, - "step": 11535 - }, - { - "epoch": 0.3, - "learning_rate": 1.975452934334834e-06, - "loss": 0.8013, - "step": 11536 - }, - { - "epoch": 0.3, - "learning_rate": 1.975446840705488e-06, - "loss": 0.708, - "step": 11537 - }, - { - "epoch": 0.3, - "learning_rate": 1.9754407463292874e-06, - "loss": 0.9844, - "step": 11538 - }, - { - "epoch": 0.3, - "learning_rate": 1.9754346512062366e-06, - "loss": 0.8135, - "step": 11539 - }, - { - "epoch": 0.3, - "learning_rate": 1.9754285553363404e-06, - "loss": 1.0713, - "step": 11540 - }, - { - "epoch": 0.3, - "learning_rate": 1.9754224587196037e-06, - "loss": 0.9092, - "step": 11541 - }, - { - "epoch": 0.3, - "learning_rate": 1.9754163613560305e-06, - "loss": 1.001, - "step": 11542 - }, - { - "epoch": 0.3, - "learning_rate": 1.975410263245626e-06, - "loss": 0.9541, - "step": 11543 - }, - { - "epoch": 0.3, - "learning_rate": 1.9754041643883943e-06, - "loss": 0.8047, - "step": 11544 - }, - { - "epoch": 0.3, - "learning_rate": 1.975398064784341e-06, - "loss": 0.7129, - "step": 11545 - }, - { - "epoch": 0.3, - "learning_rate": 1.97539196443347e-06, - "loss": 0.8086, - "step": 11546 - }, - { - "epoch": 0.3, - "learning_rate": 1.975385863335786e-06, - "loss": 0.7983, - "step": 11547 - }, - { - "epoch": 0.3, - "learning_rate": 1.9753797614912943e-06, - "loss": 1.0391, - "step": 11548 - }, - { - "epoch": 0.3, - "learning_rate": 1.9753736588999993e-06, - "loss": 0.957, - "step": 11549 - }, - { - "epoch": 0.3, - "learning_rate": 1.975367555561905e-06, - "loss": 0.7744, - "step": 11550 - }, - { - "epoch": 0.3, - "learning_rate": 1.975361451477017e-06, - "loss": 0.7168, - "step": 11551 - }, - { - "epoch": 0.3, - "learning_rate": 1.9753553466453393e-06, - "loss": 0.8818, - "step": 11552 - }, - { - "epoch": 0.3, - "learning_rate": 1.9753492410668772e-06, - "loss": 1.2031, - "step": 11553 - }, - { - "epoch": 0.3, - "learning_rate": 1.975343134741635e-06, - "loss": 1.0469, - "step": 11554 - }, - { - "epoch": 0.3, - "learning_rate": 1.975337027669617e-06, - "loss": 0.7178, - "step": 11555 - }, - { - "epoch": 0.3, - "learning_rate": 1.9753309198508285e-06, - "loss": 0.793, - "step": 11556 - }, - { - "epoch": 0.3, - "learning_rate": 1.975324811285274e-06, - "loss": 0.7727, - "step": 11557 - }, - { - "epoch": 0.3, - "learning_rate": 1.9753187019729583e-06, - "loss": 0.7705, - "step": 11558 - }, - { - "epoch": 0.3, - "learning_rate": 1.9753125919138854e-06, - "loss": 0.8364, - "step": 11559 - }, - { - "epoch": 0.3, - "learning_rate": 1.975306481108061e-06, - "loss": 0.8643, - "step": 11560 - }, - { - "epoch": 0.3, - "learning_rate": 1.975300369555489e-06, - "loss": 0.8279, - "step": 11561 - }, - { - "epoch": 0.3, - "learning_rate": 1.9752942572561747e-06, - "loss": 0.9404, - "step": 11562 - }, - { - "epoch": 0.3, - "learning_rate": 1.9752881442101223e-06, - "loss": 1.0732, - "step": 11563 - }, - { - "epoch": 0.3, - "learning_rate": 1.9752820304173367e-06, - "loss": 0.9395, - "step": 11564 - }, - { - "epoch": 0.3, - "learning_rate": 1.975275915877822e-06, - "loss": 0.8506, - "step": 11565 - }, - { - "epoch": 0.3, - "learning_rate": 1.9752698005915836e-06, - "loss": 1.1201, - "step": 11566 - }, - { - "epoch": 0.3, - "learning_rate": 1.9752636845586262e-06, - "loss": 1.0283, - "step": 11567 - }, - { - "epoch": 0.3, - "learning_rate": 1.975257567778954e-06, - "loss": 0.9199, - "step": 11568 - }, - { - "epoch": 0.3, - "learning_rate": 1.975251450252572e-06, - "loss": 0.9375, - "step": 11569 - }, - { - "epoch": 0.3, - "learning_rate": 1.9752453319794847e-06, - "loss": 0.9893, - "step": 11570 - }, - { - "epoch": 0.3, - "learning_rate": 1.9752392129596973e-06, - "loss": 0.8088, - "step": 11571 - }, - { - "epoch": 0.3, - "learning_rate": 1.9752330931932135e-06, - "loss": 0.9619, - "step": 11572 - }, - { - "epoch": 0.3, - "learning_rate": 1.9752269726800393e-06, - "loss": 0.9775, - "step": 11573 - }, - { - "epoch": 0.3, - "learning_rate": 1.975220851420178e-06, - "loss": 0.9717, - "step": 11574 - }, - { - "epoch": 0.3, - "learning_rate": 1.975214729413635e-06, - "loss": 0.8457, - "step": 11575 - }, - { - "epoch": 0.3, - "learning_rate": 1.9752086066604153e-06, - "loss": 0.9648, - "step": 11576 - }, - { - "epoch": 0.3, - "learning_rate": 1.975202483160523e-06, - "loss": 0.9893, - "step": 11577 - }, - { - "epoch": 0.3, - "learning_rate": 1.975196358913963e-06, - "loss": 0.9053, - "step": 11578 - }, - { - "epoch": 0.3, - "learning_rate": 1.97519023392074e-06, - "loss": 0.7979, - "step": 11579 - }, - { - "epoch": 0.3, - "learning_rate": 1.9751841081808586e-06, - "loss": 0.9243, - "step": 11580 - }, - { - "epoch": 0.3, - "learning_rate": 1.9751779816943233e-06, - "loss": 0.9834, - "step": 11581 - }, - { - "epoch": 0.3, - "learning_rate": 1.9751718544611395e-06, - "loss": 1.0938, - "step": 11582 - }, - { - "epoch": 0.3, - "learning_rate": 1.9751657264813114e-06, - "loss": 0.9736, - "step": 11583 - }, - { - "epoch": 0.3, - "learning_rate": 1.975159597754844e-06, - "loss": 0.958, - "step": 11584 - }, - { - "epoch": 0.3, - "learning_rate": 1.975153468281741e-06, - "loss": 0.8154, - "step": 11585 - }, - { - "epoch": 0.3, - "learning_rate": 1.9751473380620082e-06, - "loss": 1.0645, - "step": 11586 - }, - { - "epoch": 0.3, - "learning_rate": 1.97514120709565e-06, - "loss": 0.96, - "step": 11587 - }, - { - "epoch": 0.3, - "learning_rate": 1.975135075382671e-06, - "loss": 0.8027, - "step": 11588 - }, - { - "epoch": 0.3, - "learning_rate": 1.975128942923076e-06, - "loss": 0.8525, - "step": 11589 - }, - { - "epoch": 0.3, - "learning_rate": 1.9751228097168694e-06, - "loss": 0.9541, - "step": 11590 - }, - { - "epoch": 0.3, - "learning_rate": 1.9751166757640563e-06, - "loss": 0.7722, - "step": 11591 - }, - { - "epoch": 0.3, - "learning_rate": 1.975110541064641e-06, - "loss": 1.1426, - "step": 11592 - }, - { - "epoch": 0.3, - "learning_rate": 1.9751044056186285e-06, - "loss": 0.875, - "step": 11593 - }, - { - "epoch": 0.3, - "learning_rate": 1.9750982694260236e-06, - "loss": 0.9199, - "step": 11594 - }, - { - "epoch": 0.3, - "learning_rate": 1.9750921324868303e-06, - "loss": 0.8613, - "step": 11595 - }, - { - "epoch": 0.3, - "learning_rate": 1.975085994801054e-06, - "loss": 0.6284, - "step": 11596 - }, - { - "epoch": 0.3, - "learning_rate": 1.9750798563686996e-06, - "loss": 0.9277, - "step": 11597 - }, - { - "epoch": 0.3, - "learning_rate": 1.9750737171897707e-06, - "loss": 0.9697, - "step": 11598 - }, - { - "epoch": 0.3, - "learning_rate": 1.9750675772642734e-06, - "loss": 0.9785, - "step": 11599 - }, - { - "epoch": 0.3, - "learning_rate": 1.975061436592211e-06, - "loss": 0.9961, - "step": 11600 - }, - { - "epoch": 0.3, - "learning_rate": 1.9750552951735893e-06, - "loss": 0.5579, - "step": 11601 - }, - { - "epoch": 0.3, - "learning_rate": 1.9750491530084124e-06, - "loss": 0.9951, - "step": 11602 - }, - { - "epoch": 0.3, - "learning_rate": 1.9750430100966855e-06, - "loss": 1.0137, - "step": 11603 - }, - { - "epoch": 0.3, - "learning_rate": 1.9750368664384127e-06, - "loss": 0.9873, - "step": 11604 - }, - { - "epoch": 0.3, - "learning_rate": 1.9750307220335993e-06, - "loss": 1.043, - "step": 11605 - }, - { - "epoch": 0.3, - "learning_rate": 1.975024576882249e-06, - "loss": 0.8877, - "step": 11606 - }, - { - "epoch": 0.3, - "learning_rate": 1.975018430984368e-06, - "loss": 0.8008, - "step": 11607 - }, - { - "epoch": 0.3, - "learning_rate": 1.97501228433996e-06, - "loss": 0.9458, - "step": 11608 - }, - { - "epoch": 0.3, - "learning_rate": 1.9750061369490297e-06, - "loss": 0.6963, - "step": 11609 - }, - { - "epoch": 0.3, - "learning_rate": 1.974999988811582e-06, - "loss": 0.8398, - "step": 11610 - }, - { - "epoch": 0.3, - "learning_rate": 1.974993839927622e-06, - "loss": 0.5505, - "step": 11611 - }, - { - "epoch": 0.3, - "learning_rate": 1.974987690297154e-06, - "loss": 0.9043, - "step": 11612 - }, - { - "epoch": 0.3, - "learning_rate": 1.974981539920183e-06, - "loss": 0.6816, - "step": 11613 - }, - { - "epoch": 0.3, - "learning_rate": 1.974975388796713e-06, - "loss": 1.0049, - "step": 11614 - }, - { - "epoch": 0.3, - "learning_rate": 1.9749692369267493e-06, - "loss": 0.8418, - "step": 11615 - }, - { - "epoch": 0.3, - "learning_rate": 1.974963084310296e-06, - "loss": 0.833, - "step": 11616 - }, - { - "epoch": 0.3, - "learning_rate": 1.9749569309473593e-06, - "loss": 0.7441, - "step": 11617 - }, - { - "epoch": 0.3, - "learning_rate": 1.974950776837942e-06, - "loss": 0.7334, - "step": 11618 - }, - { - "epoch": 0.3, - "learning_rate": 1.9749446219820503e-06, - "loss": 0.7114, - "step": 11619 - }, - { - "epoch": 0.3, - "learning_rate": 1.9749384663796884e-06, - "loss": 1.041, - "step": 11620 - }, - { - "epoch": 0.3, - "learning_rate": 1.9749323100308604e-06, - "loss": 0.7979, - "step": 11621 - }, - { - "epoch": 0.3, - "learning_rate": 1.974926152935572e-06, - "loss": 1.0625, - "step": 11622 - }, - { - "epoch": 0.3, - "learning_rate": 1.9749199950938273e-06, - "loss": 0.8711, - "step": 11623 - }, - { - "epoch": 0.3, - "learning_rate": 1.9749138365056314e-06, - "loss": 0.8145, - "step": 11624 - }, - { - "epoch": 0.3, - "learning_rate": 1.974907677170988e-06, - "loss": 1.0781, - "step": 11625 - }, - { - "epoch": 0.3, - "learning_rate": 1.9749015170899035e-06, - "loss": 0.8613, - "step": 11626 - }, - { - "epoch": 0.3, - "learning_rate": 1.974895356262381e-06, - "loss": 0.7827, - "step": 11627 - }, - { - "epoch": 0.3, - "learning_rate": 1.9748891946884268e-06, - "loss": 0.9727, - "step": 11628 - }, - { - "epoch": 0.3, - "learning_rate": 1.9748830323680445e-06, - "loss": 0.9795, - "step": 11629 - }, - { - "epoch": 0.3, - "learning_rate": 1.974876869301239e-06, - "loss": 0.9297, - "step": 11630 - }, - { - "epoch": 0.3, - "learning_rate": 1.9748707054880154e-06, - "loss": 0.9395, - "step": 11631 - }, - { - "epoch": 0.3, - "learning_rate": 1.9748645409283774e-06, - "loss": 0.9941, - "step": 11632 - }, - { - "epoch": 0.3, - "learning_rate": 1.9748583756223306e-06, - "loss": 0.5496, - "step": 11633 - }, - { - "epoch": 0.3, - "learning_rate": 1.97485220956988e-06, - "loss": 1.0146, - "step": 11634 - }, - { - "epoch": 0.3, - "learning_rate": 1.9748460427710296e-06, - "loss": 0.8613, - "step": 11635 - }, - { - "epoch": 0.3, - "learning_rate": 1.9748398752257847e-06, - "loss": 0.9219, - "step": 11636 - }, - { - "epoch": 0.3, - "learning_rate": 1.9748337069341497e-06, - "loss": 0.8228, - "step": 11637 - }, - { - "epoch": 0.3, - "learning_rate": 1.974827537896129e-06, - "loss": 0.9707, - "step": 11638 - }, - { - "epoch": 0.3, - "learning_rate": 1.974821368111728e-06, - "loss": 0.5952, - "step": 11639 - }, - { - "epoch": 0.3, - "learning_rate": 1.974815197580951e-06, - "loss": 0.8828, - "step": 11640 - }, - { - "epoch": 0.3, - "learning_rate": 1.974809026303803e-06, - "loss": 1.0723, - "step": 11641 - }, - { - "epoch": 0.3, - "learning_rate": 1.974802854280288e-06, - "loss": 0.9326, - "step": 11642 - }, - { - "epoch": 0.3, - "learning_rate": 1.9747966815104117e-06, - "loss": 0.7422, - "step": 11643 - }, - { - "epoch": 0.3, - "learning_rate": 1.9747905079941783e-06, - "loss": 0.9346, - "step": 11644 - }, - { - "epoch": 0.3, - "learning_rate": 1.9747843337315925e-06, - "loss": 0.8945, - "step": 11645 - }, - { - "epoch": 0.3, - "learning_rate": 1.9747781587226596e-06, - "loss": 0.7686, - "step": 11646 - }, - { - "epoch": 0.3, - "learning_rate": 1.9747719829673836e-06, - "loss": 1.0225, - "step": 11647 - }, - { - "epoch": 0.3, - "learning_rate": 1.9747658064657694e-06, - "loss": 0.7275, - "step": 11648 - }, - { - "epoch": 0.3, - "learning_rate": 1.974759629217822e-06, - "loss": 0.6787, - "step": 11649 - }, - { - "epoch": 0.3, - "learning_rate": 1.974753451223546e-06, - "loss": 0.8945, - "step": 11650 - }, - { - "epoch": 0.3, - "learning_rate": 1.9747472724829463e-06, - "loss": 0.8281, - "step": 11651 - }, - { - "epoch": 0.3, - "learning_rate": 1.9747410929960268e-06, - "loss": 0.6997, - "step": 11652 - }, - { - "epoch": 0.3, - "learning_rate": 1.9747349127627933e-06, - "loss": 1.1699, - "step": 11653 - }, - { - "epoch": 0.3, - "learning_rate": 1.97472873178325e-06, - "loss": 0.8994, - "step": 11654 - }, - { - "epoch": 0.3, - "learning_rate": 1.974722550057402e-06, - "loss": 0.8242, - "step": 11655 - }, - { - "epoch": 0.3, - "learning_rate": 1.9747163675852533e-06, - "loss": 1.0117, - "step": 11656 - }, - { - "epoch": 0.3, - "learning_rate": 1.9747101843668093e-06, - "loss": 0.875, - "step": 11657 - }, - { - "epoch": 0.3, - "learning_rate": 1.9747040004020747e-06, - "loss": 0.998, - "step": 11658 - }, - { - "epoch": 0.3, - "learning_rate": 1.9746978156910537e-06, - "loss": 0.9727, - "step": 11659 - }, - { - "epoch": 0.3, - "learning_rate": 1.9746916302337517e-06, - "loss": 0.9736, - "step": 11660 - }, - { - "epoch": 0.3, - "learning_rate": 1.974685444030173e-06, - "loss": 0.7573, - "step": 11661 - }, - { - "epoch": 0.3, - "learning_rate": 1.974679257080323e-06, - "loss": 0.9053, - "step": 11662 - }, - { - "epoch": 0.3, - "learning_rate": 1.974673069384205e-06, - "loss": 0.8447, - "step": 11663 - }, - { - "epoch": 0.3, - "learning_rate": 1.9746668809418253e-06, - "loss": 0.7227, - "step": 11664 - }, - { - "epoch": 0.3, - "learning_rate": 1.9746606917531878e-06, - "loss": 0.8589, - "step": 11665 - }, - { - "epoch": 0.3, - "learning_rate": 1.9746545018182973e-06, - "loss": 0.7759, - "step": 11666 - }, - { - "epoch": 0.3, - "learning_rate": 1.974648311137159e-06, - "loss": 1.0879, - "step": 11667 - }, - { - "epoch": 0.3, - "learning_rate": 1.974642119709777e-06, - "loss": 1.001, - "step": 11668 - }, - { - "epoch": 0.3, - "learning_rate": 1.9746359275361563e-06, - "loss": 0.7068, - "step": 11669 - }, - { - "epoch": 0.3, - "learning_rate": 1.974629734616302e-06, - "loss": 0.8765, - "step": 11670 - }, - { - "epoch": 0.3, - "learning_rate": 1.974623540950218e-06, - "loss": 0.9141, - "step": 11671 - }, - { - "epoch": 0.3, - "learning_rate": 1.9746173465379097e-06, - "loss": 0.9365, - "step": 11672 - }, - { - "epoch": 0.3, - "learning_rate": 1.9746111513793823e-06, - "loss": 0.9521, - "step": 11673 - }, - { - "epoch": 0.3, - "learning_rate": 1.9746049554746396e-06, - "loss": 0.8086, - "step": 11674 - }, - { - "epoch": 0.3, - "learning_rate": 1.9745987588236862e-06, - "loss": 0.6948, - "step": 11675 - }, - { - "epoch": 0.3, - "learning_rate": 1.9745925614265282e-06, - "loss": 0.9619, - "step": 11676 - }, - { - "epoch": 0.3, - "learning_rate": 1.974586363283169e-06, - "loss": 0.9814, - "step": 11677 - }, - { - "epoch": 0.3, - "learning_rate": 1.974580164393614e-06, - "loss": 0.9102, - "step": 11678 - }, - { - "epoch": 0.3, - "learning_rate": 1.9745739647578676e-06, - "loss": 0.6841, - "step": 11679 - }, - { - "epoch": 0.3, - "learning_rate": 1.974567764375935e-06, - "loss": 1.0742, - "step": 11680 - }, - { - "epoch": 0.3, - "learning_rate": 1.9745615632478204e-06, - "loss": 1.1406, - "step": 11681 - }, - { - "epoch": 0.3, - "learning_rate": 1.9745553613735287e-06, - "loss": 0.8057, - "step": 11682 - }, - { - "epoch": 0.3, - "learning_rate": 1.9745491587530654e-06, - "loss": 0.8652, - "step": 11683 - }, - { - "epoch": 0.3, - "learning_rate": 1.9745429553864338e-06, - "loss": 0.8486, - "step": 11684 - }, - { - "epoch": 0.3, - "learning_rate": 1.9745367512736403e-06, - "loss": 0.8799, - "step": 11685 - }, - { - "epoch": 0.3, - "learning_rate": 1.9745305464146882e-06, - "loss": 0.9854, - "step": 11686 - }, - { - "epoch": 0.3, - "learning_rate": 1.974524340809583e-06, - "loss": 0.9775, - "step": 11687 - }, - { - "epoch": 0.3, - "learning_rate": 1.9745181344583294e-06, - "loss": 1.0518, - "step": 11688 - }, - { - "epoch": 0.3, - "learning_rate": 1.9745119273609322e-06, - "loss": 0.6113, - "step": 11689 - }, - { - "epoch": 0.3, - "learning_rate": 1.974505719517396e-06, - "loss": 0.7791, - "step": 11690 - }, - { - "epoch": 0.3, - "learning_rate": 1.974499510927725e-06, - "loss": 1.1094, - "step": 11691 - }, - { - "epoch": 0.3, - "learning_rate": 1.9744933015919253e-06, - "loss": 0.79, - "step": 11692 - }, - { - "epoch": 0.3, - "learning_rate": 1.974487091510001e-06, - "loss": 0.9443, - "step": 11693 - }, - { - "epoch": 0.3, - "learning_rate": 1.974480880681956e-06, - "loss": 1.0752, - "step": 11694 - }, - { - "epoch": 0.3, - "learning_rate": 1.974474669107796e-06, - "loss": 0.834, - "step": 11695 - }, - { - "epoch": 0.3, - "learning_rate": 1.9744684567875257e-06, - "loss": 0.7578, - "step": 11696 - }, - { - "epoch": 0.3, - "learning_rate": 1.9744622437211497e-06, - "loss": 0.9248, - "step": 11697 - }, - { - "epoch": 0.3, - "learning_rate": 1.9744560299086728e-06, - "loss": 1.0938, - "step": 11698 - }, - { - "epoch": 0.3, - "learning_rate": 1.9744498153500995e-06, - "loss": 0.9316, - "step": 11699 - }, - { - "epoch": 0.3, - "learning_rate": 1.9744436000454356e-06, - "loss": 0.6265, - "step": 11700 - }, - { - "epoch": 0.3, - "learning_rate": 1.9744373839946838e-06, - "loss": 0.8252, - "step": 11701 - }, - { - "epoch": 0.3, - "learning_rate": 1.974431167197851e-06, - "loss": 0.9082, - "step": 11702 - }, - { - "epoch": 0.3, - "learning_rate": 1.9744249496549406e-06, - "loss": 0.8662, - "step": 11703 - }, - { - "epoch": 0.3, - "learning_rate": 1.974418731365958e-06, - "loss": 1.0566, - "step": 11704 - }, - { - "epoch": 0.3, - "learning_rate": 1.974412512330908e-06, - "loss": 0.9873, - "step": 11705 - }, - { - "epoch": 0.3, - "learning_rate": 1.9744062925497947e-06, - "loss": 0.9814, - "step": 11706 - }, - { - "epoch": 0.3, - "learning_rate": 1.9744000720226238e-06, - "loss": 0.8838, - "step": 11707 - }, - { - "epoch": 0.3, - "learning_rate": 1.9743938507493993e-06, - "loss": 0.7029, - "step": 11708 - }, - { - "epoch": 0.3, - "learning_rate": 1.974387628730126e-06, - "loss": 1.0303, - "step": 11709 - }, - { - "epoch": 0.3, - "learning_rate": 1.9743814059648094e-06, - "loss": 0.4863, - "step": 11710 - }, - { - "epoch": 0.3, - "learning_rate": 1.9743751824534532e-06, - "loss": 1.002, - "step": 11711 - }, - { - "epoch": 0.3, - "learning_rate": 1.974368958196063e-06, - "loss": 0.9688, - "step": 11712 - }, - { - "epoch": 0.3, - "learning_rate": 1.9743627331926436e-06, - "loss": 1.0176, - "step": 11713 - }, - { - "epoch": 0.3, - "learning_rate": 1.974356507443199e-06, - "loss": 0.793, - "step": 11714 - }, - { - "epoch": 0.3, - "learning_rate": 1.9743502809477347e-06, - "loss": 0.9004, - "step": 11715 - }, - { - "epoch": 0.3, - "learning_rate": 1.974344053706255e-06, - "loss": 1.0215, - "step": 11716 - }, - { - "epoch": 0.3, - "learning_rate": 1.9743378257187652e-06, - "loss": 0.8052, - "step": 11717 - }, - { - "epoch": 0.3, - "learning_rate": 1.9743315969852693e-06, - "loss": 0.9785, - "step": 11718 - }, - { - "epoch": 0.3, - "learning_rate": 1.974325367505773e-06, - "loss": 0.7012, - "step": 11719 - }, - { - "epoch": 0.3, - "learning_rate": 1.97431913728028e-06, - "loss": 1.0566, - "step": 11720 - }, - { - "epoch": 0.3, - "learning_rate": 1.974312906308796e-06, - "loss": 0.7383, - "step": 11721 - }, - { - "epoch": 0.3, - "learning_rate": 1.974306674591325e-06, - "loss": 0.8438, - "step": 11722 - }, - { - "epoch": 0.3, - "learning_rate": 1.9743004421278723e-06, - "loss": 0.8574, - "step": 11723 - }, - { - "epoch": 0.3, - "learning_rate": 1.974294208918443e-06, - "loss": 0.833, - "step": 11724 - }, - { - "epoch": 0.3, - "learning_rate": 1.9742879749630414e-06, - "loss": 0.9014, - "step": 11725 - }, - { - "epoch": 0.3, - "learning_rate": 1.974281740261672e-06, - "loss": 0.8984, - "step": 11726 - }, - { - "epoch": 0.3, - "learning_rate": 1.9742755048143396e-06, - "loss": 0.8154, - "step": 11727 - }, - { - "epoch": 0.3, - "learning_rate": 1.9742692686210494e-06, - "loss": 1.0518, - "step": 11728 - }, - { - "epoch": 0.3, - "learning_rate": 1.974263031681806e-06, - "loss": 1.2412, - "step": 11729 - }, - { - "epoch": 0.3, - "learning_rate": 1.9742567939966145e-06, - "loss": 0.9834, - "step": 11730 - }, - { - "epoch": 0.3, - "learning_rate": 1.9742505555654794e-06, - "loss": 1.0469, - "step": 11731 - }, - { - "epoch": 0.3, - "learning_rate": 1.974244316388405e-06, - "loss": 0.7417, - "step": 11732 - }, - { - "epoch": 0.3, - "learning_rate": 1.9742380764653973e-06, - "loss": 0.9102, - "step": 11733 - }, - { - "epoch": 0.3, - "learning_rate": 1.9742318357964596e-06, - "loss": 0.8789, - "step": 11734 - }, - { - "epoch": 0.3, - "learning_rate": 1.9742255943815976e-06, - "loss": 0.9863, - "step": 11735 - }, - { - "epoch": 0.3, - "learning_rate": 1.9742193522208155e-06, - "loss": 0.8013, - "step": 11736 - }, - { - "epoch": 0.3, - "learning_rate": 1.9742131093141193e-06, - "loss": 0.959, - "step": 11737 - }, - { - "epoch": 0.3, - "learning_rate": 1.9742068656615123e-06, - "loss": 1.2422, - "step": 11738 - }, - { - "epoch": 0.3, - "learning_rate": 1.9742006212629996e-06, - "loss": 0.9902, - "step": 11739 - }, - { - "epoch": 0.3, - "learning_rate": 1.974194376118587e-06, - "loss": 0.9678, - "step": 11740 - }, - { - "epoch": 0.3, - "learning_rate": 1.974188130228278e-06, - "loss": 0.7495, - "step": 11741 - }, - { - "epoch": 0.3, - "learning_rate": 1.9741818835920783e-06, - "loss": 0.6851, - "step": 11742 - }, - { - "epoch": 0.3, - "learning_rate": 1.9741756362099924e-06, - "loss": 0.9697, - "step": 11743 - }, - { - "epoch": 0.3, - "learning_rate": 1.9741693880820246e-06, - "loss": 0.7119, - "step": 11744 - }, - { - "epoch": 0.3, - "learning_rate": 1.9741631392081803e-06, - "loss": 1.0234, - "step": 11745 - }, - { - "epoch": 0.3, - "learning_rate": 1.974156889588464e-06, - "loss": 0.7842, - "step": 11746 - }, - { - "epoch": 0.3, - "learning_rate": 1.974150639222881e-06, - "loss": 0.8203, - "step": 11747 - }, - { - "epoch": 0.3, - "learning_rate": 1.974144388111435e-06, - "loss": 0.8193, - "step": 11748 - }, - { - "epoch": 0.3, - "learning_rate": 1.9741381362541316e-06, - "loss": 0.7793, - "step": 11749 - }, - { - "epoch": 0.3, - "learning_rate": 1.9741318836509757e-06, - "loss": 0.9365, - "step": 11750 - }, - { - "epoch": 0.3, - "learning_rate": 1.9741256303019718e-06, - "loss": 0.9893, - "step": 11751 - }, - { - "epoch": 0.3, - "learning_rate": 1.9741193762071244e-06, - "loss": 0.7461, - "step": 11752 - }, - { - "epoch": 0.3, - "learning_rate": 1.9741131213664387e-06, - "loss": 0.7339, - "step": 11753 - }, - { - "epoch": 0.3, - "learning_rate": 1.9741068657799197e-06, - "loss": 1.1426, - "step": 11754 - }, - { - "epoch": 0.3, - "learning_rate": 1.9741006094475712e-06, - "loss": 1.042, - "step": 11755 - }, - { - "epoch": 0.3, - "learning_rate": 1.9740943523693992e-06, - "loss": 0.7451, - "step": 11756 - }, - { - "epoch": 0.3, - "learning_rate": 1.974088094545408e-06, - "loss": 0.9111, - "step": 11757 - }, - { - "epoch": 0.3, - "learning_rate": 1.974081835975602e-06, - "loss": 0.9678, - "step": 11758 - }, - { - "epoch": 0.3, - "learning_rate": 1.9740755766599863e-06, - "loss": 0.8879, - "step": 11759 - }, - { - "epoch": 0.3, - "learning_rate": 1.974069316598566e-06, - "loss": 0.9863, - "step": 11760 - }, - { - "epoch": 0.3, - "learning_rate": 1.9740630557913454e-06, - "loss": 0.79, - "step": 11761 - }, - { - "epoch": 0.3, - "learning_rate": 1.9740567942383297e-06, - "loss": 1.1592, - "step": 11762 - }, - { - "epoch": 0.3, - "learning_rate": 1.974050531939523e-06, - "loss": 0.8125, - "step": 11763 - }, - { - "epoch": 0.3, - "learning_rate": 1.974044268894931e-06, - "loss": 1.0977, - "step": 11764 - }, - { - "epoch": 0.3, - "learning_rate": 1.9740380051045584e-06, - "loss": 0.9805, - "step": 11765 - }, - { - "epoch": 0.3, - "learning_rate": 1.974031740568409e-06, - "loss": 0.7979, - "step": 11766 - }, - { - "epoch": 0.3, - "learning_rate": 1.974025475286489e-06, - "loss": 0.9736, - "step": 11767 - }, - { - "epoch": 0.3, - "learning_rate": 1.974019209258802e-06, - "loss": 1.084, - "step": 11768 - }, - { - "epoch": 0.3, - "learning_rate": 1.9740129424853535e-06, - "loss": 0.9365, - "step": 11769 - }, - { - "epoch": 0.3, - "learning_rate": 1.9740066749661477e-06, - "loss": 0.6792, - "step": 11770 - }, - { - "epoch": 0.3, - "learning_rate": 1.97400040670119e-06, - "loss": 0.9141, - "step": 11771 - }, - { - "epoch": 0.3, - "learning_rate": 1.9739941376904855e-06, - "loss": 0.8086, - "step": 11772 - }, - { - "epoch": 0.3, - "learning_rate": 1.9739878679340374e-06, - "loss": 1.1094, - "step": 11773 - }, - { - "epoch": 0.3, - "learning_rate": 1.9739815974318527e-06, - "loss": 0.7383, - "step": 11774 - }, - { - "epoch": 0.3, - "learning_rate": 1.973975326183934e-06, - "loss": 0.793, - "step": 11775 - }, - { - "epoch": 0.3, - "learning_rate": 1.973969054190288e-06, - "loss": 0.957, - "step": 11776 - }, - { - "epoch": 0.3, - "learning_rate": 1.9739627814509185e-06, - "loss": 0.9307, - "step": 11777 - }, - { - "epoch": 0.3, - "learning_rate": 1.9739565079658305e-06, - "loss": 0.7393, - "step": 11778 - }, - { - "epoch": 0.3, - "learning_rate": 1.9739502337350284e-06, - "loss": 0.7871, - "step": 11779 - }, - { - "epoch": 0.3, - "learning_rate": 1.973943958758518e-06, - "loss": 0.8154, - "step": 11780 - }, - { - "epoch": 0.3, - "learning_rate": 1.973937683036303e-06, - "loss": 0.9443, - "step": 11781 - }, - { - "epoch": 0.3, - "learning_rate": 1.973931406568389e-06, - "loss": 0.8643, - "step": 11782 - }, - { - "epoch": 0.3, - "learning_rate": 1.97392512935478e-06, - "loss": 0.6235, - "step": 11783 - }, - { - "epoch": 0.3, - "learning_rate": 1.973918851395482e-06, - "loss": 1.0674, - "step": 11784 - }, - { - "epoch": 0.3, - "learning_rate": 1.9739125726904984e-06, - "loss": 1.0137, - "step": 11785 - }, - { - "epoch": 0.3, - "learning_rate": 1.9739062932398354e-06, - "loss": 1.0342, - "step": 11786 - }, - { - "epoch": 0.3, - "learning_rate": 1.973900013043497e-06, - "loss": 0.6802, - "step": 11787 - }, - { - "epoch": 0.3, - "learning_rate": 1.9738937321014877e-06, - "loss": 1.0195, - "step": 11788 - }, - { - "epoch": 0.3, - "learning_rate": 1.973887450413813e-06, - "loss": 0.8691, - "step": 11789 - }, - { - "epoch": 0.3, - "learning_rate": 1.9738811679804773e-06, - "loss": 0.8496, - "step": 11790 - }, - { - "epoch": 0.3, - "learning_rate": 1.973874884801486e-06, - "loss": 0.8584, - "step": 11791 - }, - { - "epoch": 0.3, - "learning_rate": 1.9738686008768433e-06, - "loss": 1.0166, - "step": 11792 - }, - { - "epoch": 0.3, - "learning_rate": 1.973862316206554e-06, - "loss": 0.9883, - "step": 11793 - }, - { - "epoch": 0.3, - "learning_rate": 1.9738560307906233e-06, - "loss": 0.9478, - "step": 11794 - }, - { - "epoch": 0.3, - "learning_rate": 1.9738497446290555e-06, - "loss": 0.9199, - "step": 11795 - }, - { - "epoch": 0.3, - "learning_rate": 1.9738434577218563e-06, - "loss": 1.1553, - "step": 11796 - }, - { - "epoch": 0.3, - "learning_rate": 1.9738371700690294e-06, - "loss": 0.9941, - "step": 11797 - }, - { - "epoch": 0.3, - "learning_rate": 1.9738308816705805e-06, - "loss": 0.7529, - "step": 11798 - }, - { - "epoch": 0.3, - "learning_rate": 1.973824592526514e-06, - "loss": 1.0488, - "step": 11799 - }, - { - "epoch": 0.3, - "learning_rate": 1.9738183026368347e-06, - "loss": 0.8936, - "step": 11800 - }, - { - "epoch": 0.3, - "learning_rate": 1.973812012001548e-06, - "loss": 0.9893, - "step": 11801 - }, - { - "epoch": 0.3, - "learning_rate": 1.9738057206206575e-06, - "loss": 0.9932, - "step": 11802 - }, - { - "epoch": 0.3, - "learning_rate": 1.973799428494169e-06, - "loss": 1.0107, - "step": 11803 - }, - { - "epoch": 0.3, - "learning_rate": 1.973793135622087e-06, - "loss": 0.8652, - "step": 11804 - }, - { - "epoch": 0.3, - "learning_rate": 1.9737868420044164e-06, - "loss": 0.7969, - "step": 11805 - }, - { - "epoch": 0.3, - "learning_rate": 1.973780547641162e-06, - "loss": 0.7393, - "step": 11806 - }, - { - "epoch": 0.3, - "learning_rate": 1.9737742525323287e-06, - "loss": 0.8584, - "step": 11807 - }, - { - "epoch": 0.3, - "learning_rate": 1.973767956677921e-06, - "loss": 0.8682, - "step": 11808 - }, - { - "epoch": 0.3, - "learning_rate": 1.9737616600779443e-06, - "loss": 0.9492, - "step": 11809 - }, - { - "epoch": 0.3, - "learning_rate": 1.973755362732403e-06, - "loss": 1.0342, - "step": 11810 - }, - { - "epoch": 0.3, - "learning_rate": 1.9737490646413017e-06, - "loss": 0.7695, - "step": 11811 - }, - { - "epoch": 0.3, - "learning_rate": 1.9737427658046456e-06, - "loss": 1.1406, - "step": 11812 - }, - { - "epoch": 0.3, - "learning_rate": 1.9737364662224395e-06, - "loss": 0.8804, - "step": 11813 - }, - { - "epoch": 0.3, - "learning_rate": 1.973730165894688e-06, - "loss": 0.8252, - "step": 11814 - }, - { - "epoch": 0.3, - "learning_rate": 1.9737238648213967e-06, - "loss": 0.9697, - "step": 11815 - }, - { - "epoch": 0.3, - "learning_rate": 1.973717563002569e-06, - "loss": 0.916, - "step": 11816 - }, - { - "epoch": 0.3, - "learning_rate": 1.9737112604382113e-06, - "loss": 0.6758, - "step": 11817 - }, - { - "epoch": 0.3, - "learning_rate": 1.973704957128327e-06, - "loss": 0.585, - "step": 11818 - }, - { - "epoch": 0.3, - "learning_rate": 1.973698653072922e-06, - "loss": 0.8467, - "step": 11819 - }, - { - "epoch": 0.3, - "learning_rate": 1.9736923482720005e-06, - "loss": 0.8271, - "step": 11820 - }, - { - "epoch": 0.3, - "learning_rate": 1.973686042725568e-06, - "loss": 0.9297, - "step": 11821 - }, - { - "epoch": 0.3, - "learning_rate": 1.9736797364336284e-06, - "loss": 0.8672, - "step": 11822 - }, - { - "epoch": 0.3, - "learning_rate": 1.973673429396187e-06, - "loss": 1.0293, - "step": 11823 - }, - { - "epoch": 0.3, - "learning_rate": 1.9736671216132484e-06, - "loss": 1.1523, - "step": 11824 - }, - { - "epoch": 0.3, - "learning_rate": 1.9736608130848184e-06, - "loss": 0.7495, - "step": 11825 - }, - { - "epoch": 0.3, - "learning_rate": 1.9736545038109003e-06, - "loss": 0.9551, - "step": 11826 - }, - { - "epoch": 0.3, - "learning_rate": 1.9736481937915e-06, - "loss": 1.0078, - "step": 11827 - }, - { - "epoch": 0.3, - "learning_rate": 1.9736418830266223e-06, - "loss": 0.874, - "step": 11828 - }, - { - "epoch": 0.3, - "learning_rate": 1.9736355715162717e-06, - "loss": 1.0732, - "step": 11829 - }, - { - "epoch": 0.3, - "learning_rate": 1.973629259260453e-06, - "loss": 1.0645, - "step": 11830 - }, - { - "epoch": 0.3, - "learning_rate": 1.973622946259171e-06, - "loss": 1.0723, - "step": 11831 - }, - { - "epoch": 0.3, - "learning_rate": 1.973616632512431e-06, - "loss": 0.9561, - "step": 11832 - }, - { - "epoch": 0.3, - "learning_rate": 1.9736103180202373e-06, - "loss": 0.9268, - "step": 11833 - }, - { - "epoch": 0.3, - "learning_rate": 1.973604002782595e-06, - "loss": 0.9482, - "step": 11834 - }, - { - "epoch": 0.3, - "learning_rate": 1.973597686799509e-06, - "loss": 0.9639, - "step": 11835 - }, - { - "epoch": 0.3, - "learning_rate": 1.9735913700709838e-06, - "loss": 1.0068, - "step": 11836 - }, - { - "epoch": 0.3, - "learning_rate": 1.9735850525970244e-06, - "loss": 0.7676, - "step": 11837 - }, - { - "epoch": 0.3, - "learning_rate": 1.973578734377636e-06, - "loss": 0.8389, - "step": 11838 - }, - { - "epoch": 0.3, - "learning_rate": 1.9735724154128227e-06, - "loss": 0.9277, - "step": 11839 - }, - { - "epoch": 0.3, - "learning_rate": 1.97356609570259e-06, - "loss": 0.6328, - "step": 11840 - }, - { - "epoch": 0.3, - "learning_rate": 1.9735597752469426e-06, - "loss": 0.9678, - "step": 11841 - }, - { - "epoch": 0.3, - "learning_rate": 1.973553454045885e-06, - "loss": 0.9102, - "step": 11842 - }, - { - "epoch": 0.3, - "learning_rate": 1.9735471320994227e-06, - "loss": 1.04, - "step": 11843 - }, - { - "epoch": 0.3, - "learning_rate": 1.97354080940756e-06, - "loss": 1.0166, - "step": 11844 - }, - { - "epoch": 0.3, - "learning_rate": 1.9735344859703015e-06, - "loss": 0.9902, - "step": 11845 - }, - { - "epoch": 0.3, - "learning_rate": 1.9735281617876528e-06, - "loss": 0.79, - "step": 11846 - }, - { - "epoch": 0.3, - "learning_rate": 1.9735218368596184e-06, - "loss": 0.8052, - "step": 11847 - }, - { - "epoch": 0.3, - "learning_rate": 1.973515511186203e-06, - "loss": 0.832, - "step": 11848 - }, - { - "epoch": 0.3, - "learning_rate": 1.973509184767411e-06, - "loss": 0.9717, - "step": 11849 - }, - { - "epoch": 0.3, - "learning_rate": 1.9735028576032487e-06, - "loss": 0.8447, - "step": 11850 - }, - { - "epoch": 0.3, - "learning_rate": 1.9734965296937194e-06, - "loss": 0.6902, - "step": 11851 - }, - { - "epoch": 0.3, - "learning_rate": 1.9734902010388286e-06, - "loss": 0.9297, - "step": 11852 - }, - { - "epoch": 0.3, - "learning_rate": 1.9734838716385814e-06, - "loss": 0.7563, - "step": 11853 - }, - { - "epoch": 0.3, - "learning_rate": 1.9734775414929825e-06, - "loss": 0.9795, - "step": 11854 - }, - { - "epoch": 0.3, - "learning_rate": 1.973471210602036e-06, - "loss": 0.8779, - "step": 11855 - }, - { - "epoch": 0.3, - "learning_rate": 1.9734648789657477e-06, - "loss": 1.1826, - "step": 11856 - }, - { - "epoch": 0.3, - "learning_rate": 1.973458546584122e-06, - "loss": 0.8613, - "step": 11857 - }, - { - "epoch": 0.3, - "learning_rate": 1.973452213457164e-06, - "loss": 1.1455, - "step": 11858 - }, - { - "epoch": 0.3, - "learning_rate": 1.9734458795848785e-06, - "loss": 0.9775, - "step": 11859 - }, - { - "epoch": 0.3, - "learning_rate": 1.97343954496727e-06, - "loss": 1.2812, - "step": 11860 - }, - { - "epoch": 0.3, - "learning_rate": 1.9734332096043437e-06, - "loss": 1.1191, - "step": 11861 - }, - { - "epoch": 0.3, - "learning_rate": 1.9734268734961042e-06, - "loss": 0.9629, - "step": 11862 - }, - { - "epoch": 0.3, - "learning_rate": 1.9734205366425566e-06, - "loss": 1.0283, - "step": 11863 - }, - { - "epoch": 0.3, - "learning_rate": 1.9734141990437056e-06, - "loss": 1.0674, - "step": 11864 - }, - { - "epoch": 0.3, - "learning_rate": 1.973407860699556e-06, - "loss": 0.8677, - "step": 11865 - }, - { - "epoch": 0.3, - "learning_rate": 1.973401521610113e-06, - "loss": 0.7812, - "step": 11866 - }, - { - "epoch": 0.3, - "learning_rate": 1.9733951817753814e-06, - "loss": 0.7871, - "step": 11867 - }, - { - "epoch": 0.3, - "learning_rate": 1.9733888411953657e-06, - "loss": 1.0781, - "step": 11868 - }, - { - "epoch": 0.3, - "learning_rate": 1.9733824998700707e-06, - "loss": 0.9043, - "step": 11869 - }, - { - "epoch": 0.3, - "learning_rate": 1.9733761577995015e-06, - "loss": 0.9932, - "step": 11870 - }, - { - "epoch": 0.3, - "learning_rate": 1.973369814983663e-06, - "loss": 0.6987, - "step": 11871 - }, - { - "epoch": 0.3, - "learning_rate": 1.9733634714225604e-06, - "loss": 0.9648, - "step": 11872 - }, - { - "epoch": 0.3, - "learning_rate": 1.9733571271161977e-06, - "loss": 0.9502, - "step": 11873 - }, - { - "epoch": 0.3, - "learning_rate": 1.9733507820645803e-06, - "loss": 0.8218, - "step": 11874 - }, - { - "epoch": 0.3, - "learning_rate": 1.973344436267713e-06, - "loss": 0.9658, - "step": 11875 - }, - { - "epoch": 0.3, - "learning_rate": 1.9733380897256004e-06, - "loss": 0.7773, - "step": 11876 - }, - { - "epoch": 0.3, - "learning_rate": 1.973331742438248e-06, - "loss": 0.7725, - "step": 11877 - }, - { - "epoch": 0.3, - "learning_rate": 1.97332539440566e-06, - "loss": 0.8262, - "step": 11878 - }, - { - "epoch": 0.3, - "learning_rate": 1.9733190456278413e-06, - "loss": 0.874, - "step": 11879 - }, - { - "epoch": 0.3, - "learning_rate": 1.973312696104797e-06, - "loss": 0.7102, - "step": 11880 - }, - { - "epoch": 0.3, - "learning_rate": 1.973306345836532e-06, - "loss": 1.0557, - "step": 11881 - }, - { - "epoch": 0.3, - "learning_rate": 1.9732999948230517e-06, - "loss": 0.9277, - "step": 11882 - }, - { - "epoch": 0.3, - "learning_rate": 1.97329364306436e-06, - "loss": 0.876, - "step": 11883 - }, - { - "epoch": 0.3, - "learning_rate": 1.9732872905604615e-06, - "loss": 0.9414, - "step": 11884 - }, - { - "epoch": 0.3, - "learning_rate": 1.973280937311362e-06, - "loss": 1.0723, - "step": 11885 - }, - { - "epoch": 0.3, - "learning_rate": 1.9732745833170665e-06, - "loss": 0.9531, - "step": 11886 - }, - { - "epoch": 0.3, - "learning_rate": 1.973268228577579e-06, - "loss": 0.8135, - "step": 11887 - }, - { - "epoch": 0.3, - "learning_rate": 1.9732618730929046e-06, - "loss": 1.0977, - "step": 11888 - }, - { - "epoch": 0.3, - "learning_rate": 1.973255516863049e-06, - "loss": 0.7798, - "step": 11889 - }, - { - "epoch": 0.3, - "learning_rate": 1.9732491598880155e-06, - "loss": 1.0, - "step": 11890 - }, - { - "epoch": 0.3, - "learning_rate": 1.9732428021678104e-06, - "loss": 0.8525, - "step": 11891 - }, - { - "epoch": 0.3, - "learning_rate": 1.973236443702438e-06, - "loss": 0.9092, - "step": 11892 - }, - { - "epoch": 0.3, - "learning_rate": 1.9732300844919032e-06, - "loss": 1.0381, - "step": 11893 - }, - { - "epoch": 0.3, - "learning_rate": 1.973223724536211e-06, - "loss": 1.043, - "step": 11894 - }, - { - "epoch": 0.3, - "learning_rate": 1.973217363835366e-06, - "loss": 0.8506, - "step": 11895 - }, - { - "epoch": 0.3, - "learning_rate": 1.973211002389373e-06, - "loss": 0.8809, - "step": 11896 - }, - { - "epoch": 0.3, - "learning_rate": 1.9732046401982374e-06, - "loss": 0.9072, - "step": 11897 - }, - { - "epoch": 0.3, - "learning_rate": 1.9731982772619636e-06, - "loss": 0.9736, - "step": 11898 - }, - { - "epoch": 0.3, - "learning_rate": 1.973191913580556e-06, - "loss": 1.083, - "step": 11899 - }, - { - "epoch": 0.31, - "learning_rate": 1.973185549154021e-06, - "loss": 0.9619, - "step": 11900 - }, - { - "epoch": 0.31, - "learning_rate": 1.9731791839823625e-06, - "loss": 0.9082, - "step": 11901 - }, - { - "epoch": 0.31, - "learning_rate": 1.9731728180655852e-06, - "loss": 0.9551, - "step": 11902 - }, - { - "epoch": 0.31, - "learning_rate": 1.9731664514036946e-06, - "loss": 0.9697, - "step": 11903 - }, - { - "epoch": 0.31, - "learning_rate": 1.973160083996695e-06, - "loss": 1.1357, - "step": 11904 - }, - { - "epoch": 0.31, - "learning_rate": 1.9731537158445913e-06, - "loss": 0.9199, - "step": 11905 - }, - { - "epoch": 0.31, - "learning_rate": 1.9731473469473884e-06, - "loss": 0.7739, - "step": 11906 - }, - { - "epoch": 0.31, - "learning_rate": 1.9731409773050916e-06, - "loss": 1.0117, - "step": 11907 - }, - { - "epoch": 0.31, - "learning_rate": 1.9731346069177053e-06, - "loss": 1.0596, - "step": 11908 - }, - { - "epoch": 0.31, - "learning_rate": 1.973128235785235e-06, - "loss": 0.8306, - "step": 11909 - }, - { - "epoch": 0.31, - "learning_rate": 1.9731218639076848e-06, - "loss": 0.8906, - "step": 11910 - }, - { - "epoch": 0.31, - "learning_rate": 1.9731154912850602e-06, - "loss": 0.918, - "step": 11911 - }, - { - "epoch": 0.31, - "learning_rate": 1.9731091179173656e-06, - "loss": 0.6396, - "step": 11912 - }, - { - "epoch": 0.31, - "learning_rate": 1.973102743804606e-06, - "loss": 1.0684, - "step": 11913 - }, - { - "epoch": 0.31, - "learning_rate": 1.9730963689467865e-06, - "loss": 0.9961, - "step": 11914 - }, - { - "epoch": 0.31, - "learning_rate": 1.9730899933439117e-06, - "loss": 0.8906, - "step": 11915 - }, - { - "epoch": 0.31, - "learning_rate": 1.973083616995987e-06, - "loss": 0.7925, - "step": 11916 - }, - { - "epoch": 0.31, - "learning_rate": 1.9730772399030167e-06, - "loss": 0.6987, - "step": 11917 - }, - { - "epoch": 0.31, - "learning_rate": 1.9730708620650057e-06, - "loss": 1.0469, - "step": 11918 - }, - { - "epoch": 0.31, - "learning_rate": 1.9730644834819594e-06, - "loss": 1.0244, - "step": 11919 - }, - { - "epoch": 0.31, - "learning_rate": 1.9730581041538825e-06, - "loss": 0.7046, - "step": 11920 - }, - { - "epoch": 0.31, - "learning_rate": 1.973051724080779e-06, - "loss": 0.8057, - "step": 11921 - }, - { - "epoch": 0.31, - "learning_rate": 1.9730453432626554e-06, - "loss": 0.8359, - "step": 11922 - }, - { - "epoch": 0.31, - "learning_rate": 1.973038961699515e-06, - "loss": 0.8369, - "step": 11923 - }, - { - "epoch": 0.31, - "learning_rate": 1.973032579391364e-06, - "loss": 0.9912, - "step": 11924 - }, - { - "epoch": 0.31, - "learning_rate": 1.9730261963382064e-06, - "loss": 0.9126, - "step": 11925 - }, - { - "epoch": 0.31, - "learning_rate": 1.9730198125400473e-06, - "loss": 0.8271, - "step": 11926 - }, - { - "epoch": 0.31, - "learning_rate": 1.973013427996892e-06, - "loss": 0.9531, - "step": 11927 - }, - { - "epoch": 0.31, - "learning_rate": 1.973007042708745e-06, - "loss": 0.4449, - "step": 11928 - }, - { - "epoch": 0.31, - "learning_rate": 1.973000656675611e-06, - "loss": 0.8262, - "step": 11929 - }, - { - "epoch": 0.31, - "learning_rate": 1.9729942698974952e-06, - "loss": 0.8594, - "step": 11930 - }, - { - "epoch": 0.31, - "learning_rate": 1.9729878823744024e-06, - "loss": 0.7881, - "step": 11931 - }, - { - "epoch": 0.31, - "learning_rate": 1.9729814941063378e-06, - "loss": 0.8604, - "step": 11932 - }, - { - "epoch": 0.31, - "learning_rate": 1.972975105093306e-06, - "loss": 0.8215, - "step": 11933 - }, - { - "epoch": 0.31, - "learning_rate": 1.9729687153353117e-06, - "loss": 0.9883, - "step": 11934 - }, - { - "epoch": 0.31, - "learning_rate": 1.97296232483236e-06, - "loss": 0.7305, - "step": 11935 - }, - { - "epoch": 0.31, - "learning_rate": 1.972955933584456e-06, - "loss": 1.0273, - "step": 11936 - }, - { - "epoch": 0.31, - "learning_rate": 1.9729495415916036e-06, - "loss": 1.043, - "step": 11937 - }, - { - "epoch": 0.31, - "learning_rate": 1.9729431488538092e-06, - "loss": 0.8438, - "step": 11938 - }, - { - "epoch": 0.31, - "learning_rate": 1.972936755371077e-06, - "loss": 0.9307, - "step": 11939 - }, - { - "epoch": 0.31, - "learning_rate": 1.9729303611434117e-06, - "loss": 0.8809, - "step": 11940 - }, - { - "epoch": 0.31, - "learning_rate": 1.9729239661708183e-06, - "loss": 1.0586, - "step": 11941 - }, - { - "epoch": 0.31, - "learning_rate": 1.9729175704533017e-06, - "loss": 0.9746, - "step": 11942 - }, - { - "epoch": 0.31, - "learning_rate": 1.972911173990867e-06, - "loss": 0.853, - "step": 11943 - }, - { - "epoch": 0.31, - "learning_rate": 1.9729047767835188e-06, - "loss": 0.9902, - "step": 11944 - }, - { - "epoch": 0.31, - "learning_rate": 1.9728983788312625e-06, - "loss": 1.248, - "step": 11945 - }, - { - "epoch": 0.31, - "learning_rate": 1.972891980134102e-06, - "loss": 0.592, - "step": 11946 - }, - { - "epoch": 0.31, - "learning_rate": 1.9728855806920433e-06, - "loss": 0.8252, - "step": 11947 - }, - { - "epoch": 0.31, - "learning_rate": 1.972879180505091e-06, - "loss": 0.8193, - "step": 11948 - }, - { - "epoch": 0.31, - "learning_rate": 1.9728727795732497e-06, - "loss": 0.8867, - "step": 11949 - }, - { - "epoch": 0.31, - "learning_rate": 1.9728663778965243e-06, - "loss": 0.7637, - "step": 11950 - }, - { - "epoch": 0.31, - "learning_rate": 1.97285997547492e-06, - "loss": 0.9395, - "step": 11951 - }, - { - "epoch": 0.31, - "learning_rate": 1.9728535723084415e-06, - "loss": 1.0029, - "step": 11952 - }, - { - "epoch": 0.31, - "learning_rate": 1.9728471683970937e-06, - "loss": 1.0117, - "step": 11953 - }, - { - "epoch": 0.31, - "learning_rate": 1.9728407637408817e-06, - "loss": 0.9902, - "step": 11954 - }, - { - "epoch": 0.31, - "learning_rate": 1.97283435833981e-06, - "loss": 1.0869, - "step": 11955 - }, - { - "epoch": 0.31, - "learning_rate": 1.972827952193884e-06, - "loss": 1.1104, - "step": 11956 - }, - { - "epoch": 0.31, - "learning_rate": 1.972821545303108e-06, - "loss": 0.7969, - "step": 11957 - }, - { - "epoch": 0.31, - "learning_rate": 1.972815137667488e-06, - "loss": 0.7759, - "step": 11958 - }, - { - "epoch": 0.31, - "learning_rate": 1.972808729287027e-06, - "loss": 0.7588, - "step": 11959 - }, - { - "epoch": 0.31, - "learning_rate": 1.9728023201617324e-06, - "loss": 0.8574, - "step": 11960 - }, - { - "epoch": 0.31, - "learning_rate": 1.972795910291607e-06, - "loss": 0.9297, - "step": 11961 - }, - { - "epoch": 0.31, - "learning_rate": 1.9727894996766566e-06, - "loss": 1.0625, - "step": 11962 - }, - { - "epoch": 0.31, - "learning_rate": 1.9727830883168865e-06, - "loss": 0.9365, - "step": 11963 - }, - { - "epoch": 0.31, - "learning_rate": 1.9727766762123004e-06, - "loss": 0.7852, - "step": 11964 - }, - { - "epoch": 0.31, - "learning_rate": 1.9727702633629043e-06, - "loss": 0.9453, - "step": 11965 - }, - { - "epoch": 0.31, - "learning_rate": 1.9727638497687028e-06, - "loss": 1.0059, - "step": 11966 - }, - { - "epoch": 0.31, - "learning_rate": 1.972757435429701e-06, - "loss": 0.9111, - "step": 11967 - }, - { - "epoch": 0.31, - "learning_rate": 1.9727510203459026e-06, - "loss": 0.7705, - "step": 11968 - }, - { - "epoch": 0.31, - "learning_rate": 1.9727446045173146e-06, - "loss": 0.8271, - "step": 11969 - }, - { - "epoch": 0.31, - "learning_rate": 1.9727381879439398e-06, - "loss": 0.9775, - "step": 11970 - }, - { - "epoch": 0.31, - "learning_rate": 1.972731770625785e-06, - "loss": 0.6309, - "step": 11971 - }, - { - "epoch": 0.31, - "learning_rate": 1.9727253525628536e-06, - "loss": 0.7441, - "step": 11972 - }, - { - "epoch": 0.31, - "learning_rate": 1.972718933755151e-06, - "loss": 1.0752, - "step": 11973 - }, - { - "epoch": 0.31, - "learning_rate": 1.9727125142026828e-06, - "loss": 0.8657, - "step": 11974 - }, - { - "epoch": 0.31, - "learning_rate": 1.972706093905453e-06, - "loss": 0.7085, - "step": 11975 - }, - { - "epoch": 0.31, - "learning_rate": 1.972699672863467e-06, - "loss": 0.8506, - "step": 11976 - }, - { - "epoch": 0.31, - "learning_rate": 1.9726932510767297e-06, - "loss": 0.8896, - "step": 11977 - }, - { - "epoch": 0.31, - "learning_rate": 1.9726868285452455e-06, - "loss": 0.7402, - "step": 11978 - }, - { - "epoch": 0.31, - "learning_rate": 1.97268040526902e-06, - "loss": 0.9639, - "step": 11979 - }, - { - "epoch": 0.31, - "learning_rate": 1.972673981248058e-06, - "loss": 1.251, - "step": 11980 - }, - { - "epoch": 0.31, - "learning_rate": 1.972667556482364e-06, - "loss": 1.0859, - "step": 11981 - }, - { - "epoch": 0.31, - "learning_rate": 1.9726611309719436e-06, - "loss": 0.688, - "step": 11982 - }, - { - "epoch": 0.31, - "learning_rate": 1.9726547047168006e-06, - "loss": 0.8887, - "step": 11983 - }, - { - "epoch": 0.31, - "learning_rate": 1.972648277716941e-06, - "loss": 1.0684, - "step": 11984 - }, - { - "epoch": 0.31, - "learning_rate": 1.9726418499723693e-06, - "loss": 1.042, - "step": 11985 - }, - { - "epoch": 0.31, - "learning_rate": 1.9726354214830904e-06, - "loss": 0.9121, - "step": 11986 - }, - { - "epoch": 0.31, - "learning_rate": 1.972628992249109e-06, - "loss": 0.9268, - "step": 11987 - }, - { - "epoch": 0.31, - "learning_rate": 1.972622562270431e-06, - "loss": 0.8535, - "step": 11988 - }, - { - "epoch": 0.31, - "learning_rate": 1.97261613154706e-06, - "loss": 0.9385, - "step": 11989 - }, - { - "epoch": 0.31, - "learning_rate": 1.972609700079002e-06, - "loss": 1.1182, - "step": 11990 - }, - { - "epoch": 0.31, - "learning_rate": 1.9726032678662615e-06, - "loss": 0.8604, - "step": 11991 - }, - { - "epoch": 0.31, - "learning_rate": 1.972596834908843e-06, - "loss": 0.96, - "step": 11992 - }, - { - "epoch": 0.31, - "learning_rate": 1.972590401206752e-06, - "loss": 1.0273, - "step": 11993 - }, - { - "epoch": 0.31, - "learning_rate": 1.9725839667599936e-06, - "loss": 0.9883, - "step": 11994 - }, - { - "epoch": 0.31, - "learning_rate": 1.972577531568572e-06, - "loss": 0.8804, - "step": 11995 - }, - { - "epoch": 0.31, - "learning_rate": 1.9725710956324925e-06, - "loss": 0.6748, - "step": 11996 - }, - { - "epoch": 0.31, - "learning_rate": 1.97256465895176e-06, - "loss": 1.0068, - "step": 11997 - }, - { - "epoch": 0.31, - "learning_rate": 1.9725582215263797e-06, - "loss": 0.8281, - "step": 11998 - }, - { - "epoch": 0.31, - "learning_rate": 1.9725517833563557e-06, - "loss": 1.0498, - "step": 11999 - }, - { - "epoch": 0.31, - "learning_rate": 1.972545344441694e-06, - "loss": 0.8564, - "step": 12000 - }, - { - "epoch": 0.31, - "learning_rate": 1.972538904782399e-06, - "loss": 1.042, - "step": 12001 - }, - { - "epoch": 0.31, - "learning_rate": 1.9725324643784757e-06, - "loss": 0.9512, - "step": 12002 - }, - { - "epoch": 0.31, - "learning_rate": 1.972526023229929e-06, - "loss": 0.8662, - "step": 12003 - }, - { - "epoch": 0.31, - "learning_rate": 1.972519581336764e-06, - "loss": 1.127, - "step": 12004 - }, - { - "epoch": 0.31, - "learning_rate": 1.9725131386989853e-06, - "loss": 0.7861, - "step": 12005 - }, - { - "epoch": 0.31, - "learning_rate": 1.972506695316598e-06, - "loss": 1.1016, - "step": 12006 - }, - { - "epoch": 0.31, - "learning_rate": 1.972500251189607e-06, - "loss": 0.8643, - "step": 12007 - }, - { - "epoch": 0.31, - "learning_rate": 1.9724938063180176e-06, - "loss": 1.0518, - "step": 12008 - }, - { - "epoch": 0.31, - "learning_rate": 1.9724873607018338e-06, - "loss": 0.8374, - "step": 12009 - }, - { - "epoch": 0.31, - "learning_rate": 1.9724809143410614e-06, - "loss": 0.9053, - "step": 12010 - }, - { - "epoch": 0.31, - "learning_rate": 1.9724744672357055e-06, - "loss": 1.0107, - "step": 12011 - }, - { - "epoch": 0.31, - "learning_rate": 1.97246801938577e-06, - "loss": 0.7119, - "step": 12012 - }, - { - "epoch": 0.31, - "learning_rate": 1.972461570791261e-06, - "loss": 0.9111, - "step": 12013 - }, - { - "epoch": 0.31, - "learning_rate": 1.9724551214521825e-06, - "loss": 0.8867, - "step": 12014 - }, - { - "epoch": 0.31, - "learning_rate": 1.97244867136854e-06, - "loss": 0.873, - "step": 12015 - }, - { - "epoch": 0.31, - "learning_rate": 1.972442220540338e-06, - "loss": 0.7695, - "step": 12016 - }, - { - "epoch": 0.31, - "learning_rate": 1.972435768967582e-06, - "loss": 1.041, - "step": 12017 - }, - { - "epoch": 0.31, - "learning_rate": 1.9724293166502765e-06, - "loss": 1.1064, - "step": 12018 - }, - { - "epoch": 0.31, - "learning_rate": 1.972422863588427e-06, - "loss": 1.0947, - "step": 12019 - }, - { - "epoch": 0.31, - "learning_rate": 1.9724164097820376e-06, - "loss": 0.752, - "step": 12020 - }, - { - "epoch": 0.31, - "learning_rate": 1.9724099552311135e-06, - "loss": 1.0459, - "step": 12021 - }, - { - "epoch": 0.31, - "learning_rate": 1.97240349993566e-06, - "loss": 0.9258, - "step": 12022 - }, - { - "epoch": 0.31, - "learning_rate": 1.972397043895682e-06, - "loss": 0.7654, - "step": 12023 - }, - { - "epoch": 0.31, - "learning_rate": 1.9723905871111843e-06, - "loss": 0.8555, - "step": 12024 - }, - { - "epoch": 0.31, - "learning_rate": 1.9723841295821715e-06, - "loss": 0.9204, - "step": 12025 - }, - { - "epoch": 0.31, - "learning_rate": 1.9723776713086494e-06, - "loss": 0.6177, - "step": 12026 - }, - { - "epoch": 0.31, - "learning_rate": 1.9723712122906222e-06, - "loss": 0.9688, - "step": 12027 - }, - { - "epoch": 0.31, - "learning_rate": 1.972364752528095e-06, - "loss": 1.0254, - "step": 12028 - }, - { - "epoch": 0.31, - "learning_rate": 1.9723582920210728e-06, - "loss": 0.8555, - "step": 12029 - }, - { - "epoch": 0.31, - "learning_rate": 1.9723518307695607e-06, - "loss": 1.0244, - "step": 12030 - }, - { - "epoch": 0.31, - "learning_rate": 1.9723453687735634e-06, - "loss": 1.04, - "step": 12031 - }, - { - "epoch": 0.31, - "learning_rate": 1.972338906033086e-06, - "loss": 0.9492, - "step": 12032 - }, - { - "epoch": 0.31, - "learning_rate": 1.9723324425481335e-06, - "loss": 0.7998, - "step": 12033 - }, - { - "epoch": 0.31, - "learning_rate": 1.9723259783187107e-06, - "loss": 1.0293, - "step": 12034 - }, - { - "epoch": 0.31, - "learning_rate": 1.972319513344822e-06, - "loss": 0.8428, - "step": 12035 - }, - { - "epoch": 0.31, - "learning_rate": 1.972313047626474e-06, - "loss": 0.8662, - "step": 12036 - }, - { - "epoch": 0.31, - "learning_rate": 1.9723065811636703e-06, - "loss": 0.7783, - "step": 12037 - }, - { - "epoch": 0.31, - "learning_rate": 1.9723001139564154e-06, - "loss": 1.1758, - "step": 12038 - }, - { - "epoch": 0.31, - "learning_rate": 1.972293646004716e-06, - "loss": 0.752, - "step": 12039 - }, - { - "epoch": 0.31, - "learning_rate": 1.9722871773085755e-06, - "loss": 1.0195, - "step": 12040 - }, - { - "epoch": 0.31, - "learning_rate": 1.9722807078679997e-06, - "loss": 0.959, - "step": 12041 - }, - { - "epoch": 0.31, - "learning_rate": 1.972274237682993e-06, - "loss": 1.0693, - "step": 12042 - }, - { - "epoch": 0.31, - "learning_rate": 1.9722677667535607e-06, - "loss": 1.0029, - "step": 12043 - }, - { - "epoch": 0.31, - "learning_rate": 1.9722612950797075e-06, - "loss": 0.7959, - "step": 12044 - }, - { - "epoch": 0.31, - "learning_rate": 1.972254822661439e-06, - "loss": 0.7854, - "step": 12045 - }, - { - "epoch": 0.31, - "learning_rate": 1.9722483494987596e-06, - "loss": 0.8779, - "step": 12046 - }, - { - "epoch": 0.31, - "learning_rate": 1.972241875591674e-06, - "loss": 1.0645, - "step": 12047 - }, - { - "epoch": 0.31, - "learning_rate": 1.972235400940188e-06, - "loss": 0.834, - "step": 12048 - }, - { - "epoch": 0.31, - "learning_rate": 1.9722289255443056e-06, - "loss": 0.9736, - "step": 12049 - }, - { - "epoch": 0.31, - "learning_rate": 1.9722224494040325e-06, - "loss": 0.9258, - "step": 12050 - }, - { - "epoch": 0.31, - "learning_rate": 1.9722159725193734e-06, - "loss": 1.0449, - "step": 12051 - }, - { - "epoch": 0.31, - "learning_rate": 1.972209494890333e-06, - "loss": 0.9746, - "step": 12052 - }, - { - "epoch": 0.31, - "learning_rate": 1.9722030165169165e-06, - "loss": 1.1592, - "step": 12053 - }, - { - "epoch": 0.31, - "learning_rate": 1.972196537399129e-06, - "loss": 0.9355, - "step": 12054 - }, - { - "epoch": 0.31, - "learning_rate": 1.972190057536975e-06, - "loss": 1.0654, - "step": 12055 - }, - { - "epoch": 0.31, - "learning_rate": 1.97218357693046e-06, - "loss": 1.0059, - "step": 12056 - }, - { - "epoch": 0.31, - "learning_rate": 1.972177095579589e-06, - "loss": 0.9082, - "step": 12057 - }, - { - "epoch": 0.31, - "learning_rate": 1.9721706134843664e-06, - "loss": 0.6075, - "step": 12058 - }, - { - "epoch": 0.31, - "learning_rate": 1.9721641306447975e-06, - "loss": 1.2324, - "step": 12059 - }, - { - "epoch": 0.31, - "learning_rate": 1.972157647060887e-06, - "loss": 0.9062, - "step": 12060 - }, - { - "epoch": 0.31, - "learning_rate": 1.9721511627326407e-06, - "loss": 0.7871, - "step": 12061 - }, - { - "epoch": 0.31, - "learning_rate": 1.972144677660062e-06, - "loss": 0.9521, - "step": 12062 - }, - { - "epoch": 0.31, - "learning_rate": 1.972138191843158e-06, - "loss": 0.9893, - "step": 12063 - }, - { - "epoch": 0.31, - "learning_rate": 1.972131705281932e-06, - "loss": 1.0537, - "step": 12064 - }, - { - "epoch": 0.31, - "learning_rate": 1.972125217976389e-06, - "loss": 1.0664, - "step": 12065 - }, - { - "epoch": 0.31, - "learning_rate": 1.972118729926535e-06, - "loss": 0.9736, - "step": 12066 - }, - { - "epoch": 0.31, - "learning_rate": 1.972112241132374e-06, - "loss": 0.8027, - "step": 12067 - }, - { - "epoch": 0.31, - "learning_rate": 1.9721057515939115e-06, - "loss": 0.8906, - "step": 12068 - }, - { - "epoch": 0.31, - "learning_rate": 1.9720992613111524e-06, - "loss": 1.0029, - "step": 12069 - }, - { - "epoch": 0.31, - "learning_rate": 1.9720927702841016e-06, - "loss": 0.9111, - "step": 12070 - }, - { - "epoch": 0.31, - "learning_rate": 1.972086278512764e-06, - "loss": 0.8281, - "step": 12071 - }, - { - "epoch": 0.31, - "learning_rate": 1.9720797859971445e-06, - "loss": 0.9951, - "step": 12072 - }, - { - "epoch": 0.31, - "learning_rate": 1.9720732927372484e-06, - "loss": 0.5347, - "step": 12073 - }, - { - "epoch": 0.31, - "learning_rate": 1.9720667987330805e-06, - "loss": 1.0234, - "step": 12074 - }, - { - "epoch": 0.31, - "learning_rate": 1.9720603039846456e-06, - "loss": 0.7734, - "step": 12075 - }, - { - "epoch": 0.31, - "learning_rate": 1.972053808491949e-06, - "loss": 0.7988, - "step": 12076 - }, - { - "epoch": 0.31, - "learning_rate": 1.9720473122549955e-06, - "loss": 0.8259, - "step": 12077 - }, - { - "epoch": 0.31, - "learning_rate": 1.9720408152737897e-06, - "loss": 1.126, - "step": 12078 - }, - { - "epoch": 0.31, - "learning_rate": 1.972034317548337e-06, - "loss": 1.0449, - "step": 12079 - }, - { - "epoch": 0.31, - "learning_rate": 1.972027819078643e-06, - "loss": 0.8848, - "step": 12080 - }, - { - "epoch": 0.31, - "learning_rate": 1.9720213198647112e-06, - "loss": 0.9277, - "step": 12081 - }, - { - "epoch": 0.31, - "learning_rate": 1.9720148199065476e-06, - "loss": 1.0146, - "step": 12082 - }, - { - "epoch": 0.31, - "learning_rate": 1.972008319204157e-06, - "loss": 0.9932, - "step": 12083 - }, - { - "epoch": 0.31, - "learning_rate": 1.9720018177575444e-06, - "loss": 0.7344, - "step": 12084 - }, - { - "epoch": 0.31, - "learning_rate": 1.971995315566715e-06, - "loss": 0.9541, - "step": 12085 - }, - { - "epoch": 0.31, - "learning_rate": 1.971988812631673e-06, - "loss": 0.9668, - "step": 12086 - }, - { - "epoch": 0.31, - "learning_rate": 1.971982308952424e-06, - "loss": 1.0215, - "step": 12087 - }, - { - "epoch": 0.31, - "learning_rate": 1.9719758045289727e-06, - "loss": 0.9863, - "step": 12088 - }, - { - "epoch": 0.31, - "learning_rate": 1.9719692993613244e-06, - "loss": 0.8467, - "step": 12089 - }, - { - "epoch": 0.31, - "learning_rate": 1.971962793449484e-06, - "loss": 0.9922, - "step": 12090 - }, - { - "epoch": 0.31, - "learning_rate": 1.971956286793456e-06, - "loss": 1.0249, - "step": 12091 - }, - { - "epoch": 0.31, - "learning_rate": 1.971949779393246e-06, - "loss": 0.8516, - "step": 12092 - }, - { - "epoch": 0.31, - "learning_rate": 1.9719432712488588e-06, - "loss": 0.749, - "step": 12093 - }, - { - "epoch": 0.31, - "learning_rate": 1.9719367623602993e-06, - "loss": 0.8311, - "step": 12094 - }, - { - "epoch": 0.31, - "learning_rate": 1.9719302527275727e-06, - "loss": 0.8696, - "step": 12095 - }, - { - "epoch": 0.31, - "learning_rate": 1.9719237423506836e-06, - "loss": 0.7227, - "step": 12096 - }, - { - "epoch": 0.31, - "learning_rate": 1.9719172312296366e-06, - "loss": 0.772, - "step": 12097 - }, - { - "epoch": 0.31, - "learning_rate": 1.9719107193644378e-06, - "loss": 1.0322, - "step": 12098 - }, - { - "epoch": 0.31, - "learning_rate": 1.971904206755092e-06, - "loss": 1.0479, - "step": 12099 - }, - { - "epoch": 0.31, - "learning_rate": 1.9718976934016034e-06, - "loss": 1.0635, - "step": 12100 - }, - { - "epoch": 0.31, - "learning_rate": 1.9718911793039777e-06, - "loss": 1.1211, - "step": 12101 - }, - { - "epoch": 0.31, - "learning_rate": 1.9718846644622195e-06, - "loss": 0.9365, - "step": 12102 - }, - { - "epoch": 0.31, - "learning_rate": 1.9718781488763336e-06, - "loss": 0.7354, - "step": 12103 - }, - { - "epoch": 0.31, - "learning_rate": 1.971871632546326e-06, - "loss": 0.8789, - "step": 12104 - }, - { - "epoch": 0.31, - "learning_rate": 1.9718651154722e-06, - "loss": 1.0586, - "step": 12105 - }, - { - "epoch": 0.31, - "learning_rate": 1.971858597653962e-06, - "loss": 0.7705, - "step": 12106 - }, - { - "epoch": 0.31, - "learning_rate": 1.971852079091617e-06, - "loss": 0.8389, - "step": 12107 - }, - { - "epoch": 0.31, - "learning_rate": 1.971845559785169e-06, - "loss": 0.7593, - "step": 12108 - }, - { - "epoch": 0.31, - "learning_rate": 1.971839039734624e-06, - "loss": 0.5977, - "step": 12109 - }, - { - "epoch": 0.31, - "learning_rate": 1.971832518939986e-06, - "loss": 0.9492, - "step": 12110 - }, - { - "epoch": 0.31, - "learning_rate": 1.971825997401261e-06, - "loss": 0.9346, - "step": 12111 - }, - { - "epoch": 0.31, - "learning_rate": 1.9718194751184533e-06, - "loss": 0.9561, - "step": 12112 - }, - { - "epoch": 0.31, - "learning_rate": 1.971812952091568e-06, - "loss": 0.6294, - "step": 12113 - }, - { - "epoch": 0.31, - "learning_rate": 1.9718064283206104e-06, - "loss": 1.0879, - "step": 12114 - }, - { - "epoch": 0.31, - "learning_rate": 1.971799903805585e-06, - "loss": 0.7031, - "step": 12115 - }, - { - "epoch": 0.31, - "learning_rate": 1.9717933785464974e-06, - "loss": 0.917, - "step": 12116 - }, - { - "epoch": 0.31, - "learning_rate": 1.9717868525433526e-06, - "loss": 0.9502, - "step": 12117 - }, - { - "epoch": 0.31, - "learning_rate": 1.9717803257961546e-06, - "loss": 0.7205, - "step": 12118 - }, - { - "epoch": 0.31, - "learning_rate": 1.9717737983049094e-06, - "loss": 0.9941, - "step": 12119 - }, - { - "epoch": 0.31, - "learning_rate": 1.971767270069622e-06, - "loss": 0.9229, - "step": 12120 - }, - { - "epoch": 0.31, - "learning_rate": 1.971760741090297e-06, - "loss": 0.8379, - "step": 12121 - }, - { - "epoch": 0.31, - "learning_rate": 1.971754211366939e-06, - "loss": 0.7959, - "step": 12122 - }, - { - "epoch": 0.31, - "learning_rate": 1.9717476808995535e-06, - "loss": 1.0195, - "step": 12123 - }, - { - "epoch": 0.31, - "learning_rate": 1.971741149688146e-06, - "loss": 1.0615, - "step": 12124 - }, - { - "epoch": 0.31, - "learning_rate": 1.9717346177327206e-06, - "loss": 0.834, - "step": 12125 - }, - { - "epoch": 0.31, - "learning_rate": 1.9717280850332827e-06, - "loss": 1.1074, - "step": 12126 - }, - { - "epoch": 0.31, - "learning_rate": 1.9717215515898374e-06, - "loss": 0.9326, - "step": 12127 - }, - { - "epoch": 0.31, - "learning_rate": 1.9717150174023896e-06, - "loss": 1.0088, - "step": 12128 - }, - { - "epoch": 0.31, - "learning_rate": 1.9717084824709446e-06, - "loss": 1.1934, - "step": 12129 - }, - { - "epoch": 0.31, - "learning_rate": 1.9717019467955064e-06, - "loss": 1.0757, - "step": 12130 - }, - { - "epoch": 0.31, - "learning_rate": 1.971695410376081e-06, - "loss": 0.9102, - "step": 12131 - }, - { - "epoch": 0.31, - "learning_rate": 1.9716888732126733e-06, - "loss": 1.0127, - "step": 12132 - }, - { - "epoch": 0.31, - "learning_rate": 1.9716823353052877e-06, - "loss": 0.6724, - "step": 12133 - }, - { - "epoch": 0.31, - "learning_rate": 1.97167579665393e-06, - "loss": 1.0098, - "step": 12134 - }, - { - "epoch": 0.31, - "learning_rate": 1.971669257258605e-06, - "loss": 0.9414, - "step": 12135 - }, - { - "epoch": 0.31, - "learning_rate": 1.971662717119317e-06, - "loss": 1.1797, - "step": 12136 - }, - { - "epoch": 0.31, - "learning_rate": 1.971656176236072e-06, - "loss": 0.9497, - "step": 12137 - }, - { - "epoch": 0.31, - "learning_rate": 1.971649634608874e-06, - "loss": 1.0938, - "step": 12138 - }, - { - "epoch": 0.31, - "learning_rate": 1.971643092237729e-06, - "loss": 0.9619, - "step": 12139 - }, - { - "epoch": 0.31, - "learning_rate": 1.9716365491226417e-06, - "loss": 0.9766, - "step": 12140 - }, - { - "epoch": 0.31, - "learning_rate": 1.9716300052636168e-06, - "loss": 0.907, - "step": 12141 - }, - { - "epoch": 0.31, - "learning_rate": 1.971623460660659e-06, - "loss": 0.9053, - "step": 12142 - }, - { - "epoch": 0.31, - "learning_rate": 1.9716169153137744e-06, - "loss": 0.9707, - "step": 12143 - }, - { - "epoch": 0.31, - "learning_rate": 1.971610369222967e-06, - "loss": 0.7295, - "step": 12144 - }, - { - "epoch": 0.31, - "learning_rate": 1.9716038223882426e-06, - "loss": 0.6226, - "step": 12145 - }, - { - "epoch": 0.31, - "learning_rate": 1.9715972748096055e-06, - "loss": 0.79, - "step": 12146 - }, - { - "epoch": 0.31, - "learning_rate": 1.9715907264870612e-06, - "loss": 0.8115, - "step": 12147 - }, - { - "epoch": 0.31, - "learning_rate": 1.9715841774206145e-06, - "loss": 0.8994, - "step": 12148 - }, - { - "epoch": 0.31, - "learning_rate": 1.9715776276102705e-06, - "loss": 0.8042, - "step": 12149 - }, - { - "epoch": 0.31, - "learning_rate": 1.9715710770560345e-06, - "loss": 0.707, - "step": 12150 - }, - { - "epoch": 0.31, - "learning_rate": 1.9715645257579105e-06, - "loss": 0.7451, - "step": 12151 - }, - { - "epoch": 0.31, - "learning_rate": 1.9715579737159044e-06, - "loss": 1.0205, - "step": 12152 - }, - { - "epoch": 0.31, - "learning_rate": 1.9715514209300213e-06, - "loss": 0.7954, - "step": 12153 - }, - { - "epoch": 0.31, - "learning_rate": 1.9715448674002657e-06, - "loss": 1.0586, - "step": 12154 - }, - { - "epoch": 0.31, - "learning_rate": 1.9715383131266433e-06, - "loss": 0.8203, - "step": 12155 - }, - { - "epoch": 0.31, - "learning_rate": 1.9715317581091587e-06, - "loss": 0.7598, - "step": 12156 - }, - { - "epoch": 0.31, - "learning_rate": 1.9715252023478165e-06, - "loss": 1.0684, - "step": 12157 - }, - { - "epoch": 0.31, - "learning_rate": 1.9715186458426223e-06, - "loss": 0.8374, - "step": 12158 - }, - { - "epoch": 0.31, - "learning_rate": 1.971512088593581e-06, - "loss": 0.8828, - "step": 12159 - }, - { - "epoch": 0.31, - "learning_rate": 1.971505530600697e-06, - "loss": 0.8486, - "step": 12160 - }, - { - "epoch": 0.31, - "learning_rate": 1.971498971863977e-06, - "loss": 0.9814, - "step": 12161 - }, - { - "epoch": 0.31, - "learning_rate": 1.971492412383424e-06, - "loss": 1.0742, - "step": 12162 - }, - { - "epoch": 0.31, - "learning_rate": 1.971485852159044e-06, - "loss": 0.7622, - "step": 12163 - }, - { - "epoch": 0.31, - "learning_rate": 1.9714792911908425e-06, - "loss": 0.874, - "step": 12164 - }, - { - "epoch": 0.31, - "learning_rate": 1.9714727294788232e-06, - "loss": 0.9072, - "step": 12165 - }, - { - "epoch": 0.31, - "learning_rate": 1.9714661670229926e-06, - "loss": 0.8438, - "step": 12166 - }, - { - "epoch": 0.31, - "learning_rate": 1.9714596038233548e-06, - "loss": 0.8945, - "step": 12167 - }, - { - "epoch": 0.31, - "learning_rate": 1.971453039879915e-06, - "loss": 0.9346, - "step": 12168 - }, - { - "epoch": 0.31, - "learning_rate": 1.9714464751926784e-06, - "loss": 0.71, - "step": 12169 - }, - { - "epoch": 0.31, - "learning_rate": 1.9714399097616496e-06, - "loss": 1.1592, - "step": 12170 - }, - { - "epoch": 0.31, - "learning_rate": 1.9714333435868344e-06, - "loss": 0.9346, - "step": 12171 - }, - { - "epoch": 0.31, - "learning_rate": 1.971426776668237e-06, - "loss": 0.8369, - "step": 12172 - }, - { - "epoch": 0.31, - "learning_rate": 1.9714202090058626e-06, - "loss": 0.7871, - "step": 12173 - }, - { - "epoch": 0.31, - "learning_rate": 1.9714136405997165e-06, - "loss": 0.8281, - "step": 12174 - }, - { - "epoch": 0.31, - "learning_rate": 1.971407071449804e-06, - "loss": 0.8013, - "step": 12175 - }, - { - "epoch": 0.31, - "learning_rate": 1.9714005015561295e-06, - "loss": 0.8672, - "step": 12176 - }, - { - "epoch": 0.31, - "learning_rate": 1.9713939309186984e-06, - "loss": 0.7803, - "step": 12177 - }, - { - "epoch": 0.31, - "learning_rate": 1.9713873595375155e-06, - "loss": 1.0947, - "step": 12178 - }, - { - "epoch": 0.31, - "learning_rate": 1.971380787412586e-06, - "loss": 0.8633, - "step": 12179 - }, - { - "epoch": 0.31, - "learning_rate": 1.971374214543915e-06, - "loss": 0.8564, - "step": 12180 - }, - { - "epoch": 0.31, - "learning_rate": 1.9713676409315078e-06, - "loss": 0.7168, - "step": 12181 - }, - { - "epoch": 0.31, - "learning_rate": 1.9713610665753686e-06, - "loss": 0.7637, - "step": 12182 - }, - { - "epoch": 0.31, - "learning_rate": 1.9713544914755028e-06, - "loss": 0.9648, - "step": 12183 - }, - { - "epoch": 0.31, - "learning_rate": 1.9713479156319157e-06, - "loss": 0.8096, - "step": 12184 - }, - { - "epoch": 0.31, - "learning_rate": 1.971341339044612e-06, - "loss": 0.8262, - "step": 12185 - }, - { - "epoch": 0.31, - "learning_rate": 1.971334761713597e-06, - "loss": 0.7017, - "step": 12186 - }, - { - "epoch": 0.31, - "learning_rate": 1.971328183638876e-06, - "loss": 0.7271, - "step": 12187 - }, - { - "epoch": 0.31, - "learning_rate": 1.971321604820453e-06, - "loss": 0.9102, - "step": 12188 - }, - { - "epoch": 0.31, - "learning_rate": 1.9713150252583343e-06, - "loss": 0.9873, - "step": 12189 - }, - { - "epoch": 0.31, - "learning_rate": 1.971308444952524e-06, - "loss": 0.8955, - "step": 12190 - }, - { - "epoch": 0.31, - "learning_rate": 1.9713018639030275e-06, - "loss": 1.0469, - "step": 12191 - }, - { - "epoch": 0.31, - "learning_rate": 1.97129528210985e-06, - "loss": 0.8965, - "step": 12192 - }, - { - "epoch": 0.31, - "learning_rate": 1.9712886995729965e-06, - "loss": 0.8896, - "step": 12193 - }, - { - "epoch": 0.31, - "learning_rate": 1.9712821162924716e-06, - "loss": 0.8335, - "step": 12194 - }, - { - "epoch": 0.31, - "learning_rate": 1.971275532268281e-06, - "loss": 1.1934, - "step": 12195 - }, - { - "epoch": 0.31, - "learning_rate": 1.971268947500429e-06, - "loss": 1.043, - "step": 12196 - }, - { - "epoch": 0.31, - "learning_rate": 1.9712623619889214e-06, - "loss": 0.7119, - "step": 12197 - }, - { - "epoch": 0.31, - "learning_rate": 1.971255775733762e-06, - "loss": 0.8203, - "step": 12198 - }, - { - "epoch": 0.31, - "learning_rate": 1.9712491887349578e-06, - "loss": 0.8457, - "step": 12199 - }, - { - "epoch": 0.31, - "learning_rate": 1.9712426009925124e-06, - "loss": 0.9492, - "step": 12200 - }, - { - "epoch": 0.31, - "learning_rate": 1.971236012506431e-06, - "loss": 0.9932, - "step": 12201 - }, - { - "epoch": 0.31, - "learning_rate": 1.971229423276719e-06, - "loss": 0.8232, - "step": 12202 - }, - { - "epoch": 0.31, - "learning_rate": 1.971222833303381e-06, - "loss": 0.9072, - "step": 12203 - }, - { - "epoch": 0.31, - "learning_rate": 1.9712162425864226e-06, - "loss": 1.2363, - "step": 12204 - }, - { - "epoch": 0.31, - "learning_rate": 1.9712096511258486e-06, - "loss": 1.0635, - "step": 12205 - }, - { - "epoch": 0.31, - "learning_rate": 1.971203058921664e-06, - "loss": 0.8652, - "step": 12206 - }, - { - "epoch": 0.31, - "learning_rate": 1.9711964659738737e-06, - "loss": 1.0596, - "step": 12207 - }, - { - "epoch": 0.31, - "learning_rate": 1.971189872282483e-06, - "loss": 0.875, - "step": 12208 - }, - { - "epoch": 0.31, - "learning_rate": 1.971183277847497e-06, - "loss": 0.8284, - "step": 12209 - }, - { - "epoch": 0.31, - "learning_rate": 1.9711766826689207e-06, - "loss": 0.833, - "step": 12210 - }, - { - "epoch": 0.31, - "learning_rate": 1.971170086746759e-06, - "loss": 0.7715, - "step": 12211 - }, - { - "epoch": 0.31, - "learning_rate": 1.9711634900810168e-06, - "loss": 0.75, - "step": 12212 - }, - { - "epoch": 0.31, - "learning_rate": 1.9711568926716994e-06, - "loss": 1.0566, - "step": 12213 - }, - { - "epoch": 0.31, - "learning_rate": 1.971150294518812e-06, - "loss": 0.8469, - "step": 12214 - }, - { - "epoch": 0.31, - "learning_rate": 1.9711436956223594e-06, - "loss": 0.7222, - "step": 12215 - }, - { - "epoch": 0.31, - "learning_rate": 1.971137095982347e-06, - "loss": 0.8623, - "step": 12216 - }, - { - "epoch": 0.31, - "learning_rate": 1.9711304955987793e-06, - "loss": 0.8262, - "step": 12217 - }, - { - "epoch": 0.31, - "learning_rate": 1.9711238944716615e-06, - "loss": 0.6489, - "step": 12218 - }, - { - "epoch": 0.31, - "learning_rate": 1.971117292600999e-06, - "loss": 1.0762, - "step": 12219 - }, - { - "epoch": 0.31, - "learning_rate": 1.9711106899867965e-06, - "loss": 0.9971, - "step": 12220 - }, - { - "epoch": 0.31, - "learning_rate": 1.9711040866290595e-06, - "loss": 0.9238, - "step": 12221 - }, - { - "epoch": 0.31, - "learning_rate": 1.971097482527792e-06, - "loss": 0.9824, - "step": 12222 - }, - { - "epoch": 0.31, - "learning_rate": 1.9710908776830007e-06, - "loss": 0.8418, - "step": 12223 - }, - { - "epoch": 0.31, - "learning_rate": 1.971084272094689e-06, - "loss": 0.8716, - "step": 12224 - }, - { - "epoch": 0.31, - "learning_rate": 1.9710776657628635e-06, - "loss": 1.0293, - "step": 12225 - }, - { - "epoch": 0.31, - "learning_rate": 1.971071058687528e-06, - "loss": 1.1289, - "step": 12226 - }, - { - "epoch": 0.31, - "learning_rate": 1.9710644508686883e-06, - "loss": 0.9551, - "step": 12227 - }, - { - "epoch": 0.31, - "learning_rate": 1.971057842306349e-06, - "loss": 0.7793, - "step": 12228 - }, - { - "epoch": 0.31, - "learning_rate": 1.9710512330005155e-06, - "loss": 1.0576, - "step": 12229 - }, - { - "epoch": 0.31, - "learning_rate": 1.9710446229511927e-06, - "loss": 0.7266, - "step": 12230 - }, - { - "epoch": 0.31, - "learning_rate": 1.9710380121583855e-06, - "loss": 0.7319, - "step": 12231 - }, - { - "epoch": 0.31, - "learning_rate": 1.9710314006220994e-06, - "loss": 0.8047, - "step": 12232 - }, - { - "epoch": 0.31, - "learning_rate": 1.971024788342339e-06, - "loss": 0.96, - "step": 12233 - }, - { - "epoch": 0.31, - "learning_rate": 1.9710181753191093e-06, - "loss": 1.041, - "step": 12234 - }, - { - "epoch": 0.31, - "learning_rate": 1.9710115615524164e-06, - "loss": 1.0293, - "step": 12235 - }, - { - "epoch": 0.31, - "learning_rate": 1.971004947042264e-06, - "loss": 1.0166, - "step": 12236 - }, - { - "epoch": 0.31, - "learning_rate": 1.9709983317886582e-06, - "loss": 0.9771, - "step": 12237 - }, - { - "epoch": 0.31, - "learning_rate": 1.970991715791603e-06, - "loss": 0.9453, - "step": 12238 - }, - { - "epoch": 0.31, - "learning_rate": 1.9709850990511046e-06, - "loss": 0.8633, - "step": 12239 - }, - { - "epoch": 0.31, - "learning_rate": 1.9709784815671674e-06, - "loss": 0.8594, - "step": 12240 - }, - { - "epoch": 0.31, - "learning_rate": 1.9709718633397965e-06, - "loss": 0.7881, - "step": 12241 - }, - { - "epoch": 0.31, - "learning_rate": 1.970965244368997e-06, - "loss": 0.9658, - "step": 12242 - }, - { - "epoch": 0.31, - "learning_rate": 1.9709586246547744e-06, - "loss": 0.8115, - "step": 12243 - }, - { - "epoch": 0.31, - "learning_rate": 1.9709520041971336e-06, - "loss": 0.8447, - "step": 12244 - }, - { - "epoch": 0.31, - "learning_rate": 1.970945382996079e-06, - "loss": 0.8462, - "step": 12245 - }, - { - "epoch": 0.31, - "learning_rate": 1.9709387610516164e-06, - "loss": 0.9502, - "step": 12246 - }, - { - "epoch": 0.31, - "learning_rate": 1.9709321383637506e-06, - "loss": 1.084, - "step": 12247 - }, - { - "epoch": 0.31, - "learning_rate": 1.9709255149324868e-06, - "loss": 1.0508, - "step": 12248 - }, - { - "epoch": 0.31, - "learning_rate": 1.97091889075783e-06, - "loss": 0.8682, - "step": 12249 - }, - { - "epoch": 0.31, - "learning_rate": 1.970912265839785e-06, - "loss": 0.8599, - "step": 12250 - }, - { - "epoch": 0.31, - "learning_rate": 1.970905640178357e-06, - "loss": 0.7217, - "step": 12251 - }, - { - "epoch": 0.31, - "learning_rate": 1.9708990137735517e-06, - "loss": 0.918, - "step": 12252 - }, - { - "epoch": 0.31, - "learning_rate": 1.9708923866253735e-06, - "loss": 1.1875, - "step": 12253 - }, - { - "epoch": 0.31, - "learning_rate": 1.9708857587338273e-06, - "loss": 1.0791, - "step": 12254 - }, - { - "epoch": 0.31, - "learning_rate": 1.970879130098919e-06, - "loss": 0.8271, - "step": 12255 - }, - { - "epoch": 0.31, - "learning_rate": 1.970872500720653e-06, - "loss": 0.9766, - "step": 12256 - }, - { - "epoch": 0.31, - "learning_rate": 1.9708658705990345e-06, - "loss": 0.9297, - "step": 12257 - }, - { - "epoch": 0.31, - "learning_rate": 1.9708592397340685e-06, - "loss": 0.8887, - "step": 12258 - }, - { - "epoch": 0.31, - "learning_rate": 1.9708526081257608e-06, - "loss": 0.7148, - "step": 12259 - }, - { - "epoch": 0.31, - "learning_rate": 1.970845975774115e-06, - "loss": 0.8564, - "step": 12260 - }, - { - "epoch": 0.31, - "learning_rate": 1.9708393426791375e-06, - "loss": 0.6367, - "step": 12261 - }, - { - "epoch": 0.31, - "learning_rate": 1.970832708840833e-06, - "loss": 0.8027, - "step": 12262 - }, - { - "epoch": 0.31, - "learning_rate": 1.970826074259207e-06, - "loss": 0.7896, - "step": 12263 - }, - { - "epoch": 0.31, - "learning_rate": 1.9708194389342636e-06, - "loss": 0.8672, - "step": 12264 - }, - { - "epoch": 0.31, - "learning_rate": 1.970812802866008e-06, - "loss": 0.8506, - "step": 12265 - }, - { - "epoch": 0.31, - "learning_rate": 1.9708061660544464e-06, - "loss": 0.8809, - "step": 12266 - }, - { - "epoch": 0.31, - "learning_rate": 1.9707995284995832e-06, - "loss": 0.8867, - "step": 12267 - }, - { - "epoch": 0.31, - "learning_rate": 1.970792890201423e-06, - "loss": 0.9199, - "step": 12268 - }, - { - "epoch": 0.31, - "learning_rate": 1.9707862511599715e-06, - "loss": 0.8936, - "step": 12269 - }, - { - "epoch": 0.31, - "learning_rate": 1.9707796113752336e-06, - "loss": 1.082, - "step": 12270 - }, - { - "epoch": 0.31, - "learning_rate": 1.9707729708472145e-06, - "loss": 1.0137, - "step": 12271 - }, - { - "epoch": 0.31, - "learning_rate": 1.970766329575919e-06, - "loss": 0.8359, - "step": 12272 - }, - { - "epoch": 0.31, - "learning_rate": 1.9707596875613523e-06, - "loss": 0.9902, - "step": 12273 - }, - { - "epoch": 0.31, - "learning_rate": 1.9707530448035198e-06, - "loss": 1.1123, - "step": 12274 - }, - { - "epoch": 0.31, - "learning_rate": 1.970746401302426e-06, - "loss": 1.1592, - "step": 12275 - }, - { - "epoch": 0.31, - "learning_rate": 1.9707397570580765e-06, - "loss": 0.9287, - "step": 12276 - }, - { - "epoch": 0.31, - "learning_rate": 1.9707331120704764e-06, - "loss": 1.0068, - "step": 12277 - }, - { - "epoch": 0.31, - "learning_rate": 1.9707264663396303e-06, - "loss": 1.0605, - "step": 12278 - }, - { - "epoch": 0.31, - "learning_rate": 1.9707198198655436e-06, - "loss": 0.8894, - "step": 12279 - }, - { - "epoch": 0.31, - "learning_rate": 1.970713172648221e-06, - "loss": 0.8066, - "step": 12280 - }, - { - "epoch": 0.31, - "learning_rate": 1.9707065246876688e-06, - "loss": 1.0439, - "step": 12281 - }, - { - "epoch": 0.31, - "learning_rate": 1.9706998759838907e-06, - "loss": 0.9443, - "step": 12282 - }, - { - "epoch": 0.31, - "learning_rate": 1.9706932265368925e-06, - "loss": 0.8975, - "step": 12283 - }, - { - "epoch": 0.31, - "learning_rate": 1.970686576346679e-06, - "loss": 0.8945, - "step": 12284 - }, - { - "epoch": 0.31, - "learning_rate": 1.970679925413256e-06, - "loss": 0.7195, - "step": 12285 - }, - { - "epoch": 0.31, - "learning_rate": 1.9706732737366272e-06, - "loss": 0.8988, - "step": 12286 - }, - { - "epoch": 0.31, - "learning_rate": 1.9706666213167988e-06, - "loss": 0.8628, - "step": 12287 - }, - { - "epoch": 0.31, - "learning_rate": 1.9706599681537755e-06, - "loss": 0.8691, - "step": 12288 - }, - { - "epoch": 0.31, - "learning_rate": 1.970653314247563e-06, - "loss": 0.9165, - "step": 12289 - }, - { - "epoch": 0.31, - "learning_rate": 1.9706466595981655e-06, - "loss": 0.8721, - "step": 12290 - }, - { - "epoch": 0.32, - "learning_rate": 1.9706400042055885e-06, - "loss": 0.8525, - "step": 12291 - }, - { - "epoch": 0.32, - "learning_rate": 1.970633348069837e-06, - "loss": 0.7505, - "step": 12292 - }, - { - "epoch": 0.32, - "learning_rate": 1.9706266911909163e-06, - "loss": 1.0049, - "step": 12293 - }, - { - "epoch": 0.32, - "learning_rate": 1.9706200335688313e-06, - "loss": 1.1172, - "step": 12294 - }, - { - "epoch": 0.32, - "learning_rate": 1.9706133752035875e-06, - "loss": 0.7031, - "step": 12295 - }, - { - "epoch": 0.32, - "learning_rate": 1.970606716095189e-06, - "loss": 0.7812, - "step": 12296 - }, - { - "epoch": 0.32, - "learning_rate": 1.9706000562436423e-06, - "loss": 0.9573, - "step": 12297 - }, - { - "epoch": 0.32, - "learning_rate": 1.9705933956489514e-06, - "loss": 1.0391, - "step": 12298 - }, - { - "epoch": 0.32, - "learning_rate": 1.9705867343111217e-06, - "loss": 0.8867, - "step": 12299 - }, - { - "epoch": 0.32, - "learning_rate": 1.9705800722301583e-06, - "loss": 0.7183, - "step": 12300 - }, - { - "epoch": 0.32, - "learning_rate": 1.9705734094060666e-06, - "loss": 0.9443, - "step": 12301 - }, - { - "epoch": 0.32, - "learning_rate": 1.9705667458388512e-06, - "loss": 1.0146, - "step": 12302 - }, - { - "epoch": 0.32, - "learning_rate": 1.970560081528518e-06, - "loss": 0.7317, - "step": 12303 - }, - { - "epoch": 0.32, - "learning_rate": 1.970553416475071e-06, - "loss": 0.9648, - "step": 12304 - }, - { - "epoch": 0.32, - "learning_rate": 1.970546750678516e-06, - "loss": 0.8418, - "step": 12305 - }, - { - "epoch": 0.32, - "learning_rate": 1.970540084138858e-06, - "loss": 0.9229, - "step": 12306 - }, - { - "epoch": 0.32, - "learning_rate": 1.9705334168561027e-06, - "loss": 0.7744, - "step": 12307 - }, - { - "epoch": 0.32, - "learning_rate": 1.970526748830254e-06, - "loss": 1.125, - "step": 12308 - }, - { - "epoch": 0.32, - "learning_rate": 1.9705200800613176e-06, - "loss": 0.9648, - "step": 12309 - }, - { - "epoch": 0.32, - "learning_rate": 1.9705134105492985e-06, - "loss": 0.9062, - "step": 12310 - }, - { - "epoch": 0.32, - "learning_rate": 1.970506740294202e-06, - "loss": 0.9189, - "step": 12311 - }, - { - "epoch": 0.32, - "learning_rate": 1.970500069296033e-06, - "loss": 0.9668, - "step": 12312 - }, - { - "epoch": 0.32, - "learning_rate": 1.9704933975547974e-06, - "loss": 0.8574, - "step": 12313 - }, - { - "epoch": 0.32, - "learning_rate": 1.970486725070499e-06, - "loss": 0.835, - "step": 12314 - }, - { - "epoch": 0.32, - "learning_rate": 1.9704800518431436e-06, - "loss": 0.8564, - "step": 12315 - }, - { - "epoch": 0.32, - "learning_rate": 1.970473377872736e-06, - "loss": 0.8486, - "step": 12316 - }, - { - "epoch": 0.32, - "learning_rate": 1.9704667031592825e-06, - "loss": 0.8555, - "step": 12317 - }, - { - "epoch": 0.32, - "learning_rate": 1.970460027702786e-06, - "loss": 0.8281, - "step": 12318 - }, - { - "epoch": 0.32, - "learning_rate": 1.970453351503254e-06, - "loss": 0.7549, - "step": 12319 - }, - { - "epoch": 0.32, - "learning_rate": 1.97044667456069e-06, - "loss": 1.0068, - "step": 12320 - }, - { - "epoch": 0.32, - "learning_rate": 1.9704399968750994e-06, - "loss": 0.8164, - "step": 12321 - }, - { - "epoch": 0.32, - "learning_rate": 1.9704333184464878e-06, - "loss": 1.0156, - "step": 12322 - }, - { - "epoch": 0.32, - "learning_rate": 1.97042663927486e-06, - "loss": 0.8032, - "step": 12323 - }, - { - "epoch": 0.32, - "learning_rate": 1.970419959360221e-06, - "loss": 0.9209, - "step": 12324 - }, - { - "epoch": 0.32, - "learning_rate": 1.970413278702576e-06, - "loss": 0.8096, - "step": 12325 - }, - { - "epoch": 0.32, - "learning_rate": 1.9704065973019307e-06, - "loss": 0.9268, - "step": 12326 - }, - { - "epoch": 0.32, - "learning_rate": 1.9703999151582893e-06, - "loss": 0.6699, - "step": 12327 - }, - { - "epoch": 0.32, - "learning_rate": 1.9703932322716573e-06, - "loss": 0.7109, - "step": 12328 - }, - { - "epoch": 0.32, - "learning_rate": 1.97038654864204e-06, - "loss": 0.9834, - "step": 12329 - }, - { - "epoch": 0.32, - "learning_rate": 1.970379864269442e-06, - "loss": 0.9053, - "step": 12330 - }, - { - "epoch": 0.32, - "learning_rate": 1.970373179153869e-06, - "loss": 0.6991, - "step": 12331 - }, - { - "epoch": 0.32, - "learning_rate": 1.9703664932953258e-06, - "loss": 0.9854, - "step": 12332 - }, - { - "epoch": 0.32, - "learning_rate": 1.9703598066938177e-06, - "loss": 1.1475, - "step": 12333 - }, - { - "epoch": 0.32, - "learning_rate": 1.9703531193493495e-06, - "loss": 0.8804, - "step": 12334 - }, - { - "epoch": 0.32, - "learning_rate": 1.9703464312619267e-06, - "loss": 0.7207, - "step": 12335 - }, - { - "epoch": 0.32, - "learning_rate": 1.9703397424315544e-06, - "loss": 1.1084, - "step": 12336 - }, - { - "epoch": 0.32, - "learning_rate": 1.9703330528582375e-06, - "loss": 0.8984, - "step": 12337 - }, - { - "epoch": 0.32, - "learning_rate": 1.970326362541981e-06, - "loss": 0.9844, - "step": 12338 - }, - { - "epoch": 0.32, - "learning_rate": 1.9703196714827905e-06, - "loss": 0.8418, - "step": 12339 - }, - { - "epoch": 0.32, - "learning_rate": 1.9703129796806704e-06, - "loss": 1.0762, - "step": 12340 - }, - { - "epoch": 0.32, - "learning_rate": 1.9703062871356265e-06, - "loss": 0.8818, - "step": 12341 - }, - { - "epoch": 0.32, - "learning_rate": 1.9702995938476637e-06, - "loss": 0.7051, - "step": 12342 - }, - { - "epoch": 0.32, - "learning_rate": 1.9702928998167873e-06, - "loss": 1.0215, - "step": 12343 - }, - { - "epoch": 0.32, - "learning_rate": 1.970286205043002e-06, - "loss": 1.1895, - "step": 12344 - }, - { - "epoch": 0.32, - "learning_rate": 1.9702795095263133e-06, - "loss": 1.124, - "step": 12345 - }, - { - "epoch": 0.32, - "learning_rate": 1.970272813266726e-06, - "loss": 0.7139, - "step": 12346 - }, - { - "epoch": 0.32, - "learning_rate": 1.970266116264246e-06, - "loss": 1.0957, - "step": 12347 - }, - { - "epoch": 0.32, - "learning_rate": 1.970259418518877e-06, - "loss": 0.9141, - "step": 12348 - }, - { - "epoch": 0.32, - "learning_rate": 1.9702527200306258e-06, - "loss": 0.8452, - "step": 12349 - }, - { - "epoch": 0.32, - "learning_rate": 1.970246020799496e-06, - "loss": 0.7974, - "step": 12350 - }, - { - "epoch": 0.32, - "learning_rate": 1.970239320825494e-06, - "loss": 0.9355, - "step": 12351 - }, - { - "epoch": 0.32, - "learning_rate": 1.970232620108624e-06, - "loss": 0.8838, - "step": 12352 - }, - { - "epoch": 0.32, - "learning_rate": 1.9702259186488916e-06, - "loss": 1.0, - "step": 12353 - }, - { - "epoch": 0.32, - "learning_rate": 1.9702192164463017e-06, - "loss": 0.9355, - "step": 12354 - }, - { - "epoch": 0.32, - "learning_rate": 1.9702125135008597e-06, - "loss": 0.873, - "step": 12355 - }, - { - "epoch": 0.32, - "learning_rate": 1.9702058098125706e-06, - "loss": 0.7065, - "step": 12356 - }, - { - "epoch": 0.32, - "learning_rate": 1.9701991053814395e-06, - "loss": 0.7021, - "step": 12357 - }, - { - "epoch": 0.32, - "learning_rate": 1.9701924002074716e-06, - "loss": 0.5825, - "step": 12358 - }, - { - "epoch": 0.32, - "learning_rate": 1.970185694290672e-06, - "loss": 0.9268, - "step": 12359 - }, - { - "epoch": 0.32, - "learning_rate": 1.9701789876310454e-06, - "loss": 0.915, - "step": 12360 - }, - { - "epoch": 0.32, - "learning_rate": 1.9701722802285977e-06, - "loss": 0.8721, - "step": 12361 - }, - { - "epoch": 0.32, - "learning_rate": 1.970165572083334e-06, - "loss": 1.1406, - "step": 12362 - }, - { - "epoch": 0.32, - "learning_rate": 1.9701588631952586e-06, - "loss": 0.8398, - "step": 12363 - }, - { - "epoch": 0.32, - "learning_rate": 1.970152153564378e-06, - "loss": 0.8359, - "step": 12364 - }, - { - "epoch": 0.32, - "learning_rate": 1.9701454431906957e-06, - "loss": 0.9619, - "step": 12365 - }, - { - "epoch": 0.32, - "learning_rate": 1.9701387320742173e-06, - "loss": 0.9717, - "step": 12366 - }, - { - "epoch": 0.32, - "learning_rate": 1.970132020214949e-06, - "loss": 0.7261, - "step": 12367 - }, - { - "epoch": 0.32, - "learning_rate": 1.9701253076128952e-06, - "loss": 0.9009, - "step": 12368 - }, - { - "epoch": 0.32, - "learning_rate": 1.970118594268061e-06, - "loss": 0.8076, - "step": 12369 - }, - { - "epoch": 0.32, - "learning_rate": 1.9701118801804514e-06, - "loss": 0.8516, - "step": 12370 - }, - { - "epoch": 0.32, - "learning_rate": 1.970105165350072e-06, - "loss": 0.8125, - "step": 12371 - }, - { - "epoch": 0.32, - "learning_rate": 1.9700984497769276e-06, - "loss": 0.9785, - "step": 12372 - }, - { - "epoch": 0.32, - "learning_rate": 1.9700917334610235e-06, - "loss": 0.6285, - "step": 12373 - }, - { - "epoch": 0.32, - "learning_rate": 1.9700850164023642e-06, - "loss": 0.9326, - "step": 12374 - }, - { - "epoch": 0.32, - "learning_rate": 1.970078298600956e-06, - "loss": 1.0264, - "step": 12375 - }, - { - "epoch": 0.32, - "learning_rate": 1.970071580056803e-06, - "loss": 0.7915, - "step": 12376 - }, - { - "epoch": 0.32, - "learning_rate": 1.9700648607699114e-06, - "loss": 0.7793, - "step": 12377 - }, - { - "epoch": 0.32, - "learning_rate": 1.9700581407402854e-06, - "loss": 0.915, - "step": 12378 - }, - { - "epoch": 0.32, - "learning_rate": 1.9700514199679304e-06, - "loss": 0.9463, - "step": 12379 - }, - { - "epoch": 0.32, - "learning_rate": 1.970044698452852e-06, - "loss": 0.7705, - "step": 12380 - }, - { - "epoch": 0.32, - "learning_rate": 1.9700379761950546e-06, - "loss": 0.7122, - "step": 12381 - }, - { - "epoch": 0.32, - "learning_rate": 1.970031253194544e-06, - "loss": 0.8389, - "step": 12382 - }, - { - "epoch": 0.32, - "learning_rate": 1.970024529451325e-06, - "loss": 0.7559, - "step": 12383 - }, - { - "epoch": 0.32, - "learning_rate": 1.9700178049654024e-06, - "loss": 0.8994, - "step": 12384 - }, - { - "epoch": 0.32, - "learning_rate": 1.9700110797367825e-06, - "loss": 0.875, - "step": 12385 - }, - { - "epoch": 0.32, - "learning_rate": 1.970004353765469e-06, - "loss": 0.8857, - "step": 12386 - }, - { - "epoch": 0.32, - "learning_rate": 1.969997627051468e-06, - "loss": 0.8154, - "step": 12387 - }, - { - "epoch": 0.32, - "learning_rate": 1.9699908995947847e-06, - "loss": 1.1162, - "step": 12388 - }, - { - "epoch": 0.32, - "learning_rate": 1.969984171395424e-06, - "loss": 0.9912, - "step": 12389 - }, - { - "epoch": 0.32, - "learning_rate": 1.969977442453391e-06, - "loss": 0.916, - "step": 12390 - }, - { - "epoch": 0.32, - "learning_rate": 1.9699707127686903e-06, - "loss": 1.1074, - "step": 12391 - }, - { - "epoch": 0.32, - "learning_rate": 1.9699639823413282e-06, - "loss": 0.9922, - "step": 12392 - }, - { - "epoch": 0.32, - "learning_rate": 1.969957251171309e-06, - "loss": 1.0469, - "step": 12393 - }, - { - "epoch": 0.32, - "learning_rate": 1.969950519258638e-06, - "loss": 1.1299, - "step": 12394 - }, - { - "epoch": 0.32, - "learning_rate": 1.969943786603321e-06, - "loss": 0.9072, - "step": 12395 - }, - { - "epoch": 0.32, - "learning_rate": 1.969937053205362e-06, - "loss": 1.0703, - "step": 12396 - }, - { - "epoch": 0.32, - "learning_rate": 1.9699303190647675e-06, - "loss": 1.3232, - "step": 12397 - }, - { - "epoch": 0.32, - "learning_rate": 1.969923584181541e-06, - "loss": 0.7891, - "step": 12398 - }, - { - "epoch": 0.32, - "learning_rate": 1.9699168485556897e-06, - "loss": 0.5786, - "step": 12399 - }, - { - "epoch": 0.32, - "learning_rate": 1.9699101121872174e-06, - "loss": 0.9644, - "step": 12400 - }, - { - "epoch": 0.32, - "learning_rate": 1.9699033750761292e-06, - "loss": 0.7744, - "step": 12401 - }, - { - "epoch": 0.32, - "learning_rate": 1.969896637222431e-06, - "loss": 0.9248, - "step": 12402 - }, - { - "epoch": 0.32, - "learning_rate": 1.9698898986261267e-06, - "loss": 1.0596, - "step": 12403 - }, - { - "epoch": 0.32, - "learning_rate": 1.969883159287223e-06, - "loss": 0.812, - "step": 12404 - }, - { - "epoch": 0.32, - "learning_rate": 1.969876419205724e-06, - "loss": 0.8232, - "step": 12405 - }, - { - "epoch": 0.32, - "learning_rate": 1.9698696783816352e-06, - "loss": 0.7949, - "step": 12406 - }, - { - "epoch": 0.32, - "learning_rate": 1.9698629368149624e-06, - "loss": 0.9053, - "step": 12407 - }, - { - "epoch": 0.32, - "learning_rate": 1.9698561945057097e-06, - "loss": 0.8057, - "step": 12408 - }, - { - "epoch": 0.32, - "learning_rate": 1.9698494514538827e-06, - "loss": 0.688, - "step": 12409 - }, - { - "epoch": 0.32, - "learning_rate": 1.9698427076594865e-06, - "loss": 0.8516, - "step": 12410 - }, - { - "epoch": 0.32, - "learning_rate": 1.9698359631225266e-06, - "loss": 0.7012, - "step": 12411 - }, - { - "epoch": 0.32, - "learning_rate": 1.969829217843008e-06, - "loss": 0.9385, - "step": 12412 - }, - { - "epoch": 0.32, - "learning_rate": 1.9698224718209355e-06, - "loss": 1.0518, - "step": 12413 - }, - { - "epoch": 0.32, - "learning_rate": 1.969815725056314e-06, - "loss": 1.0356, - "step": 12414 - }, - { - "epoch": 0.32, - "learning_rate": 1.96980897754915e-06, - "loss": 0.8174, - "step": 12415 - }, - { - "epoch": 0.32, - "learning_rate": 1.9698022292994474e-06, - "loss": 0.8408, - "step": 12416 - }, - { - "epoch": 0.32, - "learning_rate": 1.969795480307212e-06, - "loss": 1.0771, - "step": 12417 - }, - { - "epoch": 0.32, - "learning_rate": 1.969788730572449e-06, - "loss": 0.834, - "step": 12418 - }, - { - "epoch": 0.32, - "learning_rate": 1.9697819800951633e-06, - "loss": 0.688, - "step": 12419 - }, - { - "epoch": 0.32, - "learning_rate": 1.9697752288753595e-06, - "loss": 0.7839, - "step": 12420 - }, - { - "epoch": 0.32, - "learning_rate": 1.969768476913044e-06, - "loss": 0.8691, - "step": 12421 - }, - { - "epoch": 0.32, - "learning_rate": 1.9697617242082213e-06, - "loss": 0.7561, - "step": 12422 - }, - { - "epoch": 0.32, - "learning_rate": 1.969754970760897e-06, - "loss": 0.9287, - "step": 12423 - }, - { - "epoch": 0.32, - "learning_rate": 1.969748216571075e-06, - "loss": 0.835, - "step": 12424 - }, - { - "epoch": 0.32, - "learning_rate": 1.9697414616387623e-06, - "loss": 0.9658, - "step": 12425 - }, - { - "epoch": 0.32, - "learning_rate": 1.9697347059639624e-06, - "loss": 0.8506, - "step": 12426 - }, - { - "epoch": 0.32, - "learning_rate": 1.969727949546682e-06, - "loss": 1.0176, - "step": 12427 - }, - { - "epoch": 0.32, - "learning_rate": 1.969721192386925e-06, - "loss": 0.8711, - "step": 12428 - }, - { - "epoch": 0.32, - "learning_rate": 1.969714434484697e-06, - "loss": 0.9307, - "step": 12429 - }, - { - "epoch": 0.32, - "learning_rate": 1.9697076758400034e-06, - "loss": 0.7114, - "step": 12430 - }, - { - "epoch": 0.32, - "learning_rate": 1.969700916452849e-06, - "loss": 0.7559, - "step": 12431 - }, - { - "epoch": 0.32, - "learning_rate": 1.9696941563232396e-06, - "loss": 0.8071, - "step": 12432 - }, - { - "epoch": 0.32, - "learning_rate": 1.96968739545118e-06, - "loss": 0.9463, - "step": 12433 - }, - { - "epoch": 0.32, - "learning_rate": 1.969680633836675e-06, - "loss": 0.7587, - "step": 12434 - }, - { - "epoch": 0.32, - "learning_rate": 1.9696738714797304e-06, - "loss": 0.9121, - "step": 12435 - }, - { - "epoch": 0.32, - "learning_rate": 1.9696671083803505e-06, - "loss": 1.123, - "step": 12436 - }, - { - "epoch": 0.32, - "learning_rate": 1.969660344538542e-06, - "loss": 0.832, - "step": 12437 - }, - { - "epoch": 0.32, - "learning_rate": 1.9696535799543086e-06, - "loss": 0.9736, - "step": 12438 - }, - { - "epoch": 0.32, - "learning_rate": 1.969646814627656e-06, - "loss": 0.5723, - "step": 12439 - }, - { - "epoch": 0.32, - "learning_rate": 1.9696400485585896e-06, - "loss": 0.8701, - "step": 12440 - }, - { - "epoch": 0.32, - "learning_rate": 1.9696332817471145e-06, - "loss": 0.9199, - "step": 12441 - }, - { - "epoch": 0.32, - "learning_rate": 1.9696265141932353e-06, - "loss": 0.7754, - "step": 12442 - }, - { - "epoch": 0.32, - "learning_rate": 1.969619745896958e-06, - "loss": 0.8477, - "step": 12443 - }, - { - "epoch": 0.32, - "learning_rate": 1.9696129768582877e-06, - "loss": 0.6147, - "step": 12444 - }, - { - "epoch": 0.32, - "learning_rate": 1.969606207077229e-06, - "loss": 0.9375, - "step": 12445 - }, - { - "epoch": 0.32, - "learning_rate": 1.9695994365537874e-06, - "loss": 1.0352, - "step": 12446 - }, - { - "epoch": 0.32, - "learning_rate": 1.969592665287968e-06, - "loss": 0.999, - "step": 12447 - }, - { - "epoch": 0.32, - "learning_rate": 1.9695858932797764e-06, - "loss": 0.7656, - "step": 12448 - }, - { - "epoch": 0.32, - "learning_rate": 1.9695791205292175e-06, - "loss": 0.833, - "step": 12449 - }, - { - "epoch": 0.32, - "learning_rate": 1.969572347036296e-06, - "loss": 0.8633, - "step": 12450 - }, - { - "epoch": 0.32, - "learning_rate": 1.9695655728010177e-06, - "loss": 0.8691, - "step": 12451 - }, - { - "epoch": 0.32, - "learning_rate": 1.9695587978233877e-06, - "loss": 0.916, - "step": 12452 - }, - { - "epoch": 0.32, - "learning_rate": 1.9695520221034113e-06, - "loss": 0.7827, - "step": 12453 - }, - { - "epoch": 0.32, - "learning_rate": 1.9695452456410935e-06, - "loss": 1.1787, - "step": 12454 - }, - { - "epoch": 0.32, - "learning_rate": 1.9695384684364394e-06, - "loss": 0.7998, - "step": 12455 - }, - { - "epoch": 0.32, - "learning_rate": 1.969531690489454e-06, - "loss": 0.6958, - "step": 12456 - }, - { - "epoch": 0.32, - "learning_rate": 1.969524911800143e-06, - "loss": 0.8418, - "step": 12457 - }, - { - "epoch": 0.32, - "learning_rate": 1.9695181323685115e-06, - "loss": 0.874, - "step": 12458 - }, - { - "epoch": 0.32, - "learning_rate": 1.9695113521945644e-06, - "loss": 0.9189, - "step": 12459 - }, - { - "epoch": 0.32, - "learning_rate": 1.9695045712783068e-06, - "loss": 0.9307, - "step": 12460 - }, - { - "epoch": 0.32, - "learning_rate": 1.9694977896197442e-06, - "loss": 0.9492, - "step": 12461 - }, - { - "epoch": 0.32, - "learning_rate": 1.969491007218882e-06, - "loss": 0.7266, - "step": 12462 - }, - { - "epoch": 0.32, - "learning_rate": 1.969484224075725e-06, - "loss": 0.7305, - "step": 12463 - }, - { - "epoch": 0.32, - "learning_rate": 1.969477440190278e-06, - "loss": 0.9404, - "step": 12464 - }, - { - "epoch": 0.32, - "learning_rate": 1.9694706555625475e-06, - "loss": 0.8691, - "step": 12465 - }, - { - "epoch": 0.32, - "learning_rate": 1.9694638701925378e-06, - "loss": 0.9248, - "step": 12466 - }, - { - "epoch": 0.32, - "learning_rate": 1.969457084080254e-06, - "loss": 0.6606, - "step": 12467 - }, - { - "epoch": 0.32, - "learning_rate": 1.9694502972257016e-06, - "loss": 0.9434, - "step": 12468 - }, - { - "epoch": 0.32, - "learning_rate": 1.9694435096288854e-06, - "loss": 0.9951, - "step": 12469 - }, - { - "epoch": 0.32, - "learning_rate": 1.969436721289811e-06, - "loss": 0.8018, - "step": 12470 - }, - { - "epoch": 0.32, - "learning_rate": 1.9694299322084835e-06, - "loss": 0.7998, - "step": 12471 - }, - { - "epoch": 0.32, - "learning_rate": 1.969423142384908e-06, - "loss": 0.7383, - "step": 12472 - }, - { - "epoch": 0.32, - "learning_rate": 1.9694163518190896e-06, - "loss": 0.877, - "step": 12473 - }, - { - "epoch": 0.32, - "learning_rate": 1.969409560511034e-06, - "loss": 0.9111, - "step": 12474 - }, - { - "epoch": 0.32, - "learning_rate": 1.969402768460746e-06, - "loss": 0.8984, - "step": 12475 - }, - { - "epoch": 0.32, - "learning_rate": 1.969395975668231e-06, - "loss": 1.1514, - "step": 12476 - }, - { - "epoch": 0.32, - "learning_rate": 1.9693891821334937e-06, - "loss": 0.9824, - "step": 12477 - }, - { - "epoch": 0.32, - "learning_rate": 1.96938238785654e-06, - "loss": 0.8516, - "step": 12478 - }, - { - "epoch": 0.32, - "learning_rate": 1.9693755928373748e-06, - "loss": 0.9585, - "step": 12479 - }, - { - "epoch": 0.32, - "learning_rate": 1.969368797076003e-06, - "loss": 0.877, - "step": 12480 - }, - { - "epoch": 0.32, - "learning_rate": 1.9693620005724303e-06, - "loss": 0.9268, - "step": 12481 - }, - { - "epoch": 0.32, - "learning_rate": 1.969355203326662e-06, - "loss": 0.8721, - "step": 12482 - }, - { - "epoch": 0.32, - "learning_rate": 1.9693484053387023e-06, - "loss": 0.8975, - "step": 12483 - }, - { - "epoch": 0.32, - "learning_rate": 1.9693416066085575e-06, - "loss": 0.7686, - "step": 12484 - }, - { - "epoch": 0.32, - "learning_rate": 1.9693348071362322e-06, - "loss": 0.8818, - "step": 12485 - }, - { - "epoch": 0.32, - "learning_rate": 1.969328006921732e-06, - "loss": 0.9531, - "step": 12486 - }, - { - "epoch": 0.32, - "learning_rate": 1.969321205965062e-06, - "loss": 0.9707, - "step": 12487 - }, - { - "epoch": 0.32, - "learning_rate": 1.969314404266227e-06, - "loss": 0.9316, - "step": 12488 - }, - { - "epoch": 0.32, - "learning_rate": 1.9693076018252327e-06, - "loss": 0.7881, - "step": 12489 - }, - { - "epoch": 0.32, - "learning_rate": 1.9693007986420845e-06, - "loss": 0.7231, - "step": 12490 - }, - { - "epoch": 0.32, - "learning_rate": 1.9692939947167868e-06, - "loss": 0.9434, - "step": 12491 - }, - { - "epoch": 0.32, - "learning_rate": 1.9692871900493454e-06, - "loss": 0.9766, - "step": 12492 - }, - { - "epoch": 0.32, - "learning_rate": 1.969280384639765e-06, - "loss": 1.1758, - "step": 12493 - }, - { - "epoch": 0.32, - "learning_rate": 1.969273578488052e-06, - "loss": 1.0762, - "step": 12494 - }, - { - "epoch": 0.32, - "learning_rate": 1.9692667715942103e-06, - "loss": 0.957, - "step": 12495 - }, - { - "epoch": 0.32, - "learning_rate": 1.9692599639582455e-06, - "loss": 1.002, - "step": 12496 - }, - { - "epoch": 0.32, - "learning_rate": 1.969253155580163e-06, - "loss": 0.54, - "step": 12497 - }, - { - "epoch": 0.32, - "learning_rate": 1.969246346459968e-06, - "loss": 1.1357, - "step": 12498 - }, - { - "epoch": 0.32, - "learning_rate": 1.9692395365976656e-06, - "loss": 0.8955, - "step": 12499 - }, - { - "epoch": 0.32, - "learning_rate": 1.9692327259932606e-06, - "loss": 0.6982, - "step": 12500 - }, - { - "epoch": 0.32, - "learning_rate": 1.9692259146467595e-06, - "loss": 1.0537, - "step": 12501 - }, - { - "epoch": 0.32, - "learning_rate": 1.969219102558166e-06, - "loss": 0.7075, - "step": 12502 - }, - { - "epoch": 0.32, - "learning_rate": 1.9692122897274867e-06, - "loss": 0.9756, - "step": 12503 - }, - { - "epoch": 0.32, - "learning_rate": 1.9692054761547255e-06, - "loss": 0.8789, - "step": 12504 - }, - { - "epoch": 0.32, - "learning_rate": 1.9691986618398885e-06, - "loss": 1.0537, - "step": 12505 - }, - { - "epoch": 0.32, - "learning_rate": 1.9691918467829807e-06, - "loss": 0.959, - "step": 12506 - }, - { - "epoch": 0.32, - "learning_rate": 1.9691850309840073e-06, - "loss": 0.8848, - "step": 12507 - }, - { - "epoch": 0.32, - "learning_rate": 1.9691782144429733e-06, - "loss": 0.8369, - "step": 12508 - }, - { - "epoch": 0.32, - "learning_rate": 1.969171397159884e-06, - "loss": 0.8867, - "step": 12509 - }, - { - "epoch": 0.32, - "learning_rate": 1.969164579134745e-06, - "loss": 0.8628, - "step": 12510 - }, - { - "epoch": 0.32, - "learning_rate": 1.969157760367561e-06, - "loss": 0.8965, - "step": 12511 - }, - { - "epoch": 0.32, - "learning_rate": 1.9691509408583375e-06, - "loss": 0.8218, - "step": 12512 - }, - { - "epoch": 0.32, - "learning_rate": 1.96914412060708e-06, - "loss": 0.873, - "step": 12513 - }, - { - "epoch": 0.32, - "learning_rate": 1.9691372996137933e-06, - "loss": 1.1299, - "step": 12514 - }, - { - "epoch": 0.32, - "learning_rate": 1.9691304778784823e-06, - "loss": 0.9141, - "step": 12515 - }, - { - "epoch": 0.32, - "learning_rate": 1.969123655401153e-06, - "loss": 0.9229, - "step": 12516 - }, - { - "epoch": 0.32, - "learning_rate": 1.96911683218181e-06, - "loss": 0.9648, - "step": 12517 - }, - { - "epoch": 0.32, - "learning_rate": 1.969110008220459e-06, - "loss": 0.7832, - "step": 12518 - }, - { - "epoch": 0.32, - "learning_rate": 1.9691031835171053e-06, - "loss": 0.9961, - "step": 12519 - }, - { - "epoch": 0.32, - "learning_rate": 1.9690963580717535e-06, - "loss": 0.876, - "step": 12520 - }, - { - "epoch": 0.32, - "learning_rate": 1.9690895318844097e-06, - "loss": 0.7627, - "step": 12521 - }, - { - "epoch": 0.32, - "learning_rate": 1.969082704955078e-06, - "loss": 0.959, - "step": 12522 - }, - { - "epoch": 0.32, - "learning_rate": 1.9690758772837645e-06, - "loss": 1.0078, - "step": 12523 - }, - { - "epoch": 0.32, - "learning_rate": 1.969069048870474e-06, - "loss": 0.8408, - "step": 12524 - }, - { - "epoch": 0.32, - "learning_rate": 1.969062219715212e-06, - "loss": 0.7822, - "step": 12525 - }, - { - "epoch": 0.32, - "learning_rate": 1.9690553898179837e-06, - "loss": 1.0078, - "step": 12526 - }, - { - "epoch": 0.32, - "learning_rate": 1.969048559178794e-06, - "loss": 0.9023, - "step": 12527 - }, - { - "epoch": 0.32, - "learning_rate": 1.9690417277976484e-06, - "loss": 0.8931, - "step": 12528 - }, - { - "epoch": 0.32, - "learning_rate": 1.9690348956745522e-06, - "loss": 1.0176, - "step": 12529 - }, - { - "epoch": 0.32, - "learning_rate": 1.9690280628095107e-06, - "loss": 0.9434, - "step": 12530 - }, - { - "epoch": 0.32, - "learning_rate": 1.969021229202529e-06, - "loss": 1.0244, - "step": 12531 - }, - { - "epoch": 0.32, - "learning_rate": 1.9690143948536123e-06, - "loss": 0.9219, - "step": 12532 - }, - { - "epoch": 0.32, - "learning_rate": 1.9690075597627656e-06, - "loss": 0.9629, - "step": 12533 - }, - { - "epoch": 0.32, - "learning_rate": 1.969000723929994e-06, - "loss": 1.0127, - "step": 12534 - }, - { - "epoch": 0.32, - "learning_rate": 1.968993887355304e-06, - "loss": 0.8774, - "step": 12535 - }, - { - "epoch": 0.32, - "learning_rate": 1.9689870500386996e-06, - "loss": 1.0195, - "step": 12536 - }, - { - "epoch": 0.32, - "learning_rate": 1.968980211980186e-06, - "loss": 1.1582, - "step": 12537 - }, - { - "epoch": 0.32, - "learning_rate": 1.968973373179769e-06, - "loss": 0.9883, - "step": 12538 - }, - { - "epoch": 0.32, - "learning_rate": 1.968966533637454e-06, - "loss": 1.0977, - "step": 12539 - }, - { - "epoch": 0.32, - "learning_rate": 1.9689596933532453e-06, - "loss": 0.9316, - "step": 12540 - }, - { - "epoch": 0.32, - "learning_rate": 1.968952852327149e-06, - "loss": 0.7031, - "step": 12541 - }, - { - "epoch": 0.32, - "learning_rate": 1.9689460105591702e-06, - "loss": 0.9326, - "step": 12542 - }, - { - "epoch": 0.32, - "learning_rate": 1.9689391680493135e-06, - "loss": 0.957, - "step": 12543 - }, - { - "epoch": 0.32, - "learning_rate": 1.968932324797585e-06, - "loss": 0.7988, - "step": 12544 - }, - { - "epoch": 0.32, - "learning_rate": 1.9689254808039897e-06, - "loss": 0.7725, - "step": 12545 - }, - { - "epoch": 0.32, - "learning_rate": 1.9689186360685328e-06, - "loss": 1.1494, - "step": 12546 - }, - { - "epoch": 0.32, - "learning_rate": 1.968911790591219e-06, - "loss": 0.9941, - "step": 12547 - }, - { - "epoch": 0.32, - "learning_rate": 1.9689049443720546e-06, - "loss": 1.0479, - "step": 12548 - }, - { - "epoch": 0.32, - "learning_rate": 1.9688980974110436e-06, - "loss": 1.1631, - "step": 12549 - }, - { - "epoch": 0.32, - "learning_rate": 1.968891249708192e-06, - "loss": 0.8818, - "step": 12550 - }, - { - "epoch": 0.32, - "learning_rate": 1.968884401263505e-06, - "loss": 0.7939, - "step": 12551 - }, - { - "epoch": 0.32, - "learning_rate": 1.968877552076988e-06, - "loss": 0.9482, - "step": 12552 - }, - { - "epoch": 0.32, - "learning_rate": 1.968870702148646e-06, - "loss": 0.8027, - "step": 12553 - }, - { - "epoch": 0.32, - "learning_rate": 1.968863851478484e-06, - "loss": 0.7832, - "step": 12554 - }, - { - "epoch": 0.32, - "learning_rate": 1.9688570000665075e-06, - "loss": 0.5684, - "step": 12555 - }, - { - "epoch": 0.32, - "learning_rate": 1.9688501479127216e-06, - "loss": 0.7842, - "step": 12556 - }, - { - "epoch": 0.32, - "learning_rate": 1.9688432950171322e-06, - "loss": 0.9268, - "step": 12557 - }, - { - "epoch": 0.32, - "learning_rate": 1.968836441379744e-06, - "loss": 0.9434, - "step": 12558 - }, - { - "epoch": 0.32, - "learning_rate": 1.968829587000562e-06, - "loss": 1.0117, - "step": 12559 - }, - { - "epoch": 0.32, - "learning_rate": 1.9688227318795913e-06, - "loss": 1.0908, - "step": 12560 - }, - { - "epoch": 0.32, - "learning_rate": 1.9688158760168383e-06, - "loss": 0.8066, - "step": 12561 - }, - { - "epoch": 0.32, - "learning_rate": 1.968809019412307e-06, - "loss": 0.999, - "step": 12562 - }, - { - "epoch": 0.32, - "learning_rate": 1.968802162066004e-06, - "loss": 0.8135, - "step": 12563 - }, - { - "epoch": 0.32, - "learning_rate": 1.9687953039779327e-06, - "loss": 0.7349, - "step": 12564 - }, - { - "epoch": 0.32, - "learning_rate": 1.9687884451481e-06, - "loss": 0.9678, - "step": 12565 - }, - { - "epoch": 0.32, - "learning_rate": 1.9687815855765102e-06, - "loss": 0.7949, - "step": 12566 - }, - { - "epoch": 0.32, - "learning_rate": 1.968774725263169e-06, - "loss": 1.0625, - "step": 12567 - }, - { - "epoch": 0.32, - "learning_rate": 1.968767864208082e-06, - "loss": 0.6665, - "step": 12568 - }, - { - "epoch": 0.32, - "learning_rate": 1.9687610024112534e-06, - "loss": 1.0068, - "step": 12569 - }, - { - "epoch": 0.32, - "learning_rate": 1.9687541398726894e-06, - "loss": 0.8262, - "step": 12570 - }, - { - "epoch": 0.32, - "learning_rate": 1.968747276592395e-06, - "loss": 0.8052, - "step": 12571 - }, - { - "epoch": 0.32, - "learning_rate": 1.968740412570375e-06, - "loss": 0.9004, - "step": 12572 - }, - { - "epoch": 0.32, - "learning_rate": 1.968733547806635e-06, - "loss": 0.7832, - "step": 12573 - }, - { - "epoch": 0.32, - "learning_rate": 1.9687266823011807e-06, - "loss": 0.9092, - "step": 12574 - }, - { - "epoch": 0.32, - "learning_rate": 1.9687198160540163e-06, - "loss": 0.7715, - "step": 12575 - }, - { - "epoch": 0.32, - "learning_rate": 1.968712949065148e-06, - "loss": 0.812, - "step": 12576 - }, - { - "epoch": 0.32, - "learning_rate": 1.968706081334581e-06, - "loss": 0.8721, - "step": 12577 - }, - { - "epoch": 0.32, - "learning_rate": 1.9686992128623198e-06, - "loss": 0.8862, - "step": 12578 - }, - { - "epoch": 0.32, - "learning_rate": 1.9686923436483704e-06, - "loss": 0.8408, - "step": 12579 - }, - { - "epoch": 0.32, - "learning_rate": 1.9686854736927374e-06, - "loss": 0.5581, - "step": 12580 - }, - { - "epoch": 0.32, - "learning_rate": 1.9686786029954276e-06, - "loss": 1.0166, - "step": 12581 - }, - { - "epoch": 0.32, - "learning_rate": 1.9686717315564443e-06, - "loss": 1.0713, - "step": 12582 - }, - { - "epoch": 0.32, - "learning_rate": 1.9686648593757934e-06, - "loss": 0.9253, - "step": 12583 - }, - { - "epoch": 0.32, - "learning_rate": 1.968657986453481e-06, - "loss": 1.0371, - "step": 12584 - }, - { - "epoch": 0.32, - "learning_rate": 1.968651112789511e-06, - "loss": 0.9707, - "step": 12585 - }, - { - "epoch": 0.32, - "learning_rate": 1.96864423838389e-06, - "loss": 0.8755, - "step": 12586 - }, - { - "epoch": 0.32, - "learning_rate": 1.9686373632366222e-06, - "loss": 0.834, - "step": 12587 - }, - { - "epoch": 0.32, - "learning_rate": 1.9686304873477136e-06, - "loss": 0.8242, - "step": 12588 - }, - { - "epoch": 0.32, - "learning_rate": 1.9686236107171692e-06, - "loss": 0.9697, - "step": 12589 - }, - { - "epoch": 0.32, - "learning_rate": 1.968616733344994e-06, - "loss": 1.0098, - "step": 12590 - }, - { - "epoch": 0.32, - "learning_rate": 1.9686098552311938e-06, - "loss": 0.958, - "step": 12591 - }, - { - "epoch": 0.32, - "learning_rate": 1.9686029763757733e-06, - "loss": 0.9531, - "step": 12592 - }, - { - "epoch": 0.32, - "learning_rate": 1.968596096778738e-06, - "loss": 1.0342, - "step": 12593 - }, - { - "epoch": 0.32, - "learning_rate": 1.9685892164400933e-06, - "loss": 0.8062, - "step": 12594 - }, - { - "epoch": 0.32, - "learning_rate": 1.9685823353598447e-06, - "loss": 0.8271, - "step": 12595 - }, - { - "epoch": 0.32, - "learning_rate": 1.9685754535379967e-06, - "loss": 0.8477, - "step": 12596 - }, - { - "epoch": 0.32, - "learning_rate": 1.9685685709745552e-06, - "loss": 0.9814, - "step": 12597 - }, - { - "epoch": 0.32, - "learning_rate": 1.9685616876695255e-06, - "loss": 0.7627, - "step": 12598 - }, - { - "epoch": 0.32, - "learning_rate": 1.9685548036229124e-06, - "loss": 1.0566, - "step": 12599 - }, - { - "epoch": 0.32, - "learning_rate": 1.968547918834721e-06, - "loss": 1.0088, - "step": 12600 - }, - { - "epoch": 0.32, - "learning_rate": 1.968541033304958e-06, - "loss": 0.8604, - "step": 12601 - }, - { - "epoch": 0.32, - "learning_rate": 1.968534147033627e-06, - "loss": 0.7959, - "step": 12602 - }, - { - "epoch": 0.32, - "learning_rate": 1.9685272600207338e-06, - "loss": 0.7656, - "step": 12603 - }, - { - "epoch": 0.32, - "learning_rate": 1.9685203722662844e-06, - "loss": 1.1494, - "step": 12604 - }, - { - "epoch": 0.32, - "learning_rate": 1.9685134837702826e-06, - "loss": 0.8848, - "step": 12605 - }, - { - "epoch": 0.32, - "learning_rate": 1.9685065945327353e-06, - "loss": 0.9863, - "step": 12606 - }, - { - "epoch": 0.32, - "learning_rate": 1.968499704553647e-06, - "loss": 0.8408, - "step": 12607 - }, - { - "epoch": 0.32, - "learning_rate": 1.9684928138330226e-06, - "loss": 1.0146, - "step": 12608 - }, - { - "epoch": 0.32, - "learning_rate": 1.968485922370868e-06, - "loss": 0.9756, - "step": 12609 - }, - { - "epoch": 0.32, - "learning_rate": 1.9684790301671885e-06, - "loss": 0.8984, - "step": 12610 - }, - { - "epoch": 0.32, - "learning_rate": 1.9684721372219886e-06, - "loss": 0.6523, - "step": 12611 - }, - { - "epoch": 0.32, - "learning_rate": 1.9684652435352745e-06, - "loss": 0.998, - "step": 12612 - }, - { - "epoch": 0.32, - "learning_rate": 1.9684583491070513e-06, - "loss": 0.8838, - "step": 12613 - }, - { - "epoch": 0.32, - "learning_rate": 1.9684514539373235e-06, - "loss": 0.8359, - "step": 12614 - }, - { - "epoch": 0.32, - "learning_rate": 1.9684445580260976e-06, - "loss": 0.6777, - "step": 12615 - }, - { - "epoch": 0.32, - "learning_rate": 1.968437661373378e-06, - "loss": 0.9395, - "step": 12616 - }, - { - "epoch": 0.32, - "learning_rate": 1.9684307639791696e-06, - "loss": 0.6689, - "step": 12617 - }, - { - "epoch": 0.32, - "learning_rate": 1.968423865843479e-06, - "loss": 0.8926, - "step": 12618 - }, - { - "epoch": 0.32, - "learning_rate": 1.9684169669663104e-06, - "loss": 0.9766, - "step": 12619 - }, - { - "epoch": 0.32, - "learning_rate": 1.9684100673476696e-06, - "loss": 1.2344, - "step": 12620 - }, - { - "epoch": 0.32, - "learning_rate": 1.968403166987562e-06, - "loss": 0.8882, - "step": 12621 - }, - { - "epoch": 0.32, - "learning_rate": 1.9683962658859926e-06, - "loss": 0.9653, - "step": 12622 - }, - { - "epoch": 0.32, - "learning_rate": 1.968389364042966e-06, - "loss": 0.9531, - "step": 12623 - }, - { - "epoch": 0.32, - "learning_rate": 1.968382461458489e-06, - "loss": 0.9756, - "step": 12624 - }, - { - "epoch": 0.32, - "learning_rate": 1.968375558132566e-06, - "loss": 0.9092, - "step": 12625 - }, - { - "epoch": 0.32, - "learning_rate": 1.9683686540652017e-06, - "loss": 0.9727, - "step": 12626 - }, - { - "epoch": 0.32, - "learning_rate": 1.9683617492564025e-06, - "loss": 0.9385, - "step": 12627 - }, - { - "epoch": 0.32, - "learning_rate": 1.9683548437061733e-06, - "loss": 0.8389, - "step": 12628 - }, - { - "epoch": 0.32, - "learning_rate": 1.9683479374145193e-06, - "loss": 0.7266, - "step": 12629 - }, - { - "epoch": 0.32, - "learning_rate": 1.968341030381446e-06, - "loss": 1.0566, - "step": 12630 - }, - { - "epoch": 0.32, - "learning_rate": 1.9683341226069577e-06, - "loss": 0.9473, - "step": 12631 - }, - { - "epoch": 0.32, - "learning_rate": 1.9683272140910612e-06, - "loss": 0.9189, - "step": 12632 - }, - { - "epoch": 0.32, - "learning_rate": 1.968320304833761e-06, - "loss": 1.0361, - "step": 12633 - }, - { - "epoch": 0.32, - "learning_rate": 1.968313394835062e-06, - "loss": 1.002, - "step": 12634 - }, - { - "epoch": 0.32, - "learning_rate": 1.9683064840949707e-06, - "loss": 0.9883, - "step": 12635 - }, - { - "epoch": 0.32, - "learning_rate": 1.968299572613491e-06, - "loss": 0.9053, - "step": 12636 - }, - { - "epoch": 0.32, - "learning_rate": 1.9682926603906295e-06, - "loss": 0.6416, - "step": 12637 - }, - { - "epoch": 0.32, - "learning_rate": 1.9682857474263904e-06, - "loss": 0.8838, - "step": 12638 - }, - { - "epoch": 0.32, - "learning_rate": 1.9682788337207793e-06, - "loss": 0.701, - "step": 12639 - }, - { - "epoch": 0.32, - "learning_rate": 1.968271919273802e-06, - "loss": 0.7666, - "step": 12640 - }, - { - "epoch": 0.32, - "learning_rate": 1.968265004085463e-06, - "loss": 0.7891, - "step": 12641 - }, - { - "epoch": 0.32, - "learning_rate": 1.9682580881557684e-06, - "loss": 1.0664, - "step": 12642 - }, - { - "epoch": 0.32, - "learning_rate": 1.968251171484723e-06, - "loss": 0.738, - "step": 12643 - }, - { - "epoch": 0.32, - "learning_rate": 1.968244254072332e-06, - "loss": 0.9629, - "step": 12644 - }, - { - "epoch": 0.32, - "learning_rate": 1.968237335918601e-06, - "loss": 0.8213, - "step": 12645 - }, - { - "epoch": 0.32, - "learning_rate": 1.9682304170235354e-06, - "loss": 0.7095, - "step": 12646 - }, - { - "epoch": 0.32, - "learning_rate": 1.96822349738714e-06, - "loss": 0.897, - "step": 12647 - }, - { - "epoch": 0.32, - "learning_rate": 1.9682165770094206e-06, - "loss": 0.8374, - "step": 12648 - }, - { - "epoch": 0.32, - "learning_rate": 1.968209655890382e-06, - "loss": 0.9756, - "step": 12649 - }, - { - "epoch": 0.32, - "learning_rate": 1.96820273403003e-06, - "loss": 0.8438, - "step": 12650 - }, - { - "epoch": 0.32, - "learning_rate": 1.9681958114283693e-06, - "loss": 0.9443, - "step": 12651 - }, - { - "epoch": 0.32, - "learning_rate": 1.9681888880854063e-06, - "loss": 0.9404, - "step": 12652 - }, - { - "epoch": 0.32, - "learning_rate": 1.968181964001145e-06, - "loss": 0.9873, - "step": 12653 - }, - { - "epoch": 0.32, - "learning_rate": 1.9681750391755915e-06, - "loss": 0.9688, - "step": 12654 - }, - { - "epoch": 0.32, - "learning_rate": 1.968168113608751e-06, - "loss": 0.918, - "step": 12655 - }, - { - "epoch": 0.32, - "learning_rate": 1.9681611873006285e-06, - "loss": 0.7568, - "step": 12656 - }, - { - "epoch": 0.32, - "learning_rate": 1.9681542602512297e-06, - "loss": 0.9062, - "step": 12657 - }, - { - "epoch": 0.32, - "learning_rate": 1.9681473324605594e-06, - "loss": 0.6234, - "step": 12658 - }, - { - "epoch": 0.32, - "learning_rate": 1.9681404039286234e-06, - "loss": 0.5459, - "step": 12659 - }, - { - "epoch": 0.32, - "learning_rate": 1.968133474655427e-06, - "loss": 0.9863, - "step": 12660 - }, - { - "epoch": 0.32, - "learning_rate": 1.9681265446409752e-06, - "loss": 0.7598, - "step": 12661 - }, - { - "epoch": 0.32, - "learning_rate": 1.9681196138852733e-06, - "loss": 0.8301, - "step": 12662 - }, - { - "epoch": 0.32, - "learning_rate": 1.968112682388327e-06, - "loss": 0.8945, - "step": 12663 - }, - { - "epoch": 0.32, - "learning_rate": 1.968105750150141e-06, - "loss": 0.9668, - "step": 12664 - }, - { - "epoch": 0.32, - "learning_rate": 1.968098817170721e-06, - "loss": 0.9443, - "step": 12665 - }, - { - "epoch": 0.32, - "learning_rate": 1.968091883450072e-06, - "loss": 0.9258, - "step": 12666 - }, - { - "epoch": 0.32, - "learning_rate": 1.9680849489882e-06, - "loss": 0.834, - "step": 12667 - }, - { - "epoch": 0.32, - "learning_rate": 1.9680780137851098e-06, - "loss": 0.8633, - "step": 12668 - }, - { - "epoch": 0.32, - "learning_rate": 1.9680710778408067e-06, - "loss": 0.7632, - "step": 12669 - }, - { - "epoch": 0.32, - "learning_rate": 1.968064141155296e-06, - "loss": 1.0479, - "step": 12670 - }, - { - "epoch": 0.32, - "learning_rate": 1.968057203728583e-06, - "loss": 0.8232, - "step": 12671 - }, - { - "epoch": 0.32, - "learning_rate": 1.9680502655606737e-06, - "loss": 1.0771, - "step": 12672 - }, - { - "epoch": 0.32, - "learning_rate": 1.968043326651572e-06, - "loss": 0.9336, - "step": 12673 - }, - { - "epoch": 0.32, - "learning_rate": 1.968036387001285e-06, - "loss": 0.9844, - "step": 12674 - }, - { - "epoch": 0.32, - "learning_rate": 1.9680294466098162e-06, - "loss": 0.9473, - "step": 12675 - }, - { - "epoch": 0.32, - "learning_rate": 1.968022505477172e-06, - "loss": 1.042, - "step": 12676 - }, - { - "epoch": 0.32, - "learning_rate": 1.9680155636033575e-06, - "loss": 0.793, - "step": 12677 - }, - { - "epoch": 0.32, - "learning_rate": 1.968008620988378e-06, - "loss": 0.9131, - "step": 12678 - }, - { - "epoch": 0.32, - "learning_rate": 1.968001677632239e-06, - "loss": 0.9756, - "step": 12679 - }, - { - "epoch": 0.32, - "learning_rate": 1.9679947335349457e-06, - "loss": 0.7002, - "step": 12680 - }, - { - "epoch": 0.33, - "learning_rate": 1.9679877886965027e-06, - "loss": 0.9463, - "step": 12681 - }, - { - "epoch": 0.33, - "learning_rate": 1.9679808431169165e-06, - "loss": 0.9766, - "step": 12682 - }, - { - "epoch": 0.33, - "learning_rate": 1.9679738967961917e-06, - "loss": 0.7119, - "step": 12683 - }, - { - "epoch": 0.33, - "learning_rate": 1.967966949734334e-06, - "loss": 0.9707, - "step": 12684 - }, - { - "epoch": 0.33, - "learning_rate": 1.9679600019313484e-06, - "loss": 1.001, - "step": 12685 - }, - { - "epoch": 0.33, - "learning_rate": 1.9679530533872405e-06, - "loss": 0.7539, - "step": 12686 - }, - { - "epoch": 0.33, - "learning_rate": 1.9679461041020147e-06, - "loss": 0.843, - "step": 12687 - }, - { - "epoch": 0.33, - "learning_rate": 1.967939154075678e-06, - "loss": 0.9912, - "step": 12688 - }, - { - "epoch": 0.33, - "learning_rate": 1.9679322033082343e-06, - "loss": 1.0352, - "step": 12689 - }, - { - "epoch": 0.33, - "learning_rate": 1.9679252517996898e-06, - "loss": 0.54, - "step": 12690 - }, - { - "epoch": 0.33, - "learning_rate": 1.967918299550049e-06, - "loss": 0.9111, - "step": 12691 - }, - { - "epoch": 0.33, - "learning_rate": 1.967911346559318e-06, - "loss": 0.8242, - "step": 12692 - }, - { - "epoch": 0.33, - "learning_rate": 1.9679043928275013e-06, - "loss": 0.7283, - "step": 12693 - }, - { - "epoch": 0.33, - "learning_rate": 1.9678974383546053e-06, - "loss": 0.9023, - "step": 12694 - }, - { - "epoch": 0.33, - "learning_rate": 1.9678904831406343e-06, - "loss": 0.8135, - "step": 12695 - }, - { - "epoch": 0.33, - "learning_rate": 1.967883527185594e-06, - "loss": 0.9141, - "step": 12696 - }, - { - "epoch": 0.33, - "learning_rate": 1.9678765704894903e-06, - "loss": 0.8838, - "step": 12697 - }, - { - "epoch": 0.33, - "learning_rate": 1.9678696130523276e-06, - "loss": 1.0391, - "step": 12698 - }, - { - "epoch": 0.33, - "learning_rate": 1.967862654874112e-06, - "loss": 0.9277, - "step": 12699 - }, - { - "epoch": 0.33, - "learning_rate": 1.967855695954848e-06, - "loss": 0.8525, - "step": 12700 - }, - { - "epoch": 0.33, - "learning_rate": 1.967848736294542e-06, - "loss": 0.8296, - "step": 12701 - }, - { - "epoch": 0.33, - "learning_rate": 1.9678417758931984e-06, - "loss": 0.9883, - "step": 12702 - }, - { - "epoch": 0.33, - "learning_rate": 1.9678348147508226e-06, - "loss": 0.8389, - "step": 12703 - }, - { - "epoch": 0.33, - "learning_rate": 1.9678278528674205e-06, - "loss": 1.0801, - "step": 12704 - }, - { - "epoch": 0.33, - "learning_rate": 1.967820890242997e-06, - "loss": 0.8691, - "step": 12705 - }, - { - "epoch": 0.33, - "learning_rate": 1.967813926877558e-06, - "loss": 0.8408, - "step": 12706 - }, - { - "epoch": 0.33, - "learning_rate": 1.9678069627711075e-06, - "loss": 0.7632, - "step": 12707 - }, - { - "epoch": 0.33, - "learning_rate": 1.9677999979236525e-06, - "loss": 1.0918, - "step": 12708 - }, - { - "epoch": 0.33, - "learning_rate": 1.967793032335197e-06, - "loss": 0.7209, - "step": 12709 - }, - { - "epoch": 0.33, - "learning_rate": 1.9677860660057472e-06, - "loss": 0.7104, - "step": 12710 - }, - { - "epoch": 0.33, - "learning_rate": 1.967779098935308e-06, - "loss": 0.8193, - "step": 12711 - }, - { - "epoch": 0.33, - "learning_rate": 1.9677721311238848e-06, - "loss": 0.7559, - "step": 12712 - }, - { - "epoch": 0.33, - "learning_rate": 1.967765162571483e-06, - "loss": 1.0947, - "step": 12713 - }, - { - "epoch": 0.33, - "learning_rate": 1.967758193278108e-06, - "loss": 0.9854, - "step": 12714 - }, - { - "epoch": 0.33, - "learning_rate": 1.967751223243765e-06, - "loss": 0.7354, - "step": 12715 - }, - { - "epoch": 0.33, - "learning_rate": 1.9677442524684594e-06, - "loss": 0.9033, - "step": 12716 - }, - { - "epoch": 0.33, - "learning_rate": 1.9677372809521963e-06, - "loss": 0.8906, - "step": 12717 - }, - { - "epoch": 0.33, - "learning_rate": 1.9677303086949813e-06, - "loss": 1.0664, - "step": 12718 - }, - { - "epoch": 0.33, - "learning_rate": 1.96772333569682e-06, - "loss": 0.9277, - "step": 12719 - }, - { - "epoch": 0.33, - "learning_rate": 1.9677163619577175e-06, - "loss": 1.1201, - "step": 12720 - }, - { - "epoch": 0.33, - "learning_rate": 1.967709387477679e-06, - "loss": 0.8486, - "step": 12721 - }, - { - "epoch": 0.33, - "learning_rate": 1.9677024122567095e-06, - "loss": 0.8818, - "step": 12722 - }, - { - "epoch": 0.33, - "learning_rate": 1.967695436294815e-06, - "loss": 0.9814, - "step": 12723 - }, - { - "epoch": 0.33, - "learning_rate": 1.9676884595920006e-06, - "loss": 1.1309, - "step": 12724 - }, - { - "epoch": 0.33, - "learning_rate": 1.9676814821482716e-06, - "loss": 0.9609, - "step": 12725 - }, - { - "epoch": 0.33, - "learning_rate": 1.9676745039636336e-06, - "loss": 0.8291, - "step": 12726 - }, - { - "epoch": 0.33, - "learning_rate": 1.9676675250380916e-06, - "loss": 0.73, - "step": 12727 - }, - { - "epoch": 0.33, - "learning_rate": 1.967660545371651e-06, - "loss": 0.9346, - "step": 12728 - }, - { - "epoch": 0.33, - "learning_rate": 1.9676535649643173e-06, - "loss": 0.8848, - "step": 12729 - }, - { - "epoch": 0.33, - "learning_rate": 1.967646583816096e-06, - "loss": 0.791, - "step": 12730 - }, - { - "epoch": 0.33, - "learning_rate": 1.967639601926992e-06, - "loss": 0.8018, - "step": 12731 - }, - { - "epoch": 0.33, - "learning_rate": 1.9676326192970107e-06, - "loss": 1.0693, - "step": 12732 - }, - { - "epoch": 0.33, - "learning_rate": 1.9676256359261576e-06, - "loss": 0.752, - "step": 12733 - }, - { - "epoch": 0.33, - "learning_rate": 1.9676186518144383e-06, - "loss": 0.8428, - "step": 12734 - }, - { - "epoch": 0.33, - "learning_rate": 1.9676116669618578e-06, - "loss": 0.8672, - "step": 12735 - }, - { - "epoch": 0.33, - "learning_rate": 1.967604681368421e-06, - "loss": 0.9873, - "step": 12736 - }, - { - "epoch": 0.33, - "learning_rate": 1.967597695034135e-06, - "loss": 0.8623, - "step": 12737 - }, - { - "epoch": 0.33, - "learning_rate": 1.967590707959003e-06, - "loss": 0.9121, - "step": 12738 - }, - { - "epoch": 0.33, - "learning_rate": 1.967583720143031e-06, - "loss": 0.9902, - "step": 12739 - }, - { - "epoch": 0.33, - "learning_rate": 1.9675767315862256e-06, - "loss": 0.7617, - "step": 12740 - }, - { - "epoch": 0.33, - "learning_rate": 1.9675697422885906e-06, - "loss": 0.793, - "step": 12741 - }, - { - "epoch": 0.33, - "learning_rate": 1.967562752250132e-06, - "loss": 0.7388, - "step": 12742 - }, - { - "epoch": 0.33, - "learning_rate": 1.967555761470855e-06, - "loss": 0.856, - "step": 12743 - }, - { - "epoch": 0.33, - "learning_rate": 1.9675487699507653e-06, - "loss": 0.9209, - "step": 12744 - }, - { - "epoch": 0.33, - "learning_rate": 1.9675417776898677e-06, - "loss": 0.9033, - "step": 12745 - }, - { - "epoch": 0.33, - "learning_rate": 1.9675347846881683e-06, - "loss": 0.8975, - "step": 12746 - }, - { - "epoch": 0.33, - "learning_rate": 1.9675277909456716e-06, - "loss": 0.7114, - "step": 12747 - }, - { - "epoch": 0.33, - "learning_rate": 1.9675207964623833e-06, - "loss": 0.9072, - "step": 12748 - }, - { - "epoch": 0.33, - "learning_rate": 1.967513801238309e-06, - "loss": 1.0088, - "step": 12749 - }, - { - "epoch": 0.33, - "learning_rate": 1.9675068052734542e-06, - "loss": 0.9795, - "step": 12750 - }, - { - "epoch": 0.33, - "learning_rate": 1.9674998085678233e-06, - "loss": 1.1504, - "step": 12751 - }, - { - "epoch": 0.33, - "learning_rate": 1.9674928111214227e-06, - "loss": 0.8975, - "step": 12752 - }, - { - "epoch": 0.33, - "learning_rate": 1.967485812934257e-06, - "loss": 0.9512, - "step": 12753 - }, - { - "epoch": 0.33, - "learning_rate": 1.9674788140063322e-06, - "loss": 0.6968, - "step": 12754 - }, - { - "epoch": 0.33, - "learning_rate": 1.9674718143376534e-06, - "loss": 0.959, - "step": 12755 - }, - { - "epoch": 0.33, - "learning_rate": 1.9674648139282257e-06, - "loss": 0.8369, - "step": 12756 - }, - { - "epoch": 0.33, - "learning_rate": 1.967457812778055e-06, - "loss": 1.0742, - "step": 12757 - }, - { - "epoch": 0.33, - "learning_rate": 1.9674508108871458e-06, - "loss": 0.8135, - "step": 12758 - }, - { - "epoch": 0.33, - "learning_rate": 1.9674438082555046e-06, - "loss": 1.0703, - "step": 12759 - }, - { - "epoch": 0.33, - "learning_rate": 1.9674368048831357e-06, - "loss": 0.6216, - "step": 12760 - }, - { - "epoch": 0.33, - "learning_rate": 1.967429800770045e-06, - "loss": 0.9609, - "step": 12761 - }, - { - "epoch": 0.33, - "learning_rate": 1.967422795916238e-06, - "loss": 0.9971, - "step": 12762 - }, - { - "epoch": 0.33, - "learning_rate": 1.9674157903217195e-06, - "loss": 0.8193, - "step": 12763 - }, - { - "epoch": 0.33, - "learning_rate": 1.967408783986496e-06, - "loss": 1.04, - "step": 12764 - }, - { - "epoch": 0.33, - "learning_rate": 1.967401776910571e-06, - "loss": 0.8496, - "step": 12765 - }, - { - "epoch": 0.33, - "learning_rate": 1.9673947690939516e-06, - "loss": 1.0645, - "step": 12766 - }, - { - "epoch": 0.33, - "learning_rate": 1.9673877605366425e-06, - "loss": 1.0176, - "step": 12767 - }, - { - "epoch": 0.33, - "learning_rate": 1.9673807512386487e-06, - "loss": 0.9502, - "step": 12768 - }, - { - "epoch": 0.33, - "learning_rate": 1.9673737411999764e-06, - "loss": 0.8877, - "step": 12769 - }, - { - "epoch": 0.33, - "learning_rate": 1.9673667304206304e-06, - "loss": 1.0459, - "step": 12770 - }, - { - "epoch": 0.33, - "learning_rate": 1.967359718900616e-06, - "loss": 0.793, - "step": 12771 - }, - { - "epoch": 0.33, - "learning_rate": 1.9673527066399387e-06, - "loss": 0.9883, - "step": 12772 - }, - { - "epoch": 0.33, - "learning_rate": 1.967345693638604e-06, - "loss": 0.8262, - "step": 12773 - }, - { - "epoch": 0.33, - "learning_rate": 1.967338679896617e-06, - "loss": 0.8447, - "step": 12774 - }, - { - "epoch": 0.33, - "learning_rate": 1.9673316654139837e-06, - "loss": 0.9443, - "step": 12775 - }, - { - "epoch": 0.33, - "learning_rate": 1.9673246501907087e-06, - "loss": 1.0459, - "step": 12776 - }, - { - "epoch": 0.33, - "learning_rate": 1.9673176342267977e-06, - "loss": 0.8633, - "step": 12777 - }, - { - "epoch": 0.33, - "learning_rate": 1.9673106175222564e-06, - "loss": 0.5034, - "step": 12778 - }, - { - "epoch": 0.33, - "learning_rate": 1.9673036000770895e-06, - "loss": 0.957, - "step": 12779 - }, - { - "epoch": 0.33, - "learning_rate": 1.9672965818913027e-06, - "loss": 0.6245, - "step": 12780 - }, - { - "epoch": 0.33, - "learning_rate": 1.9672895629649012e-06, - "loss": 0.8379, - "step": 12781 - }, - { - "epoch": 0.33, - "learning_rate": 1.967282543297891e-06, - "loss": 0.7422, - "step": 12782 - }, - { - "epoch": 0.33, - "learning_rate": 1.9672755228902767e-06, - "loss": 1.0723, - "step": 12783 - }, - { - "epoch": 0.33, - "learning_rate": 1.967268501742064e-06, - "loss": 0.707, - "step": 12784 - }, - { - "epoch": 0.33, - "learning_rate": 1.9672614798532586e-06, - "loss": 0.9062, - "step": 12785 - }, - { - "epoch": 0.33, - "learning_rate": 1.9672544572238654e-06, - "loss": 0.9043, - "step": 12786 - }, - { - "epoch": 0.33, - "learning_rate": 1.96724743385389e-06, - "loss": 1.1074, - "step": 12787 - }, - { - "epoch": 0.33, - "learning_rate": 1.967240409743338e-06, - "loss": 0.7471, - "step": 12788 - }, - { - "epoch": 0.33, - "learning_rate": 1.9672333848922136e-06, - "loss": 0.9355, - "step": 12789 - }, - { - "epoch": 0.33, - "learning_rate": 1.967226359300524e-06, - "loss": 0.8723, - "step": 12790 - }, - { - "epoch": 0.33, - "learning_rate": 1.9672193329682732e-06, - "loss": 0.9951, - "step": 12791 - }, - { - "epoch": 0.33, - "learning_rate": 1.967212305895467e-06, - "loss": 0.9678, - "step": 12792 - }, - { - "epoch": 0.33, - "learning_rate": 1.967205278082111e-06, - "loss": 0.9912, - "step": 12793 - }, - { - "epoch": 0.33, - "learning_rate": 1.96719824952821e-06, - "loss": 0.9307, - "step": 12794 - }, - { - "epoch": 0.33, - "learning_rate": 1.9671912202337704e-06, - "loss": 0.9385, - "step": 12795 - }, - { - "epoch": 0.33, - "learning_rate": 1.9671841901987965e-06, - "loss": 0.9893, - "step": 12796 - }, - { - "epoch": 0.33, - "learning_rate": 1.9671771594232944e-06, - "loss": 0.7598, - "step": 12797 - }, - { - "epoch": 0.33, - "learning_rate": 1.967170127907269e-06, - "loss": 0.8384, - "step": 12798 - }, - { - "epoch": 0.33, - "learning_rate": 1.9671630956507263e-06, - "loss": 0.7095, - "step": 12799 - }, - { - "epoch": 0.33, - "learning_rate": 1.9671560626536706e-06, - "loss": 0.9355, - "step": 12800 - }, - { - "epoch": 0.33, - "learning_rate": 1.9671490289161086e-06, - "loss": 0.9053, - "step": 12801 - }, - { - "epoch": 0.33, - "learning_rate": 1.967141994438045e-06, - "loss": 0.7764, - "step": 12802 - }, - { - "epoch": 0.33, - "learning_rate": 1.967134959219485e-06, - "loss": 0.7529, - "step": 12803 - }, - { - "epoch": 0.33, - "learning_rate": 1.967127923260434e-06, - "loss": 0.915, - "step": 12804 - }, - { - "epoch": 0.33, - "learning_rate": 1.967120886560898e-06, - "loss": 0.8457, - "step": 12805 - }, - { - "epoch": 0.33, - "learning_rate": 1.967113849120882e-06, - "loss": 0.8975, - "step": 12806 - }, - { - "epoch": 0.33, - "learning_rate": 1.9671068109403913e-06, - "loss": 0.9131, - "step": 12807 - }, - { - "epoch": 0.33, - "learning_rate": 1.9670997720194316e-06, - "loss": 1.1436, - "step": 12808 - }, - { - "epoch": 0.33, - "learning_rate": 1.967092732358008e-06, - "loss": 0.8203, - "step": 12809 - }, - { - "epoch": 0.33, - "learning_rate": 1.9670856919561258e-06, - "loss": 0.877, - "step": 12810 - }, - { - "epoch": 0.33, - "learning_rate": 1.9670786508137903e-06, - "loss": 1.3301, - "step": 12811 - }, - { - "epoch": 0.33, - "learning_rate": 1.9670716089310075e-06, - "loss": 0.8086, - "step": 12812 - }, - { - "epoch": 0.33, - "learning_rate": 1.9670645663077823e-06, - "loss": 0.8359, - "step": 12813 - }, - { - "epoch": 0.33, - "learning_rate": 1.9670575229441203e-06, - "loss": 1.0811, - "step": 12814 - }, - { - "epoch": 0.33, - "learning_rate": 1.967050478840027e-06, - "loss": 0.793, - "step": 12815 - }, - { - "epoch": 0.33, - "learning_rate": 1.9670434339955075e-06, - "loss": 0.8047, - "step": 12816 - }, - { - "epoch": 0.33, - "learning_rate": 1.967036388410567e-06, - "loss": 0.707, - "step": 12817 - }, - { - "epoch": 0.33, - "learning_rate": 1.9670293420852114e-06, - "loss": 0.7739, - "step": 12818 - }, - { - "epoch": 0.33, - "learning_rate": 1.9670222950194462e-06, - "loss": 0.9961, - "step": 12819 - }, - { - "epoch": 0.33, - "learning_rate": 1.967015247213276e-06, - "loss": 0.8423, - "step": 12820 - }, - { - "epoch": 0.33, - "learning_rate": 1.967008198666707e-06, - "loss": 0.8223, - "step": 12821 - }, - { - "epoch": 0.33, - "learning_rate": 1.967001149379744e-06, - "loss": 0.7871, - "step": 12822 - }, - { - "epoch": 0.33, - "learning_rate": 1.966994099352393e-06, - "loss": 0.999, - "step": 12823 - }, - { - "epoch": 0.33, - "learning_rate": 1.9669870485846594e-06, - "loss": 1.0713, - "step": 12824 - }, - { - "epoch": 0.33, - "learning_rate": 1.9669799970765478e-06, - "loss": 1.04, - "step": 12825 - }, - { - "epoch": 0.33, - "learning_rate": 1.9669729448280637e-06, - "loss": 1.1016, - "step": 12826 - }, - { - "epoch": 0.33, - "learning_rate": 1.9669658918392136e-06, - "loss": 0.8818, - "step": 12827 - }, - { - "epoch": 0.33, - "learning_rate": 1.966958838110002e-06, - "loss": 0.8125, - "step": 12828 - }, - { - "epoch": 0.33, - "learning_rate": 1.9669517836404345e-06, - "loss": 0.917, - "step": 12829 - }, - { - "epoch": 0.33, - "learning_rate": 1.966944728430516e-06, - "loss": 0.9189, - "step": 12830 - }, - { - "epoch": 0.33, - "learning_rate": 1.966937672480253e-06, - "loss": 1.0303, - "step": 12831 - }, - { - "epoch": 0.33, - "learning_rate": 1.96693061578965e-06, - "loss": 0.8643, - "step": 12832 - }, - { - "epoch": 0.33, - "learning_rate": 1.966923558358713e-06, - "loss": 0.8125, - "step": 12833 - }, - { - "epoch": 0.33, - "learning_rate": 1.966916500187446e-06, - "loss": 0.8018, - "step": 12834 - }, - { - "epoch": 0.33, - "learning_rate": 1.966909441275857e-06, - "loss": 1.002, - "step": 12835 - }, - { - "epoch": 0.33, - "learning_rate": 1.966902381623949e-06, - "loss": 0.8311, - "step": 12836 - }, - { - "epoch": 0.33, - "learning_rate": 1.9668953212317283e-06, - "loss": 0.8701, - "step": 12837 - }, - { - "epoch": 0.33, - "learning_rate": 1.9668882600992006e-06, - "loss": 0.5903, - "step": 12838 - }, - { - "epoch": 0.33, - "learning_rate": 1.966881198226371e-06, - "loss": 0.8105, - "step": 12839 - }, - { - "epoch": 0.33, - "learning_rate": 1.966874135613245e-06, - "loss": 0.8945, - "step": 12840 - }, - { - "epoch": 0.33, - "learning_rate": 1.966867072259828e-06, - "loss": 1.0098, - "step": 12841 - }, - { - "epoch": 0.33, - "learning_rate": 1.9668600081661247e-06, - "loss": 0.8525, - "step": 12842 - }, - { - "epoch": 0.33, - "learning_rate": 1.9668529433321418e-06, - "loss": 0.5835, - "step": 12843 - }, - { - "epoch": 0.33, - "learning_rate": 1.966845877757884e-06, - "loss": 0.8223, - "step": 12844 - }, - { - "epoch": 0.33, - "learning_rate": 1.9668388114433563e-06, - "loss": 1.0352, - "step": 12845 - }, - { - "epoch": 0.33, - "learning_rate": 1.966831744388565e-06, - "loss": 0.957, - "step": 12846 - }, - { - "epoch": 0.33, - "learning_rate": 1.966824676593515e-06, - "loss": 0.7607, - "step": 12847 - }, - { - "epoch": 0.33, - "learning_rate": 1.966817608058212e-06, - "loss": 0.7148, - "step": 12848 - }, - { - "epoch": 0.33, - "learning_rate": 1.966810538782661e-06, - "loss": 1.0225, - "step": 12849 - }, - { - "epoch": 0.33, - "learning_rate": 1.9668034687668675e-06, - "loss": 0.8545, - "step": 12850 - }, - { - "epoch": 0.33, - "learning_rate": 1.966796398010837e-06, - "loss": 0.7783, - "step": 12851 - }, - { - "epoch": 0.33, - "learning_rate": 1.966789326514575e-06, - "loss": 0.8398, - "step": 12852 - }, - { - "epoch": 0.33, - "learning_rate": 1.966782254278087e-06, - "loss": 0.9385, - "step": 12853 - }, - { - "epoch": 0.33, - "learning_rate": 1.9667751813013786e-06, - "loss": 0.9463, - "step": 12854 - }, - { - "epoch": 0.33, - "learning_rate": 1.9667681075844544e-06, - "loss": 0.9697, - "step": 12855 - }, - { - "epoch": 0.33, - "learning_rate": 1.9667610331273204e-06, - "loss": 1.0107, - "step": 12856 - }, - { - "epoch": 0.33, - "learning_rate": 1.966753957929982e-06, - "loss": 0.9731, - "step": 12857 - }, - { - "epoch": 0.33, - "learning_rate": 1.9667468819924446e-06, - "loss": 1.0713, - "step": 12858 - }, - { - "epoch": 0.33, - "learning_rate": 1.9667398053147134e-06, - "loss": 1.0869, - "step": 12859 - }, - { - "epoch": 0.33, - "learning_rate": 1.9667327278967944e-06, - "loss": 0.7471, - "step": 12860 - }, - { - "epoch": 0.33, - "learning_rate": 1.9667256497386923e-06, - "loss": 1.0771, - "step": 12861 - }, - { - "epoch": 0.33, - "learning_rate": 1.9667185708404125e-06, - "loss": 1.0205, - "step": 12862 - }, - { - "epoch": 0.33, - "learning_rate": 1.9667114912019615e-06, - "loss": 0.6924, - "step": 12863 - }, - { - "epoch": 0.33, - "learning_rate": 1.9667044108233434e-06, - "loss": 0.8003, - "step": 12864 - }, - { - "epoch": 0.33, - "learning_rate": 1.9666973297045642e-06, - "loss": 0.7876, - "step": 12865 - }, - { - "epoch": 0.33, - "learning_rate": 1.9666902478456295e-06, - "loss": 0.8184, - "step": 12866 - }, - { - "epoch": 0.33, - "learning_rate": 1.966683165246544e-06, - "loss": 0.9814, - "step": 12867 - }, - { - "epoch": 0.33, - "learning_rate": 1.9666760819073143e-06, - "loss": 0.6562, - "step": 12868 - }, - { - "epoch": 0.33, - "learning_rate": 1.966668997827945e-06, - "loss": 0.9053, - "step": 12869 - }, - { - "epoch": 0.33, - "learning_rate": 1.9666619130084415e-06, - "loss": 0.8408, - "step": 12870 - }, - { - "epoch": 0.33, - "learning_rate": 1.9666548274488096e-06, - "loss": 0.7461, - "step": 12871 - }, - { - "epoch": 0.33, - "learning_rate": 1.9666477411490547e-06, - "loss": 0.8574, - "step": 12872 - }, - { - "epoch": 0.33, - "learning_rate": 1.966640654109182e-06, - "loss": 1.1758, - "step": 12873 - }, - { - "epoch": 0.33, - "learning_rate": 1.9666335663291968e-06, - "loss": 0.8301, - "step": 12874 - }, - { - "epoch": 0.33, - "learning_rate": 1.9666264778091047e-06, - "loss": 1.0322, - "step": 12875 - }, - { - "epoch": 0.33, - "learning_rate": 1.966619388548911e-06, - "loss": 1.0625, - "step": 12876 - }, - { - "epoch": 0.33, - "learning_rate": 1.966612298548622e-06, - "loss": 0.832, - "step": 12877 - }, - { - "epoch": 0.33, - "learning_rate": 1.966605207808242e-06, - "loss": 1.0439, - "step": 12878 - }, - { - "epoch": 0.33, - "learning_rate": 1.9665981163277766e-06, - "loss": 0.9268, - "step": 12879 - }, - { - "epoch": 0.33, - "learning_rate": 1.966591024107232e-06, - "loss": 1.0264, - "step": 12880 - }, - { - "epoch": 0.33, - "learning_rate": 1.9665839311466127e-06, - "loss": 0.8525, - "step": 12881 - }, - { - "epoch": 0.33, - "learning_rate": 1.9665768374459244e-06, - "loss": 1.1865, - "step": 12882 - }, - { - "epoch": 0.33, - "learning_rate": 1.966569743005173e-06, - "loss": 0.9951, - "step": 12883 - }, - { - "epoch": 0.33, - "learning_rate": 1.9665626478243635e-06, - "loss": 0.835, - "step": 12884 - }, - { - "epoch": 0.33, - "learning_rate": 1.966555551903501e-06, - "loss": 1.0723, - "step": 12885 - }, - { - "epoch": 0.33, - "learning_rate": 1.9665484552425918e-06, - "loss": 0.8179, - "step": 12886 - }, - { - "epoch": 0.33, - "learning_rate": 1.966541357841641e-06, - "loss": 0.8965, - "step": 12887 - }, - { - "epoch": 0.33, - "learning_rate": 1.9665342597006534e-06, - "loss": 1.1055, - "step": 12888 - }, - { - "epoch": 0.33, - "learning_rate": 1.9665271608196357e-06, - "loss": 0.7405, - "step": 12889 - }, - { - "epoch": 0.33, - "learning_rate": 1.9665200611985923e-06, - "loss": 0.8311, - "step": 12890 - }, - { - "epoch": 0.33, - "learning_rate": 1.9665129608375285e-06, - "loss": 1.0264, - "step": 12891 - }, - { - "epoch": 0.33, - "learning_rate": 1.9665058597364506e-06, - "loss": 0.9238, - "step": 12892 - }, - { - "epoch": 0.33, - "learning_rate": 1.9664987578953636e-06, - "loss": 0.9082, - "step": 12893 - }, - { - "epoch": 0.33, - "learning_rate": 1.9664916553142726e-06, - "loss": 0.8325, - "step": 12894 - }, - { - "epoch": 0.33, - "learning_rate": 1.966484551993184e-06, - "loss": 0.8828, - "step": 12895 - }, - { - "epoch": 0.33, - "learning_rate": 1.966477447932102e-06, - "loss": 0.647, - "step": 12896 - }, - { - "epoch": 0.33, - "learning_rate": 1.966470343131033e-06, - "loss": 0.8301, - "step": 12897 - }, - { - "epoch": 0.33, - "learning_rate": 1.966463237589982e-06, - "loss": 0.916, - "step": 12898 - }, - { - "epoch": 0.33, - "learning_rate": 1.9664561313089544e-06, - "loss": 0.9121, - "step": 12899 - }, - { - "epoch": 0.33, - "learning_rate": 1.966449024287956e-06, - "loss": 0.7578, - "step": 12900 - }, - { - "epoch": 0.33, - "learning_rate": 1.966441916526992e-06, - "loss": 0.8887, - "step": 12901 - }, - { - "epoch": 0.33, - "learning_rate": 1.966434808026068e-06, - "loss": 0.7749, - "step": 12902 - }, - { - "epoch": 0.33, - "learning_rate": 1.9664276987851888e-06, - "loss": 1.1934, - "step": 12903 - }, - { - "epoch": 0.33, - "learning_rate": 1.9664205888043608e-06, - "loss": 0.9082, - "step": 12904 - }, - { - "epoch": 0.33, - "learning_rate": 1.966413478083589e-06, - "loss": 0.9678, - "step": 12905 - }, - { - "epoch": 0.33, - "learning_rate": 1.9664063666228783e-06, - "loss": 1.1504, - "step": 12906 - }, - { - "epoch": 0.33, - "learning_rate": 1.9663992544222353e-06, - "loss": 0.96, - "step": 12907 - }, - { - "epoch": 0.33, - "learning_rate": 1.9663921414816645e-06, - "loss": 0.8594, - "step": 12908 - }, - { - "epoch": 0.33, - "learning_rate": 1.966385027801172e-06, - "loss": 0.7559, - "step": 12909 - }, - { - "epoch": 0.33, - "learning_rate": 1.9663779133807627e-06, - "loss": 1.1572, - "step": 12910 - }, - { - "epoch": 0.33, - "learning_rate": 1.966370798220442e-06, - "loss": 0.7202, - "step": 12911 - }, - { - "epoch": 0.33, - "learning_rate": 1.966363682320216e-06, - "loss": 0.6108, - "step": 12912 - }, - { - "epoch": 0.33, - "learning_rate": 1.9663565656800898e-06, - "loss": 1.04, - "step": 12913 - }, - { - "epoch": 0.33, - "learning_rate": 1.966349448300068e-06, - "loss": 0.9951, - "step": 12914 - }, - { - "epoch": 0.33, - "learning_rate": 1.9663423301801577e-06, - "loss": 0.8232, - "step": 12915 - }, - { - "epoch": 0.33, - "learning_rate": 1.966335211320363e-06, - "loss": 0.8848, - "step": 12916 - }, - { - "epoch": 0.33, - "learning_rate": 1.9663280917206904e-06, - "loss": 0.8682, - "step": 12917 - }, - { - "epoch": 0.33, - "learning_rate": 1.966320971381145e-06, - "loss": 1.0537, - "step": 12918 - }, - { - "epoch": 0.33, - "learning_rate": 1.9663138503017315e-06, - "loss": 0.8237, - "step": 12919 - }, - { - "epoch": 0.33, - "learning_rate": 1.966306728482456e-06, - "loss": 1.041, - "step": 12920 - }, - { - "epoch": 0.33, - "learning_rate": 1.966299605923324e-06, - "loss": 1.1426, - "step": 12921 - }, - { - "epoch": 0.33, - "learning_rate": 1.9662924826243405e-06, - "loss": 1.0205, - "step": 12922 - }, - { - "epoch": 0.33, - "learning_rate": 1.9662853585855117e-06, - "loss": 0.9863, - "step": 12923 - }, - { - "epoch": 0.33, - "learning_rate": 1.9662782338068428e-06, - "loss": 0.917, - "step": 12924 - }, - { - "epoch": 0.33, - "learning_rate": 1.9662711082883384e-06, - "loss": 0.8701, - "step": 12925 - }, - { - "epoch": 0.33, - "learning_rate": 1.966263982030005e-06, - "loss": 0.9053, - "step": 12926 - }, - { - "epoch": 0.33, - "learning_rate": 1.966256855031848e-06, - "loss": 1.0615, - "step": 12927 - }, - { - "epoch": 0.33, - "learning_rate": 1.966249727293872e-06, - "loss": 0.9619, - "step": 12928 - }, - { - "epoch": 0.33, - "learning_rate": 1.9662425988160833e-06, - "loss": 0.9121, - "step": 12929 - }, - { - "epoch": 0.33, - "learning_rate": 1.966235469598487e-06, - "loss": 0.9697, - "step": 12930 - }, - { - "epoch": 0.33, - "learning_rate": 1.9662283396410886e-06, - "loss": 1.0293, - "step": 12931 - }, - { - "epoch": 0.33, - "learning_rate": 1.9662212089438935e-06, - "loss": 1.0264, - "step": 12932 - }, - { - "epoch": 0.33, - "learning_rate": 1.9662140775069078e-06, - "loss": 0.7783, - "step": 12933 - }, - { - "epoch": 0.33, - "learning_rate": 1.966206945330136e-06, - "loss": 1.0352, - "step": 12934 - }, - { - "epoch": 0.33, - "learning_rate": 1.966199812413584e-06, - "loss": 1.124, - "step": 12935 - }, - { - "epoch": 0.33, - "learning_rate": 1.966192678757257e-06, - "loss": 0.9346, - "step": 12936 - }, - { - "epoch": 0.33, - "learning_rate": 1.966185544361161e-06, - "loss": 0.7754, - "step": 12937 - }, - { - "epoch": 0.33, - "learning_rate": 1.9661784092253013e-06, - "loss": 1.043, - "step": 12938 - }, - { - "epoch": 0.33, - "learning_rate": 1.9661712733496825e-06, - "loss": 0.8301, - "step": 12939 - }, - { - "epoch": 0.33, - "learning_rate": 1.9661641367343113e-06, - "loss": 0.7925, - "step": 12940 - }, - { - "epoch": 0.33, - "learning_rate": 1.966156999379193e-06, - "loss": 0.7356, - "step": 12941 - }, - { - "epoch": 0.33, - "learning_rate": 1.966149861284332e-06, - "loss": 0.7852, - "step": 12942 - }, - { - "epoch": 0.33, - "learning_rate": 1.966142722449735e-06, - "loss": 0.9121, - "step": 12943 - }, - { - "epoch": 0.33, - "learning_rate": 1.9661355828754067e-06, - "loss": 0.7573, - "step": 12944 - }, - { - "epoch": 0.33, - "learning_rate": 1.9661284425613526e-06, - "loss": 0.8311, - "step": 12945 - }, - { - "epoch": 0.33, - "learning_rate": 1.9661213015075788e-06, - "loss": 0.9922, - "step": 12946 - }, - { - "epoch": 0.33, - "learning_rate": 1.96611415971409e-06, - "loss": 0.7751, - "step": 12947 - }, - { - "epoch": 0.33, - "learning_rate": 1.9661070171808924e-06, - "loss": 1.0518, - "step": 12948 - }, - { - "epoch": 0.33, - "learning_rate": 1.966099873907991e-06, - "loss": 0.9463, - "step": 12949 - }, - { - "epoch": 0.33, - "learning_rate": 1.966092729895391e-06, - "loss": 0.7915, - "step": 12950 - }, - { - "epoch": 0.33, - "learning_rate": 1.9660855851430984e-06, - "loss": 0.8682, - "step": 12951 - }, - { - "epoch": 0.33, - "learning_rate": 1.9660784396511184e-06, - "loss": 0.9336, - "step": 12952 - }, - { - "epoch": 0.33, - "learning_rate": 1.966071293419457e-06, - "loss": 0.7729, - "step": 12953 - }, - { - "epoch": 0.33, - "learning_rate": 1.966064146448119e-06, - "loss": 0.7227, - "step": 12954 - }, - { - "epoch": 0.33, - "learning_rate": 1.96605699873711e-06, - "loss": 0.8708, - "step": 12955 - }, - { - "epoch": 0.33, - "learning_rate": 1.9660498502864353e-06, - "loss": 0.7578, - "step": 12956 - }, - { - "epoch": 0.33, - "learning_rate": 1.966042701096101e-06, - "loss": 0.7446, - "step": 12957 - }, - { - "epoch": 0.33, - "learning_rate": 1.966035551166112e-06, - "loss": 0.8623, - "step": 12958 - }, - { - "epoch": 0.33, - "learning_rate": 1.9660284004964744e-06, - "loss": 0.7659, - "step": 12959 - }, - { - "epoch": 0.33, - "learning_rate": 1.966021249087193e-06, - "loss": 0.8262, - "step": 12960 - }, - { - "epoch": 0.33, - "learning_rate": 1.9660140969382734e-06, - "loss": 0.9971, - "step": 12961 - }, - { - "epoch": 0.33, - "learning_rate": 1.9660069440497214e-06, - "loss": 0.918, - "step": 12962 - }, - { - "epoch": 0.33, - "learning_rate": 1.9659997904215422e-06, - "loss": 0.9258, - "step": 12963 - }, - { - "epoch": 0.33, - "learning_rate": 1.9659926360537416e-06, - "loss": 0.8184, - "step": 12964 - }, - { - "epoch": 0.33, - "learning_rate": 1.965985480946325e-06, - "loss": 0.9893, - "step": 12965 - }, - { - "epoch": 0.33, - "learning_rate": 1.965978325099297e-06, - "loss": 0.9336, - "step": 12966 - }, - { - "epoch": 0.33, - "learning_rate": 1.9659711685126645e-06, - "loss": 0.6787, - "step": 12967 - }, - { - "epoch": 0.33, - "learning_rate": 1.9659640111864323e-06, - "loss": 0.8838, - "step": 12968 - }, - { - "epoch": 0.33, - "learning_rate": 1.9659568531206056e-06, - "loss": 0.6665, - "step": 12969 - }, - { - "epoch": 0.33, - "learning_rate": 1.96594969431519e-06, - "loss": 0.9883, - "step": 12970 - }, - { - "epoch": 0.33, - "learning_rate": 1.9659425347701914e-06, - "loss": 0.8467, - "step": 12971 - }, - { - "epoch": 0.33, - "learning_rate": 1.965935374485615e-06, - "loss": 0.7236, - "step": 12972 - }, - { - "epoch": 0.33, - "learning_rate": 1.965928213461466e-06, - "loss": 0.7256, - "step": 12973 - }, - { - "epoch": 0.33, - "learning_rate": 1.9659210516977505e-06, - "loss": 1.04, - "step": 12974 - }, - { - "epoch": 0.33, - "learning_rate": 1.9659138891944737e-06, - "loss": 0.8652, - "step": 12975 - }, - { - "epoch": 0.33, - "learning_rate": 1.965906725951641e-06, - "loss": 1.0684, - "step": 12976 - }, - { - "epoch": 0.33, - "learning_rate": 1.9658995619692578e-06, - "loss": 0.9551, - "step": 12977 - }, - { - "epoch": 0.33, - "learning_rate": 1.9658923972473298e-06, - "loss": 0.8408, - "step": 12978 - }, - { - "epoch": 0.33, - "learning_rate": 1.9658852317858623e-06, - "loss": 1.1289, - "step": 12979 - }, - { - "epoch": 0.33, - "learning_rate": 1.965878065584861e-06, - "loss": 0.9893, - "step": 12980 - }, - { - "epoch": 0.33, - "learning_rate": 1.9658708986443314e-06, - "loss": 0.7905, - "step": 12981 - }, - { - "epoch": 0.33, - "learning_rate": 1.965863730964279e-06, - "loss": 0.7632, - "step": 12982 - }, - { - "epoch": 0.33, - "learning_rate": 1.9658565625447085e-06, - "loss": 0.8486, - "step": 12983 - }, - { - "epoch": 0.33, - "learning_rate": 1.965849393385627e-06, - "loss": 0.8252, - "step": 12984 - }, - { - "epoch": 0.33, - "learning_rate": 1.965842223487038e-06, - "loss": 0.8652, - "step": 12985 - }, - { - "epoch": 0.33, - "learning_rate": 1.9658350528489485e-06, - "loss": 1.0693, - "step": 12986 - }, - { - "epoch": 0.33, - "learning_rate": 1.9658278814713638e-06, - "loss": 0.9121, - "step": 12987 - }, - { - "epoch": 0.33, - "learning_rate": 1.9658207093542884e-06, - "loss": 0.7603, - "step": 12988 - }, - { - "epoch": 0.33, - "learning_rate": 1.965813536497729e-06, - "loss": 0.7332, - "step": 12989 - }, - { - "epoch": 0.33, - "learning_rate": 1.9658063629016906e-06, - "loss": 1.0576, - "step": 12990 - }, - { - "epoch": 0.33, - "learning_rate": 1.9657991885661783e-06, - "loss": 0.9688, - "step": 12991 - }, - { - "epoch": 0.33, - "learning_rate": 1.9657920134911982e-06, - "loss": 0.8018, - "step": 12992 - }, - { - "epoch": 0.33, - "learning_rate": 1.9657848376767554e-06, - "loss": 0.7502, - "step": 12993 - }, - { - "epoch": 0.33, - "learning_rate": 1.965777661122856e-06, - "loss": 0.8164, - "step": 12994 - }, - { - "epoch": 0.33, - "learning_rate": 1.965770483829505e-06, - "loss": 0.6963, - "step": 12995 - }, - { - "epoch": 0.33, - "learning_rate": 1.965763305796708e-06, - "loss": 1.04, - "step": 12996 - }, - { - "epoch": 0.33, - "learning_rate": 1.9657561270244696e-06, - "loss": 0.9541, - "step": 12997 - }, - { - "epoch": 0.33, - "learning_rate": 1.965748947512797e-06, - "loss": 0.9102, - "step": 12998 - }, - { - "epoch": 0.33, - "learning_rate": 1.9657417672616943e-06, - "loss": 0.9326, - "step": 12999 - }, - { - "epoch": 0.33, - "learning_rate": 1.9657345862711683e-06, - "loss": 0.5737, - "step": 13000 - }, - { - "epoch": 0.33, - "learning_rate": 1.9657274045412227e-06, - "loss": 0.689, - "step": 13001 - }, - { - "epoch": 0.33, - "learning_rate": 1.9657202220718648e-06, - "loss": 0.6602, - "step": 13002 - }, - { - "epoch": 0.33, - "learning_rate": 1.9657130388630988e-06, - "loss": 1.0063, - "step": 13003 - }, - { - "epoch": 0.33, - "learning_rate": 1.965705854914931e-06, - "loss": 0.8545, - "step": 13004 - }, - { - "epoch": 0.33, - "learning_rate": 1.965698670227367e-06, - "loss": 0.8013, - "step": 13005 - }, - { - "epoch": 0.33, - "learning_rate": 1.9656914848004115e-06, - "loss": 1.0518, - "step": 13006 - }, - { - "epoch": 0.33, - "learning_rate": 1.9656842986340707e-06, - "loss": 0.7798, - "step": 13007 - }, - { - "epoch": 0.33, - "learning_rate": 1.9656771117283494e-06, - "loss": 0.8291, - "step": 13008 - }, - { - "epoch": 0.33, - "learning_rate": 1.965669924083254e-06, - "loss": 0.7939, - "step": 13009 - }, - { - "epoch": 0.33, - "learning_rate": 1.965662735698789e-06, - "loss": 0.9785, - "step": 13010 - }, - { - "epoch": 0.33, - "learning_rate": 1.9656555465749613e-06, - "loss": 0.8838, - "step": 13011 - }, - { - "epoch": 0.33, - "learning_rate": 1.965648356711775e-06, - "loss": 0.8418, - "step": 13012 - }, - { - "epoch": 0.33, - "learning_rate": 1.965641166109236e-06, - "loss": 0.9883, - "step": 13013 - }, - { - "epoch": 0.33, - "learning_rate": 1.96563397476735e-06, - "loss": 0.7642, - "step": 13014 - }, - { - "epoch": 0.33, - "learning_rate": 1.9656267826861228e-06, - "loss": 0.8716, - "step": 13015 - }, - { - "epoch": 0.33, - "learning_rate": 1.9656195898655593e-06, - "loss": 0.8965, - "step": 13016 - }, - { - "epoch": 0.33, - "learning_rate": 1.9656123963056653e-06, - "loss": 1.0439, - "step": 13017 - }, - { - "epoch": 0.33, - "learning_rate": 1.9656052020064462e-06, - "loss": 0.9346, - "step": 13018 - }, - { - "epoch": 0.33, - "learning_rate": 1.965598006967908e-06, - "loss": 0.9951, - "step": 13019 - }, - { - "epoch": 0.33, - "learning_rate": 1.9655908111900557e-06, - "loss": 0.8403, - "step": 13020 - }, - { - "epoch": 0.33, - "learning_rate": 1.9655836146728948e-06, - "loss": 0.5229, - "step": 13021 - }, - { - "epoch": 0.33, - "learning_rate": 1.965576417416431e-06, - "loss": 0.668, - "step": 13022 - }, - { - "epoch": 0.33, - "learning_rate": 1.9655692194206693e-06, - "loss": 0.9756, - "step": 13023 - }, - { - "epoch": 0.33, - "learning_rate": 1.965562020685616e-06, - "loss": 0.8018, - "step": 13024 - }, - { - "epoch": 0.33, - "learning_rate": 1.965554821211276e-06, - "loss": 0.9746, - "step": 13025 - }, - { - "epoch": 0.33, - "learning_rate": 1.9655476209976553e-06, - "loss": 0.9268, - "step": 13026 - }, - { - "epoch": 0.33, - "learning_rate": 1.9655404200447595e-06, - "loss": 0.8906, - "step": 13027 - }, - { - "epoch": 0.33, - "learning_rate": 1.9655332183525936e-06, - "loss": 1.1348, - "step": 13028 - }, - { - "epoch": 0.33, - "learning_rate": 1.9655260159211633e-06, - "loss": 0.9941, - "step": 13029 - }, - { - "epoch": 0.33, - "learning_rate": 1.965518812750474e-06, - "loss": 0.9189, - "step": 13030 - }, - { - "epoch": 0.33, - "learning_rate": 1.965511608840531e-06, - "loss": 0.875, - "step": 13031 - }, - { - "epoch": 0.33, - "learning_rate": 1.9655044041913405e-06, - "loss": 0.7832, - "step": 13032 - }, - { - "epoch": 0.33, - "learning_rate": 1.965497198802908e-06, - "loss": 0.8936, - "step": 13033 - }, - { - "epoch": 0.33, - "learning_rate": 1.9654899926752383e-06, - "loss": 0.9375, - "step": 13034 - }, - { - "epoch": 0.33, - "learning_rate": 1.9654827858083373e-06, - "loss": 1.0449, - "step": 13035 - }, - { - "epoch": 0.33, - "learning_rate": 1.9654755782022107e-06, - "loss": 0.7539, - "step": 13036 - }, - { - "epoch": 0.33, - "learning_rate": 1.9654683698568636e-06, - "loss": 0.7776, - "step": 13037 - }, - { - "epoch": 0.33, - "learning_rate": 1.965461160772302e-06, - "loss": 0.7988, - "step": 13038 - }, - { - "epoch": 0.33, - "learning_rate": 1.965453950948531e-06, - "loss": 0.8193, - "step": 13039 - }, - { - "epoch": 0.33, - "learning_rate": 1.9654467403855563e-06, - "loss": 0.9023, - "step": 13040 - }, - { - "epoch": 0.33, - "learning_rate": 1.9654395290833836e-06, - "loss": 0.8169, - "step": 13041 - }, - { - "epoch": 0.33, - "learning_rate": 1.965432317042018e-06, - "loss": 0.7354, - "step": 13042 - }, - { - "epoch": 0.33, - "learning_rate": 1.965425104261466e-06, - "loss": 0.833, - "step": 13043 - }, - { - "epoch": 0.33, - "learning_rate": 1.9654178907417317e-06, - "loss": 1.0225, - "step": 13044 - }, - { - "epoch": 0.33, - "learning_rate": 1.9654106764828215e-06, - "loss": 0.9951, - "step": 13045 - }, - { - "epoch": 0.33, - "learning_rate": 1.9654034614847405e-06, - "loss": 0.8135, - "step": 13046 - }, - { - "epoch": 0.33, - "learning_rate": 1.965396245747495e-06, - "loss": 1.0928, - "step": 13047 - }, - { - "epoch": 0.33, - "learning_rate": 1.9653890292710893e-06, - "loss": 0.9297, - "step": 13048 - }, - { - "epoch": 0.33, - "learning_rate": 1.9653818120555297e-06, - "loss": 0.8545, - "step": 13049 - }, - { - "epoch": 0.33, - "learning_rate": 1.965374594100822e-06, - "loss": 0.8994, - "step": 13050 - }, - { - "epoch": 0.33, - "learning_rate": 1.965367375406971e-06, - "loss": 1.1162, - "step": 13051 - }, - { - "epoch": 0.33, - "learning_rate": 1.965360155973983e-06, - "loss": 0.9453, - "step": 13052 - }, - { - "epoch": 0.33, - "learning_rate": 1.965352935801863e-06, - "loss": 0.8491, - "step": 13053 - }, - { - "epoch": 0.33, - "learning_rate": 1.9653457148906167e-06, - "loss": 0.9072, - "step": 13054 - }, - { - "epoch": 0.33, - "learning_rate": 1.9653384932402493e-06, - "loss": 0.5557, - "step": 13055 - }, - { - "epoch": 0.33, - "learning_rate": 1.965331270850767e-06, - "loss": 0.9238, - "step": 13056 - }, - { - "epoch": 0.33, - "learning_rate": 1.9653240477221745e-06, - "loss": 0.9404, - "step": 13057 - }, - { - "epoch": 0.33, - "learning_rate": 1.965316823854478e-06, - "loss": 0.7246, - "step": 13058 - }, - { - "epoch": 0.33, - "learning_rate": 1.965309599247683e-06, - "loss": 0.8047, - "step": 13059 - }, - { - "epoch": 0.33, - "learning_rate": 1.965302373901794e-06, - "loss": 0.4795, - "step": 13060 - }, - { - "epoch": 0.33, - "learning_rate": 1.9652951478168184e-06, - "loss": 0.9443, - "step": 13061 - }, - { - "epoch": 0.33, - "learning_rate": 1.96528792099276e-06, - "loss": 1.0161, - "step": 13062 - }, - { - "epoch": 0.33, - "learning_rate": 1.9652806934296255e-06, - "loss": 0.8701, - "step": 13063 - }, - { - "epoch": 0.33, - "learning_rate": 1.9652734651274194e-06, - "loss": 0.9043, - "step": 13064 - }, - { - "epoch": 0.33, - "learning_rate": 1.9652662360861483e-06, - "loss": 0.7939, - "step": 13065 - }, - { - "epoch": 0.33, - "learning_rate": 1.965259006305817e-06, - "loss": 0.9434, - "step": 13066 - }, - { - "epoch": 0.33, - "learning_rate": 1.9652517757864313e-06, - "loss": 0.8857, - "step": 13067 - }, - { - "epoch": 0.33, - "learning_rate": 1.9652445445279968e-06, - "loss": 0.7578, - "step": 13068 - }, - { - "epoch": 0.33, - "learning_rate": 1.965237312530519e-06, - "loss": 0.9854, - "step": 13069 - }, - { - "epoch": 0.33, - "learning_rate": 1.965230079794003e-06, - "loss": 0.9951, - "step": 13070 - }, - { - "epoch": 0.34, - "learning_rate": 1.9652228463184547e-06, - "loss": 0.832, - "step": 13071 - }, - { - "epoch": 0.34, - "learning_rate": 1.9652156121038803e-06, - "loss": 0.5474, - "step": 13072 - }, - { - "epoch": 0.34, - "learning_rate": 1.965208377150284e-06, - "loss": 0.8037, - "step": 13073 - }, - { - "epoch": 0.34, - "learning_rate": 1.9652011414576723e-06, - "loss": 0.7322, - "step": 13074 - }, - { - "epoch": 0.34, - "learning_rate": 1.96519390502605e-06, - "loss": 0.8662, - "step": 13075 - }, - { - "epoch": 0.34, - "learning_rate": 1.965186667855424e-06, - "loss": 0.9258, - "step": 13076 - }, - { - "epoch": 0.34, - "learning_rate": 1.9651794299457983e-06, - "loss": 0.7827, - "step": 13077 - }, - { - "epoch": 0.34, - "learning_rate": 1.9651721912971793e-06, - "loss": 1.0078, - "step": 13078 - }, - { - "epoch": 0.34, - "learning_rate": 1.965164951909572e-06, - "loss": 0.7529, - "step": 13079 - }, - { - "epoch": 0.34, - "learning_rate": 1.965157711782983e-06, - "loss": 1.0166, - "step": 13080 - }, - { - "epoch": 0.34, - "learning_rate": 1.9651504709174167e-06, - "loss": 0.6934, - "step": 13081 - }, - { - "epoch": 0.34, - "learning_rate": 1.965143229312879e-06, - "loss": 0.915, - "step": 13082 - }, - { - "epoch": 0.34, - "learning_rate": 1.9651359869693753e-06, - "loss": 0.917, - "step": 13083 - }, - { - "epoch": 0.34, - "learning_rate": 1.965128743886912e-06, - "loss": 0.7383, - "step": 13084 - }, - { - "epoch": 0.34, - "learning_rate": 1.9651215000654935e-06, - "loss": 0.8926, - "step": 13085 - }, - { - "epoch": 0.34, - "learning_rate": 1.965114255505126e-06, - "loss": 0.7295, - "step": 13086 - }, - { - "epoch": 0.34, - "learning_rate": 1.965107010205815e-06, - "loss": 0.9834, - "step": 13087 - }, - { - "epoch": 0.34, - "learning_rate": 1.9650997641675656e-06, - "loss": 0.8184, - "step": 13088 - }, - { - "epoch": 0.34, - "learning_rate": 1.9650925173903843e-06, - "loss": 0.9141, - "step": 13089 - }, - { - "epoch": 0.34, - "learning_rate": 1.9650852698742755e-06, - "loss": 0.959, - "step": 13090 - }, - { - "epoch": 0.34, - "learning_rate": 1.9650780216192453e-06, - "loss": 0.916, - "step": 13091 - }, - { - "epoch": 0.34, - "learning_rate": 1.965070772625299e-06, - "loss": 0.9971, - "step": 13092 - }, - { - "epoch": 0.34, - "learning_rate": 1.965063522892443e-06, - "loss": 1.0693, - "step": 13093 - }, - { - "epoch": 0.34, - "learning_rate": 1.965056272420682e-06, - "loss": 0.7739, - "step": 13094 - }, - { - "epoch": 0.34, - "learning_rate": 1.965049021210022e-06, - "loss": 0.8711, - "step": 13095 - }, - { - "epoch": 0.34, - "learning_rate": 1.9650417692604678e-06, - "loss": 0.8701, - "step": 13096 - }, - { - "epoch": 0.34, - "learning_rate": 1.965034516572026e-06, - "loss": 0.7974, - "step": 13097 - }, - { - "epoch": 0.34, - "learning_rate": 1.9650272631447013e-06, - "loss": 1.0186, - "step": 13098 - }, - { - "epoch": 0.34, - "learning_rate": 1.9650200089784996e-06, - "loss": 0.7202, - "step": 13099 - }, - { - "epoch": 0.34, - "learning_rate": 1.965012754073427e-06, - "loss": 0.9678, - "step": 13100 - }, - { - "epoch": 0.34, - "learning_rate": 1.965005498429488e-06, - "loss": 0.9229, - "step": 13101 - }, - { - "epoch": 0.34, - "learning_rate": 1.9649982420466885e-06, - "loss": 0.8145, - "step": 13102 - }, - { - "epoch": 0.34, - "learning_rate": 1.9649909849250347e-06, - "loss": 0.7666, - "step": 13103 - }, - { - "epoch": 0.34, - "learning_rate": 1.9649837270645314e-06, - "loss": 0.9678, - "step": 13104 - }, - { - "epoch": 0.34, - "learning_rate": 1.9649764684651846e-06, - "loss": 0.8506, - "step": 13105 - }, - { - "epoch": 0.34, - "learning_rate": 1.9649692091269993e-06, - "loss": 0.5674, - "step": 13106 - }, - { - "epoch": 0.34, - "learning_rate": 1.964961949049982e-06, - "loss": 0.9902, - "step": 13107 - }, - { - "epoch": 0.34, - "learning_rate": 1.964954688234137e-06, - "loss": 1.0371, - "step": 13108 - }, - { - "epoch": 0.34, - "learning_rate": 1.964947426679471e-06, - "loss": 0.9053, - "step": 13109 - }, - { - "epoch": 0.34, - "learning_rate": 1.964940164385989e-06, - "loss": 0.8276, - "step": 13110 - }, - { - "epoch": 0.34, - "learning_rate": 1.964932901353697e-06, - "loss": 1.083, - "step": 13111 - }, - { - "epoch": 0.34, - "learning_rate": 1.9649256375826e-06, - "loss": 0.7529, - "step": 13112 - }, - { - "epoch": 0.34, - "learning_rate": 1.964918373072704e-06, - "loss": 1.1309, - "step": 13113 - }, - { - "epoch": 0.34, - "learning_rate": 1.964911107824014e-06, - "loss": 0.8833, - "step": 13114 - }, - { - "epoch": 0.34, - "learning_rate": 1.9649038418365364e-06, - "loss": 0.9395, - "step": 13115 - }, - { - "epoch": 0.34, - "learning_rate": 1.964896575110276e-06, - "loss": 0.9629, - "step": 13116 - }, - { - "epoch": 0.34, - "learning_rate": 1.9648893076452387e-06, - "loss": 1.1055, - "step": 13117 - }, - { - "epoch": 0.34, - "learning_rate": 1.9648820394414297e-06, - "loss": 0.9219, - "step": 13118 - }, - { - "epoch": 0.34, - "learning_rate": 1.9648747704988556e-06, - "loss": 0.9561, - "step": 13119 - }, - { - "epoch": 0.34, - "learning_rate": 1.9648675008175205e-06, - "loss": 1.0547, - "step": 13120 - }, - { - "epoch": 0.34, - "learning_rate": 1.9648602303974312e-06, - "loss": 1.0068, - "step": 13121 - }, - { - "epoch": 0.34, - "learning_rate": 1.964852959238593e-06, - "loss": 0.9814, - "step": 13122 - }, - { - "epoch": 0.34, - "learning_rate": 1.9648456873410104e-06, - "loss": 0.8154, - "step": 13123 - }, - { - "epoch": 0.34, - "learning_rate": 1.9648384147046908e-06, - "loss": 0.8018, - "step": 13124 - }, - { - "epoch": 0.34, - "learning_rate": 1.9648311413296386e-06, - "loss": 0.8506, - "step": 13125 - }, - { - "epoch": 0.34, - "learning_rate": 1.964823867215859e-06, - "loss": 0.8369, - "step": 13126 - }, - { - "epoch": 0.34, - "learning_rate": 1.9648165923633584e-06, - "loss": 0.998, - "step": 13127 - }, - { - "epoch": 0.34, - "learning_rate": 1.964809316772142e-06, - "loss": 0.8535, - "step": 13128 - }, - { - "epoch": 0.34, - "learning_rate": 1.964802040442216e-06, - "loss": 0.8887, - "step": 13129 - }, - { - "epoch": 0.34, - "learning_rate": 1.9647947633735847e-06, - "loss": 0.873, - "step": 13130 - }, - { - "epoch": 0.34, - "learning_rate": 1.964787485566255e-06, - "loss": 0.9092, - "step": 13131 - }, - { - "epoch": 0.34, - "learning_rate": 1.9647802070202315e-06, - "loss": 0.96, - "step": 13132 - }, - { - "epoch": 0.34, - "learning_rate": 1.96477292773552e-06, - "loss": 0.8447, - "step": 13133 - }, - { - "epoch": 0.34, - "learning_rate": 1.9647656477121267e-06, - "loss": 0.9268, - "step": 13134 - }, - { - "epoch": 0.34, - "learning_rate": 1.964758366950057e-06, - "loss": 1.0029, - "step": 13135 - }, - { - "epoch": 0.34, - "learning_rate": 1.964751085449315e-06, - "loss": 0.7109, - "step": 13136 - }, - { - "epoch": 0.34, - "learning_rate": 1.9647438032099085e-06, - "loss": 0.9111, - "step": 13137 - }, - { - "epoch": 0.34, - "learning_rate": 1.9647365202318417e-06, - "loss": 0.8027, - "step": 13138 - }, - { - "epoch": 0.34, - "learning_rate": 1.9647292365151203e-06, - "loss": 0.8115, - "step": 13139 - }, - { - "epoch": 0.34, - "learning_rate": 1.9647219520597506e-06, - "loss": 1.0674, - "step": 13140 - }, - { - "epoch": 0.34, - "learning_rate": 1.964714666865737e-06, - "loss": 0.9648, - "step": 13141 - }, - { - "epoch": 0.34, - "learning_rate": 1.964707380933086e-06, - "loss": 0.959, - "step": 13142 - }, - { - "epoch": 0.34, - "learning_rate": 1.964700094261803e-06, - "loss": 0.9023, - "step": 13143 - }, - { - "epoch": 0.34, - "learning_rate": 1.9646928068518936e-06, - "loss": 0.9746, - "step": 13144 - }, - { - "epoch": 0.34, - "learning_rate": 1.9646855187033632e-06, - "loss": 0.9814, - "step": 13145 - }, - { - "epoch": 0.34, - "learning_rate": 1.9646782298162176e-06, - "loss": 0.8184, - "step": 13146 - }, - { - "epoch": 0.34, - "learning_rate": 1.964670940190462e-06, - "loss": 0.7446, - "step": 13147 - }, - { - "epoch": 0.34, - "learning_rate": 1.964663649826102e-06, - "loss": 0.8486, - "step": 13148 - }, - { - "epoch": 0.34, - "learning_rate": 1.964656358723144e-06, - "loss": 0.9131, - "step": 13149 - }, - { - "epoch": 0.34, - "learning_rate": 1.964649066881593e-06, - "loss": 0.8926, - "step": 13150 - }, - { - "epoch": 0.34, - "learning_rate": 1.964641774301454e-06, - "loss": 0.7383, - "step": 13151 - }, - { - "epoch": 0.34, - "learning_rate": 1.9646344809827335e-06, - "loss": 0.9307, - "step": 13152 - }, - { - "epoch": 0.34, - "learning_rate": 1.9646271869254364e-06, - "loss": 0.9463, - "step": 13153 - }, - { - "epoch": 0.34, - "learning_rate": 1.964619892129569e-06, - "loss": 0.9688, - "step": 13154 - }, - { - "epoch": 0.34, - "learning_rate": 1.964612596595136e-06, - "loss": 1.0996, - "step": 13155 - }, - { - "epoch": 0.34, - "learning_rate": 1.964605300322144e-06, - "loss": 0.8496, - "step": 13156 - }, - { - "epoch": 0.34, - "learning_rate": 1.964598003310598e-06, - "loss": 0.918, - "step": 13157 - }, - { - "epoch": 0.34, - "learning_rate": 1.964590705560503e-06, - "loss": 0.6428, - "step": 13158 - }, - { - "epoch": 0.34, - "learning_rate": 1.964583407071866e-06, - "loss": 1.1318, - "step": 13159 - }, - { - "epoch": 0.34, - "learning_rate": 1.964576107844692e-06, - "loss": 0.8076, - "step": 13160 - }, - { - "epoch": 0.34, - "learning_rate": 1.964568807878986e-06, - "loss": 0.8442, - "step": 13161 - }, - { - "epoch": 0.34, - "learning_rate": 1.964561507174754e-06, - "loss": 0.9609, - "step": 13162 - }, - { - "epoch": 0.34, - "learning_rate": 1.9645542057320016e-06, - "loss": 0.8252, - "step": 13163 - }, - { - "epoch": 0.34, - "learning_rate": 1.9645469035507345e-06, - "loss": 0.9219, - "step": 13164 - }, - { - "epoch": 0.34, - "learning_rate": 1.9645396006309583e-06, - "loss": 1.0518, - "step": 13165 - }, - { - "epoch": 0.34, - "learning_rate": 1.9645322969726783e-06, - "loss": 0.7969, - "step": 13166 - }, - { - "epoch": 0.34, - "learning_rate": 1.9645249925759003e-06, - "loss": 0.9014, - "step": 13167 - }, - { - "epoch": 0.34, - "learning_rate": 1.96451768744063e-06, - "loss": 0.9004, - "step": 13168 - }, - { - "epoch": 0.34, - "learning_rate": 1.9645103815668724e-06, - "loss": 0.9521, - "step": 13169 - }, - { - "epoch": 0.34, - "learning_rate": 1.964503074954634e-06, - "loss": 0.8438, - "step": 13170 - }, - { - "epoch": 0.34, - "learning_rate": 1.9644957676039197e-06, - "loss": 0.7275, - "step": 13171 - }, - { - "epoch": 0.34, - "learning_rate": 1.9644884595147357e-06, - "loss": 0.7805, - "step": 13172 - }, - { - "epoch": 0.34, - "learning_rate": 1.964481150687087e-06, - "loss": 0.9492, - "step": 13173 - }, - { - "epoch": 0.34, - "learning_rate": 1.9644738411209795e-06, - "loss": 1.0645, - "step": 13174 - }, - { - "epoch": 0.34, - "learning_rate": 1.9644665308164186e-06, - "loss": 0.918, - "step": 13175 - }, - { - "epoch": 0.34, - "learning_rate": 1.96445921977341e-06, - "loss": 0.8691, - "step": 13176 - }, - { - "epoch": 0.34, - "learning_rate": 1.9644519079919596e-06, - "loss": 0.6343, - "step": 13177 - }, - { - "epoch": 0.34, - "learning_rate": 1.9644445954720725e-06, - "loss": 0.7588, - "step": 13178 - }, - { - "epoch": 0.34, - "learning_rate": 1.964437282213755e-06, - "loss": 0.9985, - "step": 13179 - }, - { - "epoch": 0.34, - "learning_rate": 1.964429968217011e-06, - "loss": 0.9346, - "step": 13180 - }, - { - "epoch": 0.34, - "learning_rate": 1.9644226534818483e-06, - "loss": 0.8984, - "step": 13181 - }, - { - "epoch": 0.34, - "learning_rate": 1.9644153380082714e-06, - "loss": 0.8467, - "step": 13182 - }, - { - "epoch": 0.34, - "learning_rate": 1.964408021796286e-06, - "loss": 0.7373, - "step": 13183 - }, - { - "epoch": 0.34, - "learning_rate": 1.9644007048458973e-06, - "loss": 1.0605, - "step": 13184 - }, - { - "epoch": 0.34, - "learning_rate": 1.964393387157112e-06, - "loss": 0.9258, - "step": 13185 - }, - { - "epoch": 0.34, - "learning_rate": 1.964386068729935e-06, - "loss": 0.7725, - "step": 13186 - }, - { - "epoch": 0.34, - "learning_rate": 1.9643787495643714e-06, - "loss": 0.7432, - "step": 13187 - }, - { - "epoch": 0.34, - "learning_rate": 1.9643714296604276e-06, - "loss": 0.8364, - "step": 13188 - }, - { - "epoch": 0.34, - "learning_rate": 1.964364109018109e-06, - "loss": 0.9678, - "step": 13189 - }, - { - "epoch": 0.34, - "learning_rate": 1.964356787637421e-06, - "loss": 0.8096, - "step": 13190 - }, - { - "epoch": 0.34, - "learning_rate": 1.9643494655183695e-06, - "loss": 1.0195, - "step": 13191 - }, - { - "epoch": 0.34, - "learning_rate": 1.9643421426609595e-06, - "loss": 0.9424, - "step": 13192 - }, - { - "epoch": 0.34, - "learning_rate": 1.9643348190651976e-06, - "loss": 1.1621, - "step": 13193 - }, - { - "epoch": 0.34, - "learning_rate": 1.964327494731089e-06, - "loss": 1.0977, - "step": 13194 - }, - { - "epoch": 0.34, - "learning_rate": 1.9643201696586386e-06, - "loss": 0.7432, - "step": 13195 - }, - { - "epoch": 0.34, - "learning_rate": 1.964312843847853e-06, - "loss": 0.9805, - "step": 13196 - }, - { - "epoch": 0.34, - "learning_rate": 1.964305517298737e-06, - "loss": 1.1309, - "step": 13197 - }, - { - "epoch": 0.34, - "learning_rate": 1.964298190011297e-06, - "loss": 0.8027, - "step": 13198 - }, - { - "epoch": 0.34, - "learning_rate": 1.9642908619855383e-06, - "loss": 0.7842, - "step": 13199 - }, - { - "epoch": 0.34, - "learning_rate": 1.964283533221466e-06, - "loss": 0.8613, - "step": 13200 - }, - { - "epoch": 0.34, - "learning_rate": 1.9642762037190862e-06, - "loss": 0.9043, - "step": 13201 - }, - { - "epoch": 0.34, - "learning_rate": 1.9642688734784047e-06, - "loss": 0.8477, - "step": 13202 - }, - { - "epoch": 0.34, - "learning_rate": 1.9642615424994267e-06, - "loss": 0.8877, - "step": 13203 - }, - { - "epoch": 0.34, - "learning_rate": 1.964254210782158e-06, - "loss": 0.6704, - "step": 13204 - }, - { - "epoch": 0.34, - "learning_rate": 1.9642468783266042e-06, - "loss": 0.8994, - "step": 13205 - }, - { - "epoch": 0.34, - "learning_rate": 1.964239545132771e-06, - "loss": 0.8174, - "step": 13206 - }, - { - "epoch": 0.34, - "learning_rate": 1.964232211200664e-06, - "loss": 0.8955, - "step": 13207 - }, - { - "epoch": 0.34, - "learning_rate": 1.9642248765302886e-06, - "loss": 0.6753, - "step": 13208 - }, - { - "epoch": 0.34, - "learning_rate": 1.96421754112165e-06, - "loss": 0.9248, - "step": 13209 - }, - { - "epoch": 0.34, - "learning_rate": 1.9642102049747553e-06, - "loss": 0.7415, - "step": 13210 - }, - { - "epoch": 0.34, - "learning_rate": 1.964202868089609e-06, - "loss": 0.6934, - "step": 13211 - }, - { - "epoch": 0.34, - "learning_rate": 1.9641955304662165e-06, - "loss": 0.8945, - "step": 13212 - }, - { - "epoch": 0.34, - "learning_rate": 1.9641881921045837e-06, - "loss": 0.8535, - "step": 13213 - }, - { - "epoch": 0.34, - "learning_rate": 1.9641808530047168e-06, - "loss": 0.9785, - "step": 13214 - }, - { - "epoch": 0.34, - "learning_rate": 1.964173513166621e-06, - "loss": 0.9365, - "step": 13215 - }, - { - "epoch": 0.34, - "learning_rate": 1.9641661725903014e-06, - "loss": 1.0693, - "step": 13216 - }, - { - "epoch": 0.34, - "learning_rate": 1.9641588312757643e-06, - "loss": 0.6865, - "step": 13217 - }, - { - "epoch": 0.34, - "learning_rate": 1.964151489223015e-06, - "loss": 0.9561, - "step": 13218 - }, - { - "epoch": 0.34, - "learning_rate": 1.9641441464320595e-06, - "loss": 0.9014, - "step": 13219 - }, - { - "epoch": 0.34, - "learning_rate": 1.964136802902903e-06, - "loss": 0.9785, - "step": 13220 - }, - { - "epoch": 0.34, - "learning_rate": 1.9641294586355516e-06, - "loss": 0.8174, - "step": 13221 - }, - { - "epoch": 0.34, - "learning_rate": 1.9641221136300104e-06, - "loss": 0.7476, - "step": 13222 - }, - { - "epoch": 0.34, - "learning_rate": 1.964114767886285e-06, - "loss": 0.9092, - "step": 13223 - }, - { - "epoch": 0.34, - "learning_rate": 1.9641074214043812e-06, - "loss": 0.832, - "step": 13224 - }, - { - "epoch": 0.34, - "learning_rate": 1.964100074184305e-06, - "loss": 1.1523, - "step": 13225 - }, - { - "epoch": 0.34, - "learning_rate": 1.9640927262260617e-06, - "loss": 0.9844, - "step": 13226 - }, - { - "epoch": 0.34, - "learning_rate": 1.9640853775296567e-06, - "loss": 1.0879, - "step": 13227 - }, - { - "epoch": 0.34, - "learning_rate": 1.9640780280950963e-06, - "loss": 0.9277, - "step": 13228 - }, - { - "epoch": 0.34, - "learning_rate": 1.9640706779223852e-06, - "loss": 0.9155, - "step": 13229 - }, - { - "epoch": 0.34, - "learning_rate": 1.96406332701153e-06, - "loss": 0.895, - "step": 13230 - }, - { - "epoch": 0.34, - "learning_rate": 1.9640559753625352e-06, - "loss": 0.7778, - "step": 13231 - }, - { - "epoch": 0.34, - "learning_rate": 1.9640486229754073e-06, - "loss": 0.8052, - "step": 13232 - }, - { - "epoch": 0.34, - "learning_rate": 1.964041269850152e-06, - "loss": 0.7529, - "step": 13233 - }, - { - "epoch": 0.34, - "learning_rate": 1.9640339159867744e-06, - "loss": 0.8311, - "step": 13234 - }, - { - "epoch": 0.34, - "learning_rate": 1.9640265613852804e-06, - "loss": 0.7432, - "step": 13235 - }, - { - "epoch": 0.34, - "learning_rate": 1.9640192060456756e-06, - "loss": 1.0654, - "step": 13236 - }, - { - "epoch": 0.34, - "learning_rate": 1.9640118499679654e-06, - "loss": 0.9502, - "step": 13237 - }, - { - "epoch": 0.34, - "learning_rate": 1.964004493152156e-06, - "loss": 1.207, - "step": 13238 - }, - { - "epoch": 0.34, - "learning_rate": 1.9639971355982526e-06, - "loss": 0.9487, - "step": 13239 - }, - { - "epoch": 0.34, - "learning_rate": 1.9639897773062607e-06, - "loss": 0.9473, - "step": 13240 - }, - { - "epoch": 0.34, - "learning_rate": 1.9639824182761862e-06, - "loss": 0.9014, - "step": 13241 - }, - { - "epoch": 0.34, - "learning_rate": 1.963975058508035e-06, - "loss": 0.8125, - "step": 13242 - }, - { - "epoch": 0.34, - "learning_rate": 1.963967698001812e-06, - "loss": 0.9238, - "step": 13243 - }, - { - "epoch": 0.34, - "learning_rate": 1.963960336757524e-06, - "loss": 1.0146, - "step": 13244 - }, - { - "epoch": 0.34, - "learning_rate": 1.963952974775175e-06, - "loss": 0.8633, - "step": 13245 - }, - { - "epoch": 0.34, - "learning_rate": 1.963945612054772e-06, - "loss": 0.959, - "step": 13246 - }, - { - "epoch": 0.34, - "learning_rate": 1.96393824859632e-06, - "loss": 1.2422, - "step": 13247 - }, - { - "epoch": 0.34, - "learning_rate": 1.9639308843998247e-06, - "loss": 0.7485, - "step": 13248 - }, - { - "epoch": 0.34, - "learning_rate": 1.963923519465292e-06, - "loss": 0.9072, - "step": 13249 - }, - { - "epoch": 0.34, - "learning_rate": 1.9639161537927275e-06, - "loss": 0.8701, - "step": 13250 - }, - { - "epoch": 0.34, - "learning_rate": 1.9639087873821365e-06, - "loss": 0.9092, - "step": 13251 - }, - { - "epoch": 0.34, - "learning_rate": 1.9639014202335253e-06, - "loss": 1.0195, - "step": 13252 - }, - { - "epoch": 0.34, - "learning_rate": 1.9638940523468985e-06, - "loss": 1.0215, - "step": 13253 - }, - { - "epoch": 0.34, - "learning_rate": 1.963886683722263e-06, - "loss": 0.9395, - "step": 13254 - }, - { - "epoch": 0.34, - "learning_rate": 1.963879314359623e-06, - "loss": 0.854, - "step": 13255 - }, - { - "epoch": 0.34, - "learning_rate": 1.9638719442589852e-06, - "loss": 0.8984, - "step": 13256 - }, - { - "epoch": 0.34, - "learning_rate": 1.963864573420355e-06, - "loss": 0.4907, - "step": 13257 - }, - { - "epoch": 0.34, - "learning_rate": 1.9638572018437384e-06, - "loss": 0.7969, - "step": 13258 - }, - { - "epoch": 0.34, - "learning_rate": 1.9638498295291406e-06, - "loss": 0.7437, - "step": 13259 - }, - { - "epoch": 0.34, - "learning_rate": 1.963842456476567e-06, - "loss": 0.9082, - "step": 13260 - }, - { - "epoch": 0.34, - "learning_rate": 1.9638350826860236e-06, - "loss": 1.0205, - "step": 13261 - }, - { - "epoch": 0.34, - "learning_rate": 1.9638277081575162e-06, - "loss": 0.9639, - "step": 13262 - }, - { - "epoch": 0.34, - "learning_rate": 1.96382033289105e-06, - "loss": 0.9775, - "step": 13263 - }, - { - "epoch": 0.34, - "learning_rate": 1.963812956886631e-06, - "loss": 0.6929, - "step": 13264 - }, - { - "epoch": 0.34, - "learning_rate": 1.9638055801442646e-06, - "loss": 0.8516, - "step": 13265 - }, - { - "epoch": 0.34, - "learning_rate": 1.9637982026639567e-06, - "loss": 0.9785, - "step": 13266 - }, - { - "epoch": 0.34, - "learning_rate": 1.963790824445713e-06, - "loss": 1.1416, - "step": 13267 - }, - { - "epoch": 0.34, - "learning_rate": 1.9637834454895386e-06, - "loss": 0.6143, - "step": 13268 - }, - { - "epoch": 0.34, - "learning_rate": 1.96377606579544e-06, - "loss": 0.8994, - "step": 13269 - }, - { - "epoch": 0.34, - "learning_rate": 1.963768685363422e-06, - "loss": 0.959, - "step": 13270 - }, - { - "epoch": 0.34, - "learning_rate": 1.9637613041934907e-06, - "loss": 0.6519, - "step": 13271 - }, - { - "epoch": 0.34, - "learning_rate": 1.9637539222856518e-06, - "loss": 0.9395, - "step": 13272 - }, - { - "epoch": 0.34, - "learning_rate": 1.963746539639911e-06, - "loss": 0.9062, - "step": 13273 - }, - { - "epoch": 0.34, - "learning_rate": 1.9637391562562733e-06, - "loss": 0.9375, - "step": 13274 - }, - { - "epoch": 0.34, - "learning_rate": 1.963731772134745e-06, - "loss": 1.082, - "step": 13275 - }, - { - "epoch": 0.34, - "learning_rate": 1.963724387275332e-06, - "loss": 0.9863, - "step": 13276 - }, - { - "epoch": 0.34, - "learning_rate": 1.963717001678039e-06, - "loss": 0.7229, - "step": 13277 - }, - { - "epoch": 0.34, - "learning_rate": 1.9637096153428724e-06, - "loss": 0.915, - "step": 13278 - }, - { - "epoch": 0.34, - "learning_rate": 1.9637022282698376e-06, - "loss": 0.874, - "step": 13279 - }, - { - "epoch": 0.34, - "learning_rate": 1.9636948404589405e-06, - "loss": 1.1396, - "step": 13280 - }, - { - "epoch": 0.34, - "learning_rate": 1.9636874519101867e-06, - "loss": 0.8438, - "step": 13281 - }, - { - "epoch": 0.34, - "learning_rate": 1.9636800626235812e-06, - "loss": 0.9146, - "step": 13282 - }, - { - "epoch": 0.34, - "learning_rate": 1.963672672599131e-06, - "loss": 0.9854, - "step": 13283 - }, - { - "epoch": 0.34, - "learning_rate": 1.9636652818368403e-06, - "loss": 0.9424, - "step": 13284 - }, - { - "epoch": 0.34, - "learning_rate": 1.9636578903367154e-06, - "loss": 0.916, - "step": 13285 - }, - { - "epoch": 0.34, - "learning_rate": 1.963650498098762e-06, - "loss": 0.7432, - "step": 13286 - }, - { - "epoch": 0.34, - "learning_rate": 1.963643105122986e-06, - "loss": 0.8047, - "step": 13287 - }, - { - "epoch": 0.34, - "learning_rate": 1.963635711409393e-06, - "loss": 0.8164, - "step": 13288 - }, - { - "epoch": 0.34, - "learning_rate": 1.963628316957988e-06, - "loss": 0.7095, - "step": 13289 - }, - { - "epoch": 0.34, - "learning_rate": 1.963620921768777e-06, - "loss": 1.0742, - "step": 13290 - }, - { - "epoch": 0.34, - "learning_rate": 1.963613525841766e-06, - "loss": 0.6787, - "step": 13291 - }, - { - "epoch": 0.34, - "learning_rate": 1.9636061291769607e-06, - "loss": 1.0371, - "step": 13292 - }, - { - "epoch": 0.34, - "learning_rate": 1.963598731774366e-06, - "loss": 0.8682, - "step": 13293 - }, - { - "epoch": 0.34, - "learning_rate": 1.963591333633988e-06, - "loss": 0.8389, - "step": 13294 - }, - { - "epoch": 0.34, - "learning_rate": 1.963583934755833e-06, - "loss": 0.8262, - "step": 13295 - }, - { - "epoch": 0.34, - "learning_rate": 1.9635765351399055e-06, - "loss": 0.8506, - "step": 13296 - }, - { - "epoch": 0.34, - "learning_rate": 1.963569134786212e-06, - "loss": 0.9033, - "step": 13297 - }, - { - "epoch": 0.34, - "learning_rate": 1.963561733694758e-06, - "loss": 1.0713, - "step": 13298 - }, - { - "epoch": 0.34, - "learning_rate": 1.963554331865549e-06, - "loss": 0.8691, - "step": 13299 - }, - { - "epoch": 0.34, - "learning_rate": 1.9635469292985908e-06, - "loss": 0.9922, - "step": 13300 - }, - { - "epoch": 0.34, - "learning_rate": 1.963539525993889e-06, - "loss": 1.209, - "step": 13301 - }, - { - "epoch": 0.34, - "learning_rate": 1.963532121951449e-06, - "loss": 0.9922, - "step": 13302 - }, - { - "epoch": 0.34, - "learning_rate": 1.9635247171712774e-06, - "loss": 0.9414, - "step": 13303 - }, - { - "epoch": 0.34, - "learning_rate": 1.963517311653379e-06, - "loss": 0.7749, - "step": 13304 - }, - { - "epoch": 0.34, - "learning_rate": 1.9635099053977592e-06, - "loss": 1.1143, - "step": 13305 - }, - { - "epoch": 0.34, - "learning_rate": 1.9635024984044247e-06, - "loss": 0.7578, - "step": 13306 - }, - { - "epoch": 0.34, - "learning_rate": 1.9634950906733803e-06, - "loss": 0.7388, - "step": 13307 - }, - { - "epoch": 0.34, - "learning_rate": 1.9634876822046325e-06, - "loss": 0.7998, - "step": 13308 - }, - { - "epoch": 0.34, - "learning_rate": 1.963480272998186e-06, - "loss": 0.7651, - "step": 13309 - }, - { - "epoch": 0.34, - "learning_rate": 1.9634728630540473e-06, - "loss": 0.7334, - "step": 13310 - }, - { - "epoch": 0.34, - "learning_rate": 1.9634654523722214e-06, - "loss": 1.0439, - "step": 13311 - }, - { - "epoch": 0.34, - "learning_rate": 1.9634580409527145e-06, - "loss": 0.8442, - "step": 13312 - }, - { - "epoch": 0.34, - "learning_rate": 1.963450628795532e-06, - "loss": 0.6587, - "step": 13313 - }, - { - "epoch": 0.34, - "learning_rate": 1.9634432159006796e-06, - "loss": 0.998, - "step": 13314 - }, - { - "epoch": 0.34, - "learning_rate": 1.963435802268163e-06, - "loss": 0.8867, - "step": 13315 - }, - { - "epoch": 0.34, - "learning_rate": 1.963428387897988e-06, - "loss": 0.9561, - "step": 13316 - }, - { - "epoch": 0.34, - "learning_rate": 1.9634209727901606e-06, - "loss": 1.1445, - "step": 13317 - }, - { - "epoch": 0.34, - "learning_rate": 1.9634135569446854e-06, - "loss": 1.0, - "step": 13318 - }, - { - "epoch": 0.34, - "learning_rate": 1.963406140361569e-06, - "loss": 0.8647, - "step": 13319 - }, - { - "epoch": 0.34, - "learning_rate": 1.963398723040817e-06, - "loss": 0.9717, - "step": 13320 - }, - { - "epoch": 0.34, - "learning_rate": 1.963391304982435e-06, - "loss": 0.8721, - "step": 13321 - }, - { - "epoch": 0.34, - "learning_rate": 1.963383886186428e-06, - "loss": 0.6763, - "step": 13322 - }, - { - "epoch": 0.34, - "learning_rate": 1.9633764666528025e-06, - "loss": 1.1094, - "step": 13323 - }, - { - "epoch": 0.34, - "learning_rate": 1.963369046381564e-06, - "loss": 0.876, - "step": 13324 - }, - { - "epoch": 0.34, - "learning_rate": 1.9633616253727184e-06, - "loss": 0.9297, - "step": 13325 - }, - { - "epoch": 0.34, - "learning_rate": 1.963354203626271e-06, - "loss": 0.7186, - "step": 13326 - }, - { - "epoch": 0.34, - "learning_rate": 1.9633467811422267e-06, - "loss": 1.1621, - "step": 13327 - }, - { - "epoch": 0.34, - "learning_rate": 1.963339357920593e-06, - "loss": 0.8711, - "step": 13328 - }, - { - "epoch": 0.34, - "learning_rate": 1.9633319339613744e-06, - "loss": 0.7876, - "step": 13329 - }, - { - "epoch": 0.34, - "learning_rate": 1.963324509264577e-06, - "loss": 0.8809, - "step": 13330 - }, - { - "epoch": 0.34, - "learning_rate": 1.9633170838302064e-06, - "loss": 0.8486, - "step": 13331 - }, - { - "epoch": 0.34, - "learning_rate": 1.9633096576582675e-06, - "loss": 0.9385, - "step": 13332 - }, - { - "epoch": 0.34, - "learning_rate": 1.963302230748767e-06, - "loss": 0.8447, - "step": 13333 - }, - { - "epoch": 0.34, - "learning_rate": 1.9632948031017107e-06, - "loss": 0.5957, - "step": 13334 - }, - { - "epoch": 0.34, - "learning_rate": 1.9632873747171037e-06, - "loss": 0.9131, - "step": 13335 - }, - { - "epoch": 0.34, - "learning_rate": 1.9632799455949516e-06, - "loss": 0.7935, - "step": 13336 - }, - { - "epoch": 0.34, - "learning_rate": 1.9632725157352604e-06, - "loss": 0.6377, - "step": 13337 - }, - { - "epoch": 0.34, - "learning_rate": 1.963265085138036e-06, - "loss": 0.9512, - "step": 13338 - }, - { - "epoch": 0.34, - "learning_rate": 1.9632576538032836e-06, - "loss": 0.79, - "step": 13339 - }, - { - "epoch": 0.34, - "learning_rate": 1.963250221731009e-06, - "loss": 0.8203, - "step": 13340 - }, - { - "epoch": 0.34, - "learning_rate": 1.963242788921218e-06, - "loss": 0.8066, - "step": 13341 - }, - { - "epoch": 0.34, - "learning_rate": 1.963235355373917e-06, - "loss": 0.8691, - "step": 13342 - }, - { - "epoch": 0.34, - "learning_rate": 1.96322792108911e-06, - "loss": 1.0088, - "step": 13343 - }, - { - "epoch": 0.34, - "learning_rate": 1.9632204860668043e-06, - "loss": 0.918, - "step": 13344 - }, - { - "epoch": 0.34, - "learning_rate": 1.9632130503070048e-06, - "loss": 1.0029, - "step": 13345 - }, - { - "epoch": 0.34, - "learning_rate": 1.963205613809717e-06, - "loss": 0.8662, - "step": 13346 - }, - { - "epoch": 0.34, - "learning_rate": 1.963198176574947e-06, - "loss": 0.8154, - "step": 13347 - }, - { - "epoch": 0.34, - "learning_rate": 1.963190738602701e-06, - "loss": 0.8086, - "step": 13348 - }, - { - "epoch": 0.34, - "learning_rate": 1.963183299892984e-06, - "loss": 0.9446, - "step": 13349 - }, - { - "epoch": 0.34, - "learning_rate": 1.9631758604458013e-06, - "loss": 0.9941, - "step": 13350 - }, - { - "epoch": 0.34, - "learning_rate": 1.9631684202611596e-06, - "loss": 0.9932, - "step": 13351 - }, - { - "epoch": 0.34, - "learning_rate": 1.963160979339064e-06, - "loss": 0.9551, - "step": 13352 - }, - { - "epoch": 0.34, - "learning_rate": 1.9631535376795203e-06, - "loss": 0.8979, - "step": 13353 - }, - { - "epoch": 0.34, - "learning_rate": 1.963146095282534e-06, - "loss": 0.8447, - "step": 13354 - }, - { - "epoch": 0.34, - "learning_rate": 1.9631386521481117e-06, - "loss": 0.7734, - "step": 13355 - }, - { - "epoch": 0.34, - "learning_rate": 1.963131208276258e-06, - "loss": 1.1309, - "step": 13356 - }, - { - "epoch": 0.34, - "learning_rate": 1.963123763666979e-06, - "loss": 0.9512, - "step": 13357 - }, - { - "epoch": 0.34, - "learning_rate": 1.9631163183202805e-06, - "loss": 1.0771, - "step": 13358 - }, - { - "epoch": 0.34, - "learning_rate": 1.9631088722361683e-06, - "loss": 0.9141, - "step": 13359 - }, - { - "epoch": 0.34, - "learning_rate": 1.9631014254146475e-06, - "loss": 0.8555, - "step": 13360 - }, - { - "epoch": 0.34, - "learning_rate": 1.9630939778557243e-06, - "loss": 0.9497, - "step": 13361 - }, - { - "epoch": 0.34, - "learning_rate": 1.9630865295594043e-06, - "loss": 1.1094, - "step": 13362 - }, - { - "epoch": 0.34, - "learning_rate": 1.9630790805256934e-06, - "loss": 0.7798, - "step": 13363 - }, - { - "epoch": 0.34, - "learning_rate": 1.963071630754597e-06, - "loss": 0.6733, - "step": 13364 - }, - { - "epoch": 0.34, - "learning_rate": 1.963064180246121e-06, - "loss": 0.8193, - "step": 13365 - }, - { - "epoch": 0.34, - "learning_rate": 1.9630567290002714e-06, - "loss": 0.8496, - "step": 13366 - }, - { - "epoch": 0.34, - "learning_rate": 1.963049277017053e-06, - "loss": 0.6421, - "step": 13367 - }, - { - "epoch": 0.34, - "learning_rate": 1.9630418242964723e-06, - "loss": 0.8496, - "step": 13368 - }, - { - "epoch": 0.34, - "learning_rate": 1.9630343708385347e-06, - "loss": 0.8809, - "step": 13369 - }, - { - "epoch": 0.34, - "learning_rate": 1.9630269166432465e-06, - "loss": 0.7485, - "step": 13370 - }, - { - "epoch": 0.34, - "learning_rate": 1.963019461710612e-06, - "loss": 0.917, - "step": 13371 - }, - { - "epoch": 0.34, - "learning_rate": 1.963012006040638e-06, - "loss": 0.9219, - "step": 13372 - }, - { - "epoch": 0.34, - "learning_rate": 1.9630045496333303e-06, - "loss": 1.0146, - "step": 13373 - }, - { - "epoch": 0.34, - "learning_rate": 1.962997092488694e-06, - "loss": 1.1221, - "step": 13374 - }, - { - "epoch": 0.34, - "learning_rate": 1.962989634606735e-06, - "loss": 0.9668, - "step": 13375 - }, - { - "epoch": 0.34, - "learning_rate": 1.96298217598746e-06, - "loss": 0.8135, - "step": 13376 - }, - { - "epoch": 0.34, - "learning_rate": 1.962974716630873e-06, - "loss": 0.9912, - "step": 13377 - }, - { - "epoch": 0.34, - "learning_rate": 1.9629672565369807e-06, - "loss": 0.96, - "step": 13378 - }, - { - "epoch": 0.34, - "learning_rate": 1.9629597957057886e-06, - "loss": 0.8574, - "step": 13379 - }, - { - "epoch": 0.34, - "learning_rate": 1.9629523341373025e-06, - "loss": 0.5601, - "step": 13380 - }, - { - "epoch": 0.34, - "learning_rate": 1.962944871831528e-06, - "loss": 0.9492, - "step": 13381 - }, - { - "epoch": 0.34, - "learning_rate": 1.9629374087884713e-06, - "loss": 0.7998, - "step": 13382 - }, - { - "epoch": 0.34, - "learning_rate": 1.962929945008137e-06, - "loss": 0.8965, - "step": 13383 - }, - { - "epoch": 0.34, - "learning_rate": 1.962922480490532e-06, - "loss": 0.9219, - "step": 13384 - }, - { - "epoch": 0.34, - "learning_rate": 1.9629150152356613e-06, - "loss": 0.811, - "step": 13385 - }, - { - "epoch": 0.34, - "learning_rate": 1.9629075492435313e-06, - "loss": 0.8779, - "step": 13386 - }, - { - "epoch": 0.34, - "learning_rate": 1.962900082514147e-06, - "loss": 0.8926, - "step": 13387 - }, - { - "epoch": 0.34, - "learning_rate": 1.962892615047514e-06, - "loss": 0.6348, - "step": 13388 - }, - { - "epoch": 0.34, - "learning_rate": 1.962885146843639e-06, - "loss": 0.8398, - "step": 13389 - }, - { - "epoch": 0.34, - "learning_rate": 1.962877677902527e-06, - "loss": 0.7173, - "step": 13390 - }, - { - "epoch": 0.34, - "learning_rate": 1.9628702082241836e-06, - "loss": 1.0244, - "step": 13391 - }, - { - "epoch": 0.34, - "learning_rate": 1.962862737808615e-06, - "loss": 0.8633, - "step": 13392 - }, - { - "epoch": 0.34, - "learning_rate": 1.9628552666558263e-06, - "loss": 0.9902, - "step": 13393 - }, - { - "epoch": 0.34, - "learning_rate": 1.9628477947658237e-06, - "loss": 0.8818, - "step": 13394 - }, - { - "epoch": 0.34, - "learning_rate": 1.962840322138613e-06, - "loss": 1.0293, - "step": 13395 - }, - { - "epoch": 0.34, - "learning_rate": 1.9628328487741998e-06, - "loss": 0.8184, - "step": 13396 - }, - { - "epoch": 0.34, - "learning_rate": 1.9628253746725895e-06, - "loss": 0.9619, - "step": 13397 - }, - { - "epoch": 0.34, - "learning_rate": 1.962817899833788e-06, - "loss": 0.7764, - "step": 13398 - }, - { - "epoch": 0.34, - "learning_rate": 1.9628104242578015e-06, - "loss": 0.917, - "step": 13399 - }, - { - "epoch": 0.34, - "learning_rate": 1.962802947944635e-06, - "loss": 0.9707, - "step": 13400 - }, - { - "epoch": 0.34, - "learning_rate": 1.962795470894295e-06, - "loss": 0.8096, - "step": 13401 - }, - { - "epoch": 0.34, - "learning_rate": 1.9627879931067868e-06, - "loss": 0.8662, - "step": 13402 - }, - { - "epoch": 0.34, - "learning_rate": 1.9627805145821153e-06, - "loss": 0.9658, - "step": 13403 - }, - { - "epoch": 0.34, - "learning_rate": 1.9627730353202875e-06, - "loss": 0.917, - "step": 13404 - }, - { - "epoch": 0.34, - "learning_rate": 1.9627655553213086e-06, - "loss": 0.6838, - "step": 13405 - }, - { - "epoch": 0.34, - "learning_rate": 1.962758074585185e-06, - "loss": 0.7944, - "step": 13406 - }, - { - "epoch": 0.34, - "learning_rate": 1.962750593111921e-06, - "loss": 1.1201, - "step": 13407 - }, - { - "epoch": 0.34, - "learning_rate": 1.962743110901523e-06, - "loss": 0.8369, - "step": 13408 - }, - { - "epoch": 0.34, - "learning_rate": 1.9627356279539976e-06, - "loss": 0.9102, - "step": 13409 - }, - { - "epoch": 0.34, - "learning_rate": 1.9627281442693496e-06, - "loss": 0.7275, - "step": 13410 - }, - { - "epoch": 0.34, - "learning_rate": 1.9627206598475843e-06, - "loss": 0.7412, - "step": 13411 - }, - { - "epoch": 0.34, - "learning_rate": 1.962713174688709e-06, - "loss": 0.8289, - "step": 13412 - }, - { - "epoch": 0.34, - "learning_rate": 1.962705688792728e-06, - "loss": 0.8389, - "step": 13413 - }, - { - "epoch": 0.34, - "learning_rate": 1.962698202159648e-06, - "loss": 0.8945, - "step": 13414 - }, - { - "epoch": 0.34, - "learning_rate": 1.9626907147894735e-06, - "loss": 0.9014, - "step": 13415 - }, - { - "epoch": 0.34, - "learning_rate": 1.962683226682211e-06, - "loss": 0.9072, - "step": 13416 - }, - { - "epoch": 0.34, - "learning_rate": 1.9626757378378666e-06, - "loss": 0.9463, - "step": 13417 - }, - { - "epoch": 0.34, - "learning_rate": 1.9626682482564455e-06, - "loss": 0.8867, - "step": 13418 - }, - { - "epoch": 0.34, - "learning_rate": 1.9626607579379536e-06, - "loss": 0.9893, - "step": 13419 - }, - { - "epoch": 0.34, - "learning_rate": 1.962653266882397e-06, - "loss": 0.6162, - "step": 13420 - }, - { - "epoch": 0.34, - "learning_rate": 1.9626457750897806e-06, - "loss": 1.1484, - "step": 13421 - }, - { - "epoch": 0.34, - "learning_rate": 1.962638282560111e-06, - "loss": 0.8208, - "step": 13422 - }, - { - "epoch": 0.34, - "learning_rate": 1.962630789293393e-06, - "loss": 0.8252, - "step": 13423 - }, - { - "epoch": 0.34, - "learning_rate": 1.962623295289633e-06, - "loss": 0.9834, - "step": 13424 - }, - { - "epoch": 0.34, - "learning_rate": 1.962615800548837e-06, - "loss": 0.9746, - "step": 13425 - }, - { - "epoch": 0.34, - "learning_rate": 1.96260830507101e-06, - "loss": 0.8516, - "step": 13426 - }, - { - "epoch": 0.34, - "learning_rate": 1.962600808856158e-06, - "loss": 0.9795, - "step": 13427 - }, - { - "epoch": 0.34, - "learning_rate": 1.9625933119042873e-06, - "loss": 0.8516, - "step": 13428 - }, - { - "epoch": 0.34, - "learning_rate": 1.9625858142154027e-06, - "loss": 0.8574, - "step": 13429 - }, - { - "epoch": 0.34, - "learning_rate": 1.962578315789511e-06, - "loss": 0.8887, - "step": 13430 - }, - { - "epoch": 0.34, - "learning_rate": 1.9625708166266164e-06, - "loss": 1.0332, - "step": 13431 - }, - { - "epoch": 0.34, - "learning_rate": 1.9625633167267263e-06, - "loss": 0.9404, - "step": 13432 - }, - { - "epoch": 0.34, - "learning_rate": 1.9625558160898455e-06, - "loss": 1.0381, - "step": 13433 - }, - { - "epoch": 0.34, - "learning_rate": 1.96254831471598e-06, - "loss": 0.8735, - "step": 13434 - }, - { - "epoch": 0.34, - "learning_rate": 1.9625408126051352e-06, - "loss": 0.8203, - "step": 13435 - }, - { - "epoch": 0.34, - "learning_rate": 1.9625333097573176e-06, - "loss": 0.9492, - "step": 13436 - }, - { - "epoch": 0.34, - "learning_rate": 1.9625258061725326e-06, - "loss": 0.8359, - "step": 13437 - }, - { - "epoch": 0.34, - "learning_rate": 1.9625183018507854e-06, - "loss": 0.749, - "step": 13438 - }, - { - "epoch": 0.34, - "learning_rate": 1.9625107967920826e-06, - "loss": 0.7173, - "step": 13439 - }, - { - "epoch": 0.34, - "learning_rate": 1.962503290996429e-06, - "loss": 0.9385, - "step": 13440 - }, - { - "epoch": 0.34, - "learning_rate": 1.9624957844638312e-06, - "loss": 0.7812, - "step": 13441 - }, - { - "epoch": 0.34, - "learning_rate": 1.962488277194295e-06, - "loss": 1.166, - "step": 13442 - }, - { - "epoch": 0.34, - "learning_rate": 1.962480769187825e-06, - "loss": 0.8291, - "step": 13443 - }, - { - "epoch": 0.34, - "learning_rate": 1.9624732604444283e-06, - "loss": 0.8848, - "step": 13444 - }, - { - "epoch": 0.34, - "learning_rate": 1.96246575096411e-06, - "loss": 0.8652, - "step": 13445 - }, - { - "epoch": 0.34, - "learning_rate": 1.962458240746876e-06, - "loss": 0.8125, - "step": 13446 - }, - { - "epoch": 0.34, - "learning_rate": 1.962450729792732e-06, - "loss": 1.084, - "step": 13447 - }, - { - "epoch": 0.34, - "learning_rate": 1.9624432181016833e-06, - "loss": 0.8691, - "step": 13448 - }, - { - "epoch": 0.34, - "learning_rate": 1.9624357056737362e-06, - "loss": 0.8662, - "step": 13449 - }, - { - "epoch": 0.34, - "learning_rate": 1.962428192508897e-06, - "loss": 0.8047, - "step": 13450 - }, - { - "epoch": 0.34, - "learning_rate": 1.96242067860717e-06, - "loss": 0.9482, - "step": 13451 - }, - { - "epoch": 0.34, - "learning_rate": 1.9624131639685623e-06, - "loss": 1.0654, - "step": 13452 - }, - { - "epoch": 0.34, - "learning_rate": 1.9624056485930787e-06, - "loss": 0.9932, - "step": 13453 - }, - { - "epoch": 0.34, - "learning_rate": 1.9623981324807256e-06, - "loss": 0.8701, - "step": 13454 - }, - { - "epoch": 0.34, - "learning_rate": 1.9623906156315084e-06, - "loss": 0.8574, - "step": 13455 - }, - { - "epoch": 0.34, - "learning_rate": 1.9623830980454327e-06, - "loss": 1.0557, - "step": 13456 - }, - { - "epoch": 0.34, - "learning_rate": 1.9623755797225048e-06, - "loss": 0.918, - "step": 13457 - }, - { - "epoch": 0.34, - "learning_rate": 1.9623680606627302e-06, - "loss": 0.7041, - "step": 13458 - }, - { - "epoch": 0.34, - "learning_rate": 1.9623605408661145e-06, - "loss": 0.666, - "step": 13459 - }, - { - "epoch": 0.34, - "learning_rate": 1.9623530203326636e-06, - "loss": 1.1211, - "step": 13460 - }, - { - "epoch": 0.35, - "learning_rate": 1.9623454990623834e-06, - "loss": 0.6279, - "step": 13461 - }, - { - "epoch": 0.35, - "learning_rate": 1.9623379770552793e-06, - "loss": 1.0098, - "step": 13462 - }, - { - "epoch": 0.35, - "learning_rate": 1.9623304543113574e-06, - "loss": 1.0605, - "step": 13463 - }, - { - "epoch": 0.35, - "learning_rate": 1.962322930830623e-06, - "loss": 0.9043, - "step": 13464 - }, - { - "epoch": 0.35, - "learning_rate": 1.962315406613083e-06, - "loss": 0.8799, - "step": 13465 - }, - { - "epoch": 0.35, - "learning_rate": 1.9623078816587417e-06, - "loss": 0.7598, - "step": 13466 - }, - { - "epoch": 0.35, - "learning_rate": 1.9623003559676055e-06, - "loss": 0.6401, - "step": 13467 - }, - { - "epoch": 0.35, - "learning_rate": 1.9622928295396802e-06, - "loss": 1.0039, - "step": 13468 - }, - { - "epoch": 0.35, - "learning_rate": 1.9622853023749714e-06, - "loss": 0.8486, - "step": 13469 - }, - { - "epoch": 0.35, - "learning_rate": 1.9622777744734854e-06, - "loss": 0.874, - "step": 13470 - }, - { - "epoch": 0.35, - "learning_rate": 1.962270245835227e-06, - "loss": 0.8096, - "step": 13471 - }, - { - "epoch": 0.35, - "learning_rate": 1.962262716460203e-06, - "loss": 0.7852, - "step": 13472 - }, - { - "epoch": 0.35, - "learning_rate": 1.9622551863484186e-06, - "loss": 0.8711, - "step": 13473 - }, - { - "epoch": 0.35, - "learning_rate": 1.9622476554998797e-06, - "loss": 0.9678, - "step": 13474 - }, - { - "epoch": 0.35, - "learning_rate": 1.962240123914592e-06, - "loss": 0.8789, - "step": 13475 - }, - { - "epoch": 0.35, - "learning_rate": 1.9622325915925607e-06, - "loss": 0.8857, - "step": 13476 - }, - { - "epoch": 0.35, - "learning_rate": 1.962225058533793e-06, - "loss": 0.7725, - "step": 13477 - }, - { - "epoch": 0.35, - "learning_rate": 1.9622175247382935e-06, - "loss": 0.6416, - "step": 13478 - }, - { - "epoch": 0.35, - "learning_rate": 1.962209990206068e-06, - "loss": 0.9111, - "step": 13479 - }, - { - "epoch": 0.35, - "learning_rate": 1.9622024549371228e-06, - "loss": 0.9688, - "step": 13480 - }, - { - "epoch": 0.35, - "learning_rate": 1.9621949189314635e-06, - "loss": 0.9736, - "step": 13481 - }, - { - "epoch": 0.35, - "learning_rate": 1.9621873821890957e-06, - "loss": 0.8154, - "step": 13482 - }, - { - "epoch": 0.35, - "learning_rate": 1.962179844710025e-06, - "loss": 1.0996, - "step": 13483 - }, - { - "epoch": 0.35, - "learning_rate": 1.962172306494258e-06, - "loss": 0.9072, - "step": 13484 - }, - { - "epoch": 0.35, - "learning_rate": 1.9621647675417994e-06, - "loss": 0.7144, - "step": 13485 - }, - { - "epoch": 0.35, - "learning_rate": 1.9621572278526555e-06, - "loss": 0.8472, - "step": 13486 - }, - { - "epoch": 0.35, - "learning_rate": 1.9621496874268323e-06, - "loss": 0.6958, - "step": 13487 - }, - { - "epoch": 0.35, - "learning_rate": 1.9621421462643353e-06, - "loss": 0.9893, - "step": 13488 - }, - { - "epoch": 0.35, - "learning_rate": 1.9621346043651703e-06, - "loss": 1.1025, - "step": 13489 - }, - { - "epoch": 0.35, - "learning_rate": 1.9621270617293433e-06, - "loss": 0.8682, - "step": 13490 - }, - { - "epoch": 0.35, - "learning_rate": 1.9621195183568593e-06, - "loss": 0.8896, - "step": 13491 - }, - { - "epoch": 0.35, - "learning_rate": 1.9621119742477252e-06, - "loss": 0.6711, - "step": 13492 - }, - { - "epoch": 0.35, - "learning_rate": 1.9621044294019456e-06, - "loss": 0.8066, - "step": 13493 - }, - { - "epoch": 0.35, - "learning_rate": 1.9620968838195273e-06, - "loss": 0.918, - "step": 13494 - }, - { - "epoch": 0.35, - "learning_rate": 1.9620893375004753e-06, - "loss": 0.8672, - "step": 13495 - }, - { - "epoch": 0.35, - "learning_rate": 1.962081790444796e-06, - "loss": 0.8682, - "step": 13496 - }, - { - "epoch": 0.35, - "learning_rate": 1.962074242652495e-06, - "loss": 0.8965, - "step": 13497 - }, - { - "epoch": 0.35, - "learning_rate": 1.9620666941235778e-06, - "loss": 0.7543, - "step": 13498 - }, - { - "epoch": 0.35, - "learning_rate": 1.9620591448580506e-06, - "loss": 0.957, - "step": 13499 - }, - { - "epoch": 0.35, - "learning_rate": 1.962051594855919e-06, - "loss": 0.8799, - "step": 13500 - }, - { - "epoch": 0.35, - "learning_rate": 1.962044044117188e-06, - "loss": 0.7432, - "step": 13501 - }, - { - "epoch": 0.35, - "learning_rate": 1.962036492641865e-06, - "loss": 1.2236, - "step": 13502 - }, - { - "epoch": 0.35, - "learning_rate": 1.9620289404299543e-06, - "loss": 0.998, - "step": 13503 - }, - { - "epoch": 0.35, - "learning_rate": 1.9620213874814626e-06, - "loss": 0.9951, - "step": 13504 - }, - { - "epoch": 0.35, - "learning_rate": 1.9620138337963953e-06, - "loss": 0.8408, - "step": 13505 - }, - { - "epoch": 0.35, - "learning_rate": 1.962006279374758e-06, - "loss": 0.8223, - "step": 13506 - }, - { - "epoch": 0.35, - "learning_rate": 1.961998724216557e-06, - "loss": 0.8682, - "step": 13507 - }, - { - "epoch": 0.35, - "learning_rate": 1.9619911683217977e-06, - "loss": 0.7495, - "step": 13508 - }, - { - "epoch": 0.35, - "learning_rate": 1.9619836116904864e-06, - "loss": 0.8887, - "step": 13509 - }, - { - "epoch": 0.35, - "learning_rate": 1.961976054322628e-06, - "loss": 0.999, - "step": 13510 - }, - { - "epoch": 0.35, - "learning_rate": 1.961968496218229e-06, - "loss": 1.0137, - "step": 13511 - }, - { - "epoch": 0.35, - "learning_rate": 1.9619609373772944e-06, - "loss": 0.7275, - "step": 13512 - }, - { - "epoch": 0.35, - "learning_rate": 1.961953377799831e-06, - "loss": 0.7695, - "step": 13513 - }, - { - "epoch": 0.35, - "learning_rate": 1.9619458174858444e-06, - "loss": 0.5688, - "step": 13514 - }, - { - "epoch": 0.35, - "learning_rate": 1.96193825643534e-06, - "loss": 1.0205, - "step": 13515 - }, - { - "epoch": 0.35, - "learning_rate": 1.9619306946483232e-06, - "loss": 1.0654, - "step": 13516 - }, - { - "epoch": 0.35, - "learning_rate": 1.961923132124801e-06, - "loss": 0.7798, - "step": 13517 - }, - { - "epoch": 0.35, - "learning_rate": 1.961915568864778e-06, - "loss": 0.9521, - "step": 13518 - }, - { - "epoch": 0.35, - "learning_rate": 1.9619080048682605e-06, - "loss": 0.9072, - "step": 13519 - }, - { - "epoch": 0.35, - "learning_rate": 1.9619004401352543e-06, - "loss": 0.8291, - "step": 13520 - }, - { - "epoch": 0.35, - "learning_rate": 1.9618928746657654e-06, - "loss": 0.6948, - "step": 13521 - }, - { - "epoch": 0.35, - "learning_rate": 1.961885308459799e-06, - "loss": 0.9004, - "step": 13522 - }, - { - "epoch": 0.35, - "learning_rate": 1.9618777415173616e-06, - "loss": 0.7407, - "step": 13523 - }, - { - "epoch": 0.35, - "learning_rate": 1.9618701738384583e-06, - "loss": 0.9248, - "step": 13524 - }, - { - "epoch": 0.35, - "learning_rate": 1.9618626054230955e-06, - "loss": 0.8838, - "step": 13525 - }, - { - "epoch": 0.35, - "learning_rate": 1.9618550362712786e-06, - "loss": 1.0186, - "step": 13526 - }, - { - "epoch": 0.35, - "learning_rate": 1.9618474663830135e-06, - "loss": 0.7705, - "step": 13527 - }, - { - "epoch": 0.35, - "learning_rate": 1.961839895758306e-06, - "loss": 0.9209, - "step": 13528 - }, - { - "epoch": 0.35, - "learning_rate": 1.9618323243971623e-06, - "loss": 0.9707, - "step": 13529 - }, - { - "epoch": 0.35, - "learning_rate": 1.9618247522995875e-06, - "loss": 0.9326, - "step": 13530 - }, - { - "epoch": 0.35, - "learning_rate": 1.9618171794655875e-06, - "loss": 1.0781, - "step": 13531 - }, - { - "epoch": 0.35, - "learning_rate": 1.9618096058951686e-06, - "loss": 1.0439, - "step": 13532 - }, - { - "epoch": 0.35, - "learning_rate": 1.9618020315883362e-06, - "loss": 0.8193, - "step": 13533 - }, - { - "epoch": 0.35, - "learning_rate": 1.9617944565450964e-06, - "loss": 0.7607, - "step": 13534 - }, - { - "epoch": 0.35, - "learning_rate": 1.9617868807654546e-06, - "loss": 1.0244, - "step": 13535 - }, - { - "epoch": 0.35, - "learning_rate": 1.9617793042494172e-06, - "loss": 0.9502, - "step": 13536 - }, - { - "epoch": 0.35, - "learning_rate": 1.961771726996989e-06, - "loss": 0.7412, - "step": 13537 - }, - { - "epoch": 0.35, - "learning_rate": 1.9617641490081767e-06, - "loss": 0.7395, - "step": 13538 - }, - { - "epoch": 0.35, - "learning_rate": 1.961756570282986e-06, - "loss": 0.7756, - "step": 13539 - }, - { - "epoch": 0.35, - "learning_rate": 1.9617489908214223e-06, - "loss": 1.0156, - "step": 13540 - }, - { - "epoch": 0.35, - "learning_rate": 1.9617414106234915e-06, - "loss": 0.9395, - "step": 13541 - }, - { - "epoch": 0.35, - "learning_rate": 1.9617338296892e-06, - "loss": 0.9482, - "step": 13542 - }, - { - "epoch": 0.35, - "learning_rate": 1.9617262480185527e-06, - "loss": 0.9297, - "step": 13543 - }, - { - "epoch": 0.35, - "learning_rate": 1.9617186656115557e-06, - "loss": 0.7773, - "step": 13544 - }, - { - "epoch": 0.35, - "learning_rate": 1.9617110824682152e-06, - "loss": 0.9727, - "step": 13545 - }, - { - "epoch": 0.35, - "learning_rate": 1.9617034985885367e-06, - "loss": 0.7578, - "step": 13546 - }, - { - "epoch": 0.35, - "learning_rate": 1.961695913972526e-06, - "loss": 0.9844, - "step": 13547 - }, - { - "epoch": 0.35, - "learning_rate": 1.9616883286201893e-06, - "loss": 0.874, - "step": 13548 - }, - { - "epoch": 0.35, - "learning_rate": 1.9616807425315314e-06, - "loss": 1.0127, - "step": 13549 - }, - { - "epoch": 0.35, - "learning_rate": 1.9616731557065597e-06, - "loss": 0.918, - "step": 13550 - }, - { - "epoch": 0.35, - "learning_rate": 1.9616655681452783e-06, - "loss": 0.9214, - "step": 13551 - }, - { - "epoch": 0.35, - "learning_rate": 1.9616579798476944e-06, - "loss": 0.8257, - "step": 13552 - }, - { - "epoch": 0.35, - "learning_rate": 1.9616503908138123e-06, - "loss": 0.9404, - "step": 13553 - }, - { - "epoch": 0.35, - "learning_rate": 1.9616428010436397e-06, - "loss": 0.998, - "step": 13554 - }, - { - "epoch": 0.35, - "learning_rate": 1.9616352105371807e-06, - "loss": 0.6592, - "step": 13555 - }, - { - "epoch": 0.35, - "learning_rate": 1.961627619294442e-06, - "loss": 1.0283, - "step": 13556 - }, - { - "epoch": 0.35, - "learning_rate": 1.96162002731543e-06, - "loss": 0.9326, - "step": 13557 - }, - { - "epoch": 0.35, - "learning_rate": 1.9616124346001487e-06, - "loss": 0.9082, - "step": 13558 - }, - { - "epoch": 0.35, - "learning_rate": 1.9616048411486057e-06, - "loss": 0.9111, - "step": 13559 - }, - { - "epoch": 0.35, - "learning_rate": 1.961597246960806e-06, - "loss": 0.9053, - "step": 13560 - }, - { - "epoch": 0.35, - "learning_rate": 1.961589652036755e-06, - "loss": 0.7529, - "step": 13561 - }, - { - "epoch": 0.35, - "learning_rate": 1.9615820563764593e-06, - "loss": 0.9912, - "step": 13562 - }, - { - "epoch": 0.35, - "learning_rate": 1.9615744599799246e-06, - "loss": 0.9814, - "step": 13563 - }, - { - "epoch": 0.35, - "learning_rate": 1.961566862847156e-06, - "loss": 1.0938, - "step": 13564 - }, - { - "epoch": 0.35, - "learning_rate": 1.9615592649781605e-06, - "loss": 1.124, - "step": 13565 - }, - { - "epoch": 0.35, - "learning_rate": 1.961551666372943e-06, - "loss": 0.9404, - "step": 13566 - }, - { - "epoch": 0.35, - "learning_rate": 1.96154406703151e-06, - "loss": 0.8145, - "step": 13567 - }, - { - "epoch": 0.35, - "learning_rate": 1.9615364669538664e-06, - "loss": 0.9951, - "step": 13568 - }, - { - "epoch": 0.35, - "learning_rate": 1.961528866140019e-06, - "loss": 0.7407, - "step": 13569 - }, - { - "epoch": 0.35, - "learning_rate": 1.9615212645899727e-06, - "loss": 0.9902, - "step": 13570 - }, - { - "epoch": 0.35, - "learning_rate": 1.961513662303734e-06, - "loss": 1.04, - "step": 13571 - }, - { - "epoch": 0.35, - "learning_rate": 1.9615060592813084e-06, - "loss": 0.7183, - "step": 13572 - }, - { - "epoch": 0.35, - "learning_rate": 1.9614984555227017e-06, - "loss": 0.9746, - "step": 13573 - }, - { - "epoch": 0.35, - "learning_rate": 1.96149085102792e-06, - "loss": 0.9258, - "step": 13574 - }, - { - "epoch": 0.35, - "learning_rate": 1.9614832457969694e-06, - "loss": 0.9268, - "step": 13575 - }, - { - "epoch": 0.35, - "learning_rate": 1.9614756398298547e-06, - "loss": 0.8496, - "step": 13576 - }, - { - "epoch": 0.35, - "learning_rate": 1.9614680331265825e-06, - "loss": 0.7734, - "step": 13577 - }, - { - "epoch": 0.35, - "learning_rate": 1.9614604256871585e-06, - "loss": 0.8218, - "step": 13578 - }, - { - "epoch": 0.35, - "learning_rate": 1.9614528175115885e-06, - "loss": 0.9688, - "step": 13579 - }, - { - "epoch": 0.35, - "learning_rate": 1.961445208599878e-06, - "loss": 0.9951, - "step": 13580 - }, - { - "epoch": 0.35, - "learning_rate": 1.9614375989520335e-06, - "loss": 0.8467, - "step": 13581 - }, - { - "epoch": 0.35, - "learning_rate": 1.96142998856806e-06, - "loss": 0.9834, - "step": 13582 - }, - { - "epoch": 0.35, - "learning_rate": 1.961422377447964e-06, - "loss": 0.8359, - "step": 13583 - }, - { - "epoch": 0.35, - "learning_rate": 1.9614147655917513e-06, - "loss": 0.9297, - "step": 13584 - }, - { - "epoch": 0.35, - "learning_rate": 1.961407152999427e-06, - "loss": 1.0303, - "step": 13585 - }, - { - "epoch": 0.35, - "learning_rate": 1.961399539670998e-06, - "loss": 0.7236, - "step": 13586 - }, - { - "epoch": 0.35, - "learning_rate": 1.9613919256064695e-06, - "loss": 0.8838, - "step": 13587 - }, - { - "epoch": 0.35, - "learning_rate": 1.961384310805847e-06, - "loss": 0.7715, - "step": 13588 - }, - { - "epoch": 0.35, - "learning_rate": 1.961376695269137e-06, - "loss": 1.0625, - "step": 13589 - }, - { - "epoch": 0.35, - "learning_rate": 1.961369078996345e-06, - "loss": 0.9453, - "step": 13590 - }, - { - "epoch": 0.35, - "learning_rate": 1.961361461987477e-06, - "loss": 0.8555, - "step": 13591 - }, - { - "epoch": 0.35, - "learning_rate": 1.961353844242539e-06, - "loss": 0.8447, - "step": 13592 - }, - { - "epoch": 0.35, - "learning_rate": 1.961346225761536e-06, - "loss": 1.0195, - "step": 13593 - }, - { - "epoch": 0.35, - "learning_rate": 1.9613386065444747e-06, - "loss": 1.0762, - "step": 13594 - }, - { - "epoch": 0.35, - "learning_rate": 1.9613309865913604e-06, - "loss": 0.9014, - "step": 13595 - }, - { - "epoch": 0.35, - "learning_rate": 1.9613233659021995e-06, - "loss": 1.1543, - "step": 13596 - }, - { - "epoch": 0.35, - "learning_rate": 1.9613157444769974e-06, - "loss": 1.0, - "step": 13597 - }, - { - "epoch": 0.35, - "learning_rate": 1.96130812231576e-06, - "loss": 1.083, - "step": 13598 - }, - { - "epoch": 0.35, - "learning_rate": 1.961300499418493e-06, - "loss": 0.8877, - "step": 13599 - }, - { - "epoch": 0.35, - "learning_rate": 1.9612928757852028e-06, - "loss": 0.7822, - "step": 13600 - }, - { - "epoch": 0.35, - "learning_rate": 1.9612852514158946e-06, - "loss": 1.1025, - "step": 13601 - }, - { - "epoch": 0.35, - "learning_rate": 1.9612776263105745e-06, - "loss": 0.9014, - "step": 13602 - }, - { - "epoch": 0.35, - "learning_rate": 1.9612700004692484e-06, - "loss": 1.2051, - "step": 13603 - }, - { - "epoch": 0.35, - "learning_rate": 1.961262373891922e-06, - "loss": 1.0244, - "step": 13604 - }, - { - "epoch": 0.35, - "learning_rate": 1.961254746578601e-06, - "loss": 0.9893, - "step": 13605 - }, - { - "epoch": 0.35, - "learning_rate": 1.961247118529292e-06, - "loss": 0.9902, - "step": 13606 - }, - { - "epoch": 0.35, - "learning_rate": 1.961239489744e-06, - "loss": 0.9775, - "step": 13607 - }, - { - "epoch": 0.35, - "learning_rate": 1.9612318602227306e-06, - "loss": 0.7627, - "step": 13608 - }, - { - "epoch": 0.35, - "learning_rate": 1.9612242299654906e-06, - "loss": 0.8398, - "step": 13609 - }, - { - "epoch": 0.35, - "learning_rate": 1.9612165989722856e-06, - "loss": 0.9453, - "step": 13610 - }, - { - "epoch": 0.35, - "learning_rate": 1.9612089672431213e-06, - "loss": 1.125, - "step": 13611 - }, - { - "epoch": 0.35, - "learning_rate": 1.961201334778003e-06, - "loss": 0.9229, - "step": 13612 - }, - { - "epoch": 0.35, - "learning_rate": 1.961193701576937e-06, - "loss": 0.9531, - "step": 13613 - }, - { - "epoch": 0.35, - "learning_rate": 1.9611860676399295e-06, - "loss": 0.8691, - "step": 13614 - }, - { - "epoch": 0.35, - "learning_rate": 1.961178432966986e-06, - "loss": 0.7915, - "step": 13615 - }, - { - "epoch": 0.35, - "learning_rate": 1.9611707975581123e-06, - "loss": 0.9795, - "step": 13616 - }, - { - "epoch": 0.35, - "learning_rate": 1.9611631614133144e-06, - "loss": 0.709, - "step": 13617 - }, - { - "epoch": 0.35, - "learning_rate": 1.961155524532598e-06, - "loss": 0.7988, - "step": 13618 - }, - { - "epoch": 0.35, - "learning_rate": 1.961147886915969e-06, - "loss": 1.0127, - "step": 13619 - }, - { - "epoch": 0.35, - "learning_rate": 1.9611402485634337e-06, - "loss": 0.6426, - "step": 13620 - }, - { - "epoch": 0.35, - "learning_rate": 1.9611326094749968e-06, - "loss": 0.8535, - "step": 13621 - }, - { - "epoch": 0.35, - "learning_rate": 1.9611249696506653e-06, - "loss": 0.8711, - "step": 13622 - }, - { - "epoch": 0.35, - "learning_rate": 1.9611173290904443e-06, - "loss": 0.8389, - "step": 13623 - }, - { - "epoch": 0.35, - "learning_rate": 1.96110968779434e-06, - "loss": 0.6367, - "step": 13624 - }, - { - "epoch": 0.35, - "learning_rate": 1.9611020457623587e-06, - "loss": 0.5769, - "step": 13625 - }, - { - "epoch": 0.35, - "learning_rate": 1.961094402994505e-06, - "loss": 0.6895, - "step": 13626 - }, - { - "epoch": 0.35, - "learning_rate": 1.9610867594907862e-06, - "loss": 0.8818, - "step": 13627 - }, - { - "epoch": 0.35, - "learning_rate": 1.961079115251207e-06, - "loss": 0.873, - "step": 13628 - }, - { - "epoch": 0.35, - "learning_rate": 1.961071470275774e-06, - "loss": 0.9727, - "step": 13629 - }, - { - "epoch": 0.35, - "learning_rate": 1.9610638245644926e-06, - "loss": 0.9287, - "step": 13630 - }, - { - "epoch": 0.35, - "learning_rate": 1.961056178117369e-06, - "loss": 0.8096, - "step": 13631 - }, - { - "epoch": 0.35, - "learning_rate": 1.9610485309344086e-06, - "loss": 0.8955, - "step": 13632 - }, - { - "epoch": 0.35, - "learning_rate": 1.9610408830156177e-06, - "loss": 0.9243, - "step": 13633 - }, - { - "epoch": 0.35, - "learning_rate": 1.961033234361002e-06, - "loss": 1.1406, - "step": 13634 - }, - { - "epoch": 0.35, - "learning_rate": 1.961025584970567e-06, - "loss": 0.7974, - "step": 13635 - }, - { - "epoch": 0.35, - "learning_rate": 1.9610179348443195e-06, - "loss": 1.041, - "step": 13636 - }, - { - "epoch": 0.35, - "learning_rate": 1.9610102839822644e-06, - "loss": 1.0596, - "step": 13637 - }, - { - "epoch": 0.35, - "learning_rate": 1.961002632384408e-06, - "loss": 0.8848, - "step": 13638 - }, - { - "epoch": 0.35, - "learning_rate": 1.960994980050756e-06, - "loss": 1.1914, - "step": 13639 - }, - { - "epoch": 0.35, - "learning_rate": 1.9609873269813143e-06, - "loss": 0.707, - "step": 13640 - }, - { - "epoch": 0.35, - "learning_rate": 1.9609796731760886e-06, - "loss": 1.0303, - "step": 13641 - }, - { - "epoch": 0.35, - "learning_rate": 1.9609720186350853e-06, - "loss": 0.7241, - "step": 13642 - }, - { - "epoch": 0.35, - "learning_rate": 1.96096436335831e-06, - "loss": 0.9883, - "step": 13643 - }, - { - "epoch": 0.35, - "learning_rate": 1.9609567073457683e-06, - "loss": 1.1582, - "step": 13644 - }, - { - "epoch": 0.35, - "learning_rate": 1.960949050597466e-06, - "loss": 0.8828, - "step": 13645 - }, - { - "epoch": 0.35, - "learning_rate": 1.9609413931134095e-06, - "loss": 0.8164, - "step": 13646 - }, - { - "epoch": 0.35, - "learning_rate": 1.9609337348936044e-06, - "loss": 0.877, - "step": 13647 - }, - { - "epoch": 0.35, - "learning_rate": 1.9609260759380564e-06, - "loss": 0.8408, - "step": 13648 - }, - { - "epoch": 0.35, - "learning_rate": 1.9609184162467712e-06, - "loss": 0.7529, - "step": 13649 - }, - { - "epoch": 0.35, - "learning_rate": 1.9609107558197554e-06, - "loss": 1.0127, - "step": 13650 - }, - { - "epoch": 0.35, - "learning_rate": 1.9609030946570144e-06, - "loss": 0.8442, - "step": 13651 - }, - { - "epoch": 0.35, - "learning_rate": 1.9608954327585537e-06, - "loss": 0.7554, - "step": 13652 - }, - { - "epoch": 0.35, - "learning_rate": 1.9608877701243796e-06, - "loss": 1.0215, - "step": 13653 - }, - { - "epoch": 0.35, - "learning_rate": 1.9608801067544986e-06, - "loss": 1.0059, - "step": 13654 - }, - { - "epoch": 0.35, - "learning_rate": 1.9608724426489152e-06, - "loss": 0.8574, - "step": 13655 - }, - { - "epoch": 0.35, - "learning_rate": 1.9608647778076363e-06, - "loss": 0.8442, - "step": 13656 - }, - { - "epoch": 0.35, - "learning_rate": 1.960857112230667e-06, - "loss": 0.9834, - "step": 13657 - }, - { - "epoch": 0.35, - "learning_rate": 1.960849445918014e-06, - "loss": 0.9814, - "step": 13658 - }, - { - "epoch": 0.35, - "learning_rate": 1.9608417788696827e-06, - "loss": 0.8809, - "step": 13659 - }, - { - "epoch": 0.35, - "learning_rate": 1.960834111085679e-06, - "loss": 0.9009, - "step": 13660 - }, - { - "epoch": 0.35, - "learning_rate": 1.9608264425660085e-06, - "loss": 0.9062, - "step": 13661 - }, - { - "epoch": 0.35, - "learning_rate": 1.960818773310678e-06, - "loss": 0.9287, - "step": 13662 - }, - { - "epoch": 0.35, - "learning_rate": 1.9608111033196923e-06, - "loss": 0.8486, - "step": 13663 - }, - { - "epoch": 0.35, - "learning_rate": 1.9608034325930574e-06, - "loss": 0.731, - "step": 13664 - }, - { - "epoch": 0.35, - "learning_rate": 1.9607957611307803e-06, - "loss": 0.9092, - "step": 13665 - }, - { - "epoch": 0.35, - "learning_rate": 1.9607880889328653e-06, - "loss": 0.8145, - "step": 13666 - }, - { - "epoch": 0.35, - "learning_rate": 1.9607804159993194e-06, - "loss": 0.9648, - "step": 13667 - }, - { - "epoch": 0.35, - "learning_rate": 1.9607727423301484e-06, - "loss": 0.9863, - "step": 13668 - }, - { - "epoch": 0.35, - "learning_rate": 1.9607650679253576e-06, - "loss": 0.9307, - "step": 13669 - }, - { - "epoch": 0.35, - "learning_rate": 1.960757392784953e-06, - "loss": 0.8916, - "step": 13670 - }, - { - "epoch": 0.35, - "learning_rate": 1.960749716908941e-06, - "loss": 0.7764, - "step": 13671 - }, - { - "epoch": 0.35, - "learning_rate": 1.9607420402973265e-06, - "loss": 0.6411, - "step": 13672 - }, - { - "epoch": 0.35, - "learning_rate": 1.9607343629501165e-06, - "loss": 0.8379, - "step": 13673 - }, - { - "epoch": 0.35, - "learning_rate": 1.9607266848673164e-06, - "loss": 0.7837, - "step": 13674 - }, - { - "epoch": 0.35, - "learning_rate": 1.960719006048932e-06, - "loss": 0.9541, - "step": 13675 - }, - { - "epoch": 0.35, - "learning_rate": 1.960711326494969e-06, - "loss": 0.6724, - "step": 13676 - }, - { - "epoch": 0.35, - "learning_rate": 1.9607036462054335e-06, - "loss": 0.8296, - "step": 13677 - }, - { - "epoch": 0.35, - "learning_rate": 1.960695965180332e-06, - "loss": 0.7871, - "step": 13678 - }, - { - "epoch": 0.35, - "learning_rate": 1.9606882834196693e-06, - "loss": 0.8994, - "step": 13679 - }, - { - "epoch": 0.35, - "learning_rate": 1.960680600923452e-06, - "loss": 0.8145, - "step": 13680 - }, - { - "epoch": 0.35, - "learning_rate": 1.960672917691685e-06, - "loss": 0.8662, - "step": 13681 - }, - { - "epoch": 0.35, - "learning_rate": 1.9606652337243755e-06, - "loss": 0.9395, - "step": 13682 - }, - { - "epoch": 0.35, - "learning_rate": 1.960657549021529e-06, - "loss": 0.8018, - "step": 13683 - }, - { - "epoch": 0.35, - "learning_rate": 1.960649863583151e-06, - "loss": 0.959, - "step": 13684 - }, - { - "epoch": 0.35, - "learning_rate": 1.9606421774092473e-06, - "loss": 0.7344, - "step": 13685 - }, - { - "epoch": 0.35, - "learning_rate": 1.9606344904998243e-06, - "loss": 0.6802, - "step": 13686 - }, - { - "epoch": 0.35, - "learning_rate": 1.9606268028548874e-06, - "loss": 1.0234, - "step": 13687 - }, - { - "epoch": 0.35, - "learning_rate": 1.960619114474443e-06, - "loss": 0.8267, - "step": 13688 - }, - { - "epoch": 0.35, - "learning_rate": 1.9606114253584967e-06, - "loss": 0.8525, - "step": 13689 - }, - { - "epoch": 0.35, - "learning_rate": 1.9606037355070547e-06, - "loss": 0.9072, - "step": 13690 - }, - { - "epoch": 0.35, - "learning_rate": 1.960596044920122e-06, - "loss": 1.0977, - "step": 13691 - }, - { - "epoch": 0.35, - "learning_rate": 1.9605883535977053e-06, - "loss": 0.6934, - "step": 13692 - }, - { - "epoch": 0.35, - "learning_rate": 1.9605806615398102e-06, - "loss": 0.9346, - "step": 13693 - }, - { - "epoch": 0.35, - "learning_rate": 1.960572968746443e-06, - "loss": 0.8906, - "step": 13694 - }, - { - "epoch": 0.35, - "learning_rate": 1.960565275217609e-06, - "loss": 1.0127, - "step": 13695 - }, - { - "epoch": 0.35, - "learning_rate": 1.960557580953314e-06, - "loss": 1.0439, - "step": 13696 - }, - { - "epoch": 0.35, - "learning_rate": 1.960549885953565e-06, - "loss": 0.9121, - "step": 13697 - }, - { - "epoch": 0.35, - "learning_rate": 1.9605421902183664e-06, - "loss": 0.7959, - "step": 13698 - }, - { - "epoch": 0.35, - "learning_rate": 1.960534493747725e-06, - "loss": 0.6616, - "step": 13699 - }, - { - "epoch": 0.35, - "learning_rate": 1.9605267965416466e-06, - "loss": 0.8345, - "step": 13700 - }, - { - "epoch": 0.35, - "learning_rate": 1.960519098600137e-06, - "loss": 1.124, - "step": 13701 - }, - { - "epoch": 0.35, - "learning_rate": 1.960511399923202e-06, - "loss": 0.9268, - "step": 13702 - }, - { - "epoch": 0.35, - "learning_rate": 1.9605037005108477e-06, - "loss": 0.7529, - "step": 13703 - }, - { - "epoch": 0.35, - "learning_rate": 1.96049600036308e-06, - "loss": 0.9277, - "step": 13704 - }, - { - "epoch": 0.35, - "learning_rate": 1.9604882994799044e-06, - "loss": 0.9668, - "step": 13705 - }, - { - "epoch": 0.35, - "learning_rate": 1.9604805978613274e-06, - "loss": 0.9785, - "step": 13706 - }, - { - "epoch": 0.35, - "learning_rate": 1.9604728955073543e-06, - "loss": 0.8506, - "step": 13707 - }, - { - "epoch": 0.35, - "learning_rate": 1.9604651924179913e-06, - "loss": 0.6016, - "step": 13708 - }, - { - "epoch": 0.35, - "learning_rate": 1.960457488593244e-06, - "loss": 0.7788, - "step": 13709 - }, - { - "epoch": 0.35, - "learning_rate": 1.9604497840331195e-06, - "loss": 0.6895, - "step": 13710 - }, - { - "epoch": 0.35, - "learning_rate": 1.9604420787376216e-06, - "loss": 1.042, - "step": 13711 - }, - { - "epoch": 0.35, - "learning_rate": 1.960434372706758e-06, - "loss": 0.9023, - "step": 13712 - }, - { - "epoch": 0.35, - "learning_rate": 1.960426665940534e-06, - "loss": 0.8477, - "step": 13713 - }, - { - "epoch": 0.35, - "learning_rate": 1.9604189584389556e-06, - "loss": 0.8066, - "step": 13714 - }, - { - "epoch": 0.35, - "learning_rate": 1.960411250202028e-06, - "loss": 0.9062, - "step": 13715 - }, - { - "epoch": 0.35, - "learning_rate": 1.960403541229758e-06, - "loss": 0.9561, - "step": 13716 - }, - { - "epoch": 0.35, - "learning_rate": 1.960395831522151e-06, - "loss": 0.998, - "step": 13717 - }, - { - "epoch": 0.35, - "learning_rate": 1.960388121079213e-06, - "loss": 1.1309, - "step": 13718 - }, - { - "epoch": 0.35, - "learning_rate": 1.9603804099009503e-06, - "loss": 0.9277, - "step": 13719 - }, - { - "epoch": 0.35, - "learning_rate": 1.9603726979873684e-06, - "loss": 1.1289, - "step": 13720 - }, - { - "epoch": 0.35, - "learning_rate": 1.9603649853384734e-06, - "loss": 1.0049, - "step": 13721 - }, - { - "epoch": 0.35, - "learning_rate": 1.9603572719542707e-06, - "loss": 0.6719, - "step": 13722 - }, - { - "epoch": 0.35, - "learning_rate": 1.9603495578347673e-06, - "loss": 0.8647, - "step": 13723 - }, - { - "epoch": 0.35, - "learning_rate": 1.9603418429799676e-06, - "loss": 1.0605, - "step": 13724 - }, - { - "epoch": 0.35, - "learning_rate": 1.9603341273898786e-06, - "loss": 0.918, - "step": 13725 - }, - { - "epoch": 0.35, - "learning_rate": 1.960326411064506e-06, - "loss": 0.9868, - "step": 13726 - }, - { - "epoch": 0.35, - "learning_rate": 1.9603186940038556e-06, - "loss": 0.8623, - "step": 13727 - }, - { - "epoch": 0.35, - "learning_rate": 1.960310976207933e-06, - "loss": 0.9141, - "step": 13728 - }, - { - "epoch": 0.35, - "learning_rate": 1.960303257676745e-06, - "loss": 0.627, - "step": 13729 - }, - { - "epoch": 0.35, - "learning_rate": 1.9602955384102966e-06, - "loss": 0.9531, - "step": 13730 - }, - { - "epoch": 0.35, - "learning_rate": 1.960287818408594e-06, - "loss": 0.918, - "step": 13731 - }, - { - "epoch": 0.35, - "learning_rate": 1.9602800976716436e-06, - "loss": 0.9717, - "step": 13732 - }, - { - "epoch": 0.35, - "learning_rate": 1.9602723761994503e-06, - "loss": 0.8467, - "step": 13733 - }, - { - "epoch": 0.35, - "learning_rate": 1.960264653992021e-06, - "loss": 0.6885, - "step": 13734 - }, - { - "epoch": 0.35, - "learning_rate": 1.960256931049361e-06, - "loss": 0.7534, - "step": 13735 - }, - { - "epoch": 0.35, - "learning_rate": 1.960249207371477e-06, - "loss": 0.8809, - "step": 13736 - }, - { - "epoch": 0.35, - "learning_rate": 1.9602414829583735e-06, - "loss": 0.9121, - "step": 13737 - }, - { - "epoch": 0.35, - "learning_rate": 1.9602337578100577e-06, - "loss": 0.8633, - "step": 13738 - }, - { - "epoch": 0.35, - "learning_rate": 1.960226031926535e-06, - "loss": 0.7759, - "step": 13739 - }, - { - "epoch": 0.35, - "learning_rate": 1.9602183053078115e-06, - "loss": 0.7, - "step": 13740 - }, - { - "epoch": 0.35, - "learning_rate": 1.9602105779538925e-06, - "loss": 0.6655, - "step": 13741 - }, - { - "epoch": 0.35, - "learning_rate": 1.960202849864785e-06, - "loss": 0.7451, - "step": 13742 - }, - { - "epoch": 0.35, - "learning_rate": 1.960195121040494e-06, - "loss": 0.9395, - "step": 13743 - }, - { - "epoch": 0.35, - "learning_rate": 1.960187391481026e-06, - "loss": 0.8672, - "step": 13744 - }, - { - "epoch": 0.35, - "learning_rate": 1.9601796611863867e-06, - "loss": 0.9111, - "step": 13745 - }, - { - "epoch": 0.35, - "learning_rate": 1.9601719301565816e-06, - "loss": 0.7715, - "step": 13746 - }, - { - "epoch": 0.35, - "learning_rate": 1.9601641983916175e-06, - "loss": 1.083, - "step": 13747 - }, - { - "epoch": 0.35, - "learning_rate": 1.9601564658914995e-06, - "loss": 0.7773, - "step": 13748 - }, - { - "epoch": 0.35, - "learning_rate": 1.9601487326562335e-06, - "loss": 0.7158, - "step": 13749 - }, - { - "epoch": 0.35, - "learning_rate": 1.9601409986858264e-06, - "loss": 0.6836, - "step": 13750 - }, - { - "epoch": 0.35, - "learning_rate": 1.9601332639802832e-06, - "loss": 0.8154, - "step": 13751 - }, - { - "epoch": 0.35, - "learning_rate": 1.96012552853961e-06, - "loss": 0.8848, - "step": 13752 - }, - { - "epoch": 0.35, - "learning_rate": 1.960117792363813e-06, - "loss": 0.9326, - "step": 13753 - }, - { - "epoch": 0.35, - "learning_rate": 1.960110055452898e-06, - "loss": 0.8652, - "step": 13754 - }, - { - "epoch": 0.35, - "learning_rate": 1.9601023178068704e-06, - "loss": 0.915, - "step": 13755 - }, - { - "epoch": 0.35, - "learning_rate": 1.9600945794257374e-06, - "loss": 0.9902, - "step": 13756 - }, - { - "epoch": 0.35, - "learning_rate": 1.9600868403095035e-06, - "loss": 1.0557, - "step": 13757 - }, - { - "epoch": 0.35, - "learning_rate": 1.9600791004581755e-06, - "loss": 0.8672, - "step": 13758 - }, - { - "epoch": 0.35, - "learning_rate": 1.960071359871759e-06, - "loss": 0.9688, - "step": 13759 - }, - { - "epoch": 0.35, - "learning_rate": 1.96006361855026e-06, - "loss": 1.002, - "step": 13760 - }, - { - "epoch": 0.35, - "learning_rate": 1.960055876493685e-06, - "loss": 1.082, - "step": 13761 - }, - { - "epoch": 0.35, - "learning_rate": 1.9600481337020386e-06, - "loss": 0.9951, - "step": 13762 - }, - { - "epoch": 0.35, - "learning_rate": 1.960040390175328e-06, - "loss": 0.6831, - "step": 13763 - }, - { - "epoch": 0.35, - "learning_rate": 1.960032645913558e-06, - "loss": 0.6016, - "step": 13764 - }, - { - "epoch": 0.35, - "learning_rate": 1.9600249009167357e-06, - "loss": 0.6465, - "step": 13765 - }, - { - "epoch": 0.35, - "learning_rate": 1.9600171551848657e-06, - "loss": 0.7819, - "step": 13766 - }, - { - "epoch": 0.35, - "learning_rate": 1.960009408717956e-06, - "loss": 0.8428, - "step": 13767 - }, - { - "epoch": 0.35, - "learning_rate": 1.96000166151601e-06, - "loss": 0.918, - "step": 13768 - }, - { - "epoch": 0.35, - "learning_rate": 1.9599939135790357e-06, - "loss": 0.7969, - "step": 13769 - }, - { - "epoch": 0.35, - "learning_rate": 1.9599861649070377e-06, - "loss": 0.9424, - "step": 13770 - }, - { - "epoch": 0.35, - "learning_rate": 1.9599784155000226e-06, - "loss": 0.8291, - "step": 13771 - }, - { - "epoch": 0.35, - "learning_rate": 1.959970665357996e-06, - "loss": 0.9395, - "step": 13772 - }, - { - "epoch": 0.35, - "learning_rate": 1.9599629144809646e-06, - "loss": 1.0439, - "step": 13773 - }, - { - "epoch": 0.35, - "learning_rate": 1.959955162868933e-06, - "loss": 1.1465, - "step": 13774 - }, - { - "epoch": 0.35, - "learning_rate": 1.9599474105219086e-06, - "loss": 0.8057, - "step": 13775 - }, - { - "epoch": 0.35, - "learning_rate": 1.9599396574398962e-06, - "loss": 0.832, - "step": 13776 - }, - { - "epoch": 0.35, - "learning_rate": 1.959931903622902e-06, - "loss": 1.1562, - "step": 13777 - }, - { - "epoch": 0.35, - "learning_rate": 1.959924149070932e-06, - "loss": 0.8008, - "step": 13778 - }, - { - "epoch": 0.35, - "learning_rate": 1.9599163937839927e-06, - "loss": 1.0195, - "step": 13779 - }, - { - "epoch": 0.35, - "learning_rate": 1.959908637762089e-06, - "loss": 1.1787, - "step": 13780 - }, - { - "epoch": 0.35, - "learning_rate": 1.959900881005228e-06, - "loss": 0.8965, - "step": 13781 - }, - { - "epoch": 0.35, - "learning_rate": 1.9598931235134144e-06, - "loss": 0.7617, - "step": 13782 - }, - { - "epoch": 0.35, - "learning_rate": 1.9598853652866552e-06, - "loss": 0.7666, - "step": 13783 - }, - { - "epoch": 0.35, - "learning_rate": 1.959877606324956e-06, - "loss": 1.2031, - "step": 13784 - }, - { - "epoch": 0.35, - "learning_rate": 1.9598698466283224e-06, - "loss": 1.0449, - "step": 13785 - }, - { - "epoch": 0.35, - "learning_rate": 1.9598620861967606e-06, - "loss": 0.8115, - "step": 13786 - }, - { - "epoch": 0.35, - "learning_rate": 1.9598543250302766e-06, - "loss": 1.0537, - "step": 13787 - }, - { - "epoch": 0.35, - "learning_rate": 1.9598465631288764e-06, - "loss": 0.9814, - "step": 13788 - }, - { - "epoch": 0.35, - "learning_rate": 1.9598388004925657e-06, - "loss": 0.9062, - "step": 13789 - }, - { - "epoch": 0.35, - "learning_rate": 1.9598310371213507e-06, - "loss": 0.8418, - "step": 13790 - }, - { - "epoch": 0.35, - "learning_rate": 1.9598232730152367e-06, - "loss": 0.8623, - "step": 13791 - }, - { - "epoch": 0.35, - "learning_rate": 1.959815508174231e-06, - "loss": 0.9082, - "step": 13792 - }, - { - "epoch": 0.35, - "learning_rate": 1.959807742598338e-06, - "loss": 1.1201, - "step": 13793 - }, - { - "epoch": 0.35, - "learning_rate": 1.9597999762875645e-06, - "loss": 0.8438, - "step": 13794 - }, - { - "epoch": 0.35, - "learning_rate": 1.9597922092419163e-06, - "loss": 0.9854, - "step": 13795 - }, - { - "epoch": 0.35, - "learning_rate": 1.9597844414613997e-06, - "loss": 0.8984, - "step": 13796 - }, - { - "epoch": 0.35, - "learning_rate": 1.9597766729460197e-06, - "loss": 0.4937, - "step": 13797 - }, - { - "epoch": 0.35, - "learning_rate": 1.959768903695783e-06, - "loss": 0.916, - "step": 13798 - }, - { - "epoch": 0.35, - "learning_rate": 1.9597611337106956e-06, - "loss": 0.7285, - "step": 13799 - }, - { - "epoch": 0.35, - "learning_rate": 1.9597533629907633e-06, - "loss": 0.8516, - "step": 13800 - }, - { - "epoch": 0.35, - "learning_rate": 1.959745591535992e-06, - "loss": 0.9683, - "step": 13801 - }, - { - "epoch": 0.35, - "learning_rate": 1.959737819346387e-06, - "loss": 0.8389, - "step": 13802 - }, - { - "epoch": 0.35, - "learning_rate": 1.9597300464219554e-06, - "loss": 0.8074, - "step": 13803 - }, - { - "epoch": 0.35, - "learning_rate": 1.9597222727627027e-06, - "loss": 0.6816, - "step": 13804 - }, - { - "epoch": 0.35, - "learning_rate": 1.9597144983686346e-06, - "loss": 0.7695, - "step": 13805 - }, - { - "epoch": 0.35, - "learning_rate": 1.9597067232397573e-06, - "loss": 0.6978, - "step": 13806 - }, - { - "epoch": 0.35, - "learning_rate": 1.9596989473760764e-06, - "loss": 0.9023, - "step": 13807 - }, - { - "epoch": 0.35, - "learning_rate": 1.9596911707775987e-06, - "loss": 0.9912, - "step": 13808 - }, - { - "epoch": 0.35, - "learning_rate": 1.959683393444329e-06, - "loss": 1.1367, - "step": 13809 - }, - { - "epoch": 0.35, - "learning_rate": 1.9596756153762747e-06, - "loss": 0.665, - "step": 13810 - }, - { - "epoch": 0.35, - "learning_rate": 1.9596678365734403e-06, - "loss": 1.0068, - "step": 13811 - }, - { - "epoch": 0.35, - "learning_rate": 1.9596600570358324e-06, - "loss": 0.8994, - "step": 13812 - }, - { - "epoch": 0.35, - "learning_rate": 1.9596522767634568e-06, - "loss": 0.71, - "step": 13813 - }, - { - "epoch": 0.35, - "learning_rate": 1.95964449575632e-06, - "loss": 0.7754, - "step": 13814 - }, - { - "epoch": 0.35, - "learning_rate": 1.9596367140144273e-06, - "loss": 0.915, - "step": 13815 - }, - { - "epoch": 0.35, - "learning_rate": 1.9596289315377845e-06, - "loss": 0.7861, - "step": 13816 - }, - { - "epoch": 0.35, - "learning_rate": 1.9596211483263985e-06, - "loss": 0.876, - "step": 13817 - }, - { - "epoch": 0.35, - "learning_rate": 1.959613364380274e-06, - "loss": 0.6665, - "step": 13818 - }, - { - "epoch": 0.35, - "learning_rate": 1.9596055796994187e-06, - "loss": 1.0117, - "step": 13819 - }, - { - "epoch": 0.35, - "learning_rate": 1.959597794283837e-06, - "loss": 1.1328, - "step": 13820 - }, - { - "epoch": 0.35, - "learning_rate": 1.9595900081335356e-06, - "loss": 0.8379, - "step": 13821 - }, - { - "epoch": 0.35, - "learning_rate": 1.95958222124852e-06, - "loss": 0.958, - "step": 13822 - }, - { - "epoch": 0.35, - "learning_rate": 1.9595744336287963e-06, - "loss": 0.9307, - "step": 13823 - }, - { - "epoch": 0.35, - "learning_rate": 1.9595666452743708e-06, - "loss": 1.2324, - "step": 13824 - }, - { - "epoch": 0.35, - "learning_rate": 1.959558856185249e-06, - "loss": 0.8701, - "step": 13825 - }, - { - "epoch": 0.35, - "learning_rate": 1.9595510663614374e-06, - "loss": 0.7192, - "step": 13826 - }, - { - "epoch": 0.35, - "learning_rate": 1.959543275802942e-06, - "loss": 0.9102, - "step": 13827 - }, - { - "epoch": 0.35, - "learning_rate": 1.959535484509768e-06, - "loss": 0.8779, - "step": 13828 - }, - { - "epoch": 0.35, - "learning_rate": 1.9595276924819216e-06, - "loss": 0.9346, - "step": 13829 - }, - { - "epoch": 0.35, - "learning_rate": 1.959519899719409e-06, - "loss": 0.8936, - "step": 13830 - }, - { - "epoch": 0.35, - "learning_rate": 1.9595121062222366e-06, - "loss": 0.8345, - "step": 13831 - }, - { - "epoch": 0.35, - "learning_rate": 1.95950431199041e-06, - "loss": 0.771, - "step": 13832 - }, - { - "epoch": 0.35, - "learning_rate": 1.959496517023934e-06, - "loss": 0.9609, - "step": 13833 - }, - { - "epoch": 0.35, - "learning_rate": 1.9594887213228166e-06, - "loss": 0.7471, - "step": 13834 - }, - { - "epoch": 0.35, - "learning_rate": 1.9594809248870623e-06, - "loss": 0.8584, - "step": 13835 - }, - { - "epoch": 0.35, - "learning_rate": 1.959473127716678e-06, - "loss": 0.9238, - "step": 13836 - }, - { - "epoch": 0.35, - "learning_rate": 1.9594653298116693e-06, - "loss": 0.8184, - "step": 13837 - }, - { - "epoch": 0.35, - "learning_rate": 1.959457531172042e-06, - "loss": 0.8672, - "step": 13838 - }, - { - "epoch": 0.35, - "learning_rate": 1.9594497317978016e-06, - "loss": 1.0391, - "step": 13839 - }, - { - "epoch": 0.35, - "learning_rate": 1.9594419316889554e-06, - "loss": 1.1914, - "step": 13840 - }, - { - "epoch": 0.35, - "learning_rate": 1.959434130845508e-06, - "loss": 0.8877, - "step": 13841 - }, - { - "epoch": 0.35, - "learning_rate": 1.9594263292674667e-06, - "loss": 0.9629, - "step": 13842 - }, - { - "epoch": 0.35, - "learning_rate": 1.9594185269548364e-06, - "loss": 1.0352, - "step": 13843 - }, - { - "epoch": 0.35, - "learning_rate": 1.959410723907623e-06, - "loss": 0.5269, - "step": 13844 - }, - { - "epoch": 0.35, - "learning_rate": 1.9594029201258338e-06, - "loss": 1.123, - "step": 13845 - }, - { - "epoch": 0.35, - "learning_rate": 1.9593951156094732e-06, - "loss": 0.9004, - "step": 13846 - }, - { - "epoch": 0.35, - "learning_rate": 1.9593873103585484e-06, - "loss": 0.9976, - "step": 13847 - }, - { - "epoch": 0.35, - "learning_rate": 1.9593795043730647e-06, - "loss": 0.9346, - "step": 13848 - }, - { - "epoch": 0.35, - "learning_rate": 1.959371697653028e-06, - "loss": 0.9355, - "step": 13849 - }, - { - "epoch": 0.35, - "learning_rate": 1.9593638901984445e-06, - "loss": 0.7612, - "step": 13850 - }, - { - "epoch": 0.36, - "learning_rate": 1.9593560820093203e-06, - "loss": 0.8975, - "step": 13851 - }, - { - "epoch": 0.36, - "learning_rate": 1.9593482730856614e-06, - "loss": 0.8496, - "step": 13852 - }, - { - "epoch": 0.36, - "learning_rate": 1.9593404634274733e-06, - "loss": 0.7382, - "step": 13853 - }, - { - "epoch": 0.36, - "learning_rate": 1.959332653034763e-06, - "loss": 0.8887, - "step": 13854 - }, - { - "epoch": 0.36, - "learning_rate": 1.959324841907535e-06, - "loss": 0.7725, - "step": 13855 - }, - { - "epoch": 0.36, - "learning_rate": 1.9593170300457963e-06, - "loss": 1.0381, - "step": 13856 - }, - { - "epoch": 0.36, - "learning_rate": 1.9593092174495533e-06, - "loss": 0.957, - "step": 13857 - }, - { - "epoch": 0.36, - "learning_rate": 1.9593014041188104e-06, - "loss": 0.7656, - "step": 13858 - }, - { - "epoch": 0.36, - "learning_rate": 1.959293590053575e-06, - "loss": 0.79, - "step": 13859 - }, - { - "epoch": 0.36, - "learning_rate": 1.9592857752538526e-06, - "loss": 0.9521, - "step": 13860 - }, - { - "epoch": 0.36, - "learning_rate": 1.959277959719649e-06, - "loss": 0.7637, - "step": 13861 - }, - { - "epoch": 0.36, - "learning_rate": 1.9592701434509708e-06, - "loss": 0.8411, - "step": 13862 - }, - { - "epoch": 0.36, - "learning_rate": 1.9592623264478233e-06, - "loss": 0.8223, - "step": 13863 - }, - { - "epoch": 0.36, - "learning_rate": 1.9592545087102127e-06, - "loss": 0.9453, - "step": 13864 - }, - { - "epoch": 0.36, - "learning_rate": 1.959246690238145e-06, - "loss": 0.9814, - "step": 13865 - }, - { - "epoch": 0.36, - "learning_rate": 1.9592388710316264e-06, - "loss": 0.6138, - "step": 13866 - }, - { - "epoch": 0.36, - "learning_rate": 1.9592310510906625e-06, - "loss": 0.9551, - "step": 13867 - }, - { - "epoch": 0.36, - "learning_rate": 1.959223230415259e-06, - "loss": 0.7119, - "step": 13868 - }, - { - "epoch": 0.36, - "learning_rate": 1.9592154090054237e-06, - "loss": 0.9756, - "step": 13869 - }, - { - "epoch": 0.36, - "learning_rate": 1.95920758686116e-06, - "loss": 0.6836, - "step": 13870 - }, - { - "epoch": 0.36, - "learning_rate": 1.959199763982476e-06, - "loss": 0.9165, - "step": 13871 - }, - { - "epoch": 0.36, - "learning_rate": 1.9591919403693765e-06, - "loss": 0.7842, - "step": 13872 - }, - { - "epoch": 0.36, - "learning_rate": 1.9591841160218676e-06, - "loss": 0.6294, - "step": 13873 - }, - { - "epoch": 0.36, - "learning_rate": 1.959176290939956e-06, - "loss": 0.7451, - "step": 13874 - }, - { - "epoch": 0.36, - "learning_rate": 1.959168465123647e-06, - "loss": 0.8564, - "step": 13875 - }, - { - "epoch": 0.36, - "learning_rate": 1.9591606385729466e-06, - "loss": 0.9365, - "step": 13876 - }, - { - "epoch": 0.36, - "learning_rate": 1.9591528112878614e-06, - "loss": 0.9297, - "step": 13877 - }, - { - "epoch": 0.36, - "learning_rate": 1.9591449832683966e-06, - "loss": 0.9277, - "step": 13878 - }, - { - "epoch": 0.36, - "learning_rate": 1.959137154514559e-06, - "loss": 0.8433, - "step": 13879 - }, - { - "epoch": 0.36, - "learning_rate": 1.959129325026354e-06, - "loss": 0.9863, - "step": 13880 - }, - { - "epoch": 0.36, - "learning_rate": 1.959121494803788e-06, - "loss": 0.9922, - "step": 13881 - }, - { - "epoch": 0.36, - "learning_rate": 1.9591136638468662e-06, - "loss": 0.8623, - "step": 13882 - }, - { - "epoch": 0.36, - "learning_rate": 1.9591058321555957e-06, - "loss": 0.8867, - "step": 13883 - }, - { - "epoch": 0.36, - "learning_rate": 1.9590979997299815e-06, - "loss": 0.9883, - "step": 13884 - }, - { - "epoch": 0.36, - "learning_rate": 1.9590901665700304e-06, - "loss": 0.8633, - "step": 13885 - }, - { - "epoch": 0.36, - "learning_rate": 1.959082332675748e-06, - "loss": 0.8789, - "step": 13886 - }, - { - "epoch": 0.36, - "learning_rate": 1.9590744980471404e-06, - "loss": 0.957, - "step": 13887 - }, - { - "epoch": 0.36, - "learning_rate": 1.9590666626842133e-06, - "loss": 0.96, - "step": 13888 - }, - { - "epoch": 0.36, - "learning_rate": 1.959058826586973e-06, - "loss": 0.6309, - "step": 13889 - }, - { - "epoch": 0.36, - "learning_rate": 1.959050989755426e-06, - "loss": 1.0625, - "step": 13890 - }, - { - "epoch": 0.36, - "learning_rate": 1.959043152189577e-06, - "loss": 1.1113, - "step": 13891 - }, - { - "epoch": 0.36, - "learning_rate": 1.959035313889433e-06, - "loss": 0.8184, - "step": 13892 - }, - { - "epoch": 0.36, - "learning_rate": 1.9590274748550003e-06, - "loss": 0.708, - "step": 13893 - }, - { - "epoch": 0.36, - "learning_rate": 1.959019635086284e-06, - "loss": 0.7344, - "step": 13894 - }, - { - "epoch": 0.36, - "learning_rate": 1.95901179458329e-06, - "loss": 0.9521, - "step": 13895 - }, - { - "epoch": 0.36, - "learning_rate": 1.9590039533460253e-06, - "loss": 0.8799, - "step": 13896 - }, - { - "epoch": 0.36, - "learning_rate": 1.9589961113744955e-06, - "loss": 0.9717, - "step": 13897 - }, - { - "epoch": 0.36, - "learning_rate": 1.958988268668706e-06, - "loss": 0.8828, - "step": 13898 - }, - { - "epoch": 0.36, - "learning_rate": 1.9589804252286636e-06, - "loss": 1.0312, - "step": 13899 - }, - { - "epoch": 0.36, - "learning_rate": 1.9589725810543738e-06, - "loss": 1.1504, - "step": 13900 - }, - { - "epoch": 0.36, - "learning_rate": 1.9589647361458428e-06, - "loss": 0.9111, - "step": 13901 - }, - { - "epoch": 0.36, - "learning_rate": 1.9589568905030765e-06, - "loss": 0.7568, - "step": 13902 - }, - { - "epoch": 0.36, - "learning_rate": 1.9589490441260813e-06, - "loss": 0.8799, - "step": 13903 - }, - { - "epoch": 0.36, - "learning_rate": 1.9589411970148627e-06, - "loss": 0.8721, - "step": 13904 - }, - { - "epoch": 0.36, - "learning_rate": 1.958933349169427e-06, - "loss": 1.1797, - "step": 13905 - }, - { - "epoch": 0.36, - "learning_rate": 1.9589255005897803e-06, - "loss": 0.7651, - "step": 13906 - }, - { - "epoch": 0.36, - "learning_rate": 1.9589176512759284e-06, - "loss": 1.04, - "step": 13907 - }, - { - "epoch": 0.36, - "learning_rate": 1.958909801227877e-06, - "loss": 0.7803, - "step": 13908 - }, - { - "epoch": 0.36, - "learning_rate": 1.9589019504456326e-06, - "loss": 0.9248, - "step": 13909 - }, - { - "epoch": 0.36, - "learning_rate": 1.958894098929201e-06, - "loss": 1.1035, - "step": 13910 - }, - { - "epoch": 0.36, - "learning_rate": 1.9588862466785885e-06, - "loss": 0.9209, - "step": 13911 - }, - { - "epoch": 0.36, - "learning_rate": 1.9588783936938007e-06, - "loss": 0.9189, - "step": 13912 - }, - { - "epoch": 0.36, - "learning_rate": 1.958870539974844e-06, - "loss": 0.9424, - "step": 13913 - }, - { - "epoch": 0.36, - "learning_rate": 1.958862685521724e-06, - "loss": 0.7524, - "step": 13914 - }, - { - "epoch": 0.36, - "learning_rate": 1.9588548303344474e-06, - "loss": 0.9795, - "step": 13915 - }, - { - "epoch": 0.36, - "learning_rate": 1.9588469744130193e-06, - "loss": 1.0381, - "step": 13916 - }, - { - "epoch": 0.36, - "learning_rate": 1.958839117757446e-06, - "loss": 0.8818, - "step": 13917 - }, - { - "epoch": 0.36, - "learning_rate": 1.958831260367734e-06, - "loss": 1.1152, - "step": 13918 - }, - { - "epoch": 0.36, - "learning_rate": 1.958823402243889e-06, - "loss": 0.8794, - "step": 13919 - }, - { - "epoch": 0.36, - "learning_rate": 1.958815543385917e-06, - "loss": 0.8281, - "step": 13920 - }, - { - "epoch": 0.36, - "learning_rate": 1.958807683793824e-06, - "loss": 0.8799, - "step": 13921 - }, - { - "epoch": 0.36, - "learning_rate": 1.9587998234676156e-06, - "loss": 0.7896, - "step": 13922 - }, - { - "epoch": 0.36, - "learning_rate": 1.958791962407299e-06, - "loss": 0.7422, - "step": 13923 - }, - { - "epoch": 0.36, - "learning_rate": 1.958784100612879e-06, - "loss": 0.9414, - "step": 13924 - }, - { - "epoch": 0.36, - "learning_rate": 1.958776238084362e-06, - "loss": 0.8818, - "step": 13925 - }, - { - "epoch": 0.36, - "learning_rate": 1.9587683748217546e-06, - "loss": 0.8223, - "step": 13926 - }, - { - "epoch": 0.36, - "learning_rate": 1.958760510825062e-06, - "loss": 0.8525, - "step": 13927 - }, - { - "epoch": 0.36, - "learning_rate": 1.958752646094291e-06, - "loss": 0.8311, - "step": 13928 - }, - { - "epoch": 0.36, - "learning_rate": 1.9587447806294465e-06, - "loss": 0.9912, - "step": 13929 - }, - { - "epoch": 0.36, - "learning_rate": 1.9587369144305357e-06, - "loss": 0.998, - "step": 13930 - }, - { - "epoch": 0.36, - "learning_rate": 1.958729047497564e-06, - "loss": 1.1558, - "step": 13931 - }, - { - "epoch": 0.36, - "learning_rate": 1.9587211798305377e-06, - "loss": 0.9668, - "step": 13932 - }, - { - "epoch": 0.36, - "learning_rate": 1.9587133114294623e-06, - "loss": 0.9844, - "step": 13933 - }, - { - "epoch": 0.36, - "learning_rate": 1.9587054422943444e-06, - "loss": 0.9648, - "step": 13934 - }, - { - "epoch": 0.36, - "learning_rate": 1.95869757242519e-06, - "loss": 0.7881, - "step": 13935 - }, - { - "epoch": 0.36, - "learning_rate": 1.9586897018220046e-06, - "loss": 0.6758, - "step": 13936 - }, - { - "epoch": 0.36, - "learning_rate": 1.9586818304847946e-06, - "loss": 0.9551, - "step": 13937 - }, - { - "epoch": 0.36, - "learning_rate": 1.958673958413566e-06, - "loss": 0.9766, - "step": 13938 - }, - { - "epoch": 0.36, - "learning_rate": 1.958666085608325e-06, - "loss": 0.7725, - "step": 13939 - }, - { - "epoch": 0.36, - "learning_rate": 1.9586582120690777e-06, - "loss": 0.9834, - "step": 13940 - }, - { - "epoch": 0.36, - "learning_rate": 1.95865033779583e-06, - "loss": 1.21, - "step": 13941 - }, - { - "epoch": 0.36, - "learning_rate": 1.958642462788587e-06, - "loss": 1.1436, - "step": 13942 - }, - { - "epoch": 0.36, - "learning_rate": 1.9586345870473563e-06, - "loss": 0.9492, - "step": 13943 - }, - { - "epoch": 0.36, - "learning_rate": 1.9586267105721427e-06, - "loss": 1.0068, - "step": 13944 - }, - { - "epoch": 0.36, - "learning_rate": 1.958618833362953e-06, - "loss": 0.9512, - "step": 13945 - }, - { - "epoch": 0.36, - "learning_rate": 1.9586109554197927e-06, - "loss": 0.9688, - "step": 13946 - }, - { - "epoch": 0.36, - "learning_rate": 1.9586030767426682e-06, - "loss": 0.8701, - "step": 13947 - }, - { - "epoch": 0.36, - "learning_rate": 1.9585951973315855e-06, - "loss": 0.8252, - "step": 13948 - }, - { - "epoch": 0.36, - "learning_rate": 1.9585873171865503e-06, - "loss": 0.8203, - "step": 13949 - }, - { - "epoch": 0.36, - "learning_rate": 1.9585794363075692e-06, - "loss": 0.958, - "step": 13950 - }, - { - "epoch": 0.36, - "learning_rate": 1.9585715546946476e-06, - "loss": 0.9219, - "step": 13951 - }, - { - "epoch": 0.36, - "learning_rate": 1.958563672347792e-06, - "loss": 0.9756, - "step": 13952 - }, - { - "epoch": 0.36, - "learning_rate": 1.9585557892670083e-06, - "loss": 1.0586, - "step": 13953 - }, - { - "epoch": 0.36, - "learning_rate": 1.958547905452302e-06, - "loss": 1.0586, - "step": 13954 - }, - { - "epoch": 0.36, - "learning_rate": 1.9585400209036803e-06, - "loss": 0.9062, - "step": 13955 - }, - { - "epoch": 0.36, - "learning_rate": 1.9585321356211485e-06, - "loss": 1.1533, - "step": 13956 - }, - { - "epoch": 0.36, - "learning_rate": 1.9585242496047126e-06, - "loss": 0.896, - "step": 13957 - }, - { - "epoch": 0.36, - "learning_rate": 1.9585163628543787e-06, - "loss": 0.6743, - "step": 13958 - }, - { - "epoch": 0.36, - "learning_rate": 1.958508475370153e-06, - "loss": 0.6572, - "step": 13959 - }, - { - "epoch": 0.36, - "learning_rate": 1.9585005871520412e-06, - "loss": 0.8623, - "step": 13960 - }, - { - "epoch": 0.36, - "learning_rate": 1.9584926982000497e-06, - "loss": 0.8691, - "step": 13961 - }, - { - "epoch": 0.36, - "learning_rate": 1.9584848085141845e-06, - "loss": 0.8252, - "step": 13962 - }, - { - "epoch": 0.36, - "learning_rate": 1.9584769180944513e-06, - "loss": 0.8374, - "step": 13963 - }, - { - "epoch": 0.36, - "learning_rate": 1.9584690269408567e-06, - "loss": 0.833, - "step": 13964 - }, - { - "epoch": 0.36, - "learning_rate": 1.9584611350534064e-06, - "loss": 0.5725, - "step": 13965 - }, - { - "epoch": 0.36, - "learning_rate": 1.958453242432106e-06, - "loss": 0.6519, - "step": 13966 - }, - { - "epoch": 0.36, - "learning_rate": 1.9584453490769625e-06, - "loss": 0.9736, - "step": 13967 - }, - { - "epoch": 0.36, - "learning_rate": 1.9584374549879816e-06, - "loss": 0.8047, - "step": 13968 - }, - { - "epoch": 0.36, - "learning_rate": 1.958429560165169e-06, - "loss": 0.9932, - "step": 13969 - }, - { - "epoch": 0.36, - "learning_rate": 1.958421664608531e-06, - "loss": 1.0078, - "step": 13970 - }, - { - "epoch": 0.36, - "learning_rate": 1.9584137683180733e-06, - "loss": 0.8799, - "step": 13971 - }, - { - "epoch": 0.36, - "learning_rate": 1.9584058712938027e-06, - "loss": 0.8706, - "step": 13972 - }, - { - "epoch": 0.36, - "learning_rate": 1.9583979735357245e-06, - "loss": 0.8945, - "step": 13973 - }, - { - "epoch": 0.36, - "learning_rate": 1.9583900750438452e-06, - "loss": 0.9014, - "step": 13974 - }, - { - "epoch": 0.36, - "learning_rate": 1.9583821758181707e-06, - "loss": 0.7852, - "step": 13975 - }, - { - "epoch": 0.36, - "learning_rate": 1.958374275858707e-06, - "loss": 0.7251, - "step": 13976 - }, - { - "epoch": 0.36, - "learning_rate": 1.95836637516546e-06, - "loss": 0.7842, - "step": 13977 - }, - { - "epoch": 0.36, - "learning_rate": 1.958358473738436e-06, - "loss": 0.7002, - "step": 13978 - }, - { - "epoch": 0.36, - "learning_rate": 1.958350571577641e-06, - "loss": 0.9407, - "step": 13979 - }, - { - "epoch": 0.36, - "learning_rate": 1.9583426686830814e-06, - "loss": 0.9639, - "step": 13980 - }, - { - "epoch": 0.36, - "learning_rate": 1.9583347650547625e-06, - "loss": 1.0674, - "step": 13981 - }, - { - "epoch": 0.36, - "learning_rate": 1.958326860692691e-06, - "loss": 0.8965, - "step": 13982 - }, - { - "epoch": 0.36, - "learning_rate": 1.9583189555968726e-06, - "loss": 0.8379, - "step": 13983 - }, - { - "epoch": 0.36, - "learning_rate": 1.958311049767313e-06, - "loss": 1.0195, - "step": 13984 - }, - { - "epoch": 0.36, - "learning_rate": 1.958303143204019e-06, - "loss": 0.8569, - "step": 13985 - }, - { - "epoch": 0.36, - "learning_rate": 1.9582952359069967e-06, - "loss": 0.833, - "step": 13986 - }, - { - "epoch": 0.36, - "learning_rate": 1.958287327876251e-06, - "loss": 0.6816, - "step": 13987 - }, - { - "epoch": 0.36, - "learning_rate": 1.9582794191117897e-06, - "loss": 0.7156, - "step": 13988 - }, - { - "epoch": 0.36, - "learning_rate": 1.958271509613617e-06, - "loss": 0.9189, - "step": 13989 - }, - { - "epoch": 0.36, - "learning_rate": 1.9582635993817405e-06, - "loss": 0.9619, - "step": 13990 - }, - { - "epoch": 0.36, - "learning_rate": 1.9582556884161656e-06, - "loss": 0.7622, - "step": 13991 - }, - { - "epoch": 0.36, - "learning_rate": 1.958247776716898e-06, - "loss": 1.0654, - "step": 13992 - }, - { - "epoch": 0.36, - "learning_rate": 1.9582398642839444e-06, - "loss": 0.7246, - "step": 13993 - }, - { - "epoch": 0.36, - "learning_rate": 1.958231951117311e-06, - "loss": 0.9238, - "step": 13994 - }, - { - "epoch": 0.36, - "learning_rate": 1.9582240372170026e-06, - "loss": 0.7598, - "step": 13995 - }, - { - "epoch": 0.36, - "learning_rate": 1.9582161225830263e-06, - "loss": 1.0244, - "step": 13996 - }, - { - "epoch": 0.36, - "learning_rate": 1.9582082072153886e-06, - "loss": 0.8301, - "step": 13997 - }, - { - "epoch": 0.36, - "learning_rate": 1.9582002911140945e-06, - "loss": 0.9043, - "step": 13998 - }, - { - "epoch": 0.36, - "learning_rate": 1.9581923742791505e-06, - "loss": 0.7119, - "step": 13999 - }, - { - "epoch": 0.36, - "learning_rate": 1.958184456710563e-06, - "loss": 0.7344, - "step": 14000 - }, - { - "epoch": 0.36, - "learning_rate": 1.958176538408337e-06, - "loss": 0.8574, - "step": 14001 - }, - { - "epoch": 0.36, - "learning_rate": 1.9581686193724797e-06, - "loss": 0.4805, - "step": 14002 - }, - { - "epoch": 0.36, - "learning_rate": 1.958160699602997e-06, - "loss": 1.0078, - "step": 14003 - }, - { - "epoch": 0.36, - "learning_rate": 1.9581527790998945e-06, - "loss": 0.9795, - "step": 14004 - }, - { - "epoch": 0.36, - "learning_rate": 1.958144857863178e-06, - "loss": 0.9277, - "step": 14005 - }, - { - "epoch": 0.36, - "learning_rate": 1.9581369358928547e-06, - "loss": 0.7671, - "step": 14006 - }, - { - "epoch": 0.36, - "learning_rate": 1.95812901318893e-06, - "loss": 0.9199, - "step": 14007 - }, - { - "epoch": 0.36, - "learning_rate": 1.9581210897514094e-06, - "loss": 0.8335, - "step": 14008 - }, - { - "epoch": 0.36, - "learning_rate": 1.9581131655803e-06, - "loss": 0.835, - "step": 14009 - }, - { - "epoch": 0.36, - "learning_rate": 1.9581052406756073e-06, - "loss": 0.7573, - "step": 14010 - }, - { - "epoch": 0.36, - "learning_rate": 1.9580973150373373e-06, - "loss": 0.9385, - "step": 14011 - }, - { - "epoch": 0.36, - "learning_rate": 1.9580893886654964e-06, - "loss": 0.9189, - "step": 14012 - }, - { - "epoch": 0.36, - "learning_rate": 1.9580814615600907e-06, - "loss": 0.916, - "step": 14013 - }, - { - "epoch": 0.36, - "learning_rate": 1.9580735337211257e-06, - "loss": 0.7671, - "step": 14014 - }, - { - "epoch": 0.36, - "learning_rate": 1.958065605148608e-06, - "loss": 0.5688, - "step": 14015 - }, - { - "epoch": 0.36, - "learning_rate": 1.958057675842544e-06, - "loss": 0.8096, - "step": 14016 - }, - { - "epoch": 0.36, - "learning_rate": 1.9580497458029386e-06, - "loss": 0.7793, - "step": 14017 - }, - { - "epoch": 0.36, - "learning_rate": 1.958041815029799e-06, - "loss": 0.8232, - "step": 14018 - }, - { - "epoch": 0.36, - "learning_rate": 1.9580338835231304e-06, - "loss": 0.8896, - "step": 14019 - }, - { - "epoch": 0.36, - "learning_rate": 1.9580259512829394e-06, - "loss": 0.9131, - "step": 14020 - }, - { - "epoch": 0.36, - "learning_rate": 1.9580180183092323e-06, - "loss": 0.9531, - "step": 14021 - }, - { - "epoch": 0.36, - "learning_rate": 1.9580100846020146e-06, - "loss": 1.1016, - "step": 14022 - }, - { - "epoch": 0.36, - "learning_rate": 1.9580021501612925e-06, - "loss": 0.7764, - "step": 14023 - }, - { - "epoch": 0.36, - "learning_rate": 1.9579942149870726e-06, - "loss": 0.752, - "step": 14024 - }, - { - "epoch": 0.36, - "learning_rate": 1.9579862790793602e-06, - "loss": 0.9053, - "step": 14025 - }, - { - "epoch": 0.36, - "learning_rate": 1.9579783424381622e-06, - "loss": 0.708, - "step": 14026 - }, - { - "epoch": 0.36, - "learning_rate": 1.957970405063484e-06, - "loss": 1.0195, - "step": 14027 - }, - { - "epoch": 0.36, - "learning_rate": 1.9579624669553318e-06, - "loss": 0.9863, - "step": 14028 - }, - { - "epoch": 0.36, - "learning_rate": 1.957954528113712e-06, - "loss": 0.5334, - "step": 14029 - }, - { - "epoch": 0.36, - "learning_rate": 1.9579465885386303e-06, - "loss": 1.0488, - "step": 14030 - }, - { - "epoch": 0.36, - "learning_rate": 1.957938648230093e-06, - "loss": 0.8428, - "step": 14031 - }, - { - "epoch": 0.36, - "learning_rate": 1.957930707188106e-06, - "loss": 0.9385, - "step": 14032 - }, - { - "epoch": 0.36, - "learning_rate": 1.957922765412676e-06, - "loss": 0.8625, - "step": 14033 - }, - { - "epoch": 0.36, - "learning_rate": 1.957914822903808e-06, - "loss": 0.9668, - "step": 14034 - }, - { - "epoch": 0.36, - "learning_rate": 1.957906879661509e-06, - "loss": 0.9482, - "step": 14035 - }, - { - "epoch": 0.36, - "learning_rate": 1.9578989356857845e-06, - "loss": 0.8916, - "step": 14036 - }, - { - "epoch": 0.36, - "learning_rate": 1.957890990976641e-06, - "loss": 1.1172, - "step": 14037 - }, - { - "epoch": 0.36, - "learning_rate": 1.957883045534084e-06, - "loss": 0.8447, - "step": 14038 - }, - { - "epoch": 0.36, - "learning_rate": 1.9578750993581204e-06, - "loss": 0.6487, - "step": 14039 - }, - { - "epoch": 0.36, - "learning_rate": 1.957867152448756e-06, - "loss": 0.8184, - "step": 14040 - }, - { - "epoch": 0.36, - "learning_rate": 1.9578592048059965e-06, - "loss": 0.8545, - "step": 14041 - }, - { - "epoch": 0.36, - "learning_rate": 1.957851256429848e-06, - "loss": 0.7061, - "step": 14042 - }, - { - "epoch": 0.36, - "learning_rate": 1.9578433073203176e-06, - "loss": 0.9248, - "step": 14043 - }, - { - "epoch": 0.36, - "learning_rate": 1.95783535747741e-06, - "loss": 0.8936, - "step": 14044 - }, - { - "epoch": 0.36, - "learning_rate": 1.9578274069011323e-06, - "loss": 0.7686, - "step": 14045 - }, - { - "epoch": 0.36, - "learning_rate": 1.95781945559149e-06, - "loss": 1.127, - "step": 14046 - }, - { - "epoch": 0.36, - "learning_rate": 1.9578115035484894e-06, - "loss": 0.9355, - "step": 14047 - }, - { - "epoch": 0.36, - "learning_rate": 1.9578035507721367e-06, - "loss": 0.7671, - "step": 14048 - }, - { - "epoch": 0.36, - "learning_rate": 1.9577955972624376e-06, - "loss": 0.9326, - "step": 14049 - }, - { - "epoch": 0.36, - "learning_rate": 1.9577876430193986e-06, - "loss": 0.77, - "step": 14050 - }, - { - "epoch": 0.36, - "learning_rate": 1.9577796880430256e-06, - "loss": 0.8013, - "step": 14051 - }, - { - "epoch": 0.36, - "learning_rate": 1.957771732333325e-06, - "loss": 0.9648, - "step": 14052 - }, - { - "epoch": 0.36, - "learning_rate": 1.957763775890302e-06, - "loss": 1.0205, - "step": 14053 - }, - { - "epoch": 0.36, - "learning_rate": 1.957755818713964e-06, - "loss": 0.8613, - "step": 14054 - }, - { - "epoch": 0.36, - "learning_rate": 1.957747860804316e-06, - "loss": 0.9077, - "step": 14055 - }, - { - "epoch": 0.36, - "learning_rate": 1.957739902161365e-06, - "loss": 0.8076, - "step": 14056 - }, - { - "epoch": 0.36, - "learning_rate": 1.957731942785116e-06, - "loss": 0.9551, - "step": 14057 - }, - { - "epoch": 0.36, - "learning_rate": 1.9577239826755756e-06, - "loss": 0.7021, - "step": 14058 - }, - { - "epoch": 0.36, - "learning_rate": 1.9577160218327506e-06, - "loss": 0.7607, - "step": 14059 - }, - { - "epoch": 0.36, - "learning_rate": 1.957708060256646e-06, - "loss": 0.8384, - "step": 14060 - }, - { - "epoch": 0.36, - "learning_rate": 1.9577000979472684e-06, - "loss": 1.0391, - "step": 14061 - }, - { - "epoch": 0.36, - "learning_rate": 1.957692134904624e-06, - "loss": 0.9297, - "step": 14062 - }, - { - "epoch": 0.36, - "learning_rate": 1.9576841711287187e-06, - "loss": 1.0625, - "step": 14063 - }, - { - "epoch": 0.36, - "learning_rate": 1.957676206619559e-06, - "loss": 0.761, - "step": 14064 - }, - { - "epoch": 0.36, - "learning_rate": 1.9576682413771505e-06, - "loss": 0.8555, - "step": 14065 - }, - { - "epoch": 0.36, - "learning_rate": 1.9576602754014995e-06, - "loss": 0.918, - "step": 14066 - }, - { - "epoch": 0.36, - "learning_rate": 1.9576523086926118e-06, - "loss": 1.0176, - "step": 14067 - }, - { - "epoch": 0.36, - "learning_rate": 1.957644341250494e-06, - "loss": 0.8867, - "step": 14068 - }, - { - "epoch": 0.36, - "learning_rate": 1.9576363730751515e-06, - "loss": 0.7632, - "step": 14069 - }, - { - "epoch": 0.36, - "learning_rate": 1.9576284041665913e-06, - "loss": 0.709, - "step": 14070 - }, - { - "epoch": 0.36, - "learning_rate": 1.957620434524819e-06, - "loss": 0.8398, - "step": 14071 - }, - { - "epoch": 0.36, - "learning_rate": 1.957612464149841e-06, - "loss": 0.9805, - "step": 14072 - }, - { - "epoch": 0.36, - "learning_rate": 1.957604493041663e-06, - "loss": 0.9404, - "step": 14073 - }, - { - "epoch": 0.36, - "learning_rate": 1.9575965212002908e-06, - "loss": 0.8267, - "step": 14074 - }, - { - "epoch": 0.36, - "learning_rate": 1.9575885486257313e-06, - "loss": 1.1465, - "step": 14075 - }, - { - "epoch": 0.36, - "learning_rate": 1.95758057531799e-06, - "loss": 0.9565, - "step": 14076 - }, - { - "epoch": 0.36, - "learning_rate": 1.957572601277074e-06, - "loss": 0.9287, - "step": 14077 - }, - { - "epoch": 0.36, - "learning_rate": 1.957564626502988e-06, - "loss": 0.8779, - "step": 14078 - }, - { - "epoch": 0.36, - "learning_rate": 1.957556650995739e-06, - "loss": 0.8887, - "step": 14079 - }, - { - "epoch": 0.36, - "learning_rate": 1.9575486747553332e-06, - "loss": 0.7363, - "step": 14080 - }, - { - "epoch": 0.36, - "learning_rate": 1.9575406977817767e-06, - "loss": 0.7988, - "step": 14081 - }, - { - "epoch": 0.36, - "learning_rate": 1.9575327200750746e-06, - "loss": 0.6392, - "step": 14082 - }, - { - "epoch": 0.36, - "learning_rate": 1.957524741635234e-06, - "loss": 1.1758, - "step": 14083 - }, - { - "epoch": 0.36, - "learning_rate": 1.9575167624622605e-06, - "loss": 0.8955, - "step": 14084 - }, - { - "epoch": 0.36, - "learning_rate": 1.9575087825561608e-06, - "loss": 0.9199, - "step": 14085 - }, - { - "epoch": 0.36, - "learning_rate": 1.9575008019169404e-06, - "loss": 0.918, - "step": 14086 - }, - { - "epoch": 0.36, - "learning_rate": 1.957492820544606e-06, - "loss": 0.9697, - "step": 14087 - }, - { - "epoch": 0.36, - "learning_rate": 1.957484838439163e-06, - "loss": 0.8369, - "step": 14088 - }, - { - "epoch": 0.36, - "learning_rate": 1.957476855600618e-06, - "loss": 0.9248, - "step": 14089 - }, - { - "epoch": 0.36, - "learning_rate": 1.957468872028977e-06, - "loss": 0.9072, - "step": 14090 - }, - { - "epoch": 0.36, - "learning_rate": 1.957460887724246e-06, - "loss": 0.9502, - "step": 14091 - }, - { - "epoch": 0.36, - "learning_rate": 1.957452902686431e-06, - "loss": 0.8428, - "step": 14092 - }, - { - "epoch": 0.36, - "learning_rate": 1.9574449169155393e-06, - "loss": 1.0225, - "step": 14093 - }, - { - "epoch": 0.36, - "learning_rate": 1.957436930411575e-06, - "loss": 1.0898, - "step": 14094 - }, - { - "epoch": 0.36, - "learning_rate": 1.9574289431745457e-06, - "loss": 0.9106, - "step": 14095 - }, - { - "epoch": 0.36, - "learning_rate": 1.9574209552044572e-06, - "loss": 1.0039, - "step": 14096 - }, - { - "epoch": 0.36, - "learning_rate": 1.9574129665013155e-06, - "loss": 0.877, - "step": 14097 - }, - { - "epoch": 0.36, - "learning_rate": 1.9574049770651265e-06, - "loss": 1.0488, - "step": 14098 - }, - { - "epoch": 0.36, - "learning_rate": 1.9573969868958965e-06, - "loss": 0.6309, - "step": 14099 - }, - { - "epoch": 0.36, - "learning_rate": 1.957388995993632e-06, - "loss": 0.9092, - "step": 14100 - }, - { - "epoch": 0.36, - "learning_rate": 1.9573810043583384e-06, - "loss": 0.9229, - "step": 14101 - }, - { - "epoch": 0.36, - "learning_rate": 1.9573730119900224e-06, - "loss": 0.8711, - "step": 14102 - }, - { - "epoch": 0.36, - "learning_rate": 1.95736501888869e-06, - "loss": 1.0762, - "step": 14103 - }, - { - "epoch": 0.36, - "learning_rate": 1.957357025054347e-06, - "loss": 0.916, - "step": 14104 - }, - { - "epoch": 0.36, - "learning_rate": 1.9573490304869995e-06, - "loss": 0.8262, - "step": 14105 - }, - { - "epoch": 0.36, - "learning_rate": 1.9573410351866545e-06, - "loss": 0.9102, - "step": 14106 - }, - { - "epoch": 0.36, - "learning_rate": 1.9573330391533168e-06, - "loss": 0.7803, - "step": 14107 - }, - { - "epoch": 0.36, - "learning_rate": 1.957325042386994e-06, - "loss": 0.8496, - "step": 14108 - }, - { - "epoch": 0.36, - "learning_rate": 1.957317044887691e-06, - "loss": 0.9404, - "step": 14109 - }, - { - "epoch": 0.36, - "learning_rate": 1.957309046655414e-06, - "loss": 0.875, - "step": 14110 - }, - { - "epoch": 0.36, - "learning_rate": 1.95730104769017e-06, - "loss": 0.8926, - "step": 14111 - }, - { - "epoch": 0.36, - "learning_rate": 1.9572930479919647e-06, - "loss": 0.8535, - "step": 14112 - }, - { - "epoch": 0.36, - "learning_rate": 1.9572850475608035e-06, - "loss": 0.832, - "step": 14113 - }, - { - "epoch": 0.36, - "learning_rate": 1.9572770463966933e-06, - "loss": 0.5476, - "step": 14114 - }, - { - "epoch": 0.36, - "learning_rate": 1.9572690444996404e-06, - "loss": 0.9219, - "step": 14115 - }, - { - "epoch": 0.36, - "learning_rate": 1.9572610418696507e-06, - "loss": 0.5986, - "step": 14116 - }, - { - "epoch": 0.36, - "learning_rate": 1.9572530385067302e-06, - "loss": 0.8096, - "step": 14117 - }, - { - "epoch": 0.36, - "learning_rate": 1.957245034410885e-06, - "loss": 0.8955, - "step": 14118 - }, - { - "epoch": 0.36, - "learning_rate": 1.957237029582121e-06, - "loss": 0.6021, - "step": 14119 - }, - { - "epoch": 0.36, - "learning_rate": 1.957229024020445e-06, - "loss": 0.8877, - "step": 14120 - }, - { - "epoch": 0.36, - "learning_rate": 1.9572210177258627e-06, - "loss": 1.0098, - "step": 14121 - }, - { - "epoch": 0.36, - "learning_rate": 1.95721301069838e-06, - "loss": 0.8999, - "step": 14122 - }, - { - "epoch": 0.36, - "learning_rate": 1.9572050029380037e-06, - "loss": 0.709, - "step": 14123 - }, - { - "epoch": 0.36, - "learning_rate": 1.957196994444739e-06, - "loss": 0.6538, - "step": 14124 - }, - { - "epoch": 0.36, - "learning_rate": 1.957188985218593e-06, - "loss": 1.0527, - "step": 14125 - }, - { - "epoch": 0.36, - "learning_rate": 1.9571809752595713e-06, - "loss": 0.8965, - "step": 14126 - }, - { - "epoch": 0.36, - "learning_rate": 1.95717296456768e-06, - "loss": 0.8525, - "step": 14127 - }, - { - "epoch": 0.36, - "learning_rate": 1.9571649531429257e-06, - "loss": 0.9688, - "step": 14128 - }, - { - "epoch": 0.36, - "learning_rate": 1.9571569409853138e-06, - "loss": 0.9775, - "step": 14129 - }, - { - "epoch": 0.36, - "learning_rate": 1.957148928094851e-06, - "loss": 0.9561, - "step": 14130 - }, - { - "epoch": 0.36, - "learning_rate": 1.9571409144715435e-06, - "loss": 0.8022, - "step": 14131 - }, - { - "epoch": 0.36, - "learning_rate": 1.957132900115397e-06, - "loss": 1.1396, - "step": 14132 - }, - { - "epoch": 0.36, - "learning_rate": 1.9571248850264184e-06, - "loss": 0.8042, - "step": 14133 - }, - { - "epoch": 0.36, - "learning_rate": 1.957116869204612e-06, - "loss": 0.9072, - "step": 14134 - }, - { - "epoch": 0.36, - "learning_rate": 1.957108852649986e-06, - "loss": 0.8721, - "step": 14135 - }, - { - "epoch": 0.36, - "learning_rate": 1.9571008353625462e-06, - "loss": 0.96, - "step": 14136 - }, - { - "epoch": 0.36, - "learning_rate": 1.957092817342298e-06, - "loss": 0.7969, - "step": 14137 - }, - { - "epoch": 0.36, - "learning_rate": 1.9570847985892478e-06, - "loss": 0.9092, - "step": 14138 - }, - { - "epoch": 0.36, - "learning_rate": 1.9570767791034016e-06, - "loss": 0.8887, - "step": 14139 - }, - { - "epoch": 0.36, - "learning_rate": 1.9570687588847655e-06, - "loss": 0.833, - "step": 14140 - }, - { - "epoch": 0.36, - "learning_rate": 1.9570607379333465e-06, - "loss": 0.8564, - "step": 14141 - }, - { - "epoch": 0.36, - "learning_rate": 1.9570527162491495e-06, - "loss": 0.8135, - "step": 14142 - }, - { - "epoch": 0.36, - "learning_rate": 1.957044693832182e-06, - "loss": 0.9111, - "step": 14143 - }, - { - "epoch": 0.36, - "learning_rate": 1.9570366706824484e-06, - "loss": 1.0098, - "step": 14144 - }, - { - "epoch": 0.36, - "learning_rate": 1.9570286467999566e-06, - "loss": 0.9287, - "step": 14145 - }, - { - "epoch": 0.36, - "learning_rate": 1.9570206221847118e-06, - "loss": 0.7449, - "step": 14146 - }, - { - "epoch": 0.36, - "learning_rate": 1.95701259683672e-06, - "loss": 1.1621, - "step": 14147 - }, - { - "epoch": 0.36, - "learning_rate": 1.957004570755988e-06, - "loss": 1.0586, - "step": 14148 - }, - { - "epoch": 0.36, - "learning_rate": 1.9569965439425214e-06, - "loss": 0.8662, - "step": 14149 - }, - { - "epoch": 0.36, - "learning_rate": 1.9569885163963266e-06, - "loss": 0.5864, - "step": 14150 - }, - { - "epoch": 0.36, - "learning_rate": 1.95698048811741e-06, - "loss": 0.9326, - "step": 14151 - }, - { - "epoch": 0.36, - "learning_rate": 1.956972459105777e-06, - "loss": 0.6548, - "step": 14152 - }, - { - "epoch": 0.36, - "learning_rate": 1.956964429361434e-06, - "loss": 0.9189, - "step": 14153 - }, - { - "epoch": 0.36, - "learning_rate": 1.9569563988843876e-06, - "loss": 0.748, - "step": 14154 - }, - { - "epoch": 0.36, - "learning_rate": 1.956948367674644e-06, - "loss": 0.9492, - "step": 14155 - }, - { - "epoch": 0.36, - "learning_rate": 1.956940335732209e-06, - "loss": 0.772, - "step": 14156 - }, - { - "epoch": 0.36, - "learning_rate": 1.956932303057088e-06, - "loss": 0.8643, - "step": 14157 - }, - { - "epoch": 0.36, - "learning_rate": 1.956924269649289e-06, - "loss": 0.7998, - "step": 14158 - }, - { - "epoch": 0.36, - "learning_rate": 1.9569162355088165e-06, - "loss": 0.748, - "step": 14159 - }, - { - "epoch": 0.36, - "learning_rate": 1.9569082006356774e-06, - "loss": 0.8887, - "step": 14160 - }, - { - "epoch": 0.36, - "learning_rate": 1.9569001650298777e-06, - "loss": 1.0039, - "step": 14161 - }, - { - "epoch": 0.36, - "learning_rate": 1.9568921286914233e-06, - "loss": 0.999, - "step": 14162 - }, - { - "epoch": 0.36, - "learning_rate": 1.956884091620321e-06, - "loss": 0.9902, - "step": 14163 - }, - { - "epoch": 0.36, - "learning_rate": 1.9568760538165763e-06, - "loss": 0.7368, - "step": 14164 - }, - { - "epoch": 0.36, - "learning_rate": 1.956868015280196e-06, - "loss": 1.1533, - "step": 14165 - }, - { - "epoch": 0.36, - "learning_rate": 1.9568599760111854e-06, - "loss": 0.8242, - "step": 14166 - }, - { - "epoch": 0.36, - "learning_rate": 1.956851936009551e-06, - "loss": 0.8828, - "step": 14167 - }, - { - "epoch": 0.36, - "learning_rate": 1.9568438952752994e-06, - "loss": 0.9277, - "step": 14168 - }, - { - "epoch": 0.36, - "learning_rate": 1.956835853808436e-06, - "loss": 0.8896, - "step": 14169 - }, - { - "epoch": 0.36, - "learning_rate": 1.956827811608968e-06, - "loss": 0.9551, - "step": 14170 - }, - { - "epoch": 0.36, - "learning_rate": 1.9568197686769006e-06, - "loss": 0.9619, - "step": 14171 - }, - { - "epoch": 0.36, - "learning_rate": 1.95681172501224e-06, - "loss": 0.8496, - "step": 14172 - }, - { - "epoch": 0.36, - "learning_rate": 1.956803680614993e-06, - "loss": 0.9375, - "step": 14173 - }, - { - "epoch": 0.36, - "learning_rate": 1.9567956354851656e-06, - "loss": 0.9043, - "step": 14174 - }, - { - "epoch": 0.36, - "learning_rate": 1.956787589622764e-06, - "loss": 0.8257, - "step": 14175 - }, - { - "epoch": 0.36, - "learning_rate": 1.9567795430277933e-06, - "loss": 0.7627, - "step": 14176 - }, - { - "epoch": 0.36, - "learning_rate": 1.956771495700261e-06, - "loss": 0.5884, - "step": 14177 - }, - { - "epoch": 0.36, - "learning_rate": 1.9567634476401724e-06, - "loss": 0.8223, - "step": 14178 - }, - { - "epoch": 0.36, - "learning_rate": 1.9567553988475346e-06, - "loss": 0.7148, - "step": 14179 - }, - { - "epoch": 0.36, - "learning_rate": 1.9567473493223527e-06, - "loss": 0.7832, - "step": 14180 - }, - { - "epoch": 0.36, - "learning_rate": 1.9567392990646335e-06, - "loss": 1.0439, - "step": 14181 - }, - { - "epoch": 0.36, - "learning_rate": 1.956731248074383e-06, - "loss": 0.8257, - "step": 14182 - }, - { - "epoch": 0.36, - "learning_rate": 1.9567231963516077e-06, - "loss": 1.0439, - "step": 14183 - }, - { - "epoch": 0.36, - "learning_rate": 1.956715143896313e-06, - "loss": 0.9678, - "step": 14184 - }, - { - "epoch": 0.36, - "learning_rate": 1.9567070907085057e-06, - "loss": 0.9922, - "step": 14185 - }, - { - "epoch": 0.36, - "learning_rate": 1.956699036788192e-06, - "loss": 0.9668, - "step": 14186 - }, - { - "epoch": 0.36, - "learning_rate": 1.9566909821353774e-06, - "loss": 1.0547, - "step": 14187 - }, - { - "epoch": 0.36, - "learning_rate": 1.9566829267500684e-06, - "loss": 0.7656, - "step": 14188 - }, - { - "epoch": 0.36, - "learning_rate": 1.9566748706322715e-06, - "loss": 0.8984, - "step": 14189 - }, - { - "epoch": 0.36, - "learning_rate": 1.9566668137819927e-06, - "loss": 0.7126, - "step": 14190 - }, - { - "epoch": 0.36, - "learning_rate": 1.9566587561992384e-06, - "loss": 0.6553, - "step": 14191 - }, - { - "epoch": 0.36, - "learning_rate": 1.956650697884014e-06, - "loss": 0.9688, - "step": 14192 - }, - { - "epoch": 0.36, - "learning_rate": 1.9566426388363264e-06, - "loss": 0.8779, - "step": 14193 - }, - { - "epoch": 0.36, - "learning_rate": 1.9566345790561814e-06, - "loss": 0.8232, - "step": 14194 - }, - { - "epoch": 0.36, - "learning_rate": 1.9566265185435854e-06, - "loss": 0.8506, - "step": 14195 - }, - { - "epoch": 0.36, - "learning_rate": 1.9566184572985444e-06, - "loss": 0.9204, - "step": 14196 - }, - { - "epoch": 0.36, - "learning_rate": 1.9566103953210646e-06, - "loss": 0.9785, - "step": 14197 - }, - { - "epoch": 0.36, - "learning_rate": 1.956602332611152e-06, - "loss": 0.9043, - "step": 14198 - }, - { - "epoch": 0.36, - "learning_rate": 1.956594269168813e-06, - "loss": 0.9282, - "step": 14199 - }, - { - "epoch": 0.36, - "learning_rate": 1.956586204994054e-06, - "loss": 0.9033, - "step": 14200 - }, - { - "epoch": 0.36, - "learning_rate": 1.9565781400868814e-06, - "loss": 0.8174, - "step": 14201 - }, - { - "epoch": 0.36, - "learning_rate": 1.9565700744473004e-06, - "loss": 0.8525, - "step": 14202 - }, - { - "epoch": 0.36, - "learning_rate": 1.9565620080753176e-06, - "loss": 0.9404, - "step": 14203 - }, - { - "epoch": 0.36, - "learning_rate": 1.9565539409709393e-06, - "loss": 0.8281, - "step": 14204 - }, - { - "epoch": 0.36, - "learning_rate": 1.956545873134172e-06, - "loss": 0.835, - "step": 14205 - }, - { - "epoch": 0.36, - "learning_rate": 1.9565378045650207e-06, - "loss": 0.8779, - "step": 14206 - }, - { - "epoch": 0.36, - "learning_rate": 1.9565297352634927e-06, - "loss": 0.9111, - "step": 14207 - }, - { - "epoch": 0.36, - "learning_rate": 1.9565216652295946e-06, - "loss": 0.5991, - "step": 14208 - }, - { - "epoch": 0.36, - "learning_rate": 1.956513594463331e-06, - "loss": 0.748, - "step": 14209 - }, - { - "epoch": 0.36, - "learning_rate": 1.9565055229647093e-06, - "loss": 1.0239, - "step": 14210 - }, - { - "epoch": 0.36, - "learning_rate": 1.956497450733735e-06, - "loss": 1.0166, - "step": 14211 - }, - { - "epoch": 0.36, - "learning_rate": 1.9564893777704147e-06, - "loss": 0.9658, - "step": 14212 - }, - { - "epoch": 0.36, - "learning_rate": 1.9564813040747547e-06, - "loss": 0.8408, - "step": 14213 - }, - { - "epoch": 0.36, - "learning_rate": 1.956473229646761e-06, - "loss": 0.8428, - "step": 14214 - }, - { - "epoch": 0.36, - "learning_rate": 1.9564651544864394e-06, - "loss": 0.7939, - "step": 14215 - }, - { - "epoch": 0.36, - "learning_rate": 1.9564570785937965e-06, - "loss": 0.8301, - "step": 14216 - }, - { - "epoch": 0.36, - "learning_rate": 1.9564490019688386e-06, - "loss": 1.2012, - "step": 14217 - }, - { - "epoch": 0.36, - "learning_rate": 1.956440924611571e-06, - "loss": 0.9248, - "step": 14218 - }, - { - "epoch": 0.36, - "learning_rate": 1.9564328465220014e-06, - "loss": 0.9893, - "step": 14219 - }, - { - "epoch": 0.36, - "learning_rate": 1.9564247677001347e-06, - "loss": 0.833, - "step": 14220 - }, - { - "epoch": 0.36, - "learning_rate": 1.9564166881459777e-06, - "loss": 0.7607, - "step": 14221 - }, - { - "epoch": 0.36, - "learning_rate": 1.956408607859536e-06, - "loss": 0.9111, - "step": 14222 - }, - { - "epoch": 0.36, - "learning_rate": 1.9564005268408166e-06, - "loss": 0.9062, - "step": 14223 - }, - { - "epoch": 0.36, - "learning_rate": 1.9563924450898253e-06, - "loss": 0.9238, - "step": 14224 - }, - { - "epoch": 0.36, - "learning_rate": 1.956384362606568e-06, - "loss": 0.9414, - "step": 14225 - }, - { - "epoch": 0.36, - "learning_rate": 1.9563762793910514e-06, - "loss": 0.8691, - "step": 14226 - }, - { - "epoch": 0.36, - "learning_rate": 1.956368195443282e-06, - "loss": 1.0928, - "step": 14227 - }, - { - "epoch": 0.36, - "learning_rate": 1.9563601107632647e-06, - "loss": 1.0312, - "step": 14228 - }, - { - "epoch": 0.36, - "learning_rate": 1.9563520253510066e-06, - "loss": 0.8721, - "step": 14229 - }, - { - "epoch": 0.36, - "learning_rate": 1.956343939206514e-06, - "loss": 0.5947, - "step": 14230 - }, - { - "epoch": 0.36, - "learning_rate": 1.9563358523297925e-06, - "loss": 0.6338, - "step": 14231 - }, - { - "epoch": 0.36, - "learning_rate": 1.956327764720849e-06, - "loss": 0.9092, - "step": 14232 - }, - { - "epoch": 0.36, - "learning_rate": 1.956319676379689e-06, - "loss": 0.9062, - "step": 14233 - }, - { - "epoch": 0.36, - "learning_rate": 1.9563115873063185e-06, - "loss": 0.8682, - "step": 14234 - }, - { - "epoch": 0.36, - "learning_rate": 1.956303497500745e-06, - "loss": 0.8506, - "step": 14235 - }, - { - "epoch": 0.36, - "learning_rate": 1.9562954069629734e-06, - "loss": 1.0576, - "step": 14236 - }, - { - "epoch": 0.36, - "learning_rate": 1.9562873156930107e-06, - "loss": 0.9839, - "step": 14237 - }, - { - "epoch": 0.36, - "learning_rate": 1.9562792236908624e-06, - "loss": 0.7385, - "step": 14238 - }, - { - "epoch": 0.36, - "learning_rate": 1.9562711309565356e-06, - "loss": 0.7295, - "step": 14239 - }, - { - "epoch": 0.36, - "learning_rate": 1.9562630374900355e-06, - "loss": 0.8965, - "step": 14240 - }, - { - "epoch": 0.37, - "learning_rate": 1.9562549432913687e-06, - "loss": 0.9922, - "step": 14241 - }, - { - "epoch": 0.37, - "learning_rate": 1.956246848360542e-06, - "loss": 0.7656, - "step": 14242 - }, - { - "epoch": 0.37, - "learning_rate": 1.9562387526975604e-06, - "loss": 1.0293, - "step": 14243 - }, - { - "epoch": 0.37, - "learning_rate": 1.9562306563024312e-06, - "loss": 0.9717, - "step": 14244 - }, - { - "epoch": 0.37, - "learning_rate": 1.9562225591751603e-06, - "loss": 0.9902, - "step": 14245 - }, - { - "epoch": 0.37, - "learning_rate": 1.9562144613157534e-06, - "loss": 1.0225, - "step": 14246 - }, - { - "epoch": 0.37, - "learning_rate": 1.956206362724217e-06, - "loss": 0.8906, - "step": 14247 - }, - { - "epoch": 0.37, - "learning_rate": 1.956198263400558e-06, - "loss": 0.9473, - "step": 14248 - }, - { - "epoch": 0.37, - "learning_rate": 1.956190163344781e-06, - "loss": 0.8916, - "step": 14249 - }, - { - "epoch": 0.37, - "learning_rate": 1.956182062556894e-06, - "loss": 0.9639, - "step": 14250 - }, - { - "epoch": 0.37, - "learning_rate": 1.9561739610369017e-06, - "loss": 0.9141, - "step": 14251 - }, - { - "epoch": 0.37, - "learning_rate": 1.9561658587848112e-06, - "loss": 0.8496, - "step": 14252 - }, - { - "epoch": 0.37, - "learning_rate": 1.956157755800629e-06, - "loss": 0.8301, - "step": 14253 - }, - { - "epoch": 0.37, - "learning_rate": 1.95614965208436e-06, - "loss": 0.9111, - "step": 14254 - }, - { - "epoch": 0.37, - "learning_rate": 1.9561415476360115e-06, - "loss": 0.9346, - "step": 14255 - }, - { - "epoch": 0.37, - "learning_rate": 1.956133442455589e-06, - "loss": 0.8037, - "step": 14256 - }, - { - "epoch": 0.37, - "learning_rate": 1.9561253365431e-06, - "loss": 0.9746, - "step": 14257 - }, - { - "epoch": 0.37, - "learning_rate": 1.956117229898549e-06, - "loss": 0.9609, - "step": 14258 - }, - { - "epoch": 0.37, - "learning_rate": 1.9561091225219435e-06, - "loss": 0.8633, - "step": 14259 - }, - { - "epoch": 0.37, - "learning_rate": 1.956101014413289e-06, - "loss": 0.6567, - "step": 14260 - }, - { - "epoch": 0.37, - "learning_rate": 1.9560929055725915e-06, - "loss": 0.79, - "step": 14261 - }, - { - "epoch": 0.37, - "learning_rate": 1.9560847959998582e-06, - "loss": 1.0996, - "step": 14262 - }, - { - "epoch": 0.37, - "learning_rate": 1.9560766856950945e-06, - "loss": 0.7998, - "step": 14263 - }, - { - "epoch": 0.37, - "learning_rate": 1.9560685746583067e-06, - "loss": 1.0273, - "step": 14264 - }, - { - "epoch": 0.37, - "learning_rate": 1.9560604628895016e-06, - "loss": 1.0664, - "step": 14265 - }, - { - "epoch": 0.37, - "learning_rate": 1.9560523503886843e-06, - "loss": 1.0518, - "step": 14266 - }, - { - "epoch": 0.37, - "learning_rate": 1.9560442371558624e-06, - "loss": 1.2109, - "step": 14267 - }, - { - "epoch": 0.37, - "learning_rate": 1.956036123191041e-06, - "loss": 0.8906, - "step": 14268 - }, - { - "epoch": 0.37, - "learning_rate": 1.9560280084942267e-06, - "loss": 0.8291, - "step": 14269 - }, - { - "epoch": 0.37, - "learning_rate": 1.9560198930654257e-06, - "loss": 1.0078, - "step": 14270 - }, - { - "epoch": 0.37, - "learning_rate": 1.9560117769046443e-06, - "loss": 1.0977, - "step": 14271 - }, - { - "epoch": 0.37, - "learning_rate": 1.9560036600118887e-06, - "loss": 0.8096, - "step": 14272 - }, - { - "epoch": 0.37, - "learning_rate": 1.955995542387165e-06, - "loss": 1.0498, - "step": 14273 - }, - { - "epoch": 0.37, - "learning_rate": 1.9559874240304793e-06, - "loss": 1.1191, - "step": 14274 - }, - { - "epoch": 0.37, - "learning_rate": 1.9559793049418383e-06, - "loss": 0.8223, - "step": 14275 - }, - { - "epoch": 0.37, - "learning_rate": 1.9559711851212477e-06, - "loss": 1.0518, - "step": 14276 - }, - { - "epoch": 0.37, - "learning_rate": 1.955963064568714e-06, - "loss": 0.8066, - "step": 14277 - }, - { - "epoch": 0.37, - "learning_rate": 1.9559549432842432e-06, - "loss": 1.1152, - "step": 14278 - }, - { - "epoch": 0.37, - "learning_rate": 1.9559468212678417e-06, - "loss": 1.2012, - "step": 14279 - }, - { - "epoch": 0.37, - "learning_rate": 1.955938698519516e-06, - "loss": 0.8359, - "step": 14280 - }, - { - "epoch": 0.37, - "learning_rate": 1.9559305750392717e-06, - "loss": 1.0146, - "step": 14281 - }, - { - "epoch": 0.37, - "learning_rate": 1.955922450827115e-06, - "loss": 0.8643, - "step": 14282 - }, - { - "epoch": 0.37, - "learning_rate": 1.955914325883053e-06, - "loss": 0.8125, - "step": 14283 - }, - { - "epoch": 0.37, - "learning_rate": 1.955906200207091e-06, - "loss": 0.7188, - "step": 14284 - }, - { - "epoch": 0.37, - "learning_rate": 1.955898073799236e-06, - "loss": 1.0225, - "step": 14285 - }, - { - "epoch": 0.37, - "learning_rate": 1.9558899466594934e-06, - "loss": 0.9795, - "step": 14286 - }, - { - "epoch": 0.37, - "learning_rate": 1.95588181878787e-06, - "loss": 0.8965, - "step": 14287 - }, - { - "epoch": 0.37, - "learning_rate": 1.955873690184372e-06, - "loss": 0.7666, - "step": 14288 - }, - { - "epoch": 0.37, - "learning_rate": 1.955865560849005e-06, - "loss": 0.5674, - "step": 14289 - }, - { - "epoch": 0.37, - "learning_rate": 1.955857430781776e-06, - "loss": 0.9609, - "step": 14290 - }, - { - "epoch": 0.37, - "learning_rate": 1.955849299982691e-06, - "loss": 0.9111, - "step": 14291 - }, - { - "epoch": 0.37, - "learning_rate": 1.9558411684517555e-06, - "loss": 0.8975, - "step": 14292 - }, - { - "epoch": 0.37, - "learning_rate": 1.955833036188977e-06, - "loss": 0.6123, - "step": 14293 - }, - { - "epoch": 0.37, - "learning_rate": 1.955824903194361e-06, - "loss": 1.1064, - "step": 14294 - }, - { - "epoch": 0.37, - "learning_rate": 1.955816769467914e-06, - "loss": 1.0312, - "step": 14295 - }, - { - "epoch": 0.37, - "learning_rate": 1.9558086350096414e-06, - "loss": 0.9004, - "step": 14296 - }, - { - "epoch": 0.37, - "learning_rate": 1.9558004998195507e-06, - "loss": 0.7832, - "step": 14297 - }, - { - "epoch": 0.37, - "learning_rate": 1.9557923638976473e-06, - "loss": 0.9287, - "step": 14298 - }, - { - "epoch": 0.37, - "learning_rate": 1.9557842272439375e-06, - "loss": 0.9863, - "step": 14299 - }, - { - "epoch": 0.37, - "learning_rate": 1.955776089858428e-06, - "loss": 0.8843, - "step": 14300 - }, - { - "epoch": 0.37, - "learning_rate": 1.9557679517411245e-06, - "loss": 0.8789, - "step": 14301 - }, - { - "epoch": 0.37, - "learning_rate": 1.955759812892033e-06, - "loss": 0.7363, - "step": 14302 - }, - { - "epoch": 0.37, - "learning_rate": 1.955751673311161e-06, - "loss": 0.8877, - "step": 14303 - }, - { - "epoch": 0.37, - "learning_rate": 1.955743532998513e-06, - "loss": 0.7822, - "step": 14304 - }, - { - "epoch": 0.37, - "learning_rate": 1.955735391954097e-06, - "loss": 0.8804, - "step": 14305 - }, - { - "epoch": 0.37, - "learning_rate": 1.9557272501779177e-06, - "loss": 0.874, - "step": 14306 - }, - { - "epoch": 0.37, - "learning_rate": 1.9557191076699824e-06, - "loss": 0.9736, - "step": 14307 - }, - { - "epoch": 0.37, - "learning_rate": 1.9557109644302967e-06, - "loss": 0.8291, - "step": 14308 - }, - { - "epoch": 0.37, - "learning_rate": 1.9557028204588672e-06, - "loss": 1.2051, - "step": 14309 - }, - { - "epoch": 0.37, - "learning_rate": 1.9556946757557e-06, - "loss": 0.9658, - "step": 14310 - }, - { - "epoch": 0.37, - "learning_rate": 1.9556865303208013e-06, - "loss": 0.8418, - "step": 14311 - }, - { - "epoch": 0.37, - "learning_rate": 1.9556783841541775e-06, - "loss": 0.7126, - "step": 14312 - }, - { - "epoch": 0.37, - "learning_rate": 1.955670237255834e-06, - "loss": 0.9492, - "step": 14313 - }, - { - "epoch": 0.37, - "learning_rate": 1.9556620896257784e-06, - "loss": 0.9736, - "step": 14314 - }, - { - "epoch": 0.37, - "learning_rate": 1.9556539412640162e-06, - "loss": 0.9141, - "step": 14315 - }, - { - "epoch": 0.37, - "learning_rate": 1.955645792170554e-06, - "loss": 0.8857, - "step": 14316 - }, - { - "epoch": 0.37, - "learning_rate": 1.955637642345397e-06, - "loss": 1.0244, - "step": 14317 - }, - { - "epoch": 0.37, - "learning_rate": 1.955629491788553e-06, - "loss": 0.6914, - "step": 14318 - }, - { - "epoch": 0.37, - "learning_rate": 1.955621340500027e-06, - "loss": 0.9043, - "step": 14319 - }, - { - "epoch": 0.37, - "learning_rate": 1.955613188479826e-06, - "loss": 0.9268, - "step": 14320 - }, - { - "epoch": 0.37, - "learning_rate": 1.9556050357279555e-06, - "loss": 1.0908, - "step": 14321 - }, - { - "epoch": 0.37, - "learning_rate": 1.9555968822444222e-06, - "loss": 1.0508, - "step": 14322 - }, - { - "epoch": 0.37, - "learning_rate": 1.9555887280292325e-06, - "loss": 0.7529, - "step": 14323 - }, - { - "epoch": 0.37, - "learning_rate": 1.9555805730823923e-06, - "loss": 0.7192, - "step": 14324 - }, - { - "epoch": 0.37, - "learning_rate": 1.9555724174039083e-06, - "loss": 0.9082, - "step": 14325 - }, - { - "epoch": 0.37, - "learning_rate": 1.955564260993786e-06, - "loss": 0.917, - "step": 14326 - }, - { - "epoch": 0.37, - "learning_rate": 1.955556103852032e-06, - "loss": 0.8389, - "step": 14327 - }, - { - "epoch": 0.37, - "learning_rate": 1.9555479459786533e-06, - "loss": 0.9639, - "step": 14328 - }, - { - "epoch": 0.37, - "learning_rate": 1.955539787373655e-06, - "loss": 0.771, - "step": 14329 - }, - { - "epoch": 0.37, - "learning_rate": 1.955531628037044e-06, - "loss": 1.042, - "step": 14330 - }, - { - "epoch": 0.37, - "learning_rate": 1.955523467968826e-06, - "loss": 1.0176, - "step": 14331 - }, - { - "epoch": 0.37, - "learning_rate": 1.955515307169008e-06, - "loss": 0.7451, - "step": 14332 - }, - { - "epoch": 0.37, - "learning_rate": 1.955507145637596e-06, - "loss": 0.7715, - "step": 14333 - }, - { - "epoch": 0.37, - "learning_rate": 1.955498983374596e-06, - "loss": 0.9932, - "step": 14334 - }, - { - "epoch": 0.37, - "learning_rate": 1.955490820380014e-06, - "loss": 0.7725, - "step": 14335 - }, - { - "epoch": 0.37, - "learning_rate": 1.955482656653857e-06, - "loss": 0.813, - "step": 14336 - }, - { - "epoch": 0.37, - "learning_rate": 1.9554744921961304e-06, - "loss": 0.8457, - "step": 14337 - }, - { - "epoch": 0.37, - "learning_rate": 1.9554663270068416e-06, - "loss": 0.9756, - "step": 14338 - }, - { - "epoch": 0.37, - "learning_rate": 1.9554581610859958e-06, - "loss": 1.0576, - "step": 14339 - }, - { - "epoch": 0.37, - "learning_rate": 1.9554499944336e-06, - "loss": 0.8506, - "step": 14340 - }, - { - "epoch": 0.37, - "learning_rate": 1.955441827049659e-06, - "loss": 0.6606, - "step": 14341 - }, - { - "epoch": 0.37, - "learning_rate": 1.955433658934181e-06, - "loss": 0.8542, - "step": 14342 - }, - { - "epoch": 0.37, - "learning_rate": 1.9554254900871714e-06, - "loss": 0.958, - "step": 14343 - }, - { - "epoch": 0.37, - "learning_rate": 1.955417320508636e-06, - "loss": 0.8428, - "step": 14344 - }, - { - "epoch": 0.37, - "learning_rate": 1.9554091501985817e-06, - "loss": 1.0918, - "step": 14345 - }, - { - "epoch": 0.37, - "learning_rate": 1.955400979157015e-06, - "loss": 1.0273, - "step": 14346 - }, - { - "epoch": 0.37, - "learning_rate": 1.955392807383941e-06, - "loss": 0.8242, - "step": 14347 - }, - { - "epoch": 0.37, - "learning_rate": 1.955384634879367e-06, - "loss": 1.0137, - "step": 14348 - }, - { - "epoch": 0.37, - "learning_rate": 1.9553764616432987e-06, - "loss": 0.8779, - "step": 14349 - }, - { - "epoch": 0.37, - "learning_rate": 1.9553682876757428e-06, - "loss": 0.6497, - "step": 14350 - }, - { - "epoch": 0.37, - "learning_rate": 1.9553601129767053e-06, - "loss": 0.5366, - "step": 14351 - }, - { - "epoch": 0.37, - "learning_rate": 1.9553519375461922e-06, - "loss": 0.9058, - "step": 14352 - }, - { - "epoch": 0.37, - "learning_rate": 1.9553437613842107e-06, - "loss": 0.96, - "step": 14353 - }, - { - "epoch": 0.37, - "learning_rate": 1.955335584490766e-06, - "loss": 0.5698, - "step": 14354 - }, - { - "epoch": 0.37, - "learning_rate": 1.955327406865865e-06, - "loss": 0.8027, - "step": 14355 - }, - { - "epoch": 0.37, - "learning_rate": 1.955319228509513e-06, - "loss": 0.8242, - "step": 14356 - }, - { - "epoch": 0.37, - "learning_rate": 1.9553110494217177e-06, - "loss": 0.9707, - "step": 14357 - }, - { - "epoch": 0.37, - "learning_rate": 1.9553028696024847e-06, - "loss": 1.125, - "step": 14358 - }, - { - "epoch": 0.37, - "learning_rate": 1.9552946890518196e-06, - "loss": 0.8203, - "step": 14359 - }, - { - "epoch": 0.37, - "learning_rate": 1.9552865077697298e-06, - "loss": 0.8662, - "step": 14360 - }, - { - "epoch": 0.37, - "learning_rate": 1.955278325756221e-06, - "loss": 0.7529, - "step": 14361 - }, - { - "epoch": 0.37, - "learning_rate": 1.9552701430112994e-06, - "loss": 1.2188, - "step": 14362 - }, - { - "epoch": 0.37, - "learning_rate": 1.9552619595349715e-06, - "loss": 0.8232, - "step": 14363 - }, - { - "epoch": 0.37, - "learning_rate": 1.955253775327243e-06, - "loss": 0.7241, - "step": 14364 - }, - { - "epoch": 0.37, - "learning_rate": 1.955245590388121e-06, - "loss": 0.7676, - "step": 14365 - }, - { - "epoch": 0.37, - "learning_rate": 1.9552374047176115e-06, - "loss": 0.8555, - "step": 14366 - }, - { - "epoch": 0.37, - "learning_rate": 1.9552292183157203e-06, - "loss": 0.8091, - "step": 14367 - }, - { - "epoch": 0.37, - "learning_rate": 1.9552210311824544e-06, - "loss": 0.7744, - "step": 14368 - }, - { - "epoch": 0.37, - "learning_rate": 1.9552128433178195e-06, - "loss": 0.8369, - "step": 14369 - }, - { - "epoch": 0.37, - "learning_rate": 1.9552046547218217e-06, - "loss": 0.9834, - "step": 14370 - }, - { - "epoch": 0.37, - "learning_rate": 1.955196465394468e-06, - "loss": 0.8496, - "step": 14371 - }, - { - "epoch": 0.37, - "learning_rate": 1.955188275335764e-06, - "loss": 0.7114, - "step": 14372 - }, - { - "epoch": 0.37, - "learning_rate": 1.9551800845457168e-06, - "loss": 0.9912, - "step": 14373 - }, - { - "epoch": 0.37, - "learning_rate": 1.955171893024332e-06, - "loss": 0.7871, - "step": 14374 - }, - { - "epoch": 0.37, - "learning_rate": 1.9551637007716156e-06, - "loss": 0.835, - "step": 14375 - }, - { - "epoch": 0.37, - "learning_rate": 1.955155507787574e-06, - "loss": 0.7983, - "step": 14376 - }, - { - "epoch": 0.37, - "learning_rate": 1.9551473140722147e-06, - "loss": 1.1182, - "step": 14377 - }, - { - "epoch": 0.37, - "learning_rate": 1.955139119625542e-06, - "loss": 0.9448, - "step": 14378 - }, - { - "epoch": 0.37, - "learning_rate": 1.9551309244475642e-06, - "loss": 0.9219, - "step": 14379 - }, - { - "epoch": 0.37, - "learning_rate": 1.955122728538286e-06, - "loss": 1.0879, - "step": 14380 - }, - { - "epoch": 0.37, - "learning_rate": 1.9551145318977143e-06, - "loss": 1.0195, - "step": 14381 - }, - { - "epoch": 0.37, - "learning_rate": 1.9551063345258554e-06, - "loss": 1.0381, - "step": 14382 - }, - { - "epoch": 0.37, - "learning_rate": 1.9550981364227153e-06, - "loss": 0.8159, - "step": 14383 - }, - { - "epoch": 0.37, - "learning_rate": 1.9550899375883008e-06, - "loss": 0.8711, - "step": 14384 - }, - { - "epoch": 0.37, - "learning_rate": 1.9550817380226176e-06, - "loss": 0.7769, - "step": 14385 - }, - { - "epoch": 0.37, - "learning_rate": 1.9550735377256724e-06, - "loss": 0.8691, - "step": 14386 - }, - { - "epoch": 0.37, - "learning_rate": 1.9550653366974712e-06, - "loss": 0.7559, - "step": 14387 - }, - { - "epoch": 0.37, - "learning_rate": 1.9550571349380202e-06, - "loss": 0.6904, - "step": 14388 - }, - { - "epoch": 0.37, - "learning_rate": 1.955048932447326e-06, - "loss": 0.9346, - "step": 14389 - }, - { - "epoch": 0.37, - "learning_rate": 1.955040729225395e-06, - "loss": 1.0654, - "step": 14390 - }, - { - "epoch": 0.37, - "learning_rate": 1.9550325252722335e-06, - "loss": 0.8701, - "step": 14391 - }, - { - "epoch": 0.37, - "learning_rate": 1.955024320587847e-06, - "loss": 0.8496, - "step": 14392 - }, - { - "epoch": 0.37, - "learning_rate": 1.955016115172242e-06, - "loss": 0.9531, - "step": 14393 - }, - { - "epoch": 0.37, - "learning_rate": 1.9550079090254255e-06, - "loss": 0.8203, - "step": 14394 - }, - { - "epoch": 0.37, - "learning_rate": 1.954999702147403e-06, - "loss": 0.7827, - "step": 14395 - }, - { - "epoch": 0.37, - "learning_rate": 1.9549914945381816e-06, - "loss": 0.9365, - "step": 14396 - }, - { - "epoch": 0.37, - "learning_rate": 1.954983286197767e-06, - "loss": 1.0488, - "step": 14397 - }, - { - "epoch": 0.37, - "learning_rate": 1.9549750771261656e-06, - "loss": 0.9766, - "step": 14398 - }, - { - "epoch": 0.37, - "learning_rate": 1.9549668673233833e-06, - "loss": 0.8965, - "step": 14399 - }, - { - "epoch": 0.37, - "learning_rate": 1.9549586567894274e-06, - "loss": 0.665, - "step": 14400 - }, - { - "epoch": 0.37, - "learning_rate": 1.9549504455243033e-06, - "loss": 0.8887, - "step": 14401 - }, - { - "epoch": 0.37, - "learning_rate": 1.954942233528018e-06, - "loss": 1.1357, - "step": 14402 - }, - { - "epoch": 0.37, - "learning_rate": 1.9549340208005764e-06, - "loss": 0.8477, - "step": 14403 - }, - { - "epoch": 0.37, - "learning_rate": 1.9549258073419864e-06, - "loss": 0.7959, - "step": 14404 - }, - { - "epoch": 0.37, - "learning_rate": 1.954917593152253e-06, - "loss": 0.875, - "step": 14405 - }, - { - "epoch": 0.37, - "learning_rate": 1.9549093782313836e-06, - "loss": 1.1475, - "step": 14406 - }, - { - "epoch": 0.37, - "learning_rate": 1.954901162579384e-06, - "loss": 0.8516, - "step": 14407 - }, - { - "epoch": 0.37, - "learning_rate": 1.9548929461962602e-06, - "loss": 0.9268, - "step": 14408 - }, - { - "epoch": 0.37, - "learning_rate": 1.9548847290820196e-06, - "loss": 1.1777, - "step": 14409 - }, - { - "epoch": 0.37, - "learning_rate": 1.9548765112366667e-06, - "loss": 0.627, - "step": 14410 - }, - { - "epoch": 0.37, - "learning_rate": 1.954868292660209e-06, - "loss": 1.0273, - "step": 14411 - }, - { - "epoch": 0.37, - "learning_rate": 1.954860073352653e-06, - "loss": 0.9033, - "step": 14412 - }, - { - "epoch": 0.37, - "learning_rate": 1.9548518533140043e-06, - "loss": 1.1758, - "step": 14413 - }, - { - "epoch": 0.37, - "learning_rate": 1.9548436325442693e-06, - "loss": 0.9248, - "step": 14414 - }, - { - "epoch": 0.37, - "learning_rate": 1.954835411043454e-06, - "loss": 0.7185, - "step": 14415 - }, - { - "epoch": 0.37, - "learning_rate": 1.9548271888115663e-06, - "loss": 0.8652, - "step": 14416 - }, - { - "epoch": 0.37, - "learning_rate": 1.9548189658486105e-06, - "loss": 0.8193, - "step": 14417 - }, - { - "epoch": 0.37, - "learning_rate": 1.954810742154594e-06, - "loss": 0.7275, - "step": 14418 - }, - { - "epoch": 0.37, - "learning_rate": 1.954802517729523e-06, - "loss": 0.9141, - "step": 14419 - }, - { - "epoch": 0.37, - "learning_rate": 1.9547942925734027e-06, - "loss": 1.0273, - "step": 14420 - }, - { - "epoch": 0.37, - "learning_rate": 1.954786066686241e-06, - "loss": 0.6997, - "step": 14421 - }, - { - "epoch": 0.37, - "learning_rate": 1.9547778400680434e-06, - "loss": 0.8115, - "step": 14422 - }, - { - "epoch": 0.37, - "learning_rate": 1.9547696127188165e-06, - "loss": 0.8799, - "step": 14423 - }, - { - "epoch": 0.37, - "learning_rate": 1.9547613846385663e-06, - "loss": 1.0605, - "step": 14424 - }, - { - "epoch": 0.37, - "learning_rate": 1.954753155827299e-06, - "loss": 0.9102, - "step": 14425 - }, - { - "epoch": 0.37, - "learning_rate": 1.9547449262850213e-06, - "loss": 0.7666, - "step": 14426 - }, - { - "epoch": 0.37, - "learning_rate": 1.9547366960117397e-06, - "loss": 0.9775, - "step": 14427 - }, - { - "epoch": 0.37, - "learning_rate": 1.9547284650074593e-06, - "loss": 0.8281, - "step": 14428 - }, - { - "epoch": 0.37, - "learning_rate": 1.954720233272188e-06, - "loss": 0.6035, - "step": 14429 - }, - { - "epoch": 0.37, - "learning_rate": 1.9547120008059307e-06, - "loss": 0.9824, - "step": 14430 - }, - { - "epoch": 0.37, - "learning_rate": 1.9547037676086947e-06, - "loss": 1.0811, - "step": 14431 - }, - { - "epoch": 0.37, - "learning_rate": 1.9546955336804854e-06, - "loss": 1.1816, - "step": 14432 - }, - { - "epoch": 0.37, - "learning_rate": 1.95468729902131e-06, - "loss": 0.8345, - "step": 14433 - }, - { - "epoch": 0.37, - "learning_rate": 1.9546790636311747e-06, - "loss": 0.9177, - "step": 14434 - }, - { - "epoch": 0.37, - "learning_rate": 1.954670827510085e-06, - "loss": 1.0225, - "step": 14435 - }, - { - "epoch": 0.37, - "learning_rate": 1.954662590658048e-06, - "loss": 0.8525, - "step": 14436 - }, - { - "epoch": 0.37, - "learning_rate": 1.95465435307507e-06, - "loss": 0.748, - "step": 14437 - }, - { - "epoch": 0.37, - "learning_rate": 1.954646114761157e-06, - "loss": 0.8779, - "step": 14438 - }, - { - "epoch": 0.37, - "learning_rate": 1.954637875716315e-06, - "loss": 0.9912, - "step": 14439 - }, - { - "epoch": 0.37, - "learning_rate": 1.954629635940551e-06, - "loss": 1.0215, - "step": 14440 - }, - { - "epoch": 0.37, - "learning_rate": 1.9546213954338707e-06, - "loss": 0.6445, - "step": 14441 - }, - { - "epoch": 0.37, - "learning_rate": 1.954613154196281e-06, - "loss": 0.9727, - "step": 14442 - }, - { - "epoch": 0.37, - "learning_rate": 1.954604912227788e-06, - "loss": 0.7471, - "step": 14443 - }, - { - "epoch": 0.37, - "learning_rate": 1.9545966695283973e-06, - "loss": 0.9404, - "step": 14444 - }, - { - "epoch": 0.37, - "learning_rate": 1.954588426098116e-06, - "loss": 0.7568, - "step": 14445 - }, - { - "epoch": 0.37, - "learning_rate": 1.954580181936951e-06, - "loss": 1.0713, - "step": 14446 - }, - { - "epoch": 0.37, - "learning_rate": 1.9545719370449068e-06, - "loss": 0.9893, - "step": 14447 - }, - { - "epoch": 0.37, - "learning_rate": 1.9545636914219914e-06, - "loss": 0.6655, - "step": 14448 - }, - { - "epoch": 0.37, - "learning_rate": 1.9545554450682102e-06, - "loss": 0.7947, - "step": 14449 - }, - { - "epoch": 0.37, - "learning_rate": 1.95454719798357e-06, - "loss": 1.0723, - "step": 14450 - }, - { - "epoch": 0.37, - "learning_rate": 1.954538950168077e-06, - "loss": 0.6992, - "step": 14451 - }, - { - "epoch": 0.37, - "learning_rate": 1.954530701621737e-06, - "loss": 0.8584, - "step": 14452 - }, - { - "epoch": 0.37, - "learning_rate": 1.954522452344557e-06, - "loss": 0.8838, - "step": 14453 - }, - { - "epoch": 0.37, - "learning_rate": 1.954514202336543e-06, - "loss": 0.6987, - "step": 14454 - }, - { - "epoch": 0.37, - "learning_rate": 1.9545059515977014e-06, - "loss": 0.9482, - "step": 14455 - }, - { - "epoch": 0.37, - "learning_rate": 1.954497700128038e-06, - "loss": 0.9902, - "step": 14456 - }, - { - "epoch": 0.37, - "learning_rate": 1.9544894479275604e-06, - "loss": 1.0117, - "step": 14457 - }, - { - "epoch": 0.37, - "learning_rate": 1.9544811949962736e-06, - "loss": 0.9248, - "step": 14458 - }, - { - "epoch": 0.37, - "learning_rate": 1.9544729413341847e-06, - "loss": 0.6807, - "step": 14459 - }, - { - "epoch": 0.37, - "learning_rate": 1.9544646869412993e-06, - "loss": 0.7695, - "step": 14460 - }, - { - "epoch": 0.37, - "learning_rate": 1.954456431817625e-06, - "loss": 0.7764, - "step": 14461 - }, - { - "epoch": 0.37, - "learning_rate": 1.954448175963167e-06, - "loss": 0.7505, - "step": 14462 - }, - { - "epoch": 0.37, - "learning_rate": 1.9544399193779312e-06, - "loss": 0.8984, - "step": 14463 - }, - { - "epoch": 0.37, - "learning_rate": 1.954431662061925e-06, - "loss": 0.8789, - "step": 14464 - }, - { - "epoch": 0.37, - "learning_rate": 1.9544234040151548e-06, - "loss": 0.8584, - "step": 14465 - }, - { - "epoch": 0.37, - "learning_rate": 1.9544151452376263e-06, - "loss": 0.752, - "step": 14466 - }, - { - "epoch": 0.37, - "learning_rate": 1.954406885729346e-06, - "loss": 0.6335, - "step": 14467 - }, - { - "epoch": 0.37, - "learning_rate": 1.95439862549032e-06, - "loss": 0.7612, - "step": 14468 - }, - { - "epoch": 0.37, - "learning_rate": 1.954390364520555e-06, - "loss": 0.835, - "step": 14469 - }, - { - "epoch": 0.37, - "learning_rate": 1.9543821028200574e-06, - "loss": 0.7104, - "step": 14470 - }, - { - "epoch": 0.37, - "learning_rate": 1.954373840388833e-06, - "loss": 0.8828, - "step": 14471 - }, - { - "epoch": 0.37, - "learning_rate": 1.9543655772268886e-06, - "loss": 0.835, - "step": 14472 - }, - { - "epoch": 0.37, - "learning_rate": 1.9543573133342302e-06, - "loss": 0.9336, - "step": 14473 - }, - { - "epoch": 0.37, - "learning_rate": 1.9543490487108645e-06, - "loss": 0.9531, - "step": 14474 - }, - { - "epoch": 0.37, - "learning_rate": 1.9543407833567977e-06, - "loss": 0.7827, - "step": 14475 - }, - { - "epoch": 0.37, - "learning_rate": 1.954332517272036e-06, - "loss": 0.751, - "step": 14476 - }, - { - "epoch": 0.37, - "learning_rate": 1.9543242504565852e-06, - "loss": 0.7568, - "step": 14477 - }, - { - "epoch": 0.37, - "learning_rate": 1.9543159829104527e-06, - "loss": 1.0947, - "step": 14478 - }, - { - "epoch": 0.37, - "learning_rate": 1.954307714633644e-06, - "loss": 0.9258, - "step": 14479 - }, - { - "epoch": 0.37, - "learning_rate": 1.9542994456261662e-06, - "loss": 0.7832, - "step": 14480 - }, - { - "epoch": 0.37, - "learning_rate": 1.954291175888025e-06, - "loss": 1.0, - "step": 14481 - }, - { - "epoch": 0.37, - "learning_rate": 1.9542829054192273e-06, - "loss": 0.9014, - "step": 14482 - }, - { - "epoch": 0.37, - "learning_rate": 1.9542746342197785e-06, - "loss": 0.7715, - "step": 14483 - }, - { - "epoch": 0.37, - "learning_rate": 1.954266362289686e-06, - "loss": 0.9922, - "step": 14484 - }, - { - "epoch": 0.37, - "learning_rate": 1.954258089628955e-06, - "loss": 0.6709, - "step": 14485 - }, - { - "epoch": 0.37, - "learning_rate": 1.954249816237593e-06, - "loss": 0.918, - "step": 14486 - }, - { - "epoch": 0.37, - "learning_rate": 1.954241542115605e-06, - "loss": 0.7173, - "step": 14487 - }, - { - "epoch": 0.37, - "learning_rate": 1.954233267262999e-06, - "loss": 0.708, - "step": 14488 - }, - { - "epoch": 0.37, - "learning_rate": 1.9542249916797803e-06, - "loss": 0.8911, - "step": 14489 - }, - { - "epoch": 0.37, - "learning_rate": 1.954216715365955e-06, - "loss": 0.6816, - "step": 14490 - }, - { - "epoch": 0.37, - "learning_rate": 1.95420843832153e-06, - "loss": 0.957, - "step": 14491 - }, - { - "epoch": 0.37, - "learning_rate": 1.9542001605465116e-06, - "loss": 0.7969, - "step": 14492 - }, - { - "epoch": 0.37, - "learning_rate": 1.954191882040906e-06, - "loss": 0.8848, - "step": 14493 - }, - { - "epoch": 0.37, - "learning_rate": 1.9541836028047197e-06, - "loss": 0.9795, - "step": 14494 - }, - { - "epoch": 0.37, - "learning_rate": 1.9541753228379586e-06, - "loss": 1.0898, - "step": 14495 - }, - { - "epoch": 0.37, - "learning_rate": 1.9541670421406294e-06, - "loss": 0.9521, - "step": 14496 - }, - { - "epoch": 0.37, - "learning_rate": 1.9541587607127386e-06, - "loss": 0.8506, - "step": 14497 - }, - { - "epoch": 0.37, - "learning_rate": 1.9541504785542924e-06, - "loss": 0.9258, - "step": 14498 - }, - { - "epoch": 0.37, - "learning_rate": 1.9541421956652964e-06, - "loss": 0.9346, - "step": 14499 - }, - { - "epoch": 0.37, - "learning_rate": 1.9541339120457582e-06, - "loss": 0.9395, - "step": 14500 - }, - { - "epoch": 0.37, - "learning_rate": 1.9541256276956834e-06, - "loss": 0.7554, - "step": 14501 - }, - { - "epoch": 0.37, - "learning_rate": 1.954117342615078e-06, - "loss": 1.0537, - "step": 14502 - }, - { - "epoch": 0.37, - "learning_rate": 1.9541090568039493e-06, - "loss": 0.7256, - "step": 14503 - }, - { - "epoch": 0.37, - "learning_rate": 1.9541007702623033e-06, - "loss": 0.9824, - "step": 14504 - }, - { - "epoch": 0.37, - "learning_rate": 1.954092482990146e-06, - "loss": 0.8408, - "step": 14505 - }, - { - "epoch": 0.37, - "learning_rate": 1.954084194987484e-06, - "loss": 0.9795, - "step": 14506 - }, - { - "epoch": 0.37, - "learning_rate": 1.9540759062543235e-06, - "loss": 1.1113, - "step": 14507 - }, - { - "epoch": 0.37, - "learning_rate": 1.9540676167906713e-06, - "loss": 1.0049, - "step": 14508 - }, - { - "epoch": 0.37, - "learning_rate": 1.954059326596533e-06, - "loss": 0.8027, - "step": 14509 - }, - { - "epoch": 0.37, - "learning_rate": 1.9540510356719152e-06, - "loss": 1.0322, - "step": 14510 - }, - { - "epoch": 0.37, - "learning_rate": 1.954042744016825e-06, - "loss": 0.9541, - "step": 14511 - }, - { - "epoch": 0.37, - "learning_rate": 1.9540344516312674e-06, - "loss": 0.7871, - "step": 14512 - }, - { - "epoch": 0.37, - "learning_rate": 1.95402615851525e-06, - "loss": 0.8525, - "step": 14513 - }, - { - "epoch": 0.37, - "learning_rate": 1.9540178646687785e-06, - "loss": 0.792, - "step": 14514 - }, - { - "epoch": 0.37, - "learning_rate": 1.9540095700918595e-06, - "loss": 0.7656, - "step": 14515 - }, - { - "epoch": 0.37, - "learning_rate": 1.954001274784499e-06, - "loss": 0.7764, - "step": 14516 - }, - { - "epoch": 0.37, - "learning_rate": 1.9539929787467036e-06, - "loss": 0.9775, - "step": 14517 - }, - { - "epoch": 0.37, - "learning_rate": 1.95398468197848e-06, - "loss": 0.8857, - "step": 14518 - }, - { - "epoch": 0.37, - "learning_rate": 1.9539763844798337e-06, - "loss": 0.9209, - "step": 14519 - }, - { - "epoch": 0.37, - "learning_rate": 1.953968086250772e-06, - "loss": 0.8955, - "step": 14520 - }, - { - "epoch": 0.37, - "learning_rate": 1.9539597872913003e-06, - "loss": 1.084, - "step": 14521 - }, - { - "epoch": 0.37, - "learning_rate": 1.9539514876014257e-06, - "loss": 0.8418, - "step": 14522 - }, - { - "epoch": 0.37, - "learning_rate": 1.9539431871811546e-06, - "loss": 0.9639, - "step": 14523 - }, - { - "epoch": 0.37, - "learning_rate": 1.9539348860304925e-06, - "loss": 0.8096, - "step": 14524 - }, - { - "epoch": 0.37, - "learning_rate": 1.953926584149447e-06, - "loss": 0.7778, - "step": 14525 - }, - { - "epoch": 0.37, - "learning_rate": 1.9539182815380232e-06, - "loss": 0.7881, - "step": 14526 - }, - { - "epoch": 0.37, - "learning_rate": 1.9539099781962283e-06, - "loss": 0.9863, - "step": 14527 - }, - { - "epoch": 0.37, - "learning_rate": 1.9539016741240687e-06, - "loss": 0.9199, - "step": 14528 - }, - { - "epoch": 0.37, - "learning_rate": 1.95389336932155e-06, - "loss": 0.8828, - "step": 14529 - }, - { - "epoch": 0.37, - "learning_rate": 1.953885063788679e-06, - "loss": 0.7876, - "step": 14530 - }, - { - "epoch": 0.37, - "learning_rate": 1.9538767575254623e-06, - "loss": 0.9521, - "step": 14531 - }, - { - "epoch": 0.37, - "learning_rate": 1.953868450531906e-06, - "loss": 1.0488, - "step": 14532 - }, - { - "epoch": 0.37, - "learning_rate": 1.953860142808016e-06, - "loss": 1.0664, - "step": 14533 - }, - { - "epoch": 0.37, - "learning_rate": 1.9538518343537998e-06, - "loss": 0.7295, - "step": 14534 - }, - { - "epoch": 0.37, - "learning_rate": 1.9538435251692627e-06, - "loss": 1.0195, - "step": 14535 - }, - { - "epoch": 0.37, - "learning_rate": 1.9538352152544116e-06, - "loss": 0.8984, - "step": 14536 - }, - { - "epoch": 0.37, - "learning_rate": 1.953826904609253e-06, - "loss": 0.8691, - "step": 14537 - }, - { - "epoch": 0.37, - "learning_rate": 1.9538185932337928e-06, - "loss": 1.0977, - "step": 14538 - }, - { - "epoch": 0.37, - "learning_rate": 1.9538102811280372e-06, - "loss": 0.8174, - "step": 14539 - }, - { - "epoch": 0.37, - "learning_rate": 1.953801968291993e-06, - "loss": 0.916, - "step": 14540 - }, - { - "epoch": 0.37, - "learning_rate": 1.953793654725667e-06, - "loss": 1.0215, - "step": 14541 - }, - { - "epoch": 0.37, - "learning_rate": 1.9537853404290646e-06, - "loss": 0.9443, - "step": 14542 - }, - { - "epoch": 0.37, - "learning_rate": 1.953777025402193e-06, - "loss": 0.8262, - "step": 14543 - }, - { - "epoch": 0.37, - "learning_rate": 1.953768709645058e-06, - "loss": 0.7871, - "step": 14544 - }, - { - "epoch": 0.37, - "learning_rate": 1.9537603931576663e-06, - "loss": 0.7676, - "step": 14545 - }, - { - "epoch": 0.37, - "learning_rate": 1.9537520759400238e-06, - "loss": 0.9883, - "step": 14546 - }, - { - "epoch": 0.37, - "learning_rate": 1.9537437579921376e-06, - "loss": 0.7734, - "step": 14547 - }, - { - "epoch": 0.37, - "learning_rate": 1.9537354393140133e-06, - "loss": 1.0713, - "step": 14548 - }, - { - "epoch": 0.37, - "learning_rate": 1.9537271199056576e-06, - "loss": 1.0107, - "step": 14549 - }, - { - "epoch": 0.37, - "learning_rate": 1.9537187997670774e-06, - "loss": 0.9229, - "step": 14550 - }, - { - "epoch": 0.37, - "learning_rate": 1.9537104788982777e-06, - "loss": 0.8525, - "step": 14551 - }, - { - "epoch": 0.37, - "learning_rate": 1.9537021572992666e-06, - "loss": 1.0752, - "step": 14552 - }, - { - "epoch": 0.37, - "learning_rate": 1.953693834970049e-06, - "loss": 1.0723, - "step": 14553 - }, - { - "epoch": 0.37, - "learning_rate": 1.953685511910632e-06, - "loss": 1.1221, - "step": 14554 - }, - { - "epoch": 0.37, - "learning_rate": 1.9536771881210222e-06, - "loss": 0.9775, - "step": 14555 - }, - { - "epoch": 0.37, - "learning_rate": 1.9536688636012255e-06, - "loss": 0.9229, - "step": 14556 - }, - { - "epoch": 0.37, - "learning_rate": 1.9536605383512483e-06, - "loss": 0.9707, - "step": 14557 - }, - { - "epoch": 0.37, - "learning_rate": 1.953652212371097e-06, - "loss": 0.9561, - "step": 14558 - }, - { - "epoch": 0.37, - "learning_rate": 1.9536438856607785e-06, - "loss": 0.7974, - "step": 14559 - }, - { - "epoch": 0.37, - "learning_rate": 1.9536355582202983e-06, - "loss": 0.6421, - "step": 14560 - }, - { - "epoch": 0.37, - "learning_rate": 1.9536272300496634e-06, - "loss": 0.8662, - "step": 14561 - }, - { - "epoch": 0.37, - "learning_rate": 1.9536189011488797e-06, - "loss": 1.0029, - "step": 14562 - }, - { - "epoch": 0.37, - "learning_rate": 1.953610571517954e-06, - "loss": 0.9658, - "step": 14563 - }, - { - "epoch": 0.37, - "learning_rate": 1.9536022411568927e-06, - "loss": 0.8115, - "step": 14564 - }, - { - "epoch": 0.37, - "learning_rate": 1.9535939100657013e-06, - "loss": 0.8545, - "step": 14565 - }, - { - "epoch": 0.37, - "learning_rate": 1.953585578244388e-06, - "loss": 0.8633, - "step": 14566 - }, - { - "epoch": 0.37, - "learning_rate": 1.9535772456929574e-06, - "loss": 1.0059, - "step": 14567 - }, - { - "epoch": 0.37, - "learning_rate": 1.9535689124114167e-06, - "loss": 1.0078, - "step": 14568 - }, - { - "epoch": 0.37, - "learning_rate": 1.9535605783997718e-06, - "loss": 0.7871, - "step": 14569 - }, - { - "epoch": 0.37, - "learning_rate": 1.9535522436580297e-06, - "loss": 1.0107, - "step": 14570 - }, - { - "epoch": 0.37, - "learning_rate": 1.9535439081861965e-06, - "loss": 0.7949, - "step": 14571 - }, - { - "epoch": 0.37, - "learning_rate": 1.953535571984279e-06, - "loss": 0.875, - "step": 14572 - }, - { - "epoch": 0.37, - "learning_rate": 1.9535272350522825e-06, - "loss": 0.7822, - "step": 14573 - }, - { - "epoch": 0.37, - "learning_rate": 1.9535188973902144e-06, - "loss": 0.877, - "step": 14574 - }, - { - "epoch": 0.37, - "learning_rate": 1.9535105589980805e-06, - "loss": 0.5229, - "step": 14575 - }, - { - "epoch": 0.37, - "learning_rate": 1.9535022198758877e-06, - "loss": 0.6836, - "step": 14576 - }, - { - "epoch": 0.37, - "learning_rate": 1.953493880023642e-06, - "loss": 0.7515, - "step": 14577 - }, - { - "epoch": 0.37, - "learning_rate": 1.9534855394413492e-06, - "loss": 0.9629, - "step": 14578 - }, - { - "epoch": 0.37, - "learning_rate": 1.9534771981290176e-06, - "loss": 0.9023, - "step": 14579 - }, - { - "epoch": 0.37, - "learning_rate": 1.9534688560866516e-06, - "loss": 0.7585, - "step": 14580 - }, - { - "epoch": 0.37, - "learning_rate": 1.9534605133142584e-06, - "loss": 0.7891, - "step": 14581 - }, - { - "epoch": 0.37, - "learning_rate": 1.9534521698118443e-06, - "loss": 0.9336, - "step": 14582 - }, - { - "epoch": 0.37, - "learning_rate": 1.9534438255794157e-06, - "loss": 0.8584, - "step": 14583 - }, - { - "epoch": 0.37, - "learning_rate": 1.9534354806169794e-06, - "loss": 0.8438, - "step": 14584 - }, - { - "epoch": 0.37, - "learning_rate": 1.953427134924541e-06, - "loss": 0.5938, - "step": 14585 - }, - { - "epoch": 0.37, - "learning_rate": 1.9534187885021073e-06, - "loss": 1.0234, - "step": 14586 - }, - { - "epoch": 0.37, - "learning_rate": 1.9534104413496847e-06, - "loss": 0.9648, - "step": 14587 - }, - { - "epoch": 0.37, - "learning_rate": 1.9534020934672794e-06, - "loss": 0.9268, - "step": 14588 - }, - { - "epoch": 0.37, - "learning_rate": 1.9533937448548985e-06, - "loss": 0.7153, - "step": 14589 - }, - { - "epoch": 0.37, - "learning_rate": 1.953385395512547e-06, - "loss": 0.686, - "step": 14590 - }, - { - "epoch": 0.37, - "learning_rate": 1.953377045440233e-06, - "loss": 1.1748, - "step": 14591 - }, - { - "epoch": 0.37, - "learning_rate": 1.9533686946379614e-06, - "loss": 1.1523, - "step": 14592 - }, - { - "epoch": 0.37, - "learning_rate": 1.95336034310574e-06, - "loss": 0.8013, - "step": 14593 - }, - { - "epoch": 0.37, - "learning_rate": 1.9533519908435736e-06, - "loss": 0.9375, - "step": 14594 - }, - { - "epoch": 0.37, - "learning_rate": 1.9533436378514695e-06, - "loss": 0.916, - "step": 14595 - }, - { - "epoch": 0.37, - "learning_rate": 1.9533352841294348e-06, - "loss": 0.8721, - "step": 14596 - }, - { - "epoch": 0.37, - "learning_rate": 1.953326929677474e-06, - "loss": 0.6052, - "step": 14597 - }, - { - "epoch": 0.37, - "learning_rate": 1.9533185744955954e-06, - "loss": 0.9248, - "step": 14598 - }, - { - "epoch": 0.37, - "learning_rate": 1.9533102185838043e-06, - "loss": 0.8787, - "step": 14599 - }, - { - "epoch": 0.37, - "learning_rate": 1.9533018619421076e-06, - "loss": 0.9209, - "step": 14600 - }, - { - "epoch": 0.37, - "learning_rate": 1.953293504570511e-06, - "loss": 0.833, - "step": 14601 - }, - { - "epoch": 0.37, - "learning_rate": 1.953285146469022e-06, - "loss": 0.8564, - "step": 14602 - }, - { - "epoch": 0.37, - "learning_rate": 1.953276787637646e-06, - "loss": 0.834, - "step": 14603 - }, - { - "epoch": 0.37, - "learning_rate": 1.9532684280763903e-06, - "loss": 0.9551, - "step": 14604 - }, - { - "epoch": 0.37, - "learning_rate": 1.95326006778526e-06, - "loss": 0.769, - "step": 14605 - }, - { - "epoch": 0.37, - "learning_rate": 1.953251706764263e-06, - "loss": 0.8682, - "step": 14606 - }, - { - "epoch": 0.37, - "learning_rate": 1.953243345013405e-06, - "loss": 0.873, - "step": 14607 - }, - { - "epoch": 0.37, - "learning_rate": 1.953234982532692e-06, - "loss": 0.8994, - "step": 14608 - }, - { - "epoch": 0.37, - "learning_rate": 1.9532266193221308e-06, - "loss": 0.9102, - "step": 14609 - }, - { - "epoch": 0.37, - "learning_rate": 1.953218255381728e-06, - "loss": 0.8818, - "step": 14610 - }, - { - "epoch": 0.37, - "learning_rate": 1.95320989071149e-06, - "loss": 0.7803, - "step": 14611 - }, - { - "epoch": 0.37, - "learning_rate": 1.953201525311423e-06, - "loss": 0.9482, - "step": 14612 - }, - { - "epoch": 0.37, - "learning_rate": 1.9531931591815328e-06, - "loss": 1.0801, - "step": 14613 - }, - { - "epoch": 0.37, - "learning_rate": 1.953184792321827e-06, - "loss": 0.8633, - "step": 14614 - }, - { - "epoch": 0.37, - "learning_rate": 1.9531764247323115e-06, - "loss": 0.915, - "step": 14615 - }, - { - "epoch": 0.37, - "learning_rate": 1.953168056412992e-06, - "loss": 0.8711, - "step": 14616 - }, - { - "epoch": 0.37, - "learning_rate": 1.9531596873638762e-06, - "loss": 0.7539, - "step": 14617 - }, - { - "epoch": 0.37, - "learning_rate": 1.9531513175849695e-06, - "loss": 0.8477, - "step": 14618 - }, - { - "epoch": 0.37, - "learning_rate": 1.9531429470762787e-06, - "loss": 1.0518, - "step": 14619 - }, - { - "epoch": 0.37, - "learning_rate": 1.95313457583781e-06, - "loss": 0.9302, - "step": 14620 - }, - { - "epoch": 0.37, - "learning_rate": 1.9531262038695707e-06, - "loss": 0.8457, - "step": 14621 - }, - { - "epoch": 0.37, - "learning_rate": 1.953117831171566e-06, - "loss": 0.8325, - "step": 14622 - }, - { - "epoch": 0.37, - "learning_rate": 1.953109457743803e-06, - "loss": 0.8408, - "step": 14623 - }, - { - "epoch": 0.37, - "learning_rate": 1.953101083586287e-06, - "loss": 0.9077, - "step": 14624 - }, - { - "epoch": 0.37, - "learning_rate": 1.9530927086990264e-06, - "loss": 0.7532, - "step": 14625 - }, - { - "epoch": 0.37, - "learning_rate": 1.9530843330820265e-06, - "loss": 0.8037, - "step": 14626 - }, - { - "epoch": 0.37, - "learning_rate": 1.9530759567352932e-06, - "loss": 0.5752, - "step": 14627 - }, - { - "epoch": 0.37, - "learning_rate": 1.953067579658834e-06, - "loss": 0.76, - "step": 14628 - }, - { - "epoch": 0.37, - "learning_rate": 1.9530592018526544e-06, - "loss": 1.0117, - "step": 14629 - }, - { - "epoch": 0.37, - "learning_rate": 1.953050823316761e-06, - "loss": 0.6641, - "step": 14630 - }, - { - "epoch": 0.38, - "learning_rate": 1.953042444051161e-06, - "loss": 1.0098, - "step": 14631 - }, - { - "epoch": 0.38, - "learning_rate": 1.95303406405586e-06, - "loss": 0.7395, - "step": 14632 - }, - { - "epoch": 0.38, - "learning_rate": 1.9530256833308645e-06, - "loss": 0.9111, - "step": 14633 - }, - { - "epoch": 0.38, - "learning_rate": 1.9530173018761808e-06, - "loss": 1.0957, - "step": 14634 - }, - { - "epoch": 0.38, - "learning_rate": 1.953008919691816e-06, - "loss": 0.9629, - "step": 14635 - }, - { - "epoch": 0.38, - "learning_rate": 1.953000536777776e-06, - "loss": 0.9551, - "step": 14636 - }, - { - "epoch": 0.38, - "learning_rate": 1.952992153134067e-06, - "loss": 0.8398, - "step": 14637 - }, - { - "epoch": 0.38, - "learning_rate": 1.9529837687606963e-06, - "loss": 0.9287, - "step": 14638 - }, - { - "epoch": 0.38, - "learning_rate": 1.9529753836576694e-06, - "loss": 1.0889, - "step": 14639 - }, - { - "epoch": 0.38, - "learning_rate": 1.9529669978249934e-06, - "loss": 0.9072, - "step": 14640 - }, - { - "epoch": 0.38, - "learning_rate": 1.952958611262674e-06, - "loss": 0.873, - "step": 14641 - }, - { - "epoch": 0.38, - "learning_rate": 1.952950223970718e-06, - "loss": 0.9863, - "step": 14642 - }, - { - "epoch": 0.38, - "learning_rate": 1.952941835949132e-06, - "loss": 0.7153, - "step": 14643 - }, - { - "epoch": 0.38, - "learning_rate": 1.9529334471979222e-06, - "loss": 0.834, - "step": 14644 - }, - { - "epoch": 0.38, - "learning_rate": 1.952925057717095e-06, - "loss": 0.9277, - "step": 14645 - }, - { - "epoch": 0.38, - "learning_rate": 1.952916667506657e-06, - "loss": 0.9209, - "step": 14646 - }, - { - "epoch": 0.38, - "learning_rate": 1.9529082765666146e-06, - "loss": 0.9434, - "step": 14647 - }, - { - "epoch": 0.38, - "learning_rate": 1.9528998848969744e-06, - "loss": 0.6096, - "step": 14648 - }, - { - "epoch": 0.38, - "learning_rate": 1.952891492497742e-06, - "loss": 0.998, - "step": 14649 - }, - { - "epoch": 0.38, - "learning_rate": 1.9528830993689245e-06, - "loss": 0.665, - "step": 14650 - }, - { - "epoch": 0.38, - "learning_rate": 1.9528747055105284e-06, - "loss": 0.7725, - "step": 14651 - }, - { - "epoch": 0.38, - "learning_rate": 1.95286631092256e-06, - "loss": 0.8193, - "step": 14652 - }, - { - "epoch": 0.38, - "learning_rate": 1.9528579156050253e-06, - "loss": 0.874, - "step": 14653 - }, - { - "epoch": 0.38, - "learning_rate": 1.9528495195579316e-06, - "loss": 0.8906, - "step": 14654 - }, - { - "epoch": 0.38, - "learning_rate": 1.9528411227812846e-06, - "loss": 0.7988, - "step": 14655 - }, - { - "epoch": 0.38, - "learning_rate": 1.952832725275091e-06, - "loss": 0.8223, - "step": 14656 - }, - { - "epoch": 0.38, - "learning_rate": 1.9528243270393574e-06, - "loss": 1.0674, - "step": 14657 - }, - { - "epoch": 0.38, - "learning_rate": 1.9528159280740895e-06, - "loss": 0.7593, - "step": 14658 - }, - { - "epoch": 0.38, - "learning_rate": 1.952807528379295e-06, - "loss": 0.9844, - "step": 14659 - }, - { - "epoch": 0.38, - "learning_rate": 1.952799127954979e-06, - "loss": 0.8418, - "step": 14660 - }, - { - "epoch": 0.38, - "learning_rate": 1.9527907268011485e-06, - "loss": 0.8545, - "step": 14661 - }, - { - "epoch": 0.38, - "learning_rate": 1.95278232491781e-06, - "loss": 0.8066, - "step": 14662 - }, - { - "epoch": 0.38, - "learning_rate": 1.95277392230497e-06, - "loss": 0.8379, - "step": 14663 - }, - { - "epoch": 0.38, - "learning_rate": 1.952765518962635e-06, - "loss": 0.7432, - "step": 14664 - }, - { - "epoch": 0.38, - "learning_rate": 1.9527571148908112e-06, - "loss": 1.0254, - "step": 14665 - }, - { - "epoch": 0.38, - "learning_rate": 1.952748710089505e-06, - "loss": 1.1367, - "step": 14666 - }, - { - "epoch": 0.38, - "learning_rate": 1.952740304558723e-06, - "loss": 1.0166, - "step": 14667 - }, - { - "epoch": 0.38, - "learning_rate": 1.9527318982984714e-06, - "loss": 1.1436, - "step": 14668 - }, - { - "epoch": 0.38, - "learning_rate": 1.9527234913087568e-06, - "loss": 1.1729, - "step": 14669 - }, - { - "epoch": 0.38, - "learning_rate": 1.9527150835895855e-06, - "loss": 0.9453, - "step": 14670 - }, - { - "epoch": 0.38, - "learning_rate": 1.9527066751409646e-06, - "loss": 1.0752, - "step": 14671 - }, - { - "epoch": 0.38, - "learning_rate": 1.9526982659628993e-06, - "loss": 0.9551, - "step": 14672 - }, - { - "epoch": 0.38, - "learning_rate": 1.9526898560553972e-06, - "loss": 0.9805, - "step": 14673 - }, - { - "epoch": 0.38, - "learning_rate": 1.9526814454184642e-06, - "loss": 0.8828, - "step": 14674 - }, - { - "epoch": 0.38, - "learning_rate": 1.9526730340521067e-06, - "loss": 0.9355, - "step": 14675 - }, - { - "epoch": 0.38, - "learning_rate": 1.9526646219563314e-06, - "loss": 1.1162, - "step": 14676 - }, - { - "epoch": 0.38, - "learning_rate": 1.9526562091311447e-06, - "loss": 0.9697, - "step": 14677 - }, - { - "epoch": 0.38, - "learning_rate": 1.9526477955765525e-06, - "loss": 0.9297, - "step": 14678 - }, - { - "epoch": 0.38, - "learning_rate": 1.952639381292562e-06, - "loss": 0.7864, - "step": 14679 - }, - { - "epoch": 0.38, - "learning_rate": 1.952630966279179e-06, - "loss": 0.9941, - "step": 14680 - }, - { - "epoch": 0.38, - "learning_rate": 1.9526225505364107e-06, - "loss": 0.7202, - "step": 14681 - }, - { - "epoch": 0.38, - "learning_rate": 1.952614134064263e-06, - "loss": 0.856, - "step": 14682 - }, - { - "epoch": 0.38, - "learning_rate": 1.9526057168627426e-06, - "loss": 0.9785, - "step": 14683 - }, - { - "epoch": 0.38, - "learning_rate": 1.952597298931856e-06, - "loss": 0.8311, - "step": 14684 - }, - { - "epoch": 0.38, - "learning_rate": 1.9525888802716092e-06, - "loss": 0.8984, - "step": 14685 - }, - { - "epoch": 0.38, - "learning_rate": 1.9525804608820086e-06, - "loss": 0.834, - "step": 14686 - }, - { - "epoch": 0.38, - "learning_rate": 1.9525720407630614e-06, - "loss": 0.821, - "step": 14687 - }, - { - "epoch": 0.38, - "learning_rate": 1.952563619914773e-06, - "loss": 1.0322, - "step": 14688 - }, - { - "epoch": 0.38, - "learning_rate": 1.952555198337151e-06, - "loss": 1.0137, - "step": 14689 - }, - { - "epoch": 0.38, - "learning_rate": 1.952546776030201e-06, - "loss": 0.7893, - "step": 14690 - }, - { - "epoch": 0.38, - "learning_rate": 1.9525383529939298e-06, - "loss": 0.7959, - "step": 14691 - }, - { - "epoch": 0.38, - "learning_rate": 1.9525299292283435e-06, - "loss": 1.0381, - "step": 14692 - }, - { - "epoch": 0.38, - "learning_rate": 1.9525215047334492e-06, - "loss": 0.6711, - "step": 14693 - }, - { - "epoch": 0.38, - "learning_rate": 1.952513079509253e-06, - "loss": 0.8242, - "step": 14694 - }, - { - "epoch": 0.38, - "learning_rate": 1.9525046535557614e-06, - "loss": 0.8848, - "step": 14695 - }, - { - "epoch": 0.38, - "learning_rate": 1.9524962268729805e-06, - "loss": 0.9424, - "step": 14696 - }, - { - "epoch": 0.38, - "learning_rate": 1.952487799460917e-06, - "loss": 0.8662, - "step": 14697 - }, - { - "epoch": 0.38, - "learning_rate": 1.9524793713195777e-06, - "loss": 0.7368, - "step": 14698 - }, - { - "epoch": 0.38, - "learning_rate": 1.9524709424489683e-06, - "loss": 1.0107, - "step": 14699 - }, - { - "epoch": 0.38, - "learning_rate": 1.9524625128490962e-06, - "loss": 0.9004, - "step": 14700 - }, - { - "epoch": 0.38, - "learning_rate": 1.9524540825199673e-06, - "loss": 0.7053, - "step": 14701 - }, - { - "epoch": 0.38, - "learning_rate": 1.952445651461588e-06, - "loss": 0.9121, - "step": 14702 - }, - { - "epoch": 0.38, - "learning_rate": 1.9524372196739644e-06, - "loss": 0.709, - "step": 14703 - }, - { - "epoch": 0.38, - "learning_rate": 1.952428787157104e-06, - "loss": 0.8125, - "step": 14704 - }, - { - "epoch": 0.38, - "learning_rate": 1.9524203539110125e-06, - "loss": 0.833, - "step": 14705 - }, - { - "epoch": 0.38, - "learning_rate": 1.9524119199356964e-06, - "loss": 0.7949, - "step": 14706 - }, - { - "epoch": 0.38, - "learning_rate": 1.9524034852311625e-06, - "loss": 0.9697, - "step": 14707 - }, - { - "epoch": 0.38, - "learning_rate": 1.952395049797417e-06, - "loss": 0.9209, - "step": 14708 - }, - { - "epoch": 0.38, - "learning_rate": 1.9523866136344664e-06, - "loss": 0.832, - "step": 14709 - }, - { - "epoch": 0.38, - "learning_rate": 1.952378176742317e-06, - "loss": 0.8457, - "step": 14710 - }, - { - "epoch": 0.38, - "learning_rate": 1.9523697391209755e-06, - "loss": 1.0225, - "step": 14711 - }, - { - "epoch": 0.38, - "learning_rate": 1.9523613007704484e-06, - "loss": 1.1191, - "step": 14712 - }, - { - "epoch": 0.38, - "learning_rate": 1.952352861690742e-06, - "loss": 0.9268, - "step": 14713 - }, - { - "epoch": 0.38, - "learning_rate": 1.9523444218818625e-06, - "loss": 0.7979, - "step": 14714 - }, - { - "epoch": 0.38, - "learning_rate": 1.952335981343817e-06, - "loss": 1.04, - "step": 14715 - }, - { - "epoch": 0.38, - "learning_rate": 1.952327540076612e-06, - "loss": 0.9814, - "step": 14716 - }, - { - "epoch": 0.38, - "learning_rate": 1.9523190980802525e-06, - "loss": 0.7432, - "step": 14717 - }, - { - "epoch": 0.38, - "learning_rate": 1.952310655354747e-06, - "loss": 0.665, - "step": 14718 - }, - { - "epoch": 0.38, - "learning_rate": 1.9523022119001004e-06, - "loss": 0.8975, - "step": 14719 - }, - { - "epoch": 0.38, - "learning_rate": 1.9522937677163204e-06, - "loss": 0.9707, - "step": 14720 - }, - { - "epoch": 0.38, - "learning_rate": 1.9522853228034123e-06, - "loss": 0.5, - "step": 14721 - }, - { - "epoch": 0.38, - "learning_rate": 1.9522768771613833e-06, - "loss": 0.8643, - "step": 14722 - }, - { - "epoch": 0.38, - "learning_rate": 1.9522684307902398e-06, - "loss": 0.7581, - "step": 14723 - }, - { - "epoch": 0.38, - "learning_rate": 1.952259983689988e-06, - "loss": 0.9209, - "step": 14724 - }, - { - "epoch": 0.38, - "learning_rate": 1.952251535860635e-06, - "loss": 1.0703, - "step": 14725 - }, - { - "epoch": 0.38, - "learning_rate": 1.952243087302186e-06, - "loss": 0.877, - "step": 14726 - }, - { - "epoch": 0.38, - "learning_rate": 1.952234638014649e-06, - "loss": 0.8662, - "step": 14727 - }, - { - "epoch": 0.38, - "learning_rate": 1.9522261879980292e-06, - "loss": 0.9434, - "step": 14728 - }, - { - "epoch": 0.38, - "learning_rate": 1.9522177372523336e-06, - "loss": 0.8174, - "step": 14729 - }, - { - "epoch": 0.38, - "learning_rate": 1.952209285777569e-06, - "loss": 1.0859, - "step": 14730 - }, - { - "epoch": 0.38, - "learning_rate": 1.9522008335737412e-06, - "loss": 0.9893, - "step": 14731 - }, - { - "epoch": 0.38, - "learning_rate": 1.9521923806408575e-06, - "loss": 0.8457, - "step": 14732 - }, - { - "epoch": 0.38, - "learning_rate": 1.9521839269789232e-06, - "loss": 0.8232, - "step": 14733 - }, - { - "epoch": 0.38, - "learning_rate": 1.952175472587946e-06, - "loss": 1.1807, - "step": 14734 - }, - { - "epoch": 0.38, - "learning_rate": 1.9521670174679317e-06, - "loss": 1.0039, - "step": 14735 - }, - { - "epoch": 0.38, - "learning_rate": 1.952158561618887e-06, - "loss": 0.8223, - "step": 14736 - }, - { - "epoch": 0.38, - "learning_rate": 1.952150105040818e-06, - "loss": 0.9385, - "step": 14737 - }, - { - "epoch": 0.38, - "learning_rate": 1.952141647733731e-06, - "loss": 0.8901, - "step": 14738 - }, - { - "epoch": 0.38, - "learning_rate": 1.952133189697634e-06, - "loss": 1.0342, - "step": 14739 - }, - { - "epoch": 0.38, - "learning_rate": 1.9521247309325317e-06, - "loss": 0.8789, - "step": 14740 - }, - { - "epoch": 0.38, - "learning_rate": 1.952116271438431e-06, - "loss": 0.9229, - "step": 14741 - }, - { - "epoch": 0.38, - "learning_rate": 1.9521078112153395e-06, - "loss": 0.8105, - "step": 14742 - }, - { - "epoch": 0.38, - "learning_rate": 1.9520993502632624e-06, - "loss": 0.8901, - "step": 14743 - }, - { - "epoch": 0.38, - "learning_rate": 1.9520908885822063e-06, - "loss": 0.5857, - "step": 14744 - }, - { - "epoch": 0.38, - "learning_rate": 1.9520824261721784e-06, - "loss": 0.792, - "step": 14745 - }, - { - "epoch": 0.38, - "learning_rate": 1.9520739630331846e-06, - "loss": 0.9209, - "step": 14746 - }, - { - "epoch": 0.38, - "learning_rate": 1.952065499165232e-06, - "loss": 0.8027, - "step": 14747 - }, - { - "epoch": 0.38, - "learning_rate": 1.9520570345683258e-06, - "loss": 0.7686, - "step": 14748 - }, - { - "epoch": 0.38, - "learning_rate": 1.9520485692424738e-06, - "loss": 0.7422, - "step": 14749 - }, - { - "epoch": 0.38, - "learning_rate": 1.952040103187682e-06, - "loss": 0.6636, - "step": 14750 - }, - { - "epoch": 0.38, - "learning_rate": 1.952031636403957e-06, - "loss": 0.7358, - "step": 14751 - }, - { - "epoch": 0.38, - "learning_rate": 1.9520231688913043e-06, - "loss": 0.9609, - "step": 14752 - }, - { - "epoch": 0.38, - "learning_rate": 1.952014700649732e-06, - "loss": 0.8301, - "step": 14753 - }, - { - "epoch": 0.38, - "learning_rate": 1.952006231679246e-06, - "loss": 0.8726, - "step": 14754 - }, - { - "epoch": 0.38, - "learning_rate": 1.951997761979852e-06, - "loss": 0.8906, - "step": 14755 - }, - { - "epoch": 0.38, - "learning_rate": 1.9519892915515577e-06, - "loss": 0.5164, - "step": 14756 - }, - { - "epoch": 0.38, - "learning_rate": 1.951980820394369e-06, - "loss": 0.8164, - "step": 14757 - }, - { - "epoch": 0.38, - "learning_rate": 1.9519723485082915e-06, - "loss": 0.8389, - "step": 14758 - }, - { - "epoch": 0.38, - "learning_rate": 1.951963875893333e-06, - "loss": 1.001, - "step": 14759 - }, - { - "epoch": 0.38, - "learning_rate": 1.9519554025495e-06, - "loss": 0.6865, - "step": 14760 - }, - { - "epoch": 0.38, - "learning_rate": 1.9519469284767977e-06, - "loss": 0.9414, - "step": 14761 - }, - { - "epoch": 0.38, - "learning_rate": 1.951938453675234e-06, - "loss": 0.7153, - "step": 14762 - }, - { - "epoch": 0.38, - "learning_rate": 1.9519299781448143e-06, - "loss": 0.8037, - "step": 14763 - }, - { - "epoch": 0.38, - "learning_rate": 1.951921501885546e-06, - "loss": 0.8809, - "step": 14764 - }, - { - "epoch": 0.38, - "learning_rate": 1.9519130248974353e-06, - "loss": 1.0215, - "step": 14765 - }, - { - "epoch": 0.38, - "learning_rate": 1.9519045471804883e-06, - "loss": 0.6323, - "step": 14766 - }, - { - "epoch": 0.38, - "learning_rate": 1.9518960687347118e-06, - "loss": 0.9326, - "step": 14767 - }, - { - "epoch": 0.38, - "learning_rate": 1.951887589560112e-06, - "loss": 0.792, - "step": 14768 - }, - { - "epoch": 0.38, - "learning_rate": 1.951879109656696e-06, - "loss": 1.0996, - "step": 14769 - }, - { - "epoch": 0.38, - "learning_rate": 1.95187062902447e-06, - "loss": 0.9785, - "step": 14770 - }, - { - "epoch": 0.38, - "learning_rate": 1.95186214766344e-06, - "loss": 0.9453, - "step": 14771 - }, - { - "epoch": 0.38, - "learning_rate": 1.951853665573613e-06, - "loss": 0.875, - "step": 14772 - }, - { - "epoch": 0.38, - "learning_rate": 1.951845182754996e-06, - "loss": 0.7202, - "step": 14773 - }, - { - "epoch": 0.38, - "learning_rate": 1.951836699207594e-06, - "loss": 0.8701, - "step": 14774 - }, - { - "epoch": 0.38, - "learning_rate": 1.951828214931415e-06, - "loss": 0.9082, - "step": 14775 - }, - { - "epoch": 0.38, - "learning_rate": 1.9518197299264647e-06, - "loss": 0.9141, - "step": 14776 - }, - { - "epoch": 0.38, - "learning_rate": 1.95181124419275e-06, - "loss": 0.9902, - "step": 14777 - }, - { - "epoch": 0.38, - "learning_rate": 1.9518027577302773e-06, - "loss": 0.7681, - "step": 14778 - }, - { - "epoch": 0.38, - "learning_rate": 1.951794270539053e-06, - "loss": 0.9019, - "step": 14779 - }, - { - "epoch": 0.38, - "learning_rate": 1.9517857826190832e-06, - "loss": 1.0205, - "step": 14780 - }, - { - "epoch": 0.38, - "learning_rate": 1.951777293970375e-06, - "loss": 0.7881, - "step": 14781 - }, - { - "epoch": 0.38, - "learning_rate": 1.951768804592935e-06, - "loss": 0.9238, - "step": 14782 - }, - { - "epoch": 0.38, - "learning_rate": 1.9517603144867686e-06, - "loss": 0.9775, - "step": 14783 - }, - { - "epoch": 0.38, - "learning_rate": 1.9517518236518837e-06, - "loss": 0.7222, - "step": 14784 - }, - { - "epoch": 0.38, - "learning_rate": 1.951743332088286e-06, - "loss": 0.9072, - "step": 14785 - }, - { - "epoch": 0.38, - "learning_rate": 1.9517348397959824e-06, - "loss": 0.8418, - "step": 14786 - }, - { - "epoch": 0.38, - "learning_rate": 1.9517263467749788e-06, - "loss": 0.8965, - "step": 14787 - }, - { - "epoch": 0.38, - "learning_rate": 1.9517178530252824e-06, - "loss": 0.9551, - "step": 14788 - }, - { - "epoch": 0.38, - "learning_rate": 1.9517093585468993e-06, - "loss": 0.9678, - "step": 14789 - }, - { - "epoch": 0.38, - "learning_rate": 1.951700863339836e-06, - "loss": 0.8428, - "step": 14790 - }, - { - "epoch": 0.38, - "learning_rate": 1.9516923674040993e-06, - "loss": 1.0508, - "step": 14791 - }, - { - "epoch": 0.38, - "learning_rate": 1.9516838707396953e-06, - "loss": 1.0459, - "step": 14792 - }, - { - "epoch": 0.38, - "learning_rate": 1.951675373346631e-06, - "loss": 0.9932, - "step": 14793 - }, - { - "epoch": 0.38, - "learning_rate": 1.9516668752249128e-06, - "loss": 0.8828, - "step": 14794 - }, - { - "epoch": 0.38, - "learning_rate": 1.9516583763745466e-06, - "loss": 1.0459, - "step": 14795 - }, - { - "epoch": 0.38, - "learning_rate": 1.9516498767955394e-06, - "loss": 0.7529, - "step": 14796 - }, - { - "epoch": 0.38, - "learning_rate": 1.9516413764878976e-06, - "loss": 0.8496, - "step": 14797 - }, - { - "epoch": 0.38, - "learning_rate": 1.951632875451628e-06, - "loss": 1.0498, - "step": 14798 - }, - { - "epoch": 0.38, - "learning_rate": 1.951624373686737e-06, - "loss": 0.7871, - "step": 14799 - }, - { - "epoch": 0.38, - "learning_rate": 1.9516158711932304e-06, - "loss": 0.7949, - "step": 14800 - }, - { - "epoch": 0.38, - "learning_rate": 1.951607367971116e-06, - "loss": 0.9619, - "step": 14801 - }, - { - "epoch": 0.38, - "learning_rate": 1.951598864020399e-06, - "loss": 1.1123, - "step": 14802 - }, - { - "epoch": 0.38, - "learning_rate": 1.9515903593410866e-06, - "loss": 0.9648, - "step": 14803 - }, - { - "epoch": 0.38, - "learning_rate": 1.9515818539331853e-06, - "loss": 0.9912, - "step": 14804 - }, - { - "epoch": 0.38, - "learning_rate": 1.9515733477967015e-06, - "loss": 1.0244, - "step": 14805 - }, - { - "epoch": 0.38, - "learning_rate": 1.951564840931642e-06, - "loss": 0.9312, - "step": 14806 - }, - { - "epoch": 0.38, - "learning_rate": 1.9515563333380127e-06, - "loss": 1.0938, - "step": 14807 - }, - { - "epoch": 0.38, - "learning_rate": 1.9515478250158205e-06, - "loss": 0.9277, - "step": 14808 - }, - { - "epoch": 0.38, - "learning_rate": 1.9515393159650724e-06, - "loss": 1.0, - "step": 14809 - }, - { - "epoch": 0.38, - "learning_rate": 1.9515308061857734e-06, - "loss": 0.7227, - "step": 14810 - }, - { - "epoch": 0.38, - "learning_rate": 1.9515222956779317e-06, - "loss": 0.6064, - "step": 14811 - }, - { - "epoch": 0.38, - "learning_rate": 1.951513784441553e-06, - "loss": 0.8223, - "step": 14812 - }, - { - "epoch": 0.38, - "learning_rate": 1.9515052724766444e-06, - "loss": 0.7153, - "step": 14813 - }, - { - "epoch": 0.38, - "learning_rate": 1.9514967597832116e-06, - "loss": 0.9102, - "step": 14814 - }, - { - "epoch": 0.38, - "learning_rate": 1.951488246361261e-06, - "loss": 0.647, - "step": 14815 - }, - { - "epoch": 0.38, - "learning_rate": 1.9514797322108003e-06, - "loss": 0.9629, - "step": 14816 - }, - { - "epoch": 0.38, - "learning_rate": 1.951471217331835e-06, - "loss": 0.9834, - "step": 14817 - }, - { - "epoch": 0.38, - "learning_rate": 1.951462701724372e-06, - "loss": 0.7793, - "step": 14818 - }, - { - "epoch": 0.38, - "learning_rate": 1.9514541853884176e-06, - "loss": 0.7998, - "step": 14819 - }, - { - "epoch": 0.38, - "learning_rate": 1.951445668323979e-06, - "loss": 0.7891, - "step": 14820 - }, - { - "epoch": 0.38, - "learning_rate": 1.9514371505310616e-06, - "loss": 0.9492, - "step": 14821 - }, - { - "epoch": 0.38, - "learning_rate": 1.951428632009673e-06, - "loss": 1.0, - "step": 14822 - }, - { - "epoch": 0.38, - "learning_rate": 1.951420112759819e-06, - "loss": 0.7642, - "step": 14823 - }, - { - "epoch": 0.38, - "learning_rate": 1.951411592781506e-06, - "loss": 0.9346, - "step": 14824 - }, - { - "epoch": 0.38, - "learning_rate": 1.951403072074741e-06, - "loss": 1.1318, - "step": 14825 - }, - { - "epoch": 0.38, - "learning_rate": 1.951394550639531e-06, - "loss": 1.0186, - "step": 14826 - }, - { - "epoch": 0.38, - "learning_rate": 1.9513860284758815e-06, - "loss": 0.8477, - "step": 14827 - }, - { - "epoch": 0.38, - "learning_rate": 1.9513775055837993e-06, - "loss": 1.04, - "step": 14828 - }, - { - "epoch": 0.38, - "learning_rate": 1.9513689819632917e-06, - "loss": 0.7764, - "step": 14829 - }, - { - "epoch": 0.38, - "learning_rate": 1.951360457614364e-06, - "loss": 0.8467, - "step": 14830 - }, - { - "epoch": 0.38, - "learning_rate": 1.9513519325370237e-06, - "loss": 0.7661, - "step": 14831 - }, - { - "epoch": 0.38, - "learning_rate": 1.951343406731277e-06, - "loss": 0.9346, - "step": 14832 - }, - { - "epoch": 0.38, - "learning_rate": 1.95133488019713e-06, - "loss": 0.9404, - "step": 14833 - }, - { - "epoch": 0.38, - "learning_rate": 1.95132635293459e-06, - "loss": 1.0391, - "step": 14834 - }, - { - "epoch": 0.38, - "learning_rate": 1.9513178249436634e-06, - "loss": 0.6942, - "step": 14835 - }, - { - "epoch": 0.38, - "learning_rate": 1.951309296224356e-06, - "loss": 0.8413, - "step": 14836 - }, - { - "epoch": 0.38, - "learning_rate": 1.951300766776675e-06, - "loss": 0.835, - "step": 14837 - }, - { - "epoch": 0.38, - "learning_rate": 1.9512922366006265e-06, - "loss": 0.7529, - "step": 14838 - }, - { - "epoch": 0.38, - "learning_rate": 1.951283705696218e-06, - "loss": 0.8643, - "step": 14839 - }, - { - "epoch": 0.38, - "learning_rate": 1.9512751740634544e-06, - "loss": 0.7148, - "step": 14840 - }, - { - "epoch": 0.38, - "learning_rate": 1.9512666417023435e-06, - "loss": 0.7979, - "step": 14841 - }, - { - "epoch": 0.38, - "learning_rate": 1.951258108612892e-06, - "loss": 0.9102, - "step": 14842 - }, - { - "epoch": 0.38, - "learning_rate": 1.951249574795105e-06, - "loss": 0.999, - "step": 14843 - }, - { - "epoch": 0.38, - "learning_rate": 1.9512410402489903e-06, - "loss": 0.9355, - "step": 14844 - }, - { - "epoch": 0.38, - "learning_rate": 1.951232504974554e-06, - "loss": 0.7096, - "step": 14845 - }, - { - "epoch": 0.38, - "learning_rate": 1.951223968971803e-06, - "loss": 0.8291, - "step": 14846 - }, - { - "epoch": 0.38, - "learning_rate": 1.9512154322407434e-06, - "loss": 1.043, - "step": 14847 - }, - { - "epoch": 0.38, - "learning_rate": 1.951206894781382e-06, - "loss": 1.0605, - "step": 14848 - }, - { - "epoch": 0.38, - "learning_rate": 1.951198356593725e-06, - "loss": 0.8154, - "step": 14849 - }, - { - "epoch": 0.38, - "learning_rate": 1.951189817677779e-06, - "loss": 0.7202, - "step": 14850 - }, - { - "epoch": 0.38, - "learning_rate": 1.951181278033551e-06, - "loss": 0.9512, - "step": 14851 - }, - { - "epoch": 0.38, - "learning_rate": 1.9511727376610475e-06, - "loss": 0.9102, - "step": 14852 - }, - { - "epoch": 0.38, - "learning_rate": 1.951164196560274e-06, - "loss": 0.9297, - "step": 14853 - }, - { - "epoch": 0.38, - "learning_rate": 1.9511556547312384e-06, - "loss": 0.9883, - "step": 14854 - }, - { - "epoch": 0.38, - "learning_rate": 1.9511471121739467e-06, - "loss": 1.0127, - "step": 14855 - }, - { - "epoch": 0.38, - "learning_rate": 1.951138568888405e-06, - "loss": 0.5039, - "step": 14856 - }, - { - "epoch": 0.38, - "learning_rate": 1.9511300248746207e-06, - "loss": 0.8369, - "step": 14857 - }, - { - "epoch": 0.38, - "learning_rate": 1.9511214801325994e-06, - "loss": 1.0898, - "step": 14858 - }, - { - "epoch": 0.38, - "learning_rate": 1.9511129346623484e-06, - "loss": 0.7891, - "step": 14859 - }, - { - "epoch": 0.38, - "learning_rate": 1.951104388463874e-06, - "loss": 1.1074, - "step": 14860 - }, - { - "epoch": 0.38, - "learning_rate": 1.9510958415371823e-06, - "loss": 0.8721, - "step": 14861 - }, - { - "epoch": 0.38, - "learning_rate": 1.9510872938822803e-06, - "loss": 0.7822, - "step": 14862 - }, - { - "epoch": 0.38, - "learning_rate": 1.951078745499175e-06, - "loss": 1.0723, - "step": 14863 - }, - { - "epoch": 0.38, - "learning_rate": 1.951070196387872e-06, - "loss": 0.8818, - "step": 14864 - }, - { - "epoch": 0.38, - "learning_rate": 1.9510616465483783e-06, - "loss": 0.7783, - "step": 14865 - }, - { - "epoch": 0.38, - "learning_rate": 1.9510530959807007e-06, - "loss": 1.0938, - "step": 14866 - }, - { - "epoch": 0.38, - "learning_rate": 1.9510445446848455e-06, - "loss": 1.002, - "step": 14867 - }, - { - "epoch": 0.38, - "learning_rate": 1.951035992660819e-06, - "loss": 0.9258, - "step": 14868 - }, - { - "epoch": 0.38, - "learning_rate": 1.951027439908628e-06, - "loss": 0.8535, - "step": 14869 - }, - { - "epoch": 0.38, - "learning_rate": 1.951018886428279e-06, - "loss": 0.9111, - "step": 14870 - }, - { - "epoch": 0.38, - "learning_rate": 1.951010332219778e-06, - "loss": 0.9326, - "step": 14871 - }, - { - "epoch": 0.38, - "learning_rate": 1.9510017772831335e-06, - "loss": 1.04, - "step": 14872 - }, - { - "epoch": 0.38, - "learning_rate": 1.9509932216183496e-06, - "loss": 0.9941, - "step": 14873 - }, - { - "epoch": 0.38, - "learning_rate": 1.9509846652254342e-06, - "loss": 0.8701, - "step": 14874 - }, - { - "epoch": 0.38, - "learning_rate": 1.9509761081043936e-06, - "loss": 0.9043, - "step": 14875 - }, - { - "epoch": 0.38, - "learning_rate": 1.950967550255234e-06, - "loss": 0.9844, - "step": 14876 - }, - { - "epoch": 0.38, - "learning_rate": 1.950958991677963e-06, - "loss": 0.833, - "step": 14877 - }, - { - "epoch": 0.38, - "learning_rate": 1.950950432372586e-06, - "loss": 0.9072, - "step": 14878 - }, - { - "epoch": 0.38, - "learning_rate": 1.95094187233911e-06, - "loss": 1.0713, - "step": 14879 - }, - { - "epoch": 0.38, - "learning_rate": 1.9509333115775414e-06, - "loss": 0.9326, - "step": 14880 - }, - { - "epoch": 0.38, - "learning_rate": 1.950924750087887e-06, - "loss": 1.1201, - "step": 14881 - }, - { - "epoch": 0.38, - "learning_rate": 1.9509161878701533e-06, - "loss": 0.8672, - "step": 14882 - }, - { - "epoch": 0.38, - "learning_rate": 1.9509076249243467e-06, - "loss": 0.7246, - "step": 14883 - }, - { - "epoch": 0.38, - "learning_rate": 1.9508990612504737e-06, - "loss": 1.0107, - "step": 14884 - }, - { - "epoch": 0.38, - "learning_rate": 1.950890496848541e-06, - "loss": 0.8438, - "step": 14885 - }, - { - "epoch": 0.38, - "learning_rate": 1.950881931718556e-06, - "loss": 1.0332, - "step": 14886 - }, - { - "epoch": 0.38, - "learning_rate": 1.9508733658605237e-06, - "loss": 0.9854, - "step": 14887 - }, - { - "epoch": 0.38, - "learning_rate": 1.9508647992744515e-06, - "loss": 0.7495, - "step": 14888 - }, - { - "epoch": 0.38, - "learning_rate": 1.9508562319603456e-06, - "loss": 0.9805, - "step": 14889 - }, - { - "epoch": 0.38, - "learning_rate": 1.950847663918213e-06, - "loss": 1.1348, - "step": 14890 - }, - { - "epoch": 0.38, - "learning_rate": 1.95083909514806e-06, - "loss": 1.0352, - "step": 14891 - }, - { - "epoch": 0.38, - "learning_rate": 1.9508305256498938e-06, - "loss": 1.1123, - "step": 14892 - }, - { - "epoch": 0.38, - "learning_rate": 1.95082195542372e-06, - "loss": 0.8086, - "step": 14893 - }, - { - "epoch": 0.38, - "learning_rate": 1.950813384469545e-06, - "loss": 0.957, - "step": 14894 - }, - { - "epoch": 0.38, - "learning_rate": 1.9508048127873765e-06, - "loss": 0.998, - "step": 14895 - }, - { - "epoch": 0.38, - "learning_rate": 1.9507962403772206e-06, - "loss": 0.8604, - "step": 14896 - }, - { - "epoch": 0.38, - "learning_rate": 1.9507876672390834e-06, - "loss": 0.668, - "step": 14897 - }, - { - "epoch": 0.38, - "learning_rate": 1.950779093372972e-06, - "loss": 0.9404, - "step": 14898 - }, - { - "epoch": 0.38, - "learning_rate": 1.9507705187788926e-06, - "loss": 0.7058, - "step": 14899 - }, - { - "epoch": 0.38, - "learning_rate": 1.950761943456852e-06, - "loss": 0.916, - "step": 14900 - }, - { - "epoch": 0.38, - "learning_rate": 1.9507533674068566e-06, - "loss": 0.916, - "step": 14901 - }, - { - "epoch": 0.38, - "learning_rate": 1.9507447906289134e-06, - "loss": 0.9707, - "step": 14902 - }, - { - "epoch": 0.38, - "learning_rate": 1.950736213123028e-06, - "loss": 0.9092, - "step": 14903 - }, - { - "epoch": 0.38, - "learning_rate": 1.9507276348892083e-06, - "loss": 1.0098, - "step": 14904 - }, - { - "epoch": 0.38, - "learning_rate": 1.9507190559274596e-06, - "loss": 0.6934, - "step": 14905 - }, - { - "epoch": 0.38, - "learning_rate": 1.9507104762377894e-06, - "loss": 0.9697, - "step": 14906 - }, - { - "epoch": 0.38, - "learning_rate": 1.9507018958202036e-06, - "loss": 0.9365, - "step": 14907 - }, - { - "epoch": 0.38, - "learning_rate": 1.9506933146747095e-06, - "loss": 0.9932, - "step": 14908 - }, - { - "epoch": 0.38, - "learning_rate": 1.9506847328013126e-06, - "loss": 0.792, - "step": 14909 - }, - { - "epoch": 0.38, - "learning_rate": 1.950676150200021e-06, - "loss": 1.0039, - "step": 14910 - }, - { - "epoch": 0.38, - "learning_rate": 1.9506675668708398e-06, - "loss": 0.7622, - "step": 14911 - }, - { - "epoch": 0.38, - "learning_rate": 1.950658982813776e-06, - "loss": 0.7446, - "step": 14912 - }, - { - "epoch": 0.38, - "learning_rate": 1.950650398028837e-06, - "loss": 0.854, - "step": 14913 - }, - { - "epoch": 0.38, - "learning_rate": 1.950641812516028e-06, - "loss": 1.0361, - "step": 14914 - }, - { - "epoch": 0.38, - "learning_rate": 1.9506332262753565e-06, - "loss": 0.9287, - "step": 14915 - }, - { - "epoch": 0.38, - "learning_rate": 1.950624639306829e-06, - "loss": 0.7578, - "step": 14916 - }, - { - "epoch": 0.38, - "learning_rate": 1.950616051610452e-06, - "loss": 0.6323, - "step": 14917 - }, - { - "epoch": 0.38, - "learning_rate": 1.9506074631862317e-06, - "loss": 0.9277, - "step": 14918 - }, - { - "epoch": 0.38, - "learning_rate": 1.950598874034175e-06, - "loss": 1.0391, - "step": 14919 - }, - { - "epoch": 0.38, - "learning_rate": 1.9505902841542887e-06, - "loss": 0.8462, - "step": 14920 - }, - { - "epoch": 0.38, - "learning_rate": 1.950581693546579e-06, - "loss": 0.7578, - "step": 14921 - }, - { - "epoch": 0.38, - "learning_rate": 1.9505731022110523e-06, - "loss": 0.8525, - "step": 14922 - }, - { - "epoch": 0.38, - "learning_rate": 1.950564510147716e-06, - "loss": 0.9971, - "step": 14923 - }, - { - "epoch": 0.38, - "learning_rate": 1.950555917356576e-06, - "loss": 0.7471, - "step": 14924 - }, - { - "epoch": 0.38, - "learning_rate": 1.950547323837639e-06, - "loss": 0.9346, - "step": 14925 - }, - { - "epoch": 0.38, - "learning_rate": 1.9505387295909113e-06, - "loss": 0.9111, - "step": 14926 - }, - { - "epoch": 0.38, - "learning_rate": 1.9505301346164003e-06, - "loss": 1.168, - "step": 14927 - }, - { - "epoch": 0.38, - "learning_rate": 1.950521538914112e-06, - "loss": 0.7529, - "step": 14928 - }, - { - "epoch": 0.38, - "learning_rate": 1.9505129424840526e-06, - "loss": 0.9746, - "step": 14929 - }, - { - "epoch": 0.38, - "learning_rate": 1.95050434532623e-06, - "loss": 0.75, - "step": 14930 - }, - { - "epoch": 0.38, - "learning_rate": 1.950495747440649e-06, - "loss": 0.9414, - "step": 14931 - }, - { - "epoch": 0.38, - "learning_rate": 1.9504871488273176e-06, - "loss": 1.0391, - "step": 14932 - }, - { - "epoch": 0.38, - "learning_rate": 1.950478549486242e-06, - "loss": 0.8262, - "step": 14933 - }, - { - "epoch": 0.38, - "learning_rate": 1.950469949417429e-06, - "loss": 0.8516, - "step": 14934 - }, - { - "epoch": 0.38, - "learning_rate": 1.950461348620884e-06, - "loss": 0.8613, - "step": 14935 - }, - { - "epoch": 0.38, - "learning_rate": 1.9504527470966147e-06, - "loss": 0.813, - "step": 14936 - }, - { - "epoch": 0.38, - "learning_rate": 1.9504441448446274e-06, - "loss": 0.9863, - "step": 14937 - }, - { - "epoch": 0.38, - "learning_rate": 1.950435541864929e-06, - "loss": 0.8389, - "step": 14938 - }, - { - "epoch": 0.38, - "learning_rate": 1.9504269381575258e-06, - "loss": 0.8081, - "step": 14939 - }, - { - "epoch": 0.38, - "learning_rate": 1.950418333722424e-06, - "loss": 0.7905, - "step": 14940 - }, - { - "epoch": 0.38, - "learning_rate": 1.950409728559631e-06, - "loss": 0.8086, - "step": 14941 - }, - { - "epoch": 0.38, - "learning_rate": 1.9504011226691527e-06, - "loss": 0.873, - "step": 14942 - }, - { - "epoch": 0.38, - "learning_rate": 1.9503925160509964e-06, - "loss": 1.0518, - "step": 14943 - }, - { - "epoch": 0.38, - "learning_rate": 1.9503839087051677e-06, - "loss": 0.9043, - "step": 14944 - }, - { - "epoch": 0.38, - "learning_rate": 1.950375300631674e-06, - "loss": 0.9844, - "step": 14945 - }, - { - "epoch": 0.38, - "learning_rate": 1.9503666918305217e-06, - "loss": 0.6616, - "step": 14946 - }, - { - "epoch": 0.38, - "learning_rate": 1.9503580823017176e-06, - "loss": 0.7207, - "step": 14947 - }, - { - "epoch": 0.38, - "learning_rate": 1.9503494720452672e-06, - "loss": 0.8428, - "step": 14948 - }, - { - "epoch": 0.38, - "learning_rate": 1.9503408610611783e-06, - "loss": 0.7021, - "step": 14949 - }, - { - "epoch": 0.38, - "learning_rate": 1.9503322493494576e-06, - "loss": 1.0117, - "step": 14950 - }, - { - "epoch": 0.38, - "learning_rate": 1.9503236369101106e-06, - "loss": 0.7461, - "step": 14951 - }, - { - "epoch": 0.38, - "learning_rate": 1.9503150237431445e-06, - "loss": 1.1777, - "step": 14952 - }, - { - "epoch": 0.38, - "learning_rate": 1.950306409848566e-06, - "loss": 0.8135, - "step": 14953 - }, - { - "epoch": 0.38, - "learning_rate": 1.9502977952263818e-06, - "loss": 0.8525, - "step": 14954 - }, - { - "epoch": 0.38, - "learning_rate": 1.9502891798765982e-06, - "loss": 1.0781, - "step": 14955 - }, - { - "epoch": 0.38, - "learning_rate": 1.950280563799222e-06, - "loss": 0.8242, - "step": 14956 - }, - { - "epoch": 0.38, - "learning_rate": 1.950271946994259e-06, - "loss": 0.8447, - "step": 14957 - }, - { - "epoch": 0.38, - "learning_rate": 1.950263329461717e-06, - "loss": 0.7969, - "step": 14958 - }, - { - "epoch": 0.38, - "learning_rate": 1.950254711201602e-06, - "loss": 1.1465, - "step": 14959 - }, - { - "epoch": 0.38, - "learning_rate": 1.9502460922139206e-06, - "loss": 1.001, - "step": 14960 - }, - { - "epoch": 0.38, - "learning_rate": 1.9502374724986796e-06, - "loss": 1.0371, - "step": 14961 - }, - { - "epoch": 0.38, - "learning_rate": 1.950228852055885e-06, - "loss": 0.8096, - "step": 14962 - }, - { - "epoch": 0.38, - "learning_rate": 1.950220230885544e-06, - "loss": 0.8936, - "step": 14963 - }, - { - "epoch": 0.38, - "learning_rate": 1.950211608987664e-06, - "loss": 0.6895, - "step": 14964 - }, - { - "epoch": 0.38, - "learning_rate": 1.9502029863622497e-06, - "loss": 0.6921, - "step": 14965 - }, - { - "epoch": 0.38, - "learning_rate": 1.950194363009309e-06, - "loss": 0.9307, - "step": 14966 - }, - { - "epoch": 0.38, - "learning_rate": 1.9501857389288476e-06, - "loss": 0.8906, - "step": 14967 - }, - { - "epoch": 0.38, - "learning_rate": 1.950177114120873e-06, - "loss": 0.8232, - "step": 14968 - }, - { - "epoch": 0.38, - "learning_rate": 1.9501684885853917e-06, - "loss": 0.7705, - "step": 14969 - }, - { - "epoch": 0.38, - "learning_rate": 1.9501598623224102e-06, - "loss": 0.8774, - "step": 14970 - }, - { - "epoch": 0.38, - "learning_rate": 1.9501512353319346e-06, - "loss": 0.665, - "step": 14971 - }, - { - "epoch": 0.38, - "learning_rate": 1.950142607613972e-06, - "loss": 1.0752, - "step": 14972 - }, - { - "epoch": 0.38, - "learning_rate": 1.950133979168529e-06, - "loss": 0.8125, - "step": 14973 - }, - { - "epoch": 0.38, - "learning_rate": 1.9501253499956124e-06, - "loss": 1.0879, - "step": 14974 - }, - { - "epoch": 0.38, - "learning_rate": 1.950116720095228e-06, - "loss": 0.8892, - "step": 14975 - }, - { - "epoch": 0.38, - "learning_rate": 1.950108089467383e-06, - "loss": 0.9531, - "step": 14976 - }, - { - "epoch": 0.38, - "learning_rate": 1.950099458112084e-06, - "loss": 0.7651, - "step": 14977 - }, - { - "epoch": 0.38, - "learning_rate": 1.9500908260293376e-06, - "loss": 1.1084, - "step": 14978 - }, - { - "epoch": 0.38, - "learning_rate": 1.95008219321915e-06, - "loss": 0.9209, - "step": 14979 - }, - { - "epoch": 0.38, - "learning_rate": 1.9500735596815287e-06, - "loss": 0.8896, - "step": 14980 - }, - { - "epoch": 0.38, - "learning_rate": 1.9500649254164792e-06, - "loss": 0.5532, - "step": 14981 - }, - { - "epoch": 0.38, - "learning_rate": 1.950056290424009e-06, - "loss": 0.7515, - "step": 14982 - }, - { - "epoch": 0.38, - "learning_rate": 1.9500476547041243e-06, - "loss": 0.792, - "step": 14983 - }, - { - "epoch": 0.38, - "learning_rate": 1.9500390182568317e-06, - "loss": 0.8574, - "step": 14984 - }, - { - "epoch": 0.38, - "learning_rate": 1.950030381082138e-06, - "loss": 0.9902, - "step": 14985 - }, - { - "epoch": 0.38, - "learning_rate": 1.9500217431800497e-06, - "loss": 0.7969, - "step": 14986 - }, - { - "epoch": 0.38, - "learning_rate": 1.9500131045505736e-06, - "loss": 1.1299, - "step": 14987 - }, - { - "epoch": 0.38, - "learning_rate": 1.9500044651937164e-06, - "loss": 0.8223, - "step": 14988 - }, - { - "epoch": 0.38, - "learning_rate": 1.949995825109484e-06, - "loss": 0.8398, - "step": 14989 - }, - { - "epoch": 0.38, - "learning_rate": 1.9499871842978833e-06, - "loss": 0.9766, - "step": 14990 - }, - { - "epoch": 0.38, - "learning_rate": 1.9499785427589215e-06, - "loss": 0.8975, - "step": 14991 - }, - { - "epoch": 0.38, - "learning_rate": 1.9499699004926048e-06, - "loss": 0.7871, - "step": 14992 - }, - { - "epoch": 0.38, - "learning_rate": 1.9499612574989396e-06, - "loss": 0.8857, - "step": 14993 - }, - { - "epoch": 0.38, - "learning_rate": 1.9499526137779328e-06, - "loss": 0.6968, - "step": 14994 - }, - { - "epoch": 0.38, - "learning_rate": 1.949943969329591e-06, - "loss": 0.9951, - "step": 14995 - }, - { - "epoch": 0.38, - "learning_rate": 1.949935324153921e-06, - "loss": 0.9111, - "step": 14996 - }, - { - "epoch": 0.38, - "learning_rate": 1.9499266782509286e-06, - "loss": 0.9482, - "step": 14997 - }, - { - "epoch": 0.38, - "learning_rate": 1.949918031620622e-06, - "loss": 0.7896, - "step": 14998 - }, - { - "epoch": 0.38, - "learning_rate": 1.949909384263006e-06, - "loss": 1.0625, - "step": 14999 - }, - { - "epoch": 0.38, - "learning_rate": 1.949900736178088e-06, - "loss": 0.6641, - "step": 15000 - }, - { - "epoch": 0.38, - "learning_rate": 1.9498920873658754e-06, - "loss": 0.7715, - "step": 15001 - }, - { - "epoch": 0.38, - "learning_rate": 1.9498834378263735e-06, - "loss": 0.9194, - "step": 15002 - }, - { - "epoch": 0.38, - "learning_rate": 1.9498747875595896e-06, - "loss": 0.959, - "step": 15003 - }, - { - "epoch": 0.38, - "learning_rate": 1.9498661365655306e-06, - "loss": 0.8848, - "step": 15004 - }, - { - "epoch": 0.38, - "learning_rate": 1.9498574848442027e-06, - "loss": 0.876, - "step": 15005 - }, - { - "epoch": 0.38, - "learning_rate": 1.9498488323956123e-06, - "loss": 0.8379, - "step": 15006 - }, - { - "epoch": 0.38, - "learning_rate": 1.9498401792197666e-06, - "loss": 0.9629, - "step": 15007 - }, - { - "epoch": 0.38, - "learning_rate": 1.949831525316672e-06, - "loss": 0.8789, - "step": 15008 - }, - { - "epoch": 0.38, - "learning_rate": 1.949822870686335e-06, - "loss": 0.96, - "step": 15009 - }, - { - "epoch": 0.38, - "learning_rate": 1.949814215328762e-06, - "loss": 1.0303, - "step": 15010 - }, - { - "epoch": 0.38, - "learning_rate": 1.9498055592439598e-06, - "loss": 1.0127, - "step": 15011 - }, - { - "epoch": 0.38, - "learning_rate": 1.949796902431936e-06, - "loss": 1.04, - "step": 15012 - }, - { - "epoch": 0.38, - "learning_rate": 1.9497882448926957e-06, - "loss": 0.7842, - "step": 15013 - }, - { - "epoch": 0.38, - "learning_rate": 1.9497795866262464e-06, - "loss": 1.0, - "step": 15014 - }, - { - "epoch": 0.38, - "learning_rate": 1.9497709276325947e-06, - "loss": 0.6388, - "step": 15015 - }, - { - "epoch": 0.38, - "learning_rate": 1.9497622679117467e-06, - "loss": 1.0127, - "step": 15016 - }, - { - "epoch": 0.38, - "learning_rate": 1.9497536074637098e-06, - "loss": 0.7578, - "step": 15017 - }, - { - "epoch": 0.38, - "learning_rate": 1.94974494628849e-06, - "loss": 0.834, - "step": 15018 - }, - { - "epoch": 0.38, - "learning_rate": 1.949736284386094e-06, - "loss": 1.0869, - "step": 15019 - }, - { - "epoch": 0.38, - "learning_rate": 1.949727621756529e-06, - "loss": 1.0049, - "step": 15020 - }, - { - "epoch": 0.38, - "learning_rate": 1.949718958399801e-06, - "loss": 0.9844, - "step": 15021 - }, - { - "epoch": 0.39, - "learning_rate": 1.949710294315917e-06, - "loss": 0.8174, - "step": 15022 - }, - { - "epoch": 0.39, - "learning_rate": 1.9497016295048833e-06, - "loss": 1.0859, - "step": 15023 - }, - { - "epoch": 0.39, - "learning_rate": 1.949692963966707e-06, - "loss": 0.9297, - "step": 15024 - }, - { - "epoch": 0.39, - "learning_rate": 1.949684297701394e-06, - "loss": 0.9717, - "step": 15025 - }, - { - "epoch": 0.39, - "learning_rate": 1.949675630708952e-06, - "loss": 0.9932, - "step": 15026 - }, - { - "epoch": 0.39, - "learning_rate": 1.9496669629893865e-06, - "loss": 0.7422, - "step": 15027 - }, - { - "epoch": 0.39, - "learning_rate": 1.9496582945427053e-06, - "loss": 0.8008, - "step": 15028 - }, - { - "epoch": 0.39, - "learning_rate": 1.949649625368914e-06, - "loss": 0.6816, - "step": 15029 - }, - { - "epoch": 0.39, - "learning_rate": 1.949640955468019e-06, - "loss": 1.1562, - "step": 15030 - }, - { - "epoch": 0.39, - "learning_rate": 1.9496322848400286e-06, - "loss": 0.665, - "step": 15031 - }, - { - "epoch": 0.39, - "learning_rate": 1.9496236134849483e-06, - "loss": 0.96, - "step": 15032 - }, - { - "epoch": 0.39, - "learning_rate": 1.9496149414027843e-06, - "loss": 0.752, - "step": 15033 - }, - { - "epoch": 0.39, - "learning_rate": 1.9496062685935446e-06, - "loss": 0.7603, - "step": 15034 - }, - { - "epoch": 0.39, - "learning_rate": 1.9495975950572342e-06, - "loss": 1.0352, - "step": 15035 - }, - { - "epoch": 0.39, - "learning_rate": 1.9495889207938613e-06, - "loss": 0.9043, - "step": 15036 - }, - { - "epoch": 0.39, - "learning_rate": 1.9495802458034312e-06, - "loss": 1.1465, - "step": 15037 - }, - { - "epoch": 0.39, - "learning_rate": 1.9495715700859518e-06, - "loss": 0.9727, - "step": 15038 - }, - { - "epoch": 0.39, - "learning_rate": 1.9495628936414287e-06, - "loss": 0.8008, - "step": 15039 - }, - { - "epoch": 0.39, - "learning_rate": 1.949554216469869e-06, - "loss": 0.8799, - "step": 15040 - }, - { - "epoch": 0.39, - "learning_rate": 1.949545538571279e-06, - "loss": 1.0703, - "step": 15041 - }, - { - "epoch": 0.39, - "learning_rate": 1.9495368599456662e-06, - "loss": 0.8887, - "step": 15042 - }, - { - "epoch": 0.39, - "learning_rate": 1.9495281805930364e-06, - "loss": 0.8223, - "step": 15043 - }, - { - "epoch": 0.39, - "learning_rate": 1.949519500513397e-06, - "loss": 0.8574, - "step": 15044 - }, - { - "epoch": 0.39, - "learning_rate": 1.9495108197067534e-06, - "loss": 1.1406, - "step": 15045 - }, - { - "epoch": 0.39, - "learning_rate": 1.9495021381731137e-06, - "loss": 0.9316, - "step": 15046 - }, - { - "epoch": 0.39, - "learning_rate": 1.9494934559124834e-06, - "loss": 0.9688, - "step": 15047 - }, - { - "epoch": 0.39, - "learning_rate": 1.9494847729248697e-06, - "loss": 0.9404, - "step": 15048 - }, - { - "epoch": 0.39, - "learning_rate": 1.9494760892102794e-06, - "loss": 0.957, - "step": 15049 - }, - { - "epoch": 0.39, - "learning_rate": 1.949467404768719e-06, - "loss": 0.7949, - "step": 15050 - }, - { - "epoch": 0.39, - "learning_rate": 1.9494587196001944e-06, - "loss": 0.8506, - "step": 15051 - }, - { - "epoch": 0.39, - "learning_rate": 1.9494500337047137e-06, - "loss": 0.7251, - "step": 15052 - }, - { - "epoch": 0.39, - "learning_rate": 1.9494413470822826e-06, - "loss": 0.9297, - "step": 15053 - }, - { - "epoch": 0.39, - "learning_rate": 1.9494326597329075e-06, - "loss": 0.9932, - "step": 15054 - }, - { - "epoch": 0.39, - "learning_rate": 1.9494239716565955e-06, - "loss": 0.8994, - "step": 15055 - }, - { - "epoch": 0.39, - "learning_rate": 1.9494152828533536e-06, - "loss": 0.8779, - "step": 15056 - }, - { - "epoch": 0.39, - "learning_rate": 1.949406593323188e-06, - "loss": 0.6516, - "step": 15057 - }, - { - "epoch": 0.39, - "learning_rate": 1.949397903066105e-06, - "loss": 0.9395, - "step": 15058 - }, - { - "epoch": 0.39, - "learning_rate": 1.9493892120821124e-06, - "loss": 0.7803, - "step": 15059 - }, - { - "epoch": 0.39, - "learning_rate": 1.9493805203712156e-06, - "loss": 0.9971, - "step": 15060 - }, - { - "epoch": 0.39, - "learning_rate": 1.9493718279334217e-06, - "loss": 0.9111, - "step": 15061 - }, - { - "epoch": 0.39, - "learning_rate": 1.9493631347687377e-06, - "loss": 0.8701, - "step": 15062 - }, - { - "epoch": 0.39, - "learning_rate": 1.94935444087717e-06, - "loss": 1.1641, - "step": 15063 - }, - { - "epoch": 0.39, - "learning_rate": 1.9493457462587256e-06, - "loss": 0.834, - "step": 15064 - }, - { - "epoch": 0.39, - "learning_rate": 1.9493370509134103e-06, - "loss": 0.9121, - "step": 15065 - }, - { - "epoch": 0.39, - "learning_rate": 1.9493283548412315e-06, - "loss": 0.9409, - "step": 15066 - }, - { - "epoch": 0.39, - "learning_rate": 1.9493196580421954e-06, - "loss": 0.833, - "step": 15067 - }, - { - "epoch": 0.39, - "learning_rate": 1.949310960516309e-06, - "loss": 0.8857, - "step": 15068 - }, - { - "epoch": 0.39, - "learning_rate": 1.949302262263579e-06, - "loss": 0.957, - "step": 15069 - }, - { - "epoch": 0.39, - "learning_rate": 1.9492935632840116e-06, - "loss": 0.9355, - "step": 15070 - }, - { - "epoch": 0.39, - "learning_rate": 1.949284863577614e-06, - "loss": 0.7227, - "step": 15071 - }, - { - "epoch": 0.39, - "learning_rate": 1.9492761631443926e-06, - "loss": 0.9551, - "step": 15072 - }, - { - "epoch": 0.39, - "learning_rate": 1.9492674619843545e-06, - "loss": 0.8242, - "step": 15073 - }, - { - "epoch": 0.39, - "learning_rate": 1.9492587600975054e-06, - "loss": 0.8606, - "step": 15074 - }, - { - "epoch": 0.39, - "learning_rate": 1.9492500574838524e-06, - "loss": 0.7559, - "step": 15075 - }, - { - "epoch": 0.39, - "learning_rate": 1.949241354143403e-06, - "loss": 0.6704, - "step": 15076 - }, - { - "epoch": 0.39, - "learning_rate": 1.9492326500761626e-06, - "loss": 1.0264, - "step": 15077 - }, - { - "epoch": 0.39, - "learning_rate": 1.949223945282138e-06, - "loss": 0.8643, - "step": 15078 - }, - { - "epoch": 0.39, - "learning_rate": 1.949215239761337e-06, - "loss": 0.8291, - "step": 15079 - }, - { - "epoch": 0.39, - "learning_rate": 1.9492065335137655e-06, - "loss": 0.8052, - "step": 15080 - }, - { - "epoch": 0.39, - "learning_rate": 1.94919782653943e-06, - "loss": 0.9727, - "step": 15081 - }, - { - "epoch": 0.39, - "learning_rate": 1.9491891188383373e-06, - "loss": 0.9473, - "step": 15082 - }, - { - "epoch": 0.39, - "learning_rate": 1.949180410410494e-06, - "loss": 1.0566, - "step": 15083 - }, - { - "epoch": 0.39, - "learning_rate": 1.9491717012559073e-06, - "loss": 0.731, - "step": 15084 - }, - { - "epoch": 0.39, - "learning_rate": 1.949162991374583e-06, - "loss": 0.7068, - "step": 15085 - }, - { - "epoch": 0.39, - "learning_rate": 1.9491542807665285e-06, - "loss": 0.8555, - "step": 15086 - }, - { - "epoch": 0.39, - "learning_rate": 1.9491455694317506e-06, - "loss": 1.0195, - "step": 15087 - }, - { - "epoch": 0.39, - "learning_rate": 1.949136857370255e-06, - "loss": 1.0439, - "step": 15088 - }, - { - "epoch": 0.39, - "learning_rate": 1.9491281445820494e-06, - "loss": 0.8008, - "step": 15089 - }, - { - "epoch": 0.39, - "learning_rate": 1.9491194310671396e-06, - "loss": 0.7739, - "step": 15090 - }, - { - "epoch": 0.39, - "learning_rate": 1.9491107168255327e-06, - "loss": 0.7041, - "step": 15091 - }, - { - "epoch": 0.39, - "learning_rate": 1.9491020018572355e-06, - "loss": 0.9131, - "step": 15092 - }, - { - "epoch": 0.39, - "learning_rate": 1.9490932861622548e-06, - "loss": 1.0664, - "step": 15093 - }, - { - "epoch": 0.39, - "learning_rate": 1.949084569740597e-06, - "loss": 0.8086, - "step": 15094 - }, - { - "epoch": 0.39, - "learning_rate": 1.9490758525922685e-06, - "loss": 0.833, - "step": 15095 - }, - { - "epoch": 0.39, - "learning_rate": 1.949067134717276e-06, - "loss": 1.1113, - "step": 15096 - }, - { - "epoch": 0.39, - "learning_rate": 1.949058416115627e-06, - "loss": 0.7432, - "step": 15097 - }, - { - "epoch": 0.39, - "learning_rate": 1.9490496967873275e-06, - "loss": 0.9277, - "step": 15098 - }, - { - "epoch": 0.39, - "learning_rate": 1.949040976732384e-06, - "loss": 0.9102, - "step": 15099 - }, - { - "epoch": 0.39, - "learning_rate": 1.9490322559508035e-06, - "loss": 0.9512, - "step": 15100 - }, - { - "epoch": 0.39, - "learning_rate": 1.949023534442593e-06, - "loss": 0.9932, - "step": 15101 - }, - { - "epoch": 0.39, - "learning_rate": 1.9490148122077584e-06, - "loss": 0.834, - "step": 15102 - }, - { - "epoch": 0.39, - "learning_rate": 1.949006089246307e-06, - "loss": 0.998, - "step": 15103 - }, - { - "epoch": 0.39, - "learning_rate": 1.948997365558245e-06, - "loss": 0.7744, - "step": 15104 - }, - { - "epoch": 0.39, - "learning_rate": 1.94898864114358e-06, - "loss": 0.8975, - "step": 15105 - }, - { - "epoch": 0.39, - "learning_rate": 1.9489799160023174e-06, - "loss": 0.731, - "step": 15106 - }, - { - "epoch": 0.39, - "learning_rate": 1.948971190134465e-06, - "loss": 0.9805, - "step": 15107 - }, - { - "epoch": 0.39, - "learning_rate": 1.9489624635400286e-06, - "loss": 1.043, - "step": 15108 - }, - { - "epoch": 0.39, - "learning_rate": 1.9489537362190154e-06, - "loss": 0.9941, - "step": 15109 - }, - { - "epoch": 0.39, - "learning_rate": 1.948945008171432e-06, - "loss": 0.8662, - "step": 15110 - }, - { - "epoch": 0.39, - "learning_rate": 1.948936279397285e-06, - "loss": 0.8994, - "step": 15111 - }, - { - "epoch": 0.39, - "learning_rate": 1.9489275498965814e-06, - "loss": 0.5786, - "step": 15112 - }, - { - "epoch": 0.39, - "learning_rate": 1.9489188196693274e-06, - "loss": 0.7783, - "step": 15113 - }, - { - "epoch": 0.39, - "learning_rate": 1.9489100887155297e-06, - "loss": 0.9814, - "step": 15114 - }, - { - "epoch": 0.39, - "learning_rate": 1.9489013570351953e-06, - "loss": 0.9238, - "step": 15115 - }, - { - "epoch": 0.39, - "learning_rate": 1.9488926246283308e-06, - "loss": 1.002, - "step": 15116 - }, - { - "epoch": 0.39, - "learning_rate": 1.9488838914949427e-06, - "loss": 1.0039, - "step": 15117 - }, - { - "epoch": 0.39, - "learning_rate": 1.948875157635038e-06, - "loss": 0.8066, - "step": 15118 - }, - { - "epoch": 0.39, - "learning_rate": 1.9488664230486235e-06, - "loss": 0.8621, - "step": 15119 - }, - { - "epoch": 0.39, - "learning_rate": 1.948857687735705e-06, - "loss": 1.1016, - "step": 15120 - }, - { - "epoch": 0.39, - "learning_rate": 1.94884895169629e-06, - "loss": 0.8721, - "step": 15121 - }, - { - "epoch": 0.39, - "learning_rate": 1.9488402149303855e-06, - "loss": 0.9863, - "step": 15122 - }, - { - "epoch": 0.39, - "learning_rate": 1.948831477437997e-06, - "loss": 0.793, - "step": 15123 - }, - { - "epoch": 0.39, - "learning_rate": 1.948822739219132e-06, - "loss": 0.9375, - "step": 15124 - }, - { - "epoch": 0.39, - "learning_rate": 1.9488140002737973e-06, - "loss": 0.6099, - "step": 15125 - }, - { - "epoch": 0.39, - "learning_rate": 1.948805260601999e-06, - "loss": 1.041, - "step": 15126 - }, - { - "epoch": 0.39, - "learning_rate": 1.948796520203745e-06, - "loss": 0.9062, - "step": 15127 - }, - { - "epoch": 0.39, - "learning_rate": 1.94878777907904e-06, - "loss": 1.0107, - "step": 15128 - }, - { - "epoch": 0.39, - "learning_rate": 1.9487790372278925e-06, - "loss": 0.6575, - "step": 15129 - }, - { - "epoch": 0.39, - "learning_rate": 1.948770294650308e-06, - "loss": 0.7402, - "step": 15130 - }, - { - "epoch": 0.39, - "learning_rate": 1.9487615513462944e-06, - "loss": 0.9307, - "step": 15131 - }, - { - "epoch": 0.39, - "learning_rate": 1.9487528073158576e-06, - "loss": 0.6731, - "step": 15132 - }, - { - "epoch": 0.39, - "learning_rate": 1.948744062559004e-06, - "loss": 0.7405, - "step": 15133 - }, - { - "epoch": 0.39, - "learning_rate": 1.9487353170757406e-06, - "loss": 1.0537, - "step": 15134 - }, - { - "epoch": 0.39, - "learning_rate": 1.9487265708660744e-06, - "loss": 1.0332, - "step": 15135 - }, - { - "epoch": 0.39, - "learning_rate": 1.948717823930012e-06, - "loss": 0.9238, - "step": 15136 - }, - { - "epoch": 0.39, - "learning_rate": 1.9487090762675603e-06, - "loss": 0.959, - "step": 15137 - }, - { - "epoch": 0.39, - "learning_rate": 1.948700327878725e-06, - "loss": 0.6528, - "step": 15138 - }, - { - "epoch": 0.39, - "learning_rate": 1.948691578763514e-06, - "loss": 0.7705, - "step": 15139 - }, - { - "epoch": 0.39, - "learning_rate": 1.948682828921933e-06, - "loss": 1.1992, - "step": 15140 - }, - { - "epoch": 0.39, - "learning_rate": 1.9486740783539893e-06, - "loss": 0.8164, - "step": 15141 - }, - { - "epoch": 0.39, - "learning_rate": 1.94866532705969e-06, - "loss": 0.7725, - "step": 15142 - }, - { - "epoch": 0.39, - "learning_rate": 1.948656575039041e-06, - "loss": 0.9355, - "step": 15143 - }, - { - "epoch": 0.39, - "learning_rate": 1.948647822292049e-06, - "loss": 0.8145, - "step": 15144 - }, - { - "epoch": 0.39, - "learning_rate": 1.9486390688187214e-06, - "loss": 0.8252, - "step": 15145 - }, - { - "epoch": 0.39, - "learning_rate": 1.948630314619064e-06, - "loss": 0.8652, - "step": 15146 - }, - { - "epoch": 0.39, - "learning_rate": 1.9486215596930845e-06, - "loss": 0.8032, - "step": 15147 - }, - { - "epoch": 0.39, - "learning_rate": 1.9486128040407886e-06, - "loss": 0.7983, - "step": 15148 - }, - { - "epoch": 0.39, - "learning_rate": 1.9486040476621835e-06, - "loss": 0.8324, - "step": 15149 - }, - { - "epoch": 0.39, - "learning_rate": 1.9485952905572765e-06, - "loss": 0.9443, - "step": 15150 - }, - { - "epoch": 0.39, - "learning_rate": 1.948586532726073e-06, - "loss": 0.8994, - "step": 15151 - }, - { - "epoch": 0.39, - "learning_rate": 1.948577774168581e-06, - "loss": 0.9434, - "step": 15152 - }, - { - "epoch": 0.39, - "learning_rate": 1.9485690148848063e-06, - "loss": 0.877, - "step": 15153 - }, - { - "epoch": 0.39, - "learning_rate": 1.948560254874756e-06, - "loss": 0.9336, - "step": 15154 - }, - { - "epoch": 0.39, - "learning_rate": 1.948551494138437e-06, - "loss": 0.7676, - "step": 15155 - }, - { - "epoch": 0.39, - "learning_rate": 1.9485427326758553e-06, - "loss": 0.8828, - "step": 15156 - }, - { - "epoch": 0.39, - "learning_rate": 1.948533970487018e-06, - "loss": 0.6597, - "step": 15157 - }, - { - "epoch": 0.39, - "learning_rate": 1.948525207571932e-06, - "loss": 0.8828, - "step": 15158 - }, - { - "epoch": 0.39, - "learning_rate": 1.948516443930604e-06, - "loss": 0.7397, - "step": 15159 - }, - { - "epoch": 0.39, - "learning_rate": 1.9485076795630402e-06, - "loss": 0.9746, - "step": 15160 - }, - { - "epoch": 0.39, - "learning_rate": 1.948498914469248e-06, - "loss": 1.1885, - "step": 15161 - }, - { - "epoch": 0.39, - "learning_rate": 1.9484901486492337e-06, - "loss": 0.8066, - "step": 15162 - }, - { - "epoch": 0.39, - "learning_rate": 1.9484813821030044e-06, - "loss": 1.0527, - "step": 15163 - }, - { - "epoch": 0.39, - "learning_rate": 1.9484726148305662e-06, - "loss": 1.1641, - "step": 15164 - }, - { - "epoch": 0.39, - "learning_rate": 1.948463846831926e-06, - "loss": 1.084, - "step": 15165 - }, - { - "epoch": 0.39, - "learning_rate": 1.948455078107091e-06, - "loss": 0.8359, - "step": 15166 - }, - { - "epoch": 0.39, - "learning_rate": 1.9484463086560674e-06, - "loss": 0.999, - "step": 15167 - }, - { - "epoch": 0.39, - "learning_rate": 1.948437538478862e-06, - "loss": 0.7568, - "step": 15168 - }, - { - "epoch": 0.39, - "learning_rate": 1.948428767575482e-06, - "loss": 0.8965, - "step": 15169 - }, - { - "epoch": 0.39, - "learning_rate": 1.948419995945933e-06, - "loss": 1.1582, - "step": 15170 - }, - { - "epoch": 0.39, - "learning_rate": 1.948411223590223e-06, - "loss": 0.7036, - "step": 15171 - }, - { - "epoch": 0.39, - "learning_rate": 1.948402450508358e-06, - "loss": 0.9863, - "step": 15172 - }, - { - "epoch": 0.39, - "learning_rate": 1.948393676700345e-06, - "loss": 0.8691, - "step": 15173 - }, - { - "epoch": 0.39, - "learning_rate": 1.94838490216619e-06, - "loss": 0.7544, - "step": 15174 - }, - { - "epoch": 0.39, - "learning_rate": 1.9483761269059007e-06, - "loss": 0.8584, - "step": 15175 - }, - { - "epoch": 0.39, - "learning_rate": 1.9483673509194833e-06, - "loss": 1.0557, - "step": 15176 - }, - { - "epoch": 0.39, - "learning_rate": 1.9483585742069447e-06, - "loss": 0.9834, - "step": 15177 - }, - { - "epoch": 0.39, - "learning_rate": 1.9483497967682918e-06, - "loss": 0.8203, - "step": 15178 - }, - { - "epoch": 0.39, - "learning_rate": 1.9483410186035304e-06, - "loss": 0.8086, - "step": 15179 - }, - { - "epoch": 0.39, - "learning_rate": 1.9483322397126683e-06, - "loss": 0.7236, - "step": 15180 - }, - { - "epoch": 0.39, - "learning_rate": 1.9483234600957118e-06, - "loss": 0.9043, - "step": 15181 - }, - { - "epoch": 0.39, - "learning_rate": 1.9483146797526676e-06, - "loss": 0.8389, - "step": 15182 - }, - { - "epoch": 0.39, - "learning_rate": 1.9483058986835425e-06, - "loss": 0.9141, - "step": 15183 - }, - { - "epoch": 0.39, - "learning_rate": 1.948297116888343e-06, - "loss": 0.8242, - "step": 15184 - }, - { - "epoch": 0.39, - "learning_rate": 1.9482883343670764e-06, - "loss": 0.9326, - "step": 15185 - }, - { - "epoch": 0.39, - "learning_rate": 1.9482795511197485e-06, - "loss": 0.918, - "step": 15186 - }, - { - "epoch": 0.39, - "learning_rate": 1.948270767146367e-06, - "loss": 0.8887, - "step": 15187 - }, - { - "epoch": 0.39, - "learning_rate": 1.9482619824469378e-06, - "loss": 0.7798, - "step": 15188 - }, - { - "epoch": 0.39, - "learning_rate": 1.9482531970214685e-06, - "loss": 0.6792, - "step": 15189 - }, - { - "epoch": 0.39, - "learning_rate": 1.948244410869965e-06, - "loss": 0.8525, - "step": 15190 - }, - { - "epoch": 0.39, - "learning_rate": 1.948235623992434e-06, - "loss": 1.083, - "step": 15191 - }, - { - "epoch": 0.39, - "learning_rate": 1.9482268363888836e-06, - "loss": 1.0234, - "step": 15192 - }, - { - "epoch": 0.39, - "learning_rate": 1.9482180480593186e-06, - "loss": 1.0264, - "step": 15193 - }, - { - "epoch": 0.39, - "learning_rate": 1.948209259003747e-06, - "loss": 0.9575, - "step": 15194 - }, - { - "epoch": 0.39, - "learning_rate": 1.9482004692221748e-06, - "loss": 0.915, - "step": 15195 - }, - { - "epoch": 0.39, - "learning_rate": 1.9481916787146094e-06, - "loss": 0.9082, - "step": 15196 - }, - { - "epoch": 0.39, - "learning_rate": 1.9481828874810577e-06, - "loss": 0.77, - "step": 15197 - }, - { - "epoch": 0.39, - "learning_rate": 1.948174095521525e-06, - "loss": 0.9883, - "step": 15198 - }, - { - "epoch": 0.39, - "learning_rate": 1.9481653028360198e-06, - "loss": 0.957, - "step": 15199 - }, - { - "epoch": 0.39, - "learning_rate": 1.9481565094245472e-06, - "loss": 0.9111, - "step": 15200 - }, - { - "epoch": 0.39, - "learning_rate": 1.9481477152871154e-06, - "loss": 0.8867, - "step": 15201 - }, - { - "epoch": 0.39, - "learning_rate": 1.9481389204237305e-06, - "loss": 0.9287, - "step": 15202 - }, - { - "epoch": 0.39, - "learning_rate": 1.948130124834399e-06, - "loss": 0.7271, - "step": 15203 - }, - { - "epoch": 0.39, - "learning_rate": 1.948121328519128e-06, - "loss": 0.792, - "step": 15204 - }, - { - "epoch": 0.39, - "learning_rate": 1.9481125314779242e-06, - "loss": 0.8555, - "step": 15205 - }, - { - "epoch": 0.39, - "learning_rate": 1.948103733710794e-06, - "loss": 1.0518, - "step": 15206 - }, - { - "epoch": 0.39, - "learning_rate": 1.948094935217744e-06, - "loss": 0.9053, - "step": 15207 - }, - { - "epoch": 0.39, - "learning_rate": 1.948086135998782e-06, - "loss": 0.7646, - "step": 15208 - }, - { - "epoch": 0.39, - "learning_rate": 1.948077336053914e-06, - "loss": 0.636, - "step": 15209 - }, - { - "epoch": 0.39, - "learning_rate": 1.9480685353831464e-06, - "loss": 1.0479, - "step": 15210 - }, - { - "epoch": 0.39, - "learning_rate": 1.9480597339864863e-06, - "loss": 0.5646, - "step": 15211 - }, - { - "epoch": 0.39, - "learning_rate": 1.948050931863941e-06, - "loss": 0.8662, - "step": 15212 - }, - { - "epoch": 0.39, - "learning_rate": 1.948042129015516e-06, - "loss": 0.7456, - "step": 15213 - }, - { - "epoch": 0.39, - "learning_rate": 1.948033325441219e-06, - "loss": 0.8047, - "step": 15214 - }, - { - "epoch": 0.39, - "learning_rate": 1.9480245211410565e-06, - "loss": 0.6025, - "step": 15215 - }, - { - "epoch": 0.39, - "learning_rate": 1.9480157161150356e-06, - "loss": 0.8203, - "step": 15216 - }, - { - "epoch": 0.39, - "learning_rate": 1.948006910363162e-06, - "loss": 0.833, - "step": 15217 - }, - { - "epoch": 0.39, - "learning_rate": 1.9479981038854436e-06, - "loss": 0.668, - "step": 15218 - }, - { - "epoch": 0.39, - "learning_rate": 1.9479892966818865e-06, - "loss": 0.7578, - "step": 15219 - }, - { - "epoch": 0.39, - "learning_rate": 1.9479804887524975e-06, - "loss": 0.5891, - "step": 15220 - }, - { - "epoch": 0.39, - "learning_rate": 1.947971680097283e-06, - "loss": 0.9697, - "step": 15221 - }, - { - "epoch": 0.39, - "learning_rate": 1.947962870716251e-06, - "loss": 0.6172, - "step": 15222 - }, - { - "epoch": 0.39, - "learning_rate": 1.9479540606094068e-06, - "loss": 0.7588, - "step": 15223 - }, - { - "epoch": 0.39, - "learning_rate": 1.947945249776758e-06, - "loss": 0.771, - "step": 15224 - }, - { - "epoch": 0.39, - "learning_rate": 1.947936438218311e-06, - "loss": 0.6958, - "step": 15225 - }, - { - "epoch": 0.39, - "learning_rate": 1.947927625934073e-06, - "loss": 0.6865, - "step": 15226 - }, - { - "epoch": 0.39, - "learning_rate": 1.9479188129240503e-06, - "loss": 0.9336, - "step": 15227 - }, - { - "epoch": 0.39, - "learning_rate": 1.9479099991882497e-06, - "loss": 0.7871, - "step": 15228 - }, - { - "epoch": 0.39, - "learning_rate": 1.9479011847266777e-06, - "loss": 0.8047, - "step": 15229 - }, - { - "epoch": 0.39, - "learning_rate": 1.9478923695393416e-06, - "loss": 1.0996, - "step": 15230 - }, - { - "epoch": 0.39, - "learning_rate": 1.947883553626248e-06, - "loss": 0.7734, - "step": 15231 - }, - { - "epoch": 0.39, - "learning_rate": 1.947874736987403e-06, - "loss": 0.9102, - "step": 15232 - }, - { - "epoch": 0.39, - "learning_rate": 1.9478659196228146e-06, - "loss": 0.9106, - "step": 15233 - }, - { - "epoch": 0.39, - "learning_rate": 1.9478571015324887e-06, - "loss": 0.9766, - "step": 15234 - }, - { - "epoch": 0.39, - "learning_rate": 1.947848282716432e-06, - "loss": 0.9209, - "step": 15235 - }, - { - "epoch": 0.39, - "learning_rate": 1.9478394631746513e-06, - "loss": 0.9453, - "step": 15236 - }, - { - "epoch": 0.39, - "learning_rate": 1.947830642907154e-06, - "loss": 1.0303, - "step": 15237 - }, - { - "epoch": 0.39, - "learning_rate": 1.947821821913946e-06, - "loss": 1.0635, - "step": 15238 - }, - { - "epoch": 0.39, - "learning_rate": 1.947813000195035e-06, - "loss": 0.7134, - "step": 15239 - }, - { - "epoch": 0.39, - "learning_rate": 1.9478041777504263e-06, - "loss": 0.9717, - "step": 15240 - }, - { - "epoch": 0.39, - "learning_rate": 1.947795354580128e-06, - "loss": 0.7051, - "step": 15241 - }, - { - "epoch": 0.39, - "learning_rate": 1.9477865306841462e-06, - "loss": 0.958, - "step": 15242 - }, - { - "epoch": 0.39, - "learning_rate": 1.9477777060624878e-06, - "loss": 1.0254, - "step": 15243 - }, - { - "epoch": 0.39, - "learning_rate": 1.9477688807151596e-06, - "loss": 0.9062, - "step": 15244 - }, - { - "epoch": 0.39, - "learning_rate": 1.9477600546421682e-06, - "loss": 0.6465, - "step": 15245 - }, - { - "epoch": 0.39, - "learning_rate": 1.947751227843521e-06, - "loss": 1.2373, - "step": 15246 - }, - { - "epoch": 0.39, - "learning_rate": 1.947742400319224e-06, - "loss": 0.9512, - "step": 15247 - }, - { - "epoch": 0.39, - "learning_rate": 1.947733572069284e-06, - "loss": 0.7734, - "step": 15248 - }, - { - "epoch": 0.39, - "learning_rate": 1.947724743093708e-06, - "loss": 0.8113, - "step": 15249 - }, - { - "epoch": 0.39, - "learning_rate": 1.9477159133925032e-06, - "loss": 0.8418, - "step": 15250 - }, - { - "epoch": 0.39, - "learning_rate": 1.947707082965676e-06, - "loss": 0.8418, - "step": 15251 - }, - { - "epoch": 0.39, - "learning_rate": 1.9476982518132326e-06, - "loss": 0.8215, - "step": 15252 - }, - { - "epoch": 0.39, - "learning_rate": 1.94768941993518e-06, - "loss": 0.6362, - "step": 15253 - }, - { - "epoch": 0.39, - "learning_rate": 1.9476805873315257e-06, - "loss": 0.9248, - "step": 15254 - }, - { - "epoch": 0.39, - "learning_rate": 1.947671754002276e-06, - "loss": 0.7959, - "step": 15255 - }, - { - "epoch": 0.39, - "learning_rate": 1.947662919947437e-06, - "loss": 0.7656, - "step": 15256 - }, - { - "epoch": 0.39, - "learning_rate": 1.9476540851670165e-06, - "loss": 0.8789, - "step": 15257 - }, - { - "epoch": 0.39, - "learning_rate": 1.947645249661021e-06, - "loss": 0.9971, - "step": 15258 - }, - { - "epoch": 0.39, - "learning_rate": 1.9476364134294568e-06, - "loss": 0.7402, - "step": 15259 - }, - { - "epoch": 0.39, - "learning_rate": 1.9476275764723313e-06, - "loss": 0.9089, - "step": 15260 - }, - { - "epoch": 0.39, - "learning_rate": 1.9476187387896505e-06, - "loss": 0.9346, - "step": 15261 - }, - { - "epoch": 0.39, - "learning_rate": 1.947609900381422e-06, - "loss": 1.1113, - "step": 15262 - }, - { - "epoch": 0.39, - "learning_rate": 1.947601061247652e-06, - "loss": 1.0674, - "step": 15263 - }, - { - "epoch": 0.39, - "learning_rate": 1.9475922213883475e-06, - "loss": 0.9199, - "step": 15264 - }, - { - "epoch": 0.39, - "learning_rate": 1.947583380803515e-06, - "loss": 0.9014, - "step": 15265 - }, - { - "epoch": 0.39, - "learning_rate": 1.947574539493162e-06, - "loss": 0.8799, - "step": 15266 - }, - { - "epoch": 0.39, - "learning_rate": 1.9475656974572942e-06, - "loss": 0.8262, - "step": 15267 - }, - { - "epoch": 0.39, - "learning_rate": 1.947556854695919e-06, - "loss": 0.4395, - "step": 15268 - }, - { - "epoch": 0.39, - "learning_rate": 1.9475480112090433e-06, - "loss": 0.8535, - "step": 15269 - }, - { - "epoch": 0.39, - "learning_rate": 1.9475391669966736e-06, - "loss": 0.6367, - "step": 15270 - }, - { - "epoch": 0.39, - "learning_rate": 1.9475303220588164e-06, - "loss": 0.7363, - "step": 15271 - }, - { - "epoch": 0.39, - "learning_rate": 1.9475214763954792e-06, - "loss": 0.8682, - "step": 15272 - }, - { - "epoch": 0.39, - "learning_rate": 1.947512630006668e-06, - "loss": 0.8252, - "step": 15273 - }, - { - "epoch": 0.39, - "learning_rate": 1.9475037828923902e-06, - "loss": 0.9766, - "step": 15274 - }, - { - "epoch": 0.39, - "learning_rate": 1.9474949350526523e-06, - "loss": 1.0195, - "step": 15275 - }, - { - "epoch": 0.39, - "learning_rate": 1.9474860864874612e-06, - "loss": 1.0889, - "step": 15276 - }, - { - "epoch": 0.39, - "learning_rate": 1.9474772371968237e-06, - "loss": 0.7812, - "step": 15277 - }, - { - "epoch": 0.39, - "learning_rate": 1.947468387180746e-06, - "loss": 0.7632, - "step": 15278 - }, - { - "epoch": 0.39, - "learning_rate": 1.9474595364392355e-06, - "loss": 0.9746, - "step": 15279 - }, - { - "epoch": 0.39, - "learning_rate": 1.9474506849722988e-06, - "loss": 0.9404, - "step": 15280 - }, - { - "epoch": 0.39, - "learning_rate": 1.9474418327799428e-06, - "loss": 0.9873, - "step": 15281 - }, - { - "epoch": 0.39, - "learning_rate": 1.947432979862174e-06, - "loss": 0.9785, - "step": 15282 - }, - { - "epoch": 0.39, - "learning_rate": 1.9474241262189994e-06, - "loss": 0.8325, - "step": 15283 - }, - { - "epoch": 0.39, - "learning_rate": 1.947415271850426e-06, - "loss": 1.2422, - "step": 15284 - }, - { - "epoch": 0.39, - "learning_rate": 1.9474064167564595e-06, - "loss": 0.8052, - "step": 15285 - }, - { - "epoch": 0.39, - "learning_rate": 1.9473975609371084e-06, - "loss": 0.9395, - "step": 15286 - }, - { - "epoch": 0.39, - "learning_rate": 1.9473887043923777e-06, - "loss": 0.7393, - "step": 15287 - }, - { - "epoch": 0.39, - "learning_rate": 1.9473798471222756e-06, - "loss": 0.9014, - "step": 15288 - }, - { - "epoch": 0.39, - "learning_rate": 1.9473709891268083e-06, - "loss": 0.8174, - "step": 15289 - }, - { - "epoch": 0.39, - "learning_rate": 1.9473621304059823e-06, - "loss": 0.7212, - "step": 15290 - }, - { - "epoch": 0.39, - "learning_rate": 1.9473532709598047e-06, - "loss": 0.792, - "step": 15291 - }, - { - "epoch": 0.39, - "learning_rate": 1.9473444107882827e-06, - "loss": 0.8262, - "step": 15292 - }, - { - "epoch": 0.39, - "learning_rate": 1.947335549891422e-06, - "loss": 0.9199, - "step": 15293 - }, - { - "epoch": 0.39, - "learning_rate": 1.9473266882692305e-06, - "loss": 0.9736, - "step": 15294 - }, - { - "epoch": 0.39, - "learning_rate": 1.9473178259217143e-06, - "loss": 0.7554, - "step": 15295 - }, - { - "epoch": 0.39, - "learning_rate": 1.9473089628488804e-06, - "loss": 0.7949, - "step": 15296 - }, - { - "epoch": 0.39, - "learning_rate": 1.9473000990507356e-06, - "loss": 0.7256, - "step": 15297 - }, - { - "epoch": 0.39, - "learning_rate": 1.947291234527287e-06, - "loss": 1.0098, - "step": 15298 - }, - { - "epoch": 0.39, - "learning_rate": 1.947282369278541e-06, - "loss": 0.9609, - "step": 15299 - }, - { - "epoch": 0.39, - "learning_rate": 1.947273503304504e-06, - "loss": 0.8018, - "step": 15300 - }, - { - "epoch": 0.39, - "learning_rate": 1.9472646366051835e-06, - "loss": 0.9434, - "step": 15301 - }, - { - "epoch": 0.39, - "learning_rate": 1.947255769180586e-06, - "loss": 0.9072, - "step": 15302 - }, - { - "epoch": 0.39, - "learning_rate": 1.947246901030718e-06, - "loss": 0.9561, - "step": 15303 - }, - { - "epoch": 0.39, - "learning_rate": 1.9472380321555873e-06, - "loss": 0.7139, - "step": 15304 - }, - { - "epoch": 0.39, - "learning_rate": 1.9472291625551995e-06, - "loss": 0.6367, - "step": 15305 - }, - { - "epoch": 0.39, - "learning_rate": 1.947220292229562e-06, - "loss": 0.8311, - "step": 15306 - }, - { - "epoch": 0.39, - "learning_rate": 1.9472114211786816e-06, - "loss": 0.7368, - "step": 15307 - }, - { - "epoch": 0.39, - "learning_rate": 1.9472025494025647e-06, - "loss": 0.8359, - "step": 15308 - }, - { - "epoch": 0.39, - "learning_rate": 1.9471936769012186e-06, - "loss": 0.8164, - "step": 15309 - }, - { - "epoch": 0.39, - "learning_rate": 1.9471848036746497e-06, - "loss": 0.7393, - "step": 15310 - }, - { - "epoch": 0.39, - "learning_rate": 1.947175929722865e-06, - "loss": 0.9766, - "step": 15311 - }, - { - "epoch": 0.39, - "learning_rate": 1.9471670550458713e-06, - "loss": 0.7329, - "step": 15312 - }, - { - "epoch": 0.39, - "learning_rate": 1.9471581796436754e-06, - "loss": 0.9717, - "step": 15313 - }, - { - "epoch": 0.39, - "learning_rate": 1.9471493035162837e-06, - "loss": 0.8042, - "step": 15314 - }, - { - "epoch": 0.39, - "learning_rate": 1.9471404266637035e-06, - "loss": 0.7202, - "step": 15315 - }, - { - "epoch": 0.39, - "learning_rate": 1.9471315490859416e-06, - "loss": 0.9863, - "step": 15316 - }, - { - "epoch": 0.39, - "learning_rate": 1.9471226707830043e-06, - "loss": 0.8477, - "step": 15317 - }, - { - "epoch": 0.39, - "learning_rate": 1.947113791754899e-06, - "loss": 0.7087, - "step": 15318 - }, - { - "epoch": 0.39, - "learning_rate": 1.9471049120016322e-06, - "loss": 0.9346, - "step": 15319 - }, - { - "epoch": 0.39, - "learning_rate": 1.9470960315232106e-06, - "loss": 0.876, - "step": 15320 - }, - { - "epoch": 0.39, - "learning_rate": 1.947087150319641e-06, - "loss": 0.9688, - "step": 15321 - }, - { - "epoch": 0.39, - "learning_rate": 1.947078268390931e-06, - "loss": 0.8535, - "step": 15322 - }, - { - "epoch": 0.39, - "learning_rate": 1.947069385737086e-06, - "loss": 0.7881, - "step": 15323 - }, - { - "epoch": 0.39, - "learning_rate": 1.9470605023581137e-06, - "loss": 0.6729, - "step": 15324 - }, - { - "epoch": 0.39, - "learning_rate": 1.947051618254021e-06, - "loss": 0.7822, - "step": 15325 - }, - { - "epoch": 0.39, - "learning_rate": 1.9470427334248138e-06, - "loss": 1.0996, - "step": 15326 - }, - { - "epoch": 0.39, - "learning_rate": 1.9470338478705002e-06, - "loss": 0.7212, - "step": 15327 - }, - { - "epoch": 0.39, - "learning_rate": 1.947024961591086e-06, - "loss": 1.0645, - "step": 15328 - }, - { - "epoch": 0.39, - "learning_rate": 1.947016074586578e-06, - "loss": 0.7808, - "step": 15329 - }, - { - "epoch": 0.39, - "learning_rate": 1.947007186856984e-06, - "loss": 0.873, - "step": 15330 - }, - { - "epoch": 0.39, - "learning_rate": 1.94699829840231e-06, - "loss": 0.9336, - "step": 15331 - }, - { - "epoch": 0.39, - "learning_rate": 1.9469894092225623e-06, - "loss": 0.8359, - "step": 15332 - }, - { - "epoch": 0.39, - "learning_rate": 1.946980519317749e-06, - "loss": 0.8799, - "step": 15333 - }, - { - "epoch": 0.39, - "learning_rate": 1.946971628687876e-06, - "loss": 0.8525, - "step": 15334 - }, - { - "epoch": 0.39, - "learning_rate": 1.946962737332951e-06, - "loss": 0.9736, - "step": 15335 - }, - { - "epoch": 0.39, - "learning_rate": 1.9469538452529794e-06, - "loss": 0.9736, - "step": 15336 - }, - { - "epoch": 0.39, - "learning_rate": 1.946944952447969e-06, - "loss": 0.6934, - "step": 15337 - }, - { - "epoch": 0.39, - "learning_rate": 1.9469360589179263e-06, - "loss": 1.0762, - "step": 15338 - }, - { - "epoch": 0.39, - "learning_rate": 1.9469271646628586e-06, - "loss": 0.8799, - "step": 15339 - }, - { - "epoch": 0.39, - "learning_rate": 1.9469182696827717e-06, - "loss": 0.9922, - "step": 15340 - }, - { - "epoch": 0.39, - "learning_rate": 1.9469093739776733e-06, - "loss": 0.8105, - "step": 15341 - }, - { - "epoch": 0.39, - "learning_rate": 1.9469004775475703e-06, - "loss": 0.8477, - "step": 15342 - }, - { - "epoch": 0.39, - "learning_rate": 1.946891580392469e-06, - "loss": 0.8018, - "step": 15343 - }, - { - "epoch": 0.39, - "learning_rate": 1.9468826825123758e-06, - "loss": 1.0713, - "step": 15344 - }, - { - "epoch": 0.39, - "learning_rate": 1.9468737839072983e-06, - "loss": 0.8926, - "step": 15345 - }, - { - "epoch": 0.39, - "learning_rate": 1.9468648845772433e-06, - "loss": 0.7812, - "step": 15346 - }, - { - "epoch": 0.39, - "learning_rate": 1.9468559845222174e-06, - "loss": 0.9795, - "step": 15347 - }, - { - "epoch": 0.39, - "learning_rate": 1.9468470837422274e-06, - "loss": 1.0918, - "step": 15348 - }, - { - "epoch": 0.39, - "learning_rate": 1.9468381822372797e-06, - "loss": 0.9131, - "step": 15349 - }, - { - "epoch": 0.39, - "learning_rate": 1.9468292800073824e-06, - "loss": 0.7461, - "step": 15350 - }, - { - "epoch": 0.39, - "learning_rate": 1.9468203770525405e-06, - "loss": 0.7373, - "step": 15351 - }, - { - "epoch": 0.39, - "learning_rate": 1.9468114733727624e-06, - "loss": 0.6304, - "step": 15352 - }, - { - "epoch": 0.39, - "learning_rate": 1.946802568968054e-06, - "loss": 1.0469, - "step": 15353 - }, - { - "epoch": 0.39, - "learning_rate": 1.946793663838423e-06, - "loss": 0.6978, - "step": 15354 - }, - { - "epoch": 0.39, - "learning_rate": 1.9467847579838747e-06, - "loss": 0.9883, - "step": 15355 - }, - { - "epoch": 0.39, - "learning_rate": 1.946775851404417e-06, - "loss": 0.8105, - "step": 15356 - }, - { - "epoch": 0.39, - "learning_rate": 1.9467669441000576e-06, - "loss": 0.8223, - "step": 15357 - }, - { - "epoch": 0.39, - "learning_rate": 1.9467580360708013e-06, - "loss": 0.8672, - "step": 15358 - }, - { - "epoch": 0.39, - "learning_rate": 1.946749127316656e-06, - "loss": 0.8149, - "step": 15359 - }, - { - "epoch": 0.39, - "learning_rate": 1.9467402178376288e-06, - "loss": 0.9365, - "step": 15360 - }, - { - "epoch": 0.39, - "learning_rate": 1.9467313076337256e-06, - "loss": 0.5806, - "step": 15361 - }, - { - "epoch": 0.39, - "learning_rate": 1.946722396704954e-06, - "loss": 0.6924, - "step": 15362 - }, - { - "epoch": 0.39, - "learning_rate": 1.946713485051321e-06, - "loss": 0.9727, - "step": 15363 - }, - { - "epoch": 0.39, - "learning_rate": 1.9467045726728326e-06, - "loss": 0.9136, - "step": 15364 - }, - { - "epoch": 0.39, - "learning_rate": 1.946695659569496e-06, - "loss": 1.1055, - "step": 15365 - }, - { - "epoch": 0.39, - "learning_rate": 1.9466867457413186e-06, - "loss": 0.9629, - "step": 15366 - }, - { - "epoch": 0.39, - "learning_rate": 1.946677831188306e-06, - "loss": 0.8374, - "step": 15367 - }, - { - "epoch": 0.39, - "learning_rate": 1.946668915910466e-06, - "loss": 0.8408, - "step": 15368 - }, - { - "epoch": 0.39, - "learning_rate": 1.9466599999078052e-06, - "loss": 0.8643, - "step": 15369 - }, - { - "epoch": 0.39, - "learning_rate": 1.9466510831803304e-06, - "loss": 0.9678, - "step": 15370 - }, - { - "epoch": 0.39, - "learning_rate": 1.946642165728048e-06, - "loss": 0.9746, - "step": 15371 - }, - { - "epoch": 0.39, - "learning_rate": 1.946633247550966e-06, - "loss": 0.9844, - "step": 15372 - }, - { - "epoch": 0.39, - "learning_rate": 1.9466243286490897e-06, - "loss": 0.8726, - "step": 15373 - }, - { - "epoch": 0.39, - "learning_rate": 1.946615409022427e-06, - "loss": 0.9263, - "step": 15374 - }, - { - "epoch": 0.39, - "learning_rate": 1.9466064886709847e-06, - "loss": 1.041, - "step": 15375 - }, - { - "epoch": 0.39, - "learning_rate": 1.9465975675947686e-06, - "loss": 0.6592, - "step": 15376 - }, - { - "epoch": 0.39, - "learning_rate": 1.9465886457937867e-06, - "loss": 0.8164, - "step": 15377 - }, - { - "epoch": 0.39, - "learning_rate": 1.9465797232680452e-06, - "loss": 0.7266, - "step": 15378 - }, - { - "epoch": 0.39, - "learning_rate": 1.9465708000175515e-06, - "loss": 0.8291, - "step": 15379 - }, - { - "epoch": 0.39, - "learning_rate": 1.9465618760423117e-06, - "loss": 0.8877, - "step": 15380 - }, - { - "epoch": 0.39, - "learning_rate": 1.9465529513423333e-06, - "loss": 0.7766, - "step": 15381 - }, - { - "epoch": 0.39, - "learning_rate": 1.946544025917623e-06, - "loss": 0.9414, - "step": 15382 - }, - { - "epoch": 0.39, - "learning_rate": 1.9465350997681867e-06, - "loss": 1.0518, - "step": 15383 - }, - { - "epoch": 0.39, - "learning_rate": 1.9465261728940327e-06, - "loss": 0.9775, - "step": 15384 - }, - { - "epoch": 0.39, - "learning_rate": 1.946517245295167e-06, - "loss": 0.8623, - "step": 15385 - }, - { - "epoch": 0.39, - "learning_rate": 1.946508316971596e-06, - "loss": 0.9062, - "step": 15386 - }, - { - "epoch": 0.39, - "learning_rate": 1.9464993879233277e-06, - "loss": 0.8086, - "step": 15387 - }, - { - "epoch": 0.39, - "learning_rate": 1.946490458150368e-06, - "loss": 0.876, - "step": 15388 - }, - { - "epoch": 0.39, - "learning_rate": 1.9464815276527244e-06, - "loss": 0.8984, - "step": 15389 - }, - { - "epoch": 0.39, - "learning_rate": 1.9464725964304037e-06, - "loss": 0.8125, - "step": 15390 - }, - { - "epoch": 0.39, - "learning_rate": 1.9464636644834117e-06, - "loss": 0.8945, - "step": 15391 - }, - { - "epoch": 0.39, - "learning_rate": 1.9464547318117567e-06, - "loss": 0.7053, - "step": 15392 - }, - { - "epoch": 0.39, - "learning_rate": 1.9464457984154443e-06, - "loss": 0.5552, - "step": 15393 - }, - { - "epoch": 0.39, - "learning_rate": 1.946436864294482e-06, - "loss": 0.8975, - "step": 15394 - }, - { - "epoch": 0.39, - "learning_rate": 1.9464279294488763e-06, - "loss": 0.9756, - "step": 15395 - }, - { - "epoch": 0.39, - "learning_rate": 1.9464189938786348e-06, - "loss": 0.9629, - "step": 15396 - }, - { - "epoch": 0.39, - "learning_rate": 1.9464100575837633e-06, - "loss": 1.0918, - "step": 15397 - }, - { - "epoch": 0.39, - "learning_rate": 1.9464011205642696e-06, - "loss": 0.7812, - "step": 15398 - }, - { - "epoch": 0.39, - "learning_rate": 1.94639218282016e-06, - "loss": 0.9404, - "step": 15399 - }, - { - "epoch": 0.39, - "learning_rate": 1.9463832443514406e-06, - "loss": 0.7891, - "step": 15400 - }, - { - "epoch": 0.39, - "learning_rate": 1.94637430515812e-06, - "loss": 0.8633, - "step": 15401 - }, - { - "epoch": 0.39, - "learning_rate": 1.946365365240204e-06, - "loss": 0.9795, - "step": 15402 - }, - { - "epoch": 0.39, - "learning_rate": 1.946356424597699e-06, - "loss": 1.0762, - "step": 15403 - }, - { - "epoch": 0.39, - "learning_rate": 1.9463474832306126e-06, - "loss": 1.168, - "step": 15404 - }, - { - "epoch": 0.39, - "learning_rate": 1.9463385411389518e-06, - "loss": 0.7524, - "step": 15405 - }, - { - "epoch": 0.39, - "learning_rate": 1.946329598322723e-06, - "loss": 0.8794, - "step": 15406 - }, - { - "epoch": 0.39, - "learning_rate": 1.946320654781933e-06, - "loss": 0.8125, - "step": 15407 - }, - { - "epoch": 0.39, - "learning_rate": 1.9463117105165887e-06, - "loss": 0.646, - "step": 15408 - }, - { - "epoch": 0.39, - "learning_rate": 1.9463027655266975e-06, - "loss": 0.9121, - "step": 15409 - }, - { - "epoch": 0.39, - "learning_rate": 1.9462938198122652e-06, - "loss": 0.7637, - "step": 15410 - }, - { - "epoch": 0.39, - "learning_rate": 1.9462848733732993e-06, - "loss": 0.5579, - "step": 15411 - }, - { - "epoch": 0.4, - "learning_rate": 1.946275926209807e-06, - "loss": 0.8721, - "step": 15412 - }, - { - "epoch": 0.4, - "learning_rate": 1.9462669783217943e-06, - "loss": 0.8706, - "step": 15413 - }, - { - "epoch": 0.4, - "learning_rate": 1.946258029709269e-06, - "loss": 0.8457, - "step": 15414 - }, - { - "epoch": 0.4, - "learning_rate": 1.946249080372237e-06, - "loss": 0.8857, - "step": 15415 - }, - { - "epoch": 0.4, - "learning_rate": 1.946240130310706e-06, - "loss": 0.9814, - "step": 15416 - }, - { - "epoch": 0.4, - "learning_rate": 1.9462311795246817e-06, - "loss": 0.6885, - "step": 15417 - }, - { - "epoch": 0.4, - "learning_rate": 1.946222228014172e-06, - "loss": 0.6357, - "step": 15418 - }, - { - "epoch": 0.4, - "learning_rate": 1.9462132757791836e-06, - "loss": 0.8076, - "step": 15419 - }, - { - "epoch": 0.4, - "learning_rate": 1.9462043228197232e-06, - "loss": 0.7837, - "step": 15420 - }, - { - "epoch": 0.4, - "learning_rate": 1.9461953691357977e-06, - "loss": 0.875, - "step": 15421 - }, - { - "epoch": 0.4, - "learning_rate": 1.9461864147274143e-06, - "loss": 0.8105, - "step": 15422 - }, - { - "epoch": 0.4, - "learning_rate": 1.9461774595945788e-06, - "loss": 1.1113, - "step": 15423 - }, - { - "epoch": 0.4, - "learning_rate": 1.946168503737299e-06, - "loss": 0.9346, - "step": 15424 - }, - { - "epoch": 0.4, - "learning_rate": 1.9461595471555813e-06, - "loss": 0.8252, - "step": 15425 - }, - { - "epoch": 0.4, - "learning_rate": 1.946150589849433e-06, - "loss": 0.9111, - "step": 15426 - }, - { - "epoch": 0.4, - "learning_rate": 1.9461416318188604e-06, - "loss": 0.834, - "step": 15427 - }, - { - "epoch": 0.4, - "learning_rate": 1.9461326730638707e-06, - "loss": 0.7588, - "step": 15428 - }, - { - "epoch": 0.4, - "learning_rate": 1.946123713584471e-06, - "loss": 0.5347, - "step": 15429 - }, - { - "epoch": 0.4, - "learning_rate": 1.9461147533806675e-06, - "loss": 0.5898, - "step": 15430 - }, - { - "epoch": 0.4, - "learning_rate": 1.9461057924524678e-06, - "loss": 0.7627, - "step": 15431 - }, - { - "epoch": 0.4, - "learning_rate": 1.9460968307998782e-06, - "loss": 1.0605, - "step": 15432 - }, - { - "epoch": 0.4, - "learning_rate": 1.9460878684229057e-06, - "loss": 0.9082, - "step": 15433 - }, - { - "epoch": 0.4, - "learning_rate": 1.9460789053215578e-06, - "loss": 0.8584, - "step": 15434 - }, - { - "epoch": 0.4, - "learning_rate": 1.94606994149584e-06, - "loss": 0.752, - "step": 15435 - }, - { - "epoch": 0.4, - "learning_rate": 1.9460609769457603e-06, - "loss": 0.7383, - "step": 15436 - }, - { - "epoch": 0.4, - "learning_rate": 1.9460520116713253e-06, - "loss": 1.0879, - "step": 15437 - }, - { - "epoch": 0.4, - "learning_rate": 1.9460430456725415e-06, - "loss": 0.8633, - "step": 15438 - }, - { - "epoch": 0.4, - "learning_rate": 1.946034078949416e-06, - "loss": 0.8965, - "step": 15439 - }, - { - "epoch": 0.4, - "learning_rate": 1.946025111501956e-06, - "loss": 0.7461, - "step": 15440 - }, - { - "epoch": 0.4, - "learning_rate": 1.9460161433301682e-06, - "loss": 0.8037, - "step": 15441 - }, - { - "epoch": 0.4, - "learning_rate": 1.946007174434059e-06, - "loss": 1.0107, - "step": 15442 - }, - { - "epoch": 0.4, - "learning_rate": 1.945998204813636e-06, - "loss": 1.002, - "step": 15443 - }, - { - "epoch": 0.4, - "learning_rate": 1.9459892344689054e-06, - "loss": 0.7998, - "step": 15444 - }, - { - "epoch": 0.4, - "learning_rate": 1.9459802633998743e-06, - "loss": 0.9707, - "step": 15445 - }, - { - "epoch": 0.4, - "learning_rate": 1.9459712916065495e-06, - "loss": 0.8232, - "step": 15446 - }, - { - "epoch": 0.4, - "learning_rate": 1.945962319088938e-06, - "loss": 0.9229, - "step": 15447 - }, - { - "epoch": 0.4, - "learning_rate": 1.945953345847047e-06, - "loss": 1.1006, - "step": 15448 - }, - { - "epoch": 0.4, - "learning_rate": 1.945944371880883e-06, - "loss": 0.7773, - "step": 15449 - }, - { - "epoch": 0.4, - "learning_rate": 1.9459353971904522e-06, - "loss": 0.6992, - "step": 15450 - }, - { - "epoch": 0.4, - "learning_rate": 1.9459264217757626e-06, - "loss": 0.8423, - "step": 15451 - }, - { - "epoch": 0.4, - "learning_rate": 1.945917445636821e-06, - "loss": 0.8066, - "step": 15452 - }, - { - "epoch": 0.4, - "learning_rate": 1.9459084687736334e-06, - "loss": 1.0498, - "step": 15453 - }, - { - "epoch": 0.4, - "learning_rate": 1.9458994911862073e-06, - "loss": 1.0215, - "step": 15454 - }, - { - "epoch": 0.4, - "learning_rate": 1.94589051287455e-06, - "loss": 0.8408, - "step": 15455 - }, - { - "epoch": 0.4, - "learning_rate": 1.945881533838667e-06, - "loss": 1.002, - "step": 15456 - }, - { - "epoch": 0.4, - "learning_rate": 1.9458725540785666e-06, - "loss": 0.9902, - "step": 15457 - }, - { - "epoch": 0.4, - "learning_rate": 1.9458635735942544e-06, - "loss": 1.0273, - "step": 15458 - }, - { - "epoch": 0.4, - "learning_rate": 1.9458545923857387e-06, - "loss": 0.7871, - "step": 15459 - }, - { - "epoch": 0.4, - "learning_rate": 1.945845610453025e-06, - "loss": 0.9209, - "step": 15460 - }, - { - "epoch": 0.4, - "learning_rate": 1.9458366277961212e-06, - "loss": 1.0029, - "step": 15461 - }, - { - "epoch": 0.4, - "learning_rate": 1.945827644415034e-06, - "loss": 0.8994, - "step": 15462 - }, - { - "epoch": 0.4, - "learning_rate": 1.9458186603097697e-06, - "loss": 0.9229, - "step": 15463 - }, - { - "epoch": 0.4, - "learning_rate": 1.9458096754803356e-06, - "loss": 0.8105, - "step": 15464 - }, - { - "epoch": 0.4, - "learning_rate": 1.9458006899267387e-06, - "loss": 1.0703, - "step": 15465 - }, - { - "epoch": 0.4, - "learning_rate": 1.9457917036489854e-06, - "loss": 0.7358, - "step": 15466 - }, - { - "epoch": 0.4, - "learning_rate": 1.945782716647083e-06, - "loss": 0.8857, - "step": 15467 - }, - { - "epoch": 0.4, - "learning_rate": 1.9457737289210383e-06, - "loss": 0.9932, - "step": 15468 - }, - { - "epoch": 0.4, - "learning_rate": 1.945764740470858e-06, - "loss": 0.7898, - "step": 15469 - }, - { - "epoch": 0.4, - "learning_rate": 1.945755751296549e-06, - "loss": 0.7793, - "step": 15470 - }, - { - "epoch": 0.4, - "learning_rate": 1.9457467613981186e-06, - "loss": 0.5791, - "step": 15471 - }, - { - "epoch": 0.4, - "learning_rate": 1.9457377707755733e-06, - "loss": 0.9307, - "step": 15472 - }, - { - "epoch": 0.4, - "learning_rate": 1.9457287794289203e-06, - "loss": 0.6963, - "step": 15473 - }, - { - "epoch": 0.4, - "learning_rate": 1.945719787358166e-06, - "loss": 0.896, - "step": 15474 - }, - { - "epoch": 0.4, - "learning_rate": 1.945710794563318e-06, - "loss": 0.8379, - "step": 15475 - }, - { - "epoch": 0.4, - "learning_rate": 1.945701801044382e-06, - "loss": 0.9395, - "step": 15476 - }, - { - "epoch": 0.4, - "learning_rate": 1.945692806801366e-06, - "loss": 0.9731, - "step": 15477 - }, - { - "epoch": 0.4, - "learning_rate": 1.9456838118342763e-06, - "loss": 0.8057, - "step": 15478 - }, - { - "epoch": 0.4, - "learning_rate": 1.94567481614312e-06, - "loss": 0.624, - "step": 15479 - }, - { - "epoch": 0.4, - "learning_rate": 1.9456658197279046e-06, - "loss": 0.6934, - "step": 15480 - }, - { - "epoch": 0.4, - "learning_rate": 1.945656822588636e-06, - "loss": 0.9082, - "step": 15481 - }, - { - "epoch": 0.4, - "learning_rate": 1.945647824725321e-06, - "loss": 0.769, - "step": 15482 - }, - { - "epoch": 0.4, - "learning_rate": 1.9456388261379673e-06, - "loss": 0.8999, - "step": 15483 - }, - { - "epoch": 0.4, - "learning_rate": 1.945629826826582e-06, - "loss": 0.8682, - "step": 15484 - }, - { - "epoch": 0.4, - "learning_rate": 1.9456208267911703e-06, - "loss": 0.582, - "step": 15485 - }, - { - "epoch": 0.4, - "learning_rate": 1.945611826031741e-06, - "loss": 0.834, - "step": 15486 - }, - { - "epoch": 0.4, - "learning_rate": 1.9456028245483e-06, - "loss": 0.8184, - "step": 15487 - }, - { - "epoch": 0.4, - "learning_rate": 1.945593822340854e-06, - "loss": 0.7554, - "step": 15488 - }, - { - "epoch": 0.4, - "learning_rate": 1.9455848194094106e-06, - "loss": 0.9346, - "step": 15489 - }, - { - "epoch": 0.4, - "learning_rate": 1.9455758157539767e-06, - "loss": 1.0176, - "step": 15490 - }, - { - "epoch": 0.4, - "learning_rate": 1.9455668113745584e-06, - "loss": 0.9004, - "step": 15491 - }, - { - "epoch": 0.4, - "learning_rate": 1.9455578062711633e-06, - "loss": 0.7734, - "step": 15492 - }, - { - "epoch": 0.4, - "learning_rate": 1.945548800443798e-06, - "loss": 0.8975, - "step": 15493 - }, - { - "epoch": 0.4, - "learning_rate": 1.9455397938924696e-06, - "loss": 0.9375, - "step": 15494 - }, - { - "epoch": 0.4, - "learning_rate": 1.945530786617185e-06, - "loss": 0.8721, - "step": 15495 - }, - { - "epoch": 0.4, - "learning_rate": 1.9455217786179506e-06, - "loss": 1.1074, - "step": 15496 - }, - { - "epoch": 0.4, - "learning_rate": 1.9455127698947737e-06, - "loss": 0.9111, - "step": 15497 - }, - { - "epoch": 0.4, - "learning_rate": 1.945503760447661e-06, - "loss": 0.9375, - "step": 15498 - }, - { - "epoch": 0.4, - "learning_rate": 1.94549475027662e-06, - "loss": 0.9043, - "step": 15499 - }, - { - "epoch": 0.4, - "learning_rate": 1.945485739381657e-06, - "loss": 0.7769, - "step": 15500 - }, - { - "epoch": 0.4, - "learning_rate": 1.945476727762779e-06, - "loss": 0.9233, - "step": 15501 - }, - { - "epoch": 0.4, - "learning_rate": 1.945467715419993e-06, - "loss": 1.0146, - "step": 15502 - }, - { - "epoch": 0.4, - "learning_rate": 1.9454587023533057e-06, - "loss": 0.8271, - "step": 15503 - }, - { - "epoch": 0.4, - "learning_rate": 1.945449688562724e-06, - "loss": 0.9395, - "step": 15504 - }, - { - "epoch": 0.4, - "learning_rate": 1.945440674048255e-06, - "loss": 0.7815, - "step": 15505 - }, - { - "epoch": 0.4, - "learning_rate": 1.9454316588099057e-06, - "loss": 0.8223, - "step": 15506 - }, - { - "epoch": 0.4, - "learning_rate": 1.945422642847683e-06, - "loss": 0.8467, - "step": 15507 - }, - { - "epoch": 0.4, - "learning_rate": 1.9454136261615933e-06, - "loss": 1.0479, - "step": 15508 - }, - { - "epoch": 0.4, - "learning_rate": 1.945404608751644e-06, - "loss": 0.9268, - "step": 15509 - }, - { - "epoch": 0.4, - "learning_rate": 1.9453955906178423e-06, - "loss": 0.8223, - "step": 15510 - }, - { - "epoch": 0.4, - "learning_rate": 1.945386571760194e-06, - "loss": 0.9551, - "step": 15511 - }, - { - "epoch": 0.4, - "learning_rate": 1.945377552178707e-06, - "loss": 1.0439, - "step": 15512 - }, - { - "epoch": 0.4, - "learning_rate": 1.945368531873388e-06, - "loss": 0.9092, - "step": 15513 - }, - { - "epoch": 0.4, - "learning_rate": 1.945359510844243e-06, - "loss": 0.8667, - "step": 15514 - }, - { - "epoch": 0.4, - "learning_rate": 1.945350489091281e-06, - "loss": 0.7786, - "step": 15515 - }, - { - "epoch": 0.4, - "learning_rate": 1.9453414666145064e-06, - "loss": 0.9893, - "step": 15516 - }, - { - "epoch": 0.4, - "learning_rate": 1.945332443413928e-06, - "loss": 0.9473, - "step": 15517 - }, - { - "epoch": 0.4, - "learning_rate": 1.9453234194895518e-06, - "loss": 0.8164, - "step": 15518 - }, - { - "epoch": 0.4, - "learning_rate": 1.9453143948413847e-06, - "loss": 0.7979, - "step": 15519 - }, - { - "epoch": 0.4, - "learning_rate": 1.9453053694694343e-06, - "loss": 1.1133, - "step": 15520 - }, - { - "epoch": 0.4, - "learning_rate": 1.9452963433737065e-06, - "loss": 0.7046, - "step": 15521 - }, - { - "epoch": 0.4, - "learning_rate": 1.9452873165542094e-06, - "loss": 0.7944, - "step": 15522 - }, - { - "epoch": 0.4, - "learning_rate": 1.945278289010949e-06, - "loss": 1.1455, - "step": 15523 - }, - { - "epoch": 0.4, - "learning_rate": 1.9452692607439322e-06, - "loss": 0.7554, - "step": 15524 - }, - { - "epoch": 0.4, - "learning_rate": 1.9452602317531665e-06, - "loss": 0.7207, - "step": 15525 - }, - { - "epoch": 0.4, - "learning_rate": 1.9452512020386586e-06, - "loss": 0.9912, - "step": 15526 - }, - { - "epoch": 0.4, - "learning_rate": 1.945242171600415e-06, - "loss": 0.635, - "step": 15527 - }, - { - "epoch": 0.4, - "learning_rate": 1.945233140438443e-06, - "loss": 0.8477, - "step": 15528 - }, - { - "epoch": 0.4, - "learning_rate": 1.9452241085527494e-06, - "loss": 0.7271, - "step": 15529 - }, - { - "epoch": 0.4, - "learning_rate": 1.9452150759433416e-06, - "loss": 0.835, - "step": 15530 - }, - { - "epoch": 0.4, - "learning_rate": 1.9452060426102255e-06, - "loss": 0.9453, - "step": 15531 - }, - { - "epoch": 0.4, - "learning_rate": 1.9451970085534087e-06, - "loss": 1.0703, - "step": 15532 - }, - { - "epoch": 0.4, - "learning_rate": 1.9451879737728984e-06, - "loss": 0.7192, - "step": 15533 - }, - { - "epoch": 0.4, - "learning_rate": 1.945178938268701e-06, - "loss": 0.7305, - "step": 15534 - }, - { - "epoch": 0.4, - "learning_rate": 1.945169902040823e-06, - "loss": 0.8867, - "step": 15535 - }, - { - "epoch": 0.4, - "learning_rate": 1.9451608650892725e-06, - "loss": 0.7563, - "step": 15536 - }, - { - "epoch": 0.4, - "learning_rate": 1.945151827414056e-06, - "loss": 0.8984, - "step": 15537 - }, - { - "epoch": 0.4, - "learning_rate": 1.9451427890151796e-06, - "loss": 0.8267, - "step": 15538 - }, - { - "epoch": 0.4, - "learning_rate": 1.945133749892651e-06, - "loss": 1.0854, - "step": 15539 - }, - { - "epoch": 0.4, - "learning_rate": 1.945124710046477e-06, - "loss": 0.8887, - "step": 15540 - }, - { - "epoch": 0.4, - "learning_rate": 1.945115669476664e-06, - "loss": 0.9277, - "step": 15541 - }, - { - "epoch": 0.4, - "learning_rate": 1.94510662818322e-06, - "loss": 0.9473, - "step": 15542 - }, - { - "epoch": 0.4, - "learning_rate": 1.945097586166151e-06, - "loss": 0.9121, - "step": 15543 - }, - { - "epoch": 0.4, - "learning_rate": 1.9450885434254645e-06, - "loss": 0.9443, - "step": 15544 - }, - { - "epoch": 0.4, - "learning_rate": 1.9450794999611673e-06, - "loss": 0.6836, - "step": 15545 - }, - { - "epoch": 0.4, - "learning_rate": 1.945070455773266e-06, - "loss": 0.8203, - "step": 15546 - }, - { - "epoch": 0.4, - "learning_rate": 1.9450614108617677e-06, - "loss": 0.7598, - "step": 15547 - }, - { - "epoch": 0.4, - "learning_rate": 1.945052365226679e-06, - "loss": 1.0254, - "step": 15548 - }, - { - "epoch": 0.4, - "learning_rate": 1.9450433188680074e-06, - "loss": 0.7637, - "step": 15549 - }, - { - "epoch": 0.4, - "learning_rate": 1.9450342717857598e-06, - "loss": 1.2168, - "step": 15550 - }, - { - "epoch": 0.4, - "learning_rate": 1.9450252239799427e-06, - "loss": 0.75, - "step": 15551 - }, - { - "epoch": 0.4, - "learning_rate": 1.945016175450563e-06, - "loss": 0.9336, - "step": 15552 - }, - { - "epoch": 0.4, - "learning_rate": 1.9450071261976283e-06, - "loss": 0.9414, - "step": 15553 - }, - { - "epoch": 0.4, - "learning_rate": 1.944998076221145e-06, - "loss": 0.9736, - "step": 15554 - }, - { - "epoch": 0.4, - "learning_rate": 1.94498902552112e-06, - "loss": 0.9414, - "step": 15555 - }, - { - "epoch": 0.4, - "learning_rate": 1.9449799740975604e-06, - "loss": 0.917, - "step": 15556 - }, - { - "epoch": 0.4, - "learning_rate": 1.944970921950473e-06, - "loss": 1.0303, - "step": 15557 - }, - { - "epoch": 0.4, - "learning_rate": 1.9449618690798647e-06, - "loss": 0.9302, - "step": 15558 - }, - { - "epoch": 0.4, - "learning_rate": 1.944952815485743e-06, - "loss": 0.8438, - "step": 15559 - }, - { - "epoch": 0.4, - "learning_rate": 1.944943761168114e-06, - "loss": 0.8975, - "step": 15560 - }, - { - "epoch": 0.4, - "learning_rate": 1.944934706126985e-06, - "loss": 0.9727, - "step": 15561 - }, - { - "epoch": 0.4, - "learning_rate": 1.944925650362363e-06, - "loss": 0.7446, - "step": 15562 - }, - { - "epoch": 0.4, - "learning_rate": 1.944916593874255e-06, - "loss": 0.9375, - "step": 15563 - }, - { - "epoch": 0.4, - "learning_rate": 1.9449075366626678e-06, - "loss": 1.1777, - "step": 15564 - }, - { - "epoch": 0.4, - "learning_rate": 1.9448984787276085e-06, - "loss": 0.7188, - "step": 15565 - }, - { - "epoch": 0.4, - "learning_rate": 1.9448894200690835e-06, - "loss": 0.9365, - "step": 15566 - }, - { - "epoch": 0.4, - "learning_rate": 1.9448803606871005e-06, - "loss": 0.6409, - "step": 15567 - }, - { - "epoch": 0.4, - "learning_rate": 1.944871300581666e-06, - "loss": 1.0112, - "step": 15568 - }, - { - "epoch": 0.4, - "learning_rate": 1.9448622397527867e-06, - "loss": 0.813, - "step": 15569 - }, - { - "epoch": 0.4, - "learning_rate": 1.94485317820047e-06, - "loss": 1.0107, - "step": 15570 - }, - { - "epoch": 0.4, - "learning_rate": 1.944844115924723e-06, - "loss": 0.8716, - "step": 15571 - }, - { - "epoch": 0.4, - "learning_rate": 1.9448350529255517e-06, - "loss": 0.7354, - "step": 15572 - }, - { - "epoch": 0.4, - "learning_rate": 1.9448259892029636e-06, - "loss": 1.0762, - "step": 15573 - }, - { - "epoch": 0.4, - "learning_rate": 1.9448169247569662e-06, - "loss": 0.7896, - "step": 15574 - }, - { - "epoch": 0.4, - "learning_rate": 1.944807859587566e-06, - "loss": 0.9863, - "step": 15575 - }, - { - "epoch": 0.4, - "learning_rate": 1.944798793694769e-06, - "loss": 1.1055, - "step": 15576 - }, - { - "epoch": 0.4, - "learning_rate": 1.944789727078584e-06, - "loss": 0.9141, - "step": 15577 - }, - { - "epoch": 0.4, - "learning_rate": 1.9447806597390166e-06, - "loss": 0.874, - "step": 15578 - }, - { - "epoch": 0.4, - "learning_rate": 1.944771591676074e-06, - "loss": 0.6313, - "step": 15579 - }, - { - "epoch": 0.4, - "learning_rate": 1.9447625228897634e-06, - "loss": 0.9316, - "step": 15580 - }, - { - "epoch": 0.4, - "learning_rate": 1.9447534533800912e-06, - "loss": 0.8691, - "step": 15581 - }, - { - "epoch": 0.4, - "learning_rate": 1.944744383147065e-06, - "loss": 1.082, - "step": 15582 - }, - { - "epoch": 0.4, - "learning_rate": 1.9447353121906917e-06, - "loss": 0.9199, - "step": 15583 - }, - { - "epoch": 0.4, - "learning_rate": 1.9447262405109774e-06, - "loss": 0.8037, - "step": 15584 - }, - { - "epoch": 0.4, - "learning_rate": 1.94471716810793e-06, - "loss": 0.8564, - "step": 15585 - }, - { - "epoch": 0.4, - "learning_rate": 1.9447080949815563e-06, - "loss": 0.8042, - "step": 15586 - }, - { - "epoch": 0.4, - "learning_rate": 1.9446990211318626e-06, - "loss": 0.6787, - "step": 15587 - }, - { - "epoch": 0.4, - "learning_rate": 1.9446899465588566e-06, - "loss": 0.7529, - "step": 15588 - }, - { - "epoch": 0.4, - "learning_rate": 1.944680871262545e-06, - "loss": 0.9746, - "step": 15589 - }, - { - "epoch": 0.4, - "learning_rate": 1.9446717952429346e-06, - "loss": 1.0723, - "step": 15590 - }, - { - "epoch": 0.4, - "learning_rate": 1.944662718500032e-06, - "loss": 0.8223, - "step": 15591 - }, - { - "epoch": 0.4, - "learning_rate": 1.9446536410338454e-06, - "loss": 0.9824, - "step": 15592 - }, - { - "epoch": 0.4, - "learning_rate": 1.9446445628443805e-06, - "loss": 0.8066, - "step": 15593 - }, - { - "epoch": 0.4, - "learning_rate": 1.944635483931645e-06, - "loss": 0.9619, - "step": 15594 - }, - { - "epoch": 0.4, - "learning_rate": 1.9446264042956455e-06, - "loss": 1.0195, - "step": 15595 - }, - { - "epoch": 0.4, - "learning_rate": 1.9446173239363884e-06, - "loss": 0.9248, - "step": 15596 - }, - { - "epoch": 0.4, - "learning_rate": 1.9446082428538817e-06, - "loss": 0.7744, - "step": 15597 - }, - { - "epoch": 0.4, - "learning_rate": 1.944599161048132e-06, - "loss": 1.0742, - "step": 15598 - }, - { - "epoch": 0.4, - "learning_rate": 1.944590078519146e-06, - "loss": 1.0654, - "step": 15599 - }, - { - "epoch": 0.4, - "learning_rate": 1.9445809952669308e-06, - "loss": 0.7529, - "step": 15600 - }, - { - "epoch": 0.4, - "learning_rate": 1.944571911291493e-06, - "loss": 0.8198, - "step": 15601 - }, - { - "epoch": 0.4, - "learning_rate": 1.9445628265928405e-06, - "loss": 1.1104, - "step": 15602 - }, - { - "epoch": 0.4, - "learning_rate": 1.9445537411709797e-06, - "loss": 0.8984, - "step": 15603 - }, - { - "epoch": 0.4, - "learning_rate": 1.944544655025917e-06, - "loss": 0.8389, - "step": 15604 - }, - { - "epoch": 0.4, - "learning_rate": 1.9445355681576604e-06, - "loss": 0.9893, - "step": 15605 - }, - { - "epoch": 0.4, - "learning_rate": 1.9445264805662162e-06, - "loss": 0.728, - "step": 15606 - }, - { - "epoch": 0.4, - "learning_rate": 1.9445173922515914e-06, - "loss": 0.9482, - "step": 15607 - }, - { - "epoch": 0.4, - "learning_rate": 1.944508303213793e-06, - "loss": 1.1494, - "step": 15608 - }, - { - "epoch": 0.4, - "learning_rate": 1.9444992134528282e-06, - "loss": 0.6475, - "step": 15609 - }, - { - "epoch": 0.4, - "learning_rate": 1.944490122968704e-06, - "loss": 0.6953, - "step": 15610 - }, - { - "epoch": 0.4, - "learning_rate": 1.944481031761427e-06, - "loss": 0.8213, - "step": 15611 - }, - { - "epoch": 0.4, - "learning_rate": 1.944471939831004e-06, - "loss": 1.085, - "step": 15612 - }, - { - "epoch": 0.4, - "learning_rate": 1.944462847177442e-06, - "loss": 0.9062, - "step": 15613 - }, - { - "epoch": 0.4, - "learning_rate": 1.944453753800749e-06, - "loss": 0.8252, - "step": 15614 - }, - { - "epoch": 0.4, - "learning_rate": 1.9444446597009306e-06, - "loss": 0.7773, - "step": 15615 - }, - { - "epoch": 0.4, - "learning_rate": 1.9444355648779948e-06, - "loss": 0.7178, - "step": 15616 - }, - { - "epoch": 0.4, - "learning_rate": 1.9444264693319477e-06, - "loss": 0.7988, - "step": 15617 - }, - { - "epoch": 0.4, - "learning_rate": 1.944417373062797e-06, - "loss": 0.6338, - "step": 15618 - }, - { - "epoch": 0.4, - "learning_rate": 1.9444082760705493e-06, - "loss": 0.9922, - "step": 15619 - }, - { - "epoch": 0.4, - "learning_rate": 1.9443991783552115e-06, - "loss": 0.9434, - "step": 15620 - }, - { - "epoch": 0.4, - "learning_rate": 1.944390079916791e-06, - "loss": 0.9395, - "step": 15621 - }, - { - "epoch": 0.4, - "learning_rate": 1.944380980755294e-06, - "loss": 1.0, - "step": 15622 - }, - { - "epoch": 0.4, - "learning_rate": 1.9443718808707283e-06, - "loss": 1.0352, - "step": 15623 - }, - { - "epoch": 0.4, - "learning_rate": 1.9443627802631e-06, - "loss": 0.9971, - "step": 15624 - }, - { - "epoch": 0.4, - "learning_rate": 1.9443536789324167e-06, - "loss": 1.1025, - "step": 15625 - }, - { - "epoch": 0.4, - "learning_rate": 1.9443445768786854e-06, - "loss": 0.832, - "step": 15626 - }, - { - "epoch": 0.4, - "learning_rate": 1.9443354741019128e-06, - "loss": 0.627, - "step": 15627 - }, - { - "epoch": 0.4, - "learning_rate": 1.9443263706021056e-06, - "loss": 0.6809, - "step": 15628 - }, - { - "epoch": 0.4, - "learning_rate": 1.9443172663792716e-06, - "loss": 0.8237, - "step": 15629 - }, - { - "epoch": 0.4, - "learning_rate": 1.944308161433417e-06, - "loss": 0.8828, - "step": 15630 - }, - { - "epoch": 0.4, - "learning_rate": 1.9442990557645495e-06, - "loss": 0.918, - "step": 15631 - }, - { - "epoch": 0.4, - "learning_rate": 1.944289949372675e-06, - "loss": 0.7671, - "step": 15632 - }, - { - "epoch": 0.4, - "learning_rate": 1.9442808422578016e-06, - "loss": 0.9424, - "step": 15633 - }, - { - "epoch": 0.4, - "learning_rate": 1.9442717344199356e-06, - "loss": 0.8066, - "step": 15634 - }, - { - "epoch": 0.4, - "learning_rate": 1.944262625859084e-06, - "loss": 1.0293, - "step": 15635 - }, - { - "epoch": 0.4, - "learning_rate": 1.944253516575254e-06, - "loss": 1.0293, - "step": 15636 - }, - { - "epoch": 0.4, - "learning_rate": 1.944244406568453e-06, - "loss": 0.8193, - "step": 15637 - }, - { - "epoch": 0.4, - "learning_rate": 1.944235295838687e-06, - "loss": 1.2891, - "step": 15638 - }, - { - "epoch": 0.4, - "learning_rate": 1.9442261843859633e-06, - "loss": 1.0586, - "step": 15639 - }, - { - "epoch": 0.4, - "learning_rate": 1.944217072210289e-06, - "loss": 0.8789, - "step": 15640 - }, - { - "epoch": 0.4, - "learning_rate": 1.9442079593116714e-06, - "loss": 0.8657, - "step": 15641 - }, - { - "epoch": 0.4, - "learning_rate": 1.9441988456901174e-06, - "loss": 1.0181, - "step": 15642 - }, - { - "epoch": 0.4, - "learning_rate": 1.9441897313456336e-06, - "loss": 0.8135, - "step": 15643 - }, - { - "epoch": 0.4, - "learning_rate": 1.944180616278227e-06, - "loss": 0.6782, - "step": 15644 - }, - { - "epoch": 0.4, - "learning_rate": 1.944171500487905e-06, - "loss": 0.5464, - "step": 15645 - }, - { - "epoch": 0.4, - "learning_rate": 1.9441623839746736e-06, - "loss": 0.8232, - "step": 15646 - }, - { - "epoch": 0.4, - "learning_rate": 1.9441532667385408e-06, - "loss": 0.8594, - "step": 15647 - }, - { - "epoch": 0.4, - "learning_rate": 1.9441441487795136e-06, - "loss": 1.0186, - "step": 15648 - }, - { - "epoch": 0.4, - "learning_rate": 1.944135030097598e-06, - "loss": 0.6798, - "step": 15649 - }, - { - "epoch": 0.4, - "learning_rate": 1.944125910692802e-06, - "loss": 0.9375, - "step": 15650 - }, - { - "epoch": 0.4, - "learning_rate": 1.9441167905651326e-06, - "loss": 0.8926, - "step": 15651 - }, - { - "epoch": 0.4, - "learning_rate": 1.944107669714596e-06, - "loss": 1.0273, - "step": 15652 - }, - { - "epoch": 0.4, - "learning_rate": 1.9440985481411995e-06, - "loss": 1.0762, - "step": 15653 - }, - { - "epoch": 0.4, - "learning_rate": 1.9440894258449503e-06, - "loss": 1.0537, - "step": 15654 - }, - { - "epoch": 0.4, - "learning_rate": 1.944080302825855e-06, - "loss": 0.9648, - "step": 15655 - }, - { - "epoch": 0.4, - "learning_rate": 1.944071179083921e-06, - "loss": 0.9766, - "step": 15656 - }, - { - "epoch": 0.4, - "learning_rate": 1.944062054619155e-06, - "loss": 0.7568, - "step": 15657 - }, - { - "epoch": 0.4, - "learning_rate": 1.9440529294315645e-06, - "loss": 0.7715, - "step": 15658 - }, - { - "epoch": 0.4, - "learning_rate": 1.9440438035211554e-06, - "loss": 0.9131, - "step": 15659 - }, - { - "epoch": 0.4, - "learning_rate": 1.944034676887936e-06, - "loss": 0.873, - "step": 15660 - }, - { - "epoch": 0.4, - "learning_rate": 1.9440255495319123e-06, - "loss": 0.7188, - "step": 15661 - }, - { - "epoch": 0.4, - "learning_rate": 1.944016421453092e-06, - "loss": 0.8792, - "step": 15662 - }, - { - "epoch": 0.4, - "learning_rate": 1.944007292651481e-06, - "loss": 1.0039, - "step": 15663 - }, - { - "epoch": 0.4, - "learning_rate": 1.9439981631270877e-06, - "loss": 0.8359, - "step": 15664 - }, - { - "epoch": 0.4, - "learning_rate": 1.943989032879918e-06, - "loss": 0.8662, - "step": 15665 - }, - { - "epoch": 0.4, - "learning_rate": 1.9439799019099795e-06, - "loss": 0.7275, - "step": 15666 - }, - { - "epoch": 0.4, - "learning_rate": 1.943970770217279e-06, - "loss": 0.9971, - "step": 15667 - }, - { - "epoch": 0.4, - "learning_rate": 1.943961637801824e-06, - "loss": 0.8916, - "step": 15668 - }, - { - "epoch": 0.4, - "learning_rate": 1.9439525046636203e-06, - "loss": 1.0527, - "step": 15669 - }, - { - "epoch": 0.4, - "learning_rate": 1.9439433708026757e-06, - "loss": 0.7026, - "step": 15670 - }, - { - "epoch": 0.4, - "learning_rate": 1.9439342362189972e-06, - "loss": 0.7725, - "step": 15671 - }, - { - "epoch": 0.4, - "learning_rate": 1.9439251009125913e-06, - "loss": 0.918, - "step": 15672 - }, - { - "epoch": 0.4, - "learning_rate": 1.9439159648834656e-06, - "loss": 0.9272, - "step": 15673 - }, - { - "epoch": 0.4, - "learning_rate": 1.943906828131627e-06, - "loss": 1.0605, - "step": 15674 - }, - { - "epoch": 0.4, - "learning_rate": 1.9438976906570824e-06, - "loss": 0.9004, - "step": 15675 - }, - { - "epoch": 0.4, - "learning_rate": 1.9438885524598386e-06, - "loss": 0.7461, - "step": 15676 - }, - { - "epoch": 0.4, - "learning_rate": 1.9438794135399025e-06, - "loss": 1.0127, - "step": 15677 - }, - { - "epoch": 0.4, - "learning_rate": 1.9438702738972817e-06, - "loss": 1.0586, - "step": 15678 - }, - { - "epoch": 0.4, - "learning_rate": 1.9438611335319825e-06, - "loss": 0.7065, - "step": 15679 - }, - { - "epoch": 0.4, - "learning_rate": 1.943851992444012e-06, - "loss": 1.1084, - "step": 15680 - }, - { - "epoch": 0.4, - "learning_rate": 1.9438428506333783e-06, - "loss": 0.8193, - "step": 15681 - }, - { - "epoch": 0.4, - "learning_rate": 1.943833708100087e-06, - "loss": 1.1104, - "step": 15682 - }, - { - "epoch": 0.4, - "learning_rate": 1.9438245648441455e-06, - "loss": 0.8789, - "step": 15683 - }, - { - "epoch": 0.4, - "learning_rate": 1.9438154208655613e-06, - "loss": 0.9619, - "step": 15684 - }, - { - "epoch": 0.4, - "learning_rate": 1.9438062761643407e-06, - "loss": 1.0459, - "step": 15685 - }, - { - "epoch": 0.4, - "learning_rate": 1.9437971307404913e-06, - "loss": 0.77, - "step": 15686 - }, - { - "epoch": 0.4, - "learning_rate": 1.9437879845940195e-06, - "loss": 0.9346, - "step": 15687 - }, - { - "epoch": 0.4, - "learning_rate": 1.943778837724933e-06, - "loss": 0.8457, - "step": 15688 - }, - { - "epoch": 0.4, - "learning_rate": 1.943769690133238e-06, - "loss": 0.8828, - "step": 15689 - }, - { - "epoch": 0.4, - "learning_rate": 1.943760541818942e-06, - "loss": 0.8467, - "step": 15690 - }, - { - "epoch": 0.4, - "learning_rate": 1.943751392782052e-06, - "loss": 0.7925, - "step": 15691 - }, - { - "epoch": 0.4, - "learning_rate": 1.9437422430225757e-06, - "loss": 0.9639, - "step": 15692 - }, - { - "epoch": 0.4, - "learning_rate": 1.9437330925405187e-06, - "loss": 0.9131, - "step": 15693 - }, - { - "epoch": 0.4, - "learning_rate": 1.9437239413358884e-06, - "loss": 0.7598, - "step": 15694 - }, - { - "epoch": 0.4, - "learning_rate": 1.943714789408693e-06, - "loss": 1.2236, - "step": 15695 - }, - { - "epoch": 0.4, - "learning_rate": 1.9437056367589375e-06, - "loss": 1.0303, - "step": 15696 - }, - { - "epoch": 0.4, - "learning_rate": 1.943696483386631e-06, - "loss": 0.8867, - "step": 15697 - }, - { - "epoch": 0.4, - "learning_rate": 1.943687329291779e-06, - "loss": 0.8223, - "step": 15698 - }, - { - "epoch": 0.4, - "learning_rate": 1.9436781744743888e-06, - "loss": 0.9922, - "step": 15699 - }, - { - "epoch": 0.4, - "learning_rate": 1.9436690189344677e-06, - "loss": 1.0244, - "step": 15700 - }, - { - "epoch": 0.4, - "learning_rate": 1.943659862672023e-06, - "loss": 1.0137, - "step": 15701 - }, - { - "epoch": 0.4, - "learning_rate": 1.9436507056870605e-06, - "loss": 0.9912, - "step": 15702 - }, - { - "epoch": 0.4, - "learning_rate": 1.9436415479795885e-06, - "loss": 1.0, - "step": 15703 - }, - { - "epoch": 0.4, - "learning_rate": 1.943632389549614e-06, - "loss": 0.8711, - "step": 15704 - }, - { - "epoch": 0.4, - "learning_rate": 1.9436232303971434e-06, - "loss": 0.6914, - "step": 15705 - }, - { - "epoch": 0.4, - "learning_rate": 1.9436140705221834e-06, - "loss": 1.0127, - "step": 15706 - }, - { - "epoch": 0.4, - "learning_rate": 1.9436049099247417e-06, - "loss": 0.9678, - "step": 15707 - }, - { - "epoch": 0.4, - "learning_rate": 1.9435957486048253e-06, - "loss": 0.9106, - "step": 15708 - }, - { - "epoch": 0.4, - "learning_rate": 1.943586586562441e-06, - "loss": 0.9131, - "step": 15709 - }, - { - "epoch": 0.4, - "learning_rate": 1.9435774237975957e-06, - "loss": 0.6873, - "step": 15710 - }, - { - "epoch": 0.4, - "learning_rate": 1.9435682603102965e-06, - "loss": 0.6729, - "step": 15711 - }, - { - "epoch": 0.4, - "learning_rate": 1.9435590961005506e-06, - "loss": 0.8574, - "step": 15712 - }, - { - "epoch": 0.4, - "learning_rate": 1.943549931168365e-06, - "loss": 0.8672, - "step": 15713 - }, - { - "epoch": 0.4, - "learning_rate": 1.9435407655137463e-06, - "loss": 0.8623, - "step": 15714 - }, - { - "epoch": 0.4, - "learning_rate": 1.943531599136702e-06, - "loss": 0.9434, - "step": 15715 - }, - { - "epoch": 0.4, - "learning_rate": 1.943522432037239e-06, - "loss": 0.8345, - "step": 15716 - }, - { - "epoch": 0.4, - "learning_rate": 1.943513264215364e-06, - "loss": 0.8223, - "step": 15717 - }, - { - "epoch": 0.4, - "learning_rate": 1.9435040956710845e-06, - "loss": 0.8447, - "step": 15718 - }, - { - "epoch": 0.4, - "learning_rate": 1.9434949264044075e-06, - "loss": 1.0137, - "step": 15719 - }, - { - "epoch": 0.4, - "learning_rate": 1.9434857564153393e-06, - "loss": 0.9131, - "step": 15720 - }, - { - "epoch": 0.4, - "learning_rate": 1.943476585703888e-06, - "loss": 0.8369, - "step": 15721 - }, - { - "epoch": 0.4, - "learning_rate": 1.94346741427006e-06, - "loss": 0.9258, - "step": 15722 - }, - { - "epoch": 0.4, - "learning_rate": 1.943458242113862e-06, - "loss": 0.9326, - "step": 15723 - }, - { - "epoch": 0.4, - "learning_rate": 1.9434490692353014e-06, - "loss": 0.8589, - "step": 15724 - }, - { - "epoch": 0.4, - "learning_rate": 1.943439895634385e-06, - "loss": 0.9102, - "step": 15725 - }, - { - "epoch": 0.4, - "learning_rate": 1.9434307213111205e-06, - "loss": 1.0879, - "step": 15726 - }, - { - "epoch": 0.4, - "learning_rate": 1.9434215462655147e-06, - "loss": 0.7686, - "step": 15727 - }, - { - "epoch": 0.4, - "learning_rate": 1.9434123704975743e-06, - "loss": 0.9678, - "step": 15728 - }, - { - "epoch": 0.4, - "learning_rate": 1.943403194007306e-06, - "loss": 0.9639, - "step": 15729 - }, - { - "epoch": 0.4, - "learning_rate": 1.9433940167947174e-06, - "loss": 0.8027, - "step": 15730 - }, - { - "epoch": 0.4, - "learning_rate": 1.9433848388598157e-06, - "loss": 0.7129, - "step": 15731 - }, - { - "epoch": 0.4, - "learning_rate": 1.943375660202608e-06, - "loss": 1.0898, - "step": 15732 - }, - { - "epoch": 0.4, - "learning_rate": 1.9433664808231e-06, - "loss": 0.8076, - "step": 15733 - }, - { - "epoch": 0.4, - "learning_rate": 1.9433573007213e-06, - "loss": 0.8828, - "step": 15734 - }, - { - "epoch": 0.4, - "learning_rate": 1.9433481198972144e-06, - "loss": 0.8203, - "step": 15735 - }, - { - "epoch": 0.4, - "learning_rate": 1.943338938350851e-06, - "loss": 1.001, - "step": 15736 - }, - { - "epoch": 0.4, - "learning_rate": 1.943329756082216e-06, - "loss": 1.0078, - "step": 15737 - }, - { - "epoch": 0.4, - "learning_rate": 1.943320573091317e-06, - "loss": 0.8301, - "step": 15738 - }, - { - "epoch": 0.4, - "learning_rate": 1.9433113893781606e-06, - "loss": 0.9854, - "step": 15739 - }, - { - "epoch": 0.4, - "learning_rate": 1.9433022049427545e-06, - "loss": 0.9014, - "step": 15740 - }, - { - "epoch": 0.4, - "learning_rate": 1.9432930197851045e-06, - "loss": 0.8516, - "step": 15741 - }, - { - "epoch": 0.4, - "learning_rate": 1.9432838339052192e-06, - "loss": 0.8315, - "step": 15742 - }, - { - "epoch": 0.4, - "learning_rate": 1.9432746473031045e-06, - "loss": 1.0273, - "step": 15743 - }, - { - "epoch": 0.4, - "learning_rate": 1.943265459978768e-06, - "loss": 0.9561, - "step": 15744 - }, - { - "epoch": 0.4, - "learning_rate": 1.943256271932216e-06, - "loss": 0.8179, - "step": 15745 - }, - { - "epoch": 0.4, - "learning_rate": 1.9432470831634563e-06, - "loss": 1.0996, - "step": 15746 - }, - { - "epoch": 0.4, - "learning_rate": 1.943237893672496e-06, - "loss": 0.8623, - "step": 15747 - }, - { - "epoch": 0.4, - "learning_rate": 1.9432287034593412e-06, - "loss": 1.0469, - "step": 15748 - }, - { - "epoch": 0.4, - "learning_rate": 1.943219512524e-06, - "loss": 1.041, - "step": 15749 - }, - { - "epoch": 0.4, - "learning_rate": 1.943210320866479e-06, - "loss": 0.8672, - "step": 15750 - }, - { - "epoch": 0.4, - "learning_rate": 1.9432011284867853e-06, - "loss": 0.8765, - "step": 15751 - }, - { - "epoch": 0.4, - "learning_rate": 1.9431919353849256e-06, - "loss": 0.7246, - "step": 15752 - }, - { - "epoch": 0.4, - "learning_rate": 1.943182741560907e-06, - "loss": 0.9375, - "step": 15753 - }, - { - "epoch": 0.4, - "learning_rate": 1.9431735470147373e-06, - "loss": 1.2764, - "step": 15754 - }, - { - "epoch": 0.4, - "learning_rate": 1.9431643517464226e-06, - "loss": 0.8994, - "step": 15755 - }, - { - "epoch": 0.4, - "learning_rate": 1.9431551557559705e-06, - "loss": 0.9863, - "step": 15756 - }, - { - "epoch": 0.4, - "learning_rate": 1.943145959043388e-06, - "loss": 0.9531, - "step": 15757 - }, - { - "epoch": 0.4, - "learning_rate": 1.9431367616086816e-06, - "loss": 1.0088, - "step": 15758 - }, - { - "epoch": 0.4, - "learning_rate": 1.943127563451859e-06, - "loss": 0.9092, - "step": 15759 - }, - { - "epoch": 0.4, - "learning_rate": 1.943118364572927e-06, - "loss": 0.7861, - "step": 15760 - }, - { - "epoch": 0.4, - "learning_rate": 1.9431091649718927e-06, - "loss": 1.0029, - "step": 15761 - }, - { - "epoch": 0.4, - "learning_rate": 1.943099964648763e-06, - "loss": 0.8008, - "step": 15762 - }, - { - "epoch": 0.4, - "learning_rate": 1.9430907636035446e-06, - "loss": 0.8579, - "step": 15763 - }, - { - "epoch": 0.4, - "learning_rate": 1.9430815618362456e-06, - "loss": 0.7593, - "step": 15764 - }, - { - "epoch": 0.4, - "learning_rate": 1.943072359346872e-06, - "loss": 0.959, - "step": 15765 - }, - { - "epoch": 0.4, - "learning_rate": 1.9430631561354315e-06, - "loss": 1.0254, - "step": 15766 - }, - { - "epoch": 0.4, - "learning_rate": 1.943053952201931e-06, - "loss": 0.9209, - "step": 15767 - }, - { - "epoch": 0.4, - "learning_rate": 1.943044747546377e-06, - "loss": 0.7715, - "step": 15768 - }, - { - "epoch": 0.4, - "learning_rate": 1.9430355421687775e-06, - "loss": 0.8262, - "step": 15769 - }, - { - "epoch": 0.4, - "learning_rate": 1.9430263360691387e-06, - "loss": 0.8887, - "step": 15770 - }, - { - "epoch": 0.4, - "learning_rate": 1.943017129247468e-06, - "loss": 0.8418, - "step": 15771 - }, - { - "epoch": 0.4, - "learning_rate": 1.9430079217037727e-06, - "loss": 0.9746, - "step": 15772 - }, - { - "epoch": 0.4, - "learning_rate": 1.9429987134380594e-06, - "loss": 0.6787, - "step": 15773 - }, - { - "epoch": 0.4, - "learning_rate": 1.9429895044503356e-06, - "loss": 0.915, - "step": 15774 - }, - { - "epoch": 0.4, - "learning_rate": 1.9429802947406077e-06, - "loss": 0.6875, - "step": 15775 - }, - { - "epoch": 0.4, - "learning_rate": 1.9429710843088833e-06, - "loss": 0.8372, - "step": 15776 - }, - { - "epoch": 0.4, - "learning_rate": 1.942961873155169e-06, - "loss": 0.79, - "step": 15777 - }, - { - "epoch": 0.4, - "learning_rate": 1.942952661279473e-06, - "loss": 0.9399, - "step": 15778 - }, - { - "epoch": 0.4, - "learning_rate": 1.9429434486818007e-06, - "loss": 1.1074, - "step": 15779 - }, - { - "epoch": 0.4, - "learning_rate": 1.9429342353621606e-06, - "loss": 1.0137, - "step": 15780 - }, - { - "epoch": 0.4, - "learning_rate": 1.9429250213205584e-06, - "loss": 0.7744, - "step": 15781 - }, - { - "epoch": 0.4, - "learning_rate": 1.9429158065570025e-06, - "loss": 0.7559, - "step": 15782 - }, - { - "epoch": 0.4, - "learning_rate": 1.942906591071499e-06, - "loss": 1.0449, - "step": 15783 - }, - { - "epoch": 0.4, - "learning_rate": 1.9428973748640554e-06, - "loss": 0.6694, - "step": 15784 - }, - { - "epoch": 0.4, - "learning_rate": 1.9428881579346786e-06, - "loss": 0.7764, - "step": 15785 - }, - { - "epoch": 0.4, - "learning_rate": 1.9428789402833756e-06, - "loss": 0.8311, - "step": 15786 - }, - { - "epoch": 0.4, - "learning_rate": 1.9428697219101537e-06, - "loss": 1.1172, - "step": 15787 - }, - { - "epoch": 0.4, - "learning_rate": 1.94286050281502e-06, - "loss": 1.0322, - "step": 15788 - }, - { - "epoch": 0.4, - "learning_rate": 1.9428512829979807e-06, - "loss": 1.0225, - "step": 15789 - }, - { - "epoch": 0.4, - "learning_rate": 1.9428420624590437e-06, - "loss": 1.0342, - "step": 15790 - }, - { - "epoch": 0.4, - "learning_rate": 1.9428328411982166e-06, - "loss": 1.0273, - "step": 15791 - }, - { - "epoch": 0.4, - "learning_rate": 1.942823619215505e-06, - "loss": 0.9434, - "step": 15792 - }, - { - "epoch": 0.4, - "learning_rate": 1.942814396510917e-06, - "loss": 0.96, - "step": 15793 - }, - { - "epoch": 0.4, - "learning_rate": 1.9428051730844596e-06, - "loss": 1.0254, - "step": 15794 - }, - { - "epoch": 0.4, - "learning_rate": 1.942795948936139e-06, - "loss": 0.7549, - "step": 15795 - }, - { - "epoch": 0.4, - "learning_rate": 1.9427867240659635e-06, - "loss": 0.5181, - "step": 15796 - }, - { - "epoch": 0.4, - "learning_rate": 1.9427774984739392e-06, - "loss": 1.0654, - "step": 15797 - }, - { - "epoch": 0.4, - "learning_rate": 1.9427682721600735e-06, - "loss": 0.9775, - "step": 15798 - }, - { - "epoch": 0.4, - "learning_rate": 1.9427590451243735e-06, - "loss": 0.9961, - "step": 15799 - }, - { - "epoch": 0.4, - "learning_rate": 1.942749817366847e-06, - "loss": 0.6433, - "step": 15800 - }, - { - "epoch": 0.4, - "learning_rate": 1.9427405888874994e-06, - "loss": 0.8296, - "step": 15801 - }, - { - "epoch": 0.41, - "learning_rate": 1.942731359686339e-06, - "loss": 0.8074, - "step": 15802 - }, - { - "epoch": 0.41, - "learning_rate": 1.942722129763372e-06, - "loss": 1.0371, - "step": 15803 - }, - { - "epoch": 0.41, - "learning_rate": 1.942712899118607e-06, - "loss": 0.7964, - "step": 15804 - }, - { - "epoch": 0.41, - "learning_rate": 1.9427036677520495e-06, - "loss": 0.9141, - "step": 15805 - }, - { - "epoch": 0.41, - "learning_rate": 1.9426944356637074e-06, - "loss": 1.1602, - "step": 15806 - }, - { - "epoch": 0.41, - "learning_rate": 1.9426852028535872e-06, - "loss": 0.479, - "step": 15807 - }, - { - "epoch": 0.41, - "learning_rate": 1.9426759693216964e-06, - "loss": 0.9961, - "step": 15808 - }, - { - "epoch": 0.41, - "learning_rate": 1.942666735068042e-06, - "loss": 0.8857, - "step": 15809 - }, - { - "epoch": 0.41, - "learning_rate": 1.9426575000926307e-06, - "loss": 1.2109, - "step": 15810 - }, - { - "epoch": 0.41, - "learning_rate": 1.9426482643954704e-06, - "loss": 0.9316, - "step": 15811 - }, - { - "epoch": 0.41, - "learning_rate": 1.9426390279765676e-06, - "loss": 0.835, - "step": 15812 - }, - { - "epoch": 0.41, - "learning_rate": 1.9426297908359293e-06, - "loss": 1.043, - "step": 15813 - }, - { - "epoch": 0.41, - "learning_rate": 1.9426205529735626e-06, - "loss": 0.9482, - "step": 15814 - }, - { - "epoch": 0.41, - "learning_rate": 1.942611314389475e-06, - "loss": 0.9131, - "step": 15815 - }, - { - "epoch": 0.41, - "learning_rate": 1.9426020750836727e-06, - "loss": 0.8711, - "step": 15816 - }, - { - "epoch": 0.41, - "learning_rate": 1.942592835056164e-06, - "loss": 0.6587, - "step": 15817 - }, - { - "epoch": 0.41, - "learning_rate": 1.9425835943069552e-06, - "loss": 0.9209, - "step": 15818 - }, - { - "epoch": 0.41, - "learning_rate": 1.9425743528360533e-06, - "loss": 0.7646, - "step": 15819 - }, - { - "epoch": 0.41, - "learning_rate": 1.9425651106434656e-06, - "loss": 1.0137, - "step": 15820 - }, - { - "epoch": 0.41, - "learning_rate": 1.942555867729199e-06, - "loss": 1.0566, - "step": 15821 - }, - { - "epoch": 0.41, - "learning_rate": 1.9425466240932606e-06, - "loss": 0.7783, - "step": 15822 - }, - { - "epoch": 0.41, - "learning_rate": 1.942537379735658e-06, - "loss": 0.8506, - "step": 15823 - }, - { - "epoch": 0.41, - "learning_rate": 1.942528134656398e-06, - "loss": 0.9824, - "step": 15824 - }, - { - "epoch": 0.41, - "learning_rate": 1.9425188888554867e-06, - "loss": 0.8408, - "step": 15825 - }, - { - "epoch": 0.41, - "learning_rate": 1.9425096423329327e-06, - "loss": 0.7744, - "step": 15826 - }, - { - "epoch": 0.41, - "learning_rate": 1.9425003950887423e-06, - "loss": 0.7642, - "step": 15827 - }, - { - "epoch": 0.41, - "learning_rate": 1.9424911471229225e-06, - "loss": 0.9038, - "step": 15828 - }, - { - "epoch": 0.41, - "learning_rate": 1.942481898435481e-06, - "loss": 1.0098, - "step": 15829 - }, - { - "epoch": 0.41, - "learning_rate": 1.942472649026424e-06, - "loss": 0.9805, - "step": 15830 - }, - { - "epoch": 0.41, - "learning_rate": 1.942463398895759e-06, - "loss": 1.0244, - "step": 15831 - }, - { - "epoch": 0.41, - "learning_rate": 1.9424541480434936e-06, - "loss": 0.8545, - "step": 15832 - }, - { - "epoch": 0.41, - "learning_rate": 1.942444896469634e-06, - "loss": 0.8164, - "step": 15833 - }, - { - "epoch": 0.41, - "learning_rate": 1.9424356441741876e-06, - "loss": 0.79, - "step": 15834 - }, - { - "epoch": 0.41, - "learning_rate": 1.942426391157162e-06, - "loss": 1.0205, - "step": 15835 - }, - { - "epoch": 0.41, - "learning_rate": 1.9424171374185635e-06, - "loss": 0.9072, - "step": 15836 - }, - { - "epoch": 0.41, - "learning_rate": 1.9424078829583994e-06, - "loss": 1.0029, - "step": 15837 - }, - { - "epoch": 0.41, - "learning_rate": 1.942398627776677e-06, - "loss": 0.8906, - "step": 15838 - }, - { - "epoch": 0.41, - "learning_rate": 1.9423893718734035e-06, - "loss": 1.0479, - "step": 15839 - }, - { - "epoch": 0.41, - "learning_rate": 1.9423801152485857e-06, - "loss": 0.9346, - "step": 15840 - }, - { - "epoch": 0.41, - "learning_rate": 1.942370857902231e-06, - "loss": 0.8062, - "step": 15841 - }, - { - "epoch": 0.41, - "learning_rate": 1.942361599834346e-06, - "loss": 0.9346, - "step": 15842 - }, - { - "epoch": 0.41, - "learning_rate": 1.942352341044938e-06, - "loss": 0.7378, - "step": 15843 - }, - { - "epoch": 0.41, - "learning_rate": 1.9423430815340144e-06, - "loss": 0.8633, - "step": 15844 - }, - { - "epoch": 0.41, - "learning_rate": 1.942333821301582e-06, - "loss": 0.8535, - "step": 15845 - }, - { - "epoch": 0.41, - "learning_rate": 1.9423245603476475e-06, - "loss": 0.9531, - "step": 15846 - }, - { - "epoch": 0.41, - "learning_rate": 1.9423152986722187e-06, - "loss": 0.9932, - "step": 15847 - }, - { - "epoch": 0.41, - "learning_rate": 1.9423060362753025e-06, - "loss": 0.9443, - "step": 15848 - }, - { - "epoch": 0.41, - "learning_rate": 1.9422967731569057e-06, - "loss": 0.9316, - "step": 15849 - }, - { - "epoch": 0.41, - "learning_rate": 1.942287509317036e-06, - "loss": 0.7705, - "step": 15850 - }, - { - "epoch": 0.41, - "learning_rate": 1.9422782447556994e-06, - "loss": 0.9185, - "step": 15851 - }, - { - "epoch": 0.41, - "learning_rate": 1.9422689794729043e-06, - "loss": 0.9395, - "step": 15852 - }, - { - "epoch": 0.41, - "learning_rate": 1.942259713468657e-06, - "loss": 0.874, - "step": 15853 - }, - { - "epoch": 0.41, - "learning_rate": 1.9422504467429644e-06, - "loss": 0.7092, - "step": 15854 - }, - { - "epoch": 0.41, - "learning_rate": 1.9422411792958345e-06, - "loss": 0.998, - "step": 15855 - }, - { - "epoch": 0.41, - "learning_rate": 1.9422319111272735e-06, - "loss": 0.957, - "step": 15856 - }, - { - "epoch": 0.41, - "learning_rate": 1.942222642237289e-06, - "loss": 0.7422, - "step": 15857 - }, - { - "epoch": 0.41, - "learning_rate": 1.942213372625888e-06, - "loss": 1.0225, - "step": 15858 - }, - { - "epoch": 0.41, - "learning_rate": 1.9422041022930773e-06, - "loss": 1.002, - "step": 15859 - }, - { - "epoch": 0.41, - "learning_rate": 1.9421948312388644e-06, - "loss": 1.1025, - "step": 15860 - }, - { - "epoch": 0.41, - "learning_rate": 1.9421855594632563e-06, - "loss": 0.8408, - "step": 15861 - }, - { - "epoch": 0.41, - "learning_rate": 1.94217628696626e-06, - "loss": 0.9355, - "step": 15862 - }, - { - "epoch": 0.41, - "learning_rate": 1.9421670137478825e-06, - "loss": 0.6538, - "step": 15863 - }, - { - "epoch": 0.41, - "learning_rate": 1.942157739808131e-06, - "loss": 1.0576, - "step": 15864 - }, - { - "epoch": 0.41, - "learning_rate": 1.942148465147013e-06, - "loss": 0.8398, - "step": 15865 - }, - { - "epoch": 0.41, - "learning_rate": 1.942139189764535e-06, - "loss": 0.8447, - "step": 15866 - }, - { - "epoch": 0.41, - "learning_rate": 1.9421299136607043e-06, - "loss": 0.8677, - "step": 15867 - }, - { - "epoch": 0.41, - "learning_rate": 1.9421206368355284e-06, - "loss": 0.6885, - "step": 15868 - }, - { - "epoch": 0.41, - "learning_rate": 1.942111359289014e-06, - "loss": 0.9844, - "step": 15869 - }, - { - "epoch": 0.41, - "learning_rate": 1.9421020810211676e-06, - "loss": 1.1738, - "step": 15870 - }, - { - "epoch": 0.41, - "learning_rate": 1.9420928020319975e-06, - "loss": 0.9268, - "step": 15871 - }, - { - "epoch": 0.41, - "learning_rate": 1.94208352232151e-06, - "loss": 0.8867, - "step": 15872 - }, - { - "epoch": 0.41, - "learning_rate": 1.942074241889713e-06, - "loss": 0.8999, - "step": 15873 - }, - { - "epoch": 0.41, - "learning_rate": 1.9420649607366124e-06, - "loss": 1.0186, - "step": 15874 - }, - { - "epoch": 0.41, - "learning_rate": 1.9420556788622164e-06, - "loss": 0.9688, - "step": 15875 - }, - { - "epoch": 0.41, - "learning_rate": 1.9420463962665316e-06, - "loss": 0.9893, - "step": 15876 - }, - { - "epoch": 0.41, - "learning_rate": 1.9420371129495647e-06, - "loss": 0.7832, - "step": 15877 - }, - { - "epoch": 0.41, - "learning_rate": 1.942027828911324e-06, - "loss": 1.0195, - "step": 15878 - }, - { - "epoch": 0.41, - "learning_rate": 1.9420185441518155e-06, - "loss": 0.8672, - "step": 15879 - }, - { - "epoch": 0.41, - "learning_rate": 1.9420092586710467e-06, - "loss": 0.9932, - "step": 15880 - }, - { - "epoch": 0.41, - "learning_rate": 1.941999972469025e-06, - "loss": 0.6602, - "step": 15881 - }, - { - "epoch": 0.41, - "learning_rate": 1.941990685545757e-06, - "loss": 0.7383, - "step": 15882 - }, - { - "epoch": 0.41, - "learning_rate": 1.9419813979012502e-06, - "loss": 0.6841, - "step": 15883 - }, - { - "epoch": 0.41, - "learning_rate": 1.9419721095355113e-06, - "loss": 0.8887, - "step": 15884 - }, - { - "epoch": 0.41, - "learning_rate": 1.9419628204485484e-06, - "loss": 1.0098, - "step": 15885 - }, - { - "epoch": 0.41, - "learning_rate": 1.941953530640367e-06, - "loss": 0.8418, - "step": 15886 - }, - { - "epoch": 0.41, - "learning_rate": 1.9419442401109757e-06, - "loss": 0.9365, - "step": 15887 - }, - { - "epoch": 0.41, - "learning_rate": 1.9419349488603806e-06, - "loss": 0.791, - "step": 15888 - }, - { - "epoch": 0.41, - "learning_rate": 1.9419256568885895e-06, - "loss": 0.6582, - "step": 15889 - }, - { - "epoch": 0.41, - "learning_rate": 1.941916364195609e-06, - "loss": 0.8691, - "step": 15890 - }, - { - "epoch": 0.41, - "learning_rate": 1.9419070707814468e-06, - "loss": 1.0146, - "step": 15891 - }, - { - "epoch": 0.41, - "learning_rate": 1.9418977766461095e-06, - "loss": 0.7944, - "step": 15892 - }, - { - "epoch": 0.41, - "learning_rate": 1.941888481789604e-06, - "loss": 1.0752, - "step": 15893 - }, - { - "epoch": 0.41, - "learning_rate": 1.9418791862119383e-06, - "loss": 0.7793, - "step": 15894 - }, - { - "epoch": 0.41, - "learning_rate": 1.941869889913119e-06, - "loss": 0.8574, - "step": 15895 - }, - { - "epoch": 0.41, - "learning_rate": 1.941860592893153e-06, - "loss": 1.0527, - "step": 15896 - }, - { - "epoch": 0.41, - "learning_rate": 1.9418512951520475e-06, - "loss": 0.5747, - "step": 15897 - }, - { - "epoch": 0.41, - "learning_rate": 1.9418419966898097e-06, - "loss": 0.8926, - "step": 15898 - }, - { - "epoch": 0.41, - "learning_rate": 1.9418326975064475e-06, - "loss": 0.9863, - "step": 15899 - }, - { - "epoch": 0.41, - "learning_rate": 1.9418233976019667e-06, - "loss": 0.8701, - "step": 15900 - }, - { - "epoch": 0.41, - "learning_rate": 1.9418140969763754e-06, - "loss": 0.9336, - "step": 15901 - }, - { - "epoch": 0.41, - "learning_rate": 1.94180479562968e-06, - "loss": 0.9365, - "step": 15902 - }, - { - "epoch": 0.41, - "learning_rate": 1.941795493561888e-06, - "loss": 0.9199, - "step": 15903 - }, - { - "epoch": 0.41, - "learning_rate": 1.941786190773007e-06, - "loss": 0.9619, - "step": 15904 - }, - { - "epoch": 0.41, - "learning_rate": 1.941776887263043e-06, - "loss": 0.8745, - "step": 15905 - }, - { - "epoch": 0.41, - "learning_rate": 1.941767583032004e-06, - "loss": 0.6875, - "step": 15906 - }, - { - "epoch": 0.41, - "learning_rate": 1.941758278079897e-06, - "loss": 0.8604, - "step": 15907 - }, - { - "epoch": 0.41, - "learning_rate": 1.941748972406729e-06, - "loss": 0.9141, - "step": 15908 - }, - { - "epoch": 0.41, - "learning_rate": 1.941739666012507e-06, - "loss": 0.8765, - "step": 15909 - }, - { - "epoch": 0.41, - "learning_rate": 1.941730358897238e-06, - "loss": 0.7559, - "step": 15910 - }, - { - "epoch": 0.41, - "learning_rate": 1.9417210510609294e-06, - "loss": 1.2432, - "step": 15911 - }, - { - "epoch": 0.41, - "learning_rate": 1.9417117425035886e-06, - "loss": 0.9268, - "step": 15912 - }, - { - "epoch": 0.41, - "learning_rate": 1.9417024332252225e-06, - "loss": 0.7402, - "step": 15913 - }, - { - "epoch": 0.41, - "learning_rate": 1.9416931232258377e-06, - "loss": 1.0859, - "step": 15914 - }, - { - "epoch": 0.41, - "learning_rate": 1.941683812505442e-06, - "loss": 0.8438, - "step": 15915 - }, - { - "epoch": 0.41, - "learning_rate": 1.9416745010640426e-06, - "loss": 0.9678, - "step": 15916 - }, - { - "epoch": 0.41, - "learning_rate": 1.9416651889016457e-06, - "loss": 0.8408, - "step": 15917 - }, - { - "epoch": 0.41, - "learning_rate": 1.9416558760182595e-06, - "loss": 1.0801, - "step": 15918 - }, - { - "epoch": 0.41, - "learning_rate": 1.9416465624138907e-06, - "loss": 0.9844, - "step": 15919 - }, - { - "epoch": 0.41, - "learning_rate": 1.941637248088546e-06, - "loss": 0.9072, - "step": 15920 - }, - { - "epoch": 0.41, - "learning_rate": 1.9416279330422337e-06, - "loss": 0.7446, - "step": 15921 - }, - { - "epoch": 0.41, - "learning_rate": 1.9416186172749594e-06, - "loss": 0.8447, - "step": 15922 - }, - { - "epoch": 0.41, - "learning_rate": 1.9416093007867314e-06, - "loss": 0.918, - "step": 15923 - }, - { - "epoch": 0.41, - "learning_rate": 1.941599983577557e-06, - "loss": 0.7695, - "step": 15924 - }, - { - "epoch": 0.41, - "learning_rate": 1.941590665647442e-06, - "loss": 0.8767, - "step": 15925 - }, - { - "epoch": 0.41, - "learning_rate": 1.9415813469963946e-06, - "loss": 0.9053, - "step": 15926 - }, - { - "epoch": 0.41, - "learning_rate": 1.9415720276244217e-06, - "loss": 0.9102, - "step": 15927 - }, - { - "epoch": 0.41, - "learning_rate": 1.9415627075315302e-06, - "loss": 0.8462, - "step": 15928 - }, - { - "epoch": 0.41, - "learning_rate": 1.9415533867177273e-06, - "loss": 0.8403, - "step": 15929 - }, - { - "epoch": 0.41, - "learning_rate": 1.9415440651830206e-06, - "loss": 0.7432, - "step": 15930 - }, - { - "epoch": 0.41, - "learning_rate": 1.941534742927417e-06, - "loss": 0.8311, - "step": 15931 - }, - { - "epoch": 0.41, - "learning_rate": 1.941525419950923e-06, - "loss": 0.7993, - "step": 15932 - }, - { - "epoch": 0.41, - "learning_rate": 1.941516096253547e-06, - "loss": 1.0088, - "step": 15933 - }, - { - "epoch": 0.41, - "learning_rate": 1.9415067718352953e-06, - "loss": 0.8364, - "step": 15934 - }, - { - "epoch": 0.41, - "learning_rate": 1.9414974466961745e-06, - "loss": 0.7275, - "step": 15935 - }, - { - "epoch": 0.41, - "learning_rate": 1.9414881208361927e-06, - "loss": 0.9268, - "step": 15936 - }, - { - "epoch": 0.41, - "learning_rate": 1.941478794255357e-06, - "loss": 0.9043, - "step": 15937 - }, - { - "epoch": 0.41, - "learning_rate": 1.941469466953674e-06, - "loss": 1.0176, - "step": 15938 - }, - { - "epoch": 0.41, - "learning_rate": 1.9414601389311514e-06, - "loss": 0.7666, - "step": 15939 - }, - { - "epoch": 0.41, - "learning_rate": 1.9414508101877957e-06, - "loss": 0.9326, - "step": 15940 - }, - { - "epoch": 0.41, - "learning_rate": 1.9414414807236146e-06, - "loss": 1.043, - "step": 15941 - }, - { - "epoch": 0.41, - "learning_rate": 1.9414321505386152e-06, - "loss": 0.7437, - "step": 15942 - }, - { - "epoch": 0.41, - "learning_rate": 1.9414228196328044e-06, - "loss": 0.8555, - "step": 15943 - }, - { - "epoch": 0.41, - "learning_rate": 1.9414134880061892e-06, - "loss": 0.7119, - "step": 15944 - }, - { - "epoch": 0.41, - "learning_rate": 1.9414041556587774e-06, - "loss": 0.8857, - "step": 15945 - }, - { - "epoch": 0.41, - "learning_rate": 1.9413948225905753e-06, - "loss": 0.7412, - "step": 15946 - }, - { - "epoch": 0.41, - "learning_rate": 1.9413854888015905e-06, - "loss": 0.814, - "step": 15947 - }, - { - "epoch": 0.41, - "learning_rate": 1.9413761542918302e-06, - "loss": 0.8691, - "step": 15948 - }, - { - "epoch": 0.41, - "learning_rate": 1.9413668190613017e-06, - "loss": 0.7754, - "step": 15949 - }, - { - "epoch": 0.41, - "learning_rate": 1.941357483110012e-06, - "loss": 0.7749, - "step": 15950 - }, - { - "epoch": 0.41, - "learning_rate": 1.9413481464379676e-06, - "loss": 0.8477, - "step": 15951 - }, - { - "epoch": 0.41, - "learning_rate": 1.9413388090451765e-06, - "loss": 0.8223, - "step": 15952 - }, - { - "epoch": 0.41, - "learning_rate": 1.9413294709316455e-06, - "loss": 0.8057, - "step": 15953 - }, - { - "epoch": 0.41, - "learning_rate": 1.941320132097382e-06, - "loss": 0.8477, - "step": 15954 - }, - { - "epoch": 0.41, - "learning_rate": 1.941310792542393e-06, - "loss": 0.8525, - "step": 15955 - }, - { - "epoch": 0.41, - "learning_rate": 1.9413014522666855e-06, - "loss": 0.6921, - "step": 15956 - }, - { - "epoch": 0.41, - "learning_rate": 1.9412921112702664e-06, - "loss": 0.6348, - "step": 15957 - }, - { - "epoch": 0.41, - "learning_rate": 1.9412827695531434e-06, - "loss": 1.1006, - "step": 15958 - }, - { - "epoch": 0.41, - "learning_rate": 1.9412734271153238e-06, - "loss": 1.0205, - "step": 15959 - }, - { - "epoch": 0.41, - "learning_rate": 1.941264083956814e-06, - "loss": 0.9092, - "step": 15960 - }, - { - "epoch": 0.41, - "learning_rate": 1.941254740077622e-06, - "loss": 0.7095, - "step": 15961 - }, - { - "epoch": 0.41, - "learning_rate": 1.9412453954777543e-06, - "loss": 0.8555, - "step": 15962 - }, - { - "epoch": 0.41, - "learning_rate": 1.941236050157218e-06, - "loss": 0.7358, - "step": 15963 - }, - { - "epoch": 0.41, - "learning_rate": 1.941226704116021e-06, - "loss": 1.082, - "step": 15964 - }, - { - "epoch": 0.41, - "learning_rate": 1.94121735735417e-06, - "loss": 0.6201, - "step": 15965 - }, - { - "epoch": 0.41, - "learning_rate": 1.9412080098716717e-06, - "loss": 0.873, - "step": 15966 - }, - { - "epoch": 0.41, - "learning_rate": 1.941198661668534e-06, - "loss": 0.9258, - "step": 15967 - }, - { - "epoch": 0.41, - "learning_rate": 1.941189312744764e-06, - "loss": 0.9834, - "step": 15968 - }, - { - "epoch": 0.41, - "learning_rate": 1.941179963100368e-06, - "loss": 0.8467, - "step": 15969 - }, - { - "epoch": 0.41, - "learning_rate": 1.941170612735354e-06, - "loss": 0.9736, - "step": 15970 - }, - { - "epoch": 0.41, - "learning_rate": 1.9411612616497295e-06, - "loss": 0.6465, - "step": 15971 - }, - { - "epoch": 0.41, - "learning_rate": 1.9411519098435005e-06, - "loss": 0.9385, - "step": 15972 - }, - { - "epoch": 0.41, - "learning_rate": 1.9411425573166747e-06, - "loss": 0.8203, - "step": 15973 - }, - { - "epoch": 0.41, - "learning_rate": 1.9411332040692594e-06, - "loss": 1.001, - "step": 15974 - }, - { - "epoch": 0.41, - "learning_rate": 1.9411238501012618e-06, - "loss": 0.6553, - "step": 15975 - }, - { - "epoch": 0.41, - "learning_rate": 1.9411144954126894e-06, - "loss": 0.8867, - "step": 15976 - }, - { - "epoch": 0.41, - "learning_rate": 1.941105140003548e-06, - "loss": 0.7239, - "step": 15977 - }, - { - "epoch": 0.41, - "learning_rate": 1.9410957838738466e-06, - "loss": 0.8101, - "step": 15978 - }, - { - "epoch": 0.41, - "learning_rate": 1.9410864270235906e-06, - "loss": 1.0049, - "step": 15979 - }, - { - "epoch": 0.41, - "learning_rate": 1.9410770694527883e-06, - "loss": 0.9004, - "step": 15980 - }, - { - "epoch": 0.41, - "learning_rate": 1.941067711161447e-06, - "loss": 0.7715, - "step": 15981 - }, - { - "epoch": 0.41, - "learning_rate": 1.941058352149573e-06, - "loss": 1.0332, - "step": 15982 - }, - { - "epoch": 0.41, - "learning_rate": 1.9410489924171734e-06, - "loss": 0.8516, - "step": 15983 - }, - { - "epoch": 0.41, - "learning_rate": 1.941039631964257e-06, - "loss": 0.9111, - "step": 15984 - }, - { - "epoch": 0.41, - "learning_rate": 1.941030270790829e-06, - "loss": 0.8394, - "step": 15985 - }, - { - "epoch": 0.41, - "learning_rate": 1.9410209088968975e-06, - "loss": 0.5701, - "step": 15986 - }, - { - "epoch": 0.41, - "learning_rate": 1.9410115462824697e-06, - "loss": 0.9204, - "step": 15987 - }, - { - "epoch": 0.41, - "learning_rate": 1.9410021829475527e-06, - "loss": 0.791, - "step": 15988 - }, - { - "epoch": 0.41, - "learning_rate": 1.9409928188921533e-06, - "loss": 1.0283, - "step": 15989 - }, - { - "epoch": 0.41, - "learning_rate": 1.9409834541162795e-06, - "loss": 0.8682, - "step": 15990 - }, - { - "epoch": 0.41, - "learning_rate": 1.9409740886199372e-06, - "loss": 0.7988, - "step": 15991 - }, - { - "epoch": 0.41, - "learning_rate": 1.9409647224031346e-06, - "loss": 0.8604, - "step": 15992 - }, - { - "epoch": 0.41, - "learning_rate": 1.9409553554658788e-06, - "loss": 0.7778, - "step": 15993 - }, - { - "epoch": 0.41, - "learning_rate": 1.9409459878081766e-06, - "loss": 0.8867, - "step": 15994 - }, - { - "epoch": 0.41, - "learning_rate": 1.9409366194300355e-06, - "loss": 0.8281, - "step": 15995 - }, - { - "epoch": 0.41, - "learning_rate": 1.940927250331462e-06, - "loss": 0.9492, - "step": 15996 - }, - { - "epoch": 0.41, - "learning_rate": 1.9409178805124642e-06, - "loss": 0.6938, - "step": 15997 - }, - { - "epoch": 0.41, - "learning_rate": 1.9409085099730488e-06, - "loss": 1.0127, - "step": 15998 - }, - { - "epoch": 0.41, - "learning_rate": 1.940899138713223e-06, - "loss": 0.667, - "step": 15999 - }, - { - "epoch": 0.41, - "learning_rate": 1.9408897667329938e-06, - "loss": 0.9248, - "step": 16000 - }, - { - "epoch": 0.41, - "learning_rate": 1.9408803940323687e-06, - "loss": 0.8945, - "step": 16001 - }, - { - "epoch": 0.41, - "learning_rate": 1.940871020611355e-06, - "loss": 0.7178, - "step": 16002 - }, - { - "epoch": 0.41, - "learning_rate": 1.940861646469959e-06, - "loss": 0.8789, - "step": 16003 - }, - { - "epoch": 0.41, - "learning_rate": 1.9408522716081892e-06, - "loss": 0.7471, - "step": 16004 - }, - { - "epoch": 0.41, - "learning_rate": 1.940842896026052e-06, - "loss": 0.8623, - "step": 16005 - }, - { - "epoch": 0.41, - "learning_rate": 1.9408335197235544e-06, - "loss": 0.9746, - "step": 16006 - }, - { - "epoch": 0.41, - "learning_rate": 1.9408241427007036e-06, - "loss": 0.7969, - "step": 16007 - }, - { - "epoch": 0.41, - "learning_rate": 1.9408147649575075e-06, - "loss": 0.9385, - "step": 16008 - }, - { - "epoch": 0.41, - "learning_rate": 1.9408053864939722e-06, - "loss": 1.1387, - "step": 16009 - }, - { - "epoch": 0.41, - "learning_rate": 1.940796007310106e-06, - "loss": 0.8618, - "step": 16010 - }, - { - "epoch": 0.41, - "learning_rate": 1.9407866274059155e-06, - "loss": 0.9961, - "step": 16011 - }, - { - "epoch": 0.41, - "learning_rate": 1.9407772467814078e-06, - "loss": 0.8838, - "step": 16012 - }, - { - "epoch": 0.41, - "learning_rate": 1.9407678654365903e-06, - "loss": 0.8896, - "step": 16013 - }, - { - "epoch": 0.41, - "learning_rate": 1.94075848337147e-06, - "loss": 0.7031, - "step": 16014 - }, - { - "epoch": 0.41, - "learning_rate": 1.940749100586054e-06, - "loss": 0.7949, - "step": 16015 - }, - { - "epoch": 0.41, - "learning_rate": 1.9407397170803503e-06, - "loss": 0.9316, - "step": 16016 - }, - { - "epoch": 0.41, - "learning_rate": 1.940730332854365e-06, - "loss": 0.8711, - "step": 16017 - }, - { - "epoch": 0.41, - "learning_rate": 1.940720947908106e-06, - "loss": 0.6396, - "step": 16018 - }, - { - "epoch": 0.41, - "learning_rate": 1.94071156224158e-06, - "loss": 0.9912, - "step": 16019 - }, - { - "epoch": 0.41, - "learning_rate": 1.940702175854794e-06, - "loss": 1.0635, - "step": 16020 - }, - { - "epoch": 0.41, - "learning_rate": 1.940692788747756e-06, - "loss": 0.8984, - "step": 16021 - }, - { - "epoch": 0.41, - "learning_rate": 1.940683400920473e-06, - "loss": 0.7559, - "step": 16022 - }, - { - "epoch": 0.41, - "learning_rate": 1.940674012372952e-06, - "loss": 0.9717, - "step": 16023 - }, - { - "epoch": 0.41, - "learning_rate": 1.9406646231052e-06, - "loss": 0.8066, - "step": 16024 - }, - { - "epoch": 0.41, - "learning_rate": 1.9406552331172243e-06, - "loss": 0.6724, - "step": 16025 - }, - { - "epoch": 0.41, - "learning_rate": 1.9406458424090324e-06, - "loss": 0.9727, - "step": 16026 - }, - { - "epoch": 0.41, - "learning_rate": 1.9406364509806308e-06, - "loss": 0.8408, - "step": 16027 - }, - { - "epoch": 0.41, - "learning_rate": 1.940627058832027e-06, - "loss": 0.8027, - "step": 16028 - }, - { - "epoch": 0.41, - "learning_rate": 1.940617665963229e-06, - "loss": 0.5767, - "step": 16029 - }, - { - "epoch": 0.41, - "learning_rate": 1.940608272374243e-06, - "loss": 0.959, - "step": 16030 - }, - { - "epoch": 0.41, - "learning_rate": 1.9405988780650763e-06, - "loss": 0.876, - "step": 16031 - }, - { - "epoch": 0.41, - "learning_rate": 1.9405894830357365e-06, - "loss": 0.7454, - "step": 16032 - }, - { - "epoch": 0.41, - "learning_rate": 1.94058008728623e-06, - "loss": 0.9565, - "step": 16033 - }, - { - "epoch": 0.41, - "learning_rate": 1.9405706908165655e-06, - "loss": 0.9141, - "step": 16034 - }, - { - "epoch": 0.41, - "learning_rate": 1.9405612936267487e-06, - "loss": 0.8418, - "step": 16035 - }, - { - "epoch": 0.41, - "learning_rate": 1.940551895716788e-06, - "loss": 0.9785, - "step": 16036 - }, - { - "epoch": 0.41, - "learning_rate": 1.9405424970866894e-06, - "loss": 0.6899, - "step": 16037 - }, - { - "epoch": 0.41, - "learning_rate": 1.9405330977364604e-06, - "loss": 0.7812, - "step": 16038 - }, - { - "epoch": 0.41, - "learning_rate": 1.9405236976661086e-06, - "loss": 0.6511, - "step": 16039 - }, - { - "epoch": 0.41, - "learning_rate": 1.9405142968756416e-06, - "loss": 0.8428, - "step": 16040 - }, - { - "epoch": 0.41, - "learning_rate": 1.9405048953650657e-06, - "loss": 0.959, - "step": 16041 - }, - { - "epoch": 0.41, - "learning_rate": 1.940495493134388e-06, - "loss": 0.8613, - "step": 16042 - }, - { - "epoch": 0.41, - "learning_rate": 1.940486090183617e-06, - "loss": 1.0166, - "step": 16043 - }, - { - "epoch": 0.41, - "learning_rate": 1.9404766865127584e-06, - "loss": 0.7598, - "step": 16044 - }, - { - "epoch": 0.41, - "learning_rate": 1.9404672821218203e-06, - "loss": 0.7666, - "step": 16045 - }, - { - "epoch": 0.41, - "learning_rate": 1.9404578770108097e-06, - "loss": 0.7749, - "step": 16046 - }, - { - "epoch": 0.41, - "learning_rate": 1.940448471179734e-06, - "loss": 0.8994, - "step": 16047 - }, - { - "epoch": 0.41, - "learning_rate": 1.940439064628599e-06, - "loss": 0.9346, - "step": 16048 - }, - { - "epoch": 0.41, - "learning_rate": 1.940429657357414e-06, - "loss": 0.7847, - "step": 16049 - }, - { - "epoch": 0.41, - "learning_rate": 1.9404202493661852e-06, - "loss": 0.7871, - "step": 16050 - }, - { - "epoch": 0.41, - "learning_rate": 1.94041084065492e-06, - "loss": 0.8281, - "step": 16051 - }, - { - "epoch": 0.41, - "learning_rate": 1.940401431223625e-06, - "loss": 1.1279, - "step": 16052 - }, - { - "epoch": 0.41, - "learning_rate": 1.9403920210723085e-06, - "loss": 0.9258, - "step": 16053 - }, - { - "epoch": 0.41, - "learning_rate": 1.9403826102009763e-06, - "loss": 1.0078, - "step": 16054 - }, - { - "epoch": 0.41, - "learning_rate": 1.9403731986096368e-06, - "loss": 0.8491, - "step": 16055 - }, - { - "epoch": 0.41, - "learning_rate": 1.940363786298297e-06, - "loss": 0.8867, - "step": 16056 - }, - { - "epoch": 0.41, - "learning_rate": 1.9403543732669637e-06, - "loss": 1.0566, - "step": 16057 - }, - { - "epoch": 0.41, - "learning_rate": 1.9403449595156436e-06, - "loss": 1.167, - "step": 16058 - }, - { - "epoch": 0.41, - "learning_rate": 1.9403355450443455e-06, - "loss": 0.7607, - "step": 16059 - }, - { - "epoch": 0.41, - "learning_rate": 1.9403261298530754e-06, - "loss": 0.6968, - "step": 16060 - }, - { - "epoch": 0.41, - "learning_rate": 1.9403167139418408e-06, - "loss": 0.8799, - "step": 16061 - }, - { - "epoch": 0.41, - "learning_rate": 1.9403072973106493e-06, - "loss": 0.939, - "step": 16062 - }, - { - "epoch": 0.41, - "learning_rate": 1.940297879959507e-06, - "loss": 0.8447, - "step": 16063 - }, - { - "epoch": 0.41, - "learning_rate": 1.940288461888422e-06, - "loss": 1.0381, - "step": 16064 - }, - { - "epoch": 0.41, - "learning_rate": 1.940279043097402e-06, - "loss": 0.7891, - "step": 16065 - }, - { - "epoch": 0.41, - "learning_rate": 1.9402696235864533e-06, - "loss": 0.8066, - "step": 16066 - }, - { - "epoch": 0.41, - "learning_rate": 1.940260203355583e-06, - "loss": 0.9258, - "step": 16067 - }, - { - "epoch": 0.41, - "learning_rate": 1.9402507824047994e-06, - "loss": 0.8301, - "step": 16068 - }, - { - "epoch": 0.41, - "learning_rate": 1.9402413607341084e-06, - "loss": 1.1016, - "step": 16069 - }, - { - "epoch": 0.41, - "learning_rate": 1.940231938343518e-06, - "loss": 0.8584, - "step": 16070 - }, - { - "epoch": 0.41, - "learning_rate": 1.940222515233035e-06, - "loss": 0.7275, - "step": 16071 - }, - { - "epoch": 0.41, - "learning_rate": 1.9402130914026674e-06, - "loss": 0.8516, - "step": 16072 - }, - { - "epoch": 0.41, - "learning_rate": 1.9402036668524214e-06, - "loss": 0.8096, - "step": 16073 - }, - { - "epoch": 0.41, - "learning_rate": 1.940194241582305e-06, - "loss": 0.9688, - "step": 16074 - }, - { - "epoch": 0.41, - "learning_rate": 1.9401848155923252e-06, - "loss": 0.9648, - "step": 16075 - }, - { - "epoch": 0.41, - "learning_rate": 1.9401753888824886e-06, - "loss": 1.0215, - "step": 16076 - }, - { - "epoch": 0.41, - "learning_rate": 1.9401659614528032e-06, - "loss": 0.6963, - "step": 16077 - }, - { - "epoch": 0.41, - "learning_rate": 1.9401565333032758e-06, - "loss": 0.7368, - "step": 16078 - }, - { - "epoch": 0.41, - "learning_rate": 1.940147104433914e-06, - "loss": 0.833, - "step": 16079 - }, - { - "epoch": 0.41, - "learning_rate": 1.9401376748447247e-06, - "loss": 0.9004, - "step": 16080 - }, - { - "epoch": 0.41, - "learning_rate": 1.940128244535715e-06, - "loss": 0.6582, - "step": 16081 - }, - { - "epoch": 0.41, - "learning_rate": 1.9401188135068927e-06, - "loss": 0.6382, - "step": 16082 - }, - { - "epoch": 0.41, - "learning_rate": 1.9401093817582646e-06, - "loss": 0.7256, - "step": 16083 - }, - { - "epoch": 0.41, - "learning_rate": 1.9400999492898377e-06, - "loss": 0.7998, - "step": 16084 - }, - { - "epoch": 0.41, - "learning_rate": 1.94009051610162e-06, - "loss": 0.8086, - "step": 16085 - }, - { - "epoch": 0.41, - "learning_rate": 1.940081082193618e-06, - "loss": 0.7749, - "step": 16086 - }, - { - "epoch": 0.41, - "learning_rate": 1.9400716475658388e-06, - "loss": 0.8809, - "step": 16087 - }, - { - "epoch": 0.41, - "learning_rate": 1.94006221221829e-06, - "loss": 0.8975, - "step": 16088 - }, - { - "epoch": 0.41, - "learning_rate": 1.9400527761509795e-06, - "loss": 0.9805, - "step": 16089 - }, - { - "epoch": 0.41, - "learning_rate": 1.940043339363913e-06, - "loss": 0.8669, - "step": 16090 - }, - { - "epoch": 0.41, - "learning_rate": 1.9400339018570988e-06, - "loss": 0.8271, - "step": 16091 - }, - { - "epoch": 0.41, - "learning_rate": 1.940024463630544e-06, - "loss": 0.9805, - "step": 16092 - }, - { - "epoch": 0.41, - "learning_rate": 1.9400150246842556e-06, - "loss": 0.6475, - "step": 16093 - }, - { - "epoch": 0.41, - "learning_rate": 1.940005585018241e-06, - "loss": 0.9355, - "step": 16094 - }, - { - "epoch": 0.41, - "learning_rate": 1.939996144632507e-06, - "loss": 0.8428, - "step": 16095 - }, - { - "epoch": 0.41, - "learning_rate": 1.939986703527062e-06, - "loss": 0.9668, - "step": 16096 - }, - { - "epoch": 0.41, - "learning_rate": 1.9399772617019113e-06, - "loss": 0.9424, - "step": 16097 - }, - { - "epoch": 0.41, - "learning_rate": 1.939967819157064e-06, - "loss": 0.8037, - "step": 16098 - }, - { - "epoch": 0.41, - "learning_rate": 1.939958375892526e-06, - "loss": 1.0498, - "step": 16099 - }, - { - "epoch": 0.41, - "learning_rate": 1.9399489319083056e-06, - "loss": 0.9912, - "step": 16100 - }, - { - "epoch": 0.41, - "learning_rate": 1.9399394872044094e-06, - "loss": 0.9907, - "step": 16101 - }, - { - "epoch": 0.41, - "learning_rate": 1.939930041780845e-06, - "loss": 0.9341, - "step": 16102 - }, - { - "epoch": 0.41, - "learning_rate": 1.939920595637619e-06, - "loss": 0.9883, - "step": 16103 - }, - { - "epoch": 0.41, - "learning_rate": 1.939911148774739e-06, - "loss": 0.8462, - "step": 16104 - }, - { - "epoch": 0.41, - "learning_rate": 1.9399017011922125e-06, - "loss": 0.8047, - "step": 16105 - }, - { - "epoch": 0.41, - "learning_rate": 1.9398922528900462e-06, - "loss": 0.9678, - "step": 16106 - }, - { - "epoch": 0.41, - "learning_rate": 1.9398828038682476e-06, - "loss": 0.9902, - "step": 16107 - }, - { - "epoch": 0.41, - "learning_rate": 1.939873354126824e-06, - "loss": 1.1211, - "step": 16108 - }, - { - "epoch": 0.41, - "learning_rate": 1.939863903665783e-06, - "loss": 0.834, - "step": 16109 - }, - { - "epoch": 0.41, - "learning_rate": 1.939854452485131e-06, - "loss": 0.9434, - "step": 16110 - }, - { - "epoch": 0.41, - "learning_rate": 1.939845000584876e-06, - "loss": 0.9814, - "step": 16111 - }, - { - "epoch": 0.41, - "learning_rate": 1.939835547965025e-06, - "loss": 0.9502, - "step": 16112 - }, - { - "epoch": 0.41, - "learning_rate": 1.9398260946255847e-06, - "loss": 0.7705, - "step": 16113 - }, - { - "epoch": 0.41, - "learning_rate": 1.939816640566563e-06, - "loss": 0.7773, - "step": 16114 - }, - { - "epoch": 0.41, - "learning_rate": 1.9398071857879665e-06, - "loss": 0.915, - "step": 16115 - }, - { - "epoch": 0.41, - "learning_rate": 1.939797730289803e-06, - "loss": 0.9521, - "step": 16116 - }, - { - "epoch": 0.41, - "learning_rate": 1.93978827407208e-06, - "loss": 0.7598, - "step": 16117 - }, - { - "epoch": 0.41, - "learning_rate": 1.939778817134804e-06, - "loss": 0.8193, - "step": 16118 - }, - { - "epoch": 0.41, - "learning_rate": 1.9397693594779828e-06, - "loss": 1.0156, - "step": 16119 - }, - { - "epoch": 0.41, - "learning_rate": 1.9397599011016234e-06, - "loss": 0.8711, - "step": 16120 - }, - { - "epoch": 0.41, - "learning_rate": 1.9397504420057328e-06, - "loss": 0.8164, - "step": 16121 - }, - { - "epoch": 0.41, - "learning_rate": 1.9397409821903186e-06, - "loss": 0.6506, - "step": 16122 - }, - { - "epoch": 0.41, - "learning_rate": 1.9397315216553876e-06, - "loss": 0.709, - "step": 16123 - }, - { - "epoch": 0.41, - "learning_rate": 1.939722060400948e-06, - "loss": 0.8623, - "step": 16124 - }, - { - "epoch": 0.41, - "learning_rate": 1.9397125984270062e-06, - "loss": 1.0518, - "step": 16125 - }, - { - "epoch": 0.41, - "learning_rate": 1.93970313573357e-06, - "loss": 0.9268, - "step": 16126 - }, - { - "epoch": 0.41, - "learning_rate": 1.9396936723206458e-06, - "loss": 0.8311, - "step": 16127 - }, - { - "epoch": 0.41, - "learning_rate": 1.9396842081882414e-06, - "loss": 0.6217, - "step": 16128 - }, - { - "epoch": 0.41, - "learning_rate": 1.939674743336364e-06, - "loss": 1.082, - "step": 16129 - }, - { - "epoch": 0.41, - "learning_rate": 1.9396652777650215e-06, - "loss": 1.0273, - "step": 16130 - }, - { - "epoch": 0.41, - "learning_rate": 1.9396558114742196e-06, - "loss": 1.002, - "step": 16131 - }, - { - "epoch": 0.41, - "learning_rate": 1.939646344463967e-06, - "loss": 1.1289, - "step": 16132 - }, - { - "epoch": 0.41, - "learning_rate": 1.93963687673427e-06, - "loss": 0.8643, - "step": 16133 - }, - { - "epoch": 0.41, - "learning_rate": 1.9396274082851366e-06, - "loss": 0.8779, - "step": 16134 - }, - { - "epoch": 0.41, - "learning_rate": 1.9396179391165737e-06, - "loss": 1.041, - "step": 16135 - }, - { - "epoch": 0.41, - "learning_rate": 1.9396084692285885e-06, - "loss": 0.8564, - "step": 16136 - }, - { - "epoch": 0.41, - "learning_rate": 1.939598998621188e-06, - "loss": 1.0273, - "step": 16137 - }, - { - "epoch": 0.41, - "learning_rate": 1.93958952729438e-06, - "loss": 0.9316, - "step": 16138 - }, - { - "epoch": 0.41, - "learning_rate": 1.9395800552481715e-06, - "loss": 1.0762, - "step": 16139 - }, - { - "epoch": 0.41, - "learning_rate": 1.9395705824825697e-06, - "loss": 0.8662, - "step": 16140 - }, - { - "epoch": 0.41, - "learning_rate": 1.9395611089975824e-06, - "loss": 0.7734, - "step": 16141 - }, - { - "epoch": 0.41, - "learning_rate": 1.939551634793216e-06, - "loss": 0.8135, - "step": 16142 - }, - { - "epoch": 0.41, - "learning_rate": 1.939542159869478e-06, - "loss": 0.9824, - "step": 16143 - }, - { - "epoch": 0.41, - "learning_rate": 1.9395326842263757e-06, - "loss": 0.9629, - "step": 16144 - }, - { - "epoch": 0.41, - "learning_rate": 1.9395232078639167e-06, - "loss": 0.5957, - "step": 16145 - }, - { - "epoch": 0.41, - "learning_rate": 1.9395137307821073e-06, - "loss": 0.958, - "step": 16146 - }, - { - "epoch": 0.41, - "learning_rate": 1.939504252980956e-06, - "loss": 0.7803, - "step": 16147 - }, - { - "epoch": 0.41, - "learning_rate": 1.9394947744604697e-06, - "loss": 0.8447, - "step": 16148 - }, - { - "epoch": 0.41, - "learning_rate": 1.9394852952206554e-06, - "loss": 0.7744, - "step": 16149 - }, - { - "epoch": 0.41, - "learning_rate": 1.93947581526152e-06, - "loss": 1.1143, - "step": 16150 - }, - { - "epoch": 0.41, - "learning_rate": 1.939466334583071e-06, - "loss": 0.9238, - "step": 16151 - }, - { - "epoch": 0.41, - "learning_rate": 1.9394568531853167e-06, - "loss": 0.6982, - "step": 16152 - }, - { - "epoch": 0.41, - "learning_rate": 1.939447371068263e-06, - "loss": 0.751, - "step": 16153 - }, - { - "epoch": 0.41, - "learning_rate": 1.9394378882319174e-06, - "loss": 0.7041, - "step": 16154 - }, - { - "epoch": 0.41, - "learning_rate": 1.9394284046762878e-06, - "loss": 0.8594, - "step": 16155 - }, - { - "epoch": 0.41, - "learning_rate": 1.9394189204013806e-06, - "loss": 0.7983, - "step": 16156 - }, - { - "epoch": 0.41, - "learning_rate": 1.939409435407204e-06, - "loss": 0.8896, - "step": 16157 - }, - { - "epoch": 0.41, - "learning_rate": 1.9393999496937646e-06, - "loss": 0.7983, - "step": 16158 - }, - { - "epoch": 0.41, - "learning_rate": 1.9393904632610698e-06, - "loss": 1.0566, - "step": 16159 - }, - { - "epoch": 0.41, - "learning_rate": 1.939380976109127e-06, - "loss": 0.9214, - "step": 16160 - }, - { - "epoch": 0.41, - "learning_rate": 1.9393714882379433e-06, - "loss": 1.0518, - "step": 16161 - }, - { - "epoch": 0.41, - "learning_rate": 1.9393619996475265e-06, - "loss": 0.9424, - "step": 16162 - }, - { - "epoch": 0.41, - "learning_rate": 1.939352510337883e-06, - "loss": 0.9629, - "step": 16163 - }, - { - "epoch": 0.41, - "learning_rate": 1.93934302030902e-06, - "loss": 0.9688, - "step": 16164 - }, - { - "epoch": 0.41, - "learning_rate": 1.939333529560946e-06, - "loss": 0.9922, - "step": 16165 - }, - { - "epoch": 0.41, - "learning_rate": 1.9393240380936674e-06, - "loss": 0.7039, - "step": 16166 - }, - { - "epoch": 0.41, - "learning_rate": 1.9393145459071913e-06, - "loss": 0.9502, - "step": 16167 - }, - { - "epoch": 0.41, - "learning_rate": 1.9393050530015253e-06, - "loss": 0.9775, - "step": 16168 - }, - { - "epoch": 0.41, - "learning_rate": 1.9392955593766767e-06, - "loss": 0.8335, - "step": 16169 - }, - { - "epoch": 0.41, - "learning_rate": 1.9392860650326527e-06, - "loss": 0.8428, - "step": 16170 - }, - { - "epoch": 0.41, - "learning_rate": 1.9392765699694604e-06, - "loss": 0.7979, - "step": 16171 - }, - { - "epoch": 0.41, - "learning_rate": 1.9392670741871075e-06, - "loss": 0.9248, - "step": 16172 - }, - { - "epoch": 0.41, - "learning_rate": 1.9392575776856007e-06, - "loss": 1.1045, - "step": 16173 - }, - { - "epoch": 0.41, - "learning_rate": 1.9392480804649477e-06, - "loss": 0.9209, - "step": 16174 - }, - { - "epoch": 0.41, - "learning_rate": 1.9392385825251558e-06, - "loss": 0.9424, - "step": 16175 - }, - { - "epoch": 0.41, - "learning_rate": 1.939229083866232e-06, - "loss": 0.8369, - "step": 16176 - }, - { - "epoch": 0.41, - "learning_rate": 1.9392195844881835e-06, - "loss": 0.9111, - "step": 16177 - }, - { - "epoch": 0.41, - "learning_rate": 1.9392100843910177e-06, - "loss": 0.9746, - "step": 16178 - }, - { - "epoch": 0.41, - "learning_rate": 1.9392005835747425e-06, - "loss": 0.9629, - "step": 16179 - }, - { - "epoch": 0.41, - "learning_rate": 1.9391910820393638e-06, - "loss": 0.7764, - "step": 16180 - }, - { - "epoch": 0.41, - "learning_rate": 1.93918157978489e-06, - "loss": 0.626, - "step": 16181 - }, - { - "epoch": 0.41, - "learning_rate": 1.939172076811328e-06, - "loss": 1.0127, - "step": 16182 - }, - { - "epoch": 0.41, - "learning_rate": 1.9391625731186855e-06, - "loss": 0.9727, - "step": 16183 - }, - { - "epoch": 0.41, - "learning_rate": 1.939153068706969e-06, - "loss": 0.9424, - "step": 16184 - }, - { - "epoch": 0.41, - "learning_rate": 1.939143563576186e-06, - "loss": 0.9326, - "step": 16185 - }, - { - "epoch": 0.41, - "learning_rate": 1.9391340577263447e-06, - "loss": 0.9736, - "step": 16186 - }, - { - "epoch": 0.41, - "learning_rate": 1.939124551157451e-06, - "loss": 1.0088, - "step": 16187 - }, - { - "epoch": 0.41, - "learning_rate": 1.939115043869513e-06, - "loss": 0.9629, - "step": 16188 - }, - { - "epoch": 0.41, - "learning_rate": 1.939105535862538e-06, - "loss": 0.8926, - "step": 16189 - }, - { - "epoch": 0.41, - "learning_rate": 1.9390960271365327e-06, - "loss": 0.7881, - "step": 16190 - }, - { - "epoch": 0.41, - "learning_rate": 1.939086517691505e-06, - "loss": 1.0293, - "step": 16191 - }, - { - "epoch": 0.42, - "learning_rate": 1.9390770075274617e-06, - "loss": 0.8477, - "step": 16192 - }, - { - "epoch": 0.42, - "learning_rate": 1.9390674966444104e-06, - "loss": 1.0215, - "step": 16193 - }, - { - "epoch": 0.42, - "learning_rate": 1.939057985042358e-06, - "loss": 0.8506, - "step": 16194 - }, - { - "epoch": 0.42, - "learning_rate": 1.939048472721313e-06, - "loss": 0.6309, - "step": 16195 - }, - { - "epoch": 0.42, - "learning_rate": 1.9390389596812813e-06, - "loss": 0.9678, - "step": 16196 - }, - { - "epoch": 0.42, - "learning_rate": 1.93902944592227e-06, - "loss": 0.9971, - "step": 16197 - }, - { - "epoch": 0.42, - "learning_rate": 1.939019931444288e-06, - "loss": 0.8672, - "step": 16198 - }, - { - "epoch": 0.42, - "learning_rate": 1.939010416247341e-06, - "loss": 0.7041, - "step": 16199 - }, - { - "epoch": 0.42, - "learning_rate": 1.9390009003314375e-06, - "loss": 0.96, - "step": 16200 - }, - { - "epoch": 0.42, - "learning_rate": 1.9389913836965836e-06, - "loss": 1.0322, - "step": 16201 - }, - { - "epoch": 0.42, - "learning_rate": 1.938981866342787e-06, - "loss": 1.2598, - "step": 16202 - }, - { - "epoch": 0.42, - "learning_rate": 1.9389723482700558e-06, - "loss": 1.1055, - "step": 16203 - }, - { - "epoch": 0.42, - "learning_rate": 1.9389628294783963e-06, - "loss": 0.6641, - "step": 16204 - }, - { - "epoch": 0.42, - "learning_rate": 1.9389533099678164e-06, - "loss": 0.7363, - "step": 16205 - }, - { - "epoch": 0.42, - "learning_rate": 1.9389437897383227e-06, - "loss": 0.8721, - "step": 16206 - }, - { - "epoch": 0.42, - "learning_rate": 1.9389342687899234e-06, - "loss": 0.7832, - "step": 16207 - }, - { - "epoch": 0.42, - "learning_rate": 1.938924747122625e-06, - "loss": 0.9209, - "step": 16208 - }, - { - "epoch": 0.42, - "learning_rate": 1.938915224736435e-06, - "loss": 0.7065, - "step": 16209 - }, - { - "epoch": 0.42, - "learning_rate": 1.938905701631361e-06, - "loss": 0.8691, - "step": 16210 - }, - { - "epoch": 0.42, - "learning_rate": 1.9388961778074098e-06, - "loss": 0.9092, - "step": 16211 - }, - { - "epoch": 0.42, - "learning_rate": 1.9388866532645893e-06, - "loss": 0.8491, - "step": 16212 - }, - { - "epoch": 0.42, - "learning_rate": 1.9388771280029064e-06, - "loss": 0.9111, - "step": 16213 - }, - { - "epoch": 0.42, - "learning_rate": 1.9388676020223686e-06, - "loss": 0.7959, - "step": 16214 - }, - { - "epoch": 0.42, - "learning_rate": 1.938858075322983e-06, - "loss": 0.8779, - "step": 16215 - }, - { - "epoch": 0.42, - "learning_rate": 1.938848547904756e-06, - "loss": 0.8994, - "step": 16216 - }, - { - "epoch": 0.42, - "learning_rate": 1.938839019767697e-06, - "loss": 0.9492, - "step": 16217 - }, - { - "epoch": 0.42, - "learning_rate": 1.9388294909118115e-06, - "loss": 0.9365, - "step": 16218 - }, - { - "epoch": 0.42, - "learning_rate": 1.938819961337108e-06, - "loss": 1.2539, - "step": 16219 - }, - { - "epoch": 0.42, - "learning_rate": 1.9388104310435928e-06, - "loss": 0.8896, - "step": 16220 - }, - { - "epoch": 0.42, - "learning_rate": 1.9388009000312736e-06, - "loss": 0.7383, - "step": 16221 - }, - { - "epoch": 0.42, - "learning_rate": 1.938791368300158e-06, - "loss": 0.7891, - "step": 16222 - }, - { - "epoch": 0.42, - "learning_rate": 1.9387818358502528e-06, - "loss": 0.8701, - "step": 16223 - }, - { - "epoch": 0.42, - "learning_rate": 1.9387723026815656e-06, - "loss": 0.7666, - "step": 16224 - }, - { - "epoch": 0.42, - "learning_rate": 1.9387627687941036e-06, - "loss": 0.5518, - "step": 16225 - }, - { - "epoch": 0.42, - "learning_rate": 1.938753234187874e-06, - "loss": 1.0078, - "step": 16226 - }, - { - "epoch": 0.42, - "learning_rate": 1.9387436988628844e-06, - "loss": 0.7971, - "step": 16227 - }, - { - "epoch": 0.42, - "learning_rate": 1.9387341628191416e-06, - "loss": 0.8535, - "step": 16228 - }, - { - "epoch": 0.42, - "learning_rate": 1.9387246260566537e-06, - "loss": 0.8564, - "step": 16229 - }, - { - "epoch": 0.42, - "learning_rate": 1.938715088575427e-06, - "loss": 1.0996, - "step": 16230 - }, - { - "epoch": 0.42, - "learning_rate": 1.9387055503754696e-06, - "loss": 0.9229, - "step": 16231 - }, - { - "epoch": 0.42, - "learning_rate": 1.9386960114567886e-06, - "loss": 0.8379, - "step": 16232 - }, - { - "epoch": 0.42, - "learning_rate": 1.938686471819391e-06, - "loss": 0.8281, - "step": 16233 - }, - { - "epoch": 0.42, - "learning_rate": 1.9386769314632847e-06, - "loss": 0.8789, - "step": 16234 - }, - { - "epoch": 0.42, - "learning_rate": 1.9386673903884762e-06, - "loss": 0.6362, - "step": 16235 - }, - { - "epoch": 0.42, - "learning_rate": 1.9386578485949735e-06, - "loss": 0.9609, - "step": 16236 - }, - { - "epoch": 0.42, - "learning_rate": 1.9386483060827836e-06, - "loss": 0.8965, - "step": 16237 - }, - { - "epoch": 0.42, - "learning_rate": 1.9386387628519137e-06, - "loss": 0.7354, - "step": 16238 - }, - { - "epoch": 0.42, - "learning_rate": 1.9386292189023716e-06, - "loss": 0.791, - "step": 16239 - }, - { - "epoch": 0.42, - "learning_rate": 1.938619674234164e-06, - "loss": 0.9248, - "step": 16240 - }, - { - "epoch": 0.42, - "learning_rate": 1.9386101288472983e-06, - "loss": 1.0518, - "step": 16241 - }, - { - "epoch": 0.42, - "learning_rate": 1.9386005827417825e-06, - "loss": 1.0527, - "step": 16242 - }, - { - "epoch": 0.42, - "learning_rate": 1.938591035917623e-06, - "loss": 0.9258, - "step": 16243 - }, - { - "epoch": 0.42, - "learning_rate": 1.9385814883748275e-06, - "loss": 1.0596, - "step": 16244 - }, - { - "epoch": 0.42, - "learning_rate": 1.9385719401134035e-06, - "loss": 0.7979, - "step": 16245 - }, - { - "epoch": 0.42, - "learning_rate": 1.938562391133358e-06, - "loss": 0.9038, - "step": 16246 - }, - { - "epoch": 0.42, - "learning_rate": 1.9385528414346985e-06, - "loss": 0.5918, - "step": 16247 - }, - { - "epoch": 0.42, - "learning_rate": 1.938543291017432e-06, - "loss": 0.8662, - "step": 16248 - }, - { - "epoch": 0.42, - "learning_rate": 1.9385337398815663e-06, - "loss": 0.7078, - "step": 16249 - }, - { - "epoch": 0.42, - "learning_rate": 1.9385241880271087e-06, - "loss": 0.9561, - "step": 16250 - }, - { - "epoch": 0.42, - "learning_rate": 1.938514635454066e-06, - "loss": 0.7456, - "step": 16251 - }, - { - "epoch": 0.42, - "learning_rate": 1.938505082162446e-06, - "loss": 0.7188, - "step": 16252 - }, - { - "epoch": 0.42, - "learning_rate": 1.938495528152255e-06, - "loss": 1.0332, - "step": 16253 - }, - { - "epoch": 0.42, - "learning_rate": 1.938485973423502e-06, - "loss": 0.8013, - "step": 16254 - }, - { - "epoch": 0.42, - "learning_rate": 1.9384764179761932e-06, - "loss": 0.9355, - "step": 16255 - }, - { - "epoch": 0.42, - "learning_rate": 1.9384668618103362e-06, - "loss": 0.4963, - "step": 16256 - }, - { - "epoch": 0.42, - "learning_rate": 1.938457304925938e-06, - "loss": 0.8853, - "step": 16257 - }, - { - "epoch": 0.42, - "learning_rate": 1.9384477473230067e-06, - "loss": 0.7139, - "step": 16258 - }, - { - "epoch": 0.42, - "learning_rate": 1.9384381890015487e-06, - "loss": 0.9805, - "step": 16259 - }, - { - "epoch": 0.42, - "learning_rate": 1.938428629961572e-06, - "loss": 0.8584, - "step": 16260 - }, - { - "epoch": 0.42, - "learning_rate": 1.9384190702030836e-06, - "loss": 0.7246, - "step": 16261 - }, - { - "epoch": 0.42, - "learning_rate": 1.9384095097260906e-06, - "loss": 0.8486, - "step": 16262 - }, - { - "epoch": 0.42, - "learning_rate": 1.938399948530601e-06, - "loss": 0.7969, - "step": 16263 - }, - { - "epoch": 0.42, - "learning_rate": 1.9383903866166214e-06, - "loss": 0.8105, - "step": 16264 - }, - { - "epoch": 0.42, - "learning_rate": 1.9383808239841595e-06, - "loss": 1.0781, - "step": 16265 - }, - { - "epoch": 0.42, - "learning_rate": 1.9383712606332226e-06, - "loss": 0.9727, - "step": 16266 - }, - { - "epoch": 0.42, - "learning_rate": 1.938361696563818e-06, - "loss": 0.9219, - "step": 16267 - }, - { - "epoch": 0.42, - "learning_rate": 1.938352131775953e-06, - "loss": 0.7642, - "step": 16268 - }, - { - "epoch": 0.42, - "learning_rate": 1.9383425662696345e-06, - "loss": 0.6172, - "step": 16269 - }, - { - "epoch": 0.42, - "learning_rate": 1.9383330000448707e-06, - "loss": 1.0244, - "step": 16270 - }, - { - "epoch": 0.42, - "learning_rate": 1.9383234331016684e-06, - "loss": 0.8877, - "step": 16271 - }, - { - "epoch": 0.42, - "learning_rate": 1.9383138654400352e-06, - "loss": 0.7549, - "step": 16272 - }, - { - "epoch": 0.42, - "learning_rate": 1.938304297059978e-06, - "loss": 1.0107, - "step": 16273 - }, - { - "epoch": 0.42, - "learning_rate": 1.938294727961504e-06, - "loss": 0.9307, - "step": 16274 - }, - { - "epoch": 0.42, - "learning_rate": 1.9382851581446214e-06, - "loss": 0.7065, - "step": 16275 - }, - { - "epoch": 0.42, - "learning_rate": 1.9382755876093367e-06, - "loss": 0.7327, - "step": 16276 - }, - { - "epoch": 0.42, - "learning_rate": 1.938266016355658e-06, - "loss": 1.0459, - "step": 16277 - }, - { - "epoch": 0.42, - "learning_rate": 1.9382564443835913e-06, - "loss": 0.9297, - "step": 16278 - }, - { - "epoch": 0.42, - "learning_rate": 1.9382468716931455e-06, - "loss": 1.0977, - "step": 16279 - }, - { - "epoch": 0.42, - "learning_rate": 1.938237298284327e-06, - "loss": 0.7852, - "step": 16280 - }, - { - "epoch": 0.42, - "learning_rate": 1.938227724157143e-06, - "loss": 0.9277, - "step": 16281 - }, - { - "epoch": 0.42, - "learning_rate": 1.938218149311602e-06, - "loss": 0.9072, - "step": 16282 - }, - { - "epoch": 0.42, - "learning_rate": 1.9382085737477094e-06, - "loss": 1.0801, - "step": 16283 - }, - { - "epoch": 0.42, - "learning_rate": 1.9381989974654742e-06, - "loss": 1.0674, - "step": 16284 - }, - { - "epoch": 0.42, - "learning_rate": 1.938189420464903e-06, - "loss": 0.7109, - "step": 16285 - }, - { - "epoch": 0.42, - "learning_rate": 1.938179842746004e-06, - "loss": 0.8359, - "step": 16286 - }, - { - "epoch": 0.42, - "learning_rate": 1.9381702643087834e-06, - "loss": 1.2227, - "step": 16287 - }, - { - "epoch": 0.42, - "learning_rate": 1.9381606851532485e-06, - "loss": 0.9307, - "step": 16288 - }, - { - "epoch": 0.42, - "learning_rate": 1.9381511052794077e-06, - "loss": 0.8936, - "step": 16289 - }, - { - "epoch": 0.42, - "learning_rate": 1.9381415246872673e-06, - "loss": 0.7271, - "step": 16290 - }, - { - "epoch": 0.42, - "learning_rate": 1.9381319433768357e-06, - "loss": 0.9961, - "step": 16291 - }, - { - "epoch": 0.42, - "learning_rate": 1.938122361348119e-06, - "loss": 0.7822, - "step": 16292 - }, - { - "epoch": 0.42, - "learning_rate": 1.938112778601125e-06, - "loss": 0.8945, - "step": 16293 - }, - { - "epoch": 0.42, - "learning_rate": 1.938103195135862e-06, - "loss": 0.833, - "step": 16294 - }, - { - "epoch": 0.42, - "learning_rate": 1.9380936109523357e-06, - "loss": 1.0117, - "step": 16295 - }, - { - "epoch": 0.42, - "learning_rate": 1.9380840260505547e-06, - "loss": 0.8408, - "step": 16296 - }, - { - "epoch": 0.42, - "learning_rate": 1.938074440430526e-06, - "loss": 1.001, - "step": 16297 - }, - { - "epoch": 0.42, - "learning_rate": 1.938064854092256e-06, - "loss": 0.9971, - "step": 16298 - }, - { - "epoch": 0.42, - "learning_rate": 1.938055267035754e-06, - "loss": 0.8872, - "step": 16299 - }, - { - "epoch": 0.42, - "learning_rate": 1.9380456792610256e-06, - "loss": 0.9482, - "step": 16300 - }, - { - "epoch": 0.42, - "learning_rate": 1.938036090768079e-06, - "loss": 0.7734, - "step": 16301 - }, - { - "epoch": 0.42, - "learning_rate": 1.938026501556921e-06, - "loss": 0.9033, - "step": 16302 - }, - { - "epoch": 0.42, - "learning_rate": 1.9380169116275595e-06, - "loss": 0.9062, - "step": 16303 - }, - { - "epoch": 0.42, - "learning_rate": 1.9380073209800012e-06, - "loss": 0.8809, - "step": 16304 - }, - { - "epoch": 0.42, - "learning_rate": 1.9379977296142544e-06, - "loss": 0.8047, - "step": 16305 - }, - { - "epoch": 0.42, - "learning_rate": 1.9379881375303256e-06, - "loss": 0.4932, - "step": 16306 - }, - { - "epoch": 0.42, - "learning_rate": 1.937978544728222e-06, - "loss": 0.8438, - "step": 16307 - }, - { - "epoch": 0.42, - "learning_rate": 1.937968951207952e-06, - "loss": 0.8813, - "step": 16308 - }, - { - "epoch": 0.42, - "learning_rate": 1.9379593569695222e-06, - "loss": 0.7427, - "step": 16309 - }, - { - "epoch": 0.42, - "learning_rate": 1.93794976201294e-06, - "loss": 0.873, - "step": 16310 - }, - { - "epoch": 0.42, - "learning_rate": 1.9379401663382125e-06, - "loss": 0.8857, - "step": 16311 - }, - { - "epoch": 0.42, - "learning_rate": 1.9379305699453476e-06, - "loss": 0.9922, - "step": 16312 - }, - { - "epoch": 0.42, - "learning_rate": 1.9379209728343524e-06, - "loss": 0.9473, - "step": 16313 - }, - { - "epoch": 0.42, - "learning_rate": 1.9379113750052342e-06, - "loss": 0.918, - "step": 16314 - }, - { - "epoch": 0.42, - "learning_rate": 1.9379017764580002e-06, - "loss": 1.0127, - "step": 16315 - }, - { - "epoch": 0.42, - "learning_rate": 1.937892177192658e-06, - "loss": 1.0918, - "step": 16316 - }, - { - "epoch": 0.42, - "learning_rate": 1.937882577209215e-06, - "loss": 0.6914, - "step": 16317 - }, - { - "epoch": 0.42, - "learning_rate": 1.937872976507679e-06, - "loss": 0.9219, - "step": 16318 - }, - { - "epoch": 0.42, - "learning_rate": 1.9378633750880558e-06, - "loss": 0.9385, - "step": 16319 - }, - { - "epoch": 0.42, - "learning_rate": 1.937853772950354e-06, - "loss": 0.7764, - "step": 16320 - }, - { - "epoch": 0.42, - "learning_rate": 1.937844170094581e-06, - "loss": 0.8286, - "step": 16321 - }, - { - "epoch": 0.42, - "learning_rate": 1.9378345665207437e-06, - "loss": 0.8086, - "step": 16322 - }, - { - "epoch": 0.42, - "learning_rate": 1.9378249622288493e-06, - "loss": 0.9023, - "step": 16323 - }, - { - "epoch": 0.42, - "learning_rate": 1.937815357218906e-06, - "loss": 0.9248, - "step": 16324 - }, - { - "epoch": 0.42, - "learning_rate": 1.93780575149092e-06, - "loss": 0.9316, - "step": 16325 - }, - { - "epoch": 0.42, - "learning_rate": 1.9377961450448997e-06, - "loss": 0.6943, - "step": 16326 - }, - { - "epoch": 0.42, - "learning_rate": 1.937786537880852e-06, - "loss": 0.8252, - "step": 16327 - }, - { - "epoch": 0.42, - "learning_rate": 1.937776929998784e-06, - "loss": 0.8975, - "step": 16328 - }, - { - "epoch": 0.42, - "learning_rate": 1.9377673213987037e-06, - "loss": 0.8877, - "step": 16329 - }, - { - "epoch": 0.42, - "learning_rate": 1.937757712080618e-06, - "loss": 0.9414, - "step": 16330 - }, - { - "epoch": 0.42, - "learning_rate": 1.937748102044534e-06, - "loss": 0.8066, - "step": 16331 - }, - { - "epoch": 0.42, - "learning_rate": 1.93773849129046e-06, - "loss": 0.917, - "step": 16332 - }, - { - "epoch": 0.42, - "learning_rate": 1.937728879818402e-06, - "loss": 0.9688, - "step": 16333 - }, - { - "epoch": 0.42, - "learning_rate": 1.9377192676283686e-06, - "loss": 0.7866, - "step": 16334 - }, - { - "epoch": 0.42, - "learning_rate": 1.9377096547203665e-06, - "loss": 0.9512, - "step": 16335 - }, - { - "epoch": 0.42, - "learning_rate": 1.9377000410944032e-06, - "loss": 1.0742, - "step": 16336 - }, - { - "epoch": 0.42, - "learning_rate": 1.937690426750486e-06, - "loss": 0.9736, - "step": 16337 - }, - { - "epoch": 0.42, - "learning_rate": 1.9376808116886226e-06, - "loss": 0.543, - "step": 16338 - }, - { - "epoch": 0.42, - "learning_rate": 1.93767119590882e-06, - "loss": 0.8428, - "step": 16339 - }, - { - "epoch": 0.42, - "learning_rate": 1.9376615794110856e-06, - "loss": 0.8369, - "step": 16340 - }, - { - "epoch": 0.42, - "learning_rate": 1.937651962195427e-06, - "loss": 0.8369, - "step": 16341 - }, - { - "epoch": 0.42, - "learning_rate": 1.9376423442618515e-06, - "loss": 0.855, - "step": 16342 - }, - { - "epoch": 0.42, - "learning_rate": 1.9376327256103663e-06, - "loss": 0.709, - "step": 16343 - }, - { - "epoch": 0.42, - "learning_rate": 1.937623106240979e-06, - "loss": 0.8467, - "step": 16344 - }, - { - "epoch": 0.42, - "learning_rate": 1.9376134861536966e-06, - "loss": 1.0439, - "step": 16345 - }, - { - "epoch": 0.42, - "learning_rate": 1.9376038653485263e-06, - "loss": 0.9551, - "step": 16346 - }, - { - "epoch": 0.42, - "learning_rate": 1.9375942438254762e-06, - "loss": 1.0254, - "step": 16347 - }, - { - "epoch": 0.42, - "learning_rate": 1.9375846215845534e-06, - "loss": 0.9004, - "step": 16348 - }, - { - "epoch": 0.42, - "learning_rate": 1.937574998625765e-06, - "loss": 0.874, - "step": 16349 - }, - { - "epoch": 0.42, - "learning_rate": 1.9375653749491185e-06, - "loss": 0.874, - "step": 16350 - }, - { - "epoch": 0.42, - "learning_rate": 1.9375557505546216e-06, - "loss": 0.5724, - "step": 16351 - }, - { - "epoch": 0.42, - "learning_rate": 1.9375461254422812e-06, - "loss": 0.8584, - "step": 16352 - }, - { - "epoch": 0.42, - "learning_rate": 1.9375364996121046e-06, - "loss": 0.9053, - "step": 16353 - }, - { - "epoch": 0.42, - "learning_rate": 1.9375268730640997e-06, - "loss": 0.7891, - "step": 16354 - }, - { - "epoch": 0.42, - "learning_rate": 1.9375172457982733e-06, - "loss": 0.8408, - "step": 16355 - }, - { - "epoch": 0.42, - "learning_rate": 1.9375076178146336e-06, - "loss": 1.3535, - "step": 16356 - }, - { - "epoch": 0.42, - "learning_rate": 1.9374979891131868e-06, - "loss": 0.8872, - "step": 16357 - }, - { - "epoch": 0.42, - "learning_rate": 1.9374883596939414e-06, - "loss": 0.9697, - "step": 16358 - }, - { - "epoch": 0.42, - "learning_rate": 1.937478729556904e-06, - "loss": 1.0674, - "step": 16359 - }, - { - "epoch": 0.42, - "learning_rate": 1.937469098702082e-06, - "loss": 0.8516, - "step": 16360 - }, - { - "epoch": 0.42, - "learning_rate": 1.9374594671294835e-06, - "loss": 0.9521, - "step": 16361 - }, - { - "epoch": 0.42, - "learning_rate": 1.937449834839115e-06, - "loss": 0.9092, - "step": 16362 - }, - { - "epoch": 0.42, - "learning_rate": 1.937440201830985e-06, - "loss": 1.0449, - "step": 16363 - }, - { - "epoch": 0.42, - "learning_rate": 1.9374305681050992e-06, - "loss": 0.7446, - "step": 16364 - }, - { - "epoch": 0.42, - "learning_rate": 1.937420933661466e-06, - "loss": 1.0947, - "step": 16365 - }, - { - "epoch": 0.42, - "learning_rate": 1.9374112985000933e-06, - "loss": 0.7822, - "step": 16366 - }, - { - "epoch": 0.42, - "learning_rate": 1.9374016626209876e-06, - "loss": 0.9541, - "step": 16367 - }, - { - "epoch": 0.42, - "learning_rate": 1.9373920260241565e-06, - "loss": 0.8633, - "step": 16368 - }, - { - "epoch": 0.42, - "learning_rate": 1.9373823887096073e-06, - "loss": 0.7285, - "step": 16369 - }, - { - "epoch": 0.42, - "learning_rate": 1.937372750677348e-06, - "loss": 0.8652, - "step": 16370 - }, - { - "epoch": 0.42, - "learning_rate": 1.937363111927385e-06, - "loss": 0.7041, - "step": 16371 - }, - { - "epoch": 0.42, - "learning_rate": 1.9373534724597264e-06, - "loss": 0.8584, - "step": 16372 - }, - { - "epoch": 0.42, - "learning_rate": 1.937343832274379e-06, - "loss": 0.9004, - "step": 16373 - }, - { - "epoch": 0.42, - "learning_rate": 1.9373341913713512e-06, - "loss": 0.792, - "step": 16374 - }, - { - "epoch": 0.42, - "learning_rate": 1.937324549750649e-06, - "loss": 1.0029, - "step": 16375 - }, - { - "epoch": 0.42, - "learning_rate": 1.937314907412281e-06, - "loss": 0.7939, - "step": 16376 - }, - { - "epoch": 0.42, - "learning_rate": 1.937305264356254e-06, - "loss": 0.8076, - "step": 16377 - }, - { - "epoch": 0.42, - "learning_rate": 1.937295620582575e-06, - "loss": 0.7949, - "step": 16378 - }, - { - "epoch": 0.42, - "learning_rate": 1.937285976091252e-06, - "loss": 0.9609, - "step": 16379 - }, - { - "epoch": 0.42, - "learning_rate": 1.9372763308822928e-06, - "loss": 0.9375, - "step": 16380 - }, - { - "epoch": 0.42, - "learning_rate": 1.937266684955704e-06, - "loss": 0.9609, - "step": 16381 - }, - { - "epoch": 0.42, - "learning_rate": 1.937257038311493e-06, - "loss": 0.9844, - "step": 16382 - }, - { - "epoch": 0.42, - "learning_rate": 1.937247390949667e-06, - "loss": 0.9443, - "step": 16383 - }, - { - "epoch": 0.42, - "learning_rate": 1.937237742870234e-06, - "loss": 0.6528, - "step": 16384 - }, - { - "epoch": 0.42, - "learning_rate": 1.9372280940732013e-06, - "loss": 0.8223, - "step": 16385 - }, - { - "epoch": 0.42, - "learning_rate": 1.9372184445585766e-06, - "loss": 0.6265, - "step": 16386 - }, - { - "epoch": 0.42, - "learning_rate": 1.9372087943263662e-06, - "loss": 0.8867, - "step": 16387 - }, - { - "epoch": 0.42, - "learning_rate": 1.9371991433765784e-06, - "loss": 1.0742, - "step": 16388 - }, - { - "epoch": 0.42, - "learning_rate": 1.93718949170922e-06, - "loss": 1.0146, - "step": 16389 - }, - { - "epoch": 0.42, - "learning_rate": 1.937179839324299e-06, - "loss": 0.7471, - "step": 16390 - }, - { - "epoch": 0.42, - "learning_rate": 1.937170186221822e-06, - "loss": 0.7603, - "step": 16391 - }, - { - "epoch": 0.42, - "learning_rate": 1.9371605324017975e-06, - "loss": 0.959, - "step": 16392 - }, - { - "epoch": 0.42, - "learning_rate": 1.9371508778642322e-06, - "loss": 0.8438, - "step": 16393 - }, - { - "epoch": 0.42, - "learning_rate": 1.9371412226091335e-06, - "loss": 0.8818, - "step": 16394 - }, - { - "epoch": 0.42, - "learning_rate": 1.937131566636509e-06, - "loss": 1.2051, - "step": 16395 - }, - { - "epoch": 0.42, - "learning_rate": 1.9371219099463656e-06, - "loss": 1.0674, - "step": 16396 - }, - { - "epoch": 0.42, - "learning_rate": 1.9371122525387113e-06, - "loss": 0.8477, - "step": 16397 - }, - { - "epoch": 0.42, - "learning_rate": 1.9371025944135528e-06, - "loss": 0.9883, - "step": 16398 - }, - { - "epoch": 0.42, - "learning_rate": 1.9370929355708985e-06, - "loss": 0.9668, - "step": 16399 - }, - { - "epoch": 0.42, - "learning_rate": 1.937083276010755e-06, - "loss": 0.6943, - "step": 16400 - }, - { - "epoch": 0.42, - "learning_rate": 1.9370736157331296e-06, - "loss": 1.0137, - "step": 16401 - }, - { - "epoch": 0.42, - "learning_rate": 1.9370639547380303e-06, - "loss": 0.8032, - "step": 16402 - }, - { - "epoch": 0.42, - "learning_rate": 1.937054293025464e-06, - "loss": 1.0381, - "step": 16403 - }, - { - "epoch": 0.42, - "learning_rate": 1.937044630595439e-06, - "loss": 0.9902, - "step": 16404 - }, - { - "epoch": 0.42, - "learning_rate": 1.937034967447961e-06, - "loss": 1.0859, - "step": 16405 - }, - { - "epoch": 0.42, - "learning_rate": 1.9370253035830393e-06, - "loss": 1.0586, - "step": 16406 - }, - { - "epoch": 0.42, - "learning_rate": 1.93701563900068e-06, - "loss": 0.9326, - "step": 16407 - }, - { - "epoch": 0.42, - "learning_rate": 1.937005973700891e-06, - "loss": 0.917, - "step": 16408 - }, - { - "epoch": 0.42, - "learning_rate": 1.9369963076836798e-06, - "loss": 0.9111, - "step": 16409 - }, - { - "epoch": 0.42, - "learning_rate": 1.9369866409490535e-06, - "loss": 0.9248, - "step": 16410 - }, - { - "epoch": 0.42, - "learning_rate": 1.9369769734970195e-06, - "loss": 0.8047, - "step": 16411 - }, - { - "epoch": 0.42, - "learning_rate": 1.936967305327585e-06, - "loss": 0.9014, - "step": 16412 - }, - { - "epoch": 0.42, - "learning_rate": 1.936957636440758e-06, - "loss": 0.9565, - "step": 16413 - }, - { - "epoch": 0.42, - "learning_rate": 1.936947966836546e-06, - "loss": 0.8826, - "step": 16414 - }, - { - "epoch": 0.42, - "learning_rate": 1.936938296514956e-06, - "loss": 0.8105, - "step": 16415 - }, - { - "epoch": 0.42, - "learning_rate": 1.936928625475995e-06, - "loss": 0.9473, - "step": 16416 - }, - { - "epoch": 0.42, - "learning_rate": 1.9369189537196706e-06, - "loss": 0.7529, - "step": 16417 - }, - { - "epoch": 0.42, - "learning_rate": 1.936909281245991e-06, - "loss": 0.9678, - "step": 16418 - }, - { - "epoch": 0.42, - "learning_rate": 1.9368996080549626e-06, - "loss": 1.0078, - "step": 16419 - }, - { - "epoch": 0.42, - "learning_rate": 1.9368899341465936e-06, - "loss": 0.6216, - "step": 16420 - }, - { - "epoch": 0.42, - "learning_rate": 1.936880259520891e-06, - "loss": 0.8506, - "step": 16421 - }, - { - "epoch": 0.42, - "learning_rate": 1.936870584177862e-06, - "loss": 0.9131, - "step": 16422 - }, - { - "epoch": 0.42, - "learning_rate": 1.9368609081175145e-06, - "loss": 0.8926, - "step": 16423 - }, - { - "epoch": 0.42, - "learning_rate": 1.936851231339856e-06, - "loss": 0.9062, - "step": 16424 - }, - { - "epoch": 0.42, - "learning_rate": 1.936841553844893e-06, - "loss": 0.833, - "step": 16425 - }, - { - "epoch": 0.42, - "learning_rate": 1.936831875632634e-06, - "loss": 0.877, - "step": 16426 - }, - { - "epoch": 0.42, - "learning_rate": 1.9368221967030855e-06, - "loss": 0.9307, - "step": 16427 - }, - { - "epoch": 0.42, - "learning_rate": 1.9368125170562555e-06, - "loss": 0.8438, - "step": 16428 - }, - { - "epoch": 0.42, - "learning_rate": 1.9368028366921512e-06, - "loss": 0.8623, - "step": 16429 - }, - { - "epoch": 0.42, - "learning_rate": 1.93679315561078e-06, - "loss": 1.0645, - "step": 16430 - }, - { - "epoch": 0.42, - "learning_rate": 1.9367834738121495e-06, - "loss": 0.7607, - "step": 16431 - }, - { - "epoch": 0.42, - "learning_rate": 1.936773791296267e-06, - "loss": 0.772, - "step": 16432 - }, - { - "epoch": 0.42, - "learning_rate": 1.93676410806314e-06, - "loss": 0.9062, - "step": 16433 - }, - { - "epoch": 0.42, - "learning_rate": 1.9367544241127753e-06, - "loss": 1.0889, - "step": 16434 - }, - { - "epoch": 0.42, - "learning_rate": 1.936744739445181e-06, - "loss": 0.6614, - "step": 16435 - }, - { - "epoch": 0.42, - "learning_rate": 1.9367350540603646e-06, - "loss": 1.0059, - "step": 16436 - }, - { - "epoch": 0.42, - "learning_rate": 1.936725367958333e-06, - "loss": 0.8516, - "step": 16437 - }, - { - "epoch": 0.42, - "learning_rate": 1.936715681139094e-06, - "loss": 0.689, - "step": 16438 - }, - { - "epoch": 0.42, - "learning_rate": 1.9367059936026547e-06, - "loss": 0.7466, - "step": 16439 - }, - { - "epoch": 0.42, - "learning_rate": 1.9366963053490225e-06, - "loss": 0.7026, - "step": 16440 - }, - { - "epoch": 0.42, - "learning_rate": 1.936686616378205e-06, - "loss": 0.9014, - "step": 16441 - }, - { - "epoch": 0.42, - "learning_rate": 1.9366769266902103e-06, - "loss": 0.7166, - "step": 16442 - }, - { - "epoch": 0.42, - "learning_rate": 1.9366672362850446e-06, - "loss": 0.8594, - "step": 16443 - }, - { - "epoch": 0.42, - "learning_rate": 1.936657545162716e-06, - "loss": 0.7812, - "step": 16444 - }, - { - "epoch": 0.42, - "learning_rate": 1.9366478533232317e-06, - "loss": 0.7522, - "step": 16445 - }, - { - "epoch": 0.42, - "learning_rate": 1.9366381607665993e-06, - "loss": 1.0508, - "step": 16446 - }, - { - "epoch": 0.42, - "learning_rate": 1.9366284674928265e-06, - "loss": 0.6899, - "step": 16447 - }, - { - "epoch": 0.42, - "learning_rate": 1.93661877350192e-06, - "loss": 0.7905, - "step": 16448 - }, - { - "epoch": 0.42, - "learning_rate": 1.9366090787938875e-06, - "loss": 1.0215, - "step": 16449 - }, - { - "epoch": 0.42, - "learning_rate": 1.9365993833687365e-06, - "loss": 0.9336, - "step": 16450 - }, - { - "epoch": 0.42, - "learning_rate": 1.9365896872264744e-06, - "loss": 0.8623, - "step": 16451 - }, - { - "epoch": 0.42, - "learning_rate": 1.9365799903671086e-06, - "loss": 0.5508, - "step": 16452 - }, - { - "epoch": 0.42, - "learning_rate": 1.936570292790647e-06, - "loss": 0.6494, - "step": 16453 - }, - { - "epoch": 0.42, - "learning_rate": 1.936560594497096e-06, - "loss": 1.0215, - "step": 16454 - }, - { - "epoch": 0.42, - "learning_rate": 1.936550895486464e-06, - "loss": 0.7808, - "step": 16455 - }, - { - "epoch": 0.42, - "learning_rate": 1.9365411957587578e-06, - "loss": 1.0625, - "step": 16456 - }, - { - "epoch": 0.42, - "learning_rate": 1.9365314953139854e-06, - "loss": 0.7656, - "step": 16457 - }, - { - "epoch": 0.42, - "learning_rate": 1.9365217941521535e-06, - "loss": 0.9258, - "step": 16458 - }, - { - "epoch": 0.42, - "learning_rate": 1.9365120922732704e-06, - "loss": 0.9062, - "step": 16459 - }, - { - "epoch": 0.42, - "learning_rate": 1.9365023896773423e-06, - "loss": 1.1445, - "step": 16460 - }, - { - "epoch": 0.42, - "learning_rate": 1.936492686364378e-06, - "loss": 0.9873, - "step": 16461 - }, - { - "epoch": 0.42, - "learning_rate": 1.9364829823343844e-06, - "loss": 0.8953, - "step": 16462 - }, - { - "epoch": 0.42, - "learning_rate": 1.9364732775873686e-06, - "loss": 0.8447, - "step": 16463 - }, - { - "epoch": 0.42, - "learning_rate": 1.936463572123338e-06, - "loss": 0.7354, - "step": 16464 - }, - { - "epoch": 0.42, - "learning_rate": 1.9364538659423007e-06, - "loss": 1.0283, - "step": 16465 - }, - { - "epoch": 0.42, - "learning_rate": 1.936444159044264e-06, - "loss": 0.9268, - "step": 16466 - }, - { - "epoch": 0.42, - "learning_rate": 1.9364344514292343e-06, - "loss": 1.001, - "step": 16467 - }, - { - "epoch": 0.42, - "learning_rate": 1.93642474309722e-06, - "loss": 0.855, - "step": 16468 - }, - { - "epoch": 0.42, - "learning_rate": 1.9364150340482287e-06, - "loss": 0.9287, - "step": 16469 - }, - { - "epoch": 0.42, - "learning_rate": 1.9364053242822674e-06, - "loss": 0.9707, - "step": 16470 - }, - { - "epoch": 0.42, - "learning_rate": 1.936395613799343e-06, - "loss": 0.8564, - "step": 16471 - }, - { - "epoch": 0.42, - "learning_rate": 1.9363859025994644e-06, - "loss": 0.7812, - "step": 16472 - }, - { - "epoch": 0.42, - "learning_rate": 1.936376190682638e-06, - "loss": 0.9541, - "step": 16473 - }, - { - "epoch": 0.42, - "learning_rate": 1.9363664780488708e-06, - "loss": 1.0176, - "step": 16474 - }, - { - "epoch": 0.42, - "learning_rate": 1.9363567646981712e-06, - "loss": 1.0654, - "step": 16475 - }, - { - "epoch": 0.42, - "learning_rate": 1.9363470506305464e-06, - "loss": 0.6038, - "step": 16476 - }, - { - "epoch": 0.42, - "learning_rate": 1.936337335846004e-06, - "loss": 0.9775, - "step": 16477 - }, - { - "epoch": 0.42, - "learning_rate": 1.9363276203445504e-06, - "loss": 0.7283, - "step": 16478 - }, - { - "epoch": 0.42, - "learning_rate": 1.936317904126194e-06, - "loss": 1.041, - "step": 16479 - }, - { - "epoch": 0.42, - "learning_rate": 1.9363081871909426e-06, - "loss": 0.8672, - "step": 16480 - }, - { - "epoch": 0.42, - "learning_rate": 1.9362984695388026e-06, - "loss": 0.4771, - "step": 16481 - }, - { - "epoch": 0.42, - "learning_rate": 1.936288751169782e-06, - "loss": 0.6973, - "step": 16482 - }, - { - "epoch": 0.42, - "learning_rate": 1.936279032083888e-06, - "loss": 0.7026, - "step": 16483 - }, - { - "epoch": 0.42, - "learning_rate": 1.9362693122811286e-06, - "loss": 0.9727, - "step": 16484 - }, - { - "epoch": 0.42, - "learning_rate": 1.9362595917615106e-06, - "loss": 0.833, - "step": 16485 - }, - { - "epoch": 0.42, - "learning_rate": 1.9362498705250415e-06, - "loss": 0.7842, - "step": 16486 - }, - { - "epoch": 0.42, - "learning_rate": 1.936240148571729e-06, - "loss": 1.0107, - "step": 16487 - }, - { - "epoch": 0.42, - "learning_rate": 1.9362304259015805e-06, - "loss": 0.8877, - "step": 16488 - }, - { - "epoch": 0.42, - "learning_rate": 1.936220702514604e-06, - "loss": 0.6582, - "step": 16489 - }, - { - "epoch": 0.42, - "learning_rate": 1.9362109784108055e-06, - "loss": 0.9805, - "step": 16490 - }, - { - "epoch": 0.42, - "learning_rate": 1.936201253590194e-06, - "loss": 1.0225, - "step": 16491 - }, - { - "epoch": 0.42, - "learning_rate": 1.9361915280527756e-06, - "loss": 0.8818, - "step": 16492 - }, - { - "epoch": 0.42, - "learning_rate": 1.9361818017985587e-06, - "loss": 0.9951, - "step": 16493 - }, - { - "epoch": 0.42, - "learning_rate": 1.9361720748275502e-06, - "loss": 0.9487, - "step": 16494 - }, - { - "epoch": 0.42, - "learning_rate": 1.936162347139758e-06, - "loss": 0.998, - "step": 16495 - }, - { - "epoch": 0.42, - "learning_rate": 1.9361526187351895e-06, - "loss": 0.7607, - "step": 16496 - }, - { - "epoch": 0.42, - "learning_rate": 1.9361428896138516e-06, - "loss": 0.8945, - "step": 16497 - }, - { - "epoch": 0.42, - "learning_rate": 1.9361331597757523e-06, - "loss": 0.8408, - "step": 16498 - }, - { - "epoch": 0.42, - "learning_rate": 1.936123429220899e-06, - "loss": 0.7988, - "step": 16499 - }, - { - "epoch": 0.42, - "learning_rate": 1.9361136979492995e-06, - "loss": 0.625, - "step": 16500 - }, - { - "epoch": 0.42, - "learning_rate": 1.93610396596096e-06, - "loss": 1.0742, - "step": 16501 - }, - { - "epoch": 0.42, - "learning_rate": 1.9360942332558888e-06, - "loss": 0.9414, - "step": 16502 - }, - { - "epoch": 0.42, - "learning_rate": 1.936084499834094e-06, - "loss": 0.9404, - "step": 16503 - }, - { - "epoch": 0.42, - "learning_rate": 1.9360747656955816e-06, - "loss": 0.8428, - "step": 16504 - }, - { - "epoch": 0.42, - "learning_rate": 1.93606503084036e-06, - "loss": 0.9048, - "step": 16505 - }, - { - "epoch": 0.42, - "learning_rate": 1.9360552952684363e-06, - "loss": 0.5779, - "step": 16506 - }, - { - "epoch": 0.42, - "learning_rate": 1.9360455589798186e-06, - "loss": 1.0225, - "step": 16507 - }, - { - "epoch": 0.42, - "learning_rate": 1.936035821974513e-06, - "loss": 1.0059, - "step": 16508 - }, - { - "epoch": 0.42, - "learning_rate": 1.936026084252529e-06, - "loss": 0.9785, - "step": 16509 - }, - { - "epoch": 0.42, - "learning_rate": 1.9360163458138717e-06, - "loss": 0.6973, - "step": 16510 - }, - { - "epoch": 0.42, - "learning_rate": 1.93600660665855e-06, - "loss": 1.043, - "step": 16511 - }, - { - "epoch": 0.42, - "learning_rate": 1.9359968667865718e-06, - "loss": 0.6514, - "step": 16512 - }, - { - "epoch": 0.42, - "learning_rate": 1.9359871261979434e-06, - "loss": 0.9688, - "step": 16513 - }, - { - "epoch": 0.42, - "learning_rate": 1.9359773848926727e-06, - "loss": 0.8076, - "step": 16514 - }, - { - "epoch": 0.42, - "learning_rate": 1.935967642870767e-06, - "loss": 0.9961, - "step": 16515 - }, - { - "epoch": 0.42, - "learning_rate": 1.935957900132234e-06, - "loss": 0.7422, - "step": 16516 - }, - { - "epoch": 0.42, - "learning_rate": 1.935948156677081e-06, - "loss": 0.9678, - "step": 16517 - }, - { - "epoch": 0.42, - "learning_rate": 1.9359384125053157e-06, - "loss": 1.1016, - "step": 16518 - }, - { - "epoch": 0.42, - "learning_rate": 1.9359286676169452e-06, - "loss": 0.7578, - "step": 16519 - }, - { - "epoch": 0.42, - "learning_rate": 1.9359189220119773e-06, - "loss": 0.9609, - "step": 16520 - }, - { - "epoch": 0.42, - "learning_rate": 1.935909175690419e-06, - "loss": 1.0068, - "step": 16521 - }, - { - "epoch": 0.42, - "learning_rate": 1.9358994286522785e-06, - "loss": 1.0703, - "step": 16522 - }, - { - "epoch": 0.42, - "learning_rate": 1.9358896808975625e-06, - "loss": 0.9951, - "step": 16523 - }, - { - "epoch": 0.42, - "learning_rate": 1.9358799324262795e-06, - "loss": 0.708, - "step": 16524 - }, - { - "epoch": 0.42, - "learning_rate": 1.9358701832384354e-06, - "loss": 0.7051, - "step": 16525 - }, - { - "epoch": 0.42, - "learning_rate": 1.935860433334039e-06, - "loss": 0.9463, - "step": 16526 - }, - { - "epoch": 0.42, - "learning_rate": 1.9358506827130976e-06, - "loss": 0.6235, - "step": 16527 - }, - { - "epoch": 0.42, - "learning_rate": 1.9358409313756177e-06, - "loss": 0.6914, - "step": 16528 - }, - { - "epoch": 0.42, - "learning_rate": 1.9358311793216077e-06, - "loss": 0.7695, - "step": 16529 - }, - { - "epoch": 0.42, - "learning_rate": 1.9358214265510747e-06, - "loss": 0.8701, - "step": 16530 - }, - { - "epoch": 0.42, - "learning_rate": 1.9358116730640264e-06, - "loss": 0.8193, - "step": 16531 - }, - { - "epoch": 0.42, - "learning_rate": 1.93580191886047e-06, - "loss": 0.8994, - "step": 16532 - }, - { - "epoch": 0.42, - "learning_rate": 1.9357921639404135e-06, - "loss": 1.0352, - "step": 16533 - }, - { - "epoch": 0.42, - "learning_rate": 1.935782408303863e-06, - "loss": 0.9639, - "step": 16534 - }, - { - "epoch": 0.42, - "learning_rate": 1.935772651950828e-06, - "loss": 1.0996, - "step": 16535 - }, - { - "epoch": 0.42, - "learning_rate": 1.9357628948813145e-06, - "loss": 0.8291, - "step": 16536 - }, - { - "epoch": 0.42, - "learning_rate": 1.9357531370953305e-06, - "loss": 0.7441, - "step": 16537 - }, - { - "epoch": 0.42, - "learning_rate": 1.9357433785928832e-06, - "loss": 0.9351, - "step": 16538 - }, - { - "epoch": 0.42, - "learning_rate": 1.9357336193739803e-06, - "loss": 0.8301, - "step": 16539 - }, - { - "epoch": 0.42, - "learning_rate": 1.935723859438629e-06, - "loss": 1.0156, - "step": 16540 - }, - { - "epoch": 0.42, - "learning_rate": 1.9357140987868373e-06, - "loss": 1.0518, - "step": 16541 - }, - { - "epoch": 0.42, - "learning_rate": 1.935704337418612e-06, - "loss": 0.9854, - "step": 16542 - }, - { - "epoch": 0.42, - "learning_rate": 1.9356945753339612e-06, - "loss": 0.7656, - "step": 16543 - }, - { - "epoch": 0.42, - "learning_rate": 1.9356848125328916e-06, - "loss": 0.8379, - "step": 16544 - }, - { - "epoch": 0.42, - "learning_rate": 1.9356750490154117e-06, - "loss": 0.8457, - "step": 16545 - }, - { - "epoch": 0.42, - "learning_rate": 1.9356652847815283e-06, - "loss": 0.9902, - "step": 16546 - }, - { - "epoch": 0.42, - "learning_rate": 1.935655519831249e-06, - "loss": 0.9023, - "step": 16547 - }, - { - "epoch": 0.42, - "learning_rate": 1.9356457541645814e-06, - "loss": 0.9072, - "step": 16548 - }, - { - "epoch": 0.42, - "learning_rate": 1.9356359877815327e-06, - "loss": 0.9463, - "step": 16549 - }, - { - "epoch": 0.42, - "learning_rate": 1.9356262206821105e-06, - "loss": 0.7178, - "step": 16550 - }, - { - "epoch": 0.42, - "learning_rate": 1.9356164528663225e-06, - "loss": 0.7656, - "step": 16551 - }, - { - "epoch": 0.42, - "learning_rate": 1.935606684334176e-06, - "loss": 0.8018, - "step": 16552 - }, - { - "epoch": 0.42, - "learning_rate": 1.9355969150856783e-06, - "loss": 0.8818, - "step": 16553 - }, - { - "epoch": 0.42, - "learning_rate": 1.935587145120837e-06, - "loss": 0.957, - "step": 16554 - }, - { - "epoch": 0.42, - "learning_rate": 1.93557737443966e-06, - "loss": 0.6724, - "step": 16555 - }, - { - "epoch": 0.42, - "learning_rate": 1.9355676030421543e-06, - "loss": 0.9883, - "step": 16556 - }, - { - "epoch": 0.42, - "learning_rate": 1.9355578309283272e-06, - "loss": 0.6719, - "step": 16557 - }, - { - "epoch": 0.42, - "learning_rate": 1.9355480580981868e-06, - "loss": 0.6857, - "step": 16558 - }, - { - "epoch": 0.42, - "learning_rate": 1.9355382845517402e-06, - "loss": 0.8174, - "step": 16559 - }, - { - "epoch": 0.42, - "learning_rate": 1.9355285102889947e-06, - "loss": 0.917, - "step": 16560 - }, - { - "epoch": 0.42, - "learning_rate": 1.9355187353099584e-06, - "loss": 1.0342, - "step": 16561 - }, - { - "epoch": 0.42, - "learning_rate": 1.9355089596146384e-06, - "loss": 0.9463, - "step": 16562 - }, - { - "epoch": 0.42, - "learning_rate": 1.935499183203042e-06, - "loss": 1.0166, - "step": 16563 - }, - { - "epoch": 0.42, - "learning_rate": 1.935489406075177e-06, - "loss": 0.8369, - "step": 16564 - }, - { - "epoch": 0.42, - "learning_rate": 1.9354796282310504e-06, - "loss": 1.0371, - "step": 16565 - }, - { - "epoch": 0.42, - "learning_rate": 1.9354698496706707e-06, - "loss": 0.8877, - "step": 16566 - }, - { - "epoch": 0.42, - "learning_rate": 1.9354600703940445e-06, - "loss": 0.7339, - "step": 16567 - }, - { - "epoch": 0.42, - "learning_rate": 1.935450290401179e-06, - "loss": 0.8701, - "step": 16568 - }, - { - "epoch": 0.42, - "learning_rate": 1.9354405096920835e-06, - "loss": 0.731, - "step": 16569 - }, - { - "epoch": 0.42, - "learning_rate": 1.935430728266763e-06, - "loss": 0.8501, - "step": 16570 - }, - { - "epoch": 0.42, - "learning_rate": 1.9354209461252267e-06, - "loss": 0.7695, - "step": 16571 - }, - { - "epoch": 0.42, - "learning_rate": 1.9354111632674817e-06, - "loss": 0.8242, - "step": 16572 - }, - { - "epoch": 0.42, - "learning_rate": 1.9354013796935355e-06, - "loss": 0.7939, - "step": 16573 - }, - { - "epoch": 0.42, - "learning_rate": 1.935391595403395e-06, - "loss": 0.7573, - "step": 16574 - }, - { - "epoch": 0.42, - "learning_rate": 1.9353818103970683e-06, - "loss": 0.874, - "step": 16575 - }, - { - "epoch": 0.42, - "learning_rate": 1.935372024674563e-06, - "loss": 0.8408, - "step": 16576 - }, - { - "epoch": 0.42, - "learning_rate": 1.935362238235886e-06, - "loss": 0.8218, - "step": 16577 - }, - { - "epoch": 0.42, - "learning_rate": 1.935352451081045e-06, - "loss": 1.1855, - "step": 16578 - }, - { - "epoch": 0.42, - "learning_rate": 1.9353426632100483e-06, - "loss": 0.8848, - "step": 16579 - }, - { - "epoch": 0.42, - "learning_rate": 1.9353328746229025e-06, - "loss": 0.9668, - "step": 16580 - }, - { - "epoch": 0.42, - "learning_rate": 1.9353230853196153e-06, - "loss": 0.9185, - "step": 16581 - }, - { - "epoch": 0.43, - "learning_rate": 1.935313295300194e-06, - "loss": 0.9375, - "step": 16582 - }, - { - "epoch": 0.43, - "learning_rate": 1.9353035045646465e-06, - "loss": 0.9092, - "step": 16583 - }, - { - "epoch": 0.43, - "learning_rate": 1.9352937131129797e-06, - "loss": 0.8418, - "step": 16584 - }, - { - "epoch": 0.43, - "learning_rate": 1.935283920945202e-06, - "loss": 0.8301, - "step": 16585 - }, - { - "epoch": 0.43, - "learning_rate": 1.93527412806132e-06, - "loss": 0.958, - "step": 16586 - }, - { - "epoch": 0.43, - "learning_rate": 1.9352643344613423e-06, - "loss": 0.7646, - "step": 16587 - }, - { - "epoch": 0.43, - "learning_rate": 1.9352545401452752e-06, - "loss": 1.083, - "step": 16588 - }, - { - "epoch": 0.43, - "learning_rate": 1.935244745113127e-06, - "loss": 0.8018, - "step": 16589 - }, - { - "epoch": 0.43, - "learning_rate": 1.935234949364905e-06, - "loss": 0.8271, - "step": 16590 - }, - { - "epoch": 0.43, - "learning_rate": 1.9352251529006157e-06, - "loss": 0.7031, - "step": 16591 - }, - { - "epoch": 0.43, - "learning_rate": 1.935215355720268e-06, - "loss": 0.5654, - "step": 16592 - }, - { - "epoch": 0.43, - "learning_rate": 1.9352055578238694e-06, - "loss": 0.6812, - "step": 16593 - }, - { - "epoch": 0.43, - "learning_rate": 1.9351957592114263e-06, - "loss": 0.8037, - "step": 16594 - }, - { - "epoch": 0.43, - "learning_rate": 1.935185959882947e-06, - "loss": 0.9395, - "step": 16595 - }, - { - "epoch": 0.43, - "learning_rate": 1.935176159838439e-06, - "loss": 0.9219, - "step": 16596 - }, - { - "epoch": 0.43, - "learning_rate": 1.9351663590779094e-06, - "loss": 0.6602, - "step": 16597 - }, - { - "epoch": 0.43, - "learning_rate": 1.935156557601366e-06, - "loss": 1.0957, - "step": 16598 - }, - { - "epoch": 0.43, - "learning_rate": 1.935146755408816e-06, - "loss": 0.7827, - "step": 16599 - }, - { - "epoch": 0.43, - "learning_rate": 1.9351369525002675e-06, - "loss": 1.0215, - "step": 16600 - }, - { - "epoch": 0.43, - "learning_rate": 1.9351271488757276e-06, - "loss": 1.0059, - "step": 16601 - }, - { - "epoch": 0.43, - "learning_rate": 1.9351173445352034e-06, - "loss": 1.0049, - "step": 16602 - }, - { - "epoch": 0.43, - "learning_rate": 1.9351075394787035e-06, - "loss": 0.8496, - "step": 16603 - }, - { - "epoch": 0.43, - "learning_rate": 1.935097733706234e-06, - "loss": 0.9912, - "step": 16604 - }, - { - "epoch": 0.43, - "learning_rate": 1.9350879272178038e-06, - "loss": 0.5889, - "step": 16605 - }, - { - "epoch": 0.43, - "learning_rate": 1.9350781200134193e-06, - "loss": 0.8486, - "step": 16606 - }, - { - "epoch": 0.43, - "learning_rate": 1.9350683120930886e-06, - "loss": 0.5991, - "step": 16607 - }, - { - "epoch": 0.43, - "learning_rate": 1.9350585034568195e-06, - "loss": 1.0703, - "step": 16608 - }, - { - "epoch": 0.43, - "learning_rate": 1.9350486941046187e-06, - "loss": 0.8604, - "step": 16609 - }, - { - "epoch": 0.43, - "learning_rate": 1.935038884036494e-06, - "loss": 1.0078, - "step": 16610 - }, - { - "epoch": 0.43, - "learning_rate": 1.9350290732524535e-06, - "loss": 0.8223, - "step": 16611 - }, - { - "epoch": 0.43, - "learning_rate": 1.935019261752504e-06, - "loss": 0.9023, - "step": 16612 - }, - { - "epoch": 0.43, - "learning_rate": 1.935009449536653e-06, - "loss": 1.0361, - "step": 16613 - }, - { - "epoch": 0.43, - "learning_rate": 1.9349996366049086e-06, - "loss": 0.8867, - "step": 16614 - }, - { - "epoch": 0.43, - "learning_rate": 1.934989822957278e-06, - "loss": 1.0771, - "step": 16615 - }, - { - "epoch": 0.43, - "learning_rate": 1.9349800085937684e-06, - "loss": 1.0488, - "step": 16616 - }, - { - "epoch": 0.43, - "learning_rate": 1.9349701935143877e-06, - "loss": 0.8096, - "step": 16617 - }, - { - "epoch": 0.43, - "learning_rate": 1.934960377719143e-06, - "loss": 1.0664, - "step": 16618 - }, - { - "epoch": 0.43, - "learning_rate": 1.934950561208043e-06, - "loss": 0.5962, - "step": 16619 - }, - { - "epoch": 0.43, - "learning_rate": 1.9349407439810937e-06, - "loss": 0.8955, - "step": 16620 - }, - { - "epoch": 0.43, - "learning_rate": 1.9349309260383033e-06, - "loss": 0.6782, - "step": 16621 - }, - { - "epoch": 0.43, - "learning_rate": 1.9349211073796795e-06, - "loss": 0.8926, - "step": 16622 - }, - { - "epoch": 0.43, - "learning_rate": 1.9349112880052293e-06, - "loss": 1.0303, - "step": 16623 - }, - { - "epoch": 0.43, - "learning_rate": 1.9349014679149606e-06, - "loss": 1.0918, - "step": 16624 - }, - { - "epoch": 0.43, - "learning_rate": 1.9348916471088808e-06, - "loss": 0.8369, - "step": 16625 - }, - { - "epoch": 0.43, - "learning_rate": 1.9348818255869976e-06, - "loss": 1.0371, - "step": 16626 - }, - { - "epoch": 0.43, - "learning_rate": 1.9348720033493186e-06, - "loss": 0.7842, - "step": 16627 - }, - { - "epoch": 0.43, - "learning_rate": 1.9348621803958506e-06, - "loss": 0.9688, - "step": 16628 - }, - { - "epoch": 0.43, - "learning_rate": 1.9348523567266017e-06, - "loss": 0.8584, - "step": 16629 - }, - { - "epoch": 0.43, - "learning_rate": 1.9348425323415794e-06, - "loss": 0.9766, - "step": 16630 - }, - { - "epoch": 0.43, - "learning_rate": 1.9348327072407914e-06, - "loss": 0.7969, - "step": 16631 - }, - { - "epoch": 0.43, - "learning_rate": 1.9348228814242445e-06, - "loss": 0.6121, - "step": 16632 - }, - { - "epoch": 0.43, - "learning_rate": 1.934813054891947e-06, - "loss": 0.8599, - "step": 16633 - }, - { - "epoch": 0.43, - "learning_rate": 1.9348032276439064e-06, - "loss": 0.7969, - "step": 16634 - }, - { - "epoch": 0.43, - "learning_rate": 1.9347933996801297e-06, - "loss": 0.9023, - "step": 16635 - }, - { - "epoch": 0.43, - "learning_rate": 1.9347835710006246e-06, - "loss": 0.979, - "step": 16636 - }, - { - "epoch": 0.43, - "learning_rate": 1.934773741605399e-06, - "loss": 1.083, - "step": 16637 - }, - { - "epoch": 0.43, - "learning_rate": 1.9347639114944594e-06, - "loss": 1.0244, - "step": 16638 - }, - { - "epoch": 0.43, - "learning_rate": 1.9347540806678147e-06, - "loss": 0.9004, - "step": 16639 - }, - { - "epoch": 0.43, - "learning_rate": 1.9347442491254716e-06, - "loss": 0.7734, - "step": 16640 - }, - { - "epoch": 0.43, - "learning_rate": 1.934734416867438e-06, - "loss": 0.9473, - "step": 16641 - }, - { - "epoch": 0.43, - "learning_rate": 1.9347245838937208e-06, - "loss": 0.8604, - "step": 16642 - }, - { - "epoch": 0.43, - "learning_rate": 1.9347147502043283e-06, - "loss": 1.1182, - "step": 16643 - }, - { - "epoch": 0.43, - "learning_rate": 1.934704915799268e-06, - "loss": 0.8418, - "step": 16644 - }, - { - "epoch": 0.43, - "learning_rate": 1.9346950806785465e-06, - "loss": 1.0498, - "step": 16645 - }, - { - "epoch": 0.43, - "learning_rate": 1.9346852448421724e-06, - "loss": 0.8188, - "step": 16646 - }, - { - "epoch": 0.43, - "learning_rate": 1.9346754082901524e-06, - "loss": 1.0283, - "step": 16647 - }, - { - "epoch": 0.43, - "learning_rate": 1.9346655710224947e-06, - "loss": 0.9434, - "step": 16648 - }, - { - "epoch": 0.43, - "learning_rate": 1.9346557330392067e-06, - "loss": 0.8115, - "step": 16649 - }, - { - "epoch": 0.43, - "learning_rate": 1.9346458943402954e-06, - "loss": 0.9263, - "step": 16650 - }, - { - "epoch": 0.43, - "learning_rate": 1.934636054925769e-06, - "loss": 1.1309, - "step": 16651 - }, - { - "epoch": 0.43, - "learning_rate": 1.9346262147956347e-06, - "loss": 1.0342, - "step": 16652 - }, - { - "epoch": 0.43, - "learning_rate": 1.9346163739498997e-06, - "loss": 0.7534, - "step": 16653 - }, - { - "epoch": 0.43, - "learning_rate": 1.934606532388572e-06, - "loss": 0.9512, - "step": 16654 - }, - { - "epoch": 0.43, - "learning_rate": 1.9345966901116594e-06, - "loss": 1.0039, - "step": 16655 - }, - { - "epoch": 0.43, - "learning_rate": 1.934586847119169e-06, - "loss": 0.9863, - "step": 16656 - }, - { - "epoch": 0.43, - "learning_rate": 1.9345770034111085e-06, - "loss": 0.9229, - "step": 16657 - }, - { - "epoch": 0.43, - "learning_rate": 1.934567158987485e-06, - "loss": 0.7798, - "step": 16658 - }, - { - "epoch": 0.43, - "learning_rate": 1.934557313848307e-06, - "loss": 0.7656, - "step": 16659 - }, - { - "epoch": 0.43, - "learning_rate": 1.934547467993581e-06, - "loss": 0.8623, - "step": 16660 - }, - { - "epoch": 0.43, - "learning_rate": 1.934537621423315e-06, - "loss": 0.8867, - "step": 16661 - }, - { - "epoch": 0.43, - "learning_rate": 1.9345277741375167e-06, - "loss": 0.9678, - "step": 16662 - }, - { - "epoch": 0.43, - "learning_rate": 1.934517926136193e-06, - "loss": 0.7412, - "step": 16663 - }, - { - "epoch": 0.43, - "learning_rate": 1.9345080774193523e-06, - "loss": 0.7896, - "step": 16664 - }, - { - "epoch": 0.43, - "learning_rate": 1.9344982279870016e-06, - "loss": 1.0264, - "step": 16665 - }, - { - "epoch": 0.43, - "learning_rate": 1.9344883778391487e-06, - "loss": 1.0938, - "step": 16666 - }, - { - "epoch": 0.43, - "learning_rate": 1.934478526975801e-06, - "loss": 0.959, - "step": 16667 - }, - { - "epoch": 0.43, - "learning_rate": 1.934468675396966e-06, - "loss": 0.9209, - "step": 16668 - }, - { - "epoch": 0.43, - "learning_rate": 1.934458823102651e-06, - "loss": 0.7969, - "step": 16669 - }, - { - "epoch": 0.43, - "learning_rate": 1.9344489700928645e-06, - "loss": 0.9062, - "step": 16670 - }, - { - "epoch": 0.43, - "learning_rate": 1.9344391163676132e-06, - "loss": 1.0, - "step": 16671 - }, - { - "epoch": 0.43, - "learning_rate": 1.9344292619269046e-06, - "loss": 0.7837, - "step": 16672 - }, - { - "epoch": 0.43, - "learning_rate": 1.9344194067707466e-06, - "loss": 1.0381, - "step": 16673 - }, - { - "epoch": 0.43, - "learning_rate": 1.9344095508991464e-06, - "loss": 0.9375, - "step": 16674 - }, - { - "epoch": 0.43, - "learning_rate": 1.9343996943121117e-06, - "loss": 0.7979, - "step": 16675 - }, - { - "epoch": 0.43, - "learning_rate": 1.9343898370096506e-06, - "loss": 0.874, - "step": 16676 - }, - { - "epoch": 0.43, - "learning_rate": 1.93437997899177e-06, - "loss": 0.6763, - "step": 16677 - }, - { - "epoch": 0.43, - "learning_rate": 1.9343701202584777e-06, - "loss": 0.8081, - "step": 16678 - }, - { - "epoch": 0.43, - "learning_rate": 1.9343602608097808e-06, - "loss": 0.7754, - "step": 16679 - }, - { - "epoch": 0.43, - "learning_rate": 1.9343504006456874e-06, - "loss": 0.8096, - "step": 16680 - }, - { - "epoch": 0.43, - "learning_rate": 1.9343405397662053e-06, - "loss": 0.8032, - "step": 16681 - }, - { - "epoch": 0.43, - "learning_rate": 1.9343306781713407e-06, - "loss": 0.8398, - "step": 16682 - }, - { - "epoch": 0.43, - "learning_rate": 1.9343208158611027e-06, - "loss": 0.9648, - "step": 16683 - }, - { - "epoch": 0.43, - "learning_rate": 1.9343109528354982e-06, - "loss": 0.7969, - "step": 16684 - }, - { - "epoch": 0.43, - "learning_rate": 1.9343010890945347e-06, - "loss": 0.8672, - "step": 16685 - }, - { - "epoch": 0.43, - "learning_rate": 1.9342912246382196e-06, - "loss": 0.7881, - "step": 16686 - }, - { - "epoch": 0.43, - "learning_rate": 1.9342813594665607e-06, - "loss": 0.9844, - "step": 16687 - }, - { - "epoch": 0.43, - "learning_rate": 1.934271493579566e-06, - "loss": 0.9248, - "step": 16688 - }, - { - "epoch": 0.43, - "learning_rate": 1.934261626977242e-06, - "loss": 0.9941, - "step": 16689 - }, - { - "epoch": 0.43, - "learning_rate": 1.934251759659597e-06, - "loss": 0.8369, - "step": 16690 - }, - { - "epoch": 0.43, - "learning_rate": 1.9342418916266384e-06, - "loss": 0.8975, - "step": 16691 - }, - { - "epoch": 0.43, - "learning_rate": 1.934232022878374e-06, - "loss": 0.7949, - "step": 16692 - }, - { - "epoch": 0.43, - "learning_rate": 1.9342221534148105e-06, - "loss": 0.7939, - "step": 16693 - }, - { - "epoch": 0.43, - "learning_rate": 1.934212283235957e-06, - "loss": 0.9512, - "step": 16694 - }, - { - "epoch": 0.43, - "learning_rate": 1.934202412341819e-06, - "loss": 0.9561, - "step": 16695 - }, - { - "epoch": 0.43, - "learning_rate": 1.934192540732406e-06, - "loss": 0.8496, - "step": 16696 - }, - { - "epoch": 0.43, - "learning_rate": 1.9341826684077247e-06, - "loss": 1.0391, - "step": 16697 - }, - { - "epoch": 0.43, - "learning_rate": 1.934172795367782e-06, - "loss": 0.958, - "step": 16698 - }, - { - "epoch": 0.43, - "learning_rate": 1.9341629216125866e-06, - "loss": 0.9561, - "step": 16699 - }, - { - "epoch": 0.43, - "learning_rate": 1.9341530471421458e-06, - "loss": 0.9893, - "step": 16700 - }, - { - "epoch": 0.43, - "learning_rate": 1.9341431719564665e-06, - "loss": 0.918, - "step": 16701 - }, - { - "epoch": 0.43, - "learning_rate": 1.934133296055557e-06, - "loss": 0.9434, - "step": 16702 - }, - { - "epoch": 0.43, - "learning_rate": 1.9341234194394244e-06, - "loss": 0.606, - "step": 16703 - }, - { - "epoch": 0.43, - "learning_rate": 1.9341135421080768e-06, - "loss": 0.8691, - "step": 16704 - }, - { - "epoch": 0.43, - "learning_rate": 1.9341036640615213e-06, - "loss": 0.8965, - "step": 16705 - }, - { - "epoch": 0.43, - "learning_rate": 1.9340937852997654e-06, - "loss": 0.8887, - "step": 16706 - }, - { - "epoch": 0.43, - "learning_rate": 1.934083905822817e-06, - "loss": 0.9648, - "step": 16707 - }, - { - "epoch": 0.43, - "learning_rate": 1.9340740256306837e-06, - "loss": 0.811, - "step": 16708 - }, - { - "epoch": 0.43, - "learning_rate": 1.9340641447233723e-06, - "loss": 0.8916, - "step": 16709 - }, - { - "epoch": 0.43, - "learning_rate": 1.9340542631008914e-06, - "loss": 0.7686, - "step": 16710 - }, - { - "epoch": 0.43, - "learning_rate": 1.934044380763248e-06, - "loss": 0.7722, - "step": 16711 - }, - { - "epoch": 0.43, - "learning_rate": 1.9340344977104494e-06, - "loss": 1.0273, - "step": 16712 - }, - { - "epoch": 0.43, - "learning_rate": 1.934024613942504e-06, - "loss": 1.001, - "step": 16713 - }, - { - "epoch": 0.43, - "learning_rate": 1.934014729459419e-06, - "loss": 1.0967, - "step": 16714 - }, - { - "epoch": 0.43, - "learning_rate": 1.934004844261201e-06, - "loss": 0.8164, - "step": 16715 - }, - { - "epoch": 0.43, - "learning_rate": 1.9339949583478592e-06, - "loss": 0.7412, - "step": 16716 - }, - { - "epoch": 0.43, - "learning_rate": 1.9339850717194005e-06, - "loss": 1.0371, - "step": 16717 - }, - { - "epoch": 0.43, - "learning_rate": 1.933975184375832e-06, - "loss": 0.8591, - "step": 16718 - }, - { - "epoch": 0.43, - "learning_rate": 1.9339652963171617e-06, - "loss": 0.7979, - "step": 16719 - }, - { - "epoch": 0.43, - "learning_rate": 1.933955407543397e-06, - "loss": 0.9912, - "step": 16720 - }, - { - "epoch": 0.43, - "learning_rate": 1.933945518054546e-06, - "loss": 1.0176, - "step": 16721 - }, - { - "epoch": 0.43, - "learning_rate": 1.933935627850616e-06, - "loss": 0.8896, - "step": 16722 - }, - { - "epoch": 0.43, - "learning_rate": 1.933925736931614e-06, - "loss": 0.8916, - "step": 16723 - }, - { - "epoch": 0.43, - "learning_rate": 1.933915845297548e-06, - "loss": 0.668, - "step": 16724 - }, - { - "epoch": 0.43, - "learning_rate": 1.9339059529484256e-06, - "loss": 0.5071, - "step": 16725 - }, - { - "epoch": 0.43, - "learning_rate": 1.933896059884254e-06, - "loss": 0.8672, - "step": 16726 - }, - { - "epoch": 0.43, - "learning_rate": 1.9338861661050416e-06, - "loss": 1.0977, - "step": 16727 - }, - { - "epoch": 0.43, - "learning_rate": 1.9338762716107957e-06, - "loss": 0.7861, - "step": 16728 - }, - { - "epoch": 0.43, - "learning_rate": 1.933866376401523e-06, - "loss": 1.1006, - "step": 16729 - }, - { - "epoch": 0.43, - "learning_rate": 1.9338564804772327e-06, - "loss": 0.8174, - "step": 16730 - }, - { - "epoch": 0.43, - "learning_rate": 1.933846583837931e-06, - "loss": 0.8848, - "step": 16731 - }, - { - "epoch": 0.43, - "learning_rate": 1.9338366864836256e-06, - "loss": 1.0127, - "step": 16732 - }, - { - "epoch": 0.43, - "learning_rate": 1.9338267884143247e-06, - "loss": 1.0371, - "step": 16733 - }, - { - "epoch": 0.43, - "learning_rate": 1.9338168896300356e-06, - "loss": 1.0566, - "step": 16734 - }, - { - "epoch": 0.43, - "learning_rate": 1.9338069901307655e-06, - "loss": 0.6345, - "step": 16735 - }, - { - "epoch": 0.43, - "learning_rate": 1.9337970899165226e-06, - "loss": 0.9883, - "step": 16736 - }, - { - "epoch": 0.43, - "learning_rate": 1.9337871889873144e-06, - "loss": 0.873, - "step": 16737 - }, - { - "epoch": 0.43, - "learning_rate": 1.9337772873431478e-06, - "loss": 1.0, - "step": 16738 - }, - { - "epoch": 0.43, - "learning_rate": 1.933767384984031e-06, - "loss": 0.9287, - "step": 16739 - }, - { - "epoch": 0.43, - "learning_rate": 1.933757481909972e-06, - "loss": 0.7241, - "step": 16740 - }, - { - "epoch": 0.43, - "learning_rate": 1.9337475781209773e-06, - "loss": 0.8818, - "step": 16741 - }, - { - "epoch": 0.43, - "learning_rate": 1.9337376736170546e-06, - "loss": 0.8125, - "step": 16742 - }, - { - "epoch": 0.43, - "learning_rate": 1.933727768398213e-06, - "loss": 1.04, - "step": 16743 - }, - { - "epoch": 0.43, - "learning_rate": 1.9337178624644582e-06, - "loss": 0.9023, - "step": 16744 - }, - { - "epoch": 0.43, - "learning_rate": 1.9337079558157986e-06, - "loss": 0.8027, - "step": 16745 - }, - { - "epoch": 0.43, - "learning_rate": 1.933698048452242e-06, - "loss": 0.9795, - "step": 16746 - }, - { - "epoch": 0.43, - "learning_rate": 1.9336881403737956e-06, - "loss": 0.7725, - "step": 16747 - }, - { - "epoch": 0.43, - "learning_rate": 1.933678231580467e-06, - "loss": 0.8169, - "step": 16748 - }, - { - "epoch": 0.43, - "learning_rate": 1.933668322072264e-06, - "loss": 0.8926, - "step": 16749 - }, - { - "epoch": 0.43, - "learning_rate": 1.9336584118491944e-06, - "loss": 0.9131, - "step": 16750 - }, - { - "epoch": 0.43, - "learning_rate": 1.933648500911265e-06, - "loss": 0.8516, - "step": 16751 - }, - { - "epoch": 0.43, - "learning_rate": 1.9336385892584845e-06, - "loss": 0.79, - "step": 16752 - }, - { - "epoch": 0.43, - "learning_rate": 1.9336286768908595e-06, - "loss": 0.8052, - "step": 16753 - }, - { - "epoch": 0.43, - "learning_rate": 1.9336187638083976e-06, - "loss": 1.0439, - "step": 16754 - }, - { - "epoch": 0.43, - "learning_rate": 1.9336088500111073e-06, - "loss": 0.7739, - "step": 16755 - }, - { - "epoch": 0.43, - "learning_rate": 1.9335989354989956e-06, - "loss": 0.9414, - "step": 16756 - }, - { - "epoch": 0.43, - "learning_rate": 1.9335890202720695e-06, - "loss": 0.8926, - "step": 16757 - }, - { - "epoch": 0.43, - "learning_rate": 1.9335791043303378e-06, - "loss": 0.8457, - "step": 16758 - }, - { - "epoch": 0.43, - "learning_rate": 1.9335691876738072e-06, - "loss": 0.8701, - "step": 16759 - }, - { - "epoch": 0.43, - "learning_rate": 1.933559270302486e-06, - "loss": 0.8159, - "step": 16760 - }, - { - "epoch": 0.43, - "learning_rate": 1.933549352216381e-06, - "loss": 0.7393, - "step": 16761 - }, - { - "epoch": 0.43, - "learning_rate": 1.9335394334155006e-06, - "loss": 0.7266, - "step": 16762 - }, - { - "epoch": 0.43, - "learning_rate": 1.9335295138998514e-06, - "loss": 0.7705, - "step": 16763 - }, - { - "epoch": 0.43, - "learning_rate": 1.933519593669442e-06, - "loss": 1.0137, - "step": 16764 - }, - { - "epoch": 0.43, - "learning_rate": 1.9335096727242794e-06, - "loss": 1.0049, - "step": 16765 - }, - { - "epoch": 0.43, - "learning_rate": 1.9334997510643714e-06, - "loss": 0.7734, - "step": 16766 - }, - { - "epoch": 0.43, - "learning_rate": 1.9334898286897255e-06, - "loss": 0.9668, - "step": 16767 - }, - { - "epoch": 0.43, - "learning_rate": 1.9334799056003495e-06, - "loss": 0.6597, - "step": 16768 - }, - { - "epoch": 0.43, - "learning_rate": 1.933469981796251e-06, - "loss": 0.793, - "step": 16769 - }, - { - "epoch": 0.43, - "learning_rate": 1.9334600572774372e-06, - "loss": 0.8174, - "step": 16770 - }, - { - "epoch": 0.43, - "learning_rate": 1.933450132043916e-06, - "loss": 0.8818, - "step": 16771 - }, - { - "epoch": 0.43, - "learning_rate": 1.933440206095695e-06, - "loss": 1.0225, - "step": 16772 - }, - { - "epoch": 0.43, - "learning_rate": 1.9334302794327816e-06, - "loss": 0.7686, - "step": 16773 - }, - { - "epoch": 0.43, - "learning_rate": 1.933420352055184e-06, - "loss": 0.9805, - "step": 16774 - }, - { - "epoch": 0.43, - "learning_rate": 1.933410423962909e-06, - "loss": 0.9629, - "step": 16775 - }, - { - "epoch": 0.43, - "learning_rate": 1.9334004951559644e-06, - "loss": 1.0713, - "step": 16776 - }, - { - "epoch": 0.43, - "learning_rate": 1.933390565634358e-06, - "loss": 0.9307, - "step": 16777 - }, - { - "epoch": 0.43, - "learning_rate": 1.9333806353980976e-06, - "loss": 1.125, - "step": 16778 - }, - { - "epoch": 0.43, - "learning_rate": 1.9333707044471906e-06, - "loss": 0.7988, - "step": 16779 - }, - { - "epoch": 0.43, - "learning_rate": 1.9333607727816445e-06, - "loss": 0.7773, - "step": 16780 - }, - { - "epoch": 0.43, - "learning_rate": 1.933350840401467e-06, - "loss": 0.8496, - "step": 16781 - }, - { - "epoch": 0.43, - "learning_rate": 1.9333409073066653e-06, - "loss": 0.9688, - "step": 16782 - }, - { - "epoch": 0.43, - "learning_rate": 1.933330973497248e-06, - "loss": 0.9092, - "step": 16783 - }, - { - "epoch": 0.43, - "learning_rate": 1.933321038973222e-06, - "loss": 0.8652, - "step": 16784 - }, - { - "epoch": 0.43, - "learning_rate": 1.9333111037345947e-06, - "loss": 1.0088, - "step": 16785 - }, - { - "epoch": 0.43, - "learning_rate": 1.933301167781374e-06, - "loss": 0.8975, - "step": 16786 - }, - { - "epoch": 0.43, - "learning_rate": 1.9332912311135675e-06, - "loss": 0.8721, - "step": 16787 - }, - { - "epoch": 0.43, - "learning_rate": 1.933281293731183e-06, - "loss": 1.0254, - "step": 16788 - }, - { - "epoch": 0.43, - "learning_rate": 1.933271355634228e-06, - "loss": 0.7539, - "step": 16789 - }, - { - "epoch": 0.43, - "learning_rate": 1.9332614168227095e-06, - "loss": 1.0195, - "step": 16790 - }, - { - "epoch": 0.43, - "learning_rate": 1.9332514772966363e-06, - "loss": 0.9287, - "step": 16791 - }, - { - "epoch": 0.43, - "learning_rate": 1.933241537056015e-06, - "loss": 0.9766, - "step": 16792 - }, - { - "epoch": 0.43, - "learning_rate": 1.9332315961008535e-06, - "loss": 0.6392, - "step": 16793 - }, - { - "epoch": 0.43, - "learning_rate": 1.93322165443116e-06, - "loss": 0.9365, - "step": 16794 - }, - { - "epoch": 0.43, - "learning_rate": 1.933211712046941e-06, - "loss": 0.8096, - "step": 16795 - }, - { - "epoch": 0.43, - "learning_rate": 1.933201768948205e-06, - "loss": 0.9541, - "step": 16796 - }, - { - "epoch": 0.43, - "learning_rate": 1.9331918251349593e-06, - "loss": 0.7488, - "step": 16797 - }, - { - "epoch": 0.43, - "learning_rate": 1.933181880607211e-06, - "loss": 1.0156, - "step": 16798 - }, - { - "epoch": 0.43, - "learning_rate": 1.933171935364969e-06, - "loss": 0.8818, - "step": 16799 - }, - { - "epoch": 0.43, - "learning_rate": 1.93316198940824e-06, - "loss": 0.8252, - "step": 16800 - }, - { - "epoch": 0.43, - "learning_rate": 1.933152042737031e-06, - "loss": 1.0869, - "step": 16801 - }, - { - "epoch": 0.43, - "learning_rate": 1.9331420953513515e-06, - "loss": 0.9814, - "step": 16802 - }, - { - "epoch": 0.43, - "learning_rate": 1.9331321472512075e-06, - "loss": 0.915, - "step": 16803 - }, - { - "epoch": 0.43, - "learning_rate": 1.933122198436607e-06, - "loss": 0.8447, - "step": 16804 - }, - { - "epoch": 0.43, - "learning_rate": 1.933112248907558e-06, - "loss": 0.8984, - "step": 16805 - }, - { - "epoch": 0.43, - "learning_rate": 1.9331022986640677e-06, - "loss": 1.0244, - "step": 16806 - }, - { - "epoch": 0.43, - "learning_rate": 1.933092347706144e-06, - "loss": 0.7778, - "step": 16807 - }, - { - "epoch": 0.43, - "learning_rate": 1.9330823960337943e-06, - "loss": 0.4589, - "step": 16808 - }, - { - "epoch": 0.43, - "learning_rate": 1.9330724436470263e-06, - "loss": 0.8887, - "step": 16809 - }, - { - "epoch": 0.43, - "learning_rate": 1.9330624905458478e-06, - "loss": 0.7627, - "step": 16810 - }, - { - "epoch": 0.43, - "learning_rate": 1.933052536730266e-06, - "loss": 0.9941, - "step": 16811 - }, - { - "epoch": 0.43, - "learning_rate": 1.933042582200289e-06, - "loss": 1.0283, - "step": 16812 - }, - { - "epoch": 0.43, - "learning_rate": 1.933032626955924e-06, - "loss": 0.8931, - "step": 16813 - }, - { - "epoch": 0.43, - "learning_rate": 1.9330226709971787e-06, - "loss": 1.1104, - "step": 16814 - }, - { - "epoch": 0.43, - "learning_rate": 1.9330127143240614e-06, - "loss": 0.6362, - "step": 16815 - }, - { - "epoch": 0.43, - "learning_rate": 1.933002756936579e-06, - "loss": 0.7676, - "step": 16816 - }, - { - "epoch": 0.43, - "learning_rate": 1.9329927988347386e-06, - "loss": 0.916, - "step": 16817 - }, - { - "epoch": 0.43, - "learning_rate": 1.932982840018549e-06, - "loss": 1.0859, - "step": 16818 - }, - { - "epoch": 0.43, - "learning_rate": 1.9329728804880174e-06, - "loss": 0.7324, - "step": 16819 - }, - { - "epoch": 0.43, - "learning_rate": 1.9329629202431515e-06, - "loss": 0.8135, - "step": 16820 - }, - { - "epoch": 0.43, - "learning_rate": 1.9329529592839586e-06, - "loss": 0.8701, - "step": 16821 - }, - { - "epoch": 0.43, - "learning_rate": 1.9329429976104467e-06, - "loss": 0.853, - "step": 16822 - }, - { - "epoch": 0.43, - "learning_rate": 1.932933035222623e-06, - "loss": 0.9092, - "step": 16823 - }, - { - "epoch": 0.43, - "learning_rate": 1.9329230721204955e-06, - "loss": 0.8535, - "step": 16824 - }, - { - "epoch": 0.43, - "learning_rate": 1.9329131083040716e-06, - "loss": 1.0098, - "step": 16825 - }, - { - "epoch": 0.43, - "learning_rate": 1.932903143773359e-06, - "loss": 0.7993, - "step": 16826 - }, - { - "epoch": 0.43, - "learning_rate": 1.9328931785283654e-06, - "loss": 0.8555, - "step": 16827 - }, - { - "epoch": 0.43, - "learning_rate": 1.9328832125690984e-06, - "loss": 0.9512, - "step": 16828 - }, - { - "epoch": 0.43, - "learning_rate": 1.932873245895566e-06, - "loss": 0.9541, - "step": 16829 - }, - { - "epoch": 0.43, - "learning_rate": 1.932863278507775e-06, - "loss": 0.9424, - "step": 16830 - }, - { - "epoch": 0.43, - "learning_rate": 1.932853310405733e-06, - "loss": 0.9404, - "step": 16831 - }, - { - "epoch": 0.43, - "learning_rate": 1.9328433415894493e-06, - "loss": 1.0859, - "step": 16832 - }, - { - "epoch": 0.43, - "learning_rate": 1.9328333720589292e-06, - "loss": 0.8867, - "step": 16833 - }, - { - "epoch": 0.43, - "learning_rate": 1.932823401814182e-06, - "loss": 0.9893, - "step": 16834 - }, - { - "epoch": 0.43, - "learning_rate": 1.932813430855215e-06, - "loss": 1.0176, - "step": 16835 - }, - { - "epoch": 0.43, - "learning_rate": 1.9328034591820357e-06, - "loss": 0.7114, - "step": 16836 - }, - { - "epoch": 0.43, - "learning_rate": 1.9327934867946514e-06, - "loss": 0.9639, - "step": 16837 - }, - { - "epoch": 0.43, - "learning_rate": 1.93278351369307e-06, - "loss": 0.7275, - "step": 16838 - }, - { - "epoch": 0.43, - "learning_rate": 1.9327735398772993e-06, - "loss": 0.9092, - "step": 16839 - }, - { - "epoch": 0.43, - "learning_rate": 1.932763565347347e-06, - "loss": 0.8936, - "step": 16840 - }, - { - "epoch": 0.43, - "learning_rate": 1.93275359010322e-06, - "loss": 0.9248, - "step": 16841 - }, - { - "epoch": 0.43, - "learning_rate": 1.9327436141449267e-06, - "loss": 0.8433, - "step": 16842 - }, - { - "epoch": 0.43, - "learning_rate": 1.9327336374724746e-06, - "loss": 0.8711, - "step": 16843 - }, - { - "epoch": 0.43, - "learning_rate": 1.932723660085871e-06, - "loss": 0.7786, - "step": 16844 - }, - { - "epoch": 0.43, - "learning_rate": 1.932713681985124e-06, - "loss": 0.751, - "step": 16845 - }, - { - "epoch": 0.43, - "learning_rate": 1.932703703170241e-06, - "loss": 0.7148, - "step": 16846 - }, - { - "epoch": 0.43, - "learning_rate": 1.9326937236412297e-06, - "loss": 1.0098, - "step": 16847 - }, - { - "epoch": 0.43, - "learning_rate": 1.9326837433980976e-06, - "loss": 0.9658, - "step": 16848 - }, - { - "epoch": 0.43, - "learning_rate": 1.9326737624408523e-06, - "loss": 0.7959, - "step": 16849 - }, - { - "epoch": 0.43, - "learning_rate": 1.932663780769502e-06, - "loss": 0.7754, - "step": 16850 - }, - { - "epoch": 0.43, - "learning_rate": 1.9326537983840537e-06, - "loss": 0.8994, - "step": 16851 - }, - { - "epoch": 0.43, - "learning_rate": 1.932643815284515e-06, - "loss": 0.9473, - "step": 16852 - }, - { - "epoch": 0.43, - "learning_rate": 1.932633831470894e-06, - "loss": 0.8213, - "step": 16853 - }, - { - "epoch": 0.43, - "learning_rate": 1.9326238469431985e-06, - "loss": 0.8115, - "step": 16854 - }, - { - "epoch": 0.43, - "learning_rate": 1.9326138617014353e-06, - "loss": 1.0918, - "step": 16855 - }, - { - "epoch": 0.43, - "learning_rate": 1.9326038757456127e-06, - "loss": 0.7129, - "step": 16856 - }, - { - "epoch": 0.43, - "learning_rate": 1.9325938890757384e-06, - "loss": 0.6763, - "step": 16857 - }, - { - "epoch": 0.43, - "learning_rate": 1.9325839016918195e-06, - "loss": 1.0137, - "step": 16858 - }, - { - "epoch": 0.43, - "learning_rate": 1.9325739135938646e-06, - "loss": 0.6396, - "step": 16859 - }, - { - "epoch": 0.43, - "learning_rate": 1.9325639247818804e-06, - "loss": 0.7236, - "step": 16860 - }, - { - "epoch": 0.43, - "learning_rate": 1.9325539352558745e-06, - "loss": 1.0732, - "step": 16861 - }, - { - "epoch": 0.43, - "learning_rate": 1.9325439450158554e-06, - "loss": 0.8535, - "step": 16862 - }, - { - "epoch": 0.43, - "learning_rate": 1.9325339540618303e-06, - "loss": 0.9248, - "step": 16863 - }, - { - "epoch": 0.43, - "learning_rate": 1.9325239623938064e-06, - "loss": 0.9092, - "step": 16864 - }, - { - "epoch": 0.43, - "learning_rate": 1.932513970011792e-06, - "loss": 1.0752, - "step": 16865 - }, - { - "epoch": 0.43, - "learning_rate": 1.932503976915795e-06, - "loss": 0.8047, - "step": 16866 - }, - { - "epoch": 0.43, - "learning_rate": 1.932493983105822e-06, - "loss": 0.6582, - "step": 16867 - }, - { - "epoch": 0.43, - "learning_rate": 1.9324839885818812e-06, - "loss": 0.5222, - "step": 16868 - }, - { - "epoch": 0.43, - "learning_rate": 1.9324739933439806e-06, - "loss": 0.9238, - "step": 16869 - }, - { - "epoch": 0.43, - "learning_rate": 1.9324639973921274e-06, - "loss": 0.7861, - "step": 16870 - }, - { - "epoch": 0.43, - "learning_rate": 1.9324540007263296e-06, - "loss": 0.9854, - "step": 16871 - }, - { - "epoch": 0.43, - "learning_rate": 1.9324440033465944e-06, - "loss": 0.7539, - "step": 16872 - }, - { - "epoch": 0.43, - "learning_rate": 1.9324340052529295e-06, - "loss": 1.0029, - "step": 16873 - }, - { - "epoch": 0.43, - "learning_rate": 1.9324240064453428e-06, - "loss": 0.728, - "step": 16874 - }, - { - "epoch": 0.43, - "learning_rate": 1.9324140069238424e-06, - "loss": 0.9258, - "step": 16875 - }, - { - "epoch": 0.43, - "learning_rate": 1.932404006688435e-06, - "loss": 0.8721, - "step": 16876 - }, - { - "epoch": 0.43, - "learning_rate": 1.932394005739129e-06, - "loss": 0.6309, - "step": 16877 - }, - { - "epoch": 0.43, - "learning_rate": 1.9323840040759318e-06, - "loss": 0.9248, - "step": 16878 - }, - { - "epoch": 0.43, - "learning_rate": 1.932374001698851e-06, - "loss": 0.8623, - "step": 16879 - }, - { - "epoch": 0.43, - "learning_rate": 1.9323639986078943e-06, - "loss": 0.8799, - "step": 16880 - }, - { - "epoch": 0.43, - "learning_rate": 1.932353994803069e-06, - "loss": 0.8115, - "step": 16881 - }, - { - "epoch": 0.43, - "learning_rate": 1.9323439902843835e-06, - "loss": 1.0352, - "step": 16882 - }, - { - "epoch": 0.43, - "learning_rate": 1.9323339850518452e-06, - "loss": 0.8887, - "step": 16883 - }, - { - "epoch": 0.43, - "learning_rate": 1.9323239791054615e-06, - "loss": 1.0586, - "step": 16884 - }, - { - "epoch": 0.43, - "learning_rate": 1.93231397244524e-06, - "loss": 0.896, - "step": 16885 - }, - { - "epoch": 0.43, - "learning_rate": 1.932303965071189e-06, - "loss": 0.957, - "step": 16886 - }, - { - "epoch": 0.43, - "learning_rate": 1.9322939569833153e-06, - "loss": 0.8799, - "step": 16887 - }, - { - "epoch": 0.43, - "learning_rate": 1.932283948181627e-06, - "loss": 0.8682, - "step": 16888 - }, - { - "epoch": 0.43, - "learning_rate": 1.932273938666132e-06, - "loss": 0.8345, - "step": 16889 - }, - { - "epoch": 0.43, - "learning_rate": 1.9322639284368375e-06, - "loss": 0.9844, - "step": 16890 - }, - { - "epoch": 0.43, - "learning_rate": 1.9322539174937513e-06, - "loss": 1.042, - "step": 16891 - }, - { - "epoch": 0.43, - "learning_rate": 1.9322439058368815e-06, - "loss": 0.8071, - "step": 16892 - }, - { - "epoch": 0.43, - "learning_rate": 1.932233893466235e-06, - "loss": 0.8296, - "step": 16893 - }, - { - "epoch": 0.43, - "learning_rate": 1.93222388038182e-06, - "loss": 1.0576, - "step": 16894 - }, - { - "epoch": 0.43, - "learning_rate": 1.9322138665836443e-06, - "loss": 0.5908, - "step": 16895 - }, - { - "epoch": 0.43, - "learning_rate": 1.9322038520717148e-06, - "loss": 0.8628, - "step": 16896 - }, - { - "epoch": 0.43, - "learning_rate": 1.93219383684604e-06, - "loss": 0.8584, - "step": 16897 - }, - { - "epoch": 0.43, - "learning_rate": 1.9321838209066273e-06, - "loss": 0.7998, - "step": 16898 - }, - { - "epoch": 0.43, - "learning_rate": 1.9321738042534845e-06, - "loss": 0.9697, - "step": 16899 - }, - { - "epoch": 0.43, - "learning_rate": 1.9321637868866186e-06, - "loss": 0.9639, - "step": 16900 - }, - { - "epoch": 0.43, - "learning_rate": 1.9321537688060377e-06, - "loss": 0.8457, - "step": 16901 - }, - { - "epoch": 0.43, - "learning_rate": 1.93214375001175e-06, - "loss": 0.8848, - "step": 16902 - }, - { - "epoch": 0.43, - "learning_rate": 1.9321337305037625e-06, - "loss": 1.0186, - "step": 16903 - }, - { - "epoch": 0.43, - "learning_rate": 1.932123710282083e-06, - "loss": 0.9023, - "step": 16904 - }, - { - "epoch": 0.43, - "learning_rate": 1.9321136893467195e-06, - "loss": 0.9092, - "step": 16905 - }, - { - "epoch": 0.43, - "learning_rate": 1.932103667697679e-06, - "loss": 0.9941, - "step": 16906 - }, - { - "epoch": 0.43, - "learning_rate": 1.93209364533497e-06, - "loss": 1.0273, - "step": 16907 - }, - { - "epoch": 0.43, - "learning_rate": 1.9320836222585994e-06, - "loss": 0.8672, - "step": 16908 - }, - { - "epoch": 0.43, - "learning_rate": 1.9320735984685755e-06, - "loss": 0.7969, - "step": 16909 - }, - { - "epoch": 0.43, - "learning_rate": 1.932063573964905e-06, - "loss": 0.9912, - "step": 16910 - }, - { - "epoch": 0.43, - "learning_rate": 1.9320535487475974e-06, - "loss": 0.9229, - "step": 16911 - }, - { - "epoch": 0.43, - "learning_rate": 1.9320435228166583e-06, - "loss": 0.6309, - "step": 16912 - }, - { - "epoch": 0.43, - "learning_rate": 1.9320334961720966e-06, - "loss": 0.9238, - "step": 16913 - }, - { - "epoch": 0.43, - "learning_rate": 1.93202346881392e-06, - "loss": 0.6692, - "step": 16914 - }, - { - "epoch": 0.43, - "learning_rate": 1.932013440742136e-06, - "loss": 0.9355, - "step": 16915 - }, - { - "epoch": 0.43, - "learning_rate": 1.9320034119567517e-06, - "loss": 0.9834, - "step": 16916 - }, - { - "epoch": 0.43, - "learning_rate": 1.9319933824577754e-06, - "loss": 1.1289, - "step": 16917 - }, - { - "epoch": 0.43, - "learning_rate": 1.9319833522452144e-06, - "loss": 1.0781, - "step": 16918 - }, - { - "epoch": 0.43, - "learning_rate": 1.9319733213190773e-06, - "loss": 0.8486, - "step": 16919 - }, - { - "epoch": 0.43, - "learning_rate": 1.9319632896793704e-06, - "loss": 0.9854, - "step": 16920 - }, - { - "epoch": 0.43, - "learning_rate": 1.9319532573261022e-06, - "loss": 0.7588, - "step": 16921 - }, - { - "epoch": 0.43, - "learning_rate": 1.9319432242592804e-06, - "loss": 0.8623, - "step": 16922 - }, - { - "epoch": 0.43, - "learning_rate": 1.9319331904789124e-06, - "loss": 0.8896, - "step": 16923 - }, - { - "epoch": 0.43, - "learning_rate": 1.931923155985006e-06, - "loss": 0.6887, - "step": 16924 - }, - { - "epoch": 0.43, - "learning_rate": 1.931913120777569e-06, - "loss": 0.9121, - "step": 16925 - }, - { - "epoch": 0.43, - "learning_rate": 1.931903084856609e-06, - "loss": 0.8027, - "step": 16926 - }, - { - "epoch": 0.43, - "learning_rate": 1.9318930482221334e-06, - "loss": 0.6973, - "step": 16927 - }, - { - "epoch": 0.43, - "learning_rate": 1.9318830108741504e-06, - "loss": 1.1602, - "step": 16928 - }, - { - "epoch": 0.43, - "learning_rate": 1.9318729728126674e-06, - "loss": 0.5845, - "step": 16929 - }, - { - "epoch": 0.43, - "learning_rate": 1.9318629340376922e-06, - "loss": 1.1162, - "step": 16930 - }, - { - "epoch": 0.43, - "learning_rate": 1.931852894549232e-06, - "loss": 1.0459, - "step": 16931 - }, - { - "epoch": 0.43, - "learning_rate": 1.931842854347295e-06, - "loss": 0.9551, - "step": 16932 - }, - { - "epoch": 0.43, - "learning_rate": 1.931832813431889e-06, - "loss": 0.9404, - "step": 16933 - }, - { - "epoch": 0.43, - "learning_rate": 1.9318227718030215e-06, - "loss": 0.8906, - "step": 16934 - }, - { - "epoch": 0.43, - "learning_rate": 1.9318127294607e-06, - "loss": 0.748, - "step": 16935 - }, - { - "epoch": 0.43, - "learning_rate": 1.9318026864049327e-06, - "loss": 0.7979, - "step": 16936 - }, - { - "epoch": 0.43, - "learning_rate": 1.9317926426357267e-06, - "loss": 1.0098, - "step": 16937 - }, - { - "epoch": 0.43, - "learning_rate": 1.9317825981530894e-06, - "loss": 0.9492, - "step": 16938 - }, - { - "epoch": 0.43, - "learning_rate": 1.9317725529570293e-06, - "loss": 0.9604, - "step": 16939 - }, - { - "epoch": 0.43, - "learning_rate": 1.931762507047554e-06, - "loss": 0.8081, - "step": 16940 - }, - { - "epoch": 0.43, - "learning_rate": 1.931752460424671e-06, - "loss": 0.8726, - "step": 16941 - }, - { - "epoch": 0.43, - "learning_rate": 1.931742413088388e-06, - "loss": 0.8975, - "step": 16942 - }, - { - "epoch": 0.43, - "learning_rate": 1.9317323650387124e-06, - "loss": 0.8643, - "step": 16943 - }, - { - "epoch": 0.43, - "learning_rate": 1.9317223162756526e-06, - "loss": 0.7998, - "step": 16944 - }, - { - "epoch": 0.43, - "learning_rate": 1.9317122667992157e-06, - "loss": 0.9941, - "step": 16945 - }, - { - "epoch": 0.43, - "learning_rate": 1.9317022166094094e-06, - "loss": 0.875, - "step": 16946 - }, - { - "epoch": 0.43, - "learning_rate": 1.9316921657062416e-06, - "loss": 0.7656, - "step": 16947 - }, - { - "epoch": 0.43, - "learning_rate": 1.93168211408972e-06, - "loss": 1.0215, - "step": 16948 - }, - { - "epoch": 0.43, - "learning_rate": 1.931672061759852e-06, - "loss": 0.8779, - "step": 16949 - }, - { - "epoch": 0.43, - "learning_rate": 1.9316620087166457e-06, - "loss": 0.9385, - "step": 16950 - }, - { - "epoch": 0.43, - "learning_rate": 1.931651954960109e-06, - "loss": 0.9727, - "step": 16951 - }, - { - "epoch": 0.43, - "learning_rate": 1.931641900490249e-06, - "loss": 0.8135, - "step": 16952 - }, - { - "epoch": 0.43, - "learning_rate": 1.9316318453070737e-06, - "loss": 0.8115, - "step": 16953 - }, - { - "epoch": 0.43, - "learning_rate": 1.9316217894105903e-06, - "loss": 0.8057, - "step": 16954 - }, - { - "epoch": 0.43, - "learning_rate": 1.9316117328008075e-06, - "loss": 1.0371, - "step": 16955 - }, - { - "epoch": 0.43, - "learning_rate": 1.931601675477732e-06, - "loss": 0.9385, - "step": 16956 - }, - { - "epoch": 0.43, - "learning_rate": 1.931591617441372e-06, - "loss": 0.6235, - "step": 16957 - }, - { - "epoch": 0.43, - "learning_rate": 1.9315815586917355e-06, - "loss": 0.894, - "step": 16958 - }, - { - "epoch": 0.43, - "learning_rate": 1.9315714992288292e-06, - "loss": 0.9043, - "step": 16959 - }, - { - "epoch": 0.43, - "learning_rate": 1.931561439052662e-06, - "loss": 0.96, - "step": 16960 - }, - { - "epoch": 0.43, - "learning_rate": 1.931551378163241e-06, - "loss": 1.0381, - "step": 16961 - }, - { - "epoch": 0.43, - "learning_rate": 1.9315413165605736e-06, - "loss": 0.877, - "step": 16962 - }, - { - "epoch": 0.43, - "learning_rate": 1.931531254244668e-06, - "loss": 0.8301, - "step": 16963 - }, - { - "epoch": 0.43, - "learning_rate": 1.9315211912155317e-06, - "loss": 1.1504, - "step": 16964 - }, - { - "epoch": 0.43, - "learning_rate": 1.931511127473173e-06, - "loss": 0.9609, - "step": 16965 - }, - { - "epoch": 0.43, - "learning_rate": 1.9315010630175986e-06, - "loss": 0.6978, - "step": 16966 - }, - { - "epoch": 0.43, - "learning_rate": 1.9314909978488167e-06, - "loss": 1.0273, - "step": 16967 - }, - { - "epoch": 0.43, - "learning_rate": 1.9314809319668348e-06, - "loss": 1.1406, - "step": 16968 - }, - { - "epoch": 0.43, - "learning_rate": 1.931470865371661e-06, - "loss": 0.9277, - "step": 16969 - }, - { - "epoch": 0.43, - "learning_rate": 1.9314607980633025e-06, - "loss": 0.6992, - "step": 16970 - }, - { - "epoch": 0.43, - "learning_rate": 1.931450730041768e-06, - "loss": 0.9658, - "step": 16971 - }, - { - "epoch": 0.44, - "learning_rate": 1.9314406613070637e-06, - "loss": 0.8506, - "step": 16972 - }, - { - "epoch": 0.44, - "learning_rate": 1.9314305918591984e-06, - "loss": 0.8955, - "step": 16973 - }, - { - "epoch": 0.44, - "learning_rate": 1.9314205216981792e-06, - "loss": 0.9336, - "step": 16974 - }, - { - "epoch": 0.44, - "learning_rate": 1.9314104508240147e-06, - "loss": 1.082, - "step": 16975 - }, - { - "epoch": 0.44, - "learning_rate": 1.931400379236712e-06, - "loss": 0.9414, - "step": 16976 - }, - { - "epoch": 0.44, - "learning_rate": 1.9313903069362785e-06, - "loss": 0.7764, - "step": 16977 - }, - { - "epoch": 0.44, - "learning_rate": 1.9313802339227226e-06, - "loss": 0.7744, - "step": 16978 - }, - { - "epoch": 0.44, - "learning_rate": 1.9313701601960517e-06, - "loss": 0.6758, - "step": 16979 - }, - { - "epoch": 0.44, - "learning_rate": 1.931360085756273e-06, - "loss": 1.0762, - "step": 16980 - }, - { - "epoch": 0.44, - "learning_rate": 1.9313500106033953e-06, - "loss": 0.9375, - "step": 16981 - }, - { - "epoch": 0.44, - "learning_rate": 1.9313399347374255e-06, - "loss": 0.8135, - "step": 16982 - }, - { - "epoch": 0.44, - "learning_rate": 1.9313298581583716e-06, - "loss": 0.9072, - "step": 16983 - }, - { - "epoch": 0.44, - "learning_rate": 1.9313197808662413e-06, - "loss": 0.7412, - "step": 16984 - }, - { - "epoch": 0.44, - "learning_rate": 1.931309702861042e-06, - "loss": 1.0791, - "step": 16985 - }, - { - "epoch": 0.44, - "learning_rate": 1.9312996241427818e-06, - "loss": 0.8433, - "step": 16986 - }, - { - "epoch": 0.44, - "learning_rate": 1.9312895447114685e-06, - "loss": 0.9375, - "step": 16987 - }, - { - "epoch": 0.44, - "learning_rate": 1.931279464567109e-06, - "loss": 0.7368, - "step": 16988 - }, - { - "epoch": 0.44, - "learning_rate": 1.9312693837097124e-06, - "loss": 0.9102, - "step": 16989 - }, - { - "epoch": 0.44, - "learning_rate": 1.9312593021392853e-06, - "loss": 1.1357, - "step": 16990 - }, - { - "epoch": 0.44, - "learning_rate": 1.9312492198558355e-06, - "loss": 0.6958, - "step": 16991 - }, - { - "epoch": 0.44, - "learning_rate": 1.9312391368593716e-06, - "loss": 0.8027, - "step": 16992 - }, - { - "epoch": 0.44, - "learning_rate": 1.9312290531499e-06, - "loss": 1.0059, - "step": 16993 - }, - { - "epoch": 0.44, - "learning_rate": 1.93121896872743e-06, - "loss": 0.6221, - "step": 16994 - }, - { - "epoch": 0.44, - "learning_rate": 1.9312088835919676e-06, - "loss": 1.1162, - "step": 16995 - }, - { - "epoch": 0.44, - "learning_rate": 1.931198797743522e-06, - "loss": 0.8721, - "step": 16996 - }, - { - "epoch": 0.44, - "learning_rate": 1.9311887111821e-06, - "loss": 1.0762, - "step": 16997 - }, - { - "epoch": 0.44, - "learning_rate": 1.9311786239077096e-06, - "loss": 0.749, - "step": 16998 - }, - { - "epoch": 0.44, - "learning_rate": 1.9311685359203586e-06, - "loss": 1.1719, - "step": 16999 - }, - { - "epoch": 0.44, - "learning_rate": 1.9311584472200545e-06, - "loss": 1.0654, - "step": 17000 - }, - { - "epoch": 0.44, - "learning_rate": 1.9311483578068057e-06, - "loss": 0.8389, - "step": 17001 - }, - { - "epoch": 0.44, - "learning_rate": 1.931138267680619e-06, - "loss": 0.8965, - "step": 17002 - }, - { - "epoch": 0.44, - "learning_rate": 1.931128176841503e-06, - "loss": 0.9355, - "step": 17003 - }, - { - "epoch": 0.44, - "learning_rate": 1.9311180852894645e-06, - "loss": 0.8994, - "step": 17004 - }, - { - "epoch": 0.44, - "learning_rate": 1.9311079930245116e-06, - "loss": 0.8047, - "step": 17005 - }, - { - "epoch": 0.44, - "learning_rate": 1.9310979000466525e-06, - "loss": 0.9326, - "step": 17006 - }, - { - "epoch": 0.44, - "learning_rate": 1.931087806355894e-06, - "loss": 0.8643, - "step": 17007 - }, - { - "epoch": 0.44, - "learning_rate": 1.931077711952245e-06, - "loss": 1.001, - "step": 17008 - }, - { - "epoch": 0.44, - "learning_rate": 1.9310676168357122e-06, - "loss": 0.877, - "step": 17009 - }, - { - "epoch": 0.44, - "learning_rate": 1.931057521006304e-06, - "loss": 0.9004, - "step": 17010 - }, - { - "epoch": 0.44, - "learning_rate": 1.931047424464028e-06, - "loss": 1.1299, - "step": 17011 - }, - { - "epoch": 0.44, - "learning_rate": 1.9310373272088912e-06, - "loss": 0.7422, - "step": 17012 - }, - { - "epoch": 0.44, - "learning_rate": 1.9310272292409023e-06, - "loss": 0.7871, - "step": 17013 - }, - { - "epoch": 0.44, - "learning_rate": 1.9310171305600687e-06, - "loss": 1.1357, - "step": 17014 - }, - { - "epoch": 0.44, - "learning_rate": 1.9310070311663984e-06, - "loss": 0.7959, - "step": 17015 - }, - { - "epoch": 0.44, - "learning_rate": 1.930996931059898e-06, - "loss": 0.9443, - "step": 17016 - }, - { - "epoch": 0.44, - "learning_rate": 1.930986830240577e-06, - "loss": 0.7207, - "step": 17017 - }, - { - "epoch": 0.44, - "learning_rate": 1.930976728708442e-06, - "loss": 0.9062, - "step": 17018 - }, - { - "epoch": 0.44, - "learning_rate": 1.9309666264635003e-06, - "loss": 0.772, - "step": 17019 - }, - { - "epoch": 0.44, - "learning_rate": 1.9309565235057606e-06, - "loss": 0.8477, - "step": 17020 - }, - { - "epoch": 0.44, - "learning_rate": 1.9309464198352303e-06, - "loss": 0.8521, - "step": 17021 - }, - { - "epoch": 0.44, - "learning_rate": 1.930936315451917e-06, - "loss": 1.0352, - "step": 17022 - }, - { - "epoch": 0.44, - "learning_rate": 1.930926210355829e-06, - "loss": 0.877, - "step": 17023 - }, - { - "epoch": 0.44, - "learning_rate": 1.930916104546973e-06, - "loss": 0.8164, - "step": 17024 - }, - { - "epoch": 0.44, - "learning_rate": 1.930905998025358e-06, - "loss": 0.8076, - "step": 17025 - }, - { - "epoch": 0.44, - "learning_rate": 1.930895890790991e-06, - "loss": 1.123, - "step": 17026 - }, - { - "epoch": 0.44, - "learning_rate": 1.9308857828438793e-06, - "loss": 0.8262, - "step": 17027 - }, - { - "epoch": 0.44, - "learning_rate": 1.930875674184031e-06, - "loss": 0.7061, - "step": 17028 - }, - { - "epoch": 0.44, - "learning_rate": 1.9308655648114546e-06, - "loss": 0.8877, - "step": 17029 - }, - { - "epoch": 0.44, - "learning_rate": 1.930855454726157e-06, - "loss": 0.4663, - "step": 17030 - }, - { - "epoch": 0.44, - "learning_rate": 1.9308453439281466e-06, - "loss": 0.8965, - "step": 17031 - }, - { - "epoch": 0.44, - "learning_rate": 1.9308352324174302e-06, - "loss": 0.9106, - "step": 17032 - }, - { - "epoch": 0.44, - "learning_rate": 1.930825120194016e-06, - "loss": 0.9727, - "step": 17033 - }, - { - "epoch": 0.44, - "learning_rate": 1.9308150072579123e-06, - "loss": 0.8203, - "step": 17034 - }, - { - "epoch": 0.44, - "learning_rate": 1.930804893609126e-06, - "loss": 0.9014, - "step": 17035 - }, - { - "epoch": 0.44, - "learning_rate": 1.9307947792476653e-06, - "loss": 0.8857, - "step": 17036 - }, - { - "epoch": 0.44, - "learning_rate": 1.930784664173538e-06, - "loss": 0.8228, - "step": 17037 - }, - { - "epoch": 0.44, - "learning_rate": 1.9307745483867516e-06, - "loss": 0.9717, - "step": 17038 - }, - { - "epoch": 0.44, - "learning_rate": 1.9307644318873136e-06, - "loss": 0.6655, - "step": 17039 - }, - { - "epoch": 0.44, - "learning_rate": 1.9307543146752325e-06, - "loss": 1.0527, - "step": 17040 - }, - { - "epoch": 0.44, - "learning_rate": 1.930744196750515e-06, - "loss": 0.8931, - "step": 17041 - }, - { - "epoch": 0.44, - "learning_rate": 1.93073407811317e-06, - "loss": 1.0156, - "step": 17042 - }, - { - "epoch": 0.44, - "learning_rate": 1.9307239587632045e-06, - "loss": 0.8711, - "step": 17043 - }, - { - "epoch": 0.44, - "learning_rate": 1.9307138387006267e-06, - "loss": 0.8545, - "step": 17044 - }, - { - "epoch": 0.44, - "learning_rate": 1.930703717925444e-06, - "loss": 0.689, - "step": 17045 - }, - { - "epoch": 0.44, - "learning_rate": 1.930693596437664e-06, - "loss": 1.0098, - "step": 17046 - }, - { - "epoch": 0.44, - "learning_rate": 1.9306834742372954e-06, - "loss": 0.7808, - "step": 17047 - }, - { - "epoch": 0.44, - "learning_rate": 1.9306733513243446e-06, - "loss": 1.0234, - "step": 17048 - }, - { - "epoch": 0.44, - "learning_rate": 1.93066322769882e-06, - "loss": 0.8066, - "step": 17049 - }, - { - "epoch": 0.44, - "learning_rate": 1.9306531033607295e-06, - "loss": 0.8467, - "step": 17050 - }, - { - "epoch": 0.44, - "learning_rate": 1.930642978310081e-06, - "loss": 0.7642, - "step": 17051 - }, - { - "epoch": 0.44, - "learning_rate": 1.9306328525468817e-06, - "loss": 0.8857, - "step": 17052 - }, - { - "epoch": 0.44, - "learning_rate": 1.9306227260711396e-06, - "loss": 1.0547, - "step": 17053 - }, - { - "epoch": 0.44, - "learning_rate": 1.9306125988828624e-06, - "loss": 0.8965, - "step": 17054 - }, - { - "epoch": 0.44, - "learning_rate": 1.930602470982058e-06, - "loss": 0.8091, - "step": 17055 - }, - { - "epoch": 0.44, - "learning_rate": 1.9305923423687344e-06, - "loss": 0.8809, - "step": 17056 - }, - { - "epoch": 0.44, - "learning_rate": 1.9305822130428988e-06, - "loss": 0.8848, - "step": 17057 - }, - { - "epoch": 0.44, - "learning_rate": 1.930572083004559e-06, - "loss": 0.7427, - "step": 17058 - }, - { - "epoch": 0.44, - "learning_rate": 1.930561952253723e-06, - "loss": 0.9814, - "step": 17059 - }, - { - "epoch": 0.44, - "learning_rate": 1.9305518207903985e-06, - "loss": 0.7959, - "step": 17060 - }, - { - "epoch": 0.44, - "learning_rate": 1.9305416886145936e-06, - "loss": 0.8623, - "step": 17061 - }, - { - "epoch": 0.44, - "learning_rate": 1.9305315557263153e-06, - "loss": 1.0127, - "step": 17062 - }, - { - "epoch": 0.44, - "learning_rate": 1.9305214221255718e-06, - "loss": 0.7251, - "step": 17063 - }, - { - "epoch": 0.44, - "learning_rate": 1.930511287812371e-06, - "loss": 1.0225, - "step": 17064 - }, - { - "epoch": 0.44, - "learning_rate": 1.9305011527867207e-06, - "loss": 0.71, - "step": 17065 - }, - { - "epoch": 0.44, - "learning_rate": 1.930491017048628e-06, - "loss": 0.9473, - "step": 17066 - }, - { - "epoch": 0.44, - "learning_rate": 1.9304808805981015e-06, - "loss": 1.0205, - "step": 17067 - }, - { - "epoch": 0.44, - "learning_rate": 1.930470743435148e-06, - "loss": 0.9619, - "step": 17068 - }, - { - "epoch": 0.44, - "learning_rate": 1.9304606055597767e-06, - "loss": 1.1094, - "step": 17069 - }, - { - "epoch": 0.44, - "learning_rate": 1.9304504669719937e-06, - "loss": 0.8643, - "step": 17070 - }, - { - "epoch": 0.44, - "learning_rate": 1.930440327671808e-06, - "loss": 0.7844, - "step": 17071 - }, - { - "epoch": 0.44, - "learning_rate": 1.9304301876592272e-06, - "loss": 1.0283, - "step": 17072 - }, - { - "epoch": 0.44, - "learning_rate": 1.930420046934258e-06, - "loss": 0.635, - "step": 17073 - }, - { - "epoch": 0.44, - "learning_rate": 1.9304099054969093e-06, - "loss": 0.9326, - "step": 17074 - }, - { - "epoch": 0.44, - "learning_rate": 1.9303997633471885e-06, - "loss": 0.8672, - "step": 17075 - }, - { - "epoch": 0.44, - "learning_rate": 1.9303896204851036e-06, - "loss": 0.9453, - "step": 17076 - }, - { - "epoch": 0.44, - "learning_rate": 1.930379476910662e-06, - "loss": 0.8867, - "step": 17077 - }, - { - "epoch": 0.44, - "learning_rate": 1.930369332623872e-06, - "loss": 0.9395, - "step": 17078 - }, - { - "epoch": 0.44, - "learning_rate": 1.9303591876247402e-06, - "loss": 0.9268, - "step": 17079 - }, - { - "epoch": 0.44, - "learning_rate": 1.9303490419132755e-06, - "loss": 0.8291, - "step": 17080 - }, - { - "epoch": 0.44, - "learning_rate": 1.9303388954894857e-06, - "loss": 0.9326, - "step": 17081 - }, - { - "epoch": 0.44, - "learning_rate": 1.9303287483533776e-06, - "loss": 1.0186, - "step": 17082 - }, - { - "epoch": 0.44, - "learning_rate": 1.93031860050496e-06, - "loss": 0.9551, - "step": 17083 - }, - { - "epoch": 0.44, - "learning_rate": 1.93030845194424e-06, - "loss": 1.0146, - "step": 17084 - }, - { - "epoch": 0.44, - "learning_rate": 1.9302983026712257e-06, - "loss": 1.0889, - "step": 17085 - }, - { - "epoch": 0.44, - "learning_rate": 1.9302881526859245e-06, - "loss": 0.8174, - "step": 17086 - }, - { - "epoch": 0.44, - "learning_rate": 1.930278001988345e-06, - "loss": 0.8535, - "step": 17087 - }, - { - "epoch": 0.44, - "learning_rate": 1.930267850578494e-06, - "loss": 0.9668, - "step": 17088 - }, - { - "epoch": 0.44, - "learning_rate": 1.9302576984563793e-06, - "loss": 0.9189, - "step": 17089 - }, - { - "epoch": 0.44, - "learning_rate": 1.93024754562201e-06, - "loss": 1.04, - "step": 17090 - }, - { - "epoch": 0.44, - "learning_rate": 1.930237392075392e-06, - "loss": 0.9443, - "step": 17091 - }, - { - "epoch": 0.44, - "learning_rate": 1.9302272378165344e-06, - "loss": 0.708, - "step": 17092 - }, - { - "epoch": 0.44, - "learning_rate": 1.930217082845445e-06, - "loss": 0.96, - "step": 17093 - }, - { - "epoch": 0.44, - "learning_rate": 1.9302069271621306e-06, - "loss": 0.75, - "step": 17094 - }, - { - "epoch": 0.44, - "learning_rate": 1.9301967707665992e-06, - "loss": 0.834, - "step": 17095 - }, - { - "epoch": 0.44, - "learning_rate": 1.9301866136588597e-06, - "loss": 1.0449, - "step": 17096 - }, - { - "epoch": 0.44, - "learning_rate": 1.930176455838919e-06, - "loss": 0.6401, - "step": 17097 - }, - { - "epoch": 0.44, - "learning_rate": 1.930166297306784e-06, - "loss": 0.7295, - "step": 17098 - }, - { - "epoch": 0.44, - "learning_rate": 1.9301561380624645e-06, - "loss": 0.9121, - "step": 17099 - }, - { - "epoch": 0.44, - "learning_rate": 1.930145978105967e-06, - "loss": 0.833, - "step": 17100 - }, - { - "epoch": 0.44, - "learning_rate": 1.930135817437299e-06, - "loss": 0.8174, - "step": 17101 - }, - { - "epoch": 0.44, - "learning_rate": 1.9301256560564694e-06, - "loss": 0.9717, - "step": 17102 - }, - { - "epoch": 0.44, - "learning_rate": 1.930115493963485e-06, - "loss": 0.9941, - "step": 17103 - }, - { - "epoch": 0.44, - "learning_rate": 1.930105331158354e-06, - "loss": 0.917, - "step": 17104 - }, - { - "epoch": 0.44, - "learning_rate": 1.930095167641084e-06, - "loss": 0.8496, - "step": 17105 - }, - { - "epoch": 0.44, - "learning_rate": 1.9300850034116833e-06, - "loss": 1.0684, - "step": 17106 - }, - { - "epoch": 0.44, - "learning_rate": 1.9300748384701587e-06, - "loss": 0.9023, - "step": 17107 - }, - { - "epoch": 0.44, - "learning_rate": 1.930064672816519e-06, - "loss": 0.8896, - "step": 17108 - }, - { - "epoch": 0.44, - "learning_rate": 1.9300545064507718e-06, - "loss": 0.7646, - "step": 17109 - }, - { - "epoch": 0.44, - "learning_rate": 1.9300443393729238e-06, - "loss": 0.7236, - "step": 17110 - }, - { - "epoch": 0.44, - "learning_rate": 1.930034171582984e-06, - "loss": 0.8037, - "step": 17111 - }, - { - "epoch": 0.44, - "learning_rate": 1.93002400308096e-06, - "loss": 0.5022, - "step": 17112 - }, - { - "epoch": 0.44, - "learning_rate": 1.9300138338668593e-06, - "loss": 0.7695, - "step": 17113 - }, - { - "epoch": 0.44, - "learning_rate": 1.9300036639406894e-06, - "loss": 1.0049, - "step": 17114 - }, - { - "epoch": 0.44, - "learning_rate": 1.929993493302459e-06, - "loss": 1.0439, - "step": 17115 - }, - { - "epoch": 0.44, - "learning_rate": 1.9299833219521753e-06, - "loss": 0.749, - "step": 17116 - }, - { - "epoch": 0.44, - "learning_rate": 1.929973149889846e-06, - "loss": 0.8867, - "step": 17117 - }, - { - "epoch": 0.44, - "learning_rate": 1.929962977115479e-06, - "loss": 0.9502, - "step": 17118 - }, - { - "epoch": 0.44, - "learning_rate": 1.9299528036290818e-06, - "loss": 0.9375, - "step": 17119 - }, - { - "epoch": 0.44, - "learning_rate": 1.9299426294306628e-06, - "loss": 0.5723, - "step": 17120 - }, - { - "epoch": 0.44, - "learning_rate": 1.9299324545202296e-06, - "loss": 0.9512, - "step": 17121 - }, - { - "epoch": 0.44, - "learning_rate": 1.9299222788977898e-06, - "loss": 0.9502, - "step": 17122 - }, - { - "epoch": 0.44, - "learning_rate": 1.929912102563351e-06, - "loss": 0.9033, - "step": 17123 - }, - { - "epoch": 0.44, - "learning_rate": 1.9299019255169214e-06, - "loss": 0.7441, - "step": 17124 - }, - { - "epoch": 0.44, - "learning_rate": 1.929891747758509e-06, - "loss": 0.9072, - "step": 17125 - }, - { - "epoch": 0.44, - "learning_rate": 1.929881569288121e-06, - "loss": 1.0771, - "step": 17126 - }, - { - "epoch": 0.44, - "learning_rate": 1.9298713901057653e-06, - "loss": 1.0225, - "step": 17127 - }, - { - "epoch": 0.44, - "learning_rate": 1.92986121021145e-06, - "loss": 0.8271, - "step": 17128 - }, - { - "epoch": 0.44, - "learning_rate": 1.9298510296051822e-06, - "loss": 0.8594, - "step": 17129 - }, - { - "epoch": 0.44, - "learning_rate": 1.929840848286971e-06, - "loss": 0.8945, - "step": 17130 - }, - { - "epoch": 0.44, - "learning_rate": 1.929830666256823e-06, - "loss": 0.8301, - "step": 17131 - }, - { - "epoch": 0.44, - "learning_rate": 1.9298204835147466e-06, - "loss": 0.9092, - "step": 17132 - }, - { - "epoch": 0.44, - "learning_rate": 1.9298103000607494e-06, - "loss": 0.8579, - "step": 17133 - }, - { - "epoch": 0.44, - "learning_rate": 1.9298001158948393e-06, - "loss": 0.8213, - "step": 17134 - }, - { - "epoch": 0.44, - "learning_rate": 1.929789931017024e-06, - "loss": 0.8721, - "step": 17135 - }, - { - "epoch": 0.44, - "learning_rate": 1.929779745427311e-06, - "loss": 0.8213, - "step": 17136 - }, - { - "epoch": 0.44, - "learning_rate": 1.9297695591257085e-06, - "loss": 0.9082, - "step": 17137 - }, - { - "epoch": 0.44, - "learning_rate": 1.9297593721122244e-06, - "loss": 0.603, - "step": 17138 - }, - { - "epoch": 0.44, - "learning_rate": 1.929749184386866e-06, - "loss": 0.8682, - "step": 17139 - }, - { - "epoch": 0.44, - "learning_rate": 1.9297389959496417e-06, - "loss": 0.8174, - "step": 17140 - }, - { - "epoch": 0.44, - "learning_rate": 1.929728806800559e-06, - "loss": 0.7939, - "step": 17141 - }, - { - "epoch": 0.44, - "learning_rate": 1.929718616939625e-06, - "loss": 0.8721, - "step": 17142 - }, - { - "epoch": 0.44, - "learning_rate": 1.929708426366849e-06, - "loss": 0.9326, - "step": 17143 - }, - { - "epoch": 0.44, - "learning_rate": 1.9296982350822376e-06, - "loss": 0.9746, - "step": 17144 - }, - { - "epoch": 0.44, - "learning_rate": 1.929688043085799e-06, - "loss": 0.7764, - "step": 17145 - }, - { - "epoch": 0.44, - "learning_rate": 1.9296778503775415e-06, - "loss": 1.1104, - "step": 17146 - }, - { - "epoch": 0.44, - "learning_rate": 1.929667656957472e-06, - "loss": 1.0303, - "step": 17147 - }, - { - "epoch": 0.44, - "learning_rate": 1.9296574628255988e-06, - "loss": 0.8213, - "step": 17148 - }, - { - "epoch": 0.44, - "learning_rate": 1.92964726798193e-06, - "loss": 0.6948, - "step": 17149 - }, - { - "epoch": 0.44, - "learning_rate": 1.9296370724264725e-06, - "loss": 0.9072, - "step": 17150 - }, - { - "epoch": 0.44, - "learning_rate": 1.9296268761592348e-06, - "loss": 1.1182, - "step": 17151 - }, - { - "epoch": 0.44, - "learning_rate": 1.9296166791802246e-06, - "loss": 0.9277, - "step": 17152 - }, - { - "epoch": 0.44, - "learning_rate": 1.9296064814894498e-06, - "loss": 0.9355, - "step": 17153 - }, - { - "epoch": 0.44, - "learning_rate": 1.9295962830869177e-06, - "loss": 0.9233, - "step": 17154 - }, - { - "epoch": 0.44, - "learning_rate": 1.9295860839726366e-06, - "loss": 1.0039, - "step": 17155 - }, - { - "epoch": 0.44, - "learning_rate": 1.9295758841466145e-06, - "loss": 0.7549, - "step": 17156 - }, - { - "epoch": 0.44, - "learning_rate": 1.9295656836088586e-06, - "loss": 0.9795, - "step": 17157 - }, - { - "epoch": 0.44, - "learning_rate": 1.929555482359377e-06, - "loss": 0.835, - "step": 17158 - }, - { - "epoch": 0.44, - "learning_rate": 1.9295452803981777e-06, - "loss": 0.8779, - "step": 17159 - }, - { - "epoch": 0.44, - "learning_rate": 1.9295350777252677e-06, - "loss": 0.9316, - "step": 17160 - }, - { - "epoch": 0.44, - "learning_rate": 1.929524874340656e-06, - "loss": 0.6655, - "step": 17161 - }, - { - "epoch": 0.44, - "learning_rate": 1.92951467024435e-06, - "loss": 0.7358, - "step": 17162 - }, - { - "epoch": 0.44, - "learning_rate": 1.929504465436357e-06, - "loss": 0.9629, - "step": 17163 - }, - { - "epoch": 0.44, - "learning_rate": 1.9294942599166853e-06, - "loss": 0.7866, - "step": 17164 - }, - { - "epoch": 0.44, - "learning_rate": 1.9294840536853424e-06, - "loss": 0.9766, - "step": 17165 - }, - { - "epoch": 0.44, - "learning_rate": 1.9294738467423364e-06, - "loss": 0.9229, - "step": 17166 - }, - { - "epoch": 0.44, - "learning_rate": 1.9294636390876754e-06, - "loss": 0.7656, - "step": 17167 - }, - { - "epoch": 0.44, - "learning_rate": 1.929453430721366e-06, - "loss": 0.7822, - "step": 17168 - }, - { - "epoch": 0.44, - "learning_rate": 1.9294432216434177e-06, - "loss": 0.749, - "step": 17169 - }, - { - "epoch": 0.44, - "learning_rate": 1.929433011853837e-06, - "loss": 0.7366, - "step": 17170 - }, - { - "epoch": 0.44, - "learning_rate": 1.9294228013526322e-06, - "loss": 0.999, - "step": 17171 - }, - { - "epoch": 0.44, - "learning_rate": 1.929412590139811e-06, - "loss": 0.8984, - "step": 17172 - }, - { - "epoch": 0.44, - "learning_rate": 1.9294023782153815e-06, - "loss": 0.834, - "step": 17173 - }, - { - "epoch": 0.44, - "learning_rate": 1.9293921655793514e-06, - "loss": 0.7378, - "step": 17174 - }, - { - "epoch": 0.44, - "learning_rate": 1.9293819522317286e-06, - "loss": 0.7656, - "step": 17175 - }, - { - "epoch": 0.44, - "learning_rate": 1.9293717381725206e-06, - "loss": 0.9062, - "step": 17176 - }, - { - "epoch": 0.44, - "learning_rate": 1.9293615234017354e-06, - "loss": 0.7676, - "step": 17177 - }, - { - "epoch": 0.44, - "learning_rate": 1.9293513079193808e-06, - "loss": 0.7148, - "step": 17178 - }, - { - "epoch": 0.44, - "learning_rate": 1.9293410917254646e-06, - "loss": 0.9824, - "step": 17179 - }, - { - "epoch": 0.44, - "learning_rate": 1.9293308748199943e-06, - "loss": 0.8574, - "step": 17180 - }, - { - "epoch": 0.44, - "learning_rate": 1.9293206572029785e-06, - "loss": 0.8335, - "step": 17181 - }, - { - "epoch": 0.44, - "learning_rate": 1.9293104388744246e-06, - "loss": 1.0127, - "step": 17182 - }, - { - "epoch": 0.44, - "learning_rate": 1.9293002198343405e-06, - "loss": 1.0039, - "step": 17183 - }, - { - "epoch": 0.44, - "learning_rate": 1.9292900000827336e-06, - "loss": 0.71, - "step": 17184 - }, - { - "epoch": 0.44, - "learning_rate": 1.9292797796196126e-06, - "loss": 1.0195, - "step": 17185 - }, - { - "epoch": 0.44, - "learning_rate": 1.9292695584449843e-06, - "loss": 0.8154, - "step": 17186 - }, - { - "epoch": 0.44, - "learning_rate": 1.9292593365588573e-06, - "loss": 0.6489, - "step": 17187 - }, - { - "epoch": 0.44, - "learning_rate": 1.929249113961239e-06, - "loss": 0.8633, - "step": 17188 - }, - { - "epoch": 0.44, - "learning_rate": 1.9292388906521374e-06, - "loss": 0.8853, - "step": 17189 - }, - { - "epoch": 0.44, - "learning_rate": 1.9292286666315606e-06, - "loss": 0.8398, - "step": 17190 - }, - { - "epoch": 0.44, - "learning_rate": 1.9292184418995155e-06, - "loss": 0.8281, - "step": 17191 - }, - { - "epoch": 0.44, - "learning_rate": 1.9292082164560115e-06, - "loss": 0.8506, - "step": 17192 - }, - { - "epoch": 0.44, - "learning_rate": 1.9291979903010548e-06, - "loss": 0.9307, - "step": 17193 - }, - { - "epoch": 0.44, - "learning_rate": 1.929187763434654e-06, - "loss": 0.9844, - "step": 17194 - }, - { - "epoch": 0.44, - "learning_rate": 1.929177535856817e-06, - "loss": 0.7324, - "step": 17195 - }, - { - "epoch": 0.44, - "learning_rate": 1.9291673075675512e-06, - "loss": 0.626, - "step": 17196 - }, - { - "epoch": 0.44, - "learning_rate": 1.929157078566865e-06, - "loss": 0.6699, - "step": 17197 - }, - { - "epoch": 0.44, - "learning_rate": 1.929146848854766e-06, - "loss": 0.686, - "step": 17198 - }, - { - "epoch": 0.44, - "learning_rate": 1.9291366184312617e-06, - "loss": 0.9609, - "step": 17199 - }, - { - "epoch": 0.44, - "learning_rate": 1.9291263872963607e-06, - "loss": 0.8242, - "step": 17200 - }, - { - "epoch": 0.44, - "learning_rate": 1.92911615545007e-06, - "loss": 0.9619, - "step": 17201 - }, - { - "epoch": 0.44, - "learning_rate": 1.929105922892398e-06, - "loss": 0.9639, - "step": 17202 - }, - { - "epoch": 0.44, - "learning_rate": 1.929095689623352e-06, - "loss": 0.7842, - "step": 17203 - }, - { - "epoch": 0.44, - "learning_rate": 1.9290854556429405e-06, - "loss": 0.8389, - "step": 17204 - }, - { - "epoch": 0.44, - "learning_rate": 1.9290752209511703e-06, - "loss": 0.8564, - "step": 17205 - }, - { - "epoch": 0.44, - "learning_rate": 1.9290649855480505e-06, - "loss": 0.9541, - "step": 17206 - }, - { - "epoch": 0.44, - "learning_rate": 1.929054749433588e-06, - "loss": 0.9141, - "step": 17207 - }, - { - "epoch": 0.44, - "learning_rate": 1.9290445126077916e-06, - "loss": 0.749, - "step": 17208 - }, - { - "epoch": 0.44, - "learning_rate": 1.929034275070668e-06, - "loss": 1.1035, - "step": 17209 - }, - { - "epoch": 0.44, - "learning_rate": 1.929024036822226e-06, - "loss": 0.8633, - "step": 17210 - }, - { - "epoch": 0.44, - "learning_rate": 1.9290137978624727e-06, - "loss": 0.8604, - "step": 17211 - }, - { - "epoch": 0.44, - "learning_rate": 1.9290035581914164e-06, - "loss": 0.8799, - "step": 17212 - }, - { - "epoch": 0.44, - "learning_rate": 1.9289933178090646e-06, - "loss": 0.7109, - "step": 17213 - }, - { - "epoch": 0.44, - "learning_rate": 1.9289830767154257e-06, - "loss": 1.0645, - "step": 17214 - }, - { - "epoch": 0.44, - "learning_rate": 1.9289728349105066e-06, - "loss": 0.7734, - "step": 17215 - }, - { - "epoch": 0.44, - "learning_rate": 1.928962592394316e-06, - "loss": 1.0469, - "step": 17216 - }, - { - "epoch": 0.44, - "learning_rate": 1.9289523491668616e-06, - "loss": 0.875, - "step": 17217 - }, - { - "epoch": 0.44, - "learning_rate": 1.9289421052281513e-06, - "loss": 0.8477, - "step": 17218 - }, - { - "epoch": 0.44, - "learning_rate": 1.928931860578192e-06, - "loss": 0.8408, - "step": 17219 - }, - { - "epoch": 0.44, - "learning_rate": 1.9289216152169933e-06, - "loss": 0.7876, - "step": 17220 - }, - { - "epoch": 0.44, - "learning_rate": 1.9289113691445613e-06, - "loss": 0.959, - "step": 17221 - }, - { - "epoch": 0.44, - "learning_rate": 1.9289011223609046e-06, - "loss": 1.1064, - "step": 17222 - }, - { - "epoch": 0.44, - "learning_rate": 1.928890874866031e-06, - "loss": 0.7715, - "step": 17223 - }, - { - "epoch": 0.44, - "learning_rate": 1.9288806266599485e-06, - "loss": 0.4993, - "step": 17224 - }, - { - "epoch": 0.44, - "learning_rate": 1.928870377742665e-06, - "loss": 0.9873, - "step": 17225 - }, - { - "epoch": 0.44, - "learning_rate": 1.928860128114188e-06, - "loss": 0.7759, - "step": 17226 - }, - { - "epoch": 0.44, - "learning_rate": 1.9288498777745253e-06, - "loss": 0.5688, - "step": 17227 - }, - { - "epoch": 0.44, - "learning_rate": 1.9288396267236855e-06, - "loss": 0.9287, - "step": 17228 - }, - { - "epoch": 0.44, - "learning_rate": 1.9288293749616756e-06, - "loss": 1.0371, - "step": 17229 - }, - { - "epoch": 0.44, - "learning_rate": 1.9288191224885036e-06, - "loss": 1.0254, - "step": 17230 - }, - { - "epoch": 0.44, - "learning_rate": 1.928808869304178e-06, - "loss": 1.0977, - "step": 17231 - }, - { - "epoch": 0.44, - "learning_rate": 1.928798615408706e-06, - "loss": 0.6235, - "step": 17232 - }, - { - "epoch": 0.44, - "learning_rate": 1.928788360802095e-06, - "loss": 0.8691, - "step": 17233 - }, - { - "epoch": 0.44, - "learning_rate": 1.928778105484354e-06, - "loss": 0.9912, - "step": 17234 - }, - { - "epoch": 0.44, - "learning_rate": 1.92876784945549e-06, - "loss": 0.957, - "step": 17235 - }, - { - "epoch": 0.44, - "learning_rate": 1.928757592715511e-06, - "loss": 0.9805, - "step": 17236 - }, - { - "epoch": 0.44, - "learning_rate": 1.928747335264426e-06, - "loss": 0.873, - "step": 17237 - }, - { - "epoch": 0.44, - "learning_rate": 1.9287370771022407e-06, - "loss": 0.668, - "step": 17238 - }, - { - "epoch": 0.44, - "learning_rate": 1.9287268182289652e-06, - "loss": 0.8213, - "step": 17239 - }, - { - "epoch": 0.44, - "learning_rate": 1.9287165586446056e-06, - "loss": 0.8516, - "step": 17240 - }, - { - "epoch": 0.44, - "learning_rate": 1.9287062983491707e-06, - "loss": 0.7429, - "step": 17241 - }, - { - "epoch": 0.44, - "learning_rate": 1.928696037342668e-06, - "loss": 0.8101, - "step": 17242 - }, - { - "epoch": 0.44, - "learning_rate": 1.9286857756251053e-06, - "loss": 0.7139, - "step": 17243 - }, - { - "epoch": 0.44, - "learning_rate": 1.9286755131964907e-06, - "loss": 0.9688, - "step": 17244 - }, - { - "epoch": 0.44, - "learning_rate": 1.928665250056832e-06, - "loss": 0.8379, - "step": 17245 - }, - { - "epoch": 0.44, - "learning_rate": 1.928654986206137e-06, - "loss": 0.9629, - "step": 17246 - }, - { - "epoch": 0.44, - "learning_rate": 1.9286447216444133e-06, - "loss": 0.8506, - "step": 17247 - }, - { - "epoch": 0.44, - "learning_rate": 1.9286344563716693e-06, - "loss": 0.8008, - "step": 17248 - }, - { - "epoch": 0.44, - "learning_rate": 1.9286241903879126e-06, - "loss": 0.7725, - "step": 17249 - }, - { - "epoch": 0.44, - "learning_rate": 1.928613923693151e-06, - "loss": 0.875, - "step": 17250 - }, - { - "epoch": 0.44, - "learning_rate": 1.9286036562873925e-06, - "loss": 0.9473, - "step": 17251 - }, - { - "epoch": 0.44, - "learning_rate": 1.928593388170645e-06, - "loss": 0.9209, - "step": 17252 - }, - { - "epoch": 0.44, - "learning_rate": 1.928583119342916e-06, - "loss": 0.6387, - "step": 17253 - }, - { - "epoch": 0.44, - "learning_rate": 1.928572849804214e-06, - "loss": 0.8594, - "step": 17254 - }, - { - "epoch": 0.44, - "learning_rate": 1.928562579554546e-06, - "loss": 0.8281, - "step": 17255 - }, - { - "epoch": 0.44, - "learning_rate": 1.9285523085939203e-06, - "loss": 0.813, - "step": 17256 - }, - { - "epoch": 0.44, - "learning_rate": 1.9285420369223455e-06, - "loss": 1.0049, - "step": 17257 - }, - { - "epoch": 0.44, - "learning_rate": 1.928531764539828e-06, - "loss": 0.8262, - "step": 17258 - }, - { - "epoch": 0.44, - "learning_rate": 1.9285214914463766e-06, - "loss": 0.7114, - "step": 17259 - }, - { - "epoch": 0.44, - "learning_rate": 1.928511217641999e-06, - "loss": 0.9565, - "step": 17260 - }, - { - "epoch": 0.44, - "learning_rate": 1.9285009431267034e-06, - "loss": 1.0908, - "step": 17261 - }, - { - "epoch": 0.44, - "learning_rate": 1.9284906679004968e-06, - "loss": 0.9268, - "step": 17262 - }, - { - "epoch": 0.44, - "learning_rate": 1.9284803919633877e-06, - "loss": 1.0703, - "step": 17263 - }, - { - "epoch": 0.44, - "learning_rate": 1.928470115315384e-06, - "loss": 0.9619, - "step": 17264 - }, - { - "epoch": 0.44, - "learning_rate": 1.9284598379564935e-06, - "loss": 0.9043, - "step": 17265 - }, - { - "epoch": 0.44, - "learning_rate": 1.928449559886724e-06, - "loss": 1.0225, - "step": 17266 - }, - { - "epoch": 0.44, - "learning_rate": 1.9284392811060834e-06, - "loss": 0.8315, - "step": 17267 - }, - { - "epoch": 0.44, - "learning_rate": 1.9284290016145793e-06, - "loss": 0.877, - "step": 17268 - }, - { - "epoch": 0.44, - "learning_rate": 1.9284187214122197e-06, - "loss": 0.9658, - "step": 17269 - }, - { - "epoch": 0.44, - "learning_rate": 1.9284084404990127e-06, - "loss": 0.8584, - "step": 17270 - }, - { - "epoch": 0.44, - "learning_rate": 1.9283981588749663e-06, - "loss": 1.0537, - "step": 17271 - }, - { - "epoch": 0.44, - "learning_rate": 1.9283878765400882e-06, - "loss": 0.9453, - "step": 17272 - }, - { - "epoch": 0.44, - "learning_rate": 1.928377593494386e-06, - "loss": 0.7153, - "step": 17273 - }, - { - "epoch": 0.44, - "learning_rate": 1.9283673097378673e-06, - "loss": 0.8711, - "step": 17274 - }, - { - "epoch": 0.44, - "learning_rate": 1.928357025270541e-06, - "loss": 0.9971, - "step": 17275 - }, - { - "epoch": 0.44, - "learning_rate": 1.9283467400924142e-06, - "loss": 0.8271, - "step": 17276 - }, - { - "epoch": 0.44, - "learning_rate": 1.928336454203495e-06, - "loss": 0.9458, - "step": 17277 - }, - { - "epoch": 0.44, - "learning_rate": 1.9283261676037913e-06, - "loss": 0.8232, - "step": 17278 - }, - { - "epoch": 0.44, - "learning_rate": 1.9283158802933112e-06, - "loss": 0.667, - "step": 17279 - }, - { - "epoch": 0.44, - "learning_rate": 1.928305592272062e-06, - "loss": 0.8418, - "step": 17280 - }, - { - "epoch": 0.44, - "learning_rate": 1.928295303540052e-06, - "loss": 0.9385, - "step": 17281 - }, - { - "epoch": 0.44, - "learning_rate": 1.928285014097289e-06, - "loss": 0.6704, - "step": 17282 - }, - { - "epoch": 0.44, - "learning_rate": 1.9282747239437803e-06, - "loss": 1.2158, - "step": 17283 - }, - { - "epoch": 0.44, - "learning_rate": 1.928264433079535e-06, - "loss": 0.8799, - "step": 17284 - }, - { - "epoch": 0.44, - "learning_rate": 1.92825414150456e-06, - "loss": 0.7402, - "step": 17285 - }, - { - "epoch": 0.44, - "learning_rate": 1.9282438492188637e-06, - "loss": 0.875, - "step": 17286 - }, - { - "epoch": 0.44, - "learning_rate": 1.9282335562224535e-06, - "loss": 0.6475, - "step": 17287 - }, - { - "epoch": 0.44, - "learning_rate": 1.9282232625153377e-06, - "loss": 0.9619, - "step": 17288 - }, - { - "epoch": 0.44, - "learning_rate": 1.928212968097524e-06, - "loss": 0.9277, - "step": 17289 - }, - { - "epoch": 0.44, - "learning_rate": 1.9282026729690205e-06, - "loss": 0.8125, - "step": 17290 - }, - { - "epoch": 0.44, - "learning_rate": 1.9281923771298347e-06, - "loss": 1.0215, - "step": 17291 - }, - { - "epoch": 0.44, - "learning_rate": 1.9281820805799747e-06, - "loss": 0.7891, - "step": 17292 - }, - { - "epoch": 0.44, - "learning_rate": 1.9281717833194486e-06, - "loss": 0.8042, - "step": 17293 - }, - { - "epoch": 0.44, - "learning_rate": 1.9281614853482635e-06, - "loss": 0.9302, - "step": 17294 - }, - { - "epoch": 0.44, - "learning_rate": 1.9281511866664283e-06, - "loss": 0.9473, - "step": 17295 - }, - { - "epoch": 0.44, - "learning_rate": 1.9281408872739504e-06, - "loss": 0.9297, - "step": 17296 - }, - { - "epoch": 0.44, - "learning_rate": 1.928130587170837e-06, - "loss": 0.9365, - "step": 17297 - }, - { - "epoch": 0.44, - "learning_rate": 1.9281202863570976e-06, - "loss": 0.7278, - "step": 17298 - }, - { - "epoch": 0.44, - "learning_rate": 1.928109984832739e-06, - "loss": 0.9082, - "step": 17299 - }, - { - "epoch": 0.44, - "learning_rate": 1.928099682597769e-06, - "loss": 0.8408, - "step": 17300 - }, - { - "epoch": 0.44, - "learning_rate": 1.928089379652196e-06, - "loss": 0.5466, - "step": 17301 - }, - { - "epoch": 0.44, - "learning_rate": 1.928079075996027e-06, - "loss": 0.8242, - "step": 17302 - }, - { - "epoch": 0.44, - "learning_rate": 1.928068771629271e-06, - "loss": 0.9053, - "step": 17303 - }, - { - "epoch": 0.44, - "learning_rate": 1.9280584665519357e-06, - "loss": 0.7129, - "step": 17304 - }, - { - "epoch": 0.44, - "learning_rate": 1.928048160764028e-06, - "loss": 0.9414, - "step": 17305 - }, - { - "epoch": 0.44, - "learning_rate": 1.928037854265557e-06, - "loss": 0.9756, - "step": 17306 - }, - { - "epoch": 0.44, - "learning_rate": 1.9280275470565302e-06, - "loss": 1.0684, - "step": 17307 - }, - { - "epoch": 0.44, - "learning_rate": 1.928017239136955e-06, - "loss": 0.8652, - "step": 17308 - }, - { - "epoch": 0.44, - "learning_rate": 1.92800693050684e-06, - "loss": 1.1523, - "step": 17309 - }, - { - "epoch": 0.44, - "learning_rate": 1.9279966211661924e-06, - "loss": 0.916, - "step": 17310 - }, - { - "epoch": 0.44, - "learning_rate": 1.9279863111150207e-06, - "loss": 0.7305, - "step": 17311 - }, - { - "epoch": 0.44, - "learning_rate": 1.9279760003533324e-06, - "loss": 0.7236, - "step": 17312 - }, - { - "epoch": 0.44, - "learning_rate": 1.927965688881136e-06, - "loss": 0.8203, - "step": 17313 - }, - { - "epoch": 0.44, - "learning_rate": 1.9279553766984383e-06, - "loss": 0.8975, - "step": 17314 - }, - { - "epoch": 0.44, - "learning_rate": 1.9279450638052483e-06, - "loss": 1.0801, - "step": 17315 - }, - { - "epoch": 0.44, - "learning_rate": 1.9279347502015734e-06, - "loss": 0.9922, - "step": 17316 - }, - { - "epoch": 0.44, - "learning_rate": 1.927924435887421e-06, - "loss": 1.2061, - "step": 17317 - }, - { - "epoch": 0.44, - "learning_rate": 1.9279141208628002e-06, - "loss": 0.8652, - "step": 17318 - }, - { - "epoch": 0.44, - "learning_rate": 1.9279038051277177e-06, - "loss": 0.9648, - "step": 17319 - }, - { - "epoch": 0.44, - "learning_rate": 1.9278934886821824e-06, - "loss": 0.793, - "step": 17320 - }, - { - "epoch": 0.44, - "learning_rate": 1.9278831715262017e-06, - "loss": 0.9414, - "step": 17321 - }, - { - "epoch": 0.44, - "learning_rate": 1.927872853659783e-06, - "loss": 1.1816, - "step": 17322 - }, - { - "epoch": 0.44, - "learning_rate": 1.927862535082935e-06, - "loss": 0.8984, - "step": 17323 - }, - { - "epoch": 0.44, - "learning_rate": 1.9278522157956653e-06, - "loss": 0.9189, - "step": 17324 - }, - { - "epoch": 0.44, - "learning_rate": 1.927841895797982e-06, - "loss": 1.0068, - "step": 17325 - }, - { - "epoch": 0.44, - "learning_rate": 1.927831575089893e-06, - "loss": 0.8257, - "step": 17326 - }, - { - "epoch": 0.44, - "learning_rate": 1.9278212536714052e-06, - "loss": 0.6934, - "step": 17327 - }, - { - "epoch": 0.44, - "learning_rate": 1.9278109315425284e-06, - "loss": 1.0469, - "step": 17328 - }, - { - "epoch": 0.44, - "learning_rate": 1.9278006087032687e-06, - "loss": 0.9561, - "step": 17329 - }, - { - "epoch": 0.44, - "learning_rate": 1.9277902851536346e-06, - "loss": 0.7773, - "step": 17330 - }, - { - "epoch": 0.44, - "learning_rate": 1.9277799608936347e-06, - "loss": 0.916, - "step": 17331 - }, - { - "epoch": 0.44, - "learning_rate": 1.927769635923276e-06, - "loss": 0.9082, - "step": 17332 - }, - { - "epoch": 0.44, - "learning_rate": 1.927759310242567e-06, - "loss": 0.7424, - "step": 17333 - }, - { - "epoch": 0.44, - "learning_rate": 1.927748983851515e-06, - "loss": 0.9863, - "step": 17334 - }, - { - "epoch": 0.44, - "learning_rate": 1.9277386567501284e-06, - "loss": 0.9971, - "step": 17335 - }, - { - "epoch": 0.44, - "learning_rate": 1.927728328938415e-06, - "loss": 0.7686, - "step": 17336 - }, - { - "epoch": 0.44, - "learning_rate": 1.927718000416383e-06, - "loss": 1.1221, - "step": 17337 - }, - { - "epoch": 0.44, - "learning_rate": 1.9277076711840397e-06, - "loss": 0.7632, - "step": 17338 - }, - { - "epoch": 0.44, - "learning_rate": 1.927697341241393e-06, - "loss": 0.9922, - "step": 17339 - }, - { - "epoch": 0.44, - "learning_rate": 1.927687010588452e-06, - "loss": 0.8569, - "step": 17340 - }, - { - "epoch": 0.44, - "learning_rate": 1.9276766792252227e-06, - "loss": 0.6296, - "step": 17341 - }, - { - "epoch": 0.44, - "learning_rate": 1.9276663471517144e-06, - "loss": 0.8081, - "step": 17342 - }, - { - "epoch": 0.44, - "learning_rate": 1.9276560143679347e-06, - "loss": 0.9023, - "step": 17343 - }, - { - "epoch": 0.44, - "learning_rate": 1.9276456808738916e-06, - "loss": 0.8652, - "step": 17344 - }, - { - "epoch": 0.44, - "learning_rate": 1.9276353466695923e-06, - "loss": 0.8857, - "step": 17345 - }, - { - "epoch": 0.44, - "learning_rate": 1.9276250117550458e-06, - "loss": 0.916, - "step": 17346 - }, - { - "epoch": 0.44, - "learning_rate": 1.9276146761302595e-06, - "loss": 0.7988, - "step": 17347 - }, - { - "epoch": 0.44, - "learning_rate": 1.9276043397952413e-06, - "loss": 1.126, - "step": 17348 - }, - { - "epoch": 0.44, - "learning_rate": 1.9275940027499986e-06, - "loss": 1.0518, - "step": 17349 - }, - { - "epoch": 0.44, - "learning_rate": 1.92758366499454e-06, - "loss": 0.9141, - "step": 17350 - }, - { - "epoch": 0.44, - "learning_rate": 1.927573326528874e-06, - "loss": 0.8398, - "step": 17351 - }, - { - "epoch": 0.44, - "learning_rate": 1.927562987353007e-06, - "loss": 0.687, - "step": 17352 - }, - { - "epoch": 0.44, - "learning_rate": 1.9275526474669475e-06, - "loss": 0.7695, - "step": 17353 - }, - { - "epoch": 0.44, - "learning_rate": 1.927542306870704e-06, - "loss": 0.873, - "step": 17354 - }, - { - "epoch": 0.44, - "learning_rate": 1.927531965564284e-06, - "loss": 0.9541, - "step": 17355 - }, - { - "epoch": 0.44, - "learning_rate": 1.9275216235476953e-06, - "loss": 0.8857, - "step": 17356 - }, - { - "epoch": 0.44, - "learning_rate": 1.927511280820946e-06, - "loss": 0.9307, - "step": 17357 - }, - { - "epoch": 0.44, - "learning_rate": 1.927500937384044e-06, - "loss": 0.7703, - "step": 17358 - }, - { - "epoch": 0.44, - "learning_rate": 1.927490593236997e-06, - "loss": 0.8633, - "step": 17359 - }, - { - "epoch": 0.44, - "learning_rate": 1.927480248379813e-06, - "loss": 0.7305, - "step": 17360 - }, - { - "epoch": 0.44, - "learning_rate": 1.9274699028125003e-06, - "loss": 0.7646, - "step": 17361 - }, - { - "epoch": 0.44, - "learning_rate": 1.9274595565350665e-06, - "loss": 0.8037, - "step": 17362 - }, - { - "epoch": 0.45, - "learning_rate": 1.9274492095475196e-06, - "loss": 0.8936, - "step": 17363 - }, - { - "epoch": 0.45, - "learning_rate": 1.9274388618498673e-06, - "loss": 0.8359, - "step": 17364 - }, - { - "epoch": 0.45, - "learning_rate": 1.927428513442118e-06, - "loss": 0.6323, - "step": 17365 - }, - { - "epoch": 0.45, - "learning_rate": 1.927418164324279e-06, - "loss": 1.1875, - "step": 17366 - }, - { - "epoch": 0.45, - "learning_rate": 1.927407814496359e-06, - "loss": 0.8994, - "step": 17367 - }, - { - "epoch": 0.45, - "learning_rate": 1.927397463958365e-06, - "loss": 0.6221, - "step": 17368 - }, - { - "epoch": 0.45, - "learning_rate": 1.9273871127103055e-06, - "loss": 1.0635, - "step": 17369 - }, - { - "epoch": 0.45, - "learning_rate": 1.9273767607521885e-06, - "loss": 1.123, - "step": 17370 - }, - { - "epoch": 0.45, - "learning_rate": 1.927366408084022e-06, - "loss": 0.8252, - "step": 17371 - }, - { - "epoch": 0.45, - "learning_rate": 1.927356054705813e-06, - "loss": 0.8535, - "step": 17372 - }, - { - "epoch": 0.45, - "learning_rate": 1.9273457006175704e-06, - "loss": 0.6111, - "step": 17373 - }, - { - "epoch": 0.45, - "learning_rate": 1.927335345819302e-06, - "loss": 0.9268, - "step": 17374 - }, - { - "epoch": 0.45, - "learning_rate": 1.9273249903110152e-06, - "loss": 0.7969, - "step": 17375 - }, - { - "epoch": 0.45, - "learning_rate": 1.927314634092719e-06, - "loss": 0.5889, - "step": 17376 - }, - { - "epoch": 0.45, - "learning_rate": 1.92730427716442e-06, - "loss": 0.5977, - "step": 17377 - }, - { - "epoch": 0.45, - "learning_rate": 1.9272939195261267e-06, - "loss": 0.9336, - "step": 17378 - }, - { - "epoch": 0.45, - "learning_rate": 1.927283561177848e-06, - "loss": 1.0439, - "step": 17379 - }, - { - "epoch": 0.45, - "learning_rate": 1.9272732021195898e-06, - "loss": 0.8174, - "step": 17380 - }, - { - "epoch": 0.45, - "learning_rate": 1.927262842351362e-06, - "loss": 0.9229, - "step": 17381 - }, - { - "epoch": 0.45, - "learning_rate": 1.927252481873171e-06, - "loss": 0.959, - "step": 17382 - }, - { - "epoch": 0.45, - "learning_rate": 1.9272421206850255e-06, - "loss": 0.9014, - "step": 17383 - }, - { - "epoch": 0.45, - "learning_rate": 1.9272317587869336e-06, - "loss": 0.9648, - "step": 17384 - }, - { - "epoch": 0.45, - "learning_rate": 1.927221396178903e-06, - "loss": 0.999, - "step": 17385 - }, - { - "epoch": 0.45, - "learning_rate": 1.927211032860942e-06, - "loss": 0.9795, - "step": 17386 - }, - { - "epoch": 0.45, - "learning_rate": 1.927200668833057e-06, - "loss": 0.9473, - "step": 17387 - }, - { - "epoch": 0.45, - "learning_rate": 1.927190304095258e-06, - "loss": 0.9922, - "step": 17388 - }, - { - "epoch": 0.45, - "learning_rate": 1.927179938647552e-06, - "loss": 0.8652, - "step": 17389 - }, - { - "epoch": 0.45, - "learning_rate": 1.9271695724899464e-06, - "loss": 0.9326, - "step": 17390 - }, - { - "epoch": 0.45, - "learning_rate": 1.9271592056224503e-06, - "loss": 0.7485, - "step": 17391 - }, - { - "epoch": 0.45, - "learning_rate": 1.9271488380450703e-06, - "loss": 0.7236, - "step": 17392 - }, - { - "epoch": 0.45, - "learning_rate": 1.9271384697578156e-06, - "loss": 0.9629, - "step": 17393 - }, - { - "epoch": 0.45, - "learning_rate": 1.9271281007606936e-06, - "loss": 1.0312, - "step": 17394 - }, - { - "epoch": 0.45, - "learning_rate": 1.9271177310537123e-06, - "loss": 0.7749, - "step": 17395 - }, - { - "epoch": 0.45, - "learning_rate": 1.927107360636879e-06, - "loss": 0.9717, - "step": 17396 - }, - { - "epoch": 0.45, - "learning_rate": 1.927096989510203e-06, - "loss": 0.6982, - "step": 17397 - }, - { - "epoch": 0.45, - "learning_rate": 1.9270866176736912e-06, - "loss": 0.8721, - "step": 17398 - }, - { - "epoch": 0.45, - "learning_rate": 1.9270762451273517e-06, - "loss": 0.8047, - "step": 17399 - }, - { - "epoch": 0.45, - "learning_rate": 1.9270658718711926e-06, - "loss": 1.2021, - "step": 17400 - }, - { - "epoch": 0.45, - "learning_rate": 1.9270554979052215e-06, - "loss": 0.958, - "step": 17401 - }, - { - "epoch": 0.45, - "learning_rate": 1.927045123229447e-06, - "loss": 0.9541, - "step": 17402 - }, - { - "epoch": 0.45, - "learning_rate": 1.9270347478438768e-06, - "loss": 0.821, - "step": 17403 - }, - { - "epoch": 0.45, - "learning_rate": 1.9270243717485183e-06, - "loss": 0.8496, - "step": 17404 - }, - { - "epoch": 0.45, - "learning_rate": 1.92701399494338e-06, - "loss": 0.8965, - "step": 17405 - }, - { - "epoch": 0.45, - "learning_rate": 1.9270036174284697e-06, - "loss": 0.8955, - "step": 17406 - }, - { - "epoch": 0.45, - "learning_rate": 1.9269932392037954e-06, - "loss": 0.9883, - "step": 17407 - }, - { - "epoch": 0.45, - "learning_rate": 1.9269828602693654e-06, - "loss": 0.9453, - "step": 17408 - }, - { - "epoch": 0.45, - "learning_rate": 1.9269724806251866e-06, - "loss": 0.8237, - "step": 17409 - }, - { - "epoch": 0.45, - "learning_rate": 1.926962100271268e-06, - "loss": 0.9033, - "step": 17410 - }, - { - "epoch": 0.45, - "learning_rate": 1.926951719207617e-06, - "loss": 0.8467, - "step": 17411 - }, - { - "epoch": 0.45, - "learning_rate": 1.9269413374342417e-06, - "loss": 0.8281, - "step": 17412 - }, - { - "epoch": 0.45, - "learning_rate": 1.9269309549511502e-06, - "loss": 0.7471, - "step": 17413 - }, - { - "epoch": 0.45, - "learning_rate": 1.9269205717583498e-06, - "loss": 0.8379, - "step": 17414 - }, - { - "epoch": 0.45, - "learning_rate": 1.9269101878558492e-06, - "loss": 0.9302, - "step": 17415 - }, - { - "epoch": 0.45, - "learning_rate": 1.926899803243656e-06, - "loss": 0.6943, - "step": 17416 - }, - { - "epoch": 0.45, - "learning_rate": 1.9268894179217787e-06, - "loss": 0.9595, - "step": 17417 - }, - { - "epoch": 0.45, - "learning_rate": 1.9268790318902244e-06, - "loss": 0.9307, - "step": 17418 - }, - { - "epoch": 0.45, - "learning_rate": 1.9268686451490014e-06, - "loss": 0.8115, - "step": 17419 - }, - { - "epoch": 0.45, - "learning_rate": 1.926858257698118e-06, - "loss": 1.0283, - "step": 17420 - }, - { - "epoch": 0.45, - "learning_rate": 1.926847869537582e-06, - "loss": 1.1543, - "step": 17421 - }, - { - "epoch": 0.45, - "learning_rate": 1.926837480667401e-06, - "loss": 0.7842, - "step": 17422 - }, - { - "epoch": 0.45, - "learning_rate": 1.9268270910875824e-06, - "loss": 0.8701, - "step": 17423 - }, - { - "epoch": 0.45, - "learning_rate": 1.9268167007981358e-06, - "loss": 0.8706, - "step": 17424 - }, - { - "epoch": 0.45, - "learning_rate": 1.9268063097990683e-06, - "loss": 0.9346, - "step": 17425 - }, - { - "epoch": 0.45, - "learning_rate": 1.9267959180903875e-06, - "loss": 1.0957, - "step": 17426 - }, - { - "epoch": 0.45, - "learning_rate": 1.9267855256721014e-06, - "loss": 0.9219, - "step": 17427 - }, - { - "epoch": 0.45, - "learning_rate": 1.9267751325442186e-06, - "loss": 0.8237, - "step": 17428 - }, - { - "epoch": 0.45, - "learning_rate": 1.9267647387067466e-06, - "loss": 0.7334, - "step": 17429 - }, - { - "epoch": 0.45, - "learning_rate": 1.926754344159694e-06, - "loss": 0.9199, - "step": 17430 - }, - { - "epoch": 0.45, - "learning_rate": 1.9267439489030674e-06, - "loss": 0.8457, - "step": 17431 - }, - { - "epoch": 0.45, - "learning_rate": 1.926733552936876e-06, - "loss": 0.8838, - "step": 17432 - }, - { - "epoch": 0.45, - "learning_rate": 1.926723156261127e-06, - "loss": 1.1074, - "step": 17433 - }, - { - "epoch": 0.45, - "learning_rate": 1.926712758875829e-06, - "loss": 0.8574, - "step": 17434 - }, - { - "epoch": 0.45, - "learning_rate": 1.9267023607809896e-06, - "loss": 1.0186, - "step": 17435 - }, - { - "epoch": 0.45, - "learning_rate": 1.9266919619766168e-06, - "loss": 0.9121, - "step": 17436 - }, - { - "epoch": 0.45, - "learning_rate": 1.926681562462719e-06, - "loss": 1.1318, - "step": 17437 - }, - { - "epoch": 0.45, - "learning_rate": 1.9266711622393032e-06, - "loss": 0.8286, - "step": 17438 - }, - { - "epoch": 0.45, - "learning_rate": 1.9266607613063777e-06, - "loss": 0.8789, - "step": 17439 - }, - { - "epoch": 0.45, - "learning_rate": 1.926650359663951e-06, - "loss": 0.7979, - "step": 17440 - }, - { - "epoch": 0.45, - "learning_rate": 1.9266399573120307e-06, - "loss": 0.8506, - "step": 17441 - }, - { - "epoch": 0.45, - "learning_rate": 1.926629554250625e-06, - "loss": 0.9795, - "step": 17442 - }, - { - "epoch": 0.45, - "learning_rate": 1.926619150479741e-06, - "loss": 0.7939, - "step": 17443 - }, - { - "epoch": 0.45, - "learning_rate": 1.9266087459993877e-06, - "loss": 0.8613, - "step": 17444 - }, - { - "epoch": 0.45, - "learning_rate": 1.926598340809573e-06, - "loss": 0.6875, - "step": 17445 - }, - { - "epoch": 0.45, - "learning_rate": 1.926587934910304e-06, - "loss": 0.8408, - "step": 17446 - }, - { - "epoch": 0.45, - "learning_rate": 1.92657752830159e-06, - "loss": 0.9355, - "step": 17447 - }, - { - "epoch": 0.45, - "learning_rate": 1.926567120983438e-06, - "loss": 0.9541, - "step": 17448 - }, - { - "epoch": 0.45, - "learning_rate": 1.9265567129558555e-06, - "loss": 0.958, - "step": 17449 - }, - { - "epoch": 0.45, - "learning_rate": 1.9265463042188517e-06, - "loss": 0.7168, - "step": 17450 - }, - { - "epoch": 0.45, - "learning_rate": 1.9265358947724336e-06, - "loss": 1.1436, - "step": 17451 - }, - { - "epoch": 0.45, - "learning_rate": 1.9265254846166097e-06, - "loss": 0.8154, - "step": 17452 - }, - { - "epoch": 0.45, - "learning_rate": 1.926515073751388e-06, - "loss": 1.0859, - "step": 17453 - }, - { - "epoch": 0.45, - "learning_rate": 1.926504662176776e-06, - "loss": 0.9062, - "step": 17454 - }, - { - "epoch": 0.45, - "learning_rate": 1.9264942498927824e-06, - "loss": 0.9639, - "step": 17455 - }, - { - "epoch": 0.45, - "learning_rate": 1.9264838368994147e-06, - "loss": 0.9678, - "step": 17456 - }, - { - "epoch": 0.45, - "learning_rate": 1.926473423196681e-06, - "loss": 1.0098, - "step": 17457 - }, - { - "epoch": 0.45, - "learning_rate": 1.9264630087845886e-06, - "loss": 0.9014, - "step": 17458 - }, - { - "epoch": 0.45, - "learning_rate": 1.9264525936631467e-06, - "loss": 0.9141, - "step": 17459 - }, - { - "epoch": 0.45, - "learning_rate": 1.9264421778323622e-06, - "loss": 0.8662, - "step": 17460 - }, - { - "epoch": 0.45, - "learning_rate": 1.926431761292244e-06, - "loss": 0.8525, - "step": 17461 - }, - { - "epoch": 0.45, - "learning_rate": 1.926421344042799e-06, - "loss": 0.6724, - "step": 17462 - }, - { - "epoch": 0.45, - "learning_rate": 1.926410926084036e-06, - "loss": 0.9658, - "step": 17463 - }, - { - "epoch": 0.45, - "learning_rate": 1.926400507415963e-06, - "loss": 0.9922, - "step": 17464 - }, - { - "epoch": 0.45, - "learning_rate": 1.9263900880385878e-06, - "loss": 0.8359, - "step": 17465 - }, - { - "epoch": 0.45, - "learning_rate": 1.926379667951918e-06, - "loss": 0.8369, - "step": 17466 - }, - { - "epoch": 0.45, - "learning_rate": 1.926369247155962e-06, - "loss": 0.8452, - "step": 17467 - }, - { - "epoch": 0.45, - "learning_rate": 1.926358825650728e-06, - "loss": 1.0254, - "step": 17468 - }, - { - "epoch": 0.45, - "learning_rate": 1.926348403436223e-06, - "loss": 1.125, - "step": 17469 - }, - { - "epoch": 0.45, - "learning_rate": 1.926337980512456e-06, - "loss": 0.8882, - "step": 17470 - }, - { - "epoch": 0.45, - "learning_rate": 1.9263275568794346e-06, - "loss": 0.8379, - "step": 17471 - }, - { - "epoch": 0.45, - "learning_rate": 1.9263171325371667e-06, - "loss": 0.7891, - "step": 17472 - }, - { - "epoch": 0.45, - "learning_rate": 1.9263067074856603e-06, - "loss": 0.8623, - "step": 17473 - }, - { - "epoch": 0.45, - "learning_rate": 1.9262962817249235e-06, - "loss": 1.0898, - "step": 17474 - }, - { - "epoch": 0.45, - "learning_rate": 1.9262858552549642e-06, - "loss": 0.998, - "step": 17475 - }, - { - "epoch": 0.45, - "learning_rate": 1.9262754280757903e-06, - "loss": 0.7954, - "step": 17476 - }, - { - "epoch": 0.45, - "learning_rate": 1.9262650001874105e-06, - "loss": 0.9561, - "step": 17477 - }, - { - "epoch": 0.45, - "learning_rate": 1.9262545715898315e-06, - "loss": 0.9961, - "step": 17478 - }, - { - "epoch": 0.45, - "learning_rate": 1.926244142283062e-06, - "loss": 1.0625, - "step": 17479 - }, - { - "epoch": 0.45, - "learning_rate": 1.9262337122671103e-06, - "loss": 1.0391, - "step": 17480 - }, - { - "epoch": 0.45, - "learning_rate": 1.9262232815419837e-06, - "loss": 0.8159, - "step": 17481 - }, - { - "epoch": 0.45, - "learning_rate": 1.926212850107691e-06, - "loss": 0.5723, - "step": 17482 - }, - { - "epoch": 0.45, - "learning_rate": 1.9262024179642395e-06, - "loss": 0.9482, - "step": 17483 - }, - { - "epoch": 0.45, - "learning_rate": 1.926191985111637e-06, - "loss": 0.5923, - "step": 17484 - }, - { - "epoch": 0.45, - "learning_rate": 1.926181551549892e-06, - "loss": 0.8848, - "step": 17485 - }, - { - "epoch": 0.45, - "learning_rate": 1.9261711172790127e-06, - "loss": 0.8682, - "step": 17486 - }, - { - "epoch": 0.45, - "learning_rate": 1.926160682299007e-06, - "loss": 0.5776, - "step": 17487 - }, - { - "epoch": 0.45, - "learning_rate": 1.926150246609882e-06, - "loss": 0.8242, - "step": 17488 - }, - { - "epoch": 0.45, - "learning_rate": 1.9261398102116467e-06, - "loss": 0.9058, - "step": 17489 - }, - { - "epoch": 0.45, - "learning_rate": 1.9261293731043085e-06, - "loss": 0.96, - "step": 17490 - }, - { - "epoch": 0.45, - "learning_rate": 1.926118935287876e-06, - "loss": 0.8096, - "step": 17491 - }, - { - "epoch": 0.45, - "learning_rate": 1.9261084967623567e-06, - "loss": 0.9531, - "step": 17492 - }, - { - "epoch": 0.45, - "learning_rate": 1.9260980575277584e-06, - "loss": 0.9014, - "step": 17493 - }, - { - "epoch": 0.45, - "learning_rate": 1.9260876175840893e-06, - "loss": 0.9355, - "step": 17494 - }, - { - "epoch": 0.45, - "learning_rate": 1.9260771769313583e-06, - "loss": 0.7842, - "step": 17495 - }, - { - "epoch": 0.45, - "learning_rate": 1.926066735569572e-06, - "loss": 0.9199, - "step": 17496 - }, - { - "epoch": 0.45, - "learning_rate": 1.926056293498739e-06, - "loss": 0.8418, - "step": 17497 - }, - { - "epoch": 0.45, - "learning_rate": 1.926045850718867e-06, - "loss": 1.0186, - "step": 17498 - }, - { - "epoch": 0.45, - "learning_rate": 1.926035407229965e-06, - "loss": 0.8291, - "step": 17499 - }, - { - "epoch": 0.45, - "learning_rate": 1.9260249630320398e-06, - "loss": 0.8213, - "step": 17500 - }, - { - "epoch": 0.45, - "learning_rate": 1.9260145181250998e-06, - "loss": 0.9141, - "step": 17501 - }, - { - "epoch": 0.45, - "learning_rate": 1.9260040725091534e-06, - "loss": 0.9502, - "step": 17502 - }, - { - "epoch": 0.45, - "learning_rate": 1.925993626184208e-06, - "loss": 0.7783, - "step": 17503 - }, - { - "epoch": 0.45, - "learning_rate": 1.925983179150272e-06, - "loss": 1.0176, - "step": 17504 - }, - { - "epoch": 0.45, - "learning_rate": 1.925972731407353e-06, - "loss": 0.75, - "step": 17505 - }, - { - "epoch": 0.45, - "learning_rate": 1.9259622829554596e-06, - "loss": 0.9893, - "step": 17506 - }, - { - "epoch": 0.45, - "learning_rate": 1.9259518337945994e-06, - "loss": 0.6455, - "step": 17507 - }, - { - "epoch": 0.45, - "learning_rate": 1.9259413839247803e-06, - "loss": 0.8584, - "step": 17508 - }, - { - "epoch": 0.45, - "learning_rate": 1.9259309333460103e-06, - "loss": 0.8906, - "step": 17509 - }, - { - "epoch": 0.45, - "learning_rate": 1.925920482058298e-06, - "loss": 1.127, - "step": 17510 - }, - { - "epoch": 0.45, - "learning_rate": 1.9259100300616507e-06, - "loss": 0.6641, - "step": 17511 - }, - { - "epoch": 0.45, - "learning_rate": 1.9258995773560767e-06, - "loss": 0.833, - "step": 17512 - }, - { - "epoch": 0.45, - "learning_rate": 1.925889123941584e-06, - "loss": 0.9971, - "step": 17513 - }, - { - "epoch": 0.45, - "learning_rate": 1.9258786698181805e-06, - "loss": 1.0859, - "step": 17514 - }, - { - "epoch": 0.45, - "learning_rate": 1.925868214985874e-06, - "loss": 0.8149, - "step": 17515 - }, - { - "epoch": 0.45, - "learning_rate": 1.9258577594446735e-06, - "loss": 0.7324, - "step": 17516 - }, - { - "epoch": 0.45, - "learning_rate": 1.925847303194586e-06, - "loss": 1.1777, - "step": 17517 - }, - { - "epoch": 0.45, - "learning_rate": 1.9258368462356195e-06, - "loss": 0.9121, - "step": 17518 - }, - { - "epoch": 0.45, - "learning_rate": 1.9258263885677825e-06, - "loss": 1.0811, - "step": 17519 - }, - { - "epoch": 0.45, - "learning_rate": 1.925815930191083e-06, - "loss": 0.915, - "step": 17520 - }, - { - "epoch": 0.45, - "learning_rate": 1.9258054711055283e-06, - "loss": 0.6503, - "step": 17521 - }, - { - "epoch": 0.45, - "learning_rate": 1.925795011311127e-06, - "loss": 0.8594, - "step": 17522 - }, - { - "epoch": 0.45, - "learning_rate": 1.9257845508078872e-06, - "loss": 0.9404, - "step": 17523 - }, - { - "epoch": 0.45, - "learning_rate": 1.925774089595817e-06, - "loss": 0.689, - "step": 17524 - }, - { - "epoch": 0.45, - "learning_rate": 1.925763627674924e-06, - "loss": 0.8906, - "step": 17525 - }, - { - "epoch": 0.45, - "learning_rate": 1.9257531650452164e-06, - "loss": 0.8545, - "step": 17526 - }, - { - "epoch": 0.45, - "learning_rate": 1.925742701706702e-06, - "loss": 1.0137, - "step": 17527 - }, - { - "epoch": 0.45, - "learning_rate": 1.925732237659389e-06, - "loss": 0.9004, - "step": 17528 - }, - { - "epoch": 0.45, - "learning_rate": 1.9257217729032855e-06, - "loss": 0.832, - "step": 17529 - }, - { - "epoch": 0.45, - "learning_rate": 1.9257113074383994e-06, - "loss": 1.1055, - "step": 17530 - }, - { - "epoch": 0.45, - "learning_rate": 1.9257008412647385e-06, - "loss": 0.7822, - "step": 17531 - }, - { - "epoch": 0.45, - "learning_rate": 1.9256903743823114e-06, - "loss": 0.8145, - "step": 17532 - }, - { - "epoch": 0.45, - "learning_rate": 1.925679906791125e-06, - "loss": 0.8418, - "step": 17533 - }, - { - "epoch": 0.45, - "learning_rate": 1.925669438491189e-06, - "loss": 0.9668, - "step": 17534 - }, - { - "epoch": 0.45, - "learning_rate": 1.92565896948251e-06, - "loss": 0.9453, - "step": 17535 - }, - { - "epoch": 0.45, - "learning_rate": 1.925648499765096e-06, - "loss": 0.9756, - "step": 17536 - }, - { - "epoch": 0.45, - "learning_rate": 1.9256380293389564e-06, - "loss": 1.0352, - "step": 17537 - }, - { - "epoch": 0.45, - "learning_rate": 1.925627558204098e-06, - "loss": 0.9316, - "step": 17538 - }, - { - "epoch": 0.45, - "learning_rate": 1.925617086360529e-06, - "loss": 0.8838, - "step": 17539 - }, - { - "epoch": 0.45, - "learning_rate": 1.925606613808258e-06, - "loss": 0.8604, - "step": 17540 - }, - { - "epoch": 0.45, - "learning_rate": 1.925596140547292e-06, - "loss": 1.0664, - "step": 17541 - }, - { - "epoch": 0.45, - "learning_rate": 1.92558566657764e-06, - "loss": 1.0879, - "step": 17542 - }, - { - "epoch": 0.45, - "learning_rate": 1.9255751918993094e-06, - "loss": 0.6094, - "step": 17543 - }, - { - "epoch": 0.45, - "learning_rate": 1.9255647165123086e-06, - "loss": 0.9062, - "step": 17544 - }, - { - "epoch": 0.45, - "learning_rate": 1.925554240416645e-06, - "loss": 0.8428, - "step": 17545 - }, - { - "epoch": 0.45, - "learning_rate": 1.925543763612328e-06, - "loss": 1.04, - "step": 17546 - }, - { - "epoch": 0.45, - "learning_rate": 1.925533286099364e-06, - "loss": 1.0117, - "step": 17547 - }, - { - "epoch": 0.45, - "learning_rate": 1.9255228078777615e-06, - "loss": 0.8535, - "step": 17548 - }, - { - "epoch": 0.45, - "learning_rate": 1.9255123289475295e-06, - "loss": 0.793, - "step": 17549 - }, - { - "epoch": 0.45, - "learning_rate": 1.9255018493086743e-06, - "loss": 0.7549, - "step": 17550 - }, - { - "epoch": 0.45, - "learning_rate": 1.9254913689612054e-06, - "loss": 0.998, - "step": 17551 - }, - { - "epoch": 0.45, - "learning_rate": 1.9254808879051304e-06, - "loss": 0.8088, - "step": 17552 - }, - { - "epoch": 0.45, - "learning_rate": 1.9254704061404576e-06, - "loss": 1.0361, - "step": 17553 - }, - { - "epoch": 0.45, - "learning_rate": 1.9254599236671943e-06, - "loss": 0.916, - "step": 17554 - }, - { - "epoch": 0.45, - "learning_rate": 1.9254494404853486e-06, - "loss": 0.7676, - "step": 17555 - }, - { - "epoch": 0.45, - "learning_rate": 1.9254389565949294e-06, - "loss": 0.8301, - "step": 17556 - }, - { - "epoch": 0.45, - "learning_rate": 1.9254284719959433e-06, - "loss": 0.9375, - "step": 17557 - }, - { - "epoch": 0.45, - "learning_rate": 1.9254179866884e-06, - "loss": 0.9902, - "step": 17558 - }, - { - "epoch": 0.45, - "learning_rate": 1.9254075006723065e-06, - "loss": 0.8271, - "step": 17559 - }, - { - "epoch": 0.45, - "learning_rate": 1.925397013947671e-06, - "loss": 0.7075, - "step": 17560 - }, - { - "epoch": 0.45, - "learning_rate": 1.9253865265145012e-06, - "loss": 0.8135, - "step": 17561 - }, - { - "epoch": 0.45, - "learning_rate": 1.925376038372806e-06, - "loss": 0.8604, - "step": 17562 - }, - { - "epoch": 0.45, - "learning_rate": 1.9253655495225923e-06, - "loss": 0.6406, - "step": 17563 - }, - { - "epoch": 0.45, - "learning_rate": 1.9253550599638692e-06, - "loss": 0.9697, - "step": 17564 - }, - { - "epoch": 0.45, - "learning_rate": 1.925344569696644e-06, - "loss": 0.9717, - "step": 17565 - }, - { - "epoch": 0.45, - "learning_rate": 1.925334078720925e-06, - "loss": 0.9541, - "step": 17566 - }, - { - "epoch": 0.45, - "learning_rate": 1.9253235870367207e-06, - "loss": 0.8447, - "step": 17567 - }, - { - "epoch": 0.45, - "learning_rate": 1.9253130946440384e-06, - "loss": 0.8467, - "step": 17568 - }, - { - "epoch": 0.45, - "learning_rate": 1.9253026015428867e-06, - "loss": 0.877, - "step": 17569 - }, - { - "epoch": 0.45, - "learning_rate": 1.925292107733273e-06, - "loss": 0.6162, - "step": 17570 - }, - { - "epoch": 0.45, - "learning_rate": 1.9252816132152058e-06, - "loss": 1.0244, - "step": 17571 - }, - { - "epoch": 0.45, - "learning_rate": 1.925271117988693e-06, - "loss": 0.834, - "step": 17572 - }, - { - "epoch": 0.45, - "learning_rate": 1.9252606220537427e-06, - "loss": 0.7178, - "step": 17573 - }, - { - "epoch": 0.45, - "learning_rate": 1.9252501254103627e-06, - "loss": 1.0195, - "step": 17574 - }, - { - "epoch": 0.45, - "learning_rate": 1.9252396280585613e-06, - "loss": 0.7617, - "step": 17575 - }, - { - "epoch": 0.45, - "learning_rate": 1.9252291299983464e-06, - "loss": 0.9375, - "step": 17576 - }, - { - "epoch": 0.45, - "learning_rate": 1.925218631229726e-06, - "loss": 0.8198, - "step": 17577 - }, - { - "epoch": 0.45, - "learning_rate": 1.925208131752709e-06, - "loss": 1.0215, - "step": 17578 - }, - { - "epoch": 0.45, - "learning_rate": 1.925197631567302e-06, - "loss": 0.6733, - "step": 17579 - }, - { - "epoch": 0.45, - "learning_rate": 1.9251871306735135e-06, - "loss": 0.499, - "step": 17580 - }, - { - "epoch": 0.45, - "learning_rate": 1.9251766290713524e-06, - "loss": 0.7075, - "step": 17581 - }, - { - "epoch": 0.45, - "learning_rate": 1.9251661267608257e-06, - "loss": 0.8179, - "step": 17582 - }, - { - "epoch": 0.45, - "learning_rate": 1.925155623741942e-06, - "loss": 0.7056, - "step": 17583 - }, - { - "epoch": 0.45, - "learning_rate": 1.925145120014709e-06, - "loss": 0.9316, - "step": 17584 - }, - { - "epoch": 0.45, - "learning_rate": 1.925134615579135e-06, - "loss": 0.7954, - "step": 17585 - }, - { - "epoch": 0.45, - "learning_rate": 1.925124110435228e-06, - "loss": 0.9873, - "step": 17586 - }, - { - "epoch": 0.45, - "learning_rate": 1.925113604582996e-06, - "loss": 0.9639, - "step": 17587 - }, - { - "epoch": 0.45, - "learning_rate": 1.925103098022447e-06, - "loss": 0.8525, - "step": 17588 - }, - { - "epoch": 0.45, - "learning_rate": 1.925092590753589e-06, - "loss": 0.8516, - "step": 17589 - }, - { - "epoch": 0.45, - "learning_rate": 1.9250820827764302e-06, - "loss": 0.8384, - "step": 17590 - }, - { - "epoch": 0.45, - "learning_rate": 1.9250715740909785e-06, - "loss": 1.0146, - "step": 17591 - }, - { - "epoch": 0.45, - "learning_rate": 1.9250610646972426e-06, - "loss": 0.7783, - "step": 17592 - }, - { - "epoch": 0.45, - "learning_rate": 1.9250505545952295e-06, - "loss": 0.9795, - "step": 17593 - }, - { - "epoch": 0.45, - "learning_rate": 1.925040043784948e-06, - "loss": 0.7332, - "step": 17594 - }, - { - "epoch": 0.45, - "learning_rate": 1.9250295322664056e-06, - "loss": 0.9863, - "step": 17595 - }, - { - "epoch": 0.45, - "learning_rate": 1.9250190200396104e-06, - "loss": 1.001, - "step": 17596 - }, - { - "epoch": 0.45, - "learning_rate": 1.925008507104571e-06, - "loss": 0.8281, - "step": 17597 - }, - { - "epoch": 0.45, - "learning_rate": 1.924997993461295e-06, - "loss": 0.751, - "step": 17598 - }, - { - "epoch": 0.45, - "learning_rate": 1.9249874791097905e-06, - "loss": 0.6821, - "step": 17599 - }, - { - "epoch": 0.45, - "learning_rate": 1.924976964050066e-06, - "loss": 0.8701, - "step": 17600 - }, - { - "epoch": 0.45, - "learning_rate": 1.924966448282129e-06, - "loss": 0.7134, - "step": 17601 - }, - { - "epoch": 0.45, - "learning_rate": 1.9249559318059875e-06, - "loss": 0.9863, - "step": 17602 - }, - { - "epoch": 0.45, - "learning_rate": 1.92494541462165e-06, - "loss": 0.9492, - "step": 17603 - }, - { - "epoch": 0.45, - "learning_rate": 1.924934896729124e-06, - "loss": 0.8774, - "step": 17604 - }, - { - "epoch": 0.45, - "learning_rate": 1.9249243781284188e-06, - "loss": 0.9629, - "step": 17605 - }, - { - "epoch": 0.45, - "learning_rate": 1.9249138588195404e-06, - "loss": 0.9414, - "step": 17606 - }, - { - "epoch": 0.45, - "learning_rate": 1.9249033388024985e-06, - "loss": 0.6062, - "step": 17607 - }, - { - "epoch": 0.45, - "learning_rate": 1.9248928180773006e-06, - "loss": 0.6953, - "step": 17608 - }, - { - "epoch": 0.45, - "learning_rate": 1.924882296643955e-06, - "loss": 0.9248, - "step": 17609 - }, - { - "epoch": 0.45, - "learning_rate": 1.924871774502469e-06, - "loss": 1.1074, - "step": 17610 - }, - { - "epoch": 0.45, - "learning_rate": 1.9248612516528516e-06, - "loss": 0.9219, - "step": 17611 - }, - { - "epoch": 0.45, - "learning_rate": 1.9248507280951103e-06, - "loss": 0.8281, - "step": 17612 - }, - { - "epoch": 0.45, - "learning_rate": 1.9248402038292533e-06, - "loss": 0.6689, - "step": 17613 - }, - { - "epoch": 0.45, - "learning_rate": 1.924829678855289e-06, - "loss": 0.7861, - "step": 17614 - }, - { - "epoch": 0.45, - "learning_rate": 1.924819153173225e-06, - "loss": 0.9199, - "step": 17615 - }, - { - "epoch": 0.45, - "learning_rate": 1.9248086267830696e-06, - "loss": 0.8252, - "step": 17616 - }, - { - "epoch": 0.45, - "learning_rate": 1.9247980996848305e-06, - "loss": 0.8994, - "step": 17617 - }, - { - "epoch": 0.45, - "learning_rate": 1.9247875718785164e-06, - "loss": 0.9062, - "step": 17618 - }, - { - "epoch": 0.45, - "learning_rate": 1.9247770433641344e-06, - "loss": 0.8833, - "step": 17619 - }, - { - "epoch": 0.45, - "learning_rate": 1.9247665141416934e-06, - "loss": 0.9004, - "step": 17620 - }, - { - "epoch": 0.45, - "learning_rate": 1.9247559842112015e-06, - "loss": 0.8936, - "step": 17621 - }, - { - "epoch": 0.45, - "learning_rate": 1.9247454535726663e-06, - "loss": 1.0049, - "step": 17622 - }, - { - "epoch": 0.45, - "learning_rate": 1.9247349222260958e-06, - "loss": 1.0469, - "step": 17623 - }, - { - "epoch": 0.45, - "learning_rate": 1.9247243901714985e-06, - "loss": 1.0312, - "step": 17624 - }, - { - "epoch": 0.45, - "learning_rate": 1.924713857408882e-06, - "loss": 0.9541, - "step": 17625 - }, - { - "epoch": 0.45, - "learning_rate": 1.924703323938255e-06, - "loss": 0.9971, - "step": 17626 - }, - { - "epoch": 0.45, - "learning_rate": 1.924692789759625e-06, - "loss": 0.9062, - "step": 17627 - }, - { - "epoch": 0.45, - "learning_rate": 1.924682254873e-06, - "loss": 0.8037, - "step": 17628 - }, - { - "epoch": 0.45, - "learning_rate": 1.924671719278389e-06, - "loss": 0.9619, - "step": 17629 - }, - { - "epoch": 0.45, - "learning_rate": 1.924661182975799e-06, - "loss": 0.7881, - "step": 17630 - }, - { - "epoch": 0.45, - "learning_rate": 1.924650645965238e-06, - "loss": 0.8623, - "step": 17631 - }, - { - "epoch": 0.45, - "learning_rate": 1.9246401082467153e-06, - "loss": 0.9004, - "step": 17632 - }, - { - "epoch": 0.45, - "learning_rate": 1.9246295698202377e-06, - "loss": 0.7297, - "step": 17633 - }, - { - "epoch": 0.45, - "learning_rate": 1.9246190306858137e-06, - "loss": 0.5986, - "step": 17634 - }, - { - "epoch": 0.45, - "learning_rate": 1.9246084908434515e-06, - "loss": 1.0986, - "step": 17635 - }, - { - "epoch": 0.45, - "learning_rate": 1.924597950293159e-06, - "loss": 0.8428, - "step": 17636 - }, - { - "epoch": 0.45, - "learning_rate": 1.924587409034945e-06, - "loss": 0.6895, - "step": 17637 - }, - { - "epoch": 0.45, - "learning_rate": 1.924576867068816e-06, - "loss": 0.9189, - "step": 17638 - }, - { - "epoch": 0.45, - "learning_rate": 1.9245663243947817e-06, - "loss": 0.7451, - "step": 17639 - }, - { - "epoch": 0.45, - "learning_rate": 1.9245557810128492e-06, - "loss": 0.79, - "step": 17640 - }, - { - "epoch": 0.45, - "learning_rate": 1.924545236923027e-06, - "loss": 0.7119, - "step": 17641 - }, - { - "epoch": 0.45, - "learning_rate": 1.9245346921253228e-06, - "loss": 0.8931, - "step": 17642 - }, - { - "epoch": 0.45, - "learning_rate": 1.924524146619745e-06, - "loss": 1.0254, - "step": 17643 - }, - { - "epoch": 0.45, - "learning_rate": 1.9245136004063015e-06, - "loss": 0.7949, - "step": 17644 - }, - { - "epoch": 0.45, - "learning_rate": 1.924503053485001e-06, - "loss": 1.0488, - "step": 17645 - }, - { - "epoch": 0.45, - "learning_rate": 1.9244925058558503e-06, - "loss": 1.1836, - "step": 17646 - }, - { - "epoch": 0.45, - "learning_rate": 1.9244819575188585e-06, - "loss": 0.8438, - "step": 17647 - }, - { - "epoch": 0.45, - "learning_rate": 1.924471408474033e-06, - "loss": 1.0137, - "step": 17648 - }, - { - "epoch": 0.45, - "learning_rate": 1.924460858721383e-06, - "loss": 0.915, - "step": 17649 - }, - { - "epoch": 0.45, - "learning_rate": 1.924450308260915e-06, - "loss": 1.127, - "step": 17650 - }, - { - "epoch": 0.45, - "learning_rate": 1.9244397570926386e-06, - "loss": 0.8071, - "step": 17651 - }, - { - "epoch": 0.45, - "learning_rate": 1.924429205216561e-06, - "loss": 0.917, - "step": 17652 - }, - { - "epoch": 0.45, - "learning_rate": 1.92441865263269e-06, - "loss": 0.7197, - "step": 17653 - }, - { - "epoch": 0.45, - "learning_rate": 1.924408099341035e-06, - "loss": 0.9482, - "step": 17654 - }, - { - "epoch": 0.45, - "learning_rate": 1.9243975453416025e-06, - "loss": 0.9941, - "step": 17655 - }, - { - "epoch": 0.45, - "learning_rate": 1.9243869906344016e-06, - "loss": 0.9873, - "step": 17656 - }, - { - "epoch": 0.45, - "learning_rate": 1.92437643521944e-06, - "loss": 0.8354, - "step": 17657 - }, - { - "epoch": 0.45, - "learning_rate": 1.924365879096726e-06, - "loss": 0.8984, - "step": 17658 - }, - { - "epoch": 0.45, - "learning_rate": 1.924355322266267e-06, - "loss": 0.7446, - "step": 17659 - }, - { - "epoch": 0.45, - "learning_rate": 1.9243447647280724e-06, - "loss": 0.7876, - "step": 17660 - }, - { - "epoch": 0.45, - "learning_rate": 1.924334206482149e-06, - "loss": 0.8027, - "step": 17661 - }, - { - "epoch": 0.45, - "learning_rate": 1.9243236475285056e-06, - "loss": 0.9668, - "step": 17662 - }, - { - "epoch": 0.45, - "learning_rate": 1.92431308786715e-06, - "loss": 0.7949, - "step": 17663 - }, - { - "epoch": 0.45, - "learning_rate": 1.924302527498091e-06, - "loss": 0.8164, - "step": 17664 - }, - { - "epoch": 0.45, - "learning_rate": 1.924291966421335e-06, - "loss": 1.0557, - "step": 17665 - }, - { - "epoch": 0.45, - "learning_rate": 1.924281404636892e-06, - "loss": 0.5422, - "step": 17666 - }, - { - "epoch": 0.45, - "learning_rate": 1.9242708421447688e-06, - "loss": 0.9434, - "step": 17667 - }, - { - "epoch": 0.45, - "learning_rate": 1.9242602789449737e-06, - "loss": 0.7939, - "step": 17668 - }, - { - "epoch": 0.45, - "learning_rate": 1.9242497150375153e-06, - "loss": 0.7773, - "step": 17669 - }, - { - "epoch": 0.45, - "learning_rate": 1.9242391504224014e-06, - "loss": 0.9629, - "step": 17670 - }, - { - "epoch": 0.45, - "learning_rate": 1.92422858509964e-06, - "loss": 1.0723, - "step": 17671 - }, - { - "epoch": 0.45, - "learning_rate": 1.9242180190692394e-06, - "loss": 0.7261, - "step": 17672 - }, - { - "epoch": 0.45, - "learning_rate": 1.9242074523312073e-06, - "loss": 0.9746, - "step": 17673 - }, - { - "epoch": 0.45, - "learning_rate": 1.9241968848855525e-06, - "loss": 0.8828, - "step": 17674 - }, - { - "epoch": 0.45, - "learning_rate": 1.924186316732282e-06, - "loss": 0.7178, - "step": 17675 - }, - { - "epoch": 0.45, - "learning_rate": 1.924175747871405e-06, - "loss": 0.7227, - "step": 17676 - }, - { - "epoch": 0.45, - "learning_rate": 1.9241651783029293e-06, - "loss": 1.0332, - "step": 17677 - }, - { - "epoch": 0.45, - "learning_rate": 1.9241546080268626e-06, - "loss": 1.0088, - "step": 17678 - }, - { - "epoch": 0.45, - "learning_rate": 1.924144037043213e-06, - "loss": 0.7251, - "step": 17679 - }, - { - "epoch": 0.45, - "learning_rate": 1.9241334653519893e-06, - "loss": 0.957, - "step": 17680 - }, - { - "epoch": 0.45, - "learning_rate": 1.9241228929531983e-06, - "loss": 0.6973, - "step": 17681 - }, - { - "epoch": 0.45, - "learning_rate": 1.92411231984685e-06, - "loss": 0.6899, - "step": 17682 - }, - { - "epoch": 0.45, - "learning_rate": 1.92410174603295e-06, - "loss": 0.8477, - "step": 17683 - }, - { - "epoch": 0.45, - "learning_rate": 1.924091171511509e-06, - "loss": 0.9082, - "step": 17684 - }, - { - "epoch": 0.45, - "learning_rate": 1.924080596282533e-06, - "loss": 0.8936, - "step": 17685 - }, - { - "epoch": 0.45, - "learning_rate": 1.924070020346032e-06, - "loss": 0.7759, - "step": 17686 - }, - { - "epoch": 0.45, - "learning_rate": 1.9240594437020123e-06, - "loss": 0.8364, - "step": 17687 - }, - { - "epoch": 0.45, - "learning_rate": 1.924048866350483e-06, - "loss": 1.0234, - "step": 17688 - }, - { - "epoch": 0.45, - "learning_rate": 1.924038288291452e-06, - "loss": 0.834, - "step": 17689 - }, - { - "epoch": 0.45, - "learning_rate": 1.924027709524927e-06, - "loss": 0.7129, - "step": 17690 - }, - { - "epoch": 0.45, - "learning_rate": 1.9240171300509166e-06, - "loss": 0.8584, - "step": 17691 - }, - { - "epoch": 0.45, - "learning_rate": 1.924006549869429e-06, - "loss": 1.082, - "step": 17692 - }, - { - "epoch": 0.45, - "learning_rate": 1.923995968980472e-06, - "loss": 0.9102, - "step": 17693 - }, - { - "epoch": 0.45, - "learning_rate": 1.923985387384054e-06, - "loss": 0.9199, - "step": 17694 - }, - { - "epoch": 0.45, - "learning_rate": 1.9239748050801824e-06, - "loss": 0.7842, - "step": 17695 - }, - { - "epoch": 0.45, - "learning_rate": 1.923964222068866e-06, - "loss": 1.1025, - "step": 17696 - }, - { - "epoch": 0.45, - "learning_rate": 1.923953638350113e-06, - "loss": 0.8809, - "step": 17697 - }, - { - "epoch": 0.45, - "learning_rate": 1.9239430539239305e-06, - "loss": 0.79, - "step": 17698 - }, - { - "epoch": 0.45, - "learning_rate": 1.923932468790328e-06, - "loss": 0.8799, - "step": 17699 - }, - { - "epoch": 0.45, - "learning_rate": 1.923921882949312e-06, - "loss": 0.9551, - "step": 17700 - }, - { - "epoch": 0.45, - "learning_rate": 1.9239112964008925e-06, - "loss": 0.9336, - "step": 17701 - }, - { - "epoch": 0.45, - "learning_rate": 1.9239007091450762e-06, - "loss": 0.8389, - "step": 17702 - }, - { - "epoch": 0.45, - "learning_rate": 1.9238901211818715e-06, - "loss": 0.8887, - "step": 17703 - }, - { - "epoch": 0.45, - "learning_rate": 1.9238795325112867e-06, - "loss": 0.6611, - "step": 17704 - }, - { - "epoch": 0.45, - "learning_rate": 1.9238689431333298e-06, - "loss": 0.9443, - "step": 17705 - }, - { - "epoch": 0.45, - "learning_rate": 1.923858353048009e-06, - "loss": 0.8298, - "step": 17706 - }, - { - "epoch": 0.45, - "learning_rate": 1.923847762255332e-06, - "loss": 0.9326, - "step": 17707 - }, - { - "epoch": 0.45, - "learning_rate": 1.923837170755308e-06, - "loss": 0.9395, - "step": 17708 - }, - { - "epoch": 0.45, - "learning_rate": 1.9238265785479437e-06, - "loss": 0.8516, - "step": 17709 - }, - { - "epoch": 0.45, - "learning_rate": 1.923815985633248e-06, - "loss": 0.8984, - "step": 17710 - }, - { - "epoch": 0.45, - "learning_rate": 1.923805392011229e-06, - "loss": 0.9336, - "step": 17711 - }, - { - "epoch": 0.45, - "learning_rate": 1.9237947976818947e-06, - "loss": 0.7393, - "step": 17712 - }, - { - "epoch": 0.45, - "learning_rate": 1.923784202645253e-06, - "loss": 0.9932, - "step": 17713 - }, - { - "epoch": 0.45, - "learning_rate": 1.9237736069013124e-06, - "loss": 0.9336, - "step": 17714 - }, - { - "epoch": 0.45, - "learning_rate": 1.9237630104500807e-06, - "loss": 1.0449, - "step": 17715 - }, - { - "epoch": 0.45, - "learning_rate": 1.9237524132915663e-06, - "loss": 0.8394, - "step": 17716 - }, - { - "epoch": 0.45, - "learning_rate": 1.923741815425777e-06, - "loss": 0.8613, - "step": 17717 - }, - { - "epoch": 0.45, - "learning_rate": 1.9237312168527212e-06, - "loss": 0.686, - "step": 17718 - }, - { - "epoch": 0.45, - "learning_rate": 1.9237206175724067e-06, - "loss": 0.8964, - "step": 17719 - }, - { - "epoch": 0.45, - "learning_rate": 1.9237100175848416e-06, - "loss": 0.958, - "step": 17720 - }, - { - "epoch": 0.45, - "learning_rate": 1.9236994168900346e-06, - "loss": 0.9727, - "step": 17721 - }, - { - "epoch": 0.45, - "learning_rate": 1.923688815487993e-06, - "loss": 0.8696, - "step": 17722 - }, - { - "epoch": 0.45, - "learning_rate": 1.923678213378726e-06, - "loss": 0.5708, - "step": 17723 - }, - { - "epoch": 0.45, - "learning_rate": 1.923667610562241e-06, - "loss": 0.9463, - "step": 17724 - }, - { - "epoch": 0.45, - "learning_rate": 1.923657007038546e-06, - "loss": 0.7698, - "step": 17725 - }, - { - "epoch": 0.45, - "learning_rate": 1.923646402807649e-06, - "loss": 0.9131, - "step": 17726 - }, - { - "epoch": 0.45, - "learning_rate": 1.9236357978695588e-06, - "loss": 0.9199, - "step": 17727 - }, - { - "epoch": 0.45, - "learning_rate": 1.923625192224283e-06, - "loss": 0.79, - "step": 17728 - }, - { - "epoch": 0.45, - "learning_rate": 1.92361458587183e-06, - "loss": 0.9302, - "step": 17729 - }, - { - "epoch": 0.45, - "learning_rate": 1.9236039788122075e-06, - "loss": 1.0088, - "step": 17730 - }, - { - "epoch": 0.45, - "learning_rate": 1.923593371045424e-06, - "loss": 0.8535, - "step": 17731 - }, - { - "epoch": 0.45, - "learning_rate": 1.9235827625714872e-06, - "loss": 0.7158, - "step": 17732 - }, - { - "epoch": 0.45, - "learning_rate": 1.923572153390406e-06, - "loss": 0.7861, - "step": 17733 - }, - { - "epoch": 0.45, - "learning_rate": 1.923561543502188e-06, - "loss": 0.8545, - "step": 17734 - }, - { - "epoch": 0.45, - "learning_rate": 1.9235509329068415e-06, - "loss": 0.9131, - "step": 17735 - }, - { - "epoch": 0.45, - "learning_rate": 1.9235403216043744e-06, - "loss": 0.7969, - "step": 17736 - }, - { - "epoch": 0.45, - "learning_rate": 1.923529709594795e-06, - "loss": 0.8691, - "step": 17737 - }, - { - "epoch": 0.45, - "learning_rate": 1.923519096878111e-06, - "loss": 0.8916, - "step": 17738 - }, - { - "epoch": 0.45, - "learning_rate": 1.9235084834543314e-06, - "loss": 0.6855, - "step": 17739 - }, - { - "epoch": 0.45, - "learning_rate": 1.9234978693234638e-06, - "loss": 0.9248, - "step": 17740 - }, - { - "epoch": 0.45, - "learning_rate": 1.923487254485516e-06, - "loss": 0.7871, - "step": 17741 - }, - { - "epoch": 0.45, - "learning_rate": 1.9234766389404963e-06, - "loss": 0.9727, - "step": 17742 - }, - { - "epoch": 0.45, - "learning_rate": 1.923466022688414e-06, - "loss": 0.8643, - "step": 17743 - }, - { - "epoch": 0.45, - "learning_rate": 1.9234554057292753e-06, - "loss": 0.8252, - "step": 17744 - }, - { - "epoch": 0.45, - "learning_rate": 1.9234447880630895e-06, - "loss": 0.875, - "step": 17745 - }, - { - "epoch": 0.45, - "learning_rate": 1.923434169689864e-06, - "loss": 0.9639, - "step": 17746 - }, - { - "epoch": 0.45, - "learning_rate": 1.923423550609608e-06, - "loss": 0.7656, - "step": 17747 - }, - { - "epoch": 0.45, - "learning_rate": 1.9234129308223294e-06, - "loss": 0.8018, - "step": 17748 - }, - { - "epoch": 0.45, - "learning_rate": 1.9234023103280353e-06, - "loss": 0.9385, - "step": 17749 - }, - { - "epoch": 0.45, - "learning_rate": 1.9233916891267347e-06, - "loss": 0.8174, - "step": 17750 - }, - { - "epoch": 0.45, - "learning_rate": 1.9233810672184355e-06, - "loss": 0.7285, - "step": 17751 - }, - { - "epoch": 0.45, - "learning_rate": 1.923370444603146e-06, - "loss": 1.0752, - "step": 17752 - }, - { - "epoch": 0.46, - "learning_rate": 1.9233598212808743e-06, - "loss": 0.5693, - "step": 17753 - }, - { - "epoch": 0.46, - "learning_rate": 1.9233491972516284e-06, - "loss": 0.8916, - "step": 17754 - }, - { - "epoch": 0.46, - "learning_rate": 1.923338572515416e-06, - "loss": 0.918, - "step": 17755 - }, - { - "epoch": 0.46, - "learning_rate": 1.9233279470722465e-06, - "loss": 0.8652, - "step": 17756 - }, - { - "epoch": 0.46, - "learning_rate": 1.9233173209221267e-06, - "loss": 0.8584, - "step": 17757 - }, - { - "epoch": 0.46, - "learning_rate": 1.9233066940650655e-06, - "loss": 0.8496, - "step": 17758 - }, - { - "epoch": 0.46, - "learning_rate": 1.9232960665010706e-06, - "loss": 0.9912, - "step": 17759 - }, - { - "epoch": 0.46, - "learning_rate": 1.9232854382301505e-06, - "loss": 0.9668, - "step": 17760 - }, - { - "epoch": 0.46, - "learning_rate": 1.923274809252313e-06, - "loss": 0.9854, - "step": 17761 - }, - { - "epoch": 0.46, - "learning_rate": 1.9232641795675668e-06, - "loss": 0.7837, - "step": 17762 - }, - { - "epoch": 0.46, - "learning_rate": 1.9232535491759197e-06, - "loss": 0.9136, - "step": 17763 - }, - { - "epoch": 0.46, - "learning_rate": 1.9232429180773795e-06, - "loss": 0.8203, - "step": 17764 - }, - { - "epoch": 0.46, - "learning_rate": 1.9232322862719544e-06, - "loss": 0.9092, - "step": 17765 - }, - { - "epoch": 0.46, - "learning_rate": 1.9232216537596536e-06, - "loss": 0.9248, - "step": 17766 - }, - { - "epoch": 0.46, - "learning_rate": 1.9232110205404835e-06, - "loss": 0.8037, - "step": 17767 - }, - { - "epoch": 0.46, - "learning_rate": 1.923200386614454e-06, - "loss": 0.7695, - "step": 17768 - }, - { - "epoch": 0.46, - "learning_rate": 1.923189751981572e-06, - "loss": 1.0049, - "step": 17769 - }, - { - "epoch": 0.46, - "learning_rate": 1.923179116641846e-06, - "loss": 0.7212, - "step": 17770 - }, - { - "epoch": 0.46, - "learning_rate": 1.9231684805952842e-06, - "loss": 0.9292, - "step": 17771 - }, - { - "epoch": 0.46, - "learning_rate": 1.923157843841895e-06, - "loss": 0.9312, - "step": 17772 - }, - { - "epoch": 0.46, - "learning_rate": 1.9231472063816864e-06, - "loss": 1.0293, - "step": 17773 - }, - { - "epoch": 0.46, - "learning_rate": 1.923136568214666e-06, - "loss": 0.7754, - "step": 17774 - }, - { - "epoch": 0.46, - "learning_rate": 1.9231259293408425e-06, - "loss": 1.0098, - "step": 17775 - }, - { - "epoch": 0.46, - "learning_rate": 1.923115289760224e-06, - "loss": 0.9482, - "step": 17776 - }, - { - "epoch": 0.46, - "learning_rate": 1.9231046494728185e-06, - "loss": 1.0264, - "step": 17777 - }, - { - "epoch": 0.46, - "learning_rate": 1.9230940084786343e-06, - "loss": 1.0088, - "step": 17778 - }, - { - "epoch": 0.46, - "learning_rate": 1.9230833667776794e-06, - "loss": 0.8027, - "step": 17779 - }, - { - "epoch": 0.46, - "learning_rate": 1.923072724369962e-06, - "loss": 0.7998, - "step": 17780 - }, - { - "epoch": 0.46, - "learning_rate": 1.9230620812554904e-06, - "loss": 0.668, - "step": 17781 - }, - { - "epoch": 0.46, - "learning_rate": 1.9230514374342727e-06, - "loss": 0.9355, - "step": 17782 - }, - { - "epoch": 0.46, - "learning_rate": 1.923040792906317e-06, - "loss": 0.9297, - "step": 17783 - }, - { - "epoch": 0.46, - "learning_rate": 1.923030147671631e-06, - "loss": 0.9062, - "step": 17784 - }, - { - "epoch": 0.46, - "learning_rate": 1.9230195017302233e-06, - "loss": 0.8389, - "step": 17785 - }, - { - "epoch": 0.46, - "learning_rate": 1.923008855082102e-06, - "loss": 0.9326, - "step": 17786 - }, - { - "epoch": 0.46, - "learning_rate": 1.9229982077272756e-06, - "loss": 0.9727, - "step": 17787 - }, - { - "epoch": 0.46, - "learning_rate": 1.9229875596657513e-06, - "loss": 0.8242, - "step": 17788 - }, - { - "epoch": 0.46, - "learning_rate": 1.9229769108975385e-06, - "loss": 0.917, - "step": 17789 - }, - { - "epoch": 0.46, - "learning_rate": 1.9229662614226444e-06, - "loss": 0.8613, - "step": 17790 - }, - { - "epoch": 0.46, - "learning_rate": 1.9229556112410775e-06, - "loss": 0.999, - "step": 17791 - }, - { - "epoch": 0.46, - "learning_rate": 1.9229449603528463e-06, - "loss": 0.8711, - "step": 17792 - }, - { - "epoch": 0.46, - "learning_rate": 1.9229343087579583e-06, - "loss": 0.8276, - "step": 17793 - }, - { - "epoch": 0.46, - "learning_rate": 1.9229236564564217e-06, - "loss": 0.6455, - "step": 17794 - }, - { - "epoch": 0.46, - "learning_rate": 1.9229130034482453e-06, - "loss": 0.5942, - "step": 17795 - }, - { - "epoch": 0.46, - "learning_rate": 1.9229023497334363e-06, - "loss": 0.9453, - "step": 17796 - }, - { - "epoch": 0.46, - "learning_rate": 1.922891695312004e-06, - "loss": 0.9189, - "step": 17797 - }, - { - "epoch": 0.46, - "learning_rate": 1.9228810401839557e-06, - "loss": 0.9258, - "step": 17798 - }, - { - "epoch": 0.46, - "learning_rate": 1.9228703843493e-06, - "loss": 0.7012, - "step": 17799 - }, - { - "epoch": 0.46, - "learning_rate": 1.922859727808045e-06, - "loss": 1.1055, - "step": 17800 - }, - { - "epoch": 0.46, - "learning_rate": 1.922849070560198e-06, - "loss": 0.8975, - "step": 17801 - }, - { - "epoch": 0.46, - "learning_rate": 1.9228384126057684e-06, - "loss": 0.813, - "step": 17802 - }, - { - "epoch": 0.46, - "learning_rate": 1.922827753944764e-06, - "loss": 0.7598, - "step": 17803 - }, - { - "epoch": 0.46, - "learning_rate": 1.9228170945771924e-06, - "loss": 1.0078, - "step": 17804 - }, - { - "epoch": 0.46, - "learning_rate": 1.9228064345030625e-06, - "loss": 1.0459, - "step": 17805 - }, - { - "epoch": 0.46, - "learning_rate": 1.922795773722382e-06, - "loss": 0.6577, - "step": 17806 - }, - { - "epoch": 0.46, - "learning_rate": 1.9227851122351595e-06, - "loss": 1.0068, - "step": 17807 - }, - { - "epoch": 0.46, - "learning_rate": 1.922774450041403e-06, - "loss": 0.7637, - "step": 17808 - }, - { - "epoch": 0.46, - "learning_rate": 1.92276378714112e-06, - "loss": 0.9229, - "step": 17809 - }, - { - "epoch": 0.46, - "learning_rate": 1.9227531235343193e-06, - "loss": 0.7461, - "step": 17810 - }, - { - "epoch": 0.46, - "learning_rate": 1.922742459221009e-06, - "loss": 0.9609, - "step": 17811 - }, - { - "epoch": 0.46, - "learning_rate": 1.922731794201197e-06, - "loss": 1.0889, - "step": 17812 - }, - { - "epoch": 0.46, - "learning_rate": 1.9227211284748922e-06, - "loss": 0.6934, - "step": 17813 - }, - { - "epoch": 0.46, - "learning_rate": 1.922710462042102e-06, - "loss": 0.9971, - "step": 17814 - }, - { - "epoch": 0.46, - "learning_rate": 1.9226997949028348e-06, - "loss": 0.7412, - "step": 17815 - }, - { - "epoch": 0.46, - "learning_rate": 1.922689127057099e-06, - "loss": 0.5884, - "step": 17816 - }, - { - "epoch": 0.46, - "learning_rate": 1.922678458504902e-06, - "loss": 1.1123, - "step": 17817 - }, - { - "epoch": 0.46, - "learning_rate": 1.9226677892462534e-06, - "loss": 0.7178, - "step": 17818 - }, - { - "epoch": 0.46, - "learning_rate": 1.92265711928116e-06, - "loss": 0.8604, - "step": 17819 - }, - { - "epoch": 0.46, - "learning_rate": 1.9226464486096307e-06, - "loss": 0.6394, - "step": 17820 - }, - { - "epoch": 0.46, - "learning_rate": 1.922635777231673e-06, - "loss": 0.9512, - "step": 17821 - }, - { - "epoch": 0.46, - "learning_rate": 1.9226251051472956e-06, - "loss": 1.1592, - "step": 17822 - }, - { - "epoch": 0.46, - "learning_rate": 1.922614432356507e-06, - "loss": 0.9663, - "step": 17823 - }, - { - "epoch": 0.46, - "learning_rate": 1.922603758859315e-06, - "loss": 1.0156, - "step": 17824 - }, - { - "epoch": 0.46, - "learning_rate": 1.922593084655727e-06, - "loss": 0.6768, - "step": 17825 - }, - { - "epoch": 0.46, - "learning_rate": 1.9225824097457524e-06, - "loss": 0.8057, - "step": 17826 - }, - { - "epoch": 0.46, - "learning_rate": 1.922571734129399e-06, - "loss": 0.8633, - "step": 17827 - }, - { - "epoch": 0.46, - "learning_rate": 1.9225610578066745e-06, - "loss": 1.041, - "step": 17828 - }, - { - "epoch": 0.46, - "learning_rate": 1.9225503807775873e-06, - "loss": 0.7227, - "step": 17829 - }, - { - "epoch": 0.46, - "learning_rate": 1.922539703042146e-06, - "loss": 1.0713, - "step": 17830 - }, - { - "epoch": 0.46, - "learning_rate": 1.9225290246003584e-06, - "loss": 0.9883, - "step": 17831 - }, - { - "epoch": 0.46, - "learning_rate": 1.9225183454522328e-06, - "loss": 0.9287, - "step": 17832 - }, - { - "epoch": 0.46, - "learning_rate": 1.9225076655977774e-06, - "loss": 0.917, - "step": 17833 - }, - { - "epoch": 0.46, - "learning_rate": 1.9224969850370003e-06, - "loss": 0.8418, - "step": 17834 - }, - { - "epoch": 0.46, - "learning_rate": 1.922486303769909e-06, - "loss": 0.8623, - "step": 17835 - }, - { - "epoch": 0.46, - "learning_rate": 1.922475621796513e-06, - "loss": 0.9395, - "step": 17836 - }, - { - "epoch": 0.46, - "learning_rate": 1.92246493911682e-06, - "loss": 0.7476, - "step": 17837 - }, - { - "epoch": 0.46, - "learning_rate": 1.922454255730838e-06, - "loss": 0.7148, - "step": 17838 - }, - { - "epoch": 0.46, - "learning_rate": 1.9224435716385745e-06, - "loss": 0.9131, - "step": 17839 - }, - { - "epoch": 0.46, - "learning_rate": 1.922432886840039e-06, - "loss": 0.8428, - "step": 17840 - }, - { - "epoch": 0.46, - "learning_rate": 1.922422201335239e-06, - "loss": 0.8682, - "step": 17841 - }, - { - "epoch": 0.46, - "learning_rate": 1.9224115151241826e-06, - "loss": 0.9141, - "step": 17842 - }, - { - "epoch": 0.46, - "learning_rate": 1.922400828206878e-06, - "loss": 0.7334, - "step": 17843 - }, - { - "epoch": 0.46, - "learning_rate": 1.9223901405833336e-06, - "loss": 0.5674, - "step": 17844 - }, - { - "epoch": 0.46, - "learning_rate": 1.9223794522535576e-06, - "loss": 0.8926, - "step": 17845 - }, - { - "epoch": 0.46, - "learning_rate": 1.922368763217558e-06, - "loss": 0.8359, - "step": 17846 - }, - { - "epoch": 0.46, - "learning_rate": 1.922358073475343e-06, - "loss": 0.804, - "step": 17847 - }, - { - "epoch": 0.46, - "learning_rate": 1.9223473830269207e-06, - "loss": 0.8457, - "step": 17848 - }, - { - "epoch": 0.46, - "learning_rate": 1.9223366918722995e-06, - "loss": 0.894, - "step": 17849 - }, - { - "epoch": 0.46, - "learning_rate": 1.922326000011488e-06, - "loss": 0.4868, - "step": 17850 - }, - { - "epoch": 0.46, - "learning_rate": 1.922315307444493e-06, - "loss": 0.9277, - "step": 17851 - }, - { - "epoch": 0.46, - "learning_rate": 1.9223046141713245e-06, - "loss": 0.8381, - "step": 17852 - }, - { - "epoch": 0.46, - "learning_rate": 1.922293920191989e-06, - "loss": 0.8291, - "step": 17853 - }, - { - "epoch": 0.46, - "learning_rate": 1.922283225506496e-06, - "loss": 0.7998, - "step": 17854 - }, - { - "epoch": 0.46, - "learning_rate": 1.922272530114853e-06, - "loss": 0.4839, - "step": 17855 - }, - { - "epoch": 0.46, - "learning_rate": 1.922261834017068e-06, - "loss": 0.6177, - "step": 17856 - }, - { - "epoch": 0.46, - "learning_rate": 1.92225113721315e-06, - "loss": 0.8164, - "step": 17857 - }, - { - "epoch": 0.46, - "learning_rate": 1.922240439703106e-06, - "loss": 0.9302, - "step": 17858 - }, - { - "epoch": 0.46, - "learning_rate": 1.922229741486946e-06, - "loss": 0.9531, - "step": 17859 - }, - { - "epoch": 0.46, - "learning_rate": 1.922219042564676e-06, - "loss": 0.8076, - "step": 17860 - }, - { - "epoch": 0.46, - "learning_rate": 1.922208342936306e-06, - "loss": 0.7603, - "step": 17861 - }, - { - "epoch": 0.46, - "learning_rate": 1.922197642601843e-06, - "loss": 0.7583, - "step": 17862 - }, - { - "epoch": 0.46, - "learning_rate": 1.922186941561296e-06, - "loss": 0.9961, - "step": 17863 - }, - { - "epoch": 0.46, - "learning_rate": 1.9221762398146728e-06, - "loss": 0.6353, - "step": 17864 - }, - { - "epoch": 0.46, - "learning_rate": 1.9221655373619815e-06, - "loss": 0.7529, - "step": 17865 - }, - { - "epoch": 0.46, - "learning_rate": 1.9221548342032306e-06, - "loss": 0.874, - "step": 17866 - }, - { - "epoch": 0.46, - "learning_rate": 1.922144130338428e-06, - "loss": 1.0264, - "step": 17867 - }, - { - "epoch": 0.46, - "learning_rate": 1.922133425767582e-06, - "loss": 0.873, - "step": 17868 - }, - { - "epoch": 0.46, - "learning_rate": 1.922122720490701e-06, - "loss": 0.9092, - "step": 17869 - }, - { - "epoch": 0.46, - "learning_rate": 1.9221120145077932e-06, - "loss": 0.7852, - "step": 17870 - }, - { - "epoch": 0.46, - "learning_rate": 1.9221013078188665e-06, - "loss": 0.9854, - "step": 17871 - }, - { - "epoch": 0.46, - "learning_rate": 1.922090600423929e-06, - "loss": 0.9375, - "step": 17872 - }, - { - "epoch": 0.46, - "learning_rate": 1.9220798923229894e-06, - "loss": 0.6914, - "step": 17873 - }, - { - "epoch": 0.46, - "learning_rate": 1.9220691835160556e-06, - "loss": 0.7988, - "step": 17874 - }, - { - "epoch": 0.46, - "learning_rate": 1.9220584740031354e-06, - "loss": 0.8716, - "step": 17875 - }, - { - "epoch": 0.46, - "learning_rate": 1.922047763784238e-06, - "loss": 0.6807, - "step": 17876 - }, - { - "epoch": 0.46, - "learning_rate": 1.922037052859371e-06, - "loss": 0.8428, - "step": 17877 - }, - { - "epoch": 0.46, - "learning_rate": 1.9220263412285423e-06, - "loss": 0.8789, - "step": 17878 - }, - { - "epoch": 0.46, - "learning_rate": 1.9220156288917604e-06, - "loss": 0.5867, - "step": 17879 - }, - { - "epoch": 0.46, - "learning_rate": 1.9220049158490338e-06, - "loss": 1.2812, - "step": 17880 - }, - { - "epoch": 0.46, - "learning_rate": 1.9219942021003704e-06, - "loss": 0.7129, - "step": 17881 - }, - { - "epoch": 0.46, - "learning_rate": 1.9219834876457782e-06, - "loss": 0.835, - "step": 17882 - }, - { - "epoch": 0.46, - "learning_rate": 1.9219727724852655e-06, - "loss": 0.8784, - "step": 17883 - }, - { - "epoch": 0.46, - "learning_rate": 1.9219620566188414e-06, - "loss": 0.9946, - "step": 17884 - }, - { - "epoch": 0.46, - "learning_rate": 1.9219513400465128e-06, - "loss": 0.832, - "step": 17885 - }, - { - "epoch": 0.46, - "learning_rate": 1.9219406227682885e-06, - "loss": 0.8672, - "step": 17886 - }, - { - "epoch": 0.46, - "learning_rate": 1.9219299047841766e-06, - "loss": 1.0283, - "step": 17887 - }, - { - "epoch": 0.46, - "learning_rate": 1.9219191860941855e-06, - "loss": 1.0391, - "step": 17888 - }, - { - "epoch": 0.46, - "learning_rate": 1.9219084666983234e-06, - "loss": 0.7241, - "step": 17889 - }, - { - "epoch": 0.46, - "learning_rate": 1.9218977465965978e-06, - "loss": 0.6748, - "step": 17890 - }, - { - "epoch": 0.46, - "learning_rate": 1.921887025789018e-06, - "loss": 0.8057, - "step": 17891 - }, - { - "epoch": 0.46, - "learning_rate": 1.9218763042755913e-06, - "loss": 0.8784, - "step": 17892 - }, - { - "epoch": 0.46, - "learning_rate": 1.921865582056327e-06, - "loss": 0.9736, - "step": 17893 - }, - { - "epoch": 0.46, - "learning_rate": 1.921854859131232e-06, - "loss": 0.7461, - "step": 17894 - }, - { - "epoch": 0.46, - "learning_rate": 1.9218441355003153e-06, - "loss": 0.9473, - "step": 17895 - }, - { - "epoch": 0.46, - "learning_rate": 1.9218334111635847e-06, - "loss": 0.8496, - "step": 17896 - }, - { - "epoch": 0.46, - "learning_rate": 1.921822686121049e-06, - "loss": 0.7612, - "step": 17897 - }, - { - "epoch": 0.46, - "learning_rate": 1.9218119603727162e-06, - "loss": 1.0234, - "step": 17898 - }, - { - "epoch": 0.46, - "learning_rate": 1.921801233918594e-06, - "loss": 0.7891, - "step": 17899 - }, - { - "epoch": 0.46, - "learning_rate": 1.921790506758691e-06, - "loss": 0.7344, - "step": 17900 - }, - { - "epoch": 0.46, - "learning_rate": 1.9217797788930155e-06, - "loss": 0.8232, - "step": 17901 - }, - { - "epoch": 0.46, - "learning_rate": 1.9217690503215753e-06, - "loss": 0.8193, - "step": 17902 - }, - { - "epoch": 0.46, - "learning_rate": 1.9217583210443793e-06, - "loss": 0.9199, - "step": 17903 - }, - { - "epoch": 0.46, - "learning_rate": 1.9217475910614354e-06, - "loss": 0.9092, - "step": 17904 - }, - { - "epoch": 0.46, - "learning_rate": 1.9217368603727517e-06, - "loss": 0.7812, - "step": 17905 - }, - { - "epoch": 0.46, - "learning_rate": 1.9217261289783363e-06, - "loss": 0.9688, - "step": 17906 - }, - { - "epoch": 0.46, - "learning_rate": 1.9217153968781975e-06, - "loss": 1.0146, - "step": 17907 - }, - { - "epoch": 0.46, - "learning_rate": 1.921704664072344e-06, - "loss": 0.9336, - "step": 17908 - }, - { - "epoch": 0.46, - "learning_rate": 1.921693930560783e-06, - "loss": 0.9316, - "step": 17909 - }, - { - "epoch": 0.46, - "learning_rate": 1.921683196343524e-06, - "loss": 0.6094, - "step": 17910 - }, - { - "epoch": 0.46, - "learning_rate": 1.921672461420574e-06, - "loss": 0.6768, - "step": 17911 - }, - { - "epoch": 0.46, - "learning_rate": 1.9216617257919425e-06, - "loss": 1.0186, - "step": 17912 - }, - { - "epoch": 0.46, - "learning_rate": 1.9216509894576364e-06, - "loss": 0.7778, - "step": 17913 - }, - { - "epoch": 0.46, - "learning_rate": 1.9216402524176646e-06, - "loss": 0.9268, - "step": 17914 - }, - { - "epoch": 0.46, - "learning_rate": 1.9216295146720356e-06, - "loss": 0.7803, - "step": 17915 - }, - { - "epoch": 0.46, - "learning_rate": 1.9216187762207566e-06, - "loss": 0.7578, - "step": 17916 - }, - { - "epoch": 0.46, - "learning_rate": 1.921608037063837e-06, - "loss": 0.8315, - "step": 17917 - }, - { - "epoch": 0.46, - "learning_rate": 1.921597297201284e-06, - "loss": 0.9023, - "step": 17918 - }, - { - "epoch": 0.46, - "learning_rate": 1.921586556633107e-06, - "loss": 0.8799, - "step": 17919 - }, - { - "epoch": 0.46, - "learning_rate": 1.921575815359313e-06, - "loss": 0.9307, - "step": 17920 - }, - { - "epoch": 0.46, - "learning_rate": 1.921565073379911e-06, - "loss": 0.7178, - "step": 17921 - }, - { - "epoch": 0.46, - "learning_rate": 1.9215543306949093e-06, - "loss": 0.7329, - "step": 17922 - }, - { - "epoch": 0.46, - "learning_rate": 1.921543587304315e-06, - "loss": 0.9219, - "step": 17923 - }, - { - "epoch": 0.46, - "learning_rate": 1.921532843208138e-06, - "loss": 0.7529, - "step": 17924 - }, - { - "epoch": 0.46, - "learning_rate": 1.9215220984063853e-06, - "loss": 1.1182, - "step": 17925 - }, - { - "epoch": 0.46, - "learning_rate": 1.9215113528990656e-06, - "loss": 1.0303, - "step": 17926 - }, - { - "epoch": 0.46, - "learning_rate": 1.921500606686187e-06, - "loss": 0.9229, - "step": 17927 - }, - { - "epoch": 0.46, - "learning_rate": 1.9214898597677578e-06, - "loss": 1.0068, - "step": 17928 - }, - { - "epoch": 0.46, - "learning_rate": 1.9214791121437857e-06, - "loss": 1.1543, - "step": 17929 - }, - { - "epoch": 0.46, - "learning_rate": 1.9214683638142797e-06, - "loss": 0.7188, - "step": 17930 - }, - { - "epoch": 0.46, - "learning_rate": 1.921457614779248e-06, - "loss": 0.9385, - "step": 17931 - }, - { - "epoch": 0.46, - "learning_rate": 1.9214468650386984e-06, - "loss": 0.7773, - "step": 17932 - }, - { - "epoch": 0.46, - "learning_rate": 1.9214361145926396e-06, - "loss": 0.8721, - "step": 17933 - }, - { - "epoch": 0.46, - "learning_rate": 1.921425363441079e-06, - "loss": 1.0264, - "step": 17934 - }, - { - "epoch": 0.46, - "learning_rate": 1.921414611584026e-06, - "loss": 0.9775, - "step": 17935 - }, - { - "epoch": 0.46, - "learning_rate": 1.9214038590214876e-06, - "loss": 0.8486, - "step": 17936 - }, - { - "epoch": 0.46, - "learning_rate": 1.921393105753473e-06, - "loss": 0.96, - "step": 17937 - }, - { - "epoch": 0.46, - "learning_rate": 1.92138235177999e-06, - "loss": 1.0889, - "step": 17938 - }, - { - "epoch": 0.46, - "learning_rate": 1.9213715971010465e-06, - "loss": 0.896, - "step": 17939 - }, - { - "epoch": 0.46, - "learning_rate": 1.9213608417166518e-06, - "loss": 0.9111, - "step": 17940 - }, - { - "epoch": 0.46, - "learning_rate": 1.921350085626813e-06, - "loss": 0.8076, - "step": 17941 - }, - { - "epoch": 0.46, - "learning_rate": 1.921339328831539e-06, - "loss": 0.6953, - "step": 17942 - }, - { - "epoch": 0.46, - "learning_rate": 1.9213285713308376e-06, - "loss": 0.9531, - "step": 17943 - }, - { - "epoch": 0.46, - "learning_rate": 1.921317813124718e-06, - "loss": 0.7686, - "step": 17944 - }, - { - "epoch": 0.46, - "learning_rate": 1.921307054213187e-06, - "loss": 0.8135, - "step": 17945 - }, - { - "epoch": 0.46, - "learning_rate": 1.921296294596253e-06, - "loss": 1.0635, - "step": 17946 - }, - { - "epoch": 0.46, - "learning_rate": 1.921285534273926e-06, - "loss": 0.707, - "step": 17947 - }, - { - "epoch": 0.46, - "learning_rate": 1.9212747732462126e-06, - "loss": 0.7666, - "step": 17948 - }, - { - "epoch": 0.46, - "learning_rate": 1.9212640115131213e-06, - "loss": 0.8721, - "step": 17949 - }, - { - "epoch": 0.46, - "learning_rate": 1.9212532490746607e-06, - "loss": 0.8267, - "step": 17950 - }, - { - "epoch": 0.46, - "learning_rate": 1.9212424859308386e-06, - "loss": 0.9121, - "step": 17951 - }, - { - "epoch": 0.46, - "learning_rate": 1.9212317220816637e-06, - "loss": 0.7871, - "step": 17952 - }, - { - "epoch": 0.46, - "learning_rate": 1.921220957527144e-06, - "loss": 0.7812, - "step": 17953 - }, - { - "epoch": 0.46, - "learning_rate": 1.921210192267288e-06, - "loss": 1.0391, - "step": 17954 - }, - { - "epoch": 0.46, - "learning_rate": 1.9211994263021034e-06, - "loss": 1.0596, - "step": 17955 - }, - { - "epoch": 0.46, - "learning_rate": 1.9211886596315986e-06, - "loss": 0.9922, - "step": 17956 - }, - { - "epoch": 0.46, - "learning_rate": 1.9211778922557825e-06, - "loss": 1.1035, - "step": 17957 - }, - { - "epoch": 0.46, - "learning_rate": 1.9211671241746625e-06, - "loss": 0.9482, - "step": 17958 - }, - { - "epoch": 0.46, - "learning_rate": 1.921156355388247e-06, - "loss": 0.7764, - "step": 17959 - }, - { - "epoch": 0.46, - "learning_rate": 1.921145585896545e-06, - "loss": 0.9512, - "step": 17960 - }, - { - "epoch": 0.46, - "learning_rate": 1.9211348156995636e-06, - "loss": 0.8555, - "step": 17961 - }, - { - "epoch": 0.46, - "learning_rate": 1.921124044797312e-06, - "loss": 0.917, - "step": 17962 - }, - { - "epoch": 0.46, - "learning_rate": 1.921113273189798e-06, - "loss": 1.0039, - "step": 17963 - }, - { - "epoch": 0.46, - "learning_rate": 1.9211025008770296e-06, - "loss": 0.9365, - "step": 17964 - }, - { - "epoch": 0.46, - "learning_rate": 1.921091727859016e-06, - "loss": 1.04, - "step": 17965 - }, - { - "epoch": 0.46, - "learning_rate": 1.9210809541357644e-06, - "loss": 0.6895, - "step": 17966 - }, - { - "epoch": 0.46, - "learning_rate": 1.9210701797072836e-06, - "loss": 0.9336, - "step": 17967 - }, - { - "epoch": 0.46, - "learning_rate": 1.9210594045735817e-06, - "loss": 0.9414, - "step": 17968 - }, - { - "epoch": 0.46, - "learning_rate": 1.921048628734667e-06, - "loss": 0.6982, - "step": 17969 - }, - { - "epoch": 0.46, - "learning_rate": 1.9210378521905477e-06, - "loss": 0.8975, - "step": 17970 - }, - { - "epoch": 0.46, - "learning_rate": 1.921027074941232e-06, - "loss": 0.9062, - "step": 17971 - }, - { - "epoch": 0.46, - "learning_rate": 1.9210162969867283e-06, - "loss": 0.9941, - "step": 17972 - }, - { - "epoch": 0.46, - "learning_rate": 1.9210055183270447e-06, - "loss": 0.8828, - "step": 17973 - }, - { - "epoch": 0.46, - "learning_rate": 1.9209947389621893e-06, - "loss": 0.9824, - "step": 17974 - }, - { - "epoch": 0.46, - "learning_rate": 1.920983958892171e-06, - "loss": 1.0752, - "step": 17975 - }, - { - "epoch": 0.46, - "learning_rate": 1.9209731781169975e-06, - "loss": 0.9727, - "step": 17976 - }, - { - "epoch": 0.46, - "learning_rate": 1.920962396636677e-06, - "loss": 0.9805, - "step": 17977 - }, - { - "epoch": 0.46, - "learning_rate": 1.9209516144512178e-06, - "loss": 0.918, - "step": 17978 - }, - { - "epoch": 0.46, - "learning_rate": 1.9209408315606288e-06, - "loss": 1.0508, - "step": 17979 - }, - { - "epoch": 0.46, - "learning_rate": 1.9209300479649174e-06, - "loss": 0.9424, - "step": 17980 - }, - { - "epoch": 0.46, - "learning_rate": 1.9209192636640923e-06, - "loss": 0.8354, - "step": 17981 - }, - { - "epoch": 0.46, - "learning_rate": 1.9209084786581617e-06, - "loss": 1.168, - "step": 17982 - }, - { - "epoch": 0.46, - "learning_rate": 1.920897692947134e-06, - "loss": 0.9453, - "step": 17983 - }, - { - "epoch": 0.46, - "learning_rate": 1.920886906531017e-06, - "loss": 0.9307, - "step": 17984 - }, - { - "epoch": 0.46, - "learning_rate": 1.9208761194098195e-06, - "loss": 0.9746, - "step": 17985 - }, - { - "epoch": 0.46, - "learning_rate": 1.920865331583549e-06, - "loss": 0.9443, - "step": 17986 - }, - { - "epoch": 0.46, - "learning_rate": 1.9208545430522146e-06, - "loss": 0.8438, - "step": 17987 - }, - { - "epoch": 0.46, - "learning_rate": 1.9208437538158245e-06, - "loss": 0.6436, - "step": 17988 - }, - { - "epoch": 0.46, - "learning_rate": 1.9208329638743863e-06, - "loss": 0.8501, - "step": 17989 - }, - { - "epoch": 0.46, - "learning_rate": 1.9208221732279088e-06, - "loss": 0.7871, - "step": 17990 - }, - { - "epoch": 0.46, - "learning_rate": 1.9208113818764e-06, - "loss": 0.7715, - "step": 17991 - }, - { - "epoch": 0.46, - "learning_rate": 1.920800589819868e-06, - "loss": 0.877, - "step": 17992 - }, - { - "epoch": 0.46, - "learning_rate": 1.9207897970583216e-06, - "loss": 0.6084, - "step": 17993 - }, - { - "epoch": 0.46, - "learning_rate": 1.9207790035917686e-06, - "loss": 0.9912, - "step": 17994 - }, - { - "epoch": 0.46, - "learning_rate": 1.920768209420218e-06, - "loss": 0.8799, - "step": 17995 - }, - { - "epoch": 0.46, - "learning_rate": 1.920757414543677e-06, - "loss": 1.0625, - "step": 17996 - }, - { - "epoch": 0.46, - "learning_rate": 1.9207466189621545e-06, - "loss": 0.918, - "step": 17997 - }, - { - "epoch": 0.46, - "learning_rate": 1.920735822675659e-06, - "loss": 0.8604, - "step": 17998 - }, - { - "epoch": 0.46, - "learning_rate": 1.920725025684198e-06, - "loss": 1.0801, - "step": 17999 - }, - { - "epoch": 0.46, - "learning_rate": 1.9207142279877803e-06, - "loss": 0.8091, - "step": 18000 - }, - { - "epoch": 0.46, - "learning_rate": 1.9207034295864138e-06, - "loss": 0.9189, - "step": 18001 - }, - { - "epoch": 0.46, - "learning_rate": 1.9206926304801074e-06, - "loss": 1.0498, - "step": 18002 - }, - { - "epoch": 0.46, - "learning_rate": 1.920681830668869e-06, - "loss": 0.957, - "step": 18003 - }, - { - "epoch": 0.46, - "learning_rate": 1.9206710301527067e-06, - "loss": 0.9541, - "step": 18004 - }, - { - "epoch": 0.46, - "learning_rate": 1.920660228931629e-06, - "loss": 0.957, - "step": 18005 - }, - { - "epoch": 0.46, - "learning_rate": 1.9206494270056443e-06, - "loss": 0.8755, - "step": 18006 - }, - { - "epoch": 0.46, - "learning_rate": 1.92063862437476e-06, - "loss": 0.8989, - "step": 18007 - }, - { - "epoch": 0.46, - "learning_rate": 1.920627821038986e-06, - "loss": 0.791, - "step": 18008 - }, - { - "epoch": 0.46, - "learning_rate": 1.9206170169983285e-06, - "loss": 0.8965, - "step": 18009 - }, - { - "epoch": 0.46, - "learning_rate": 1.920606212252798e-06, - "loss": 0.8052, - "step": 18010 - }, - { - "epoch": 0.46, - "learning_rate": 1.9205954068024006e-06, - "loss": 0.9561, - "step": 18011 - }, - { - "epoch": 0.46, - "learning_rate": 1.9205846006471466e-06, - "loss": 0.8145, - "step": 18012 - }, - { - "epoch": 0.46, - "learning_rate": 1.9205737937870427e-06, - "loss": 0.8086, - "step": 18013 - }, - { - "epoch": 0.46, - "learning_rate": 1.9205629862220976e-06, - "loss": 1.0625, - "step": 18014 - }, - { - "epoch": 0.46, - "learning_rate": 1.9205521779523203e-06, - "loss": 0.8167, - "step": 18015 - }, - { - "epoch": 0.46, - "learning_rate": 1.920541368977718e-06, - "loss": 0.9424, - "step": 18016 - }, - { - "epoch": 0.46, - "learning_rate": 1.9205305592982997e-06, - "loss": 0.8125, - "step": 18017 - }, - { - "epoch": 0.46, - "learning_rate": 1.920519748914074e-06, - "loss": 1.1064, - "step": 18018 - }, - { - "epoch": 0.46, - "learning_rate": 1.920508937825048e-06, - "loss": 1.0264, - "step": 18019 - }, - { - "epoch": 0.46, - "learning_rate": 1.920498126031231e-06, - "loss": 0.9482, - "step": 18020 - }, - { - "epoch": 0.46, - "learning_rate": 1.9204873135326305e-06, - "loss": 0.8828, - "step": 18021 - }, - { - "epoch": 0.46, - "learning_rate": 1.9204765003292556e-06, - "loss": 0.6924, - "step": 18022 - }, - { - "epoch": 0.46, - "learning_rate": 1.9204656864211138e-06, - "loss": 0.8149, - "step": 18023 - }, - { - "epoch": 0.46, - "learning_rate": 1.9204548718082142e-06, - "loss": 0.8389, - "step": 18024 - }, - { - "epoch": 0.46, - "learning_rate": 1.9204440564905642e-06, - "loss": 0.9204, - "step": 18025 - }, - { - "epoch": 0.46, - "learning_rate": 1.920433240468173e-06, - "loss": 0.8403, - "step": 18026 - }, - { - "epoch": 0.46, - "learning_rate": 1.920422423741048e-06, - "loss": 0.6968, - "step": 18027 - }, - { - "epoch": 0.46, - "learning_rate": 1.9204116063091978e-06, - "loss": 0.8701, - "step": 18028 - }, - { - "epoch": 0.46, - "learning_rate": 1.920400788172631e-06, - "loss": 0.7432, - "step": 18029 - }, - { - "epoch": 0.46, - "learning_rate": 1.9203899693313557e-06, - "loss": 0.7373, - "step": 18030 - }, - { - "epoch": 0.46, - "learning_rate": 1.9203791497853795e-06, - "loss": 0.8232, - "step": 18031 - }, - { - "epoch": 0.46, - "learning_rate": 1.920368329534712e-06, - "loss": 1.0059, - "step": 18032 - }, - { - "epoch": 0.46, - "learning_rate": 1.9203575085793607e-06, - "loss": 0.8667, - "step": 18033 - }, - { - "epoch": 0.46, - "learning_rate": 1.9203466869193338e-06, - "loss": 0.9941, - "step": 18034 - }, - { - "epoch": 0.46, - "learning_rate": 1.92033586455464e-06, - "loss": 0.8628, - "step": 18035 - }, - { - "epoch": 0.46, - "learning_rate": 1.920325041485287e-06, - "loss": 0.8604, - "step": 18036 - }, - { - "epoch": 0.46, - "learning_rate": 1.9203142177112835e-06, - "loss": 0.8555, - "step": 18037 - }, - { - "epoch": 0.46, - "learning_rate": 1.9203033932326376e-06, - "loss": 0.8936, - "step": 18038 - }, - { - "epoch": 0.46, - "learning_rate": 1.920292568049358e-06, - "loss": 1.0781, - "step": 18039 - }, - { - "epoch": 0.46, - "learning_rate": 1.9202817421614526e-06, - "loss": 0.6851, - "step": 18040 - }, - { - "epoch": 0.46, - "learning_rate": 1.9202709155689297e-06, - "loss": 0.9004, - "step": 18041 - }, - { - "epoch": 0.46, - "learning_rate": 1.920260088271798e-06, - "loss": 0.7998, - "step": 18042 - }, - { - "epoch": 0.46, - "learning_rate": 1.9202492602700653e-06, - "loss": 0.6418, - "step": 18043 - }, - { - "epoch": 0.46, - "learning_rate": 1.92023843156374e-06, - "loss": 1.0059, - "step": 18044 - }, - { - "epoch": 0.46, - "learning_rate": 1.9202276021528304e-06, - "loss": 0.9004, - "step": 18045 - }, - { - "epoch": 0.46, - "learning_rate": 1.920216772037345e-06, - "loss": 0.8545, - "step": 18046 - }, - { - "epoch": 0.46, - "learning_rate": 1.9202059412172916e-06, - "loss": 0.8008, - "step": 18047 - }, - { - "epoch": 0.46, - "learning_rate": 1.9201951096926788e-06, - "loss": 0.9258, - "step": 18048 - }, - { - "epoch": 0.46, - "learning_rate": 1.9201842774635154e-06, - "loss": 0.9922, - "step": 18049 - }, - { - "epoch": 0.46, - "learning_rate": 1.920173444529809e-06, - "loss": 0.9492, - "step": 18050 - }, - { - "epoch": 0.46, - "learning_rate": 1.9201626108915678e-06, - "loss": 0.8604, - "step": 18051 - }, - { - "epoch": 0.46, - "learning_rate": 1.920151776548801e-06, - "loss": 0.7856, - "step": 18052 - }, - { - "epoch": 0.46, - "learning_rate": 1.9201409415015157e-06, - "loss": 0.7314, - "step": 18053 - }, - { - "epoch": 0.46, - "learning_rate": 1.920130105749721e-06, - "loss": 1.1504, - "step": 18054 - }, - { - "epoch": 0.46, - "learning_rate": 1.9201192692934253e-06, - "loss": 0.9648, - "step": 18055 - }, - { - "epoch": 0.46, - "learning_rate": 1.920108432132636e-06, - "loss": 1.0, - "step": 18056 - }, - { - "epoch": 0.46, - "learning_rate": 1.9200975942673626e-06, - "loss": 1.0254, - "step": 18057 - }, - { - "epoch": 0.46, - "learning_rate": 1.9200867556976125e-06, - "loss": 0.7715, - "step": 18058 - }, - { - "epoch": 0.46, - "learning_rate": 1.920075916423394e-06, - "loss": 0.9912, - "step": 18059 - }, - { - "epoch": 0.46, - "learning_rate": 1.920065076444716e-06, - "loss": 0.8345, - "step": 18060 - }, - { - "epoch": 0.46, - "learning_rate": 1.9200542357615865e-06, - "loss": 0.998, - "step": 18061 - }, - { - "epoch": 0.46, - "learning_rate": 1.9200433943740137e-06, - "loss": 0.7622, - "step": 18062 - }, - { - "epoch": 0.46, - "learning_rate": 1.920032552282006e-06, - "loss": 1.0889, - "step": 18063 - }, - { - "epoch": 0.46, - "learning_rate": 1.9200217094855715e-06, - "loss": 0.9834, - "step": 18064 - }, - { - "epoch": 0.46, - "learning_rate": 1.9200108659847187e-06, - "loss": 0.7939, - "step": 18065 - }, - { - "epoch": 0.46, - "learning_rate": 1.9200000217794565e-06, - "loss": 0.8271, - "step": 18066 - }, - { - "epoch": 0.46, - "learning_rate": 1.919989176869792e-06, - "loss": 0.8965, - "step": 18067 - }, - { - "epoch": 0.46, - "learning_rate": 1.9199783312557338e-06, - "loss": 0.7998, - "step": 18068 - }, - { - "epoch": 0.46, - "learning_rate": 1.9199674849372907e-06, - "loss": 0.77, - "step": 18069 - }, - { - "epoch": 0.46, - "learning_rate": 1.9199566379144716e-06, - "loss": 0.8633, - "step": 18070 - }, - { - "epoch": 0.46, - "learning_rate": 1.9199457901872827e-06, - "loss": 0.751, - "step": 18071 - }, - { - "epoch": 0.46, - "learning_rate": 1.9199349417557347e-06, - "loss": 0.9814, - "step": 18072 - }, - { - "epoch": 0.46, - "learning_rate": 1.9199240926198343e-06, - "loss": 1.0352, - "step": 18073 - }, - { - "epoch": 0.46, - "learning_rate": 1.9199132427795905e-06, - "loss": 0.8232, - "step": 18074 - }, - { - "epoch": 0.46, - "learning_rate": 1.9199023922350112e-06, - "loss": 0.7676, - "step": 18075 - }, - { - "epoch": 0.46, - "learning_rate": 1.919891540986105e-06, - "loss": 0.9458, - "step": 18076 - }, - { - "epoch": 0.46, - "learning_rate": 1.9198806890328803e-06, - "loss": 0.8086, - "step": 18077 - }, - { - "epoch": 0.46, - "learning_rate": 1.919869836375345e-06, - "loss": 0.7266, - "step": 18078 - }, - { - "epoch": 0.46, - "learning_rate": 1.919858983013508e-06, - "loss": 0.7803, - "step": 18079 - }, - { - "epoch": 0.46, - "learning_rate": 1.919848128947377e-06, - "loss": 0.9336, - "step": 18080 - }, - { - "epoch": 0.46, - "learning_rate": 1.919837274176961e-06, - "loss": 0.8052, - "step": 18081 - }, - { - "epoch": 0.46, - "learning_rate": 1.9198264187022675e-06, - "loss": 0.8896, - "step": 18082 - }, - { - "epoch": 0.46, - "learning_rate": 1.9198155625233056e-06, - "loss": 0.9385, - "step": 18083 - }, - { - "epoch": 0.46, - "learning_rate": 1.9198047056400827e-06, - "loss": 0.4043, - "step": 18084 - }, - { - "epoch": 0.46, - "learning_rate": 1.919793848052608e-06, - "loss": 0.9785, - "step": 18085 - }, - { - "epoch": 0.46, - "learning_rate": 1.919782989760889e-06, - "loss": 0.8672, - "step": 18086 - }, - { - "epoch": 0.46, - "learning_rate": 1.919772130764935e-06, - "loss": 0.9609, - "step": 18087 - }, - { - "epoch": 0.46, - "learning_rate": 1.9197612710647536e-06, - "loss": 0.8154, - "step": 18088 - }, - { - "epoch": 0.46, - "learning_rate": 1.919750410660353e-06, - "loss": 0.7236, - "step": 18089 - }, - { - "epoch": 0.46, - "learning_rate": 1.9197395495517422e-06, - "loss": 0.9736, - "step": 18090 - }, - { - "epoch": 0.46, - "learning_rate": 1.9197286877389287e-06, - "loss": 1.0605, - "step": 18091 - }, - { - "epoch": 0.46, - "learning_rate": 1.9197178252219216e-06, - "loss": 0.9023, - "step": 18092 - }, - { - "epoch": 0.46, - "learning_rate": 1.9197069620007285e-06, - "loss": 0.8926, - "step": 18093 - }, - { - "epoch": 0.46, - "learning_rate": 1.9196960980753585e-06, - "loss": 1.0498, - "step": 18094 - }, - { - "epoch": 0.46, - "learning_rate": 1.919685233445819e-06, - "loss": 0.9795, - "step": 18095 - }, - { - "epoch": 0.46, - "learning_rate": 1.9196743681121194e-06, - "loss": 0.835, - "step": 18096 - }, - { - "epoch": 0.46, - "learning_rate": 1.919663502074267e-06, - "loss": 0.7163, - "step": 18097 - }, - { - "epoch": 0.46, - "learning_rate": 1.9196526353322705e-06, - "loss": 0.8447, - "step": 18098 - }, - { - "epoch": 0.46, - "learning_rate": 1.9196417678861386e-06, - "loss": 0.7607, - "step": 18099 - }, - { - "epoch": 0.46, - "learning_rate": 1.9196308997358787e-06, - "loss": 0.9038, - "step": 18100 - }, - { - "epoch": 0.46, - "learning_rate": 1.9196200308815007e-06, - "loss": 0.748, - "step": 18101 - }, - { - "epoch": 0.46, - "learning_rate": 1.919609161323011e-06, - "loss": 0.8188, - "step": 18102 - }, - { - "epoch": 0.46, - "learning_rate": 1.9195982910604193e-06, - "loss": 0.7031, - "step": 18103 - }, - { - "epoch": 0.46, - "learning_rate": 1.919587420093733e-06, - "loss": 1.1514, - "step": 18104 - }, - { - "epoch": 0.46, - "learning_rate": 1.9195765484229615e-06, - "loss": 0.9282, - "step": 18105 - }, - { - "epoch": 0.46, - "learning_rate": 1.919565676048112e-06, - "loss": 1.0361, - "step": 18106 - }, - { - "epoch": 0.46, - "learning_rate": 1.919554802969194e-06, - "loss": 0.8818, - "step": 18107 - }, - { - "epoch": 0.46, - "learning_rate": 1.9195439291862147e-06, - "loss": 0.6851, - "step": 18108 - }, - { - "epoch": 0.46, - "learning_rate": 1.9195330546991828e-06, - "loss": 0.8242, - "step": 18109 - }, - { - "epoch": 0.46, - "learning_rate": 1.9195221795081068e-06, - "loss": 0.9336, - "step": 18110 - }, - { - "epoch": 0.46, - "learning_rate": 1.9195113036129952e-06, - "loss": 1.0312, - "step": 18111 - }, - { - "epoch": 0.46, - "learning_rate": 1.919500427013856e-06, - "loss": 0.8721, - "step": 18112 - }, - { - "epoch": 0.46, - "learning_rate": 1.919489549710697e-06, - "loss": 0.8877, - "step": 18113 - }, - { - "epoch": 0.46, - "learning_rate": 1.919478671703528e-06, - "loss": 0.8887, - "step": 18114 - }, - { - "epoch": 0.46, - "learning_rate": 1.9194677929923563e-06, - "loss": 0.9502, - "step": 18115 - }, - { - "epoch": 0.46, - "learning_rate": 1.91945691357719e-06, - "loss": 1.0898, - "step": 18116 - }, - { - "epoch": 0.46, - "learning_rate": 1.9194460334580384e-06, - "loss": 1.125, - "step": 18117 - }, - { - "epoch": 0.46, - "learning_rate": 1.9194351526349086e-06, - "loss": 0.6616, - "step": 18118 - }, - { - "epoch": 0.46, - "learning_rate": 1.9194242711078098e-06, - "loss": 0.6797, - "step": 18119 - }, - { - "epoch": 0.46, - "learning_rate": 1.9194133888767503e-06, - "loss": 0.7881, - "step": 18120 - }, - { - "epoch": 0.46, - "learning_rate": 1.919402505941738e-06, - "loss": 0.7861, - "step": 18121 - }, - { - "epoch": 0.46, - "learning_rate": 1.9193916223027813e-06, - "loss": 0.7588, - "step": 18122 - }, - { - "epoch": 0.46, - "learning_rate": 1.919380737959889e-06, - "loss": 0.6318, - "step": 18123 - }, - { - "epoch": 0.46, - "learning_rate": 1.9193698529130694e-06, - "loss": 0.7764, - "step": 18124 - }, - { - "epoch": 0.46, - "learning_rate": 1.91935896716233e-06, - "loss": 0.8623, - "step": 18125 - }, - { - "epoch": 0.46, - "learning_rate": 1.9193480807076803e-06, - "loss": 0.7891, - "step": 18126 - }, - { - "epoch": 0.46, - "learning_rate": 1.9193371935491278e-06, - "loss": 0.8447, - "step": 18127 - }, - { - "epoch": 0.46, - "learning_rate": 1.919326305686681e-06, - "loss": 0.8281, - "step": 18128 - }, - { - "epoch": 0.46, - "learning_rate": 1.9193154171203485e-06, - "loss": 0.9473, - "step": 18129 - }, - { - "epoch": 0.46, - "learning_rate": 1.919304527850138e-06, - "loss": 0.8945, - "step": 18130 - }, - { - "epoch": 0.46, - "learning_rate": 1.9192936378760587e-06, - "loss": 0.8037, - "step": 18131 - }, - { - "epoch": 0.46, - "learning_rate": 1.9192827471981187e-06, - "loss": 0.7783, - "step": 18132 - }, - { - "epoch": 0.46, - "learning_rate": 1.919271855816326e-06, - "loss": 0.832, - "step": 18133 - }, - { - "epoch": 0.46, - "learning_rate": 1.919260963730689e-06, - "loss": 0.7368, - "step": 18134 - }, - { - "epoch": 0.46, - "learning_rate": 1.919250070941216e-06, - "loss": 1.042, - "step": 18135 - }, - { - "epoch": 0.46, - "learning_rate": 1.9192391774479156e-06, - "loss": 0.791, - "step": 18136 - }, - { - "epoch": 0.46, - "learning_rate": 1.9192282832507963e-06, - "loss": 0.6897, - "step": 18137 - }, - { - "epoch": 0.46, - "learning_rate": 1.919217388349866e-06, - "loss": 1.0176, - "step": 18138 - }, - { - "epoch": 0.46, - "learning_rate": 1.9192064927451332e-06, - "loss": 0.8208, - "step": 18139 - }, - { - "epoch": 0.46, - "learning_rate": 1.919195596436606e-06, - "loss": 0.918, - "step": 18140 - }, - { - "epoch": 0.46, - "learning_rate": 1.9191846994242935e-06, - "loss": 0.9482, - "step": 18141 - }, - { - "epoch": 0.46, - "learning_rate": 1.919173801708203e-06, - "loss": 0.8218, - "step": 18142 - }, - { - "epoch": 0.47, - "learning_rate": 1.9191629032883436e-06, - "loss": 0.9453, - "step": 18143 - }, - { - "epoch": 0.47, - "learning_rate": 1.9191520041647235e-06, - "loss": 0.8311, - "step": 18144 - }, - { - "epoch": 0.47, - "learning_rate": 1.919141104337351e-06, - "loss": 0.834, - "step": 18145 - }, - { - "epoch": 0.47, - "learning_rate": 1.9191302038062343e-06, - "loss": 0.8672, - "step": 18146 - }, - { - "epoch": 0.47, - "learning_rate": 1.919119302571382e-06, - "loss": 0.9219, - "step": 18147 - }, - { - "epoch": 0.47, - "learning_rate": 1.9191084006328026e-06, - "loss": 0.7891, - "step": 18148 - }, - { - "epoch": 0.47, - "learning_rate": 1.9190974979905035e-06, - "loss": 0.7021, - "step": 18149 - }, - { - "epoch": 0.47, - "learning_rate": 1.919086594644494e-06, - "loss": 0.7549, - "step": 18150 - }, - { - "epoch": 0.47, - "learning_rate": 1.9190756905947824e-06, - "loss": 0.9395, - "step": 18151 - }, - { - "epoch": 0.47, - "learning_rate": 1.9190647858413765e-06, - "loss": 0.8975, - "step": 18152 - }, - { - "epoch": 0.47, - "learning_rate": 1.9190538803842853e-06, - "loss": 1.0527, - "step": 18153 - }, - { - "epoch": 0.47, - "learning_rate": 1.9190429742235163e-06, - "loss": 0.4824, - "step": 18154 - }, - { - "epoch": 0.47, - "learning_rate": 1.9190320673590786e-06, - "loss": 0.9023, - "step": 18155 - }, - { - "epoch": 0.47, - "learning_rate": 1.91902115979098e-06, - "loss": 0.9893, - "step": 18156 - }, - { - "epoch": 0.47, - "learning_rate": 1.9190102515192297e-06, - "loss": 1.0586, - "step": 18157 - }, - { - "epoch": 0.47, - "learning_rate": 1.9189993425438355e-06, - "loss": 0.5879, - "step": 18158 - }, - { - "epoch": 0.47, - "learning_rate": 1.9189884328648055e-06, - "loss": 0.9062, - "step": 18159 - }, - { - "epoch": 0.47, - "learning_rate": 1.9189775224821483e-06, - "loss": 0.7522, - "step": 18160 - }, - { - "epoch": 0.47, - "learning_rate": 1.918966611395872e-06, - "loss": 1.0088, - "step": 18161 - }, - { - "epoch": 0.47, - "learning_rate": 1.9189556996059857e-06, - "loss": 0.7607, - "step": 18162 - }, - { - "epoch": 0.47, - "learning_rate": 1.918944787112497e-06, - "loss": 0.7812, - "step": 18163 - }, - { - "epoch": 0.47, - "learning_rate": 1.9189338739154147e-06, - "loss": 1.0391, - "step": 18164 - }, - { - "epoch": 0.47, - "learning_rate": 1.918922960014747e-06, - "loss": 1.0859, - "step": 18165 - }, - { - "epoch": 0.47, - "learning_rate": 1.918912045410502e-06, - "loss": 0.9688, - "step": 18166 - }, - { - "epoch": 0.47, - "learning_rate": 1.9189011301026884e-06, - "loss": 0.9014, - "step": 18167 - }, - { - "epoch": 0.47, - "learning_rate": 1.9188902140913146e-06, - "loss": 0.832, - "step": 18168 - }, - { - "epoch": 0.47, - "learning_rate": 1.918879297376389e-06, - "loss": 0.6787, - "step": 18169 - }, - { - "epoch": 0.47, - "learning_rate": 1.9188683799579194e-06, - "loss": 0.9648, - "step": 18170 - }, - { - "epoch": 0.47, - "learning_rate": 1.9188574618359145e-06, - "loss": 0.9229, - "step": 18171 - }, - { - "epoch": 0.47, - "learning_rate": 1.918846543010383e-06, - "loss": 0.8262, - "step": 18172 - }, - { - "epoch": 0.47, - "learning_rate": 1.9188356234813327e-06, - "loss": 0.8457, - "step": 18173 - }, - { - "epoch": 0.47, - "learning_rate": 1.9188247032487724e-06, - "loss": 0.9258, - "step": 18174 - }, - { - "epoch": 0.47, - "learning_rate": 1.91881378231271e-06, - "loss": 1.0322, - "step": 18175 - }, - { - "epoch": 0.47, - "learning_rate": 1.9188028606731544e-06, - "loss": 0.9023, - "step": 18176 - }, - { - "epoch": 0.47, - "learning_rate": 1.9187919383301137e-06, - "loss": 0.7905, - "step": 18177 - }, - { - "epoch": 0.47, - "learning_rate": 1.918781015283596e-06, - "loss": 1.0752, - "step": 18178 - }, - { - "epoch": 0.47, - "learning_rate": 1.91877009153361e-06, - "loss": 0.7725, - "step": 18179 - }, - { - "epoch": 0.47, - "learning_rate": 1.918759167080164e-06, - "loss": 0.8281, - "step": 18180 - }, - { - "epoch": 0.47, - "learning_rate": 1.9187482419232667e-06, - "loss": 0.9053, - "step": 18181 - }, - { - "epoch": 0.47, - "learning_rate": 1.918737316062926e-06, - "loss": 0.8877, - "step": 18182 - }, - { - "epoch": 0.47, - "learning_rate": 1.91872638949915e-06, - "loss": 0.9473, - "step": 18183 - }, - { - "epoch": 0.47, - "learning_rate": 1.9187154622319476e-06, - "loss": 0.748, - "step": 18184 - }, - { - "epoch": 0.47, - "learning_rate": 1.918704534261327e-06, - "loss": 0.8975, - "step": 18185 - }, - { - "epoch": 0.47, - "learning_rate": 1.918693605587297e-06, - "loss": 0.8555, - "step": 18186 - }, - { - "epoch": 0.47, - "learning_rate": 1.918682676209865e-06, - "loss": 0.8643, - "step": 18187 - }, - { - "epoch": 0.47, - "learning_rate": 1.91867174612904e-06, - "loss": 0.7354, - "step": 18188 - }, - { - "epoch": 0.47, - "learning_rate": 1.9186608153448303e-06, - "loss": 0.9561, - "step": 18189 - }, - { - "epoch": 0.47, - "learning_rate": 1.9186498838572443e-06, - "loss": 0.9951, - "step": 18190 - }, - { - "epoch": 0.47, - "learning_rate": 1.9186389516662906e-06, - "loss": 0.791, - "step": 18191 - }, - { - "epoch": 0.47, - "learning_rate": 1.9186280187719773e-06, - "loss": 0.8477, - "step": 18192 - }, - { - "epoch": 0.47, - "learning_rate": 1.9186170851743124e-06, - "loss": 1.0078, - "step": 18193 - }, - { - "epoch": 0.47, - "learning_rate": 1.9186061508733047e-06, - "loss": 0.8887, - "step": 18194 - }, - { - "epoch": 0.47, - "learning_rate": 1.9185952158689625e-06, - "loss": 1.0752, - "step": 18195 - }, - { - "epoch": 0.47, - "learning_rate": 1.9185842801612944e-06, - "loss": 0.8555, - "step": 18196 - }, - { - "epoch": 0.47, - "learning_rate": 1.9185733437503083e-06, - "loss": 0.6528, - "step": 18197 - }, - { - "epoch": 0.47, - "learning_rate": 1.9185624066360133e-06, - "loss": 1.0703, - "step": 18198 - }, - { - "epoch": 0.47, - "learning_rate": 1.9185514688184166e-06, - "loss": 0.6582, - "step": 18199 - }, - { - "epoch": 0.47, - "learning_rate": 1.9185405302975277e-06, - "loss": 1.127, - "step": 18200 - }, - { - "epoch": 0.47, - "learning_rate": 1.9185295910733545e-06, - "loss": 0.707, - "step": 18201 - }, - { - "epoch": 0.47, - "learning_rate": 1.9185186511459056e-06, - "loss": 0.8916, - "step": 18202 - }, - { - "epoch": 0.47, - "learning_rate": 1.918507710515189e-06, - "loss": 0.9395, - "step": 18203 - }, - { - "epoch": 0.47, - "learning_rate": 1.9184967691812133e-06, - "loss": 0.957, - "step": 18204 - }, - { - "epoch": 0.47, - "learning_rate": 1.918485827143987e-06, - "loss": 0.895, - "step": 18205 - }, - { - "epoch": 0.47, - "learning_rate": 1.9184748844035183e-06, - "loss": 0.8906, - "step": 18206 - }, - { - "epoch": 0.47, - "learning_rate": 1.9184639409598154e-06, - "loss": 0.7041, - "step": 18207 - }, - { - "epoch": 0.47, - "learning_rate": 1.918452996812887e-06, - "loss": 0.9873, - "step": 18208 - }, - { - "epoch": 0.47, - "learning_rate": 1.9184420519627413e-06, - "loss": 0.8545, - "step": 18209 - }, - { - "epoch": 0.47, - "learning_rate": 1.918431106409387e-06, - "loss": 0.8887, - "step": 18210 - }, - { - "epoch": 0.47, - "learning_rate": 1.918420160152832e-06, - "loss": 0.7197, - "step": 18211 - }, - { - "epoch": 0.47, - "learning_rate": 1.918409213193085e-06, - "loss": 0.7139, - "step": 18212 - }, - { - "epoch": 0.47, - "learning_rate": 1.918398265530154e-06, - "loss": 0.9209, - "step": 18213 - }, - { - "epoch": 0.47, - "learning_rate": 1.918387317164048e-06, - "loss": 0.9512, - "step": 18214 - }, - { - "epoch": 0.47, - "learning_rate": 1.918376368094775e-06, - "loss": 0.813, - "step": 18215 - }, - { - "epoch": 0.47, - "learning_rate": 1.9183654183223433e-06, - "loss": 0.9395, - "step": 18216 - }, - { - "epoch": 0.47, - "learning_rate": 1.9183544678467617e-06, - "loss": 0.915, - "step": 18217 - }, - { - "epoch": 0.47, - "learning_rate": 1.918343516668038e-06, - "loss": 0.8438, - "step": 18218 - }, - { - "epoch": 0.47, - "learning_rate": 1.918332564786181e-06, - "loss": 0.8008, - "step": 18219 - }, - { - "epoch": 0.47, - "learning_rate": 1.9183216122011995e-06, - "loss": 0.8877, - "step": 18220 - }, - { - "epoch": 0.47, - "learning_rate": 1.918310658913101e-06, - "loss": 0.8018, - "step": 18221 - }, - { - "epoch": 0.47, - "learning_rate": 1.918299704921894e-06, - "loss": 0.8457, - "step": 18222 - }, - { - "epoch": 0.47, - "learning_rate": 1.918288750227587e-06, - "loss": 0.7559, - "step": 18223 - }, - { - "epoch": 0.47, - "learning_rate": 1.9182777948301893e-06, - "loss": 0.9258, - "step": 18224 - }, - { - "epoch": 0.47, - "learning_rate": 1.918266838729708e-06, - "loss": 0.8047, - "step": 18225 - }, - { - "epoch": 0.47, - "learning_rate": 1.918255881926152e-06, - "loss": 0.9141, - "step": 18226 - }, - { - "epoch": 0.47, - "learning_rate": 1.91824492441953e-06, - "loss": 0.8594, - "step": 18227 - }, - { - "epoch": 0.47, - "learning_rate": 1.9182339662098497e-06, - "loss": 0.9932, - "step": 18228 - }, - { - "epoch": 0.47, - "learning_rate": 1.91822300729712e-06, - "loss": 1.0078, - "step": 18229 - }, - { - "epoch": 0.47, - "learning_rate": 1.918212047681349e-06, - "loss": 0.8721, - "step": 18230 - }, - { - "epoch": 0.47, - "learning_rate": 1.9182010873625453e-06, - "loss": 0.7783, - "step": 18231 - }, - { - "epoch": 0.47, - "learning_rate": 1.918190126340718e-06, - "loss": 0.9238, - "step": 18232 - }, - { - "epoch": 0.47, - "learning_rate": 1.9181791646158738e-06, - "loss": 1.0703, - "step": 18233 - }, - { - "epoch": 0.47, - "learning_rate": 1.9181682021880224e-06, - "loss": 0.9102, - "step": 18234 - }, - { - "epoch": 0.47, - "learning_rate": 1.9181572390571715e-06, - "loss": 0.9448, - "step": 18235 - }, - { - "epoch": 0.47, - "learning_rate": 1.9181462752233306e-06, - "loss": 0.8643, - "step": 18236 - }, - { - "epoch": 0.47, - "learning_rate": 1.9181353106865065e-06, - "loss": 0.7012, - "step": 18237 - }, - { - "epoch": 0.47, - "learning_rate": 1.9181243454467087e-06, - "loss": 0.8809, - "step": 18238 - }, - { - "epoch": 0.47, - "learning_rate": 1.9181133795039455e-06, - "loss": 0.7749, - "step": 18239 - }, - { - "epoch": 0.47, - "learning_rate": 1.918102412858225e-06, - "loss": 0.8975, - "step": 18240 - }, - { - "epoch": 0.47, - "learning_rate": 1.9180914455095552e-06, - "loss": 0.8857, - "step": 18241 - }, - { - "epoch": 0.47, - "learning_rate": 1.918080477457946e-06, - "loss": 0.9453, - "step": 18242 - }, - { - "epoch": 0.47, - "learning_rate": 1.918069508703404e-06, - "loss": 0.9902, - "step": 18243 - }, - { - "epoch": 0.47, - "learning_rate": 1.9180585392459385e-06, - "loss": 1.0195, - "step": 18244 - }, - { - "epoch": 0.47, - "learning_rate": 1.9180475690855577e-06, - "loss": 0.7627, - "step": 18245 - }, - { - "epoch": 0.47, - "learning_rate": 1.9180365982222704e-06, - "loss": 0.5989, - "step": 18246 - }, - { - "epoch": 0.47, - "learning_rate": 1.9180256266560847e-06, - "loss": 1.0635, - "step": 18247 - }, - { - "epoch": 0.47, - "learning_rate": 1.9180146543870086e-06, - "loss": 0.8486, - "step": 18248 - }, - { - "epoch": 0.47, - "learning_rate": 1.9180036814150514e-06, - "loss": 0.7759, - "step": 18249 - }, - { - "epoch": 0.47, - "learning_rate": 1.917992707740221e-06, - "loss": 0.6924, - "step": 18250 - }, - { - "epoch": 0.47, - "learning_rate": 1.9179817333625252e-06, - "loss": 0.8198, - "step": 18251 - }, - { - "epoch": 0.47, - "learning_rate": 1.9179707582819736e-06, - "loss": 0.832, - "step": 18252 - }, - { - "epoch": 0.47, - "learning_rate": 1.9179597824985734e-06, - "loss": 0.7046, - "step": 18253 - }, - { - "epoch": 0.47, - "learning_rate": 1.917948806012334e-06, - "loss": 0.8818, - "step": 18254 - }, - { - "epoch": 0.47, - "learning_rate": 1.9179378288232634e-06, - "loss": 0.8875, - "step": 18255 - }, - { - "epoch": 0.47, - "learning_rate": 1.91792685093137e-06, - "loss": 0.7412, - "step": 18256 - }, - { - "epoch": 0.47, - "learning_rate": 1.917915872336662e-06, - "loss": 0.9194, - "step": 18257 - }, - { - "epoch": 0.47, - "learning_rate": 1.9179048930391483e-06, - "loss": 0.9668, - "step": 18258 - }, - { - "epoch": 0.47, - "learning_rate": 1.917893913038837e-06, - "loss": 0.7241, - "step": 18259 - }, - { - "epoch": 0.47, - "learning_rate": 1.9178829323357366e-06, - "loss": 0.8408, - "step": 18260 - }, - { - "epoch": 0.47, - "learning_rate": 1.9178719509298554e-06, - "loss": 0.9531, - "step": 18261 - }, - { - "epoch": 0.47, - "learning_rate": 1.9178609688212016e-06, - "loss": 0.9082, - "step": 18262 - }, - { - "epoch": 0.47, - "learning_rate": 1.917849986009784e-06, - "loss": 0.6118, - "step": 18263 - }, - { - "epoch": 0.47, - "learning_rate": 1.917839002495611e-06, - "loss": 0.7261, - "step": 18264 - }, - { - "epoch": 0.47, - "learning_rate": 1.9178280182786906e-06, - "loss": 0.8516, - "step": 18265 - }, - { - "epoch": 0.47, - "learning_rate": 1.917817033359032e-06, - "loss": 1.0205, - "step": 18266 - }, - { - "epoch": 0.47, - "learning_rate": 1.9178060477366426e-06, - "loss": 1.0137, - "step": 18267 - }, - { - "epoch": 0.47, - "learning_rate": 1.9177950614115317e-06, - "loss": 0.8281, - "step": 18268 - }, - { - "epoch": 0.47, - "learning_rate": 1.917784074383707e-06, - "loss": 1.0088, - "step": 18269 - }, - { - "epoch": 0.47, - "learning_rate": 1.9177730866531773e-06, - "loss": 0.7236, - "step": 18270 - }, - { - "epoch": 0.47, - "learning_rate": 1.9177620982199508e-06, - "loss": 0.9336, - "step": 18271 - }, - { - "epoch": 0.47, - "learning_rate": 1.9177511090840363e-06, - "loss": 0.9209, - "step": 18272 - }, - { - "epoch": 0.47, - "learning_rate": 1.917740119245442e-06, - "loss": 0.7881, - "step": 18273 - }, - { - "epoch": 0.47, - "learning_rate": 1.9177291287041763e-06, - "loss": 0.5996, - "step": 18274 - }, - { - "epoch": 0.47, - "learning_rate": 1.9177181374602475e-06, - "loss": 0.9824, - "step": 18275 - }, - { - "epoch": 0.47, - "learning_rate": 1.9177071455136643e-06, - "loss": 0.8223, - "step": 18276 - }, - { - "epoch": 0.47, - "learning_rate": 1.9176961528644347e-06, - "loss": 0.7891, - "step": 18277 - }, - { - "epoch": 0.47, - "learning_rate": 1.9176851595125675e-06, - "loss": 0.8389, - "step": 18278 - }, - { - "epoch": 0.47, - "learning_rate": 1.9176741654580704e-06, - "loss": 0.8105, - "step": 18279 - }, - { - "epoch": 0.47, - "learning_rate": 1.917663170700953e-06, - "loss": 1.0615, - "step": 18280 - }, - { - "epoch": 0.47, - "learning_rate": 1.9176521752412233e-06, - "loss": 0.8994, - "step": 18281 - }, - { - "epoch": 0.47, - "learning_rate": 1.9176411790788893e-06, - "loss": 0.6304, - "step": 18282 - }, - { - "epoch": 0.47, - "learning_rate": 1.9176301822139593e-06, - "loss": 0.918, - "step": 18283 - }, - { - "epoch": 0.47, - "learning_rate": 1.9176191846464426e-06, - "loss": 1.0049, - "step": 18284 - }, - { - "epoch": 0.47, - "learning_rate": 1.917608186376347e-06, - "loss": 0.832, - "step": 18285 - }, - { - "epoch": 0.47, - "learning_rate": 1.9175971874036804e-06, - "loss": 1.0684, - "step": 18286 - }, - { - "epoch": 0.47, - "learning_rate": 1.917586187728452e-06, - "loss": 0.8428, - "step": 18287 - }, - { - "epoch": 0.47, - "learning_rate": 1.9175751873506703e-06, - "loss": 1.1221, - "step": 18288 - }, - { - "epoch": 0.47, - "learning_rate": 1.9175641862703437e-06, - "loss": 0.9453, - "step": 18289 - }, - { - "epoch": 0.47, - "learning_rate": 1.9175531844874802e-06, - "loss": 0.9834, - "step": 18290 - }, - { - "epoch": 0.47, - "learning_rate": 1.917542182002088e-06, - "loss": 0.8271, - "step": 18291 - }, - { - "epoch": 0.47, - "learning_rate": 1.9175311788141766e-06, - "loss": 0.7607, - "step": 18292 - }, - { - "epoch": 0.47, - "learning_rate": 1.9175201749237534e-06, - "loss": 1.1338, - "step": 18293 - }, - { - "epoch": 0.47, - "learning_rate": 1.9175091703308272e-06, - "loss": 0.8271, - "step": 18294 - }, - { - "epoch": 0.47, - "learning_rate": 1.9174981650354067e-06, - "loss": 0.6045, - "step": 18295 - }, - { - "epoch": 0.47, - "learning_rate": 1.9174871590375e-06, - "loss": 0.96, - "step": 18296 - }, - { - "epoch": 0.47, - "learning_rate": 1.917476152337115e-06, - "loss": 0.7715, - "step": 18297 - }, - { - "epoch": 0.47, - "learning_rate": 1.9174651449342613e-06, - "loss": 1.0791, - "step": 18298 - }, - { - "epoch": 0.47, - "learning_rate": 1.9174541368289466e-06, - "loss": 0.9277, - "step": 18299 - }, - { - "epoch": 0.47, - "learning_rate": 1.917443128021179e-06, - "loss": 0.915, - "step": 18300 - }, - { - "epoch": 0.47, - "learning_rate": 1.917432118510968e-06, - "loss": 0.9189, - "step": 18301 - }, - { - "epoch": 0.47, - "learning_rate": 1.9174211082983207e-06, - "loss": 0.9443, - "step": 18302 - }, - { - "epoch": 0.47, - "learning_rate": 1.917410097383247e-06, - "loss": 0.8896, - "step": 18303 - }, - { - "epoch": 0.47, - "learning_rate": 1.9173990857657546e-06, - "loss": 0.9722, - "step": 18304 - }, - { - "epoch": 0.47, - "learning_rate": 1.9173880734458513e-06, - "loss": 0.8701, - "step": 18305 - }, - { - "epoch": 0.47, - "learning_rate": 1.9173770604235464e-06, - "loss": 0.7178, - "step": 18306 - }, - { - "epoch": 0.47, - "learning_rate": 1.9173660466988483e-06, - "loss": 0.8496, - "step": 18307 - }, - { - "epoch": 0.47, - "learning_rate": 1.917355032271765e-06, - "loss": 0.6343, - "step": 18308 - }, - { - "epoch": 0.47, - "learning_rate": 1.9173440171423047e-06, - "loss": 0.7979, - "step": 18309 - }, - { - "epoch": 0.47, - "learning_rate": 1.9173330013104765e-06, - "loss": 0.8418, - "step": 18310 - }, - { - "epoch": 0.47, - "learning_rate": 1.917321984776289e-06, - "loss": 0.8027, - "step": 18311 - }, - { - "epoch": 0.47, - "learning_rate": 1.91731096753975e-06, - "loss": 0.999, - "step": 18312 - }, - { - "epoch": 0.47, - "learning_rate": 1.917299949600868e-06, - "loss": 1.0898, - "step": 18313 - }, - { - "epoch": 0.47, - "learning_rate": 1.917288930959652e-06, - "loss": 0.8311, - "step": 18314 - }, - { - "epoch": 0.47, - "learning_rate": 1.91727791161611e-06, - "loss": 0.7666, - "step": 18315 - }, - { - "epoch": 0.47, - "learning_rate": 1.9172668915702502e-06, - "loss": 0.8877, - "step": 18316 - }, - { - "epoch": 0.47, - "learning_rate": 1.9172558708220815e-06, - "loss": 1.0215, - "step": 18317 - }, - { - "epoch": 0.47, - "learning_rate": 1.917244849371612e-06, - "loss": 0.9414, - "step": 18318 - }, - { - "epoch": 0.47, - "learning_rate": 1.9172338272188505e-06, - "loss": 0.8413, - "step": 18319 - }, - { - "epoch": 0.47, - "learning_rate": 1.917222804363805e-06, - "loss": 0.8623, - "step": 18320 - }, - { - "epoch": 0.47, - "learning_rate": 1.917211780806484e-06, - "loss": 1.0068, - "step": 18321 - }, - { - "epoch": 0.47, - "learning_rate": 1.917200756546897e-06, - "loss": 0.748, - "step": 18322 - }, - { - "epoch": 0.47, - "learning_rate": 1.917189731585051e-06, - "loss": 0.8574, - "step": 18323 - }, - { - "epoch": 0.47, - "learning_rate": 1.917178705920955e-06, - "loss": 0.833, - "step": 18324 - }, - { - "epoch": 0.47, - "learning_rate": 1.917167679554617e-06, - "loss": 1.0381, - "step": 18325 - }, - { - "epoch": 0.47, - "learning_rate": 1.9171566524860465e-06, - "loss": 0.6084, - "step": 18326 - }, - { - "epoch": 0.47, - "learning_rate": 1.917145624715251e-06, - "loss": 0.8613, - "step": 18327 - }, - { - "epoch": 0.47, - "learning_rate": 1.9171345962422395e-06, - "loss": 0.7539, - "step": 18328 - }, - { - "epoch": 0.47, - "learning_rate": 1.9171235670670197e-06, - "loss": 0.8018, - "step": 18329 - }, - { - "epoch": 0.47, - "learning_rate": 1.917112537189601e-06, - "loss": 0.7998, - "step": 18330 - }, - { - "epoch": 0.47, - "learning_rate": 1.917101506609991e-06, - "loss": 0.7056, - "step": 18331 - }, - { - "epoch": 0.47, - "learning_rate": 1.9170904753281995e-06, - "loss": 1.1045, - "step": 18332 - }, - { - "epoch": 0.47, - "learning_rate": 1.917079443344233e-06, - "loss": 0.9004, - "step": 18333 - }, - { - "epoch": 0.47, - "learning_rate": 1.9170684106581016e-06, - "loss": 0.873, - "step": 18334 - }, - { - "epoch": 0.47, - "learning_rate": 1.9170573772698127e-06, - "loss": 0.8779, - "step": 18335 - }, - { - "epoch": 0.47, - "learning_rate": 1.917046343179375e-06, - "loss": 0.7969, - "step": 18336 - }, - { - "epoch": 0.47, - "learning_rate": 1.917035308386798e-06, - "loss": 0.6304, - "step": 18337 - }, - { - "epoch": 0.47, - "learning_rate": 1.917024272892088e-06, - "loss": 1.0537, - "step": 18338 - }, - { - "epoch": 0.47, - "learning_rate": 1.917013236695255e-06, - "loss": 0.8828, - "step": 18339 - }, - { - "epoch": 0.47, - "learning_rate": 1.9170021997963076e-06, - "loss": 0.7715, - "step": 18340 - }, - { - "epoch": 0.47, - "learning_rate": 1.9169911621952533e-06, - "loss": 0.8291, - "step": 18341 - }, - { - "epoch": 0.47, - "learning_rate": 1.9169801238921015e-06, - "loss": 0.9688, - "step": 18342 - }, - { - "epoch": 0.47, - "learning_rate": 1.91696908488686e-06, - "loss": 0.9834, - "step": 18343 - }, - { - "epoch": 0.47, - "learning_rate": 1.9169580451795373e-06, - "loss": 0.6355, - "step": 18344 - }, - { - "epoch": 0.47, - "learning_rate": 1.916947004770142e-06, - "loss": 0.9521, - "step": 18345 - }, - { - "epoch": 0.47, - "learning_rate": 1.9169359636586824e-06, - "loss": 0.7444, - "step": 18346 - }, - { - "epoch": 0.47, - "learning_rate": 1.9169249218451677e-06, - "loss": 0.7544, - "step": 18347 - }, - { - "epoch": 0.47, - "learning_rate": 1.916913879329605e-06, - "loss": 0.9014, - "step": 18348 - }, - { - "epoch": 0.47, - "learning_rate": 1.916902836112004e-06, - "loss": 0.793, - "step": 18349 - }, - { - "epoch": 0.47, - "learning_rate": 1.9168917921923727e-06, - "loss": 0.8613, - "step": 18350 - }, - { - "epoch": 0.47, - "learning_rate": 1.9168807475707193e-06, - "loss": 0.8936, - "step": 18351 - }, - { - "epoch": 0.47, - "learning_rate": 1.916869702247052e-06, - "loss": 0.7529, - "step": 18352 - }, - { - "epoch": 0.47, - "learning_rate": 1.9168586562213807e-06, - "loss": 1.0586, - "step": 18353 - }, - { - "epoch": 0.47, - "learning_rate": 1.9168476094937124e-06, - "loss": 0.6865, - "step": 18354 - }, - { - "epoch": 0.47, - "learning_rate": 1.916836562064056e-06, - "loss": 0.8066, - "step": 18355 - }, - { - "epoch": 0.47, - "learning_rate": 1.91682551393242e-06, - "loss": 0.8818, - "step": 18356 - }, - { - "epoch": 0.47, - "learning_rate": 1.916814465098813e-06, - "loss": 0.8955, - "step": 18357 - }, - { - "epoch": 0.47, - "learning_rate": 1.9168034155632433e-06, - "loss": 0.9648, - "step": 18358 - }, - { - "epoch": 0.47, - "learning_rate": 1.916792365325719e-06, - "loss": 1.0938, - "step": 18359 - }, - { - "epoch": 0.47, - "learning_rate": 1.9167813143862493e-06, - "loss": 0.8975, - "step": 18360 - }, - { - "epoch": 0.47, - "learning_rate": 1.916770262744842e-06, - "loss": 0.7256, - "step": 18361 - }, - { - "epoch": 0.47, - "learning_rate": 1.916759210401507e-06, - "loss": 0.8848, - "step": 18362 - }, - { - "epoch": 0.47, - "learning_rate": 1.91674815735625e-06, - "loss": 0.8252, - "step": 18363 - }, - { - "epoch": 0.47, - "learning_rate": 1.916737103609082e-06, - "loss": 0.7397, - "step": 18364 - }, - { - "epoch": 0.47, - "learning_rate": 1.9167260491600106e-06, - "loss": 0.4846, - "step": 18365 - }, - { - "epoch": 0.47, - "learning_rate": 1.916714994009044e-06, - "loss": 0.8184, - "step": 18366 - }, - { - "epoch": 0.47, - "learning_rate": 1.916703938156191e-06, - "loss": 0.7773, - "step": 18367 - }, - { - "epoch": 0.47, - "learning_rate": 1.9166928816014596e-06, - "loss": 0.8887, - "step": 18368 - }, - { - "epoch": 0.47, - "learning_rate": 1.9166818243448592e-06, - "loss": 0.7031, - "step": 18369 - }, - { - "epoch": 0.47, - "learning_rate": 1.916670766386397e-06, - "loss": 0.8242, - "step": 18370 - }, - { - "epoch": 0.47, - "learning_rate": 1.916659707726083e-06, - "loss": 0.7512, - "step": 18371 - }, - { - "epoch": 0.47, - "learning_rate": 1.9166486483639238e-06, - "loss": 1.1182, - "step": 18372 - }, - { - "epoch": 0.47, - "learning_rate": 1.9166375882999293e-06, - "loss": 0.6543, - "step": 18373 - }, - { - "epoch": 0.47, - "learning_rate": 1.9166265275341074e-06, - "loss": 1.0303, - "step": 18374 - }, - { - "epoch": 0.47, - "learning_rate": 1.916615466066467e-06, - "loss": 0.9922, - "step": 18375 - }, - { - "epoch": 0.47, - "learning_rate": 1.9166044038970163e-06, - "loss": 0.8862, - "step": 18376 - }, - { - "epoch": 0.47, - "learning_rate": 1.9165933410257637e-06, - "loss": 0.5947, - "step": 18377 - }, - { - "epoch": 0.47, - "learning_rate": 1.9165822774527175e-06, - "loss": 0.8623, - "step": 18378 - }, - { - "epoch": 0.47, - "learning_rate": 1.9165712131778867e-06, - "loss": 0.7822, - "step": 18379 - }, - { - "epoch": 0.47, - "learning_rate": 1.9165601482012794e-06, - "loss": 0.7744, - "step": 18380 - }, - { - "epoch": 0.47, - "learning_rate": 1.916549082522904e-06, - "loss": 0.9883, - "step": 18381 - }, - { - "epoch": 0.47, - "learning_rate": 1.916538016142769e-06, - "loss": 0.7925, - "step": 18382 - }, - { - "epoch": 0.47, - "learning_rate": 1.9165269490608835e-06, - "loss": 0.7545, - "step": 18383 - }, - { - "epoch": 0.47, - "learning_rate": 1.916515881277255e-06, - "loss": 0.877, - "step": 18384 - }, - { - "epoch": 0.47, - "learning_rate": 1.9165048127918927e-06, - "loss": 1.0137, - "step": 18385 - }, - { - "epoch": 0.47, - "learning_rate": 1.916493743604805e-06, - "loss": 0.877, - "step": 18386 - }, - { - "epoch": 0.47, - "learning_rate": 1.9164826737159994e-06, - "loss": 0.7773, - "step": 18387 - }, - { - "epoch": 0.47, - "learning_rate": 1.9164716031254856e-06, - "loss": 1.0703, - "step": 18388 - }, - { - "epoch": 0.47, - "learning_rate": 1.916460531833272e-06, - "loss": 0.7209, - "step": 18389 - }, - { - "epoch": 0.47, - "learning_rate": 1.916449459839366e-06, - "loss": 0.6943, - "step": 18390 - }, - { - "epoch": 0.47, - "learning_rate": 1.916438387143777e-06, - "loss": 0.9951, - "step": 18391 - }, - { - "epoch": 0.47, - "learning_rate": 1.9164273137465137e-06, - "loss": 1.043, - "step": 18392 - }, - { - "epoch": 0.47, - "learning_rate": 1.916416239647584e-06, - "loss": 0.8071, - "step": 18393 - }, - { - "epoch": 0.47, - "learning_rate": 1.916405164846996e-06, - "loss": 0.6309, - "step": 18394 - }, - { - "epoch": 0.47, - "learning_rate": 1.9163940893447594e-06, - "loss": 0.9268, - "step": 18395 - }, - { - "epoch": 0.47, - "learning_rate": 1.9163830131408816e-06, - "loss": 0.9033, - "step": 18396 - }, - { - "epoch": 0.47, - "learning_rate": 1.9163719362353716e-06, - "loss": 0.8584, - "step": 18397 - }, - { - "epoch": 0.47, - "learning_rate": 1.9163608586282376e-06, - "loss": 0.9082, - "step": 18398 - }, - { - "epoch": 0.47, - "learning_rate": 1.9163497803194885e-06, - "loss": 0.9648, - "step": 18399 - }, - { - "epoch": 0.47, - "learning_rate": 1.916338701309132e-06, - "loss": 0.9775, - "step": 18400 - }, - { - "epoch": 0.47, - "learning_rate": 1.9163276215971776e-06, - "loss": 0.7578, - "step": 18401 - }, - { - "epoch": 0.47, - "learning_rate": 1.916316541183633e-06, - "loss": 0.8623, - "step": 18402 - }, - { - "epoch": 0.47, - "learning_rate": 1.9163054600685073e-06, - "loss": 0.7085, - "step": 18403 - }, - { - "epoch": 0.47, - "learning_rate": 1.916294378251808e-06, - "loss": 0.7866, - "step": 18404 - }, - { - "epoch": 0.47, - "learning_rate": 1.9162832957335448e-06, - "loss": 1.0146, - "step": 18405 - }, - { - "epoch": 0.47, - "learning_rate": 1.9162722125137252e-06, - "loss": 1.0166, - "step": 18406 - }, - { - "epoch": 0.47, - "learning_rate": 1.9162611285923583e-06, - "loss": 0.6899, - "step": 18407 - }, - { - "epoch": 0.47, - "learning_rate": 1.916250043969453e-06, - "loss": 0.8418, - "step": 18408 - }, - { - "epoch": 0.47, - "learning_rate": 1.916238958645016e-06, - "loss": 1.0195, - "step": 18409 - }, - { - "epoch": 0.47, - "learning_rate": 1.9162278726190577e-06, - "loss": 0.8291, - "step": 18410 - }, - { - "epoch": 0.47, - "learning_rate": 1.916216785891586e-06, - "loss": 0.8564, - "step": 18411 - }, - { - "epoch": 0.47, - "learning_rate": 1.9162056984626084e-06, - "loss": 0.8252, - "step": 18412 - }, - { - "epoch": 0.47, - "learning_rate": 1.916194610332135e-06, - "loss": 0.8262, - "step": 18413 - }, - { - "epoch": 0.47, - "learning_rate": 1.916183521500173e-06, - "loss": 0.8545, - "step": 18414 - }, - { - "epoch": 0.47, - "learning_rate": 1.9161724319667314e-06, - "loss": 0.8105, - "step": 18415 - }, - { - "epoch": 0.47, - "learning_rate": 1.9161613417318193e-06, - "loss": 0.9561, - "step": 18416 - }, - { - "epoch": 0.47, - "learning_rate": 1.9161502507954445e-06, - "loss": 0.8223, - "step": 18417 - }, - { - "epoch": 0.47, - "learning_rate": 1.916139159157615e-06, - "loss": 0.856, - "step": 18418 - }, - { - "epoch": 0.47, - "learning_rate": 1.9161280668183403e-06, - "loss": 0.7061, - "step": 18419 - }, - { - "epoch": 0.47, - "learning_rate": 1.9161169737776286e-06, - "loss": 1.084, - "step": 18420 - }, - { - "epoch": 0.47, - "learning_rate": 1.9161058800354876e-06, - "loss": 0.7622, - "step": 18421 - }, - { - "epoch": 0.47, - "learning_rate": 1.9160947855919267e-06, - "loss": 0.9111, - "step": 18422 - }, - { - "epoch": 0.47, - "learning_rate": 1.916083690446955e-06, - "loss": 0.8145, - "step": 18423 - }, - { - "epoch": 0.47, - "learning_rate": 1.916072594600579e-06, - "loss": 0.8896, - "step": 18424 - }, - { - "epoch": 0.47, - "learning_rate": 1.9160614980528087e-06, - "loss": 0.7217, - "step": 18425 - }, - { - "epoch": 0.47, - "learning_rate": 1.9160504008036524e-06, - "loss": 1.0117, - "step": 18426 - }, - { - "epoch": 0.47, - "learning_rate": 1.9160393028531185e-06, - "loss": 1.0254, - "step": 18427 - }, - { - "epoch": 0.47, - "learning_rate": 1.9160282042012154e-06, - "loss": 0.7686, - "step": 18428 - }, - { - "epoch": 0.47, - "learning_rate": 1.9160171048479513e-06, - "loss": 0.9766, - "step": 18429 - }, - { - "epoch": 0.47, - "learning_rate": 1.9160060047933354e-06, - "loss": 1.0918, - "step": 18430 - }, - { - "epoch": 0.47, - "learning_rate": 1.9159949040373754e-06, - "loss": 0.7432, - "step": 18431 - }, - { - "epoch": 0.47, - "learning_rate": 1.91598380258008e-06, - "loss": 0.8545, - "step": 18432 - }, - { - "epoch": 0.47, - "learning_rate": 1.915972700421459e-06, - "loss": 0.772, - "step": 18433 - }, - { - "epoch": 0.47, - "learning_rate": 1.915961597561519e-06, - "loss": 1.0703, - "step": 18434 - }, - { - "epoch": 0.47, - "learning_rate": 1.9159504940002695e-06, - "loss": 0.9146, - "step": 18435 - }, - { - "epoch": 0.47, - "learning_rate": 1.915939389737719e-06, - "loss": 1.041, - "step": 18436 - }, - { - "epoch": 0.47, - "learning_rate": 1.9159282847738754e-06, - "loss": 0.71, - "step": 18437 - }, - { - "epoch": 0.47, - "learning_rate": 1.915917179108748e-06, - "loss": 0.7832, - "step": 18438 - }, - { - "epoch": 0.47, - "learning_rate": 1.915906072742345e-06, - "loss": 0.8535, - "step": 18439 - }, - { - "epoch": 0.47, - "learning_rate": 1.9158949656746744e-06, - "loss": 0.8882, - "step": 18440 - }, - { - "epoch": 0.47, - "learning_rate": 1.9158838579057454e-06, - "loss": 0.6997, - "step": 18441 - }, - { - "epoch": 0.47, - "learning_rate": 1.9158727494355662e-06, - "loss": 0.9854, - "step": 18442 - }, - { - "epoch": 0.47, - "learning_rate": 1.9158616402641454e-06, - "loss": 1.0645, - "step": 18443 - }, - { - "epoch": 0.47, - "learning_rate": 1.915850530391492e-06, - "loss": 0.9189, - "step": 18444 - }, - { - "epoch": 0.47, - "learning_rate": 1.9158394198176133e-06, - "loss": 0.9033, - "step": 18445 - }, - { - "epoch": 0.47, - "learning_rate": 1.9158283085425184e-06, - "loss": 1.1152, - "step": 18446 - }, - { - "epoch": 0.47, - "learning_rate": 1.915817196566216e-06, - "loss": 0.918, - "step": 18447 - }, - { - "epoch": 0.47, - "learning_rate": 1.9158060838887143e-06, - "loss": 0.8799, - "step": 18448 - }, - { - "epoch": 0.47, - "learning_rate": 1.9157949705100224e-06, - "loss": 0.9922, - "step": 18449 - }, - { - "epoch": 0.47, - "learning_rate": 1.915783856430148e-06, - "loss": 0.5969, - "step": 18450 - }, - { - "epoch": 0.47, - "learning_rate": 1.9157727416491005e-06, - "loss": 0.9512, - "step": 18451 - }, - { - "epoch": 0.47, - "learning_rate": 1.915761626166888e-06, - "loss": 1.0742, - "step": 18452 - }, - { - "epoch": 0.47, - "learning_rate": 1.915750509983518e-06, - "loss": 0.8584, - "step": 18453 - }, - { - "epoch": 0.47, - "learning_rate": 1.9157393930990006e-06, - "loss": 0.9141, - "step": 18454 - }, - { - "epoch": 0.47, - "learning_rate": 1.915728275513344e-06, - "loss": 0.9697, - "step": 18455 - }, - { - "epoch": 0.47, - "learning_rate": 1.9157171572265555e-06, - "loss": 0.7827, - "step": 18456 - }, - { - "epoch": 0.47, - "learning_rate": 1.915706038238645e-06, - "loss": 0.7109, - "step": 18457 - }, - { - "epoch": 0.47, - "learning_rate": 1.9156949185496203e-06, - "loss": 0.875, - "step": 18458 - }, - { - "epoch": 0.47, - "learning_rate": 1.9156837981594904e-06, - "loss": 0.9885, - "step": 18459 - }, - { - "epoch": 0.47, - "learning_rate": 1.9156726770682633e-06, - "loss": 0.8301, - "step": 18460 - }, - { - "epoch": 0.47, - "learning_rate": 1.915661555275948e-06, - "loss": 0.7314, - "step": 18461 - }, - { - "epoch": 0.47, - "learning_rate": 1.9156504327825525e-06, - "loss": 0.9521, - "step": 18462 - }, - { - "epoch": 0.47, - "learning_rate": 1.9156393095880858e-06, - "loss": 0.8457, - "step": 18463 - }, - { - "epoch": 0.47, - "learning_rate": 1.9156281856925557e-06, - "loss": 0.6265, - "step": 18464 - }, - { - "epoch": 0.47, - "learning_rate": 1.9156170610959712e-06, - "loss": 0.791, - "step": 18465 - }, - { - "epoch": 0.47, - "learning_rate": 1.9156059357983412e-06, - "loss": 0.8087, - "step": 18466 - }, - { - "epoch": 0.47, - "learning_rate": 1.915594809799674e-06, - "loss": 1.0029, - "step": 18467 - }, - { - "epoch": 0.47, - "learning_rate": 1.9155836830999775e-06, - "loss": 0.8433, - "step": 18468 - }, - { - "epoch": 0.47, - "learning_rate": 1.915572555699261e-06, - "loss": 0.9463, - "step": 18469 - }, - { - "epoch": 0.47, - "learning_rate": 1.915561427597533e-06, - "loss": 1.002, - "step": 18470 - }, - { - "epoch": 0.47, - "learning_rate": 1.915550298794801e-06, - "loss": 0.8965, - "step": 18471 - }, - { - "epoch": 0.47, - "learning_rate": 1.915539169291074e-06, - "loss": 0.9961, - "step": 18472 - }, - { - "epoch": 0.47, - "learning_rate": 1.9155280390863617e-06, - "loss": 0.9678, - "step": 18473 - }, - { - "epoch": 0.47, - "learning_rate": 1.9155169081806713e-06, - "loss": 0.7725, - "step": 18474 - }, - { - "epoch": 0.47, - "learning_rate": 1.9155057765740113e-06, - "loss": 0.873, - "step": 18475 - }, - { - "epoch": 0.47, - "learning_rate": 1.915494644266391e-06, - "loss": 0.7384, - "step": 18476 - }, - { - "epoch": 0.47, - "learning_rate": 1.9154835112578188e-06, - "loss": 0.7969, - "step": 18477 - }, - { - "epoch": 0.47, - "learning_rate": 1.9154723775483024e-06, - "loss": 0.8486, - "step": 18478 - }, - { - "epoch": 0.47, - "learning_rate": 1.915461243137851e-06, - "loss": 0.8047, - "step": 18479 - }, - { - "epoch": 0.47, - "learning_rate": 1.915450108026473e-06, - "loss": 0.9404, - "step": 18480 - }, - { - "epoch": 0.47, - "learning_rate": 1.9154389722141776e-06, - "loss": 0.8789, - "step": 18481 - }, - { - "epoch": 0.47, - "learning_rate": 1.915427835700972e-06, - "loss": 0.9082, - "step": 18482 - }, - { - "epoch": 0.47, - "learning_rate": 1.9154166984868658e-06, - "loss": 0.9814, - "step": 18483 - }, - { - "epoch": 0.47, - "learning_rate": 1.915405560571867e-06, - "loss": 1.041, - "step": 18484 - }, - { - "epoch": 0.47, - "learning_rate": 1.915394421955984e-06, - "loss": 0.623, - "step": 18485 - }, - { - "epoch": 0.47, - "learning_rate": 1.915383282639226e-06, - "loss": 0.9775, - "step": 18486 - }, - { - "epoch": 0.47, - "learning_rate": 1.915372142621601e-06, - "loss": 1.0361, - "step": 18487 - }, - { - "epoch": 0.47, - "learning_rate": 1.9153610019031173e-06, - "loss": 0.8555, - "step": 18488 - }, - { - "epoch": 0.47, - "learning_rate": 1.9153498604837843e-06, - "loss": 0.8535, - "step": 18489 - }, - { - "epoch": 0.47, - "learning_rate": 1.9153387183636094e-06, - "loss": 0.9277, - "step": 18490 - }, - { - "epoch": 0.47, - "learning_rate": 1.915327575542602e-06, - "loss": 0.7509, - "step": 18491 - }, - { - "epoch": 0.47, - "learning_rate": 1.9153164320207705e-06, - "loss": 1.1562, - "step": 18492 - }, - { - "epoch": 0.47, - "learning_rate": 1.915305287798123e-06, - "loss": 0.8711, - "step": 18493 - }, - { - "epoch": 0.47, - "learning_rate": 1.9152941428746685e-06, - "loss": 1.1064, - "step": 18494 - }, - { - "epoch": 0.47, - "learning_rate": 1.9152829972504153e-06, - "loss": 0.8057, - "step": 18495 - }, - { - "epoch": 0.47, - "learning_rate": 1.9152718509253723e-06, - "loss": 1.0684, - "step": 18496 - }, - { - "epoch": 0.47, - "learning_rate": 1.9152607038995473e-06, - "loss": 1.0449, - "step": 18497 - }, - { - "epoch": 0.47, - "learning_rate": 1.9152495561729494e-06, - "loss": 0.6912, - "step": 18498 - }, - { - "epoch": 0.47, - "learning_rate": 1.915238407745587e-06, - "loss": 0.8643, - "step": 18499 - }, - { - "epoch": 0.47, - "learning_rate": 1.915227258617469e-06, - "loss": 0.8027, - "step": 18500 - }, - { - "epoch": 0.47, - "learning_rate": 1.9152161087886032e-06, - "loss": 0.6064, - "step": 18501 - }, - { - "epoch": 0.47, - "learning_rate": 1.9152049582589984e-06, - "loss": 0.7278, - "step": 18502 - }, - { - "epoch": 0.47, - "learning_rate": 1.9151938070286636e-06, - "loss": 0.9258, - "step": 18503 - }, - { - "epoch": 0.47, - "learning_rate": 1.9151826550976068e-06, - "loss": 0.7715, - "step": 18504 - }, - { - "epoch": 0.47, - "learning_rate": 1.9151715024658364e-06, - "loss": 0.9922, - "step": 18505 - }, - { - "epoch": 0.47, - "learning_rate": 1.915160349133362e-06, - "loss": 0.7764, - "step": 18506 - }, - { - "epoch": 0.47, - "learning_rate": 1.915149195100191e-06, - "loss": 0.9902, - "step": 18507 - }, - { - "epoch": 0.47, - "learning_rate": 1.915138040366332e-06, - "loss": 0.9414, - "step": 18508 - }, - { - "epoch": 0.47, - "learning_rate": 1.9151268849317945e-06, - "loss": 0.8896, - "step": 18509 - }, - { - "epoch": 0.47, - "learning_rate": 1.915115728796586e-06, - "loss": 0.7656, - "step": 18510 - }, - { - "epoch": 0.47, - "learning_rate": 1.9151045719607156e-06, - "loss": 0.9033, - "step": 18511 - }, - { - "epoch": 0.47, - "learning_rate": 1.9150934144241917e-06, - "loss": 0.9229, - "step": 18512 - }, - { - "epoch": 0.47, - "learning_rate": 1.915082256187023e-06, - "loss": 0.7285, - "step": 18513 - }, - { - "epoch": 0.47, - "learning_rate": 1.9150710972492176e-06, - "loss": 0.8389, - "step": 18514 - }, - { - "epoch": 0.47, - "learning_rate": 1.9150599376107844e-06, - "loss": 1.0049, - "step": 18515 - }, - { - "epoch": 0.47, - "learning_rate": 1.915048777271732e-06, - "loss": 0.6914, - "step": 18516 - }, - { - "epoch": 0.47, - "learning_rate": 1.9150376162320688e-06, - "loss": 1.0254, - "step": 18517 - }, - { - "epoch": 0.47, - "learning_rate": 1.9150264544918033e-06, - "loss": 0.8604, - "step": 18518 - }, - { - "epoch": 0.47, - "learning_rate": 1.9150152920509442e-06, - "loss": 0.6895, - "step": 18519 - }, - { - "epoch": 0.47, - "learning_rate": 1.9150041289095e-06, - "loss": 0.9092, - "step": 18520 - }, - { - "epoch": 0.47, - "learning_rate": 1.9149929650674794e-06, - "loss": 1.082, - "step": 18521 - }, - { - "epoch": 0.47, - "learning_rate": 1.91498180052489e-06, - "loss": 0.8447, - "step": 18522 - }, - { - "epoch": 0.47, - "learning_rate": 1.914970635281742e-06, - "loss": 0.8994, - "step": 18523 - }, - { - "epoch": 0.47, - "learning_rate": 1.9149594693380425e-06, - "loss": 0.9082, - "step": 18524 - }, - { - "epoch": 0.47, - "learning_rate": 1.914948302693801e-06, - "loss": 0.8447, - "step": 18525 - }, - { - "epoch": 0.47, - "learning_rate": 1.9149371353490252e-06, - "loss": 1.207, - "step": 18526 - }, - { - "epoch": 0.47, - "learning_rate": 1.9149259673037244e-06, - "loss": 0.8975, - "step": 18527 - }, - { - "epoch": 0.47, - "learning_rate": 1.914914798557907e-06, - "loss": 0.9033, - "step": 18528 - }, - { - "epoch": 0.47, - "learning_rate": 1.914903629111581e-06, - "loss": 0.875, - "step": 18529 - }, - { - "epoch": 0.47, - "learning_rate": 1.9148924589647553e-06, - "loss": 1.0234, - "step": 18530 - }, - { - "epoch": 0.47, - "learning_rate": 1.914881288117439e-06, - "loss": 0.7871, - "step": 18531 - }, - { - "epoch": 0.47, - "learning_rate": 1.9148701165696403e-06, - "loss": 0.9736, - "step": 18532 - }, - { - "epoch": 0.48, - "learning_rate": 1.914858944321367e-06, - "loss": 0.8066, - "step": 18533 - }, - { - "epoch": 0.48, - "learning_rate": 1.9148477713726285e-06, - "loss": 0.916, - "step": 18534 - }, - { - "epoch": 0.48, - "learning_rate": 1.914836597723433e-06, - "loss": 0.8789, - "step": 18535 - }, - { - "epoch": 0.48, - "learning_rate": 1.9148254233737896e-06, - "loss": 0.9932, - "step": 18536 - }, - { - "epoch": 0.48, - "learning_rate": 1.9148142483237062e-06, - "loss": 0.8706, - "step": 18537 - }, - { - "epoch": 0.48, - "learning_rate": 1.9148030725731914e-06, - "loss": 0.6719, - "step": 18538 - }, - { - "epoch": 0.48, - "learning_rate": 1.914791896122254e-06, - "loss": 0.9873, - "step": 18539 - }, - { - "epoch": 0.48, - "learning_rate": 1.914780718970903e-06, - "loss": 0.9219, - "step": 18540 - }, - { - "epoch": 0.48, - "learning_rate": 1.914769541119146e-06, - "loss": 1.0244, - "step": 18541 - }, - { - "epoch": 0.48, - "learning_rate": 1.9147583625669922e-06, - "loss": 0.8994, - "step": 18542 - }, - { - "epoch": 0.48, - "learning_rate": 1.9147471833144498e-06, - "loss": 0.7495, - "step": 18543 - }, - { - "epoch": 0.48, - "learning_rate": 1.9147360033615275e-06, - "loss": 1.0391, - "step": 18544 - }, - { - "epoch": 0.48, - "learning_rate": 1.914724822708234e-06, - "loss": 0.7695, - "step": 18545 - }, - { - "epoch": 0.48, - "learning_rate": 1.914713641354578e-06, - "loss": 0.8564, - "step": 18546 - }, - { - "epoch": 0.48, - "learning_rate": 1.9147024593005677e-06, - "loss": 1.1162, - "step": 18547 - }, - { - "epoch": 0.48, - "learning_rate": 1.9146912765462115e-06, - "loss": 0.6855, - "step": 18548 - }, - { - "epoch": 0.48, - "learning_rate": 1.9146800930915187e-06, - "loss": 1.0352, - "step": 18549 - }, - { - "epoch": 0.48, - "learning_rate": 1.9146689089364973e-06, - "loss": 1.0146, - "step": 18550 - }, - { - "epoch": 0.48, - "learning_rate": 1.914657724081156e-06, - "loss": 0.9531, - "step": 18551 - }, - { - "epoch": 0.48, - "learning_rate": 1.914646538525503e-06, - "loss": 0.9512, - "step": 18552 - }, - { - "epoch": 0.48, - "learning_rate": 1.9146353522695472e-06, - "loss": 0.8047, - "step": 18553 - }, - { - "epoch": 0.48, - "learning_rate": 1.9146241653132973e-06, - "loss": 0.8857, - "step": 18554 - }, - { - "epoch": 0.48, - "learning_rate": 1.914612977656762e-06, - "loss": 0.9863, - "step": 18555 - }, - { - "epoch": 0.48, - "learning_rate": 1.9146017892999495e-06, - "loss": 0.7979, - "step": 18556 - }, - { - "epoch": 0.48, - "learning_rate": 1.914590600242868e-06, - "loss": 0.5752, - "step": 18557 - }, - { - "epoch": 0.48, - "learning_rate": 1.9145794104855272e-06, - "loss": 1.0088, - "step": 18558 - }, - { - "epoch": 0.48, - "learning_rate": 1.9145682200279345e-06, - "loss": 0.8232, - "step": 18559 - }, - { - "epoch": 0.48, - "learning_rate": 1.9145570288700996e-06, - "loss": 0.8198, - "step": 18560 - }, - { - "epoch": 0.48, - "learning_rate": 1.9145458370120298e-06, - "loss": 0.7754, - "step": 18561 - }, - { - "epoch": 0.48, - "learning_rate": 1.9145346444537343e-06, - "loss": 0.8975, - "step": 18562 - }, - { - "epoch": 0.48, - "learning_rate": 1.914523451195222e-06, - "loss": 0.9717, - "step": 18563 - }, - { - "epoch": 0.48, - "learning_rate": 1.9145122572365013e-06, - "loss": 0.7749, - "step": 18564 - }, - { - "epoch": 0.48, - "learning_rate": 1.9145010625775798e-06, - "loss": 1.1016, - "step": 18565 - }, - { - "epoch": 0.48, - "learning_rate": 1.914489867218468e-06, - "loss": 0.9209, - "step": 18566 - }, - { - "epoch": 0.48, - "learning_rate": 1.9144786711591726e-06, - "loss": 0.8975, - "step": 18567 - }, - { - "epoch": 0.48, - "learning_rate": 1.914467474399703e-06, - "loss": 0.832, - "step": 18568 - }, - { - "epoch": 0.48, - "learning_rate": 1.9144562769400675e-06, - "loss": 0.8486, - "step": 18569 - }, - { - "epoch": 0.48, - "learning_rate": 1.9144450787802754e-06, - "loss": 0.9272, - "step": 18570 - }, - { - "epoch": 0.48, - "learning_rate": 1.9144338799203348e-06, - "loss": 0.7231, - "step": 18571 - }, - { - "epoch": 0.48, - "learning_rate": 1.914422680360254e-06, - "loss": 0.7842, - "step": 18572 - }, - { - "epoch": 0.48, - "learning_rate": 1.9144114801000413e-06, - "loss": 0.7939, - "step": 18573 - }, - { - "epoch": 0.48, - "learning_rate": 1.9144002791397063e-06, - "loss": 0.9834, - "step": 18574 - }, - { - "epoch": 0.48, - "learning_rate": 1.914389077479257e-06, - "loss": 0.7974, - "step": 18575 - }, - { - "epoch": 0.48, - "learning_rate": 1.9143778751187025e-06, - "loss": 0.8904, - "step": 18576 - }, - { - "epoch": 0.48, - "learning_rate": 1.91436667205805e-06, - "loss": 0.7754, - "step": 18577 - }, - { - "epoch": 0.48, - "learning_rate": 1.9143554682973095e-06, - "loss": 1.0195, - "step": 18578 - }, - { - "epoch": 0.48, - "learning_rate": 1.914344263836489e-06, - "loss": 0.7041, - "step": 18579 - }, - { - "epoch": 0.48, - "learning_rate": 1.914333058675597e-06, - "loss": 0.9932, - "step": 18580 - }, - { - "epoch": 0.48, - "learning_rate": 1.9143218528146425e-06, - "loss": 0.7227, - "step": 18581 - }, - { - "epoch": 0.48, - "learning_rate": 1.9143106462536338e-06, - "loss": 0.7415, - "step": 18582 - }, - { - "epoch": 0.48, - "learning_rate": 1.914299438992579e-06, - "loss": 0.8887, - "step": 18583 - }, - { - "epoch": 0.48, - "learning_rate": 1.914288231031488e-06, - "loss": 0.8979, - "step": 18584 - }, - { - "epoch": 0.48, - "learning_rate": 1.9142770223703676e-06, - "loss": 0.9492, - "step": 18585 - }, - { - "epoch": 0.48, - "learning_rate": 1.9142658130092276e-06, - "loss": 0.7427, - "step": 18586 - }, - { - "epoch": 0.48, - "learning_rate": 1.9142546029480762e-06, - "loss": 0.6846, - "step": 18587 - }, - { - "epoch": 0.48, - "learning_rate": 1.914243392186923e-06, - "loss": 0.959, - "step": 18588 - }, - { - "epoch": 0.48, - "learning_rate": 1.9142321807257748e-06, - "loss": 0.9902, - "step": 18589 - }, - { - "epoch": 0.48, - "learning_rate": 1.914220968564641e-06, - "loss": 0.7, - "step": 18590 - }, - { - "epoch": 0.48, - "learning_rate": 1.9142097557035305e-06, - "loss": 0.6807, - "step": 18591 - }, - { - "epoch": 0.48, - "learning_rate": 1.9141985421424517e-06, - "loss": 0.7812, - "step": 18592 - }, - { - "epoch": 0.48, - "learning_rate": 1.9141873278814133e-06, - "loss": 0.7598, - "step": 18593 - }, - { - "epoch": 0.48, - "learning_rate": 1.914176112920423e-06, - "loss": 0.8145, - "step": 18594 - }, - { - "epoch": 0.48, - "learning_rate": 1.9141648972594905e-06, - "loss": 0.7495, - "step": 18595 - }, - { - "epoch": 0.48, - "learning_rate": 1.9141536808986244e-06, - "loss": 1.001, - "step": 18596 - }, - { - "epoch": 0.48, - "learning_rate": 1.914142463837832e-06, - "loss": 0.9111, - "step": 18597 - }, - { - "epoch": 0.48, - "learning_rate": 1.9141312460771233e-06, - "loss": 0.9189, - "step": 18598 - }, - { - "epoch": 0.48, - "learning_rate": 1.9141200276165065e-06, - "loss": 0.7695, - "step": 18599 - }, - { - "epoch": 0.48, - "learning_rate": 1.91410880845599e-06, - "loss": 0.8743, - "step": 18600 - }, - { - "epoch": 0.48, - "learning_rate": 1.914097588595582e-06, - "loss": 0.8838, - "step": 18601 - }, - { - "epoch": 0.48, - "learning_rate": 1.9140863680352917e-06, - "loss": 0.7871, - "step": 18602 - }, - { - "epoch": 0.48, - "learning_rate": 1.9140751467751273e-06, - "loss": 0.9043, - "step": 18603 - }, - { - "epoch": 0.48, - "learning_rate": 1.9140639248150977e-06, - "loss": 0.875, - "step": 18604 - }, - { - "epoch": 0.48, - "learning_rate": 1.9140527021552113e-06, - "loss": 0.8574, - "step": 18605 - }, - { - "epoch": 0.48, - "learning_rate": 1.914041478795477e-06, - "loss": 0.7837, - "step": 18606 - }, - { - "epoch": 0.48, - "learning_rate": 1.914030254735903e-06, - "loss": 0.8257, - "step": 18607 - }, - { - "epoch": 0.48, - "learning_rate": 1.9140190299764982e-06, - "loss": 0.8848, - "step": 18608 - }, - { - "epoch": 0.48, - "learning_rate": 1.9140078045172713e-06, - "loss": 0.8652, - "step": 18609 - }, - { - "epoch": 0.48, - "learning_rate": 1.9139965783582304e-06, - "loss": 0.9902, - "step": 18610 - }, - { - "epoch": 0.48, - "learning_rate": 1.9139853514993845e-06, - "loss": 0.9131, - "step": 18611 - }, - { - "epoch": 0.48, - "learning_rate": 1.9139741239407415e-06, - "loss": 0.6648, - "step": 18612 - }, - { - "epoch": 0.48, - "learning_rate": 1.913962895682311e-06, - "loss": 0.8496, - "step": 18613 - }, - { - "epoch": 0.48, - "learning_rate": 1.913951666724101e-06, - "loss": 0.7676, - "step": 18614 - }, - { - "epoch": 0.48, - "learning_rate": 1.9139404370661203e-06, - "loss": 0.7749, - "step": 18615 - }, - { - "epoch": 0.48, - "learning_rate": 1.9139292067083773e-06, - "loss": 0.7656, - "step": 18616 - }, - { - "epoch": 0.48, - "learning_rate": 1.913917975650881e-06, - "loss": 0.9136, - "step": 18617 - }, - { - "epoch": 0.48, - "learning_rate": 1.9139067438936397e-06, - "loss": 0.8237, - "step": 18618 - }, - { - "epoch": 0.48, - "learning_rate": 1.913895511436662e-06, - "loss": 0.793, - "step": 18619 - }, - { - "epoch": 0.48, - "learning_rate": 1.913884278279956e-06, - "loss": 0.8984, - "step": 18620 - }, - { - "epoch": 0.48, - "learning_rate": 1.9138730444235318e-06, - "loss": 0.7861, - "step": 18621 - }, - { - "epoch": 0.48, - "learning_rate": 1.913861809867396e-06, - "loss": 0.8564, - "step": 18622 - }, - { - "epoch": 0.48, - "learning_rate": 1.9138505746115587e-06, - "loss": 0.7432, - "step": 18623 - }, - { - "epoch": 0.48, - "learning_rate": 1.9138393386560283e-06, - "loss": 0.8535, - "step": 18624 - }, - { - "epoch": 0.48, - "learning_rate": 1.9138281020008126e-06, - "loss": 0.6357, - "step": 18625 - }, - { - "epoch": 0.48, - "learning_rate": 1.913816864645921e-06, - "loss": 0.8447, - "step": 18626 - }, - { - "epoch": 0.48, - "learning_rate": 1.913805626591362e-06, - "loss": 1.0283, - "step": 18627 - }, - { - "epoch": 0.48, - "learning_rate": 1.9137943878371437e-06, - "loss": 0.5125, - "step": 18628 - }, - { - "epoch": 0.48, - "learning_rate": 1.9137831483832757e-06, - "loss": 0.8936, - "step": 18629 - }, - { - "epoch": 0.48, - "learning_rate": 1.9137719082297653e-06, - "loss": 1.0381, - "step": 18630 - }, - { - "epoch": 0.48, - "learning_rate": 1.913760667376622e-06, - "loss": 0.8711, - "step": 18631 - }, - { - "epoch": 0.48, - "learning_rate": 1.9137494258238543e-06, - "loss": 0.9609, - "step": 18632 - }, - { - "epoch": 0.48, - "learning_rate": 1.9137381835714704e-06, - "loss": 0.9023, - "step": 18633 - }, - { - "epoch": 0.48, - "learning_rate": 1.9137269406194795e-06, - "loss": 0.6729, - "step": 18634 - }, - { - "epoch": 0.48, - "learning_rate": 1.91371569696789e-06, - "loss": 0.7881, - "step": 18635 - }, - { - "epoch": 0.48, - "learning_rate": 1.91370445261671e-06, - "loss": 0.7783, - "step": 18636 - }, - { - "epoch": 0.48, - "learning_rate": 1.9136932075659485e-06, - "loss": 0.8281, - "step": 18637 - }, - { - "epoch": 0.48, - "learning_rate": 1.9136819618156145e-06, - "loss": 0.9277, - "step": 18638 - }, - { - "epoch": 0.48, - "learning_rate": 1.913670715365716e-06, - "loss": 0.9814, - "step": 18639 - }, - { - "epoch": 0.48, - "learning_rate": 1.913659468216262e-06, - "loss": 0.6953, - "step": 18640 - }, - { - "epoch": 0.48, - "learning_rate": 1.9136482203672606e-06, - "loss": 0.7012, - "step": 18641 - }, - { - "epoch": 0.48, - "learning_rate": 1.913636971818721e-06, - "loss": 0.9189, - "step": 18642 - }, - { - "epoch": 0.48, - "learning_rate": 1.9136257225706513e-06, - "loss": 0.8896, - "step": 18643 - }, - { - "epoch": 0.48, - "learning_rate": 1.913614472623061e-06, - "loss": 0.8086, - "step": 18644 - }, - { - "epoch": 0.48, - "learning_rate": 1.9136032219759576e-06, - "loss": 1.0244, - "step": 18645 - }, - { - "epoch": 0.48, - "learning_rate": 1.9135919706293502e-06, - "loss": 0.8672, - "step": 18646 - }, - { - "epoch": 0.48, - "learning_rate": 1.913580718583248e-06, - "loss": 0.8477, - "step": 18647 - }, - { - "epoch": 0.48, - "learning_rate": 1.9135694658376583e-06, - "loss": 0.8135, - "step": 18648 - }, - { - "epoch": 0.48, - "learning_rate": 1.913558212392591e-06, - "loss": 1.0752, - "step": 18649 - }, - { - "epoch": 0.48, - "learning_rate": 1.9135469582480543e-06, - "loss": 0.834, - "step": 18650 - }, - { - "epoch": 0.48, - "learning_rate": 1.9135357034040563e-06, - "loss": 0.8809, - "step": 18651 - }, - { - "epoch": 0.48, - "learning_rate": 1.913524447860606e-06, - "loss": 0.8496, - "step": 18652 - }, - { - "epoch": 0.48, - "learning_rate": 1.9135131916177124e-06, - "loss": 0.7046, - "step": 18653 - }, - { - "epoch": 0.48, - "learning_rate": 1.9135019346753834e-06, - "loss": 0.7627, - "step": 18654 - }, - { - "epoch": 0.48, - "learning_rate": 1.913490677033628e-06, - "loss": 0.7395, - "step": 18655 - }, - { - "epoch": 0.48, - "learning_rate": 1.913479418692455e-06, - "loss": 0.8076, - "step": 18656 - }, - { - "epoch": 0.48, - "learning_rate": 1.9134681596518725e-06, - "loss": 0.791, - "step": 18657 - }, - { - "epoch": 0.48, - "learning_rate": 1.91345689991189e-06, - "loss": 0.7627, - "step": 18658 - }, - { - "epoch": 0.48, - "learning_rate": 1.913445639472515e-06, - "loss": 0.7864, - "step": 18659 - }, - { - "epoch": 0.48, - "learning_rate": 1.9134343783337566e-06, - "loss": 0.7646, - "step": 18660 - }, - { - "epoch": 0.48, - "learning_rate": 1.913423116495624e-06, - "loss": 1.126, - "step": 18661 - }, - { - "epoch": 0.48, - "learning_rate": 1.913411853958125e-06, - "loss": 0.9014, - "step": 18662 - }, - { - "epoch": 0.48, - "learning_rate": 1.913400590721269e-06, - "loss": 0.9336, - "step": 18663 - }, - { - "epoch": 0.48, - "learning_rate": 1.913389326785064e-06, - "loss": 0.7666, - "step": 18664 - }, - { - "epoch": 0.48, - "learning_rate": 1.9133780621495183e-06, - "loss": 0.9248, - "step": 18665 - }, - { - "epoch": 0.48, - "learning_rate": 1.913366796814641e-06, - "loss": 0.7397, - "step": 18666 - }, - { - "epoch": 0.48, - "learning_rate": 1.9133555307804413e-06, - "loss": 0.8691, - "step": 18667 - }, - { - "epoch": 0.48, - "learning_rate": 1.913344264046927e-06, - "loss": 0.9404, - "step": 18668 - }, - { - "epoch": 0.48, - "learning_rate": 1.913332996614107e-06, - "loss": 1.0146, - "step": 18669 - }, - { - "epoch": 0.48, - "learning_rate": 1.91332172848199e-06, - "loss": 0.8506, - "step": 18670 - }, - { - "epoch": 0.48, - "learning_rate": 1.9133104596505843e-06, - "loss": 0.7466, - "step": 18671 - }, - { - "epoch": 0.48, - "learning_rate": 1.913299190119899e-06, - "loss": 1.0088, - "step": 18672 - }, - { - "epoch": 0.48, - "learning_rate": 1.9132879198899427e-06, - "loss": 0.8994, - "step": 18673 - }, - { - "epoch": 0.48, - "learning_rate": 1.9132766489607234e-06, - "loss": 0.8438, - "step": 18674 - }, - { - "epoch": 0.48, - "learning_rate": 1.9132653773322504e-06, - "loss": 1.0957, - "step": 18675 - }, - { - "epoch": 0.48, - "learning_rate": 1.913254105004532e-06, - "loss": 1.0566, - "step": 18676 - }, - { - "epoch": 0.48, - "learning_rate": 1.913242831977577e-06, - "loss": 0.8738, - "step": 18677 - }, - { - "epoch": 0.48, - "learning_rate": 1.913231558251394e-06, - "loss": 0.665, - "step": 18678 - }, - { - "epoch": 0.48, - "learning_rate": 1.9132202838259915e-06, - "loss": 0.7197, - "step": 18679 - }, - { - "epoch": 0.48, - "learning_rate": 1.9132090087013782e-06, - "loss": 0.7546, - "step": 18680 - }, - { - "epoch": 0.48, - "learning_rate": 1.913197732877563e-06, - "loss": 0.7471, - "step": 18681 - }, - { - "epoch": 0.48, - "learning_rate": 1.9131864563545538e-06, - "loss": 1.1338, - "step": 18682 - }, - { - "epoch": 0.48, - "learning_rate": 1.91317517913236e-06, - "loss": 0.79, - "step": 18683 - }, - { - "epoch": 0.48, - "learning_rate": 1.91316390121099e-06, - "loss": 0.999, - "step": 18684 - }, - { - "epoch": 0.48, - "learning_rate": 1.9131526225904523e-06, - "loss": 0.7129, - "step": 18685 - }, - { - "epoch": 0.48, - "learning_rate": 1.913141343270756e-06, - "loss": 0.9863, - "step": 18686 - }, - { - "epoch": 0.48, - "learning_rate": 1.9131300632519087e-06, - "loss": 0.8389, - "step": 18687 - }, - { - "epoch": 0.48, - "learning_rate": 1.91311878253392e-06, - "loss": 0.668, - "step": 18688 - }, - { - "epoch": 0.48, - "learning_rate": 1.913107501116798e-06, - "loss": 0.7104, - "step": 18689 - }, - { - "epoch": 0.48, - "learning_rate": 1.913096219000552e-06, - "loss": 0.8135, - "step": 18690 - }, - { - "epoch": 0.48, - "learning_rate": 1.91308493618519e-06, - "loss": 0.9902, - "step": 18691 - }, - { - "epoch": 0.48, - "learning_rate": 1.913073652670721e-06, - "loss": 0.8857, - "step": 18692 - }, - { - "epoch": 0.48, - "learning_rate": 1.9130623684571532e-06, - "loss": 1.0986, - "step": 18693 - }, - { - "epoch": 0.48, - "learning_rate": 1.913051083544496e-06, - "loss": 0.998, - "step": 18694 - }, - { - "epoch": 0.48, - "learning_rate": 1.913039797932757e-06, - "loss": 0.7339, - "step": 18695 - }, - { - "epoch": 0.48, - "learning_rate": 1.9130285116219457e-06, - "loss": 0.9756, - "step": 18696 - }, - { - "epoch": 0.48, - "learning_rate": 1.9130172246120706e-06, - "loss": 1.0439, - "step": 18697 - }, - { - "epoch": 0.48, - "learning_rate": 1.91300593690314e-06, - "loss": 0.6514, - "step": 18698 - }, - { - "epoch": 0.48, - "learning_rate": 1.9129946484951625e-06, - "loss": 0.8496, - "step": 18699 - }, - { - "epoch": 0.48, - "learning_rate": 1.912983359388148e-06, - "loss": 0.8237, - "step": 18700 - }, - { - "epoch": 0.48, - "learning_rate": 1.912972069582103e-06, - "loss": 0.8955, - "step": 18701 - }, - { - "epoch": 0.48, - "learning_rate": 1.9129607790770375e-06, - "loss": 1.0093, - "step": 18702 - }, - { - "epoch": 0.48, - "learning_rate": 1.9129494878729598e-06, - "loss": 0.9248, - "step": 18703 - }, - { - "epoch": 0.48, - "learning_rate": 1.912938195969879e-06, - "loss": 1.0205, - "step": 18704 - }, - { - "epoch": 0.48, - "learning_rate": 1.9129269033678035e-06, - "loss": 0.9131, - "step": 18705 - }, - { - "epoch": 0.48, - "learning_rate": 1.9129156100667416e-06, - "loss": 1.0381, - "step": 18706 - }, - { - "epoch": 0.48, - "learning_rate": 1.912904316066702e-06, - "loss": 0.8838, - "step": 18707 - }, - { - "epoch": 0.48, - "learning_rate": 1.912893021367694e-06, - "loss": 0.8516, - "step": 18708 - }, - { - "epoch": 0.48, - "learning_rate": 1.9128817259697257e-06, - "loss": 0.8701, - "step": 18709 - }, - { - "epoch": 0.48, - "learning_rate": 1.9128704298728057e-06, - "loss": 0.875, - "step": 18710 - }, - { - "epoch": 0.48, - "learning_rate": 1.9128591330769426e-06, - "loss": 0.9062, - "step": 18711 - }, - { - "epoch": 0.48, - "learning_rate": 1.9128478355821455e-06, - "loss": 0.8271, - "step": 18712 - }, - { - "epoch": 0.48, - "learning_rate": 1.9128365373884226e-06, - "loss": 1.0703, - "step": 18713 - }, - { - "epoch": 0.48, - "learning_rate": 1.9128252384957828e-06, - "loss": 0.5413, - "step": 18714 - }, - { - "epoch": 0.48, - "learning_rate": 1.912813938904235e-06, - "loss": 1.0029, - "step": 18715 - }, - { - "epoch": 0.48, - "learning_rate": 1.9128026386137874e-06, - "loss": 0.8467, - "step": 18716 - }, - { - "epoch": 0.48, - "learning_rate": 1.9127913376244483e-06, - "loss": 0.7163, - "step": 18717 - }, - { - "epoch": 0.48, - "learning_rate": 1.9127800359362274e-06, - "loss": 0.915, - "step": 18718 - }, - { - "epoch": 0.48, - "learning_rate": 1.912768733549133e-06, - "loss": 0.7114, - "step": 18719 - }, - { - "epoch": 0.48, - "learning_rate": 1.9127574304631725e-06, - "loss": 0.8516, - "step": 18720 - }, - { - "epoch": 0.48, - "learning_rate": 1.9127461266783562e-06, - "loss": 0.7788, - "step": 18721 - }, - { - "epoch": 0.48, - "learning_rate": 1.9127348221946925e-06, - "loss": 0.8379, - "step": 18722 - }, - { - "epoch": 0.48, - "learning_rate": 1.9127235170121896e-06, - "loss": 1.0762, - "step": 18723 - }, - { - "epoch": 0.48, - "learning_rate": 1.912712211130856e-06, - "loss": 0.7607, - "step": 18724 - }, - { - "epoch": 0.48, - "learning_rate": 1.912700904550701e-06, - "loss": 0.8584, - "step": 18725 - }, - { - "epoch": 0.48, - "learning_rate": 1.912689597271732e-06, - "loss": 0.9453, - "step": 18726 - }, - { - "epoch": 0.48, - "learning_rate": 1.9126782892939596e-06, - "loss": 1.0312, - "step": 18727 - }, - { - "epoch": 0.48, - "learning_rate": 1.912666980617391e-06, - "loss": 0.8018, - "step": 18728 - }, - { - "epoch": 0.48, - "learning_rate": 1.912655671242035e-06, - "loss": 0.9707, - "step": 18729 - }, - { - "epoch": 0.48, - "learning_rate": 1.912644361167901e-06, - "loss": 0.7178, - "step": 18730 - }, - { - "epoch": 0.48, - "learning_rate": 1.912633050394997e-06, - "loss": 1.0156, - "step": 18731 - }, - { - "epoch": 0.48, - "learning_rate": 1.9126217389233315e-06, - "loss": 1.0029, - "step": 18732 - }, - { - "epoch": 0.48, - "learning_rate": 1.9126104267529136e-06, - "loss": 0.8115, - "step": 18733 - }, - { - "epoch": 0.48, - "learning_rate": 1.9125991138837524e-06, - "loss": 0.8867, - "step": 18734 - }, - { - "epoch": 0.48, - "learning_rate": 1.9125878003158555e-06, - "loss": 1.0439, - "step": 18735 - }, - { - "epoch": 0.48, - "learning_rate": 1.9125764860492323e-06, - "loss": 1.0547, - "step": 18736 - }, - { - "epoch": 0.48, - "learning_rate": 1.912565171083891e-06, - "loss": 0.957, - "step": 18737 - }, - { - "epoch": 0.48, - "learning_rate": 1.9125538554198405e-06, - "loss": 0.9844, - "step": 18738 - }, - { - "epoch": 0.48, - "learning_rate": 1.9125425390570898e-06, - "loss": 1.3428, - "step": 18739 - }, - { - "epoch": 0.48, - "learning_rate": 1.912531221995647e-06, - "loss": 0.9883, - "step": 18740 - }, - { - "epoch": 0.48, - "learning_rate": 1.912519904235521e-06, - "loss": 0.8223, - "step": 18741 - }, - { - "epoch": 0.48, - "learning_rate": 1.9125085857767208e-06, - "loss": 0.7373, - "step": 18742 - }, - { - "epoch": 0.48, - "learning_rate": 1.9124972666192543e-06, - "loss": 0.9092, - "step": 18743 - }, - { - "epoch": 0.48, - "learning_rate": 1.912485946763131e-06, - "loss": 0.7686, - "step": 18744 - }, - { - "epoch": 0.48, - "learning_rate": 1.912474626208359e-06, - "loss": 0.9746, - "step": 18745 - }, - { - "epoch": 0.48, - "learning_rate": 1.912463304954947e-06, - "loss": 0.8916, - "step": 18746 - }, - { - "epoch": 0.48, - "learning_rate": 1.912451983002904e-06, - "loss": 0.7417, - "step": 18747 - }, - { - "epoch": 0.48, - "learning_rate": 1.9124406603522384e-06, - "loss": 0.7856, - "step": 18748 - }, - { - "epoch": 0.48, - "learning_rate": 1.912429337002959e-06, - "loss": 0.7988, - "step": 18749 - }, - { - "epoch": 0.48, - "learning_rate": 1.912418012955074e-06, - "loss": 0.8496, - "step": 18750 - }, - { - "epoch": 0.48, - "learning_rate": 1.912406688208593e-06, - "loss": 0.7546, - "step": 18751 - }, - { - "epoch": 0.48, - "learning_rate": 1.912395362763524e-06, - "loss": 0.8789, - "step": 18752 - }, - { - "epoch": 0.48, - "learning_rate": 1.912384036619876e-06, - "loss": 0.9736, - "step": 18753 - }, - { - "epoch": 0.48, - "learning_rate": 1.912372709777657e-06, - "loss": 0.9551, - "step": 18754 - }, - { - "epoch": 0.48, - "learning_rate": 1.9123613822368766e-06, - "loss": 0.7705, - "step": 18755 - }, - { - "epoch": 0.48, - "learning_rate": 1.9123500539975427e-06, - "loss": 1.1191, - "step": 18756 - }, - { - "epoch": 0.48, - "learning_rate": 1.9123387250596642e-06, - "loss": 0.5759, - "step": 18757 - }, - { - "epoch": 0.48, - "learning_rate": 1.9123273954232503e-06, - "loss": 0.9072, - "step": 18758 - }, - { - "epoch": 0.48, - "learning_rate": 1.912316065088309e-06, - "loss": 0.8232, - "step": 18759 - }, - { - "epoch": 0.48, - "learning_rate": 1.9123047340548495e-06, - "loss": 1.1133, - "step": 18760 - }, - { - "epoch": 0.48, - "learning_rate": 1.9122934023228804e-06, - "loss": 1.0049, - "step": 18761 - }, - { - "epoch": 0.48, - "learning_rate": 1.9122820698924097e-06, - "loss": 0.9058, - "step": 18762 - }, - { - "epoch": 0.48, - "learning_rate": 1.912270736763447e-06, - "loss": 0.8516, - "step": 18763 - }, - { - "epoch": 0.48, - "learning_rate": 1.912259402936e-06, - "loss": 0.7358, - "step": 18764 - }, - { - "epoch": 0.48, - "learning_rate": 1.9122480684100783e-06, - "loss": 0.918, - "step": 18765 - }, - { - "epoch": 0.48, - "learning_rate": 1.91223673318569e-06, - "loss": 0.8389, - "step": 18766 - }, - { - "epoch": 0.48, - "learning_rate": 1.9122253972628443e-06, - "loss": 0.8081, - "step": 18767 - }, - { - "epoch": 0.48, - "learning_rate": 1.9122140606415494e-06, - "loss": 0.7456, - "step": 18768 - }, - { - "epoch": 0.48, - "learning_rate": 1.912202723321814e-06, - "loss": 0.9414, - "step": 18769 - }, - { - "epoch": 0.48, - "learning_rate": 1.912191385303647e-06, - "loss": 0.5496, - "step": 18770 - }, - { - "epoch": 0.48, - "learning_rate": 1.912180046587057e-06, - "loss": 1.1289, - "step": 18771 - }, - { - "epoch": 0.48, - "learning_rate": 1.912168707172053e-06, - "loss": 0.8789, - "step": 18772 - }, - { - "epoch": 0.48, - "learning_rate": 1.9121573670586428e-06, - "loss": 0.9727, - "step": 18773 - }, - { - "epoch": 0.48, - "learning_rate": 1.912146026246836e-06, - "loss": 0.8604, - "step": 18774 - }, - { - "epoch": 0.48, - "learning_rate": 1.9121346847366407e-06, - "loss": 0.9111, - "step": 18775 - }, - { - "epoch": 0.48, - "learning_rate": 1.9121233425280662e-06, - "loss": 0.9648, - "step": 18776 - }, - { - "epoch": 0.48, - "learning_rate": 1.9121119996211202e-06, - "loss": 0.6445, - "step": 18777 - }, - { - "epoch": 0.48, - "learning_rate": 1.9121006560158125e-06, - "loss": 0.8794, - "step": 18778 - }, - { - "epoch": 0.48, - "learning_rate": 1.912089311712151e-06, - "loss": 0.9561, - "step": 18779 - }, - { - "epoch": 0.48, - "learning_rate": 1.912077966710145e-06, - "loss": 0.9268, - "step": 18780 - }, - { - "epoch": 0.48, - "learning_rate": 1.9120666210098025e-06, - "loss": 0.8262, - "step": 18781 - }, - { - "epoch": 0.48, - "learning_rate": 1.9120552746111326e-06, - "loss": 0.877, - "step": 18782 - }, - { - "epoch": 0.48, - "learning_rate": 1.912043927514144e-06, - "loss": 0.7747, - "step": 18783 - }, - { - "epoch": 0.48, - "learning_rate": 1.9120325797188453e-06, - "loss": 0.8906, - "step": 18784 - }, - { - "epoch": 0.48, - "learning_rate": 1.9120212312252452e-06, - "loss": 0.9443, - "step": 18785 - }, - { - "epoch": 0.48, - "learning_rate": 1.912009882033352e-06, - "loss": 0.9272, - "step": 18786 - }, - { - "epoch": 0.48, - "learning_rate": 1.9119985321431755e-06, - "loss": 0.793, - "step": 18787 - }, - { - "epoch": 0.48, - "learning_rate": 1.911987181554723e-06, - "loss": 1.1172, - "step": 18788 - }, - { - "epoch": 0.48, - "learning_rate": 1.911975830268004e-06, - "loss": 0.7695, - "step": 18789 - }, - { - "epoch": 0.48, - "learning_rate": 1.911964478283027e-06, - "loss": 0.8145, - "step": 18790 - }, - { - "epoch": 0.48, - "learning_rate": 1.911953125599801e-06, - "loss": 1.0713, - "step": 18791 - }, - { - "epoch": 0.48, - "learning_rate": 1.9119417722183344e-06, - "loss": 0.5718, - "step": 18792 - }, - { - "epoch": 0.48, - "learning_rate": 1.9119304181386354e-06, - "loss": 0.8096, - "step": 18793 - }, - { - "epoch": 0.48, - "learning_rate": 1.911919063360714e-06, - "loss": 0.8774, - "step": 18794 - }, - { - "epoch": 0.48, - "learning_rate": 1.9119077078845776e-06, - "loss": 0.7681, - "step": 18795 - }, - { - "epoch": 0.48, - "learning_rate": 1.9118963517102357e-06, - "loss": 1.0273, - "step": 18796 - }, - { - "epoch": 0.48, - "learning_rate": 1.9118849948376964e-06, - "loss": 0.8535, - "step": 18797 - }, - { - "epoch": 0.48, - "learning_rate": 1.911873637266969e-06, - "loss": 1.0234, - "step": 18798 - }, - { - "epoch": 0.48, - "learning_rate": 1.9118622789980615e-06, - "loss": 1.0557, - "step": 18799 - }, - { - "epoch": 0.48, - "learning_rate": 1.9118509200309833e-06, - "loss": 0.9375, - "step": 18800 - }, - { - "epoch": 0.48, - "learning_rate": 1.911839560365742e-06, - "loss": 0.9307, - "step": 18801 - }, - { - "epoch": 0.48, - "learning_rate": 1.9118282000023483e-06, - "loss": 0.8008, - "step": 18802 - }, - { - "epoch": 0.48, - "learning_rate": 1.9118168389408088e-06, - "loss": 0.8057, - "step": 18803 - }, - { - "epoch": 0.48, - "learning_rate": 1.9118054771811333e-06, - "loss": 0.5098, - "step": 18804 - }, - { - "epoch": 0.48, - "learning_rate": 1.9117941147233307e-06, - "loss": 0.7627, - "step": 18805 - }, - { - "epoch": 0.48, - "learning_rate": 1.9117827515674086e-06, - "loss": 1.0361, - "step": 18806 - }, - { - "epoch": 0.48, - "learning_rate": 1.9117713877133768e-06, - "loss": 0.917, - "step": 18807 - }, - { - "epoch": 0.48, - "learning_rate": 1.9117600231612433e-06, - "loss": 0.9111, - "step": 18808 - }, - { - "epoch": 0.48, - "learning_rate": 1.9117486579110174e-06, - "loss": 0.7056, - "step": 18809 - }, - { - "epoch": 0.48, - "learning_rate": 1.9117372919627073e-06, - "loss": 0.9551, - "step": 18810 - }, - { - "epoch": 0.48, - "learning_rate": 1.9117259253163217e-06, - "loss": 0.9336, - "step": 18811 - }, - { - "epoch": 0.48, - "learning_rate": 1.91171455797187e-06, - "loss": 0.7031, - "step": 18812 - }, - { - "epoch": 0.48, - "learning_rate": 1.9117031899293598e-06, - "loss": 0.8386, - "step": 18813 - }, - { - "epoch": 0.48, - "learning_rate": 1.911691821188801e-06, - "loss": 0.8325, - "step": 18814 - }, - { - "epoch": 0.48, - "learning_rate": 1.911680451750201e-06, - "loss": 1.0732, - "step": 18815 - }, - { - "epoch": 0.48, - "learning_rate": 1.9116690816135693e-06, - "loss": 1.041, - "step": 18816 - }, - { - "epoch": 0.48, - "learning_rate": 1.911657710778915e-06, - "loss": 0.749, - "step": 18817 - }, - { - "epoch": 0.48, - "learning_rate": 1.9116463392462457e-06, - "loss": 0.8298, - "step": 18818 - }, - { - "epoch": 0.48, - "learning_rate": 1.9116349670155714e-06, - "loss": 0.7749, - "step": 18819 - }, - { - "epoch": 0.48, - "learning_rate": 1.9116235940868995e-06, - "loss": 0.7607, - "step": 18820 - }, - { - "epoch": 0.48, - "learning_rate": 1.91161222046024e-06, - "loss": 0.7573, - "step": 18821 - }, - { - "epoch": 0.48, - "learning_rate": 1.9116008461356e-06, - "loss": 0.9014, - "step": 18822 - }, - { - "epoch": 0.48, - "learning_rate": 1.91158947111299e-06, - "loss": 1.001, - "step": 18823 - }, - { - "epoch": 0.48, - "learning_rate": 1.9115780953924175e-06, - "loss": 0.9072, - "step": 18824 - }, - { - "epoch": 0.48, - "learning_rate": 1.9115667189738916e-06, - "loss": 0.9102, - "step": 18825 - }, - { - "epoch": 0.48, - "learning_rate": 1.911555341857421e-06, - "loss": 0.7891, - "step": 18826 - }, - { - "epoch": 0.48, - "learning_rate": 1.9115439640430145e-06, - "loss": 0.9365, - "step": 18827 - }, - { - "epoch": 0.48, - "learning_rate": 1.9115325855306807e-06, - "loss": 1.1006, - "step": 18828 - }, - { - "epoch": 0.48, - "learning_rate": 1.911521206320428e-06, - "loss": 0.916, - "step": 18829 - }, - { - "epoch": 0.48, - "learning_rate": 1.911509826412266e-06, - "loss": 0.9575, - "step": 18830 - }, - { - "epoch": 0.48, - "learning_rate": 1.911498445806202e-06, - "loss": 0.9932, - "step": 18831 - }, - { - "epoch": 0.48, - "learning_rate": 1.9114870645022464e-06, - "loss": 0.8877, - "step": 18832 - }, - { - "epoch": 0.48, - "learning_rate": 1.9114756825004067e-06, - "loss": 0.918, - "step": 18833 - }, - { - "epoch": 0.48, - "learning_rate": 1.911464299800692e-06, - "loss": 0.8291, - "step": 18834 - }, - { - "epoch": 0.48, - "learning_rate": 1.9114529164031107e-06, - "loss": 0.8564, - "step": 18835 - }, - { - "epoch": 0.48, - "learning_rate": 1.911441532307672e-06, - "loss": 0.7432, - "step": 18836 - }, - { - "epoch": 0.48, - "learning_rate": 1.9114301475143847e-06, - "loss": 0.9639, - "step": 18837 - }, - { - "epoch": 0.48, - "learning_rate": 1.911418762023257e-06, - "loss": 0.8867, - "step": 18838 - }, - { - "epoch": 0.48, - "learning_rate": 1.911407375834298e-06, - "loss": 0.834, - "step": 18839 - }, - { - "epoch": 0.48, - "learning_rate": 1.911395988947516e-06, - "loss": 0.8555, - "step": 18840 - }, - { - "epoch": 0.48, - "learning_rate": 1.91138460136292e-06, - "loss": 0.8242, - "step": 18841 - }, - { - "epoch": 0.48, - "learning_rate": 1.911373213080519e-06, - "loss": 1.0586, - "step": 18842 - }, - { - "epoch": 0.48, - "learning_rate": 1.9113618241003213e-06, - "loss": 0.8223, - "step": 18843 - }, - { - "epoch": 0.48, - "learning_rate": 1.9113504344223357e-06, - "loss": 0.9395, - "step": 18844 - }, - { - "epoch": 0.48, - "learning_rate": 1.9113390440465716e-06, - "loss": 0.8342, - "step": 18845 - }, - { - "epoch": 0.48, - "learning_rate": 1.9113276529730365e-06, - "loss": 0.8857, - "step": 18846 - }, - { - "epoch": 0.48, - "learning_rate": 1.9113162612017394e-06, - "loss": 0.9277, - "step": 18847 - }, - { - "epoch": 0.48, - "learning_rate": 1.91130486873269e-06, - "loss": 0.6919, - "step": 18848 - }, - { - "epoch": 0.48, - "learning_rate": 1.911293475565896e-06, - "loss": 0.7686, - "step": 18849 - }, - { - "epoch": 0.48, - "learning_rate": 1.911282081701367e-06, - "loss": 0.9395, - "step": 18850 - }, - { - "epoch": 0.48, - "learning_rate": 1.9112706871391106e-06, - "loss": 0.8633, - "step": 18851 - }, - { - "epoch": 0.48, - "learning_rate": 1.911259291879136e-06, - "loss": 0.9033, - "step": 18852 - }, - { - "epoch": 0.48, - "learning_rate": 1.9112478959214526e-06, - "loss": 0.9531, - "step": 18853 - }, - { - "epoch": 0.48, - "learning_rate": 1.9112364992660687e-06, - "loss": 0.6416, - "step": 18854 - }, - { - "epoch": 0.48, - "learning_rate": 1.911225101912992e-06, - "loss": 0.9668, - "step": 18855 - }, - { - "epoch": 0.48, - "learning_rate": 1.911213703862233e-06, - "loss": 0.9297, - "step": 18856 - }, - { - "epoch": 0.48, - "learning_rate": 1.9112023051137995e-06, - "loss": 0.7705, - "step": 18857 - }, - { - "epoch": 0.48, - "learning_rate": 1.9111909056677e-06, - "loss": 0.8413, - "step": 18858 - }, - { - "epoch": 0.48, - "learning_rate": 1.9111795055239438e-06, - "loss": 0.8711, - "step": 18859 - }, - { - "epoch": 0.48, - "learning_rate": 1.911168104682539e-06, - "loss": 0.9141, - "step": 18860 - }, - { - "epoch": 0.48, - "learning_rate": 1.9111567031434948e-06, - "loss": 0.8164, - "step": 18861 - }, - { - "epoch": 0.48, - "learning_rate": 1.9111453009068197e-06, - "loss": 1.0781, - "step": 18862 - }, - { - "epoch": 0.48, - "learning_rate": 1.911133897972523e-06, - "loss": 0.918, - "step": 18863 - }, - { - "epoch": 0.48, - "learning_rate": 1.9111224943406126e-06, - "loss": 0.7939, - "step": 18864 - }, - { - "epoch": 0.48, - "learning_rate": 1.9111110900110974e-06, - "loss": 1.0547, - "step": 18865 - }, - { - "epoch": 0.48, - "learning_rate": 1.9110996849839867e-06, - "loss": 1.0264, - "step": 18866 - }, - { - "epoch": 0.48, - "learning_rate": 1.911088279259289e-06, - "loss": 0.8594, - "step": 18867 - }, - { - "epoch": 0.48, - "learning_rate": 1.9110768728370123e-06, - "loss": 0.7861, - "step": 18868 - }, - { - "epoch": 0.48, - "learning_rate": 1.9110654657171665e-06, - "loss": 0.9336, - "step": 18869 - }, - { - "epoch": 0.48, - "learning_rate": 1.91105405789976e-06, - "loss": 0.9473, - "step": 18870 - }, - { - "epoch": 0.48, - "learning_rate": 1.9110426493848003e-06, - "loss": 0.9189, - "step": 18871 - }, - { - "epoch": 0.48, - "learning_rate": 1.9110312401722978e-06, - "loss": 1.0234, - "step": 18872 - }, - { - "epoch": 0.48, - "learning_rate": 1.91101983026226e-06, - "loss": 1.0791, - "step": 18873 - }, - { - "epoch": 0.48, - "learning_rate": 1.911008419654697e-06, - "loss": 0.9053, - "step": 18874 - }, - { - "epoch": 0.48, - "learning_rate": 1.9109970083496164e-06, - "loss": 0.9229, - "step": 18875 - }, - { - "epoch": 0.48, - "learning_rate": 1.9109855963470275e-06, - "loss": 0.8223, - "step": 18876 - }, - { - "epoch": 0.48, - "learning_rate": 1.9109741836469384e-06, - "loss": 0.7705, - "step": 18877 - }, - { - "epoch": 0.48, - "learning_rate": 1.9109627702493583e-06, - "loss": 0.6611, - "step": 18878 - }, - { - "epoch": 0.48, - "learning_rate": 1.910951356154296e-06, - "loss": 0.6152, - "step": 18879 - }, - { - "epoch": 0.48, - "learning_rate": 1.9109399413617603e-06, - "loss": 0.8491, - "step": 18880 - }, - { - "epoch": 0.48, - "learning_rate": 1.9109285258717598e-06, - "loss": 0.999, - "step": 18881 - }, - { - "epoch": 0.48, - "learning_rate": 1.910917109684303e-06, - "loss": 0.8662, - "step": 18882 - }, - { - "epoch": 0.48, - "learning_rate": 1.910905692799399e-06, - "loss": 0.9033, - "step": 18883 - }, - { - "epoch": 0.48, - "learning_rate": 1.9108942752170563e-06, - "loss": 0.834, - "step": 18884 - }, - { - "epoch": 0.48, - "learning_rate": 1.9108828569372837e-06, - "loss": 0.9609, - "step": 18885 - }, - { - "epoch": 0.48, - "learning_rate": 1.91087143796009e-06, - "loss": 0.9131, - "step": 18886 - }, - { - "epoch": 0.48, - "learning_rate": 1.910860018285484e-06, - "loss": 0.9111, - "step": 18887 - }, - { - "epoch": 0.48, - "learning_rate": 1.910848597913474e-06, - "loss": 0.7954, - "step": 18888 - }, - { - "epoch": 0.48, - "learning_rate": 1.9108371768440698e-06, - "loss": 0.8018, - "step": 18889 - }, - { - "epoch": 0.48, - "learning_rate": 1.910825755077279e-06, - "loss": 0.9082, - "step": 18890 - }, - { - "epoch": 0.48, - "learning_rate": 1.910814332613111e-06, - "loss": 0.8584, - "step": 18891 - }, - { - "epoch": 0.48, - "learning_rate": 1.9108029094515743e-06, - "loss": 0.8643, - "step": 18892 - }, - { - "epoch": 0.48, - "learning_rate": 1.9107914855926778e-06, - "loss": 0.863, - "step": 18893 - }, - { - "epoch": 0.48, - "learning_rate": 1.9107800610364296e-06, - "loss": 0.8296, - "step": 18894 - }, - { - "epoch": 0.48, - "learning_rate": 1.9107686357828395e-06, - "loss": 0.7471, - "step": 18895 - }, - { - "epoch": 0.48, - "learning_rate": 1.9107572098319156e-06, - "loss": 0.7612, - "step": 18896 - }, - { - "epoch": 0.48, - "learning_rate": 1.9107457831836667e-06, - "loss": 0.7012, - "step": 18897 - }, - { - "epoch": 0.48, - "learning_rate": 1.910734355838102e-06, - "loss": 0.8174, - "step": 18898 - }, - { - "epoch": 0.48, - "learning_rate": 1.9107229277952293e-06, - "loss": 0.8525, - "step": 18899 - }, - { - "epoch": 0.48, - "learning_rate": 1.910711499055058e-06, - "loss": 0.7773, - "step": 18900 - }, - { - "epoch": 0.48, - "learning_rate": 1.910700069617597e-06, - "loss": 0.8755, - "step": 18901 - }, - { - "epoch": 0.48, - "learning_rate": 1.910688639482855e-06, - "loss": 0.9238, - "step": 18902 - }, - { - "epoch": 0.48, - "learning_rate": 1.9106772086508403e-06, - "loss": 0.9307, - "step": 18903 - }, - { - "epoch": 0.48, - "learning_rate": 1.9106657771215624e-06, - "loss": 0.7627, - "step": 18904 - }, - { - "epoch": 0.48, - "learning_rate": 1.910654344895029e-06, - "loss": 0.8831, - "step": 18905 - }, - { - "epoch": 0.48, - "learning_rate": 1.9106429119712498e-06, - "loss": 0.9766, - "step": 18906 - }, - { - "epoch": 0.48, - "learning_rate": 1.910631478350233e-06, - "loss": 0.9238, - "step": 18907 - }, - { - "epoch": 0.48, - "learning_rate": 1.9106200440319876e-06, - "loss": 0.8252, - "step": 18908 - }, - { - "epoch": 0.48, - "learning_rate": 1.9106086090165224e-06, - "loss": 0.916, - "step": 18909 - }, - { - "epoch": 0.48, - "learning_rate": 1.910597173303846e-06, - "loss": 0.7441, - "step": 18910 - }, - { - "epoch": 0.48, - "learning_rate": 1.910585736893967e-06, - "loss": 0.7578, - "step": 18911 - }, - { - "epoch": 0.48, - "learning_rate": 1.9105742997868945e-06, - "loss": 0.582, - "step": 18912 - }, - { - "epoch": 0.48, - "learning_rate": 1.9105628619826372e-06, - "loss": 1.0342, - "step": 18913 - }, - { - "epoch": 0.48, - "learning_rate": 1.9105514234812037e-06, - "loss": 1.0234, - "step": 18914 - }, - { - "epoch": 0.48, - "learning_rate": 1.910539984282603e-06, - "loss": 1.1836, - "step": 18915 - }, - { - "epoch": 0.48, - "learning_rate": 1.9105285443868437e-06, - "loss": 1.0732, - "step": 18916 - }, - { - "epoch": 0.48, - "learning_rate": 1.9105171037939346e-06, - "loss": 1.0557, - "step": 18917 - }, - { - "epoch": 0.48, - "learning_rate": 1.9105056625038844e-06, - "loss": 0.7793, - "step": 18918 - }, - { - "epoch": 0.48, - "learning_rate": 1.9104942205167015e-06, - "loss": 0.8369, - "step": 18919 - }, - { - "epoch": 0.48, - "learning_rate": 1.9104827778323952e-06, - "loss": 0.9844, - "step": 18920 - }, - { - "epoch": 0.48, - "learning_rate": 1.9104713344509745e-06, - "loss": 1.0293, - "step": 18921 - }, - { - "epoch": 0.48, - "learning_rate": 1.9104598903724473e-06, - "loss": 0.8066, - "step": 18922 - }, - { - "epoch": 0.49, - "learning_rate": 1.910448445596823e-06, - "loss": 1.0068, - "step": 18923 - }, - { - "epoch": 0.49, - "learning_rate": 1.91043700012411e-06, - "loss": 0.9214, - "step": 18924 - }, - { - "epoch": 0.49, - "learning_rate": 1.910425553954318e-06, - "loss": 0.5898, - "step": 18925 - }, - { - "epoch": 0.49, - "learning_rate": 1.910414107087454e-06, - "loss": 0.9375, - "step": 18926 - }, - { - "epoch": 0.49, - "learning_rate": 1.9104026595235286e-06, - "loss": 0.9639, - "step": 18927 - }, - { - "epoch": 0.49, - "learning_rate": 1.9103912112625492e-06, - "loss": 0.6084, - "step": 18928 - }, - { - "epoch": 0.49, - "learning_rate": 1.9103797623045253e-06, - "loss": 0.9365, - "step": 18929 - }, - { - "epoch": 0.49, - "learning_rate": 1.9103683126494657e-06, - "loss": 0.8877, - "step": 18930 - }, - { - "epoch": 0.49, - "learning_rate": 1.9103568622973784e-06, - "loss": 0.7109, - "step": 18931 - }, - { - "epoch": 0.49, - "learning_rate": 1.9103454112482732e-06, - "loss": 0.666, - "step": 18932 - }, - { - "epoch": 0.49, - "learning_rate": 1.910333959502158e-06, - "loss": 0.8096, - "step": 18933 - }, - { - "epoch": 0.49, - "learning_rate": 1.9103225070590426e-06, - "loss": 0.8379, - "step": 18934 - }, - { - "epoch": 0.49, - "learning_rate": 1.9103110539189345e-06, - "loss": 0.7578, - "step": 18935 - }, - { - "epoch": 0.49, - "learning_rate": 1.9102996000818433e-06, - "loss": 0.8301, - "step": 18936 - }, - { - "epoch": 0.49, - "learning_rate": 1.9102881455477773e-06, - "loss": 0.7485, - "step": 18937 - }, - { - "epoch": 0.49, - "learning_rate": 1.910276690316746e-06, - "loss": 0.8789, - "step": 18938 - }, - { - "epoch": 0.49, - "learning_rate": 1.9102652343887572e-06, - "loss": 0.9326, - "step": 18939 - }, - { - "epoch": 0.49, - "learning_rate": 1.9102537777638205e-06, - "loss": 1.0068, - "step": 18940 - }, - { - "epoch": 0.49, - "learning_rate": 1.9102423204419442e-06, - "loss": 1.0615, - "step": 18941 - }, - { - "epoch": 0.49, - "learning_rate": 1.9102308624231373e-06, - "loss": 0.7554, - "step": 18942 - }, - { - "epoch": 0.49, - "learning_rate": 1.9102194037074086e-06, - "loss": 0.7153, - "step": 18943 - }, - { - "epoch": 0.49, - "learning_rate": 1.9102079442947666e-06, - "loss": 0.8188, - "step": 18944 - }, - { - "epoch": 0.49, - "learning_rate": 1.9101964841852197e-06, - "loss": 0.8516, - "step": 18945 - }, - { - "epoch": 0.49, - "learning_rate": 1.910185023378778e-06, - "loss": 0.6978, - "step": 18946 - }, - { - "epoch": 0.49, - "learning_rate": 1.9101735618754493e-06, - "loss": 0.8682, - "step": 18947 - }, - { - "epoch": 0.49, - "learning_rate": 1.910162099675242e-06, - "loss": 0.9834, - "step": 18948 - }, - { - "epoch": 0.49, - "learning_rate": 1.9101506367781662e-06, - "loss": 0.7412, - "step": 18949 - }, - { - "epoch": 0.49, - "learning_rate": 1.9101391731842295e-06, - "loss": 0.7363, - "step": 18950 - }, - { - "epoch": 0.49, - "learning_rate": 1.9101277088934413e-06, - "loss": 0.9023, - "step": 18951 - }, - { - "epoch": 0.49, - "learning_rate": 1.91011624390581e-06, - "loss": 0.873, - "step": 18952 - }, - { - "epoch": 0.49, - "learning_rate": 1.9101047782213444e-06, - "loss": 0.9541, - "step": 18953 - }, - { - "epoch": 0.49, - "learning_rate": 1.910093311840054e-06, - "loss": 0.7651, - "step": 18954 - }, - { - "epoch": 0.49, - "learning_rate": 1.9100818447619463e-06, - "loss": 0.7061, - "step": 18955 - }, - { - "epoch": 0.49, - "learning_rate": 1.910070376987031e-06, - "loss": 0.9092, - "step": 18956 - }, - { - "epoch": 0.49, - "learning_rate": 1.910058908515317e-06, - "loss": 0.6379, - "step": 18957 - }, - { - "epoch": 0.49, - "learning_rate": 1.9100474393468123e-06, - "loss": 0.7197, - "step": 18958 - }, - { - "epoch": 0.49, - "learning_rate": 1.9100359694815262e-06, - "loss": 0.8945, - "step": 18959 - }, - { - "epoch": 0.49, - "learning_rate": 1.9100244989194675e-06, - "loss": 0.8018, - "step": 18960 - }, - { - "epoch": 0.49, - "learning_rate": 1.910013027660645e-06, - "loss": 0.958, - "step": 18961 - }, - { - "epoch": 0.49, - "learning_rate": 1.910001555705067e-06, - "loss": 0.8154, - "step": 18962 - }, - { - "epoch": 0.49, - "learning_rate": 1.909990083052743e-06, - "loss": 0.8701, - "step": 18963 - }, - { - "epoch": 0.49, - "learning_rate": 1.9099786097036812e-06, - "loss": 0.7734, - "step": 18964 - }, - { - "epoch": 0.49, - "learning_rate": 1.909967135657891e-06, - "loss": 1.0186, - "step": 18965 - }, - { - "epoch": 0.49, - "learning_rate": 1.9099556609153805e-06, - "loss": 0.9482, - "step": 18966 - }, - { - "epoch": 0.49, - "learning_rate": 1.909944185476159e-06, - "loss": 0.79, - "step": 18967 - }, - { - "epoch": 0.49, - "learning_rate": 1.909932709340235e-06, - "loss": 1.1006, - "step": 18968 - }, - { - "epoch": 0.49, - "learning_rate": 1.909921232507617e-06, - "loss": 0.8184, - "step": 18969 - }, - { - "epoch": 0.49, - "learning_rate": 1.9099097549783143e-06, - "loss": 0.8184, - "step": 18970 - }, - { - "epoch": 0.49, - "learning_rate": 1.9098982767523357e-06, - "loss": 0.9551, - "step": 18971 - }, - { - "epoch": 0.49, - "learning_rate": 1.90988679782969e-06, - "loss": 0.5981, - "step": 18972 - }, - { - "epoch": 0.49, - "learning_rate": 1.9098753182103854e-06, - "loss": 0.7539, - "step": 18973 - }, - { - "epoch": 0.49, - "learning_rate": 1.9098638378944318e-06, - "loss": 0.6606, - "step": 18974 - }, - { - "epoch": 0.49, - "learning_rate": 1.9098523568818364e-06, - "loss": 0.7139, - "step": 18975 - }, - { - "epoch": 0.49, - "learning_rate": 1.9098408751726093e-06, - "loss": 1.0352, - "step": 18976 - }, - { - "epoch": 0.49, - "learning_rate": 1.909829392766759e-06, - "loss": 0.9658, - "step": 18977 - }, - { - "epoch": 0.49, - "learning_rate": 1.909817909664294e-06, - "loss": 0.8691, - "step": 18978 - }, - { - "epoch": 0.49, - "learning_rate": 1.9098064258652236e-06, - "loss": 0.7505, - "step": 18979 - }, - { - "epoch": 0.49, - "learning_rate": 1.909794941369556e-06, - "loss": 1.0, - "step": 18980 - }, - { - "epoch": 0.49, - "learning_rate": 1.9097834561772997e-06, - "loss": 0.9727, - "step": 18981 - }, - { - "epoch": 0.49, - "learning_rate": 1.9097719702884648e-06, - "loss": 1.0352, - "step": 18982 - }, - { - "epoch": 0.49, - "learning_rate": 1.909760483703059e-06, - "loss": 0.5967, - "step": 18983 - }, - { - "epoch": 0.49, - "learning_rate": 1.909748996421092e-06, - "loss": 0.6865, - "step": 18984 - }, - { - "epoch": 0.49, - "learning_rate": 1.909737508442571e-06, - "loss": 0.8809, - "step": 18985 - }, - { - "epoch": 0.49, - "learning_rate": 1.909726019767507e-06, - "loss": 0.6765, - "step": 18986 - }, - { - "epoch": 0.49, - "learning_rate": 1.9097145303959067e-06, - "loss": 0.8291, - "step": 18987 - }, - { - "epoch": 0.49, - "learning_rate": 1.90970304032778e-06, - "loss": 0.9756, - "step": 18988 - }, - { - "epoch": 0.49, - "learning_rate": 1.9096915495631357e-06, - "loss": 0.7417, - "step": 18989 - }, - { - "epoch": 0.49, - "learning_rate": 1.909680058101982e-06, - "loss": 0.8438, - "step": 18990 - }, - { - "epoch": 0.49, - "learning_rate": 1.9096685659443286e-06, - "loss": 0.8877, - "step": 18991 - }, - { - "epoch": 0.49, - "learning_rate": 1.9096570730901837e-06, - "loss": 0.7832, - "step": 18992 - }, - { - "epoch": 0.49, - "learning_rate": 1.909645579539556e-06, - "loss": 1.0156, - "step": 18993 - }, - { - "epoch": 0.49, - "learning_rate": 1.909634085292455e-06, - "loss": 0.7305, - "step": 18994 - }, - { - "epoch": 0.49, - "learning_rate": 1.9096225903488885e-06, - "loss": 0.8945, - "step": 18995 - }, - { - "epoch": 0.49, - "learning_rate": 1.909611094708866e-06, - "loss": 0.6953, - "step": 18996 - }, - { - "epoch": 0.49, - "learning_rate": 1.909599598372396e-06, - "loss": 0.624, - "step": 18997 - }, - { - "epoch": 0.49, - "learning_rate": 1.9095881013394872e-06, - "loss": 0.9453, - "step": 18998 - }, - { - "epoch": 0.49, - "learning_rate": 1.909576603610149e-06, - "loss": 1.0283, - "step": 18999 - }, - { - "epoch": 0.49, - "learning_rate": 1.9095651051843896e-06, - "loss": 0.8208, - "step": 19000 - }, - { - "epoch": 0.49, - "learning_rate": 1.9095536060622183e-06, - "loss": 0.96, - "step": 19001 - }, - { - "epoch": 0.49, - "learning_rate": 1.9095421062436437e-06, - "loss": 0.9697, - "step": 19002 - }, - { - "epoch": 0.49, - "learning_rate": 1.909530605728674e-06, - "loss": 0.917, - "step": 19003 - }, - { - "epoch": 0.49, - "learning_rate": 1.909519104517319e-06, - "loss": 0.7065, - "step": 19004 - }, - { - "epoch": 0.49, - "learning_rate": 1.9095076026095867e-06, - "loss": 0.9336, - "step": 19005 - }, - { - "epoch": 0.49, - "learning_rate": 1.9094961000054866e-06, - "loss": 1.0146, - "step": 19006 - }, - { - "epoch": 0.49, - "learning_rate": 1.909484596705027e-06, - "loss": 0.8516, - "step": 19007 - }, - { - "epoch": 0.49, - "learning_rate": 1.909473092708217e-06, - "loss": 0.9307, - "step": 19008 - }, - { - "epoch": 0.49, - "learning_rate": 1.909461588015065e-06, - "loss": 1.0415, - "step": 19009 - }, - { - "epoch": 0.49, - "learning_rate": 1.90945008262558e-06, - "loss": 0.9707, - "step": 19010 - }, - { - "epoch": 0.49, - "learning_rate": 1.909438576539771e-06, - "loss": 0.6504, - "step": 19011 - }, - { - "epoch": 0.49, - "learning_rate": 1.909427069757647e-06, - "loss": 0.5615, - "step": 19012 - }, - { - "epoch": 0.49, - "learning_rate": 1.909415562279216e-06, - "loss": 0.6519, - "step": 19013 - }, - { - "epoch": 0.49, - "learning_rate": 1.909404054104488e-06, - "loss": 1.1152, - "step": 19014 - }, - { - "epoch": 0.49, - "learning_rate": 1.909392545233471e-06, - "loss": 0.7817, - "step": 19015 - }, - { - "epoch": 0.49, - "learning_rate": 1.9093810356661734e-06, - "loss": 0.9785, - "step": 19016 - }, - { - "epoch": 0.49, - "learning_rate": 1.9093695254026047e-06, - "loss": 0.9463, - "step": 19017 - }, - { - "epoch": 0.49, - "learning_rate": 1.9093580144427736e-06, - "loss": 0.5476, - "step": 19018 - }, - { - "epoch": 0.49, - "learning_rate": 1.909346502786689e-06, - "loss": 0.8438, - "step": 19019 - }, - { - "epoch": 0.49, - "learning_rate": 1.9093349904343595e-06, - "loss": 0.8506, - "step": 19020 - }, - { - "epoch": 0.49, - "learning_rate": 1.9093234773857943e-06, - "loss": 0.8564, - "step": 19021 - }, - { - "epoch": 0.49, - "learning_rate": 1.909311963641002e-06, - "loss": 0.9023, - "step": 19022 - }, - { - "epoch": 0.49, - "learning_rate": 1.9093004491999907e-06, - "loss": 0.6699, - "step": 19023 - }, - { - "epoch": 0.49, - "learning_rate": 1.90928893406277e-06, - "loss": 0.9971, - "step": 19024 - }, - { - "epoch": 0.49, - "learning_rate": 1.909277418229349e-06, - "loss": 0.7578, - "step": 19025 - }, - { - "epoch": 0.49, - "learning_rate": 1.909265901699736e-06, - "loss": 0.9434, - "step": 19026 - }, - { - "epoch": 0.49, - "learning_rate": 1.9092543844739397e-06, - "loss": 0.8232, - "step": 19027 - }, - { - "epoch": 0.49, - "learning_rate": 1.909242866551969e-06, - "loss": 0.876, - "step": 19028 - }, - { - "epoch": 0.49, - "learning_rate": 1.9092313479338333e-06, - "loss": 0.8438, - "step": 19029 - }, - { - "epoch": 0.49, - "learning_rate": 1.909219828619541e-06, - "loss": 0.875, - "step": 19030 - }, - { - "epoch": 0.49, - "learning_rate": 1.9092083086091005e-06, - "loss": 0.9102, - "step": 19031 - }, - { - "epoch": 0.49, - "learning_rate": 1.909196787902521e-06, - "loss": 0.8169, - "step": 19032 - }, - { - "epoch": 0.49, - "learning_rate": 1.9091852664998113e-06, - "loss": 0.7197, - "step": 19033 - }, - { - "epoch": 0.49, - "learning_rate": 1.9091737444009807e-06, - "loss": 0.7241, - "step": 19034 - }, - { - "epoch": 0.49, - "learning_rate": 1.909162221606037e-06, - "loss": 0.8467, - "step": 19035 - }, - { - "epoch": 0.49, - "learning_rate": 1.90915069811499e-06, - "loss": 0.8247, - "step": 19036 - }, - { - "epoch": 0.49, - "learning_rate": 1.9091391739278477e-06, - "loss": 1.0205, - "step": 19037 - }, - { - "epoch": 0.49, - "learning_rate": 1.90912764904462e-06, - "loss": 0.9297, - "step": 19038 - }, - { - "epoch": 0.49, - "learning_rate": 1.9091161234653144e-06, - "loss": 0.999, - "step": 19039 - }, - { - "epoch": 0.49, - "learning_rate": 1.9091045971899405e-06, - "loss": 0.6704, - "step": 19040 - }, - { - "epoch": 0.49, - "learning_rate": 1.909093070218507e-06, - "loss": 0.6658, - "step": 19041 - }, - { - "epoch": 0.49, - "learning_rate": 1.909081542551023e-06, - "loss": 0.8213, - "step": 19042 - }, - { - "epoch": 0.49, - "learning_rate": 1.909070014187497e-06, - "loss": 0.8008, - "step": 19043 - }, - { - "epoch": 0.49, - "learning_rate": 1.909058485127938e-06, - "loss": 1.1797, - "step": 19044 - }, - { - "epoch": 0.49, - "learning_rate": 1.9090469553723544e-06, - "loss": 0.8467, - "step": 19045 - }, - { - "epoch": 0.49, - "learning_rate": 1.9090354249207558e-06, - "loss": 0.793, - "step": 19046 - }, - { - "epoch": 0.49, - "learning_rate": 1.90902389377315e-06, - "loss": 0.7646, - "step": 19047 - }, - { - "epoch": 0.49, - "learning_rate": 1.9090123619295468e-06, - "loss": 0.9424, - "step": 19048 - }, - { - "epoch": 0.49, - "learning_rate": 1.9090008293899547e-06, - "loss": 0.9863, - "step": 19049 - }, - { - "epoch": 0.49, - "learning_rate": 1.9089892961543823e-06, - "loss": 0.916, - "step": 19050 - }, - { - "epoch": 0.49, - "learning_rate": 1.9089777622228386e-06, - "loss": 0.7183, - "step": 19051 - }, - { - "epoch": 0.49, - "learning_rate": 1.9089662275953323e-06, - "loss": 0.9316, - "step": 19052 - }, - { - "epoch": 0.49, - "learning_rate": 1.9089546922718724e-06, - "loss": 1.0205, - "step": 19053 - }, - { - "epoch": 0.49, - "learning_rate": 1.908943156252468e-06, - "loss": 0.9893, - "step": 19054 - }, - { - "epoch": 0.49, - "learning_rate": 1.9089316195371274e-06, - "loss": 0.7266, - "step": 19055 - }, - { - "epoch": 0.49, - "learning_rate": 1.9089200821258596e-06, - "loss": 0.7456, - "step": 19056 - }, - { - "epoch": 0.49, - "learning_rate": 1.9089085440186734e-06, - "loss": 0.8389, - "step": 19057 - }, - { - "epoch": 0.49, - "learning_rate": 1.9088970052155776e-06, - "loss": 0.8828, - "step": 19058 - }, - { - "epoch": 0.49, - "learning_rate": 1.9088854657165816e-06, - "loss": 0.9014, - "step": 19059 - }, - { - "epoch": 0.49, - "learning_rate": 1.9088739255216933e-06, - "loss": 0.6753, - "step": 19060 - }, - { - "epoch": 0.49, - "learning_rate": 1.9088623846309226e-06, - "loss": 0.9131, - "step": 19061 - }, - { - "epoch": 0.49, - "learning_rate": 1.9088508430442775e-06, - "loss": 0.5737, - "step": 19062 - }, - { - "epoch": 0.49, - "learning_rate": 1.908839300761767e-06, - "loss": 0.8887, - "step": 19063 - }, - { - "epoch": 0.49, - "learning_rate": 1.9088277577834e-06, - "loss": 1.0283, - "step": 19064 - }, - { - "epoch": 0.49, - "learning_rate": 1.9088162141091855e-06, - "loss": 0.9473, - "step": 19065 - }, - { - "epoch": 0.49, - "learning_rate": 1.908804669739132e-06, - "loss": 0.8604, - "step": 19066 - }, - { - "epoch": 0.49, - "learning_rate": 1.9087931246732488e-06, - "loss": 0.7219, - "step": 19067 - }, - { - "epoch": 0.49, - "learning_rate": 1.9087815789115444e-06, - "loss": 0.9248, - "step": 19068 - }, - { - "epoch": 0.49, - "learning_rate": 1.908770032454028e-06, - "loss": 1.0869, - "step": 19069 - }, - { - "epoch": 0.49, - "learning_rate": 1.9087584853007076e-06, - "loss": 0.7002, - "step": 19070 - }, - { - "epoch": 0.49, - "learning_rate": 1.908746937451593e-06, - "loss": 0.8389, - "step": 19071 - }, - { - "epoch": 0.49, - "learning_rate": 1.9087353889066925e-06, - "loss": 0.8369, - "step": 19072 - }, - { - "epoch": 0.49, - "learning_rate": 1.9087238396660155e-06, - "loss": 0.8691, - "step": 19073 - }, - { - "epoch": 0.49, - "learning_rate": 1.90871228972957e-06, - "loss": 0.7314, - "step": 19074 - }, - { - "epoch": 0.49, - "learning_rate": 1.9087007390973655e-06, - "loss": 0.9814, - "step": 19075 - }, - { - "epoch": 0.49, - "learning_rate": 1.9086891877694103e-06, - "loss": 0.6797, - "step": 19076 - }, - { - "epoch": 0.49, - "learning_rate": 1.908677635745714e-06, - "loss": 0.9326, - "step": 19077 - }, - { - "epoch": 0.49, - "learning_rate": 1.908666083026285e-06, - "loss": 0.9531, - "step": 19078 - }, - { - "epoch": 0.49, - "learning_rate": 1.908654529611132e-06, - "loss": 0.9927, - "step": 19079 - }, - { - "epoch": 0.49, - "learning_rate": 1.908642975500264e-06, - "loss": 0.8672, - "step": 19080 - }, - { - "epoch": 0.49, - "learning_rate": 1.9086314206936898e-06, - "loss": 1.041, - "step": 19081 - }, - { - "epoch": 0.49, - "learning_rate": 1.908619865191418e-06, - "loss": 0.6426, - "step": 19082 - }, - { - "epoch": 0.49, - "learning_rate": 1.9086083089934586e-06, - "loss": 0.7861, - "step": 19083 - }, - { - "epoch": 0.49, - "learning_rate": 1.908596752099819e-06, - "loss": 0.9629, - "step": 19084 - }, - { - "epoch": 0.49, - "learning_rate": 1.9085851945105086e-06, - "loss": 0.918, - "step": 19085 - }, - { - "epoch": 0.49, - "learning_rate": 1.908573636225537e-06, - "loss": 1.0469, - "step": 19086 - }, - { - "epoch": 0.49, - "learning_rate": 1.9085620772449113e-06, - "loss": 0.8818, - "step": 19087 - }, - { - "epoch": 0.49, - "learning_rate": 1.908550517568642e-06, - "loss": 1.1279, - "step": 19088 - }, - { - "epoch": 0.49, - "learning_rate": 1.908538957196737e-06, - "loss": 0.8711, - "step": 19089 - }, - { - "epoch": 0.49, - "learning_rate": 1.908527396129206e-06, - "loss": 0.8838, - "step": 19090 - }, - { - "epoch": 0.49, - "learning_rate": 1.908515834366057e-06, - "loss": 0.8965, - "step": 19091 - }, - { - "epoch": 0.49, - "learning_rate": 1.9085042719072993e-06, - "loss": 0.7944, - "step": 19092 - }, - { - "epoch": 0.49, - "learning_rate": 1.9084927087529414e-06, - "loss": 0.5669, - "step": 19093 - }, - { - "epoch": 0.49, - "learning_rate": 1.908481144902993e-06, - "loss": 0.832, - "step": 19094 - }, - { - "epoch": 0.49, - "learning_rate": 1.9084695803574617e-06, - "loss": 0.999, - "step": 19095 - }, - { - "epoch": 0.49, - "learning_rate": 1.908458015116357e-06, - "loss": 0.9639, - "step": 19096 - }, - { - "epoch": 0.49, - "learning_rate": 1.9084464491796884e-06, - "loss": 0.8394, - "step": 19097 - }, - { - "epoch": 0.49, - "learning_rate": 1.9084348825474636e-06, - "loss": 0.8545, - "step": 19098 - }, - { - "epoch": 0.49, - "learning_rate": 1.9084233152196926e-06, - "loss": 0.8584, - "step": 19099 - }, - { - "epoch": 0.49, - "learning_rate": 1.908411747196383e-06, - "loss": 0.8406, - "step": 19100 - }, - { - "epoch": 0.49, - "learning_rate": 1.9084001784775447e-06, - "loss": 0.9854, - "step": 19101 - }, - { - "epoch": 0.49, - "learning_rate": 1.9083886090631856e-06, - "loss": 0.959, - "step": 19102 - }, - { - "epoch": 0.49, - "learning_rate": 1.908377038953316e-06, - "loss": 0.9072, - "step": 19103 - }, - { - "epoch": 0.49, - "learning_rate": 1.908365468147943e-06, - "loss": 0.9971, - "step": 19104 - }, - { - "epoch": 0.49, - "learning_rate": 1.9083538966470767e-06, - "loss": 0.9219, - "step": 19105 - }, - { - "epoch": 0.49, - "learning_rate": 1.9083423244507255e-06, - "loss": 0.8867, - "step": 19106 - }, - { - "epoch": 0.49, - "learning_rate": 1.9083307515588985e-06, - "loss": 0.8652, - "step": 19107 - }, - { - "epoch": 0.49, - "learning_rate": 1.9083191779716044e-06, - "loss": 0.8516, - "step": 19108 - }, - { - "epoch": 0.49, - "learning_rate": 1.908307603688852e-06, - "loss": 0.7354, - "step": 19109 - }, - { - "epoch": 0.49, - "learning_rate": 1.90829602871065e-06, - "loss": 0.8779, - "step": 19110 - }, - { - "epoch": 0.49, - "learning_rate": 1.908284453037008e-06, - "loss": 0.8564, - "step": 19111 - }, - { - "epoch": 0.49, - "learning_rate": 1.908272876667934e-06, - "loss": 0.8652, - "step": 19112 - }, - { - "epoch": 0.49, - "learning_rate": 1.908261299603437e-06, - "loss": 0.9072, - "step": 19113 - }, - { - "epoch": 0.49, - "learning_rate": 1.9082497218435267e-06, - "loss": 0.9385, - "step": 19114 - }, - { - "epoch": 0.49, - "learning_rate": 1.908238143388211e-06, - "loss": 0.8789, - "step": 19115 - }, - { - "epoch": 0.49, - "learning_rate": 1.908226564237499e-06, - "loss": 0.8848, - "step": 19116 - }, - { - "epoch": 0.49, - "learning_rate": 1.9082149843914e-06, - "loss": 0.7754, - "step": 19117 - }, - { - "epoch": 0.49, - "learning_rate": 1.9082034038499226e-06, - "loss": 1.1348, - "step": 19118 - }, - { - "epoch": 0.49, - "learning_rate": 1.9081918226130752e-06, - "loss": 1.0439, - "step": 19119 - }, - { - "epoch": 0.49, - "learning_rate": 1.9081802406808672e-06, - "loss": 0.9092, - "step": 19120 - }, - { - "epoch": 0.49, - "learning_rate": 1.908168658053308e-06, - "loss": 0.9141, - "step": 19121 - }, - { - "epoch": 0.49, - "learning_rate": 1.9081570747304047e-06, - "loss": 1.0645, - "step": 19122 - }, - { - "epoch": 0.49, - "learning_rate": 1.908145490712168e-06, - "loss": 0.8564, - "step": 19123 - }, - { - "epoch": 0.49, - "learning_rate": 1.9081339059986057e-06, - "loss": 0.9326, - "step": 19124 - }, - { - "epoch": 0.49, - "learning_rate": 1.9081223205897273e-06, - "loss": 0.8467, - "step": 19125 - }, - { - "epoch": 0.49, - "learning_rate": 1.9081107344855415e-06, - "loss": 0.8721, - "step": 19126 - }, - { - "epoch": 0.49, - "learning_rate": 1.9080991476860564e-06, - "loss": 0.5618, - "step": 19127 - }, - { - "epoch": 0.49, - "learning_rate": 1.9080875601912822e-06, - "loss": 0.5938, - "step": 19128 - }, - { - "epoch": 0.49, - "learning_rate": 1.908075972001227e-06, - "loss": 0.9248, - "step": 19129 - }, - { - "epoch": 0.49, - "learning_rate": 1.9080643831158996e-06, - "loss": 0.8608, - "step": 19130 - }, - { - "epoch": 0.49, - "learning_rate": 1.9080527935353093e-06, - "loss": 0.958, - "step": 19131 - }, - { - "epoch": 0.49, - "learning_rate": 1.9080412032594647e-06, - "loss": 0.8428, - "step": 19132 - }, - { - "epoch": 0.49, - "learning_rate": 1.9080296122883745e-06, - "loss": 0.6025, - "step": 19133 - }, - { - "epoch": 0.49, - "learning_rate": 1.9080180206220478e-06, - "loss": 0.7876, - "step": 19134 - }, - { - "epoch": 0.49, - "learning_rate": 1.9080064282604933e-06, - "loss": 0.7627, - "step": 19135 - }, - { - "epoch": 0.49, - "learning_rate": 1.907994835203721e-06, - "loss": 0.7939, - "step": 19136 - }, - { - "epoch": 0.49, - "learning_rate": 1.9079832414517378e-06, - "loss": 0.8359, - "step": 19137 - }, - { - "epoch": 0.49, - "learning_rate": 1.9079716470045536e-06, - "loss": 0.9658, - "step": 19138 - }, - { - "epoch": 0.49, - "learning_rate": 1.9079600518621777e-06, - "loss": 0.6279, - "step": 19139 - }, - { - "epoch": 0.49, - "learning_rate": 1.907948456024618e-06, - "loss": 0.7427, - "step": 19140 - }, - { - "epoch": 0.49, - "learning_rate": 1.9079368594918847e-06, - "loss": 1.0049, - "step": 19141 - }, - { - "epoch": 0.49, - "learning_rate": 1.9079252622639854e-06, - "loss": 0.9424, - "step": 19142 - }, - { - "epoch": 0.49, - "learning_rate": 1.9079136643409295e-06, - "loss": 0.9072, - "step": 19143 - }, - { - "epoch": 0.49, - "learning_rate": 1.907902065722726e-06, - "loss": 0.8564, - "step": 19144 - }, - { - "epoch": 0.49, - "learning_rate": 1.9078904664093832e-06, - "loss": 0.8701, - "step": 19145 - }, - { - "epoch": 0.49, - "learning_rate": 1.9078788664009106e-06, - "loss": 0.9639, - "step": 19146 - }, - { - "epoch": 0.49, - "learning_rate": 1.907867265697317e-06, - "loss": 0.917, - "step": 19147 - }, - { - "epoch": 0.49, - "learning_rate": 1.9078556642986114e-06, - "loss": 0.8213, - "step": 19148 - }, - { - "epoch": 0.49, - "learning_rate": 1.9078440622048025e-06, - "loss": 0.7246, - "step": 19149 - }, - { - "epoch": 0.49, - "learning_rate": 1.9078324594158986e-06, - "loss": 0.8232, - "step": 19150 - }, - { - "epoch": 0.49, - "learning_rate": 1.9078208559319096e-06, - "loss": 1.1035, - "step": 19151 - }, - { - "epoch": 0.49, - "learning_rate": 1.9078092517528437e-06, - "loss": 0.7334, - "step": 19152 - }, - { - "epoch": 0.49, - "learning_rate": 1.90779764687871e-06, - "loss": 0.8572, - "step": 19153 - }, - { - "epoch": 0.49, - "learning_rate": 1.9077860413095175e-06, - "loss": 0.8828, - "step": 19154 - }, - { - "epoch": 0.49, - "learning_rate": 1.907774435045275e-06, - "loss": 0.666, - "step": 19155 - }, - { - "epoch": 0.49, - "learning_rate": 1.9077628280859912e-06, - "loss": 0.8174, - "step": 19156 - }, - { - "epoch": 0.49, - "learning_rate": 1.9077512204316754e-06, - "loss": 0.8096, - "step": 19157 - }, - { - "epoch": 0.49, - "learning_rate": 1.9077396120823355e-06, - "loss": 1.0215, - "step": 19158 - }, - { - "epoch": 0.49, - "learning_rate": 1.907728003037982e-06, - "loss": 0.9653, - "step": 19159 - }, - { - "epoch": 0.49, - "learning_rate": 1.9077163932986228e-06, - "loss": 0.5488, - "step": 19160 - }, - { - "epoch": 0.49, - "learning_rate": 1.9077047828642664e-06, - "loss": 0.8721, - "step": 19161 - }, - { - "epoch": 0.49, - "learning_rate": 1.907693171734922e-06, - "loss": 0.9434, - "step": 19162 - }, - { - "epoch": 0.49, - "learning_rate": 1.9076815599105995e-06, - "loss": 0.9258, - "step": 19163 - }, - { - "epoch": 0.49, - "learning_rate": 1.9076699473913067e-06, - "loss": 0.9814, - "step": 19164 - }, - { - "epoch": 0.49, - "learning_rate": 1.9076583341770526e-06, - "loss": 0.7434, - "step": 19165 - }, - { - "epoch": 0.49, - "learning_rate": 1.9076467202678465e-06, - "loss": 0.9102, - "step": 19166 - }, - { - "epoch": 0.49, - "learning_rate": 1.9076351056636964e-06, - "loss": 0.7935, - "step": 19167 - }, - { - "epoch": 0.49, - "learning_rate": 1.9076234903646126e-06, - "loss": 0.9131, - "step": 19168 - }, - { - "epoch": 0.49, - "learning_rate": 1.9076118743706026e-06, - "loss": 0.6802, - "step": 19169 - }, - { - "epoch": 0.49, - "learning_rate": 1.907600257681676e-06, - "loss": 0.832, - "step": 19170 - }, - { - "epoch": 0.49, - "learning_rate": 1.9075886402978422e-06, - "loss": 0.9346, - "step": 19171 - }, - { - "epoch": 0.49, - "learning_rate": 1.907577022219109e-06, - "loss": 0.7646, - "step": 19172 - }, - { - "epoch": 0.49, - "learning_rate": 1.907565403445486e-06, - "loss": 0.6392, - "step": 19173 - }, - { - "epoch": 0.49, - "learning_rate": 1.907553783976982e-06, - "loss": 0.7061, - "step": 19174 - }, - { - "epoch": 0.49, - "learning_rate": 1.9075421638136057e-06, - "loss": 0.73, - "step": 19175 - }, - { - "epoch": 0.49, - "learning_rate": 1.907530542955366e-06, - "loss": 0.8462, - "step": 19176 - }, - { - "epoch": 0.49, - "learning_rate": 1.907518921402272e-06, - "loss": 0.8574, - "step": 19177 - }, - { - "epoch": 0.49, - "learning_rate": 1.9075072991543322e-06, - "loss": 0.7319, - "step": 19178 - }, - { - "epoch": 0.49, - "learning_rate": 1.9074956762115557e-06, - "loss": 0.9854, - "step": 19179 - }, - { - "epoch": 0.49, - "learning_rate": 1.907484052573952e-06, - "loss": 0.7065, - "step": 19180 - }, - { - "epoch": 0.49, - "learning_rate": 1.9074724282415296e-06, - "loss": 0.6934, - "step": 19181 - }, - { - "epoch": 0.49, - "learning_rate": 1.9074608032142965e-06, - "loss": 0.8535, - "step": 19182 - }, - { - "epoch": 0.49, - "learning_rate": 1.907449177492263e-06, - "loss": 0.7734, - "step": 19183 - }, - { - "epoch": 0.49, - "learning_rate": 1.9074375510754373e-06, - "loss": 0.6445, - "step": 19184 - }, - { - "epoch": 0.49, - "learning_rate": 1.9074259239638285e-06, - "loss": 0.9683, - "step": 19185 - }, - { - "epoch": 0.49, - "learning_rate": 1.907414296157445e-06, - "loss": 0.6155, - "step": 19186 - }, - { - "epoch": 0.49, - "learning_rate": 1.9074026676562966e-06, - "loss": 0.7612, - "step": 19187 - }, - { - "epoch": 0.49, - "learning_rate": 1.9073910384603912e-06, - "loss": 0.9639, - "step": 19188 - }, - { - "epoch": 0.49, - "learning_rate": 1.9073794085697385e-06, - "loss": 1.0752, - "step": 19189 - }, - { - "epoch": 0.49, - "learning_rate": 1.907367777984347e-06, - "loss": 0.9375, - "step": 19190 - }, - { - "epoch": 0.49, - "learning_rate": 1.9073561467042263e-06, - "loss": 0.9922, - "step": 19191 - }, - { - "epoch": 0.49, - "learning_rate": 1.907344514729384e-06, - "loss": 0.9199, - "step": 19192 - }, - { - "epoch": 0.49, - "learning_rate": 1.9073328820598297e-06, - "loss": 0.9961, - "step": 19193 - }, - { - "epoch": 0.49, - "learning_rate": 1.9073212486955726e-06, - "loss": 0.8936, - "step": 19194 - }, - { - "epoch": 0.49, - "learning_rate": 1.9073096146366211e-06, - "loss": 0.7656, - "step": 19195 - }, - { - "epoch": 0.49, - "learning_rate": 1.9072979798829847e-06, - "loss": 1.0508, - "step": 19196 - }, - { - "epoch": 0.49, - "learning_rate": 1.9072863444346718e-06, - "loss": 0.9302, - "step": 19197 - }, - { - "epoch": 0.49, - "learning_rate": 1.9072747082916916e-06, - "loss": 0.7549, - "step": 19198 - }, - { - "epoch": 0.49, - "learning_rate": 1.9072630714540526e-06, - "loss": 0.9863, - "step": 19199 - }, - { - "epoch": 0.49, - "learning_rate": 1.907251433921764e-06, - "loss": 0.918, - "step": 19200 - }, - { - "epoch": 0.49, - "learning_rate": 1.9072397956948349e-06, - "loss": 0.8506, - "step": 19201 - }, - { - "epoch": 0.49, - "learning_rate": 1.9072281567732737e-06, - "loss": 0.8164, - "step": 19202 - }, - { - "epoch": 0.49, - "learning_rate": 1.90721651715709e-06, - "loss": 0.5186, - "step": 19203 - }, - { - "epoch": 0.49, - "learning_rate": 1.907204876846292e-06, - "loss": 1.0117, - "step": 19204 - }, - { - "epoch": 0.49, - "learning_rate": 1.9071932358408893e-06, - "loss": 0.9062, - "step": 19205 - }, - { - "epoch": 0.49, - "learning_rate": 1.9071815941408902e-06, - "loss": 0.8809, - "step": 19206 - }, - { - "epoch": 0.49, - "learning_rate": 1.907169951746304e-06, - "loss": 0.6943, - "step": 19207 - }, - { - "epoch": 0.49, - "learning_rate": 1.9071583086571393e-06, - "loss": 1.002, - "step": 19208 - }, - { - "epoch": 0.49, - "learning_rate": 1.907146664873405e-06, - "loss": 0.8335, - "step": 19209 - }, - { - "epoch": 0.49, - "learning_rate": 1.9071350203951107e-06, - "loss": 0.8926, - "step": 19210 - }, - { - "epoch": 0.49, - "learning_rate": 1.9071233752222647e-06, - "loss": 0.6572, - "step": 19211 - }, - { - "epoch": 0.49, - "learning_rate": 1.907111729354876e-06, - "loss": 0.6885, - "step": 19212 - }, - { - "epoch": 0.49, - "learning_rate": 1.9071000827929535e-06, - "loss": 0.8721, - "step": 19213 - }, - { - "epoch": 0.49, - "learning_rate": 1.9070884355365062e-06, - "loss": 0.6587, - "step": 19214 - }, - { - "epoch": 0.49, - "learning_rate": 1.907076787585543e-06, - "loss": 0.9023, - "step": 19215 - }, - { - "epoch": 0.49, - "learning_rate": 1.9070651389400728e-06, - "loss": 0.8301, - "step": 19216 - }, - { - "epoch": 0.49, - "learning_rate": 1.9070534896001045e-06, - "loss": 0.6978, - "step": 19217 - }, - { - "epoch": 0.49, - "learning_rate": 1.907041839565647e-06, - "loss": 0.999, - "step": 19218 - }, - { - "epoch": 0.49, - "learning_rate": 1.9070301888367095e-06, - "loss": 0.7236, - "step": 19219 - }, - { - "epoch": 0.49, - "learning_rate": 1.9070185374133005e-06, - "loss": 0.8652, - "step": 19220 - }, - { - "epoch": 0.49, - "learning_rate": 1.9070068852954292e-06, - "loss": 0.7319, - "step": 19221 - }, - { - "epoch": 0.49, - "learning_rate": 1.9069952324831044e-06, - "loss": 0.8857, - "step": 19222 - }, - { - "epoch": 0.49, - "learning_rate": 1.9069835789763351e-06, - "loss": 0.9219, - "step": 19223 - }, - { - "epoch": 0.49, - "learning_rate": 1.9069719247751301e-06, - "loss": 0.9014, - "step": 19224 - }, - { - "epoch": 0.49, - "learning_rate": 1.9069602698794983e-06, - "loss": 0.916, - "step": 19225 - }, - { - "epoch": 0.49, - "learning_rate": 1.9069486142894488e-06, - "loss": 0.9492, - "step": 19226 - }, - { - "epoch": 0.49, - "learning_rate": 1.9069369580049909e-06, - "loss": 0.9062, - "step": 19227 - }, - { - "epoch": 0.49, - "learning_rate": 1.9069253010261325e-06, - "loss": 0.8193, - "step": 19228 - }, - { - "epoch": 0.49, - "learning_rate": 1.9069136433528832e-06, - "loss": 0.791, - "step": 19229 - }, - { - "epoch": 0.49, - "learning_rate": 1.906901984985252e-06, - "loss": 0.79, - "step": 19230 - }, - { - "epoch": 0.49, - "learning_rate": 1.9068903259232473e-06, - "loss": 0.981, - "step": 19231 - }, - { - "epoch": 0.49, - "learning_rate": 1.9068786661668788e-06, - "loss": 0.8682, - "step": 19232 - }, - { - "epoch": 0.49, - "learning_rate": 1.9068670057161547e-06, - "loss": 0.7008, - "step": 19233 - }, - { - "epoch": 0.49, - "learning_rate": 1.9068553445710843e-06, - "loss": 0.8848, - "step": 19234 - }, - { - "epoch": 0.49, - "learning_rate": 1.9068436827316768e-06, - "loss": 0.7646, - "step": 19235 - }, - { - "epoch": 0.49, - "learning_rate": 1.9068320201979404e-06, - "loss": 1.0469, - "step": 19236 - }, - { - "epoch": 0.49, - "learning_rate": 1.9068203569698843e-06, - "loss": 0.7715, - "step": 19237 - }, - { - "epoch": 0.49, - "learning_rate": 1.9068086930475181e-06, - "loss": 0.6606, - "step": 19238 - }, - { - "epoch": 0.49, - "learning_rate": 1.9067970284308496e-06, - "loss": 0.9805, - "step": 19239 - }, - { - "epoch": 0.49, - "learning_rate": 1.9067853631198887e-06, - "loss": 0.9814, - "step": 19240 - }, - { - "epoch": 0.49, - "learning_rate": 1.9067736971146439e-06, - "loss": 0.9248, - "step": 19241 - }, - { - "epoch": 0.49, - "learning_rate": 1.906762030415124e-06, - "loss": 0.9678, - "step": 19242 - }, - { - "epoch": 0.49, - "learning_rate": 1.9067503630213384e-06, - "loss": 0.9629, - "step": 19243 - }, - { - "epoch": 0.49, - "learning_rate": 1.9067386949332955e-06, - "loss": 0.7695, - "step": 19244 - }, - { - "epoch": 0.49, - "learning_rate": 1.9067270261510045e-06, - "loss": 0.8857, - "step": 19245 - }, - { - "epoch": 0.49, - "learning_rate": 1.9067153566744742e-06, - "loss": 0.8896, - "step": 19246 - }, - { - "epoch": 0.49, - "learning_rate": 1.9067036865037137e-06, - "loss": 1.0635, - "step": 19247 - }, - { - "epoch": 0.49, - "learning_rate": 1.9066920156387321e-06, - "loss": 0.7319, - "step": 19248 - }, - { - "epoch": 0.49, - "learning_rate": 1.9066803440795378e-06, - "loss": 0.9697, - "step": 19249 - }, - { - "epoch": 0.49, - "learning_rate": 1.9066686718261403e-06, - "loss": 1.1133, - "step": 19250 - }, - { - "epoch": 0.49, - "learning_rate": 1.906656998878548e-06, - "loss": 0.8594, - "step": 19251 - }, - { - "epoch": 0.49, - "learning_rate": 1.9066453252367706e-06, - "loss": 0.875, - "step": 19252 - }, - { - "epoch": 0.49, - "learning_rate": 1.9066336509008161e-06, - "loss": 1.0635, - "step": 19253 - }, - { - "epoch": 0.49, - "learning_rate": 1.9066219758706943e-06, - "loss": 0.7249, - "step": 19254 - }, - { - "epoch": 0.49, - "learning_rate": 1.9066103001464134e-06, - "loss": 1.0459, - "step": 19255 - }, - { - "epoch": 0.49, - "learning_rate": 1.9065986237279828e-06, - "loss": 0.7944, - "step": 19256 - }, - { - "epoch": 0.49, - "learning_rate": 1.9065869466154111e-06, - "loss": 0.8408, - "step": 19257 - }, - { - "epoch": 0.49, - "learning_rate": 1.9065752688087078e-06, - "loss": 0.6777, - "step": 19258 - }, - { - "epoch": 0.49, - "learning_rate": 1.9065635903078814e-06, - "loss": 0.9268, - "step": 19259 - }, - { - "epoch": 0.49, - "learning_rate": 1.9065519111129409e-06, - "loss": 0.5706, - "step": 19260 - }, - { - "epoch": 0.49, - "learning_rate": 1.9065402312238954e-06, - "loss": 0.6423, - "step": 19261 - }, - { - "epoch": 0.49, - "learning_rate": 1.9065285506407536e-06, - "loss": 1.1104, - "step": 19262 - }, - { - "epoch": 0.49, - "learning_rate": 1.9065168693635247e-06, - "loss": 0.8682, - "step": 19263 - }, - { - "epoch": 0.49, - "learning_rate": 1.9065051873922173e-06, - "loss": 0.6914, - "step": 19264 - }, - { - "epoch": 0.49, - "learning_rate": 1.906493504726841e-06, - "loss": 0.9785, - "step": 19265 - }, - { - "epoch": 0.49, - "learning_rate": 1.9064818213674038e-06, - "loss": 1.0049, - "step": 19266 - }, - { - "epoch": 0.49, - "learning_rate": 1.9064701373139154e-06, - "loss": 0.8398, - "step": 19267 - }, - { - "epoch": 0.49, - "learning_rate": 1.9064584525663844e-06, - "loss": 0.96, - "step": 19268 - }, - { - "epoch": 0.49, - "learning_rate": 1.9064467671248198e-06, - "loss": 0.6514, - "step": 19269 - }, - { - "epoch": 0.49, - "learning_rate": 1.906435080989231e-06, - "loss": 1.1357, - "step": 19270 - }, - { - "epoch": 0.49, - "learning_rate": 1.906423394159626e-06, - "loss": 1.0156, - "step": 19271 - }, - { - "epoch": 0.49, - "learning_rate": 1.9064117066360146e-06, - "loss": 0.8613, - "step": 19272 - }, - { - "epoch": 0.49, - "learning_rate": 1.9064000184184052e-06, - "loss": 1.0205, - "step": 19273 - }, - { - "epoch": 0.49, - "learning_rate": 1.9063883295068073e-06, - "loss": 0.7671, - "step": 19274 - }, - { - "epoch": 0.49, - "learning_rate": 1.9063766399012292e-06, - "loss": 0.9736, - "step": 19275 - }, - { - "epoch": 0.49, - "learning_rate": 1.9063649496016802e-06, - "loss": 0.7466, - "step": 19276 - }, - { - "epoch": 0.49, - "learning_rate": 1.9063532586081696e-06, - "loss": 1.0117, - "step": 19277 - }, - { - "epoch": 0.49, - "learning_rate": 1.9063415669207056e-06, - "loss": 0.5664, - "step": 19278 - }, - { - "epoch": 0.49, - "learning_rate": 1.9063298745392976e-06, - "loss": 0.6865, - "step": 19279 - }, - { - "epoch": 0.49, - "learning_rate": 1.906318181463955e-06, - "loss": 0.9502, - "step": 19280 - }, - { - "epoch": 0.49, - "learning_rate": 1.9063064876946858e-06, - "loss": 0.7378, - "step": 19281 - }, - { - "epoch": 0.49, - "learning_rate": 1.9062947932314993e-06, - "loss": 1.2812, - "step": 19282 - }, - { - "epoch": 0.49, - "learning_rate": 1.9062830980744046e-06, - "loss": 0.9287, - "step": 19283 - }, - { - "epoch": 0.49, - "learning_rate": 1.9062714022234107e-06, - "loss": 0.877, - "step": 19284 - }, - { - "epoch": 0.49, - "learning_rate": 1.9062597056785267e-06, - "loss": 0.959, - "step": 19285 - }, - { - "epoch": 0.49, - "learning_rate": 1.9062480084397608e-06, - "loss": 0.9668, - "step": 19286 - }, - { - "epoch": 0.49, - "learning_rate": 1.9062363105071227e-06, - "loss": 0.8379, - "step": 19287 - }, - { - "epoch": 0.49, - "learning_rate": 1.906224611880621e-06, - "loss": 0.8677, - "step": 19288 - }, - { - "epoch": 0.49, - "learning_rate": 1.906212912560265e-06, - "loss": 0.9365, - "step": 19289 - }, - { - "epoch": 0.49, - "learning_rate": 1.9062012125460635e-06, - "loss": 0.9736, - "step": 19290 - }, - { - "epoch": 0.49, - "learning_rate": 1.9061895118380252e-06, - "loss": 1.0771, - "step": 19291 - }, - { - "epoch": 0.49, - "learning_rate": 1.9061778104361595e-06, - "loss": 1.2012, - "step": 19292 - }, - { - "epoch": 0.49, - "learning_rate": 1.9061661083404748e-06, - "loss": 0.7017, - "step": 19293 - }, - { - "epoch": 0.49, - "learning_rate": 1.9061544055509807e-06, - "loss": 0.8857, - "step": 19294 - }, - { - "epoch": 0.49, - "learning_rate": 1.9061427020676855e-06, - "loss": 0.8135, - "step": 19295 - }, - { - "epoch": 0.49, - "learning_rate": 1.9061309978905986e-06, - "loss": 0.7913, - "step": 19296 - }, - { - "epoch": 0.49, - "learning_rate": 1.906119293019729e-06, - "loss": 0.8677, - "step": 19297 - }, - { - "epoch": 0.49, - "learning_rate": 1.9061075874550853e-06, - "loss": 0.9668, - "step": 19298 - }, - { - "epoch": 0.49, - "learning_rate": 1.906095881196677e-06, - "loss": 1.0557, - "step": 19299 - }, - { - "epoch": 0.49, - "learning_rate": 1.9060841742445124e-06, - "loss": 1.0127, - "step": 19300 - }, - { - "epoch": 0.49, - "learning_rate": 1.906072466598601e-06, - "loss": 0.7363, - "step": 19301 - }, - { - "epoch": 0.49, - "learning_rate": 1.9060607582589515e-06, - "loss": 0.9014, - "step": 19302 - }, - { - "epoch": 0.49, - "learning_rate": 1.9060490492255731e-06, - "loss": 0.8525, - "step": 19303 - }, - { - "epoch": 0.49, - "learning_rate": 1.9060373394984745e-06, - "loss": 0.5879, - "step": 19304 - }, - { - "epoch": 0.49, - "learning_rate": 1.9060256290776646e-06, - "loss": 0.8896, - "step": 19305 - }, - { - "epoch": 0.49, - "learning_rate": 1.906013917963153e-06, - "loss": 0.7754, - "step": 19306 - }, - { - "epoch": 0.49, - "learning_rate": 1.9060022061549477e-06, - "loss": 0.7373, - "step": 19307 - }, - { - "epoch": 0.49, - "learning_rate": 1.9059904936530584e-06, - "loss": 0.6445, - "step": 19308 - }, - { - "epoch": 0.49, - "learning_rate": 1.9059787804574939e-06, - "loss": 1.0361, - "step": 19309 - }, - { - "epoch": 0.49, - "learning_rate": 1.905967066568263e-06, - "loss": 0.9189, - "step": 19310 - }, - { - "epoch": 0.49, - "learning_rate": 1.9059553519853748e-06, - "loss": 0.8057, - "step": 19311 - }, - { - "epoch": 0.49, - "learning_rate": 1.9059436367088382e-06, - "loss": 1.0391, - "step": 19312 - }, - { - "epoch": 0.5, - "learning_rate": 1.9059319207386623e-06, - "loss": 0.8184, - "step": 19313 - }, - { - "epoch": 0.5, - "learning_rate": 1.9059202040748562e-06, - "loss": 1.1543, - "step": 19314 - }, - { - "epoch": 0.5, - "learning_rate": 1.9059084867174281e-06, - "loss": 0.7529, - "step": 19315 - }, - { - "epoch": 0.5, - "learning_rate": 1.9058967686663879e-06, - "loss": 0.9717, - "step": 19316 - }, - { - "epoch": 0.5, - "learning_rate": 1.9058850499217441e-06, - "loss": 0.8274, - "step": 19317 - }, - { - "epoch": 0.5, - "learning_rate": 1.9058733304835057e-06, - "loss": 0.9443, - "step": 19318 - }, - { - "epoch": 0.5, - "learning_rate": 1.9058616103516818e-06, - "loss": 0.8193, - "step": 19319 - }, - { - "epoch": 0.5, - "learning_rate": 1.9058498895262813e-06, - "loss": 0.916, - "step": 19320 - }, - { - "epoch": 0.5, - "learning_rate": 1.9058381680073135e-06, - "loss": 1.0117, - "step": 19321 - }, - { - "epoch": 0.5, - "learning_rate": 1.9058264457947866e-06, - "loss": 0.8135, - "step": 19322 - }, - { - "epoch": 0.5, - "learning_rate": 1.9058147228887104e-06, - "loss": 0.585, - "step": 19323 - }, - { - "epoch": 0.5, - "learning_rate": 1.9058029992890932e-06, - "loss": 1.124, - "step": 19324 - }, - { - "epoch": 0.5, - "learning_rate": 1.9057912749959447e-06, - "loss": 0.7998, - "step": 19325 - }, - { - "epoch": 0.5, - "learning_rate": 1.905779550009273e-06, - "loss": 1.0547, - "step": 19326 - }, - { - "epoch": 0.5, - "learning_rate": 1.905767824329088e-06, - "loss": 0.7217, - "step": 19327 - }, - { - "epoch": 0.5, - "learning_rate": 1.905756097955398e-06, - "loss": 1.0059, - "step": 19328 - }, - { - "epoch": 0.5, - "learning_rate": 1.905744370888212e-06, - "loss": 0.8325, - "step": 19329 - }, - { - "epoch": 0.5, - "learning_rate": 1.9057326431275396e-06, - "loss": 1.0469, - "step": 19330 - }, - { - "epoch": 0.5, - "learning_rate": 1.905720914673389e-06, - "loss": 0.8809, - "step": 19331 - }, - { - "epoch": 0.5, - "learning_rate": 1.9057091855257696e-06, - "loss": 0.8921, - "step": 19332 - }, - { - "epoch": 0.5, - "learning_rate": 1.9056974556846906e-06, - "loss": 0.8638, - "step": 19333 - }, - { - "epoch": 0.5, - "learning_rate": 1.9056857251501603e-06, - "loss": 1.0078, - "step": 19334 - }, - { - "epoch": 0.5, - "learning_rate": 1.9056739939221887e-06, - "loss": 1.0283, - "step": 19335 - }, - { - "epoch": 0.5, - "learning_rate": 1.9056622620007836e-06, - "loss": 0.7715, - "step": 19336 - }, - { - "epoch": 0.5, - "learning_rate": 1.9056505293859546e-06, - "loss": 0.7822, - "step": 19337 - }, - { - "epoch": 0.5, - "learning_rate": 1.905638796077711e-06, - "loss": 0.7939, - "step": 19338 - }, - { - "epoch": 0.5, - "learning_rate": 1.9056270620760612e-06, - "loss": 0.7617, - "step": 19339 - }, - { - "epoch": 0.5, - "learning_rate": 1.9056153273810143e-06, - "loss": 0.6411, - "step": 19340 - }, - { - "epoch": 0.5, - "learning_rate": 1.9056035919925793e-06, - "loss": 0.958, - "step": 19341 - }, - { - "epoch": 0.5, - "learning_rate": 1.9055918559107656e-06, - "loss": 1.0537, - "step": 19342 - }, - { - "epoch": 0.5, - "learning_rate": 1.9055801191355814e-06, - "loss": 1.0605, - "step": 19343 - }, - { - "epoch": 0.5, - "learning_rate": 1.9055683816670365e-06, - "loss": 0.8262, - "step": 19344 - }, - { - "epoch": 0.5, - "learning_rate": 1.9055566435051395e-06, - "loss": 0.75, - "step": 19345 - }, - { - "epoch": 0.5, - "learning_rate": 1.9055449046498992e-06, - "loss": 1.0039, - "step": 19346 - }, - { - "epoch": 0.5, - "learning_rate": 1.9055331651013252e-06, - "loss": 0.9014, - "step": 19347 - }, - { - "epoch": 0.5, - "learning_rate": 1.905521424859426e-06, - "loss": 0.7402, - "step": 19348 - }, - { - "epoch": 0.5, - "learning_rate": 1.9055096839242104e-06, - "loss": 0.7939, - "step": 19349 - }, - { - "epoch": 0.5, - "learning_rate": 1.9054979422956875e-06, - "loss": 1.1572, - "step": 19350 - }, - { - "epoch": 0.5, - "learning_rate": 1.905486199973867e-06, - "loss": 0.9863, - "step": 19351 - }, - { - "epoch": 0.5, - "learning_rate": 1.9054744569587573e-06, - "loss": 0.6938, - "step": 19352 - }, - { - "epoch": 0.5, - "learning_rate": 1.905462713250367e-06, - "loss": 0.8682, - "step": 19353 - }, - { - "epoch": 0.5, - "learning_rate": 1.9054509688487059e-06, - "loss": 0.6558, - "step": 19354 - }, - { - "epoch": 0.5, - "learning_rate": 1.9054392237537825e-06, - "loss": 0.7793, - "step": 19355 - }, - { - "epoch": 0.5, - "learning_rate": 1.9054274779656062e-06, - "loss": 1.0449, - "step": 19356 - }, - { - "epoch": 0.5, - "learning_rate": 1.9054157314841852e-06, - "loss": 0.8867, - "step": 19357 - }, - { - "epoch": 0.5, - "learning_rate": 1.9054039843095296e-06, - "loss": 1.0303, - "step": 19358 - }, - { - "epoch": 0.5, - "learning_rate": 1.9053922364416472e-06, - "loss": 0.8984, - "step": 19359 - }, - { - "epoch": 0.5, - "learning_rate": 1.905380487880548e-06, - "loss": 0.9932, - "step": 19360 - }, - { - "epoch": 0.5, - "learning_rate": 1.9053687386262406e-06, - "loss": 0.9424, - "step": 19361 - }, - { - "epoch": 0.5, - "learning_rate": 1.9053569886787337e-06, - "loss": 0.9688, - "step": 19362 - }, - { - "epoch": 0.5, - "learning_rate": 1.9053452380380368e-06, - "loss": 1.084, - "step": 19363 - }, - { - "epoch": 0.5, - "learning_rate": 1.9053334867041583e-06, - "loss": 1.1182, - "step": 19364 - }, - { - "epoch": 0.5, - "learning_rate": 1.9053217346771082e-06, - "loss": 0.8838, - "step": 19365 - }, - { - "epoch": 0.5, - "learning_rate": 1.9053099819568945e-06, - "loss": 0.959, - "step": 19366 - }, - { - "epoch": 0.5, - "learning_rate": 1.9052982285435266e-06, - "loss": 0.9126, - "step": 19367 - }, - { - "epoch": 0.5, - "learning_rate": 1.9052864744370134e-06, - "loss": 1.04, - "step": 19368 - }, - { - "epoch": 0.5, - "learning_rate": 1.9052747196373642e-06, - "loss": 0.7891, - "step": 19369 - }, - { - "epoch": 0.5, - "learning_rate": 1.9052629641445876e-06, - "loss": 0.8867, - "step": 19370 - }, - { - "epoch": 0.5, - "learning_rate": 1.9052512079586932e-06, - "loss": 0.812, - "step": 19371 - }, - { - "epoch": 0.5, - "learning_rate": 1.905239451079689e-06, - "loss": 0.749, - "step": 19372 - }, - { - "epoch": 0.5, - "learning_rate": 1.9052276935075847e-06, - "loss": 1.0654, - "step": 19373 - }, - { - "epoch": 0.5, - "learning_rate": 1.9052159352423894e-06, - "loss": 0.9805, - "step": 19374 - }, - { - "epoch": 0.5, - "learning_rate": 1.9052041762841115e-06, - "loss": 0.9146, - "step": 19375 - }, - { - "epoch": 0.5, - "learning_rate": 1.9051924166327607e-06, - "loss": 0.8516, - "step": 19376 - }, - { - "epoch": 0.5, - "learning_rate": 1.9051806562883456e-06, - "loss": 0.9414, - "step": 19377 - }, - { - "epoch": 0.5, - "learning_rate": 1.9051688952508754e-06, - "loss": 1.0078, - "step": 19378 - }, - { - "epoch": 0.5, - "learning_rate": 1.9051571335203588e-06, - "loss": 0.8145, - "step": 19379 - }, - { - "epoch": 0.5, - "learning_rate": 1.9051453710968052e-06, - "loss": 0.6458, - "step": 19380 - }, - { - "epoch": 0.5, - "learning_rate": 1.9051336079802234e-06, - "loss": 0.9043, - "step": 19381 - }, - { - "epoch": 0.5, - "learning_rate": 1.9051218441706223e-06, - "loss": 0.8237, - "step": 19382 - }, - { - "epoch": 0.5, - "learning_rate": 1.905110079668011e-06, - "loss": 0.7871, - "step": 19383 - }, - { - "epoch": 0.5, - "learning_rate": 1.9050983144723987e-06, - "loss": 0.918, - "step": 19384 - }, - { - "epoch": 0.5, - "learning_rate": 1.905086548583794e-06, - "loss": 0.8662, - "step": 19385 - }, - { - "epoch": 0.5, - "learning_rate": 1.9050747820022063e-06, - "loss": 0.8555, - "step": 19386 - }, - { - "epoch": 0.5, - "learning_rate": 1.9050630147276446e-06, - "loss": 0.8818, - "step": 19387 - }, - { - "epoch": 0.5, - "learning_rate": 1.9050512467601174e-06, - "loss": 1.0117, - "step": 19388 - }, - { - "epoch": 0.5, - "learning_rate": 1.9050394780996344e-06, - "loss": 0.7549, - "step": 19389 - }, - { - "epoch": 0.5, - "learning_rate": 1.9050277087462042e-06, - "loss": 1.1318, - "step": 19390 - }, - { - "epoch": 0.5, - "learning_rate": 1.9050159386998358e-06, - "loss": 0.7656, - "step": 19391 - }, - { - "epoch": 0.5, - "learning_rate": 1.9050041679605383e-06, - "loss": 0.8193, - "step": 19392 - }, - { - "epoch": 0.5, - "learning_rate": 1.9049923965283208e-06, - "loss": 0.7969, - "step": 19393 - }, - { - "epoch": 0.5, - "learning_rate": 1.9049806244031923e-06, - "loss": 0.8252, - "step": 19394 - }, - { - "epoch": 0.5, - "learning_rate": 1.9049688515851617e-06, - "loss": 0.7939, - "step": 19395 - }, - { - "epoch": 0.5, - "learning_rate": 1.904957078074238e-06, - "loss": 0.8643, - "step": 19396 - }, - { - "epoch": 0.5, - "learning_rate": 1.9049453038704302e-06, - "loss": 0.9043, - "step": 19397 - }, - { - "epoch": 0.5, - "learning_rate": 1.9049335289737476e-06, - "loss": 0.8057, - "step": 19398 - }, - { - "epoch": 0.5, - "learning_rate": 1.9049217533841989e-06, - "loss": 0.959, - "step": 19399 - }, - { - "epoch": 0.5, - "learning_rate": 1.904909977101793e-06, - "loss": 0.8877, - "step": 19400 - }, - { - "epoch": 0.5, - "learning_rate": 1.9048982001265395e-06, - "loss": 0.8896, - "step": 19401 - }, - { - "epoch": 0.5, - "learning_rate": 1.9048864224584469e-06, - "loss": 0.8037, - "step": 19402 - }, - { - "epoch": 0.5, - "learning_rate": 1.9048746440975245e-06, - "loss": 0.7642, - "step": 19403 - }, - { - "epoch": 0.5, - "learning_rate": 1.904862865043781e-06, - "loss": 0.7241, - "step": 19404 - }, - { - "epoch": 0.5, - "learning_rate": 1.9048510852972256e-06, - "loss": 0.8359, - "step": 19405 - }, - { - "epoch": 0.5, - "learning_rate": 1.9048393048578676e-06, - "loss": 1.0957, - "step": 19406 - }, - { - "epoch": 0.5, - "learning_rate": 1.9048275237257155e-06, - "loss": 0.9502, - "step": 19407 - }, - { - "epoch": 0.5, - "learning_rate": 1.9048157419007787e-06, - "loss": 0.7432, - "step": 19408 - }, - { - "epoch": 0.5, - "learning_rate": 1.904803959383066e-06, - "loss": 0.8506, - "step": 19409 - }, - { - "epoch": 0.5, - "learning_rate": 1.9047921761725867e-06, - "loss": 0.7783, - "step": 19410 - }, - { - "epoch": 0.5, - "learning_rate": 1.9047803922693495e-06, - "loss": 0.9854, - "step": 19411 - }, - { - "epoch": 0.5, - "learning_rate": 1.9047686076733634e-06, - "loss": 0.9023, - "step": 19412 - }, - { - "epoch": 0.5, - "learning_rate": 1.9047568223846377e-06, - "loss": 1.0684, - "step": 19413 - }, - { - "epoch": 0.5, - "learning_rate": 1.9047450364031814e-06, - "loss": 0.8672, - "step": 19414 - }, - { - "epoch": 0.5, - "learning_rate": 1.9047332497290033e-06, - "loss": 0.9668, - "step": 19415 - }, - { - "epoch": 0.5, - "learning_rate": 1.9047214623621126e-06, - "loss": 0.7114, - "step": 19416 - }, - { - "epoch": 0.5, - "learning_rate": 1.9047096743025181e-06, - "loss": 0.729, - "step": 19417 - }, - { - "epoch": 0.5, - "learning_rate": 1.9046978855502294e-06, - "loss": 0.8135, - "step": 19418 - }, - { - "epoch": 0.5, - "learning_rate": 1.904686096105255e-06, - "loss": 0.8643, - "step": 19419 - }, - { - "epoch": 0.5, - "learning_rate": 1.9046743059676039e-06, - "loss": 0.748, - "step": 19420 - }, - { - "epoch": 0.5, - "learning_rate": 1.9046625151372852e-06, - "loss": 0.8643, - "step": 19421 - }, - { - "epoch": 0.5, - "learning_rate": 1.9046507236143081e-06, - "loss": 1.0186, - "step": 19422 - }, - { - "epoch": 0.5, - "learning_rate": 1.9046389313986817e-06, - "loss": 0.8721, - "step": 19423 - }, - { - "epoch": 0.5, - "learning_rate": 1.9046271384904146e-06, - "loss": 0.7588, - "step": 19424 - }, - { - "epoch": 0.5, - "learning_rate": 1.9046153448895166e-06, - "loss": 0.6716, - "step": 19425 - }, - { - "epoch": 0.5, - "learning_rate": 1.9046035505959956e-06, - "loss": 0.8164, - "step": 19426 - }, - { - "epoch": 0.5, - "learning_rate": 1.9045917556098616e-06, - "loss": 0.915, - "step": 19427 - }, - { - "epoch": 0.5, - "learning_rate": 1.9045799599311234e-06, - "loss": 0.8115, - "step": 19428 - }, - { - "epoch": 0.5, - "learning_rate": 1.9045681635597896e-06, - "loss": 1.04, - "step": 19429 - }, - { - "epoch": 0.5, - "learning_rate": 1.9045563664958699e-06, - "loss": 0.7725, - "step": 19430 - }, - { - "epoch": 0.5, - "learning_rate": 1.9045445687393726e-06, - "loss": 0.9307, - "step": 19431 - }, - { - "epoch": 0.5, - "learning_rate": 1.9045327702903074e-06, - "loss": 1.0098, - "step": 19432 - }, - { - "epoch": 0.5, - "learning_rate": 1.904520971148683e-06, - "loss": 0.9668, - "step": 19433 - }, - { - "epoch": 0.5, - "learning_rate": 1.9045091713145083e-06, - "loss": 0.8506, - "step": 19434 - }, - { - "epoch": 0.5, - "learning_rate": 1.9044973707877927e-06, - "loss": 0.7939, - "step": 19435 - }, - { - "epoch": 0.5, - "learning_rate": 1.9044855695685448e-06, - "loss": 0.8896, - "step": 19436 - }, - { - "epoch": 0.5, - "learning_rate": 1.9044737676567743e-06, - "loss": 0.9365, - "step": 19437 - }, - { - "epoch": 0.5, - "learning_rate": 1.9044619650524895e-06, - "loss": 0.9385, - "step": 19438 - }, - { - "epoch": 0.5, - "learning_rate": 1.9044501617557e-06, - "loss": 0.8462, - "step": 19439 - }, - { - "epoch": 0.5, - "learning_rate": 1.9044383577664145e-06, - "loss": 1.0605, - "step": 19440 - }, - { - "epoch": 0.5, - "learning_rate": 1.9044265530846419e-06, - "loss": 1.1279, - "step": 19441 - }, - { - "epoch": 0.5, - "learning_rate": 1.9044147477103919e-06, - "loss": 0.7949, - "step": 19442 - }, - { - "epoch": 0.5, - "learning_rate": 1.904402941643673e-06, - "loss": 0.8379, - "step": 19443 - }, - { - "epoch": 0.5, - "learning_rate": 1.9043911348844942e-06, - "loss": 0.6538, - "step": 19444 - }, - { - "epoch": 0.5, - "learning_rate": 1.9043793274328645e-06, - "loss": 0.959, - "step": 19445 - }, - { - "epoch": 0.5, - "learning_rate": 1.9043675192887933e-06, - "loss": 0.8232, - "step": 19446 - }, - { - "epoch": 0.5, - "learning_rate": 1.9043557104522895e-06, - "loss": 0.8496, - "step": 19447 - }, - { - "epoch": 0.5, - "learning_rate": 1.9043439009233624e-06, - "loss": 0.8047, - "step": 19448 - }, - { - "epoch": 0.5, - "learning_rate": 1.9043320907020206e-06, - "loss": 0.7998, - "step": 19449 - }, - { - "epoch": 0.5, - "learning_rate": 1.9043202797882731e-06, - "loss": 0.8164, - "step": 19450 - }, - { - "epoch": 0.5, - "learning_rate": 1.9043084681821294e-06, - "loss": 0.877, - "step": 19451 - }, - { - "epoch": 0.5, - "learning_rate": 1.904296655883598e-06, - "loss": 0.8701, - "step": 19452 - }, - { - "epoch": 0.5, - "learning_rate": 1.9042848428926884e-06, - "loss": 0.9248, - "step": 19453 - }, - { - "epoch": 0.5, - "learning_rate": 1.9042730292094094e-06, - "loss": 0.8486, - "step": 19454 - }, - { - "epoch": 0.5, - "learning_rate": 1.9042612148337701e-06, - "loss": 0.9248, - "step": 19455 - }, - { - "epoch": 0.5, - "learning_rate": 1.90424939976578e-06, - "loss": 0.8286, - "step": 19456 - }, - { - "epoch": 0.5, - "learning_rate": 1.9042375840054471e-06, - "loss": 1.0615, - "step": 19457 - }, - { - "epoch": 0.5, - "learning_rate": 1.9042257675527814e-06, - "loss": 1.04, - "step": 19458 - }, - { - "epoch": 0.5, - "learning_rate": 1.9042139504077914e-06, - "loss": 0.8604, - "step": 19459 - }, - { - "epoch": 0.5, - "learning_rate": 1.9042021325704867e-06, - "loss": 0.8828, - "step": 19460 - }, - { - "epoch": 0.5, - "learning_rate": 1.9041903140408756e-06, - "loss": 0.9961, - "step": 19461 - }, - { - "epoch": 0.5, - "learning_rate": 1.9041784948189678e-06, - "loss": 1.0947, - "step": 19462 - }, - { - "epoch": 0.5, - "learning_rate": 1.904166674904772e-06, - "loss": 0.6515, - "step": 19463 - }, - { - "epoch": 0.5, - "learning_rate": 1.9041548542982975e-06, - "loss": 1.0566, - "step": 19464 - }, - { - "epoch": 0.5, - "learning_rate": 1.9041430329995532e-06, - "loss": 0.8281, - "step": 19465 - }, - { - "epoch": 0.5, - "learning_rate": 1.904131211008548e-06, - "loss": 0.7354, - "step": 19466 - }, - { - "epoch": 0.5, - "learning_rate": 1.904119388325291e-06, - "loss": 0.8135, - "step": 19467 - }, - { - "epoch": 0.5, - "learning_rate": 1.9041075649497916e-06, - "loss": 0.833, - "step": 19468 - }, - { - "epoch": 0.5, - "learning_rate": 1.9040957408820585e-06, - "loss": 0.6465, - "step": 19469 - }, - { - "epoch": 0.5, - "learning_rate": 1.9040839161221009e-06, - "loss": 0.7185, - "step": 19470 - }, - { - "epoch": 0.5, - "learning_rate": 1.904072090669928e-06, - "loss": 1.04, - "step": 19471 - }, - { - "epoch": 0.5, - "learning_rate": 1.9040602645255483e-06, - "loss": 0.9326, - "step": 19472 - }, - { - "epoch": 0.5, - "learning_rate": 1.9040484376889715e-06, - "loss": 1.0615, - "step": 19473 - }, - { - "epoch": 0.5, - "learning_rate": 1.9040366101602063e-06, - "loss": 0.8242, - "step": 19474 - }, - { - "epoch": 0.5, - "learning_rate": 1.9040247819392618e-06, - "loss": 0.9443, - "step": 19475 - }, - { - "epoch": 0.5, - "learning_rate": 1.904012953026147e-06, - "loss": 0.9619, - "step": 19476 - }, - { - "epoch": 0.5, - "learning_rate": 1.9040011234208712e-06, - "loss": 0.7832, - "step": 19477 - }, - { - "epoch": 0.5, - "learning_rate": 1.9039892931234433e-06, - "loss": 0.9395, - "step": 19478 - }, - { - "epoch": 0.5, - "learning_rate": 1.9039774621338722e-06, - "loss": 0.623, - "step": 19479 - }, - { - "epoch": 0.5, - "learning_rate": 1.903965630452167e-06, - "loss": 0.9028, - "step": 19480 - }, - { - "epoch": 0.5, - "learning_rate": 1.9039537980783376e-06, - "loss": 0.8921, - "step": 19481 - }, - { - "epoch": 0.5, - "learning_rate": 1.9039419650123918e-06, - "loss": 0.8105, - "step": 19482 - }, - { - "epoch": 0.5, - "learning_rate": 1.9039301312543392e-06, - "loss": 0.8887, - "step": 19483 - }, - { - "epoch": 0.5, - "learning_rate": 1.903918296804189e-06, - "loss": 0.9189, - "step": 19484 - }, - { - "epoch": 0.5, - "learning_rate": 1.90390646166195e-06, - "loss": 0.8496, - "step": 19485 - }, - { - "epoch": 0.5, - "learning_rate": 1.9038946258276316e-06, - "loss": 0.6211, - "step": 19486 - }, - { - "epoch": 0.5, - "learning_rate": 1.9038827893012424e-06, - "loss": 0.5706, - "step": 19487 - }, - { - "epoch": 0.5, - "learning_rate": 1.9038709520827917e-06, - "loss": 1.0625, - "step": 19488 - }, - { - "epoch": 0.5, - "learning_rate": 1.9038591141722886e-06, - "loss": 0.9512, - "step": 19489 - }, - { - "epoch": 0.5, - "learning_rate": 1.9038472755697423e-06, - "loss": 0.7988, - "step": 19490 - }, - { - "epoch": 0.5, - "learning_rate": 1.9038354362751617e-06, - "loss": 0.7939, - "step": 19491 - }, - { - "epoch": 0.5, - "learning_rate": 1.9038235962885559e-06, - "loss": 1.0513, - "step": 19492 - }, - { - "epoch": 0.5, - "learning_rate": 1.9038117556099339e-06, - "loss": 0.8574, - "step": 19493 - }, - { - "epoch": 0.5, - "learning_rate": 1.9037999142393044e-06, - "loss": 0.9629, - "step": 19494 - }, - { - "epoch": 0.5, - "learning_rate": 1.9037880721766773e-06, - "loss": 0.7666, - "step": 19495 - }, - { - "epoch": 0.5, - "learning_rate": 1.903776229422061e-06, - "loss": 0.6855, - "step": 19496 - }, - { - "epoch": 0.5, - "learning_rate": 1.9037643859754651e-06, - "loss": 0.792, - "step": 19497 - }, - { - "epoch": 0.5, - "learning_rate": 1.903752541836898e-06, - "loss": 0.6787, - "step": 19498 - }, - { - "epoch": 0.5, - "learning_rate": 1.9037406970063695e-06, - "loss": 0.8848, - "step": 19499 - }, - { - "epoch": 0.5, - "learning_rate": 1.903728851483888e-06, - "loss": 0.8643, - "step": 19500 - }, - { - "epoch": 0.5, - "learning_rate": 1.9037170052694628e-06, - "loss": 0.8652, - "step": 19501 - }, - { - "epoch": 0.5, - "learning_rate": 1.9037051583631035e-06, - "loss": 0.8257, - "step": 19502 - }, - { - "epoch": 0.5, - "learning_rate": 1.9036933107648184e-06, - "loss": 0.9756, - "step": 19503 - }, - { - "epoch": 0.5, - "learning_rate": 1.9036814624746169e-06, - "loss": 1.1123, - "step": 19504 - }, - { - "epoch": 0.5, - "learning_rate": 1.903669613492508e-06, - "loss": 0.7036, - "step": 19505 - }, - { - "epoch": 0.5, - "learning_rate": 1.9036577638185007e-06, - "loss": 0.958, - "step": 19506 - }, - { - "epoch": 0.5, - "learning_rate": 1.9036459134526045e-06, - "loss": 0.916, - "step": 19507 - }, - { - "epoch": 0.5, - "learning_rate": 1.903634062394828e-06, - "loss": 0.9043, - "step": 19508 - }, - { - "epoch": 0.5, - "learning_rate": 1.9036222106451807e-06, - "loss": 0.9082, - "step": 19509 - }, - { - "epoch": 0.5, - "learning_rate": 1.9036103582036711e-06, - "loss": 1.0879, - "step": 19510 - }, - { - "epoch": 0.5, - "learning_rate": 1.9035985050703087e-06, - "loss": 0.9893, - "step": 19511 - }, - { - "epoch": 0.5, - "learning_rate": 1.9035866512451028e-06, - "loss": 0.8662, - "step": 19512 - }, - { - "epoch": 0.5, - "learning_rate": 1.9035747967280618e-06, - "loss": 1.1162, - "step": 19513 - }, - { - "epoch": 0.5, - "learning_rate": 1.9035629415191952e-06, - "loss": 0.8638, - "step": 19514 - }, - { - "epoch": 0.5, - "learning_rate": 1.903551085618512e-06, - "loss": 0.9766, - "step": 19515 - }, - { - "epoch": 0.5, - "learning_rate": 1.9035392290260212e-06, - "loss": 0.7402, - "step": 19516 - }, - { - "epoch": 0.5, - "learning_rate": 1.9035273717417319e-06, - "loss": 0.7788, - "step": 19517 - }, - { - "epoch": 0.5, - "learning_rate": 1.9035155137656535e-06, - "loss": 0.7261, - "step": 19518 - }, - { - "epoch": 0.5, - "learning_rate": 1.9035036550977947e-06, - "loss": 0.8691, - "step": 19519 - }, - { - "epoch": 0.5, - "learning_rate": 1.903491795738165e-06, - "loss": 0.9746, - "step": 19520 - }, - { - "epoch": 0.5, - "learning_rate": 1.9034799356867726e-06, - "loss": 0.8887, - "step": 19521 - }, - { - "epoch": 0.5, - "learning_rate": 1.9034680749436274e-06, - "loss": 0.9912, - "step": 19522 - }, - { - "epoch": 0.5, - "learning_rate": 1.9034562135087385e-06, - "loss": 1.0684, - "step": 19523 - }, - { - "epoch": 0.5, - "learning_rate": 1.9034443513821143e-06, - "loss": 0.751, - "step": 19524 - }, - { - "epoch": 0.5, - "learning_rate": 1.9034324885637646e-06, - "loss": 0.9199, - "step": 19525 - }, - { - "epoch": 0.5, - "learning_rate": 1.9034206250536979e-06, - "loss": 0.8906, - "step": 19526 - }, - { - "epoch": 0.5, - "learning_rate": 1.9034087608519238e-06, - "loss": 0.9678, - "step": 19527 - }, - { - "epoch": 0.5, - "learning_rate": 1.903396895958451e-06, - "loss": 0.7217, - "step": 19528 - }, - { - "epoch": 0.5, - "learning_rate": 1.9033850303732889e-06, - "loss": 0.5991, - "step": 19529 - }, - { - "epoch": 0.5, - "learning_rate": 1.9033731640964463e-06, - "loss": 0.8584, - "step": 19530 - }, - { - "epoch": 0.5, - "learning_rate": 1.9033612971279322e-06, - "loss": 1.248, - "step": 19531 - }, - { - "epoch": 0.5, - "learning_rate": 1.9033494294677563e-06, - "loss": 0.7061, - "step": 19532 - }, - { - "epoch": 0.5, - "learning_rate": 1.903337561115927e-06, - "loss": 0.792, - "step": 19533 - }, - { - "epoch": 0.5, - "learning_rate": 1.903325692072454e-06, - "loss": 0.9355, - "step": 19534 - }, - { - "epoch": 0.5, - "learning_rate": 1.903313822337346e-06, - "loss": 1.0244, - "step": 19535 - }, - { - "epoch": 0.5, - "learning_rate": 1.903301951910612e-06, - "loss": 0.7202, - "step": 19536 - }, - { - "epoch": 0.5, - "learning_rate": 1.903290080792261e-06, - "loss": 1.0625, - "step": 19537 - }, - { - "epoch": 0.5, - "learning_rate": 1.9032782089823026e-06, - "loss": 0.8555, - "step": 19538 - }, - { - "epoch": 0.5, - "learning_rate": 1.9032663364807453e-06, - "loss": 0.8398, - "step": 19539 - }, - { - "epoch": 0.5, - "learning_rate": 1.903254463287599e-06, - "loss": 0.7246, - "step": 19540 - }, - { - "epoch": 0.5, - "learning_rate": 1.9032425894028718e-06, - "loss": 0.7969, - "step": 19541 - }, - { - "epoch": 0.5, - "learning_rate": 1.9032307148265736e-06, - "loss": 0.9092, - "step": 19542 - }, - { - "epoch": 0.5, - "learning_rate": 1.903218839558713e-06, - "loss": 0.7166, - "step": 19543 - }, - { - "epoch": 0.5, - "learning_rate": 1.9032069635992993e-06, - "loss": 1.0049, - "step": 19544 - }, - { - "epoch": 0.5, - "learning_rate": 1.9031950869483417e-06, - "loss": 0.9209, - "step": 19545 - }, - { - "epoch": 0.5, - "learning_rate": 1.903183209605849e-06, - "loss": 0.917, - "step": 19546 - }, - { - "epoch": 0.5, - "learning_rate": 1.9031713315718308e-06, - "loss": 0.8325, - "step": 19547 - }, - { - "epoch": 0.5, - "learning_rate": 1.9031594528462955e-06, - "loss": 0.8354, - "step": 19548 - }, - { - "epoch": 0.5, - "learning_rate": 1.9031475734292525e-06, - "loss": 0.8457, - "step": 19549 - }, - { - "epoch": 0.5, - "learning_rate": 1.903135693320711e-06, - "loss": 0.9062, - "step": 19550 - }, - { - "epoch": 0.5, - "learning_rate": 1.9031238125206799e-06, - "loss": 1.127, - "step": 19551 - }, - { - "epoch": 0.5, - "learning_rate": 1.9031119310291689e-06, - "loss": 0.9111, - "step": 19552 - }, - { - "epoch": 0.5, - "learning_rate": 1.903100048846186e-06, - "loss": 0.7202, - "step": 19553 - }, - { - "epoch": 0.5, - "learning_rate": 1.9030881659717412e-06, - "loss": 0.645, - "step": 19554 - }, - { - "epoch": 0.5, - "learning_rate": 1.9030762824058435e-06, - "loss": 0.8369, - "step": 19555 - }, - { - "epoch": 0.5, - "learning_rate": 1.9030643981485015e-06, - "loss": 0.8159, - "step": 19556 - }, - { - "epoch": 0.5, - "learning_rate": 1.9030525131997247e-06, - "loss": 0.8711, - "step": 19557 - }, - { - "epoch": 0.5, - "learning_rate": 1.9030406275595224e-06, - "loss": 0.8621, - "step": 19558 - }, - { - "epoch": 0.5, - "learning_rate": 1.903028741227903e-06, - "loss": 0.7725, - "step": 19559 - }, - { - "epoch": 0.5, - "learning_rate": 1.903016854204876e-06, - "loss": 1.0, - "step": 19560 - }, - { - "epoch": 0.5, - "learning_rate": 1.9030049664904508e-06, - "loss": 0.8618, - "step": 19561 - }, - { - "epoch": 0.5, - "learning_rate": 1.902993078084636e-06, - "loss": 0.6665, - "step": 19562 - }, - { - "epoch": 0.5, - "learning_rate": 1.9029811889874411e-06, - "loss": 1.1064, - "step": 19563 - }, - { - "epoch": 0.5, - "learning_rate": 1.902969299198875e-06, - "loss": 1.0195, - "step": 19564 - }, - { - "epoch": 0.5, - "learning_rate": 1.9029574087189469e-06, - "loss": 0.7344, - "step": 19565 - }, - { - "epoch": 0.5, - "learning_rate": 1.902945517547666e-06, - "loss": 0.7571, - "step": 19566 - }, - { - "epoch": 0.5, - "learning_rate": 1.9029336256850406e-06, - "loss": 0.7686, - "step": 19567 - }, - { - "epoch": 0.5, - "learning_rate": 1.9029217331310807e-06, - "loss": 0.6494, - "step": 19568 - }, - { - "epoch": 0.5, - "learning_rate": 1.9029098398857955e-06, - "loss": 0.9268, - "step": 19569 - }, - { - "epoch": 0.5, - "learning_rate": 1.9028979459491935e-06, - "loss": 0.9736, - "step": 19570 - }, - { - "epoch": 0.5, - "learning_rate": 1.9028860513212842e-06, - "loss": 1.0273, - "step": 19571 - }, - { - "epoch": 0.5, - "learning_rate": 1.9028741560020762e-06, - "loss": 0.9824, - "step": 19572 - }, - { - "epoch": 0.5, - "learning_rate": 1.9028622599915791e-06, - "loss": 0.8354, - "step": 19573 - }, - { - "epoch": 0.5, - "learning_rate": 1.902850363289802e-06, - "loss": 0.876, - "step": 19574 - }, - { - "epoch": 0.5, - "learning_rate": 1.902838465896754e-06, - "loss": 1.0811, - "step": 19575 - }, - { - "epoch": 0.5, - "learning_rate": 1.9028265678124439e-06, - "loss": 0.8506, - "step": 19576 - }, - { - "epoch": 0.5, - "learning_rate": 1.902814669036881e-06, - "loss": 0.7559, - "step": 19577 - }, - { - "epoch": 0.5, - "learning_rate": 1.9028027695700746e-06, - "loss": 1.0723, - "step": 19578 - }, - { - "epoch": 0.5, - "learning_rate": 1.9027908694120335e-06, - "loss": 0.8115, - "step": 19579 - }, - { - "epoch": 0.5, - "learning_rate": 1.9027789685627672e-06, - "loss": 0.8086, - "step": 19580 - }, - { - "epoch": 0.5, - "learning_rate": 1.9027670670222843e-06, - "loss": 0.9785, - "step": 19581 - }, - { - "epoch": 0.5, - "learning_rate": 1.902755164790594e-06, - "loss": 0.918, - "step": 19582 - }, - { - "epoch": 0.5, - "learning_rate": 1.9027432618677058e-06, - "loss": 0.6802, - "step": 19583 - }, - { - "epoch": 0.5, - "learning_rate": 1.9027313582536286e-06, - "loss": 0.8506, - "step": 19584 - }, - { - "epoch": 0.5, - "learning_rate": 1.9027194539483715e-06, - "loss": 0.8633, - "step": 19585 - }, - { - "epoch": 0.5, - "learning_rate": 1.9027075489519438e-06, - "loss": 0.9463, - "step": 19586 - }, - { - "epoch": 0.5, - "learning_rate": 1.902695643264354e-06, - "loss": 0.6621, - "step": 19587 - }, - { - "epoch": 0.5, - "learning_rate": 1.9026837368856122e-06, - "loss": 0.8066, - "step": 19588 - }, - { - "epoch": 0.5, - "learning_rate": 1.9026718298157264e-06, - "loss": 0.8506, - "step": 19589 - }, - { - "epoch": 0.5, - "learning_rate": 1.9026599220547066e-06, - "loss": 0.834, - "step": 19590 - }, - { - "epoch": 0.5, - "learning_rate": 1.9026480136025615e-06, - "loss": 0.7461, - "step": 19591 - }, - { - "epoch": 0.5, - "learning_rate": 1.9026361044593005e-06, - "loss": 0.7705, - "step": 19592 - }, - { - "epoch": 0.5, - "learning_rate": 1.9026241946249323e-06, - "loss": 0.8975, - "step": 19593 - }, - { - "epoch": 0.5, - "learning_rate": 1.9026122840994665e-06, - "loss": 0.7617, - "step": 19594 - }, - { - "epoch": 0.5, - "learning_rate": 1.9026003728829117e-06, - "loss": 0.9902, - "step": 19595 - }, - { - "epoch": 0.5, - "learning_rate": 1.9025884609752776e-06, - "loss": 0.9482, - "step": 19596 - }, - { - "epoch": 0.5, - "learning_rate": 1.9025765483765727e-06, - "loss": 0.958, - "step": 19597 - }, - { - "epoch": 0.5, - "learning_rate": 1.9025646350868066e-06, - "loss": 1.0967, - "step": 19598 - }, - { - "epoch": 0.5, - "learning_rate": 1.902552721105988e-06, - "loss": 0.8721, - "step": 19599 - }, - { - "epoch": 0.5, - "learning_rate": 1.9025408064341268e-06, - "loss": 0.7822, - "step": 19600 - }, - { - "epoch": 0.5, - "learning_rate": 1.9025288910712313e-06, - "loss": 1.043, - "step": 19601 - }, - { - "epoch": 0.5, - "learning_rate": 1.902516975017311e-06, - "loss": 0.8379, - "step": 19602 - }, - { - "epoch": 0.5, - "learning_rate": 1.902505058272375e-06, - "loss": 0.8281, - "step": 19603 - }, - { - "epoch": 0.5, - "learning_rate": 1.9024931408364324e-06, - "loss": 1.0, - "step": 19604 - }, - { - "epoch": 0.5, - "learning_rate": 1.9024812227094922e-06, - "loss": 0.7642, - "step": 19605 - }, - { - "epoch": 0.5, - "learning_rate": 1.9024693038915635e-06, - "loss": 0.8457, - "step": 19606 - }, - { - "epoch": 0.5, - "learning_rate": 1.9024573843826556e-06, - "loss": 0.9854, - "step": 19607 - }, - { - "epoch": 0.5, - "learning_rate": 1.9024454641827776e-06, - "loss": 0.958, - "step": 19608 - }, - { - "epoch": 0.5, - "learning_rate": 1.9024335432919388e-06, - "loss": 1.0898, - "step": 19609 - }, - { - "epoch": 0.5, - "learning_rate": 1.9024216217101481e-06, - "loss": 0.75, - "step": 19610 - }, - { - "epoch": 0.5, - "learning_rate": 1.9024096994374145e-06, - "loss": 1.0713, - "step": 19611 - }, - { - "epoch": 0.5, - "learning_rate": 1.9023977764737474e-06, - "loss": 0.9023, - "step": 19612 - }, - { - "epoch": 0.5, - "learning_rate": 1.9023858528191557e-06, - "loss": 0.8564, - "step": 19613 - }, - { - "epoch": 0.5, - "learning_rate": 1.9023739284736486e-06, - "loss": 0.9053, - "step": 19614 - }, - { - "epoch": 0.5, - "learning_rate": 1.9023620034372353e-06, - "loss": 0.7607, - "step": 19615 - }, - { - "epoch": 0.5, - "learning_rate": 1.902350077709925e-06, - "loss": 1.002, - "step": 19616 - }, - { - "epoch": 0.5, - "learning_rate": 1.9023381512917268e-06, - "loss": 0.7197, - "step": 19617 - }, - { - "epoch": 0.5, - "learning_rate": 1.9023262241826496e-06, - "loss": 0.7227, - "step": 19618 - }, - { - "epoch": 0.5, - "learning_rate": 1.9023142963827028e-06, - "loss": 1.0479, - "step": 19619 - }, - { - "epoch": 0.5, - "learning_rate": 1.9023023678918954e-06, - "loss": 0.7656, - "step": 19620 - }, - { - "epoch": 0.5, - "learning_rate": 1.9022904387102367e-06, - "loss": 0.6504, - "step": 19621 - }, - { - "epoch": 0.5, - "learning_rate": 1.9022785088377356e-06, - "loss": 0.9546, - "step": 19622 - }, - { - "epoch": 0.5, - "learning_rate": 1.9022665782744013e-06, - "loss": 1.0117, - "step": 19623 - }, - { - "epoch": 0.5, - "learning_rate": 1.902254647020243e-06, - "loss": 0.9814, - "step": 19624 - }, - { - "epoch": 0.5, - "learning_rate": 1.9022427150752697e-06, - "loss": 0.7441, - "step": 19625 - }, - { - "epoch": 0.5, - "learning_rate": 1.9022307824394907e-06, - "loss": 0.752, - "step": 19626 - }, - { - "epoch": 0.5, - "learning_rate": 1.9022188491129153e-06, - "loss": 1.1211, - "step": 19627 - }, - { - "epoch": 0.5, - "learning_rate": 1.9022069150955523e-06, - "loss": 0.9951, - "step": 19628 - }, - { - "epoch": 0.5, - "learning_rate": 1.9021949803874106e-06, - "loss": 0.8848, - "step": 19629 - }, - { - "epoch": 0.5, - "learning_rate": 1.9021830449884998e-06, - "loss": 0.8623, - "step": 19630 - }, - { - "epoch": 0.5, - "learning_rate": 1.9021711088988292e-06, - "loss": 0.96, - "step": 19631 - }, - { - "epoch": 0.5, - "learning_rate": 1.9021591721184077e-06, - "loss": 1.0469, - "step": 19632 - }, - { - "epoch": 0.5, - "learning_rate": 1.9021472346472441e-06, - "loss": 0.9229, - "step": 19633 - }, - { - "epoch": 0.5, - "learning_rate": 1.902135296485348e-06, - "loss": 0.9395, - "step": 19634 - }, - { - "epoch": 0.5, - "learning_rate": 1.9021233576327282e-06, - "loss": 0.6885, - "step": 19635 - }, - { - "epoch": 0.5, - "learning_rate": 1.9021114180893943e-06, - "loss": 0.7764, - "step": 19636 - }, - { - "epoch": 0.5, - "learning_rate": 1.9020994778553551e-06, - "loss": 0.9834, - "step": 19637 - }, - { - "epoch": 0.5, - "learning_rate": 1.9020875369306197e-06, - "loss": 0.918, - "step": 19638 - }, - { - "epoch": 0.5, - "learning_rate": 1.9020755953151975e-06, - "loss": 1.167, - "step": 19639 - }, - { - "epoch": 0.5, - "learning_rate": 1.9020636530090975e-06, - "loss": 1.042, - "step": 19640 - }, - { - "epoch": 0.5, - "learning_rate": 1.9020517100123287e-06, - "loss": 0.9312, - "step": 19641 - }, - { - "epoch": 0.5, - "learning_rate": 1.9020397663249007e-06, - "loss": 1.0674, - "step": 19642 - }, - { - "epoch": 0.5, - "learning_rate": 1.902027821946822e-06, - "loss": 0.6543, - "step": 19643 - }, - { - "epoch": 0.5, - "learning_rate": 1.902015876878102e-06, - "loss": 0.7314, - "step": 19644 - }, - { - "epoch": 0.5, - "learning_rate": 1.9020039311187501e-06, - "loss": 0.7412, - "step": 19645 - }, - { - "epoch": 0.5, - "learning_rate": 1.9019919846687752e-06, - "loss": 0.9243, - "step": 19646 - }, - { - "epoch": 0.5, - "learning_rate": 1.9019800375281867e-06, - "loss": 1.0693, - "step": 19647 - }, - { - "epoch": 0.5, - "learning_rate": 1.9019680896969935e-06, - "loss": 0.6919, - "step": 19648 - }, - { - "epoch": 0.5, - "learning_rate": 1.9019561411752045e-06, - "loss": 0.666, - "step": 19649 - }, - { - "epoch": 0.5, - "learning_rate": 1.9019441919628294e-06, - "loss": 0.8652, - "step": 19650 - }, - { - "epoch": 0.5, - "learning_rate": 1.901932242059877e-06, - "loss": 0.8335, - "step": 19651 - }, - { - "epoch": 0.5, - "learning_rate": 1.9019202914663566e-06, - "loss": 1.0127, - "step": 19652 - }, - { - "epoch": 0.5, - "learning_rate": 1.9019083401822774e-06, - "loss": 0.665, - "step": 19653 - }, - { - "epoch": 0.5, - "learning_rate": 1.9018963882076484e-06, - "loss": 0.8994, - "step": 19654 - }, - { - "epoch": 0.5, - "learning_rate": 1.9018844355424788e-06, - "loss": 0.9521, - "step": 19655 - }, - { - "epoch": 0.5, - "learning_rate": 1.9018724821867776e-06, - "loss": 0.9785, - "step": 19656 - }, - { - "epoch": 0.5, - "learning_rate": 1.9018605281405544e-06, - "loss": 0.9297, - "step": 19657 - }, - { - "epoch": 0.5, - "learning_rate": 1.901848573403818e-06, - "loss": 0.957, - "step": 19658 - }, - { - "epoch": 0.5, - "learning_rate": 1.9018366179765772e-06, - "loss": 0.7139, - "step": 19659 - }, - { - "epoch": 0.5, - "learning_rate": 1.901824661858842e-06, - "loss": 0.9824, - "step": 19660 - }, - { - "epoch": 0.5, - "learning_rate": 1.901812705050621e-06, - "loss": 0.9541, - "step": 19661 - }, - { - "epoch": 0.5, - "learning_rate": 1.9018007475519235e-06, - "loss": 1.0059, - "step": 19662 - }, - { - "epoch": 0.5, - "learning_rate": 1.9017887893627588e-06, - "loss": 1.0264, - "step": 19663 - }, - { - "epoch": 0.5, - "learning_rate": 1.9017768304831357e-06, - "loss": 0.7031, - "step": 19664 - }, - { - "epoch": 0.5, - "learning_rate": 1.9017648709130634e-06, - "loss": 0.9658, - "step": 19665 - }, - { - "epoch": 0.5, - "learning_rate": 1.9017529106525517e-06, - "loss": 0.7822, - "step": 19666 - }, - { - "epoch": 0.5, - "learning_rate": 1.9017409497016085e-06, - "loss": 1.0674, - "step": 19667 - }, - { - "epoch": 0.5, - "learning_rate": 1.9017289880602444e-06, - "loss": 0.8945, - "step": 19668 - }, - { - "epoch": 0.5, - "learning_rate": 1.9017170257284676e-06, - "loss": 0.9141, - "step": 19669 - }, - { - "epoch": 0.5, - "learning_rate": 1.9017050627062877e-06, - "loss": 0.7949, - "step": 19670 - }, - { - "epoch": 0.5, - "learning_rate": 1.9016930989937135e-06, - "loss": 0.9033, - "step": 19671 - }, - { - "epoch": 0.5, - "learning_rate": 1.9016811345907543e-06, - "loss": 0.8247, - "step": 19672 - }, - { - "epoch": 0.5, - "learning_rate": 1.9016691694974197e-06, - "loss": 0.9619, - "step": 19673 - }, - { - "epoch": 0.5, - "learning_rate": 1.901657203713718e-06, - "loss": 0.9062, - "step": 19674 - }, - { - "epoch": 0.5, - "learning_rate": 1.901645237239659e-06, - "loss": 1.0586, - "step": 19675 - }, - { - "epoch": 0.5, - "learning_rate": 1.9016332700752518e-06, - "loss": 0.6936, - "step": 19676 - }, - { - "epoch": 0.5, - "learning_rate": 1.9016213022205055e-06, - "loss": 0.958, - "step": 19677 - }, - { - "epoch": 0.5, - "learning_rate": 1.9016093336754292e-06, - "loss": 0.8828, - "step": 19678 - }, - { - "epoch": 0.5, - "learning_rate": 1.9015973644400318e-06, - "loss": 0.8457, - "step": 19679 - }, - { - "epoch": 0.5, - "learning_rate": 1.9015853945143232e-06, - "loss": 0.7563, - "step": 19680 - }, - { - "epoch": 0.5, - "learning_rate": 1.9015734238983119e-06, - "loss": 0.7524, - "step": 19681 - }, - { - "epoch": 0.5, - "learning_rate": 1.9015614525920073e-06, - "loss": 0.8545, - "step": 19682 - }, - { - "epoch": 0.5, - "learning_rate": 1.9015494805954183e-06, - "loss": 0.6509, - "step": 19683 - }, - { - "epoch": 0.5, - "learning_rate": 1.9015375079085546e-06, - "loss": 0.876, - "step": 19684 - }, - { - "epoch": 0.5, - "learning_rate": 1.901525534531425e-06, - "loss": 0.9766, - "step": 19685 - }, - { - "epoch": 0.5, - "learning_rate": 1.901513560464039e-06, - "loss": 0.8326, - "step": 19686 - }, - { - "epoch": 0.5, - "learning_rate": 1.9015015857064052e-06, - "loss": 0.6709, - "step": 19687 - }, - { - "epoch": 0.5, - "learning_rate": 1.9014896102585332e-06, - "loss": 0.6846, - "step": 19688 - }, - { - "epoch": 0.5, - "learning_rate": 1.9014776341204319e-06, - "loss": 0.729, - "step": 19689 - }, - { - "epoch": 0.5, - "learning_rate": 1.901465657292111e-06, - "loss": 0.7009, - "step": 19690 - }, - { - "epoch": 0.5, - "learning_rate": 1.901453679773579e-06, - "loss": 0.9678, - "step": 19691 - }, - { - "epoch": 0.5, - "learning_rate": 1.9014417015648455e-06, - "loss": 0.8403, - "step": 19692 - }, - { - "epoch": 0.5, - "learning_rate": 1.9014297226659192e-06, - "loss": 0.9141, - "step": 19693 - }, - { - "epoch": 0.5, - "learning_rate": 1.9014177430768102e-06, - "loss": 0.9111, - "step": 19694 - }, - { - "epoch": 0.5, - "learning_rate": 1.9014057627975267e-06, - "loss": 0.8281, - "step": 19695 - }, - { - "epoch": 0.5, - "learning_rate": 1.9013937818280784e-06, - "loss": 0.6279, - "step": 19696 - }, - { - "epoch": 0.5, - "learning_rate": 1.9013818001684742e-06, - "loss": 0.8281, - "step": 19697 - }, - { - "epoch": 0.5, - "learning_rate": 1.9013698178187234e-06, - "loss": 0.9272, - "step": 19698 - }, - { - "epoch": 0.5, - "learning_rate": 1.9013578347788352e-06, - "loss": 0.8887, - "step": 19699 - }, - { - "epoch": 0.5, - "learning_rate": 1.9013458510488188e-06, - "loss": 1.0498, - "step": 19700 - }, - { - "epoch": 0.5, - "learning_rate": 1.9013338666286832e-06, - "loss": 1.0898, - "step": 19701 - }, - { - "epoch": 0.5, - "learning_rate": 1.901321881518438e-06, - "loss": 0.7559, - "step": 19702 - }, - { - "epoch": 0.5, - "learning_rate": 1.901309895718092e-06, - "loss": 0.9893, - "step": 19703 - }, - { - "epoch": 0.51, - "learning_rate": 1.9012979092276541e-06, - "loss": 0.9033, - "step": 19704 - }, - { - "epoch": 0.51, - "learning_rate": 1.9012859220471343e-06, - "loss": 0.6655, - "step": 19705 - }, - { - "epoch": 0.51, - "learning_rate": 1.9012739341765412e-06, - "loss": 0.689, - "step": 19706 - }, - { - "epoch": 0.51, - "learning_rate": 1.9012619456158836e-06, - "loss": 0.8135, - "step": 19707 - }, - { - "epoch": 0.51, - "learning_rate": 1.9012499563651718e-06, - "loss": 0.8105, - "step": 19708 - }, - { - "epoch": 0.51, - "learning_rate": 1.901237966424414e-06, - "loss": 0.8438, - "step": 19709 - }, - { - "epoch": 0.51, - "learning_rate": 1.9012259757936197e-06, - "loss": 0.7505, - "step": 19710 - }, - { - "epoch": 0.51, - "learning_rate": 1.9012139844727986e-06, - "loss": 0.7891, - "step": 19711 - }, - { - "epoch": 0.51, - "learning_rate": 1.901201992461959e-06, - "loss": 0.8994, - "step": 19712 - }, - { - "epoch": 0.51, - "learning_rate": 1.9011899997611103e-06, - "loss": 0.9922, - "step": 19713 - }, - { - "epoch": 0.51, - "learning_rate": 1.9011780063702622e-06, - "loss": 0.9229, - "step": 19714 - }, - { - "epoch": 0.51, - "learning_rate": 1.9011660122894234e-06, - "loss": 0.9766, - "step": 19715 - }, - { - "epoch": 0.51, - "learning_rate": 1.9011540175186032e-06, - "loss": 0.9834, - "step": 19716 - }, - { - "epoch": 0.51, - "learning_rate": 1.9011420220578107e-06, - "loss": 0.9814, - "step": 19717 - }, - { - "epoch": 0.51, - "learning_rate": 1.9011300259070553e-06, - "loss": 0.8154, - "step": 19718 - }, - { - "epoch": 0.51, - "learning_rate": 1.9011180290663461e-06, - "loss": 1.0098, - "step": 19719 - }, - { - "epoch": 0.51, - "learning_rate": 1.9011060315356923e-06, - "loss": 0.8984, - "step": 19720 - }, - { - "epoch": 0.51, - "learning_rate": 1.9010940333151032e-06, - "loss": 1.0605, - "step": 19721 - }, - { - "epoch": 0.51, - "learning_rate": 1.9010820344045876e-06, - "loss": 1.0127, - "step": 19722 - }, - { - "epoch": 0.51, - "learning_rate": 1.901070034804155e-06, - "loss": 0.8564, - "step": 19723 - }, - { - "epoch": 0.51, - "learning_rate": 1.9010580345138143e-06, - "loss": 0.917, - "step": 19724 - }, - { - "epoch": 0.51, - "learning_rate": 1.901046033533575e-06, - "loss": 0.751, - "step": 19725 - }, - { - "epoch": 0.51, - "learning_rate": 1.901034031863446e-06, - "loss": 0.9395, - "step": 19726 - }, - { - "epoch": 0.51, - "learning_rate": 1.901022029503437e-06, - "loss": 1.1064, - "step": 19727 - }, - { - "epoch": 0.51, - "learning_rate": 1.901010026453557e-06, - "loss": 0.7085, - "step": 19728 - }, - { - "epoch": 0.51, - "learning_rate": 1.9009980227138147e-06, - "loss": 0.813, - "step": 19729 - }, - { - "epoch": 0.51, - "learning_rate": 1.90098601828422e-06, - "loss": 0.9448, - "step": 19730 - }, - { - "epoch": 0.51, - "learning_rate": 1.9009740131647813e-06, - "loss": 0.9233, - "step": 19731 - }, - { - "epoch": 0.51, - "learning_rate": 1.9009620073555084e-06, - "loss": 0.8555, - "step": 19732 - }, - { - "epoch": 0.51, - "learning_rate": 1.9009500008564104e-06, - "loss": 0.9062, - "step": 19733 - }, - { - "epoch": 0.51, - "learning_rate": 1.9009379936674962e-06, - "loss": 0.8784, - "step": 19734 - }, - { - "epoch": 0.51, - "learning_rate": 1.9009259857887753e-06, - "loss": 0.7026, - "step": 19735 - }, - { - "epoch": 0.51, - "learning_rate": 1.9009139772202572e-06, - "loss": 1.0039, - "step": 19736 - }, - { - "epoch": 0.51, - "learning_rate": 1.9009019679619502e-06, - "loss": 0.8604, - "step": 19737 - }, - { - "epoch": 0.51, - "learning_rate": 1.900889958013864e-06, - "loss": 0.9521, - "step": 19738 - }, - { - "epoch": 0.51, - "learning_rate": 1.9008779473760081e-06, - "loss": 0.8525, - "step": 19739 - }, - { - "epoch": 0.51, - "learning_rate": 1.9008659360483912e-06, - "loss": 0.8096, - "step": 19740 - }, - { - "epoch": 0.51, - "learning_rate": 1.9008539240310226e-06, - "loss": 0.9443, - "step": 19741 - }, - { - "epoch": 0.51, - "learning_rate": 1.9008419113239115e-06, - "loss": 0.8301, - "step": 19742 - }, - { - "epoch": 0.51, - "learning_rate": 1.9008298979270676e-06, - "loss": 0.8848, - "step": 19743 - }, - { - "epoch": 0.51, - "learning_rate": 1.9008178838404994e-06, - "loss": 1.0625, - "step": 19744 - }, - { - "epoch": 0.51, - "learning_rate": 1.9008058690642162e-06, - "loss": 0.8408, - "step": 19745 - }, - { - "epoch": 0.51, - "learning_rate": 1.9007938535982275e-06, - "loss": 0.6865, - "step": 19746 - }, - { - "epoch": 0.51, - "learning_rate": 1.9007818374425425e-06, - "loss": 0.8296, - "step": 19747 - }, - { - "epoch": 0.51, - "learning_rate": 1.90076982059717e-06, - "loss": 0.958, - "step": 19748 - }, - { - "epoch": 0.51, - "learning_rate": 1.90075780306212e-06, - "loss": 0.9297, - "step": 19749 - }, - { - "epoch": 0.51, - "learning_rate": 1.9007457848374004e-06, - "loss": 0.8359, - "step": 19750 - }, - { - "epoch": 0.51, - "learning_rate": 1.9007337659230216e-06, - "loss": 0.874, - "step": 19751 - }, - { - "epoch": 0.51, - "learning_rate": 1.9007217463189922e-06, - "loss": 0.8486, - "step": 19752 - }, - { - "epoch": 0.51, - "learning_rate": 1.900709726025322e-06, - "loss": 1.1445, - "step": 19753 - }, - { - "epoch": 0.51, - "learning_rate": 1.9006977050420195e-06, - "loss": 0.833, - "step": 19754 - }, - { - "epoch": 0.51, - "learning_rate": 1.9006856833690939e-06, - "loss": 0.7256, - "step": 19755 - }, - { - "epoch": 0.51, - "learning_rate": 1.9006736610065551e-06, - "loss": 1.1074, - "step": 19756 - }, - { - "epoch": 0.51, - "learning_rate": 1.9006616379544119e-06, - "loss": 0.7324, - "step": 19757 - }, - { - "epoch": 0.51, - "learning_rate": 1.900649614212673e-06, - "loss": 0.7705, - "step": 19758 - }, - { - "epoch": 0.51, - "learning_rate": 1.9006375897813487e-06, - "loss": 0.8955, - "step": 19759 - }, - { - "epoch": 0.51, - "learning_rate": 1.9006255646604473e-06, - "loss": 1.084, - "step": 19760 - }, - { - "epoch": 0.51, - "learning_rate": 1.9006135388499781e-06, - "loss": 0.9902, - "step": 19761 - }, - { - "epoch": 0.51, - "learning_rate": 1.900601512349951e-06, - "loss": 0.8838, - "step": 19762 - }, - { - "epoch": 0.51, - "learning_rate": 1.9005894851603746e-06, - "loss": 0.8091, - "step": 19763 - }, - { - "epoch": 0.51, - "learning_rate": 1.900577457281258e-06, - "loss": 0.9395, - "step": 19764 - }, - { - "epoch": 0.51, - "learning_rate": 1.900565428712611e-06, - "loss": 0.8936, - "step": 19765 - }, - { - "epoch": 0.51, - "learning_rate": 1.9005533994544422e-06, - "loss": 1.0068, - "step": 19766 - }, - { - "epoch": 0.51, - "learning_rate": 1.900541369506761e-06, - "loss": 0.9668, - "step": 19767 - }, - { - "epoch": 0.51, - "learning_rate": 1.900529338869577e-06, - "loss": 1.1406, - "step": 19768 - }, - { - "epoch": 0.51, - "learning_rate": 1.9005173075428988e-06, - "loss": 0.7744, - "step": 19769 - }, - { - "epoch": 0.51, - "learning_rate": 1.9005052755267361e-06, - "loss": 0.9355, - "step": 19770 - }, - { - "epoch": 0.51, - "learning_rate": 1.9004932428210978e-06, - "loss": 0.8467, - "step": 19771 - }, - { - "epoch": 0.51, - "learning_rate": 1.9004812094259934e-06, - "loss": 0.9102, - "step": 19772 - }, - { - "epoch": 0.51, - "learning_rate": 1.9004691753414317e-06, - "loss": 1.0947, - "step": 19773 - }, - { - "epoch": 0.51, - "learning_rate": 1.9004571405674223e-06, - "loss": 0.7256, - "step": 19774 - }, - { - "epoch": 0.51, - "learning_rate": 1.9004451051039742e-06, - "loss": 0.6963, - "step": 19775 - }, - { - "epoch": 0.51, - "learning_rate": 1.9004330689510968e-06, - "loss": 0.8223, - "step": 19776 - }, - { - "epoch": 0.51, - "learning_rate": 1.9004210321087992e-06, - "loss": 0.7456, - "step": 19777 - }, - { - "epoch": 0.51, - "learning_rate": 1.9004089945770904e-06, - "loss": 0.8857, - "step": 19778 - }, - { - "epoch": 0.51, - "learning_rate": 1.90039695635598e-06, - "loss": 0.96, - "step": 19779 - }, - { - "epoch": 0.51, - "learning_rate": 1.9003849174454771e-06, - "loss": 0.8555, - "step": 19780 - }, - { - "epoch": 0.51, - "learning_rate": 1.9003728778455907e-06, - "loss": 0.8906, - "step": 19781 - }, - { - "epoch": 0.51, - "learning_rate": 1.9003608375563306e-06, - "loss": 0.8779, - "step": 19782 - }, - { - "epoch": 0.51, - "learning_rate": 1.9003487965777053e-06, - "loss": 0.7559, - "step": 19783 - }, - { - "epoch": 0.51, - "learning_rate": 1.9003367549097241e-06, - "loss": 0.8071, - "step": 19784 - }, - { - "epoch": 0.51, - "learning_rate": 1.9003247125523969e-06, - "loss": 0.7319, - "step": 19785 - }, - { - "epoch": 0.51, - "learning_rate": 1.9003126695057322e-06, - "loss": 1.0225, - "step": 19786 - }, - { - "epoch": 0.51, - "learning_rate": 1.9003006257697394e-06, - "loss": 0.9434, - "step": 19787 - }, - { - "epoch": 0.51, - "learning_rate": 1.9002885813444278e-06, - "loss": 0.5122, - "step": 19788 - }, - { - "epoch": 0.51, - "learning_rate": 1.900276536229807e-06, - "loss": 0.6187, - "step": 19789 - }, - { - "epoch": 0.51, - "learning_rate": 1.9002644904258856e-06, - "loss": 0.959, - "step": 19790 - }, - { - "epoch": 0.51, - "learning_rate": 1.900252443932673e-06, - "loss": 1.083, - "step": 19791 - }, - { - "epoch": 0.51, - "learning_rate": 1.9002403967501786e-06, - "loss": 0.7556, - "step": 19792 - }, - { - "epoch": 0.51, - "learning_rate": 1.9002283488784117e-06, - "loss": 0.8887, - "step": 19793 - }, - { - "epoch": 0.51, - "learning_rate": 1.900216300317381e-06, - "loss": 0.7729, - "step": 19794 - }, - { - "epoch": 0.51, - "learning_rate": 1.9002042510670963e-06, - "loss": 0.9541, - "step": 19795 - }, - { - "epoch": 0.51, - "learning_rate": 1.9001922011275664e-06, - "loss": 0.9443, - "step": 19796 - }, - { - "epoch": 0.51, - "learning_rate": 1.9001801504988008e-06, - "loss": 0.9834, - "step": 19797 - }, - { - "epoch": 0.51, - "learning_rate": 1.9001680991808088e-06, - "loss": 0.7705, - "step": 19798 - }, - { - "epoch": 0.51, - "learning_rate": 1.9001560471735993e-06, - "loss": 0.7988, - "step": 19799 - }, - { - "epoch": 0.51, - "learning_rate": 1.9001439944771817e-06, - "loss": 1.083, - "step": 19800 - }, - { - "epoch": 0.51, - "learning_rate": 1.9001319410915655e-06, - "loss": 0.9717, - "step": 19801 - }, - { - "epoch": 0.51, - "learning_rate": 1.9001198870167595e-06, - "loss": 0.7744, - "step": 19802 - }, - { - "epoch": 0.51, - "learning_rate": 1.9001078322527731e-06, - "loss": 0.8994, - "step": 19803 - }, - { - "epoch": 0.51, - "learning_rate": 1.9000957767996156e-06, - "loss": 0.9971, - "step": 19804 - }, - { - "epoch": 0.51, - "learning_rate": 1.900083720657296e-06, - "loss": 0.6011, - "step": 19805 - }, - { - "epoch": 0.51, - "learning_rate": 1.9000716638258237e-06, - "loss": 0.8203, - "step": 19806 - }, - { - "epoch": 0.51, - "learning_rate": 1.9000596063052078e-06, - "loss": 0.7744, - "step": 19807 - }, - { - "epoch": 0.51, - "learning_rate": 1.9000475480954576e-06, - "loss": 0.9756, - "step": 19808 - }, - { - "epoch": 0.51, - "learning_rate": 1.9000354891965827e-06, - "loss": 0.8027, - "step": 19809 - }, - { - "epoch": 0.51, - "learning_rate": 1.9000234296085917e-06, - "loss": 0.8281, - "step": 19810 - }, - { - "epoch": 0.51, - "learning_rate": 1.9000113693314945e-06, - "loss": 1.0088, - "step": 19811 - }, - { - "epoch": 0.51, - "learning_rate": 1.8999993083653e-06, - "loss": 0.8799, - "step": 19812 - }, - { - "epoch": 0.51, - "learning_rate": 1.899987246710017e-06, - "loss": 0.9746, - "step": 19813 - }, - { - "epoch": 0.51, - "learning_rate": 1.8999751843656554e-06, - "loss": 0.6807, - "step": 19814 - }, - { - "epoch": 0.51, - "learning_rate": 1.8999631213322243e-06, - "loss": 1.0205, - "step": 19815 - }, - { - "epoch": 0.51, - "learning_rate": 1.8999510576097327e-06, - "loss": 1.0713, - "step": 19816 - }, - { - "epoch": 0.51, - "learning_rate": 1.8999389931981897e-06, - "loss": 0.9014, - "step": 19817 - }, - { - "epoch": 0.51, - "learning_rate": 1.8999269280976052e-06, - "loss": 0.8926, - "step": 19818 - }, - { - "epoch": 0.51, - "learning_rate": 1.8999148623079875e-06, - "loss": 0.8506, - "step": 19819 - }, - { - "epoch": 0.51, - "learning_rate": 1.8999027958293468e-06, - "loss": 0.9492, - "step": 19820 - }, - { - "epoch": 0.51, - "learning_rate": 1.8998907286616918e-06, - "loss": 0.7583, - "step": 19821 - }, - { - "epoch": 0.51, - "learning_rate": 1.8998786608050319e-06, - "loss": 0.8643, - "step": 19822 - }, - { - "epoch": 0.51, - "learning_rate": 1.8998665922593765e-06, - "loss": 0.7891, - "step": 19823 - }, - { - "epoch": 0.51, - "learning_rate": 1.8998545230247341e-06, - "loss": 0.7734, - "step": 19824 - }, - { - "epoch": 0.51, - "learning_rate": 1.8998424531011147e-06, - "loss": 0.7329, - "step": 19825 - }, - { - "epoch": 0.51, - "learning_rate": 1.8998303824885276e-06, - "loss": 0.9482, - "step": 19826 - }, - { - "epoch": 0.51, - "learning_rate": 1.8998183111869813e-06, - "loss": 0.7275, - "step": 19827 - }, - { - "epoch": 0.51, - "learning_rate": 1.8998062391964857e-06, - "loss": 0.8271, - "step": 19828 - }, - { - "epoch": 0.51, - "learning_rate": 1.8997941665170499e-06, - "loss": 0.8252, - "step": 19829 - }, - { - "epoch": 0.51, - "learning_rate": 1.899782093148683e-06, - "loss": 0.7383, - "step": 19830 - }, - { - "epoch": 0.51, - "learning_rate": 1.8997700190913944e-06, - "loss": 0.8877, - "step": 19831 - }, - { - "epoch": 0.51, - "learning_rate": 1.8997579443451932e-06, - "loss": 0.8105, - "step": 19832 - }, - { - "epoch": 0.51, - "learning_rate": 1.8997458689100886e-06, - "loss": 0.8379, - "step": 19833 - }, - { - "epoch": 0.51, - "learning_rate": 1.8997337927860902e-06, - "loss": 0.6055, - "step": 19834 - }, - { - "epoch": 0.51, - "learning_rate": 1.8997217159732069e-06, - "loss": 0.9736, - "step": 19835 - }, - { - "epoch": 0.51, - "learning_rate": 1.899709638471448e-06, - "loss": 0.5518, - "step": 19836 - }, - { - "epoch": 0.51, - "learning_rate": 1.8996975602808228e-06, - "loss": 0.8408, - "step": 19837 - }, - { - "epoch": 0.51, - "learning_rate": 1.8996854814013405e-06, - "loss": 0.8301, - "step": 19838 - }, - { - "epoch": 0.51, - "learning_rate": 1.8996734018330107e-06, - "loss": 1.1445, - "step": 19839 - }, - { - "epoch": 0.51, - "learning_rate": 1.899661321575842e-06, - "loss": 0.8232, - "step": 19840 - }, - { - "epoch": 0.51, - "learning_rate": 1.899649240629844e-06, - "loss": 0.9453, - "step": 19841 - }, - { - "epoch": 0.51, - "learning_rate": 1.8996371589950262e-06, - "loss": 1.0146, - "step": 19842 - }, - { - "epoch": 0.51, - "learning_rate": 1.8996250766713974e-06, - "loss": 0.8564, - "step": 19843 - }, - { - "epoch": 0.51, - "learning_rate": 1.899612993658967e-06, - "loss": 0.7793, - "step": 19844 - }, - { - "epoch": 0.51, - "learning_rate": 1.8996009099577446e-06, - "loss": 0.7861, - "step": 19845 - }, - { - "epoch": 0.51, - "learning_rate": 1.899588825567739e-06, - "loss": 1.0117, - "step": 19846 - }, - { - "epoch": 0.51, - "learning_rate": 1.8995767404889596e-06, - "loss": 0.9766, - "step": 19847 - }, - { - "epoch": 0.51, - "learning_rate": 1.8995646547214155e-06, - "loss": 0.7881, - "step": 19848 - }, - { - "epoch": 0.51, - "learning_rate": 1.8995525682651161e-06, - "loss": 0.7812, - "step": 19849 - }, - { - "epoch": 0.51, - "learning_rate": 1.899540481120071e-06, - "loss": 0.9697, - "step": 19850 - }, - { - "epoch": 0.51, - "learning_rate": 1.8995283932862886e-06, - "loss": 0.8652, - "step": 19851 - }, - { - "epoch": 0.51, - "learning_rate": 1.8995163047637792e-06, - "loss": 0.8184, - "step": 19852 - }, - { - "epoch": 0.51, - "learning_rate": 1.899504215552551e-06, - "loss": 0.9277, - "step": 19853 - }, - { - "epoch": 0.51, - "learning_rate": 1.8994921256526142e-06, - "loss": 0.8428, - "step": 19854 - }, - { - "epoch": 0.51, - "learning_rate": 1.8994800350639775e-06, - "loss": 0.8379, - "step": 19855 - }, - { - "epoch": 0.51, - "learning_rate": 1.8994679437866504e-06, - "loss": 0.8008, - "step": 19856 - }, - { - "epoch": 0.51, - "learning_rate": 1.8994558518206418e-06, - "loss": 0.7822, - "step": 19857 - }, - { - "epoch": 0.51, - "learning_rate": 1.8994437591659613e-06, - "loss": 0.7646, - "step": 19858 - }, - { - "epoch": 0.51, - "learning_rate": 1.8994316658226182e-06, - "loss": 0.8525, - "step": 19859 - }, - { - "epoch": 0.51, - "learning_rate": 1.8994195717906215e-06, - "loss": 0.8828, - "step": 19860 - }, - { - "epoch": 0.51, - "learning_rate": 1.899407477069981e-06, - "loss": 0.8516, - "step": 19861 - }, - { - "epoch": 0.51, - "learning_rate": 1.8993953816607048e-06, - "loss": 0.9873, - "step": 19862 - }, - { - "epoch": 0.51, - "learning_rate": 1.8993832855628034e-06, - "loss": 0.9355, - "step": 19863 - }, - { - "epoch": 0.51, - "learning_rate": 1.8993711887762856e-06, - "loss": 0.9814, - "step": 19864 - }, - { - "epoch": 0.51, - "learning_rate": 1.8993590913011604e-06, - "loss": 1.1123, - "step": 19865 - }, - { - "epoch": 0.51, - "learning_rate": 1.8993469931374375e-06, - "loss": 0.6426, - "step": 19866 - }, - { - "epoch": 0.51, - "learning_rate": 1.899334894285126e-06, - "loss": 0.7759, - "step": 19867 - }, - { - "epoch": 0.51, - "learning_rate": 1.899322794744235e-06, - "loss": 0.8457, - "step": 19868 - }, - { - "epoch": 0.51, - "learning_rate": 1.899310694514774e-06, - "loss": 0.9736, - "step": 19869 - }, - { - "epoch": 0.51, - "learning_rate": 1.899298593596752e-06, - "loss": 1.0049, - "step": 19870 - }, - { - "epoch": 0.51, - "learning_rate": 1.8992864919901783e-06, - "loss": 0.7983, - "step": 19871 - }, - { - "epoch": 0.51, - "learning_rate": 1.8992743896950625e-06, - "loss": 0.9268, - "step": 19872 - }, - { - "epoch": 0.51, - "learning_rate": 1.8992622867114136e-06, - "loss": 0.8965, - "step": 19873 - }, - { - "epoch": 0.51, - "learning_rate": 1.899250183039241e-06, - "loss": 0.8936, - "step": 19874 - }, - { - "epoch": 0.51, - "learning_rate": 1.8992380786785539e-06, - "loss": 0.7397, - "step": 19875 - }, - { - "epoch": 0.51, - "learning_rate": 1.8992259736293614e-06, - "loss": 0.9248, - "step": 19876 - }, - { - "epoch": 0.51, - "learning_rate": 1.8992138678916726e-06, - "loss": 0.873, - "step": 19877 - }, - { - "epoch": 0.51, - "learning_rate": 1.8992017614654979e-06, - "loss": 0.8521, - "step": 19878 - }, - { - "epoch": 0.51, - "learning_rate": 1.8991896543508452e-06, - "loss": 0.8467, - "step": 19879 - }, - { - "epoch": 0.51, - "learning_rate": 1.8991775465477241e-06, - "loss": 0.6895, - "step": 19880 - }, - { - "epoch": 0.51, - "learning_rate": 1.8991654380561447e-06, - "loss": 0.8467, - "step": 19881 - }, - { - "epoch": 0.51, - "learning_rate": 1.8991533288761155e-06, - "loss": 0.8125, - "step": 19882 - }, - { - "epoch": 0.51, - "learning_rate": 1.8991412190076458e-06, - "loss": 0.5681, - "step": 19883 - }, - { - "epoch": 0.51, - "learning_rate": 1.899129108450745e-06, - "loss": 0.8711, - "step": 19884 - }, - { - "epoch": 0.51, - "learning_rate": 1.8991169972054223e-06, - "loss": 0.8994, - "step": 19885 - }, - { - "epoch": 0.51, - "learning_rate": 1.8991048852716873e-06, - "loss": 0.918, - "step": 19886 - }, - { - "epoch": 0.51, - "learning_rate": 1.8990927726495491e-06, - "loss": 0.7832, - "step": 19887 - }, - { - "epoch": 0.51, - "learning_rate": 1.8990806593390167e-06, - "loss": 0.6689, - "step": 19888 - }, - { - "epoch": 0.51, - "learning_rate": 1.8990685453400995e-06, - "loss": 0.6709, - "step": 19889 - }, - { - "epoch": 0.51, - "learning_rate": 1.899056430652807e-06, - "loss": 0.9912, - "step": 19890 - }, - { - "epoch": 0.51, - "learning_rate": 1.8990443152771482e-06, - "loss": 0.8047, - "step": 19891 - }, - { - "epoch": 0.51, - "learning_rate": 1.8990321992131327e-06, - "loss": 0.751, - "step": 19892 - }, - { - "epoch": 0.51, - "learning_rate": 1.8990200824607696e-06, - "loss": 0.665, - "step": 19893 - }, - { - "epoch": 0.51, - "learning_rate": 1.8990079650200678e-06, - "loss": 0.7578, - "step": 19894 - }, - { - "epoch": 0.51, - "learning_rate": 1.8989958468910375e-06, - "loss": 1.0244, - "step": 19895 - }, - { - "epoch": 0.51, - "learning_rate": 1.898983728073687e-06, - "loss": 0.7427, - "step": 19896 - }, - { - "epoch": 0.51, - "learning_rate": 1.898971608568026e-06, - "loss": 0.9229, - "step": 19897 - }, - { - "epoch": 0.51, - "learning_rate": 1.898959488374064e-06, - "loss": 0.8535, - "step": 19898 - }, - { - "epoch": 0.51, - "learning_rate": 1.89894736749181e-06, - "loss": 0.9893, - "step": 19899 - }, - { - "epoch": 0.51, - "learning_rate": 1.8989352459212733e-06, - "loss": 0.8037, - "step": 19900 - }, - { - "epoch": 0.51, - "learning_rate": 1.8989231236624633e-06, - "loss": 1.0527, - "step": 19901 - }, - { - "epoch": 0.51, - "learning_rate": 1.898911000715389e-06, - "loss": 0.9531, - "step": 19902 - }, - { - "epoch": 0.51, - "learning_rate": 1.89889887708006e-06, - "loss": 1.0176, - "step": 19903 - }, - { - "epoch": 0.51, - "learning_rate": 1.8988867527564853e-06, - "loss": 0.9141, - "step": 19904 - }, - { - "epoch": 0.51, - "learning_rate": 1.8988746277446746e-06, - "loss": 0.7354, - "step": 19905 - }, - { - "epoch": 0.51, - "learning_rate": 1.8988625020446368e-06, - "loss": 0.6763, - "step": 19906 - }, - { - "epoch": 0.51, - "learning_rate": 1.8988503756563813e-06, - "loss": 0.834, - "step": 19907 - }, - { - "epoch": 0.51, - "learning_rate": 1.8988382485799175e-06, - "loss": 0.8018, - "step": 19908 - }, - { - "epoch": 0.51, - "learning_rate": 1.8988261208152542e-06, - "loss": 1.0625, - "step": 19909 - }, - { - "epoch": 0.51, - "learning_rate": 1.8988139923624016e-06, - "loss": 0.832, - "step": 19910 - }, - { - "epoch": 0.51, - "learning_rate": 1.8988018632213683e-06, - "loss": 0.8652, - "step": 19911 - }, - { - "epoch": 0.51, - "learning_rate": 1.8987897333921636e-06, - "loss": 0.8865, - "step": 19912 - }, - { - "epoch": 0.51, - "learning_rate": 1.898777602874797e-06, - "loss": 0.8477, - "step": 19913 - }, - { - "epoch": 0.51, - "learning_rate": 1.8987654716692775e-06, - "loss": 0.9775, - "step": 19914 - }, - { - "epoch": 0.51, - "learning_rate": 1.898753339775615e-06, - "loss": 0.7153, - "step": 19915 - }, - { - "epoch": 0.51, - "learning_rate": 1.8987412071938183e-06, - "loss": 0.6531, - "step": 19916 - }, - { - "epoch": 0.51, - "learning_rate": 1.8987290739238966e-06, - "loss": 0.823, - "step": 19917 - }, - { - "epoch": 0.51, - "learning_rate": 1.8987169399658595e-06, - "loss": 0.8555, - "step": 19918 - }, - { - "epoch": 0.51, - "learning_rate": 1.898704805319716e-06, - "loss": 1.0811, - "step": 19919 - }, - { - "epoch": 0.51, - "learning_rate": 1.8986926699854757e-06, - "loss": 0.8613, - "step": 19920 - }, - { - "epoch": 0.51, - "learning_rate": 1.8986805339631478e-06, - "loss": 0.6919, - "step": 19921 - }, - { - "epoch": 0.51, - "learning_rate": 1.8986683972527415e-06, - "loss": 0.9199, - "step": 19922 - }, - { - "epoch": 0.51, - "learning_rate": 1.898656259854266e-06, - "loss": 0.791, - "step": 19923 - }, - { - "epoch": 0.51, - "learning_rate": 1.898644121767731e-06, - "loss": 0.8955, - "step": 19924 - }, - { - "epoch": 0.51, - "learning_rate": 1.898631982993145e-06, - "loss": 0.9189, - "step": 19925 - }, - { - "epoch": 0.51, - "learning_rate": 1.8986198435305183e-06, - "loss": 1.0938, - "step": 19926 - }, - { - "epoch": 0.51, - "learning_rate": 1.8986077033798596e-06, - "loss": 0.8799, - "step": 19927 - }, - { - "epoch": 0.51, - "learning_rate": 1.8985955625411782e-06, - "loss": 0.7744, - "step": 19928 - }, - { - "epoch": 0.51, - "learning_rate": 1.8985834210144836e-06, - "loss": 0.8262, - "step": 19929 - }, - { - "epoch": 0.51, - "learning_rate": 1.898571278799785e-06, - "loss": 0.8613, - "step": 19930 - }, - { - "epoch": 0.51, - "learning_rate": 1.8985591358970913e-06, - "loss": 0.8447, - "step": 19931 - }, - { - "epoch": 0.51, - "learning_rate": 1.8985469923064126e-06, - "loss": 0.8184, - "step": 19932 - }, - { - "epoch": 0.51, - "learning_rate": 1.8985348480277578e-06, - "loss": 0.8887, - "step": 19933 - }, - { - "epoch": 0.51, - "learning_rate": 1.898522703061136e-06, - "loss": 0.8408, - "step": 19934 - }, - { - "epoch": 0.51, - "learning_rate": 1.8985105574065567e-06, - "loss": 1.0234, - "step": 19935 - }, - { - "epoch": 0.51, - "learning_rate": 1.8984984110640295e-06, - "loss": 0.7588, - "step": 19936 - }, - { - "epoch": 0.51, - "learning_rate": 1.898486264033563e-06, - "loss": 0.9688, - "step": 19937 - }, - { - "epoch": 0.51, - "learning_rate": 1.898474116315167e-06, - "loss": 0.7534, - "step": 19938 - }, - { - "epoch": 0.51, - "learning_rate": 1.8984619679088508e-06, - "loss": 0.7725, - "step": 19939 - }, - { - "epoch": 0.51, - "learning_rate": 1.8984498188146233e-06, - "loss": 0.916, - "step": 19940 - }, - { - "epoch": 0.51, - "learning_rate": 1.8984376690324944e-06, - "loss": 0.7188, - "step": 19941 - }, - { - "epoch": 0.51, - "learning_rate": 1.898425518562473e-06, - "loss": 0.8447, - "step": 19942 - }, - { - "epoch": 0.51, - "learning_rate": 1.8984133674045683e-06, - "loss": 0.7773, - "step": 19943 - }, - { - "epoch": 0.51, - "learning_rate": 1.8984012155587901e-06, - "loss": 0.7656, - "step": 19944 - }, - { - "epoch": 0.51, - "learning_rate": 1.898389063025147e-06, - "loss": 0.6611, - "step": 19945 - }, - { - "epoch": 0.51, - "learning_rate": 1.898376909803649e-06, - "loss": 0.7339, - "step": 19946 - }, - { - "epoch": 0.51, - "learning_rate": 1.898364755894305e-06, - "loss": 0.7026, - "step": 19947 - }, - { - "epoch": 0.51, - "learning_rate": 1.8983526012971246e-06, - "loss": 0.8447, - "step": 19948 - }, - { - "epoch": 0.51, - "learning_rate": 1.8983404460121167e-06, - "loss": 0.8984, - "step": 19949 - }, - { - "epoch": 0.51, - "learning_rate": 1.898328290039291e-06, - "loss": 0.6226, - "step": 19950 - }, - { - "epoch": 0.51, - "learning_rate": 1.8983161333786564e-06, - "loss": 0.6196, - "step": 19951 - }, - { - "epoch": 0.51, - "learning_rate": 1.8983039760302227e-06, - "loss": 0.8809, - "step": 19952 - }, - { - "epoch": 0.51, - "learning_rate": 1.8982918179939986e-06, - "loss": 0.832, - "step": 19953 - }, - { - "epoch": 0.51, - "learning_rate": 1.8982796592699942e-06, - "loss": 0.7349, - "step": 19954 - }, - { - "epoch": 0.51, - "learning_rate": 1.898267499858218e-06, - "loss": 0.8486, - "step": 19955 - }, - { - "epoch": 0.51, - "learning_rate": 1.89825533975868e-06, - "loss": 0.9951, - "step": 19956 - }, - { - "epoch": 0.51, - "learning_rate": 1.898243178971389e-06, - "loss": 0.8662, - "step": 19957 - }, - { - "epoch": 0.51, - "learning_rate": 1.8982310174963546e-06, - "loss": 1.0605, - "step": 19958 - }, - { - "epoch": 0.51, - "learning_rate": 1.898218855333586e-06, - "loss": 0.8125, - "step": 19959 - }, - { - "epoch": 0.51, - "learning_rate": 1.8982066924830921e-06, - "loss": 0.8545, - "step": 19960 - }, - { - "epoch": 0.51, - "learning_rate": 1.898194528944883e-06, - "loss": 0.709, - "step": 19961 - }, - { - "epoch": 0.51, - "learning_rate": 1.8981823647189676e-06, - "loss": 0.7036, - "step": 19962 - }, - { - "epoch": 0.51, - "learning_rate": 1.8981701998053556e-06, - "loss": 0.9121, - "step": 19963 - }, - { - "epoch": 0.51, - "learning_rate": 1.8981580342040554e-06, - "loss": 0.8271, - "step": 19964 - }, - { - "epoch": 0.51, - "learning_rate": 1.8981458679150776e-06, - "loss": 0.9902, - "step": 19965 - }, - { - "epoch": 0.51, - "learning_rate": 1.89813370093843e-06, - "loss": 0.9873, - "step": 19966 - }, - { - "epoch": 0.51, - "learning_rate": 1.8981215332741231e-06, - "loss": 0.8496, - "step": 19967 - }, - { - "epoch": 0.51, - "learning_rate": 1.898109364922166e-06, - "loss": 1.0869, - "step": 19968 - }, - { - "epoch": 0.51, - "learning_rate": 1.8980971958825679e-06, - "loss": 0.7637, - "step": 19969 - }, - { - "epoch": 0.51, - "learning_rate": 1.8980850261553378e-06, - "loss": 0.9346, - "step": 19970 - }, - { - "epoch": 0.51, - "learning_rate": 1.8980728557404853e-06, - "loss": 0.7275, - "step": 19971 - }, - { - "epoch": 0.51, - "learning_rate": 1.8980606846380195e-06, - "loss": 1.1094, - "step": 19972 - }, - { - "epoch": 0.51, - "learning_rate": 1.8980485128479504e-06, - "loss": 0.6514, - "step": 19973 - }, - { - "epoch": 0.51, - "learning_rate": 1.8980363403702868e-06, - "loss": 0.7949, - "step": 19974 - }, - { - "epoch": 0.51, - "learning_rate": 1.8980241672050376e-06, - "loss": 0.9551, - "step": 19975 - }, - { - "epoch": 0.51, - "learning_rate": 1.898011993352213e-06, - "loss": 0.7461, - "step": 19976 - }, - { - "epoch": 0.51, - "learning_rate": 1.8979998188118218e-06, - "loss": 1.2812, - "step": 19977 - }, - { - "epoch": 0.51, - "learning_rate": 1.8979876435838738e-06, - "loss": 1.0479, - "step": 19978 - }, - { - "epoch": 0.51, - "learning_rate": 1.8979754676683775e-06, - "loss": 0.9922, - "step": 19979 - }, - { - "epoch": 0.51, - "learning_rate": 1.8979632910653427e-06, - "loss": 0.9268, - "step": 19980 - }, - { - "epoch": 0.51, - "learning_rate": 1.8979511137747788e-06, - "loss": 0.7837, - "step": 19981 - }, - { - "epoch": 0.51, - "learning_rate": 1.8979389357966948e-06, - "loss": 1.0332, - "step": 19982 - }, - { - "epoch": 0.51, - "learning_rate": 1.8979267571311004e-06, - "loss": 0.7559, - "step": 19983 - }, - { - "epoch": 0.51, - "learning_rate": 1.897914577778005e-06, - "loss": 0.916, - "step": 19984 - }, - { - "epoch": 0.51, - "learning_rate": 1.8979023977374173e-06, - "loss": 0.999, - "step": 19985 - }, - { - "epoch": 0.51, - "learning_rate": 1.8978902170093473e-06, - "loss": 0.8105, - "step": 19986 - }, - { - "epoch": 0.51, - "learning_rate": 1.8978780355938039e-06, - "loss": 0.8105, - "step": 19987 - }, - { - "epoch": 0.51, - "learning_rate": 1.8978658534907967e-06, - "loss": 0.835, - "step": 19988 - }, - { - "epoch": 0.51, - "learning_rate": 1.8978536707003348e-06, - "loss": 0.8926, - "step": 19989 - }, - { - "epoch": 0.51, - "learning_rate": 1.8978414872224278e-06, - "loss": 0.8921, - "step": 19990 - }, - { - "epoch": 0.51, - "learning_rate": 1.8978293030570847e-06, - "loss": 1.1992, - "step": 19991 - }, - { - "epoch": 0.51, - "learning_rate": 1.897817118204315e-06, - "loss": 0.7827, - "step": 19992 - }, - { - "epoch": 0.51, - "learning_rate": 1.8978049326641278e-06, - "loss": 0.9873, - "step": 19993 - }, - { - "epoch": 0.51, - "learning_rate": 1.897792746436533e-06, - "loss": 0.8467, - "step": 19994 - }, - { - "epoch": 0.51, - "learning_rate": 1.8977805595215395e-06, - "loss": 0.8555, - "step": 19995 - }, - { - "epoch": 0.51, - "learning_rate": 1.8977683719191567e-06, - "loss": 0.5861, - "step": 19996 - }, - { - "epoch": 0.51, - "learning_rate": 1.897756183629394e-06, - "loss": 0.6868, - "step": 19997 - }, - { - "epoch": 0.51, - "learning_rate": 1.8977439946522605e-06, - "loss": 0.9434, - "step": 19998 - }, - { - "epoch": 0.51, - "learning_rate": 1.8977318049877658e-06, - "loss": 0.9844, - "step": 19999 - }, - { - "epoch": 0.51, - "learning_rate": 1.897719614635919e-06, - "loss": 0.8027, - "step": 20000 - }, - { - "epoch": 0.51, - "learning_rate": 1.8977074235967296e-06, - "loss": 0.8154, - "step": 20001 - }, - { - "epoch": 0.51, - "learning_rate": 1.8976952318702072e-06, - "loss": 0.6533, - "step": 20002 - }, - { - "epoch": 0.51, - "learning_rate": 1.8976830394563606e-06, - "loss": 0.605, - "step": 20003 - }, - { - "epoch": 0.51, - "learning_rate": 1.8976708463551994e-06, - "loss": 0.7998, - "step": 20004 - }, - { - "epoch": 0.51, - "learning_rate": 1.8976586525667328e-06, - "loss": 0.9082, - "step": 20005 - }, - { - "epoch": 0.51, - "learning_rate": 1.8976464580909703e-06, - "loss": 0.9551, - "step": 20006 - }, - { - "epoch": 0.51, - "learning_rate": 1.8976342629279212e-06, - "loss": 0.9365, - "step": 20007 - }, - { - "epoch": 0.51, - "learning_rate": 1.897622067077595e-06, - "loss": 0.8857, - "step": 20008 - }, - { - "epoch": 0.51, - "learning_rate": 1.8976098705400005e-06, - "loss": 0.9668, - "step": 20009 - }, - { - "epoch": 0.51, - "learning_rate": 1.8975976733151477e-06, - "loss": 0.6353, - "step": 20010 - }, - { - "epoch": 0.51, - "learning_rate": 1.8975854754030456e-06, - "loss": 0.999, - "step": 20011 - }, - { - "epoch": 0.51, - "learning_rate": 1.8975732768037033e-06, - "loss": 0.9863, - "step": 20012 - }, - { - "epoch": 0.51, - "learning_rate": 1.8975610775171308e-06, - "loss": 0.8193, - "step": 20013 - }, - { - "epoch": 0.51, - "learning_rate": 1.8975488775433367e-06, - "loss": 0.8691, - "step": 20014 - }, - { - "epoch": 0.51, - "learning_rate": 1.8975366768823308e-06, - "loss": 0.7695, - "step": 20015 - }, - { - "epoch": 0.51, - "learning_rate": 1.8975244755341225e-06, - "loss": 0.917, - "step": 20016 - }, - { - "epoch": 0.51, - "learning_rate": 1.8975122734987207e-06, - "loss": 0.6836, - "step": 20017 - }, - { - "epoch": 0.51, - "learning_rate": 1.8975000707761355e-06, - "loss": 0.8076, - "step": 20018 - }, - { - "epoch": 0.51, - "learning_rate": 1.8974878673663754e-06, - "loss": 0.7068, - "step": 20019 - }, - { - "epoch": 0.51, - "learning_rate": 1.89747566326945e-06, - "loss": 0.9436, - "step": 20020 - }, - { - "epoch": 0.51, - "learning_rate": 1.897463458485369e-06, - "loss": 0.9131, - "step": 20021 - }, - { - "epoch": 0.51, - "learning_rate": 1.8974512530141414e-06, - "loss": 0.8389, - "step": 20022 - }, - { - "epoch": 0.51, - "learning_rate": 1.8974390468557769e-06, - "loss": 0.6782, - "step": 20023 - }, - { - "epoch": 0.51, - "learning_rate": 1.8974268400102842e-06, - "loss": 0.7725, - "step": 20024 - }, - { - "epoch": 0.51, - "learning_rate": 1.8974146324776732e-06, - "loss": 0.8896, - "step": 20025 - }, - { - "epoch": 0.51, - "learning_rate": 1.897402424257953e-06, - "loss": 0.6895, - "step": 20026 - }, - { - "epoch": 0.51, - "learning_rate": 1.897390215351133e-06, - "loss": 0.8789, - "step": 20027 - }, - { - "epoch": 0.51, - "learning_rate": 1.8973780057572229e-06, - "loss": 0.874, - "step": 20028 - }, - { - "epoch": 0.51, - "learning_rate": 1.8973657954762313e-06, - "loss": 0.8896, - "step": 20029 - }, - { - "epoch": 0.51, - "learning_rate": 1.8973535845081683e-06, - "loss": 0.6989, - "step": 20030 - }, - { - "epoch": 0.51, - "learning_rate": 1.8973413728530426e-06, - "loss": 0.8555, - "step": 20031 - }, - { - "epoch": 0.51, - "learning_rate": 1.8973291605108641e-06, - "loss": 0.751, - "step": 20032 - }, - { - "epoch": 0.51, - "learning_rate": 1.897316947481642e-06, - "loss": 1.0449, - "step": 20033 - }, - { - "epoch": 0.51, - "learning_rate": 1.8973047337653853e-06, - "loss": 0.876, - "step": 20034 - }, - { - "epoch": 0.51, - "learning_rate": 1.8972925193621037e-06, - "loss": 0.8301, - "step": 20035 - }, - { - "epoch": 0.51, - "learning_rate": 1.8972803042718067e-06, - "loss": 0.9463, - "step": 20036 - }, - { - "epoch": 0.51, - "learning_rate": 1.8972680884945032e-06, - "loss": 0.9883, - "step": 20037 - }, - { - "epoch": 0.51, - "learning_rate": 1.897255872030203e-06, - "loss": 0.9863, - "step": 20038 - }, - { - "epoch": 0.51, - "learning_rate": 1.897243654878915e-06, - "loss": 0.7764, - "step": 20039 - }, - { - "epoch": 0.51, - "learning_rate": 1.897231437040649e-06, - "loss": 1.0479, - "step": 20040 - }, - { - "epoch": 0.51, - "learning_rate": 1.897219218515414e-06, - "loss": 1.0176, - "step": 20041 - }, - { - "epoch": 0.51, - "learning_rate": 1.8972069993032193e-06, - "loss": 0.7524, - "step": 20042 - }, - { - "epoch": 0.51, - "learning_rate": 1.8971947794040748e-06, - "loss": 0.6997, - "step": 20043 - }, - { - "epoch": 0.51, - "learning_rate": 1.8971825588179895e-06, - "loss": 0.9697, - "step": 20044 - }, - { - "epoch": 0.51, - "learning_rate": 1.8971703375449726e-06, - "loss": 0.8896, - "step": 20045 - }, - { - "epoch": 0.51, - "learning_rate": 1.8971581155850336e-06, - "loss": 0.8574, - "step": 20046 - }, - { - "epoch": 0.51, - "learning_rate": 1.897145892938182e-06, - "loss": 0.7617, - "step": 20047 - }, - { - "epoch": 0.51, - "learning_rate": 1.8971336696044271e-06, - "loss": 0.843, - "step": 20048 - }, - { - "epoch": 0.51, - "learning_rate": 1.897121445583778e-06, - "loss": 0.959, - "step": 20049 - }, - { - "epoch": 0.51, - "learning_rate": 1.8971092208762446e-06, - "loss": 0.9287, - "step": 20050 - }, - { - "epoch": 0.51, - "learning_rate": 1.8970969954818353e-06, - "loss": 0.8271, - "step": 20051 - }, - { - "epoch": 0.51, - "learning_rate": 1.8970847694005607e-06, - "loss": 0.8325, - "step": 20052 - }, - { - "epoch": 0.51, - "learning_rate": 1.8970725426324293e-06, - "loss": 0.7544, - "step": 20053 - }, - { - "epoch": 0.51, - "learning_rate": 1.8970603151774506e-06, - "loss": 0.7891, - "step": 20054 - }, - { - "epoch": 0.51, - "learning_rate": 1.8970480870356345e-06, - "loss": 0.8682, - "step": 20055 - }, - { - "epoch": 0.51, - "learning_rate": 1.8970358582069895e-06, - "loss": 0.8584, - "step": 20056 - }, - { - "epoch": 0.51, - "learning_rate": 1.8970236286915253e-06, - "loss": 0.7705, - "step": 20057 - }, - { - "epoch": 0.51, - "learning_rate": 1.8970113984892518e-06, - "loss": 0.7861, - "step": 20058 - }, - { - "epoch": 0.51, - "learning_rate": 1.8969991676001775e-06, - "loss": 0.8408, - "step": 20059 - }, - { - "epoch": 0.51, - "learning_rate": 1.8969869360243122e-06, - "loss": 0.6069, - "step": 20060 - }, - { - "epoch": 0.51, - "learning_rate": 1.8969747037616654e-06, - "loss": 1.165, - "step": 20061 - }, - { - "epoch": 0.51, - "learning_rate": 1.8969624708122464e-06, - "loss": 0.8291, - "step": 20062 - }, - { - "epoch": 0.51, - "learning_rate": 1.8969502371760645e-06, - "loss": 0.8389, - "step": 20063 - }, - { - "epoch": 0.51, - "learning_rate": 1.896938002853129e-06, - "loss": 0.8975, - "step": 20064 - }, - { - "epoch": 0.51, - "learning_rate": 1.8969257678434491e-06, - "loss": 1.0566, - "step": 20065 - }, - { - "epoch": 0.51, - "learning_rate": 1.8969135321470347e-06, - "loss": 1.0889, - "step": 20066 - }, - { - "epoch": 0.51, - "learning_rate": 1.8969012957638945e-06, - "loss": 0.7451, - "step": 20067 - }, - { - "epoch": 0.51, - "learning_rate": 1.8968890586940386e-06, - "loss": 0.707, - "step": 20068 - }, - { - "epoch": 0.51, - "learning_rate": 1.8968768209374757e-06, - "loss": 1.0703, - "step": 20069 - }, - { - "epoch": 0.51, - "learning_rate": 1.8968645824942156e-06, - "loss": 0.9087, - "step": 20070 - }, - { - "epoch": 0.51, - "learning_rate": 1.8968523433642676e-06, - "loss": 0.874, - "step": 20071 - }, - { - "epoch": 0.51, - "learning_rate": 1.8968401035476408e-06, - "loss": 1.1104, - "step": 20072 - }, - { - "epoch": 0.51, - "learning_rate": 1.8968278630443449e-06, - "loss": 0.6699, - "step": 20073 - }, - { - "epoch": 0.51, - "learning_rate": 1.896815621854389e-06, - "loss": 0.9561, - "step": 20074 - }, - { - "epoch": 0.51, - "learning_rate": 1.8968033799777827e-06, - "loss": 1.1758, - "step": 20075 - }, - { - "epoch": 0.51, - "learning_rate": 1.896791137414535e-06, - "loss": 0.8525, - "step": 20076 - }, - { - "epoch": 0.51, - "learning_rate": 1.896778894164656e-06, - "loss": 0.9805, - "step": 20077 - }, - { - "epoch": 0.51, - "learning_rate": 1.8967666502281548e-06, - "loss": 0.7178, - "step": 20078 - }, - { - "epoch": 0.51, - "learning_rate": 1.8967544056050402e-06, - "loss": 0.8462, - "step": 20079 - }, - { - "epoch": 0.51, - "learning_rate": 1.8967421602953219e-06, - "loss": 0.7153, - "step": 20080 - }, - { - "epoch": 0.51, - "learning_rate": 1.8967299142990097e-06, - "loss": 0.8623, - "step": 20081 - }, - { - "epoch": 0.51, - "learning_rate": 1.8967176676161123e-06, - "loss": 1.1016, - "step": 20082 - }, - { - "epoch": 0.51, - "learning_rate": 1.8967054202466396e-06, - "loss": 1.0195, - "step": 20083 - }, - { - "epoch": 0.51, - "learning_rate": 1.8966931721906008e-06, - "loss": 0.873, - "step": 20084 - }, - { - "epoch": 0.51, - "learning_rate": 1.8966809234480054e-06, - "loss": 0.9014, - "step": 20085 - }, - { - "epoch": 0.51, - "learning_rate": 1.8966686740188624e-06, - "loss": 0.6331, - "step": 20086 - }, - { - "epoch": 0.51, - "learning_rate": 1.8966564239031815e-06, - "loss": 0.9512, - "step": 20087 - }, - { - "epoch": 0.51, - "learning_rate": 1.896644173100972e-06, - "loss": 0.8877, - "step": 20088 - }, - { - "epoch": 0.51, - "learning_rate": 1.8966319216122435e-06, - "loss": 0.9971, - "step": 20089 - }, - { - "epoch": 0.51, - "learning_rate": 1.896619669437005e-06, - "loss": 0.8301, - "step": 20090 - }, - { - "epoch": 0.51, - "learning_rate": 1.896607416575266e-06, - "loss": 0.9844, - "step": 20091 - }, - { - "epoch": 0.51, - "learning_rate": 1.896595163027036e-06, - "loss": 0.9736, - "step": 20092 - }, - { - "epoch": 0.51, - "learning_rate": 1.8965829087923242e-06, - "loss": 1.0, - "step": 20093 - }, - { - "epoch": 0.52, - "learning_rate": 1.89657065387114e-06, - "loss": 0.772, - "step": 20094 - }, - { - "epoch": 0.52, - "learning_rate": 1.8965583982634932e-06, - "loss": 0.8994, - "step": 20095 - }, - { - "epoch": 0.52, - "learning_rate": 1.8965461419693927e-06, - "loss": 0.8545, - "step": 20096 - }, - { - "epoch": 0.52, - "learning_rate": 1.8965338849888481e-06, - "loss": 0.8906, - "step": 20097 - }, - { - "epoch": 0.52, - "learning_rate": 1.8965216273218685e-06, - "loss": 1.0498, - "step": 20098 - }, - { - "epoch": 0.52, - "learning_rate": 1.8965093689684637e-06, - "loss": 0.9326, - "step": 20099 - }, - { - "epoch": 0.52, - "learning_rate": 1.896497109928643e-06, - "loss": 0.7324, - "step": 20100 - }, - { - "epoch": 0.52, - "learning_rate": 1.8964848502024155e-06, - "loss": 0.8516, - "step": 20101 - }, - { - "epoch": 0.52, - "learning_rate": 1.8964725897897908e-06, - "loss": 0.7061, - "step": 20102 - }, - { - "epoch": 0.52, - "learning_rate": 1.8964603286907783e-06, - "loss": 0.9346, - "step": 20103 - }, - { - "epoch": 0.52, - "learning_rate": 1.8964480669053872e-06, - "loss": 0.8652, - "step": 20104 - }, - { - "epoch": 0.52, - "learning_rate": 1.8964358044336275e-06, - "loss": 0.7993, - "step": 20105 - }, - { - "epoch": 0.52, - "learning_rate": 1.8964235412755078e-06, - "loss": 0.9912, - "step": 20106 - }, - { - "epoch": 0.52, - "learning_rate": 1.8964112774310376e-06, - "loss": 0.9717, - "step": 20107 - }, - { - "epoch": 0.52, - "learning_rate": 1.8963990129002268e-06, - "loss": 0.833, - "step": 20108 - }, - { - "epoch": 0.52, - "learning_rate": 1.8963867476830843e-06, - "loss": 0.5178, - "step": 20109 - }, - { - "epoch": 0.52, - "learning_rate": 1.89637448177962e-06, - "loss": 0.8643, - "step": 20110 - }, - { - "epoch": 0.52, - "learning_rate": 1.8963622151898425e-06, - "loss": 0.9854, - "step": 20111 - }, - { - "epoch": 0.52, - "learning_rate": 1.8963499479137622e-06, - "loss": 0.8416, - "step": 20112 - }, - { - "epoch": 0.52, - "learning_rate": 1.8963376799513878e-06, - "loss": 0.8389, - "step": 20113 - }, - { - "epoch": 0.52, - "learning_rate": 1.8963254113027286e-06, - "loss": 0.6963, - "step": 20114 - }, - { - "epoch": 0.52, - "learning_rate": 1.8963131419677945e-06, - "loss": 0.9736, - "step": 20115 - }, - { - "epoch": 0.52, - "learning_rate": 1.8963008719465945e-06, - "loss": 1.001, - "step": 20116 - }, - { - "epoch": 0.52, - "learning_rate": 1.8962886012391382e-06, - "loss": 0.96, - "step": 20117 - }, - { - "epoch": 0.52, - "learning_rate": 1.896276329845435e-06, - "loss": 0.793, - "step": 20118 - }, - { - "epoch": 0.52, - "learning_rate": 1.896264057765494e-06, - "loss": 1.0107, - "step": 20119 - }, - { - "epoch": 0.52, - "learning_rate": 1.896251784999325e-06, - "loss": 0.856, - "step": 20120 - }, - { - "epoch": 0.52, - "learning_rate": 1.8962395115469372e-06, - "loss": 0.9131, - "step": 20121 - }, - { - "epoch": 0.52, - "learning_rate": 1.89622723740834e-06, - "loss": 0.6365, - "step": 20122 - }, - { - "epoch": 0.52, - "learning_rate": 1.8962149625835426e-06, - "loss": 0.6987, - "step": 20123 - }, - { - "epoch": 0.52, - "learning_rate": 1.896202687072555e-06, - "loss": 0.8223, - "step": 20124 - }, - { - "epoch": 0.52, - "learning_rate": 1.896190410875386e-06, - "loss": 0.6948, - "step": 20125 - }, - { - "epoch": 0.52, - "learning_rate": 1.8961781339920453e-06, - "loss": 0.7305, - "step": 20126 - }, - { - "epoch": 0.52, - "learning_rate": 1.896165856422542e-06, - "loss": 0.8857, - "step": 20127 - }, - { - "epoch": 0.52, - "learning_rate": 1.8961535781668857e-06, - "loss": 0.8545, - "step": 20128 - }, - { - "epoch": 0.52, - "learning_rate": 1.8961412992250862e-06, - "loss": 0.7744, - "step": 20129 - }, - { - "epoch": 0.52, - "learning_rate": 1.8961290195971524e-06, - "loss": 0.7686, - "step": 20130 - }, - { - "epoch": 0.52, - "learning_rate": 1.8961167392830934e-06, - "loss": 0.9736, - "step": 20131 - }, - { - "epoch": 0.52, - "learning_rate": 1.8961044582829196e-06, - "loss": 0.8145, - "step": 20132 - }, - { - "epoch": 0.52, - "learning_rate": 1.8960921765966394e-06, - "loss": 0.9912, - "step": 20133 - }, - { - "epoch": 0.52, - "learning_rate": 1.8960798942242628e-06, - "loss": 0.6943, - "step": 20134 - }, - { - "epoch": 0.52, - "learning_rate": 1.8960676111657992e-06, - "loss": 1.1729, - "step": 20135 - }, - { - "epoch": 0.52, - "learning_rate": 1.8960553274212574e-06, - "loss": 0.9834, - "step": 20136 - }, - { - "epoch": 0.52, - "learning_rate": 1.8960430429906476e-06, - "loss": 0.9336, - "step": 20137 - }, - { - "epoch": 0.52, - "learning_rate": 1.8960307578739788e-06, - "loss": 0.7827, - "step": 20138 - }, - { - "epoch": 0.52, - "learning_rate": 1.89601847207126e-06, - "loss": 0.9648, - "step": 20139 - }, - { - "epoch": 0.52, - "learning_rate": 1.8960061855825016e-06, - "loss": 0.8066, - "step": 20140 - }, - { - "epoch": 0.52, - "learning_rate": 1.8959938984077121e-06, - "loss": 0.8271, - "step": 20141 - }, - { - "epoch": 0.52, - "learning_rate": 1.8959816105469016e-06, - "loss": 0.8457, - "step": 20142 - }, - { - "epoch": 0.52, - "learning_rate": 1.895969322000079e-06, - "loss": 0.9541, - "step": 20143 - }, - { - "epoch": 0.52, - "learning_rate": 1.8959570327672538e-06, - "loss": 0.9854, - "step": 20144 - }, - { - "epoch": 0.52, - "learning_rate": 1.8959447428484357e-06, - "loss": 0.9209, - "step": 20145 - }, - { - "epoch": 0.52, - "learning_rate": 1.8959324522436337e-06, - "loss": 0.9365, - "step": 20146 - }, - { - "epoch": 0.52, - "learning_rate": 1.8959201609528576e-06, - "loss": 0.7178, - "step": 20147 - }, - { - "epoch": 0.52, - "learning_rate": 1.8959078689761166e-06, - "loss": 0.9053, - "step": 20148 - }, - { - "epoch": 0.52, - "learning_rate": 1.8958955763134202e-06, - "loss": 0.6382, - "step": 20149 - }, - { - "epoch": 0.52, - "learning_rate": 1.8958832829647776e-06, - "loss": 0.9707, - "step": 20150 - }, - { - "epoch": 0.52, - "learning_rate": 1.8958709889301984e-06, - "loss": 1.0264, - "step": 20151 - }, - { - "epoch": 0.52, - "learning_rate": 1.895858694209692e-06, - "loss": 0.9902, - "step": 20152 - }, - { - "epoch": 0.52, - "learning_rate": 1.895846398803268e-06, - "loss": 0.9102, - "step": 20153 - }, - { - "epoch": 0.52, - "learning_rate": 1.895834102710935e-06, - "loss": 0.9053, - "step": 20154 - }, - { - "epoch": 0.52, - "learning_rate": 1.8958218059327035e-06, - "loss": 0.7617, - "step": 20155 - }, - { - "epoch": 0.52, - "learning_rate": 1.8958095084685823e-06, - "loss": 0.9102, - "step": 20156 - }, - { - "epoch": 0.52, - "learning_rate": 1.8957972103185811e-06, - "loss": 1.0195, - "step": 20157 - }, - { - "epoch": 0.52, - "learning_rate": 1.8957849114827092e-06, - "loss": 0.8262, - "step": 20158 - }, - { - "epoch": 0.52, - "learning_rate": 1.8957726119609756e-06, - "loss": 0.9639, - "step": 20159 - }, - { - "epoch": 0.52, - "learning_rate": 1.8957603117533903e-06, - "loss": 0.6511, - "step": 20160 - }, - { - "epoch": 0.52, - "learning_rate": 1.8957480108599627e-06, - "loss": 0.7217, - "step": 20161 - }, - { - "epoch": 0.52, - "learning_rate": 1.8957357092807018e-06, - "loss": 1.1113, - "step": 20162 - }, - { - "epoch": 0.52, - "learning_rate": 1.8957234070156174e-06, - "loss": 0.8096, - "step": 20163 - }, - { - "epoch": 0.52, - "learning_rate": 1.8957111040647188e-06, - "loss": 0.8477, - "step": 20164 - }, - { - "epoch": 0.52, - "learning_rate": 1.8956988004280153e-06, - "loss": 0.8896, - "step": 20165 - }, - { - "epoch": 0.52, - "learning_rate": 1.8956864961055164e-06, - "loss": 0.8809, - "step": 20166 - }, - { - "epoch": 0.52, - "learning_rate": 1.8956741910972313e-06, - "loss": 0.8271, - "step": 20167 - }, - { - "epoch": 0.52, - "learning_rate": 1.8956618854031701e-06, - "loss": 0.915, - "step": 20168 - }, - { - "epoch": 0.52, - "learning_rate": 1.8956495790233415e-06, - "loss": 0.8672, - "step": 20169 - }, - { - "epoch": 0.52, - "learning_rate": 1.8956372719577553e-06, - "loss": 0.8984, - "step": 20170 - }, - { - "epoch": 0.52, - "learning_rate": 1.8956249642064211e-06, - "loss": 0.9678, - "step": 20171 - }, - { - "epoch": 0.52, - "learning_rate": 1.8956126557693475e-06, - "loss": 0.7847, - "step": 20172 - }, - { - "epoch": 0.52, - "learning_rate": 1.8956003466465446e-06, - "loss": 0.875, - "step": 20173 - }, - { - "epoch": 0.52, - "learning_rate": 1.895588036838022e-06, - "loss": 0.6167, - "step": 20174 - }, - { - "epoch": 0.52, - "learning_rate": 1.8955757263437886e-06, - "loss": 0.8857, - "step": 20175 - }, - { - "epoch": 0.52, - "learning_rate": 1.8955634151638541e-06, - "loss": 0.9658, - "step": 20176 - }, - { - "epoch": 0.52, - "learning_rate": 1.8955511032982279e-06, - "loss": 0.6895, - "step": 20177 - }, - { - "epoch": 0.52, - "learning_rate": 1.8955387907469194e-06, - "loss": 1.0791, - "step": 20178 - }, - { - "epoch": 0.52, - "learning_rate": 1.895526477509938e-06, - "loss": 0.6855, - "step": 20179 - }, - { - "epoch": 0.52, - "learning_rate": 1.8955141635872932e-06, - "loss": 0.8691, - "step": 20180 - }, - { - "epoch": 0.52, - "learning_rate": 1.8955018489789941e-06, - "loss": 0.6688, - "step": 20181 - }, - { - "epoch": 0.52, - "learning_rate": 1.8954895336850507e-06, - "loss": 1.0527, - "step": 20182 - }, - { - "epoch": 0.52, - "learning_rate": 1.8954772177054723e-06, - "loss": 0.7251, - "step": 20183 - }, - { - "epoch": 0.52, - "learning_rate": 1.8954649010402677e-06, - "loss": 0.7473, - "step": 20184 - }, - { - "epoch": 0.52, - "learning_rate": 1.895452583689447e-06, - "loss": 0.7646, - "step": 20185 - }, - { - "epoch": 0.52, - "learning_rate": 1.8954402656530198e-06, - "loss": 0.8584, - "step": 20186 - }, - { - "epoch": 0.52, - "learning_rate": 1.8954279469309947e-06, - "loss": 0.7471, - "step": 20187 - }, - { - "epoch": 0.52, - "learning_rate": 1.8954156275233816e-06, - "loss": 0.9531, - "step": 20188 - }, - { - "epoch": 0.52, - "learning_rate": 1.89540330743019e-06, - "loss": 0.606, - "step": 20189 - }, - { - "epoch": 0.52, - "learning_rate": 1.8953909866514295e-06, - "loss": 0.8691, - "step": 20190 - }, - { - "epoch": 0.52, - "learning_rate": 1.895378665187109e-06, - "loss": 0.6387, - "step": 20191 - }, - { - "epoch": 0.52, - "learning_rate": 1.8953663430372386e-06, - "loss": 0.8398, - "step": 20192 - }, - { - "epoch": 0.52, - "learning_rate": 1.895354020201827e-06, - "loss": 0.8867, - "step": 20193 - }, - { - "epoch": 0.52, - "learning_rate": 1.8953416966808842e-06, - "loss": 0.7227, - "step": 20194 - }, - { - "epoch": 0.52, - "learning_rate": 1.8953293724744193e-06, - "loss": 0.7305, - "step": 20195 - }, - { - "epoch": 0.52, - "learning_rate": 1.8953170475824419e-06, - "loss": 1.0215, - "step": 20196 - }, - { - "epoch": 0.52, - "learning_rate": 1.8953047220049614e-06, - "loss": 0.7432, - "step": 20197 - }, - { - "epoch": 0.52, - "learning_rate": 1.895292395741987e-06, - "loss": 0.6797, - "step": 20198 - }, - { - "epoch": 0.52, - "learning_rate": 1.8952800687935286e-06, - "loss": 0.7812, - "step": 20199 - }, - { - "epoch": 0.52, - "learning_rate": 1.8952677411595957e-06, - "loss": 1.0938, - "step": 20200 - }, - { - "epoch": 0.52, - "learning_rate": 1.895255412840197e-06, - "loss": 1.0254, - "step": 20201 - }, - { - "epoch": 0.52, - "learning_rate": 1.8952430838353428e-06, - "loss": 0.6963, - "step": 20202 - }, - { - "epoch": 0.52, - "learning_rate": 1.895230754145042e-06, - "loss": 0.792, - "step": 20203 - }, - { - "epoch": 0.52, - "learning_rate": 1.8952184237693038e-06, - "loss": 0.7959, - "step": 20204 - }, - { - "epoch": 0.52, - "learning_rate": 1.8952060927081383e-06, - "loss": 1.0117, - "step": 20205 - }, - { - "epoch": 0.52, - "learning_rate": 1.8951937609615549e-06, - "loss": 0.748, - "step": 20206 - }, - { - "epoch": 0.52, - "learning_rate": 1.8951814285295625e-06, - "loss": 0.8389, - "step": 20207 - }, - { - "epoch": 0.52, - "learning_rate": 1.895169095412171e-06, - "loss": 0.8579, - "step": 20208 - }, - { - "epoch": 0.52, - "learning_rate": 1.8951567616093896e-06, - "loss": 0.5725, - "step": 20209 - }, - { - "epoch": 0.52, - "learning_rate": 1.8951444271212278e-06, - "loss": 1.1738, - "step": 20210 - }, - { - "epoch": 0.52, - "learning_rate": 1.8951320919476949e-06, - "loss": 0.8945, - "step": 20211 - }, - { - "epoch": 0.52, - "learning_rate": 1.8951197560888008e-06, - "loss": 0.8076, - "step": 20212 - }, - { - "epoch": 0.52, - "learning_rate": 1.8951074195445547e-06, - "loss": 0.8164, - "step": 20213 - }, - { - "epoch": 0.52, - "learning_rate": 1.8950950823149658e-06, - "loss": 0.7229, - "step": 20214 - }, - { - "epoch": 0.52, - "learning_rate": 1.8950827444000439e-06, - "loss": 0.8853, - "step": 20215 - }, - { - "epoch": 0.52, - "learning_rate": 1.8950704057997981e-06, - "loss": 0.7622, - "step": 20216 - }, - { - "epoch": 0.52, - "learning_rate": 1.8950580665142382e-06, - "loss": 0.686, - "step": 20217 - }, - { - "epoch": 0.52, - "learning_rate": 1.8950457265433735e-06, - "loss": 0.8325, - "step": 20218 - }, - { - "epoch": 0.52, - "learning_rate": 1.8950333858872134e-06, - "loss": 0.9893, - "step": 20219 - }, - { - "epoch": 0.52, - "learning_rate": 1.8950210445457674e-06, - "loss": 0.6885, - "step": 20220 - }, - { - "epoch": 0.52, - "learning_rate": 1.895008702519045e-06, - "loss": 0.9824, - "step": 20221 - }, - { - "epoch": 0.52, - "learning_rate": 1.8949963598070556e-06, - "loss": 0.7559, - "step": 20222 - }, - { - "epoch": 0.52, - "learning_rate": 1.8949840164098086e-06, - "loss": 0.9131, - "step": 20223 - }, - { - "epoch": 0.52, - "learning_rate": 1.8949716723273134e-06, - "loss": 1.0078, - "step": 20224 - }, - { - "epoch": 0.52, - "learning_rate": 1.8949593275595796e-06, - "loss": 0.8799, - "step": 20225 - }, - { - "epoch": 0.52, - "learning_rate": 1.8949469821066167e-06, - "loss": 0.8022, - "step": 20226 - }, - { - "epoch": 0.52, - "learning_rate": 1.894934635968434e-06, - "loss": 0.8096, - "step": 20227 - }, - { - "epoch": 0.52, - "learning_rate": 1.894922289145041e-06, - "loss": 0.8467, - "step": 20228 - }, - { - "epoch": 0.52, - "learning_rate": 1.8949099416364472e-06, - "loss": 1.0117, - "step": 20229 - }, - { - "epoch": 0.52, - "learning_rate": 1.8948975934426619e-06, - "loss": 0.9727, - "step": 20230 - }, - { - "epoch": 0.52, - "learning_rate": 1.8948852445636944e-06, - "loss": 0.9082, - "step": 20231 - }, - { - "epoch": 0.52, - "learning_rate": 1.8948728949995548e-06, - "loss": 0.4658, - "step": 20232 - }, - { - "epoch": 0.52, - "learning_rate": 1.8948605447502519e-06, - "loss": 0.7393, - "step": 20233 - }, - { - "epoch": 0.52, - "learning_rate": 1.894848193815796e-06, - "loss": 0.957, - "step": 20234 - }, - { - "epoch": 0.52, - "learning_rate": 1.8948358421961953e-06, - "loss": 0.6929, - "step": 20235 - }, - { - "epoch": 0.52, - "learning_rate": 1.8948234898914603e-06, - "loss": 1.0703, - "step": 20236 - }, - { - "epoch": 0.52, - "learning_rate": 1.8948111369016e-06, - "loss": 0.9058, - "step": 20237 - }, - { - "epoch": 0.52, - "learning_rate": 1.8947987832266239e-06, - "loss": 0.8267, - "step": 20238 - }, - { - "epoch": 0.52, - "learning_rate": 1.8947864288665415e-06, - "loss": 0.8071, - "step": 20239 - }, - { - "epoch": 0.52, - "learning_rate": 1.8947740738213625e-06, - "loss": 0.7646, - "step": 20240 - }, - { - "epoch": 0.52, - "learning_rate": 1.894761718091096e-06, - "loss": 0.8877, - "step": 20241 - }, - { - "epoch": 0.52, - "learning_rate": 1.8947493616757515e-06, - "loss": 0.7402, - "step": 20242 - }, - { - "epoch": 0.52, - "learning_rate": 1.8947370045753389e-06, - "loss": 0.7993, - "step": 20243 - }, - { - "epoch": 0.52, - "learning_rate": 1.894724646789867e-06, - "loss": 0.9658, - "step": 20244 - }, - { - "epoch": 0.52, - "learning_rate": 1.8947122883193455e-06, - "loss": 0.7046, - "step": 20245 - }, - { - "epoch": 0.52, - "learning_rate": 1.894699929163784e-06, - "loss": 0.915, - "step": 20246 - }, - { - "epoch": 0.52, - "learning_rate": 1.8946875693231924e-06, - "loss": 0.959, - "step": 20247 - }, - { - "epoch": 0.52, - "learning_rate": 1.894675208797579e-06, - "loss": 0.7695, - "step": 20248 - }, - { - "epoch": 0.52, - "learning_rate": 1.894662847586954e-06, - "loss": 0.9688, - "step": 20249 - }, - { - "epoch": 0.52, - "learning_rate": 1.894650485691327e-06, - "loss": 0.918, - "step": 20250 - }, - { - "epoch": 0.52, - "learning_rate": 1.8946381231107074e-06, - "loss": 0.9023, - "step": 20251 - }, - { - "epoch": 0.52, - "learning_rate": 1.8946257598451042e-06, - "loss": 0.7153, - "step": 20252 - }, - { - "epoch": 0.52, - "learning_rate": 1.8946133958945274e-06, - "loss": 0.7939, - "step": 20253 - }, - { - "epoch": 0.52, - "learning_rate": 1.8946010312589861e-06, - "loss": 1.1436, - "step": 20254 - }, - { - "epoch": 0.52, - "learning_rate": 1.8945886659384902e-06, - "loss": 0.9434, - "step": 20255 - }, - { - "epoch": 0.52, - "learning_rate": 1.8945762999330489e-06, - "loss": 0.8369, - "step": 20256 - }, - { - "epoch": 0.52, - "learning_rate": 1.8945639332426713e-06, - "loss": 1.0312, - "step": 20257 - }, - { - "epoch": 0.52, - "learning_rate": 1.8945515658673674e-06, - "loss": 0.7734, - "step": 20258 - }, - { - "epoch": 0.52, - "learning_rate": 1.8945391978071466e-06, - "loss": 0.8682, - "step": 20259 - }, - { - "epoch": 0.52, - "learning_rate": 1.8945268290620183e-06, - "loss": 0.7275, - "step": 20260 - }, - { - "epoch": 0.52, - "learning_rate": 1.8945144596319917e-06, - "loss": 0.842, - "step": 20261 - }, - { - "epoch": 0.52, - "learning_rate": 1.8945020895170769e-06, - "loss": 0.8301, - "step": 20262 - }, - { - "epoch": 0.52, - "learning_rate": 1.8944897187172825e-06, - "loss": 0.9463, - "step": 20263 - }, - { - "epoch": 0.52, - "learning_rate": 1.8944773472326187e-06, - "loss": 1.0732, - "step": 20264 - }, - { - "epoch": 0.52, - "learning_rate": 1.8944649750630948e-06, - "loss": 0.792, - "step": 20265 - }, - { - "epoch": 0.52, - "learning_rate": 1.89445260220872e-06, - "loss": 0.8965, - "step": 20266 - }, - { - "epoch": 0.52, - "learning_rate": 1.894440228669504e-06, - "loss": 0.6323, - "step": 20267 - }, - { - "epoch": 0.52, - "learning_rate": 1.8944278544454564e-06, - "loss": 0.7603, - "step": 20268 - }, - { - "epoch": 0.52, - "learning_rate": 1.8944154795365862e-06, - "loss": 0.6909, - "step": 20269 - }, - { - "epoch": 0.52, - "learning_rate": 1.8944031039429037e-06, - "loss": 0.8516, - "step": 20270 - }, - { - "epoch": 0.52, - "learning_rate": 1.8943907276644175e-06, - "loss": 0.9346, - "step": 20271 - }, - { - "epoch": 0.52, - "learning_rate": 1.8943783507011375e-06, - "loss": 1.0449, - "step": 20272 - }, - { - "epoch": 0.52, - "learning_rate": 1.8943659730530731e-06, - "loss": 0.6333, - "step": 20273 - }, - { - "epoch": 0.52, - "learning_rate": 1.894353594720234e-06, - "loss": 0.9961, - "step": 20274 - }, - { - "epoch": 0.52, - "learning_rate": 1.8943412157026292e-06, - "loss": 0.8555, - "step": 20275 - }, - { - "epoch": 0.52, - "learning_rate": 1.8943288360002687e-06, - "loss": 0.8105, - "step": 20276 - }, - { - "epoch": 0.52, - "learning_rate": 1.8943164556131617e-06, - "loss": 0.8389, - "step": 20277 - }, - { - "epoch": 0.52, - "learning_rate": 1.8943040745413176e-06, - "loss": 0.832, - "step": 20278 - }, - { - "epoch": 0.52, - "learning_rate": 1.894291692784746e-06, - "loss": 0.832, - "step": 20279 - }, - { - "epoch": 0.52, - "learning_rate": 1.8942793103434563e-06, - "loss": 1.0244, - "step": 20280 - }, - { - "epoch": 0.52, - "learning_rate": 1.8942669272174583e-06, - "loss": 0.7744, - "step": 20281 - }, - { - "epoch": 0.52, - "learning_rate": 1.8942545434067609e-06, - "loss": 1.1143, - "step": 20282 - }, - { - "epoch": 0.52, - "learning_rate": 1.8942421589113743e-06, - "loss": 0.9736, - "step": 20283 - }, - { - "epoch": 0.52, - "learning_rate": 1.8942297737313072e-06, - "loss": 0.9258, - "step": 20284 - }, - { - "epoch": 0.52, - "learning_rate": 1.8942173878665696e-06, - "loss": 0.8989, - "step": 20285 - }, - { - "epoch": 0.52, - "learning_rate": 1.8942050013171711e-06, - "loss": 0.749, - "step": 20286 - }, - { - "epoch": 0.52, - "learning_rate": 1.8941926140831205e-06, - "loss": 0.729, - "step": 20287 - }, - { - "epoch": 0.52, - "learning_rate": 1.8941802261644284e-06, - "loss": 0.9199, - "step": 20288 - }, - { - "epoch": 0.52, - "learning_rate": 1.894167837561103e-06, - "loss": 0.8477, - "step": 20289 - }, - { - "epoch": 0.52, - "learning_rate": 1.8941554482731548e-06, - "loss": 0.6738, - "step": 20290 - }, - { - "epoch": 0.52, - "learning_rate": 1.8941430583005926e-06, - "loss": 0.7339, - "step": 20291 - }, - { - "epoch": 0.52, - "learning_rate": 1.8941306676434263e-06, - "loss": 0.8157, - "step": 20292 - }, - { - "epoch": 0.52, - "learning_rate": 1.8941182763016653e-06, - "loss": 0.9219, - "step": 20293 - }, - { - "epoch": 0.52, - "learning_rate": 1.8941058842753191e-06, - "loss": 0.8916, - "step": 20294 - }, - { - "epoch": 0.52, - "learning_rate": 1.894093491564397e-06, - "loss": 0.7676, - "step": 20295 - }, - { - "epoch": 0.52, - "learning_rate": 1.8940810981689086e-06, - "loss": 0.9736, - "step": 20296 - }, - { - "epoch": 0.52, - "learning_rate": 1.8940687040888635e-06, - "loss": 1.0898, - "step": 20297 - }, - { - "epoch": 0.52, - "learning_rate": 1.894056309324271e-06, - "loss": 0.8491, - "step": 20298 - }, - { - "epoch": 0.52, - "learning_rate": 1.8940439138751408e-06, - "loss": 0.7695, - "step": 20299 - }, - { - "epoch": 0.52, - "learning_rate": 1.8940315177414823e-06, - "loss": 0.6924, - "step": 20300 - }, - { - "epoch": 0.52, - "learning_rate": 1.8940191209233048e-06, - "loss": 0.8457, - "step": 20301 - }, - { - "epoch": 0.52, - "learning_rate": 1.894006723420618e-06, - "loss": 1.0225, - "step": 20302 - }, - { - "epoch": 0.52, - "learning_rate": 1.8939943252334317e-06, - "loss": 0.8506, - "step": 20303 - }, - { - "epoch": 0.52, - "learning_rate": 1.893981926361755e-06, - "loss": 0.793, - "step": 20304 - }, - { - "epoch": 0.52, - "learning_rate": 1.8939695268055971e-06, - "loss": 0.8701, - "step": 20305 - }, - { - "epoch": 0.52, - "learning_rate": 1.8939571265649681e-06, - "loss": 0.6436, - "step": 20306 - }, - { - "epoch": 0.52, - "learning_rate": 1.8939447256398768e-06, - "loss": 0.877, - "step": 20307 - }, - { - "epoch": 0.52, - "learning_rate": 1.8939323240303334e-06, - "loss": 0.8799, - "step": 20308 - }, - { - "epoch": 0.52, - "learning_rate": 1.8939199217363475e-06, - "loss": 0.8799, - "step": 20309 - }, - { - "epoch": 0.52, - "learning_rate": 1.8939075187579276e-06, - "loss": 0.9795, - "step": 20310 - }, - { - "epoch": 0.52, - "learning_rate": 1.893895115095084e-06, - "loss": 1.0752, - "step": 20311 - }, - { - "epoch": 0.52, - "learning_rate": 1.8938827107478263e-06, - "loss": 0.8867, - "step": 20312 - }, - { - "epoch": 0.52, - "learning_rate": 1.8938703057161635e-06, - "loss": 0.9873, - "step": 20313 - }, - { - "epoch": 0.52, - "learning_rate": 1.8938579000001056e-06, - "loss": 0.9629, - "step": 20314 - }, - { - "epoch": 0.52, - "learning_rate": 1.8938454935996616e-06, - "loss": 1.0137, - "step": 20315 - }, - { - "epoch": 0.52, - "learning_rate": 1.8938330865148412e-06, - "loss": 0.9414, - "step": 20316 - }, - { - "epoch": 0.52, - "learning_rate": 1.8938206787456537e-06, - "loss": 0.917, - "step": 20317 - }, - { - "epoch": 0.52, - "learning_rate": 1.893808270292109e-06, - "loss": 0.9883, - "step": 20318 - }, - { - "epoch": 0.52, - "learning_rate": 1.8937958611542164e-06, - "loss": 0.9971, - "step": 20319 - }, - { - "epoch": 0.52, - "learning_rate": 1.8937834513319854e-06, - "loss": 1.0029, - "step": 20320 - }, - { - "epoch": 0.52, - "learning_rate": 1.8937710408254255e-06, - "loss": 0.5774, - "step": 20321 - }, - { - "epoch": 0.52, - "learning_rate": 1.8937586296345462e-06, - "loss": 0.8486, - "step": 20322 - }, - { - "epoch": 0.52, - "learning_rate": 1.8937462177593568e-06, - "loss": 1.248, - "step": 20323 - }, - { - "epoch": 0.52, - "learning_rate": 1.8937338051998675e-06, - "loss": 0.8701, - "step": 20324 - }, - { - "epoch": 0.52, - "learning_rate": 1.893721391956087e-06, - "loss": 1.1572, - "step": 20325 - }, - { - "epoch": 0.52, - "learning_rate": 1.893708978028025e-06, - "loss": 0.8125, - "step": 20326 - }, - { - "epoch": 0.52, - "learning_rate": 1.8936965634156917e-06, - "loss": 0.7163, - "step": 20327 - }, - { - "epoch": 0.52, - "learning_rate": 1.8936841481190954e-06, - "loss": 0.9121, - "step": 20328 - }, - { - "epoch": 0.52, - "learning_rate": 1.8936717321382465e-06, - "loss": 1.084, - "step": 20329 - }, - { - "epoch": 0.52, - "learning_rate": 1.8936593154731542e-06, - "loss": 0.686, - "step": 20330 - }, - { - "epoch": 0.52, - "learning_rate": 1.893646898123828e-06, - "loss": 0.834, - "step": 20331 - }, - { - "epoch": 0.52, - "learning_rate": 1.8936344800902777e-06, - "loss": 0.8535, - "step": 20332 - }, - { - "epoch": 0.52, - "learning_rate": 1.8936220613725124e-06, - "loss": 0.7881, - "step": 20333 - }, - { - "epoch": 0.52, - "learning_rate": 1.8936096419705417e-06, - "loss": 0.6045, - "step": 20334 - }, - { - "epoch": 0.52, - "learning_rate": 1.8935972218843754e-06, - "loss": 0.9795, - "step": 20335 - }, - { - "epoch": 0.52, - "learning_rate": 1.8935848011140227e-06, - "loss": 0.8965, - "step": 20336 - }, - { - "epoch": 0.52, - "learning_rate": 1.8935723796594931e-06, - "loss": 0.812, - "step": 20337 - }, - { - "epoch": 0.52, - "learning_rate": 1.8935599575207962e-06, - "loss": 0.7939, - "step": 20338 - }, - { - "epoch": 0.52, - "learning_rate": 1.8935475346979416e-06, - "loss": 0.959, - "step": 20339 - }, - { - "epoch": 0.52, - "learning_rate": 1.893535111190939e-06, - "loss": 0.7456, - "step": 20340 - }, - { - "epoch": 0.52, - "learning_rate": 1.8935226869997973e-06, - "loss": 0.9707, - "step": 20341 - }, - { - "epoch": 0.52, - "learning_rate": 1.8935102621245265e-06, - "loss": 1.1318, - "step": 20342 - }, - { - "epoch": 0.52, - "learning_rate": 1.8934978365651359e-06, - "loss": 0.8506, - "step": 20343 - }, - { - "epoch": 0.52, - "learning_rate": 1.8934854103216353e-06, - "loss": 0.8193, - "step": 20344 - }, - { - "epoch": 0.52, - "learning_rate": 1.8934729833940337e-06, - "loss": 0.7188, - "step": 20345 - }, - { - "epoch": 0.52, - "learning_rate": 1.8934605557823411e-06, - "loss": 1.0215, - "step": 20346 - }, - { - "epoch": 0.52, - "learning_rate": 1.8934481274865668e-06, - "loss": 0.9062, - "step": 20347 - }, - { - "epoch": 0.52, - "learning_rate": 1.8934356985067204e-06, - "loss": 0.9346, - "step": 20348 - }, - { - "epoch": 0.52, - "learning_rate": 1.8934232688428114e-06, - "loss": 1.0039, - "step": 20349 - }, - { - "epoch": 0.52, - "learning_rate": 1.893410838494849e-06, - "loss": 0.6313, - "step": 20350 - }, - { - "epoch": 0.52, - "learning_rate": 1.8933984074628434e-06, - "loss": 0.917, - "step": 20351 - }, - { - "epoch": 0.52, - "learning_rate": 1.8933859757468033e-06, - "loss": 0.9229, - "step": 20352 - }, - { - "epoch": 0.52, - "learning_rate": 1.893373543346739e-06, - "loss": 0.9492, - "step": 20353 - }, - { - "epoch": 0.52, - "learning_rate": 1.8933611102626595e-06, - "loss": 0.6069, - "step": 20354 - }, - { - "epoch": 0.52, - "learning_rate": 1.8933486764945746e-06, - "loss": 0.7773, - "step": 20355 - }, - { - "epoch": 0.52, - "learning_rate": 1.8933362420424934e-06, - "loss": 0.6558, - "step": 20356 - }, - { - "epoch": 0.52, - "learning_rate": 1.8933238069064262e-06, - "loss": 1.0557, - "step": 20357 - }, - { - "epoch": 0.52, - "learning_rate": 1.8933113710863815e-06, - "loss": 0.9111, - "step": 20358 - }, - { - "epoch": 0.52, - "learning_rate": 1.8932989345823698e-06, - "loss": 0.8516, - "step": 20359 - }, - { - "epoch": 0.52, - "learning_rate": 1.8932864973944e-06, - "loss": 0.832, - "step": 20360 - }, - { - "epoch": 0.52, - "learning_rate": 1.8932740595224814e-06, - "loss": 1.0264, - "step": 20361 - }, - { - "epoch": 0.52, - "learning_rate": 1.8932616209666245e-06, - "loss": 0.7485, - "step": 20362 - }, - { - "epoch": 0.52, - "learning_rate": 1.893249181726838e-06, - "loss": 1.0146, - "step": 20363 - }, - { - "epoch": 0.52, - "learning_rate": 1.8932367418031318e-06, - "loss": 0.8132, - "step": 20364 - }, - { - "epoch": 0.52, - "learning_rate": 1.8932243011955152e-06, - "loss": 1.0127, - "step": 20365 - }, - { - "epoch": 0.52, - "learning_rate": 1.8932118599039979e-06, - "loss": 0.7288, - "step": 20366 - }, - { - "epoch": 0.52, - "learning_rate": 1.8931994179285893e-06, - "loss": 0.8076, - "step": 20367 - }, - { - "epoch": 0.52, - "learning_rate": 1.893186975269299e-06, - "loss": 0.7334, - "step": 20368 - }, - { - "epoch": 0.52, - "learning_rate": 1.8931745319261365e-06, - "loss": 0.8076, - "step": 20369 - }, - { - "epoch": 0.52, - "learning_rate": 1.8931620878991112e-06, - "loss": 1.1562, - "step": 20370 - }, - { - "epoch": 0.52, - "learning_rate": 1.893149643188233e-06, - "loss": 0.8633, - "step": 20371 - }, - { - "epoch": 0.52, - "learning_rate": 1.8931371977935111e-06, - "loss": 0.7827, - "step": 20372 - }, - { - "epoch": 0.52, - "learning_rate": 1.893124751714955e-06, - "loss": 0.646, - "step": 20373 - }, - { - "epoch": 0.52, - "learning_rate": 1.8931123049525746e-06, - "loss": 0.9229, - "step": 20374 - }, - { - "epoch": 0.52, - "learning_rate": 1.893099857506379e-06, - "loss": 0.9775, - "step": 20375 - }, - { - "epoch": 0.52, - "learning_rate": 1.8930874093763777e-06, - "loss": 0.9844, - "step": 20376 - }, - { - "epoch": 0.52, - "learning_rate": 1.8930749605625806e-06, - "loss": 1.0488, - "step": 20377 - }, - { - "epoch": 0.52, - "learning_rate": 1.893062511064997e-06, - "loss": 0.7754, - "step": 20378 - }, - { - "epoch": 0.52, - "learning_rate": 1.8930500608836369e-06, - "loss": 0.7002, - "step": 20379 - }, - { - "epoch": 0.52, - "learning_rate": 1.8930376100185091e-06, - "loss": 1.0684, - "step": 20380 - }, - { - "epoch": 0.52, - "learning_rate": 1.8930251584696234e-06, - "loss": 0.7959, - "step": 20381 - }, - { - "epoch": 0.52, - "learning_rate": 1.8930127062369897e-06, - "loss": 0.8887, - "step": 20382 - }, - { - "epoch": 0.52, - "learning_rate": 1.8930002533206169e-06, - "loss": 0.7881, - "step": 20383 - }, - { - "epoch": 0.52, - "learning_rate": 1.892987799720515e-06, - "loss": 0.8838, - "step": 20384 - }, - { - "epoch": 0.52, - "learning_rate": 1.8929753454366933e-06, - "loss": 0.8994, - "step": 20385 - }, - { - "epoch": 0.52, - "learning_rate": 1.8929628904691618e-06, - "loss": 0.6499, - "step": 20386 - }, - { - "epoch": 0.52, - "learning_rate": 1.8929504348179292e-06, - "loss": 0.8132, - "step": 20387 - }, - { - "epoch": 0.52, - "learning_rate": 1.8929379784830057e-06, - "loss": 0.8242, - "step": 20388 - }, - { - "epoch": 0.52, - "learning_rate": 1.892925521464401e-06, - "loss": 0.8135, - "step": 20389 - }, - { - "epoch": 0.52, - "learning_rate": 1.8929130637621236e-06, - "loss": 0.752, - "step": 20390 - }, - { - "epoch": 0.52, - "learning_rate": 1.8929006053761842e-06, - "loss": 1.1318, - "step": 20391 - }, - { - "epoch": 0.52, - "learning_rate": 1.8928881463065917e-06, - "loss": 0.6074, - "step": 20392 - }, - { - "epoch": 0.52, - "learning_rate": 1.8928756865533558e-06, - "loss": 0.9512, - "step": 20393 - }, - { - "epoch": 0.52, - "learning_rate": 1.892863226116486e-06, - "loss": 0.8916, - "step": 20394 - }, - { - "epoch": 0.52, - "learning_rate": 1.8928507649959922e-06, - "loss": 0.8965, - "step": 20395 - }, - { - "epoch": 0.52, - "learning_rate": 1.8928383031918833e-06, - "loss": 0.748, - "step": 20396 - }, - { - "epoch": 0.52, - "learning_rate": 1.8928258407041692e-06, - "loss": 0.9146, - "step": 20397 - }, - { - "epoch": 0.52, - "learning_rate": 1.8928133775328596e-06, - "loss": 1.0605, - "step": 20398 - }, - { - "epoch": 0.52, - "learning_rate": 1.8928009136779636e-06, - "loss": 0.6804, - "step": 20399 - }, - { - "epoch": 0.52, - "learning_rate": 1.8927884491394911e-06, - "loss": 0.835, - "step": 20400 - }, - { - "epoch": 0.52, - "learning_rate": 1.8927759839174518e-06, - "loss": 0.9824, - "step": 20401 - }, - { - "epoch": 0.52, - "learning_rate": 1.8927635180118546e-06, - "loss": 0.8506, - "step": 20402 - }, - { - "epoch": 0.52, - "learning_rate": 1.8927510514227096e-06, - "loss": 0.8604, - "step": 20403 - }, - { - "epoch": 0.52, - "learning_rate": 1.8927385841500261e-06, - "loss": 1.1318, - "step": 20404 - }, - { - "epoch": 0.52, - "learning_rate": 1.8927261161938138e-06, - "loss": 0.8164, - "step": 20405 - }, - { - "epoch": 0.52, - "learning_rate": 1.892713647554082e-06, - "loss": 0.7637, - "step": 20406 - }, - { - "epoch": 0.52, - "learning_rate": 1.8927011782308403e-06, - "loss": 0.9746, - "step": 20407 - }, - { - "epoch": 0.52, - "learning_rate": 1.8926887082240987e-06, - "loss": 0.689, - "step": 20408 - }, - { - "epoch": 0.52, - "learning_rate": 1.8926762375338664e-06, - "loss": 0.8809, - "step": 20409 - }, - { - "epoch": 0.52, - "learning_rate": 1.8926637661601527e-06, - "loss": 0.9678, - "step": 20410 - }, - { - "epoch": 0.52, - "learning_rate": 1.8926512941029675e-06, - "loss": 0.6665, - "step": 20411 - }, - { - "epoch": 0.52, - "learning_rate": 1.8926388213623202e-06, - "loss": 0.8916, - "step": 20412 - }, - { - "epoch": 0.52, - "learning_rate": 1.8926263479382208e-06, - "loss": 1.083, - "step": 20413 - }, - { - "epoch": 0.52, - "learning_rate": 1.892613873830678e-06, - "loss": 0.8945, - "step": 20414 - }, - { - "epoch": 0.52, - "learning_rate": 1.892601399039702e-06, - "loss": 0.7275, - "step": 20415 - }, - { - "epoch": 0.52, - "learning_rate": 1.8925889235653018e-06, - "loss": 0.7505, - "step": 20416 - }, - { - "epoch": 0.52, - "learning_rate": 1.8925764474074878e-06, - "loss": 0.8975, - "step": 20417 - }, - { - "epoch": 0.52, - "learning_rate": 1.8925639705662687e-06, - "loss": 0.7075, - "step": 20418 - }, - { - "epoch": 0.52, - "learning_rate": 1.8925514930416545e-06, - "loss": 0.9102, - "step": 20419 - }, - { - "epoch": 0.52, - "learning_rate": 1.8925390148336549e-06, - "loss": 0.9062, - "step": 20420 - }, - { - "epoch": 0.52, - "learning_rate": 1.892526535942279e-06, - "loss": 0.9824, - "step": 20421 - }, - { - "epoch": 0.52, - "learning_rate": 1.8925140563675365e-06, - "loss": 0.8984, - "step": 20422 - }, - { - "epoch": 0.52, - "learning_rate": 1.8925015761094372e-06, - "loss": 0.9287, - "step": 20423 - }, - { - "epoch": 0.52, - "learning_rate": 1.8924890951679902e-06, - "loss": 1.0029, - "step": 20424 - }, - { - "epoch": 0.52, - "learning_rate": 1.8924766135432057e-06, - "loss": 0.8213, - "step": 20425 - }, - { - "epoch": 0.52, - "learning_rate": 1.8924641312350926e-06, - "loss": 0.7041, - "step": 20426 - }, - { - "epoch": 0.52, - "learning_rate": 1.8924516482436607e-06, - "loss": 0.9229, - "step": 20427 - }, - { - "epoch": 0.52, - "learning_rate": 1.89243916456892e-06, - "loss": 0.7549, - "step": 20428 - }, - { - "epoch": 0.52, - "learning_rate": 1.8924266802108795e-06, - "loss": 0.916, - "step": 20429 - }, - { - "epoch": 0.52, - "learning_rate": 1.892414195169549e-06, - "loss": 0.8252, - "step": 20430 - }, - { - "epoch": 0.52, - "learning_rate": 1.8924017094449378e-06, - "loss": 0.8125, - "step": 20431 - }, - { - "epoch": 0.52, - "learning_rate": 1.8923892230370554e-06, - "loss": 0.9883, - "step": 20432 - }, - { - "epoch": 0.52, - "learning_rate": 1.8923767359459123e-06, - "loss": 0.8057, - "step": 20433 - }, - { - "epoch": 0.52, - "learning_rate": 1.8923642481715168e-06, - "loss": 0.8809, - "step": 20434 - }, - { - "epoch": 0.52, - "learning_rate": 1.8923517597138793e-06, - "loss": 1.0029, - "step": 20435 - }, - { - "epoch": 0.52, - "learning_rate": 1.8923392705730091e-06, - "loss": 0.8682, - "step": 20436 - }, - { - "epoch": 0.52, - "learning_rate": 1.8923267807489154e-06, - "loss": 0.9922, - "step": 20437 - }, - { - "epoch": 0.52, - "learning_rate": 1.8923142902416083e-06, - "loss": 0.9072, - "step": 20438 - }, - { - "epoch": 0.52, - "learning_rate": 1.8923017990510974e-06, - "loss": 0.8413, - "step": 20439 - }, - { - "epoch": 0.52, - "learning_rate": 1.8922893071773917e-06, - "loss": 0.7559, - "step": 20440 - }, - { - "epoch": 0.52, - "learning_rate": 1.8922768146205014e-06, - "loss": 0.6235, - "step": 20441 - }, - { - "epoch": 0.52, - "learning_rate": 1.8922643213804357e-06, - "loss": 0.7842, - "step": 20442 - }, - { - "epoch": 0.52, - "learning_rate": 1.8922518274572042e-06, - "loss": 0.9424, - "step": 20443 - }, - { - "epoch": 0.52, - "learning_rate": 1.8922393328508167e-06, - "loss": 0.9717, - "step": 20444 - }, - { - "epoch": 0.52, - "learning_rate": 1.892226837561282e-06, - "loss": 0.9404, - "step": 20445 - }, - { - "epoch": 0.52, - "learning_rate": 1.8922143415886107e-06, - "loss": 0.9648, - "step": 20446 - }, - { - "epoch": 0.52, - "learning_rate": 1.8922018449328117e-06, - "loss": 0.9209, - "step": 20447 - }, - { - "epoch": 0.52, - "learning_rate": 1.892189347593895e-06, - "loss": 0.8516, - "step": 20448 - }, - { - "epoch": 0.52, - "learning_rate": 1.8921768495718697e-06, - "loss": 0.8018, - "step": 20449 - }, - { - "epoch": 0.52, - "learning_rate": 1.892164350866746e-06, - "loss": 0.9385, - "step": 20450 - }, - { - "epoch": 0.52, - "learning_rate": 1.8921518514785325e-06, - "loss": 0.8916, - "step": 20451 - }, - { - "epoch": 0.52, - "learning_rate": 1.8921393514072399e-06, - "loss": 0.73, - "step": 20452 - }, - { - "epoch": 0.52, - "learning_rate": 1.892126850652877e-06, - "loss": 0.8589, - "step": 20453 - }, - { - "epoch": 0.52, - "learning_rate": 1.8921143492154533e-06, - "loss": 1.0352, - "step": 20454 - }, - { - "epoch": 0.52, - "learning_rate": 1.8921018470949792e-06, - "loss": 0.9551, - "step": 20455 - }, - { - "epoch": 0.52, - "learning_rate": 1.8920893442914633e-06, - "loss": 1.002, - "step": 20456 - }, - { - "epoch": 0.52, - "learning_rate": 1.8920768408049156e-06, - "loss": 0.7627, - "step": 20457 - }, - { - "epoch": 0.52, - "learning_rate": 1.8920643366353461e-06, - "loss": 1.0283, - "step": 20458 - }, - { - "epoch": 0.52, - "learning_rate": 1.8920518317827638e-06, - "loss": 0.7734, - "step": 20459 - }, - { - "epoch": 0.52, - "learning_rate": 1.8920393262471782e-06, - "loss": 1.0254, - "step": 20460 - }, - { - "epoch": 0.52, - "learning_rate": 1.8920268200285992e-06, - "loss": 0.9375, - "step": 20461 - }, - { - "epoch": 0.52, - "learning_rate": 1.8920143131270363e-06, - "loss": 0.8613, - "step": 20462 - }, - { - "epoch": 0.52, - "learning_rate": 1.8920018055424993e-06, - "loss": 0.8008, - "step": 20463 - }, - { - "epoch": 0.52, - "learning_rate": 1.8919892972749972e-06, - "loss": 0.9307, - "step": 20464 - }, - { - "epoch": 0.52, - "learning_rate": 1.89197678832454e-06, - "loss": 0.9951, - "step": 20465 - }, - { - "epoch": 0.52, - "learning_rate": 1.8919642786911374e-06, - "loss": 1.0703, - "step": 20466 - }, - { - "epoch": 0.52, - "learning_rate": 1.8919517683747985e-06, - "loss": 0.793, - "step": 20467 - }, - { - "epoch": 0.52, - "learning_rate": 1.8919392573755332e-06, - "loss": 0.9165, - "step": 20468 - }, - { - "epoch": 0.52, - "learning_rate": 1.891926745693351e-06, - "loss": 0.8965, - "step": 20469 - }, - { - "epoch": 0.52, - "learning_rate": 1.8919142333282614e-06, - "loss": 0.7783, - "step": 20470 - }, - { - "epoch": 0.52, - "learning_rate": 1.8919017202802742e-06, - "loss": 0.8848, - "step": 20471 - }, - { - "epoch": 0.52, - "learning_rate": 1.8918892065493992e-06, - "loss": 0.877, - "step": 20472 - }, - { - "epoch": 0.52, - "learning_rate": 1.8918766921356451e-06, - "loss": 0.8496, - "step": 20473 - }, - { - "epoch": 0.52, - "learning_rate": 1.8918641770390224e-06, - "loss": 0.7954, - "step": 20474 - }, - { - "epoch": 0.52, - "learning_rate": 1.8918516612595404e-06, - "loss": 0.7974, - "step": 20475 - }, - { - "epoch": 0.52, - "learning_rate": 1.891839144797208e-06, - "loss": 0.6758, - "step": 20476 - }, - { - "epoch": 0.52, - "learning_rate": 1.8918266276520358e-06, - "loss": 0.8418, - "step": 20477 - }, - { - "epoch": 0.52, - "learning_rate": 1.891814109824033e-06, - "loss": 0.9756, - "step": 20478 - }, - { - "epoch": 0.52, - "learning_rate": 1.891801591313209e-06, - "loss": 0.9385, - "step": 20479 - }, - { - "epoch": 0.52, - "learning_rate": 1.8917890721195735e-06, - "loss": 0.6494, - "step": 20480 - }, - { - "epoch": 0.52, - "learning_rate": 1.891776552243136e-06, - "loss": 0.6934, - "step": 20481 - }, - { - "epoch": 0.52, - "learning_rate": 1.8917640316839068e-06, - "loss": 0.8379, - "step": 20482 - }, - { - "epoch": 0.52, - "learning_rate": 1.8917515104418942e-06, - "loss": 0.7603, - "step": 20483 - }, - { - "epoch": 0.53, - "learning_rate": 1.891738988517109e-06, - "loss": 0.7085, - "step": 20484 - }, - { - "epoch": 0.53, - "learning_rate": 1.89172646590956e-06, - "loss": 0.9141, - "step": 20485 - }, - { - "epoch": 0.53, - "learning_rate": 1.8917139426192569e-06, - "loss": 0.9521, - "step": 20486 - }, - { - "epoch": 0.53, - "learning_rate": 1.8917014186462094e-06, - "loss": 1.0254, - "step": 20487 - }, - { - "epoch": 0.53, - "learning_rate": 1.8916888939904277e-06, - "loss": 1.0146, - "step": 20488 - }, - { - "epoch": 0.53, - "learning_rate": 1.8916763686519205e-06, - "loss": 0.4692, - "step": 20489 - }, - { - "epoch": 0.53, - "learning_rate": 1.8916638426306975e-06, - "loss": 0.9272, - "step": 20490 - }, - { - "epoch": 0.53, - "learning_rate": 1.8916513159267685e-06, - "loss": 0.7969, - "step": 20491 - }, - { - "epoch": 0.53, - "learning_rate": 1.8916387885401433e-06, - "loss": 0.8799, - "step": 20492 - }, - { - "epoch": 0.53, - "learning_rate": 1.891626260470831e-06, - "loss": 0.8711, - "step": 20493 - }, - { - "epoch": 0.53, - "learning_rate": 1.8916137317188419e-06, - "loss": 0.8066, - "step": 20494 - }, - { - "epoch": 0.53, - "learning_rate": 1.8916012022841848e-06, - "loss": 0.7036, - "step": 20495 - }, - { - "epoch": 0.53, - "learning_rate": 1.8915886721668697e-06, - "loss": 0.9873, - "step": 20496 - }, - { - "epoch": 0.53, - "learning_rate": 1.8915761413669063e-06, - "loss": 0.8096, - "step": 20497 - }, - { - "epoch": 0.53, - "learning_rate": 1.891563609884304e-06, - "loss": 0.6763, - "step": 20498 - }, - { - "epoch": 0.53, - "learning_rate": 1.8915510777190722e-06, - "loss": 0.9131, - "step": 20499 - }, - { - "epoch": 0.53, - "learning_rate": 1.8915385448712211e-06, - "loss": 0.9277, - "step": 20500 - }, - { - "epoch": 0.53, - "learning_rate": 1.8915260113407597e-06, - "loss": 0.8037, - "step": 20501 - }, - { - "epoch": 0.53, - "learning_rate": 1.891513477127698e-06, - "loss": 0.8682, - "step": 20502 - }, - { - "epoch": 0.53, - "learning_rate": 1.8915009422320454e-06, - "loss": 0.7529, - "step": 20503 - }, - { - "epoch": 0.53, - "learning_rate": 1.8914884066538113e-06, - "loss": 0.8701, - "step": 20504 - }, - { - "epoch": 0.53, - "learning_rate": 1.8914758703930059e-06, - "loss": 0.7627, - "step": 20505 - }, - { - "epoch": 0.53, - "learning_rate": 1.891463333449638e-06, - "loss": 0.8086, - "step": 20506 - }, - { - "epoch": 0.53, - "learning_rate": 1.8914507958237179e-06, - "loss": 0.8779, - "step": 20507 - }, - { - "epoch": 0.53, - "learning_rate": 1.8914382575152548e-06, - "loss": 0.8281, - "step": 20508 - }, - { - "epoch": 0.53, - "learning_rate": 1.8914257185242585e-06, - "loss": 0.7334, - "step": 20509 - }, - { - "epoch": 0.53, - "learning_rate": 1.8914131788507382e-06, - "loss": 0.9922, - "step": 20510 - }, - { - "epoch": 0.53, - "learning_rate": 1.891400638494704e-06, - "loss": 0.7666, - "step": 20511 - }, - { - "epoch": 0.53, - "learning_rate": 1.8913880974561655e-06, - "loss": 0.7266, - "step": 20512 - }, - { - "epoch": 0.53, - "learning_rate": 1.891375555735132e-06, - "loss": 0.7935, - "step": 20513 - }, - { - "epoch": 0.53, - "learning_rate": 1.8913630133316132e-06, - "loss": 0.6172, - "step": 20514 - }, - { - "epoch": 0.53, - "learning_rate": 1.891350470245619e-06, - "loss": 0.7764, - "step": 20515 - }, - { - "epoch": 0.53, - "learning_rate": 1.8913379264771584e-06, - "loss": 0.8604, - "step": 20516 - }, - { - "epoch": 0.53, - "learning_rate": 1.8913253820262415e-06, - "loss": 1.0059, - "step": 20517 - }, - { - "epoch": 0.53, - "learning_rate": 1.8913128368928775e-06, - "loss": 0.959, - "step": 20518 - }, - { - "epoch": 0.53, - "learning_rate": 1.8913002910770763e-06, - "loss": 1.0811, - "step": 20519 - }, - { - "epoch": 0.53, - "learning_rate": 1.8912877445788475e-06, - "loss": 0.8818, - "step": 20520 - }, - { - "epoch": 0.53, - "learning_rate": 1.891275197398201e-06, - "loss": 0.7725, - "step": 20521 - }, - { - "epoch": 0.53, - "learning_rate": 1.8912626495351456e-06, - "loss": 0.9297, - "step": 20522 - }, - { - "epoch": 0.53, - "learning_rate": 1.8912501009896915e-06, - "loss": 0.8857, - "step": 20523 - }, - { - "epoch": 0.53, - "learning_rate": 1.8912375517618485e-06, - "loss": 0.8047, - "step": 20524 - }, - { - "epoch": 0.53, - "learning_rate": 1.8912250018516253e-06, - "loss": 1.0527, - "step": 20525 - }, - { - "epoch": 0.53, - "learning_rate": 1.8912124512590326e-06, - "loss": 0.9229, - "step": 20526 - }, - { - "epoch": 0.53, - "learning_rate": 1.8911998999840792e-06, - "loss": 0.873, - "step": 20527 - }, - { - "epoch": 0.53, - "learning_rate": 1.8911873480267752e-06, - "loss": 0.668, - "step": 20528 - }, - { - "epoch": 0.53, - "learning_rate": 1.8911747953871298e-06, - "loss": 0.9551, - "step": 20529 - }, - { - "epoch": 0.53, - "learning_rate": 1.8911622420651532e-06, - "loss": 0.8594, - "step": 20530 - }, - { - "epoch": 0.53, - "learning_rate": 1.8911496880608545e-06, - "loss": 0.9697, - "step": 20531 - }, - { - "epoch": 0.53, - "learning_rate": 1.8911371333742432e-06, - "loss": 0.958, - "step": 20532 - }, - { - "epoch": 0.53, - "learning_rate": 1.8911245780053293e-06, - "loss": 1.0117, - "step": 20533 - }, - { - "epoch": 0.53, - "learning_rate": 1.8911120219541226e-06, - "loss": 0.7812, - "step": 20534 - }, - { - "epoch": 0.53, - "learning_rate": 1.8910994652206318e-06, - "loss": 0.8574, - "step": 20535 - }, - { - "epoch": 0.53, - "learning_rate": 1.8910869078048677e-06, - "loss": 0.5759, - "step": 20536 - }, - { - "epoch": 0.53, - "learning_rate": 1.891074349706839e-06, - "loss": 0.8818, - "step": 20537 - }, - { - "epoch": 0.53, - "learning_rate": 1.8910617909265559e-06, - "loss": 0.9424, - "step": 20538 - }, - { - "epoch": 0.53, - "learning_rate": 1.8910492314640277e-06, - "loss": 1.0264, - "step": 20539 - }, - { - "epoch": 0.53, - "learning_rate": 1.8910366713192638e-06, - "loss": 0.8477, - "step": 20540 - }, - { - "epoch": 0.53, - "learning_rate": 1.8910241104922741e-06, - "loss": 0.7612, - "step": 20541 - }, - { - "epoch": 0.53, - "learning_rate": 1.8910115489830685e-06, - "loss": 0.9766, - "step": 20542 - }, - { - "epoch": 0.53, - "learning_rate": 1.890998986791656e-06, - "loss": 0.7939, - "step": 20543 - }, - { - "epoch": 0.53, - "learning_rate": 1.8909864239180469e-06, - "loss": 0.8271, - "step": 20544 - }, - { - "epoch": 0.53, - "learning_rate": 1.8909738603622502e-06, - "loss": 1.1289, - "step": 20545 - }, - { - "epoch": 0.53, - "learning_rate": 1.890961296124276e-06, - "loss": 1.0078, - "step": 20546 - }, - { - "epoch": 0.53, - "learning_rate": 1.8909487312041335e-06, - "loss": 0.8184, - "step": 20547 - }, - { - "epoch": 0.53, - "learning_rate": 1.8909361656018326e-06, - "loss": 0.9526, - "step": 20548 - }, - { - "epoch": 0.53, - "learning_rate": 1.8909235993173832e-06, - "loss": 0.9385, - "step": 20549 - }, - { - "epoch": 0.53, - "learning_rate": 1.890911032350794e-06, - "loss": 0.8262, - "step": 20550 - }, - { - "epoch": 0.53, - "learning_rate": 1.8908984647020754e-06, - "loss": 0.7524, - "step": 20551 - }, - { - "epoch": 0.53, - "learning_rate": 1.8908858963712368e-06, - "loss": 0.7075, - "step": 20552 - }, - { - "epoch": 0.53, - "learning_rate": 1.890873327358288e-06, - "loss": 0.7249, - "step": 20553 - }, - { - "epoch": 0.53, - "learning_rate": 1.8908607576632383e-06, - "loss": 0.8008, - "step": 20554 - }, - { - "epoch": 0.53, - "learning_rate": 1.8908481872860972e-06, - "loss": 0.8555, - "step": 20555 - }, - { - "epoch": 0.53, - "learning_rate": 1.890835616226875e-06, - "loss": 0.8701, - "step": 20556 - }, - { - "epoch": 0.53, - "learning_rate": 1.890823044485581e-06, - "loss": 0.7224, - "step": 20557 - }, - { - "epoch": 0.53, - "learning_rate": 1.8908104720622244e-06, - "loss": 0.9229, - "step": 20558 - }, - { - "epoch": 0.53, - "learning_rate": 1.8907978989568156e-06, - "loss": 0.8252, - "step": 20559 - }, - { - "epoch": 0.53, - "learning_rate": 1.8907853251693636e-06, - "loss": 0.7661, - "step": 20560 - }, - { - "epoch": 0.53, - "learning_rate": 1.8907727506998781e-06, - "loss": 0.9502, - "step": 20561 - }, - { - "epoch": 0.53, - "learning_rate": 1.890760175548369e-06, - "loss": 1.0684, - "step": 20562 - }, - { - "epoch": 0.53, - "learning_rate": 1.8907475997148456e-06, - "loss": 0.9189, - "step": 20563 - }, - { - "epoch": 0.53, - "learning_rate": 1.890735023199318e-06, - "loss": 0.7754, - "step": 20564 - }, - { - "epoch": 0.53, - "learning_rate": 1.8907224460017954e-06, - "loss": 0.9014, - "step": 20565 - }, - { - "epoch": 0.53, - "learning_rate": 1.8907098681222876e-06, - "loss": 0.8291, - "step": 20566 - }, - { - "epoch": 0.53, - "learning_rate": 1.8906972895608042e-06, - "loss": 0.8125, - "step": 20567 - }, - { - "epoch": 0.53, - "learning_rate": 1.8906847103173548e-06, - "loss": 0.6978, - "step": 20568 - }, - { - "epoch": 0.53, - "learning_rate": 1.8906721303919493e-06, - "loss": 1.0898, - "step": 20569 - }, - { - "epoch": 0.53, - "learning_rate": 1.8906595497845967e-06, - "loss": 0.7046, - "step": 20570 - }, - { - "epoch": 0.53, - "learning_rate": 1.8906469684953075e-06, - "loss": 0.9814, - "step": 20571 - }, - { - "epoch": 0.53, - "learning_rate": 1.8906343865240908e-06, - "loss": 1.0107, - "step": 20572 - }, - { - "epoch": 0.53, - "learning_rate": 1.8906218038709559e-06, - "loss": 1.1104, - "step": 20573 - }, - { - "epoch": 0.53, - "learning_rate": 1.8906092205359132e-06, - "loss": 0.9395, - "step": 20574 - }, - { - "epoch": 0.53, - "learning_rate": 1.8905966365189718e-06, - "loss": 0.8096, - "step": 20575 - }, - { - "epoch": 0.53, - "learning_rate": 1.8905840518201416e-06, - "loss": 0.9102, - "step": 20576 - }, - { - "epoch": 0.53, - "learning_rate": 1.890571466439432e-06, - "loss": 0.8428, - "step": 20577 - }, - { - "epoch": 0.53, - "learning_rate": 1.890558880376853e-06, - "loss": 1.0098, - "step": 20578 - }, - { - "epoch": 0.53, - "learning_rate": 1.890546293632414e-06, - "loss": 0.7959, - "step": 20579 - }, - { - "epoch": 0.53, - "learning_rate": 1.8905337062061244e-06, - "loss": 0.9053, - "step": 20580 - }, - { - "epoch": 0.53, - "learning_rate": 1.8905211180979944e-06, - "loss": 0.9785, - "step": 20581 - }, - { - "epoch": 0.53, - "learning_rate": 1.890508529308033e-06, - "loss": 0.957, - "step": 20582 - }, - { - "epoch": 0.53, - "learning_rate": 1.8904959398362506e-06, - "loss": 0.6851, - "step": 20583 - }, - { - "epoch": 0.53, - "learning_rate": 1.890483349682656e-06, - "loss": 0.9258, - "step": 20584 - }, - { - "epoch": 0.53, - "learning_rate": 1.8904707588472593e-06, - "loss": 0.9365, - "step": 20585 - }, - { - "epoch": 0.53, - "learning_rate": 1.8904581673300704e-06, - "loss": 0.9639, - "step": 20586 - }, - { - "epoch": 0.53, - "learning_rate": 1.8904455751310982e-06, - "loss": 0.8306, - "step": 20587 - }, - { - "epoch": 0.53, - "learning_rate": 1.890432982250353e-06, - "loss": 0.9058, - "step": 20588 - }, - { - "epoch": 0.53, - "learning_rate": 1.8904203886878443e-06, - "loss": 1.0225, - "step": 20589 - }, - { - "epoch": 0.53, - "learning_rate": 1.8904077944435812e-06, - "loss": 0.9531, - "step": 20590 - }, - { - "epoch": 0.53, - "learning_rate": 1.8903951995175742e-06, - "loss": 0.6475, - "step": 20591 - }, - { - "epoch": 0.53, - "learning_rate": 1.8903826039098324e-06, - "loss": 0.6904, - "step": 20592 - }, - { - "epoch": 0.53, - "learning_rate": 1.890370007620366e-06, - "loss": 0.8867, - "step": 20593 - }, - { - "epoch": 0.53, - "learning_rate": 1.8903574106491836e-06, - "loss": 0.9766, - "step": 20594 - }, - { - "epoch": 0.53, - "learning_rate": 1.8903448129962957e-06, - "loss": 0.9336, - "step": 20595 - }, - { - "epoch": 0.53, - "learning_rate": 1.8903322146617118e-06, - "loss": 0.8467, - "step": 20596 - }, - { - "epoch": 0.53, - "learning_rate": 1.8903196156454415e-06, - "loss": 1.0703, - "step": 20597 - }, - { - "epoch": 0.53, - "learning_rate": 1.8903070159474943e-06, - "loss": 0.9443, - "step": 20598 - }, - { - "epoch": 0.53, - "learning_rate": 1.89029441556788e-06, - "loss": 0.9893, - "step": 20599 - }, - { - "epoch": 0.53, - "learning_rate": 1.890281814506608e-06, - "loss": 0.8232, - "step": 20600 - }, - { - "epoch": 0.53, - "learning_rate": 1.8902692127636883e-06, - "loss": 0.7246, - "step": 20601 - }, - { - "epoch": 0.53, - "learning_rate": 1.8902566103391305e-06, - "loss": 0.9951, - "step": 20602 - }, - { - "epoch": 0.53, - "learning_rate": 1.890244007232944e-06, - "loss": 0.8594, - "step": 20603 - }, - { - "epoch": 0.53, - "learning_rate": 1.8902314034451387e-06, - "loss": 0.521, - "step": 20604 - }, - { - "epoch": 0.53, - "learning_rate": 1.890218798975724e-06, - "loss": 0.9775, - "step": 20605 - }, - { - "epoch": 0.53, - "learning_rate": 1.89020619382471e-06, - "loss": 0.7139, - "step": 20606 - }, - { - "epoch": 0.53, - "learning_rate": 1.8901935879921058e-06, - "loss": 0.8745, - "step": 20607 - }, - { - "epoch": 0.53, - "learning_rate": 1.8901809814779215e-06, - "loss": 0.7573, - "step": 20608 - }, - { - "epoch": 0.53, - "learning_rate": 1.8901683742821663e-06, - "loss": 0.9072, - "step": 20609 - }, - { - "epoch": 0.53, - "learning_rate": 1.8901557664048502e-06, - "loss": 0.688, - "step": 20610 - }, - { - "epoch": 0.53, - "learning_rate": 1.8901431578459827e-06, - "loss": 0.814, - "step": 20611 - }, - { - "epoch": 0.53, - "learning_rate": 1.890130548605574e-06, - "loss": 0.5884, - "step": 20612 - }, - { - "epoch": 0.53, - "learning_rate": 1.8901179386836326e-06, - "loss": 0.9512, - "step": 20613 - }, - { - "epoch": 0.53, - "learning_rate": 1.890105328080169e-06, - "loss": 0.8486, - "step": 20614 - }, - { - "epoch": 0.53, - "learning_rate": 1.890092716795193e-06, - "loss": 0.792, - "step": 20615 - }, - { - "epoch": 0.53, - "learning_rate": 1.8900801048287137e-06, - "loss": 0.7002, - "step": 20616 - }, - { - "epoch": 0.53, - "learning_rate": 1.8900674921807409e-06, - "loss": 0.9375, - "step": 20617 - }, - { - "epoch": 0.53, - "learning_rate": 1.8900548788512845e-06, - "loss": 0.7466, - "step": 20618 - }, - { - "epoch": 0.53, - "learning_rate": 1.8900422648403538e-06, - "loss": 0.8271, - "step": 20619 - }, - { - "epoch": 0.53, - "learning_rate": 1.890029650147959e-06, - "loss": 0.7744, - "step": 20620 - }, - { - "epoch": 0.53, - "learning_rate": 1.8900170347741092e-06, - "loss": 0.8799, - "step": 20621 - }, - { - "epoch": 0.53, - "learning_rate": 1.8900044187188142e-06, - "loss": 0.6836, - "step": 20622 - }, - { - "epoch": 0.53, - "learning_rate": 1.889991801982084e-06, - "loss": 0.8613, - "step": 20623 - }, - { - "epoch": 0.53, - "learning_rate": 1.8899791845639276e-06, - "loss": 0.9736, - "step": 20624 - }, - { - "epoch": 0.53, - "learning_rate": 1.8899665664643555e-06, - "loss": 0.7808, - "step": 20625 - }, - { - "epoch": 0.53, - "learning_rate": 1.889953947683377e-06, - "loss": 1.0254, - "step": 20626 - }, - { - "epoch": 0.53, - "learning_rate": 1.8899413282210014e-06, - "loss": 0.9258, - "step": 20627 - }, - { - "epoch": 0.53, - "learning_rate": 1.8899287080772385e-06, - "loss": 0.7354, - "step": 20628 - }, - { - "epoch": 0.53, - "learning_rate": 1.8899160872520983e-06, - "loss": 0.7227, - "step": 20629 - }, - { - "epoch": 0.53, - "learning_rate": 1.88990346574559e-06, - "loss": 0.7959, - "step": 20630 - }, - { - "epoch": 0.53, - "learning_rate": 1.8898908435577238e-06, - "loss": 1.0405, - "step": 20631 - }, - { - "epoch": 0.53, - "learning_rate": 1.8898782206885091e-06, - "loss": 0.627, - "step": 20632 - }, - { - "epoch": 0.53, - "learning_rate": 1.8898655971379558e-06, - "loss": 0.9932, - "step": 20633 - }, - { - "epoch": 0.53, - "learning_rate": 1.8898529729060728e-06, - "loss": 0.6885, - "step": 20634 - }, - { - "epoch": 0.53, - "learning_rate": 1.8898403479928707e-06, - "loss": 0.8799, - "step": 20635 - }, - { - "epoch": 0.53, - "learning_rate": 1.8898277223983588e-06, - "loss": 0.9434, - "step": 20636 - }, - { - "epoch": 0.53, - "learning_rate": 1.8898150961225462e-06, - "loss": 0.8799, - "step": 20637 - }, - { - "epoch": 0.53, - "learning_rate": 1.8898024691654438e-06, - "loss": 0.7305, - "step": 20638 - }, - { - "epoch": 0.53, - "learning_rate": 1.8897898415270599e-06, - "loss": 0.8691, - "step": 20639 - }, - { - "epoch": 0.53, - "learning_rate": 1.8897772132074053e-06, - "loss": 0.605, - "step": 20640 - }, - { - "epoch": 0.53, - "learning_rate": 1.889764584206489e-06, - "loss": 0.7773, - "step": 20641 - }, - { - "epoch": 0.53, - "learning_rate": 1.8897519545243207e-06, - "loss": 1.0371, - "step": 20642 - }, - { - "epoch": 0.53, - "learning_rate": 1.8897393241609107e-06, - "loss": 0.8672, - "step": 20643 - }, - { - "epoch": 0.53, - "learning_rate": 1.8897266931162678e-06, - "loss": 0.9062, - "step": 20644 - }, - { - "epoch": 0.53, - "learning_rate": 1.8897140613904025e-06, - "loss": 0.8896, - "step": 20645 - }, - { - "epoch": 0.53, - "learning_rate": 1.8897014289833237e-06, - "loss": 0.594, - "step": 20646 - }, - { - "epoch": 0.53, - "learning_rate": 1.8896887958950415e-06, - "loss": 0.9375, - "step": 20647 - }, - { - "epoch": 0.53, - "learning_rate": 1.8896761621255657e-06, - "loss": 0.8813, - "step": 20648 - }, - { - "epoch": 0.53, - "learning_rate": 1.8896635276749055e-06, - "loss": 0.9297, - "step": 20649 - }, - { - "epoch": 0.53, - "learning_rate": 1.889650892543071e-06, - "loss": 0.75, - "step": 20650 - }, - { - "epoch": 0.53, - "learning_rate": 1.8896382567300714e-06, - "loss": 0.8799, - "step": 20651 - }, - { - "epoch": 0.53, - "learning_rate": 1.8896256202359174e-06, - "loss": 0.7959, - "step": 20652 - }, - { - "epoch": 0.53, - "learning_rate": 1.8896129830606173e-06, - "loss": 0.6172, - "step": 20653 - }, - { - "epoch": 0.53, - "learning_rate": 1.8896003452041817e-06, - "loss": 0.7036, - "step": 20654 - }, - { - "epoch": 0.53, - "learning_rate": 1.88958770666662e-06, - "loss": 0.6692, - "step": 20655 - }, - { - "epoch": 0.53, - "learning_rate": 1.8895750674479421e-06, - "loss": 0.8506, - "step": 20656 - }, - { - "epoch": 0.53, - "learning_rate": 1.889562427548157e-06, - "loss": 0.8667, - "step": 20657 - }, - { - "epoch": 0.53, - "learning_rate": 1.8895497869672753e-06, - "loss": 0.6235, - "step": 20658 - }, - { - "epoch": 0.53, - "learning_rate": 1.8895371457053057e-06, - "loss": 1.1338, - "step": 20659 - }, - { - "epoch": 0.53, - "learning_rate": 1.8895245037622588e-06, - "loss": 0.8809, - "step": 20660 - }, - { - "epoch": 0.53, - "learning_rate": 1.8895118611381439e-06, - "loss": 0.4785, - "step": 20661 - }, - { - "epoch": 0.53, - "learning_rate": 1.8894992178329708e-06, - "loss": 1.0625, - "step": 20662 - }, - { - "epoch": 0.53, - "learning_rate": 1.889486573846749e-06, - "loss": 0.4858, - "step": 20663 - }, - { - "epoch": 0.53, - "learning_rate": 1.8894739291794878e-06, - "loss": 0.8281, - "step": 20664 - }, - { - "epoch": 0.53, - "learning_rate": 1.8894612838311978e-06, - "loss": 0.7134, - "step": 20665 - }, - { - "epoch": 0.53, - "learning_rate": 1.889448637801888e-06, - "loss": 0.6733, - "step": 20666 - }, - { - "epoch": 0.53, - "learning_rate": 1.889435991091568e-06, - "loss": 0.8213, - "step": 20667 - }, - { - "epoch": 0.53, - "learning_rate": 1.8894233437002482e-06, - "loss": 0.6479, - "step": 20668 - }, - { - "epoch": 0.53, - "learning_rate": 1.8894106956279377e-06, - "loss": 0.8701, - "step": 20669 - }, - { - "epoch": 0.53, - "learning_rate": 1.8893980468746462e-06, - "loss": 0.875, - "step": 20670 - }, - { - "epoch": 0.53, - "learning_rate": 1.8893853974403838e-06, - "loss": 0.7949, - "step": 20671 - }, - { - "epoch": 0.53, - "learning_rate": 1.8893727473251596e-06, - "loss": 1.0381, - "step": 20672 - }, - { - "epoch": 0.53, - "learning_rate": 1.8893600965289837e-06, - "loss": 1.0645, - "step": 20673 - }, - { - "epoch": 0.53, - "learning_rate": 1.8893474450518658e-06, - "loss": 0.9033, - "step": 20674 - }, - { - "epoch": 0.53, - "learning_rate": 1.8893347928938153e-06, - "loss": 0.8525, - "step": 20675 - }, - { - "epoch": 0.53, - "learning_rate": 1.889322140054842e-06, - "loss": 0.9609, - "step": 20676 - }, - { - "epoch": 0.53, - "learning_rate": 1.8893094865349557e-06, - "loss": 0.9961, - "step": 20677 - }, - { - "epoch": 0.53, - "learning_rate": 1.8892968323341657e-06, - "loss": 0.874, - "step": 20678 - }, - { - "epoch": 0.53, - "learning_rate": 1.8892841774524824e-06, - "loss": 0.9131, - "step": 20679 - }, - { - "epoch": 0.53, - "learning_rate": 1.889271521889915e-06, - "loss": 1.1064, - "step": 20680 - }, - { - "epoch": 0.53, - "learning_rate": 1.8892588656464734e-06, - "loss": 0.6509, - "step": 20681 - }, - { - "epoch": 0.53, - "learning_rate": 1.889246208722167e-06, - "loss": 0.9893, - "step": 20682 - }, - { - "epoch": 0.53, - "learning_rate": 1.8892335511170058e-06, - "loss": 0.7959, - "step": 20683 - }, - { - "epoch": 0.53, - "learning_rate": 1.889220892830999e-06, - "loss": 0.835, - "step": 20684 - }, - { - "epoch": 0.53, - "learning_rate": 1.8892082338641574e-06, - "loss": 1.0527, - "step": 20685 - }, - { - "epoch": 0.53, - "learning_rate": 1.8891955742164894e-06, - "loss": 0.7959, - "step": 20686 - }, - { - "epoch": 0.53, - "learning_rate": 1.8891829138880054e-06, - "loss": 0.79, - "step": 20687 - }, - { - "epoch": 0.53, - "learning_rate": 1.8891702528787149e-06, - "loss": 0.9648, - "step": 20688 - }, - { - "epoch": 0.53, - "learning_rate": 1.8891575911886273e-06, - "loss": 1.04, - "step": 20689 - }, - { - "epoch": 0.53, - "learning_rate": 1.8891449288177531e-06, - "loss": 0.9453, - "step": 20690 - }, - { - "epoch": 0.53, - "learning_rate": 1.8891322657661012e-06, - "loss": 0.9404, - "step": 20691 - }, - { - "epoch": 0.53, - "learning_rate": 1.8891196020336816e-06, - "loss": 0.8516, - "step": 20692 - }, - { - "epoch": 0.53, - "learning_rate": 1.8891069376205043e-06, - "loss": 0.8716, - "step": 20693 - }, - { - "epoch": 0.53, - "learning_rate": 1.8890942725265784e-06, - "loss": 0.8252, - "step": 20694 - }, - { - "epoch": 0.53, - "learning_rate": 1.889081606751914e-06, - "loss": 0.8228, - "step": 20695 - }, - { - "epoch": 0.53, - "learning_rate": 1.8890689402965209e-06, - "loss": 0.9727, - "step": 20696 - }, - { - "epoch": 0.53, - "learning_rate": 1.889056273160408e-06, - "loss": 0.9756, - "step": 20697 - }, - { - "epoch": 0.53, - "learning_rate": 1.8890436053435863e-06, - "loss": 0.8428, - "step": 20698 - }, - { - "epoch": 0.53, - "learning_rate": 1.8890309368460644e-06, - "loss": 0.8857, - "step": 20699 - }, - { - "epoch": 0.53, - "learning_rate": 1.8890182676678524e-06, - "loss": 0.9385, - "step": 20700 - }, - { - "epoch": 0.53, - "learning_rate": 1.88900559780896e-06, - "loss": 1.084, - "step": 20701 - }, - { - "epoch": 0.53, - "learning_rate": 1.8889929272693972e-06, - "loss": 0.6943, - "step": 20702 - }, - { - "epoch": 0.53, - "learning_rate": 1.888980256049173e-06, - "loss": 0.8115, - "step": 20703 - }, - { - "epoch": 0.53, - "learning_rate": 1.8889675841482977e-06, - "loss": 0.7305, - "step": 20704 - }, - { - "epoch": 0.53, - "learning_rate": 1.8889549115667807e-06, - "loss": 0.8496, - "step": 20705 - }, - { - "epoch": 0.53, - "learning_rate": 1.8889422383046317e-06, - "loss": 1.0195, - "step": 20706 - }, - { - "epoch": 0.53, - "learning_rate": 1.8889295643618609e-06, - "loss": 0.9189, - "step": 20707 - }, - { - "epoch": 0.53, - "learning_rate": 1.888916889738477e-06, - "loss": 0.8574, - "step": 20708 - }, - { - "epoch": 0.53, - "learning_rate": 1.888904214434491e-06, - "loss": 0.7896, - "step": 20709 - }, - { - "epoch": 0.53, - "learning_rate": 1.8888915384499113e-06, - "loss": 0.8423, - "step": 20710 - }, - { - "epoch": 0.53, - "learning_rate": 1.8888788617847484e-06, - "loss": 0.9521, - "step": 20711 - }, - { - "epoch": 0.53, - "learning_rate": 1.888866184439012e-06, - "loss": 0.8877, - "step": 20712 - }, - { - "epoch": 0.53, - "learning_rate": 1.8888535064127119e-06, - "loss": 0.832, - "step": 20713 - }, - { - "epoch": 0.53, - "learning_rate": 1.888840827705857e-06, - "loss": 0.8926, - "step": 20714 - }, - { - "epoch": 0.53, - "learning_rate": 1.8888281483184576e-06, - "loss": 0.9443, - "step": 20715 - }, - { - "epoch": 0.53, - "learning_rate": 1.8888154682505238e-06, - "loss": 0.8633, - "step": 20716 - }, - { - "epoch": 0.53, - "learning_rate": 1.8888027875020645e-06, - "loss": 0.822, - "step": 20717 - }, - { - "epoch": 0.53, - "learning_rate": 1.8887901060730898e-06, - "loss": 1.0078, - "step": 20718 - }, - { - "epoch": 0.53, - "learning_rate": 1.8887774239636092e-06, - "loss": 0.8711, - "step": 20719 - }, - { - "epoch": 0.53, - "learning_rate": 1.888764741173633e-06, - "loss": 0.9727, - "step": 20720 - }, - { - "epoch": 0.53, - "learning_rate": 1.8887520577031704e-06, - "loss": 0.9121, - "step": 20721 - }, - { - "epoch": 0.53, - "learning_rate": 1.888739373552231e-06, - "loss": 0.8403, - "step": 20722 - }, - { - "epoch": 0.53, - "learning_rate": 1.8887266887208249e-06, - "loss": 0.9785, - "step": 20723 - }, - { - "epoch": 0.53, - "learning_rate": 1.8887140032089614e-06, - "loss": 0.959, - "step": 20724 - }, - { - "epoch": 0.53, - "learning_rate": 1.8887013170166508e-06, - "loss": 1.1475, - "step": 20725 - }, - { - "epoch": 0.53, - "learning_rate": 1.8886886301439023e-06, - "loss": 0.7412, - "step": 20726 - }, - { - "epoch": 0.53, - "learning_rate": 1.8886759425907256e-06, - "loss": 1.0068, - "step": 20727 - }, - { - "epoch": 0.53, - "learning_rate": 1.888663254357131e-06, - "loss": 0.8955, - "step": 20728 - }, - { - "epoch": 0.53, - "learning_rate": 1.8886505654431276e-06, - "loss": 0.7101, - "step": 20729 - }, - { - "epoch": 0.53, - "learning_rate": 1.8886378758487252e-06, - "loss": 0.8877, - "step": 20730 - }, - { - "epoch": 0.53, - "learning_rate": 1.8886251855739336e-06, - "loss": 0.6079, - "step": 20731 - }, - { - "epoch": 0.53, - "learning_rate": 1.8886124946187629e-06, - "loss": 0.9092, - "step": 20732 - }, - { - "epoch": 0.53, - "learning_rate": 1.8885998029832222e-06, - "loss": 0.9424, - "step": 20733 - }, - { - "epoch": 0.53, - "learning_rate": 1.8885871106673216e-06, - "loss": 0.9785, - "step": 20734 - }, - { - "epoch": 0.53, - "learning_rate": 1.8885744176710708e-06, - "loss": 0.9854, - "step": 20735 - }, - { - "epoch": 0.53, - "learning_rate": 1.8885617239944793e-06, - "loss": 0.9678, - "step": 20736 - }, - { - "epoch": 0.53, - "learning_rate": 1.8885490296375571e-06, - "loss": 0.8984, - "step": 20737 - }, - { - "epoch": 0.53, - "learning_rate": 1.8885363346003133e-06, - "loss": 0.6499, - "step": 20738 - }, - { - "epoch": 0.53, - "learning_rate": 1.8885236388827587e-06, - "loss": 0.7158, - "step": 20739 - }, - { - "epoch": 0.53, - "learning_rate": 1.888510942484902e-06, - "loss": 0.8452, - "step": 20740 - }, - { - "epoch": 0.53, - "learning_rate": 1.8884982454067534e-06, - "loss": 0.8237, - "step": 20741 - }, - { - "epoch": 0.53, - "learning_rate": 1.8884855476483226e-06, - "loss": 1.1162, - "step": 20742 - }, - { - "epoch": 0.53, - "learning_rate": 1.8884728492096191e-06, - "loss": 0.998, - "step": 20743 - }, - { - "epoch": 0.53, - "learning_rate": 1.888460150090653e-06, - "loss": 0.9697, - "step": 20744 - }, - { - "epoch": 0.53, - "learning_rate": 1.8884474502914337e-06, - "loss": 0.9043, - "step": 20745 - }, - { - "epoch": 0.53, - "learning_rate": 1.8884347498119712e-06, - "loss": 1.0244, - "step": 20746 - }, - { - "epoch": 0.53, - "learning_rate": 1.8884220486522748e-06, - "loss": 0.8594, - "step": 20747 - }, - { - "epoch": 0.53, - "learning_rate": 1.888409346812355e-06, - "loss": 0.8867, - "step": 20748 - }, - { - "epoch": 0.53, - "learning_rate": 1.8883966442922205e-06, - "loss": 0.7334, - "step": 20749 - }, - { - "epoch": 0.53, - "learning_rate": 1.8883839410918818e-06, - "loss": 0.8232, - "step": 20750 - }, - { - "epoch": 0.53, - "learning_rate": 1.888371237211348e-06, - "loss": 0.6279, - "step": 20751 - }, - { - "epoch": 0.53, - "learning_rate": 1.8883585326506294e-06, - "loss": 0.7246, - "step": 20752 - }, - { - "epoch": 0.53, - "learning_rate": 1.888345827409736e-06, - "loss": 0.8428, - "step": 20753 - }, - { - "epoch": 0.53, - "learning_rate": 1.8883331214886764e-06, - "loss": 1.0576, - "step": 20754 - }, - { - "epoch": 0.53, - "learning_rate": 1.8883204148874613e-06, - "loss": 0.9102, - "step": 20755 - }, - { - "epoch": 0.53, - "learning_rate": 1.8883077076061e-06, - "loss": 0.7744, - "step": 20756 - }, - { - "epoch": 0.53, - "learning_rate": 1.8882949996446022e-06, - "loss": 0.6914, - "step": 20757 - }, - { - "epoch": 0.53, - "learning_rate": 1.8882822910029778e-06, - "loss": 0.7539, - "step": 20758 - }, - { - "epoch": 0.53, - "learning_rate": 1.8882695816812367e-06, - "loss": 0.9307, - "step": 20759 - }, - { - "epoch": 0.53, - "learning_rate": 1.8882568716793883e-06, - "loss": 0.8682, - "step": 20760 - }, - { - "epoch": 0.53, - "learning_rate": 1.8882441609974426e-06, - "loss": 0.8105, - "step": 20761 - }, - { - "epoch": 0.53, - "learning_rate": 1.888231449635409e-06, - "loss": 0.7563, - "step": 20762 - }, - { - "epoch": 0.53, - "learning_rate": 1.8882187375932977e-06, - "loss": 0.5674, - "step": 20763 - }, - { - "epoch": 0.53, - "learning_rate": 1.8882060248711177e-06, - "loss": 0.7832, - "step": 20764 - }, - { - "epoch": 0.53, - "learning_rate": 1.8881933114688795e-06, - "loss": 0.8486, - "step": 20765 - }, - { - "epoch": 0.53, - "learning_rate": 1.8881805973865926e-06, - "loss": 0.7026, - "step": 20766 - }, - { - "epoch": 0.53, - "learning_rate": 1.8881678826242664e-06, - "loss": 0.7117, - "step": 20767 - }, - { - "epoch": 0.53, - "learning_rate": 1.8881551671819112e-06, - "loss": 0.7461, - "step": 20768 - }, - { - "epoch": 0.53, - "learning_rate": 1.8881424510595362e-06, - "loss": 0.8701, - "step": 20769 - }, - { - "epoch": 0.53, - "learning_rate": 1.8881297342571512e-06, - "loss": 0.9795, - "step": 20770 - }, - { - "epoch": 0.53, - "learning_rate": 1.8881170167747663e-06, - "loss": 0.7715, - "step": 20771 - }, - { - "epoch": 0.53, - "learning_rate": 1.888104298612391e-06, - "loss": 0.8379, - "step": 20772 - }, - { - "epoch": 0.53, - "learning_rate": 1.8880915797700351e-06, - "loss": 0.9248, - "step": 20773 - }, - { - "epoch": 0.53, - "learning_rate": 1.8880788602477082e-06, - "loss": 1.0547, - "step": 20774 - }, - { - "epoch": 0.53, - "learning_rate": 1.8880661400454204e-06, - "loss": 1.0127, - "step": 20775 - }, - { - "epoch": 0.53, - "learning_rate": 1.8880534191631812e-06, - "loss": 0.8228, - "step": 20776 - }, - { - "epoch": 0.53, - "learning_rate": 1.888040697601e-06, - "loss": 0.749, - "step": 20777 - }, - { - "epoch": 0.53, - "learning_rate": 1.8880279753588871e-06, - "loss": 0.8857, - "step": 20778 - }, - { - "epoch": 0.53, - "learning_rate": 1.888015252436852e-06, - "loss": 0.9258, - "step": 20779 - }, - { - "epoch": 0.53, - "learning_rate": 1.8880025288349043e-06, - "loss": 0.8555, - "step": 20780 - }, - { - "epoch": 0.53, - "learning_rate": 1.8879898045530541e-06, - "loss": 0.9346, - "step": 20781 - }, - { - "epoch": 0.53, - "learning_rate": 1.8879770795913109e-06, - "loss": 1.0801, - "step": 20782 - }, - { - "epoch": 0.53, - "learning_rate": 1.8879643539496844e-06, - "loss": 0.876, - "step": 20783 - }, - { - "epoch": 0.53, - "learning_rate": 1.8879516276281846e-06, - "loss": 0.8535, - "step": 20784 - }, - { - "epoch": 0.53, - "learning_rate": 1.8879389006268207e-06, - "loss": 0.7334, - "step": 20785 - }, - { - "epoch": 0.53, - "learning_rate": 1.887926172945603e-06, - "loss": 0.7646, - "step": 20786 - }, - { - "epoch": 0.53, - "learning_rate": 1.8879134445845413e-06, - "loss": 0.708, - "step": 20787 - }, - { - "epoch": 0.53, - "learning_rate": 1.887900715543645e-06, - "loss": 0.6958, - "step": 20788 - }, - { - "epoch": 0.53, - "learning_rate": 1.8878879858229237e-06, - "loss": 0.8125, - "step": 20789 - }, - { - "epoch": 0.53, - "learning_rate": 1.8878752554223875e-06, - "loss": 1.1426, - "step": 20790 - }, - { - "epoch": 0.53, - "learning_rate": 1.887862524342046e-06, - "loss": 0.9355, - "step": 20791 - }, - { - "epoch": 0.53, - "learning_rate": 1.887849792581909e-06, - "loss": 0.8887, - "step": 20792 - }, - { - "epoch": 0.53, - "learning_rate": 1.8878370601419866e-06, - "loss": 0.6104, - "step": 20793 - }, - { - "epoch": 0.53, - "learning_rate": 1.8878243270222878e-06, - "loss": 0.8994, - "step": 20794 - }, - { - "epoch": 0.53, - "learning_rate": 1.887811593222823e-06, - "loss": 0.8315, - "step": 20795 - }, - { - "epoch": 0.53, - "learning_rate": 1.8877988587436014e-06, - "loss": 0.5879, - "step": 20796 - }, - { - "epoch": 0.53, - "learning_rate": 1.887786123584633e-06, - "loss": 0.9678, - "step": 20797 - }, - { - "epoch": 0.53, - "learning_rate": 1.8877733877459278e-06, - "loss": 0.9604, - "step": 20798 - }, - { - "epoch": 0.53, - "learning_rate": 1.8877606512274955e-06, - "loss": 0.7473, - "step": 20799 - }, - { - "epoch": 0.53, - "learning_rate": 1.8877479140293454e-06, - "loss": 1.0176, - "step": 20800 - }, - { - "epoch": 0.53, - "learning_rate": 1.8877351761514875e-06, - "loss": 0.8623, - "step": 20801 - }, - { - "epoch": 0.53, - "learning_rate": 1.8877224375939318e-06, - "loss": 1.1006, - "step": 20802 - }, - { - "epoch": 0.53, - "learning_rate": 1.8877096983566877e-06, - "loss": 0.8208, - "step": 20803 - }, - { - "epoch": 0.53, - "learning_rate": 1.8876969584397652e-06, - "loss": 0.7671, - "step": 20804 - }, - { - "epoch": 0.53, - "learning_rate": 1.8876842178431738e-06, - "loss": 1.0713, - "step": 20805 - }, - { - "epoch": 0.53, - "learning_rate": 1.8876714765669236e-06, - "loss": 0.9717, - "step": 20806 - }, - { - "epoch": 0.53, - "learning_rate": 1.887658734611024e-06, - "loss": 0.5967, - "step": 20807 - }, - { - "epoch": 0.53, - "learning_rate": 1.8876459919754853e-06, - "loss": 1.0049, - "step": 20808 - }, - { - "epoch": 0.53, - "learning_rate": 1.8876332486603164e-06, - "loss": 0.7153, - "step": 20809 - }, - { - "epoch": 0.53, - "learning_rate": 1.8876205046655277e-06, - "loss": 0.8628, - "step": 20810 - }, - { - "epoch": 0.53, - "learning_rate": 1.887607759991129e-06, - "loss": 0.9062, - "step": 20811 - }, - { - "epoch": 0.53, - "learning_rate": 1.8875950146371296e-06, - "loss": 0.8125, - "step": 20812 - }, - { - "epoch": 0.53, - "learning_rate": 1.8875822686035393e-06, - "loss": 1.1094, - "step": 20813 - }, - { - "epoch": 0.53, - "learning_rate": 1.8875695218903687e-06, - "loss": 0.9893, - "step": 20814 - }, - { - "epoch": 0.53, - "learning_rate": 1.8875567744976264e-06, - "loss": 0.7197, - "step": 20815 - }, - { - "epoch": 0.53, - "learning_rate": 1.887544026425323e-06, - "loss": 1.1982, - "step": 20816 - }, - { - "epoch": 0.53, - "learning_rate": 1.8875312776734678e-06, - "loss": 0.9961, - "step": 20817 - }, - { - "epoch": 0.53, - "learning_rate": 1.8875185282420706e-06, - "loss": 0.9736, - "step": 20818 - }, - { - "epoch": 0.53, - "learning_rate": 1.8875057781311416e-06, - "loss": 1.001, - "step": 20819 - }, - { - "epoch": 0.53, - "learning_rate": 1.88749302734069e-06, - "loss": 0.6958, - "step": 20820 - }, - { - "epoch": 0.53, - "learning_rate": 1.8874802758707258e-06, - "loss": 0.833, - "step": 20821 - }, - { - "epoch": 0.53, - "learning_rate": 1.8874675237212587e-06, - "loss": 1.0625, - "step": 20822 - }, - { - "epoch": 0.53, - "learning_rate": 1.8874547708922988e-06, - "loss": 0.9385, - "step": 20823 - }, - { - "epoch": 0.53, - "learning_rate": 1.8874420173838552e-06, - "loss": 0.8516, - "step": 20824 - }, - { - "epoch": 0.53, - "learning_rate": 1.8874292631959383e-06, - "loss": 0.5698, - "step": 20825 - }, - { - "epoch": 0.53, - "learning_rate": 1.8874165083285578e-06, - "loss": 0.7705, - "step": 20826 - }, - { - "epoch": 0.53, - "learning_rate": 1.887403752781723e-06, - "loss": 0.9512, - "step": 20827 - }, - { - "epoch": 0.53, - "learning_rate": 1.887390996555444e-06, - "loss": 0.9902, - "step": 20828 - }, - { - "epoch": 0.53, - "learning_rate": 1.8873782396497305e-06, - "loss": 0.8828, - "step": 20829 - }, - { - "epoch": 0.53, - "learning_rate": 1.8873654820645923e-06, - "loss": 0.8975, - "step": 20830 - }, - { - "epoch": 0.53, - "learning_rate": 1.8873527238000392e-06, - "loss": 0.9863, - "step": 20831 - }, - { - "epoch": 0.53, - "learning_rate": 1.8873399648560808e-06, - "loss": 0.8896, - "step": 20832 - }, - { - "epoch": 0.53, - "learning_rate": 1.8873272052327272e-06, - "loss": 0.8652, - "step": 20833 - }, - { - "epoch": 0.53, - "learning_rate": 1.8873144449299878e-06, - "loss": 0.9629, - "step": 20834 - }, - { - "epoch": 0.53, - "learning_rate": 1.8873016839478724e-06, - "loss": 0.8809, - "step": 20835 - }, - { - "epoch": 0.53, - "learning_rate": 1.8872889222863911e-06, - "loss": 0.8379, - "step": 20836 - }, - { - "epoch": 0.53, - "learning_rate": 1.8872761599455536e-06, - "loss": 0.6436, - "step": 20837 - }, - { - "epoch": 0.53, - "learning_rate": 1.8872633969253692e-06, - "loss": 0.7651, - "step": 20838 - }, - { - "epoch": 0.53, - "learning_rate": 1.8872506332258485e-06, - "loss": 0.7939, - "step": 20839 - }, - { - "epoch": 0.53, - "learning_rate": 1.8872378688470004e-06, - "loss": 0.8477, - "step": 20840 - }, - { - "epoch": 0.53, - "learning_rate": 1.8872251037888352e-06, - "loss": 0.6851, - "step": 20841 - }, - { - "epoch": 0.53, - "learning_rate": 1.8872123380513624e-06, - "loss": 1.0781, - "step": 20842 - }, - { - "epoch": 0.53, - "learning_rate": 1.887199571634592e-06, - "loss": 0.9277, - "step": 20843 - }, - { - "epoch": 0.53, - "learning_rate": 1.8871868045385335e-06, - "loss": 1.0449, - "step": 20844 - }, - { - "epoch": 0.53, - "learning_rate": 1.8871740367631972e-06, - "loss": 0.8457, - "step": 20845 - }, - { - "epoch": 0.53, - "learning_rate": 1.8871612683085923e-06, - "loss": 0.7395, - "step": 20846 - }, - { - "epoch": 0.53, - "learning_rate": 1.8871484991747289e-06, - "loss": 0.7156, - "step": 20847 - }, - { - "epoch": 0.53, - "learning_rate": 1.8871357293616166e-06, - "loss": 0.8271, - "step": 20848 - }, - { - "epoch": 0.53, - "learning_rate": 1.8871229588692654e-06, - "loss": 0.9766, - "step": 20849 - }, - { - "epoch": 0.53, - "learning_rate": 1.8871101876976846e-06, - "loss": 1.0391, - "step": 20850 - }, - { - "epoch": 0.53, - "learning_rate": 1.8870974158468847e-06, - "loss": 0.873, - "step": 20851 - }, - { - "epoch": 0.53, - "learning_rate": 1.887084643316875e-06, - "loss": 1.0391, - "step": 20852 - }, - { - "epoch": 0.53, - "learning_rate": 1.8870718701076654e-06, - "loss": 0.8672, - "step": 20853 - }, - { - "epoch": 0.53, - "learning_rate": 1.8870590962192657e-06, - "loss": 0.7539, - "step": 20854 - }, - { - "epoch": 0.53, - "learning_rate": 1.8870463216516854e-06, - "loss": 0.8535, - "step": 20855 - }, - { - "epoch": 0.53, - "learning_rate": 1.8870335464049347e-06, - "loss": 0.9141, - "step": 20856 - }, - { - "epoch": 0.53, - "learning_rate": 1.8870207704790232e-06, - "loss": 0.9092, - "step": 20857 - }, - { - "epoch": 0.53, - "learning_rate": 1.8870079938739605e-06, - "loss": 1.0459, - "step": 20858 - }, - { - "epoch": 0.53, - "learning_rate": 1.886995216589757e-06, - "loss": 0.6069, - "step": 20859 - }, - { - "epoch": 0.53, - "learning_rate": 1.8869824386264214e-06, - "loss": 0.9707, - "step": 20860 - }, - { - "epoch": 0.53, - "learning_rate": 1.8869696599839648e-06, - "loss": 0.7627, - "step": 20861 - }, - { - "epoch": 0.53, - "learning_rate": 1.8869568806623958e-06, - "loss": 0.999, - "step": 20862 - }, - { - "epoch": 0.53, - "learning_rate": 1.886944100661725e-06, - "loss": 0.7314, - "step": 20863 - }, - { - "epoch": 0.53, - "learning_rate": 1.8869313199819618e-06, - "loss": 0.9502, - "step": 20864 - }, - { - "epoch": 0.53, - "learning_rate": 1.8869185386231162e-06, - "loss": 1.0547, - "step": 20865 - }, - { - "epoch": 0.53, - "learning_rate": 1.8869057565851975e-06, - "loss": 0.8374, - "step": 20866 - }, - { - "epoch": 0.53, - "learning_rate": 1.8868929738682163e-06, - "loss": 0.8779, - "step": 20867 - }, - { - "epoch": 0.53, - "learning_rate": 1.8868801904721817e-06, - "loss": 0.8525, - "step": 20868 - }, - { - "epoch": 0.53, - "learning_rate": 1.8868674063971035e-06, - "loss": 0.9761, - "step": 20869 - }, - { - "epoch": 0.53, - "learning_rate": 1.8868546216429922e-06, - "loss": 0.8994, - "step": 20870 - }, - { - "epoch": 0.53, - "learning_rate": 1.8868418362098567e-06, - "loss": 0.9102, - "step": 20871 - }, - { - "epoch": 0.53, - "learning_rate": 1.8868290500977074e-06, - "loss": 0.8252, - "step": 20872 - }, - { - "epoch": 0.53, - "learning_rate": 1.8868162633065536e-06, - "loss": 0.8101, - "step": 20873 - }, - { - "epoch": 0.54, - "learning_rate": 1.8868034758364055e-06, - "loss": 0.834, - "step": 20874 - }, - { - "epoch": 0.54, - "learning_rate": 1.8867906876872729e-06, - "loss": 1.0625, - "step": 20875 - }, - { - "epoch": 0.54, - "learning_rate": 1.8867778988591652e-06, - "loss": 0.7192, - "step": 20876 - }, - { - "epoch": 0.54, - "learning_rate": 1.8867651093520926e-06, - "loss": 0.8521, - "step": 20877 - }, - { - "epoch": 0.54, - "learning_rate": 1.8867523191660646e-06, - "loss": 0.752, - "step": 20878 - }, - { - "epoch": 0.54, - "learning_rate": 1.8867395283010913e-06, - "loss": 0.8291, - "step": 20879 - }, - { - "epoch": 0.54, - "learning_rate": 1.886726736757182e-06, - "loss": 0.876, - "step": 20880 - }, - { - "epoch": 0.54, - "learning_rate": 1.8867139445343474e-06, - "loss": 0.749, - "step": 20881 - }, - { - "epoch": 0.54, - "learning_rate": 1.8867011516325963e-06, - "loss": 0.9424, - "step": 20882 - }, - { - "epoch": 0.54, - "learning_rate": 1.886688358051939e-06, - "loss": 1.0254, - "step": 20883 - }, - { - "epoch": 0.54, - "learning_rate": 1.886675563792385e-06, - "loss": 0.8799, - "step": 20884 - }, - { - "epoch": 0.54, - "learning_rate": 1.8866627688539446e-06, - "loss": 0.5381, - "step": 20885 - }, - { - "epoch": 0.54, - "learning_rate": 1.886649973236627e-06, - "loss": 0.9297, - "step": 20886 - }, - { - "epoch": 0.54, - "learning_rate": 1.8866371769404425e-06, - "loss": 0.9019, - "step": 20887 - }, - { - "epoch": 0.54, - "learning_rate": 1.8866243799654006e-06, - "loss": 0.7104, - "step": 20888 - }, - { - "epoch": 0.54, - "learning_rate": 1.8866115823115111e-06, - "loss": 0.5493, - "step": 20889 - }, - { - "epoch": 0.54, - "learning_rate": 1.8865987839787843e-06, - "loss": 0.6924, - "step": 20890 - }, - { - "epoch": 0.54, - "learning_rate": 1.8865859849672289e-06, - "loss": 1.1152, - "step": 20891 - }, - { - "epoch": 0.54, - "learning_rate": 1.8865731852768558e-06, - "loss": 0.8994, - "step": 20892 - }, - { - "epoch": 0.54, - "learning_rate": 1.8865603849076743e-06, - "loss": 0.9072, - "step": 20893 - }, - { - "epoch": 0.54, - "learning_rate": 1.8865475838596942e-06, - "loss": 0.8682, - "step": 20894 - }, - { - "epoch": 0.54, - "learning_rate": 1.8865347821329255e-06, - "loss": 0.9854, - "step": 20895 - }, - { - "epoch": 0.54, - "learning_rate": 1.886521979727378e-06, - "loss": 0.9375, - "step": 20896 - }, - { - "epoch": 0.54, - "learning_rate": 1.8865091766430612e-06, - "loss": 0.7891, - "step": 20897 - }, - { - "epoch": 0.54, - "learning_rate": 1.886496372879985e-06, - "loss": 0.9434, - "step": 20898 - }, - { - "epoch": 0.54, - "learning_rate": 1.8864835684381595e-06, - "loss": 1.0557, - "step": 20899 - }, - { - "epoch": 0.54, - "learning_rate": 1.886470763317594e-06, - "loss": 0.8408, - "step": 20900 - }, - { - "epoch": 0.54, - "learning_rate": 1.8864579575182987e-06, - "loss": 1.0117, - "step": 20901 - }, - { - "epoch": 0.54, - "learning_rate": 1.8864451510402835e-06, - "loss": 0.8965, - "step": 20902 - }, - { - "epoch": 0.54, - "learning_rate": 1.886432343883558e-06, - "loss": 0.8857, - "step": 20903 - }, - { - "epoch": 0.54, - "learning_rate": 1.8864195360481318e-06, - "loss": 0.8066, - "step": 20904 - }, - { - "epoch": 0.54, - "learning_rate": 1.886406727534015e-06, - "loss": 0.793, - "step": 20905 - }, - { - "epoch": 0.54, - "learning_rate": 1.8863939183412175e-06, - "loss": 0.731, - "step": 20906 - }, - { - "epoch": 0.54, - "learning_rate": 1.8863811084697487e-06, - "loss": 0.9326, - "step": 20907 - }, - { - "epoch": 0.54, - "learning_rate": 1.8863682979196187e-06, - "loss": 0.7109, - "step": 20908 - }, - { - "epoch": 0.54, - "learning_rate": 1.8863554866908373e-06, - "loss": 0.8135, - "step": 20909 - }, - { - "epoch": 0.54, - "learning_rate": 1.8863426747834143e-06, - "loss": 0.9072, - "step": 20910 - }, - { - "epoch": 0.54, - "learning_rate": 1.8863298621973595e-06, - "loss": 0.7339, - "step": 20911 - }, - { - "epoch": 0.54, - "learning_rate": 1.8863170489326824e-06, - "loss": 0.9316, - "step": 20912 - }, - { - "epoch": 0.54, - "learning_rate": 1.8863042349893933e-06, - "loss": 0.9111, - "step": 20913 - }, - { - "epoch": 0.54, - "learning_rate": 1.886291420367502e-06, - "loss": 0.6521, - "step": 20914 - }, - { - "epoch": 0.54, - "learning_rate": 1.8862786050670177e-06, - "loss": 0.874, - "step": 20915 - }, - { - "epoch": 0.54, - "learning_rate": 1.8862657890879508e-06, - "loss": 1.0205, - "step": 20916 - }, - { - "epoch": 0.54, - "learning_rate": 1.886252972430311e-06, - "loss": 0.8506, - "step": 20917 - }, - { - "epoch": 0.54, - "learning_rate": 1.886240155094108e-06, - "loss": 0.7695, - "step": 20918 - }, - { - "epoch": 0.54, - "learning_rate": 1.8862273370793517e-06, - "loss": 0.7549, - "step": 20919 - }, - { - "epoch": 0.54, - "learning_rate": 1.8862145183860518e-06, - "loss": 0.8057, - "step": 20920 - }, - { - "epoch": 0.54, - "learning_rate": 1.8862016990142183e-06, - "loss": 0.7361, - "step": 20921 - }, - { - "epoch": 0.54, - "learning_rate": 1.886188878963861e-06, - "loss": 0.8662, - "step": 20922 - }, - { - "epoch": 0.54, - "learning_rate": 1.8861760582349892e-06, - "loss": 1.0508, - "step": 20923 - }, - { - "epoch": 0.54, - "learning_rate": 1.8861632368276135e-06, - "loss": 0.8721, - "step": 20924 - }, - { - "epoch": 0.54, - "learning_rate": 1.8861504147417433e-06, - "loss": 0.7222, - "step": 20925 - }, - { - "epoch": 0.54, - "learning_rate": 1.8861375919773885e-06, - "loss": 0.7041, - "step": 20926 - }, - { - "epoch": 0.54, - "learning_rate": 1.8861247685345588e-06, - "loss": 0.7861, - "step": 20927 - }, - { - "epoch": 0.54, - "learning_rate": 1.8861119444132641e-06, - "loss": 0.9609, - "step": 20928 - }, - { - "epoch": 0.54, - "learning_rate": 1.8860991196135143e-06, - "loss": 0.9248, - "step": 20929 - }, - { - "epoch": 0.54, - "learning_rate": 1.886086294135319e-06, - "loss": 1.0195, - "step": 20930 - }, - { - "epoch": 0.54, - "learning_rate": 1.8860734679786884e-06, - "loss": 0.821, - "step": 20931 - }, - { - "epoch": 0.54, - "learning_rate": 1.8860606411436319e-06, - "loss": 0.9814, - "step": 20932 - }, - { - "epoch": 0.54, - "learning_rate": 1.8860478136301596e-06, - "loss": 0.8984, - "step": 20933 - }, - { - "epoch": 0.54, - "learning_rate": 1.886034985438281e-06, - "loss": 0.9092, - "step": 20934 - }, - { - "epoch": 0.54, - "learning_rate": 1.8860221565680065e-06, - "loss": 1.0605, - "step": 20935 - }, - { - "epoch": 0.54, - "learning_rate": 1.8860093270193453e-06, - "loss": 0.9316, - "step": 20936 - }, - { - "epoch": 0.54, - "learning_rate": 1.8859964967923079e-06, - "loss": 0.8975, - "step": 20937 - }, - { - "epoch": 0.54, - "learning_rate": 1.8859836658869032e-06, - "loss": 0.8779, - "step": 20938 - }, - { - "epoch": 0.54, - "learning_rate": 1.885970834303142e-06, - "loss": 0.8711, - "step": 20939 - }, - { - "epoch": 0.54, - "learning_rate": 1.8859580020410336e-06, - "loss": 0.9902, - "step": 20940 - }, - { - "epoch": 0.54, - "learning_rate": 1.8859451691005876e-06, - "loss": 0.7231, - "step": 20941 - }, - { - "epoch": 0.54, - "learning_rate": 1.8859323354818145e-06, - "loss": 0.7969, - "step": 20942 - }, - { - "epoch": 0.54, - "learning_rate": 1.8859195011847234e-06, - "loss": 1.0596, - "step": 20943 - }, - { - "epoch": 0.54, - "learning_rate": 1.8859066662093246e-06, - "loss": 0.6553, - "step": 20944 - }, - { - "epoch": 0.54, - "learning_rate": 1.8858938305556279e-06, - "loss": 0.6865, - "step": 20945 - }, - { - "epoch": 0.54, - "learning_rate": 1.8858809942236429e-06, - "loss": 0.7466, - "step": 20946 - }, - { - "epoch": 0.54, - "learning_rate": 1.8858681572133795e-06, - "loss": 0.8486, - "step": 20947 - }, - { - "epoch": 0.54, - "learning_rate": 1.8858553195248477e-06, - "loss": 0.9502, - "step": 20948 - }, - { - "epoch": 0.54, - "learning_rate": 1.885842481158057e-06, - "loss": 0.7354, - "step": 20949 - }, - { - "epoch": 0.54, - "learning_rate": 1.8858296421130179e-06, - "loss": 0.8994, - "step": 20950 - }, - { - "epoch": 0.54, - "learning_rate": 1.8858168023897395e-06, - "loss": 0.8911, - "step": 20951 - }, - { - "epoch": 0.54, - "learning_rate": 1.8858039619882317e-06, - "loss": 1.0059, - "step": 20952 - }, - { - "epoch": 0.54, - "learning_rate": 1.885791120908505e-06, - "loss": 0.9932, - "step": 20953 - }, - { - "epoch": 0.54, - "learning_rate": 1.8857782791505685e-06, - "loss": 0.6992, - "step": 20954 - }, - { - "epoch": 0.54, - "learning_rate": 1.8857654367144323e-06, - "loss": 0.834, - "step": 20955 - }, - { - "epoch": 0.54, - "learning_rate": 1.8857525936001064e-06, - "loss": 0.8926, - "step": 20956 - }, - { - "epoch": 0.54, - "learning_rate": 1.8857397498076003e-06, - "loss": 0.9795, - "step": 20957 - }, - { - "epoch": 0.54, - "learning_rate": 1.885726905336924e-06, - "loss": 0.9648, - "step": 20958 - }, - { - "epoch": 0.54, - "learning_rate": 1.8857140601880875e-06, - "loss": 0.8716, - "step": 20959 - }, - { - "epoch": 0.54, - "learning_rate": 1.8857012143611003e-06, - "loss": 0.9121, - "step": 20960 - }, - { - "epoch": 0.54, - "learning_rate": 1.8856883678559724e-06, - "loss": 0.835, - "step": 20961 - }, - { - "epoch": 0.54, - "learning_rate": 1.8856755206727137e-06, - "loss": 0.7031, - "step": 20962 - }, - { - "epoch": 0.54, - "learning_rate": 1.8856626728113338e-06, - "loss": 0.7812, - "step": 20963 - }, - { - "epoch": 0.54, - "learning_rate": 1.885649824271843e-06, - "loss": 0.8354, - "step": 20964 - }, - { - "epoch": 0.54, - "learning_rate": 1.8856369750542507e-06, - "loss": 0.8647, - "step": 20965 - }, - { - "epoch": 0.54, - "learning_rate": 1.8856241251585668e-06, - "loss": 0.7339, - "step": 20966 - }, - { - "epoch": 0.54, - "learning_rate": 1.8856112745848013e-06, - "loss": 1.0273, - "step": 20967 - }, - { - "epoch": 0.54, - "learning_rate": 1.885598423332964e-06, - "loss": 0.7178, - "step": 20968 - }, - { - "epoch": 0.54, - "learning_rate": 1.885585571403065e-06, - "loss": 0.9648, - "step": 20969 - }, - { - "epoch": 0.54, - "learning_rate": 1.8855727187951134e-06, - "loss": 0.9473, - "step": 20970 - }, - { - "epoch": 0.54, - "learning_rate": 1.8855598655091195e-06, - "loss": 0.9619, - "step": 20971 - }, - { - "epoch": 0.54, - "learning_rate": 1.8855470115450936e-06, - "loss": 1.0039, - "step": 20972 - }, - { - "epoch": 0.54, - "learning_rate": 1.8855341569030445e-06, - "loss": 0.6333, - "step": 20973 - }, - { - "epoch": 0.54, - "learning_rate": 1.885521301582983e-06, - "loss": 0.6953, - "step": 20974 - }, - { - "epoch": 0.54, - "learning_rate": 1.8855084455849184e-06, - "loss": 0.9697, - "step": 20975 - }, - { - "epoch": 0.54, - "learning_rate": 1.885495588908861e-06, - "loss": 0.9834, - "step": 20976 - }, - { - "epoch": 0.54, - "learning_rate": 1.8854827315548198e-06, - "loss": 0.9941, - "step": 20977 - }, - { - "epoch": 0.54, - "learning_rate": 1.8854698735228055e-06, - "loss": 0.9658, - "step": 20978 - }, - { - "epoch": 0.54, - "learning_rate": 1.8854570148128276e-06, - "loss": 0.8379, - "step": 20979 - }, - { - "epoch": 0.54, - "learning_rate": 1.885444155424896e-06, - "loss": 0.7451, - "step": 20980 - }, - { - "epoch": 0.54, - "learning_rate": 1.8854312953590203e-06, - "loss": 0.7695, - "step": 20981 - }, - { - "epoch": 0.54, - "learning_rate": 1.885418434615211e-06, - "loss": 0.7461, - "step": 20982 - }, - { - "epoch": 0.54, - "learning_rate": 1.8854055731934773e-06, - "loss": 0.646, - "step": 20983 - }, - { - "epoch": 0.54, - "learning_rate": 1.8853927110938293e-06, - "loss": 0.9634, - "step": 20984 - }, - { - "epoch": 0.54, - "learning_rate": 1.8853798483162765e-06, - "loss": 0.9121, - "step": 20985 - }, - { - "epoch": 0.54, - "learning_rate": 1.8853669848608295e-06, - "loss": 0.8389, - "step": 20986 - }, - { - "epoch": 0.54, - "learning_rate": 1.8853541207274977e-06, - "loss": 0.8047, - "step": 20987 - }, - { - "epoch": 0.54, - "learning_rate": 1.8853412559162906e-06, - "loss": 0.8818, - "step": 20988 - }, - { - "epoch": 0.54, - "learning_rate": 1.885328390427219e-06, - "loss": 1.0039, - "step": 20989 - }, - { - "epoch": 0.54, - "learning_rate": 1.8853155242602915e-06, - "loss": 0.9629, - "step": 20990 - }, - { - "epoch": 0.54, - "learning_rate": 1.8853026574155186e-06, - "loss": 0.5752, - "step": 20991 - }, - { - "epoch": 0.54, - "learning_rate": 1.8852897898929107e-06, - "loss": 0.9053, - "step": 20992 - }, - { - "epoch": 0.54, - "learning_rate": 1.8852769216924768e-06, - "loss": 1.2109, - "step": 20993 - }, - { - "epoch": 0.54, - "learning_rate": 1.885264052814227e-06, - "loss": 0.9307, - "step": 20994 - }, - { - "epoch": 0.54, - "learning_rate": 1.8852511832581714e-06, - "loss": 1.0078, - "step": 20995 - }, - { - "epoch": 0.54, - "learning_rate": 1.8852383130243197e-06, - "loss": 0.8494, - "step": 20996 - }, - { - "epoch": 0.54, - "learning_rate": 1.8852254421126816e-06, - "loss": 0.6162, - "step": 20997 - }, - { - "epoch": 0.54, - "learning_rate": 1.8852125705232671e-06, - "loss": 0.9805, - "step": 20998 - }, - { - "epoch": 0.54, - "learning_rate": 1.885199698256086e-06, - "loss": 0.7529, - "step": 20999 - }, - { - "epoch": 0.54, - "learning_rate": 1.8851868253111482e-06, - "loss": 0.707, - "step": 21000 - }, - { - "epoch": 0.54, - "learning_rate": 1.885173951688464e-06, - "loss": 0.811, - "step": 21001 - }, - { - "epoch": 0.54, - "learning_rate": 1.8851610773880422e-06, - "loss": 0.8701, - "step": 21002 - }, - { - "epoch": 0.54, - "learning_rate": 1.8851482024098935e-06, - "loss": 0.8428, - "step": 21003 - }, - { - "epoch": 0.54, - "learning_rate": 1.8851353267540272e-06, - "loss": 0.7598, - "step": 21004 - }, - { - "epoch": 0.54, - "learning_rate": 1.8851224504204541e-06, - "loss": 0.8232, - "step": 21005 - }, - { - "epoch": 0.54, - "learning_rate": 1.885109573409183e-06, - "loss": 0.9072, - "step": 21006 - }, - { - "epoch": 0.54, - "learning_rate": 1.8850966957202244e-06, - "loss": 0.5154, - "step": 21007 - }, - { - "epoch": 0.54, - "learning_rate": 1.885083817353588e-06, - "loss": 0.8423, - "step": 21008 - }, - { - "epoch": 0.54, - "learning_rate": 1.8850709383092833e-06, - "loss": 0.9116, - "step": 21009 - }, - { - "epoch": 0.54, - "learning_rate": 1.8850580585873206e-06, - "loss": 0.8267, - "step": 21010 - }, - { - "epoch": 0.54, - "learning_rate": 1.8850451781877096e-06, - "loss": 0.8984, - "step": 21011 - }, - { - "epoch": 0.54, - "learning_rate": 1.8850322971104604e-06, - "loss": 1.0732, - "step": 21012 - }, - { - "epoch": 0.54, - "learning_rate": 1.8850194153555827e-06, - "loss": 0.8545, - "step": 21013 - }, - { - "epoch": 0.54, - "learning_rate": 1.8850065329230863e-06, - "loss": 0.79, - "step": 21014 - }, - { - "epoch": 0.54, - "learning_rate": 1.8849936498129808e-06, - "loss": 0.639, - "step": 21015 - }, - { - "epoch": 0.54, - "learning_rate": 1.8849807660252766e-06, - "loss": 0.8677, - "step": 21016 - }, - { - "epoch": 0.54, - "learning_rate": 1.8849678815599834e-06, - "loss": 0.6743, - "step": 21017 - }, - { - "epoch": 0.54, - "learning_rate": 1.884954996417111e-06, - "loss": 0.8779, - "step": 21018 - }, - { - "epoch": 0.54, - "learning_rate": 1.8849421105966689e-06, - "loss": 0.832, - "step": 21019 - }, - { - "epoch": 0.54, - "learning_rate": 1.8849292240986676e-06, - "loss": 0.9395, - "step": 21020 - }, - { - "epoch": 0.54, - "learning_rate": 1.8849163369231165e-06, - "loss": 0.9902, - "step": 21021 - }, - { - "epoch": 0.54, - "learning_rate": 1.884903449070026e-06, - "loss": 1.0234, - "step": 21022 - }, - { - "epoch": 0.54, - "learning_rate": 1.8848905605394052e-06, - "loss": 1.0732, - "step": 21023 - }, - { - "epoch": 0.54, - "learning_rate": 1.8848776713312646e-06, - "loss": 0.7969, - "step": 21024 - }, - { - "epoch": 0.54, - "learning_rate": 1.8848647814456139e-06, - "loss": 0.9258, - "step": 21025 - }, - { - "epoch": 0.54, - "learning_rate": 1.8848518908824626e-06, - "loss": 0.8838, - "step": 21026 - }, - { - "epoch": 0.54, - "learning_rate": 1.8848389996418213e-06, - "loss": 0.8394, - "step": 21027 - }, - { - "epoch": 0.54, - "learning_rate": 1.8848261077236993e-06, - "loss": 0.8623, - "step": 21028 - }, - { - "epoch": 0.54, - "learning_rate": 1.8848132151281067e-06, - "loss": 0.8896, - "step": 21029 - }, - { - "epoch": 0.54, - "learning_rate": 1.8848003218550532e-06, - "loss": 0.8027, - "step": 21030 - }, - { - "epoch": 0.54, - "learning_rate": 1.8847874279045488e-06, - "loss": 0.7314, - "step": 21031 - }, - { - "epoch": 0.54, - "learning_rate": 1.8847745332766035e-06, - "loss": 0.8301, - "step": 21032 - }, - { - "epoch": 0.54, - "learning_rate": 1.8847616379712268e-06, - "loss": 1.0654, - "step": 21033 - }, - { - "epoch": 0.54, - "learning_rate": 1.884748741988429e-06, - "loss": 1.0508, - "step": 21034 - }, - { - "epoch": 0.54, - "learning_rate": 1.8847358453282194e-06, - "loss": 0.7295, - "step": 21035 - }, - { - "epoch": 0.54, - "learning_rate": 1.8847229479906087e-06, - "loss": 0.9854, - "step": 21036 - }, - { - "epoch": 0.54, - "learning_rate": 1.8847100499756058e-06, - "loss": 0.7236, - "step": 21037 - }, - { - "epoch": 0.54, - "learning_rate": 1.8846971512832214e-06, - "loss": 0.752, - "step": 21038 - }, - { - "epoch": 0.54, - "learning_rate": 1.8846842519134654e-06, - "loss": 0.7656, - "step": 21039 - }, - { - "epoch": 0.54, - "learning_rate": 1.884671351866347e-06, - "loss": 0.8447, - "step": 21040 - }, - { - "epoch": 0.54, - "learning_rate": 1.8846584511418764e-06, - "loss": 1.0801, - "step": 21041 - }, - { - "epoch": 0.54, - "learning_rate": 1.8846455497400636e-06, - "loss": 1.2051, - "step": 21042 - }, - { - "epoch": 0.54, - "learning_rate": 1.8846326476609185e-06, - "loss": 0.9849, - "step": 21043 - }, - { - "epoch": 0.54, - "learning_rate": 1.8846197449044505e-06, - "loss": 0.9785, - "step": 21044 - }, - { - "epoch": 0.54, - "learning_rate": 1.8846068414706702e-06, - "loss": 0.9131, - "step": 21045 - }, - { - "epoch": 0.54, - "learning_rate": 1.884593937359587e-06, - "loss": 0.7949, - "step": 21046 - }, - { - "epoch": 0.54, - "learning_rate": 1.8845810325712108e-06, - "loss": 0.8076, - "step": 21047 - }, - { - "epoch": 0.54, - "learning_rate": 1.8845681271055516e-06, - "loss": 0.7598, - "step": 21048 - }, - { - "epoch": 0.54, - "learning_rate": 1.8845552209626192e-06, - "loss": 0.7979, - "step": 21049 - }, - { - "epoch": 0.54, - "learning_rate": 1.8845423141424236e-06, - "loss": 0.7935, - "step": 21050 - }, - { - "epoch": 0.54, - "learning_rate": 1.8845294066449746e-06, - "loss": 1.0078, - "step": 21051 - }, - { - "epoch": 0.54, - "learning_rate": 1.884516498470282e-06, - "loss": 0.8643, - "step": 21052 - }, - { - "epoch": 0.54, - "learning_rate": 1.8845035896183562e-06, - "loss": 0.7637, - "step": 21053 - }, - { - "epoch": 0.54, - "learning_rate": 1.8844906800892063e-06, - "loss": 0.9092, - "step": 21054 - }, - { - "epoch": 0.54, - "learning_rate": 1.8844777698828426e-06, - "loss": 0.8779, - "step": 21055 - }, - { - "epoch": 0.54, - "learning_rate": 1.8844648589992752e-06, - "loss": 0.9912, - "step": 21056 - }, - { - "epoch": 0.54, - "learning_rate": 1.8844519474385134e-06, - "loss": 0.6749, - "step": 21057 - }, - { - "epoch": 0.54, - "learning_rate": 1.8844390352005676e-06, - "loss": 0.8037, - "step": 21058 - }, - { - "epoch": 0.54, - "learning_rate": 1.8844261222854474e-06, - "loss": 0.8818, - "step": 21059 - }, - { - "epoch": 0.54, - "learning_rate": 1.884413208693163e-06, - "loss": 0.7979, - "step": 21060 - }, - { - "epoch": 0.54, - "learning_rate": 1.884400294423724e-06, - "loss": 0.8359, - "step": 21061 - }, - { - "epoch": 0.54, - "learning_rate": 1.8843873794771402e-06, - "loss": 1.0127, - "step": 21062 - }, - { - "epoch": 0.54, - "learning_rate": 1.8843744638534216e-06, - "loss": 0.7314, - "step": 21063 - }, - { - "epoch": 0.54, - "learning_rate": 1.8843615475525783e-06, - "loss": 0.7178, - "step": 21064 - }, - { - "epoch": 0.54, - "learning_rate": 1.8843486305746199e-06, - "loss": 0.9307, - "step": 21065 - }, - { - "epoch": 0.54, - "learning_rate": 1.8843357129195566e-06, - "loss": 0.9927, - "step": 21066 - }, - { - "epoch": 0.54, - "learning_rate": 1.884322794587398e-06, - "loss": 0.9941, - "step": 21067 - }, - { - "epoch": 0.54, - "learning_rate": 1.8843098755781538e-06, - "loss": 0.9766, - "step": 21068 - }, - { - "epoch": 0.54, - "learning_rate": 1.8842969558918346e-06, - "loss": 0.752, - "step": 21069 - }, - { - "epoch": 0.54, - "learning_rate": 1.88428403552845e-06, - "loss": 0.9131, - "step": 21070 - }, - { - "epoch": 0.54, - "learning_rate": 1.8842711144880093e-06, - "loss": 0.9287, - "step": 21071 - }, - { - "epoch": 0.54, - "learning_rate": 1.8842581927705233e-06, - "loss": 0.9102, - "step": 21072 - }, - { - "epoch": 0.54, - "learning_rate": 1.8842452703760013e-06, - "loss": 0.8438, - "step": 21073 - }, - { - "epoch": 0.54, - "learning_rate": 1.8842323473044533e-06, - "loss": 0.8467, - "step": 21074 - }, - { - "epoch": 0.54, - "learning_rate": 1.8842194235558892e-06, - "loss": 0.918, - "step": 21075 - }, - { - "epoch": 0.54, - "learning_rate": 1.884206499130319e-06, - "loss": 1.0273, - "step": 21076 - }, - { - "epoch": 0.54, - "learning_rate": 1.8841935740277525e-06, - "loss": 0.9189, - "step": 21077 - }, - { - "epoch": 0.54, - "learning_rate": 1.8841806482481997e-06, - "loss": 0.7627, - "step": 21078 - }, - { - "epoch": 0.54, - "learning_rate": 1.8841677217916705e-06, - "loss": 0.7686, - "step": 21079 - }, - { - "epoch": 0.54, - "learning_rate": 1.884154794658175e-06, - "loss": 1.0596, - "step": 21080 - }, - { - "epoch": 0.54, - "learning_rate": 1.884141866847722e-06, - "loss": 0.915, - "step": 21081 - }, - { - "epoch": 0.54, - "learning_rate": 1.884128938360323e-06, - "loss": 1.0566, - "step": 21082 - }, - { - "epoch": 0.54, - "learning_rate": 1.8841160091959867e-06, - "loss": 0.8633, - "step": 21083 - }, - { - "epoch": 0.54, - "learning_rate": 1.8841030793547238e-06, - "loss": 0.8538, - "step": 21084 - }, - { - "epoch": 0.54, - "learning_rate": 1.8840901488365434e-06, - "loss": 0.7842, - "step": 21085 - }, - { - "epoch": 0.54, - "learning_rate": 1.884077217641456e-06, - "loss": 0.9971, - "step": 21086 - }, - { - "epoch": 0.54, - "learning_rate": 1.8840642857694714e-06, - "loss": 0.7026, - "step": 21087 - }, - { - "epoch": 0.54, - "learning_rate": 1.8840513532205993e-06, - "loss": 0.8174, - "step": 21088 - }, - { - "epoch": 0.54, - "learning_rate": 1.8840384199948497e-06, - "loss": 0.876, - "step": 21089 - }, - { - "epoch": 0.54, - "learning_rate": 1.8840254860922328e-06, - "loss": 0.8394, - "step": 21090 - }, - { - "epoch": 0.54, - "learning_rate": 1.8840125515127582e-06, - "loss": 0.9209, - "step": 21091 - }, - { - "epoch": 0.54, - "learning_rate": 1.8839996162564356e-06, - "loss": 0.8555, - "step": 21092 - }, - { - "epoch": 0.54, - "learning_rate": 1.883986680323275e-06, - "loss": 0.7397, - "step": 21093 - }, - { - "epoch": 0.54, - "learning_rate": 1.883973743713287e-06, - "loss": 0.9023, - "step": 21094 - }, - { - "epoch": 0.54, - "learning_rate": 1.8839608064264807e-06, - "loss": 1.1543, - "step": 21095 - }, - { - "epoch": 0.54, - "learning_rate": 1.883947868462866e-06, - "loss": 0.915, - "step": 21096 - }, - { - "epoch": 0.54, - "learning_rate": 1.8839349298224534e-06, - "loss": 0.8193, - "step": 21097 - }, - { - "epoch": 0.54, - "learning_rate": 1.8839219905052524e-06, - "loss": 0.7959, - "step": 21098 - }, - { - "epoch": 0.54, - "learning_rate": 1.883909050511273e-06, - "loss": 0.7815, - "step": 21099 - }, - { - "epoch": 0.54, - "learning_rate": 1.8838961098405246e-06, - "loss": 0.7979, - "step": 21100 - }, - { - "epoch": 0.54, - "learning_rate": 1.883883168493018e-06, - "loss": 0.8965, - "step": 21101 - }, - { - "epoch": 0.54, - "learning_rate": 1.8838702264687627e-06, - "loss": 1.1367, - "step": 21102 - }, - { - "epoch": 0.54, - "learning_rate": 1.8838572837677687e-06, - "loss": 0.9658, - "step": 21103 - }, - { - "epoch": 0.54, - "learning_rate": 1.8838443403900457e-06, - "loss": 0.9531, - "step": 21104 - }, - { - "epoch": 0.54, - "learning_rate": 1.8838313963356036e-06, - "loss": 0.9434, - "step": 21105 - }, - { - "epoch": 0.54, - "learning_rate": 1.8838184516044526e-06, - "loss": 0.8818, - "step": 21106 - }, - { - "epoch": 0.54, - "learning_rate": 1.8838055061966024e-06, - "loss": 1.0, - "step": 21107 - }, - { - "epoch": 0.54, - "learning_rate": 1.883792560112063e-06, - "loss": 0.7998, - "step": 21108 - }, - { - "epoch": 0.54, - "learning_rate": 1.8837796133508444e-06, - "loss": 0.9238, - "step": 21109 - }, - { - "epoch": 0.54, - "learning_rate": 1.8837666659129562e-06, - "loss": 0.7949, - "step": 21110 - }, - { - "epoch": 0.54, - "learning_rate": 1.8837537177984086e-06, - "loss": 0.5693, - "step": 21111 - }, - { - "epoch": 0.54, - "learning_rate": 1.8837407690072113e-06, - "loss": 1.1689, - "step": 21112 - }, - { - "epoch": 0.54, - "learning_rate": 1.8837278195393744e-06, - "loss": 0.8662, - "step": 21113 - }, - { - "epoch": 0.54, - "learning_rate": 1.8837148693949078e-06, - "loss": 0.8623, - "step": 21114 - }, - { - "epoch": 0.54, - "learning_rate": 1.8837019185738212e-06, - "loss": 0.9971, - "step": 21115 - }, - { - "epoch": 0.54, - "learning_rate": 1.8836889670761247e-06, - "loss": 0.7468, - "step": 21116 - }, - { - "epoch": 0.54, - "learning_rate": 1.8836760149018284e-06, - "loss": 0.8843, - "step": 21117 - }, - { - "epoch": 0.54, - "learning_rate": 1.883663062050942e-06, - "loss": 0.8877, - "step": 21118 - }, - { - "epoch": 0.54, - "learning_rate": 1.8836501085234752e-06, - "loss": 0.9521, - "step": 21119 - }, - { - "epoch": 0.54, - "learning_rate": 1.8836371543194383e-06, - "loss": 1.0156, - "step": 21120 - }, - { - "epoch": 0.54, - "learning_rate": 1.8836241994388408e-06, - "loss": 0.636, - "step": 21121 - }, - { - "epoch": 0.54, - "learning_rate": 1.8836112438816932e-06, - "loss": 0.915, - "step": 21122 - }, - { - "epoch": 0.54, - "learning_rate": 1.883598287648005e-06, - "loss": 1.0479, - "step": 21123 - }, - { - "epoch": 0.54, - "learning_rate": 1.883585330737786e-06, - "loss": 0.959, - "step": 21124 - }, - { - "epoch": 0.54, - "learning_rate": 1.8835723731510466e-06, - "loss": 0.7803, - "step": 21125 - }, - { - "epoch": 0.54, - "learning_rate": 1.8835594148877964e-06, - "loss": 0.7927, - "step": 21126 - }, - { - "epoch": 0.54, - "learning_rate": 1.8835464559480453e-06, - "loss": 0.8447, - "step": 21127 - }, - { - "epoch": 0.54, - "learning_rate": 1.8835334963318036e-06, - "loss": 0.9121, - "step": 21128 - }, - { - "epoch": 0.54, - "learning_rate": 1.8835205360390806e-06, - "loss": 0.9932, - "step": 21129 - }, - { - "epoch": 0.54, - "learning_rate": 1.8835075750698867e-06, - "loss": 0.8633, - "step": 21130 - }, - { - "epoch": 0.54, - "learning_rate": 1.8834946134242315e-06, - "loss": 0.76, - "step": 21131 - }, - { - "epoch": 0.54, - "learning_rate": 1.8834816511021254e-06, - "loss": 0.876, - "step": 21132 - }, - { - "epoch": 0.54, - "learning_rate": 1.8834686881035777e-06, - "loss": 1.04, - "step": 21133 - }, - { - "epoch": 0.54, - "learning_rate": 1.8834557244285988e-06, - "loss": 0.7852, - "step": 21134 - }, - { - "epoch": 0.54, - "learning_rate": 1.8834427600771987e-06, - "loss": 1.0117, - "step": 21135 - }, - { - "epoch": 0.54, - "learning_rate": 1.8834297950493867e-06, - "loss": 0.9258, - "step": 21136 - }, - { - "epoch": 0.54, - "learning_rate": 1.8834168293451733e-06, - "loss": 0.8862, - "step": 21137 - }, - { - "epoch": 0.54, - "learning_rate": 1.8834038629645686e-06, - "loss": 0.7856, - "step": 21138 - }, - { - "epoch": 0.54, - "learning_rate": 1.8833908959075818e-06, - "loss": 0.8267, - "step": 21139 - }, - { - "epoch": 0.54, - "learning_rate": 1.883377928174223e-06, - "loss": 0.7354, - "step": 21140 - }, - { - "epoch": 0.54, - "learning_rate": 1.8833649597645028e-06, - "loss": 1.1777, - "step": 21141 - }, - { - "epoch": 0.54, - "learning_rate": 1.8833519906784306e-06, - "loss": 0.6221, - "step": 21142 - }, - { - "epoch": 0.54, - "learning_rate": 1.883339020916016e-06, - "loss": 0.9082, - "step": 21143 - }, - { - "epoch": 0.54, - "learning_rate": 1.8833260504772697e-06, - "loss": 0.7354, - "step": 21144 - }, - { - "epoch": 0.54, - "learning_rate": 1.8833130793622012e-06, - "loss": 0.8174, - "step": 21145 - }, - { - "epoch": 0.54, - "learning_rate": 1.8833001075708203e-06, - "loss": 0.7417, - "step": 21146 - }, - { - "epoch": 0.54, - "learning_rate": 1.8832871351031373e-06, - "loss": 0.9922, - "step": 21147 - }, - { - "epoch": 0.54, - "learning_rate": 1.8832741619591621e-06, - "loss": 0.9707, - "step": 21148 - }, - { - "epoch": 0.54, - "learning_rate": 1.8832611881389042e-06, - "loss": 0.8604, - "step": 21149 - }, - { - "epoch": 0.54, - "learning_rate": 1.883248213642374e-06, - "loss": 0.7148, - "step": 21150 - }, - { - "epoch": 0.54, - "learning_rate": 1.883235238469581e-06, - "loss": 0.9443, - "step": 21151 - }, - { - "epoch": 0.54, - "learning_rate": 1.8832222626205358e-06, - "loss": 0.7656, - "step": 21152 - }, - { - "epoch": 0.54, - "learning_rate": 1.8832092860952478e-06, - "loss": 0.9131, - "step": 21153 - }, - { - "epoch": 0.54, - "learning_rate": 1.8831963088937269e-06, - "loss": 0.8398, - "step": 21154 - }, - { - "epoch": 0.54, - "learning_rate": 1.8831833310159833e-06, - "loss": 0.8652, - "step": 21155 - }, - { - "epoch": 0.54, - "learning_rate": 1.8831703524620267e-06, - "loss": 0.7002, - "step": 21156 - }, - { - "epoch": 0.54, - "learning_rate": 1.8831573732318673e-06, - "loss": 0.9932, - "step": 21157 - }, - { - "epoch": 0.54, - "learning_rate": 1.883144393325515e-06, - "loss": 1.0244, - "step": 21158 - }, - { - "epoch": 0.54, - "learning_rate": 1.8831314127429794e-06, - "loss": 0.6333, - "step": 21159 - }, - { - "epoch": 0.54, - "learning_rate": 1.8831184314842708e-06, - "loss": 0.9214, - "step": 21160 - }, - { - "epoch": 0.54, - "learning_rate": 1.883105449549399e-06, - "loss": 0.8398, - "step": 21161 - }, - { - "epoch": 0.54, - "learning_rate": 1.883092466938374e-06, - "loss": 1.001, - "step": 21162 - }, - { - "epoch": 0.54, - "learning_rate": 1.8830794836512055e-06, - "loss": 0.9951, - "step": 21163 - }, - { - "epoch": 0.54, - "learning_rate": 1.883066499687904e-06, - "loss": 0.8315, - "step": 21164 - }, - { - "epoch": 0.54, - "learning_rate": 1.8830535150484787e-06, - "loss": 0.9131, - "step": 21165 - }, - { - "epoch": 0.54, - "learning_rate": 1.8830405297329403e-06, - "loss": 0.9883, - "step": 21166 - }, - { - "epoch": 0.54, - "learning_rate": 1.8830275437412983e-06, - "loss": 0.8174, - "step": 21167 - }, - { - "epoch": 0.54, - "learning_rate": 1.8830145570735625e-06, - "loss": 0.9629, - "step": 21168 - }, - { - "epoch": 0.54, - "learning_rate": 1.8830015697297435e-06, - "loss": 0.8877, - "step": 21169 - }, - { - "epoch": 0.54, - "learning_rate": 1.8829885817098502e-06, - "loss": 0.7832, - "step": 21170 - }, - { - "epoch": 0.54, - "learning_rate": 1.8829755930138936e-06, - "loss": 0.8887, - "step": 21171 - }, - { - "epoch": 0.54, - "learning_rate": 1.882962603641883e-06, - "loss": 0.6777, - "step": 21172 - }, - { - "epoch": 0.54, - "learning_rate": 1.8829496135938286e-06, - "loss": 0.9717, - "step": 21173 - }, - { - "epoch": 0.54, - "learning_rate": 1.88293662286974e-06, - "loss": 0.874, - "step": 21174 - }, - { - "epoch": 0.54, - "learning_rate": 1.882923631469628e-06, - "loss": 0.915, - "step": 21175 - }, - { - "epoch": 0.54, - "learning_rate": 1.8829106393935014e-06, - "loss": 0.8799, - "step": 21176 - }, - { - "epoch": 0.54, - "learning_rate": 1.8828976466413712e-06, - "loss": 0.8906, - "step": 21177 - }, - { - "epoch": 0.54, - "learning_rate": 1.8828846532132464e-06, - "loss": 0.9678, - "step": 21178 - }, - { - "epoch": 0.54, - "learning_rate": 1.8828716591091377e-06, - "loss": 1.0889, - "step": 21179 - }, - { - "epoch": 0.54, - "learning_rate": 1.8828586643290547e-06, - "loss": 0.9092, - "step": 21180 - }, - { - "epoch": 0.54, - "learning_rate": 1.8828456688730075e-06, - "loss": 0.8906, - "step": 21181 - }, - { - "epoch": 0.54, - "learning_rate": 1.8828326727410057e-06, - "loss": 0.8418, - "step": 21182 - }, - { - "epoch": 0.54, - "learning_rate": 1.8828196759330596e-06, - "loss": 0.8037, - "step": 21183 - }, - { - "epoch": 0.54, - "learning_rate": 1.8828066784491793e-06, - "loss": 0.54, - "step": 21184 - }, - { - "epoch": 0.54, - "learning_rate": 1.8827936802893746e-06, - "loss": 0.8574, - "step": 21185 - }, - { - "epoch": 0.54, - "learning_rate": 1.882780681453655e-06, - "loss": 0.9678, - "step": 21186 - }, - { - "epoch": 0.54, - "learning_rate": 1.882767681942031e-06, - "loss": 1.0215, - "step": 21187 - }, - { - "epoch": 0.54, - "learning_rate": 1.8827546817545124e-06, - "loss": 1.0332, - "step": 21188 - }, - { - "epoch": 0.54, - "learning_rate": 1.882741680891109e-06, - "loss": 1.1895, - "step": 21189 - }, - { - "epoch": 0.54, - "learning_rate": 1.8827286793518312e-06, - "loss": 0.9512, - "step": 21190 - }, - { - "epoch": 0.54, - "learning_rate": 1.8827156771366882e-06, - "loss": 0.8838, - "step": 21191 - }, - { - "epoch": 0.54, - "learning_rate": 1.8827026742456907e-06, - "loss": 0.8721, - "step": 21192 - }, - { - "epoch": 0.54, - "learning_rate": 1.8826896706788482e-06, - "loss": 0.8081, - "step": 21193 - }, - { - "epoch": 0.54, - "learning_rate": 1.882676666436171e-06, - "loss": 1.1143, - "step": 21194 - }, - { - "epoch": 0.54, - "learning_rate": 1.8826636615176686e-06, - "loss": 1.0342, - "step": 21195 - }, - { - "epoch": 0.54, - "learning_rate": 1.8826506559233515e-06, - "loss": 0.7495, - "step": 21196 - }, - { - "epoch": 0.54, - "learning_rate": 1.8826376496532293e-06, - "loss": 0.6631, - "step": 21197 - }, - { - "epoch": 0.54, - "learning_rate": 1.882624642707312e-06, - "loss": 0.9023, - "step": 21198 - }, - { - "epoch": 0.54, - "learning_rate": 1.8826116350856094e-06, - "loss": 0.7153, - "step": 21199 - }, - { - "epoch": 0.54, - "learning_rate": 1.8825986267881318e-06, - "loss": 0.8184, - "step": 21200 - }, - { - "epoch": 0.54, - "learning_rate": 1.8825856178148891e-06, - "loss": 0.7197, - "step": 21201 - }, - { - "epoch": 0.54, - "learning_rate": 1.8825726081658911e-06, - "loss": 0.7654, - "step": 21202 - }, - { - "epoch": 0.54, - "learning_rate": 1.8825595978411476e-06, - "loss": 0.9053, - "step": 21203 - }, - { - "epoch": 0.54, - "learning_rate": 1.8825465868406694e-06, - "loss": 0.9375, - "step": 21204 - }, - { - "epoch": 0.54, - "learning_rate": 1.8825335751644653e-06, - "loss": 0.7271, - "step": 21205 - }, - { - "epoch": 0.54, - "learning_rate": 1.8825205628125462e-06, - "loss": 0.8633, - "step": 21206 - }, - { - "epoch": 0.54, - "learning_rate": 1.8825075497849214e-06, - "loss": 0.6221, - "step": 21207 - }, - { - "epoch": 0.54, - "learning_rate": 1.882494536081601e-06, - "loss": 0.9824, - "step": 21208 - }, - { - "epoch": 0.54, - "learning_rate": 1.8824815217025956e-06, - "loss": 1.0039, - "step": 21209 - }, - { - "epoch": 0.54, - "learning_rate": 1.8824685066479144e-06, - "loss": 1.0137, - "step": 21210 - }, - { - "epoch": 0.54, - "learning_rate": 1.8824554909175676e-06, - "loss": 0.8857, - "step": 21211 - }, - { - "epoch": 0.54, - "learning_rate": 1.8824424745115652e-06, - "loss": 0.7197, - "step": 21212 - }, - { - "epoch": 0.54, - "learning_rate": 1.8824294574299175e-06, - "loss": 0.916, - "step": 21213 - }, - { - "epoch": 0.54, - "learning_rate": 1.882416439672634e-06, - "loss": 0.9736, - "step": 21214 - }, - { - "epoch": 0.54, - "learning_rate": 1.8824034212397245e-06, - "loss": 0.7915, - "step": 21215 - }, - { - "epoch": 0.54, - "learning_rate": 1.8823904021311996e-06, - "loss": 0.8779, - "step": 21216 - }, - { - "epoch": 0.54, - "learning_rate": 1.8823773823470689e-06, - "loss": 0.7332, - "step": 21217 - }, - { - "epoch": 0.54, - "learning_rate": 1.8823643618873422e-06, - "loss": 0.8516, - "step": 21218 - }, - { - "epoch": 0.54, - "learning_rate": 1.88235134075203e-06, - "loss": 0.918, - "step": 21219 - }, - { - "epoch": 0.54, - "learning_rate": 1.8823383189411417e-06, - "loss": 0.7891, - "step": 21220 - }, - { - "epoch": 0.54, - "learning_rate": 1.8823252964546875e-06, - "loss": 1.0625, - "step": 21221 - }, - { - "epoch": 0.54, - "learning_rate": 1.8823122732926775e-06, - "loss": 0.7461, - "step": 21222 - }, - { - "epoch": 0.54, - "learning_rate": 1.8822992494551215e-06, - "loss": 0.7715, - "step": 21223 - }, - { - "epoch": 0.54, - "learning_rate": 1.8822862249420296e-06, - "loss": 0.7295, - "step": 21224 - }, - { - "epoch": 0.54, - "learning_rate": 1.8822731997534115e-06, - "loss": 1.0518, - "step": 21225 - }, - { - "epoch": 0.54, - "learning_rate": 1.8822601738892777e-06, - "loss": 0.8721, - "step": 21226 - }, - { - "epoch": 0.54, - "learning_rate": 1.8822471473496378e-06, - "loss": 0.8906, - "step": 21227 - }, - { - "epoch": 0.54, - "learning_rate": 1.8822341201345015e-06, - "loss": 0.957, - "step": 21228 - }, - { - "epoch": 0.54, - "learning_rate": 1.8822210922438794e-06, - "loss": 1.0156, - "step": 21229 - }, - { - "epoch": 0.54, - "learning_rate": 1.882208063677781e-06, - "loss": 0.7754, - "step": 21230 - }, - { - "epoch": 0.54, - "learning_rate": 1.8821950344362168e-06, - "loss": 0.79, - "step": 21231 - }, - { - "epoch": 0.54, - "learning_rate": 1.8821820045191964e-06, - "loss": 0.9668, - "step": 21232 - }, - { - "epoch": 0.54, - "learning_rate": 1.8821689739267294e-06, - "loss": 0.8369, - "step": 21233 - }, - { - "epoch": 0.54, - "learning_rate": 1.8821559426588265e-06, - "loss": 1.0752, - "step": 21234 - }, - { - "epoch": 0.54, - "learning_rate": 1.8821429107154972e-06, - "loss": 0.9844, - "step": 21235 - }, - { - "epoch": 0.54, - "learning_rate": 1.8821298780967516e-06, - "loss": 0.9678, - "step": 21236 - }, - { - "epoch": 0.54, - "learning_rate": 1.8821168448025998e-06, - "loss": 0.9893, - "step": 21237 - }, - { - "epoch": 0.54, - "learning_rate": 1.8821038108330516e-06, - "loss": 0.6631, - "step": 21238 - }, - { - "epoch": 0.54, - "learning_rate": 1.882090776188117e-06, - "loss": 0.7195, - "step": 21239 - }, - { - "epoch": 0.54, - "learning_rate": 1.8820777408678063e-06, - "loss": 0.8799, - "step": 21240 - }, - { - "epoch": 0.54, - "learning_rate": 1.8820647048721293e-06, - "loss": 0.708, - "step": 21241 - }, - { - "epoch": 0.54, - "learning_rate": 1.8820516682010953e-06, - "loss": 0.7676, - "step": 21242 - }, - { - "epoch": 0.54, - "learning_rate": 1.8820386308547156e-06, - "loss": 1.0459, - "step": 21243 - }, - { - "epoch": 0.54, - "learning_rate": 1.8820255928329991e-06, - "loss": 0.8633, - "step": 21244 - }, - { - "epoch": 0.54, - "learning_rate": 1.8820125541359564e-06, - "loss": 0.71, - "step": 21245 - }, - { - "epoch": 0.54, - "learning_rate": 1.881999514763597e-06, - "loss": 1.041, - "step": 21246 - }, - { - "epoch": 0.54, - "learning_rate": 1.8819864747159313e-06, - "loss": 0.7725, - "step": 21247 - }, - { - "epoch": 0.54, - "learning_rate": 1.8819734339929691e-06, - "loss": 0.8613, - "step": 21248 - }, - { - "epoch": 0.54, - "learning_rate": 1.8819603925947205e-06, - "loss": 0.8301, - "step": 21249 - }, - { - "epoch": 0.54, - "learning_rate": 1.8819473505211952e-06, - "loss": 0.7129, - "step": 21250 - }, - { - "epoch": 0.54, - "learning_rate": 1.8819343077724032e-06, - "loss": 0.9287, - "step": 21251 - }, - { - "epoch": 0.54, - "learning_rate": 1.8819212643483548e-06, - "loss": 0.8062, - "step": 21252 - }, - { - "epoch": 0.54, - "learning_rate": 1.88190822024906e-06, - "loss": 0.8728, - "step": 21253 - }, - { - "epoch": 0.54, - "learning_rate": 1.8818951754745287e-06, - "loss": 0.9238, - "step": 21254 - }, - { - "epoch": 0.54, - "learning_rate": 1.8818821300247705e-06, - "loss": 0.7461, - "step": 21255 - }, - { - "epoch": 0.54, - "learning_rate": 1.881869083899796e-06, - "loss": 0.8564, - "step": 21256 - }, - { - "epoch": 0.54, - "learning_rate": 1.8818560370996147e-06, - "loss": 0.9033, - "step": 21257 - }, - { - "epoch": 0.54, - "learning_rate": 1.8818429896242367e-06, - "loss": 0.8066, - "step": 21258 - }, - { - "epoch": 0.54, - "learning_rate": 1.881829941473672e-06, - "loss": 0.7114, - "step": 21259 - }, - { - "epoch": 0.54, - "learning_rate": 1.881816892647931e-06, - "loss": 0.5854, - "step": 21260 - }, - { - "epoch": 0.54, - "learning_rate": 1.8818038431470233e-06, - "loss": 1.0107, - "step": 21261 - }, - { - "epoch": 0.54, - "learning_rate": 1.8817907929709587e-06, - "loss": 0.7344, - "step": 21262 - }, - { - "epoch": 0.54, - "learning_rate": 1.8817777421197477e-06, - "loss": 0.7275, - "step": 21263 - }, - { - "epoch": 0.55, - "learning_rate": 1.8817646905933997e-06, - "loss": 0.8994, - "step": 21264 - }, - { - "epoch": 0.55, - "learning_rate": 1.8817516383919254e-06, - "loss": 0.8545, - "step": 21265 - }, - { - "epoch": 0.55, - "learning_rate": 1.8817385855153342e-06, - "loss": 0.9424, - "step": 21266 - }, - { - "epoch": 0.55, - "learning_rate": 1.8817255319636364e-06, - "loss": 0.7998, - "step": 21267 - }, - { - "epoch": 0.55, - "learning_rate": 1.8817124777368418e-06, - "loss": 0.9648, - "step": 21268 - }, - { - "epoch": 0.55, - "learning_rate": 1.8816994228349605e-06, - "loss": 0.9688, - "step": 21269 - }, - { - "epoch": 0.55, - "learning_rate": 1.8816863672580025e-06, - "loss": 1.291, - "step": 21270 - }, - { - "epoch": 0.55, - "learning_rate": 1.881673311005978e-06, - "loss": 0.7075, - "step": 21271 - }, - { - "epoch": 0.55, - "learning_rate": 1.8816602540788966e-06, - "loss": 0.9258, - "step": 21272 - }, - { - "epoch": 0.55, - "learning_rate": 1.8816471964767684e-06, - "loss": 0.8896, - "step": 21273 - }, - { - "epoch": 0.55, - "learning_rate": 1.8816341381996036e-06, - "loss": 0.9502, - "step": 21274 - }, - { - "epoch": 0.55, - "learning_rate": 1.881621079247412e-06, - "loss": 0.9492, - "step": 21275 - }, - { - "epoch": 0.55, - "learning_rate": 1.881608019620204e-06, - "loss": 1.0664, - "step": 21276 - }, - { - "epoch": 0.55, - "learning_rate": 1.8815949593179888e-06, - "loss": 0.9248, - "step": 21277 - }, - { - "epoch": 0.55, - "learning_rate": 1.881581898340777e-06, - "loss": 0.8059, - "step": 21278 - }, - { - "epoch": 0.55, - "learning_rate": 1.8815688366885786e-06, - "loss": 0.8496, - "step": 21279 - }, - { - "epoch": 0.55, - "learning_rate": 1.8815557743614035e-06, - "loss": 0.8105, - "step": 21280 - }, - { - "epoch": 0.55, - "learning_rate": 1.8815427113592618e-06, - "loss": 0.7021, - "step": 21281 - }, - { - "epoch": 0.55, - "learning_rate": 1.8815296476821628e-06, - "loss": 0.7588, - "step": 21282 - }, - { - "epoch": 0.55, - "learning_rate": 1.8815165833301178e-06, - "loss": 0.6934, - "step": 21283 - }, - { - "epoch": 0.55, - "learning_rate": 1.881503518303136e-06, - "loss": 0.749, - "step": 21284 - }, - { - "epoch": 0.55, - "learning_rate": 1.881490452601227e-06, - "loss": 0.8242, - "step": 21285 - }, - { - "epoch": 0.55, - "learning_rate": 1.8814773862244015e-06, - "loss": 0.7192, - "step": 21286 - }, - { - "epoch": 0.55, - "learning_rate": 1.8814643191726693e-06, - "loss": 0.8735, - "step": 21287 - }, - { - "epoch": 0.55, - "learning_rate": 1.8814512514460405e-06, - "loss": 1.0781, - "step": 21288 - }, - { - "epoch": 0.55, - "learning_rate": 1.881438183044525e-06, - "loss": 0.7952, - "step": 21289 - }, - { - "epoch": 0.55, - "learning_rate": 1.8814251139681327e-06, - "loss": 0.9058, - "step": 21290 - }, - { - "epoch": 0.55, - "learning_rate": 1.8814120442168736e-06, - "loss": 0.8643, - "step": 21291 - }, - { - "epoch": 0.55, - "learning_rate": 1.8813989737907583e-06, - "loss": 1.0264, - "step": 21292 - }, - { - "epoch": 0.55, - "learning_rate": 1.881385902689796e-06, - "loss": 0.855, - "step": 21293 - }, - { - "epoch": 0.55, - "learning_rate": 1.881372830913997e-06, - "loss": 0.8154, - "step": 21294 - }, - { - "epoch": 0.55, - "learning_rate": 1.8813597584633715e-06, - "loss": 0.6113, - "step": 21295 - }, - { - "epoch": 0.55, - "learning_rate": 1.8813466853379294e-06, - "loss": 0.9414, - "step": 21296 - }, - { - "epoch": 0.55, - "learning_rate": 1.8813336115376806e-06, - "loss": 0.8511, - "step": 21297 - }, - { - "epoch": 0.55, - "learning_rate": 1.881320537062635e-06, - "loss": 0.9844, - "step": 21298 - }, - { - "epoch": 0.55, - "learning_rate": 1.881307461912803e-06, - "loss": 0.8271, - "step": 21299 - }, - { - "epoch": 0.55, - "learning_rate": 1.8812943860881942e-06, - "loss": 0.7499, - "step": 21300 - }, - { - "epoch": 0.55, - "learning_rate": 1.8812813095888191e-06, - "loss": 0.8428, - "step": 21301 - }, - { - "epoch": 0.55, - "learning_rate": 1.8812682324146873e-06, - "loss": 1.0186, - "step": 21302 - }, - { - "epoch": 0.55, - "learning_rate": 1.881255154565809e-06, - "loss": 0.6311, - "step": 21303 - }, - { - "epoch": 0.55, - "learning_rate": 1.8812420760421941e-06, - "loss": 0.7451, - "step": 21304 - }, - { - "epoch": 0.55, - "learning_rate": 1.8812289968438524e-06, - "loss": 0.752, - "step": 21305 - }, - { - "epoch": 0.55, - "learning_rate": 1.8812159169707944e-06, - "loss": 0.7549, - "step": 21306 - }, - { - "epoch": 0.55, - "learning_rate": 1.8812028364230299e-06, - "loss": 0.9658, - "step": 21307 - }, - { - "epoch": 0.55, - "learning_rate": 1.8811897552005688e-06, - "loss": 0.8291, - "step": 21308 - }, - { - "epoch": 0.55, - "learning_rate": 1.8811766733034212e-06, - "loss": 0.6006, - "step": 21309 - }, - { - "epoch": 0.55, - "learning_rate": 1.8811635907315975e-06, - "loss": 0.8105, - "step": 21310 - }, - { - "epoch": 0.55, - "learning_rate": 1.881150507485107e-06, - "loss": 0.9375, - "step": 21311 - }, - { - "epoch": 0.55, - "learning_rate": 1.8811374235639602e-06, - "loss": 0.8169, - "step": 21312 - }, - { - "epoch": 0.55, - "learning_rate": 1.881124338968167e-06, - "loss": 1.0898, - "step": 21313 - }, - { - "epoch": 0.55, - "learning_rate": 1.8811112536977376e-06, - "loss": 0.7861, - "step": 21314 - }, - { - "epoch": 0.55, - "learning_rate": 1.8810981677526816e-06, - "loss": 0.959, - "step": 21315 - }, - { - "epoch": 0.55, - "learning_rate": 1.8810850811330092e-06, - "loss": 0.9736, - "step": 21316 - }, - { - "epoch": 0.55, - "learning_rate": 1.8810719938387306e-06, - "loss": 0.8281, - "step": 21317 - }, - { - "epoch": 0.55, - "learning_rate": 1.8810589058698554e-06, - "loss": 0.8926, - "step": 21318 - }, - { - "epoch": 0.55, - "learning_rate": 1.8810458172263943e-06, - "loss": 0.8545, - "step": 21319 - }, - { - "epoch": 0.55, - "learning_rate": 1.8810327279083568e-06, - "loss": 0.6904, - "step": 21320 - }, - { - "epoch": 0.55, - "learning_rate": 1.8810196379157528e-06, - "loss": 0.7324, - "step": 21321 - }, - { - "epoch": 0.55, - "learning_rate": 1.8810065472485927e-06, - "loss": 0.8677, - "step": 21322 - }, - { - "epoch": 0.55, - "learning_rate": 1.8809934559068866e-06, - "loss": 0.8608, - "step": 21323 - }, - { - "epoch": 0.55, - "learning_rate": 1.8809803638906442e-06, - "loss": 0.9404, - "step": 21324 - }, - { - "epoch": 0.55, - "learning_rate": 1.8809672711998757e-06, - "loss": 0.8896, - "step": 21325 - }, - { - "epoch": 0.55, - "learning_rate": 1.880954177834591e-06, - "loss": 1.0156, - "step": 21326 - }, - { - "epoch": 0.55, - "learning_rate": 1.8809410837948001e-06, - "loss": 1.001, - "step": 21327 - }, - { - "epoch": 0.55, - "learning_rate": 1.8809279890805133e-06, - "loss": 0.9424, - "step": 21328 - }, - { - "epoch": 0.55, - "learning_rate": 1.8809148936917402e-06, - "loss": 0.9746, - "step": 21329 - }, - { - "epoch": 0.55, - "learning_rate": 1.8809017976284914e-06, - "loss": 1.1758, - "step": 21330 - }, - { - "epoch": 0.55, - "learning_rate": 1.8808887008907766e-06, - "loss": 0.9336, - "step": 21331 - }, - { - "epoch": 0.55, - "learning_rate": 1.8808756034786054e-06, - "loss": 0.8496, - "step": 21332 - }, - { - "epoch": 0.55, - "learning_rate": 1.8808625053919887e-06, - "loss": 1.1094, - "step": 21333 - }, - { - "epoch": 0.55, - "learning_rate": 1.8808494066309357e-06, - "loss": 0.6802, - "step": 21334 - }, - { - "epoch": 0.55, - "learning_rate": 1.880836307195457e-06, - "loss": 0.8701, - "step": 21335 - }, - { - "epoch": 0.55, - "learning_rate": 1.8808232070855625e-06, - "loss": 0.998, - "step": 21336 - }, - { - "epoch": 0.55, - "learning_rate": 1.8808101063012622e-06, - "loss": 1.0059, - "step": 21337 - }, - { - "epoch": 0.55, - "learning_rate": 1.8807970048425661e-06, - "loss": 0.8135, - "step": 21338 - }, - { - "epoch": 0.55, - "learning_rate": 1.880783902709484e-06, - "loss": 0.7734, - "step": 21339 - }, - { - "epoch": 0.55, - "learning_rate": 1.8807707999020263e-06, - "loss": 1.001, - "step": 21340 - }, - { - "epoch": 0.55, - "learning_rate": 1.880757696420203e-06, - "loss": 0.793, - "step": 21341 - }, - { - "epoch": 0.55, - "learning_rate": 1.880744592264024e-06, - "loss": 0.7891, - "step": 21342 - }, - { - "epoch": 0.55, - "learning_rate": 1.8807314874334992e-06, - "loss": 0.5264, - "step": 21343 - }, - { - "epoch": 0.55, - "learning_rate": 1.880718381928639e-06, - "loss": 0.998, - "step": 21344 - }, - { - "epoch": 0.55, - "learning_rate": 1.880705275749453e-06, - "loss": 1.1162, - "step": 21345 - }, - { - "epoch": 0.55, - "learning_rate": 1.8806921688959517e-06, - "loss": 0.9297, - "step": 21346 - }, - { - "epoch": 0.55, - "learning_rate": 1.8806790613681449e-06, - "loss": 1.0127, - "step": 21347 - }, - { - "epoch": 0.55, - "learning_rate": 1.8806659531660425e-06, - "loss": 0.8242, - "step": 21348 - }, - { - "epoch": 0.55, - "learning_rate": 1.8806528442896544e-06, - "loss": 0.9546, - "step": 21349 - }, - { - "epoch": 0.55, - "learning_rate": 1.8806397347389913e-06, - "loss": 0.8506, - "step": 21350 - }, - { - "epoch": 0.55, - "learning_rate": 1.8806266245140629e-06, - "loss": 0.8506, - "step": 21351 - }, - { - "epoch": 0.55, - "learning_rate": 1.880613513614879e-06, - "loss": 0.8809, - "step": 21352 - }, - { - "epoch": 0.55, - "learning_rate": 1.88060040204145e-06, - "loss": 1.0859, - "step": 21353 - }, - { - "epoch": 0.55, - "learning_rate": 1.8805872897937855e-06, - "loss": 0.8359, - "step": 21354 - }, - { - "epoch": 0.55, - "learning_rate": 1.880574176871896e-06, - "loss": 0.7192, - "step": 21355 - }, - { - "epoch": 0.55, - "learning_rate": 1.8805610632757913e-06, - "loss": 0.6909, - "step": 21356 - }, - { - "epoch": 0.55, - "learning_rate": 1.8805479490054816e-06, - "loss": 0.7988, - "step": 21357 - }, - { - "epoch": 0.55, - "learning_rate": 1.8805348340609766e-06, - "loss": 1.0713, - "step": 21358 - }, - { - "epoch": 0.55, - "learning_rate": 1.8805217184422868e-06, - "loss": 0.8564, - "step": 21359 - }, - { - "epoch": 0.55, - "learning_rate": 1.8805086021494216e-06, - "loss": 0.9004, - "step": 21360 - }, - { - "epoch": 0.55, - "learning_rate": 1.8804954851823919e-06, - "loss": 0.8369, - "step": 21361 - }, - { - "epoch": 0.55, - "learning_rate": 1.8804823675412072e-06, - "loss": 0.7988, - "step": 21362 - }, - { - "epoch": 0.55, - "learning_rate": 1.8804692492258776e-06, - "loss": 0.5842, - "step": 21363 - }, - { - "epoch": 0.55, - "learning_rate": 1.880456130236413e-06, - "loss": 0.8389, - "step": 21364 - }, - { - "epoch": 0.55, - "learning_rate": 1.880443010572824e-06, - "loss": 0.7324, - "step": 21365 - }, - { - "epoch": 0.55, - "learning_rate": 1.8804298902351199e-06, - "loss": 0.7881, - "step": 21366 - }, - { - "epoch": 0.55, - "learning_rate": 1.8804167692233113e-06, - "loss": 0.8672, - "step": 21367 - }, - { - "epoch": 0.55, - "learning_rate": 1.880403647537408e-06, - "loss": 0.8711, - "step": 21368 - }, - { - "epoch": 0.55, - "learning_rate": 1.88039052517742e-06, - "loss": 0.9824, - "step": 21369 - }, - { - "epoch": 0.55, - "learning_rate": 1.8803774021433576e-06, - "loss": 1.0771, - "step": 21370 - }, - { - "epoch": 0.55, - "learning_rate": 1.8803642784352308e-06, - "loss": 0.8682, - "step": 21371 - }, - { - "epoch": 0.55, - "learning_rate": 1.8803511540530495e-06, - "loss": 0.6193, - "step": 21372 - }, - { - "epoch": 0.55, - "learning_rate": 1.8803380289968236e-06, - "loss": 0.8193, - "step": 21373 - }, - { - "epoch": 0.55, - "learning_rate": 1.8803249032665636e-06, - "loss": 0.8848, - "step": 21374 - }, - { - "epoch": 0.55, - "learning_rate": 1.880311776862279e-06, - "loss": 0.4575, - "step": 21375 - }, - { - "epoch": 0.55, - "learning_rate": 1.8802986497839805e-06, - "loss": 0.7949, - "step": 21376 - }, - { - "epoch": 0.55, - "learning_rate": 1.8802855220316776e-06, - "loss": 0.791, - "step": 21377 - }, - { - "epoch": 0.55, - "learning_rate": 1.8802723936053805e-06, - "loss": 0.686, - "step": 21378 - }, - { - "epoch": 0.55, - "learning_rate": 1.8802592645050994e-06, - "loss": 0.9033, - "step": 21379 - }, - { - "epoch": 0.55, - "learning_rate": 1.8802461347308442e-06, - "loss": 0.5811, - "step": 21380 - }, - { - "epoch": 0.55, - "learning_rate": 1.8802330042826251e-06, - "loss": 1.0059, - "step": 21381 - }, - { - "epoch": 0.55, - "learning_rate": 1.8802198731604522e-06, - "loss": 0.7803, - "step": 21382 - }, - { - "epoch": 0.55, - "learning_rate": 1.880206741364335e-06, - "loss": 1.0781, - "step": 21383 - }, - { - "epoch": 0.55, - "learning_rate": 1.8801936088942842e-06, - "loss": 0.918, - "step": 21384 - }, - { - "epoch": 0.55, - "learning_rate": 1.8801804757503096e-06, - "loss": 0.8477, - "step": 21385 - }, - { - "epoch": 0.55, - "learning_rate": 1.8801673419324215e-06, - "loss": 0.791, - "step": 21386 - }, - { - "epoch": 0.55, - "learning_rate": 1.8801542074406295e-06, - "loss": 0.8496, - "step": 21387 - }, - { - "epoch": 0.55, - "learning_rate": 1.880141072274944e-06, - "loss": 0.8975, - "step": 21388 - }, - { - "epoch": 0.55, - "learning_rate": 1.8801279364353748e-06, - "loss": 0.8037, - "step": 21389 - }, - { - "epoch": 0.55, - "learning_rate": 1.8801147999219323e-06, - "loss": 0.8867, - "step": 21390 - }, - { - "epoch": 0.55, - "learning_rate": 1.8801016627346263e-06, - "loss": 0.7461, - "step": 21391 - }, - { - "epoch": 0.55, - "learning_rate": 1.8800885248734668e-06, - "loss": 0.7891, - "step": 21392 - }, - { - "epoch": 0.55, - "learning_rate": 1.8800753863384643e-06, - "loss": 0.8872, - "step": 21393 - }, - { - "epoch": 0.55, - "learning_rate": 1.8800622471296282e-06, - "loss": 0.875, - "step": 21394 - }, - { - "epoch": 0.55, - "learning_rate": 1.8800491072469691e-06, - "loss": 0.9258, - "step": 21395 - }, - { - "epoch": 0.55, - "learning_rate": 1.8800359666904968e-06, - "loss": 0.9355, - "step": 21396 - }, - { - "epoch": 0.55, - "learning_rate": 1.8800228254602213e-06, - "loss": 0.834, - "step": 21397 - }, - { - "epoch": 0.55, - "learning_rate": 1.880009683556153e-06, - "loss": 0.5356, - "step": 21398 - }, - { - "epoch": 0.55, - "learning_rate": 1.8799965409783016e-06, - "loss": 1.1377, - "step": 21399 - }, - { - "epoch": 0.55, - "learning_rate": 1.8799833977266774e-06, - "loss": 0.8245, - "step": 21400 - }, - { - "epoch": 0.55, - "learning_rate": 1.8799702538012902e-06, - "loss": 1.0557, - "step": 21401 - }, - { - "epoch": 0.55, - "learning_rate": 1.8799571092021505e-06, - "loss": 0.6626, - "step": 21402 - }, - { - "epoch": 0.55, - "learning_rate": 1.8799439639292681e-06, - "loss": 0.9844, - "step": 21403 - }, - { - "epoch": 0.55, - "learning_rate": 1.879930817982653e-06, - "loss": 0.5867, - "step": 21404 - }, - { - "epoch": 0.55, - "learning_rate": 1.879917671362315e-06, - "loss": 0.6943, - "step": 21405 - }, - { - "epoch": 0.55, - "learning_rate": 1.879904524068265e-06, - "loss": 0.813, - "step": 21406 - }, - { - "epoch": 0.55, - "learning_rate": 1.8798913761005122e-06, - "loss": 0.7407, - "step": 21407 - }, - { - "epoch": 0.55, - "learning_rate": 1.8798782274590672e-06, - "loss": 0.7725, - "step": 21408 - }, - { - "epoch": 0.55, - "learning_rate": 1.8798650781439399e-06, - "loss": 0.6289, - "step": 21409 - }, - { - "epoch": 0.55, - "learning_rate": 1.8798519281551403e-06, - "loss": 0.7217, - "step": 21410 - }, - { - "epoch": 0.55, - "learning_rate": 1.8798387774926786e-06, - "loss": 0.9385, - "step": 21411 - }, - { - "epoch": 0.55, - "learning_rate": 1.879825626156565e-06, - "loss": 1.0762, - "step": 21412 - }, - { - "epoch": 0.55, - "learning_rate": 1.8798124741468092e-06, - "loss": 0.8569, - "step": 21413 - }, - { - "epoch": 0.55, - "learning_rate": 1.8797993214634212e-06, - "loss": 0.7627, - "step": 21414 - }, - { - "epoch": 0.55, - "learning_rate": 1.8797861681064115e-06, - "loss": 0.8789, - "step": 21415 - }, - { - "epoch": 0.55, - "learning_rate": 1.8797730140757899e-06, - "loss": 0.9854, - "step": 21416 - }, - { - "epoch": 0.55, - "learning_rate": 1.8797598593715666e-06, - "loss": 0.6821, - "step": 21417 - }, - { - "epoch": 0.55, - "learning_rate": 1.879746703993752e-06, - "loss": 0.8674, - "step": 21418 - }, - { - "epoch": 0.55, - "learning_rate": 1.8797335479423553e-06, - "loss": 0.9248, - "step": 21419 - }, - { - "epoch": 0.55, - "learning_rate": 1.8797203912173871e-06, - "loss": 0.5591, - "step": 21420 - }, - { - "epoch": 0.55, - "learning_rate": 1.8797072338188577e-06, - "loss": 0.7734, - "step": 21421 - }, - { - "epoch": 0.55, - "learning_rate": 1.879694075746777e-06, - "loss": 0.9648, - "step": 21422 - }, - { - "epoch": 0.55, - "learning_rate": 1.879680917001155e-06, - "loss": 0.9634, - "step": 21423 - }, - { - "epoch": 0.55, - "learning_rate": 1.8796677575820014e-06, - "loss": 0.7656, - "step": 21424 - }, - { - "epoch": 0.55, - "learning_rate": 1.8796545974893268e-06, - "loss": 0.8936, - "step": 21425 - }, - { - "epoch": 0.55, - "learning_rate": 1.879641436723141e-06, - "loss": 0.835, - "step": 21426 - }, - { - "epoch": 0.55, - "learning_rate": 1.8796282752834544e-06, - "loss": 0.6777, - "step": 21427 - }, - { - "epoch": 0.55, - "learning_rate": 1.879615113170277e-06, - "loss": 1.0039, - "step": 21428 - }, - { - "epoch": 0.55, - "learning_rate": 1.8796019503836185e-06, - "loss": 0.7095, - "step": 21429 - }, - { - "epoch": 0.55, - "learning_rate": 1.8795887869234895e-06, - "loss": 0.689, - "step": 21430 - }, - { - "epoch": 0.55, - "learning_rate": 1.8795756227898996e-06, - "loss": 0.7251, - "step": 21431 - }, - { - "epoch": 0.55, - "learning_rate": 1.879562457982859e-06, - "loss": 0.9092, - "step": 21432 - }, - { - "epoch": 0.55, - "learning_rate": 1.8795492925023783e-06, - "loss": 0.75, - "step": 21433 - }, - { - "epoch": 0.55, - "learning_rate": 1.8795361263484665e-06, - "loss": 0.7646, - "step": 21434 - }, - { - "epoch": 0.55, - "learning_rate": 1.8795229595211346e-06, - "loss": 0.8682, - "step": 21435 - }, - { - "epoch": 0.55, - "learning_rate": 1.8795097920203926e-06, - "loss": 0.8774, - "step": 21436 - }, - { - "epoch": 0.55, - "learning_rate": 1.8794966238462502e-06, - "loss": 0.9775, - "step": 21437 - }, - { - "epoch": 0.55, - "learning_rate": 1.8794834549987178e-06, - "loss": 0.8594, - "step": 21438 - }, - { - "epoch": 0.55, - "learning_rate": 1.8794702854778052e-06, - "loss": 1.0537, - "step": 21439 - }, - { - "epoch": 0.55, - "learning_rate": 1.879457115283523e-06, - "loss": 0.8235, - "step": 21440 - }, - { - "epoch": 0.55, - "learning_rate": 1.8794439444158808e-06, - "loss": 1.0303, - "step": 21441 - }, - { - "epoch": 0.55, - "learning_rate": 1.8794307728748887e-06, - "loss": 0.8398, - "step": 21442 - }, - { - "epoch": 0.55, - "learning_rate": 1.8794176006605566e-06, - "loss": 1.1494, - "step": 21443 - }, - { - "epoch": 0.55, - "learning_rate": 1.8794044277728954e-06, - "loss": 0.874, - "step": 21444 - }, - { - "epoch": 0.55, - "learning_rate": 1.879391254211914e-06, - "loss": 0.7822, - "step": 21445 - }, - { - "epoch": 0.55, - "learning_rate": 1.879378079977624e-06, - "loss": 0.438, - "step": 21446 - }, - { - "epoch": 0.55, - "learning_rate": 1.8793649050700342e-06, - "loss": 1.1133, - "step": 21447 - }, - { - "epoch": 0.55, - "learning_rate": 1.879351729489155e-06, - "loss": 0.8042, - "step": 21448 - }, - { - "epoch": 0.55, - "learning_rate": 1.8793385532349967e-06, - "loss": 0.8579, - "step": 21449 - }, - { - "epoch": 0.55, - "learning_rate": 1.8793253763075694e-06, - "loss": 0.9844, - "step": 21450 - }, - { - "epoch": 0.55, - "learning_rate": 1.879312198706883e-06, - "loss": 0.9521, - "step": 21451 - }, - { - "epoch": 0.55, - "learning_rate": 1.8792990204329478e-06, - "loss": 0.73, - "step": 21452 - }, - { - "epoch": 0.55, - "learning_rate": 1.8792858414857738e-06, - "loss": 0.8652, - "step": 21453 - }, - { - "epoch": 0.55, - "learning_rate": 1.879272661865371e-06, - "loss": 1.0205, - "step": 21454 - }, - { - "epoch": 0.55, - "learning_rate": 1.8792594815717494e-06, - "loss": 0.8525, - "step": 21455 - }, - { - "epoch": 0.55, - "learning_rate": 1.8792463006049193e-06, - "loss": 0.8645, - "step": 21456 - }, - { - "epoch": 0.55, - "learning_rate": 1.8792331189648908e-06, - "loss": 0.8359, - "step": 21457 - }, - { - "epoch": 0.55, - "learning_rate": 1.879219936651674e-06, - "loss": 0.6123, - "step": 21458 - }, - { - "epoch": 0.55, - "learning_rate": 1.879206753665279e-06, - "loss": 0.9639, - "step": 21459 - }, - { - "epoch": 0.55, - "learning_rate": 1.8791935700057155e-06, - "loss": 0.9932, - "step": 21460 - }, - { - "epoch": 0.55, - "learning_rate": 1.8791803856729942e-06, - "loss": 0.5791, - "step": 21461 - }, - { - "epoch": 0.55, - "learning_rate": 1.8791672006671248e-06, - "loss": 0.7979, - "step": 21462 - }, - { - "epoch": 0.55, - "learning_rate": 1.8791540149881175e-06, - "loss": 0.8643, - "step": 21463 - }, - { - "epoch": 0.55, - "learning_rate": 1.8791408286359824e-06, - "loss": 0.9678, - "step": 21464 - }, - { - "epoch": 0.55, - "learning_rate": 1.8791276416107293e-06, - "loss": 0.7998, - "step": 21465 - }, - { - "epoch": 0.55, - "learning_rate": 1.879114453912369e-06, - "loss": 0.8164, - "step": 21466 - }, - { - "epoch": 0.55, - "learning_rate": 1.8791012655409112e-06, - "loss": 0.7817, - "step": 21467 - }, - { - "epoch": 0.55, - "learning_rate": 1.8790880764963656e-06, - "loss": 0.9619, - "step": 21468 - }, - { - "epoch": 0.55, - "learning_rate": 1.879074886778743e-06, - "loss": 0.8965, - "step": 21469 - }, - { - "epoch": 0.55, - "learning_rate": 1.879061696388053e-06, - "loss": 0.8955, - "step": 21470 - }, - { - "epoch": 0.55, - "learning_rate": 1.8790485053243058e-06, - "loss": 0.6982, - "step": 21471 - }, - { - "epoch": 0.55, - "learning_rate": 1.8790353135875118e-06, - "loss": 1.1104, - "step": 21472 - }, - { - "epoch": 0.55, - "learning_rate": 1.879022121177681e-06, - "loss": 0.6553, - "step": 21473 - }, - { - "epoch": 0.55, - "learning_rate": 1.8790089280948233e-06, - "loss": 0.9512, - "step": 21474 - }, - { - "epoch": 0.55, - "learning_rate": 1.8789957343389488e-06, - "loss": 0.9336, - "step": 21475 - }, - { - "epoch": 0.55, - "learning_rate": 1.8789825399100677e-06, - "loss": 0.9307, - "step": 21476 - }, - { - "epoch": 0.55, - "learning_rate": 1.87896934480819e-06, - "loss": 0.6567, - "step": 21477 - }, - { - "epoch": 0.55, - "learning_rate": 1.8789561490333259e-06, - "loss": 0.8276, - "step": 21478 - }, - { - "epoch": 0.55, - "learning_rate": 1.8789429525854853e-06, - "loss": 0.8105, - "step": 21479 - }, - { - "epoch": 0.55, - "learning_rate": 1.878929755464679e-06, - "loss": 0.9375, - "step": 21480 - }, - { - "epoch": 0.55, - "learning_rate": 1.8789165576709163e-06, - "loss": 1.0205, - "step": 21481 - }, - { - "epoch": 0.55, - "learning_rate": 1.8789033592042077e-06, - "loss": 0.6372, - "step": 21482 - }, - { - "epoch": 0.55, - "learning_rate": 1.878890160064563e-06, - "loss": 0.9277, - "step": 21483 - }, - { - "epoch": 0.55, - "learning_rate": 1.8788769602519927e-06, - "loss": 0.8145, - "step": 21484 - }, - { - "epoch": 0.55, - "learning_rate": 1.8788637597665069e-06, - "loss": 0.8643, - "step": 21485 - }, - { - "epoch": 0.55, - "learning_rate": 1.8788505586081152e-06, - "loss": 0.9663, - "step": 21486 - }, - { - "epoch": 0.55, - "learning_rate": 1.878837356776828e-06, - "loss": 0.9019, - "step": 21487 - }, - { - "epoch": 0.55, - "learning_rate": 1.8788241542726557e-06, - "loss": 0.6646, - "step": 21488 - }, - { - "epoch": 0.55, - "learning_rate": 1.8788109510956081e-06, - "loss": 1.0518, - "step": 21489 - }, - { - "epoch": 0.55, - "learning_rate": 1.8787977472456956e-06, - "loss": 0.8062, - "step": 21490 - }, - { - "epoch": 0.55, - "learning_rate": 1.8787845427229273e-06, - "loss": 0.7441, - "step": 21491 - }, - { - "epoch": 0.55, - "learning_rate": 1.8787713375273149e-06, - "loss": 0.832, - "step": 21492 - }, - { - "epoch": 0.55, - "learning_rate": 1.8787581316588673e-06, - "loss": 0.7427, - "step": 21493 - }, - { - "epoch": 0.55, - "learning_rate": 1.878744925117595e-06, - "loss": 0.9131, - "step": 21494 - }, - { - "epoch": 0.55, - "learning_rate": 1.8787317179035083e-06, - "loss": 0.9258, - "step": 21495 - }, - { - "epoch": 0.55, - "learning_rate": 1.878718510016617e-06, - "loss": 1.1328, - "step": 21496 - }, - { - "epoch": 0.55, - "learning_rate": 1.8787053014569315e-06, - "loss": 1.002, - "step": 21497 - }, - { - "epoch": 0.55, - "learning_rate": 1.8786920922244614e-06, - "loss": 0.8994, - "step": 21498 - }, - { - "epoch": 0.55, - "learning_rate": 1.8786788823192174e-06, - "loss": 0.7729, - "step": 21499 - }, - { - "epoch": 0.55, - "learning_rate": 1.8786656717412095e-06, - "loss": 1.1328, - "step": 21500 - }, - { - "epoch": 0.55, - "learning_rate": 1.8786524604904478e-06, - "loss": 0.9932, - "step": 21501 - }, - { - "epoch": 0.55, - "learning_rate": 1.8786392485669418e-06, - "loss": 0.8225, - "step": 21502 - }, - { - "epoch": 0.55, - "learning_rate": 1.8786260359707025e-06, - "loss": 0.8486, - "step": 21503 - }, - { - "epoch": 0.55, - "learning_rate": 1.8786128227017395e-06, - "loss": 0.6436, - "step": 21504 - }, - { - "epoch": 0.55, - "learning_rate": 1.8785996087600632e-06, - "loss": 0.8457, - "step": 21505 - }, - { - "epoch": 0.55, - "learning_rate": 1.8785863941456834e-06, - "loss": 0.9971, - "step": 21506 - }, - { - "epoch": 0.55, - "learning_rate": 1.8785731788586104e-06, - "loss": 0.8096, - "step": 21507 - }, - { - "epoch": 0.55, - "learning_rate": 1.8785599628988543e-06, - "loss": 0.9922, - "step": 21508 - }, - { - "epoch": 0.55, - "learning_rate": 1.8785467462664256e-06, - "loss": 0.7295, - "step": 21509 - }, - { - "epoch": 0.55, - "learning_rate": 1.8785335289613339e-06, - "loss": 0.6871, - "step": 21510 - }, - { - "epoch": 0.55, - "learning_rate": 1.8785203109835891e-06, - "loss": 0.7505, - "step": 21511 - }, - { - "epoch": 0.55, - "learning_rate": 1.878507092333202e-06, - "loss": 0.5776, - "step": 21512 - }, - { - "epoch": 0.55, - "learning_rate": 1.8784938730101824e-06, - "loss": 0.8281, - "step": 21513 - }, - { - "epoch": 0.55, - "learning_rate": 1.8784806530145403e-06, - "loss": 0.8926, - "step": 21514 - }, - { - "epoch": 0.55, - "learning_rate": 1.8784674323462862e-06, - "loss": 0.7246, - "step": 21515 - }, - { - "epoch": 0.55, - "learning_rate": 1.8784542110054298e-06, - "loss": 0.9766, - "step": 21516 - }, - { - "epoch": 0.55, - "learning_rate": 1.8784409889919814e-06, - "loss": 0.8589, - "step": 21517 - }, - { - "epoch": 0.55, - "learning_rate": 1.8784277663059513e-06, - "loss": 0.9043, - "step": 21518 - }, - { - "epoch": 0.55, - "learning_rate": 1.8784145429473493e-06, - "loss": 0.7734, - "step": 21519 - }, - { - "epoch": 0.55, - "learning_rate": 1.8784013189161856e-06, - "loss": 0.7822, - "step": 21520 - }, - { - "epoch": 0.55, - "learning_rate": 1.8783880942124705e-06, - "loss": 0.8232, - "step": 21521 - }, - { - "epoch": 0.55, - "learning_rate": 1.878374868836214e-06, - "loss": 0.9131, - "step": 21522 - }, - { - "epoch": 0.55, - "learning_rate": 1.8783616427874263e-06, - "loss": 0.9268, - "step": 21523 - }, - { - "epoch": 0.55, - "learning_rate": 1.8783484160661174e-06, - "loss": 0.6699, - "step": 21524 - }, - { - "epoch": 0.55, - "learning_rate": 1.8783351886722975e-06, - "loss": 0.7969, - "step": 21525 - }, - { - "epoch": 0.55, - "learning_rate": 1.878321960605977e-06, - "loss": 1.0283, - "step": 21526 - }, - { - "epoch": 0.55, - "learning_rate": 1.8783087318671655e-06, - "loss": 0.998, - "step": 21527 - }, - { - "epoch": 0.55, - "learning_rate": 1.8782955024558736e-06, - "loss": 0.792, - "step": 21528 - }, - { - "epoch": 0.55, - "learning_rate": 1.878282272372111e-06, - "loss": 0.8535, - "step": 21529 - }, - { - "epoch": 0.55, - "learning_rate": 1.878269041615888e-06, - "loss": 0.5858, - "step": 21530 - }, - { - "epoch": 0.55, - "learning_rate": 1.8782558101872151e-06, - "loss": 0.5835, - "step": 21531 - }, - { - "epoch": 0.55, - "learning_rate": 1.8782425780861017e-06, - "loss": 0.7378, - "step": 21532 - }, - { - "epoch": 0.55, - "learning_rate": 1.8782293453125587e-06, - "loss": 0.8418, - "step": 21533 - }, - { - "epoch": 0.55, - "learning_rate": 1.8782161118665956e-06, - "loss": 0.8027, - "step": 21534 - }, - { - "epoch": 0.55, - "learning_rate": 1.8782028777482228e-06, - "loss": 0.791, - "step": 21535 - }, - { - "epoch": 0.55, - "learning_rate": 1.8781896429574507e-06, - "loss": 0.8271, - "step": 21536 - }, - { - "epoch": 0.55, - "learning_rate": 1.8781764074942892e-06, - "loss": 0.8799, - "step": 21537 - }, - { - "epoch": 0.55, - "learning_rate": 1.878163171358748e-06, - "loss": 0.9814, - "step": 21538 - }, - { - "epoch": 0.55, - "learning_rate": 1.878149934550838e-06, - "loss": 0.7822, - "step": 21539 - }, - { - "epoch": 0.55, - "learning_rate": 1.8781366970705687e-06, - "loss": 0.9004, - "step": 21540 - }, - { - "epoch": 0.55, - "learning_rate": 1.8781234589179506e-06, - "loss": 0.8477, - "step": 21541 - }, - { - "epoch": 0.55, - "learning_rate": 1.878110220092994e-06, - "loss": 0.9434, - "step": 21542 - }, - { - "epoch": 0.55, - "learning_rate": 1.8780969805957084e-06, - "loss": 0.731, - "step": 21543 - }, - { - "epoch": 0.55, - "learning_rate": 1.8780837404261045e-06, - "loss": 0.8506, - "step": 21544 - }, - { - "epoch": 0.55, - "learning_rate": 1.8780704995841924e-06, - "loss": 0.9766, - "step": 21545 - }, - { - "epoch": 0.55, - "learning_rate": 1.8780572580699819e-06, - "loss": 0.8867, - "step": 21546 - }, - { - "epoch": 0.55, - "learning_rate": 1.8780440158834835e-06, - "loss": 0.8501, - "step": 21547 - }, - { - "epoch": 0.55, - "learning_rate": 1.8780307730247069e-06, - "loss": 0.8926, - "step": 21548 - }, - { - "epoch": 0.55, - "learning_rate": 1.8780175294936627e-06, - "loss": 0.8301, - "step": 21549 - }, - { - "epoch": 0.55, - "learning_rate": 1.8780042852903608e-06, - "loss": 0.9902, - "step": 21550 - }, - { - "epoch": 0.55, - "learning_rate": 1.8779910404148115e-06, - "loss": 0.8145, - "step": 21551 - }, - { - "epoch": 0.55, - "learning_rate": 1.8779777948670246e-06, - "loss": 0.8438, - "step": 21552 - }, - { - "epoch": 0.55, - "learning_rate": 1.8779645486470106e-06, - "loss": 0.8169, - "step": 21553 - }, - { - "epoch": 0.55, - "learning_rate": 1.8779513017547797e-06, - "loss": 0.877, - "step": 21554 - }, - { - "epoch": 0.55, - "learning_rate": 1.8779380541903417e-06, - "loss": 0.6377, - "step": 21555 - }, - { - "epoch": 0.55, - "learning_rate": 1.8779248059537067e-06, - "loss": 1.0098, - "step": 21556 - }, - { - "epoch": 0.55, - "learning_rate": 1.877911557044885e-06, - "loss": 0.8086, - "step": 21557 - }, - { - "epoch": 0.55, - "learning_rate": 1.8778983074638873e-06, - "loss": 0.8379, - "step": 21558 - }, - { - "epoch": 0.55, - "learning_rate": 1.8778850572107227e-06, - "loss": 1.0615, - "step": 21559 - }, - { - "epoch": 0.55, - "learning_rate": 1.8778718062854023e-06, - "loss": 1.0752, - "step": 21560 - }, - { - "epoch": 0.55, - "learning_rate": 1.8778585546879357e-06, - "loss": 0.6113, - "step": 21561 - }, - { - "epoch": 0.55, - "learning_rate": 1.877845302418333e-06, - "loss": 1.0605, - "step": 21562 - }, - { - "epoch": 0.55, - "learning_rate": 1.8778320494766046e-06, - "loss": 1.0146, - "step": 21563 - }, - { - "epoch": 0.55, - "learning_rate": 1.8778187958627606e-06, - "loss": 0.7148, - "step": 21564 - }, - { - "epoch": 0.55, - "learning_rate": 1.8778055415768114e-06, - "loss": 0.8525, - "step": 21565 - }, - { - "epoch": 0.55, - "learning_rate": 1.8777922866187663e-06, - "loss": 1.0117, - "step": 21566 - }, - { - "epoch": 0.55, - "learning_rate": 1.8777790309886363e-06, - "loss": 0.814, - "step": 21567 - }, - { - "epoch": 0.55, - "learning_rate": 1.877765774686431e-06, - "loss": 0.6577, - "step": 21568 - }, - { - "epoch": 0.55, - "learning_rate": 1.8777525177121612e-06, - "loss": 0.8462, - "step": 21569 - }, - { - "epoch": 0.55, - "learning_rate": 1.8777392600658364e-06, - "loss": 0.7549, - "step": 21570 - }, - { - "epoch": 0.55, - "learning_rate": 1.8777260017474672e-06, - "loss": 0.7959, - "step": 21571 - }, - { - "epoch": 0.55, - "learning_rate": 1.8777127427570635e-06, - "loss": 1.1377, - "step": 21572 - }, - { - "epoch": 0.55, - "learning_rate": 1.8776994830946356e-06, - "loss": 0.6826, - "step": 21573 - }, - { - "epoch": 0.55, - "learning_rate": 1.8776862227601933e-06, - "loss": 0.9092, - "step": 21574 - }, - { - "epoch": 0.55, - "learning_rate": 1.8776729617537472e-06, - "loss": 1.0176, - "step": 21575 - }, - { - "epoch": 0.55, - "learning_rate": 1.8776597000753071e-06, - "loss": 0.8115, - "step": 21576 - }, - { - "epoch": 0.55, - "learning_rate": 1.8776464377248832e-06, - "loss": 0.7939, - "step": 21577 - }, - { - "epoch": 0.55, - "learning_rate": 1.8776331747024862e-06, - "loss": 0.8579, - "step": 21578 - }, - { - "epoch": 0.55, - "learning_rate": 1.877619911008126e-06, - "loss": 0.8047, - "step": 21579 - }, - { - "epoch": 0.55, - "learning_rate": 1.8776066466418121e-06, - "loss": 0.5913, - "step": 21580 - }, - { - "epoch": 0.55, - "learning_rate": 1.8775933816035553e-06, - "loss": 0.75, - "step": 21581 - }, - { - "epoch": 0.55, - "learning_rate": 1.8775801158933654e-06, - "loss": 0.8306, - "step": 21582 - }, - { - "epoch": 0.55, - "learning_rate": 1.8775668495112532e-06, - "loss": 0.8955, - "step": 21583 - }, - { - "epoch": 0.55, - "learning_rate": 1.877553582457228e-06, - "loss": 0.8799, - "step": 21584 - }, - { - "epoch": 0.55, - "learning_rate": 1.8775403147313004e-06, - "loss": 0.9658, - "step": 21585 - }, - { - "epoch": 0.55, - "learning_rate": 1.8775270463334808e-06, - "loss": 1.0303, - "step": 21586 - }, - { - "epoch": 0.55, - "learning_rate": 1.8775137772637791e-06, - "loss": 0.9385, - "step": 21587 - }, - { - "epoch": 0.55, - "learning_rate": 1.877500507522205e-06, - "loss": 0.8457, - "step": 21588 - }, - { - "epoch": 0.55, - "learning_rate": 1.8774872371087696e-06, - "loss": 0.7109, - "step": 21589 - }, - { - "epoch": 0.55, - "learning_rate": 1.8774739660234821e-06, - "loss": 1.0469, - "step": 21590 - }, - { - "epoch": 0.55, - "learning_rate": 1.8774606942663537e-06, - "loss": 0.9463, - "step": 21591 - }, - { - "epoch": 0.55, - "learning_rate": 1.8774474218373935e-06, - "loss": 0.8223, - "step": 21592 - }, - { - "epoch": 0.55, - "learning_rate": 1.8774341487366125e-06, - "loss": 0.9082, - "step": 21593 - }, - { - "epoch": 0.55, - "learning_rate": 1.8774208749640204e-06, - "loss": 0.7109, - "step": 21594 - }, - { - "epoch": 0.55, - "learning_rate": 1.8774076005196275e-06, - "loss": 0.8818, - "step": 21595 - }, - { - "epoch": 0.55, - "learning_rate": 1.877394325403444e-06, - "loss": 0.9688, - "step": 21596 - }, - { - "epoch": 0.55, - "learning_rate": 1.8773810496154797e-06, - "loss": 0.9814, - "step": 21597 - }, - { - "epoch": 0.55, - "learning_rate": 1.8773677731557453e-06, - "loss": 0.959, - "step": 21598 - }, - { - "epoch": 0.55, - "learning_rate": 1.8773544960242509e-06, - "loss": 1.0332, - "step": 21599 - }, - { - "epoch": 0.55, - "learning_rate": 1.8773412182210062e-06, - "loss": 0.645, - "step": 21600 - }, - { - "epoch": 0.55, - "learning_rate": 1.8773279397460218e-06, - "loss": 0.6868, - "step": 21601 - }, - { - "epoch": 0.55, - "learning_rate": 1.8773146605993078e-06, - "loss": 0.7573, - "step": 21602 - }, - { - "epoch": 0.55, - "learning_rate": 1.877301380780874e-06, - "loss": 0.6492, - "step": 21603 - }, - { - "epoch": 0.55, - "learning_rate": 1.8772881002907312e-06, - "loss": 0.9775, - "step": 21604 - }, - { - "epoch": 0.55, - "learning_rate": 1.8772748191288894e-06, - "loss": 1.1836, - "step": 21605 - }, - { - "epoch": 0.55, - "learning_rate": 1.8772615372953582e-06, - "loss": 0.9463, - "step": 21606 - }, - { - "epoch": 0.55, - "learning_rate": 1.8772482547901483e-06, - "loss": 0.9204, - "step": 21607 - }, - { - "epoch": 0.55, - "learning_rate": 1.8772349716132698e-06, - "loss": 1.0615, - "step": 21608 - }, - { - "epoch": 0.55, - "learning_rate": 1.877221687764733e-06, - "loss": 0.7446, - "step": 21609 - }, - { - "epoch": 0.55, - "learning_rate": 1.8772084032445474e-06, - "loss": 1.0576, - "step": 21610 - }, - { - "epoch": 0.55, - "learning_rate": 1.877195118052724e-06, - "loss": 0.7539, - "step": 21611 - }, - { - "epoch": 0.55, - "learning_rate": 1.8771818321892726e-06, - "loss": 0.9385, - "step": 21612 - }, - { - "epoch": 0.55, - "learning_rate": 1.8771685456542037e-06, - "loss": 0.9648, - "step": 21613 - }, - { - "epoch": 0.55, - "learning_rate": 1.8771552584475266e-06, - "loss": 0.8745, - "step": 21614 - }, - { - "epoch": 0.55, - "learning_rate": 1.8771419705692523e-06, - "loss": 1.209, - "step": 21615 - }, - { - "epoch": 0.55, - "learning_rate": 1.877128682019391e-06, - "loss": 0.918, - "step": 21616 - }, - { - "epoch": 0.55, - "learning_rate": 1.8771153927979522e-06, - "loss": 1.0605, - "step": 21617 - }, - { - "epoch": 0.55, - "learning_rate": 1.8771021029049465e-06, - "loss": 1.0557, - "step": 21618 - }, - { - "epoch": 0.55, - "learning_rate": 1.8770888123403843e-06, - "loss": 0.8125, - "step": 21619 - }, - { - "epoch": 0.55, - "learning_rate": 1.8770755211042755e-06, - "loss": 0.9102, - "step": 21620 - }, - { - "epoch": 0.55, - "learning_rate": 1.8770622291966301e-06, - "loss": 0.7568, - "step": 21621 - }, - { - "epoch": 0.55, - "learning_rate": 1.8770489366174587e-06, - "loss": 0.9248, - "step": 21622 - }, - { - "epoch": 0.55, - "learning_rate": 1.8770356433667712e-06, - "loss": 0.6138, - "step": 21623 - }, - { - "epoch": 0.55, - "learning_rate": 1.8770223494445776e-06, - "loss": 0.9648, - "step": 21624 - }, - { - "epoch": 0.55, - "learning_rate": 1.8770090548508886e-06, - "loss": 0.9512, - "step": 21625 - }, - { - "epoch": 0.55, - "learning_rate": 1.8769957595857137e-06, - "loss": 1.0186, - "step": 21626 - }, - { - "epoch": 0.55, - "learning_rate": 1.8769824636490638e-06, - "loss": 0.8672, - "step": 21627 - }, - { - "epoch": 0.55, - "learning_rate": 1.8769691670409488e-06, - "loss": 1.041, - "step": 21628 - }, - { - "epoch": 0.55, - "learning_rate": 1.8769558697613787e-06, - "loss": 0.8379, - "step": 21629 - }, - { - "epoch": 0.55, - "learning_rate": 1.876942571810364e-06, - "loss": 0.9668, - "step": 21630 - }, - { - "epoch": 0.55, - "learning_rate": 1.8769292731879144e-06, - "loss": 0.8398, - "step": 21631 - }, - { - "epoch": 0.55, - "learning_rate": 1.8769159738940407e-06, - "loss": 0.8877, - "step": 21632 - }, - { - "epoch": 0.55, - "learning_rate": 1.8769026739287526e-06, - "loss": 0.7036, - "step": 21633 - }, - { - "epoch": 0.55, - "learning_rate": 1.8768893732920604e-06, - "loss": 0.751, - "step": 21634 - }, - { - "epoch": 0.55, - "learning_rate": 1.8768760719839746e-06, - "loss": 0.9248, - "step": 21635 - }, - { - "epoch": 0.55, - "learning_rate": 1.8768627700045045e-06, - "loss": 0.7134, - "step": 21636 - }, - { - "epoch": 0.55, - "learning_rate": 1.8768494673536614e-06, - "loss": 1.0068, - "step": 21637 - }, - { - "epoch": 0.55, - "learning_rate": 1.8768361640314549e-06, - "loss": 1.042, - "step": 21638 - }, - { - "epoch": 0.55, - "learning_rate": 1.8768228600378953e-06, - "loss": 0.835, - "step": 21639 - }, - { - "epoch": 0.55, - "learning_rate": 1.8768095553729927e-06, - "loss": 0.7949, - "step": 21640 - }, - { - "epoch": 0.55, - "learning_rate": 1.8767962500367571e-06, - "loss": 0.8472, - "step": 21641 - }, - { - "epoch": 0.55, - "learning_rate": 1.876782944029199e-06, - "loss": 0.9199, - "step": 21642 - }, - { - "epoch": 0.55, - "learning_rate": 1.8767696373503289e-06, - "loss": 0.6956, - "step": 21643 - }, - { - "epoch": 0.55, - "learning_rate": 1.8767563300001562e-06, - "loss": 0.8369, - "step": 21644 - }, - { - "epoch": 0.55, - "learning_rate": 1.8767430219786918e-06, - "loss": 0.8809, - "step": 21645 - }, - { - "epoch": 0.55, - "learning_rate": 1.8767297132859455e-06, - "loss": 0.8184, - "step": 21646 - }, - { - "epoch": 0.55, - "learning_rate": 1.8767164039219275e-06, - "loss": 0.7427, - "step": 21647 - }, - { - "epoch": 0.55, - "learning_rate": 1.8767030938866477e-06, - "loss": 0.9551, - "step": 21648 - }, - { - "epoch": 0.55, - "learning_rate": 1.8766897831801172e-06, - "loss": 1.0088, - "step": 21649 - }, - { - "epoch": 0.55, - "learning_rate": 1.8766764718023452e-06, - "loss": 0.8333, - "step": 21650 - }, - { - "epoch": 0.55, - "learning_rate": 1.8766631597533429e-06, - "loss": 0.9014, - "step": 21651 - }, - { - "epoch": 0.55, - "learning_rate": 1.8766498470331197e-06, - "loss": 0.9395, - "step": 21652 - }, - { - "epoch": 0.55, - "learning_rate": 1.876636533641686e-06, - "loss": 0.624, - "step": 21653 - }, - { - "epoch": 0.56, - "learning_rate": 1.8766232195790516e-06, - "loss": 0.9619, - "step": 21654 - }, - { - "epoch": 0.56, - "learning_rate": 1.8766099048452278e-06, - "loss": 0.9453, - "step": 21655 - }, - { - "epoch": 0.56, - "learning_rate": 1.8765965894402235e-06, - "loss": 0.9043, - "step": 21656 - }, - { - "epoch": 0.56, - "learning_rate": 1.87658327336405e-06, - "loss": 0.8086, - "step": 21657 - }, - { - "epoch": 0.56, - "learning_rate": 1.8765699566167169e-06, - "loss": 0.5215, - "step": 21658 - }, - { - "epoch": 0.56, - "learning_rate": 1.8765566391982342e-06, - "loss": 0.8574, - "step": 21659 - }, - { - "epoch": 0.56, - "learning_rate": 1.8765433211086124e-06, - "loss": 1.1191, - "step": 21660 - }, - { - "epoch": 0.56, - "learning_rate": 1.8765300023478618e-06, - "loss": 0.8232, - "step": 21661 - }, - { - "epoch": 0.56, - "learning_rate": 1.8765166829159926e-06, - "loss": 1.0342, - "step": 21662 - }, - { - "epoch": 0.56, - "learning_rate": 1.8765033628130147e-06, - "loss": 0.9912, - "step": 21663 - }, - { - "epoch": 0.56, - "learning_rate": 1.8764900420389388e-06, - "loss": 0.7598, - "step": 21664 - }, - { - "epoch": 0.56, - "learning_rate": 1.8764767205937743e-06, - "loss": 0.9121, - "step": 21665 - }, - { - "epoch": 0.56, - "learning_rate": 1.8764633984775321e-06, - "loss": 0.7979, - "step": 21666 - }, - { - "epoch": 0.56, - "learning_rate": 1.8764500756902222e-06, - "loss": 0.7559, - "step": 21667 - }, - { - "epoch": 0.56, - "learning_rate": 1.876436752231855e-06, - "loss": 0.6274, - "step": 21668 - }, - { - "epoch": 0.56, - "learning_rate": 1.87642342810244e-06, - "loss": 0.8135, - "step": 21669 - }, - { - "epoch": 0.56, - "learning_rate": 1.876410103301988e-06, - "loss": 0.7661, - "step": 21670 - }, - { - "epoch": 0.56, - "learning_rate": 1.8763967778305095e-06, - "loss": 0.8428, - "step": 21671 - }, - { - "epoch": 0.56, - "learning_rate": 1.8763834516880139e-06, - "loss": 0.9521, - "step": 21672 - }, - { - "epoch": 0.56, - "learning_rate": 1.8763701248745122e-06, - "loss": 0.9199, - "step": 21673 - }, - { - "epoch": 0.56, - "learning_rate": 1.8763567973900136e-06, - "loss": 1.0752, - "step": 21674 - }, - { - "epoch": 0.56, - "learning_rate": 1.8763434692345292e-06, - "loss": 0.8896, - "step": 21675 - }, - { - "epoch": 0.56, - "learning_rate": 1.876330140408069e-06, - "loss": 0.7637, - "step": 21676 - }, - { - "epoch": 0.56, - "learning_rate": 1.876316810910643e-06, - "loss": 0.9678, - "step": 21677 - }, - { - "epoch": 0.56, - "learning_rate": 1.8763034807422616e-06, - "loss": 0.9736, - "step": 21678 - }, - { - "epoch": 0.56, - "learning_rate": 1.8762901499029345e-06, - "loss": 0.9961, - "step": 21679 - }, - { - "epoch": 0.56, - "learning_rate": 1.8762768183926727e-06, - "loss": 0.8877, - "step": 21680 - }, - { - "epoch": 0.56, - "learning_rate": 1.876263486211486e-06, - "loss": 0.6826, - "step": 21681 - }, - { - "epoch": 0.56, - "learning_rate": 1.8762501533593847e-06, - "loss": 0.8418, - "step": 21682 - }, - { - "epoch": 0.56, - "learning_rate": 1.8762368198363787e-06, - "loss": 1.0303, - "step": 21683 - }, - { - "epoch": 0.56, - "learning_rate": 1.8762234856424786e-06, - "loss": 0.8652, - "step": 21684 - }, - { - "epoch": 0.56, - "learning_rate": 1.8762101507776945e-06, - "loss": 0.8564, - "step": 21685 - }, - { - "epoch": 0.56, - "learning_rate": 1.8761968152420366e-06, - "loss": 0.7959, - "step": 21686 - }, - { - "epoch": 0.56, - "learning_rate": 1.8761834790355149e-06, - "loss": 0.7959, - "step": 21687 - }, - { - "epoch": 0.56, - "learning_rate": 1.87617014215814e-06, - "loss": 0.8223, - "step": 21688 - }, - { - "epoch": 0.56, - "learning_rate": 1.876156804609922e-06, - "loss": 1.0059, - "step": 21689 - }, - { - "epoch": 0.56, - "learning_rate": 1.8761434663908708e-06, - "loss": 0.8184, - "step": 21690 - }, - { - "epoch": 0.56, - "learning_rate": 1.876130127500997e-06, - "loss": 0.7988, - "step": 21691 - }, - { - "epoch": 0.56, - "learning_rate": 1.8761167879403103e-06, - "loss": 0.8252, - "step": 21692 - }, - { - "epoch": 0.56, - "learning_rate": 1.8761034477088216e-06, - "loss": 0.8682, - "step": 21693 - }, - { - "epoch": 0.56, - "learning_rate": 1.876090106806541e-06, - "loss": 0.7639, - "step": 21694 - }, - { - "epoch": 0.56, - "learning_rate": 1.876076765233478e-06, - "loss": 0.8359, - "step": 21695 - }, - { - "epoch": 0.56, - "learning_rate": 1.8760634229896434e-06, - "loss": 0.6909, - "step": 21696 - }, - { - "epoch": 0.56, - "learning_rate": 1.8760500800750476e-06, - "loss": 0.9463, - "step": 21697 - }, - { - "epoch": 0.56, - "learning_rate": 1.8760367364897002e-06, - "loss": 0.9424, - "step": 21698 - }, - { - "epoch": 0.56, - "learning_rate": 1.8760233922336117e-06, - "loss": 0.9795, - "step": 21699 - }, - { - "epoch": 0.56, - "learning_rate": 1.8760100473067928e-06, - "loss": 0.7959, - "step": 21700 - }, - { - "epoch": 0.56, - "learning_rate": 1.875996701709253e-06, - "loss": 1.1387, - "step": 21701 - }, - { - "epoch": 0.56, - "learning_rate": 1.875983355441003e-06, - "loss": 0.8311, - "step": 21702 - }, - { - "epoch": 0.56, - "learning_rate": 1.8759700085020525e-06, - "loss": 0.8491, - "step": 21703 - }, - { - "epoch": 0.56, - "learning_rate": 1.8759566608924121e-06, - "loss": 0.833, - "step": 21704 - }, - { - "epoch": 0.56, - "learning_rate": 1.8759433126120924e-06, - "loss": 0.6279, - "step": 21705 - }, - { - "epoch": 0.56, - "learning_rate": 1.8759299636611025e-06, - "loss": 0.7222, - "step": 21706 - }, - { - "epoch": 0.56, - "learning_rate": 1.875916614039454e-06, - "loss": 0.8877, - "step": 21707 - }, - { - "epoch": 0.56, - "learning_rate": 1.8759032637471559e-06, - "loss": 0.9854, - "step": 21708 - }, - { - "epoch": 0.56, - "learning_rate": 1.8758899127842193e-06, - "loss": 0.8867, - "step": 21709 - }, - { - "epoch": 0.56, - "learning_rate": 1.8758765611506538e-06, - "loss": 0.8496, - "step": 21710 - }, - { - "epoch": 0.56, - "learning_rate": 1.8758632088464702e-06, - "loss": 0.7158, - "step": 21711 - }, - { - "epoch": 0.56, - "learning_rate": 1.875849855871678e-06, - "loss": 0.6504, - "step": 21712 - }, - { - "epoch": 0.56, - "learning_rate": 1.875836502226288e-06, - "loss": 1.0166, - "step": 21713 - }, - { - "epoch": 0.56, - "learning_rate": 1.8758231479103102e-06, - "loss": 0.7002, - "step": 21714 - }, - { - "epoch": 0.56, - "learning_rate": 1.8758097929237551e-06, - "loss": 0.7446, - "step": 21715 - }, - { - "epoch": 0.56, - "learning_rate": 1.8757964372666326e-06, - "loss": 0.7471, - "step": 21716 - }, - { - "epoch": 0.56, - "learning_rate": 1.8757830809389529e-06, - "loss": 0.7871, - "step": 21717 - }, - { - "epoch": 0.56, - "learning_rate": 1.875769723940727e-06, - "loss": 0.7334, - "step": 21718 - }, - { - "epoch": 0.56, - "learning_rate": 1.8757563662719639e-06, - "loss": 0.9102, - "step": 21719 - }, - { - "epoch": 0.56, - "learning_rate": 1.8757430079326743e-06, - "loss": 0.9209, - "step": 21720 - }, - { - "epoch": 0.56, - "learning_rate": 1.875729648922869e-06, - "loss": 0.8564, - "step": 21721 - }, - { - "epoch": 0.56, - "learning_rate": 1.8757162892425574e-06, - "loss": 0.7959, - "step": 21722 - }, - { - "epoch": 0.56, - "learning_rate": 1.87570292889175e-06, - "loss": 0.7959, - "step": 21723 - }, - { - "epoch": 0.56, - "learning_rate": 1.8756895678704577e-06, - "loss": 0.79, - "step": 21724 - }, - { - "epoch": 0.56, - "learning_rate": 1.8756762061786896e-06, - "loss": 0.7646, - "step": 21725 - }, - { - "epoch": 0.56, - "learning_rate": 1.8756628438164568e-06, - "loss": 0.9121, - "step": 21726 - }, - { - "epoch": 0.56, - "learning_rate": 1.8756494807837693e-06, - "loss": 0.9272, - "step": 21727 - }, - { - "epoch": 0.56, - "learning_rate": 1.8756361170806372e-06, - "loss": 0.8252, - "step": 21728 - }, - { - "epoch": 0.56, - "learning_rate": 1.8756227527070705e-06, - "loss": 0.9863, - "step": 21729 - }, - { - "epoch": 0.56, - "learning_rate": 1.87560938766308e-06, - "loss": 0.9756, - "step": 21730 - }, - { - "epoch": 0.56, - "learning_rate": 1.8755960219486756e-06, - "loss": 0.7808, - "step": 21731 - }, - { - "epoch": 0.56, - "learning_rate": 1.8755826555638677e-06, - "loss": 0.7935, - "step": 21732 - }, - { - "epoch": 0.56, - "learning_rate": 1.875569288508666e-06, - "loss": 0.9531, - "step": 21733 - }, - { - "epoch": 0.56, - "learning_rate": 1.8755559207830816e-06, - "loss": 0.8379, - "step": 21734 - }, - { - "epoch": 0.56, - "learning_rate": 1.875542552387124e-06, - "loss": 0.9028, - "step": 21735 - }, - { - "epoch": 0.56, - "learning_rate": 1.875529183320804e-06, - "loss": 0.7847, - "step": 21736 - }, - { - "epoch": 0.56, - "learning_rate": 1.8755158135841315e-06, - "loss": 0.9043, - "step": 21737 - }, - { - "epoch": 0.56, - "learning_rate": 1.8755024431771167e-06, - "loss": 0.9248, - "step": 21738 - }, - { - "epoch": 0.56, - "learning_rate": 1.8754890720997697e-06, - "loss": 0.9082, - "step": 21739 - }, - { - "epoch": 0.56, - "learning_rate": 1.8754757003521012e-06, - "loss": 1.042, - "step": 21740 - }, - { - "epoch": 0.56, - "learning_rate": 1.8754623279341214e-06, - "loss": 0.8164, - "step": 21741 - }, - { - "epoch": 0.56, - "learning_rate": 1.87544895484584e-06, - "loss": 0.6768, - "step": 21742 - }, - { - "epoch": 0.56, - "learning_rate": 1.875435581087268e-06, - "loss": 0.9033, - "step": 21743 - }, - { - "epoch": 0.56, - "learning_rate": 1.8754222066584152e-06, - "loss": 0.9668, - "step": 21744 - }, - { - "epoch": 0.56, - "learning_rate": 1.8754088315592912e-06, - "loss": 0.9521, - "step": 21745 - }, - { - "epoch": 0.56, - "learning_rate": 1.8753954557899076e-06, - "loss": 0.897, - "step": 21746 - }, - { - "epoch": 0.56, - "learning_rate": 1.875382079350274e-06, - "loss": 0.6782, - "step": 21747 - }, - { - "epoch": 0.56, - "learning_rate": 1.8753687022404e-06, - "loss": 1.0049, - "step": 21748 - }, - { - "epoch": 0.56, - "learning_rate": 1.8753553244602968e-06, - "loss": 0.6343, - "step": 21749 - }, - { - "epoch": 0.56, - "learning_rate": 1.8753419460099744e-06, - "loss": 0.9561, - "step": 21750 - }, - { - "epoch": 0.56, - "learning_rate": 1.8753285668894428e-06, - "loss": 1.0439, - "step": 21751 - }, - { - "epoch": 0.56, - "learning_rate": 1.8753151870987124e-06, - "loss": 0.9238, - "step": 21752 - }, - { - "epoch": 0.56, - "learning_rate": 1.8753018066377932e-06, - "loss": 0.7559, - "step": 21753 - }, - { - "epoch": 0.56, - "learning_rate": 1.8752884255066959e-06, - "loss": 0.8516, - "step": 21754 - }, - { - "epoch": 0.56, - "learning_rate": 1.87527504370543e-06, - "loss": 0.707, - "step": 21755 - }, - { - "epoch": 0.56, - "learning_rate": 1.8752616612340068e-06, - "loss": 0.7368, - "step": 21756 - }, - { - "epoch": 0.56, - "learning_rate": 1.875248278092436e-06, - "loss": 0.6753, - "step": 21757 - }, - { - "epoch": 0.56, - "learning_rate": 1.8752348942807275e-06, - "loss": 0.5911, - "step": 21758 - }, - { - "epoch": 0.56, - "learning_rate": 1.875221509798892e-06, - "loss": 0.9795, - "step": 21759 - }, - { - "epoch": 0.56, - "learning_rate": 1.87520812464694e-06, - "loss": 0.9658, - "step": 21760 - }, - { - "epoch": 0.56, - "learning_rate": 1.8751947388248807e-06, - "loss": 0.7905, - "step": 21761 - }, - { - "epoch": 0.56, - "learning_rate": 1.8751813523327255e-06, - "loss": 0.8203, - "step": 21762 - }, - { - "epoch": 0.56, - "learning_rate": 1.8751679651704842e-06, - "loss": 0.5347, - "step": 21763 - }, - { - "epoch": 0.56, - "learning_rate": 1.875154577338167e-06, - "loss": 0.688, - "step": 21764 - }, - { - "epoch": 0.56, - "learning_rate": 1.8751411888357839e-06, - "loss": 0.8584, - "step": 21765 - }, - { - "epoch": 0.56, - "learning_rate": 1.8751277996633456e-06, - "loss": 0.7324, - "step": 21766 - }, - { - "epoch": 0.56, - "learning_rate": 1.8751144098208625e-06, - "loss": 0.9941, - "step": 21767 - }, - { - "epoch": 0.56, - "learning_rate": 1.8751010193083442e-06, - "loss": 0.874, - "step": 21768 - }, - { - "epoch": 0.56, - "learning_rate": 1.8750876281258012e-06, - "loss": 1.0684, - "step": 21769 - }, - { - "epoch": 0.56, - "learning_rate": 1.8750742362732441e-06, - "loss": 0.8022, - "step": 21770 - }, - { - "epoch": 0.56, - "learning_rate": 1.8750608437506827e-06, - "loss": 0.9463, - "step": 21771 - }, - { - "epoch": 0.56, - "learning_rate": 1.8750474505581276e-06, - "loss": 0.8555, - "step": 21772 - }, - { - "epoch": 0.56, - "learning_rate": 1.8750340566955889e-06, - "loss": 0.9023, - "step": 21773 - }, - { - "epoch": 0.56, - "learning_rate": 1.8750206621630765e-06, - "loss": 0.8955, - "step": 21774 - }, - { - "epoch": 0.56, - "learning_rate": 1.8750072669606014e-06, - "loss": 0.7666, - "step": 21775 - }, - { - "epoch": 0.56, - "learning_rate": 1.8749938710881733e-06, - "loss": 0.7463, - "step": 21776 - }, - { - "epoch": 0.56, - "learning_rate": 1.8749804745458028e-06, - "loss": 0.9541, - "step": 21777 - }, - { - "epoch": 0.56, - "learning_rate": 1.8749670773334997e-06, - "loss": 0.9268, - "step": 21778 - }, - { - "epoch": 0.56, - "learning_rate": 1.8749536794512749e-06, - "loss": 0.7129, - "step": 21779 - }, - { - "epoch": 0.56, - "learning_rate": 1.8749402808991382e-06, - "loss": 1.0439, - "step": 21780 - }, - { - "epoch": 0.56, - "learning_rate": 1.8749268816770995e-06, - "loss": 0.8643, - "step": 21781 - }, - { - "epoch": 0.56, - "learning_rate": 1.8749134817851702e-06, - "loss": 0.7402, - "step": 21782 - }, - { - "epoch": 0.56, - "learning_rate": 1.8749000812233592e-06, - "loss": 0.8203, - "step": 21783 - }, - { - "epoch": 0.56, - "learning_rate": 1.8748866799916781e-06, - "loss": 0.9102, - "step": 21784 - }, - { - "epoch": 0.56, - "learning_rate": 1.8748732780901363e-06, - "loss": 0.7747, - "step": 21785 - }, - { - "epoch": 0.56, - "learning_rate": 1.874859875518744e-06, - "loss": 0.8713, - "step": 21786 - }, - { - "epoch": 0.56, - "learning_rate": 1.874846472277512e-06, - "loss": 0.8906, - "step": 21787 - }, - { - "epoch": 0.56, - "learning_rate": 1.8748330683664499e-06, - "loss": 0.9756, - "step": 21788 - }, - { - "epoch": 0.56, - "learning_rate": 1.8748196637855687e-06, - "loss": 0.9414, - "step": 21789 - }, - { - "epoch": 0.56, - "learning_rate": 1.8748062585348783e-06, - "loss": 0.8955, - "step": 21790 - }, - { - "epoch": 0.56, - "learning_rate": 1.8747928526143887e-06, - "loss": 0.7876, - "step": 21791 - }, - { - "epoch": 0.56, - "learning_rate": 1.8747794460241106e-06, - "loss": 0.8652, - "step": 21792 - }, - { - "epoch": 0.56, - "learning_rate": 1.8747660387640543e-06, - "loss": 0.8193, - "step": 21793 - }, - { - "epoch": 0.56, - "learning_rate": 1.8747526308342296e-06, - "loss": 0.6855, - "step": 21794 - }, - { - "epoch": 0.56, - "learning_rate": 1.8747392222346472e-06, - "loss": 0.9785, - "step": 21795 - }, - { - "epoch": 0.56, - "learning_rate": 1.8747258129653171e-06, - "loss": 1.0693, - "step": 21796 - }, - { - "epoch": 0.56, - "learning_rate": 1.8747124030262498e-06, - "loss": 0.8535, - "step": 21797 - }, - { - "epoch": 0.56, - "learning_rate": 1.8746989924174553e-06, - "loss": 0.6416, - "step": 21798 - }, - { - "epoch": 0.56, - "learning_rate": 1.874685581138944e-06, - "loss": 0.9736, - "step": 21799 - }, - { - "epoch": 0.56, - "learning_rate": 1.8746721691907262e-06, - "loss": 0.7104, - "step": 21800 - }, - { - "epoch": 0.56, - "learning_rate": 1.874658756572812e-06, - "loss": 0.7036, - "step": 21801 - }, - { - "epoch": 0.56, - "learning_rate": 1.8746453432852122e-06, - "loss": 1.0107, - "step": 21802 - }, - { - "epoch": 0.56, - "learning_rate": 1.8746319293279363e-06, - "loss": 0.8096, - "step": 21803 - }, - { - "epoch": 0.56, - "learning_rate": 1.874618514700995e-06, - "loss": 0.9297, - "step": 21804 - }, - { - "epoch": 0.56, - "learning_rate": 1.8746050994043987e-06, - "loss": 0.8535, - "step": 21805 - }, - { - "epoch": 0.56, - "learning_rate": 1.8745916834381572e-06, - "loss": 0.6509, - "step": 21806 - }, - { - "epoch": 0.56, - "learning_rate": 1.8745782668022812e-06, - "loss": 0.8589, - "step": 21807 - }, - { - "epoch": 0.56, - "learning_rate": 1.8745648494967809e-06, - "loss": 0.9404, - "step": 21808 - }, - { - "epoch": 0.56, - "learning_rate": 1.8745514315216665e-06, - "loss": 0.7031, - "step": 21809 - }, - { - "epoch": 0.56, - "learning_rate": 1.8745380128769483e-06, - "loss": 0.8643, - "step": 21810 - }, - { - "epoch": 0.56, - "learning_rate": 1.8745245935626363e-06, - "loss": 0.7468, - "step": 21811 - }, - { - "epoch": 0.56, - "learning_rate": 1.8745111735787416e-06, - "loss": 0.9185, - "step": 21812 - }, - { - "epoch": 0.56, - "learning_rate": 1.8744977529252735e-06, - "loss": 1.001, - "step": 21813 - }, - { - "epoch": 0.56, - "learning_rate": 1.8744843316022428e-06, - "loss": 0.9277, - "step": 21814 - }, - { - "epoch": 0.56, - "learning_rate": 1.8744709096096596e-06, - "loss": 0.9521, - "step": 21815 - }, - { - "epoch": 0.56, - "learning_rate": 1.8744574869475342e-06, - "loss": 0.7705, - "step": 21816 - }, - { - "epoch": 0.56, - "learning_rate": 1.8744440636158769e-06, - "loss": 0.8892, - "step": 21817 - }, - { - "epoch": 0.56, - "learning_rate": 1.8744306396146978e-06, - "loss": 0.8281, - "step": 21818 - }, - { - "epoch": 0.56, - "learning_rate": 1.8744172149440076e-06, - "loss": 0.9395, - "step": 21819 - }, - { - "epoch": 0.56, - "learning_rate": 1.8744037896038164e-06, - "loss": 0.7339, - "step": 21820 - }, - { - "epoch": 0.56, - "learning_rate": 1.8743903635941344e-06, - "loss": 0.9414, - "step": 21821 - }, - { - "epoch": 0.56, - "learning_rate": 1.874376936914972e-06, - "loss": 0.8257, - "step": 21822 - }, - { - "epoch": 0.56, - "learning_rate": 1.874363509566339e-06, - "loss": 0.8672, - "step": 21823 - }, - { - "epoch": 0.56, - "learning_rate": 1.8743500815482464e-06, - "loss": 0.8174, - "step": 21824 - }, - { - "epoch": 0.56, - "learning_rate": 1.874336652860704e-06, - "loss": 1.0908, - "step": 21825 - }, - { - "epoch": 0.56, - "learning_rate": 1.8743232235037225e-06, - "loss": 0.7246, - "step": 21826 - }, - { - "epoch": 0.56, - "learning_rate": 1.8743097934773116e-06, - "loss": 0.8906, - "step": 21827 - }, - { - "epoch": 0.56, - "learning_rate": 1.874296362781482e-06, - "loss": 0.7573, - "step": 21828 - }, - { - "epoch": 0.56, - "learning_rate": 1.874282931416244e-06, - "loss": 0.9746, - "step": 21829 - }, - { - "epoch": 0.56, - "learning_rate": 1.8742694993816074e-06, - "loss": 0.8701, - "step": 21830 - }, - { - "epoch": 0.56, - "learning_rate": 1.8742560666775832e-06, - "loss": 1.0352, - "step": 21831 - }, - { - "epoch": 0.56, - "learning_rate": 1.8742426333041811e-06, - "loss": 1.0654, - "step": 21832 - }, - { - "epoch": 0.56, - "learning_rate": 1.8742291992614119e-06, - "loss": 0.8428, - "step": 21833 - }, - { - "epoch": 0.56, - "learning_rate": 1.8742157645492854e-06, - "loss": 0.7871, - "step": 21834 - }, - { - "epoch": 0.56, - "learning_rate": 1.874202329167812e-06, - "loss": 0.6426, - "step": 21835 - }, - { - "epoch": 0.56, - "learning_rate": 1.8741888931170022e-06, - "loss": 0.9688, - "step": 21836 - }, - { - "epoch": 0.56, - "learning_rate": 1.8741754563968662e-06, - "loss": 0.7607, - "step": 21837 - }, - { - "epoch": 0.56, - "learning_rate": 1.874162019007414e-06, - "loss": 0.7798, - "step": 21838 - }, - { - "epoch": 0.56, - "learning_rate": 1.8741485809486566e-06, - "loss": 0.9727, - "step": 21839 - }, - { - "epoch": 0.56, - "learning_rate": 1.8741351422206036e-06, - "loss": 0.7705, - "step": 21840 - }, - { - "epoch": 0.56, - "learning_rate": 1.8741217028232653e-06, - "loss": 1.1035, - "step": 21841 - }, - { - "epoch": 0.56, - "learning_rate": 1.8741082627566525e-06, - "loss": 0.7744, - "step": 21842 - }, - { - "epoch": 0.56, - "learning_rate": 1.8740948220207748e-06, - "loss": 1.1445, - "step": 21843 - }, - { - "epoch": 0.56, - "learning_rate": 1.8740813806156432e-06, - "loss": 0.853, - "step": 21844 - }, - { - "epoch": 0.56, - "learning_rate": 1.8740679385412677e-06, - "loss": 0.8228, - "step": 21845 - }, - { - "epoch": 0.56, - "learning_rate": 1.8740544957976585e-06, - "loss": 0.8154, - "step": 21846 - }, - { - "epoch": 0.56, - "learning_rate": 1.874041052384826e-06, - "loss": 1.0098, - "step": 21847 - }, - { - "epoch": 0.56, - "learning_rate": 1.8740276083027804e-06, - "loss": 0.8877, - "step": 21848 - }, - { - "epoch": 0.56, - "learning_rate": 1.8740141635515322e-06, - "loss": 0.9023, - "step": 21849 - }, - { - "epoch": 0.56, - "learning_rate": 1.8740007181310913e-06, - "loss": 0.8203, - "step": 21850 - }, - { - "epoch": 0.56, - "learning_rate": 1.8739872720414684e-06, - "loss": 1.001, - "step": 21851 - }, - { - "epoch": 0.56, - "learning_rate": 1.8739738252826735e-06, - "loss": 0.9277, - "step": 21852 - }, - { - "epoch": 0.56, - "learning_rate": 1.8739603778547171e-06, - "loss": 0.7656, - "step": 21853 - }, - { - "epoch": 0.56, - "learning_rate": 1.8739469297576096e-06, - "loss": 0.7334, - "step": 21854 - }, - { - "epoch": 0.56, - "learning_rate": 1.8739334809913609e-06, - "loss": 0.7251, - "step": 21855 - }, - { - "epoch": 0.56, - "learning_rate": 1.8739200315559813e-06, - "loss": 1.0234, - "step": 21856 - }, - { - "epoch": 0.56, - "learning_rate": 1.873906581451482e-06, - "loss": 1.0459, - "step": 21857 - }, - { - "epoch": 0.56, - "learning_rate": 1.873893130677872e-06, - "loss": 0.8848, - "step": 21858 - }, - { - "epoch": 0.56, - "learning_rate": 1.8738796792351622e-06, - "loss": 0.8008, - "step": 21859 - }, - { - "epoch": 0.56, - "learning_rate": 1.873866227123363e-06, - "loss": 0.8652, - "step": 21860 - }, - { - "epoch": 0.56, - "learning_rate": 1.873852774342485e-06, - "loss": 0.8477, - "step": 21861 - }, - { - "epoch": 0.56, - "learning_rate": 1.873839320892538e-06, - "loss": 0.8481, - "step": 21862 - }, - { - "epoch": 0.56, - "learning_rate": 1.873825866773532e-06, - "loss": 1.0488, - "step": 21863 - }, - { - "epoch": 0.56, - "learning_rate": 1.8738124119854781e-06, - "loss": 0.8184, - "step": 21864 - }, - { - "epoch": 0.56, - "learning_rate": 1.8737989565283861e-06, - "loss": 1.0703, - "step": 21865 - }, - { - "epoch": 0.56, - "learning_rate": 1.8737855004022664e-06, - "loss": 1.0859, - "step": 21866 - }, - { - "epoch": 0.56, - "learning_rate": 1.8737720436071294e-06, - "loss": 0.9346, - "step": 21867 - }, - { - "epoch": 0.56, - "learning_rate": 1.8737585861429852e-06, - "loss": 1.0479, - "step": 21868 - }, - { - "epoch": 0.56, - "learning_rate": 1.8737451280098444e-06, - "loss": 0.6582, - "step": 21869 - }, - { - "epoch": 0.56, - "learning_rate": 1.873731669207717e-06, - "loss": 0.8135, - "step": 21870 - }, - { - "epoch": 0.56, - "learning_rate": 1.8737182097366133e-06, - "loss": 0.9102, - "step": 21871 - }, - { - "epoch": 0.56, - "learning_rate": 1.8737047495965438e-06, - "loss": 0.9336, - "step": 21872 - }, - { - "epoch": 0.56, - "learning_rate": 1.8736912887875188e-06, - "loss": 0.9053, - "step": 21873 - }, - { - "epoch": 0.56, - "learning_rate": 1.873677827309549e-06, - "loss": 0.9395, - "step": 21874 - }, - { - "epoch": 0.56, - "learning_rate": 1.8736643651626436e-06, - "loss": 0.8398, - "step": 21875 - }, - { - "epoch": 0.56, - "learning_rate": 1.8736509023468138e-06, - "loss": 1.0361, - "step": 21876 - }, - { - "epoch": 0.56, - "learning_rate": 1.8736374388620697e-06, - "loss": 0.8145, - "step": 21877 - }, - { - "epoch": 0.56, - "learning_rate": 1.8736239747084218e-06, - "loss": 0.7725, - "step": 21878 - }, - { - "epoch": 0.56, - "learning_rate": 1.8736105098858798e-06, - "loss": 0.9502, - "step": 21879 - }, - { - "epoch": 0.56, - "learning_rate": 1.8735970443944544e-06, - "loss": 0.865, - "step": 21880 - }, - { - "epoch": 0.56, - "learning_rate": 1.8735835782341562e-06, - "loss": 0.7324, - "step": 21881 - }, - { - "epoch": 0.56, - "learning_rate": 1.8735701114049953e-06, - "loss": 0.7397, - "step": 21882 - }, - { - "epoch": 0.56, - "learning_rate": 1.8735566439069816e-06, - "loss": 0.7925, - "step": 21883 - }, - { - "epoch": 0.56, - "learning_rate": 1.873543175740126e-06, - "loss": 0.8584, - "step": 21884 - }, - { - "epoch": 0.56, - "learning_rate": 1.8735297069044384e-06, - "loss": 0.853, - "step": 21885 - }, - { - "epoch": 0.56, - "learning_rate": 1.8735162373999294e-06, - "loss": 0.876, - "step": 21886 - }, - { - "epoch": 0.56, - "learning_rate": 1.873502767226609e-06, - "loss": 0.665, - "step": 21887 - }, - { - "epoch": 0.56, - "learning_rate": 1.8734892963844878e-06, - "loss": 1.0098, - "step": 21888 - }, - { - "epoch": 0.56, - "learning_rate": 1.8734758248735761e-06, - "loss": 0.7856, - "step": 21889 - }, - { - "epoch": 0.56, - "learning_rate": 1.8734623526938838e-06, - "loss": 0.9043, - "step": 21890 - }, - { - "epoch": 0.56, - "learning_rate": 1.8734488798454218e-06, - "loss": 0.6648, - "step": 21891 - }, - { - "epoch": 0.56, - "learning_rate": 1.8734354063282e-06, - "loss": 0.9844, - "step": 21892 - }, - { - "epoch": 0.56, - "learning_rate": 1.8734219321422292e-06, - "loss": 0.7812, - "step": 21893 - }, - { - "epoch": 0.56, - "learning_rate": 1.873408457287519e-06, - "loss": 0.8154, - "step": 21894 - }, - { - "epoch": 0.56, - "learning_rate": 1.8733949817640803e-06, - "loss": 0.9248, - "step": 21895 - }, - { - "epoch": 0.56, - "learning_rate": 1.873381505571923e-06, - "loss": 0.9863, - "step": 21896 - }, - { - "epoch": 0.56, - "learning_rate": 1.873368028711058e-06, - "loss": 0.8252, - "step": 21897 - }, - { - "epoch": 0.56, - "learning_rate": 1.8733545511814951e-06, - "loss": 0.9941, - "step": 21898 - }, - { - "epoch": 0.56, - "learning_rate": 1.873341072983245e-06, - "loss": 0.7036, - "step": 21899 - }, - { - "epoch": 0.56, - "learning_rate": 1.8733275941163176e-06, - "loss": 0.6963, - "step": 21900 - }, - { - "epoch": 0.56, - "learning_rate": 1.8733141145807231e-06, - "loss": 0.7026, - "step": 21901 - }, - { - "epoch": 0.56, - "learning_rate": 1.8733006343764726e-06, - "loss": 0.6218, - "step": 21902 - }, - { - "epoch": 0.56, - "learning_rate": 1.873287153503576e-06, - "loss": 0.6689, - "step": 21903 - }, - { - "epoch": 0.56, - "learning_rate": 1.8732736719620433e-06, - "loss": 0.8091, - "step": 21904 - }, - { - "epoch": 0.56, - "learning_rate": 1.873260189751885e-06, - "loss": 0.5986, - "step": 21905 - }, - { - "epoch": 0.56, - "learning_rate": 1.873246706873112e-06, - "loss": 0.9902, - "step": 21906 - }, - { - "epoch": 0.56, - "learning_rate": 1.8732332233257338e-06, - "loss": 0.7305, - "step": 21907 - }, - { - "epoch": 0.56, - "learning_rate": 1.8732197391097611e-06, - "loss": 0.8721, - "step": 21908 - }, - { - "epoch": 0.56, - "learning_rate": 1.873206254225204e-06, - "loss": 0.8857, - "step": 21909 - }, - { - "epoch": 0.56, - "learning_rate": 1.8731927686720734e-06, - "loss": 0.7979, - "step": 21910 - }, - { - "epoch": 0.56, - "learning_rate": 1.873179282450379e-06, - "loss": 0.8916, - "step": 21911 - }, - { - "epoch": 0.56, - "learning_rate": 1.8731657955601315e-06, - "loss": 0.9048, - "step": 21912 - }, - { - "epoch": 0.56, - "learning_rate": 1.873152308001341e-06, - "loss": 0.7129, - "step": 21913 - }, - { - "epoch": 0.56, - "learning_rate": 1.873138819774018e-06, - "loss": 0.6841, - "step": 21914 - }, - { - "epoch": 0.56, - "learning_rate": 1.8731253308781727e-06, - "loss": 0.7896, - "step": 21915 - }, - { - "epoch": 0.56, - "learning_rate": 1.8731118413138155e-06, - "loss": 0.9531, - "step": 21916 - }, - { - "epoch": 0.56, - "learning_rate": 1.8730983510809568e-06, - "loss": 1.1533, - "step": 21917 - }, - { - "epoch": 0.56, - "learning_rate": 1.873084860179607e-06, - "loss": 0.9199, - "step": 21918 - }, - { - "epoch": 0.56, - "learning_rate": 1.8730713686097759e-06, - "loss": 0.8164, - "step": 21919 - }, - { - "epoch": 0.56, - "learning_rate": 1.8730578763714743e-06, - "loss": 0.8213, - "step": 21920 - }, - { - "epoch": 0.56, - "learning_rate": 1.8730443834647124e-06, - "loss": 0.9521, - "step": 21921 - }, - { - "epoch": 0.56, - "learning_rate": 1.8730308898895007e-06, - "loss": 0.8301, - "step": 21922 - }, - { - "epoch": 0.56, - "learning_rate": 1.8730173956458493e-06, - "loss": 0.9717, - "step": 21923 - }, - { - "epoch": 0.56, - "learning_rate": 1.8730039007337688e-06, - "loss": 0.8389, - "step": 21924 - }, - { - "epoch": 0.56, - "learning_rate": 1.8729904051532693e-06, - "loss": 0.8447, - "step": 21925 - }, - { - "epoch": 0.56, - "learning_rate": 1.872976908904361e-06, - "loss": 0.918, - "step": 21926 - }, - { - "epoch": 0.56, - "learning_rate": 1.8729634119870545e-06, - "loss": 0.8062, - "step": 21927 - }, - { - "epoch": 0.56, - "learning_rate": 1.8729499144013601e-06, - "loss": 0.9365, - "step": 21928 - }, - { - "epoch": 0.56, - "learning_rate": 1.8729364161472879e-06, - "loss": 0.8613, - "step": 21929 - }, - { - "epoch": 0.56, - "learning_rate": 1.8729229172248486e-06, - "loss": 0.9189, - "step": 21930 - }, - { - "epoch": 0.56, - "learning_rate": 1.8729094176340523e-06, - "loss": 0.8682, - "step": 21931 - }, - { - "epoch": 0.56, - "learning_rate": 1.8728959173749095e-06, - "loss": 0.8867, - "step": 21932 - }, - { - "epoch": 0.56, - "learning_rate": 1.8728824164474304e-06, - "loss": 0.7217, - "step": 21933 - }, - { - "epoch": 0.56, - "learning_rate": 1.8728689148516256e-06, - "loss": 0.7026, - "step": 21934 - }, - { - "epoch": 0.56, - "learning_rate": 1.8728554125875047e-06, - "loss": 0.7588, - "step": 21935 - }, - { - "epoch": 0.56, - "learning_rate": 1.8728419096550787e-06, - "loss": 0.8149, - "step": 21936 - }, - { - "epoch": 0.56, - "learning_rate": 1.8728284060543577e-06, - "loss": 1.0078, - "step": 21937 - }, - { - "epoch": 0.56, - "learning_rate": 1.8728149017853525e-06, - "loss": 0.7783, - "step": 21938 - }, - { - "epoch": 0.56, - "learning_rate": 1.872801396848073e-06, - "loss": 0.7637, - "step": 21939 - }, - { - "epoch": 0.56, - "learning_rate": 1.8727878912425291e-06, - "loss": 1.0117, - "step": 21940 - }, - { - "epoch": 0.56, - "learning_rate": 1.8727743849687322e-06, - "loss": 1.0352, - "step": 21941 - }, - { - "epoch": 0.56, - "learning_rate": 1.872760878026692e-06, - "loss": 0.5376, - "step": 21942 - }, - { - "epoch": 0.56, - "learning_rate": 1.8727473704164187e-06, - "loss": 0.9297, - "step": 21943 - }, - { - "epoch": 0.56, - "learning_rate": 1.872733862137923e-06, - "loss": 0.959, - "step": 21944 - }, - { - "epoch": 0.56, - "learning_rate": 1.872720353191215e-06, - "loss": 0.8818, - "step": 21945 - }, - { - "epoch": 0.56, - "learning_rate": 1.8727068435763056e-06, - "loss": 1.0898, - "step": 21946 - }, - { - "epoch": 0.56, - "learning_rate": 1.8726933332932042e-06, - "loss": 0.9082, - "step": 21947 - }, - { - "epoch": 0.56, - "learning_rate": 1.8726798223419217e-06, - "loss": 0.9922, - "step": 21948 - }, - { - "epoch": 0.56, - "learning_rate": 1.8726663107224688e-06, - "loss": 0.7046, - "step": 21949 - }, - { - "epoch": 0.56, - "learning_rate": 1.872652798434855e-06, - "loss": 0.8535, - "step": 21950 - }, - { - "epoch": 0.56, - "learning_rate": 1.8726392854790911e-06, - "loss": 0.9531, - "step": 21951 - }, - { - "epoch": 0.56, - "learning_rate": 1.8726257718551874e-06, - "loss": 0.686, - "step": 21952 - }, - { - "epoch": 0.56, - "learning_rate": 1.8726122575631545e-06, - "loss": 0.8086, - "step": 21953 - }, - { - "epoch": 0.56, - "learning_rate": 1.8725987426030023e-06, - "loss": 0.9136, - "step": 21954 - }, - { - "epoch": 0.56, - "learning_rate": 1.8725852269747414e-06, - "loss": 0.7715, - "step": 21955 - }, - { - "epoch": 0.56, - "learning_rate": 1.8725717106783823e-06, - "loss": 0.8711, - "step": 21956 - }, - { - "epoch": 0.56, - "learning_rate": 1.872558193713935e-06, - "loss": 0.8623, - "step": 21957 - }, - { - "epoch": 0.56, - "learning_rate": 1.8725446760814102e-06, - "loss": 1.0107, - "step": 21958 - }, - { - "epoch": 0.56, - "learning_rate": 1.8725311577808177e-06, - "loss": 0.7178, - "step": 21959 - }, - { - "epoch": 0.56, - "learning_rate": 1.8725176388121685e-06, - "loss": 0.9463, - "step": 21960 - }, - { - "epoch": 0.56, - "learning_rate": 1.8725041191754727e-06, - "loss": 0.7515, - "step": 21961 - }, - { - "epoch": 0.56, - "learning_rate": 1.8724905988707404e-06, - "loss": 0.9155, - "step": 21962 - }, - { - "epoch": 0.56, - "learning_rate": 1.8724770778979824e-06, - "loss": 0.9316, - "step": 21963 - }, - { - "epoch": 0.56, - "learning_rate": 1.8724635562572086e-06, - "loss": 1.0107, - "step": 21964 - }, - { - "epoch": 0.56, - "learning_rate": 1.8724500339484298e-06, - "loss": 0.8066, - "step": 21965 - }, - { - "epoch": 0.56, - "learning_rate": 1.872436510971656e-06, - "loss": 0.7227, - "step": 21966 - }, - { - "epoch": 0.56, - "learning_rate": 1.8724229873268977e-06, - "loss": 0.8105, - "step": 21967 - }, - { - "epoch": 0.56, - "learning_rate": 1.8724094630141651e-06, - "loss": 0.8438, - "step": 21968 - }, - { - "epoch": 0.56, - "learning_rate": 1.8723959380334688e-06, - "loss": 0.9834, - "step": 21969 - }, - { - "epoch": 0.56, - "learning_rate": 1.8723824123848191e-06, - "loss": 0.8174, - "step": 21970 - }, - { - "epoch": 0.56, - "learning_rate": 1.872368886068226e-06, - "loss": 0.6421, - "step": 21971 - }, - { - "epoch": 0.56, - "learning_rate": 1.8723553590837006e-06, - "loss": 0.8633, - "step": 21972 - }, - { - "epoch": 0.56, - "learning_rate": 1.8723418314312527e-06, - "loss": 0.9385, - "step": 21973 - }, - { - "epoch": 0.56, - "learning_rate": 1.8723283031108928e-06, - "loss": 1.0205, - "step": 21974 - }, - { - "epoch": 0.56, - "learning_rate": 1.8723147741226308e-06, - "loss": 0.7114, - "step": 21975 - }, - { - "epoch": 0.56, - "learning_rate": 1.872301244466478e-06, - "loss": 0.9854, - "step": 21976 - }, - { - "epoch": 0.56, - "learning_rate": 1.8722877141424438e-06, - "loss": 0.9746, - "step": 21977 - }, - { - "epoch": 0.56, - "learning_rate": 1.8722741831505395e-06, - "loss": 0.8306, - "step": 21978 - }, - { - "epoch": 0.56, - "learning_rate": 1.8722606514907746e-06, - "loss": 0.7222, - "step": 21979 - }, - { - "epoch": 0.56, - "learning_rate": 1.87224711916316e-06, - "loss": 0.8906, - "step": 21980 - }, - { - "epoch": 0.56, - "learning_rate": 1.8722335861677059e-06, - "loss": 0.7104, - "step": 21981 - }, - { - "epoch": 0.56, - "learning_rate": 1.8722200525044225e-06, - "loss": 0.7979, - "step": 21982 - }, - { - "epoch": 0.56, - "learning_rate": 1.8722065181733205e-06, - "loss": 0.8916, - "step": 21983 - }, - { - "epoch": 0.56, - "learning_rate": 1.87219298317441e-06, - "loss": 0.8643, - "step": 21984 - }, - { - "epoch": 0.56, - "learning_rate": 1.872179447507701e-06, - "loss": 0.8916, - "step": 21985 - }, - { - "epoch": 0.56, - "learning_rate": 1.8721659111732048e-06, - "loss": 0.8066, - "step": 21986 - }, - { - "epoch": 0.56, - "learning_rate": 1.8721523741709313e-06, - "loss": 0.8643, - "step": 21987 - }, - { - "epoch": 0.56, - "learning_rate": 1.8721388365008907e-06, - "loss": 0.8623, - "step": 21988 - }, - { - "epoch": 0.56, - "learning_rate": 1.8721252981630936e-06, - "loss": 0.8916, - "step": 21989 - }, - { - "epoch": 0.56, - "learning_rate": 1.8721117591575499e-06, - "loss": 0.9102, - "step": 21990 - }, - { - "epoch": 0.56, - "learning_rate": 1.8720982194842708e-06, - "loss": 1.0254, - "step": 21991 - }, - { - "epoch": 0.56, - "learning_rate": 1.8720846791432661e-06, - "loss": 0.6924, - "step": 21992 - }, - { - "epoch": 0.56, - "learning_rate": 1.872071138134546e-06, - "loss": 0.9307, - "step": 21993 - }, - { - "epoch": 0.56, - "learning_rate": 1.8720575964581213e-06, - "loss": 0.7432, - "step": 21994 - }, - { - "epoch": 0.56, - "learning_rate": 1.872044054114002e-06, - "loss": 0.8452, - "step": 21995 - }, - { - "epoch": 0.56, - "learning_rate": 1.8720305111021988e-06, - "loss": 0.9365, - "step": 21996 - }, - { - "epoch": 0.56, - "learning_rate": 1.8720169674227222e-06, - "loss": 0.6768, - "step": 21997 - }, - { - "epoch": 0.56, - "learning_rate": 1.8720034230755819e-06, - "loss": 0.9512, - "step": 21998 - }, - { - "epoch": 0.56, - "learning_rate": 1.8719898780607888e-06, - "loss": 0.7295, - "step": 21999 - }, - { - "epoch": 0.56, - "learning_rate": 1.8719763323783533e-06, - "loss": 0.918, - "step": 22000 - }, - { - "epoch": 0.56, - "learning_rate": 1.8719627860282853e-06, - "loss": 0.7349, - "step": 22001 - }, - { - "epoch": 0.56, - "learning_rate": 1.8719492390105958e-06, - "loss": 0.7168, - "step": 22002 - }, - { - "epoch": 0.56, - "learning_rate": 1.8719356913252947e-06, - "loss": 0.8135, - "step": 22003 - }, - { - "epoch": 0.56, - "learning_rate": 1.8719221429723926e-06, - "loss": 1.0957, - "step": 22004 - }, - { - "epoch": 0.56, - "learning_rate": 1.8719085939518998e-06, - "loss": 0.8223, - "step": 22005 - }, - { - "epoch": 0.56, - "learning_rate": 1.8718950442638267e-06, - "loss": 0.8721, - "step": 22006 - }, - { - "epoch": 0.56, - "learning_rate": 1.8718814939081838e-06, - "loss": 0.7334, - "step": 22007 - }, - { - "epoch": 0.56, - "learning_rate": 1.871867942884981e-06, - "loss": 1.1416, - "step": 22008 - }, - { - "epoch": 0.56, - "learning_rate": 1.8718543911942292e-06, - "loss": 0.9043, - "step": 22009 - }, - { - "epoch": 0.56, - "learning_rate": 1.8718408388359386e-06, - "loss": 0.8086, - "step": 22010 - }, - { - "epoch": 0.56, - "learning_rate": 1.8718272858101197e-06, - "loss": 0.916, - "step": 22011 - }, - { - "epoch": 0.56, - "learning_rate": 1.8718137321167822e-06, - "loss": 0.7222, - "step": 22012 - }, - { - "epoch": 0.56, - "learning_rate": 1.8718001777559374e-06, - "loss": 0.9092, - "step": 22013 - }, - { - "epoch": 0.56, - "learning_rate": 1.8717866227275954e-06, - "loss": 1.001, - "step": 22014 - }, - { - "epoch": 0.56, - "learning_rate": 1.8717730670317661e-06, - "loss": 0.8887, - "step": 22015 - }, - { - "epoch": 0.56, - "learning_rate": 1.8717595106684607e-06, - "loss": 0.9512, - "step": 22016 - }, - { - "epoch": 0.56, - "learning_rate": 1.8717459536376887e-06, - "loss": 0.8945, - "step": 22017 - }, - { - "epoch": 0.56, - "learning_rate": 1.871732395939461e-06, - "loss": 0.9131, - "step": 22018 - }, - { - "epoch": 0.56, - "learning_rate": 1.871718837573788e-06, - "loss": 0.9004, - "step": 22019 - }, - { - "epoch": 0.56, - "learning_rate": 1.87170527854068e-06, - "loss": 0.9697, - "step": 22020 - }, - { - "epoch": 0.56, - "learning_rate": 1.8716917188401472e-06, - "loss": 0.7529, - "step": 22021 - }, - { - "epoch": 0.56, - "learning_rate": 1.8716781584722003e-06, - "loss": 0.8564, - "step": 22022 - }, - { - "epoch": 0.56, - "learning_rate": 1.8716645974368496e-06, - "loss": 1.0176, - "step": 22023 - }, - { - "epoch": 0.56, - "learning_rate": 1.8716510357341054e-06, - "loss": 0.9297, - "step": 22024 - }, - { - "epoch": 0.56, - "learning_rate": 1.8716374733639778e-06, - "loss": 0.9336, - "step": 22025 - }, - { - "epoch": 0.56, - "learning_rate": 1.8716239103264775e-06, - "loss": 0.8994, - "step": 22026 - }, - { - "epoch": 0.56, - "learning_rate": 1.8716103466216149e-06, - "loss": 0.8623, - "step": 22027 - }, - { - "epoch": 0.56, - "learning_rate": 1.8715967822494006e-06, - "loss": 0.9473, - "step": 22028 - }, - { - "epoch": 0.56, - "learning_rate": 1.8715832172098444e-06, - "loss": 0.812, - "step": 22029 - }, - { - "epoch": 0.56, - "learning_rate": 1.8715696515029569e-06, - "loss": 1.1758, - "step": 22030 - }, - { - "epoch": 0.56, - "learning_rate": 1.8715560851287488e-06, - "loss": 0.8369, - "step": 22031 - }, - { - "epoch": 0.56, - "learning_rate": 1.8715425180872305e-06, - "loss": 0.8486, - "step": 22032 - }, - { - "epoch": 0.56, - "learning_rate": 1.871528950378412e-06, - "loss": 0.9531, - "step": 22033 - }, - { - "epoch": 0.56, - "learning_rate": 1.8715153820023038e-06, - "loss": 0.7598, - "step": 22034 - }, - { - "epoch": 0.56, - "learning_rate": 1.8715018129589163e-06, - "loss": 0.9414, - "step": 22035 - }, - { - "epoch": 0.56, - "learning_rate": 1.8714882432482599e-06, - "loss": 1.0293, - "step": 22036 - }, - { - "epoch": 0.56, - "learning_rate": 1.8714746728703452e-06, - "loss": 0.5029, - "step": 22037 - }, - { - "epoch": 0.56, - "learning_rate": 1.8714611018251823e-06, - "loss": 0.8906, - "step": 22038 - }, - { - "epoch": 0.56, - "learning_rate": 1.8714475301127816e-06, - "loss": 1.002, - "step": 22039 - }, - { - "epoch": 0.56, - "learning_rate": 1.8714339577331536e-06, - "loss": 1.0703, - "step": 22040 - }, - { - "epoch": 0.56, - "learning_rate": 1.8714203846863091e-06, - "loss": 0.4277, - "step": 22041 - }, - { - "epoch": 0.56, - "learning_rate": 1.8714068109722576e-06, - "loss": 0.7593, - "step": 22042 - }, - { - "epoch": 0.56, - "learning_rate": 1.8713932365910103e-06, - "loss": 1.1074, - "step": 22043 - }, - { - "epoch": 0.56, - "learning_rate": 1.8713796615425771e-06, - "loss": 1.0469, - "step": 22044 - }, - { - "epoch": 0.57, - "learning_rate": 1.8713660858269687e-06, - "loss": 0.9258, - "step": 22045 - }, - { - "epoch": 0.57, - "learning_rate": 1.871352509444195e-06, - "loss": 1.0449, - "step": 22046 - }, - { - "epoch": 0.57, - "learning_rate": 1.8713389323942671e-06, - "loss": 0.832, - "step": 22047 - }, - { - "epoch": 0.57, - "learning_rate": 1.871325354677195e-06, - "loss": 0.7603, - "step": 22048 - }, - { - "epoch": 0.57, - "learning_rate": 1.871311776292989e-06, - "loss": 0.8867, - "step": 22049 - }, - { - "epoch": 0.57, - "learning_rate": 1.8712981972416597e-06, - "loss": 0.801, - "step": 22050 - }, - { - "epoch": 0.57, - "learning_rate": 1.8712846175232175e-06, - "loss": 0.6467, - "step": 22051 - }, - { - "epoch": 0.57, - "learning_rate": 1.8712710371376728e-06, - "loss": 0.9678, - "step": 22052 - }, - { - "epoch": 0.57, - "learning_rate": 1.8712574560850358e-06, - "loss": 0.8604, - "step": 22053 - }, - { - "epoch": 0.57, - "learning_rate": 1.8712438743653171e-06, - "loss": 0.8887, - "step": 22054 - }, - { - "epoch": 0.57, - "learning_rate": 1.8712302919785268e-06, - "loss": 1.0322, - "step": 22055 - }, - { - "epoch": 0.57, - "learning_rate": 1.8712167089246758e-06, - "loss": 0.7305, - "step": 22056 - }, - { - "epoch": 0.57, - "learning_rate": 1.871203125203774e-06, - "loss": 0.9746, - "step": 22057 - }, - { - "epoch": 0.57, - "learning_rate": 1.8711895408158322e-06, - "loss": 0.9097, - "step": 22058 - }, - { - "epoch": 0.57, - "learning_rate": 1.8711759557608606e-06, - "loss": 0.8862, - "step": 22059 - }, - { - "epoch": 0.57, - "learning_rate": 1.8711623700388698e-06, - "loss": 0.9014, - "step": 22060 - }, - { - "epoch": 0.57, - "learning_rate": 1.8711487836498695e-06, - "loss": 0.8369, - "step": 22061 - }, - { - "epoch": 0.57, - "learning_rate": 1.871135196593871e-06, - "loss": 0.9951, - "step": 22062 - }, - { - "epoch": 0.57, - "learning_rate": 1.8711216088708843e-06, - "loss": 0.687, - "step": 22063 - }, - { - "epoch": 0.57, - "learning_rate": 1.87110802048092e-06, - "loss": 1.1035, - "step": 22064 - }, - { - "epoch": 0.57, - "learning_rate": 1.8710944314239883e-06, - "loss": 0.9561, - "step": 22065 - }, - { - "epoch": 0.57, - "learning_rate": 1.8710808417000994e-06, - "loss": 0.6362, - "step": 22066 - }, - { - "epoch": 0.57, - "learning_rate": 1.871067251309264e-06, - "loss": 1.0127, - "step": 22067 - }, - { - "epoch": 0.57, - "learning_rate": 1.8710536602514926e-06, - "loss": 0.7266, - "step": 22068 - }, - { - "epoch": 0.57, - "learning_rate": 1.8710400685267955e-06, - "loss": 0.9541, - "step": 22069 - }, - { - "epoch": 0.57, - "learning_rate": 1.871026476135183e-06, - "loss": 0.7617, - "step": 22070 - }, - { - "epoch": 0.57, - "learning_rate": 1.8710128830766654e-06, - "loss": 0.876, - "step": 22071 - }, - { - "epoch": 0.57, - "learning_rate": 1.8709992893512534e-06, - "loss": 0.8779, - "step": 22072 - }, - { - "epoch": 0.57, - "learning_rate": 1.8709856949589575e-06, - "loss": 1.0625, - "step": 22073 - }, - { - "epoch": 0.57, - "learning_rate": 1.8709720998997875e-06, - "loss": 0.9219, - "step": 22074 - }, - { - "epoch": 0.57, - "learning_rate": 1.8709585041737546e-06, - "loss": 0.8672, - "step": 22075 - }, - { - "epoch": 0.57, - "learning_rate": 1.8709449077808688e-06, - "loss": 0.7842, - "step": 22076 - }, - { - "epoch": 0.57, - "learning_rate": 1.8709313107211404e-06, - "loss": 0.9648, - "step": 22077 - }, - { - "epoch": 0.57, - "learning_rate": 1.8709177129945798e-06, - "loss": 0.8457, - "step": 22078 - }, - { - "epoch": 0.57, - "learning_rate": 1.8709041146011978e-06, - "loss": 0.8174, - "step": 22079 - }, - { - "epoch": 0.57, - "learning_rate": 1.8708905155410041e-06, - "loss": 0.7178, - "step": 22080 - }, - { - "epoch": 0.57, - "learning_rate": 1.8708769158140103e-06, - "loss": 0.7578, - "step": 22081 - }, - { - "epoch": 0.57, - "learning_rate": 1.8708633154202255e-06, - "loss": 0.8271, - "step": 22082 - }, - { - "epoch": 0.57, - "learning_rate": 1.870849714359661e-06, - "loss": 0.958, - "step": 22083 - }, - { - "epoch": 0.57, - "learning_rate": 1.870836112632327e-06, - "loss": 0.7837, - "step": 22084 - }, - { - "epoch": 0.57, - "learning_rate": 1.8708225102382336e-06, - "loss": 0.8662, - "step": 22085 - }, - { - "epoch": 0.57, - "learning_rate": 1.8708089071773915e-06, - "loss": 0.7705, - "step": 22086 - }, - { - "epoch": 0.57, - "learning_rate": 1.870795303449811e-06, - "loss": 0.9795, - "step": 22087 - }, - { - "epoch": 0.57, - "learning_rate": 1.8707816990555028e-06, - "loss": 0.7676, - "step": 22088 - }, - { - "epoch": 0.57, - "learning_rate": 1.870768093994477e-06, - "loss": 0.8203, - "step": 22089 - }, - { - "epoch": 0.57, - "learning_rate": 1.870754488266744e-06, - "loss": 0.7705, - "step": 22090 - }, - { - "epoch": 0.57, - "learning_rate": 1.8707408818723142e-06, - "loss": 0.5649, - "step": 22091 - }, - { - "epoch": 0.57, - "learning_rate": 1.8707272748111984e-06, - "loss": 0.8105, - "step": 22092 - }, - { - "epoch": 0.57, - "learning_rate": 1.8707136670834068e-06, - "loss": 0.6445, - "step": 22093 - }, - { - "epoch": 0.57, - "learning_rate": 1.8707000586889496e-06, - "loss": 0.9785, - "step": 22094 - }, - { - "epoch": 0.57, - "learning_rate": 1.8706864496278376e-06, - "loss": 0.9648, - "step": 22095 - }, - { - "epoch": 0.57, - "learning_rate": 1.870672839900081e-06, - "loss": 0.4937, - "step": 22096 - }, - { - "epoch": 0.57, - "learning_rate": 1.8706592295056898e-06, - "loss": 0.9648, - "step": 22097 - }, - { - "epoch": 0.57, - "learning_rate": 1.8706456184446756e-06, - "loss": 0.8506, - "step": 22098 - }, - { - "epoch": 0.57, - "learning_rate": 1.8706320067170473e-06, - "loss": 0.792, - "step": 22099 - }, - { - "epoch": 0.57, - "learning_rate": 1.8706183943228167e-06, - "loss": 1.0508, - "step": 22100 - }, - { - "epoch": 0.57, - "learning_rate": 1.8706047812619934e-06, - "loss": 0.7983, - "step": 22101 - }, - { - "epoch": 0.57, - "learning_rate": 1.870591167534588e-06, - "loss": 0.8364, - "step": 22102 - }, - { - "epoch": 0.57, - "learning_rate": 1.870577553140611e-06, - "loss": 0.9121, - "step": 22103 - }, - { - "epoch": 0.57, - "learning_rate": 1.8705639380800728e-06, - "loss": 0.8633, - "step": 22104 - }, - { - "epoch": 0.57, - "learning_rate": 1.870550322352984e-06, - "loss": 0.9531, - "step": 22105 - }, - { - "epoch": 0.57, - "learning_rate": 1.8705367059593546e-06, - "loss": 1.1504, - "step": 22106 - }, - { - "epoch": 0.57, - "learning_rate": 1.8705230888991954e-06, - "loss": 0.8506, - "step": 22107 - }, - { - "epoch": 0.57, - "learning_rate": 1.8705094711725168e-06, - "loss": 0.9951, - "step": 22108 - }, - { - "epoch": 0.57, - "learning_rate": 1.8704958527793289e-06, - "loss": 0.8975, - "step": 22109 - }, - { - "epoch": 0.57, - "learning_rate": 1.8704822337196427e-06, - "loss": 0.6763, - "step": 22110 - }, - { - "epoch": 0.57, - "learning_rate": 1.8704686139934677e-06, - "loss": 0.6992, - "step": 22111 - }, - { - "epoch": 0.57, - "learning_rate": 1.8704549936008153e-06, - "loss": 0.8613, - "step": 22112 - }, - { - "epoch": 0.57, - "learning_rate": 1.8704413725416956e-06, - "loss": 0.834, - "step": 22113 - }, - { - "epoch": 0.57, - "learning_rate": 1.8704277508161188e-06, - "loss": 1.0703, - "step": 22114 - }, - { - "epoch": 0.57, - "learning_rate": 1.8704141284240955e-06, - "loss": 1.3975, - "step": 22115 - }, - { - "epoch": 0.57, - "learning_rate": 1.8704005053656361e-06, - "loss": 0.9287, - "step": 22116 - }, - { - "epoch": 0.57, - "learning_rate": 1.8703868816407513e-06, - "loss": 0.9141, - "step": 22117 - }, - { - "epoch": 0.57, - "learning_rate": 1.870373257249451e-06, - "loss": 0.8389, - "step": 22118 - }, - { - "epoch": 0.57, - "learning_rate": 1.870359632191746e-06, - "loss": 0.6875, - "step": 22119 - }, - { - "epoch": 0.57, - "learning_rate": 1.8703460064676468e-06, - "loss": 0.7388, - "step": 22120 - }, - { - "epoch": 0.57, - "learning_rate": 1.8703323800771633e-06, - "loss": 0.8848, - "step": 22121 - }, - { - "epoch": 0.57, - "learning_rate": 1.8703187530203066e-06, - "loss": 0.8086, - "step": 22122 - }, - { - "epoch": 0.57, - "learning_rate": 1.870305125297087e-06, - "loss": 0.916, - "step": 22123 - }, - { - "epoch": 0.57, - "learning_rate": 1.8702914969075145e-06, - "loss": 0.748, - "step": 22124 - }, - { - "epoch": 0.57, - "learning_rate": 1.8702778678516e-06, - "loss": 1.0303, - "step": 22125 - }, - { - "epoch": 0.57, - "learning_rate": 1.8702642381293536e-06, - "loss": 1.0557, - "step": 22126 - }, - { - "epoch": 0.57, - "learning_rate": 1.870250607740786e-06, - "loss": 0.7402, - "step": 22127 - }, - { - "epoch": 0.57, - "learning_rate": 1.8702369766859074e-06, - "loss": 0.8062, - "step": 22128 - }, - { - "epoch": 0.57, - "learning_rate": 1.8702233449647285e-06, - "loss": 0.8394, - "step": 22129 - }, - { - "epoch": 0.57, - "learning_rate": 1.8702097125772595e-06, - "loss": 0.6333, - "step": 22130 - }, - { - "epoch": 0.57, - "learning_rate": 1.8701960795235112e-06, - "loss": 0.8267, - "step": 22131 - }, - { - "epoch": 0.57, - "learning_rate": 1.8701824458034934e-06, - "loss": 0.8218, - "step": 22132 - }, - { - "epoch": 0.57, - "learning_rate": 1.870168811417217e-06, - "loss": 0.7402, - "step": 22133 - }, - { - "epoch": 0.57, - "learning_rate": 1.8701551763646925e-06, - "loss": 0.8721, - "step": 22134 - }, - { - "epoch": 0.57, - "learning_rate": 1.87014154064593e-06, - "loss": 0.8164, - "step": 22135 - }, - { - "epoch": 0.57, - "learning_rate": 1.8701279042609405e-06, - "loss": 0.8301, - "step": 22136 - }, - { - "epoch": 0.57, - "learning_rate": 1.8701142672097337e-06, - "loss": 0.9375, - "step": 22137 - }, - { - "epoch": 0.57, - "learning_rate": 1.8701006294923205e-06, - "loss": 0.7888, - "step": 22138 - }, - { - "epoch": 0.57, - "learning_rate": 1.8700869911087114e-06, - "loss": 0.4663, - "step": 22139 - }, - { - "epoch": 0.57, - "learning_rate": 1.8700733520589164e-06, - "loss": 0.8584, - "step": 22140 - }, - { - "epoch": 0.57, - "learning_rate": 1.8700597123429468e-06, - "loss": 0.957, - "step": 22141 - }, - { - "epoch": 0.57, - "learning_rate": 1.8700460719608117e-06, - "loss": 0.9258, - "step": 22142 - }, - { - "epoch": 0.57, - "learning_rate": 1.870032430912523e-06, - "loss": 0.8955, - "step": 22143 - }, - { - "epoch": 0.57, - "learning_rate": 1.8700187891980903e-06, - "loss": 0.9062, - "step": 22144 - }, - { - "epoch": 0.57, - "learning_rate": 1.870005146817524e-06, - "loss": 0.7949, - "step": 22145 - }, - { - "epoch": 0.57, - "learning_rate": 1.869991503770835e-06, - "loss": 0.9121, - "step": 22146 - }, - { - "epoch": 0.57, - "learning_rate": 1.8699778600580332e-06, - "loss": 0.8223, - "step": 22147 - }, - { - "epoch": 0.57, - "learning_rate": 1.8699642156791296e-06, - "loss": 0.9756, - "step": 22148 - }, - { - "epoch": 0.57, - "learning_rate": 1.8699505706341343e-06, - "loss": 1.1455, - "step": 22149 - }, - { - "epoch": 0.57, - "learning_rate": 1.8699369249230582e-06, - "loss": 0.8823, - "step": 22150 - }, - { - "epoch": 0.57, - "learning_rate": 1.8699232785459109e-06, - "loss": 0.8525, - "step": 22151 - }, - { - "epoch": 0.57, - "learning_rate": 1.8699096315027037e-06, - "loss": 0.916, - "step": 22152 - }, - { - "epoch": 0.57, - "learning_rate": 1.8698959837934465e-06, - "loss": 1.084, - "step": 22153 - }, - { - "epoch": 0.57, - "learning_rate": 1.8698823354181502e-06, - "loss": 0.877, - "step": 22154 - }, - { - "epoch": 0.57, - "learning_rate": 1.8698686863768244e-06, - "loss": 0.8721, - "step": 22155 - }, - { - "epoch": 0.57, - "learning_rate": 1.8698550366694805e-06, - "loss": 0.7842, - "step": 22156 - }, - { - "epoch": 0.57, - "learning_rate": 1.869841386296129e-06, - "loss": 0.709, - "step": 22157 - }, - { - "epoch": 0.57, - "learning_rate": 1.8698277352567793e-06, - "loss": 1.0615, - "step": 22158 - }, - { - "epoch": 0.57, - "learning_rate": 1.8698140835514428e-06, - "loss": 0.7578, - "step": 22159 - }, - { - "epoch": 0.57, - "learning_rate": 1.8698004311801297e-06, - "loss": 0.9551, - "step": 22160 - }, - { - "epoch": 0.57, - "learning_rate": 1.8697867781428504e-06, - "loss": 0.6816, - "step": 22161 - }, - { - "epoch": 0.57, - "learning_rate": 1.8697731244396154e-06, - "loss": 0.9521, - "step": 22162 - }, - { - "epoch": 0.57, - "learning_rate": 1.8697594700704346e-06, - "loss": 0.9863, - "step": 22163 - }, - { - "epoch": 0.57, - "learning_rate": 1.8697458150353195e-06, - "loss": 0.8574, - "step": 22164 - }, - { - "epoch": 0.57, - "learning_rate": 1.8697321593342798e-06, - "loss": 0.9854, - "step": 22165 - }, - { - "epoch": 0.57, - "learning_rate": 1.8697185029673265e-06, - "loss": 0.8252, - "step": 22166 - }, - { - "epoch": 0.57, - "learning_rate": 1.8697048459344696e-06, - "loss": 1.0146, - "step": 22167 - }, - { - "epoch": 0.57, - "learning_rate": 1.8696911882357194e-06, - "loss": 0.8525, - "step": 22168 - }, - { - "epoch": 0.57, - "learning_rate": 1.8696775298710868e-06, - "loss": 0.8652, - "step": 22169 - }, - { - "epoch": 0.57, - "learning_rate": 1.8696638708405822e-06, - "loss": 0.834, - "step": 22170 - }, - { - "epoch": 0.57, - "learning_rate": 1.8696502111442158e-06, - "loss": 1.0049, - "step": 22171 - }, - { - "epoch": 0.57, - "learning_rate": 1.8696365507819985e-06, - "loss": 0.9863, - "step": 22172 - }, - { - "epoch": 0.57, - "learning_rate": 1.8696228897539404e-06, - "loss": 0.7861, - "step": 22173 - }, - { - "epoch": 0.57, - "learning_rate": 1.8696092280600518e-06, - "loss": 1.082, - "step": 22174 - }, - { - "epoch": 0.57, - "learning_rate": 1.8695955657003435e-06, - "loss": 0.8867, - "step": 22175 - }, - { - "epoch": 0.57, - "learning_rate": 1.8695819026748261e-06, - "loss": 0.9004, - "step": 22176 - }, - { - "epoch": 0.57, - "learning_rate": 1.8695682389835095e-06, - "loss": 1.0156, - "step": 22177 - }, - { - "epoch": 0.57, - "learning_rate": 1.8695545746264046e-06, - "loss": 0.8447, - "step": 22178 - }, - { - "epoch": 0.57, - "learning_rate": 1.8695409096035215e-06, - "loss": 0.8188, - "step": 22179 - }, - { - "epoch": 0.57, - "learning_rate": 1.8695272439148715e-06, - "loss": 1.0205, - "step": 22180 - }, - { - "epoch": 0.57, - "learning_rate": 1.869513577560464e-06, - "loss": 0.8887, - "step": 22181 - }, - { - "epoch": 0.57, - "learning_rate": 1.86949991054031e-06, - "loss": 0.853, - "step": 22182 - }, - { - "epoch": 0.57, - "learning_rate": 1.86948624285442e-06, - "loss": 0.7422, - "step": 22183 - }, - { - "epoch": 0.57, - "learning_rate": 1.8694725745028044e-06, - "loss": 0.79, - "step": 22184 - }, - { - "epoch": 0.57, - "learning_rate": 1.8694589054854735e-06, - "loss": 0.605, - "step": 22185 - }, - { - "epoch": 0.57, - "learning_rate": 1.8694452358024379e-06, - "loss": 0.7756, - "step": 22186 - }, - { - "epoch": 0.57, - "learning_rate": 1.8694315654537082e-06, - "loss": 1.0908, - "step": 22187 - }, - { - "epoch": 0.57, - "learning_rate": 1.8694178944392947e-06, - "loss": 0.6997, - "step": 22188 - }, - { - "epoch": 0.57, - "learning_rate": 1.8694042227592078e-06, - "loss": 0.918, - "step": 22189 - }, - { - "epoch": 0.57, - "learning_rate": 1.869390550413458e-06, - "loss": 1.0176, - "step": 22190 - }, - { - "epoch": 0.57, - "learning_rate": 1.869376877402056e-06, - "loss": 1.0771, - "step": 22191 - }, - { - "epoch": 0.57, - "learning_rate": 1.869363203725012e-06, - "loss": 0.8291, - "step": 22192 - }, - { - "epoch": 0.57, - "learning_rate": 1.8693495293823367e-06, - "loss": 0.8535, - "step": 22193 - }, - { - "epoch": 0.57, - "learning_rate": 1.8693358543740403e-06, - "loss": 0.7896, - "step": 22194 - }, - { - "epoch": 0.57, - "learning_rate": 1.8693221787001333e-06, - "loss": 0.7046, - "step": 22195 - }, - { - "epoch": 0.57, - "learning_rate": 1.8693085023606266e-06, - "loss": 1.209, - "step": 22196 - }, - { - "epoch": 0.57, - "learning_rate": 1.86929482535553e-06, - "loss": 0.7656, - "step": 22197 - }, - { - "epoch": 0.57, - "learning_rate": 1.8692811476848547e-06, - "loss": 0.8467, - "step": 22198 - }, - { - "epoch": 0.57, - "learning_rate": 1.8692674693486105e-06, - "loss": 0.8594, - "step": 22199 - }, - { - "epoch": 0.57, - "learning_rate": 1.8692537903468085e-06, - "loss": 0.7354, - "step": 22200 - }, - { - "epoch": 0.57, - "learning_rate": 1.8692401106794583e-06, - "loss": 1.0645, - "step": 22201 - }, - { - "epoch": 0.57, - "learning_rate": 1.8692264303465716e-06, - "loss": 0.792, - "step": 22202 - }, - { - "epoch": 0.57, - "learning_rate": 1.8692127493481574e-06, - "loss": 0.957, - "step": 22203 - }, - { - "epoch": 0.57, - "learning_rate": 1.8691990676842274e-06, - "loss": 0.8291, - "step": 22204 - }, - { - "epoch": 0.57, - "learning_rate": 1.8691853853547919e-06, - "loss": 0.959, - "step": 22205 - }, - { - "epoch": 0.57, - "learning_rate": 1.8691717023598606e-06, - "loss": 0.8677, - "step": 22206 - }, - { - "epoch": 0.57, - "learning_rate": 1.8691580186994447e-06, - "loss": 0.707, - "step": 22207 - }, - { - "epoch": 0.57, - "learning_rate": 1.8691443343735546e-06, - "loss": 0.7495, - "step": 22208 - }, - { - "epoch": 0.57, - "learning_rate": 1.8691306493822005e-06, - "loss": 0.8384, - "step": 22209 - }, - { - "epoch": 0.57, - "learning_rate": 1.8691169637253931e-06, - "loss": 0.8369, - "step": 22210 - }, - { - "epoch": 0.57, - "learning_rate": 1.869103277403143e-06, - "loss": 0.7026, - "step": 22211 - }, - { - "epoch": 0.57, - "learning_rate": 1.8690895904154603e-06, - "loss": 1.0254, - "step": 22212 - }, - { - "epoch": 0.57, - "learning_rate": 1.8690759027623556e-06, - "loss": 1.0137, - "step": 22213 - }, - { - "epoch": 0.57, - "learning_rate": 1.8690622144438393e-06, - "loss": 0.9258, - "step": 22214 - }, - { - "epoch": 0.57, - "learning_rate": 1.8690485254599221e-06, - "loss": 0.8086, - "step": 22215 - }, - { - "epoch": 0.57, - "learning_rate": 1.8690348358106144e-06, - "loss": 1.002, - "step": 22216 - }, - { - "epoch": 0.57, - "learning_rate": 1.8690211454959267e-06, - "loss": 0.9805, - "step": 22217 - }, - { - "epoch": 0.57, - "learning_rate": 1.86900745451587e-06, - "loss": 0.9814, - "step": 22218 - }, - { - "epoch": 0.57, - "learning_rate": 1.8689937628704535e-06, - "loss": 0.707, - "step": 22219 - }, - { - "epoch": 0.57, - "learning_rate": 1.8689800705596888e-06, - "loss": 0.6347, - "step": 22220 - }, - { - "epoch": 0.57, - "learning_rate": 1.868966377583586e-06, - "loss": 0.8252, - "step": 22221 - }, - { - "epoch": 0.57, - "learning_rate": 1.8689526839421554e-06, - "loss": 0.7168, - "step": 22222 - }, - { - "epoch": 0.57, - "learning_rate": 1.868938989635408e-06, - "loss": 0.9141, - "step": 22223 - }, - { - "epoch": 0.57, - "learning_rate": 1.8689252946633537e-06, - "loss": 0.7876, - "step": 22224 - }, - { - "epoch": 0.57, - "learning_rate": 1.8689115990260035e-06, - "loss": 0.9502, - "step": 22225 - }, - { - "epoch": 0.57, - "learning_rate": 1.8688979027233676e-06, - "loss": 1.0801, - "step": 22226 - }, - { - "epoch": 0.57, - "learning_rate": 1.8688842057554562e-06, - "loss": 0.9053, - "step": 22227 - }, - { - "epoch": 0.57, - "learning_rate": 1.8688705081222804e-06, - "loss": 0.7822, - "step": 22228 - }, - { - "epoch": 0.57, - "learning_rate": 1.8688568098238504e-06, - "loss": 1.0898, - "step": 22229 - }, - { - "epoch": 0.57, - "learning_rate": 1.8688431108601765e-06, - "loss": 0.8838, - "step": 22230 - }, - { - "epoch": 0.57, - "learning_rate": 1.8688294112312697e-06, - "loss": 0.9697, - "step": 22231 - }, - { - "epoch": 0.57, - "learning_rate": 1.86881571093714e-06, - "loss": 0.9365, - "step": 22232 - }, - { - "epoch": 0.57, - "learning_rate": 1.868802009977798e-06, - "loss": 0.8447, - "step": 22233 - }, - { - "epoch": 0.57, - "learning_rate": 1.8687883083532544e-06, - "loss": 0.9004, - "step": 22234 - }, - { - "epoch": 0.57, - "learning_rate": 1.8687746060635194e-06, - "loss": 0.8379, - "step": 22235 - }, - { - "epoch": 0.57, - "learning_rate": 1.8687609031086038e-06, - "loss": 1.0518, - "step": 22236 - }, - { - "epoch": 0.57, - "learning_rate": 1.8687471994885176e-06, - "loss": 0.8467, - "step": 22237 - }, - { - "epoch": 0.57, - "learning_rate": 1.8687334952032719e-06, - "loss": 0.9463, - "step": 22238 - }, - { - "epoch": 0.57, - "learning_rate": 1.8687197902528768e-06, - "loss": 0.8007, - "step": 22239 - }, - { - "epoch": 0.57, - "learning_rate": 1.8687060846373428e-06, - "loss": 0.7715, - "step": 22240 - }, - { - "epoch": 0.57, - "learning_rate": 1.8686923783566808e-06, - "loss": 0.9619, - "step": 22241 - }, - { - "epoch": 0.57, - "learning_rate": 1.8686786714109006e-06, - "loss": 0.8252, - "step": 22242 - }, - { - "epoch": 0.57, - "learning_rate": 1.8686649638000134e-06, - "loss": 0.7122, - "step": 22243 - }, - { - "epoch": 0.57, - "learning_rate": 1.8686512555240293e-06, - "loss": 0.9326, - "step": 22244 - }, - { - "epoch": 0.57, - "learning_rate": 1.8686375465829588e-06, - "loss": 0.769, - "step": 22245 - }, - { - "epoch": 0.57, - "learning_rate": 1.8686238369768126e-06, - "loss": 0.8853, - "step": 22246 - }, - { - "epoch": 0.57, - "learning_rate": 1.868610126705601e-06, - "loss": 0.4326, - "step": 22247 - }, - { - "epoch": 0.57, - "learning_rate": 1.8685964157693346e-06, - "loss": 0.8311, - "step": 22248 - }, - { - "epoch": 0.57, - "learning_rate": 1.8685827041680237e-06, - "loss": 1.0361, - "step": 22249 - }, - { - "epoch": 0.57, - "learning_rate": 1.8685689919016791e-06, - "loss": 0.9814, - "step": 22250 - }, - { - "epoch": 0.57, - "learning_rate": 1.868555278970311e-06, - "loss": 1.0371, - "step": 22251 - }, - { - "epoch": 0.57, - "learning_rate": 1.8685415653739302e-06, - "loss": 0.9307, - "step": 22252 - }, - { - "epoch": 0.57, - "learning_rate": 1.8685278511125473e-06, - "loss": 0.8936, - "step": 22253 - }, - { - "epoch": 0.57, - "learning_rate": 1.8685141361861724e-06, - "loss": 0.9062, - "step": 22254 - }, - { - "epoch": 0.57, - "learning_rate": 1.8685004205948158e-06, - "loss": 0.7637, - "step": 22255 - }, - { - "epoch": 0.57, - "learning_rate": 1.8684867043384886e-06, - "loss": 0.8096, - "step": 22256 - }, - { - "epoch": 0.57, - "learning_rate": 1.8684729874172011e-06, - "loss": 0.8081, - "step": 22257 - }, - { - "epoch": 0.57, - "learning_rate": 1.8684592698309638e-06, - "loss": 0.876, - "step": 22258 - }, - { - "epoch": 0.57, - "learning_rate": 1.8684455515797872e-06, - "loss": 0.9004, - "step": 22259 - }, - { - "epoch": 0.57, - "learning_rate": 1.8684318326636817e-06, - "loss": 0.8818, - "step": 22260 - }, - { - "epoch": 0.57, - "learning_rate": 1.8684181130826579e-06, - "loss": 0.6812, - "step": 22261 - }, - { - "epoch": 0.57, - "learning_rate": 1.8684043928367263e-06, - "loss": 0.8438, - "step": 22262 - }, - { - "epoch": 0.57, - "learning_rate": 1.8683906719258973e-06, - "loss": 1.0732, - "step": 22263 - }, - { - "epoch": 0.57, - "learning_rate": 1.8683769503501816e-06, - "loss": 0.749, - "step": 22264 - }, - { - "epoch": 0.57, - "learning_rate": 1.8683632281095895e-06, - "loss": 0.6318, - "step": 22265 - }, - { - "epoch": 0.57, - "learning_rate": 1.8683495052041318e-06, - "loss": 0.7822, - "step": 22266 - }, - { - "epoch": 0.57, - "learning_rate": 1.8683357816338185e-06, - "loss": 1.0137, - "step": 22267 - }, - { - "epoch": 0.57, - "learning_rate": 1.8683220573986608e-06, - "loss": 0.8359, - "step": 22268 - }, - { - "epoch": 0.57, - "learning_rate": 1.8683083324986683e-06, - "loss": 0.9863, - "step": 22269 - }, - { - "epoch": 0.57, - "learning_rate": 1.8682946069338526e-06, - "loss": 1.043, - "step": 22270 - }, - { - "epoch": 0.57, - "learning_rate": 1.8682808807042233e-06, - "loss": 1.0605, - "step": 22271 - }, - { - "epoch": 0.57, - "learning_rate": 1.8682671538097914e-06, - "loss": 0.7422, - "step": 22272 - }, - { - "epoch": 0.57, - "learning_rate": 1.8682534262505674e-06, - "loss": 0.8115, - "step": 22273 - }, - { - "epoch": 0.57, - "learning_rate": 1.8682396980265614e-06, - "loss": 0.6792, - "step": 22274 - }, - { - "epoch": 0.57, - "learning_rate": 1.8682259691377841e-06, - "loss": 0.8564, - "step": 22275 - }, - { - "epoch": 0.57, - "learning_rate": 1.8682122395842463e-06, - "loss": 0.7734, - "step": 22276 - }, - { - "epoch": 0.57, - "learning_rate": 1.8681985093659582e-06, - "loss": 0.8252, - "step": 22277 - }, - { - "epoch": 0.57, - "learning_rate": 1.8681847784829308e-06, - "loss": 0.9263, - "step": 22278 - }, - { - "epoch": 0.57, - "learning_rate": 1.8681710469351737e-06, - "loss": 0.8145, - "step": 22279 - }, - { - "epoch": 0.57, - "learning_rate": 1.8681573147226984e-06, - "loss": 0.8013, - "step": 22280 - }, - { - "epoch": 0.57, - "learning_rate": 1.8681435818455146e-06, - "loss": 0.8486, - "step": 22281 - }, - { - "epoch": 0.57, - "learning_rate": 1.8681298483036332e-06, - "loss": 0.8945, - "step": 22282 - }, - { - "epoch": 0.57, - "learning_rate": 1.868116114097065e-06, - "loss": 0.8057, - "step": 22283 - }, - { - "epoch": 0.57, - "learning_rate": 1.8681023792258198e-06, - "loss": 0.6941, - "step": 22284 - }, - { - "epoch": 0.57, - "learning_rate": 1.8680886436899091e-06, - "loss": 0.9072, - "step": 22285 - }, - { - "epoch": 0.57, - "learning_rate": 1.8680749074893422e-06, - "loss": 0.6508, - "step": 22286 - }, - { - "epoch": 0.57, - "learning_rate": 1.8680611706241306e-06, - "loss": 1.1074, - "step": 22287 - }, - { - "epoch": 0.57, - "learning_rate": 1.8680474330942847e-06, - "loss": 0.7295, - "step": 22288 - }, - { - "epoch": 0.57, - "learning_rate": 1.8680336948998145e-06, - "loss": 0.8101, - "step": 22289 - }, - { - "epoch": 0.57, - "learning_rate": 1.8680199560407308e-06, - "loss": 0.9521, - "step": 22290 - }, - { - "epoch": 0.57, - "learning_rate": 1.868006216517044e-06, - "loss": 0.9062, - "step": 22291 - }, - { - "epoch": 0.57, - "learning_rate": 1.8679924763287648e-06, - "loss": 0.6934, - "step": 22292 - }, - { - "epoch": 0.57, - "learning_rate": 1.867978735475904e-06, - "loss": 0.9346, - "step": 22293 - }, - { - "epoch": 0.57, - "learning_rate": 1.8679649939584717e-06, - "loss": 0.7607, - "step": 22294 - }, - { - "epoch": 0.57, - "learning_rate": 1.8679512517764783e-06, - "loss": 0.9062, - "step": 22295 - }, - { - "epoch": 0.57, - "learning_rate": 1.8679375089299344e-06, - "loss": 0.9287, - "step": 22296 - }, - { - "epoch": 0.57, - "learning_rate": 1.867923765418851e-06, - "loss": 0.8838, - "step": 22297 - }, - { - "epoch": 0.57, - "learning_rate": 1.8679100212432384e-06, - "loss": 1.0, - "step": 22298 - }, - { - "epoch": 0.57, - "learning_rate": 1.8678962764031066e-06, - "loss": 1.0088, - "step": 22299 - }, - { - "epoch": 0.57, - "learning_rate": 1.8678825308984668e-06, - "loss": 0.9375, - "step": 22300 - }, - { - "epoch": 0.57, - "learning_rate": 1.867868784729329e-06, - "loss": 0.7549, - "step": 22301 - }, - { - "epoch": 0.57, - "learning_rate": 1.8678550378957043e-06, - "loss": 1.002, - "step": 22302 - }, - { - "epoch": 0.57, - "learning_rate": 1.8678412903976026e-06, - "loss": 0.6218, - "step": 22303 - }, - { - "epoch": 0.57, - "learning_rate": 1.8678275422350352e-06, - "loss": 0.8169, - "step": 22304 - }, - { - "epoch": 0.57, - "learning_rate": 1.8678137934080116e-06, - "loss": 1.0117, - "step": 22305 - }, - { - "epoch": 0.57, - "learning_rate": 1.8678000439165432e-06, - "loss": 0.7666, - "step": 22306 - }, - { - "epoch": 0.57, - "learning_rate": 1.86778629376064e-06, - "loss": 0.9238, - "step": 22307 - }, - { - "epoch": 0.57, - "learning_rate": 1.8677725429403132e-06, - "loss": 0.6807, - "step": 22308 - }, - { - "epoch": 0.57, - "learning_rate": 1.8677587914555723e-06, - "loss": 0.8086, - "step": 22309 - }, - { - "epoch": 0.57, - "learning_rate": 1.8677450393064285e-06, - "loss": 0.8228, - "step": 22310 - }, - { - "epoch": 0.57, - "learning_rate": 1.8677312864928924e-06, - "loss": 0.7852, - "step": 22311 - }, - { - "epoch": 0.57, - "learning_rate": 1.8677175330149742e-06, - "loss": 0.8721, - "step": 22312 - }, - { - "epoch": 0.57, - "learning_rate": 1.8677037788726846e-06, - "loss": 0.6538, - "step": 22313 - }, - { - "epoch": 0.57, - "learning_rate": 1.8676900240660342e-06, - "loss": 0.8838, - "step": 22314 - }, - { - "epoch": 0.57, - "learning_rate": 1.8676762685950337e-06, - "loss": 0.9834, - "step": 22315 - }, - { - "epoch": 0.57, - "learning_rate": 1.867662512459693e-06, - "loss": 0.7749, - "step": 22316 - }, - { - "epoch": 0.57, - "learning_rate": 1.867648755660023e-06, - "loss": 0.8613, - "step": 22317 - }, - { - "epoch": 0.57, - "learning_rate": 1.8676349981960344e-06, - "loss": 0.8418, - "step": 22318 - }, - { - "epoch": 0.57, - "learning_rate": 1.8676212400677375e-06, - "loss": 0.7998, - "step": 22319 - }, - { - "epoch": 0.57, - "learning_rate": 1.867607481275143e-06, - "loss": 0.6826, - "step": 22320 - }, - { - "epoch": 0.57, - "learning_rate": 1.8675937218182613e-06, - "loss": 1.0381, - "step": 22321 - }, - { - "epoch": 0.57, - "learning_rate": 1.8675799616971028e-06, - "loss": 1.0518, - "step": 22322 - }, - { - "epoch": 0.57, - "learning_rate": 1.8675662009116786e-06, - "loss": 0.999, - "step": 22323 - }, - { - "epoch": 0.57, - "learning_rate": 1.8675524394619985e-06, - "loss": 0.7363, - "step": 22324 - }, - { - "epoch": 0.57, - "learning_rate": 1.8675386773480737e-06, - "loss": 1.0156, - "step": 22325 - }, - { - "epoch": 0.57, - "learning_rate": 1.8675249145699143e-06, - "loss": 0.8804, - "step": 22326 - }, - { - "epoch": 0.57, - "learning_rate": 1.8675111511275308e-06, - "loss": 0.9766, - "step": 22327 - }, - { - "epoch": 0.57, - "learning_rate": 1.867497387020934e-06, - "loss": 0.7251, - "step": 22328 - }, - { - "epoch": 0.57, - "learning_rate": 1.8674836222501345e-06, - "loss": 1.1387, - "step": 22329 - }, - { - "epoch": 0.57, - "learning_rate": 1.8674698568151426e-06, - "loss": 0.9365, - "step": 22330 - }, - { - "epoch": 0.57, - "learning_rate": 1.8674560907159687e-06, - "loss": 1.0049, - "step": 22331 - }, - { - "epoch": 0.57, - "learning_rate": 1.8674423239526239e-06, - "loss": 0.96, - "step": 22332 - }, - { - "epoch": 0.57, - "learning_rate": 1.8674285565251182e-06, - "loss": 0.6721, - "step": 22333 - }, - { - "epoch": 0.57, - "learning_rate": 1.867414788433462e-06, - "loss": 0.9688, - "step": 22334 - }, - { - "epoch": 0.57, - "learning_rate": 1.8674010196776667e-06, - "loss": 1.0078, - "step": 22335 - }, - { - "epoch": 0.57, - "learning_rate": 1.8673872502577424e-06, - "loss": 0.8604, - "step": 22336 - }, - { - "epoch": 0.57, - "learning_rate": 1.8673734801736992e-06, - "loss": 0.6338, - "step": 22337 - }, - { - "epoch": 0.57, - "learning_rate": 1.867359709425548e-06, - "loss": 0.6416, - "step": 22338 - }, - { - "epoch": 0.57, - "learning_rate": 1.8673459380132996e-06, - "loss": 0.9053, - "step": 22339 - }, - { - "epoch": 0.57, - "learning_rate": 1.8673321659369643e-06, - "loss": 0.877, - "step": 22340 - }, - { - "epoch": 0.57, - "learning_rate": 1.8673183931965523e-06, - "loss": 0.8262, - "step": 22341 - }, - { - "epoch": 0.57, - "learning_rate": 1.8673046197920747e-06, - "loss": 0.9727, - "step": 22342 - }, - { - "epoch": 0.57, - "learning_rate": 1.867290845723542e-06, - "loss": 0.7891, - "step": 22343 - }, - { - "epoch": 0.57, - "learning_rate": 1.8672770709909641e-06, - "loss": 1.0625, - "step": 22344 - }, - { - "epoch": 0.57, - "learning_rate": 1.8672632955943525e-06, - "loss": 0.7334, - "step": 22345 - }, - { - "epoch": 0.57, - "learning_rate": 1.8672495195337172e-06, - "loss": 0.9023, - "step": 22346 - }, - { - "epoch": 0.57, - "learning_rate": 1.8672357428090689e-06, - "loss": 0.8672, - "step": 22347 - }, - { - "epoch": 0.57, - "learning_rate": 1.8672219654204179e-06, - "loss": 0.9355, - "step": 22348 - }, - { - "epoch": 0.57, - "learning_rate": 1.8672081873677748e-06, - "loss": 0.8379, - "step": 22349 - }, - { - "epoch": 0.57, - "learning_rate": 1.8671944086511504e-06, - "loss": 1.0908, - "step": 22350 - }, - { - "epoch": 0.57, - "learning_rate": 1.867180629270555e-06, - "loss": 0.8701, - "step": 22351 - }, - { - "epoch": 0.57, - "learning_rate": 1.8671668492259994e-06, - "loss": 0.7773, - "step": 22352 - }, - { - "epoch": 0.57, - "learning_rate": 1.867153068517494e-06, - "loss": 1.0391, - "step": 22353 - }, - { - "epoch": 0.57, - "learning_rate": 1.8671392871450493e-06, - "loss": 0.8066, - "step": 22354 - }, - { - "epoch": 0.57, - "learning_rate": 1.8671255051086762e-06, - "loss": 0.644, - "step": 22355 - }, - { - "epoch": 0.57, - "learning_rate": 1.8671117224083845e-06, - "loss": 0.8594, - "step": 22356 - }, - { - "epoch": 0.57, - "learning_rate": 1.8670979390441856e-06, - "loss": 0.7949, - "step": 22357 - }, - { - "epoch": 0.57, - "learning_rate": 1.8670841550160895e-06, - "loss": 0.7969, - "step": 22358 - }, - { - "epoch": 0.57, - "learning_rate": 1.867070370324107e-06, - "loss": 0.6465, - "step": 22359 - }, - { - "epoch": 0.57, - "learning_rate": 1.8670565849682486e-06, - "loss": 0.9736, - "step": 22360 - }, - { - "epoch": 0.57, - "learning_rate": 1.8670427989485248e-06, - "loss": 0.8877, - "step": 22361 - }, - { - "epoch": 0.57, - "learning_rate": 1.8670290122649463e-06, - "loss": 0.8496, - "step": 22362 - }, - { - "epoch": 0.57, - "learning_rate": 1.8670152249175235e-06, - "loss": 0.7363, - "step": 22363 - }, - { - "epoch": 0.57, - "learning_rate": 1.8670014369062668e-06, - "loss": 0.7646, - "step": 22364 - }, - { - "epoch": 0.57, - "learning_rate": 1.8669876482311872e-06, - "loss": 0.79, - "step": 22365 - }, - { - "epoch": 0.57, - "learning_rate": 1.866973858892295e-06, - "loss": 0.6689, - "step": 22366 - }, - { - "epoch": 0.57, - "learning_rate": 1.8669600688896009e-06, - "loss": 0.8057, - "step": 22367 - }, - { - "epoch": 0.57, - "learning_rate": 1.866946278223115e-06, - "loss": 0.8594, - "step": 22368 - }, - { - "epoch": 0.57, - "learning_rate": 1.8669324868928485e-06, - "loss": 1.0283, - "step": 22369 - }, - { - "epoch": 0.57, - "learning_rate": 1.8669186948988113e-06, - "loss": 1.0205, - "step": 22370 - }, - { - "epoch": 0.57, - "learning_rate": 1.8669049022410146e-06, - "loss": 0.8081, - "step": 22371 - }, - { - "epoch": 0.57, - "learning_rate": 1.8668911089194687e-06, - "loss": 0.9482, - "step": 22372 - }, - { - "epoch": 0.57, - "learning_rate": 1.8668773149341841e-06, - "loss": 0.8091, - "step": 22373 - }, - { - "epoch": 0.57, - "learning_rate": 1.8668635202851713e-06, - "loss": 0.9922, - "step": 22374 - }, - { - "epoch": 0.57, - "learning_rate": 1.866849724972441e-06, - "loss": 0.9473, - "step": 22375 - }, - { - "epoch": 0.57, - "learning_rate": 1.8668359289960038e-06, - "loss": 0.9736, - "step": 22376 - }, - { - "epoch": 0.57, - "learning_rate": 1.8668221323558702e-06, - "loss": 0.8105, - "step": 22377 - }, - { - "epoch": 0.57, - "learning_rate": 1.8668083350520507e-06, - "loss": 0.9111, - "step": 22378 - }, - { - "epoch": 0.57, - "learning_rate": 1.866794537084556e-06, - "loss": 0.8418, - "step": 22379 - }, - { - "epoch": 0.57, - "learning_rate": 1.8667807384533965e-06, - "loss": 0.9551, - "step": 22380 - }, - { - "epoch": 0.57, - "learning_rate": 1.8667669391585825e-06, - "loss": 0.8799, - "step": 22381 - }, - { - "epoch": 0.57, - "learning_rate": 1.8667531392001255e-06, - "loss": 0.8716, - "step": 22382 - }, - { - "epoch": 0.57, - "learning_rate": 1.8667393385780352e-06, - "loss": 0.9648, - "step": 22383 - }, - { - "epoch": 0.57, - "learning_rate": 1.8667255372923223e-06, - "loss": 0.9502, - "step": 22384 - }, - { - "epoch": 0.57, - "learning_rate": 1.8667117353429977e-06, - "loss": 1.1357, - "step": 22385 - }, - { - "epoch": 0.57, - "learning_rate": 1.8666979327300719e-06, - "loss": 0.8262, - "step": 22386 - }, - { - "epoch": 0.57, - "learning_rate": 1.8666841294535552e-06, - "loss": 0.9219, - "step": 22387 - }, - { - "epoch": 0.57, - "learning_rate": 1.8666703255134581e-06, - "loss": 0.9834, - "step": 22388 - }, - { - "epoch": 0.57, - "learning_rate": 1.8666565209097916e-06, - "loss": 0.8984, - "step": 22389 - }, - { - "epoch": 0.57, - "learning_rate": 1.866642715642566e-06, - "loss": 0.874, - "step": 22390 - }, - { - "epoch": 0.57, - "learning_rate": 1.866628909711792e-06, - "loss": 1.042, - "step": 22391 - }, - { - "epoch": 0.57, - "learning_rate": 1.8666151031174802e-06, - "loss": 0.9033, - "step": 22392 - }, - { - "epoch": 0.57, - "learning_rate": 1.8666012958596408e-06, - "loss": 0.8438, - "step": 22393 - }, - { - "epoch": 0.57, - "learning_rate": 1.8665874879382847e-06, - "loss": 0.9248, - "step": 22394 - }, - { - "epoch": 0.57, - "learning_rate": 1.8665736793534226e-06, - "loss": 0.9834, - "step": 22395 - }, - { - "epoch": 0.57, - "learning_rate": 1.8665598701050647e-06, - "loss": 0.8574, - "step": 22396 - }, - { - "epoch": 0.57, - "learning_rate": 1.8665460601932218e-06, - "loss": 0.9707, - "step": 22397 - }, - { - "epoch": 0.57, - "learning_rate": 1.8665322496179044e-06, - "loss": 0.7207, - "step": 22398 - }, - { - "epoch": 0.57, - "learning_rate": 1.866518438379123e-06, - "loss": 0.918, - "step": 22399 - }, - { - "epoch": 0.57, - "learning_rate": 1.8665046264768885e-06, - "loss": 0.9814, - "step": 22400 - }, - { - "epoch": 0.57, - "learning_rate": 1.866490813911211e-06, - "loss": 0.4138, - "step": 22401 - }, - { - "epoch": 0.57, - "learning_rate": 1.8664770006821015e-06, - "loss": 1.0068, - "step": 22402 - }, - { - "epoch": 0.57, - "learning_rate": 1.8664631867895704e-06, - "loss": 0.7598, - "step": 22403 - }, - { - "epoch": 0.57, - "learning_rate": 1.8664493722336284e-06, - "loss": 0.9893, - "step": 22404 - }, - { - "epoch": 0.57, - "learning_rate": 1.8664355570142858e-06, - "loss": 0.998, - "step": 22405 - }, - { - "epoch": 0.57, - "learning_rate": 1.8664217411315533e-06, - "loss": 0.7764, - "step": 22406 - }, - { - "epoch": 0.57, - "learning_rate": 1.8664079245854416e-06, - "loss": 0.6892, - "step": 22407 - }, - { - "epoch": 0.57, - "learning_rate": 1.866394107375961e-06, - "loss": 0.8623, - "step": 22408 - }, - { - "epoch": 0.57, - "learning_rate": 1.8663802895031223e-06, - "loss": 0.9746, - "step": 22409 - }, - { - "epoch": 0.57, - "learning_rate": 1.8663664709669361e-06, - "loss": 0.8105, - "step": 22410 - }, - { - "epoch": 0.57, - "learning_rate": 1.8663526517674132e-06, - "loss": 0.772, - "step": 22411 - }, - { - "epoch": 0.57, - "learning_rate": 1.8663388319045636e-06, - "loss": 0.7852, - "step": 22412 - }, - { - "epoch": 0.57, - "learning_rate": 1.8663250113783984e-06, - "loss": 0.6189, - "step": 22413 - }, - { - "epoch": 0.57, - "learning_rate": 1.866311190188928e-06, - "loss": 0.7456, - "step": 22414 - }, - { - "epoch": 0.57, - "learning_rate": 1.8662973683361626e-06, - "loss": 0.8374, - "step": 22415 - }, - { - "epoch": 0.57, - "learning_rate": 1.8662835458201136e-06, - "loss": 0.6641, - "step": 22416 - }, - { - "epoch": 0.57, - "learning_rate": 1.8662697226407907e-06, - "loss": 0.7842, - "step": 22417 - }, - { - "epoch": 0.57, - "learning_rate": 1.866255898798205e-06, - "loss": 0.9336, - "step": 22418 - }, - { - "epoch": 0.57, - "learning_rate": 1.8662420742923672e-06, - "loss": 0.8936, - "step": 22419 - }, - { - "epoch": 0.57, - "learning_rate": 1.8662282491232877e-06, - "loss": 0.7969, - "step": 22420 - }, - { - "epoch": 0.57, - "learning_rate": 1.8662144232909767e-06, - "loss": 1.103, - "step": 22421 - }, - { - "epoch": 0.57, - "learning_rate": 1.8662005967954455e-06, - "loss": 0.8018, - "step": 22422 - }, - { - "epoch": 0.57, - "learning_rate": 1.8661867696367043e-06, - "loss": 0.8926, - "step": 22423 - }, - { - "epoch": 0.57, - "learning_rate": 1.8661729418147635e-06, - "loss": 0.7803, - "step": 22424 - }, - { - "epoch": 0.57, - "learning_rate": 1.866159113329634e-06, - "loss": 0.875, - "step": 22425 - }, - { - "epoch": 0.57, - "learning_rate": 1.8661452841813264e-06, - "loss": 0.7554, - "step": 22426 - }, - { - "epoch": 0.57, - "learning_rate": 1.866131454369851e-06, - "loss": 0.6938, - "step": 22427 - }, - { - "epoch": 0.57, - "learning_rate": 1.8661176238952186e-06, - "loss": 0.7451, - "step": 22428 - }, - { - "epoch": 0.57, - "learning_rate": 1.86610379275744e-06, - "loss": 0.9541, - "step": 22429 - }, - { - "epoch": 0.57, - "learning_rate": 1.866089960956525e-06, - "loss": 0.8623, - "step": 22430 - }, - { - "epoch": 0.57, - "learning_rate": 1.8660761284924853e-06, - "loss": 0.749, - "step": 22431 - }, - { - "epoch": 0.57, - "learning_rate": 1.8660622953653307e-06, - "loss": 0.9756, - "step": 22432 - }, - { - "epoch": 0.57, - "learning_rate": 1.866048461575072e-06, - "loss": 0.8604, - "step": 22433 - }, - { - "epoch": 0.57, - "learning_rate": 1.86603462712172e-06, - "loss": 0.9805, - "step": 22434 - }, - { - "epoch": 0.58, - "learning_rate": 1.866020792005285e-06, - "loss": 0.9131, - "step": 22435 - }, - { - "epoch": 0.58, - "learning_rate": 1.8660069562257777e-06, - "loss": 0.4907, - "step": 22436 - }, - { - "epoch": 0.58, - "learning_rate": 1.8659931197832085e-06, - "loss": 0.7881, - "step": 22437 - }, - { - "epoch": 0.58, - "learning_rate": 1.8659792826775887e-06, - "loss": 1.0127, - "step": 22438 - }, - { - "epoch": 0.58, - "learning_rate": 1.865965444908928e-06, - "loss": 0.7852, - "step": 22439 - }, - { - "epoch": 0.58, - "learning_rate": 1.8659516064772374e-06, - "loss": 0.5471, - "step": 22440 - }, - { - "epoch": 0.58, - "learning_rate": 1.8659377673825274e-06, - "loss": 0.7437, - "step": 22441 - }, - { - "epoch": 0.58, - "learning_rate": 1.8659239276248089e-06, - "loss": 0.6433, - "step": 22442 - }, - { - "epoch": 0.58, - "learning_rate": 1.865910087204092e-06, - "loss": 1.0371, - "step": 22443 - }, - { - "epoch": 0.58, - "learning_rate": 1.8658962461203877e-06, - "loss": 0.9043, - "step": 22444 - }, - { - "epoch": 0.58, - "learning_rate": 1.8658824043737064e-06, - "loss": 0.8662, - "step": 22445 - }, - { - "epoch": 0.58, - "learning_rate": 1.865868561964059e-06, - "loss": 0.8247, - "step": 22446 - }, - { - "epoch": 0.58, - "learning_rate": 1.8658547188914557e-06, - "loss": 0.9854, - "step": 22447 - }, - { - "epoch": 0.58, - "learning_rate": 1.8658408751559071e-06, - "loss": 0.7336, - "step": 22448 - }, - { - "epoch": 0.58, - "learning_rate": 1.865827030757424e-06, - "loss": 0.9629, - "step": 22449 - }, - { - "epoch": 0.58, - "learning_rate": 1.865813185696017e-06, - "loss": 0.8564, - "step": 22450 - }, - { - "epoch": 0.58, - "learning_rate": 1.865799339971697e-06, - "loss": 0.8906, - "step": 22451 - }, - { - "epoch": 0.58, - "learning_rate": 1.865785493584474e-06, - "loss": 0.7065, - "step": 22452 - }, - { - "epoch": 0.58, - "learning_rate": 1.8657716465343584e-06, - "loss": 1.0625, - "step": 22453 - }, - { - "epoch": 0.58, - "learning_rate": 1.8657577988213617e-06, - "loss": 0.7666, - "step": 22454 - }, - { - "epoch": 0.58, - "learning_rate": 1.8657439504454942e-06, - "loss": 0.7949, - "step": 22455 - }, - { - "epoch": 0.58, - "learning_rate": 1.8657301014067662e-06, - "loss": 1.0684, - "step": 22456 - }, - { - "epoch": 0.58, - "learning_rate": 1.8657162517051886e-06, - "loss": 0.6709, - "step": 22457 - }, - { - "epoch": 0.58, - "learning_rate": 1.8657024013407714e-06, - "loss": 0.9395, - "step": 22458 - }, - { - "epoch": 0.58, - "learning_rate": 1.8656885503135262e-06, - "loss": 0.8755, - "step": 22459 - }, - { - "epoch": 0.58, - "learning_rate": 1.8656746986234627e-06, - "loss": 0.7344, - "step": 22460 - }, - { - "epoch": 0.58, - "learning_rate": 1.8656608462705923e-06, - "loss": 0.9087, - "step": 22461 - }, - { - "epoch": 0.58, - "learning_rate": 1.8656469932549248e-06, - "loss": 1.0586, - "step": 22462 - }, - { - "epoch": 0.58, - "learning_rate": 1.8656331395764716e-06, - "loss": 0.9287, - "step": 22463 - }, - { - "epoch": 0.58, - "learning_rate": 1.8656192852352426e-06, - "loss": 1.0195, - "step": 22464 - }, - { - "epoch": 0.58, - "learning_rate": 1.8656054302312487e-06, - "loss": 0.9746, - "step": 22465 - }, - { - "epoch": 0.58, - "learning_rate": 1.8655915745645006e-06, - "loss": 0.9385, - "step": 22466 - }, - { - "epoch": 0.58, - "learning_rate": 1.865577718235009e-06, - "loss": 0.7803, - "step": 22467 - }, - { - "epoch": 0.58, - "learning_rate": 1.8655638612427843e-06, - "loss": 0.7979, - "step": 22468 - }, - { - "epoch": 0.58, - "learning_rate": 1.8655500035878368e-06, - "loss": 0.9893, - "step": 22469 - }, - { - "epoch": 0.58, - "learning_rate": 1.8655361452701776e-06, - "loss": 0.9531, - "step": 22470 - }, - { - "epoch": 0.58, - "learning_rate": 1.8655222862898175e-06, - "loss": 0.9014, - "step": 22471 - }, - { - "epoch": 0.58, - "learning_rate": 1.8655084266467664e-06, - "loss": 0.8438, - "step": 22472 - }, - { - "epoch": 0.58, - "learning_rate": 1.8654945663410355e-06, - "loss": 0.5171, - "step": 22473 - }, - { - "epoch": 0.58, - "learning_rate": 1.8654807053726352e-06, - "loss": 1.0586, - "step": 22474 - }, - { - "epoch": 0.58, - "learning_rate": 1.8654668437415762e-06, - "loss": 1.1445, - "step": 22475 - }, - { - "epoch": 0.58, - "learning_rate": 1.8654529814478689e-06, - "loss": 1.0381, - "step": 22476 - }, - { - "epoch": 0.58, - "learning_rate": 1.8654391184915239e-06, - "loss": 1.2275, - "step": 22477 - }, - { - "epoch": 0.58, - "learning_rate": 1.8654252548725522e-06, - "loss": 0.9316, - "step": 22478 - }, - { - "epoch": 0.58, - "learning_rate": 1.865411390590964e-06, - "loss": 0.6797, - "step": 22479 - }, - { - "epoch": 0.58, - "learning_rate": 1.8653975256467702e-06, - "loss": 0.8584, - "step": 22480 - }, - { - "epoch": 0.58, - "learning_rate": 1.8653836600399812e-06, - "loss": 0.6362, - "step": 22481 - }, - { - "epoch": 0.58, - "learning_rate": 1.865369793770608e-06, - "loss": 0.7998, - "step": 22482 - }, - { - "epoch": 0.58, - "learning_rate": 1.865355926838661e-06, - "loss": 0.8115, - "step": 22483 - }, - { - "epoch": 0.58, - "learning_rate": 1.8653420592441504e-06, - "loss": 0.9854, - "step": 22484 - }, - { - "epoch": 0.58, - "learning_rate": 1.8653281909870872e-06, - "loss": 0.7041, - "step": 22485 - }, - { - "epoch": 0.58, - "learning_rate": 1.865314322067482e-06, - "loss": 0.7676, - "step": 22486 - }, - { - "epoch": 0.58, - "learning_rate": 1.8653004524853455e-06, - "loss": 0.6011, - "step": 22487 - }, - { - "epoch": 0.58, - "learning_rate": 1.8652865822406882e-06, - "loss": 0.8574, - "step": 22488 - }, - { - "epoch": 0.58, - "learning_rate": 1.8652727113335209e-06, - "loss": 0.8271, - "step": 22489 - }, - { - "epoch": 0.58, - "learning_rate": 1.8652588397638537e-06, - "loss": 0.7734, - "step": 22490 - }, - { - "epoch": 0.58, - "learning_rate": 1.8652449675316982e-06, - "loss": 0.6787, - "step": 22491 - }, - { - "epoch": 0.58, - "learning_rate": 1.865231094637064e-06, - "loss": 0.6409, - "step": 22492 - }, - { - "epoch": 0.58, - "learning_rate": 1.865217221079962e-06, - "loss": 0.8828, - "step": 22493 - }, - { - "epoch": 0.58, - "learning_rate": 1.8652033468604032e-06, - "loss": 0.9346, - "step": 22494 - }, - { - "epoch": 0.58, - "learning_rate": 1.865189471978398e-06, - "loss": 0.9287, - "step": 22495 - }, - { - "epoch": 0.58, - "learning_rate": 1.8651755964339571e-06, - "loss": 0.6641, - "step": 22496 - }, - { - "epoch": 0.58, - "learning_rate": 1.8651617202270908e-06, - "loss": 0.6897, - "step": 22497 - }, - { - "epoch": 0.58, - "learning_rate": 1.86514784335781e-06, - "loss": 0.9404, - "step": 22498 - }, - { - "epoch": 0.58, - "learning_rate": 1.8651339658261252e-06, - "loss": 0.9141, - "step": 22499 - }, - { - "epoch": 0.58, - "learning_rate": 1.8651200876320472e-06, - "loss": 0.7891, - "step": 22500 - }, - { - "epoch": 0.58, - "learning_rate": 1.8651062087755864e-06, - "loss": 0.9561, - "step": 22501 - }, - { - "epoch": 0.58, - "learning_rate": 1.865092329256754e-06, - "loss": 0.8223, - "step": 22502 - }, - { - "epoch": 0.58, - "learning_rate": 1.8650784490755598e-06, - "loss": 0.9131, - "step": 22503 - }, - { - "epoch": 0.58, - "learning_rate": 1.8650645682320146e-06, - "loss": 0.9639, - "step": 22504 - }, - { - "epoch": 0.58, - "learning_rate": 1.8650506867261298e-06, - "loss": 1.0117, - "step": 22505 - }, - { - "epoch": 0.58, - "learning_rate": 1.865036804557915e-06, - "loss": 0.9346, - "step": 22506 - }, - { - "epoch": 0.58, - "learning_rate": 1.8650229217273817e-06, - "loss": 0.8311, - "step": 22507 - }, - { - "epoch": 0.58, - "learning_rate": 1.8650090382345395e-06, - "loss": 0.9717, - "step": 22508 - }, - { - "epoch": 0.58, - "learning_rate": 1.8649951540794002e-06, - "loss": 0.9355, - "step": 22509 - }, - { - "epoch": 0.58, - "learning_rate": 1.8649812692619738e-06, - "loss": 0.9492, - "step": 22510 - }, - { - "epoch": 0.58, - "learning_rate": 1.8649673837822708e-06, - "loss": 0.875, - "step": 22511 - }, - { - "epoch": 0.58, - "learning_rate": 1.864953497640302e-06, - "loss": 0.9502, - "step": 22512 - }, - { - "epoch": 0.58, - "learning_rate": 1.8649396108360787e-06, - "loss": 1.0479, - "step": 22513 - }, - { - "epoch": 0.58, - "learning_rate": 1.8649257233696102e-06, - "loss": 0.8193, - "step": 22514 - }, - { - "epoch": 0.58, - "learning_rate": 1.8649118352409082e-06, - "loss": 0.8623, - "step": 22515 - }, - { - "epoch": 0.58, - "learning_rate": 1.8648979464499827e-06, - "loss": 0.8076, - "step": 22516 - }, - { - "epoch": 0.58, - "learning_rate": 1.864884056996845e-06, - "loss": 0.9453, - "step": 22517 - }, - { - "epoch": 0.58, - "learning_rate": 1.8648701668815052e-06, - "loss": 0.8584, - "step": 22518 - }, - { - "epoch": 0.58, - "learning_rate": 1.8648562761039739e-06, - "loss": 0.7803, - "step": 22519 - }, - { - "epoch": 0.58, - "learning_rate": 1.864842384664262e-06, - "loss": 1.0146, - "step": 22520 - }, - { - "epoch": 0.58, - "learning_rate": 1.8648284925623803e-06, - "loss": 0.7256, - "step": 22521 - }, - { - "epoch": 0.58, - "learning_rate": 1.864814599798339e-06, - "loss": 0.5488, - "step": 22522 - }, - { - "epoch": 0.58, - "learning_rate": 1.864800706372149e-06, - "loss": 0.7671, - "step": 22523 - }, - { - "epoch": 0.58, - "learning_rate": 1.8647868122838206e-06, - "loss": 0.9238, - "step": 22524 - }, - { - "epoch": 0.58, - "learning_rate": 1.8647729175333648e-06, - "loss": 0.8696, - "step": 22525 - }, - { - "epoch": 0.58, - "learning_rate": 1.8647590221207923e-06, - "loss": 0.9307, - "step": 22526 - }, - { - "epoch": 0.58, - "learning_rate": 1.8647451260461137e-06, - "loss": 0.8105, - "step": 22527 - }, - { - "epoch": 0.58, - "learning_rate": 1.8647312293093392e-06, - "loss": 0.6636, - "step": 22528 - }, - { - "epoch": 0.58, - "learning_rate": 1.86471733191048e-06, - "loss": 0.7358, - "step": 22529 - }, - { - "epoch": 0.58, - "learning_rate": 1.8647034338495463e-06, - "loss": 0.8311, - "step": 22530 - }, - { - "epoch": 0.58, - "learning_rate": 1.864689535126549e-06, - "loss": 0.9834, - "step": 22531 - }, - { - "epoch": 0.58, - "learning_rate": 1.8646756357414985e-06, - "loss": 0.6426, - "step": 22532 - }, - { - "epoch": 0.58, - "learning_rate": 1.8646617356944058e-06, - "loss": 0.9199, - "step": 22533 - }, - { - "epoch": 0.58, - "learning_rate": 1.8646478349852814e-06, - "loss": 0.8467, - "step": 22534 - }, - { - "epoch": 0.58, - "learning_rate": 1.8646339336141362e-06, - "loss": 0.8623, - "step": 22535 - }, - { - "epoch": 0.58, - "learning_rate": 1.8646200315809801e-06, - "loss": 0.958, - "step": 22536 - }, - { - "epoch": 0.58, - "learning_rate": 1.8646061288858244e-06, - "loss": 0.873, - "step": 22537 - }, - { - "epoch": 0.58, - "learning_rate": 1.8645922255286794e-06, - "loss": 0.9014, - "step": 22538 - }, - { - "epoch": 0.58, - "learning_rate": 1.864578321509556e-06, - "loss": 1.0195, - "step": 22539 - }, - { - "epoch": 0.58, - "learning_rate": 1.8645644168284647e-06, - "loss": 0.9971, - "step": 22540 - }, - { - "epoch": 0.58, - "learning_rate": 1.864550511485416e-06, - "loss": 0.8525, - "step": 22541 - }, - { - "epoch": 0.58, - "learning_rate": 1.864536605480421e-06, - "loss": 0.9648, - "step": 22542 - }, - { - "epoch": 0.58, - "learning_rate": 1.86452269881349e-06, - "loss": 1.0527, - "step": 22543 - }, - { - "epoch": 0.58, - "learning_rate": 1.864508791484634e-06, - "loss": 0.958, - "step": 22544 - }, - { - "epoch": 0.58, - "learning_rate": 1.864494883493863e-06, - "loss": 0.9375, - "step": 22545 - }, - { - "epoch": 0.58, - "learning_rate": 1.8644809748411881e-06, - "loss": 0.793, - "step": 22546 - }, - { - "epoch": 0.58, - "learning_rate": 1.8644670655266198e-06, - "loss": 0.9248, - "step": 22547 - }, - { - "epoch": 0.58, - "learning_rate": 1.8644531555501688e-06, - "loss": 0.7646, - "step": 22548 - }, - { - "epoch": 0.58, - "learning_rate": 1.864439244911846e-06, - "loss": 1.0898, - "step": 22549 - }, - { - "epoch": 0.58, - "learning_rate": 1.8644253336116617e-06, - "loss": 0.8828, - "step": 22550 - }, - { - "epoch": 0.58, - "learning_rate": 1.8644114216496268e-06, - "loss": 0.6279, - "step": 22551 - }, - { - "epoch": 0.58, - "learning_rate": 1.8643975090257516e-06, - "loss": 0.7881, - "step": 22552 - }, - { - "epoch": 0.58, - "learning_rate": 1.8643835957400472e-06, - "loss": 0.8555, - "step": 22553 - }, - { - "epoch": 0.58, - "learning_rate": 1.8643696817925235e-06, - "loss": 0.8447, - "step": 22554 - }, - { - "epoch": 0.58, - "learning_rate": 1.8643557671831923e-06, - "loss": 0.6514, - "step": 22555 - }, - { - "epoch": 0.58, - "learning_rate": 1.8643418519120632e-06, - "loss": 0.7563, - "step": 22556 - }, - { - "epoch": 0.58, - "learning_rate": 1.8643279359791475e-06, - "loss": 0.8809, - "step": 22557 - }, - { - "epoch": 0.58, - "learning_rate": 1.8643140193844556e-06, - "loss": 0.8013, - "step": 22558 - }, - { - "epoch": 0.58, - "learning_rate": 1.8643001021279984e-06, - "loss": 0.8848, - "step": 22559 - }, - { - "epoch": 0.58, - "learning_rate": 1.8642861842097859e-06, - "loss": 0.7324, - "step": 22560 - }, - { - "epoch": 0.58, - "learning_rate": 1.8642722656298295e-06, - "loss": 0.7656, - "step": 22561 - }, - { - "epoch": 0.58, - "learning_rate": 1.8642583463881397e-06, - "loss": 0.9258, - "step": 22562 - }, - { - "epoch": 0.58, - "learning_rate": 1.8642444264847268e-06, - "loss": 1.002, - "step": 22563 - }, - { - "epoch": 0.58, - "learning_rate": 1.8642305059196017e-06, - "loss": 0.9229, - "step": 22564 - }, - { - "epoch": 0.58, - "learning_rate": 1.864216584692775e-06, - "loss": 0.9023, - "step": 22565 - }, - { - "epoch": 0.58, - "learning_rate": 1.8642026628042578e-06, - "loss": 0.9609, - "step": 22566 - }, - { - "epoch": 0.58, - "learning_rate": 1.86418874025406e-06, - "loss": 0.9639, - "step": 22567 - }, - { - "epoch": 0.58, - "learning_rate": 1.8641748170421925e-06, - "loss": 1.1895, - "step": 22568 - }, - { - "epoch": 0.58, - "learning_rate": 1.8641608931686663e-06, - "loss": 1.0381, - "step": 22569 - }, - { - "epoch": 0.58, - "learning_rate": 1.864146968633492e-06, - "loss": 0.7427, - "step": 22570 - }, - { - "epoch": 0.58, - "learning_rate": 1.8641330434366798e-06, - "loss": 0.5322, - "step": 22571 - }, - { - "epoch": 0.58, - "learning_rate": 1.8641191175782405e-06, - "loss": 0.8579, - "step": 22572 - }, - { - "epoch": 0.58, - "learning_rate": 1.8641051910581852e-06, - "loss": 0.8965, - "step": 22573 - }, - { - "epoch": 0.58, - "learning_rate": 1.8640912638765243e-06, - "loss": 0.999, - "step": 22574 - }, - { - "epoch": 0.58, - "learning_rate": 1.8640773360332685e-06, - "loss": 1.0684, - "step": 22575 - }, - { - "epoch": 0.58, - "learning_rate": 1.864063407528428e-06, - "loss": 0.8408, - "step": 22576 - }, - { - "epoch": 0.58, - "learning_rate": 1.8640494783620144e-06, - "loss": 0.9258, - "step": 22577 - }, - { - "epoch": 0.58, - "learning_rate": 1.8640355485340376e-06, - "loss": 1.0166, - "step": 22578 - }, - { - "epoch": 0.58, - "learning_rate": 1.8640216180445085e-06, - "loss": 0.9521, - "step": 22579 - }, - { - "epoch": 0.58, - "learning_rate": 1.864007686893438e-06, - "loss": 0.9165, - "step": 22580 - }, - { - "epoch": 0.58, - "learning_rate": 1.8639937550808361e-06, - "loss": 0.8237, - "step": 22581 - }, - { - "epoch": 0.58, - "learning_rate": 1.8639798226067142e-06, - "loss": 0.7471, - "step": 22582 - }, - { - "epoch": 0.58, - "learning_rate": 1.8639658894710828e-06, - "loss": 0.8867, - "step": 22583 - }, - { - "epoch": 0.58, - "learning_rate": 1.8639519556739525e-06, - "loss": 0.7373, - "step": 22584 - }, - { - "epoch": 0.58, - "learning_rate": 1.8639380212153336e-06, - "loss": 0.7705, - "step": 22585 - }, - { - "epoch": 0.58, - "learning_rate": 1.863924086095237e-06, - "loss": 1.1221, - "step": 22586 - }, - { - "epoch": 0.58, - "learning_rate": 1.863910150313674e-06, - "loss": 1.0547, - "step": 22587 - }, - { - "epoch": 0.58, - "learning_rate": 1.8638962138706541e-06, - "loss": 0.6602, - "step": 22588 - }, - { - "epoch": 0.58, - "learning_rate": 1.8638822767661889e-06, - "loss": 0.6733, - "step": 22589 - }, - { - "epoch": 0.58, - "learning_rate": 1.8638683390002887e-06, - "loss": 0.9824, - "step": 22590 - }, - { - "epoch": 0.58, - "learning_rate": 1.8638544005729645e-06, - "loss": 0.9141, - "step": 22591 - }, - { - "epoch": 0.58, - "learning_rate": 1.8638404614842265e-06, - "loss": 1.0566, - "step": 22592 - }, - { - "epoch": 0.58, - "learning_rate": 1.8638265217340854e-06, - "loss": 1.0225, - "step": 22593 - }, - { - "epoch": 0.58, - "learning_rate": 1.8638125813225521e-06, - "loss": 0.9961, - "step": 22594 - }, - { - "epoch": 0.58, - "learning_rate": 1.8637986402496373e-06, - "loss": 0.6484, - "step": 22595 - }, - { - "epoch": 0.58, - "learning_rate": 1.8637846985153516e-06, - "loss": 0.9307, - "step": 22596 - }, - { - "epoch": 0.58, - "learning_rate": 1.8637707561197057e-06, - "loss": 0.6343, - "step": 22597 - }, - { - "epoch": 0.58, - "learning_rate": 1.8637568130627103e-06, - "loss": 0.917, - "step": 22598 - }, - { - "epoch": 0.58, - "learning_rate": 1.863742869344376e-06, - "loss": 0.6523, - "step": 22599 - }, - { - "epoch": 0.58, - "learning_rate": 1.8637289249647137e-06, - "loss": 0.9346, - "step": 22600 - }, - { - "epoch": 0.58, - "learning_rate": 1.8637149799237335e-06, - "loss": 0.9746, - "step": 22601 - }, - { - "epoch": 0.58, - "learning_rate": 1.8637010342214466e-06, - "loss": 0.7397, - "step": 22602 - }, - { - "epoch": 0.58, - "learning_rate": 1.8636870878578636e-06, - "loss": 0.6698, - "step": 22603 - }, - { - "epoch": 0.58, - "learning_rate": 1.8636731408329949e-06, - "loss": 0.8306, - "step": 22604 - }, - { - "epoch": 0.58, - "learning_rate": 1.8636591931468515e-06, - "loss": 0.8594, - "step": 22605 - }, - { - "epoch": 0.58, - "learning_rate": 1.8636452447994441e-06, - "loss": 1.0771, - "step": 22606 - }, - { - "epoch": 0.58, - "learning_rate": 1.8636312957907831e-06, - "loss": 0.7781, - "step": 22607 - }, - { - "epoch": 0.58, - "learning_rate": 1.8636173461208795e-06, - "loss": 0.8828, - "step": 22608 - }, - { - "epoch": 0.58, - "learning_rate": 1.8636033957897434e-06, - "loss": 0.7021, - "step": 22609 - }, - { - "epoch": 0.58, - "learning_rate": 1.8635894447973863e-06, - "loss": 0.7715, - "step": 22610 - }, - { - "epoch": 0.58, - "learning_rate": 1.8635754931438183e-06, - "loss": 0.8057, - "step": 22611 - }, - { - "epoch": 0.58, - "learning_rate": 1.8635615408290503e-06, - "loss": 0.8875, - "step": 22612 - }, - { - "epoch": 0.58, - "learning_rate": 1.863547587853093e-06, - "loss": 0.7139, - "step": 22613 - }, - { - "epoch": 0.58, - "learning_rate": 1.8635336342159568e-06, - "loss": 1.0371, - "step": 22614 - }, - { - "epoch": 0.58, - "learning_rate": 1.863519679917653e-06, - "loss": 0.792, - "step": 22615 - }, - { - "epoch": 0.58, - "learning_rate": 1.8635057249581917e-06, - "loss": 0.7739, - "step": 22616 - }, - { - "epoch": 0.58, - "learning_rate": 1.8634917693375836e-06, - "loss": 0.9062, - "step": 22617 - }, - { - "epoch": 0.58, - "learning_rate": 1.8634778130558397e-06, - "loss": 0.7666, - "step": 22618 - }, - { - "epoch": 0.58, - "learning_rate": 1.8634638561129705e-06, - "loss": 1.0566, - "step": 22619 - }, - { - "epoch": 0.58, - "learning_rate": 1.8634498985089867e-06, - "loss": 0.957, - "step": 22620 - }, - { - "epoch": 0.58, - "learning_rate": 1.863435940243899e-06, - "loss": 0.6963, - "step": 22621 - }, - { - "epoch": 0.58, - "learning_rate": 1.8634219813177183e-06, - "loss": 0.873, - "step": 22622 - }, - { - "epoch": 0.58, - "learning_rate": 1.863408021730455e-06, - "loss": 0.9316, - "step": 22623 - }, - { - "epoch": 0.58, - "learning_rate": 1.8633940614821197e-06, - "loss": 0.9072, - "step": 22624 - }, - { - "epoch": 0.58, - "learning_rate": 1.8633801005727235e-06, - "loss": 0.8291, - "step": 22625 - }, - { - "epoch": 0.58, - "learning_rate": 1.8633661390022767e-06, - "loss": 1.0459, - "step": 22626 - }, - { - "epoch": 0.58, - "learning_rate": 1.8633521767707902e-06, - "loss": 0.7603, - "step": 22627 - }, - { - "epoch": 0.58, - "learning_rate": 1.8633382138782747e-06, - "loss": 0.7007, - "step": 22628 - }, - { - "epoch": 0.58, - "learning_rate": 1.8633242503247409e-06, - "loss": 0.96, - "step": 22629 - }, - { - "epoch": 0.58, - "learning_rate": 1.863310286110199e-06, - "loss": 1.0293, - "step": 22630 - }, - { - "epoch": 0.58, - "learning_rate": 1.8632963212346604e-06, - "loss": 0.9053, - "step": 22631 - }, - { - "epoch": 0.58, - "learning_rate": 1.8632823556981356e-06, - "loss": 0.9434, - "step": 22632 - }, - { - "epoch": 0.58, - "learning_rate": 1.8632683895006348e-06, - "loss": 0.7729, - "step": 22633 - }, - { - "epoch": 0.58, - "learning_rate": 1.8632544226421696e-06, - "loss": 0.8965, - "step": 22634 - }, - { - "epoch": 0.58, - "learning_rate": 1.8632404551227498e-06, - "loss": 1.0459, - "step": 22635 - }, - { - "epoch": 0.58, - "learning_rate": 1.8632264869423868e-06, - "loss": 0.9219, - "step": 22636 - }, - { - "epoch": 0.58, - "learning_rate": 1.8632125181010907e-06, - "loss": 0.8184, - "step": 22637 - }, - { - "epoch": 0.58, - "learning_rate": 1.8631985485988727e-06, - "loss": 1.0283, - "step": 22638 - }, - { - "epoch": 0.58, - "learning_rate": 1.8631845784357432e-06, - "loss": 1.0674, - "step": 22639 - }, - { - "epoch": 0.58, - "learning_rate": 1.8631706076117128e-06, - "loss": 0.915, - "step": 22640 - }, - { - "epoch": 0.58, - "learning_rate": 1.8631566361267926e-06, - "loss": 0.9062, - "step": 22641 - }, - { - "epoch": 0.58, - "learning_rate": 1.8631426639809928e-06, - "loss": 0.7949, - "step": 22642 - }, - { - "epoch": 0.58, - "learning_rate": 1.8631286911743245e-06, - "loss": 0.7578, - "step": 22643 - }, - { - "epoch": 0.58, - "learning_rate": 1.8631147177067983e-06, - "loss": 0.7715, - "step": 22644 - }, - { - "epoch": 0.58, - "learning_rate": 1.8631007435784247e-06, - "loss": 0.9189, - "step": 22645 - }, - { - "epoch": 0.58, - "learning_rate": 1.8630867687892145e-06, - "loss": 0.8203, - "step": 22646 - }, - { - "epoch": 0.58, - "learning_rate": 1.8630727933391786e-06, - "loss": 0.7202, - "step": 22647 - }, - { - "epoch": 0.58, - "learning_rate": 1.8630588172283275e-06, - "loss": 0.8467, - "step": 22648 - }, - { - "epoch": 0.58, - "learning_rate": 1.863044840456672e-06, - "loss": 0.769, - "step": 22649 - }, - { - "epoch": 0.58, - "learning_rate": 1.8630308630242224e-06, - "loss": 0.8706, - "step": 22650 - }, - { - "epoch": 0.58, - "learning_rate": 1.8630168849309903e-06, - "loss": 0.8643, - "step": 22651 - }, - { - "epoch": 0.58, - "learning_rate": 1.8630029061769854e-06, - "loss": 0.9482, - "step": 22652 - }, - { - "epoch": 0.58, - "learning_rate": 1.862988926762219e-06, - "loss": 1.0322, - "step": 22653 - }, - { - "epoch": 0.58, - "learning_rate": 1.8629749466867018e-06, - "loss": 0.7402, - "step": 22654 - }, - { - "epoch": 0.58, - "learning_rate": 1.8629609659504442e-06, - "loss": 0.9111, - "step": 22655 - }, - { - "epoch": 0.58, - "learning_rate": 1.8629469845534574e-06, - "loss": 0.9697, - "step": 22656 - }, - { - "epoch": 0.58, - "learning_rate": 1.8629330024957515e-06, - "loss": 0.8799, - "step": 22657 - }, - { - "epoch": 0.58, - "learning_rate": 1.8629190197773372e-06, - "loss": 0.7725, - "step": 22658 - }, - { - "epoch": 0.58, - "learning_rate": 1.862905036398226e-06, - "loss": 0.6572, - "step": 22659 - }, - { - "epoch": 0.58, - "learning_rate": 1.8628910523584278e-06, - "loss": 0.9482, - "step": 22660 - }, - { - "epoch": 0.58, - "learning_rate": 1.8628770676579537e-06, - "loss": 0.5835, - "step": 22661 - }, - { - "epoch": 0.58, - "learning_rate": 1.862863082296814e-06, - "loss": 0.8857, - "step": 22662 - }, - { - "epoch": 0.58, - "learning_rate": 1.8628490962750201e-06, - "loss": 0.9531, - "step": 22663 - }, - { - "epoch": 0.58, - "learning_rate": 1.8628351095925825e-06, - "loss": 1.0977, - "step": 22664 - }, - { - "epoch": 0.58, - "learning_rate": 1.862821122249511e-06, - "loss": 0.7144, - "step": 22665 - }, - { - "epoch": 0.58, - "learning_rate": 1.8628071342458179e-06, - "loss": 0.7793, - "step": 22666 - }, - { - "epoch": 0.58, - "learning_rate": 1.8627931455815125e-06, - "loss": 0.8125, - "step": 22667 - }, - { - "epoch": 0.58, - "learning_rate": 1.8627791562566063e-06, - "loss": 0.8394, - "step": 22668 - }, - { - "epoch": 0.58, - "learning_rate": 1.8627651662711094e-06, - "loss": 1.0801, - "step": 22669 - }, - { - "epoch": 0.58, - "learning_rate": 1.8627511756250334e-06, - "loss": 0.9785, - "step": 22670 - }, - { - "epoch": 0.58, - "learning_rate": 1.8627371843183882e-06, - "loss": 0.8086, - "step": 22671 - }, - { - "epoch": 0.58, - "learning_rate": 1.8627231923511845e-06, - "loss": 0.9121, - "step": 22672 - }, - { - "epoch": 0.58, - "learning_rate": 1.8627091997234339e-06, - "loss": 0.8613, - "step": 22673 - }, - { - "epoch": 0.58, - "learning_rate": 1.8626952064351462e-06, - "loss": 0.7048, - "step": 22674 - }, - { - "epoch": 0.58, - "learning_rate": 1.8626812124863327e-06, - "loss": 0.9697, - "step": 22675 - }, - { - "epoch": 0.58, - "learning_rate": 1.8626672178770035e-06, - "loss": 1.0293, - "step": 22676 - }, - { - "epoch": 0.58, - "learning_rate": 1.86265322260717e-06, - "loss": 0.8379, - "step": 22677 - }, - { - "epoch": 0.58, - "learning_rate": 1.8626392266768424e-06, - "loss": 0.9004, - "step": 22678 - }, - { - "epoch": 0.58, - "learning_rate": 1.8626252300860319e-06, - "loss": 0.7383, - "step": 22679 - }, - { - "epoch": 0.58, - "learning_rate": 1.8626112328347485e-06, - "loss": 0.8281, - "step": 22680 - }, - { - "epoch": 0.58, - "learning_rate": 1.8625972349230036e-06, - "loss": 0.7178, - "step": 22681 - }, - { - "epoch": 0.58, - "learning_rate": 1.8625832363508075e-06, - "loss": 0.8232, - "step": 22682 - }, - { - "epoch": 0.58, - "learning_rate": 1.8625692371181713e-06, - "loss": 0.791, - "step": 22683 - }, - { - "epoch": 0.58, - "learning_rate": 1.8625552372251057e-06, - "loss": 0.9248, - "step": 22684 - }, - { - "epoch": 0.58, - "learning_rate": 1.8625412366716207e-06, - "loss": 0.7627, - "step": 22685 - }, - { - "epoch": 0.58, - "learning_rate": 1.8625272354577279e-06, - "loss": 1.0791, - "step": 22686 - }, - { - "epoch": 0.58, - "learning_rate": 1.8625132335834376e-06, - "loss": 0.918, - "step": 22687 - }, - { - "epoch": 0.58, - "learning_rate": 1.8624992310487601e-06, - "loss": 0.7725, - "step": 22688 - }, - { - "epoch": 0.58, - "learning_rate": 1.8624852278537074e-06, - "loss": 0.8359, - "step": 22689 - }, - { - "epoch": 0.58, - "learning_rate": 1.862471223998289e-06, - "loss": 0.8027, - "step": 22690 - }, - { - "epoch": 0.58, - "learning_rate": 1.8624572194825156e-06, - "loss": 0.9541, - "step": 22691 - }, - { - "epoch": 0.58, - "learning_rate": 1.8624432143063991e-06, - "loss": 0.7383, - "step": 22692 - }, - { - "epoch": 0.58, - "learning_rate": 1.8624292084699491e-06, - "loss": 1.0918, - "step": 22693 - }, - { - "epoch": 0.58, - "learning_rate": 1.8624152019731766e-06, - "loss": 0.8789, - "step": 22694 - }, - { - "epoch": 0.58, - "learning_rate": 1.8624011948160928e-06, - "loss": 0.8018, - "step": 22695 - }, - { - "epoch": 0.58, - "learning_rate": 1.862387186998708e-06, - "loss": 0.9102, - "step": 22696 - }, - { - "epoch": 0.58, - "learning_rate": 1.862373178521033e-06, - "loss": 1.1152, - "step": 22697 - }, - { - "epoch": 0.58, - "learning_rate": 1.8623591693830782e-06, - "loss": 0.6367, - "step": 22698 - }, - { - "epoch": 0.58, - "learning_rate": 1.862345159584855e-06, - "loss": 0.812, - "step": 22699 - }, - { - "epoch": 0.58, - "learning_rate": 1.8623311491263735e-06, - "loss": 0.8398, - "step": 22700 - }, - { - "epoch": 0.58, - "learning_rate": 1.8623171380076447e-06, - "loss": 0.8, - "step": 22701 - }, - { - "epoch": 0.58, - "learning_rate": 1.8623031262286795e-06, - "loss": 0.9082, - "step": 22702 - }, - { - "epoch": 0.58, - "learning_rate": 1.8622891137894882e-06, - "loss": 0.8838, - "step": 22703 - }, - { - "epoch": 0.58, - "learning_rate": 1.8622751006900818e-06, - "loss": 0.7891, - "step": 22704 - }, - { - "epoch": 0.58, - "learning_rate": 1.8622610869304714e-06, - "loss": 0.7954, - "step": 22705 - }, - { - "epoch": 0.58, - "learning_rate": 1.862247072510667e-06, - "loss": 0.7715, - "step": 22706 - }, - { - "epoch": 0.58, - "learning_rate": 1.8622330574306797e-06, - "loss": 0.7944, - "step": 22707 - }, - { - "epoch": 0.58, - "learning_rate": 1.8622190416905204e-06, - "loss": 0.8213, - "step": 22708 - }, - { - "epoch": 0.58, - "learning_rate": 1.8622050252901993e-06, - "loss": 0.75, - "step": 22709 - }, - { - "epoch": 0.58, - "learning_rate": 1.8621910082297275e-06, - "loss": 1.0059, - "step": 22710 - }, - { - "epoch": 0.58, - "learning_rate": 1.8621769905091158e-06, - "loss": 1.1211, - "step": 22711 - }, - { - "epoch": 0.58, - "learning_rate": 1.8621629721283747e-06, - "loss": 1.0488, - "step": 22712 - }, - { - "epoch": 0.58, - "learning_rate": 1.8621489530875154e-06, - "loss": 0.8477, - "step": 22713 - }, - { - "epoch": 0.58, - "learning_rate": 1.8621349333865478e-06, - "loss": 0.7832, - "step": 22714 - }, - { - "epoch": 0.58, - "learning_rate": 1.8621209130254835e-06, - "loss": 1.0068, - "step": 22715 - }, - { - "epoch": 0.58, - "learning_rate": 1.8621068920043327e-06, - "loss": 0.916, - "step": 22716 - }, - { - "epoch": 0.58, - "learning_rate": 1.8620928703231065e-06, - "loss": 0.7227, - "step": 22717 - }, - { - "epoch": 0.58, - "learning_rate": 1.8620788479818153e-06, - "loss": 0.8271, - "step": 22718 - }, - { - "epoch": 0.58, - "learning_rate": 1.8620648249804699e-06, - "loss": 0.7578, - "step": 22719 - }, - { - "epoch": 0.58, - "learning_rate": 1.862050801319081e-06, - "loss": 1.0068, - "step": 22720 - }, - { - "epoch": 0.58, - "learning_rate": 1.8620367769976597e-06, - "loss": 0.8564, - "step": 22721 - }, - { - "epoch": 0.58, - "learning_rate": 1.862022752016216e-06, - "loss": 0.7485, - "step": 22722 - }, - { - "epoch": 0.58, - "learning_rate": 1.8620087263747617e-06, - "loss": 0.9893, - "step": 22723 - }, - { - "epoch": 0.58, - "learning_rate": 1.8619947000733066e-06, - "loss": 0.8838, - "step": 22724 - }, - { - "epoch": 0.58, - "learning_rate": 1.8619806731118621e-06, - "loss": 0.9688, - "step": 22725 - }, - { - "epoch": 0.58, - "learning_rate": 1.8619666454904384e-06, - "loss": 0.8418, - "step": 22726 - }, - { - "epoch": 0.58, - "learning_rate": 1.8619526172090466e-06, - "loss": 0.9023, - "step": 22727 - }, - { - "epoch": 0.58, - "learning_rate": 1.861938588267697e-06, - "loss": 0.5967, - "step": 22728 - }, - { - "epoch": 0.58, - "learning_rate": 1.861924558666401e-06, - "loss": 0.8425, - "step": 22729 - }, - { - "epoch": 0.58, - "learning_rate": 1.8619105284051689e-06, - "loss": 0.6704, - "step": 22730 - }, - { - "epoch": 0.58, - "learning_rate": 1.8618964974840114e-06, - "loss": 0.9092, - "step": 22731 - }, - { - "epoch": 0.58, - "learning_rate": 1.8618824659029398e-06, - "loss": 0.7568, - "step": 22732 - }, - { - "epoch": 0.58, - "learning_rate": 1.861868433661964e-06, - "loss": 0.8022, - "step": 22733 - }, - { - "epoch": 0.58, - "learning_rate": 1.8618544007610952e-06, - "loss": 0.9062, - "step": 22734 - }, - { - "epoch": 0.58, - "learning_rate": 1.8618403672003442e-06, - "loss": 1.0234, - "step": 22735 - }, - { - "epoch": 0.58, - "learning_rate": 1.8618263329797216e-06, - "loss": 1.0117, - "step": 22736 - }, - { - "epoch": 0.58, - "learning_rate": 1.8618122980992384e-06, - "loss": 0.8037, - "step": 22737 - }, - { - "epoch": 0.58, - "learning_rate": 1.8617982625589051e-06, - "loss": 0.75, - "step": 22738 - }, - { - "epoch": 0.58, - "learning_rate": 1.8617842263587323e-06, - "loss": 0.875, - "step": 22739 - }, - { - "epoch": 0.58, - "learning_rate": 1.8617701894987312e-06, - "loss": 1.0498, - "step": 22740 - }, - { - "epoch": 0.58, - "learning_rate": 1.8617561519789121e-06, - "loss": 0.832, - "step": 22741 - }, - { - "epoch": 0.58, - "learning_rate": 1.861742113799286e-06, - "loss": 0.9082, - "step": 22742 - }, - { - "epoch": 0.58, - "learning_rate": 1.8617280749598633e-06, - "loss": 0.8848, - "step": 22743 - }, - { - "epoch": 0.58, - "learning_rate": 1.8617140354606558e-06, - "loss": 0.9619, - "step": 22744 - }, - { - "epoch": 0.58, - "learning_rate": 1.8616999953016727e-06, - "loss": 0.9033, - "step": 22745 - }, - { - "epoch": 0.58, - "learning_rate": 1.861685954482926e-06, - "loss": 0.8389, - "step": 22746 - }, - { - "epoch": 0.58, - "learning_rate": 1.861671913004426e-06, - "loss": 0.9033, - "step": 22747 - }, - { - "epoch": 0.58, - "learning_rate": 1.861657870866183e-06, - "loss": 0.9902, - "step": 22748 - }, - { - "epoch": 0.58, - "learning_rate": 1.8616438280682084e-06, - "loss": 0.8809, - "step": 22749 - }, - { - "epoch": 0.58, - "learning_rate": 1.861629784610513e-06, - "loss": 0.7412, - "step": 22750 - }, - { - "epoch": 0.58, - "learning_rate": 1.861615740493107e-06, - "loss": 0.877, - "step": 22751 - }, - { - "epoch": 0.58, - "learning_rate": 1.8616016957160014e-06, - "loss": 0.8506, - "step": 22752 - }, - { - "epoch": 0.58, - "learning_rate": 1.8615876502792075e-06, - "loss": 0.9512, - "step": 22753 - }, - { - "epoch": 0.58, - "learning_rate": 1.861573604182735e-06, - "loss": 0.9805, - "step": 22754 - }, - { - "epoch": 0.58, - "learning_rate": 1.8615595574265953e-06, - "loss": 0.8955, - "step": 22755 - }, - { - "epoch": 0.58, - "learning_rate": 1.8615455100107993e-06, - "loss": 0.7588, - "step": 22756 - }, - { - "epoch": 0.58, - "learning_rate": 1.8615314619353573e-06, - "loss": 0.6196, - "step": 22757 - }, - { - "epoch": 0.58, - "learning_rate": 1.8615174132002801e-06, - "loss": 0.6995, - "step": 22758 - }, - { - "epoch": 0.58, - "learning_rate": 1.8615033638055793e-06, - "loss": 0.8193, - "step": 22759 - }, - { - "epoch": 0.58, - "learning_rate": 1.8614893137512644e-06, - "loss": 0.8892, - "step": 22760 - }, - { - "epoch": 0.58, - "learning_rate": 1.861475263037347e-06, - "loss": 0.6191, - "step": 22761 - }, - { - "epoch": 0.58, - "learning_rate": 1.8614612116638374e-06, - "loss": 0.6011, - "step": 22762 - }, - { - "epoch": 0.58, - "learning_rate": 1.8614471596307466e-06, - "loss": 0.8496, - "step": 22763 - }, - { - "epoch": 0.58, - "learning_rate": 1.8614331069380855e-06, - "loss": 0.8418, - "step": 22764 - }, - { - "epoch": 0.58, - "learning_rate": 1.8614190535858648e-06, - "loss": 0.7656, - "step": 22765 - }, - { - "epoch": 0.58, - "learning_rate": 1.861404999574095e-06, - "loss": 0.9761, - "step": 22766 - }, - { - "epoch": 0.58, - "learning_rate": 1.8613909449027866e-06, - "loss": 0.7822, - "step": 22767 - }, - { - "epoch": 0.58, - "learning_rate": 1.861376889571951e-06, - "loss": 0.7383, - "step": 22768 - }, - { - "epoch": 0.58, - "learning_rate": 1.861362833581599e-06, - "loss": 0.8945, - "step": 22769 - }, - { - "epoch": 0.58, - "learning_rate": 1.8613487769317407e-06, - "loss": 0.6841, - "step": 22770 - }, - { - "epoch": 0.58, - "learning_rate": 1.8613347196223877e-06, - "loss": 0.9678, - "step": 22771 - }, - { - "epoch": 0.58, - "learning_rate": 1.8613206616535498e-06, - "loss": 0.8662, - "step": 22772 - }, - { - "epoch": 0.58, - "learning_rate": 1.8613066030252384e-06, - "loss": 0.8652, - "step": 22773 - }, - { - "epoch": 0.58, - "learning_rate": 1.8612925437374644e-06, - "loss": 0.8198, - "step": 22774 - }, - { - "epoch": 0.58, - "learning_rate": 1.8612784837902382e-06, - "loss": 0.6934, - "step": 22775 - }, - { - "epoch": 0.58, - "learning_rate": 1.8612644231835706e-06, - "loss": 1.0205, - "step": 22776 - }, - { - "epoch": 0.58, - "learning_rate": 1.8612503619174723e-06, - "loss": 0.877, - "step": 22777 - }, - { - "epoch": 0.58, - "learning_rate": 1.8612362999919547e-06, - "loss": 0.8652, - "step": 22778 - }, - { - "epoch": 0.58, - "learning_rate": 1.8612222374070274e-06, - "loss": 0.9971, - "step": 22779 - }, - { - "epoch": 0.58, - "learning_rate": 1.8612081741627024e-06, - "loss": 0.8467, - "step": 22780 - }, - { - "epoch": 0.58, - "learning_rate": 1.8611941102589897e-06, - "loss": 1.082, - "step": 22781 - }, - { - "epoch": 0.58, - "learning_rate": 1.8611800456958998e-06, - "loss": 0.8362, - "step": 22782 - }, - { - "epoch": 0.58, - "learning_rate": 1.8611659804734447e-06, - "loss": 0.8066, - "step": 22783 - }, - { - "epoch": 0.58, - "learning_rate": 1.8611519145916338e-06, - "loss": 0.8994, - "step": 22784 - }, - { - "epoch": 0.58, - "learning_rate": 1.8611378480504789e-06, - "loss": 0.6802, - "step": 22785 - }, - { - "epoch": 0.58, - "learning_rate": 1.8611237808499903e-06, - "loss": 1.0205, - "step": 22786 - }, - { - "epoch": 0.58, - "learning_rate": 1.8611097129901787e-06, - "loss": 0.9648, - "step": 22787 - }, - { - "epoch": 0.58, - "learning_rate": 1.8610956444710549e-06, - "loss": 0.8955, - "step": 22788 - }, - { - "epoch": 0.58, - "learning_rate": 1.8610815752926298e-06, - "loss": 1.0342, - "step": 22789 - }, - { - "epoch": 0.58, - "learning_rate": 1.8610675054549143e-06, - "loss": 0.7158, - "step": 22790 - }, - { - "epoch": 0.58, - "learning_rate": 1.861053434957919e-06, - "loss": 1.042, - "step": 22791 - }, - { - "epoch": 0.58, - "learning_rate": 1.8610393638016544e-06, - "loss": 0.8418, - "step": 22792 - }, - { - "epoch": 0.58, - "learning_rate": 1.8610252919861319e-06, - "loss": 1.0967, - "step": 22793 - }, - { - "epoch": 0.58, - "learning_rate": 1.8610112195113616e-06, - "loss": 0.8965, - "step": 22794 - }, - { - "epoch": 0.58, - "learning_rate": 1.8609971463773547e-06, - "loss": 0.8359, - "step": 22795 - }, - { - "epoch": 0.58, - "learning_rate": 1.860983072584122e-06, - "loss": 0.9229, - "step": 22796 - }, - { - "epoch": 0.58, - "learning_rate": 1.860968998131674e-06, - "loss": 0.7832, - "step": 22797 - }, - { - "epoch": 0.58, - "learning_rate": 1.8609549230200217e-06, - "loss": 1.0293, - "step": 22798 - }, - { - "epoch": 0.58, - "learning_rate": 1.8609408472491758e-06, - "loss": 0.9746, - "step": 22799 - }, - { - "epoch": 0.58, - "learning_rate": 1.860926770819147e-06, - "loss": 0.8184, - "step": 22800 - }, - { - "epoch": 0.58, - "learning_rate": 1.8609126937299463e-06, - "loss": 0.7227, - "step": 22801 - }, - { - "epoch": 0.58, - "learning_rate": 1.8608986159815846e-06, - "loss": 1.0479, - "step": 22802 - }, - { - "epoch": 0.58, - "learning_rate": 1.8608845375740719e-06, - "loss": 0.8203, - "step": 22803 - }, - { - "epoch": 0.58, - "learning_rate": 1.8608704585074196e-06, - "loss": 0.7214, - "step": 22804 - }, - { - "epoch": 0.58, - "learning_rate": 1.8608563787816384e-06, - "loss": 0.71, - "step": 22805 - }, - { - "epoch": 0.58, - "learning_rate": 1.8608422983967392e-06, - "loss": 0.8379, - "step": 22806 - }, - { - "epoch": 0.58, - "learning_rate": 1.8608282173527323e-06, - "loss": 0.9326, - "step": 22807 - }, - { - "epoch": 0.58, - "learning_rate": 1.8608141356496291e-06, - "loss": 1.0254, - "step": 22808 - }, - { - "epoch": 0.58, - "learning_rate": 1.8608000532874401e-06, - "loss": 0.9814, - "step": 22809 - }, - { - "epoch": 0.58, - "learning_rate": 1.860785970266176e-06, - "loss": 0.8359, - "step": 22810 - }, - { - "epoch": 0.58, - "learning_rate": 1.860771886585848e-06, - "loss": 0.7842, - "step": 22811 - }, - { - "epoch": 0.58, - "learning_rate": 1.8607578022464661e-06, - "loss": 0.8594, - "step": 22812 - }, - { - "epoch": 0.58, - "learning_rate": 1.8607437172480416e-06, - "loss": 0.6685, - "step": 22813 - }, - { - "epoch": 0.58, - "learning_rate": 1.8607296315905853e-06, - "loss": 0.8682, - "step": 22814 - }, - { - "epoch": 0.58, - "learning_rate": 1.860715545274108e-06, - "loss": 0.9326, - "step": 22815 - }, - { - "epoch": 0.58, - "learning_rate": 1.8607014582986202e-06, - "loss": 0.7705, - "step": 22816 - }, - { - "epoch": 0.58, - "learning_rate": 1.860687370664133e-06, - "loss": 0.8154, - "step": 22817 - }, - { - "epoch": 0.58, - "learning_rate": 1.860673282370657e-06, - "loss": 0.8975, - "step": 22818 - }, - { - "epoch": 0.58, - "learning_rate": 1.860659193418203e-06, - "loss": 0.6465, - "step": 22819 - }, - { - "epoch": 0.58, - "learning_rate": 1.8606451038067818e-06, - "loss": 0.9141, - "step": 22820 - }, - { - "epoch": 0.58, - "learning_rate": 1.8606310135364046e-06, - "loss": 0.9209, - "step": 22821 - }, - { - "epoch": 0.58, - "learning_rate": 1.8606169226070812e-06, - "loss": 0.8154, - "step": 22822 - }, - { - "epoch": 0.58, - "learning_rate": 1.8606028310188232e-06, - "loss": 1.1621, - "step": 22823 - }, - { - "epoch": 0.58, - "learning_rate": 1.8605887387716416e-06, - "loss": 0.981, - "step": 22824 - }, - { - "epoch": 0.59, - "learning_rate": 1.8605746458655462e-06, - "loss": 0.8926, - "step": 22825 - }, - { - "epoch": 0.59, - "learning_rate": 1.8605605523005488e-06, - "loss": 0.9824, - "step": 22826 - }, - { - "epoch": 0.59, - "learning_rate": 1.8605464580766594e-06, - "loss": 0.8945, - "step": 22827 - }, - { - "epoch": 0.59, - "learning_rate": 1.8605323631938892e-06, - "loss": 0.9121, - "step": 22828 - }, - { - "epoch": 0.59, - "learning_rate": 1.8605182676522491e-06, - "loss": 0.877, - "step": 22829 - }, - { - "epoch": 0.59, - "learning_rate": 1.8605041714517498e-06, - "loss": 0.8057, - "step": 22830 - }, - { - "epoch": 0.59, - "learning_rate": 1.860490074592402e-06, - "loss": 0.9326, - "step": 22831 - }, - { - "epoch": 0.59, - "learning_rate": 1.8604759770742162e-06, - "loss": 1.1182, - "step": 22832 - }, - { - "epoch": 0.59, - "learning_rate": 1.8604618788972038e-06, - "loss": 0.8821, - "step": 22833 - }, - { - "epoch": 0.59, - "learning_rate": 1.860447780061375e-06, - "loss": 0.7881, - "step": 22834 - }, - { - "epoch": 0.59, - "learning_rate": 1.8604336805667413e-06, - "loss": 0.8032, - "step": 22835 - }, - { - "epoch": 0.59, - "learning_rate": 1.860419580413313e-06, - "loss": 0.8516, - "step": 22836 - }, - { - "epoch": 0.59, - "learning_rate": 1.8604054796011008e-06, - "loss": 0.9844, - "step": 22837 - }, - { - "epoch": 0.59, - "learning_rate": 1.860391378130116e-06, - "loss": 1.0479, - "step": 22838 - }, - { - "epoch": 0.59, - "learning_rate": 1.8603772760003688e-06, - "loss": 0.9873, - "step": 22839 - }, - { - "epoch": 0.59, - "learning_rate": 1.8603631732118704e-06, - "loss": 0.6646, - "step": 22840 - }, - { - "epoch": 0.59, - "learning_rate": 1.8603490697646313e-06, - "loss": 0.8135, - "step": 22841 - }, - { - "epoch": 0.59, - "learning_rate": 1.8603349656586627e-06, - "loss": 1.0781, - "step": 22842 - }, - { - "epoch": 0.59, - "learning_rate": 1.8603208608939752e-06, - "loss": 1.0156, - "step": 22843 - }, - { - "epoch": 0.59, - "learning_rate": 1.8603067554705794e-06, - "loss": 0.7871, - "step": 22844 - }, - { - "epoch": 0.59, - "learning_rate": 1.8602926493884863e-06, - "loss": 0.8535, - "step": 22845 - }, - { - "epoch": 0.59, - "learning_rate": 1.8602785426477067e-06, - "loss": 0.8428, - "step": 22846 - }, - { - "epoch": 0.59, - "learning_rate": 1.8602644352482514e-06, - "loss": 0.8701, - "step": 22847 - }, - { - "epoch": 0.59, - "learning_rate": 1.860250327190131e-06, - "loss": 0.6709, - "step": 22848 - }, - { - "epoch": 0.59, - "learning_rate": 1.8602362184733566e-06, - "loss": 0.7236, - "step": 22849 - }, - { - "epoch": 0.59, - "learning_rate": 1.860222109097939e-06, - "loss": 0.8457, - "step": 22850 - }, - { - "epoch": 0.59, - "learning_rate": 1.860207999063889e-06, - "loss": 1.1279, - "step": 22851 - }, - { - "epoch": 0.59, - "learning_rate": 1.8601938883712171e-06, - "loss": 0.8315, - "step": 22852 - }, - { - "epoch": 0.59, - "learning_rate": 1.8601797770199343e-06, - "loss": 0.7271, - "step": 22853 - }, - { - "epoch": 0.59, - "learning_rate": 1.8601656650100512e-06, - "loss": 0.7314, - "step": 22854 - }, - { - "epoch": 0.59, - "learning_rate": 1.8601515523415792e-06, - "loss": 0.8462, - "step": 22855 - }, - { - "epoch": 0.59, - "learning_rate": 1.8601374390145285e-06, - "loss": 0.6802, - "step": 22856 - }, - { - "epoch": 0.59, - "learning_rate": 1.86012332502891e-06, - "loss": 1.1279, - "step": 22857 - }, - { - "epoch": 0.59, - "learning_rate": 1.8601092103847348e-06, - "loss": 0.9619, - "step": 22858 - }, - { - "epoch": 0.59, - "learning_rate": 1.8600950950820136e-06, - "loss": 0.8369, - "step": 22859 - }, - { - "epoch": 0.59, - "learning_rate": 1.8600809791207567e-06, - "loss": 0.9346, - "step": 22860 - }, - { - "epoch": 0.59, - "learning_rate": 1.8600668625009758e-06, - "loss": 1.0029, - "step": 22861 - }, - { - "epoch": 0.59, - "learning_rate": 1.8600527452226813e-06, - "loss": 1.1152, - "step": 22862 - }, - { - "epoch": 0.59, - "learning_rate": 1.8600386272858836e-06, - "loss": 0.9658, - "step": 22863 - }, - { - "epoch": 0.59, - "learning_rate": 1.8600245086905942e-06, - "loss": 0.7476, - "step": 22864 - }, - { - "epoch": 0.59, - "learning_rate": 1.8600103894368232e-06, - "loss": 0.9092, - "step": 22865 - }, - { - "epoch": 0.59, - "learning_rate": 1.859996269524582e-06, - "loss": 0.9707, - "step": 22866 - }, - { - "epoch": 0.59, - "learning_rate": 1.859982148953881e-06, - "loss": 0.9248, - "step": 22867 - }, - { - "epoch": 0.59, - "learning_rate": 1.8599680277247317e-06, - "loss": 0.8369, - "step": 22868 - }, - { - "epoch": 0.59, - "learning_rate": 1.8599539058371442e-06, - "loss": 0.7217, - "step": 22869 - }, - { - "epoch": 0.59, - "learning_rate": 1.8599397832911294e-06, - "loss": 1.0244, - "step": 22870 - }, - { - "epoch": 0.59, - "learning_rate": 1.8599256600866981e-06, - "loss": 0.8076, - "step": 22871 - }, - { - "epoch": 0.59, - "learning_rate": 1.8599115362238616e-06, - "loss": 0.8286, - "step": 22872 - }, - { - "epoch": 0.59, - "learning_rate": 1.8598974117026304e-06, - "loss": 1.0137, - "step": 22873 - }, - { - "epoch": 0.59, - "learning_rate": 1.859883286523015e-06, - "loss": 1.0098, - "step": 22874 - }, - { - "epoch": 0.59, - "learning_rate": 1.8598691606850268e-06, - "loss": 0.8613, - "step": 22875 - }, - { - "epoch": 0.59, - "learning_rate": 1.859855034188676e-06, - "loss": 1.124, - "step": 22876 - }, - { - "epoch": 0.59, - "learning_rate": 1.859840907033974e-06, - "loss": 0.8066, - "step": 22877 - }, - { - "epoch": 0.59, - "learning_rate": 1.8598267792209312e-06, - "loss": 0.9668, - "step": 22878 - }, - { - "epoch": 0.59, - "learning_rate": 1.8598126507495586e-06, - "loss": 0.9629, - "step": 22879 - }, - { - "epoch": 0.59, - "learning_rate": 1.859798521619867e-06, - "loss": 1.042, - "step": 22880 - }, - { - "epoch": 0.59, - "learning_rate": 1.8597843918318672e-06, - "loss": 0.7881, - "step": 22881 - }, - { - "epoch": 0.59, - "learning_rate": 1.8597702613855702e-06, - "loss": 0.9131, - "step": 22882 - }, - { - "epoch": 0.59, - "learning_rate": 1.8597561302809865e-06, - "loss": 0.9023, - "step": 22883 - }, - { - "epoch": 0.59, - "learning_rate": 1.8597419985181271e-06, - "loss": 0.9092, - "step": 22884 - }, - { - "epoch": 0.59, - "learning_rate": 1.8597278660970029e-06, - "loss": 0.791, - "step": 22885 - }, - { - "epoch": 0.59, - "learning_rate": 1.8597137330176243e-06, - "loss": 0.6963, - "step": 22886 - }, - { - "epoch": 0.59, - "learning_rate": 1.8596995992800025e-06, - "loss": 0.7522, - "step": 22887 - }, - { - "epoch": 0.59, - "learning_rate": 1.8596854648841482e-06, - "loss": 1.1123, - "step": 22888 - }, - { - "epoch": 0.59, - "learning_rate": 1.8596713298300726e-06, - "loss": 0.8379, - "step": 22889 - }, - { - "epoch": 0.59, - "learning_rate": 1.859657194117786e-06, - "loss": 0.6836, - "step": 22890 - }, - { - "epoch": 0.59, - "learning_rate": 1.8596430577472994e-06, - "loss": 1.2021, - "step": 22891 - }, - { - "epoch": 0.59, - "learning_rate": 1.8596289207186236e-06, - "loss": 0.9121, - "step": 22892 - }, - { - "epoch": 0.59, - "learning_rate": 1.8596147830317693e-06, - "loss": 0.9795, - "step": 22893 - }, - { - "epoch": 0.59, - "learning_rate": 1.8596006446867478e-06, - "loss": 0.9678, - "step": 22894 - }, - { - "epoch": 0.59, - "learning_rate": 1.8595865056835694e-06, - "loss": 0.9893, - "step": 22895 - }, - { - "epoch": 0.59, - "learning_rate": 1.8595723660222453e-06, - "loss": 0.9092, - "step": 22896 - }, - { - "epoch": 0.59, - "learning_rate": 1.859558225702786e-06, - "loss": 0.9014, - "step": 22897 - }, - { - "epoch": 0.59, - "learning_rate": 1.859544084725203e-06, - "loss": 0.791, - "step": 22898 - }, - { - "epoch": 0.59, - "learning_rate": 1.859529943089506e-06, - "loss": 0.9111, - "step": 22899 - }, - { - "epoch": 0.59, - "learning_rate": 1.8595158007957066e-06, - "loss": 0.9121, - "step": 22900 - }, - { - "epoch": 0.59, - "learning_rate": 1.8595016578438156e-06, - "loss": 1.0156, - "step": 22901 - }, - { - "epoch": 0.59, - "learning_rate": 1.8594875142338435e-06, - "loss": 0.7881, - "step": 22902 - }, - { - "epoch": 0.59, - "learning_rate": 1.8594733699658014e-06, - "loss": 0.6758, - "step": 22903 - }, - { - "epoch": 0.59, - "learning_rate": 1.8594592250397004e-06, - "loss": 0.7949, - "step": 22904 - }, - { - "epoch": 0.59, - "learning_rate": 1.8594450794555505e-06, - "loss": 0.8027, - "step": 22905 - }, - { - "epoch": 0.59, - "learning_rate": 1.8594309332133632e-06, - "loss": 0.8853, - "step": 22906 - }, - { - "epoch": 0.59, - "learning_rate": 1.8594167863131492e-06, - "loss": 0.917, - "step": 22907 - }, - { - "epoch": 0.59, - "learning_rate": 1.8594026387549194e-06, - "loss": 1.0391, - "step": 22908 - }, - { - "epoch": 0.59, - "learning_rate": 1.8593884905386843e-06, - "loss": 0.9541, - "step": 22909 - }, - { - "epoch": 0.59, - "learning_rate": 1.859374341664455e-06, - "loss": 0.6118, - "step": 22910 - }, - { - "epoch": 0.59, - "learning_rate": 1.8593601921322421e-06, - "loss": 0.7056, - "step": 22911 - }, - { - "epoch": 0.59, - "learning_rate": 1.859346041942057e-06, - "loss": 0.8813, - "step": 22912 - }, - { - "epoch": 0.59, - "learning_rate": 1.8593318910939098e-06, - "loss": 0.7695, - "step": 22913 - }, - { - "epoch": 0.59, - "learning_rate": 1.859317739587812e-06, - "loss": 0.8691, - "step": 22914 - }, - { - "epoch": 0.59, - "learning_rate": 1.8593035874237739e-06, - "loss": 0.7773, - "step": 22915 - }, - { - "epoch": 0.59, - "learning_rate": 1.8592894346018067e-06, - "loss": 0.8325, - "step": 22916 - }, - { - "epoch": 0.59, - "learning_rate": 1.859275281121921e-06, - "loss": 0.9062, - "step": 22917 - }, - { - "epoch": 0.59, - "learning_rate": 1.8592611269841277e-06, - "loss": 1.0859, - "step": 22918 - }, - { - "epoch": 0.59, - "learning_rate": 1.8592469721884378e-06, - "loss": 0.7725, - "step": 22919 - }, - { - "epoch": 0.59, - "learning_rate": 1.8592328167348618e-06, - "loss": 0.7632, - "step": 22920 - }, - { - "epoch": 0.59, - "learning_rate": 1.8592186606234108e-06, - "loss": 0.9883, - "step": 22921 - }, - { - "epoch": 0.59, - "learning_rate": 1.8592045038540958e-06, - "loss": 1.0332, - "step": 22922 - }, - { - "epoch": 0.59, - "learning_rate": 1.8591903464269273e-06, - "loss": 0.8066, - "step": 22923 - }, - { - "epoch": 0.59, - "learning_rate": 1.8591761883419162e-06, - "loss": 0.8652, - "step": 22924 - }, - { - "epoch": 0.59, - "learning_rate": 1.8591620295990733e-06, - "loss": 0.9883, - "step": 22925 - }, - { - "epoch": 0.59, - "learning_rate": 1.8591478701984098e-06, - "loss": 0.8613, - "step": 22926 - }, - { - "epoch": 0.59, - "learning_rate": 1.859133710139936e-06, - "loss": 0.7407, - "step": 22927 - }, - { - "epoch": 0.59, - "learning_rate": 1.8591195494236632e-06, - "loss": 0.7124, - "step": 22928 - }, - { - "epoch": 0.59, - "learning_rate": 1.8591053880496022e-06, - "loss": 0.6921, - "step": 22929 - }, - { - "epoch": 0.59, - "learning_rate": 1.8590912260177634e-06, - "loss": 0.6821, - "step": 22930 - }, - { - "epoch": 0.59, - "learning_rate": 1.859077063328158e-06, - "loss": 0.7617, - "step": 22931 - }, - { - "epoch": 0.59, - "learning_rate": 1.859062899980797e-06, - "loss": 0.876, - "step": 22932 - }, - { - "epoch": 0.59, - "learning_rate": 1.8590487359756909e-06, - "loss": 0.8682, - "step": 22933 - }, - { - "epoch": 0.59, - "learning_rate": 1.8590345713128506e-06, - "loss": 0.8813, - "step": 22934 - }, - { - "epoch": 0.59, - "learning_rate": 1.859020405992287e-06, - "loss": 0.875, - "step": 22935 - }, - { - "epoch": 0.59, - "learning_rate": 1.8590062400140113e-06, - "loss": 0.8564, - "step": 22936 - }, - { - "epoch": 0.59, - "learning_rate": 1.8589920733780338e-06, - "loss": 0.8213, - "step": 22937 - }, - { - "epoch": 0.59, - "learning_rate": 1.8589779060843656e-06, - "loss": 0.877, - "step": 22938 - }, - { - "epoch": 0.59, - "learning_rate": 1.8589637381330175e-06, - "loss": 0.8301, - "step": 22939 - }, - { - "epoch": 0.59, - "learning_rate": 1.8589495695240002e-06, - "loss": 0.5767, - "step": 22940 - }, - { - "epoch": 0.59, - "learning_rate": 1.8589354002573248e-06, - "loss": 0.8096, - "step": 22941 - }, - { - "epoch": 0.59, - "learning_rate": 1.8589212303330021e-06, - "loss": 0.8408, - "step": 22942 - }, - { - "epoch": 0.59, - "learning_rate": 1.858907059751043e-06, - "loss": 0.8135, - "step": 22943 - }, - { - "epoch": 0.59, - "learning_rate": 1.8588928885114581e-06, - "loss": 0.9854, - "step": 22944 - }, - { - "epoch": 0.59, - "learning_rate": 1.8588787166142587e-06, - "loss": 0.7891, - "step": 22945 - }, - { - "epoch": 0.59, - "learning_rate": 1.8588645440594552e-06, - "loss": 1.0781, - "step": 22946 - }, - { - "epoch": 0.59, - "learning_rate": 1.8588503708470584e-06, - "loss": 0.7791, - "step": 22947 - }, - { - "epoch": 0.59, - "learning_rate": 1.8588361969770795e-06, - "loss": 0.8721, - "step": 22948 - }, - { - "epoch": 0.59, - "learning_rate": 1.8588220224495292e-06, - "loss": 0.9717, - "step": 22949 - }, - { - "epoch": 0.59, - "learning_rate": 1.8588078472644186e-06, - "loss": 0.8132, - "step": 22950 - }, - { - "epoch": 0.59, - "learning_rate": 1.858793671421758e-06, - "loss": 0.793, - "step": 22951 - }, - { - "epoch": 0.59, - "learning_rate": 1.858779494921559e-06, - "loss": 0.8491, - "step": 22952 - }, - { - "epoch": 0.59, - "learning_rate": 1.8587653177638316e-06, - "loss": 1.0293, - "step": 22953 - }, - { - "epoch": 0.59, - "learning_rate": 1.8587511399485871e-06, - "loss": 0.8877, - "step": 22954 - }, - { - "epoch": 0.59, - "learning_rate": 1.8587369614758367e-06, - "loss": 0.8096, - "step": 22955 - }, - { - "epoch": 0.59, - "learning_rate": 1.8587227823455904e-06, - "loss": 1.0264, - "step": 22956 - }, - { - "epoch": 0.59, - "learning_rate": 1.85870860255786e-06, - "loss": 0.9307, - "step": 22957 - }, - { - "epoch": 0.59, - "learning_rate": 1.8586944221126558e-06, - "loss": 0.8555, - "step": 22958 - }, - { - "epoch": 0.59, - "learning_rate": 1.8586802410099885e-06, - "loss": 0.7012, - "step": 22959 - }, - { - "epoch": 0.59, - "learning_rate": 1.8586660592498693e-06, - "loss": 0.8613, - "step": 22960 - }, - { - "epoch": 0.59, - "learning_rate": 1.858651876832309e-06, - "loss": 0.894, - "step": 22961 - }, - { - "epoch": 0.59, - "learning_rate": 1.8586376937573185e-06, - "loss": 0.8916, - "step": 22962 - }, - { - "epoch": 0.59, - "learning_rate": 1.8586235100249085e-06, - "loss": 0.7871, - "step": 22963 - }, - { - "epoch": 0.59, - "learning_rate": 1.8586093256350904e-06, - "loss": 0.9893, - "step": 22964 - }, - { - "epoch": 0.59, - "learning_rate": 1.8585951405878744e-06, - "loss": 0.8779, - "step": 22965 - }, - { - "epoch": 0.59, - "learning_rate": 1.8585809548832714e-06, - "loss": 0.7402, - "step": 22966 - }, - { - "epoch": 0.59, - "learning_rate": 1.8585667685212925e-06, - "loss": 0.9766, - "step": 22967 - }, - { - "epoch": 0.59, - "learning_rate": 1.8585525815019483e-06, - "loss": 0.8018, - "step": 22968 - }, - { - "epoch": 0.59, - "learning_rate": 1.8585383938252503e-06, - "loss": 0.7178, - "step": 22969 - }, - { - "epoch": 0.59, - "learning_rate": 1.8585242054912087e-06, - "loss": 0.8291, - "step": 22970 - }, - { - "epoch": 0.59, - "learning_rate": 1.8585100164998346e-06, - "loss": 0.8535, - "step": 22971 - }, - { - "epoch": 0.59, - "learning_rate": 1.858495826851139e-06, - "loss": 0.8496, - "step": 22972 - }, - { - "epoch": 0.59, - "learning_rate": 1.8584816365451324e-06, - "loss": 0.9258, - "step": 22973 - }, - { - "epoch": 0.59, - "learning_rate": 1.858467445581826e-06, - "loss": 0.7476, - "step": 22974 - }, - { - "epoch": 0.59, - "learning_rate": 1.8584532539612306e-06, - "loss": 0.9229, - "step": 22975 - }, - { - "epoch": 0.59, - "learning_rate": 1.8584390616833567e-06, - "loss": 0.9014, - "step": 22976 - }, - { - "epoch": 0.59, - "learning_rate": 1.8584248687482158e-06, - "loss": 0.7639, - "step": 22977 - }, - { - "epoch": 0.59, - "learning_rate": 1.8584106751558184e-06, - "loss": 0.6694, - "step": 22978 - }, - { - "epoch": 0.59, - "learning_rate": 1.8583964809061751e-06, - "loss": 0.8643, - "step": 22979 - }, - { - "epoch": 0.59, - "learning_rate": 1.8583822859992976e-06, - "loss": 0.8535, - "step": 22980 - }, - { - "epoch": 0.59, - "learning_rate": 1.858368090435196e-06, - "loss": 0.9668, - "step": 22981 - }, - { - "epoch": 0.59, - "learning_rate": 1.8583538942138812e-06, - "loss": 0.8242, - "step": 22982 - }, - { - "epoch": 0.59, - "learning_rate": 1.8583396973353647e-06, - "loss": 0.7949, - "step": 22983 - }, - { - "epoch": 0.59, - "learning_rate": 1.8583254997996568e-06, - "loss": 0.8008, - "step": 22984 - }, - { - "epoch": 0.59, - "learning_rate": 1.8583113016067683e-06, - "loss": 0.7793, - "step": 22985 - }, - { - "epoch": 0.59, - "learning_rate": 1.8582971027567108e-06, - "loss": 0.6836, - "step": 22986 - }, - { - "epoch": 0.59, - "learning_rate": 1.8582829032494942e-06, - "loss": 0.9541, - "step": 22987 - }, - { - "epoch": 0.59, - "learning_rate": 1.8582687030851303e-06, - "loss": 0.792, - "step": 22988 - }, - { - "epoch": 0.59, - "learning_rate": 1.858254502263629e-06, - "loss": 0.8994, - "step": 22989 - }, - { - "epoch": 0.59, - "learning_rate": 1.858240300785002e-06, - "loss": 0.7129, - "step": 22990 - }, - { - "epoch": 0.59, - "learning_rate": 1.85822609864926e-06, - "loss": 0.7295, - "step": 22991 - }, - { - "epoch": 0.59, - "learning_rate": 1.8582118958564135e-06, - "loss": 0.7666, - "step": 22992 - }, - { - "epoch": 0.59, - "learning_rate": 1.8581976924064737e-06, - "loss": 0.8916, - "step": 22993 - }, - { - "epoch": 0.59, - "learning_rate": 1.8581834882994514e-06, - "loss": 0.8652, - "step": 22994 - }, - { - "epoch": 0.59, - "learning_rate": 1.8581692835353576e-06, - "loss": 0.6829, - "step": 22995 - }, - { - "epoch": 0.59, - "learning_rate": 1.8581550781142026e-06, - "loss": 0.9355, - "step": 22996 - }, - { - "epoch": 0.59, - "learning_rate": 1.8581408720359981e-06, - "loss": 0.7217, - "step": 22997 - }, - { - "epoch": 0.59, - "learning_rate": 1.8581266653007544e-06, - "loss": 0.9395, - "step": 22998 - }, - { - "epoch": 0.59, - "learning_rate": 1.8581124579084827e-06, - "loss": 0.8633, - "step": 22999 - }, - { - "epoch": 0.59, - "learning_rate": 1.8580982498591937e-06, - "loss": 0.813, - "step": 23000 - }, - { - "epoch": 0.59, - "learning_rate": 1.8580840411528982e-06, - "loss": 0.96, - "step": 23001 - }, - { - "epoch": 0.59, - "learning_rate": 1.8580698317896073e-06, - "loss": 1.0879, - "step": 23002 - }, - { - "epoch": 0.59, - "learning_rate": 1.8580556217693318e-06, - "loss": 1.0977, - "step": 23003 - }, - { - "epoch": 0.59, - "learning_rate": 1.8580414110920827e-06, - "loss": 0.8652, - "step": 23004 - }, - { - "epoch": 0.59, - "learning_rate": 1.8580271997578706e-06, - "loss": 1.0967, - "step": 23005 - }, - { - "epoch": 0.59, - "learning_rate": 1.8580129877667065e-06, - "loss": 0.8242, - "step": 23006 - }, - { - "epoch": 0.59, - "learning_rate": 1.8579987751186013e-06, - "loss": 0.8691, - "step": 23007 - }, - { - "epoch": 0.59, - "learning_rate": 1.8579845618135659e-06, - "loss": 0.8906, - "step": 23008 - }, - { - "epoch": 0.59, - "learning_rate": 1.8579703478516113e-06, - "loss": 0.9023, - "step": 23009 - }, - { - "epoch": 0.59, - "learning_rate": 1.857956133232748e-06, - "loss": 1.1748, - "step": 23010 - }, - { - "epoch": 0.59, - "learning_rate": 1.8579419179569875e-06, - "loss": 0.9043, - "step": 23011 - }, - { - "epoch": 0.59, - "learning_rate": 1.85792770202434e-06, - "loss": 0.6423, - "step": 23012 - }, - { - "epoch": 0.59, - "learning_rate": 1.857913485434817e-06, - "loss": 0.8486, - "step": 23013 - }, - { - "epoch": 0.59, - "learning_rate": 1.857899268188429e-06, - "loss": 0.678, - "step": 23014 - }, - { - "epoch": 0.59, - "learning_rate": 1.857885050285187e-06, - "loss": 0.7349, - "step": 23015 - }, - { - "epoch": 0.59, - "learning_rate": 1.8578708317251015e-06, - "loss": 0.8887, - "step": 23016 - }, - { - "epoch": 0.59, - "learning_rate": 1.857856612508184e-06, - "loss": 0.8789, - "step": 23017 - }, - { - "epoch": 0.59, - "learning_rate": 1.8578423926344451e-06, - "loss": 0.7686, - "step": 23018 - }, - { - "epoch": 0.59, - "learning_rate": 1.857828172103896e-06, - "loss": 0.793, - "step": 23019 - }, - { - "epoch": 0.59, - "learning_rate": 1.8578139509165468e-06, - "loss": 0.5762, - "step": 23020 - }, - { - "epoch": 0.59, - "learning_rate": 1.8577997290724095e-06, - "loss": 0.8809, - "step": 23021 - }, - { - "epoch": 0.59, - "learning_rate": 1.8577855065714937e-06, - "loss": 1.0342, - "step": 23022 - }, - { - "epoch": 0.59, - "learning_rate": 1.8577712834138115e-06, - "loss": 0.8511, - "step": 23023 - }, - { - "epoch": 0.59, - "learning_rate": 1.8577570595993732e-06, - "loss": 0.9678, - "step": 23024 - }, - { - "epoch": 0.59, - "learning_rate": 1.8577428351281896e-06, - "loss": 0.8887, - "step": 23025 - }, - { - "epoch": 0.59, - "learning_rate": 1.857728610000272e-06, - "loss": 0.6992, - "step": 23026 - }, - { - "epoch": 0.59, - "learning_rate": 1.857714384215631e-06, - "loss": 0.8086, - "step": 23027 - }, - { - "epoch": 0.59, - "learning_rate": 1.8577001577742773e-06, - "loss": 0.9541, - "step": 23028 - }, - { - "epoch": 0.59, - "learning_rate": 1.8576859306762222e-06, - "loss": 0.665, - "step": 23029 - }, - { - "epoch": 0.59, - "learning_rate": 1.8576717029214764e-06, - "loss": 0.7759, - "step": 23030 - }, - { - "epoch": 0.59, - "learning_rate": 1.8576574745100508e-06, - "loss": 0.9531, - "step": 23031 - }, - { - "epoch": 0.59, - "learning_rate": 1.8576432454419562e-06, - "loss": 0.6509, - "step": 23032 - }, - { - "epoch": 0.59, - "learning_rate": 1.8576290157172037e-06, - "loss": 0.9521, - "step": 23033 - }, - { - "epoch": 0.59, - "learning_rate": 1.8576147853358043e-06, - "loss": 0.7515, - "step": 23034 - }, - { - "epoch": 0.59, - "learning_rate": 1.8576005542977682e-06, - "loss": 0.9961, - "step": 23035 - }, - { - "epoch": 0.59, - "learning_rate": 1.8575863226031073e-06, - "loss": 0.7007, - "step": 23036 - }, - { - "epoch": 0.59, - "learning_rate": 1.8575720902518316e-06, - "loss": 1.0703, - "step": 23037 - }, - { - "epoch": 0.59, - "learning_rate": 1.8575578572439526e-06, - "loss": 1.2432, - "step": 23038 - }, - { - "epoch": 0.59, - "learning_rate": 1.857543623579481e-06, - "loss": 1.0059, - "step": 23039 - }, - { - "epoch": 0.59, - "learning_rate": 1.8575293892584276e-06, - "loss": 0.8926, - "step": 23040 - }, - { - "epoch": 0.59, - "learning_rate": 1.8575151542808034e-06, - "loss": 0.9443, - "step": 23041 - }, - { - "epoch": 0.59, - "learning_rate": 1.857500918646619e-06, - "loss": 0.6099, - "step": 23042 - }, - { - "epoch": 0.59, - "learning_rate": 1.8574866823558862e-06, - "loss": 0.9404, - "step": 23043 - }, - { - "epoch": 0.59, - "learning_rate": 1.8574724454086147e-06, - "loss": 0.7817, - "step": 23044 - }, - { - "epoch": 0.59, - "learning_rate": 1.8574582078048163e-06, - "loss": 0.7617, - "step": 23045 - }, - { - "epoch": 0.59, - "learning_rate": 1.8574439695445015e-06, - "loss": 0.8174, - "step": 23046 - }, - { - "epoch": 0.59, - "learning_rate": 1.8574297306276811e-06, - "loss": 0.7275, - "step": 23047 - }, - { - "epoch": 0.59, - "learning_rate": 1.8574154910543661e-06, - "loss": 1.0068, - "step": 23048 - }, - { - "epoch": 0.59, - "learning_rate": 1.857401250824568e-06, - "loss": 0.8057, - "step": 23049 - }, - { - "epoch": 0.59, - "learning_rate": 1.857387009938297e-06, - "loss": 0.9258, - "step": 23050 - }, - { - "epoch": 0.59, - "learning_rate": 1.8573727683955639e-06, - "loss": 0.9658, - "step": 23051 - }, - { - "epoch": 0.59, - "learning_rate": 1.85735852619638e-06, - "loss": 0.7979, - "step": 23052 - }, - { - "epoch": 0.59, - "learning_rate": 1.8573442833407563e-06, - "loss": 0.918, - "step": 23053 - }, - { - "epoch": 0.59, - "learning_rate": 1.8573300398287032e-06, - "loss": 0.7559, - "step": 23054 - }, - { - "epoch": 0.59, - "learning_rate": 1.8573157956602321e-06, - "loss": 0.8623, - "step": 23055 - }, - { - "epoch": 0.59, - "learning_rate": 1.8573015508353537e-06, - "loss": 0.7109, - "step": 23056 - }, - { - "epoch": 0.59, - "learning_rate": 1.857287305354079e-06, - "loss": 0.793, - "step": 23057 - }, - { - "epoch": 0.59, - "learning_rate": 1.8572730592164188e-06, - "loss": 0.8984, - "step": 23058 - }, - { - "epoch": 0.59, - "learning_rate": 1.8572588124223839e-06, - "loss": 0.8975, - "step": 23059 - }, - { - "epoch": 0.59, - "learning_rate": 1.8572445649719854e-06, - "loss": 0.9424, - "step": 23060 - }, - { - "epoch": 0.59, - "learning_rate": 1.8572303168652343e-06, - "loss": 0.8267, - "step": 23061 - }, - { - "epoch": 0.59, - "learning_rate": 1.8572160681021412e-06, - "loss": 0.8652, - "step": 23062 - }, - { - "epoch": 0.59, - "learning_rate": 1.8572018186827172e-06, - "loss": 0.8652, - "step": 23063 - }, - { - "epoch": 0.59, - "learning_rate": 1.8571875686069732e-06, - "loss": 0.9932, - "step": 23064 - }, - { - "epoch": 0.59, - "learning_rate": 1.85717331787492e-06, - "loss": 0.8467, - "step": 23065 - }, - { - "epoch": 0.59, - "learning_rate": 1.857159066486569e-06, - "loss": 0.8999, - "step": 23066 - }, - { - "epoch": 0.59, - "learning_rate": 1.8571448144419302e-06, - "loss": 0.8711, - "step": 23067 - }, - { - "epoch": 0.59, - "learning_rate": 1.8571305617410153e-06, - "loss": 0.9326, - "step": 23068 - }, - { - "epoch": 0.59, - "learning_rate": 1.8571163083838347e-06, - "loss": 0.715, - "step": 23069 - }, - { - "epoch": 0.59, - "learning_rate": 1.8571020543704e-06, - "loss": 0.9277, - "step": 23070 - }, - { - "epoch": 0.59, - "learning_rate": 1.8570877997007212e-06, - "loss": 0.7886, - "step": 23071 - }, - { - "epoch": 0.59, - "learning_rate": 1.85707354437481e-06, - "loss": 0.6389, - "step": 23072 - }, - { - "epoch": 0.59, - "learning_rate": 1.8570592883926767e-06, - "loss": 0.9883, - "step": 23073 - }, - { - "epoch": 0.59, - "learning_rate": 1.857045031754333e-06, - "loss": 0.9473, - "step": 23074 - }, - { - "epoch": 0.59, - "learning_rate": 1.857030774459789e-06, - "loss": 0.8418, - "step": 23075 - }, - { - "epoch": 0.59, - "learning_rate": 1.857016516509056e-06, - "loss": 1.1289, - "step": 23076 - }, - { - "epoch": 0.59, - "learning_rate": 1.8570022579021447e-06, - "loss": 0.894, - "step": 23077 - }, - { - "epoch": 0.59, - "learning_rate": 1.8569879986390663e-06, - "loss": 1.0049, - "step": 23078 - }, - { - "epoch": 0.59, - "learning_rate": 1.8569737387198317e-06, - "loss": 0.9434, - "step": 23079 - }, - { - "epoch": 0.59, - "learning_rate": 1.8569594781444514e-06, - "loss": 0.8506, - "step": 23080 - }, - { - "epoch": 0.59, - "learning_rate": 1.8569452169129368e-06, - "loss": 0.9941, - "step": 23081 - }, - { - "epoch": 0.59, - "learning_rate": 1.8569309550252989e-06, - "loss": 0.7163, - "step": 23082 - }, - { - "epoch": 0.59, - "learning_rate": 1.8569166924815481e-06, - "loss": 0.8701, - "step": 23083 - }, - { - "epoch": 0.59, - "learning_rate": 1.8569024292816956e-06, - "loss": 0.8413, - "step": 23084 - }, - { - "epoch": 0.59, - "learning_rate": 1.8568881654257528e-06, - "loss": 0.7661, - "step": 23085 - }, - { - "epoch": 0.59, - "learning_rate": 1.8568739009137295e-06, - "loss": 0.8481, - "step": 23086 - }, - { - "epoch": 0.59, - "learning_rate": 1.8568596357456374e-06, - "loss": 0.8213, - "step": 23087 - }, - { - "epoch": 0.59, - "learning_rate": 1.8568453699214875e-06, - "loss": 0.6665, - "step": 23088 - }, - { - "epoch": 0.59, - "learning_rate": 1.8568311034412902e-06, - "loss": 0.6992, - "step": 23089 - }, - { - "epoch": 0.59, - "learning_rate": 1.8568168363050568e-06, - "loss": 0.7656, - "step": 23090 - }, - { - "epoch": 0.59, - "learning_rate": 1.8568025685127981e-06, - "loss": 0.9453, - "step": 23091 - }, - { - "epoch": 0.59, - "learning_rate": 1.8567883000645253e-06, - "loss": 0.9219, - "step": 23092 - }, - { - "epoch": 0.59, - "learning_rate": 1.8567740309602488e-06, - "loss": 0.7979, - "step": 23093 - }, - { - "epoch": 0.59, - "learning_rate": 1.85675976119998e-06, - "loss": 0.7798, - "step": 23094 - }, - { - "epoch": 0.59, - "learning_rate": 1.8567454907837297e-06, - "loss": 0.8994, - "step": 23095 - }, - { - "epoch": 0.59, - "learning_rate": 1.8567312197115087e-06, - "loss": 0.8389, - "step": 23096 - }, - { - "epoch": 0.59, - "learning_rate": 1.856716947983328e-06, - "loss": 0.5874, - "step": 23097 - }, - { - "epoch": 0.59, - "learning_rate": 1.8567026755991985e-06, - "loss": 0.8838, - "step": 23098 - }, - { - "epoch": 0.59, - "learning_rate": 1.8566884025591313e-06, - "loss": 0.9561, - "step": 23099 - }, - { - "epoch": 0.59, - "learning_rate": 1.8566741288631369e-06, - "loss": 0.6821, - "step": 23100 - }, - { - "epoch": 0.59, - "learning_rate": 1.8566598545112267e-06, - "loss": 0.9609, - "step": 23101 - }, - { - "epoch": 0.59, - "learning_rate": 1.8566455795034116e-06, - "loss": 1.0264, - "step": 23102 - }, - { - "epoch": 0.59, - "learning_rate": 1.8566313038397022e-06, - "loss": 0.7949, - "step": 23103 - }, - { - "epoch": 0.59, - "learning_rate": 1.8566170275201093e-06, - "loss": 0.7998, - "step": 23104 - }, - { - "epoch": 0.59, - "learning_rate": 1.8566027505446447e-06, - "loss": 0.7583, - "step": 23105 - }, - { - "epoch": 0.59, - "learning_rate": 1.8565884729133184e-06, - "loss": 0.9658, - "step": 23106 - }, - { - "epoch": 0.59, - "learning_rate": 1.8565741946261417e-06, - "loss": 0.7227, - "step": 23107 - }, - { - "epoch": 0.59, - "learning_rate": 1.8565599156831256e-06, - "loss": 0.7998, - "step": 23108 - }, - { - "epoch": 0.59, - "learning_rate": 1.856545636084281e-06, - "loss": 0.8828, - "step": 23109 - }, - { - "epoch": 0.59, - "learning_rate": 1.8565313558296186e-06, - "loss": 0.8848, - "step": 23110 - }, - { - "epoch": 0.59, - "learning_rate": 1.8565170749191496e-06, - "loss": 0.6885, - "step": 23111 - }, - { - "epoch": 0.59, - "learning_rate": 1.8565027933528852e-06, - "loss": 0.5383, - "step": 23112 - }, - { - "epoch": 0.59, - "learning_rate": 1.8564885111308357e-06, - "loss": 0.9863, - "step": 23113 - }, - { - "epoch": 0.59, - "learning_rate": 1.8564742282530124e-06, - "loss": 1.1865, - "step": 23114 - }, - { - "epoch": 0.59, - "learning_rate": 1.856459944719426e-06, - "loss": 1.0459, - "step": 23115 - }, - { - "epoch": 0.59, - "learning_rate": 1.8564456605300878e-06, - "loss": 0.9473, - "step": 23116 - }, - { - "epoch": 0.59, - "learning_rate": 1.8564313756850086e-06, - "loss": 0.7998, - "step": 23117 - }, - { - "epoch": 0.59, - "learning_rate": 1.8564170901841988e-06, - "loss": 0.8154, - "step": 23118 - }, - { - "epoch": 0.59, - "learning_rate": 1.8564028040276702e-06, - "loss": 1.2607, - "step": 23119 - }, - { - "epoch": 0.59, - "learning_rate": 1.8563885172154334e-06, - "loss": 0.9258, - "step": 23120 - }, - { - "epoch": 0.59, - "learning_rate": 1.856374229747499e-06, - "loss": 0.918, - "step": 23121 - }, - { - "epoch": 0.59, - "learning_rate": 1.8563599416238787e-06, - "loss": 0.7744, - "step": 23122 - }, - { - "epoch": 0.59, - "learning_rate": 1.8563456528445824e-06, - "loss": 0.8906, - "step": 23123 - }, - { - "epoch": 0.59, - "learning_rate": 1.856331363409622e-06, - "loss": 0.8066, - "step": 23124 - }, - { - "epoch": 0.59, - "learning_rate": 1.856317073319008e-06, - "loss": 0.9473, - "step": 23125 - }, - { - "epoch": 0.59, - "learning_rate": 1.8563027825727512e-06, - "loss": 0.8398, - "step": 23126 - }, - { - "epoch": 0.59, - "learning_rate": 1.856288491170863e-06, - "loss": 0.8281, - "step": 23127 - }, - { - "epoch": 0.59, - "learning_rate": 1.856274199113354e-06, - "loss": 1.0381, - "step": 23128 - }, - { - "epoch": 0.59, - "learning_rate": 1.856259906400235e-06, - "loss": 0.7236, - "step": 23129 - }, - { - "epoch": 0.59, - "learning_rate": 1.8562456130315173e-06, - "loss": 0.8105, - "step": 23130 - }, - { - "epoch": 0.59, - "learning_rate": 1.8562313190072118e-06, - "loss": 1.0234, - "step": 23131 - }, - { - "epoch": 0.59, - "learning_rate": 1.8562170243273294e-06, - "loss": 0.8135, - "step": 23132 - }, - { - "epoch": 0.59, - "learning_rate": 1.8562027289918807e-06, - "loss": 0.7744, - "step": 23133 - }, - { - "epoch": 0.59, - "learning_rate": 1.8561884330008773e-06, - "loss": 0.9785, - "step": 23134 - }, - { - "epoch": 0.59, - "learning_rate": 1.8561741363543294e-06, - "loss": 0.9375, - "step": 23135 - }, - { - "epoch": 0.59, - "learning_rate": 1.8561598390522486e-06, - "loss": 0.6208, - "step": 23136 - }, - { - "epoch": 0.59, - "learning_rate": 1.8561455410946456e-06, - "loss": 0.7256, - "step": 23137 - }, - { - "epoch": 0.59, - "learning_rate": 1.8561312424815312e-06, - "loss": 0.959, - "step": 23138 - }, - { - "epoch": 0.59, - "learning_rate": 1.8561169432129164e-06, - "loss": 1.0479, - "step": 23139 - }, - { - "epoch": 0.59, - "learning_rate": 1.8561026432888123e-06, - "loss": 0.9805, - "step": 23140 - }, - { - "epoch": 0.59, - "learning_rate": 1.85608834270923e-06, - "loss": 0.8955, - "step": 23141 - }, - { - "epoch": 0.59, - "learning_rate": 1.85607404147418e-06, - "loss": 0.8145, - "step": 23142 - }, - { - "epoch": 0.59, - "learning_rate": 1.8560597395836735e-06, - "loss": 0.7808, - "step": 23143 - }, - { - "epoch": 0.59, - "learning_rate": 1.8560454370377214e-06, - "loss": 0.874, - "step": 23144 - }, - { - "epoch": 0.59, - "learning_rate": 1.8560311338363346e-06, - "loss": 0.8457, - "step": 23145 - }, - { - "epoch": 0.59, - "learning_rate": 1.856016829979524e-06, - "loss": 0.8643, - "step": 23146 - }, - { - "epoch": 0.59, - "learning_rate": 1.8560025254673011e-06, - "loss": 0.9355, - "step": 23147 - }, - { - "epoch": 0.59, - "learning_rate": 1.8559882202996762e-06, - "loss": 1.1523, - "step": 23148 - }, - { - "epoch": 0.59, - "learning_rate": 1.8559739144766605e-06, - "loss": 0.7578, - "step": 23149 - }, - { - "epoch": 0.59, - "learning_rate": 1.855959607998265e-06, - "loss": 0.7773, - "step": 23150 - }, - { - "epoch": 0.59, - "learning_rate": 1.8559453008645006e-06, - "loss": 0.9155, - "step": 23151 - }, - { - "epoch": 0.59, - "learning_rate": 1.8559309930753779e-06, - "loss": 0.7031, - "step": 23152 - }, - { - "epoch": 0.59, - "learning_rate": 1.8559166846309085e-06, - "loss": 0.9912, - "step": 23153 - }, - { - "epoch": 0.59, - "learning_rate": 1.855902375531103e-06, - "loss": 0.66, - "step": 23154 - }, - { - "epoch": 0.59, - "learning_rate": 1.8558880657759723e-06, - "loss": 0.9893, - "step": 23155 - }, - { - "epoch": 0.59, - "learning_rate": 1.8558737553655276e-06, - "loss": 0.9629, - "step": 23156 - }, - { - "epoch": 0.59, - "learning_rate": 1.8558594442997797e-06, - "loss": 0.9033, - "step": 23157 - }, - { - "epoch": 0.59, - "learning_rate": 1.8558451325787394e-06, - "loss": 0.7891, - "step": 23158 - }, - { - "epoch": 0.59, - "learning_rate": 1.855830820202418e-06, - "loss": 0.8359, - "step": 23159 - }, - { - "epoch": 0.59, - "learning_rate": 1.8558165071708266e-06, - "loss": 1.0215, - "step": 23160 - }, - { - "epoch": 0.59, - "learning_rate": 1.8558021934839752e-06, - "loss": 0.9663, - "step": 23161 - }, - { - "epoch": 0.59, - "learning_rate": 1.855787879141876e-06, - "loss": 0.7061, - "step": 23162 - }, - { - "epoch": 0.59, - "learning_rate": 1.855773564144539e-06, - "loss": 0.8564, - "step": 23163 - }, - { - "epoch": 0.59, - "learning_rate": 1.8557592484919756e-06, - "loss": 0.8018, - "step": 23164 - }, - { - "epoch": 0.59, - "learning_rate": 1.8557449321841969e-06, - "loss": 0.8418, - "step": 23165 - }, - { - "epoch": 0.59, - "learning_rate": 1.8557306152212133e-06, - "loss": 0.8184, - "step": 23166 - }, - { - "epoch": 0.59, - "learning_rate": 1.8557162976030364e-06, - "loss": 0.8398, - "step": 23167 - }, - { - "epoch": 0.59, - "learning_rate": 1.8557019793296766e-06, - "loss": 0.9814, - "step": 23168 - }, - { - "epoch": 0.59, - "learning_rate": 1.8556876604011453e-06, - "loss": 0.7549, - "step": 23169 - }, - { - "epoch": 0.59, - "learning_rate": 1.8556733408174536e-06, - "loss": 0.9375, - "step": 23170 - }, - { - "epoch": 0.59, - "learning_rate": 1.8556590205786119e-06, - "loss": 0.4932, - "step": 23171 - }, - { - "epoch": 0.59, - "learning_rate": 1.8556446996846314e-06, - "loss": 0.9346, - "step": 23172 - }, - { - "epoch": 0.59, - "learning_rate": 1.8556303781355229e-06, - "loss": 0.833, - "step": 23173 - }, - { - "epoch": 0.59, - "learning_rate": 1.855616055931298e-06, - "loss": 0.8438, - "step": 23174 - }, - { - "epoch": 0.59, - "learning_rate": 1.855601733071967e-06, - "loss": 0.8896, - "step": 23175 - }, - { - "epoch": 0.59, - "learning_rate": 1.855587409557541e-06, - "loss": 1.0762, - "step": 23176 - }, - { - "epoch": 0.59, - "learning_rate": 1.8555730853880315e-06, - "loss": 0.6772, - "step": 23177 - }, - { - "epoch": 0.59, - "learning_rate": 1.8555587605634484e-06, - "loss": 0.7373, - "step": 23178 - }, - { - "epoch": 0.59, - "learning_rate": 1.8555444350838037e-06, - "loss": 1.1572, - "step": 23179 - }, - { - "epoch": 0.59, - "learning_rate": 1.8555301089491078e-06, - "loss": 0.9346, - "step": 23180 - }, - { - "epoch": 0.59, - "learning_rate": 1.855515782159372e-06, - "loss": 0.7852, - "step": 23181 - }, - { - "epoch": 0.59, - "learning_rate": 1.855501454714607e-06, - "loss": 0.8579, - "step": 23182 - }, - { - "epoch": 0.59, - "learning_rate": 1.8554871266148237e-06, - "loss": 0.8818, - "step": 23183 - }, - { - "epoch": 0.59, - "learning_rate": 1.8554727978600336e-06, - "loss": 0.9658, - "step": 23184 - }, - { - "epoch": 0.59, - "learning_rate": 1.8554584684502471e-06, - "loss": 0.7983, - "step": 23185 - }, - { - "epoch": 0.59, - "learning_rate": 1.8554441383854752e-06, - "loss": 1.1074, - "step": 23186 - }, - { - "epoch": 0.59, - "learning_rate": 1.8554298076657292e-06, - "loss": 0.853, - "step": 23187 - }, - { - "epoch": 0.59, - "learning_rate": 1.85541547629102e-06, - "loss": 0.8259, - "step": 23188 - }, - { - "epoch": 0.59, - "learning_rate": 1.8554011442613588e-06, - "loss": 0.9893, - "step": 23189 - }, - { - "epoch": 0.59, - "learning_rate": 1.855386811576756e-06, - "loss": 0.8174, - "step": 23190 - }, - { - "epoch": 0.59, - "learning_rate": 1.8553724782372225e-06, - "loss": 0.8818, - "step": 23191 - }, - { - "epoch": 0.59, - "learning_rate": 1.8553581442427703e-06, - "loss": 0.8916, - "step": 23192 - }, - { - "epoch": 0.59, - "learning_rate": 1.8553438095934093e-06, - "loss": 0.7759, - "step": 23193 - }, - { - "epoch": 0.59, - "learning_rate": 1.8553294742891508e-06, - "loss": 0.8652, - "step": 23194 - }, - { - "epoch": 0.59, - "learning_rate": 1.855315138330006e-06, - "loss": 0.9863, - "step": 23195 - }, - { - "epoch": 0.59, - "learning_rate": 1.8553008017159856e-06, - "loss": 0.7568, - "step": 23196 - }, - { - "epoch": 0.59, - "learning_rate": 1.8552864644471011e-06, - "loss": 0.9209, - "step": 23197 - }, - { - "epoch": 0.59, - "learning_rate": 1.8552721265233625e-06, - "loss": 0.8711, - "step": 23198 - }, - { - "epoch": 0.59, - "learning_rate": 1.855257787944782e-06, - "loss": 0.8574, - "step": 23199 - }, - { - "epoch": 0.59, - "learning_rate": 1.8552434487113695e-06, - "loss": 0.8877, - "step": 23200 - }, - { - "epoch": 0.59, - "learning_rate": 1.8552291088231366e-06, - "loss": 0.8135, - "step": 23201 - }, - { - "epoch": 0.59, - "learning_rate": 1.8552147682800937e-06, - "loss": 0.8062, - "step": 23202 - }, - { - "epoch": 0.59, - "learning_rate": 1.8552004270822528e-06, - "loss": 0.8691, - "step": 23203 - }, - { - "epoch": 0.59, - "learning_rate": 1.855186085229624e-06, - "loss": 0.8389, - "step": 23204 - }, - { - "epoch": 0.59, - "learning_rate": 1.8551717427222182e-06, - "loss": 0.9521, - "step": 23205 - }, - { - "epoch": 0.59, - "learning_rate": 1.855157399560047e-06, - "loss": 1.0137, - "step": 23206 - }, - { - "epoch": 0.59, - "learning_rate": 1.8551430557431211e-06, - "loss": 0.7124, - "step": 23207 - }, - { - "epoch": 0.59, - "learning_rate": 1.8551287112714515e-06, - "loss": 0.9492, - "step": 23208 - }, - { - "epoch": 0.59, - "learning_rate": 1.8551143661450492e-06, - "loss": 0.7354, - "step": 23209 - }, - { - "epoch": 0.59, - "learning_rate": 1.855100020363925e-06, - "loss": 1.0186, - "step": 23210 - }, - { - "epoch": 0.59, - "learning_rate": 1.8550856739280902e-06, - "loss": 0.7451, - "step": 23211 - }, - { - "epoch": 0.59, - "learning_rate": 1.8550713268375557e-06, - "loss": 1.0879, - "step": 23212 - }, - { - "epoch": 0.59, - "learning_rate": 1.8550569790923322e-06, - "loss": 0.8027, - "step": 23213 - }, - { - "epoch": 0.59, - "learning_rate": 1.8550426306924307e-06, - "loss": 0.7617, - "step": 23214 - }, - { - "epoch": 0.6, - "learning_rate": 1.8550282816378626e-06, - "loss": 0.8369, - "step": 23215 - }, - { - "epoch": 0.6, - "learning_rate": 1.855013931928639e-06, - "loss": 1.041, - "step": 23216 - }, - { - "epoch": 0.6, - "learning_rate": 1.8549995815647701e-06, - "loss": 0.8066, - "step": 23217 - }, - { - "epoch": 0.6, - "learning_rate": 1.8549852305462675e-06, - "loss": 0.9189, - "step": 23218 - }, - { - "epoch": 0.6, - "learning_rate": 1.854970878873142e-06, - "loss": 0.6304, - "step": 23219 - }, - { - "epoch": 0.6, - "learning_rate": 1.8549565265454046e-06, - "loss": 0.8975, - "step": 23220 - }, - { - "epoch": 0.6, - "learning_rate": 1.8549421735630662e-06, - "loss": 0.9736, - "step": 23221 - }, - { - "epoch": 0.6, - "learning_rate": 1.854927819926138e-06, - "loss": 0.9043, - "step": 23222 - }, - { - "epoch": 0.6, - "learning_rate": 1.8549134656346306e-06, - "loss": 0.9951, - "step": 23223 - }, - { - "epoch": 0.6, - "learning_rate": 1.8548991106885556e-06, - "loss": 0.8994, - "step": 23224 - }, - { - "epoch": 0.6, - "learning_rate": 1.8548847550879236e-06, - "loss": 0.9551, - "step": 23225 - }, - { - "epoch": 0.6, - "learning_rate": 1.8548703988327456e-06, - "loss": 0.8584, - "step": 23226 - }, - { - "epoch": 0.6, - "learning_rate": 1.8548560419230329e-06, - "loss": 0.8906, - "step": 23227 - }, - { - "epoch": 0.6, - "learning_rate": 1.8548416843587958e-06, - "loss": 0.9551, - "step": 23228 - }, - { - "epoch": 0.6, - "learning_rate": 1.854827326140046e-06, - "loss": 0.812, - "step": 23229 - }, - { - "epoch": 0.6, - "learning_rate": 1.8548129672667941e-06, - "loss": 0.8975, - "step": 23230 - }, - { - "epoch": 0.6, - "learning_rate": 1.8547986077390512e-06, - "loss": 1.0205, - "step": 23231 - }, - { - "epoch": 0.6, - "learning_rate": 1.8547842475568286e-06, - "loss": 0.9648, - "step": 23232 - }, - { - "epoch": 0.6, - "learning_rate": 1.8547698867201367e-06, - "loss": 0.8311, - "step": 23233 - }, - { - "epoch": 0.6, - "learning_rate": 1.8547555252289868e-06, - "loss": 0.9424, - "step": 23234 - }, - { - "epoch": 0.6, - "learning_rate": 1.8547411630833901e-06, - "loss": 1.0771, - "step": 23235 - }, - { - "epoch": 0.6, - "learning_rate": 1.8547268002833571e-06, - "loss": 0.9619, - "step": 23236 - }, - { - "epoch": 0.6, - "learning_rate": 1.8547124368288993e-06, - "loss": 0.8779, - "step": 23237 - }, - { - "epoch": 0.6, - "learning_rate": 1.8546980727200276e-06, - "loss": 0.9297, - "step": 23238 - }, - { - "epoch": 0.6, - "learning_rate": 1.8546837079567528e-06, - "loss": 0.5815, - "step": 23239 - }, - { - "epoch": 0.6, - "learning_rate": 1.8546693425390858e-06, - "loss": 0.9131, - "step": 23240 - }, - { - "epoch": 0.6, - "learning_rate": 1.8546549764670378e-06, - "loss": 0.8838, - "step": 23241 - }, - { - "epoch": 0.6, - "learning_rate": 1.85464060974062e-06, - "loss": 0.791, - "step": 23242 - }, - { - "epoch": 0.6, - "learning_rate": 1.8546262423598432e-06, - "loss": 0.8711, - "step": 23243 - }, - { - "epoch": 0.6, - "learning_rate": 1.8546118743247182e-06, - "loss": 1.0332, - "step": 23244 - }, - { - "epoch": 0.6, - "learning_rate": 1.8545975056352562e-06, - "loss": 0.7803, - "step": 23245 - }, - { - "epoch": 0.6, - "learning_rate": 1.854583136291468e-06, - "loss": 0.8018, - "step": 23246 - }, - { - "epoch": 0.6, - "learning_rate": 1.8545687662933654e-06, - "loss": 0.7939, - "step": 23247 - }, - { - "epoch": 0.6, - "learning_rate": 1.8545543956409584e-06, - "loss": 0.9131, - "step": 23248 - }, - { - "epoch": 0.6, - "learning_rate": 1.8545400243342582e-06, - "loss": 0.9512, - "step": 23249 - }, - { - "epoch": 0.6, - "learning_rate": 1.8545256523732765e-06, - "loss": 0.9932, - "step": 23250 - }, - { - "epoch": 0.6, - "learning_rate": 1.8545112797580233e-06, - "loss": 0.8008, - "step": 23251 - }, - { - "epoch": 0.6, - "learning_rate": 1.8544969064885104e-06, - "loss": 0.8203, - "step": 23252 - }, - { - "epoch": 0.6, - "learning_rate": 1.8544825325647481e-06, - "loss": 0.9092, - "step": 23253 - }, - { - "epoch": 0.6, - "learning_rate": 1.8544681579867483e-06, - "loss": 0.7158, - "step": 23254 - }, - { - "epoch": 0.6, - "learning_rate": 1.8544537827545215e-06, - "loss": 0.8984, - "step": 23255 - }, - { - "epoch": 0.6, - "learning_rate": 1.8544394068680785e-06, - "loss": 0.7705, - "step": 23256 - }, - { - "epoch": 0.6, - "learning_rate": 1.8544250303274307e-06, - "loss": 0.9531, - "step": 23257 - }, - { - "epoch": 0.6, - "learning_rate": 1.8544106531325888e-06, - "loss": 0.7969, - "step": 23258 - }, - { - "epoch": 0.6, - "learning_rate": 1.8543962752835639e-06, - "loss": 0.9648, - "step": 23259 - }, - { - "epoch": 0.6, - "learning_rate": 1.8543818967803672e-06, - "loss": 0.9795, - "step": 23260 - }, - { - "epoch": 0.6, - "learning_rate": 1.8543675176230097e-06, - "loss": 0.7715, - "step": 23261 - }, - { - "epoch": 0.6, - "learning_rate": 1.8543531378115017e-06, - "loss": 0.8076, - "step": 23262 - }, - { - "epoch": 0.6, - "learning_rate": 1.8543387573458555e-06, - "loss": 0.7085, - "step": 23263 - }, - { - "epoch": 0.6, - "learning_rate": 1.854324376226081e-06, - "loss": 1.041, - "step": 23264 - }, - { - "epoch": 0.6, - "learning_rate": 1.8543099944521896e-06, - "loss": 0.9854, - "step": 23265 - }, - { - "epoch": 0.6, - "learning_rate": 1.8542956120241927e-06, - "loss": 0.7939, - "step": 23266 - }, - { - "epoch": 0.6, - "learning_rate": 1.8542812289421006e-06, - "loss": 0.7793, - "step": 23267 - }, - { - "epoch": 0.6, - "learning_rate": 1.8542668452059246e-06, - "loss": 1.0225, - "step": 23268 - }, - { - "epoch": 0.6, - "learning_rate": 1.8542524608156757e-06, - "loss": 0.728, - "step": 23269 - }, - { - "epoch": 0.6, - "learning_rate": 1.854238075771365e-06, - "loss": 1.0117, - "step": 23270 - }, - { - "epoch": 0.6, - "learning_rate": 1.8542236900730038e-06, - "loss": 1.0371, - "step": 23271 - }, - { - "epoch": 0.6, - "learning_rate": 1.8542093037206026e-06, - "loss": 0.752, - "step": 23272 - }, - { - "epoch": 0.6, - "learning_rate": 1.8541949167141726e-06, - "loss": 0.7397, - "step": 23273 - }, - { - "epoch": 0.6, - "learning_rate": 1.8541805290537247e-06, - "loss": 0.8872, - "step": 23274 - }, - { - "epoch": 0.6, - "learning_rate": 1.8541661407392704e-06, - "loss": 0.8369, - "step": 23275 - }, - { - "epoch": 0.6, - "learning_rate": 1.85415175177082e-06, - "loss": 1.0049, - "step": 23276 - }, - { - "epoch": 0.6, - "learning_rate": 1.854137362148385e-06, - "loss": 0.7432, - "step": 23277 - }, - { - "epoch": 0.6, - "learning_rate": 1.8541229718719763e-06, - "loss": 0.7822, - "step": 23278 - }, - { - "epoch": 0.6, - "learning_rate": 1.854108580941605e-06, - "loss": 0.9727, - "step": 23279 - }, - { - "epoch": 0.6, - "learning_rate": 1.854094189357282e-06, - "loss": 0.8779, - "step": 23280 - }, - { - "epoch": 0.6, - "learning_rate": 1.8540797971190183e-06, - "loss": 0.9014, - "step": 23281 - }, - { - "epoch": 0.6, - "learning_rate": 1.854065404226825e-06, - "loss": 0.9307, - "step": 23282 - }, - { - "epoch": 0.6, - "learning_rate": 1.8540510106807133e-06, - "loss": 0.9121, - "step": 23283 - }, - { - "epoch": 0.6, - "learning_rate": 1.8540366164806937e-06, - "loss": 0.8701, - "step": 23284 - }, - { - "epoch": 0.6, - "learning_rate": 1.8540222216267775e-06, - "loss": 0.8096, - "step": 23285 - }, - { - "epoch": 0.6, - "learning_rate": 1.854007826118976e-06, - "loss": 0.9971, - "step": 23286 - }, - { - "epoch": 0.6, - "learning_rate": 1.8539934299572998e-06, - "loss": 0.5437, - "step": 23287 - }, - { - "epoch": 0.6, - "learning_rate": 1.85397903314176e-06, - "loss": 0.8906, - "step": 23288 - }, - { - "epoch": 0.6, - "learning_rate": 1.8539646356723679e-06, - "loss": 0.7759, - "step": 23289 - }, - { - "epoch": 0.6, - "learning_rate": 1.8539502375491344e-06, - "loss": 0.8135, - "step": 23290 - }, - { - "epoch": 0.6, - "learning_rate": 1.8539358387720705e-06, - "loss": 0.8467, - "step": 23291 - }, - { - "epoch": 0.6, - "learning_rate": 1.853921439341187e-06, - "loss": 0.8457, - "step": 23292 - }, - { - "epoch": 0.6, - "learning_rate": 1.8539070392564953e-06, - "loss": 0.876, - "step": 23293 - }, - { - "epoch": 0.6, - "learning_rate": 1.853892638518006e-06, - "loss": 0.6216, - "step": 23294 - }, - { - "epoch": 0.6, - "learning_rate": 1.8538782371257305e-06, - "loss": 1.0479, - "step": 23295 - }, - { - "epoch": 0.6, - "learning_rate": 1.85386383507968e-06, - "loss": 0.7129, - "step": 23296 - }, - { - "epoch": 0.6, - "learning_rate": 1.8538494323798645e-06, - "loss": 0.9541, - "step": 23297 - }, - { - "epoch": 0.6, - "learning_rate": 1.8538350290262966e-06, - "loss": 0.8818, - "step": 23298 - }, - { - "epoch": 0.6, - "learning_rate": 1.853820625018986e-06, - "loss": 1.0244, - "step": 23299 - }, - { - "epoch": 0.6, - "learning_rate": 1.8538062203579441e-06, - "loss": 0.7832, - "step": 23300 - }, - { - "epoch": 0.6, - "learning_rate": 1.8537918150431824e-06, - "loss": 0.6724, - "step": 23301 - }, - { - "epoch": 0.6, - "learning_rate": 1.8537774090747113e-06, - "loss": 0.7803, - "step": 23302 - }, - { - "epoch": 0.6, - "learning_rate": 1.8537630024525422e-06, - "loss": 0.8877, - "step": 23303 - }, - { - "epoch": 0.6, - "learning_rate": 1.8537485951766861e-06, - "loss": 0.7773, - "step": 23304 - }, - { - "epoch": 0.6, - "learning_rate": 1.8537341872471538e-06, - "loss": 0.8872, - "step": 23305 - }, - { - "epoch": 0.6, - "learning_rate": 1.8537197786639562e-06, - "loss": 0.7227, - "step": 23306 - }, - { - "epoch": 0.6, - "learning_rate": 1.8537053694271052e-06, - "loss": 0.876, - "step": 23307 - }, - { - "epoch": 0.6, - "learning_rate": 1.8536909595366109e-06, - "loss": 1.0, - "step": 23308 - }, - { - "epoch": 0.6, - "learning_rate": 1.8536765489924848e-06, - "loss": 1.0669, - "step": 23309 - }, - { - "epoch": 0.6, - "learning_rate": 1.8536621377947379e-06, - "loss": 0.7432, - "step": 23310 - }, - { - "epoch": 0.6, - "learning_rate": 1.853647725943381e-06, - "loss": 1.0391, - "step": 23311 - }, - { - "epoch": 0.6, - "learning_rate": 1.8536333134384255e-06, - "loss": 0.9717, - "step": 23312 - }, - { - "epoch": 0.6, - "learning_rate": 1.853618900279882e-06, - "loss": 1.0039, - "step": 23313 - }, - { - "epoch": 0.6, - "learning_rate": 1.8536044864677618e-06, - "loss": 0.686, - "step": 23314 - }, - { - "epoch": 0.6, - "learning_rate": 1.8535900720020758e-06, - "loss": 1.0176, - "step": 23315 - }, - { - "epoch": 0.6, - "learning_rate": 1.8535756568828353e-06, - "loss": 0.834, - "step": 23316 - }, - { - "epoch": 0.6, - "learning_rate": 1.8535612411100514e-06, - "loss": 1.085, - "step": 23317 - }, - { - "epoch": 0.6, - "learning_rate": 1.8535468246837345e-06, - "loss": 0.8408, - "step": 23318 - }, - { - "epoch": 0.6, - "learning_rate": 1.8535324076038962e-06, - "loss": 0.708, - "step": 23319 - }, - { - "epoch": 0.6, - "learning_rate": 1.8535179898705473e-06, - "loss": 0.6953, - "step": 23320 - }, - { - "epoch": 0.6, - "learning_rate": 1.853503571483699e-06, - "loss": 0.875, - "step": 23321 - }, - { - "epoch": 0.6, - "learning_rate": 1.8534891524433624e-06, - "loss": 0.7148, - "step": 23322 - }, - { - "epoch": 0.6, - "learning_rate": 1.853474732749548e-06, - "loss": 0.8135, - "step": 23323 - }, - { - "epoch": 0.6, - "learning_rate": 1.8534603124022675e-06, - "loss": 0.8057, - "step": 23324 - }, - { - "epoch": 0.6, - "learning_rate": 1.8534458914015318e-06, - "loss": 0.9268, - "step": 23325 - }, - { - "epoch": 0.6, - "learning_rate": 1.8534314697473516e-06, - "loss": 1.0596, - "step": 23326 - }, - { - "epoch": 0.6, - "learning_rate": 1.8534170474397384e-06, - "loss": 0.7988, - "step": 23327 - }, - { - "epoch": 0.6, - "learning_rate": 1.853402624478703e-06, - "loss": 0.7837, - "step": 23328 - }, - { - "epoch": 0.6, - "learning_rate": 1.853388200864256e-06, - "loss": 0.9854, - "step": 23329 - }, - { - "epoch": 0.6, - "learning_rate": 1.8533737765964093e-06, - "loss": 0.7456, - "step": 23330 - }, - { - "epoch": 0.6, - "learning_rate": 1.8533593516751735e-06, - "loss": 0.9258, - "step": 23331 - }, - { - "epoch": 0.6, - "learning_rate": 1.8533449261005596e-06, - "loss": 0.6421, - "step": 23332 - }, - { - "epoch": 0.6, - "learning_rate": 1.853330499872579e-06, - "loss": 0.7612, - "step": 23333 - }, - { - "epoch": 0.6, - "learning_rate": 1.853316072991242e-06, - "loss": 0.71, - "step": 23334 - }, - { - "epoch": 0.6, - "learning_rate": 1.8533016454565603e-06, - "loss": 0.9375, - "step": 23335 - }, - { - "epoch": 0.6, - "learning_rate": 1.853287217268545e-06, - "loss": 0.9106, - "step": 23336 - }, - { - "epoch": 0.6, - "learning_rate": 1.8532727884272067e-06, - "loss": 1.0967, - "step": 23337 - }, - { - "epoch": 0.6, - "learning_rate": 1.8532583589325568e-06, - "loss": 0.8394, - "step": 23338 - }, - { - "epoch": 0.6, - "learning_rate": 1.853243928784606e-06, - "loss": 0.8633, - "step": 23339 - }, - { - "epoch": 0.6, - "learning_rate": 1.8532294979833655e-06, - "loss": 1.1152, - "step": 23340 - }, - { - "epoch": 0.6, - "learning_rate": 1.8532150665288466e-06, - "loss": 0.8467, - "step": 23341 - }, - { - "epoch": 0.6, - "learning_rate": 1.8532006344210602e-06, - "loss": 0.9043, - "step": 23342 - }, - { - "epoch": 0.6, - "learning_rate": 1.853186201660017e-06, - "loss": 0.8379, - "step": 23343 - }, - { - "epoch": 0.6, - "learning_rate": 1.8531717682457289e-06, - "loss": 1.0, - "step": 23344 - }, - { - "epoch": 0.6, - "learning_rate": 1.853157334178206e-06, - "loss": 1.0312, - "step": 23345 - }, - { - "epoch": 0.6, - "learning_rate": 1.8531428994574598e-06, - "loss": 0.8926, - "step": 23346 - }, - { - "epoch": 0.6, - "learning_rate": 1.8531284640835014e-06, - "loss": 1.0088, - "step": 23347 - }, - { - "epoch": 0.6, - "learning_rate": 1.8531140280563418e-06, - "loss": 0.998, - "step": 23348 - }, - { - "epoch": 0.6, - "learning_rate": 1.853099591375992e-06, - "loss": 0.7383, - "step": 23349 - }, - { - "epoch": 0.6, - "learning_rate": 1.8530851540424628e-06, - "loss": 0.7139, - "step": 23350 - }, - { - "epoch": 0.6, - "learning_rate": 1.8530707160557659e-06, - "loss": 0.6792, - "step": 23351 - }, - { - "epoch": 0.6, - "learning_rate": 1.8530562774159118e-06, - "loss": 0.7686, - "step": 23352 - }, - { - "epoch": 0.6, - "learning_rate": 1.8530418381229115e-06, - "loss": 0.8291, - "step": 23353 - }, - { - "epoch": 0.6, - "learning_rate": 1.8530273981767768e-06, - "loss": 1.0049, - "step": 23354 - }, - { - "epoch": 0.6, - "learning_rate": 1.8530129575775178e-06, - "loss": 0.6597, - "step": 23355 - }, - { - "epoch": 0.6, - "learning_rate": 1.8529985163251463e-06, - "loss": 0.916, - "step": 23356 - }, - { - "epoch": 0.6, - "learning_rate": 1.8529840744196728e-06, - "loss": 0.8311, - "step": 23357 - }, - { - "epoch": 0.6, - "learning_rate": 1.8529696318611089e-06, - "loss": 0.8887, - "step": 23358 - }, - { - "epoch": 0.6, - "learning_rate": 1.8529551886494652e-06, - "loss": 0.5752, - "step": 23359 - }, - { - "epoch": 0.6, - "learning_rate": 1.852940744784753e-06, - "loss": 0.7783, - "step": 23360 - }, - { - "epoch": 0.6, - "learning_rate": 1.8529263002669833e-06, - "loss": 0.5933, - "step": 23361 - }, - { - "epoch": 0.6, - "learning_rate": 1.8529118550961668e-06, - "loss": 0.8242, - "step": 23362 - }, - { - "epoch": 0.6, - "learning_rate": 1.8528974092723153e-06, - "loss": 0.8438, - "step": 23363 - }, - { - "epoch": 0.6, - "learning_rate": 1.8528829627954394e-06, - "loss": 0.9414, - "step": 23364 - }, - { - "epoch": 0.6, - "learning_rate": 1.8528685156655501e-06, - "loss": 0.7637, - "step": 23365 - }, - { - "epoch": 0.6, - "learning_rate": 1.8528540678826587e-06, - "loss": 0.7324, - "step": 23366 - }, - { - "epoch": 0.6, - "learning_rate": 1.8528396194467763e-06, - "loss": 0.9805, - "step": 23367 - }, - { - "epoch": 0.6, - "learning_rate": 1.8528251703579137e-06, - "loss": 0.9521, - "step": 23368 - }, - { - "epoch": 0.6, - "learning_rate": 1.8528107206160822e-06, - "loss": 0.6919, - "step": 23369 - }, - { - "epoch": 0.6, - "learning_rate": 1.8527962702212925e-06, - "loss": 0.8867, - "step": 23370 - }, - { - "epoch": 0.6, - "learning_rate": 1.8527818191735559e-06, - "loss": 0.8447, - "step": 23371 - }, - { - "epoch": 0.6, - "learning_rate": 1.8527673674728836e-06, - "loss": 0.96, - "step": 23372 - }, - { - "epoch": 0.6, - "learning_rate": 1.8527529151192866e-06, - "loss": 0.8916, - "step": 23373 - }, - { - "epoch": 0.6, - "learning_rate": 1.8527384621127757e-06, - "loss": 0.9619, - "step": 23374 - }, - { - "epoch": 0.6, - "learning_rate": 1.8527240084533622e-06, - "loss": 0.7432, - "step": 23375 - }, - { - "epoch": 0.6, - "learning_rate": 1.8527095541410572e-06, - "loss": 0.9375, - "step": 23376 - }, - { - "epoch": 0.6, - "learning_rate": 1.8526950991758722e-06, - "loss": 0.9141, - "step": 23377 - }, - { - "epoch": 0.6, - "learning_rate": 1.852680643557817e-06, - "loss": 0.8047, - "step": 23378 - }, - { - "epoch": 0.6, - "learning_rate": 1.8526661872869037e-06, - "loss": 0.8926, - "step": 23379 - }, - { - "epoch": 0.6, - "learning_rate": 1.8526517303631432e-06, - "loss": 0.7012, - "step": 23380 - }, - { - "epoch": 0.6, - "learning_rate": 1.8526372727865465e-06, - "loss": 0.8164, - "step": 23381 - }, - { - "epoch": 0.6, - "learning_rate": 1.8526228145571245e-06, - "loss": 0.8848, - "step": 23382 - }, - { - "epoch": 0.6, - "learning_rate": 1.8526083556748885e-06, - "loss": 0.8516, - "step": 23383 - }, - { - "epoch": 0.6, - "learning_rate": 1.8525938961398495e-06, - "loss": 0.8916, - "step": 23384 - }, - { - "epoch": 0.6, - "learning_rate": 1.8525794359520183e-06, - "loss": 0.5647, - "step": 23385 - }, - { - "epoch": 0.6, - "learning_rate": 1.8525649751114068e-06, - "loss": 0.876, - "step": 23386 - }, - { - "epoch": 0.6, - "learning_rate": 1.852550513618025e-06, - "loss": 0.5786, - "step": 23387 - }, - { - "epoch": 0.6, - "learning_rate": 1.8525360514718847e-06, - "loss": 0.5396, - "step": 23388 - }, - { - "epoch": 0.6, - "learning_rate": 1.8525215886729965e-06, - "loss": 0.8018, - "step": 23389 - }, - { - "epoch": 0.6, - "learning_rate": 1.852507125221372e-06, - "loss": 0.9375, - "step": 23390 - }, - { - "epoch": 0.6, - "learning_rate": 1.8524926611170218e-06, - "loss": 0.7988, - "step": 23391 - }, - { - "epoch": 0.6, - "learning_rate": 1.8524781963599574e-06, - "loss": 0.7705, - "step": 23392 - }, - { - "epoch": 0.6, - "learning_rate": 1.8524637309501895e-06, - "loss": 0.7627, - "step": 23393 - }, - { - "epoch": 0.6, - "learning_rate": 1.8524492648877293e-06, - "loss": 0.7754, - "step": 23394 - }, - { - "epoch": 0.6, - "learning_rate": 1.852434798172588e-06, - "loss": 0.9434, - "step": 23395 - }, - { - "epoch": 0.6, - "learning_rate": 1.8524203308047763e-06, - "loss": 1.0547, - "step": 23396 - }, - { - "epoch": 0.6, - "learning_rate": 1.8524058627843058e-06, - "loss": 0.603, - "step": 23397 - }, - { - "epoch": 0.6, - "learning_rate": 1.8523913941111872e-06, - "loss": 0.875, - "step": 23398 - }, - { - "epoch": 0.6, - "learning_rate": 1.8523769247854318e-06, - "loss": 0.7681, - "step": 23399 - }, - { - "epoch": 0.6, - "learning_rate": 1.8523624548070505e-06, - "loss": 0.9727, - "step": 23400 - }, - { - "epoch": 0.6, - "learning_rate": 1.8523479841760548e-06, - "loss": 0.9424, - "step": 23401 - }, - { - "epoch": 0.6, - "learning_rate": 1.852333512892455e-06, - "loss": 0.6812, - "step": 23402 - }, - { - "epoch": 0.6, - "learning_rate": 1.8523190409562628e-06, - "loss": 0.6714, - "step": 23403 - }, - { - "epoch": 0.6, - "learning_rate": 1.852304568367489e-06, - "loss": 0.6383, - "step": 23404 - }, - { - "epoch": 0.6, - "learning_rate": 1.8522900951261448e-06, - "loss": 0.7168, - "step": 23405 - }, - { - "epoch": 0.6, - "learning_rate": 1.8522756212322412e-06, - "loss": 0.8867, - "step": 23406 - }, - { - "epoch": 0.6, - "learning_rate": 1.8522611466857896e-06, - "loss": 0.7593, - "step": 23407 - }, - { - "epoch": 0.6, - "learning_rate": 1.8522466714868007e-06, - "loss": 1.0234, - "step": 23408 - }, - { - "epoch": 0.6, - "learning_rate": 1.8522321956352855e-06, - "loss": 0.8584, - "step": 23409 - }, - { - "epoch": 0.6, - "learning_rate": 1.8522177191312556e-06, - "loss": 0.7842, - "step": 23410 - }, - { - "epoch": 0.6, - "learning_rate": 1.8522032419747217e-06, - "loss": 0.9473, - "step": 23411 - }, - { - "epoch": 0.6, - "learning_rate": 1.852188764165695e-06, - "loss": 0.7811, - "step": 23412 - }, - { - "epoch": 0.6, - "learning_rate": 1.8521742857041864e-06, - "loss": 0.8916, - "step": 23413 - }, - { - "epoch": 0.6, - "learning_rate": 1.8521598065902074e-06, - "loss": 0.7466, - "step": 23414 - }, - { - "epoch": 0.6, - "learning_rate": 1.8521453268237685e-06, - "loss": 0.9199, - "step": 23415 - }, - { - "epoch": 0.6, - "learning_rate": 1.8521308464048812e-06, - "loss": 0.8955, - "step": 23416 - }, - { - "epoch": 0.6, - "learning_rate": 1.8521163653335565e-06, - "loss": 0.9111, - "step": 23417 - }, - { - "epoch": 0.6, - "learning_rate": 1.8521018836098055e-06, - "loss": 0.835, - "step": 23418 - }, - { - "epoch": 0.6, - "learning_rate": 1.8520874012336394e-06, - "loss": 0.9912, - "step": 23419 - }, - { - "epoch": 0.6, - "learning_rate": 1.852072918205069e-06, - "loss": 0.9336, - "step": 23420 - }, - { - "epoch": 0.6, - "learning_rate": 1.8520584345241055e-06, - "loss": 0.7236, - "step": 23421 - }, - { - "epoch": 0.6, - "learning_rate": 1.8520439501907603e-06, - "loss": 0.8877, - "step": 23422 - }, - { - "epoch": 0.6, - "learning_rate": 1.8520294652050439e-06, - "loss": 0.7002, - "step": 23423 - }, - { - "epoch": 0.6, - "learning_rate": 1.8520149795669679e-06, - "loss": 1.0801, - "step": 23424 - }, - { - "epoch": 0.6, - "learning_rate": 1.8520004932765431e-06, - "loss": 0.7583, - "step": 23425 - }, - { - "epoch": 0.6, - "learning_rate": 1.8519860063337806e-06, - "loss": 0.9248, - "step": 23426 - }, - { - "epoch": 0.6, - "learning_rate": 1.8519715187386922e-06, - "loss": 0.8154, - "step": 23427 - }, - { - "epoch": 0.6, - "learning_rate": 1.8519570304912878e-06, - "loss": 0.8726, - "step": 23428 - }, - { - "epoch": 0.6, - "learning_rate": 1.8519425415915793e-06, - "loss": 0.7148, - "step": 23429 - }, - { - "epoch": 0.6, - "learning_rate": 1.8519280520395773e-06, - "loss": 0.8281, - "step": 23430 - }, - { - "epoch": 0.6, - "learning_rate": 1.8519135618352935e-06, - "loss": 0.8018, - "step": 23431 - }, - { - "epoch": 0.6, - "learning_rate": 1.8518990709787383e-06, - "loss": 0.8271, - "step": 23432 - }, - { - "epoch": 0.6, - "learning_rate": 1.8518845794699234e-06, - "loss": 0.9844, - "step": 23433 - }, - { - "epoch": 0.6, - "learning_rate": 1.8518700873088596e-06, - "loss": 0.9131, - "step": 23434 - }, - { - "epoch": 0.6, - "learning_rate": 1.851855594495558e-06, - "loss": 0.9609, - "step": 23435 - }, - { - "epoch": 0.6, - "learning_rate": 1.85184110103003e-06, - "loss": 0.8848, - "step": 23436 - }, - { - "epoch": 0.6, - "learning_rate": 1.8518266069122862e-06, - "loss": 0.8447, - "step": 23437 - }, - { - "epoch": 0.6, - "learning_rate": 1.8518121121423378e-06, - "loss": 0.8379, - "step": 23438 - }, - { - "epoch": 0.6, - "learning_rate": 1.8517976167201964e-06, - "loss": 1.2822, - "step": 23439 - }, - { - "epoch": 0.6, - "learning_rate": 1.8517831206458725e-06, - "loss": 0.4434, - "step": 23440 - }, - { - "epoch": 0.6, - "learning_rate": 1.8517686239193772e-06, - "loss": 0.7192, - "step": 23441 - }, - { - "epoch": 0.6, - "learning_rate": 1.8517541265407224e-06, - "loss": 0.9014, - "step": 23442 - }, - { - "epoch": 0.6, - "learning_rate": 1.851739628509918e-06, - "loss": 1.1426, - "step": 23443 - }, - { - "epoch": 0.6, - "learning_rate": 1.8517251298269763e-06, - "loss": 0.7417, - "step": 23444 - }, - { - "epoch": 0.6, - "learning_rate": 1.8517106304919074e-06, - "loss": 0.9824, - "step": 23445 - }, - { - "epoch": 0.6, - "learning_rate": 1.8516961305047231e-06, - "loss": 0.8242, - "step": 23446 - }, - { - "epoch": 0.6, - "learning_rate": 1.851681629865434e-06, - "loss": 0.8525, - "step": 23447 - }, - { - "epoch": 0.6, - "learning_rate": 1.8516671285740518e-06, - "loss": 0.8936, - "step": 23448 - }, - { - "epoch": 0.6, - "learning_rate": 1.851652626630587e-06, - "loss": 0.8232, - "step": 23449 - }, - { - "epoch": 0.6, - "learning_rate": 1.8516381240350509e-06, - "loss": 0.96, - "step": 23450 - }, - { - "epoch": 0.6, - "learning_rate": 1.8516236207874547e-06, - "loss": 0.8936, - "step": 23451 - }, - { - "epoch": 0.6, - "learning_rate": 1.8516091168878093e-06, - "loss": 0.9639, - "step": 23452 - }, - { - "epoch": 0.6, - "learning_rate": 1.8515946123361263e-06, - "loss": 0.9844, - "step": 23453 - }, - { - "epoch": 0.6, - "learning_rate": 1.8515801071324164e-06, - "loss": 1.0225, - "step": 23454 - }, - { - "epoch": 0.6, - "learning_rate": 1.8515656012766905e-06, - "loss": 0.7959, - "step": 23455 - }, - { - "epoch": 0.6, - "learning_rate": 1.8515510947689603e-06, - "loss": 0.9854, - "step": 23456 - }, - { - "epoch": 0.6, - "learning_rate": 1.8515365876092363e-06, - "loss": 0.79, - "step": 23457 - }, - { - "epoch": 0.6, - "learning_rate": 1.85152207979753e-06, - "loss": 1.1094, - "step": 23458 - }, - { - "epoch": 0.6, - "learning_rate": 1.8515075713338523e-06, - "loss": 0.7466, - "step": 23459 - }, - { - "epoch": 0.6, - "learning_rate": 1.8514930622182145e-06, - "loss": 0.8848, - "step": 23460 - }, - { - "epoch": 0.6, - "learning_rate": 1.8514785524506278e-06, - "loss": 0.7676, - "step": 23461 - }, - { - "epoch": 0.6, - "learning_rate": 1.851464042031103e-06, - "loss": 1.0771, - "step": 23462 - }, - { - "epoch": 0.6, - "learning_rate": 1.8514495309596511e-06, - "loss": 0.9424, - "step": 23463 - }, - { - "epoch": 0.6, - "learning_rate": 1.8514350192362837e-06, - "loss": 0.7578, - "step": 23464 - }, - { - "epoch": 0.6, - "learning_rate": 1.8514205068610116e-06, - "loss": 0.8516, - "step": 23465 - }, - { - "epoch": 0.6, - "learning_rate": 1.851405993833846e-06, - "loss": 0.7563, - "step": 23466 - }, - { - "epoch": 0.6, - "learning_rate": 1.851391480154798e-06, - "loss": 0.8691, - "step": 23467 - }, - { - "epoch": 0.6, - "learning_rate": 1.8513769658238784e-06, - "loss": 1.0146, - "step": 23468 - }, - { - "epoch": 0.6, - "learning_rate": 1.851362450841099e-06, - "loss": 0.8789, - "step": 23469 - }, - { - "epoch": 0.6, - "learning_rate": 1.8513479352064703e-06, - "loss": 0.5679, - "step": 23470 - }, - { - "epoch": 0.6, - "learning_rate": 1.8513334189200038e-06, - "loss": 0.8306, - "step": 23471 - }, - { - "epoch": 0.6, - "learning_rate": 1.8513189019817101e-06, - "loss": 1.0195, - "step": 23472 - }, - { - "epoch": 0.6, - "learning_rate": 1.8513043843916009e-06, - "loss": 0.7324, - "step": 23473 - }, - { - "epoch": 0.6, - "learning_rate": 1.8512898661496873e-06, - "loss": 0.915, - "step": 23474 - }, - { - "epoch": 0.6, - "learning_rate": 1.8512753472559797e-06, - "loss": 1.041, - "step": 23475 - }, - { - "epoch": 0.6, - "learning_rate": 1.8512608277104902e-06, - "loss": 0.8457, - "step": 23476 - }, - { - "epoch": 0.6, - "learning_rate": 1.8512463075132292e-06, - "loss": 0.7471, - "step": 23477 - }, - { - "epoch": 0.6, - "learning_rate": 1.8512317866642077e-06, - "loss": 0.8408, - "step": 23478 - }, - { - "epoch": 0.6, - "learning_rate": 1.8512172651634378e-06, - "loss": 0.8203, - "step": 23479 - }, - { - "epoch": 0.6, - "learning_rate": 1.8512027430109293e-06, - "loss": 0.7388, - "step": 23480 - }, - { - "epoch": 0.6, - "learning_rate": 1.8511882202066947e-06, - "loss": 0.9551, - "step": 23481 - }, - { - "epoch": 0.6, - "learning_rate": 1.8511736967507438e-06, - "loss": 1.1182, - "step": 23482 - }, - { - "epoch": 0.6, - "learning_rate": 1.8511591726430889e-06, - "loss": 0.9141, - "step": 23483 - }, - { - "epoch": 0.6, - "learning_rate": 1.8511446478837402e-06, - "loss": 0.8296, - "step": 23484 - }, - { - "epoch": 0.6, - "learning_rate": 1.8511301224727091e-06, - "loss": 0.7861, - "step": 23485 - }, - { - "epoch": 0.6, - "learning_rate": 1.8511155964100071e-06, - "loss": 0.8809, - "step": 23486 - }, - { - "epoch": 0.6, - "learning_rate": 1.851101069695645e-06, - "loss": 0.7725, - "step": 23487 - }, - { - "epoch": 0.6, - "learning_rate": 1.8510865423296337e-06, - "loss": 0.7738, - "step": 23488 - }, - { - "epoch": 0.6, - "learning_rate": 1.8510720143119848e-06, - "loss": 0.7245, - "step": 23489 - }, - { - "epoch": 0.6, - "learning_rate": 1.8510574856427091e-06, - "loss": 0.8979, - "step": 23490 - }, - { - "epoch": 0.6, - "learning_rate": 1.8510429563218178e-06, - "loss": 0.8516, - "step": 23491 - }, - { - "epoch": 0.6, - "learning_rate": 1.851028426349322e-06, - "loss": 0.7095, - "step": 23492 - }, - { - "epoch": 0.6, - "learning_rate": 1.851013895725233e-06, - "loss": 0.9131, - "step": 23493 - }, - { - "epoch": 0.6, - "learning_rate": 1.8509993644495619e-06, - "loss": 1.0332, - "step": 23494 - }, - { - "epoch": 0.6, - "learning_rate": 1.8509848325223195e-06, - "loss": 0.5791, - "step": 23495 - }, - { - "epoch": 0.6, - "learning_rate": 1.850970299943517e-06, - "loss": 0.6465, - "step": 23496 - }, - { - "epoch": 0.6, - "learning_rate": 1.8509557667131657e-06, - "loss": 1.001, - "step": 23497 - }, - { - "epoch": 0.6, - "learning_rate": 1.850941232831277e-06, - "loss": 0.7158, - "step": 23498 - }, - { - "epoch": 0.6, - "learning_rate": 1.8509266982978615e-06, - "loss": 0.8281, - "step": 23499 - }, - { - "epoch": 0.6, - "learning_rate": 1.8509121631129308e-06, - "loss": 0.856, - "step": 23500 - }, - { - "epoch": 0.6, - "learning_rate": 1.8508976272764954e-06, - "loss": 1.0039, - "step": 23501 - }, - { - "epoch": 0.6, - "learning_rate": 1.8508830907885671e-06, - "loss": 0.874, - "step": 23502 - }, - { - "epoch": 0.6, - "learning_rate": 1.8508685536491566e-06, - "loss": 0.8955, - "step": 23503 - }, - { - "epoch": 0.6, - "learning_rate": 1.8508540158582753e-06, - "loss": 1.0166, - "step": 23504 - }, - { - "epoch": 0.6, - "learning_rate": 1.850839477415934e-06, - "loss": 0.8076, - "step": 23505 - }, - { - "epoch": 0.6, - "learning_rate": 1.8508249383221442e-06, - "loss": 0.7266, - "step": 23506 - }, - { - "epoch": 0.6, - "learning_rate": 1.8508103985769168e-06, - "loss": 1.0215, - "step": 23507 - }, - { - "epoch": 0.6, - "learning_rate": 1.850795858180263e-06, - "loss": 0.958, - "step": 23508 - }, - { - "epoch": 0.6, - "learning_rate": 1.8507813171321941e-06, - "loss": 0.6426, - "step": 23509 - }, - { - "epoch": 0.6, - "learning_rate": 1.8507667754327208e-06, - "loss": 0.7305, - "step": 23510 - }, - { - "epoch": 0.6, - "learning_rate": 1.8507522330818547e-06, - "loss": 0.8906, - "step": 23511 - }, - { - "epoch": 0.6, - "learning_rate": 1.8507376900796067e-06, - "loss": 0.9453, - "step": 23512 - }, - { - "epoch": 0.6, - "learning_rate": 1.8507231464259881e-06, - "loss": 0.9424, - "step": 23513 - }, - { - "epoch": 0.6, - "learning_rate": 1.8507086021210097e-06, - "loss": 1.0186, - "step": 23514 - }, - { - "epoch": 0.6, - "learning_rate": 1.8506940571646827e-06, - "loss": 0.9648, - "step": 23515 - }, - { - "epoch": 0.6, - "learning_rate": 1.8506795115570186e-06, - "loss": 1.002, - "step": 23516 - }, - { - "epoch": 0.6, - "learning_rate": 1.8506649652980281e-06, - "loss": 1.0918, - "step": 23517 - }, - { - "epoch": 0.6, - "learning_rate": 1.850650418387723e-06, - "loss": 0.7051, - "step": 23518 - }, - { - "epoch": 0.6, - "learning_rate": 1.8506358708261136e-06, - "loss": 0.8564, - "step": 23519 - }, - { - "epoch": 0.6, - "learning_rate": 1.8506213226132114e-06, - "loss": 1.1924, - "step": 23520 - }, - { - "epoch": 0.6, - "learning_rate": 1.8506067737490279e-06, - "loss": 0.7539, - "step": 23521 - }, - { - "epoch": 0.6, - "learning_rate": 1.8505922242335736e-06, - "loss": 0.9736, - "step": 23522 - }, - { - "epoch": 0.6, - "learning_rate": 1.85057767406686e-06, - "loss": 0.8789, - "step": 23523 - }, - { - "epoch": 0.6, - "learning_rate": 1.8505631232488984e-06, - "loss": 0.9746, - "step": 23524 - }, - { - "epoch": 0.6, - "learning_rate": 1.8505485717796993e-06, - "loss": 1.0332, - "step": 23525 - }, - { - "epoch": 0.6, - "learning_rate": 1.8505340196592747e-06, - "loss": 0.8701, - "step": 23526 - }, - { - "epoch": 0.6, - "learning_rate": 1.8505194668876348e-06, - "loss": 0.7588, - "step": 23527 - }, - { - "epoch": 0.6, - "learning_rate": 1.8505049134647918e-06, - "loss": 0.9409, - "step": 23528 - }, - { - "epoch": 0.6, - "learning_rate": 1.8504903593907562e-06, - "loss": 0.6562, - "step": 23529 - }, - { - "epoch": 0.6, - "learning_rate": 1.850475804665539e-06, - "loss": 0.9395, - "step": 23530 - }, - { - "epoch": 0.6, - "learning_rate": 1.850461249289152e-06, - "loss": 0.7959, - "step": 23531 - }, - { - "epoch": 0.6, - "learning_rate": 1.8504466932616055e-06, - "loss": 0.8159, - "step": 23532 - }, - { - "epoch": 0.6, - "learning_rate": 1.8504321365829111e-06, - "loss": 0.7656, - "step": 23533 - }, - { - "epoch": 0.6, - "learning_rate": 1.8504175792530801e-06, - "loss": 0.9531, - "step": 23534 - }, - { - "epoch": 0.6, - "learning_rate": 1.8504030212721233e-06, - "loss": 0.7725, - "step": 23535 - }, - { - "epoch": 0.6, - "learning_rate": 1.8503884626400522e-06, - "loss": 0.9375, - "step": 23536 - }, - { - "epoch": 0.6, - "learning_rate": 1.8503739033568774e-06, - "loss": 0.8438, - "step": 23537 - }, - { - "epoch": 0.6, - "learning_rate": 1.850359343422611e-06, - "loss": 0.6885, - "step": 23538 - }, - { - "epoch": 0.6, - "learning_rate": 1.8503447828372632e-06, - "loss": 0.7786, - "step": 23539 - }, - { - "epoch": 0.6, - "learning_rate": 1.850330221600845e-06, - "loss": 0.7246, - "step": 23540 - }, - { - "epoch": 0.6, - "learning_rate": 1.8503156597133689e-06, - "loss": 0.8389, - "step": 23541 - }, - { - "epoch": 0.6, - "learning_rate": 1.850301097174845e-06, - "loss": 0.7529, - "step": 23542 - }, - { - "epoch": 0.6, - "learning_rate": 1.8502865339852842e-06, - "loss": 0.957, - "step": 23543 - }, - { - "epoch": 0.6, - "learning_rate": 1.8502719701446985e-06, - "loss": 0.6409, - "step": 23544 - }, - { - "epoch": 0.6, - "learning_rate": 1.8502574056530987e-06, - "loss": 0.7622, - "step": 23545 - }, - { - "epoch": 0.6, - "learning_rate": 1.8502428405104956e-06, - "loss": 0.8652, - "step": 23546 - }, - { - "epoch": 0.6, - "learning_rate": 1.8502282747169007e-06, - "loss": 0.7939, - "step": 23547 - }, - { - "epoch": 0.6, - "learning_rate": 1.8502137082723252e-06, - "loss": 0.8604, - "step": 23548 - }, - { - "epoch": 0.6, - "learning_rate": 1.8501991411767803e-06, - "loss": 0.5881, - "step": 23549 - }, - { - "epoch": 0.6, - "learning_rate": 1.8501845734302768e-06, - "loss": 0.7351, - "step": 23550 - }, - { - "epoch": 0.6, - "learning_rate": 1.8501700050328261e-06, - "loss": 0.7441, - "step": 23551 - }, - { - "epoch": 0.6, - "learning_rate": 1.8501554359844394e-06, - "loss": 0.873, - "step": 23552 - }, - { - "epoch": 0.6, - "learning_rate": 1.8501408662851277e-06, - "loss": 0.6919, - "step": 23553 - }, - { - "epoch": 0.6, - "learning_rate": 1.8501262959349023e-06, - "loss": 0.915, - "step": 23554 - }, - { - "epoch": 0.6, - "learning_rate": 1.8501117249337743e-06, - "loss": 0.8262, - "step": 23555 - }, - { - "epoch": 0.6, - "learning_rate": 1.8500971532817547e-06, - "loss": 0.873, - "step": 23556 - }, - { - "epoch": 0.6, - "learning_rate": 1.8500825809788548e-06, - "loss": 0.8447, - "step": 23557 - }, - { - "epoch": 0.6, - "learning_rate": 1.850068008025086e-06, - "loss": 0.9307, - "step": 23558 - }, - { - "epoch": 0.6, - "learning_rate": 1.850053434420459e-06, - "loss": 0.7559, - "step": 23559 - }, - { - "epoch": 0.6, - "learning_rate": 1.8500388601649853e-06, - "loss": 0.791, - "step": 23560 - }, - { - "epoch": 0.6, - "learning_rate": 1.8500242852586756e-06, - "loss": 0.8828, - "step": 23561 - }, - { - "epoch": 0.6, - "learning_rate": 1.850009709701542e-06, - "loss": 0.8604, - "step": 23562 - }, - { - "epoch": 0.6, - "learning_rate": 1.8499951334935946e-06, - "loss": 0.999, - "step": 23563 - }, - { - "epoch": 0.6, - "learning_rate": 1.849980556634845e-06, - "loss": 0.8271, - "step": 23564 - }, - { - "epoch": 0.6, - "learning_rate": 1.8499659791253044e-06, - "loss": 0.6973, - "step": 23565 - }, - { - "epoch": 0.6, - "learning_rate": 1.8499514009649842e-06, - "loss": 0.8584, - "step": 23566 - }, - { - "epoch": 0.6, - "learning_rate": 1.849936822153895e-06, - "loss": 0.9609, - "step": 23567 - }, - { - "epoch": 0.6, - "learning_rate": 1.8499222426920484e-06, - "loss": 0.96, - "step": 23568 - }, - { - "epoch": 0.6, - "learning_rate": 1.8499076625794551e-06, - "loss": 0.999, - "step": 23569 - }, - { - "epoch": 0.6, - "learning_rate": 1.849893081816127e-06, - "loss": 0.9404, - "step": 23570 - }, - { - "epoch": 0.6, - "learning_rate": 1.8498785004020747e-06, - "loss": 0.9229, - "step": 23571 - }, - { - "epoch": 0.6, - "learning_rate": 1.8498639183373095e-06, - "loss": 0.667, - "step": 23572 - }, - { - "epoch": 0.6, - "learning_rate": 1.8498493356218424e-06, - "loss": 0.8787, - "step": 23573 - }, - { - "epoch": 0.6, - "learning_rate": 1.8498347522556853e-06, - "loss": 0.4851, - "step": 23574 - }, - { - "epoch": 0.6, - "learning_rate": 1.8498201682388484e-06, - "loss": 0.8867, - "step": 23575 - }, - { - "epoch": 0.6, - "learning_rate": 1.849805583571343e-06, - "loss": 0.7739, - "step": 23576 - }, - { - "epoch": 0.6, - "learning_rate": 1.849790998253181e-06, - "loss": 0.9004, - "step": 23577 - }, - { - "epoch": 0.6, - "learning_rate": 1.8497764122843731e-06, - "loss": 0.9131, - "step": 23578 - }, - { - "epoch": 0.6, - "learning_rate": 1.8497618256649301e-06, - "loss": 0.6724, - "step": 23579 - }, - { - "epoch": 0.6, - "learning_rate": 1.849747238394864e-06, - "loss": 0.8125, - "step": 23580 - }, - { - "epoch": 0.6, - "learning_rate": 1.8497326504741853e-06, - "loss": 0.6045, - "step": 23581 - }, - { - "epoch": 0.6, - "learning_rate": 1.8497180619029052e-06, - "loss": 0.5042, - "step": 23582 - }, - { - "epoch": 0.6, - "learning_rate": 1.8497034726810352e-06, - "loss": 1.0215, - "step": 23583 - }, - { - "epoch": 0.6, - "learning_rate": 1.8496888828085863e-06, - "loss": 0.8457, - "step": 23584 - }, - { - "epoch": 0.6, - "learning_rate": 1.8496742922855697e-06, - "loss": 0.7725, - "step": 23585 - }, - { - "epoch": 0.6, - "learning_rate": 1.8496597011119967e-06, - "loss": 0.7949, - "step": 23586 - }, - { - "epoch": 0.6, - "learning_rate": 1.8496451092878782e-06, - "loss": 0.7876, - "step": 23587 - }, - { - "epoch": 0.6, - "learning_rate": 1.8496305168132255e-06, - "loss": 0.7812, - "step": 23588 - }, - { - "epoch": 0.6, - "learning_rate": 1.84961592368805e-06, - "loss": 0.7793, - "step": 23589 - }, - { - "epoch": 0.6, - "learning_rate": 1.8496013299123626e-06, - "loss": 0.8623, - "step": 23590 - }, - { - "epoch": 0.6, - "learning_rate": 1.8495867354861741e-06, - "loss": 1.0391, - "step": 23591 - }, - { - "epoch": 0.6, - "learning_rate": 1.8495721404094966e-06, - "loss": 0.9111, - "step": 23592 - }, - { - "epoch": 0.6, - "learning_rate": 1.8495575446823403e-06, - "loss": 1.0996, - "step": 23593 - }, - { - "epoch": 0.6, - "learning_rate": 1.8495429483047173e-06, - "loss": 1.0312, - "step": 23594 - }, - { - "epoch": 0.6, - "learning_rate": 1.8495283512766383e-06, - "loss": 1.0635, - "step": 23595 - }, - { - "epoch": 0.6, - "learning_rate": 1.8495137535981142e-06, - "loss": 0.7109, - "step": 23596 - }, - { - "epoch": 0.6, - "learning_rate": 1.8494991552691568e-06, - "loss": 0.8955, - "step": 23597 - }, - { - "epoch": 0.6, - "learning_rate": 1.8494845562897767e-06, - "loss": 0.7871, - "step": 23598 - }, - { - "epoch": 0.6, - "learning_rate": 1.8494699566599853e-06, - "loss": 0.8301, - "step": 23599 - }, - { - "epoch": 0.6, - "learning_rate": 1.849455356379794e-06, - "loss": 0.6226, - "step": 23600 - }, - { - "epoch": 0.6, - "learning_rate": 1.8494407554492137e-06, - "loss": 1.0127, - "step": 23601 - }, - { - "epoch": 0.6, - "learning_rate": 1.8494261538682557e-06, - "loss": 0.8994, - "step": 23602 - }, - { - "epoch": 0.6, - "learning_rate": 1.8494115516369314e-06, - "loss": 1.0068, - "step": 23603 - }, - { - "epoch": 0.6, - "learning_rate": 1.8493969487552512e-06, - "loss": 0.8574, - "step": 23604 - }, - { - "epoch": 0.61, - "learning_rate": 1.8493823452232271e-06, - "loss": 0.9287, - "step": 23605 - }, - { - "epoch": 0.61, - "learning_rate": 1.8493677410408702e-06, - "loss": 0.7642, - "step": 23606 - }, - { - "epoch": 0.61, - "learning_rate": 1.849353136208191e-06, - "loss": 0.8975, - "step": 23607 - }, - { - "epoch": 0.61, - "learning_rate": 1.8493385307252017e-06, - "loss": 0.8799, - "step": 23608 - }, - { - "epoch": 0.61, - "learning_rate": 1.8493239245919128e-06, - "loss": 0.9082, - "step": 23609 - }, - { - "epoch": 0.61, - "learning_rate": 1.8493093178083354e-06, - "loss": 0.7568, - "step": 23610 - }, - { - "epoch": 0.61, - "learning_rate": 1.849294710374481e-06, - "loss": 0.9043, - "step": 23611 - }, - { - "epoch": 0.61, - "learning_rate": 1.8492801022903606e-06, - "loss": 0.9775, - "step": 23612 - }, - { - "epoch": 0.61, - "learning_rate": 1.8492654935559858e-06, - "loss": 0.9414, - "step": 23613 - }, - { - "epoch": 0.61, - "learning_rate": 1.8492508841713672e-06, - "loss": 1.0332, - "step": 23614 - }, - { - "epoch": 0.61, - "learning_rate": 1.8492362741365162e-06, - "loss": 0.917, - "step": 23615 - }, - { - "epoch": 0.61, - "learning_rate": 1.849221663451444e-06, - "loss": 0.9033, - "step": 23616 - }, - { - "epoch": 0.61, - "learning_rate": 1.849207052116162e-06, - "loss": 0.8145, - "step": 23617 - }, - { - "epoch": 0.61, - "learning_rate": 1.849192440130681e-06, - "loss": 0.6821, - "step": 23618 - }, - { - "epoch": 0.61, - "learning_rate": 1.8491778274950128e-06, - "loss": 0.9727, - "step": 23619 - }, - { - "epoch": 0.61, - "learning_rate": 1.8491632142091678e-06, - "loss": 0.5784, - "step": 23620 - }, - { - "epoch": 0.61, - "learning_rate": 1.8491486002731579e-06, - "loss": 0.7568, - "step": 23621 - }, - { - "epoch": 0.61, - "learning_rate": 1.8491339856869936e-06, - "loss": 1.0098, - "step": 23622 - }, - { - "epoch": 0.61, - "learning_rate": 1.8491193704506867e-06, - "loss": 0.8799, - "step": 23623 - }, - { - "epoch": 0.61, - "learning_rate": 1.849104754564248e-06, - "loss": 0.9629, - "step": 23624 - }, - { - "epoch": 0.61, - "learning_rate": 1.8490901380276889e-06, - "loss": 0.8066, - "step": 23625 - }, - { - "epoch": 0.61, - "learning_rate": 1.8490755208410204e-06, - "loss": 0.9268, - "step": 23626 - }, - { - "epoch": 0.61, - "learning_rate": 1.8490609030042542e-06, - "loss": 0.9434, - "step": 23627 - }, - { - "epoch": 0.61, - "learning_rate": 1.8490462845174007e-06, - "loss": 1.0059, - "step": 23628 - }, - { - "epoch": 0.61, - "learning_rate": 1.8490316653804715e-06, - "loss": 0.9619, - "step": 23629 - }, - { - "epoch": 0.61, - "learning_rate": 1.849017045593478e-06, - "loss": 0.8555, - "step": 23630 - }, - { - "epoch": 0.61, - "learning_rate": 1.8490024251564311e-06, - "loss": 0.707, - "step": 23631 - }, - { - "epoch": 0.61, - "learning_rate": 1.8489878040693422e-06, - "loss": 0.9473, - "step": 23632 - }, - { - "epoch": 0.61, - "learning_rate": 1.8489731823322221e-06, - "loss": 1.0117, - "step": 23633 - }, - { - "epoch": 0.61, - "learning_rate": 1.8489585599450822e-06, - "loss": 0.8022, - "step": 23634 - }, - { - "epoch": 0.61, - "learning_rate": 1.8489439369079343e-06, - "loss": 0.7886, - "step": 23635 - }, - { - "epoch": 0.61, - "learning_rate": 1.8489293132207888e-06, - "loss": 0.8291, - "step": 23636 - }, - { - "epoch": 0.61, - "learning_rate": 1.848914688883657e-06, - "loss": 1.042, - "step": 23637 - }, - { - "epoch": 0.61, - "learning_rate": 1.8489000638965506e-06, - "loss": 0.8745, - "step": 23638 - }, - { - "epoch": 0.61, - "learning_rate": 1.84888543825948e-06, - "loss": 0.8945, - "step": 23639 - }, - { - "epoch": 0.61, - "learning_rate": 1.8488708119724572e-06, - "loss": 0.7852, - "step": 23640 - }, - { - "epoch": 0.61, - "learning_rate": 1.8488561850354932e-06, - "loss": 0.7354, - "step": 23641 - }, - { - "epoch": 0.61, - "learning_rate": 1.8488415574485985e-06, - "loss": 0.8164, - "step": 23642 - }, - { - "epoch": 0.61, - "learning_rate": 1.8488269292117853e-06, - "loss": 0.9941, - "step": 23643 - }, - { - "epoch": 0.61, - "learning_rate": 1.848812300325064e-06, - "loss": 0.8203, - "step": 23644 - }, - { - "epoch": 0.61, - "learning_rate": 1.8487976707884462e-06, - "loss": 0.7876, - "step": 23645 - }, - { - "epoch": 0.61, - "learning_rate": 1.8487830406019436e-06, - "loss": 1.0107, - "step": 23646 - }, - { - "epoch": 0.61, - "learning_rate": 1.8487684097655664e-06, - "loss": 0.8555, - "step": 23647 - }, - { - "epoch": 0.61, - "learning_rate": 1.848753778279326e-06, - "loss": 0.8809, - "step": 23648 - }, - { - "epoch": 0.61, - "learning_rate": 1.8487391461432344e-06, - "loss": 0.9229, - "step": 23649 - }, - { - "epoch": 0.61, - "learning_rate": 1.848724513357302e-06, - "loss": 0.7158, - "step": 23650 - }, - { - "epoch": 0.61, - "learning_rate": 1.8487098799215404e-06, - "loss": 0.9082, - "step": 23651 - }, - { - "epoch": 0.61, - "learning_rate": 1.8486952458359605e-06, - "loss": 0.6719, - "step": 23652 - }, - { - "epoch": 0.61, - "learning_rate": 1.8486806111005738e-06, - "loss": 0.877, - "step": 23653 - }, - { - "epoch": 0.61, - "learning_rate": 1.848665975715391e-06, - "loss": 0.5486, - "step": 23654 - }, - { - "epoch": 0.61, - "learning_rate": 1.8486513396804243e-06, - "loss": 0.9902, - "step": 23655 - }, - { - "epoch": 0.61, - "learning_rate": 1.848636702995684e-06, - "loss": 0.8398, - "step": 23656 - }, - { - "epoch": 0.61, - "learning_rate": 1.8486220656611815e-06, - "loss": 0.9023, - "step": 23657 - }, - { - "epoch": 0.61, - "learning_rate": 1.8486074276769283e-06, - "loss": 0.7949, - "step": 23658 - }, - { - "epoch": 0.61, - "learning_rate": 1.8485927890429354e-06, - "loss": 0.9775, - "step": 23659 - }, - { - "epoch": 0.61, - "learning_rate": 1.8485781497592136e-06, - "loss": 0.9473, - "step": 23660 - }, - { - "epoch": 0.61, - "learning_rate": 1.848563509825775e-06, - "loss": 0.8096, - "step": 23661 - }, - { - "epoch": 0.61, - "learning_rate": 1.8485488692426304e-06, - "loss": 0.8643, - "step": 23662 - }, - { - "epoch": 0.61, - "learning_rate": 1.8485342280097907e-06, - "loss": 0.8428, - "step": 23663 - }, - { - "epoch": 0.61, - "learning_rate": 1.8485195861272674e-06, - "loss": 1.0459, - "step": 23664 - }, - { - "epoch": 0.61, - "learning_rate": 1.8485049435950716e-06, - "loss": 0.8018, - "step": 23665 - }, - { - "epoch": 0.61, - "learning_rate": 1.8484903004132146e-06, - "loss": 0.8965, - "step": 23666 - }, - { - "epoch": 0.61, - "learning_rate": 1.8484756565817077e-06, - "loss": 1.0732, - "step": 23667 - }, - { - "epoch": 0.61, - "learning_rate": 1.8484610121005619e-06, - "loss": 0.8193, - "step": 23668 - }, - { - "epoch": 0.61, - "learning_rate": 1.8484463669697888e-06, - "loss": 0.8115, - "step": 23669 - }, - { - "epoch": 0.61, - "learning_rate": 1.848431721189399e-06, - "loss": 0.8672, - "step": 23670 - }, - { - "epoch": 0.61, - "learning_rate": 1.848417074759404e-06, - "loss": 0.9902, - "step": 23671 - }, - { - "epoch": 0.61, - "learning_rate": 1.848402427679815e-06, - "loss": 0.8711, - "step": 23672 - }, - { - "epoch": 0.61, - "learning_rate": 1.8483877799506437e-06, - "loss": 0.8735, - "step": 23673 - }, - { - "epoch": 0.61, - "learning_rate": 1.8483731315719008e-06, - "loss": 0.8682, - "step": 23674 - }, - { - "epoch": 0.61, - "learning_rate": 1.848358482543597e-06, - "loss": 0.9414, - "step": 23675 - }, - { - "epoch": 0.61, - "learning_rate": 1.848343832865745e-06, - "loss": 0.8304, - "step": 23676 - }, - { - "epoch": 0.61, - "learning_rate": 1.8483291825383546e-06, - "loss": 0.9106, - "step": 23677 - }, - { - "epoch": 0.61, - "learning_rate": 1.8483145315614376e-06, - "loss": 0.8164, - "step": 23678 - }, - { - "epoch": 0.61, - "learning_rate": 1.8482998799350052e-06, - "loss": 0.71, - "step": 23679 - }, - { - "epoch": 0.61, - "learning_rate": 1.8482852276590685e-06, - "loss": 0.5186, - "step": 23680 - }, - { - "epoch": 0.61, - "learning_rate": 1.848270574733639e-06, - "loss": 0.6631, - "step": 23681 - }, - { - "epoch": 0.61, - "learning_rate": 1.8482559211587279e-06, - "loss": 0.6753, - "step": 23682 - }, - { - "epoch": 0.61, - "learning_rate": 1.8482412669343459e-06, - "loss": 0.9746, - "step": 23683 - }, - { - "epoch": 0.61, - "learning_rate": 1.8482266120605047e-06, - "loss": 0.918, - "step": 23684 - }, - { - "epoch": 0.61, - "learning_rate": 1.848211956537215e-06, - "loss": 0.7949, - "step": 23685 - }, - { - "epoch": 0.61, - "learning_rate": 1.848197300364489e-06, - "loss": 0.7778, - "step": 23686 - }, - { - "epoch": 0.61, - "learning_rate": 1.8481826435423372e-06, - "loss": 0.668, - "step": 23687 - }, - { - "epoch": 0.61, - "learning_rate": 1.848167986070771e-06, - "loss": 0.8867, - "step": 23688 - }, - { - "epoch": 0.61, - "learning_rate": 1.8481533279498013e-06, - "loss": 0.9199, - "step": 23689 - }, - { - "epoch": 0.61, - "learning_rate": 1.8481386691794396e-06, - "loss": 0.9287, - "step": 23690 - }, - { - "epoch": 0.61, - "learning_rate": 1.8481240097596974e-06, - "loss": 0.7852, - "step": 23691 - }, - { - "epoch": 0.61, - "learning_rate": 1.8481093496905854e-06, - "loss": 0.7427, - "step": 23692 - }, - { - "epoch": 0.61, - "learning_rate": 1.8480946889721149e-06, - "loss": 0.79, - "step": 23693 - }, - { - "epoch": 0.61, - "learning_rate": 1.8480800276042977e-06, - "loss": 0.8975, - "step": 23694 - }, - { - "epoch": 0.61, - "learning_rate": 1.8480653655871444e-06, - "loss": 0.9287, - "step": 23695 - }, - { - "epoch": 0.61, - "learning_rate": 1.8480507029206664e-06, - "loss": 0.8306, - "step": 23696 - }, - { - "epoch": 0.61, - "learning_rate": 1.848036039604875e-06, - "loss": 0.9512, - "step": 23697 - }, - { - "epoch": 0.61, - "learning_rate": 1.8480213756397816e-06, - "loss": 0.8096, - "step": 23698 - }, - { - "epoch": 0.61, - "learning_rate": 1.848006711025397e-06, - "loss": 0.9707, - "step": 23699 - }, - { - "epoch": 0.61, - "learning_rate": 1.8479920457617329e-06, - "loss": 1.0312, - "step": 23700 - }, - { - "epoch": 0.61, - "learning_rate": 1.8479773798488e-06, - "loss": 0.864, - "step": 23701 - }, - { - "epoch": 0.61, - "learning_rate": 1.84796271328661e-06, - "loss": 0.6738, - "step": 23702 - }, - { - "epoch": 0.61, - "learning_rate": 1.8479480460751739e-06, - "loss": 1.0762, - "step": 23703 - }, - { - "epoch": 0.61, - "learning_rate": 1.847933378214503e-06, - "loss": 0.9609, - "step": 23704 - }, - { - "epoch": 0.61, - "learning_rate": 1.8479187097046083e-06, - "loss": 0.7285, - "step": 23705 - }, - { - "epoch": 0.61, - "learning_rate": 1.8479040405455012e-06, - "loss": 0.7227, - "step": 23706 - }, - { - "epoch": 0.61, - "learning_rate": 1.8478893707371932e-06, - "loss": 0.6631, - "step": 23707 - }, - { - "epoch": 0.61, - "learning_rate": 1.8478747002796954e-06, - "loss": 0.9395, - "step": 23708 - }, - { - "epoch": 0.61, - "learning_rate": 1.8478600291730188e-06, - "loss": 1.0039, - "step": 23709 - }, - { - "epoch": 0.61, - "learning_rate": 1.8478453574171747e-06, - "loss": 0.9717, - "step": 23710 - }, - { - "epoch": 0.61, - "learning_rate": 1.8478306850121746e-06, - "loss": 0.8203, - "step": 23711 - }, - { - "epoch": 0.61, - "learning_rate": 1.847816011958029e-06, - "loss": 1.0059, - "step": 23712 - }, - { - "epoch": 0.61, - "learning_rate": 1.8478013382547501e-06, - "loss": 0.9131, - "step": 23713 - }, - { - "epoch": 0.61, - "learning_rate": 1.8477866639023488e-06, - "loss": 0.9443, - "step": 23714 - }, - { - "epoch": 0.61, - "learning_rate": 1.847771988900836e-06, - "loss": 0.6748, - "step": 23715 - }, - { - "epoch": 0.61, - "learning_rate": 1.847757313250223e-06, - "loss": 0.7051, - "step": 23716 - }, - { - "epoch": 0.61, - "learning_rate": 1.8477426369505215e-06, - "loss": 0.7939, - "step": 23717 - }, - { - "epoch": 0.61, - "learning_rate": 1.8477279600017425e-06, - "loss": 0.876, - "step": 23718 - }, - { - "epoch": 0.61, - "learning_rate": 1.8477132824038969e-06, - "loss": 0.7461, - "step": 23719 - }, - { - "epoch": 0.61, - "learning_rate": 1.8476986041569964e-06, - "loss": 0.877, - "step": 23720 - }, - { - "epoch": 0.61, - "learning_rate": 1.847683925261052e-06, - "loss": 0.9668, - "step": 23721 - }, - { - "epoch": 0.61, - "learning_rate": 1.847669245716075e-06, - "loss": 0.9736, - "step": 23722 - }, - { - "epoch": 0.61, - "learning_rate": 1.8476545655220765e-06, - "loss": 0.752, - "step": 23723 - }, - { - "epoch": 0.61, - "learning_rate": 1.8476398846790682e-06, - "loss": 1.085, - "step": 23724 - }, - { - "epoch": 0.61, - "learning_rate": 1.847625203187061e-06, - "loss": 1.0195, - "step": 23725 - }, - { - "epoch": 0.61, - "learning_rate": 1.8476105210460657e-06, - "loss": 0.8535, - "step": 23726 - }, - { - "epoch": 0.61, - "learning_rate": 1.8475958382560943e-06, - "loss": 0.8086, - "step": 23727 - }, - { - "epoch": 0.61, - "learning_rate": 1.847581154817158e-06, - "loss": 0.7734, - "step": 23728 - }, - { - "epoch": 0.61, - "learning_rate": 1.8475664707292674e-06, - "loss": 0.8965, - "step": 23729 - }, - { - "epoch": 0.61, - "learning_rate": 1.8475517859924344e-06, - "loss": 1.0928, - "step": 23730 - }, - { - "epoch": 0.61, - "learning_rate": 1.8475371006066696e-06, - "loss": 0.9307, - "step": 23731 - }, - { - "epoch": 0.61, - "learning_rate": 1.8475224145719847e-06, - "loss": 0.6807, - "step": 23732 - }, - { - "epoch": 0.61, - "learning_rate": 1.8475077278883913e-06, - "loss": 0.8638, - "step": 23733 - }, - { - "epoch": 0.61, - "learning_rate": 1.8474930405559e-06, - "loss": 1.0117, - "step": 23734 - }, - { - "epoch": 0.61, - "learning_rate": 1.847478352574522e-06, - "loss": 0.9844, - "step": 23735 - }, - { - "epoch": 0.61, - "learning_rate": 1.8474636639442688e-06, - "loss": 0.8467, - "step": 23736 - }, - { - "epoch": 0.61, - "learning_rate": 1.8474489746651518e-06, - "loss": 0.9219, - "step": 23737 - }, - { - "epoch": 0.61, - "learning_rate": 1.847434284737182e-06, - "loss": 0.8584, - "step": 23738 - }, - { - "epoch": 0.61, - "learning_rate": 1.8474195941603709e-06, - "loss": 0.8237, - "step": 23739 - }, - { - "epoch": 0.61, - "learning_rate": 1.8474049029347293e-06, - "loss": 0.8203, - "step": 23740 - }, - { - "epoch": 0.61, - "learning_rate": 1.847390211060269e-06, - "loss": 0.834, - "step": 23741 - }, - { - "epoch": 0.61, - "learning_rate": 1.847375518537001e-06, - "loss": 0.6045, - "step": 23742 - }, - { - "epoch": 0.61, - "learning_rate": 1.8473608253649365e-06, - "loss": 0.6957, - "step": 23743 - }, - { - "epoch": 0.61, - "learning_rate": 1.8473461315440866e-06, - "loss": 0.9043, - "step": 23744 - }, - { - "epoch": 0.61, - "learning_rate": 1.8473314370744628e-06, - "loss": 0.8809, - "step": 23745 - }, - { - "epoch": 0.61, - "learning_rate": 1.8473167419560763e-06, - "loss": 0.7383, - "step": 23746 - }, - { - "epoch": 0.61, - "learning_rate": 1.8473020461889384e-06, - "loss": 0.9297, - "step": 23747 - }, - { - "epoch": 0.61, - "learning_rate": 1.8472873497730601e-06, - "loss": 0.9365, - "step": 23748 - }, - { - "epoch": 0.61, - "learning_rate": 1.8472726527084528e-06, - "loss": 0.7725, - "step": 23749 - }, - { - "epoch": 0.61, - "learning_rate": 1.8472579549951282e-06, - "loss": 0.7324, - "step": 23750 - }, - { - "epoch": 0.61, - "learning_rate": 1.8472432566330966e-06, - "loss": 0.9893, - "step": 23751 - }, - { - "epoch": 0.61, - "learning_rate": 1.8472285576223704e-06, - "loss": 0.8691, - "step": 23752 - }, - { - "epoch": 0.61, - "learning_rate": 1.8472138579629596e-06, - "loss": 0.7944, - "step": 23753 - }, - { - "epoch": 0.61, - "learning_rate": 1.8471991576548764e-06, - "loss": 0.8311, - "step": 23754 - }, - { - "epoch": 0.61, - "learning_rate": 1.847184456698132e-06, - "loss": 0.833, - "step": 23755 - }, - { - "epoch": 0.61, - "learning_rate": 1.8471697550927371e-06, - "loss": 0.8438, - "step": 23756 - }, - { - "epoch": 0.61, - "learning_rate": 1.8471550528387035e-06, - "loss": 0.8271, - "step": 23757 - }, - { - "epoch": 0.61, - "learning_rate": 1.8471403499360421e-06, - "loss": 0.7148, - "step": 23758 - }, - { - "epoch": 0.61, - "learning_rate": 1.8471256463847642e-06, - "loss": 0.5522, - "step": 23759 - }, - { - "epoch": 0.61, - "learning_rate": 1.8471109421848814e-06, - "loss": 0.9092, - "step": 23760 - }, - { - "epoch": 0.61, - "learning_rate": 1.8470962373364043e-06, - "loss": 0.8398, - "step": 23761 - }, - { - "epoch": 0.61, - "learning_rate": 1.847081531839345e-06, - "loss": 0.8652, - "step": 23762 - }, - { - "epoch": 0.61, - "learning_rate": 1.8470668256937142e-06, - "loss": 0.7222, - "step": 23763 - }, - { - "epoch": 0.61, - "learning_rate": 1.8470521188995232e-06, - "loss": 0.9053, - "step": 23764 - }, - { - "epoch": 0.61, - "learning_rate": 1.847037411456783e-06, - "loss": 0.5882, - "step": 23765 - }, - { - "epoch": 0.61, - "learning_rate": 1.8470227033655057e-06, - "loss": 0.9233, - "step": 23766 - }, - { - "epoch": 0.61, - "learning_rate": 1.8470079946257018e-06, - "loss": 0.959, - "step": 23767 - }, - { - "epoch": 0.61, - "learning_rate": 1.846993285237383e-06, - "loss": 1.0752, - "step": 23768 - }, - { - "epoch": 0.61, - "learning_rate": 1.8469785752005604e-06, - "loss": 0.8516, - "step": 23769 - }, - { - "epoch": 0.61, - "learning_rate": 1.8469638645152451e-06, - "loss": 0.7144, - "step": 23770 - }, - { - "epoch": 0.61, - "learning_rate": 1.8469491531814488e-06, - "loss": 0.915, - "step": 23771 - }, - { - "epoch": 0.61, - "learning_rate": 1.846934441199182e-06, - "loss": 0.9043, - "step": 23772 - }, - { - "epoch": 0.61, - "learning_rate": 1.8469197285684568e-06, - "loss": 1.1318, - "step": 23773 - }, - { - "epoch": 0.61, - "learning_rate": 1.846905015289284e-06, - "loss": 0.5453, - "step": 23774 - }, - { - "epoch": 0.61, - "learning_rate": 1.846890301361675e-06, - "loss": 0.5605, - "step": 23775 - }, - { - "epoch": 0.61, - "learning_rate": 1.846875586785641e-06, - "loss": 1.0322, - "step": 23776 - }, - { - "epoch": 0.61, - "learning_rate": 1.8468608715611933e-06, - "loss": 0.9209, - "step": 23777 - }, - { - "epoch": 0.61, - "learning_rate": 1.8468461556883433e-06, - "loss": 1.1152, - "step": 23778 - }, - { - "epoch": 0.61, - "learning_rate": 1.846831439167102e-06, - "loss": 0.8975, - "step": 23779 - }, - { - "epoch": 0.61, - "learning_rate": 1.8468167219974809e-06, - "loss": 0.9326, - "step": 23780 - }, - { - "epoch": 0.61, - "learning_rate": 1.8468020041794913e-06, - "loss": 0.8652, - "step": 23781 - }, - { - "epoch": 0.61, - "learning_rate": 1.846787285713144e-06, - "loss": 1.0117, - "step": 23782 - }, - { - "epoch": 0.61, - "learning_rate": 1.8467725665984509e-06, - "loss": 0.918, - "step": 23783 - }, - { - "epoch": 0.61, - "learning_rate": 1.8467578468354225e-06, - "loss": 0.9316, - "step": 23784 - }, - { - "epoch": 0.61, - "learning_rate": 1.8467431264240708e-06, - "loss": 1.1514, - "step": 23785 - }, - { - "epoch": 0.61, - "learning_rate": 1.846728405364407e-06, - "loss": 0.9863, - "step": 23786 - }, - { - "epoch": 0.61, - "learning_rate": 1.8467136836564423e-06, - "loss": 0.8779, - "step": 23787 - }, - { - "epoch": 0.61, - "learning_rate": 1.8466989613001876e-06, - "loss": 0.7451, - "step": 23788 - }, - { - "epoch": 0.61, - "learning_rate": 1.8466842382956543e-06, - "loss": 0.8535, - "step": 23789 - }, - { - "epoch": 0.61, - "learning_rate": 1.8466695146428544e-06, - "loss": 0.8467, - "step": 23790 - }, - { - "epoch": 0.61, - "learning_rate": 1.846654790341798e-06, - "loss": 0.5918, - "step": 23791 - }, - { - "epoch": 0.61, - "learning_rate": 1.8466400653924973e-06, - "loss": 0.8291, - "step": 23792 - }, - { - "epoch": 0.61, - "learning_rate": 1.8466253397949632e-06, - "loss": 0.7871, - "step": 23793 - }, - { - "epoch": 0.61, - "learning_rate": 1.8466106135492065e-06, - "loss": 1.0269, - "step": 23794 - }, - { - "epoch": 0.61, - "learning_rate": 1.8465958866552396e-06, - "loss": 0.75, - "step": 23795 - }, - { - "epoch": 0.61, - "learning_rate": 1.846581159113073e-06, - "loss": 0.9102, - "step": 23796 - }, - { - "epoch": 0.61, - "learning_rate": 1.8465664309227181e-06, - "loss": 0.8691, - "step": 23797 - }, - { - "epoch": 0.61, - "learning_rate": 1.8465517020841861e-06, - "loss": 0.7842, - "step": 23798 - }, - { - "epoch": 0.61, - "learning_rate": 1.8465369725974887e-06, - "loss": 0.5786, - "step": 23799 - }, - { - "epoch": 0.61, - "learning_rate": 1.8465222424626363e-06, - "loss": 1.002, - "step": 23800 - }, - { - "epoch": 0.61, - "learning_rate": 1.846507511679641e-06, - "loss": 0.7227, - "step": 23801 - }, - { - "epoch": 0.61, - "learning_rate": 1.8464927802485143e-06, - "loss": 0.717, - "step": 23802 - }, - { - "epoch": 0.61, - "learning_rate": 1.8464780481692666e-06, - "loss": 0.8877, - "step": 23803 - }, - { - "epoch": 0.61, - "learning_rate": 1.8464633154419094e-06, - "loss": 0.8418, - "step": 23804 - }, - { - "epoch": 0.61, - "learning_rate": 1.8464485820664545e-06, - "loss": 0.9502, - "step": 23805 - }, - { - "epoch": 0.61, - "learning_rate": 1.8464338480429124e-06, - "loss": 1.3145, - "step": 23806 - }, - { - "epoch": 0.61, - "learning_rate": 1.8464191133712952e-06, - "loss": 0.8652, - "step": 23807 - }, - { - "epoch": 0.61, - "learning_rate": 1.8464043780516135e-06, - "loss": 0.7224, - "step": 23808 - }, - { - "epoch": 0.61, - "learning_rate": 1.846389642083879e-06, - "loss": 0.957, - "step": 23809 - }, - { - "epoch": 0.61, - "learning_rate": 1.8463749054681032e-06, - "loss": 0.7505, - "step": 23810 - }, - { - "epoch": 0.61, - "learning_rate": 1.8463601682042969e-06, - "loss": 0.8711, - "step": 23811 - }, - { - "epoch": 0.61, - "learning_rate": 1.8463454302924714e-06, - "loss": 0.8408, - "step": 23812 - }, - { - "epoch": 0.61, - "learning_rate": 1.8463306917326382e-06, - "loss": 0.833, - "step": 23813 - }, - { - "epoch": 0.61, - "learning_rate": 1.8463159525248083e-06, - "loss": 0.7725, - "step": 23814 - }, - { - "epoch": 0.61, - "learning_rate": 1.8463012126689936e-06, - "loss": 0.9238, - "step": 23815 - }, - { - "epoch": 0.61, - "learning_rate": 1.8462864721652047e-06, - "loss": 1.1191, - "step": 23816 - }, - { - "epoch": 0.61, - "learning_rate": 1.8462717310134533e-06, - "loss": 0.79, - "step": 23817 - }, - { - "epoch": 0.61, - "learning_rate": 1.8462569892137502e-06, - "loss": 0.8936, - "step": 23818 - }, - { - "epoch": 0.61, - "learning_rate": 1.8462422467661076e-06, - "loss": 0.6787, - "step": 23819 - }, - { - "epoch": 0.61, - "learning_rate": 1.846227503670536e-06, - "loss": 1.0586, - "step": 23820 - }, - { - "epoch": 0.61, - "learning_rate": 1.8462127599270467e-06, - "loss": 0.9961, - "step": 23821 - }, - { - "epoch": 0.61, - "learning_rate": 1.846198015535651e-06, - "loss": 1.0156, - "step": 23822 - }, - { - "epoch": 0.61, - "learning_rate": 1.8461832704963612e-06, - "loss": 1.0215, - "step": 23823 - }, - { - "epoch": 0.61, - "learning_rate": 1.8461685248091873e-06, - "loss": 0.6826, - "step": 23824 - }, - { - "epoch": 0.61, - "learning_rate": 1.8461537784741407e-06, - "loss": 0.6343, - "step": 23825 - }, - { - "epoch": 0.61, - "learning_rate": 1.8461390314912336e-06, - "loss": 0.8877, - "step": 23826 - }, - { - "epoch": 0.61, - "learning_rate": 1.8461242838604765e-06, - "loss": 0.9219, - "step": 23827 - }, - { - "epoch": 0.61, - "learning_rate": 1.846109535581881e-06, - "loss": 0.8516, - "step": 23828 - }, - { - "epoch": 0.61, - "learning_rate": 1.8460947866554584e-06, - "loss": 0.8311, - "step": 23829 - }, - { - "epoch": 0.61, - "learning_rate": 1.84608003708122e-06, - "loss": 0.7764, - "step": 23830 - }, - { - "epoch": 0.61, - "learning_rate": 1.8460652868591767e-06, - "loss": 1.0098, - "step": 23831 - }, - { - "epoch": 0.61, - "learning_rate": 1.8460505359893404e-06, - "loss": 0.792, - "step": 23832 - }, - { - "epoch": 0.61, - "learning_rate": 1.8460357844717217e-06, - "loss": 0.8711, - "step": 23833 - }, - { - "epoch": 0.61, - "learning_rate": 1.846021032306333e-06, - "loss": 0.7627, - "step": 23834 - }, - { - "epoch": 0.61, - "learning_rate": 1.8460062794931845e-06, - "loss": 0.7886, - "step": 23835 - }, - { - "epoch": 0.61, - "learning_rate": 1.8459915260322878e-06, - "loss": 0.8828, - "step": 23836 - }, - { - "epoch": 0.61, - "learning_rate": 1.8459767719236546e-06, - "loss": 0.9746, - "step": 23837 - }, - { - "epoch": 0.61, - "learning_rate": 1.8459620171672955e-06, - "loss": 0.9297, - "step": 23838 - }, - { - "epoch": 0.61, - "learning_rate": 1.8459472617632224e-06, - "loss": 0.7842, - "step": 23839 - }, - { - "epoch": 0.61, - "learning_rate": 1.8459325057114463e-06, - "loss": 0.9883, - "step": 23840 - }, - { - "epoch": 0.61, - "learning_rate": 1.8459177490119786e-06, - "loss": 0.8701, - "step": 23841 - }, - { - "epoch": 0.61, - "learning_rate": 1.8459029916648308e-06, - "loss": 0.7266, - "step": 23842 - }, - { - "epoch": 0.61, - "learning_rate": 1.8458882336700134e-06, - "loss": 0.5732, - "step": 23843 - }, - { - "epoch": 0.61, - "learning_rate": 1.8458734750275387e-06, - "loss": 1.1016, - "step": 23844 - }, - { - "epoch": 0.61, - "learning_rate": 1.8458587157374174e-06, - "loss": 0.8789, - "step": 23845 - }, - { - "epoch": 0.61, - "learning_rate": 1.8458439557996612e-06, - "loss": 0.9346, - "step": 23846 - }, - { - "epoch": 0.61, - "learning_rate": 1.8458291952142812e-06, - "loss": 0.8647, - "step": 23847 - }, - { - "epoch": 0.61, - "learning_rate": 1.8458144339812884e-06, - "loss": 0.9258, - "step": 23848 - }, - { - "epoch": 0.61, - "learning_rate": 1.8457996721006945e-06, - "loss": 0.8057, - "step": 23849 - }, - { - "epoch": 0.61, - "learning_rate": 1.8457849095725108e-06, - "loss": 0.7014, - "step": 23850 - }, - { - "epoch": 0.61, - "learning_rate": 1.8457701463967484e-06, - "loss": 0.6836, - "step": 23851 - }, - { - "epoch": 0.61, - "learning_rate": 1.8457553825734188e-06, - "loss": 0.8359, - "step": 23852 - }, - { - "epoch": 0.61, - "learning_rate": 1.8457406181025328e-06, - "loss": 0.8125, - "step": 23853 - }, - { - "epoch": 0.61, - "learning_rate": 1.8457258529841025e-06, - "loss": 0.8887, - "step": 23854 - }, - { - "epoch": 0.61, - "learning_rate": 1.8457110872181386e-06, - "loss": 0.9561, - "step": 23855 - }, - { - "epoch": 0.61, - "learning_rate": 1.8456963208046527e-06, - "loss": 0.8447, - "step": 23856 - }, - { - "epoch": 0.61, - "learning_rate": 1.845681553743656e-06, - "loss": 0.8281, - "step": 23857 - }, - { - "epoch": 0.61, - "learning_rate": 1.8456667860351599e-06, - "loss": 0.9023, - "step": 23858 - }, - { - "epoch": 0.61, - "learning_rate": 1.8456520176791754e-06, - "loss": 0.5925, - "step": 23859 - }, - { - "epoch": 0.61, - "learning_rate": 1.8456372486757142e-06, - "loss": 0.7529, - "step": 23860 - }, - { - "epoch": 0.61, - "learning_rate": 1.8456224790247874e-06, - "loss": 0.9639, - "step": 23861 - }, - { - "epoch": 0.61, - "learning_rate": 1.8456077087264065e-06, - "loss": 0.6323, - "step": 23862 - }, - { - "epoch": 0.61, - "learning_rate": 1.8455929377805824e-06, - "loss": 0.9336, - "step": 23863 - }, - { - "epoch": 0.61, - "learning_rate": 1.8455781661873266e-06, - "loss": 1.0088, - "step": 23864 - }, - { - "epoch": 0.61, - "learning_rate": 1.845563393946651e-06, - "loss": 0.9824, - "step": 23865 - }, - { - "epoch": 0.61, - "learning_rate": 1.8455486210585658e-06, - "loss": 1.0205, - "step": 23866 - }, - { - "epoch": 0.61, - "learning_rate": 1.8455338475230833e-06, - "loss": 0.8877, - "step": 23867 - }, - { - "epoch": 0.61, - "learning_rate": 1.8455190733402142e-06, - "loss": 0.9355, - "step": 23868 - }, - { - "epoch": 0.61, - "learning_rate": 1.84550429850997e-06, - "loss": 0.76, - "step": 23869 - }, - { - "epoch": 0.61, - "learning_rate": 1.8454895230323623e-06, - "loss": 0.9033, - "step": 23870 - }, - { - "epoch": 0.61, - "learning_rate": 1.8454747469074019e-06, - "loss": 1.0049, - "step": 23871 - }, - { - "epoch": 0.61, - "learning_rate": 1.8454599701351005e-06, - "loss": 0.8418, - "step": 23872 - }, - { - "epoch": 0.61, - "learning_rate": 1.8454451927154692e-06, - "loss": 0.9229, - "step": 23873 - }, - { - "epoch": 0.61, - "learning_rate": 1.8454304146485193e-06, - "loss": 0.8892, - "step": 23874 - }, - { - "epoch": 0.61, - "learning_rate": 1.8454156359342625e-06, - "loss": 0.7451, - "step": 23875 - }, - { - "epoch": 0.61, - "learning_rate": 1.8454008565727098e-06, - "loss": 0.708, - "step": 23876 - }, - { - "epoch": 0.61, - "learning_rate": 1.845386076563872e-06, - "loss": 0.835, - "step": 23877 - }, - { - "epoch": 0.61, - "learning_rate": 1.8453712959077615e-06, - "loss": 0.9883, - "step": 23878 - }, - { - "epoch": 0.61, - "learning_rate": 1.8453565146043889e-06, - "loss": 1.0488, - "step": 23879 - }, - { - "epoch": 0.61, - "learning_rate": 1.8453417326537658e-06, - "loss": 0.9297, - "step": 23880 - }, - { - "epoch": 0.61, - "learning_rate": 1.8453269500559032e-06, - "loss": 0.7842, - "step": 23881 - }, - { - "epoch": 0.61, - "learning_rate": 1.8453121668108128e-06, - "loss": 1.1113, - "step": 23882 - }, - { - "epoch": 0.61, - "learning_rate": 1.8452973829185056e-06, - "loss": 0.8604, - "step": 23883 - }, - { - "epoch": 0.61, - "learning_rate": 1.845282598378993e-06, - "loss": 0.8506, - "step": 23884 - }, - { - "epoch": 0.61, - "learning_rate": 1.8452678131922866e-06, - "loss": 0.8965, - "step": 23885 - }, - { - "epoch": 0.61, - "learning_rate": 1.8452530273583973e-06, - "loss": 0.7324, - "step": 23886 - }, - { - "epoch": 0.61, - "learning_rate": 1.8452382408773368e-06, - "loss": 0.6506, - "step": 23887 - }, - { - "epoch": 0.61, - "learning_rate": 1.8452234537491163e-06, - "loss": 0.7578, - "step": 23888 - }, - { - "epoch": 0.61, - "learning_rate": 1.8452086659737467e-06, - "loss": 0.9561, - "step": 23889 - }, - { - "epoch": 0.61, - "learning_rate": 1.8451938775512402e-06, - "loss": 0.8848, - "step": 23890 - }, - { - "epoch": 0.61, - "learning_rate": 1.8451790884816071e-06, - "loss": 1.0361, - "step": 23891 - }, - { - "epoch": 0.61, - "learning_rate": 1.8451642987648595e-06, - "loss": 0.9297, - "step": 23892 - }, - { - "epoch": 0.61, - "learning_rate": 1.8451495084010084e-06, - "loss": 1.0078, - "step": 23893 - }, - { - "epoch": 0.61, - "learning_rate": 1.8451347173900652e-06, - "loss": 0.7969, - "step": 23894 - }, - { - "epoch": 0.61, - "learning_rate": 1.8451199257320411e-06, - "loss": 0.8193, - "step": 23895 - }, - { - "epoch": 0.61, - "learning_rate": 1.8451051334269478e-06, - "loss": 0.7451, - "step": 23896 - }, - { - "epoch": 0.61, - "learning_rate": 1.845090340474796e-06, - "loss": 1.0186, - "step": 23897 - }, - { - "epoch": 0.61, - "learning_rate": 1.8450755468755976e-06, - "loss": 0.8828, - "step": 23898 - }, - { - "epoch": 0.61, - "learning_rate": 1.8450607526293638e-06, - "loss": 0.7544, - "step": 23899 - }, - { - "epoch": 0.61, - "learning_rate": 1.8450459577361058e-06, - "loss": 1.0752, - "step": 23900 - }, - { - "epoch": 0.61, - "learning_rate": 1.8450311621958347e-06, - "loss": 0.7056, - "step": 23901 - }, - { - "epoch": 0.61, - "learning_rate": 1.8450163660085624e-06, - "loss": 0.9609, - "step": 23902 - }, - { - "epoch": 0.61, - "learning_rate": 1.8450015691742999e-06, - "loss": 0.8994, - "step": 23903 - }, - { - "epoch": 0.61, - "learning_rate": 1.8449867716930583e-06, - "loss": 0.9131, - "step": 23904 - }, - { - "epoch": 0.61, - "learning_rate": 1.8449719735648494e-06, - "loss": 0.9033, - "step": 23905 - }, - { - "epoch": 0.61, - "learning_rate": 1.8449571747896844e-06, - "loss": 0.8965, - "step": 23906 - }, - { - "epoch": 0.61, - "learning_rate": 1.8449423753675744e-06, - "loss": 1.0889, - "step": 23907 - }, - { - "epoch": 0.61, - "learning_rate": 1.8449275752985307e-06, - "loss": 0.6511, - "step": 23908 - }, - { - "epoch": 0.61, - "learning_rate": 1.844912774582565e-06, - "loss": 0.8271, - "step": 23909 - }, - { - "epoch": 0.61, - "learning_rate": 1.8448979732196884e-06, - "loss": 0.7524, - "step": 23910 - }, - { - "epoch": 0.61, - "learning_rate": 1.8448831712099125e-06, - "loss": 0.9307, - "step": 23911 - }, - { - "epoch": 0.61, - "learning_rate": 1.8448683685532482e-06, - "loss": 0.8525, - "step": 23912 - }, - { - "epoch": 0.61, - "learning_rate": 1.8448535652497071e-06, - "loss": 0.8652, - "step": 23913 - }, - { - "epoch": 0.61, - "learning_rate": 1.8448387612993002e-06, - "loss": 1.0264, - "step": 23914 - }, - { - "epoch": 0.61, - "learning_rate": 1.8448239567020395e-06, - "loss": 1.0273, - "step": 23915 - }, - { - "epoch": 0.61, - "learning_rate": 1.8448091514579356e-06, - "loss": 0.8594, - "step": 23916 - }, - { - "epoch": 0.61, - "learning_rate": 1.8447943455670005e-06, - "loss": 0.9785, - "step": 23917 - }, - { - "epoch": 0.61, - "learning_rate": 1.8447795390292452e-06, - "loss": 0.9814, - "step": 23918 - }, - { - "epoch": 0.61, - "learning_rate": 1.844764731844681e-06, - "loss": 0.7729, - "step": 23919 - }, - { - "epoch": 0.61, - "learning_rate": 1.8447499240133189e-06, - "loss": 0.7402, - "step": 23920 - }, - { - "epoch": 0.61, - "learning_rate": 1.844735115535171e-06, - "loss": 0.7166, - "step": 23921 - }, - { - "epoch": 0.61, - "learning_rate": 1.8447203064102482e-06, - "loss": 0.9902, - "step": 23922 - }, - { - "epoch": 0.61, - "learning_rate": 1.8447054966385618e-06, - "loss": 0.9766, - "step": 23923 - }, - { - "epoch": 0.61, - "learning_rate": 1.8446906862201233e-06, - "loss": 0.7832, - "step": 23924 - }, - { - "epoch": 0.61, - "learning_rate": 1.844675875154944e-06, - "loss": 0.832, - "step": 23925 - }, - { - "epoch": 0.61, - "learning_rate": 1.8446610634430353e-06, - "loss": 0.8438, - "step": 23926 - }, - { - "epoch": 0.61, - "learning_rate": 1.8446462510844084e-06, - "loss": 0.8118, - "step": 23927 - }, - { - "epoch": 0.61, - "learning_rate": 1.8446314380790748e-06, - "loss": 0.7998, - "step": 23928 - }, - { - "epoch": 0.61, - "learning_rate": 1.8446166244270455e-06, - "loss": 0.9883, - "step": 23929 - }, - { - "epoch": 0.61, - "learning_rate": 1.8446018101283324e-06, - "loss": 0.8584, - "step": 23930 - }, - { - "epoch": 0.61, - "learning_rate": 1.8445869951829462e-06, - "loss": 0.7891, - "step": 23931 - }, - { - "epoch": 0.61, - "learning_rate": 1.844572179590899e-06, - "loss": 1.083, - "step": 23932 - }, - { - "epoch": 0.61, - "learning_rate": 1.844557363352201e-06, - "loss": 0.8398, - "step": 23933 - }, - { - "epoch": 0.61, - "learning_rate": 1.844542546466865e-06, - "loss": 0.8965, - "step": 23934 - }, - { - "epoch": 0.61, - "learning_rate": 1.8445277289349013e-06, - "loss": 0.916, - "step": 23935 - }, - { - "epoch": 0.61, - "learning_rate": 1.8445129107563216e-06, - "loss": 0.8418, - "step": 23936 - }, - { - "epoch": 0.61, - "learning_rate": 1.844498091931137e-06, - "loss": 0.7827, - "step": 23937 - }, - { - "epoch": 0.61, - "learning_rate": 1.8444832724593593e-06, - "loss": 0.9971, - "step": 23938 - }, - { - "epoch": 0.61, - "learning_rate": 1.8444684523409994e-06, - "loss": 0.918, - "step": 23939 - }, - { - "epoch": 0.61, - "learning_rate": 1.8444536315760691e-06, - "loss": 0.8398, - "step": 23940 - }, - { - "epoch": 0.61, - "learning_rate": 1.8444388101645792e-06, - "loss": 0.874, - "step": 23941 - }, - { - "epoch": 0.61, - "learning_rate": 1.8444239881065416e-06, - "loss": 0.9502, - "step": 23942 - }, - { - "epoch": 0.61, - "learning_rate": 1.844409165401967e-06, - "loss": 0.8887, - "step": 23943 - }, - { - "epoch": 0.61, - "learning_rate": 1.8443943420508674e-06, - "loss": 1.0547, - "step": 23944 - }, - { - "epoch": 0.61, - "learning_rate": 1.844379518053254e-06, - "loss": 0.9551, - "step": 23945 - }, - { - "epoch": 0.61, - "learning_rate": 1.8443646934091377e-06, - "loss": 0.7285, - "step": 23946 - }, - { - "epoch": 0.61, - "learning_rate": 1.8443498681185305e-06, - "loss": 0.7427, - "step": 23947 - }, - { - "epoch": 0.61, - "learning_rate": 1.8443350421814433e-06, - "loss": 0.9395, - "step": 23948 - }, - { - "epoch": 0.61, - "learning_rate": 1.8443202155978873e-06, - "loss": 0.6846, - "step": 23949 - }, - { - "epoch": 0.61, - "learning_rate": 1.8443053883678746e-06, - "loss": 0.7588, - "step": 23950 - }, - { - "epoch": 0.61, - "learning_rate": 1.8442905604914158e-06, - "loss": 0.8252, - "step": 23951 - }, - { - "epoch": 0.61, - "learning_rate": 1.8442757319685227e-06, - "loss": 1.001, - "step": 23952 - }, - { - "epoch": 0.61, - "learning_rate": 1.8442609027992062e-06, - "loss": 0.7793, - "step": 23953 - }, - { - "epoch": 0.61, - "learning_rate": 1.8442460729834784e-06, - "loss": 0.79, - "step": 23954 - }, - { - "epoch": 0.61, - "learning_rate": 1.8442312425213497e-06, - "loss": 0.8535, - "step": 23955 - }, - { - "epoch": 0.61, - "learning_rate": 1.8442164114128324e-06, - "loss": 0.7402, - "step": 23956 - }, - { - "epoch": 0.61, - "learning_rate": 1.844201579657937e-06, - "loss": 0.915, - "step": 23957 - }, - { - "epoch": 0.61, - "learning_rate": 1.8441867472566757e-06, - "loss": 1.0098, - "step": 23958 - }, - { - "epoch": 0.61, - "learning_rate": 1.8441719142090592e-06, - "loss": 0.877, - "step": 23959 - }, - { - "epoch": 0.61, - "learning_rate": 1.844157080515099e-06, - "loss": 0.7163, - "step": 23960 - }, - { - "epoch": 0.61, - "learning_rate": 1.8441422461748068e-06, - "loss": 0.8779, - "step": 23961 - }, - { - "epoch": 0.61, - "learning_rate": 1.8441274111881934e-06, - "loss": 0.8848, - "step": 23962 - }, - { - "epoch": 0.61, - "learning_rate": 1.8441125755552706e-06, - "loss": 0.8359, - "step": 23963 - }, - { - "epoch": 0.61, - "learning_rate": 1.8440977392760497e-06, - "loss": 0.8223, - "step": 23964 - }, - { - "epoch": 0.61, - "learning_rate": 1.8440829023505417e-06, - "loss": 0.8389, - "step": 23965 - }, - { - "epoch": 0.61, - "learning_rate": 1.8440680647787583e-06, - "loss": 0.6802, - "step": 23966 - }, - { - "epoch": 0.61, - "learning_rate": 1.8440532265607112e-06, - "loss": 0.9756, - "step": 23967 - }, - { - "epoch": 0.61, - "learning_rate": 1.8440383876964109e-06, - "loss": 0.8452, - "step": 23968 - }, - { - "epoch": 0.61, - "learning_rate": 1.8440235481858694e-06, - "loss": 0.9629, - "step": 23969 - }, - { - "epoch": 0.61, - "learning_rate": 1.844008708029098e-06, - "loss": 0.8052, - "step": 23970 - }, - { - "epoch": 0.61, - "learning_rate": 1.8439938672261075e-06, - "loss": 0.8325, - "step": 23971 - }, - { - "epoch": 0.61, - "learning_rate": 1.8439790257769104e-06, - "loss": 0.8071, - "step": 23972 - }, - { - "epoch": 0.61, - "learning_rate": 1.8439641836815168e-06, - "loss": 0.7057, - "step": 23973 - }, - { - "epoch": 0.61, - "learning_rate": 1.8439493409399388e-06, - "loss": 0.9253, - "step": 23974 - }, - { - "epoch": 0.61, - "learning_rate": 1.8439344975521875e-06, - "loss": 0.6787, - "step": 23975 - }, - { - "epoch": 0.61, - "learning_rate": 1.8439196535182745e-06, - "loss": 0.9453, - "step": 23976 - }, - { - "epoch": 0.61, - "learning_rate": 1.843904808838211e-06, - "loss": 0.7402, - "step": 23977 - }, - { - "epoch": 0.61, - "learning_rate": 1.8438899635120083e-06, - "loss": 0.874, - "step": 23978 - }, - { - "epoch": 0.61, - "learning_rate": 1.843875117539678e-06, - "loss": 1.0215, - "step": 23979 - }, - { - "epoch": 0.61, - "learning_rate": 1.8438602709212313e-06, - "loss": 0.7959, - "step": 23980 - }, - { - "epoch": 0.61, - "learning_rate": 1.8438454236566794e-06, - "loss": 0.7446, - "step": 23981 - }, - { - "epoch": 0.61, - "learning_rate": 1.8438305757460339e-06, - "loss": 0.7256, - "step": 23982 - }, - { - "epoch": 0.61, - "learning_rate": 1.8438157271893064e-06, - "loss": 1.0508, - "step": 23983 - }, - { - "epoch": 0.61, - "learning_rate": 1.8438008779865077e-06, - "loss": 0.8672, - "step": 23984 - }, - { - "epoch": 0.61, - "learning_rate": 1.8437860281376496e-06, - "loss": 0.8223, - "step": 23985 - }, - { - "epoch": 0.61, - "learning_rate": 1.8437711776427434e-06, - "loss": 0.8721, - "step": 23986 - }, - { - "epoch": 0.61, - "learning_rate": 1.8437563265018003e-06, - "loss": 0.8438, - "step": 23987 - }, - { - "epoch": 0.61, - "learning_rate": 1.843741474714832e-06, - "loss": 0.8398, - "step": 23988 - }, - { - "epoch": 0.61, - "learning_rate": 1.8437266222818492e-06, - "loss": 0.833, - "step": 23989 - }, - { - "epoch": 0.61, - "learning_rate": 1.843711769202864e-06, - "loss": 0.8262, - "step": 23990 - }, - { - "epoch": 0.61, - "learning_rate": 1.8436969154778877e-06, - "loss": 0.8555, - "step": 23991 - }, - { - "epoch": 0.61, - "learning_rate": 1.8436820611069312e-06, - "loss": 0.8955, - "step": 23992 - }, - { - "epoch": 0.61, - "learning_rate": 1.8436672060900062e-06, - "loss": 0.876, - "step": 23993 - }, - { - "epoch": 0.61, - "learning_rate": 1.843652350427124e-06, - "loss": 0.876, - "step": 23994 - }, - { - "epoch": 0.62, - "learning_rate": 1.8436374941182959e-06, - "loss": 0.8857, - "step": 23995 - }, - { - "epoch": 0.62, - "learning_rate": 1.8436226371635336e-06, - "loss": 0.9883, - "step": 23996 - }, - { - "epoch": 0.62, - "learning_rate": 1.843607779562848e-06, - "loss": 0.9756, - "step": 23997 - }, - { - "epoch": 0.62, - "learning_rate": 1.8435929213162508e-06, - "loss": 0.7578, - "step": 23998 - }, - { - "epoch": 0.62, - "learning_rate": 1.843578062423753e-06, - "loss": 0.9893, - "step": 23999 - }, - { - "epoch": 0.62, - "learning_rate": 1.8435632028853666e-06, - "loss": 0.9102, - "step": 24000 - }, - { - "epoch": 0.62, - "learning_rate": 1.8435483427011028e-06, - "loss": 0.8403, - "step": 24001 - }, - { - "epoch": 0.62, - "learning_rate": 1.8435334818709727e-06, - "loss": 0.7024, - "step": 24002 - }, - { - "epoch": 0.62, - "learning_rate": 1.8435186203949878e-06, - "loss": 0.8369, - "step": 24003 - }, - { - "epoch": 0.62, - "learning_rate": 1.8435037582731593e-06, - "loss": 0.6826, - "step": 24004 - }, - { - "epoch": 0.62, - "learning_rate": 1.8434888955054987e-06, - "loss": 0.8657, - "step": 24005 - }, - { - "epoch": 0.62, - "learning_rate": 1.8434740320920177e-06, - "loss": 0.8218, - "step": 24006 - }, - { - "epoch": 0.62, - "learning_rate": 1.8434591680327274e-06, - "loss": 1.0127, - "step": 24007 - }, - { - "epoch": 0.62, - "learning_rate": 1.843444303327639e-06, - "loss": 0.8174, - "step": 24008 - }, - { - "epoch": 0.62, - "learning_rate": 1.843429437976764e-06, - "loss": 0.7793, - "step": 24009 - }, - { - "epoch": 0.62, - "learning_rate": 1.8434145719801141e-06, - "loss": 0.9443, - "step": 24010 - }, - { - "epoch": 0.62, - "learning_rate": 1.8433997053377005e-06, - "loss": 1.1689, - "step": 24011 - }, - { - "epoch": 0.62, - "learning_rate": 1.8433848380495345e-06, - "loss": 0.8906, - "step": 24012 - }, - { - "epoch": 0.62, - "learning_rate": 1.8433699701156273e-06, - "loss": 1.1309, - "step": 24013 - }, - { - "epoch": 0.62, - "learning_rate": 1.8433551015359907e-06, - "loss": 0.6279, - "step": 24014 - }, - { - "epoch": 0.62, - "learning_rate": 1.843340232310636e-06, - "loss": 0.6929, - "step": 24015 - }, - { - "epoch": 0.62, - "learning_rate": 1.843325362439574e-06, - "loss": 0.8418, - "step": 24016 - }, - { - "epoch": 0.62, - "learning_rate": 1.8433104919228168e-06, - "loss": 0.6382, - "step": 24017 - }, - { - "epoch": 0.62, - "learning_rate": 1.8432956207603755e-06, - "loss": 0.812, - "step": 24018 - }, - { - "epoch": 0.62, - "learning_rate": 1.8432807489522618e-06, - "loss": 0.7861, - "step": 24019 - }, - { - "epoch": 0.62, - "learning_rate": 1.8432658764984864e-06, - "loss": 0.7197, - "step": 24020 - }, - { - "epoch": 0.62, - "learning_rate": 1.8432510033990614e-06, - "loss": 0.8711, - "step": 24021 - }, - { - "epoch": 0.62, - "learning_rate": 1.8432361296539978e-06, - "loss": 0.8125, - "step": 24022 - }, - { - "epoch": 0.62, - "learning_rate": 1.8432212552633069e-06, - "loss": 0.8105, - "step": 24023 - }, - { - "epoch": 0.62, - "learning_rate": 1.8432063802270004e-06, - "loss": 0.9688, - "step": 24024 - }, - { - "epoch": 0.62, - "learning_rate": 1.8431915045450895e-06, - "loss": 0.8833, - "step": 24025 - }, - { - "epoch": 0.62, - "learning_rate": 1.8431766282175855e-06, - "loss": 0.7744, - "step": 24026 - }, - { - "epoch": 0.62, - "learning_rate": 1.8431617512445001e-06, - "loss": 0.7402, - "step": 24027 - }, - { - "epoch": 0.62, - "learning_rate": 1.8431468736258443e-06, - "loss": 0.5737, - "step": 24028 - }, - { - "epoch": 0.62, - "learning_rate": 1.84313199536163e-06, - "loss": 0.729, - "step": 24029 - }, - { - "epoch": 0.62, - "learning_rate": 1.8431171164518684e-06, - "loss": 1.0859, - "step": 24030 - }, - { - "epoch": 0.62, - "learning_rate": 1.8431022368965704e-06, - "loss": 1.0439, - "step": 24031 - }, - { - "epoch": 0.62, - "learning_rate": 1.843087356695748e-06, - "loss": 0.9062, - "step": 24032 - }, - { - "epoch": 0.62, - "learning_rate": 1.8430724758494125e-06, - "loss": 0.8467, - "step": 24033 - }, - { - "epoch": 0.62, - "learning_rate": 1.843057594357575e-06, - "loss": 0.7334, - "step": 24034 - }, - { - "epoch": 0.62, - "learning_rate": 1.8430427122202469e-06, - "loss": 0.9463, - "step": 24035 - }, - { - "epoch": 0.62, - "learning_rate": 1.8430278294374402e-06, - "loss": 0.6714, - "step": 24036 - }, - { - "epoch": 0.62, - "learning_rate": 1.8430129460091655e-06, - "loss": 0.8379, - "step": 24037 - }, - { - "epoch": 0.62, - "learning_rate": 1.8429980619354346e-06, - "loss": 0.9473, - "step": 24038 - }, - { - "epoch": 0.62, - "learning_rate": 1.842983177216259e-06, - "loss": 1.0244, - "step": 24039 - }, - { - "epoch": 0.62, - "learning_rate": 1.8429682918516497e-06, - "loss": 0.686, - "step": 24040 - }, - { - "epoch": 0.62, - "learning_rate": 1.8429534058416185e-06, - "loss": 0.8447, - "step": 24041 - }, - { - "epoch": 0.62, - "learning_rate": 1.8429385191861768e-06, - "loss": 0.6729, - "step": 24042 - }, - { - "epoch": 0.62, - "learning_rate": 1.8429236318853354e-06, - "loss": 0.6252, - "step": 24043 - }, - { - "epoch": 0.62, - "learning_rate": 1.8429087439391067e-06, - "loss": 0.8125, - "step": 24044 - }, - { - "epoch": 0.62, - "learning_rate": 1.842893855347501e-06, - "loss": 1.0156, - "step": 24045 - }, - { - "epoch": 0.62, - "learning_rate": 1.8428789661105305e-06, - "loss": 0.9463, - "step": 24046 - }, - { - "epoch": 0.62, - "learning_rate": 1.8428640762282064e-06, - "loss": 0.916, - "step": 24047 - }, - { - "epoch": 0.62, - "learning_rate": 1.8428491857005396e-06, - "loss": 0.751, - "step": 24048 - }, - { - "epoch": 0.62, - "learning_rate": 1.8428342945275426e-06, - "loss": 0.9941, - "step": 24049 - }, - { - "epoch": 0.62, - "learning_rate": 1.8428194027092256e-06, - "loss": 0.8389, - "step": 24050 - }, - { - "epoch": 0.62, - "learning_rate": 1.8428045102456006e-06, - "loss": 0.7915, - "step": 24051 - }, - { - "epoch": 0.62, - "learning_rate": 1.8427896171366792e-06, - "loss": 0.7461, - "step": 24052 - }, - { - "epoch": 0.62, - "learning_rate": 1.8427747233824725e-06, - "loss": 0.874, - "step": 24053 - }, - { - "epoch": 0.62, - "learning_rate": 1.8427598289829918e-06, - "loss": 0.8877, - "step": 24054 - }, - { - "epoch": 0.62, - "learning_rate": 1.8427449339382487e-06, - "loss": 0.8633, - "step": 24055 - }, - { - "epoch": 0.62, - "learning_rate": 1.8427300382482544e-06, - "loss": 0.8657, - "step": 24056 - }, - { - "epoch": 0.62, - "learning_rate": 1.8427151419130208e-06, - "loss": 1.1113, - "step": 24057 - }, - { - "epoch": 0.62, - "learning_rate": 1.8427002449325587e-06, - "loss": 0.9248, - "step": 24058 - }, - { - "epoch": 0.62, - "learning_rate": 1.8426853473068799e-06, - "loss": 0.76, - "step": 24059 - }, - { - "epoch": 0.62, - "learning_rate": 1.8426704490359955e-06, - "loss": 1.041, - "step": 24060 - }, - { - "epoch": 0.62, - "learning_rate": 1.8426555501199173e-06, - "loss": 0.6992, - "step": 24061 - }, - { - "epoch": 0.62, - "learning_rate": 1.8426406505586566e-06, - "loss": 0.9805, - "step": 24062 - }, - { - "epoch": 0.62, - "learning_rate": 1.8426257503522242e-06, - "loss": 0.8379, - "step": 24063 - }, - { - "epoch": 0.62, - "learning_rate": 1.8426108495006325e-06, - "loss": 0.6748, - "step": 24064 - }, - { - "epoch": 0.62, - "learning_rate": 1.842595948003892e-06, - "loss": 1.0693, - "step": 24065 - }, - { - "epoch": 0.62, - "learning_rate": 1.8425810458620147e-06, - "loss": 0.9453, - "step": 24066 - }, - { - "epoch": 0.62, - "learning_rate": 1.8425661430750118e-06, - "loss": 0.8809, - "step": 24067 - }, - { - "epoch": 0.62, - "learning_rate": 1.842551239642895e-06, - "loss": 0.8545, - "step": 24068 - }, - { - "epoch": 0.62, - "learning_rate": 1.8425363355656754e-06, - "loss": 0.8789, - "step": 24069 - }, - { - "epoch": 0.62, - "learning_rate": 1.8425214308433644e-06, - "loss": 0.7837, - "step": 24070 - }, - { - "epoch": 0.62, - "learning_rate": 1.8425065254759732e-06, - "loss": 0.6953, - "step": 24071 - }, - { - "epoch": 0.62, - "learning_rate": 1.842491619463514e-06, - "loss": 0.751, - "step": 24072 - }, - { - "epoch": 0.62, - "learning_rate": 1.8424767128059973e-06, - "loss": 0.5405, - "step": 24073 - }, - { - "epoch": 0.62, - "learning_rate": 1.842461805503435e-06, - "loss": 0.9873, - "step": 24074 - }, - { - "epoch": 0.62, - "learning_rate": 1.8424468975558386e-06, - "loss": 0.9502, - "step": 24075 - }, - { - "epoch": 0.62, - "learning_rate": 1.8424319889632191e-06, - "loss": 0.7937, - "step": 24076 - }, - { - "epoch": 0.62, - "learning_rate": 1.8424170797255885e-06, - "loss": 0.7959, - "step": 24077 - }, - { - "epoch": 0.62, - "learning_rate": 1.8424021698429575e-06, - "loss": 0.8672, - "step": 24078 - }, - { - "epoch": 0.62, - "learning_rate": 1.842387259315338e-06, - "loss": 0.7554, - "step": 24079 - }, - { - "epoch": 0.62, - "learning_rate": 1.8423723481427414e-06, - "loss": 0.9746, - "step": 24080 - }, - { - "epoch": 0.62, - "learning_rate": 1.842357436325179e-06, - "loss": 0.9092, - "step": 24081 - }, - { - "epoch": 0.62, - "learning_rate": 1.8423425238626625e-06, - "loss": 0.9785, - "step": 24082 - }, - { - "epoch": 0.62, - "learning_rate": 1.8423276107552026e-06, - "loss": 0.7988, - "step": 24083 - }, - { - "epoch": 0.62, - "learning_rate": 1.8423126970028116e-06, - "loss": 0.6211, - "step": 24084 - }, - { - "epoch": 0.62, - "learning_rate": 1.8422977826055002e-06, - "loss": 0.8711, - "step": 24085 - }, - { - "epoch": 0.62, - "learning_rate": 1.8422828675632802e-06, - "loss": 0.8955, - "step": 24086 - }, - { - "epoch": 0.62, - "learning_rate": 1.8422679518761629e-06, - "loss": 0.7393, - "step": 24087 - }, - { - "epoch": 0.62, - "learning_rate": 1.84225303554416e-06, - "loss": 1.1055, - "step": 24088 - }, - { - "epoch": 0.62, - "learning_rate": 1.8422381185672822e-06, - "loss": 0.9209, - "step": 24089 - }, - { - "epoch": 0.62, - "learning_rate": 1.8422232009455416e-06, - "loss": 0.8672, - "step": 24090 - }, - { - "epoch": 0.62, - "learning_rate": 1.8422082826789497e-06, - "loss": 0.8281, - "step": 24091 - }, - { - "epoch": 0.62, - "learning_rate": 1.8421933637675174e-06, - "loss": 0.4834, - "step": 24092 - }, - { - "epoch": 0.62, - "learning_rate": 1.8421784442112564e-06, - "loss": 0.9102, - "step": 24093 - }, - { - "epoch": 0.62, - "learning_rate": 1.842163524010178e-06, - "loss": 0.9043, - "step": 24094 - }, - { - "epoch": 0.62, - "learning_rate": 1.8421486031642938e-06, - "loss": 0.5576, - "step": 24095 - }, - { - "epoch": 0.62, - "learning_rate": 1.8421336816736152e-06, - "loss": 0.9326, - "step": 24096 - }, - { - "epoch": 0.62, - "learning_rate": 1.8421187595381536e-06, - "loss": 0.9316, - "step": 24097 - }, - { - "epoch": 0.62, - "learning_rate": 1.8421038367579205e-06, - "loss": 0.5676, - "step": 24098 - }, - { - "epoch": 0.62, - "learning_rate": 1.842088913332927e-06, - "loss": 0.8882, - "step": 24099 - }, - { - "epoch": 0.62, - "learning_rate": 1.8420739892631847e-06, - "loss": 0.7666, - "step": 24100 - }, - { - "epoch": 0.62, - "learning_rate": 1.8420590645487048e-06, - "loss": 0.7222, - "step": 24101 - }, - { - "epoch": 0.62, - "learning_rate": 1.8420441391894995e-06, - "loss": 0.7539, - "step": 24102 - }, - { - "epoch": 0.62, - "learning_rate": 1.8420292131855795e-06, - "loss": 1.1328, - "step": 24103 - }, - { - "epoch": 0.62, - "learning_rate": 1.8420142865369565e-06, - "loss": 0.8994, - "step": 24104 - }, - { - "epoch": 0.62, - "learning_rate": 1.8419993592436418e-06, - "loss": 0.957, - "step": 24105 - }, - { - "epoch": 0.62, - "learning_rate": 1.8419844313056472e-06, - "loss": 1.0518, - "step": 24106 - }, - { - "epoch": 0.62, - "learning_rate": 1.8419695027229833e-06, - "loss": 0.9678, - "step": 24107 - }, - { - "epoch": 0.62, - "learning_rate": 1.8419545734956625e-06, - "loss": 0.7451, - "step": 24108 - }, - { - "epoch": 0.62, - "learning_rate": 1.8419396436236956e-06, - "loss": 1.124, - "step": 24109 - }, - { - "epoch": 0.62, - "learning_rate": 1.8419247131070943e-06, - "loss": 0.7412, - "step": 24110 - }, - { - "epoch": 0.62, - "learning_rate": 1.84190978194587e-06, - "loss": 0.9541, - "step": 24111 - }, - { - "epoch": 0.62, - "learning_rate": 1.8418948501400343e-06, - "loss": 0.8447, - "step": 24112 - }, - { - "epoch": 0.62, - "learning_rate": 1.841879917689598e-06, - "loss": 0.8052, - "step": 24113 - }, - { - "epoch": 0.62, - "learning_rate": 1.841864984594573e-06, - "loss": 0.8506, - "step": 24114 - }, - { - "epoch": 0.62, - "learning_rate": 1.8418500508549709e-06, - "loss": 0.5151, - "step": 24115 - }, - { - "epoch": 0.62, - "learning_rate": 1.8418351164708027e-06, - "loss": 0.8428, - "step": 24116 - }, - { - "epoch": 0.62, - "learning_rate": 1.8418201814420804e-06, - "loss": 0.8428, - "step": 24117 - }, - { - "epoch": 0.62, - "learning_rate": 1.841805245768815e-06, - "loss": 0.9463, - "step": 24118 - }, - { - "epoch": 0.62, - "learning_rate": 1.841790309451018e-06, - "loss": 0.8809, - "step": 24119 - }, - { - "epoch": 0.62, - "learning_rate": 1.8417753724887006e-06, - "loss": 0.8252, - "step": 24120 - }, - { - "epoch": 0.62, - "learning_rate": 1.8417604348818747e-06, - "loss": 0.772, - "step": 24121 - }, - { - "epoch": 0.62, - "learning_rate": 1.8417454966305516e-06, - "loss": 0.8584, - "step": 24122 - }, - { - "epoch": 0.62, - "learning_rate": 1.8417305577347427e-06, - "loss": 0.7852, - "step": 24123 - }, - { - "epoch": 0.62, - "learning_rate": 1.8417156181944593e-06, - "loss": 0.8242, - "step": 24124 - }, - { - "epoch": 0.62, - "learning_rate": 1.8417006780097131e-06, - "loss": 0.958, - "step": 24125 - }, - { - "epoch": 0.62, - "learning_rate": 1.8416857371805151e-06, - "loss": 0.9766, - "step": 24126 - }, - { - "epoch": 0.62, - "learning_rate": 1.8416707957068773e-06, - "loss": 0.9219, - "step": 24127 - }, - { - "epoch": 0.62, - "learning_rate": 1.8416558535888106e-06, - "loss": 0.8311, - "step": 24128 - }, - { - "epoch": 0.62, - "learning_rate": 1.841640910826327e-06, - "loss": 0.9189, - "step": 24129 - }, - { - "epoch": 0.62, - "learning_rate": 1.8416259674194375e-06, - "loss": 1.0684, - "step": 24130 - }, - { - "epoch": 0.62, - "learning_rate": 1.841611023368154e-06, - "loss": 0.958, - "step": 24131 - }, - { - "epoch": 0.62, - "learning_rate": 1.841596078672487e-06, - "loss": 0.75, - "step": 24132 - }, - { - "epoch": 0.62, - "learning_rate": 1.8415811333324491e-06, - "loss": 0.9893, - "step": 24133 - }, - { - "epoch": 0.62, - "learning_rate": 1.8415661873480513e-06, - "loss": 0.9229, - "step": 24134 - }, - { - "epoch": 0.62, - "learning_rate": 1.8415512407193048e-06, - "loss": 0.7363, - "step": 24135 - }, - { - "epoch": 0.62, - "learning_rate": 1.841536293446221e-06, - "loss": 1.0088, - "step": 24136 - }, - { - "epoch": 0.62, - "learning_rate": 1.8415213455288119e-06, - "loss": 0.9648, - "step": 24137 - }, - { - "epoch": 0.62, - "learning_rate": 1.8415063969670884e-06, - "loss": 0.6465, - "step": 24138 - }, - { - "epoch": 0.62, - "learning_rate": 1.8414914477610621e-06, - "loss": 0.9082, - "step": 24139 - }, - { - "epoch": 0.62, - "learning_rate": 1.8414764979107447e-06, - "loss": 0.7881, - "step": 24140 - }, - { - "epoch": 0.62, - "learning_rate": 1.8414615474161473e-06, - "loss": 0.9111, - "step": 24141 - }, - { - "epoch": 0.62, - "learning_rate": 1.8414465962772812e-06, - "loss": 0.9854, - "step": 24142 - }, - { - "epoch": 0.62, - "learning_rate": 1.8414316444941585e-06, - "loss": 0.9932, - "step": 24143 - }, - { - "epoch": 0.62, - "learning_rate": 1.84141669206679e-06, - "loss": 1.0566, - "step": 24144 - }, - { - "epoch": 0.62, - "learning_rate": 1.841401738995188e-06, - "loss": 0.79, - "step": 24145 - }, - { - "epoch": 0.62, - "learning_rate": 1.8413867852793628e-06, - "loss": 0.9297, - "step": 24146 - }, - { - "epoch": 0.62, - "learning_rate": 1.8413718309193267e-06, - "loss": 0.9023, - "step": 24147 - }, - { - "epoch": 0.62, - "learning_rate": 1.8413568759150908e-06, - "loss": 0.9805, - "step": 24148 - }, - { - "epoch": 0.62, - "learning_rate": 1.8413419202666666e-06, - "loss": 1.0098, - "step": 24149 - }, - { - "epoch": 0.62, - "learning_rate": 1.8413269639740656e-06, - "loss": 0.9717, - "step": 24150 - }, - { - "epoch": 0.62, - "learning_rate": 1.8413120070372994e-06, - "loss": 0.8447, - "step": 24151 - }, - { - "epoch": 0.62, - "learning_rate": 1.8412970494563789e-06, - "loss": 1.0781, - "step": 24152 - }, - { - "epoch": 0.62, - "learning_rate": 1.8412820912313162e-06, - "loss": 1.0361, - "step": 24153 - }, - { - "epoch": 0.62, - "learning_rate": 1.8412671323621225e-06, - "loss": 0.9238, - "step": 24154 - }, - { - "epoch": 0.62, - "learning_rate": 1.8412521728488094e-06, - "loss": 0.8452, - "step": 24155 - }, - { - "epoch": 0.62, - "learning_rate": 1.8412372126913878e-06, - "loss": 0.8115, - "step": 24156 - }, - { - "epoch": 0.62, - "learning_rate": 1.8412222518898697e-06, - "loss": 0.9678, - "step": 24157 - }, - { - "epoch": 0.62, - "learning_rate": 1.8412072904442665e-06, - "loss": 0.7192, - "step": 24158 - }, - { - "epoch": 0.62, - "learning_rate": 1.8411923283545893e-06, - "loss": 0.8623, - "step": 24159 - }, - { - "epoch": 0.62, - "learning_rate": 1.84117736562085e-06, - "loss": 1.0059, - "step": 24160 - }, - { - "epoch": 0.62, - "learning_rate": 1.84116240224306e-06, - "loss": 0.9131, - "step": 24161 - }, - { - "epoch": 0.62, - "learning_rate": 1.8411474382212304e-06, - "loss": 0.9189, - "step": 24162 - }, - { - "epoch": 0.62, - "learning_rate": 1.841132473555373e-06, - "loss": 0.8096, - "step": 24163 - }, - { - "epoch": 0.62, - "learning_rate": 1.841117508245499e-06, - "loss": 1.0078, - "step": 24164 - }, - { - "epoch": 0.62, - "learning_rate": 1.8411025422916203e-06, - "loss": 0.7783, - "step": 24165 - }, - { - "epoch": 0.62, - "learning_rate": 1.8410875756937477e-06, - "loss": 0.9551, - "step": 24166 - }, - { - "epoch": 0.62, - "learning_rate": 1.8410726084518933e-06, - "loss": 0.6167, - "step": 24167 - }, - { - "epoch": 0.62, - "learning_rate": 1.841057640566068e-06, - "loss": 0.9062, - "step": 24168 - }, - { - "epoch": 0.62, - "learning_rate": 1.8410426720362837e-06, - "loss": 0.7661, - "step": 24169 - }, - { - "epoch": 0.62, - "learning_rate": 1.8410277028625516e-06, - "loss": 0.8916, - "step": 24170 - }, - { - "epoch": 0.62, - "learning_rate": 1.8410127330448834e-06, - "loss": 0.8809, - "step": 24171 - }, - { - "epoch": 0.62, - "learning_rate": 1.8409977625832904e-06, - "loss": 0.9604, - "step": 24172 - }, - { - "epoch": 0.62, - "learning_rate": 1.840982791477784e-06, - "loss": 0.8037, - "step": 24173 - }, - { - "epoch": 0.62, - "learning_rate": 1.840967819728376e-06, - "loss": 0.9131, - "step": 24174 - }, - { - "epoch": 0.62, - "learning_rate": 1.8409528473350773e-06, - "loss": 0.791, - "step": 24175 - }, - { - "epoch": 0.62, - "learning_rate": 1.8409378742979e-06, - "loss": 0.9844, - "step": 24176 - }, - { - "epoch": 0.62, - "learning_rate": 1.840922900616855e-06, - "loss": 0.6982, - "step": 24177 - }, - { - "epoch": 0.62, - "learning_rate": 1.8409079262919538e-06, - "loss": 1.0742, - "step": 24178 - }, - { - "epoch": 0.62, - "learning_rate": 1.8408929513232083e-06, - "loss": 0.6924, - "step": 24179 - }, - { - "epoch": 0.62, - "learning_rate": 1.8408779757106298e-06, - "loss": 0.6636, - "step": 24180 - }, - { - "epoch": 0.62, - "learning_rate": 1.8408629994542296e-06, - "loss": 0.4438, - "step": 24181 - }, - { - "epoch": 0.62, - "learning_rate": 1.8408480225540192e-06, - "loss": 0.8398, - "step": 24182 - }, - { - "epoch": 0.62, - "learning_rate": 1.8408330450100102e-06, - "loss": 1.0596, - "step": 24183 - }, - { - "epoch": 0.62, - "learning_rate": 1.8408180668222144e-06, - "loss": 0.8104, - "step": 24184 - }, - { - "epoch": 0.62, - "learning_rate": 1.8408030879906424e-06, - "loss": 0.6152, - "step": 24185 - }, - { - "epoch": 0.62, - "learning_rate": 1.8407881085153063e-06, - "loss": 1.1191, - "step": 24186 - }, - { - "epoch": 0.62, - "learning_rate": 1.8407731283962172e-06, - "loss": 0.7095, - "step": 24187 - }, - { - "epoch": 0.62, - "learning_rate": 1.8407581476333868e-06, - "loss": 0.9409, - "step": 24188 - }, - { - "epoch": 0.62, - "learning_rate": 1.8407431662268266e-06, - "loss": 0.8555, - "step": 24189 - }, - { - "epoch": 0.62, - "learning_rate": 1.840728184176548e-06, - "loss": 0.8867, - "step": 24190 - }, - { - "epoch": 0.62, - "learning_rate": 1.8407132014825629e-06, - "loss": 0.6929, - "step": 24191 - }, - { - "epoch": 0.62, - "learning_rate": 1.8406982181448817e-06, - "loss": 0.8223, - "step": 24192 - }, - { - "epoch": 0.62, - "learning_rate": 1.840683234163517e-06, - "loss": 0.7661, - "step": 24193 - }, - { - "epoch": 0.62, - "learning_rate": 1.8406682495384795e-06, - "loss": 0.915, - "step": 24194 - }, - { - "epoch": 0.62, - "learning_rate": 1.8406532642697811e-06, - "loss": 0.7559, - "step": 24195 - }, - { - "epoch": 0.62, - "learning_rate": 1.8406382783574334e-06, - "loss": 0.9512, - "step": 24196 - }, - { - "epoch": 0.62, - "learning_rate": 1.8406232918014472e-06, - "loss": 0.918, - "step": 24197 - }, - { - "epoch": 0.62, - "learning_rate": 1.8406083046018348e-06, - "loss": 0.79, - "step": 24198 - }, - { - "epoch": 0.62, - "learning_rate": 1.840593316758607e-06, - "loss": 0.8691, - "step": 24199 - }, - { - "epoch": 0.62, - "learning_rate": 1.8405783282717758e-06, - "loss": 0.9385, - "step": 24200 - }, - { - "epoch": 0.62, - "learning_rate": 1.8405633391413521e-06, - "loss": 0.7655, - "step": 24201 - }, - { - "epoch": 0.62, - "learning_rate": 1.840548349367348e-06, - "loss": 1.0654, - "step": 24202 - }, - { - "epoch": 0.62, - "learning_rate": 1.8405333589497745e-06, - "loss": 0.8125, - "step": 24203 - }, - { - "epoch": 0.62, - "learning_rate": 1.8405183678886433e-06, - "loss": 0.5774, - "step": 24204 - }, - { - "epoch": 0.62, - "learning_rate": 1.8405033761839658e-06, - "loss": 1.0391, - "step": 24205 - }, - { - "epoch": 0.62, - "learning_rate": 1.8404883838357535e-06, - "loss": 0.6519, - "step": 24206 - }, - { - "epoch": 0.62, - "learning_rate": 1.8404733908440178e-06, - "loss": 0.771, - "step": 24207 - }, - { - "epoch": 0.62, - "learning_rate": 1.8404583972087707e-06, - "loss": 0.9229, - "step": 24208 - }, - { - "epoch": 0.62, - "learning_rate": 1.8404434029300226e-06, - "loss": 0.7568, - "step": 24209 - }, - { - "epoch": 0.62, - "learning_rate": 1.8404284080077858e-06, - "loss": 0.5801, - "step": 24210 - }, - { - "epoch": 0.62, - "learning_rate": 1.8404134124420721e-06, - "loss": 0.7109, - "step": 24211 - }, - { - "epoch": 0.62, - "learning_rate": 1.840398416232892e-06, - "loss": 0.7705, - "step": 24212 - }, - { - "epoch": 0.62, - "learning_rate": 1.8403834193802577e-06, - "loss": 0.7959, - "step": 24213 - }, - { - "epoch": 0.62, - "learning_rate": 1.8403684218841805e-06, - "loss": 0.9922, - "step": 24214 - }, - { - "epoch": 0.62, - "learning_rate": 1.8403534237446717e-06, - "loss": 0.6833, - "step": 24215 - }, - { - "epoch": 0.62, - "learning_rate": 1.840338424961743e-06, - "loss": 0.9385, - "step": 24216 - }, - { - "epoch": 0.62, - "learning_rate": 1.8403234255354056e-06, - "loss": 0.7178, - "step": 24217 - }, - { - "epoch": 0.62, - "learning_rate": 1.8403084254656716e-06, - "loss": 0.8198, - "step": 24218 - }, - { - "epoch": 0.62, - "learning_rate": 1.8402934247525518e-06, - "loss": 0.9404, - "step": 24219 - }, - { - "epoch": 0.62, - "learning_rate": 1.840278423396058e-06, - "loss": 0.7266, - "step": 24220 - }, - { - "epoch": 0.62, - "learning_rate": 1.8402634213962015e-06, - "loss": 0.7329, - "step": 24221 - }, - { - "epoch": 0.62, - "learning_rate": 1.8402484187529944e-06, - "loss": 0.9844, - "step": 24222 - }, - { - "epoch": 0.62, - "learning_rate": 1.8402334154664474e-06, - "loss": 1.0137, - "step": 24223 - }, - { - "epoch": 0.62, - "learning_rate": 1.8402184115365725e-06, - "loss": 0.9287, - "step": 24224 - }, - { - "epoch": 0.62, - "learning_rate": 1.8402034069633806e-06, - "loss": 0.6816, - "step": 24225 - }, - { - "epoch": 0.62, - "learning_rate": 1.840188401746884e-06, - "loss": 0.8232, - "step": 24226 - }, - { - "epoch": 0.62, - "learning_rate": 1.8401733958870933e-06, - "loss": 0.7842, - "step": 24227 - }, - { - "epoch": 0.62, - "learning_rate": 1.8401583893840207e-06, - "loss": 0.7373, - "step": 24228 - }, - { - "epoch": 0.62, - "learning_rate": 1.8401433822376777e-06, - "loss": 0.7002, - "step": 24229 - }, - { - "epoch": 0.62, - "learning_rate": 1.8401283744480751e-06, - "loss": 1.043, - "step": 24230 - }, - { - "epoch": 0.62, - "learning_rate": 1.8401133660152252e-06, - "loss": 0.6255, - "step": 24231 - }, - { - "epoch": 0.62, - "learning_rate": 1.8400983569391388e-06, - "loss": 0.9053, - "step": 24232 - }, - { - "epoch": 0.62, - "learning_rate": 1.8400833472198284e-06, - "loss": 0.7271, - "step": 24233 - }, - { - "epoch": 0.62, - "learning_rate": 1.840068336857304e-06, - "loss": 0.8643, - "step": 24234 - }, - { - "epoch": 0.62, - "learning_rate": 1.8400533258515783e-06, - "loss": 0.7578, - "step": 24235 - }, - { - "epoch": 0.62, - "learning_rate": 1.8400383142026624e-06, - "loss": 0.9414, - "step": 24236 - }, - { - "epoch": 0.62, - "learning_rate": 1.8400233019105675e-06, - "loss": 0.9189, - "step": 24237 - }, - { - "epoch": 0.62, - "learning_rate": 1.8400082889753057e-06, - "loss": 0.7969, - "step": 24238 - }, - { - "epoch": 0.62, - "learning_rate": 1.8399932753968881e-06, - "loss": 0.875, - "step": 24239 - }, - { - "epoch": 0.62, - "learning_rate": 1.839978261175326e-06, - "loss": 1.1123, - "step": 24240 - }, - { - "epoch": 0.62, - "learning_rate": 1.8399632463106316e-06, - "loss": 0.8975, - "step": 24241 - }, - { - "epoch": 0.62, - "learning_rate": 1.8399482308028157e-06, - "loss": 1.0078, - "step": 24242 - }, - { - "epoch": 0.62, - "learning_rate": 1.8399332146518903e-06, - "loss": 0.6758, - "step": 24243 - }, - { - "epoch": 0.62, - "learning_rate": 1.8399181978578665e-06, - "loss": 0.6562, - "step": 24244 - }, - { - "epoch": 0.62, - "learning_rate": 1.8399031804207558e-06, - "loss": 0.7939, - "step": 24245 - }, - { - "epoch": 0.62, - "learning_rate": 1.83988816234057e-06, - "loss": 0.7441, - "step": 24246 - }, - { - "epoch": 0.62, - "learning_rate": 1.8398731436173204e-06, - "loss": 0.6924, - "step": 24247 - }, - { - "epoch": 0.62, - "learning_rate": 1.8398581242510187e-06, - "loss": 0.8579, - "step": 24248 - }, - { - "epoch": 0.62, - "learning_rate": 1.8398431042416763e-06, - "loss": 0.7178, - "step": 24249 - }, - { - "epoch": 0.62, - "learning_rate": 1.8398280835893046e-06, - "loss": 0.8896, - "step": 24250 - }, - { - "epoch": 0.62, - "learning_rate": 1.839813062293915e-06, - "loss": 0.7188, - "step": 24251 - }, - { - "epoch": 0.62, - "learning_rate": 1.8397980403555192e-06, - "loss": 1.1348, - "step": 24252 - }, - { - "epoch": 0.62, - "learning_rate": 1.8397830177741287e-06, - "loss": 0.9785, - "step": 24253 - }, - { - "epoch": 0.62, - "learning_rate": 1.8397679945497548e-06, - "loss": 1.0059, - "step": 24254 - }, - { - "epoch": 0.62, - "learning_rate": 1.8397529706824094e-06, - "loss": 0.8877, - "step": 24255 - }, - { - "epoch": 0.62, - "learning_rate": 1.8397379461721037e-06, - "loss": 0.811, - "step": 24256 - }, - { - "epoch": 0.62, - "learning_rate": 1.8397229210188492e-06, - "loss": 0.8047, - "step": 24257 - }, - { - "epoch": 0.62, - "learning_rate": 1.8397078952226575e-06, - "loss": 0.9102, - "step": 24258 - }, - { - "epoch": 0.62, - "learning_rate": 1.83969286878354e-06, - "loss": 0.9092, - "step": 24259 - }, - { - "epoch": 0.62, - "learning_rate": 1.8396778417015084e-06, - "loss": 0.9482, - "step": 24260 - }, - { - "epoch": 0.62, - "learning_rate": 1.8396628139765742e-06, - "loss": 1.0947, - "step": 24261 - }, - { - "epoch": 0.62, - "learning_rate": 1.8396477856087485e-06, - "loss": 0.6851, - "step": 24262 - }, - { - "epoch": 0.62, - "learning_rate": 1.8396327565980431e-06, - "loss": 0.8267, - "step": 24263 - }, - { - "epoch": 0.62, - "learning_rate": 1.8396177269444698e-06, - "loss": 0.8428, - "step": 24264 - }, - { - "epoch": 0.62, - "learning_rate": 1.8396026966480397e-06, - "loss": 0.9229, - "step": 24265 - }, - { - "epoch": 0.62, - "learning_rate": 1.8395876657087643e-06, - "loss": 0.7703, - "step": 24266 - }, - { - "epoch": 0.62, - "learning_rate": 1.8395726341266553e-06, - "loss": 0.8975, - "step": 24267 - }, - { - "epoch": 0.62, - "learning_rate": 1.8395576019017241e-06, - "loss": 1.1133, - "step": 24268 - }, - { - "epoch": 0.62, - "learning_rate": 1.8395425690339824e-06, - "loss": 0.8857, - "step": 24269 - }, - { - "epoch": 0.62, - "learning_rate": 1.8395275355234413e-06, - "loss": 0.8286, - "step": 24270 - }, - { - "epoch": 0.62, - "learning_rate": 1.839512501370113e-06, - "loss": 0.8232, - "step": 24271 - }, - { - "epoch": 0.62, - "learning_rate": 1.839497466574008e-06, - "loss": 0.7427, - "step": 24272 - }, - { - "epoch": 0.62, - "learning_rate": 1.8394824311351386e-06, - "loss": 1.0352, - "step": 24273 - }, - { - "epoch": 0.62, - "learning_rate": 1.8394673950535165e-06, - "loss": 0.8877, - "step": 24274 - }, - { - "epoch": 0.62, - "learning_rate": 1.8394523583291525e-06, - "loss": 0.8096, - "step": 24275 - }, - { - "epoch": 0.62, - "learning_rate": 1.8394373209620583e-06, - "loss": 0.8057, - "step": 24276 - }, - { - "epoch": 0.62, - "learning_rate": 1.8394222829522455e-06, - "loss": 0.665, - "step": 24277 - }, - { - "epoch": 0.62, - "learning_rate": 1.839407244299726e-06, - "loss": 0.7705, - "step": 24278 - }, - { - "epoch": 0.62, - "learning_rate": 1.8393922050045108e-06, - "loss": 0.7725, - "step": 24279 - }, - { - "epoch": 0.62, - "learning_rate": 1.8393771650666117e-06, - "loss": 0.7041, - "step": 24280 - }, - { - "epoch": 0.62, - "learning_rate": 1.8393621244860397e-06, - "loss": 0.9443, - "step": 24281 - }, - { - "epoch": 0.62, - "learning_rate": 1.8393470832628071e-06, - "loss": 0.8545, - "step": 24282 - }, - { - "epoch": 0.62, - "learning_rate": 1.8393320413969251e-06, - "loss": 0.9482, - "step": 24283 - }, - { - "epoch": 0.62, - "learning_rate": 1.839316998888405e-06, - "loss": 0.8281, - "step": 24284 - }, - { - "epoch": 0.62, - "learning_rate": 1.8393019557372582e-06, - "loss": 0.9824, - "step": 24285 - }, - { - "epoch": 0.62, - "learning_rate": 1.8392869119434968e-06, - "loss": 0.7573, - "step": 24286 - }, - { - "epoch": 0.62, - "learning_rate": 1.839271867507132e-06, - "loss": 0.7029, - "step": 24287 - }, - { - "epoch": 0.62, - "learning_rate": 1.8392568224281753e-06, - "loss": 0.8657, - "step": 24288 - }, - { - "epoch": 0.62, - "learning_rate": 1.8392417767066381e-06, - "loss": 1.0645, - "step": 24289 - }, - { - "epoch": 0.62, - "learning_rate": 1.8392267303425322e-06, - "loss": 0.6738, - "step": 24290 - }, - { - "epoch": 0.62, - "learning_rate": 1.839211683335869e-06, - "loss": 0.8975, - "step": 24291 - }, - { - "epoch": 0.62, - "learning_rate": 1.83919663568666e-06, - "loss": 0.9062, - "step": 24292 - }, - { - "epoch": 0.62, - "learning_rate": 1.8391815873949165e-06, - "loss": 1.1279, - "step": 24293 - }, - { - "epoch": 0.62, - "learning_rate": 1.8391665384606505e-06, - "loss": 0.8545, - "step": 24294 - }, - { - "epoch": 0.62, - "learning_rate": 1.839151488883873e-06, - "loss": 1.0117, - "step": 24295 - }, - { - "epoch": 0.62, - "learning_rate": 1.839136438664596e-06, - "loss": 0.9736, - "step": 24296 - }, - { - "epoch": 0.62, - "learning_rate": 1.8391213878028308e-06, - "loss": 0.8887, - "step": 24297 - }, - { - "epoch": 0.62, - "learning_rate": 1.839106336298589e-06, - "loss": 0.7725, - "step": 24298 - }, - { - "epoch": 0.62, - "learning_rate": 1.839091284151882e-06, - "loss": 1.0625, - "step": 24299 - }, - { - "epoch": 0.62, - "learning_rate": 1.8390762313627213e-06, - "loss": 0.7715, - "step": 24300 - }, - { - "epoch": 0.62, - "learning_rate": 1.8390611779311187e-06, - "loss": 0.9023, - "step": 24301 - }, - { - "epoch": 0.62, - "learning_rate": 1.8390461238570853e-06, - "loss": 0.9131, - "step": 24302 - }, - { - "epoch": 0.62, - "learning_rate": 1.839031069140633e-06, - "loss": 0.8418, - "step": 24303 - }, - { - "epoch": 0.62, - "learning_rate": 1.8390160137817731e-06, - "loss": 0.6846, - "step": 24304 - }, - { - "epoch": 0.62, - "learning_rate": 1.8390009577805174e-06, - "loss": 0.7598, - "step": 24305 - }, - { - "epoch": 0.62, - "learning_rate": 1.8389859011368772e-06, - "loss": 0.8154, - "step": 24306 - }, - { - "epoch": 0.62, - "learning_rate": 1.838970843850864e-06, - "loss": 0.8691, - "step": 24307 - }, - { - "epoch": 0.62, - "learning_rate": 1.8389557859224893e-06, - "loss": 0.9365, - "step": 24308 - }, - { - "epoch": 0.62, - "learning_rate": 1.838940727351765e-06, - "loss": 0.8896, - "step": 24309 - }, - { - "epoch": 0.62, - "learning_rate": 1.8389256681387019e-06, - "loss": 0.958, - "step": 24310 - }, - { - "epoch": 0.62, - "learning_rate": 1.8389106082833124e-06, - "loss": 1.0361, - "step": 24311 - }, - { - "epoch": 0.62, - "learning_rate": 1.8388955477856073e-06, - "loss": 0.6885, - "step": 24312 - }, - { - "epoch": 0.62, - "learning_rate": 1.838880486645599e-06, - "loss": 0.8887, - "step": 24313 - }, - { - "epoch": 0.62, - "learning_rate": 1.838865424863298e-06, - "loss": 0.9893, - "step": 24314 - }, - { - "epoch": 0.62, - "learning_rate": 1.8388503624387167e-06, - "loss": 0.8335, - "step": 24315 - }, - { - "epoch": 0.62, - "learning_rate": 1.8388352993718658e-06, - "loss": 0.7241, - "step": 24316 - }, - { - "epoch": 0.62, - "learning_rate": 1.8388202356627577e-06, - "loss": 0.8281, - "step": 24317 - }, - { - "epoch": 0.62, - "learning_rate": 1.8388051713114033e-06, - "loss": 0.7695, - "step": 24318 - }, - { - "epoch": 0.62, - "learning_rate": 1.8387901063178142e-06, - "loss": 0.7476, - "step": 24319 - }, - { - "epoch": 0.62, - "learning_rate": 1.838775040682002e-06, - "loss": 0.7271, - "step": 24320 - }, - { - "epoch": 0.62, - "learning_rate": 1.8387599744039788e-06, - "loss": 0.915, - "step": 24321 - }, - { - "epoch": 0.62, - "learning_rate": 1.8387449074837554e-06, - "loss": 0.9385, - "step": 24322 - }, - { - "epoch": 0.62, - "learning_rate": 1.8387298399213438e-06, - "loss": 0.9453, - "step": 24323 - }, - { - "epoch": 0.62, - "learning_rate": 1.8387147717167548e-06, - "loss": 0.8862, - "step": 24324 - }, - { - "epoch": 0.62, - "learning_rate": 1.838699702870001e-06, - "loss": 0.8428, - "step": 24325 - }, - { - "epoch": 0.62, - "learning_rate": 1.838684633381093e-06, - "loss": 0.8975, - "step": 24326 - }, - { - "epoch": 0.62, - "learning_rate": 1.8386695632500432e-06, - "loss": 0.8643, - "step": 24327 - }, - { - "epoch": 0.62, - "learning_rate": 1.8386544924768623e-06, - "loss": 0.7153, - "step": 24328 - }, - { - "epoch": 0.62, - "learning_rate": 1.8386394210615624e-06, - "loss": 0.5708, - "step": 24329 - }, - { - "epoch": 0.62, - "learning_rate": 1.8386243490041547e-06, - "loss": 0.8281, - "step": 24330 - }, - { - "epoch": 0.62, - "learning_rate": 1.8386092763046511e-06, - "loss": 0.9629, - "step": 24331 - }, - { - "epoch": 0.62, - "learning_rate": 1.8385942029630627e-06, - "loss": 0.9727, - "step": 24332 - }, - { - "epoch": 0.62, - "learning_rate": 1.8385791289794015e-06, - "loss": 0.9014, - "step": 24333 - }, - { - "epoch": 0.62, - "learning_rate": 1.8385640543536787e-06, - "loss": 0.9561, - "step": 24334 - }, - { - "epoch": 0.62, - "learning_rate": 1.8385489790859058e-06, - "loss": 0.9922, - "step": 24335 - }, - { - "epoch": 0.62, - "learning_rate": 1.8385339031760949e-06, - "loss": 0.8496, - "step": 24336 - }, - { - "epoch": 0.62, - "learning_rate": 1.838518826624257e-06, - "loss": 0.918, - "step": 24337 - }, - { - "epoch": 0.62, - "learning_rate": 1.8385037494304037e-06, - "loss": 1.0918, - "step": 24338 - }, - { - "epoch": 0.62, - "learning_rate": 1.8384886715945468e-06, - "loss": 0.9258, - "step": 24339 - }, - { - "epoch": 0.62, - "learning_rate": 1.8384735931166975e-06, - "loss": 0.6108, - "step": 24340 - }, - { - "epoch": 0.62, - "learning_rate": 1.8384585139968674e-06, - "loss": 0.8398, - "step": 24341 - }, - { - "epoch": 0.62, - "learning_rate": 1.8384434342350684e-06, - "loss": 0.8779, - "step": 24342 - }, - { - "epoch": 0.62, - "learning_rate": 1.8384283538313117e-06, - "loss": 0.8027, - "step": 24343 - }, - { - "epoch": 0.62, - "learning_rate": 1.838413272785609e-06, - "loss": 0.7549, - "step": 24344 - }, - { - "epoch": 0.62, - "learning_rate": 1.8383981910979718e-06, - "loss": 0.7129, - "step": 24345 - }, - { - "epoch": 0.62, - "learning_rate": 1.8383831087684117e-06, - "loss": 0.9736, - "step": 24346 - }, - { - "epoch": 0.62, - "learning_rate": 1.83836802579694e-06, - "loss": 0.751, - "step": 24347 - }, - { - "epoch": 0.62, - "learning_rate": 1.8383529421835688e-06, - "loss": 0.7532, - "step": 24348 - }, - { - "epoch": 0.62, - "learning_rate": 1.8383378579283094e-06, - "loss": 0.8701, - "step": 24349 - }, - { - "epoch": 0.62, - "learning_rate": 1.8383227730311725e-06, - "loss": 0.8564, - "step": 24350 - }, - { - "epoch": 0.62, - "learning_rate": 1.8383076874921711e-06, - "loss": 0.959, - "step": 24351 - }, - { - "epoch": 0.62, - "learning_rate": 1.8382926013113157e-06, - "loss": 0.7412, - "step": 24352 - }, - { - "epoch": 0.62, - "learning_rate": 1.8382775144886184e-06, - "loss": 0.876, - "step": 24353 - }, - { - "epoch": 0.62, - "learning_rate": 1.8382624270240905e-06, - "loss": 0.8555, - "step": 24354 - }, - { - "epoch": 0.62, - "learning_rate": 1.8382473389177435e-06, - "loss": 0.8682, - "step": 24355 - }, - { - "epoch": 0.62, - "learning_rate": 1.8382322501695895e-06, - "loss": 0.8965, - "step": 24356 - }, - { - "epoch": 0.62, - "learning_rate": 1.838217160779639e-06, - "loss": 0.9854, - "step": 24357 - }, - { - "epoch": 0.62, - "learning_rate": 1.8382020707479046e-06, - "loss": 0.7163, - "step": 24358 - }, - { - "epoch": 0.62, - "learning_rate": 1.838186980074397e-06, - "loss": 0.8311, - "step": 24359 - }, - { - "epoch": 0.62, - "learning_rate": 1.8381718887591284e-06, - "loss": 0.8203, - "step": 24360 - }, - { - "epoch": 0.62, - "learning_rate": 1.8381567968021104e-06, - "loss": 0.792, - "step": 24361 - }, - { - "epoch": 0.62, - "learning_rate": 1.838141704203354e-06, - "loss": 0.874, - "step": 24362 - }, - { - "epoch": 0.62, - "learning_rate": 1.8381266109628708e-06, - "loss": 0.8105, - "step": 24363 - }, - { - "epoch": 0.62, - "learning_rate": 1.8381115170806729e-06, - "loss": 0.7471, - "step": 24364 - }, - { - "epoch": 0.62, - "learning_rate": 1.8380964225567715e-06, - "loss": 0.9229, - "step": 24365 - }, - { - "epoch": 0.62, - "learning_rate": 1.8380813273911784e-06, - "loss": 1.0918, - "step": 24366 - }, - { - "epoch": 0.62, - "learning_rate": 1.8380662315839043e-06, - "loss": 0.9189, - "step": 24367 - }, - { - "epoch": 0.62, - "learning_rate": 1.8380511351349621e-06, - "loss": 0.876, - "step": 24368 - }, - { - "epoch": 0.62, - "learning_rate": 1.8380360380443624e-06, - "loss": 0.7051, - "step": 24369 - }, - { - "epoch": 0.62, - "learning_rate": 1.8380209403121172e-06, - "loss": 0.79, - "step": 24370 - }, - { - "epoch": 0.62, - "learning_rate": 1.8380058419382378e-06, - "loss": 0.8818, - "step": 24371 - }, - { - "epoch": 0.62, - "learning_rate": 1.8379907429227358e-06, - "loss": 0.9971, - "step": 24372 - }, - { - "epoch": 0.62, - "learning_rate": 1.837975643265623e-06, - "loss": 1.1055, - "step": 24373 - }, - { - "epoch": 0.62, - "learning_rate": 1.8379605429669108e-06, - "loss": 0.9844, - "step": 24374 - }, - { - "epoch": 0.62, - "learning_rate": 1.8379454420266103e-06, - "loss": 0.7383, - "step": 24375 - }, - { - "epoch": 0.62, - "learning_rate": 1.837930340444734e-06, - "loss": 0.7275, - "step": 24376 - }, - { - "epoch": 0.62, - "learning_rate": 1.8379152382212927e-06, - "loss": 0.8887, - "step": 24377 - }, - { - "epoch": 0.62, - "learning_rate": 1.8379001353562985e-06, - "loss": 0.8955, - "step": 24378 - }, - { - "epoch": 0.62, - "learning_rate": 1.8378850318497623e-06, - "loss": 0.6724, - "step": 24379 - }, - { - "epoch": 0.62, - "learning_rate": 1.8378699277016962e-06, - "loss": 0.6929, - "step": 24380 - }, - { - "epoch": 0.62, - "learning_rate": 1.8378548229121118e-06, - "loss": 0.8662, - "step": 24381 - }, - { - "epoch": 0.62, - "learning_rate": 1.8378397174810202e-06, - "loss": 0.8184, - "step": 24382 - }, - { - "epoch": 0.62, - "learning_rate": 1.8378246114084334e-06, - "loss": 0.8789, - "step": 24383 - }, - { - "epoch": 0.62, - "learning_rate": 1.8378095046943628e-06, - "loss": 0.8447, - "step": 24384 - }, - { - "epoch": 0.62, - "learning_rate": 1.83779439733882e-06, - "loss": 0.9795, - "step": 24385 - }, - { - "epoch": 0.63, - "learning_rate": 1.837779289341817e-06, - "loss": 0.8818, - "step": 24386 - }, - { - "epoch": 0.63, - "learning_rate": 1.8377641807033642e-06, - "loss": 0.7124, - "step": 24387 - }, - { - "epoch": 0.63, - "learning_rate": 1.8377490714234741e-06, - "loss": 0.9004, - "step": 24388 - }, - { - "epoch": 0.63, - "learning_rate": 1.8377339615021582e-06, - "loss": 0.7607, - "step": 24389 - }, - { - "epoch": 0.63, - "learning_rate": 1.837718850939428e-06, - "loss": 0.916, - "step": 24390 - }, - { - "epoch": 0.63, - "learning_rate": 1.8377037397352948e-06, - "loss": 0.9009, - "step": 24391 - }, - { - "epoch": 0.63, - "learning_rate": 1.8376886278897703e-06, - "loss": 0.7139, - "step": 24392 - }, - { - "epoch": 0.63, - "learning_rate": 1.8376735154028664e-06, - "loss": 0.7852, - "step": 24393 - }, - { - "epoch": 0.63, - "learning_rate": 1.8376584022745942e-06, - "loss": 0.7524, - "step": 24394 - }, - { - "epoch": 0.63, - "learning_rate": 1.8376432885049656e-06, - "loss": 1.0283, - "step": 24395 - }, - { - "epoch": 0.63, - "learning_rate": 1.837628174093992e-06, - "loss": 0.9658, - "step": 24396 - }, - { - "epoch": 0.63, - "learning_rate": 1.8376130590416849e-06, - "loss": 0.833, - "step": 24397 - }, - { - "epoch": 0.63, - "learning_rate": 1.8375979433480563e-06, - "loss": 0.792, - "step": 24398 - }, - { - "epoch": 0.63, - "learning_rate": 1.8375828270131172e-06, - "loss": 0.9746, - "step": 24399 - }, - { - "epoch": 0.63, - "learning_rate": 1.8375677100368794e-06, - "loss": 0.8584, - "step": 24400 - }, - { - "epoch": 0.63, - "learning_rate": 1.837552592419355e-06, - "loss": 0.9541, - "step": 24401 - }, - { - "epoch": 0.63, - "learning_rate": 1.8375374741605544e-06, - "loss": 0.8506, - "step": 24402 - }, - { - "epoch": 0.63, - "learning_rate": 1.8375223552604902e-06, - "loss": 0.8096, - "step": 24403 - }, - { - "epoch": 0.63, - "learning_rate": 1.8375072357191738e-06, - "loss": 0.7585, - "step": 24404 - }, - { - "epoch": 0.63, - "learning_rate": 1.8374921155366164e-06, - "loss": 0.9512, - "step": 24405 - }, - { - "epoch": 0.63, - "learning_rate": 1.8374769947128299e-06, - "loss": 0.9023, - "step": 24406 - }, - { - "epoch": 0.63, - "learning_rate": 1.8374618732478258e-06, - "loss": 1.0615, - "step": 24407 - }, - { - "epoch": 0.63, - "learning_rate": 1.8374467511416155e-06, - "loss": 1.0098, - "step": 24408 - }, - { - "epoch": 0.63, - "learning_rate": 1.8374316283942108e-06, - "loss": 0.7559, - "step": 24409 - }, - { - "epoch": 0.63, - "learning_rate": 1.8374165050056233e-06, - "loss": 1.0186, - "step": 24410 - }, - { - "epoch": 0.63, - "learning_rate": 1.8374013809758644e-06, - "loss": 0.8711, - "step": 24411 - }, - { - "epoch": 0.63, - "learning_rate": 1.8373862563049455e-06, - "loss": 0.751, - "step": 24412 - }, - { - "epoch": 0.63, - "learning_rate": 1.8373711309928788e-06, - "loss": 0.7466, - "step": 24413 - }, - { - "epoch": 0.63, - "learning_rate": 1.8373560050396754e-06, - "loss": 0.6603, - "step": 24414 - }, - { - "epoch": 0.63, - "learning_rate": 1.8373408784453473e-06, - "loss": 0.8198, - "step": 24415 - }, - { - "epoch": 0.63, - "learning_rate": 1.8373257512099055e-06, - "loss": 0.8486, - "step": 24416 - }, - { - "epoch": 0.63, - "learning_rate": 1.8373106233333617e-06, - "loss": 0.8193, - "step": 24417 - }, - { - "epoch": 0.63, - "learning_rate": 1.837295494815728e-06, - "loss": 0.7461, - "step": 24418 - }, - { - "epoch": 0.63, - "learning_rate": 1.8372803656570155e-06, - "loss": 1.1348, - "step": 24419 - }, - { - "epoch": 0.63, - "learning_rate": 1.837265235857236e-06, - "loss": 0.873, - "step": 24420 - }, - { - "epoch": 0.63, - "learning_rate": 1.837250105416401e-06, - "loss": 0.8398, - "step": 24421 - }, - { - "epoch": 0.63, - "learning_rate": 1.8372349743345219e-06, - "loss": 0.8086, - "step": 24422 - }, - { - "epoch": 0.63, - "learning_rate": 1.8372198426116109e-06, - "loss": 0.9346, - "step": 24423 - }, - { - "epoch": 0.63, - "learning_rate": 1.8372047102476787e-06, - "loss": 0.8496, - "step": 24424 - }, - { - "epoch": 0.63, - "learning_rate": 1.8371895772427376e-06, - "loss": 0.8994, - "step": 24425 - }, - { - "epoch": 0.63, - "learning_rate": 1.8371744435967988e-06, - "loss": 0.8623, - "step": 24426 - }, - { - "epoch": 0.63, - "learning_rate": 1.8371593093098744e-06, - "loss": 0.7686, - "step": 24427 - }, - { - "epoch": 0.63, - "learning_rate": 1.8371441743819751e-06, - "loss": 0.8379, - "step": 24428 - }, - { - "epoch": 0.63, - "learning_rate": 1.8371290388131131e-06, - "loss": 0.8076, - "step": 24429 - }, - { - "epoch": 0.63, - "learning_rate": 1.8371139026033e-06, - "loss": 0.8379, - "step": 24430 - }, - { - "epoch": 0.63, - "learning_rate": 1.837098765752547e-06, - "loss": 1.1357, - "step": 24431 - }, - { - "epoch": 0.63, - "learning_rate": 1.8370836282608665e-06, - "loss": 0.8306, - "step": 24432 - }, - { - "epoch": 0.63, - "learning_rate": 1.8370684901282694e-06, - "loss": 0.9199, - "step": 24433 - }, - { - "epoch": 0.63, - "learning_rate": 1.8370533513547673e-06, - "loss": 0.7065, - "step": 24434 - }, - { - "epoch": 0.63, - "learning_rate": 1.837038211940372e-06, - "loss": 1.0703, - "step": 24435 - }, - { - "epoch": 0.63, - "learning_rate": 1.8370230718850949e-06, - "loss": 0.5249, - "step": 24436 - }, - { - "epoch": 0.63, - "learning_rate": 1.8370079311889479e-06, - "loss": 0.9258, - "step": 24437 - }, - { - "epoch": 0.63, - "learning_rate": 1.8369927898519423e-06, - "loss": 0.7969, - "step": 24438 - }, - { - "epoch": 0.63, - "learning_rate": 1.83697764787409e-06, - "loss": 0.7007, - "step": 24439 - }, - { - "epoch": 0.63, - "learning_rate": 1.836962505255402e-06, - "loss": 0.9844, - "step": 24440 - }, - { - "epoch": 0.63, - "learning_rate": 1.8369473619958906e-06, - "loss": 0.8594, - "step": 24441 - }, - { - "epoch": 0.63, - "learning_rate": 1.8369322180955668e-06, - "loss": 0.9053, - "step": 24442 - }, - { - "epoch": 0.63, - "learning_rate": 1.8369170735544431e-06, - "loss": 0.9902, - "step": 24443 - }, - { - "epoch": 0.63, - "learning_rate": 1.83690192837253e-06, - "loss": 0.5806, - "step": 24444 - }, - { - "epoch": 0.63, - "learning_rate": 1.8368867825498398e-06, - "loss": 0.9307, - "step": 24445 - }, - { - "epoch": 0.63, - "learning_rate": 1.8368716360863833e-06, - "loss": 1.1504, - "step": 24446 - }, - { - "epoch": 0.63, - "learning_rate": 1.8368564889821733e-06, - "loss": 1.0879, - "step": 24447 - }, - { - "epoch": 0.63, - "learning_rate": 1.8368413412372205e-06, - "loss": 0.9316, - "step": 24448 - }, - { - "epoch": 0.63, - "learning_rate": 1.836826192851537e-06, - "loss": 1.1582, - "step": 24449 - }, - { - "epoch": 0.63, - "learning_rate": 1.836811043825134e-06, - "loss": 0.9033, - "step": 24450 - }, - { - "epoch": 0.63, - "learning_rate": 1.836795894158023e-06, - "loss": 0.6831, - "step": 24451 - }, - { - "epoch": 0.63, - "learning_rate": 1.8367807438502164e-06, - "loss": 0.8213, - "step": 24452 - }, - { - "epoch": 0.63, - "learning_rate": 1.8367655929017246e-06, - "loss": 0.8701, - "step": 24453 - }, - { - "epoch": 0.63, - "learning_rate": 1.8367504413125605e-06, - "loss": 0.8271, - "step": 24454 - }, - { - "epoch": 0.63, - "learning_rate": 1.8367352890827347e-06, - "loss": 0.9365, - "step": 24455 - }, - { - "epoch": 0.63, - "learning_rate": 1.8367201362122594e-06, - "loss": 0.9404, - "step": 24456 - }, - { - "epoch": 0.63, - "learning_rate": 1.836704982701146e-06, - "loss": 1.1289, - "step": 24457 - }, - { - "epoch": 0.63, - "learning_rate": 1.8366898285494058e-06, - "loss": 0.7646, - "step": 24458 - }, - { - "epoch": 0.63, - "learning_rate": 1.8366746737570506e-06, - "loss": 0.999, - "step": 24459 - }, - { - "epoch": 0.63, - "learning_rate": 1.8366595183240922e-06, - "loss": 0.8965, - "step": 24460 - }, - { - "epoch": 0.63, - "learning_rate": 1.836644362250542e-06, - "loss": 1.1172, - "step": 24461 - }, - { - "epoch": 0.63, - "learning_rate": 1.836629205536412e-06, - "loss": 0.8525, - "step": 24462 - }, - { - "epoch": 0.63, - "learning_rate": 1.8366140481817132e-06, - "loss": 0.9678, - "step": 24463 - }, - { - "epoch": 0.63, - "learning_rate": 1.8365988901864577e-06, - "loss": 0.6216, - "step": 24464 - }, - { - "epoch": 0.63, - "learning_rate": 1.8365837315506568e-06, - "loss": 1.0068, - "step": 24465 - }, - { - "epoch": 0.63, - "learning_rate": 1.8365685722743223e-06, - "loss": 0.7695, - "step": 24466 - }, - { - "epoch": 0.63, - "learning_rate": 1.8365534123574654e-06, - "loss": 0.9658, - "step": 24467 - }, - { - "epoch": 0.63, - "learning_rate": 1.8365382518000983e-06, - "loss": 1.1211, - "step": 24468 - }, - { - "epoch": 0.63, - "learning_rate": 1.8365230906022322e-06, - "loss": 0.9346, - "step": 24469 - }, - { - "epoch": 0.63, - "learning_rate": 1.8365079287638787e-06, - "loss": 0.998, - "step": 24470 - }, - { - "epoch": 0.63, - "learning_rate": 1.8364927662850498e-06, - "loss": 0.876, - "step": 24471 - }, - { - "epoch": 0.63, - "learning_rate": 1.8364776031657568e-06, - "loss": 0.8135, - "step": 24472 - }, - { - "epoch": 0.63, - "learning_rate": 1.8364624394060114e-06, - "loss": 0.8022, - "step": 24473 - }, - { - "epoch": 0.63, - "learning_rate": 1.836447275005825e-06, - "loss": 0.9229, - "step": 24474 - }, - { - "epoch": 0.63, - "learning_rate": 1.8364321099652095e-06, - "loss": 0.8896, - "step": 24475 - }, - { - "epoch": 0.63, - "learning_rate": 1.8364169442841763e-06, - "loss": 0.9004, - "step": 24476 - }, - { - "epoch": 0.63, - "learning_rate": 1.8364017779627371e-06, - "loss": 0.7637, - "step": 24477 - }, - { - "epoch": 0.63, - "learning_rate": 1.8363866110009037e-06, - "loss": 0.6924, - "step": 24478 - }, - { - "epoch": 0.63, - "learning_rate": 1.8363714433986874e-06, - "loss": 0.8418, - "step": 24479 - }, - { - "epoch": 0.63, - "learning_rate": 1.8363562751561e-06, - "loss": 0.8203, - "step": 24480 - }, - { - "epoch": 0.63, - "learning_rate": 1.836341106273153e-06, - "loss": 1.0342, - "step": 24481 - }, - { - "epoch": 0.63, - "learning_rate": 1.8363259367498581e-06, - "loss": 1.0283, - "step": 24482 - }, - { - "epoch": 0.63, - "learning_rate": 1.836310766586227e-06, - "loss": 0.9463, - "step": 24483 - }, - { - "epoch": 0.63, - "learning_rate": 1.836295595782271e-06, - "loss": 0.9541, - "step": 24484 - }, - { - "epoch": 0.63, - "learning_rate": 1.836280424338002e-06, - "loss": 0.6885, - "step": 24485 - }, - { - "epoch": 0.63, - "learning_rate": 1.8362652522534315e-06, - "loss": 1.1562, - "step": 24486 - }, - { - "epoch": 0.63, - "learning_rate": 1.8362500795285712e-06, - "loss": 0.8809, - "step": 24487 - }, - { - "epoch": 0.63, - "learning_rate": 1.8362349061634328e-06, - "loss": 0.7568, - "step": 24488 - }, - { - "epoch": 0.63, - "learning_rate": 1.8362197321580274e-06, - "loss": 0.5571, - "step": 24489 - }, - { - "epoch": 0.63, - "learning_rate": 1.8362045575123673e-06, - "loss": 0.8877, - "step": 24490 - }, - { - "epoch": 0.63, - "learning_rate": 1.8361893822264637e-06, - "loss": 0.7725, - "step": 24491 - }, - { - "epoch": 0.63, - "learning_rate": 1.8361742063003286e-06, - "loss": 0.8599, - "step": 24492 - }, - { - "epoch": 0.63, - "learning_rate": 1.8361590297339731e-06, - "loss": 1.0146, - "step": 24493 - }, - { - "epoch": 0.63, - "learning_rate": 1.8361438525274088e-06, - "loss": 0.9863, - "step": 24494 - }, - { - "epoch": 0.63, - "learning_rate": 1.836128674680648e-06, - "loss": 0.7666, - "step": 24495 - }, - { - "epoch": 0.63, - "learning_rate": 1.8361134961937022e-06, - "loss": 0.6621, - "step": 24496 - }, - { - "epoch": 0.63, - "learning_rate": 1.836098317066582e-06, - "loss": 0.959, - "step": 24497 - }, - { - "epoch": 0.63, - "learning_rate": 1.8360831372993002e-06, - "loss": 0.5742, - "step": 24498 - }, - { - "epoch": 0.63, - "learning_rate": 1.8360679568918682e-06, - "loss": 0.9238, - "step": 24499 - }, - { - "epoch": 0.63, - "learning_rate": 1.836052775844297e-06, - "loss": 0.9326, - "step": 24500 - }, - { - "epoch": 0.63, - "learning_rate": 1.8360375941565987e-06, - "loss": 0.7773, - "step": 24501 - }, - { - "epoch": 0.63, - "learning_rate": 1.836022411828785e-06, - "loss": 0.6582, - "step": 24502 - }, - { - "epoch": 0.63, - "learning_rate": 1.8360072288608674e-06, - "loss": 0.6377, - "step": 24503 - }, - { - "epoch": 0.63, - "learning_rate": 1.8359920452528575e-06, - "loss": 0.9482, - "step": 24504 - }, - { - "epoch": 0.63, - "learning_rate": 1.8359768610047666e-06, - "loss": 0.8037, - "step": 24505 - }, - { - "epoch": 0.63, - "learning_rate": 1.835961676116607e-06, - "loss": 0.8594, - "step": 24506 - }, - { - "epoch": 0.63, - "learning_rate": 1.83594649058839e-06, - "loss": 0.8408, - "step": 24507 - }, - { - "epoch": 0.63, - "learning_rate": 1.835931304420127e-06, - "loss": 1.0127, - "step": 24508 - }, - { - "epoch": 0.63, - "learning_rate": 1.8359161176118299e-06, - "loss": 0.9248, - "step": 24509 - }, - { - "epoch": 0.63, - "learning_rate": 1.8359009301635102e-06, - "loss": 0.8564, - "step": 24510 - }, - { - "epoch": 0.63, - "learning_rate": 1.8358857420751797e-06, - "loss": 0.7959, - "step": 24511 - }, - { - "epoch": 0.63, - "learning_rate": 1.83587055334685e-06, - "loss": 0.6982, - "step": 24512 - }, - { - "epoch": 0.63, - "learning_rate": 1.8358553639785325e-06, - "loss": 0.7842, - "step": 24513 - }, - { - "epoch": 0.63, - "learning_rate": 1.8358401739702392e-06, - "loss": 0.8789, - "step": 24514 - }, - { - "epoch": 0.63, - "learning_rate": 1.8358249833219813e-06, - "loss": 0.9678, - "step": 24515 - }, - { - "epoch": 0.63, - "learning_rate": 1.8358097920337708e-06, - "loss": 0.7842, - "step": 24516 - }, - { - "epoch": 0.63, - "learning_rate": 1.835794600105619e-06, - "loss": 0.7437, - "step": 24517 - }, - { - "epoch": 0.63, - "learning_rate": 1.835779407537538e-06, - "loss": 0.709, - "step": 24518 - }, - { - "epoch": 0.63, - "learning_rate": 1.8357642143295387e-06, - "loss": 0.6934, - "step": 24519 - }, - { - "epoch": 0.63, - "learning_rate": 1.8357490204816335e-06, - "loss": 0.7793, - "step": 24520 - }, - { - "epoch": 0.63, - "learning_rate": 1.8357338259938335e-06, - "loss": 0.7588, - "step": 24521 - }, - { - "epoch": 0.63, - "learning_rate": 1.8357186308661508e-06, - "loss": 0.877, - "step": 24522 - }, - { - "epoch": 0.63, - "learning_rate": 1.8357034350985962e-06, - "loss": 1.0264, - "step": 24523 - }, - { - "epoch": 0.63, - "learning_rate": 1.8356882386911824e-06, - "loss": 0.8457, - "step": 24524 - }, - { - "epoch": 0.63, - "learning_rate": 1.8356730416439206e-06, - "loss": 0.8784, - "step": 24525 - }, - { - "epoch": 0.63, - "learning_rate": 1.8356578439568223e-06, - "loss": 0.8711, - "step": 24526 - }, - { - "epoch": 0.63, - "learning_rate": 1.835642645629899e-06, - "loss": 0.8213, - "step": 24527 - }, - { - "epoch": 0.63, - "learning_rate": 1.8356274466631627e-06, - "loss": 1.0596, - "step": 24528 - }, - { - "epoch": 0.63, - "learning_rate": 1.835612247056625e-06, - "loss": 0.728, - "step": 24529 - }, - { - "epoch": 0.63, - "learning_rate": 1.8355970468102973e-06, - "loss": 0.7881, - "step": 24530 - }, - { - "epoch": 0.63, - "learning_rate": 1.8355818459241915e-06, - "loss": 0.6787, - "step": 24531 - }, - { - "epoch": 0.63, - "learning_rate": 1.8355666443983187e-06, - "loss": 0.7422, - "step": 24532 - }, - { - "epoch": 0.63, - "learning_rate": 1.8355514422326915e-06, - "loss": 0.8428, - "step": 24533 - }, - { - "epoch": 0.63, - "learning_rate": 1.8355362394273204e-06, - "loss": 0.7317, - "step": 24534 - }, - { - "epoch": 0.63, - "learning_rate": 1.835521035982218e-06, - "loss": 0.7075, - "step": 24535 - }, - { - "epoch": 0.63, - "learning_rate": 1.8355058318973955e-06, - "loss": 1.0566, - "step": 24536 - }, - { - "epoch": 0.63, - "learning_rate": 1.8354906271728644e-06, - "loss": 0.8281, - "step": 24537 - }, - { - "epoch": 0.63, - "learning_rate": 1.835475421808637e-06, - "loss": 0.7749, - "step": 24538 - }, - { - "epoch": 0.63, - "learning_rate": 1.8354602158047241e-06, - "loss": 0.9053, - "step": 24539 - }, - { - "epoch": 0.63, - "learning_rate": 1.835445009161138e-06, - "loss": 0.9121, - "step": 24540 - }, - { - "epoch": 0.63, - "learning_rate": 1.8354298018778898e-06, - "loss": 0.7871, - "step": 24541 - }, - { - "epoch": 0.63, - "learning_rate": 1.8354145939549915e-06, - "loss": 0.957, - "step": 24542 - }, - { - "epoch": 0.63, - "learning_rate": 1.8353993853924545e-06, - "loss": 0.9639, - "step": 24543 - }, - { - "epoch": 0.63, - "learning_rate": 1.835384176190291e-06, - "loss": 1.1055, - "step": 24544 - }, - { - "epoch": 0.63, - "learning_rate": 1.8353689663485118e-06, - "loss": 0.9082, - "step": 24545 - }, - { - "epoch": 0.63, - "learning_rate": 1.8353537558671293e-06, - "loss": 0.8564, - "step": 24546 - }, - { - "epoch": 0.63, - "learning_rate": 1.8353385447461548e-06, - "loss": 0.9785, - "step": 24547 - }, - { - "epoch": 0.63, - "learning_rate": 1.8353233329855999e-06, - "loss": 0.9648, - "step": 24548 - }, - { - "epoch": 0.63, - "learning_rate": 1.8353081205854766e-06, - "loss": 0.9229, - "step": 24549 - }, - { - "epoch": 0.63, - "learning_rate": 1.8352929075457959e-06, - "loss": 0.9873, - "step": 24550 - }, - { - "epoch": 0.63, - "learning_rate": 1.8352776938665699e-06, - "loss": 0.6741, - "step": 24551 - }, - { - "epoch": 0.63, - "learning_rate": 1.8352624795478105e-06, - "loss": 1.0361, - "step": 24552 - }, - { - "epoch": 0.63, - "learning_rate": 1.8352472645895287e-06, - "loss": 0.9434, - "step": 24553 - }, - { - "epoch": 0.63, - "learning_rate": 1.8352320489917365e-06, - "loss": 0.752, - "step": 24554 - }, - { - "epoch": 0.63, - "learning_rate": 1.8352168327544458e-06, - "loss": 0.9609, - "step": 24555 - }, - { - "epoch": 0.63, - "learning_rate": 1.8352016158776674e-06, - "loss": 0.6709, - "step": 24556 - }, - { - "epoch": 0.63, - "learning_rate": 1.8351863983614142e-06, - "loss": 0.9062, - "step": 24557 - }, - { - "epoch": 0.63, - "learning_rate": 1.8351711802056967e-06, - "loss": 0.6914, - "step": 24558 - }, - { - "epoch": 0.63, - "learning_rate": 1.8351559614105275e-06, - "loss": 0.8672, - "step": 24559 - }, - { - "epoch": 0.63, - "learning_rate": 1.8351407419759174e-06, - "loss": 0.9951, - "step": 24560 - }, - { - "epoch": 0.63, - "learning_rate": 1.8351255219018785e-06, - "loss": 0.9619, - "step": 24561 - }, - { - "epoch": 0.63, - "learning_rate": 1.8351103011884223e-06, - "loss": 0.9395, - "step": 24562 - }, - { - "epoch": 0.63, - "learning_rate": 1.8350950798355606e-06, - "loss": 1.0049, - "step": 24563 - }, - { - "epoch": 0.63, - "learning_rate": 1.835079857843305e-06, - "loss": 0.9111, - "step": 24564 - }, - { - "epoch": 0.63, - "learning_rate": 1.8350646352116671e-06, - "loss": 0.9297, - "step": 24565 - }, - { - "epoch": 0.63, - "learning_rate": 1.835049411940659e-06, - "loss": 0.9922, - "step": 24566 - }, - { - "epoch": 0.63, - "learning_rate": 1.8350341880302915e-06, - "loss": 0.6758, - "step": 24567 - }, - { - "epoch": 0.63, - "learning_rate": 1.835018963480577e-06, - "loss": 0.709, - "step": 24568 - }, - { - "epoch": 0.63, - "learning_rate": 1.8350037382915267e-06, - "loss": 1.2734, - "step": 24569 - }, - { - "epoch": 0.63, - "learning_rate": 1.8349885124631524e-06, - "loss": 0.7627, - "step": 24570 - }, - { - "epoch": 0.63, - "learning_rate": 1.8349732859954661e-06, - "loss": 0.6855, - "step": 24571 - }, - { - "epoch": 0.63, - "learning_rate": 1.8349580588884788e-06, - "loss": 0.8809, - "step": 24572 - }, - { - "epoch": 0.63, - "learning_rate": 1.8349428311422027e-06, - "loss": 0.8096, - "step": 24573 - }, - { - "epoch": 0.63, - "learning_rate": 1.834927602756649e-06, - "loss": 0.8228, - "step": 24574 - }, - { - "epoch": 0.63, - "learning_rate": 1.83491237373183e-06, - "loss": 0.7568, - "step": 24575 - }, - { - "epoch": 0.63, - "learning_rate": 1.8348971440677567e-06, - "loss": 0.915, - "step": 24576 - }, - { - "epoch": 0.63, - "learning_rate": 1.834881913764441e-06, - "loss": 0.9062, - "step": 24577 - }, - { - "epoch": 0.63, - "learning_rate": 1.8348666828218948e-06, - "loss": 0.9756, - "step": 24578 - }, - { - "epoch": 0.63, - "learning_rate": 1.8348514512401296e-06, - "loss": 0.8398, - "step": 24579 - }, - { - "epoch": 0.63, - "learning_rate": 1.8348362190191571e-06, - "loss": 0.958, - "step": 24580 - }, - { - "epoch": 0.63, - "learning_rate": 1.8348209861589888e-06, - "loss": 0.8364, - "step": 24581 - }, - { - "epoch": 0.63, - "learning_rate": 1.8348057526596365e-06, - "loss": 0.9131, - "step": 24582 - }, - { - "epoch": 0.63, - "learning_rate": 1.8347905185211117e-06, - "loss": 0.7383, - "step": 24583 - }, - { - "epoch": 0.63, - "learning_rate": 1.834775283743426e-06, - "loss": 0.5994, - "step": 24584 - }, - { - "epoch": 0.63, - "learning_rate": 1.8347600483265917e-06, - "loss": 0.999, - "step": 24585 - }, - { - "epoch": 0.63, - "learning_rate": 1.8347448122706197e-06, - "loss": 0.709, - "step": 24586 - }, - { - "epoch": 0.63, - "learning_rate": 1.834729575575522e-06, - "loss": 0.9131, - "step": 24587 - }, - { - "epoch": 0.63, - "learning_rate": 1.8347143382413105e-06, - "loss": 0.9521, - "step": 24588 - }, - { - "epoch": 0.63, - "learning_rate": 1.834699100267996e-06, - "loss": 1.0127, - "step": 24589 - }, - { - "epoch": 0.63, - "learning_rate": 1.8346838616555912e-06, - "loss": 0.5786, - "step": 24590 - }, - { - "epoch": 0.63, - "learning_rate": 1.8346686224041074e-06, - "loss": 1.0625, - "step": 24591 - }, - { - "epoch": 0.63, - "learning_rate": 1.8346533825135564e-06, - "loss": 0.7295, - "step": 24592 - }, - { - "epoch": 0.63, - "learning_rate": 1.8346381419839494e-06, - "loss": 0.9766, - "step": 24593 - }, - { - "epoch": 0.63, - "learning_rate": 1.8346229008152983e-06, - "loss": 0.5874, - "step": 24594 - }, - { - "epoch": 0.63, - "learning_rate": 1.8346076590076152e-06, - "loss": 0.917, - "step": 24595 - }, - { - "epoch": 0.63, - "learning_rate": 1.8345924165609107e-06, - "loss": 0.7759, - "step": 24596 - }, - { - "epoch": 0.63, - "learning_rate": 1.8345771734751978e-06, - "loss": 0.8711, - "step": 24597 - }, - { - "epoch": 0.63, - "learning_rate": 1.8345619297504873e-06, - "loss": 0.9023, - "step": 24598 - }, - { - "epoch": 0.63, - "learning_rate": 1.8345466853867913e-06, - "loss": 0.8853, - "step": 24599 - }, - { - "epoch": 0.63, - "learning_rate": 1.834531440384121e-06, - "loss": 0.7725, - "step": 24600 - }, - { - "epoch": 0.63, - "learning_rate": 1.8345161947424886e-06, - "loss": 0.5884, - "step": 24601 - }, - { - "epoch": 0.63, - "learning_rate": 1.834500948461905e-06, - "loss": 0.9824, - "step": 24602 - }, - { - "epoch": 0.63, - "learning_rate": 1.8344857015423828e-06, - "loss": 0.835, - "step": 24603 - }, - { - "epoch": 0.63, - "learning_rate": 1.8344704539839332e-06, - "loss": 0.7456, - "step": 24604 - }, - { - "epoch": 0.63, - "learning_rate": 1.8344552057865681e-06, - "loss": 0.8701, - "step": 24605 - }, - { - "epoch": 0.63, - "learning_rate": 1.8344399569502988e-06, - "loss": 0.7661, - "step": 24606 - }, - { - "epoch": 0.63, - "learning_rate": 1.8344247074751373e-06, - "loss": 0.7549, - "step": 24607 - }, - { - "epoch": 0.63, - "learning_rate": 1.834409457361095e-06, - "loss": 1.0137, - "step": 24608 - }, - { - "epoch": 0.63, - "learning_rate": 1.8343942066081842e-06, - "loss": 0.9658, - "step": 24609 - }, - { - "epoch": 0.63, - "learning_rate": 1.8343789552164158e-06, - "loss": 0.7319, - "step": 24610 - }, - { - "epoch": 0.63, - "learning_rate": 1.8343637031858017e-06, - "loss": 0.8623, - "step": 24611 - }, - { - "epoch": 0.63, - "learning_rate": 1.8343484505163538e-06, - "loss": 0.6284, - "step": 24612 - }, - { - "epoch": 0.63, - "learning_rate": 1.8343331972080836e-06, - "loss": 0.7847, - "step": 24613 - }, - { - "epoch": 0.63, - "learning_rate": 1.834317943261003e-06, - "loss": 0.9961, - "step": 24614 - }, - { - "epoch": 0.63, - "learning_rate": 1.8343026886751233e-06, - "loss": 0.7734, - "step": 24615 - }, - { - "epoch": 0.63, - "learning_rate": 1.8342874334504566e-06, - "loss": 0.8799, - "step": 24616 - }, - { - "epoch": 0.63, - "learning_rate": 1.8342721775870143e-06, - "loss": 0.8516, - "step": 24617 - }, - { - "epoch": 0.63, - "learning_rate": 1.834256921084808e-06, - "loss": 0.9688, - "step": 24618 - }, - { - "epoch": 0.63, - "learning_rate": 1.8342416639438496e-06, - "loss": 0.9395, - "step": 24619 - }, - { - "epoch": 0.63, - "learning_rate": 1.8342264061641508e-06, - "loss": 0.915, - "step": 24620 - }, - { - "epoch": 0.63, - "learning_rate": 1.8342111477457234e-06, - "loss": 0.5981, - "step": 24621 - }, - { - "epoch": 0.63, - "learning_rate": 1.8341958886885783e-06, - "loss": 0.8174, - "step": 24622 - }, - { - "epoch": 0.63, - "learning_rate": 1.8341806289927283e-06, - "loss": 0.9189, - "step": 24623 - }, - { - "epoch": 0.63, - "learning_rate": 1.8341653686581843e-06, - "loss": 0.8921, - "step": 24624 - }, - { - "epoch": 0.63, - "learning_rate": 1.8341501076849584e-06, - "loss": 0.8462, - "step": 24625 - }, - { - "epoch": 0.63, - "learning_rate": 1.8341348460730618e-06, - "loss": 0.8613, - "step": 24626 - }, - { - "epoch": 0.63, - "learning_rate": 1.834119583822507e-06, - "loss": 0.6748, - "step": 24627 - }, - { - "epoch": 0.63, - "learning_rate": 1.8341043209333049e-06, - "loss": 0.8926, - "step": 24628 - }, - { - "epoch": 0.63, - "learning_rate": 1.8340890574054674e-06, - "loss": 0.958, - "step": 24629 - }, - { - "epoch": 0.63, - "learning_rate": 1.8340737932390065e-06, - "loss": 0.8521, - "step": 24630 - }, - { - "epoch": 0.63, - "learning_rate": 1.8340585284339333e-06, - "loss": 1.0137, - "step": 24631 - }, - { - "epoch": 0.63, - "learning_rate": 1.83404326299026e-06, - "loss": 0.8057, - "step": 24632 - }, - { - "epoch": 0.63, - "learning_rate": 1.8340279969079982e-06, - "loss": 1.0244, - "step": 24633 - }, - { - "epoch": 0.63, - "learning_rate": 1.8340127301871595e-06, - "loss": 0.8232, - "step": 24634 - }, - { - "epoch": 0.63, - "learning_rate": 1.8339974628277558e-06, - "loss": 1.0371, - "step": 24635 - }, - { - "epoch": 0.63, - "learning_rate": 1.8339821948297983e-06, - "loss": 0.7197, - "step": 24636 - }, - { - "epoch": 0.63, - "learning_rate": 1.833966926193299e-06, - "loss": 0.873, - "step": 24637 - }, - { - "epoch": 0.63, - "learning_rate": 1.8339516569182694e-06, - "loss": 1.0132, - "step": 24638 - }, - { - "epoch": 0.63, - "learning_rate": 1.8339363870047215e-06, - "loss": 0.7944, - "step": 24639 - }, - { - "epoch": 0.63, - "learning_rate": 1.8339211164526672e-06, - "loss": 0.9512, - "step": 24640 - }, - { - "epoch": 0.63, - "learning_rate": 1.8339058452621174e-06, - "loss": 0.8301, - "step": 24641 - }, - { - "epoch": 0.63, - "learning_rate": 1.8338905734330845e-06, - "loss": 0.73, - "step": 24642 - }, - { - "epoch": 0.63, - "learning_rate": 1.8338753009655798e-06, - "loss": 0.7197, - "step": 24643 - }, - { - "epoch": 0.63, - "learning_rate": 1.8338600278596153e-06, - "loss": 0.7412, - "step": 24644 - }, - { - "epoch": 0.63, - "learning_rate": 1.8338447541152023e-06, - "loss": 0.8525, - "step": 24645 - }, - { - "epoch": 0.63, - "learning_rate": 1.8338294797323528e-06, - "loss": 0.7686, - "step": 24646 - }, - { - "epoch": 0.63, - "learning_rate": 1.8338142047110784e-06, - "loss": 0.8311, - "step": 24647 - }, - { - "epoch": 0.63, - "learning_rate": 1.833798929051391e-06, - "loss": 0.8379, - "step": 24648 - }, - { - "epoch": 0.63, - "learning_rate": 1.8337836527533017e-06, - "loss": 0.9756, - "step": 24649 - }, - { - "epoch": 0.63, - "learning_rate": 1.833768375816823e-06, - "loss": 0.9668, - "step": 24650 - }, - { - "epoch": 0.63, - "learning_rate": 1.8337530982419658e-06, - "loss": 0.8291, - "step": 24651 - }, - { - "epoch": 0.63, - "learning_rate": 1.8337378200287423e-06, - "loss": 0.9824, - "step": 24652 - }, - { - "epoch": 0.63, - "learning_rate": 1.8337225411771642e-06, - "loss": 0.7754, - "step": 24653 - }, - { - "epoch": 0.63, - "learning_rate": 1.8337072616872432e-06, - "loss": 0.8076, - "step": 24654 - }, - { - "epoch": 0.63, - "learning_rate": 1.8336919815589909e-06, - "loss": 0.9453, - "step": 24655 - }, - { - "epoch": 0.63, - "learning_rate": 1.8336767007924187e-06, - "loss": 0.8481, - "step": 24656 - }, - { - "epoch": 0.63, - "learning_rate": 1.8336614193875386e-06, - "loss": 0.7891, - "step": 24657 - }, - { - "epoch": 0.63, - "learning_rate": 1.8336461373443624e-06, - "loss": 0.8154, - "step": 24658 - }, - { - "epoch": 0.63, - "learning_rate": 1.8336308546629016e-06, - "loss": 0.7427, - "step": 24659 - }, - { - "epoch": 0.63, - "learning_rate": 1.8336155713431682e-06, - "loss": 0.8416, - "step": 24660 - }, - { - "epoch": 0.63, - "learning_rate": 1.8336002873851734e-06, - "loss": 0.9814, - "step": 24661 - }, - { - "epoch": 0.63, - "learning_rate": 1.8335850027889294e-06, - "loss": 0.7168, - "step": 24662 - }, - { - "epoch": 0.63, - "learning_rate": 1.8335697175544477e-06, - "loss": 0.9854, - "step": 24663 - }, - { - "epoch": 0.63, - "learning_rate": 1.8335544316817399e-06, - "loss": 0.7979, - "step": 24664 - }, - { - "epoch": 0.63, - "learning_rate": 1.833539145170818e-06, - "loss": 0.9688, - "step": 24665 - }, - { - "epoch": 0.63, - "learning_rate": 1.8335238580216932e-06, - "loss": 0.8193, - "step": 24666 - }, - { - "epoch": 0.63, - "learning_rate": 1.8335085702343775e-06, - "loss": 1.0049, - "step": 24667 - }, - { - "epoch": 0.63, - "learning_rate": 1.833493281808883e-06, - "loss": 0.9219, - "step": 24668 - }, - { - "epoch": 0.63, - "learning_rate": 1.833477992745221e-06, - "loss": 0.8174, - "step": 24669 - }, - { - "epoch": 0.63, - "learning_rate": 1.8334627030434028e-06, - "loss": 0.6846, - "step": 24670 - }, - { - "epoch": 0.63, - "learning_rate": 1.8334474127034407e-06, - "loss": 1.0156, - "step": 24671 - }, - { - "epoch": 0.63, - "learning_rate": 1.8334321217253463e-06, - "loss": 0.8965, - "step": 24672 - }, - { - "epoch": 0.63, - "learning_rate": 1.8334168301091313e-06, - "loss": 0.8975, - "step": 24673 - }, - { - "epoch": 0.63, - "learning_rate": 1.833401537854807e-06, - "loss": 0.9258, - "step": 24674 - }, - { - "epoch": 0.63, - "learning_rate": 1.8333862449623859e-06, - "loss": 0.7939, - "step": 24675 - }, - { - "epoch": 0.63, - "learning_rate": 1.833370951431879e-06, - "loss": 0.7954, - "step": 24676 - }, - { - "epoch": 0.63, - "learning_rate": 1.8333556572632984e-06, - "loss": 0.9482, - "step": 24677 - }, - { - "epoch": 0.63, - "learning_rate": 1.8333403624566558e-06, - "loss": 0.8652, - "step": 24678 - }, - { - "epoch": 0.63, - "learning_rate": 1.8333250670119627e-06, - "loss": 0.8193, - "step": 24679 - }, - { - "epoch": 0.63, - "learning_rate": 1.8333097709292309e-06, - "loss": 0.9863, - "step": 24680 - }, - { - "epoch": 0.63, - "learning_rate": 1.833294474208472e-06, - "loss": 0.5255, - "step": 24681 - }, - { - "epoch": 0.63, - "learning_rate": 1.833279176849698e-06, - "loss": 0.8965, - "step": 24682 - }, - { - "epoch": 0.63, - "learning_rate": 1.8332638788529204e-06, - "loss": 0.9746, - "step": 24683 - }, - { - "epoch": 0.63, - "learning_rate": 1.833248580218151e-06, - "loss": 0.7339, - "step": 24684 - }, - { - "epoch": 0.63, - "learning_rate": 1.8332332809454013e-06, - "loss": 0.9824, - "step": 24685 - }, - { - "epoch": 0.63, - "learning_rate": 1.8332179810346834e-06, - "loss": 1.0459, - "step": 24686 - }, - { - "epoch": 0.63, - "learning_rate": 1.8332026804860087e-06, - "loss": 0.7632, - "step": 24687 - }, - { - "epoch": 0.63, - "learning_rate": 1.8331873792993892e-06, - "loss": 0.5436, - "step": 24688 - }, - { - "epoch": 0.63, - "learning_rate": 1.8331720774748362e-06, - "loss": 0.8477, - "step": 24689 - }, - { - "epoch": 0.63, - "learning_rate": 1.833156775012362e-06, - "loss": 0.7949, - "step": 24690 - }, - { - "epoch": 0.63, - "learning_rate": 1.8331414719119776e-06, - "loss": 0.6436, - "step": 24691 - }, - { - "epoch": 0.63, - "learning_rate": 1.8331261681736955e-06, - "loss": 0.7739, - "step": 24692 - }, - { - "epoch": 0.63, - "learning_rate": 1.8331108637975264e-06, - "loss": 0.7827, - "step": 24693 - }, - { - "epoch": 0.63, - "learning_rate": 1.8330955587834829e-06, - "loss": 0.8135, - "step": 24694 - }, - { - "epoch": 0.63, - "learning_rate": 1.8330802531315765e-06, - "loss": 0.6802, - "step": 24695 - }, - { - "epoch": 0.63, - "learning_rate": 1.8330649468418188e-06, - "loss": 0.834, - "step": 24696 - }, - { - "epoch": 0.63, - "learning_rate": 1.8330496399142215e-06, - "loss": 0.7778, - "step": 24697 - }, - { - "epoch": 0.63, - "learning_rate": 1.8330343323487964e-06, - "loss": 0.9277, - "step": 24698 - }, - { - "epoch": 0.63, - "learning_rate": 1.8330190241455555e-06, - "loss": 0.8105, - "step": 24699 - }, - { - "epoch": 0.63, - "learning_rate": 1.83300371530451e-06, - "loss": 1.0176, - "step": 24700 - }, - { - "epoch": 0.63, - "learning_rate": 1.8329884058256719e-06, - "loss": 0.8604, - "step": 24701 - }, - { - "epoch": 0.63, - "learning_rate": 1.832973095709053e-06, - "loss": 0.9253, - "step": 24702 - }, - { - "epoch": 0.63, - "learning_rate": 1.8329577849546646e-06, - "loss": 0.5271, - "step": 24703 - }, - { - "epoch": 0.63, - "learning_rate": 1.8329424735625189e-06, - "loss": 1.2119, - "step": 24704 - }, - { - "epoch": 0.63, - "learning_rate": 1.8329271615326275e-06, - "loss": 0.7109, - "step": 24705 - }, - { - "epoch": 0.63, - "learning_rate": 1.832911848865002e-06, - "loss": 0.9609, - "step": 24706 - }, - { - "epoch": 0.63, - "learning_rate": 1.8328965355596542e-06, - "loss": 1.1348, - "step": 24707 - }, - { - "epoch": 0.63, - "learning_rate": 1.832881221616596e-06, - "loss": 0.7244, - "step": 24708 - }, - { - "epoch": 0.63, - "learning_rate": 1.8328659070358388e-06, - "loss": 0.7793, - "step": 24709 - }, - { - "epoch": 0.63, - "learning_rate": 1.8328505918173943e-06, - "loss": 0.9014, - "step": 24710 - }, - { - "epoch": 0.63, - "learning_rate": 1.8328352759612744e-06, - "loss": 1.2148, - "step": 24711 - }, - { - "epoch": 0.63, - "learning_rate": 1.8328199594674912e-06, - "loss": 0.9434, - "step": 24712 - }, - { - "epoch": 0.63, - "learning_rate": 1.8328046423360556e-06, - "loss": 1.0039, - "step": 24713 - }, - { - "epoch": 0.63, - "learning_rate": 1.83278932456698e-06, - "loss": 1.1074, - "step": 24714 - }, - { - "epoch": 0.63, - "learning_rate": 1.8327740061602762e-06, - "loss": 0.5813, - "step": 24715 - }, - { - "epoch": 0.63, - "learning_rate": 1.8327586871159552e-06, - "loss": 0.8018, - "step": 24716 - }, - { - "epoch": 0.63, - "learning_rate": 1.8327433674340293e-06, - "loss": 0.6177, - "step": 24717 - }, - { - "epoch": 0.63, - "learning_rate": 1.8327280471145102e-06, - "loss": 0.999, - "step": 24718 - }, - { - "epoch": 0.63, - "learning_rate": 1.8327127261574093e-06, - "loss": 0.7197, - "step": 24719 - }, - { - "epoch": 0.63, - "learning_rate": 1.8326974045627388e-06, - "loss": 0.5278, - "step": 24720 - }, - { - "epoch": 0.63, - "learning_rate": 1.83268208233051e-06, - "loss": 0.999, - "step": 24721 - }, - { - "epoch": 0.63, - "learning_rate": 1.8326667594607347e-06, - "loss": 0.8818, - "step": 24722 - }, - { - "epoch": 0.63, - "learning_rate": 1.8326514359534251e-06, - "loss": 0.873, - "step": 24723 - }, - { - "epoch": 0.63, - "learning_rate": 1.8326361118085925e-06, - "loss": 0.9746, - "step": 24724 - }, - { - "epoch": 0.63, - "learning_rate": 1.8326207870262484e-06, - "loss": 0.8789, - "step": 24725 - }, - { - "epoch": 0.63, - "learning_rate": 1.8326054616064051e-06, - "loss": 0.6001, - "step": 24726 - }, - { - "epoch": 0.63, - "learning_rate": 1.8325901355490742e-06, - "loss": 0.8022, - "step": 24727 - }, - { - "epoch": 0.63, - "learning_rate": 1.8325748088542672e-06, - "loss": 0.8408, - "step": 24728 - }, - { - "epoch": 0.63, - "learning_rate": 1.8325594815219958e-06, - "loss": 0.9736, - "step": 24729 - }, - { - "epoch": 0.63, - "learning_rate": 1.832544153552272e-06, - "loss": 1.0352, - "step": 24730 - }, - { - "epoch": 0.63, - "learning_rate": 1.8325288249451077e-06, - "loss": 1.0215, - "step": 24731 - }, - { - "epoch": 0.63, - "learning_rate": 1.832513495700514e-06, - "loss": 0.9502, - "step": 24732 - }, - { - "epoch": 0.63, - "learning_rate": 1.832498165818503e-06, - "loss": 0.4979, - "step": 24733 - }, - { - "epoch": 0.63, - "learning_rate": 1.8324828352990866e-06, - "loss": 1.1084, - "step": 24734 - }, - { - "epoch": 0.63, - "learning_rate": 1.8324675041422764e-06, - "loss": 0.8687, - "step": 24735 - }, - { - "epoch": 0.63, - "learning_rate": 1.832452172348084e-06, - "loss": 0.9473, - "step": 24736 - }, - { - "epoch": 0.63, - "learning_rate": 1.8324368399165211e-06, - "loss": 0.8711, - "step": 24737 - }, - { - "epoch": 0.63, - "learning_rate": 1.8324215068476e-06, - "loss": 0.8164, - "step": 24738 - }, - { - "epoch": 0.63, - "learning_rate": 1.8324061731413315e-06, - "loss": 1.0146, - "step": 24739 - }, - { - "epoch": 0.63, - "learning_rate": 1.8323908387977283e-06, - "loss": 0.9014, - "step": 24740 - }, - { - "epoch": 0.63, - "learning_rate": 1.8323755038168015e-06, - "loss": 0.8301, - "step": 24741 - }, - { - "epoch": 0.63, - "learning_rate": 1.832360168198563e-06, - "loss": 1.1113, - "step": 24742 - }, - { - "epoch": 0.63, - "learning_rate": 1.8323448319430248e-06, - "loss": 0.9492, - "step": 24743 - }, - { - "epoch": 0.63, - "learning_rate": 1.832329495050198e-06, - "loss": 0.8062, - "step": 24744 - }, - { - "epoch": 0.63, - "learning_rate": 1.8323141575200954e-06, - "loss": 1.0332, - "step": 24745 - }, - { - "epoch": 0.63, - "learning_rate": 1.8322988193527279e-06, - "loss": 0.8374, - "step": 24746 - }, - { - "epoch": 0.63, - "learning_rate": 1.8322834805481074e-06, - "loss": 1.0146, - "step": 24747 - }, - { - "epoch": 0.63, - "learning_rate": 1.8322681411062456e-06, - "loss": 0.678, - "step": 24748 - }, - { - "epoch": 0.63, - "learning_rate": 1.8322528010271546e-06, - "loss": 0.9219, - "step": 24749 - }, - { - "epoch": 0.63, - "learning_rate": 1.8322374603108458e-06, - "loss": 0.8496, - "step": 24750 - }, - { - "epoch": 0.63, - "learning_rate": 1.8322221189573308e-06, - "loss": 0.6663, - "step": 24751 - }, - { - "epoch": 0.63, - "learning_rate": 1.832206776966622e-06, - "loss": 0.8525, - "step": 24752 - }, - { - "epoch": 0.63, - "learning_rate": 1.8321914343387304e-06, - "loss": 0.7393, - "step": 24753 - }, - { - "epoch": 0.63, - "learning_rate": 1.8321760910736681e-06, - "loss": 0.9785, - "step": 24754 - }, - { - "epoch": 0.63, - "learning_rate": 1.832160747171447e-06, - "loss": 0.9072, - "step": 24755 - }, - { - "epoch": 0.63, - "learning_rate": 1.8321454026320786e-06, - "loss": 0.9502, - "step": 24756 - }, - { - "epoch": 0.63, - "learning_rate": 1.8321300574555746e-06, - "loss": 0.718, - "step": 24757 - }, - { - "epoch": 0.63, - "learning_rate": 1.8321147116419473e-06, - "loss": 0.8574, - "step": 24758 - }, - { - "epoch": 0.63, - "learning_rate": 1.8320993651912079e-06, - "loss": 0.8906, - "step": 24759 - }, - { - "epoch": 0.63, - "learning_rate": 1.832084018103368e-06, - "loss": 0.6675, - "step": 24760 - }, - { - "epoch": 0.63, - "learning_rate": 1.8320686703784396e-06, - "loss": 0.9639, - "step": 24761 - }, - { - "epoch": 0.63, - "learning_rate": 1.8320533220164346e-06, - "loss": 0.7661, - "step": 24762 - }, - { - "epoch": 0.63, - "learning_rate": 1.8320379730173648e-06, - "loss": 0.9873, - "step": 24763 - }, - { - "epoch": 0.63, - "learning_rate": 1.8320226233812417e-06, - "loss": 0.8877, - "step": 24764 - }, - { - "epoch": 0.63, - "learning_rate": 1.832007273108077e-06, - "loss": 0.6638, - "step": 24765 - }, - { - "epoch": 0.63, - "learning_rate": 1.8319919221978827e-06, - "loss": 0.8574, - "step": 24766 - }, - { - "epoch": 0.63, - "learning_rate": 1.8319765706506703e-06, - "loss": 0.9189, - "step": 24767 - }, - { - "epoch": 0.63, - "learning_rate": 1.8319612184664516e-06, - "loss": 0.9277, - "step": 24768 - }, - { - "epoch": 0.63, - "learning_rate": 1.8319458656452388e-06, - "loss": 0.8887, - "step": 24769 - }, - { - "epoch": 0.63, - "learning_rate": 1.8319305121870432e-06, - "loss": 0.7153, - "step": 24770 - }, - { - "epoch": 0.63, - "learning_rate": 1.8319151580918767e-06, - "loss": 0.6699, - "step": 24771 - }, - { - "epoch": 0.63, - "learning_rate": 1.831899803359751e-06, - "loss": 0.7148, - "step": 24772 - }, - { - "epoch": 0.63, - "learning_rate": 1.8318844479906779e-06, - "loss": 0.9023, - "step": 24773 - }, - { - "epoch": 0.63, - "learning_rate": 1.8318690919846688e-06, - "loss": 0.6768, - "step": 24774 - }, - { - "epoch": 0.63, - "learning_rate": 1.831853735341736e-06, - "loss": 0.7954, - "step": 24775 - }, - { - "epoch": 0.64, - "learning_rate": 1.831838378061891e-06, - "loss": 1.0459, - "step": 24776 - }, - { - "epoch": 0.64, - "learning_rate": 1.831823020145146e-06, - "loss": 0.9395, - "step": 24777 - }, - { - "epoch": 0.64, - "learning_rate": 1.8318076615915118e-06, - "loss": 0.644, - "step": 24778 - }, - { - "epoch": 0.64, - "learning_rate": 1.831792302401001e-06, - "loss": 0.7637, - "step": 24779 - }, - { - "epoch": 0.64, - "learning_rate": 1.8317769425736249e-06, - "loss": 0.9541, - "step": 24780 - }, - { - "epoch": 0.64, - "learning_rate": 1.8317615821093957e-06, - "loss": 0.6021, - "step": 24781 - }, - { - "epoch": 0.64, - "learning_rate": 1.8317462210083247e-06, - "loss": 0.9092, - "step": 24782 - }, - { - "epoch": 0.64, - "learning_rate": 1.831730859270424e-06, - "loss": 1.0137, - "step": 24783 - }, - { - "epoch": 0.64, - "learning_rate": 1.8317154968957054e-06, - "loss": 0.8789, - "step": 24784 - }, - { - "epoch": 0.64, - "learning_rate": 1.8317001338841801e-06, - "loss": 0.9111, - "step": 24785 - }, - { - "epoch": 0.64, - "learning_rate": 1.8316847702358603e-06, - "loss": 0.7637, - "step": 24786 - }, - { - "epoch": 0.64, - "learning_rate": 1.8316694059507581e-06, - "loss": 0.936, - "step": 24787 - }, - { - "epoch": 0.64, - "learning_rate": 1.8316540410288845e-06, - "loss": 0.709, - "step": 24788 - }, - { - "epoch": 0.64, - "learning_rate": 1.8316386754702515e-06, - "loss": 0.8137, - "step": 24789 - }, - { - "epoch": 0.64, - "learning_rate": 1.8316233092748714e-06, - "loss": 0.958, - "step": 24790 - }, - { - "epoch": 0.64, - "learning_rate": 1.8316079424427553e-06, - "loss": 0.8555, - "step": 24791 - }, - { - "epoch": 0.64, - "learning_rate": 1.8315925749739154e-06, - "loss": 0.998, - "step": 24792 - }, - { - "epoch": 0.64, - "learning_rate": 1.8315772068683632e-06, - "loss": 0.9023, - "step": 24793 - }, - { - "epoch": 0.64, - "learning_rate": 1.8315618381261107e-06, - "loss": 0.9585, - "step": 24794 - }, - { - "epoch": 0.64, - "learning_rate": 1.8315464687471694e-06, - "loss": 1.0166, - "step": 24795 - }, - { - "epoch": 0.64, - "learning_rate": 1.8315310987315513e-06, - "loss": 0.491, - "step": 24796 - }, - { - "epoch": 0.64, - "learning_rate": 1.831515728079268e-06, - "loss": 0.916, - "step": 24797 - }, - { - "epoch": 0.64, - "learning_rate": 1.8315003567903315e-06, - "loss": 0.8164, - "step": 24798 - }, - { - "epoch": 0.64, - "learning_rate": 1.8314849848647534e-06, - "loss": 1.0322, - "step": 24799 - }, - { - "epoch": 0.64, - "learning_rate": 1.8314696123025452e-06, - "loss": 0.6526, - "step": 24800 - }, - { - "epoch": 0.64, - "learning_rate": 1.831454239103719e-06, - "loss": 0.6172, - "step": 24801 - }, - { - "epoch": 0.64, - "learning_rate": 1.8314388652682867e-06, - "loss": 0.6885, - "step": 24802 - }, - { - "epoch": 0.64, - "learning_rate": 1.8314234907962597e-06, - "loss": 0.73, - "step": 24803 - }, - { - "epoch": 0.64, - "learning_rate": 1.8314081156876502e-06, - "loss": 0.9131, - "step": 24804 - }, - { - "epoch": 0.64, - "learning_rate": 1.8313927399424696e-06, - "loss": 0.7183, - "step": 24805 - }, - { - "epoch": 0.64, - "learning_rate": 1.83137736356073e-06, - "loss": 1.0713, - "step": 24806 - }, - { - "epoch": 0.64, - "learning_rate": 1.8313619865424428e-06, - "loss": 0.918, - "step": 24807 - }, - { - "epoch": 0.64, - "learning_rate": 1.83134660888762e-06, - "loss": 0.916, - "step": 24808 - }, - { - "epoch": 0.64, - "learning_rate": 1.8313312305962732e-06, - "loss": 0.9043, - "step": 24809 - }, - { - "epoch": 0.64, - "learning_rate": 1.8313158516684144e-06, - "loss": 0.8867, - "step": 24810 - }, - { - "epoch": 0.64, - "learning_rate": 1.8313004721040552e-06, - "loss": 0.9961, - "step": 24811 - }, - { - "epoch": 0.64, - "learning_rate": 1.8312850919032075e-06, - "loss": 0.9346, - "step": 24812 - }, - { - "epoch": 0.64, - "learning_rate": 1.8312697110658831e-06, - "loss": 0.7012, - "step": 24813 - }, - { - "epoch": 0.64, - "learning_rate": 1.8312543295920938e-06, - "loss": 1.0352, - "step": 24814 - }, - { - "epoch": 0.64, - "learning_rate": 1.831238947481851e-06, - "loss": 1.2207, - "step": 24815 - }, - { - "epoch": 0.64, - "learning_rate": 1.831223564735167e-06, - "loss": 0.9297, - "step": 24816 - }, - { - "epoch": 0.64, - "learning_rate": 1.831208181352053e-06, - "loss": 0.7246, - "step": 24817 - }, - { - "epoch": 0.64, - "learning_rate": 1.8311927973325214e-06, - "loss": 0.9175, - "step": 24818 - }, - { - "epoch": 0.64, - "learning_rate": 1.8311774126765838e-06, - "loss": 0.8457, - "step": 24819 - }, - { - "epoch": 0.64, - "learning_rate": 1.8311620273842516e-06, - "loss": 0.562, - "step": 24820 - }, - { - "epoch": 0.64, - "learning_rate": 1.8311466414555369e-06, - "loss": 0.8887, - "step": 24821 - }, - { - "epoch": 0.64, - "learning_rate": 1.8311312548904519e-06, - "loss": 0.9336, - "step": 24822 - }, - { - "epoch": 0.64, - "learning_rate": 1.8311158676890073e-06, - "loss": 0.9043, - "step": 24823 - }, - { - "epoch": 0.64, - "learning_rate": 1.8311004798512157e-06, - "loss": 0.9004, - "step": 24824 - }, - { - "epoch": 0.64, - "learning_rate": 1.8310850913770889e-06, - "loss": 0.9834, - "step": 24825 - }, - { - "epoch": 0.64, - "learning_rate": 1.8310697022666378e-06, - "loss": 0.9941, - "step": 24826 - }, - { - "epoch": 0.64, - "learning_rate": 1.8310543125198756e-06, - "loss": 0.7744, - "step": 24827 - }, - { - "epoch": 0.64, - "learning_rate": 1.831038922136813e-06, - "loss": 0.8398, - "step": 24828 - }, - { - "epoch": 0.64, - "learning_rate": 1.8310235311174621e-06, - "loss": 0.9873, - "step": 24829 - }, - { - "epoch": 0.64, - "learning_rate": 1.8310081394618349e-06, - "loss": 0.8867, - "step": 24830 - }, - { - "epoch": 0.64, - "learning_rate": 1.8309927471699427e-06, - "loss": 0.6353, - "step": 24831 - }, - { - "epoch": 0.64, - "learning_rate": 1.8309773542417978e-06, - "loss": 0.8916, - "step": 24832 - }, - { - "epoch": 0.64, - "learning_rate": 1.8309619606774116e-06, - "loss": 0.8228, - "step": 24833 - }, - { - "epoch": 0.64, - "learning_rate": 1.830946566476796e-06, - "loss": 0.8457, - "step": 24834 - }, - { - "epoch": 0.64, - "learning_rate": 1.8309311716399626e-06, - "loss": 1.1934, - "step": 24835 - }, - { - "epoch": 0.64, - "learning_rate": 1.830915776166924e-06, - "loss": 0.8789, - "step": 24836 - }, - { - "epoch": 0.64, - "learning_rate": 1.830900380057691e-06, - "loss": 0.8955, - "step": 24837 - }, - { - "epoch": 0.64, - "learning_rate": 1.8308849833122756e-06, - "loss": 0.9492, - "step": 24838 - }, - { - "epoch": 0.64, - "learning_rate": 1.8308695859306904e-06, - "loss": 0.6826, - "step": 24839 - }, - { - "epoch": 0.64, - "learning_rate": 1.830854187912946e-06, - "loss": 1.0273, - "step": 24840 - }, - { - "epoch": 0.64, - "learning_rate": 1.830838789259055e-06, - "loss": 0.9961, - "step": 24841 - }, - { - "epoch": 0.64, - "learning_rate": 1.8308233899690291e-06, - "loss": 1.041, - "step": 24842 - }, - { - "epoch": 0.64, - "learning_rate": 1.8308079900428796e-06, - "loss": 0.8018, - "step": 24843 - }, - { - "epoch": 0.64, - "learning_rate": 1.8307925894806186e-06, - "loss": 0.834, - "step": 24844 - }, - { - "epoch": 0.64, - "learning_rate": 1.8307771882822582e-06, - "loss": 0.7666, - "step": 24845 - }, - { - "epoch": 0.64, - "learning_rate": 1.8307617864478098e-06, - "loss": 0.8169, - "step": 24846 - }, - { - "epoch": 0.64, - "learning_rate": 1.8307463839772853e-06, - "loss": 0.833, - "step": 24847 - }, - { - "epoch": 0.64, - "learning_rate": 1.8307309808706966e-06, - "loss": 1.0068, - "step": 24848 - }, - { - "epoch": 0.64, - "learning_rate": 1.830715577128055e-06, - "loss": 0.5728, - "step": 24849 - }, - { - "epoch": 0.64, - "learning_rate": 1.8307001727493731e-06, - "loss": 0.8418, - "step": 24850 - }, - { - "epoch": 0.64, - "learning_rate": 1.8306847677346622e-06, - "loss": 0.957, - "step": 24851 - }, - { - "epoch": 0.64, - "learning_rate": 1.830669362083934e-06, - "loss": 0.9873, - "step": 24852 - }, - { - "epoch": 0.64, - "learning_rate": 1.8306539557972006e-06, - "loss": 0.9365, - "step": 24853 - }, - { - "epoch": 0.64, - "learning_rate": 1.8306385488744736e-06, - "loss": 0.7925, - "step": 24854 - }, - { - "epoch": 0.64, - "learning_rate": 1.8306231413157649e-06, - "loss": 0.6875, - "step": 24855 - }, - { - "epoch": 0.64, - "learning_rate": 1.830607733121086e-06, - "loss": 0.9688, - "step": 24856 - }, - { - "epoch": 0.64, - "learning_rate": 1.8305923242904493e-06, - "loss": 0.8311, - "step": 24857 - }, - { - "epoch": 0.64, - "learning_rate": 1.8305769148238662e-06, - "loss": 0.8438, - "step": 24858 - }, - { - "epoch": 0.64, - "learning_rate": 1.8305615047213483e-06, - "loss": 0.8301, - "step": 24859 - }, - { - "epoch": 0.64, - "learning_rate": 1.8305460939829075e-06, - "loss": 0.9473, - "step": 24860 - }, - { - "epoch": 0.64, - "learning_rate": 1.8305306826085563e-06, - "loss": 0.8682, - "step": 24861 - }, - { - "epoch": 0.64, - "learning_rate": 1.8305152705983055e-06, - "loss": 0.6018, - "step": 24862 - }, - { - "epoch": 0.64, - "learning_rate": 1.8304998579521678e-06, - "loss": 0.9277, - "step": 24863 - }, - { - "epoch": 0.64, - "learning_rate": 1.8304844446701542e-06, - "loss": 0.9541, - "step": 24864 - }, - { - "epoch": 0.64, - "learning_rate": 1.830469030752277e-06, - "loss": 0.791, - "step": 24865 - }, - { - "epoch": 0.64, - "learning_rate": 1.8304536161985477e-06, - "loss": 0.729, - "step": 24866 - }, - { - "epoch": 0.64, - "learning_rate": 1.8304382010089782e-06, - "loss": 0.9873, - "step": 24867 - }, - { - "epoch": 0.64, - "learning_rate": 1.8304227851835807e-06, - "loss": 0.5605, - "step": 24868 - }, - { - "epoch": 0.64, - "learning_rate": 1.8304073687223666e-06, - "loss": 0.9248, - "step": 24869 - }, - { - "epoch": 0.64, - "learning_rate": 1.8303919516253475e-06, - "loss": 0.5918, - "step": 24870 - }, - { - "epoch": 0.64, - "learning_rate": 1.8303765338925357e-06, - "loss": 0.7197, - "step": 24871 - }, - { - "epoch": 0.64, - "learning_rate": 1.8303611155239428e-06, - "loss": 0.7744, - "step": 24872 - }, - { - "epoch": 0.64, - "learning_rate": 1.83034569651958e-06, - "loss": 0.6045, - "step": 24873 - }, - { - "epoch": 0.64, - "learning_rate": 1.8303302768794601e-06, - "loss": 0.8906, - "step": 24874 - }, - { - "epoch": 0.64, - "learning_rate": 1.8303148566035946e-06, - "loss": 0.9688, - "step": 24875 - }, - { - "epoch": 0.64, - "learning_rate": 1.830299435691995e-06, - "loss": 0.835, - "step": 24876 - }, - { - "epoch": 0.64, - "learning_rate": 1.8302840141446735e-06, - "loss": 0.9766, - "step": 24877 - }, - { - "epoch": 0.64, - "learning_rate": 1.8302685919616415e-06, - "loss": 0.9805, - "step": 24878 - }, - { - "epoch": 0.64, - "learning_rate": 1.8302531691429111e-06, - "loss": 0.873, - "step": 24879 - }, - { - "epoch": 0.64, - "learning_rate": 1.830237745688494e-06, - "loss": 0.8506, - "step": 24880 - }, - { - "epoch": 0.64, - "learning_rate": 1.8302223215984021e-06, - "loss": 0.9082, - "step": 24881 - }, - { - "epoch": 0.64, - "learning_rate": 1.8302068968726471e-06, - "loss": 0.7949, - "step": 24882 - }, - { - "epoch": 0.64, - "learning_rate": 1.8301914715112407e-06, - "loss": 0.8306, - "step": 24883 - }, - { - "epoch": 0.64, - "learning_rate": 1.8301760455141953e-06, - "loss": 0.5898, - "step": 24884 - }, - { - "epoch": 0.64, - "learning_rate": 1.830160618881522e-06, - "loss": 0.6821, - "step": 24885 - }, - { - "epoch": 0.64, - "learning_rate": 1.8301451916132326e-06, - "loss": 0.6733, - "step": 24886 - }, - { - "epoch": 0.64, - "learning_rate": 1.8301297637093396e-06, - "loss": 0.6862, - "step": 24887 - }, - { - "epoch": 0.64, - "learning_rate": 1.8301143351698545e-06, - "loss": 0.6182, - "step": 24888 - }, - { - "epoch": 0.64, - "learning_rate": 1.8300989059947887e-06, - "loss": 0.7832, - "step": 24889 - }, - { - "epoch": 0.64, - "learning_rate": 1.8300834761841543e-06, - "loss": 0.8384, - "step": 24890 - }, - { - "epoch": 0.64, - "learning_rate": 1.8300680457379634e-06, - "loss": 0.7959, - "step": 24891 - }, - { - "epoch": 0.64, - "learning_rate": 1.8300526146562275e-06, - "loss": 0.9492, - "step": 24892 - }, - { - "epoch": 0.64, - "learning_rate": 1.8300371829389585e-06, - "loss": 0.8442, - "step": 24893 - }, - { - "epoch": 0.64, - "learning_rate": 1.8300217505861682e-06, - "loss": 0.8022, - "step": 24894 - }, - { - "epoch": 0.64, - "learning_rate": 1.8300063175978685e-06, - "loss": 0.9268, - "step": 24895 - }, - { - "epoch": 0.64, - "learning_rate": 1.8299908839740706e-06, - "loss": 0.6934, - "step": 24896 - }, - { - "epoch": 0.64, - "learning_rate": 1.8299754497147872e-06, - "loss": 0.8564, - "step": 24897 - }, - { - "epoch": 0.64, - "learning_rate": 1.8299600148200298e-06, - "loss": 0.7896, - "step": 24898 - }, - { - "epoch": 0.64, - "learning_rate": 1.8299445792898103e-06, - "loss": 0.8486, - "step": 24899 - }, - { - "epoch": 0.64, - "learning_rate": 1.8299291431241403e-06, - "loss": 0.8564, - "step": 24900 - }, - { - "epoch": 0.64, - "learning_rate": 1.8299137063230317e-06, - "loss": 0.8447, - "step": 24901 - }, - { - "epoch": 0.64, - "learning_rate": 1.8298982688864961e-06, - "loss": 0.749, - "step": 24902 - }, - { - "epoch": 0.64, - "learning_rate": 1.829882830814546e-06, - "loss": 1.0449, - "step": 24903 - }, - { - "epoch": 0.64, - "learning_rate": 1.8298673921071926e-06, - "loss": 0.8369, - "step": 24904 - }, - { - "epoch": 0.64, - "learning_rate": 1.829851952764448e-06, - "loss": 0.8604, - "step": 24905 - }, - { - "epoch": 0.64, - "learning_rate": 1.8298365127863233e-06, - "loss": 0.8379, - "step": 24906 - }, - { - "epoch": 0.64, - "learning_rate": 1.8298210721728316e-06, - "loss": 0.8672, - "step": 24907 - }, - { - "epoch": 0.64, - "learning_rate": 1.8298056309239837e-06, - "loss": 0.7041, - "step": 24908 - }, - { - "epoch": 0.64, - "learning_rate": 1.829790189039792e-06, - "loss": 0.7441, - "step": 24909 - }, - { - "epoch": 0.64, - "learning_rate": 1.8297747465202683e-06, - "loss": 0.9053, - "step": 24910 - }, - { - "epoch": 0.64, - "learning_rate": 1.8297593033654239e-06, - "loss": 1.085, - "step": 24911 - }, - { - "epoch": 0.64, - "learning_rate": 1.829743859575271e-06, - "loss": 0.9355, - "step": 24912 - }, - { - "epoch": 0.64, - "learning_rate": 1.8297284151498214e-06, - "loss": 0.9268, - "step": 24913 - }, - { - "epoch": 0.64, - "learning_rate": 1.829712970089087e-06, - "loss": 0.835, - "step": 24914 - }, - { - "epoch": 0.64, - "learning_rate": 1.8296975243930791e-06, - "loss": 0.998, - "step": 24915 - }, - { - "epoch": 0.64, - "learning_rate": 1.8296820780618106e-06, - "loss": 0.8066, - "step": 24916 - }, - { - "epoch": 0.64, - "learning_rate": 1.8296666310952925e-06, - "loss": 0.7886, - "step": 24917 - }, - { - "epoch": 0.64, - "learning_rate": 1.8296511834935363e-06, - "loss": 0.7603, - "step": 24918 - }, - { - "epoch": 0.64, - "learning_rate": 1.8296357352565548e-06, - "loss": 0.9492, - "step": 24919 - }, - { - "epoch": 0.64, - "learning_rate": 1.8296202863843595e-06, - "loss": 0.9844, - "step": 24920 - }, - { - "epoch": 0.64, - "learning_rate": 1.8296048368769616e-06, - "loss": 0.8379, - "step": 24921 - }, - { - "epoch": 0.64, - "learning_rate": 1.8295893867343738e-06, - "loss": 0.8154, - "step": 24922 - }, - { - "epoch": 0.64, - "learning_rate": 1.8295739359566075e-06, - "loss": 0.8262, - "step": 24923 - }, - { - "epoch": 0.64, - "learning_rate": 1.8295584845436744e-06, - "loss": 0.7637, - "step": 24924 - }, - { - "epoch": 0.64, - "learning_rate": 1.8295430324955867e-06, - "loss": 0.7314, - "step": 24925 - }, - { - "epoch": 0.64, - "learning_rate": 1.8295275798123563e-06, - "loss": 0.7529, - "step": 24926 - }, - { - "epoch": 0.64, - "learning_rate": 1.8295121264939942e-06, - "loss": 0.9082, - "step": 24927 - }, - { - "epoch": 0.64, - "learning_rate": 1.8294966725405131e-06, - "loss": 1.0029, - "step": 24928 - }, - { - "epoch": 0.64, - "learning_rate": 1.8294812179519248e-06, - "loss": 1.1426, - "step": 24929 - }, - { - "epoch": 0.64, - "learning_rate": 1.8294657627282403e-06, - "loss": 1.0635, - "step": 24930 - }, - { - "epoch": 0.64, - "learning_rate": 1.8294503068694725e-06, - "loss": 0.9688, - "step": 24931 - }, - { - "epoch": 0.64, - "learning_rate": 1.8294348503756324e-06, - "loss": 0.9502, - "step": 24932 - }, - { - "epoch": 0.64, - "learning_rate": 1.8294193932467324e-06, - "loss": 0.874, - "step": 24933 - }, - { - "epoch": 0.64, - "learning_rate": 1.8294039354827842e-06, - "loss": 0.9004, - "step": 24934 - }, - { - "epoch": 0.64, - "learning_rate": 1.8293884770837993e-06, - "loss": 0.8408, - "step": 24935 - }, - { - "epoch": 0.64, - "learning_rate": 1.8293730180497896e-06, - "loss": 1.0117, - "step": 24936 - }, - { - "epoch": 0.64, - "learning_rate": 1.8293575583807676e-06, - "loss": 0.7588, - "step": 24937 - }, - { - "epoch": 0.64, - "learning_rate": 1.8293420980767444e-06, - "loss": 0.7937, - "step": 24938 - }, - { - "epoch": 0.64, - "learning_rate": 1.829326637137732e-06, - "loss": 0.8184, - "step": 24939 - }, - { - "epoch": 0.64, - "learning_rate": 1.8293111755637426e-06, - "loss": 0.874, - "step": 24940 - }, - { - "epoch": 0.64, - "learning_rate": 1.8292957133547876e-06, - "loss": 0.9834, - "step": 24941 - }, - { - "epoch": 0.64, - "learning_rate": 1.829280250510879e-06, - "loss": 0.8398, - "step": 24942 - }, - { - "epoch": 0.64, - "learning_rate": 1.8292647870320285e-06, - "loss": 1.0488, - "step": 24943 - }, - { - "epoch": 0.64, - "learning_rate": 1.8292493229182485e-06, - "loss": 0.7363, - "step": 24944 - }, - { - "epoch": 0.64, - "learning_rate": 1.82923385816955e-06, - "loss": 0.9717, - "step": 24945 - }, - { - "epoch": 0.64, - "learning_rate": 1.8292183927859452e-06, - "loss": 0.8921, - "step": 24946 - }, - { - "epoch": 0.64, - "learning_rate": 1.8292029267674462e-06, - "loss": 0.8008, - "step": 24947 - }, - { - "epoch": 0.64, - "learning_rate": 1.8291874601140647e-06, - "loss": 0.7617, - "step": 24948 - }, - { - "epoch": 0.64, - "learning_rate": 1.8291719928258125e-06, - "loss": 0.9482, - "step": 24949 - }, - { - "epoch": 0.64, - "learning_rate": 1.8291565249027015e-06, - "loss": 0.7871, - "step": 24950 - }, - { - "epoch": 0.64, - "learning_rate": 1.8291410563447433e-06, - "loss": 0.8232, - "step": 24951 - }, - { - "epoch": 0.64, - "learning_rate": 1.82912558715195e-06, - "loss": 0.8164, - "step": 24952 - }, - { - "epoch": 0.64, - "learning_rate": 1.8291101173243333e-06, - "loss": 0.9971, - "step": 24953 - }, - { - "epoch": 0.64, - "learning_rate": 1.8290946468619052e-06, - "loss": 0.9531, - "step": 24954 - }, - { - "epoch": 0.64, - "learning_rate": 1.8290791757646774e-06, - "loss": 1.0869, - "step": 24955 - }, - { - "epoch": 0.64, - "learning_rate": 1.8290637040326618e-06, - "loss": 0.8438, - "step": 24956 - }, - { - "epoch": 0.64, - "learning_rate": 1.82904823166587e-06, - "loss": 0.7822, - "step": 24957 - }, - { - "epoch": 0.64, - "learning_rate": 1.8290327586643146e-06, - "loss": 0.605, - "step": 24958 - }, - { - "epoch": 0.64, - "learning_rate": 1.8290172850280066e-06, - "loss": 0.9443, - "step": 24959 - }, - { - "epoch": 0.64, - "learning_rate": 1.8290018107569582e-06, - "loss": 0.8022, - "step": 24960 - }, - { - "epoch": 0.64, - "learning_rate": 1.8289863358511814e-06, - "loss": 0.9023, - "step": 24961 - }, - { - "epoch": 0.64, - "learning_rate": 1.8289708603106876e-06, - "loss": 0.8047, - "step": 24962 - }, - { - "epoch": 0.64, - "learning_rate": 1.8289553841354892e-06, - "loss": 0.8574, - "step": 24963 - }, - { - "epoch": 0.64, - "learning_rate": 1.8289399073255978e-06, - "loss": 1.1006, - "step": 24964 - }, - { - "epoch": 0.64, - "learning_rate": 1.828924429881025e-06, - "loss": 0.7832, - "step": 24965 - }, - { - "epoch": 0.64, - "learning_rate": 1.828908951801783e-06, - "loss": 0.666, - "step": 24966 - }, - { - "epoch": 0.64, - "learning_rate": 1.8288934730878834e-06, - "loss": 0.71, - "step": 24967 - }, - { - "epoch": 0.64, - "learning_rate": 1.828877993739338e-06, - "loss": 0.8604, - "step": 24968 - }, - { - "epoch": 0.64, - "learning_rate": 1.8288625137561593e-06, - "loss": 0.8379, - "step": 24969 - }, - { - "epoch": 0.64, - "learning_rate": 1.8288470331383586e-06, - "loss": 0.7603, - "step": 24970 - }, - { - "epoch": 0.64, - "learning_rate": 1.8288315518859477e-06, - "loss": 0.8525, - "step": 24971 - }, - { - "epoch": 0.64, - "learning_rate": 1.8288160699989387e-06, - "loss": 0.9707, - "step": 24972 - }, - { - "epoch": 0.64, - "learning_rate": 1.8288005874773434e-06, - "loss": 1.0586, - "step": 24973 - }, - { - "epoch": 0.64, - "learning_rate": 1.8287851043211732e-06, - "loss": 0.8237, - "step": 24974 - }, - { - "epoch": 0.64, - "learning_rate": 1.828769620530441e-06, - "loss": 0.9951, - "step": 24975 - }, - { - "epoch": 0.64, - "learning_rate": 1.8287541361051575e-06, - "loss": 0.9824, - "step": 24976 - }, - { - "epoch": 0.64, - "learning_rate": 1.8287386510453354e-06, - "loss": 0.8613, - "step": 24977 - }, - { - "epoch": 0.64, - "learning_rate": 1.8287231653509857e-06, - "loss": 0.8789, - "step": 24978 - }, - { - "epoch": 0.64, - "learning_rate": 1.8287076790221213e-06, - "loss": 0.7793, - "step": 24979 - }, - { - "epoch": 0.64, - "learning_rate": 1.8286921920587532e-06, - "loss": 0.9277, - "step": 24980 - }, - { - "epoch": 0.64, - "learning_rate": 1.8286767044608937e-06, - "loss": 1.0166, - "step": 24981 - }, - { - "epoch": 0.64, - "learning_rate": 1.8286612162285548e-06, - "loss": 1.0381, - "step": 24982 - }, - { - "epoch": 0.64, - "learning_rate": 1.8286457273617478e-06, - "loss": 0.8379, - "step": 24983 - }, - { - "epoch": 0.64, - "learning_rate": 1.828630237860485e-06, - "loss": 0.9775, - "step": 24984 - }, - { - "epoch": 0.64, - "learning_rate": 1.828614747724778e-06, - "loss": 0.7275, - "step": 24985 - }, - { - "epoch": 0.64, - "learning_rate": 1.828599256954639e-06, - "loss": 0.748, - "step": 24986 - }, - { - "epoch": 0.64, - "learning_rate": 1.8285837655500793e-06, - "loss": 0.8281, - "step": 24987 - }, - { - "epoch": 0.64, - "learning_rate": 1.8285682735111117e-06, - "loss": 0.8975, - "step": 24988 - }, - { - "epoch": 0.64, - "learning_rate": 1.828552780837747e-06, - "loss": 0.8608, - "step": 24989 - }, - { - "epoch": 0.64, - "learning_rate": 1.8285372875299976e-06, - "loss": 0.9238, - "step": 24990 - }, - { - "epoch": 0.64, - "learning_rate": 1.828521793587875e-06, - "loss": 0.6577, - "step": 24991 - }, - { - "epoch": 0.64, - "learning_rate": 1.828506299011392e-06, - "loss": 0.8174, - "step": 24992 - }, - { - "epoch": 0.64, - "learning_rate": 1.8284908038005596e-06, - "loss": 0.7734, - "step": 24993 - }, - { - "epoch": 0.64, - "learning_rate": 1.8284753079553897e-06, - "loss": 0.9209, - "step": 24994 - }, - { - "epoch": 0.64, - "learning_rate": 1.8284598114758944e-06, - "loss": 1.0742, - "step": 24995 - }, - { - "epoch": 0.64, - "learning_rate": 1.8284443143620858e-06, - "loss": 0.9111, - "step": 24996 - }, - { - "epoch": 0.64, - "learning_rate": 1.8284288166139753e-06, - "loss": 0.731, - "step": 24997 - }, - { - "epoch": 0.64, - "learning_rate": 1.8284133182315745e-06, - "loss": 0.8394, - "step": 24998 - }, - { - "epoch": 0.64, - "learning_rate": 1.8283978192148962e-06, - "loss": 0.9048, - "step": 24999 - }, - { - "epoch": 0.64, - "learning_rate": 1.8283823195639518e-06, - "loss": 0.7412, - "step": 25000 - }, - { - "epoch": 0.64, - "learning_rate": 1.8283668192787532e-06, - "loss": 0.8442, - "step": 25001 - }, - { - "epoch": 0.64, - "learning_rate": 1.828351318359312e-06, - "loss": 0.8604, - "step": 25002 - }, - { - "epoch": 0.64, - "learning_rate": 1.8283358168056404e-06, - "loss": 0.792, - "step": 25003 - }, - { - "epoch": 0.64, - "learning_rate": 1.8283203146177502e-06, - "loss": 1.0547, - "step": 25004 - }, - { - "epoch": 0.64, - "learning_rate": 1.828304811795653e-06, - "loss": 0.8408, - "step": 25005 - }, - { - "epoch": 0.64, - "learning_rate": 1.8282893083393609e-06, - "loss": 0.9756, - "step": 25006 - }, - { - "epoch": 0.64, - "learning_rate": 1.8282738042488858e-06, - "loss": 0.96, - "step": 25007 - }, - { - "epoch": 0.64, - "learning_rate": 1.8282582995242397e-06, - "loss": 0.7148, - "step": 25008 - }, - { - "epoch": 0.64, - "learning_rate": 1.8282427941654344e-06, - "loss": 0.9424, - "step": 25009 - }, - { - "epoch": 0.64, - "learning_rate": 1.8282272881724813e-06, - "loss": 1.1211, - "step": 25010 - }, - { - "epoch": 0.64, - "learning_rate": 1.8282117815453929e-06, - "loss": 0.6592, - "step": 25011 - }, - { - "epoch": 0.64, - "learning_rate": 1.8281962742841808e-06, - "loss": 0.604, - "step": 25012 - }, - { - "epoch": 0.64, - "learning_rate": 1.828180766388857e-06, - "loss": 0.7178, - "step": 25013 - }, - { - "epoch": 0.64, - "learning_rate": 1.828165257859433e-06, - "loss": 0.7065, - "step": 25014 - }, - { - "epoch": 0.64, - "learning_rate": 1.828149748695921e-06, - "loss": 1.0059, - "step": 25015 - }, - { - "epoch": 0.64, - "learning_rate": 1.8281342388983329e-06, - "loss": 0.894, - "step": 25016 - }, - { - "epoch": 0.64, - "learning_rate": 1.8281187284666805e-06, - "loss": 0.8428, - "step": 25017 - }, - { - "epoch": 0.64, - "learning_rate": 1.8281032174009757e-06, - "loss": 0.9844, - "step": 25018 - }, - { - "epoch": 0.64, - "learning_rate": 1.8280877057012303e-06, - "loss": 0.7969, - "step": 25019 - }, - { - "epoch": 0.64, - "learning_rate": 1.8280721933674562e-06, - "loss": 0.8242, - "step": 25020 - }, - { - "epoch": 0.64, - "learning_rate": 1.8280566803996652e-06, - "loss": 0.8564, - "step": 25021 - }, - { - "epoch": 0.64, - "learning_rate": 1.8280411667978694e-06, - "loss": 0.7524, - "step": 25022 - }, - { - "epoch": 0.64, - "learning_rate": 1.8280256525620805e-06, - "loss": 0.9854, - "step": 25023 - }, - { - "epoch": 0.64, - "learning_rate": 1.8280101376923105e-06, - "loss": 0.7378, - "step": 25024 - }, - { - "epoch": 0.64, - "learning_rate": 1.8279946221885712e-06, - "loss": 0.7466, - "step": 25025 - }, - { - "epoch": 0.64, - "learning_rate": 1.8279791060508744e-06, - "loss": 0.8809, - "step": 25026 - }, - { - "epoch": 0.64, - "learning_rate": 1.8279635892792323e-06, - "loss": 0.6763, - "step": 25027 - }, - { - "epoch": 0.64, - "learning_rate": 1.8279480718736564e-06, - "loss": 1.0645, - "step": 25028 - }, - { - "epoch": 0.64, - "learning_rate": 1.8279325538341586e-06, - "loss": 0.7749, - "step": 25029 - }, - { - "epoch": 0.64, - "learning_rate": 1.827917035160751e-06, - "loss": 0.9775, - "step": 25030 - }, - { - "epoch": 0.64, - "learning_rate": 1.8279015158534454e-06, - "loss": 0.8203, - "step": 25031 - }, - { - "epoch": 0.64, - "learning_rate": 1.8278859959122537e-06, - "loss": 1.0107, - "step": 25032 - }, - { - "epoch": 0.64, - "learning_rate": 1.8278704753371876e-06, - "loss": 0.8857, - "step": 25033 - }, - { - "epoch": 0.64, - "learning_rate": 1.8278549541282596e-06, - "loss": 0.9443, - "step": 25034 - }, - { - "epoch": 0.64, - "learning_rate": 1.8278394322854806e-06, - "loss": 0.8945, - "step": 25035 - }, - { - "epoch": 0.64, - "learning_rate": 1.8278239098088632e-06, - "loss": 0.8086, - "step": 25036 - }, - { - "epoch": 0.64, - "learning_rate": 1.8278083866984194e-06, - "loss": 0.9131, - "step": 25037 - }, - { - "epoch": 0.64, - "learning_rate": 1.8277928629541606e-06, - "loss": 0.7827, - "step": 25038 - }, - { - "epoch": 0.64, - "learning_rate": 1.8277773385760987e-06, - "loss": 1.0449, - "step": 25039 - }, - { - "epoch": 0.64, - "learning_rate": 1.8277618135642459e-06, - "loss": 0.855, - "step": 25040 - }, - { - "epoch": 0.64, - "learning_rate": 1.8277462879186136e-06, - "loss": 0.9814, - "step": 25041 - }, - { - "epoch": 0.64, - "learning_rate": 1.8277307616392147e-06, - "loss": 0.8037, - "step": 25042 - }, - { - "epoch": 0.64, - "learning_rate": 1.8277152347260598e-06, - "loss": 0.9336, - "step": 25043 - }, - { - "epoch": 0.64, - "learning_rate": 1.8276997071791619e-06, - "loss": 1.1338, - "step": 25044 - }, - { - "epoch": 0.64, - "learning_rate": 1.8276841789985319e-06, - "loss": 0.8838, - "step": 25045 - }, - { - "epoch": 0.64, - "learning_rate": 1.8276686501841825e-06, - "loss": 0.7451, - "step": 25046 - }, - { - "epoch": 0.64, - "learning_rate": 1.827653120736125e-06, - "loss": 0.9297, - "step": 25047 - }, - { - "epoch": 0.64, - "learning_rate": 1.8276375906543718e-06, - "loss": 0.9375, - "step": 25048 - }, - { - "epoch": 0.64, - "learning_rate": 1.8276220599389345e-06, - "loss": 0.9414, - "step": 25049 - }, - { - "epoch": 0.64, - "learning_rate": 1.827606528589825e-06, - "loss": 0.7441, - "step": 25050 - }, - { - "epoch": 0.64, - "learning_rate": 1.8275909966070552e-06, - "loss": 0.6797, - "step": 25051 - }, - { - "epoch": 0.64, - "learning_rate": 1.8275754639906373e-06, - "loss": 0.8447, - "step": 25052 - }, - { - "epoch": 0.64, - "learning_rate": 1.8275599307405827e-06, - "loss": 0.9404, - "step": 25053 - }, - { - "epoch": 0.64, - "learning_rate": 1.8275443968569034e-06, - "loss": 0.7319, - "step": 25054 - }, - { - "epoch": 0.64, - "learning_rate": 1.8275288623396117e-06, - "loss": 1.002, - "step": 25055 - }, - { - "epoch": 0.64, - "learning_rate": 1.8275133271887188e-06, - "loss": 0.8403, - "step": 25056 - }, - { - "epoch": 0.64, - "learning_rate": 1.8274977914042374e-06, - "loss": 0.6787, - "step": 25057 - }, - { - "epoch": 0.64, - "learning_rate": 1.8274822549861787e-06, - "loss": 0.8027, - "step": 25058 - }, - { - "epoch": 0.64, - "learning_rate": 1.8274667179345551e-06, - "loss": 0.8613, - "step": 25059 - }, - { - "epoch": 0.64, - "learning_rate": 1.8274511802493782e-06, - "loss": 0.7886, - "step": 25060 - }, - { - "epoch": 0.64, - "learning_rate": 1.82743564193066e-06, - "loss": 1.0459, - "step": 25061 - }, - { - "epoch": 0.64, - "learning_rate": 1.8274201029784124e-06, - "loss": 0.8931, - "step": 25062 - }, - { - "epoch": 0.64, - "learning_rate": 1.8274045633926472e-06, - "loss": 0.7886, - "step": 25063 - }, - { - "epoch": 0.64, - "learning_rate": 1.8273890231733762e-06, - "loss": 0.729, - "step": 25064 - }, - { - "epoch": 0.64, - "learning_rate": 1.8273734823206117e-06, - "loss": 0.8906, - "step": 25065 - }, - { - "epoch": 0.64, - "learning_rate": 1.8273579408343655e-06, - "loss": 0.9277, - "step": 25066 - }, - { - "epoch": 0.64, - "learning_rate": 1.827342398714649e-06, - "loss": 0.8057, - "step": 25067 - }, - { - "epoch": 0.64, - "learning_rate": 1.8273268559614747e-06, - "loss": 1.0186, - "step": 25068 - }, - { - "epoch": 0.64, - "learning_rate": 1.8273113125748542e-06, - "loss": 0.8276, - "step": 25069 - }, - { - "epoch": 0.64, - "learning_rate": 1.8272957685547996e-06, - "loss": 0.7734, - "step": 25070 - }, - { - "epoch": 0.64, - "learning_rate": 1.8272802239013227e-06, - "loss": 0.792, - "step": 25071 - }, - { - "epoch": 0.64, - "learning_rate": 1.8272646786144352e-06, - "loss": 0.7505, - "step": 25072 - }, - { - "epoch": 0.64, - "learning_rate": 1.827249132694149e-06, - "loss": 0.6992, - "step": 25073 - }, - { - "epoch": 0.64, - "learning_rate": 1.8272335861404765e-06, - "loss": 1.0068, - "step": 25074 - }, - { - "epoch": 0.64, - "learning_rate": 1.827218038953429e-06, - "loss": 0.6348, - "step": 25075 - }, - { - "epoch": 0.64, - "learning_rate": 1.8272024911330192e-06, - "loss": 0.9805, - "step": 25076 - }, - { - "epoch": 0.64, - "learning_rate": 1.827186942679258e-06, - "loss": 0.6914, - "step": 25077 - }, - { - "epoch": 0.64, - "learning_rate": 1.827171393592158e-06, - "loss": 0.7119, - "step": 25078 - }, - { - "epoch": 0.64, - "learning_rate": 1.827155843871731e-06, - "loss": 0.9102, - "step": 25079 - }, - { - "epoch": 0.64, - "learning_rate": 1.8271402935179884e-06, - "loss": 0.9395, - "step": 25080 - }, - { - "epoch": 0.64, - "learning_rate": 1.827124742530943e-06, - "loss": 0.8398, - "step": 25081 - }, - { - "epoch": 0.64, - "learning_rate": 1.8271091909106059e-06, - "loss": 0.7617, - "step": 25082 - }, - { - "epoch": 0.64, - "learning_rate": 1.8270936386569893e-06, - "loss": 0.7783, - "step": 25083 - }, - { - "epoch": 0.64, - "learning_rate": 1.8270780857701053e-06, - "loss": 0.9629, - "step": 25084 - }, - { - "epoch": 0.64, - "learning_rate": 1.8270625322499654e-06, - "loss": 1.0293, - "step": 25085 - }, - { - "epoch": 0.64, - "learning_rate": 1.827046978096582e-06, - "loss": 0.7822, - "step": 25086 - }, - { - "epoch": 0.64, - "learning_rate": 1.8270314233099666e-06, - "loss": 0.7852, - "step": 25087 - }, - { - "epoch": 0.64, - "learning_rate": 1.8270158678901316e-06, - "loss": 0.7837, - "step": 25088 - }, - { - "epoch": 0.64, - "learning_rate": 1.827000311837088e-06, - "loss": 0.9951, - "step": 25089 - }, - { - "epoch": 0.64, - "learning_rate": 1.8269847551508488e-06, - "loss": 0.8906, - "step": 25090 - }, - { - "epoch": 0.64, - "learning_rate": 1.826969197831425e-06, - "loss": 0.7109, - "step": 25091 - }, - { - "epoch": 0.64, - "learning_rate": 1.8269536398788292e-06, - "loss": 0.9912, - "step": 25092 - }, - { - "epoch": 0.64, - "learning_rate": 1.826938081293073e-06, - "loss": 0.7534, - "step": 25093 - }, - { - "epoch": 0.64, - "learning_rate": 1.8269225220741683e-06, - "loss": 1.1621, - "step": 25094 - }, - { - "epoch": 0.64, - "learning_rate": 1.8269069622221269e-06, - "loss": 0.8374, - "step": 25095 - }, - { - "epoch": 0.64, - "learning_rate": 1.8268914017369613e-06, - "loss": 0.9121, - "step": 25096 - }, - { - "epoch": 0.64, - "learning_rate": 1.8268758406186825e-06, - "loss": 0.9365, - "step": 25097 - }, - { - "epoch": 0.64, - "learning_rate": 1.8268602788673028e-06, - "loss": 0.9106, - "step": 25098 - }, - { - "epoch": 0.64, - "learning_rate": 1.8268447164828346e-06, - "loss": 0.7051, - "step": 25099 - }, - { - "epoch": 0.64, - "learning_rate": 1.8268291534652894e-06, - "loss": 0.7852, - "step": 25100 - }, - { - "epoch": 0.64, - "learning_rate": 1.826813589814679e-06, - "loss": 0.873, - "step": 25101 - }, - { - "epoch": 0.64, - "learning_rate": 1.8267980255310153e-06, - "loss": 0.7363, - "step": 25102 - }, - { - "epoch": 0.64, - "learning_rate": 1.8267824606143106e-06, - "loss": 0.6475, - "step": 25103 - }, - { - "epoch": 0.64, - "learning_rate": 1.8267668950645764e-06, - "loss": 0.8652, - "step": 25104 - }, - { - "epoch": 0.64, - "learning_rate": 1.8267513288818251e-06, - "loss": 0.6851, - "step": 25105 - }, - { - "epoch": 0.64, - "learning_rate": 1.826735762066068e-06, - "loss": 0.9141, - "step": 25106 - }, - { - "epoch": 0.64, - "learning_rate": 1.8267201946173174e-06, - "loss": 0.7236, - "step": 25107 - }, - { - "epoch": 0.64, - "learning_rate": 1.8267046265355854e-06, - "loss": 0.7061, - "step": 25108 - }, - { - "epoch": 0.64, - "learning_rate": 1.8266890578208836e-06, - "loss": 0.9033, - "step": 25109 - }, - { - "epoch": 0.64, - "learning_rate": 1.8266734884732237e-06, - "loss": 0.7871, - "step": 25110 - }, - { - "epoch": 0.64, - "learning_rate": 1.8266579184926183e-06, - "loss": 0.8359, - "step": 25111 - }, - { - "epoch": 0.64, - "learning_rate": 1.8266423478790787e-06, - "loss": 0.8398, - "step": 25112 - }, - { - "epoch": 0.64, - "learning_rate": 1.8266267766326173e-06, - "loss": 0.9092, - "step": 25113 - }, - { - "epoch": 0.64, - "learning_rate": 1.8266112047532456e-06, - "loss": 0.6592, - "step": 25114 - }, - { - "epoch": 0.64, - "learning_rate": 1.8265956322409756e-06, - "loss": 0.8623, - "step": 25115 - }, - { - "epoch": 0.64, - "learning_rate": 1.8265800590958195e-06, - "loss": 0.7686, - "step": 25116 - }, - { - "epoch": 0.64, - "learning_rate": 1.826564485317789e-06, - "loss": 0.8486, - "step": 25117 - }, - { - "epoch": 0.64, - "learning_rate": 1.8265489109068963e-06, - "loss": 0.7246, - "step": 25118 - }, - { - "epoch": 0.64, - "learning_rate": 1.8265333358631527e-06, - "loss": 0.8213, - "step": 25119 - }, - { - "epoch": 0.64, - "learning_rate": 1.826517760186571e-06, - "loss": 0.8604, - "step": 25120 - }, - { - "epoch": 0.64, - "learning_rate": 1.8265021838771623e-06, - "loss": 0.8965, - "step": 25121 - }, - { - "epoch": 0.64, - "learning_rate": 1.826486606934939e-06, - "loss": 0.7163, - "step": 25122 - }, - { - "epoch": 0.64, - "learning_rate": 1.8264710293599128e-06, - "loss": 0.7715, - "step": 25123 - }, - { - "epoch": 0.64, - "learning_rate": 1.8264554511520959e-06, - "loss": 0.7861, - "step": 25124 - }, - { - "epoch": 0.64, - "learning_rate": 1.8264398723115e-06, - "loss": 0.8057, - "step": 25125 - }, - { - "epoch": 0.64, - "learning_rate": 1.826424292838137e-06, - "loss": 0.7021, - "step": 25126 - }, - { - "epoch": 0.64, - "learning_rate": 1.8264087127320188e-06, - "loss": 0.9512, - "step": 25127 - }, - { - "epoch": 0.64, - "learning_rate": 1.8263931319931577e-06, - "loss": 0.9424, - "step": 25128 - }, - { - "epoch": 0.64, - "learning_rate": 1.8263775506215656e-06, - "loss": 0.8721, - "step": 25129 - }, - { - "epoch": 0.64, - "learning_rate": 1.8263619686172538e-06, - "loss": 0.7554, - "step": 25130 - }, - { - "epoch": 0.64, - "learning_rate": 1.8263463859802348e-06, - "loss": 0.7061, - "step": 25131 - }, - { - "epoch": 0.64, - "learning_rate": 1.8263308027105202e-06, - "loss": 0.8389, - "step": 25132 - }, - { - "epoch": 0.64, - "learning_rate": 1.8263152188081223e-06, - "loss": 1.0342, - "step": 25133 - }, - { - "epoch": 0.64, - "learning_rate": 1.8262996342730529e-06, - "loss": 0.8105, - "step": 25134 - }, - { - "epoch": 0.64, - "learning_rate": 1.8262840491053235e-06, - "loss": 1.002, - "step": 25135 - }, - { - "epoch": 0.64, - "learning_rate": 1.8262684633049467e-06, - "loss": 0.9414, - "step": 25136 - }, - { - "epoch": 0.64, - "learning_rate": 1.8262528768719342e-06, - "loss": 0.9678, - "step": 25137 - }, - { - "epoch": 0.64, - "learning_rate": 1.8262372898062977e-06, - "loss": 0.8926, - "step": 25138 - }, - { - "epoch": 0.64, - "learning_rate": 1.8262217021080494e-06, - "loss": 0.8232, - "step": 25139 - }, - { - "epoch": 0.64, - "learning_rate": 1.8262061137772008e-06, - "loss": 0.7871, - "step": 25140 - }, - { - "epoch": 0.64, - "learning_rate": 1.8261905248137646e-06, - "loss": 0.8877, - "step": 25141 - }, - { - "epoch": 0.64, - "learning_rate": 1.826174935217752e-06, - "loss": 0.8721, - "step": 25142 - }, - { - "epoch": 0.64, - "learning_rate": 1.8261593449891755e-06, - "loss": 0.7266, - "step": 25143 - }, - { - "epoch": 0.64, - "learning_rate": 1.8261437541280467e-06, - "loss": 0.8364, - "step": 25144 - }, - { - "epoch": 0.64, - "learning_rate": 1.8261281626343776e-06, - "loss": 0.6733, - "step": 25145 - }, - { - "epoch": 0.64, - "learning_rate": 1.82611257050818e-06, - "loss": 0.9414, - "step": 25146 - }, - { - "epoch": 0.64, - "learning_rate": 1.826096977749466e-06, - "loss": 1.0703, - "step": 25147 - }, - { - "epoch": 0.64, - "learning_rate": 1.8260813843582477e-06, - "loss": 0.958, - "step": 25148 - }, - { - "epoch": 0.64, - "learning_rate": 1.8260657903345367e-06, - "loss": 0.7305, - "step": 25149 - }, - { - "epoch": 0.64, - "learning_rate": 1.8260501956783453e-06, - "loss": 0.9102, - "step": 25150 - }, - { - "epoch": 0.64, - "learning_rate": 1.8260346003896852e-06, - "loss": 1.0039, - "step": 25151 - }, - { - "epoch": 0.64, - "learning_rate": 1.8260190044685683e-06, - "loss": 0.6875, - "step": 25152 - }, - { - "epoch": 0.64, - "learning_rate": 1.8260034079150066e-06, - "loss": 0.9082, - "step": 25153 - }, - { - "epoch": 0.64, - "learning_rate": 1.8259878107290123e-06, - "loss": 0.7891, - "step": 25154 - }, - { - "epoch": 0.64, - "learning_rate": 1.8259722129105968e-06, - "loss": 0.7939, - "step": 25155 - }, - { - "epoch": 0.64, - "learning_rate": 1.8259566144597726e-06, - "loss": 0.8994, - "step": 25156 - }, - { - "epoch": 0.64, - "learning_rate": 1.8259410153765512e-06, - "loss": 0.7891, - "step": 25157 - }, - { - "epoch": 0.64, - "learning_rate": 1.825925415660945e-06, - "loss": 0.8672, - "step": 25158 - }, - { - "epoch": 0.64, - "learning_rate": 1.8259098153129656e-06, - "loss": 0.7329, - "step": 25159 - }, - { - "epoch": 0.64, - "learning_rate": 1.825894214332625e-06, - "loss": 0.8877, - "step": 25160 - }, - { - "epoch": 0.64, - "learning_rate": 1.8258786127199351e-06, - "loss": 0.7695, - "step": 25161 - }, - { - "epoch": 0.64, - "learning_rate": 1.825863010474908e-06, - "loss": 0.8779, - "step": 25162 - }, - { - "epoch": 0.64, - "learning_rate": 1.8258474075975556e-06, - "loss": 0.8857, - "step": 25163 - }, - { - "epoch": 0.64, - "learning_rate": 1.8258318040878897e-06, - "loss": 0.7808, - "step": 25164 - }, - { - "epoch": 0.64, - "learning_rate": 1.8258161999459225e-06, - "loss": 0.8604, - "step": 25165 - }, - { - "epoch": 0.65, - "learning_rate": 1.8258005951716657e-06, - "loss": 1.0205, - "step": 25166 - }, - { - "epoch": 0.65, - "learning_rate": 1.8257849897651312e-06, - "loss": 0.8711, - "step": 25167 - }, - { - "epoch": 0.65, - "learning_rate": 1.8257693837263313e-06, - "loss": 0.8232, - "step": 25168 - }, - { - "epoch": 0.65, - "learning_rate": 1.8257537770552777e-06, - "loss": 0.6792, - "step": 25169 - }, - { - "epoch": 0.65, - "learning_rate": 1.8257381697519825e-06, - "loss": 0.7734, - "step": 25170 - }, - { - "epoch": 0.65, - "learning_rate": 1.8257225618164575e-06, - "loss": 0.7695, - "step": 25171 - }, - { - "epoch": 0.65, - "learning_rate": 1.8257069532487148e-06, - "loss": 0.7388, - "step": 25172 - }, - { - "epoch": 0.65, - "learning_rate": 1.8256913440487661e-06, - "loss": 0.8525, - "step": 25173 - }, - { - "epoch": 0.65, - "learning_rate": 1.8256757342166234e-06, - "loss": 1.0547, - "step": 25174 - }, - { - "epoch": 0.65, - "learning_rate": 1.8256601237522991e-06, - "loss": 0.6147, - "step": 25175 - }, - { - "epoch": 0.65, - "learning_rate": 1.8256445126558045e-06, - "loss": 0.9814, - "step": 25176 - }, - { - "epoch": 0.65, - "learning_rate": 1.8256289009271518e-06, - "loss": 0.9385, - "step": 25177 - }, - { - "epoch": 0.65, - "learning_rate": 1.8256132885663536e-06, - "loss": 1.0371, - "step": 25178 - }, - { - "epoch": 0.65, - "learning_rate": 1.8255976755734206e-06, - "loss": 0.877, - "step": 25179 - }, - { - "epoch": 0.65, - "learning_rate": 1.8255820619483658e-06, - "loss": 0.9131, - "step": 25180 - }, - { - "epoch": 0.65, - "learning_rate": 1.8255664476912008e-06, - "loss": 1.0166, - "step": 25181 - }, - { - "epoch": 0.65, - "learning_rate": 1.8255508328019372e-06, - "loss": 0.9395, - "step": 25182 - }, - { - "epoch": 0.65, - "learning_rate": 1.8255352172805876e-06, - "loss": 0.915, - "step": 25183 - }, - { - "epoch": 0.65, - "learning_rate": 1.8255196011271633e-06, - "loss": 0.7627, - "step": 25184 - }, - { - "epoch": 0.65, - "learning_rate": 1.8255039843416768e-06, - "loss": 1.0332, - "step": 25185 - }, - { - "epoch": 0.65, - "learning_rate": 1.82548836692414e-06, - "loss": 0.7651, - "step": 25186 - }, - { - "epoch": 0.65, - "learning_rate": 1.8254727488745644e-06, - "loss": 0.9238, - "step": 25187 - }, - { - "epoch": 0.65, - "learning_rate": 1.8254571301929626e-06, - "loss": 0.7861, - "step": 25188 - }, - { - "epoch": 0.65, - "learning_rate": 1.825441510879346e-06, - "loss": 0.9062, - "step": 25189 - }, - { - "epoch": 0.65, - "learning_rate": 1.8254258909337268e-06, - "loss": 0.7905, - "step": 25190 - }, - { - "epoch": 0.65, - "learning_rate": 1.8254102703561171e-06, - "loss": 0.9082, - "step": 25191 - }, - { - "epoch": 0.65, - "learning_rate": 1.8253946491465285e-06, - "loss": 0.7412, - "step": 25192 - }, - { - "epoch": 0.65, - "learning_rate": 1.8253790273049735e-06, - "loss": 0.8408, - "step": 25193 - }, - { - "epoch": 0.65, - "learning_rate": 1.8253634048314634e-06, - "loss": 0.8291, - "step": 25194 - }, - { - "epoch": 0.65, - "learning_rate": 1.8253477817260107e-06, - "loss": 0.833, - "step": 25195 - }, - { - "epoch": 0.65, - "learning_rate": 1.8253321579886272e-06, - "loss": 1.0254, - "step": 25196 - }, - { - "epoch": 0.65, - "learning_rate": 1.8253165336193245e-06, - "loss": 0.7036, - "step": 25197 - }, - { - "epoch": 0.65, - "learning_rate": 1.8253009086181153e-06, - "loss": 0.79, - "step": 25198 - }, - { - "epoch": 0.65, - "learning_rate": 1.825285282985011e-06, - "loss": 1.0146, - "step": 25199 - }, - { - "epoch": 0.65, - "learning_rate": 1.8252696567200237e-06, - "loss": 0.7686, - "step": 25200 - }, - { - "epoch": 0.65, - "learning_rate": 1.825254029823165e-06, - "loss": 0.73, - "step": 25201 - }, - { - "epoch": 0.65, - "learning_rate": 1.8252384022944476e-06, - "loss": 0.8936, - "step": 25202 - }, - { - "epoch": 0.65, - "learning_rate": 1.825222774133883e-06, - "loss": 0.9443, - "step": 25203 - }, - { - "epoch": 0.65, - "learning_rate": 1.8252071453414835e-06, - "loss": 0.8936, - "step": 25204 - }, - { - "epoch": 0.65, - "learning_rate": 1.8251915159172606e-06, - "loss": 0.7959, - "step": 25205 - }, - { - "epoch": 0.65, - "learning_rate": 1.8251758858612262e-06, - "loss": 1.0381, - "step": 25206 - }, - { - "epoch": 0.65, - "learning_rate": 1.8251602551733932e-06, - "loss": 1.0381, - "step": 25207 - }, - { - "epoch": 0.65, - "learning_rate": 1.8251446238537725e-06, - "loss": 0.8525, - "step": 25208 - }, - { - "epoch": 0.65, - "learning_rate": 1.8251289919023767e-06, - "loss": 0.7285, - "step": 25209 - }, - { - "epoch": 0.65, - "learning_rate": 1.8251133593192175e-06, - "loss": 0.8672, - "step": 25210 - }, - { - "epoch": 0.65, - "learning_rate": 1.825097726104307e-06, - "loss": 0.8408, - "step": 25211 - }, - { - "epoch": 0.65, - "learning_rate": 1.825082092257657e-06, - "loss": 0.8459, - "step": 25212 - }, - { - "epoch": 0.65, - "learning_rate": 1.8250664577792795e-06, - "loss": 0.9785, - "step": 25213 - }, - { - "epoch": 0.65, - "learning_rate": 1.8250508226691868e-06, - "loss": 0.9336, - "step": 25214 - }, - { - "epoch": 0.65, - "learning_rate": 1.8250351869273906e-06, - "loss": 0.8159, - "step": 25215 - }, - { - "epoch": 0.65, - "learning_rate": 1.8250195505539025e-06, - "loss": 1.0859, - "step": 25216 - }, - { - "epoch": 0.65, - "learning_rate": 1.8250039135487355e-06, - "loss": 0.6733, - "step": 25217 - }, - { - "epoch": 0.65, - "learning_rate": 1.8249882759119007e-06, - "loss": 0.8213, - "step": 25218 - }, - { - "epoch": 0.65, - "learning_rate": 1.82497263764341e-06, - "loss": 1.1016, - "step": 25219 - }, - { - "epoch": 0.65, - "learning_rate": 1.8249569987432758e-06, - "loss": 0.9863, - "step": 25220 - }, - { - "epoch": 0.65, - "learning_rate": 1.8249413592115102e-06, - "loss": 0.6221, - "step": 25221 - }, - { - "epoch": 0.65, - "learning_rate": 1.824925719048125e-06, - "loss": 0.7969, - "step": 25222 - }, - { - "epoch": 0.65, - "learning_rate": 1.8249100782531318e-06, - "loss": 1.0264, - "step": 25223 - }, - { - "epoch": 0.65, - "learning_rate": 1.8248944368265428e-06, - "loss": 0.8901, - "step": 25224 - }, - { - "epoch": 0.65, - "learning_rate": 1.8248787947683703e-06, - "loss": 0.8047, - "step": 25225 - }, - { - "epoch": 0.65, - "learning_rate": 1.824863152078626e-06, - "loss": 0.998, - "step": 25226 - }, - { - "epoch": 0.65, - "learning_rate": 1.824847508757322e-06, - "loss": 0.999, - "step": 25227 - }, - { - "epoch": 0.65, - "learning_rate": 1.82483186480447e-06, - "loss": 0.7927, - "step": 25228 - }, - { - "epoch": 0.65, - "learning_rate": 1.8248162202200823e-06, - "loss": 0.666, - "step": 25229 - }, - { - "epoch": 0.65, - "learning_rate": 1.8248005750041705e-06, - "loss": 0.9473, - "step": 25230 - }, - { - "epoch": 0.65, - "learning_rate": 1.8247849291567472e-06, - "loss": 0.834, - "step": 25231 - }, - { - "epoch": 0.65, - "learning_rate": 1.8247692826778238e-06, - "loss": 0.9277, - "step": 25232 - }, - { - "epoch": 0.65, - "learning_rate": 1.8247536355674127e-06, - "loss": 0.9902, - "step": 25233 - }, - { - "epoch": 0.65, - "learning_rate": 1.8247379878255254e-06, - "loss": 0.9287, - "step": 25234 - }, - { - "epoch": 0.65, - "learning_rate": 1.8247223394521743e-06, - "loss": 0.9497, - "step": 25235 - }, - { - "epoch": 0.65, - "learning_rate": 1.8247066904473708e-06, - "loss": 0.8677, - "step": 25236 - }, - { - "epoch": 0.65, - "learning_rate": 1.8246910408111278e-06, - "loss": 0.8765, - "step": 25237 - }, - { - "epoch": 0.65, - "learning_rate": 1.8246753905434567e-06, - "loss": 0.8213, - "step": 25238 - }, - { - "epoch": 0.65, - "learning_rate": 1.8246597396443696e-06, - "loss": 0.8496, - "step": 25239 - }, - { - "epoch": 0.65, - "learning_rate": 1.8246440881138782e-06, - "loss": 0.9502, - "step": 25240 - }, - { - "epoch": 0.65, - "learning_rate": 1.824628435951995e-06, - "loss": 0.7148, - "step": 25241 - }, - { - "epoch": 0.65, - "learning_rate": 1.8246127831587316e-06, - "loss": 1.0273, - "step": 25242 - }, - { - "epoch": 0.65, - "learning_rate": 1.8245971297341e-06, - "loss": 0.709, - "step": 25243 - }, - { - "epoch": 0.65, - "learning_rate": 1.8245814756781127e-06, - "loss": 0.8301, - "step": 25244 - }, - { - "epoch": 0.65, - "learning_rate": 1.824565820990781e-06, - "loss": 0.876, - "step": 25245 - }, - { - "epoch": 0.65, - "learning_rate": 1.824550165672117e-06, - "loss": 0.9424, - "step": 25246 - }, - { - "epoch": 0.65, - "learning_rate": 1.8245345097221333e-06, - "loss": 0.9326, - "step": 25247 - }, - { - "epoch": 0.65, - "learning_rate": 1.824518853140841e-06, - "loss": 1.04, - "step": 25248 - }, - { - "epoch": 0.65, - "learning_rate": 1.8245031959282527e-06, - "loss": 0.9404, - "step": 25249 - }, - { - "epoch": 0.65, - "learning_rate": 1.8244875380843805e-06, - "loss": 0.9131, - "step": 25250 - }, - { - "epoch": 0.65, - "learning_rate": 1.8244718796092355e-06, - "loss": 0.8066, - "step": 25251 - }, - { - "epoch": 0.65, - "learning_rate": 1.8244562205028306e-06, - "loss": 1.0566, - "step": 25252 - }, - { - "epoch": 0.65, - "learning_rate": 1.8244405607651778e-06, - "loss": 0.7524, - "step": 25253 - }, - { - "epoch": 0.65, - "learning_rate": 1.8244249003962883e-06, - "loss": 0.8555, - "step": 25254 - }, - { - "epoch": 0.65, - "learning_rate": 1.8244092393961747e-06, - "loss": 0.8809, - "step": 25255 - }, - { - "epoch": 0.65, - "learning_rate": 1.8243935777648489e-06, - "loss": 0.4637, - "step": 25256 - }, - { - "epoch": 0.65, - "learning_rate": 1.8243779155023228e-06, - "loss": 0.7202, - "step": 25257 - }, - { - "epoch": 0.65, - "learning_rate": 1.8243622526086083e-06, - "loss": 0.823, - "step": 25258 - }, - { - "epoch": 0.65, - "learning_rate": 1.824346589083718e-06, - "loss": 0.8335, - "step": 25259 - }, - { - "epoch": 0.65, - "learning_rate": 1.824330924927663e-06, - "loss": 0.9424, - "step": 25260 - }, - { - "epoch": 0.65, - "learning_rate": 1.8243152601404558e-06, - "loss": 0.9307, - "step": 25261 - }, - { - "epoch": 0.65, - "learning_rate": 1.8242995947221084e-06, - "loss": 0.8594, - "step": 25262 - }, - { - "epoch": 0.65, - "learning_rate": 1.8242839286726327e-06, - "loss": 0.8984, - "step": 25263 - }, - { - "epoch": 0.65, - "learning_rate": 1.8242682619920403e-06, - "loss": 0.8901, - "step": 25264 - }, - { - "epoch": 0.65, - "learning_rate": 1.8242525946803443e-06, - "loss": 0.9043, - "step": 25265 - }, - { - "epoch": 0.65, - "learning_rate": 1.8242369267375554e-06, - "loss": 0.9414, - "step": 25266 - }, - { - "epoch": 0.65, - "learning_rate": 1.8242212581636864e-06, - "loss": 0.9131, - "step": 25267 - }, - { - "epoch": 0.65, - "learning_rate": 1.8242055889587494e-06, - "loss": 0.7148, - "step": 25268 - }, - { - "epoch": 0.65, - "learning_rate": 1.8241899191227556e-06, - "loss": 0.876, - "step": 25269 - }, - { - "epoch": 0.65, - "learning_rate": 1.8241742486557177e-06, - "loss": 0.8613, - "step": 25270 - }, - { - "epoch": 0.65, - "learning_rate": 1.8241585775576473e-06, - "loss": 0.6489, - "step": 25271 - }, - { - "epoch": 0.65, - "learning_rate": 1.8241429058285568e-06, - "loss": 0.9707, - "step": 25272 - }, - { - "epoch": 0.65, - "learning_rate": 1.8241272334684577e-06, - "loss": 0.9053, - "step": 25273 - }, - { - "epoch": 0.65, - "learning_rate": 1.8241115604773624e-06, - "loss": 0.6157, - "step": 25274 - }, - { - "epoch": 0.65, - "learning_rate": 1.824095886855283e-06, - "loss": 1.0117, - "step": 25275 - }, - { - "epoch": 0.65, - "learning_rate": 1.824080212602231e-06, - "loss": 0.9175, - "step": 25276 - }, - { - "epoch": 0.65, - "learning_rate": 1.8240645377182188e-06, - "loss": 0.8662, - "step": 25277 - }, - { - "epoch": 0.65, - "learning_rate": 1.824048862203258e-06, - "loss": 0.8799, - "step": 25278 - }, - { - "epoch": 0.65, - "learning_rate": 1.8240331860573612e-06, - "loss": 0.6228, - "step": 25279 - }, - { - "epoch": 0.65, - "learning_rate": 1.82401750928054e-06, - "loss": 1.0303, - "step": 25280 - }, - { - "epoch": 0.65, - "learning_rate": 1.8240018318728065e-06, - "loss": 0.8667, - "step": 25281 - }, - { - "epoch": 0.65, - "learning_rate": 1.8239861538341725e-06, - "loss": 0.8047, - "step": 25282 - }, - { - "epoch": 0.65, - "learning_rate": 1.8239704751646503e-06, - "loss": 0.8848, - "step": 25283 - }, - { - "epoch": 0.65, - "learning_rate": 1.823954795864252e-06, - "loss": 0.7275, - "step": 25284 - }, - { - "epoch": 0.65, - "learning_rate": 1.8239391159329891e-06, - "loss": 0.7871, - "step": 25285 - }, - { - "epoch": 0.65, - "learning_rate": 1.823923435370874e-06, - "loss": 1.0439, - "step": 25286 - }, - { - "epoch": 0.65, - "learning_rate": 1.8239077541779188e-06, - "loss": 0.8545, - "step": 25287 - }, - { - "epoch": 0.65, - "learning_rate": 1.8238920723541352e-06, - "loss": 0.6514, - "step": 25288 - }, - { - "epoch": 0.65, - "learning_rate": 1.823876389899535e-06, - "loss": 0.8076, - "step": 25289 - }, - { - "epoch": 0.65, - "learning_rate": 1.823860706814131e-06, - "loss": 1.1592, - "step": 25290 - }, - { - "epoch": 0.65, - "learning_rate": 1.8238450230979345e-06, - "loss": 1.0088, - "step": 25291 - }, - { - "epoch": 0.65, - "learning_rate": 1.8238293387509577e-06, - "loss": 1.0566, - "step": 25292 - }, - { - "epoch": 0.65, - "learning_rate": 1.8238136537732128e-06, - "loss": 0.8247, - "step": 25293 - }, - { - "epoch": 0.65, - "learning_rate": 1.8237979681647118e-06, - "loss": 0.876, - "step": 25294 - }, - { - "epoch": 0.65, - "learning_rate": 1.8237822819254665e-06, - "loss": 0.9023, - "step": 25295 - }, - { - "epoch": 0.65, - "learning_rate": 1.8237665950554888e-06, - "loss": 0.9893, - "step": 25296 - }, - { - "epoch": 0.65, - "learning_rate": 1.8237509075547908e-06, - "loss": 0.8516, - "step": 25297 - }, - { - "epoch": 0.65, - "learning_rate": 1.8237352194233847e-06, - "loss": 0.812, - "step": 25298 - }, - { - "epoch": 0.65, - "learning_rate": 1.8237195306612828e-06, - "loss": 0.751, - "step": 25299 - }, - { - "epoch": 0.65, - "learning_rate": 1.8237038412684964e-06, - "loss": 0.959, - "step": 25300 - }, - { - "epoch": 0.65, - "learning_rate": 1.8236881512450379e-06, - "loss": 0.8564, - "step": 25301 - }, - { - "epoch": 0.65, - "learning_rate": 1.8236724605909192e-06, - "loss": 1.083, - "step": 25302 - }, - { - "epoch": 0.65, - "learning_rate": 1.8236567693061524e-06, - "loss": 0.8086, - "step": 25303 - }, - { - "epoch": 0.65, - "learning_rate": 1.8236410773907497e-06, - "loss": 0.8345, - "step": 25304 - }, - { - "epoch": 0.65, - "learning_rate": 1.8236253848447224e-06, - "loss": 0.917, - "step": 25305 - }, - { - "epoch": 0.65, - "learning_rate": 1.8236096916680834e-06, - "loss": 0.6299, - "step": 25306 - }, - { - "epoch": 0.65, - "learning_rate": 1.8235939978608442e-06, - "loss": 1.0078, - "step": 25307 - }, - { - "epoch": 0.65, - "learning_rate": 1.823578303423017e-06, - "loss": 0.8896, - "step": 25308 - }, - { - "epoch": 0.65, - "learning_rate": 1.8235626083546136e-06, - "loss": 0.9766, - "step": 25309 - }, - { - "epoch": 0.65, - "learning_rate": 1.8235469126556464e-06, - "loss": 0.8516, - "step": 25310 - }, - { - "epoch": 0.65, - "learning_rate": 1.823531216326127e-06, - "loss": 0.9541, - "step": 25311 - }, - { - "epoch": 0.65, - "learning_rate": 1.8235155193660678e-06, - "loss": 1.0254, - "step": 25312 - }, - { - "epoch": 0.65, - "learning_rate": 1.8234998217754808e-06, - "loss": 0.9629, - "step": 25313 - }, - { - "epoch": 0.65, - "learning_rate": 1.8234841235543774e-06, - "loss": 0.6943, - "step": 25314 - }, - { - "epoch": 0.65, - "learning_rate": 1.8234684247027703e-06, - "loss": 0.8086, - "step": 25315 - }, - { - "epoch": 0.65, - "learning_rate": 1.8234527252206715e-06, - "loss": 0.9092, - "step": 25316 - }, - { - "epoch": 0.65, - "learning_rate": 1.8234370251080923e-06, - "loss": 0.6479, - "step": 25317 - }, - { - "epoch": 0.65, - "learning_rate": 1.8234213243650456e-06, - "loss": 0.8789, - "step": 25318 - }, - { - "epoch": 0.65, - "learning_rate": 1.8234056229915432e-06, - "loss": 0.731, - "step": 25319 - }, - { - "epoch": 0.65, - "learning_rate": 1.8233899209875966e-06, - "loss": 0.9678, - "step": 25320 - }, - { - "epoch": 0.65, - "learning_rate": 1.8233742183532183e-06, - "loss": 0.8623, - "step": 25321 - }, - { - "epoch": 0.65, - "learning_rate": 1.8233585150884204e-06, - "loss": 0.6382, - "step": 25322 - }, - { - "epoch": 0.65, - "learning_rate": 1.8233428111932145e-06, - "loss": 0.7061, - "step": 25323 - }, - { - "epoch": 0.65, - "learning_rate": 1.823327106667613e-06, - "loss": 0.8086, - "step": 25324 - }, - { - "epoch": 0.65, - "learning_rate": 1.8233114015116277e-06, - "loss": 0.6709, - "step": 25325 - }, - { - "epoch": 0.65, - "learning_rate": 1.823295695725271e-06, - "loss": 0.8696, - "step": 25326 - }, - { - "epoch": 0.65, - "learning_rate": 1.8232799893085543e-06, - "loss": 0.9863, - "step": 25327 - }, - { - "epoch": 0.65, - "learning_rate": 1.82326428226149e-06, - "loss": 0.769, - "step": 25328 - }, - { - "epoch": 0.65, - "learning_rate": 1.8232485745840904e-06, - "loss": 0.814, - "step": 25329 - }, - { - "epoch": 0.65, - "learning_rate": 1.823232866276367e-06, - "loss": 0.7998, - "step": 25330 - }, - { - "epoch": 0.65, - "learning_rate": 1.8232171573383321e-06, - "loss": 0.873, - "step": 25331 - }, - { - "epoch": 0.65, - "learning_rate": 1.8232014477699974e-06, - "loss": 0.6953, - "step": 25332 - }, - { - "epoch": 0.65, - "learning_rate": 1.8231857375713756e-06, - "loss": 0.6384, - "step": 25333 - }, - { - "epoch": 0.65, - "learning_rate": 1.823170026742478e-06, - "loss": 0.7705, - "step": 25334 - }, - { - "epoch": 0.65, - "learning_rate": 1.8231543152833172e-06, - "loss": 0.9668, - "step": 25335 - }, - { - "epoch": 0.65, - "learning_rate": 1.823138603193905e-06, - "loss": 0.8477, - "step": 25336 - }, - { - "epoch": 0.65, - "learning_rate": 1.8231228904742535e-06, - "loss": 0.792, - "step": 25337 - }, - { - "epoch": 0.65, - "learning_rate": 1.8231071771243743e-06, - "loss": 1.0615, - "step": 25338 - }, - { - "epoch": 0.65, - "learning_rate": 1.82309146314428e-06, - "loss": 0.5859, - "step": 25339 - }, - { - "epoch": 0.65, - "learning_rate": 1.8230757485339826e-06, - "loss": 0.9111, - "step": 25340 - }, - { - "epoch": 0.65, - "learning_rate": 1.8230600332934935e-06, - "loss": 0.7441, - "step": 25341 - }, - { - "epoch": 0.65, - "learning_rate": 1.8230443174228256e-06, - "loss": 1.0498, - "step": 25342 - }, - { - "epoch": 0.65, - "learning_rate": 1.8230286009219902e-06, - "loss": 0.873, - "step": 25343 - }, - { - "epoch": 0.65, - "learning_rate": 1.8230128837909998e-06, - "loss": 0.8525, - "step": 25344 - }, - { - "epoch": 0.65, - "learning_rate": 1.8229971660298662e-06, - "loss": 0.9727, - "step": 25345 - }, - { - "epoch": 0.65, - "learning_rate": 1.8229814476386015e-06, - "loss": 1.1367, - "step": 25346 - }, - { - "epoch": 0.65, - "learning_rate": 1.822965728617218e-06, - "loss": 0.5562, - "step": 25347 - }, - { - "epoch": 0.65, - "learning_rate": 1.8229500089657273e-06, - "loss": 0.916, - "step": 25348 - }, - { - "epoch": 0.65, - "learning_rate": 1.8229342886841415e-06, - "loss": 0.7607, - "step": 25349 - }, - { - "epoch": 0.65, - "learning_rate": 1.822918567772473e-06, - "loss": 0.9473, - "step": 25350 - }, - { - "epoch": 0.65, - "learning_rate": 1.8229028462307334e-06, - "loss": 0.7539, - "step": 25351 - }, - { - "epoch": 0.65, - "learning_rate": 1.822887124058935e-06, - "loss": 0.8135, - "step": 25352 - }, - { - "epoch": 0.65, - "learning_rate": 1.8228714012570898e-06, - "loss": 0.8223, - "step": 25353 - }, - { - "epoch": 0.65, - "learning_rate": 1.8228556778252098e-06, - "loss": 0.9473, - "step": 25354 - }, - { - "epoch": 0.65, - "learning_rate": 1.822839953763307e-06, - "loss": 0.9058, - "step": 25355 - }, - { - "epoch": 0.65, - "learning_rate": 1.8228242290713933e-06, - "loss": 0.916, - "step": 25356 - }, - { - "epoch": 0.65, - "learning_rate": 1.8228085037494812e-06, - "loss": 0.8652, - "step": 25357 - }, - { - "epoch": 0.65, - "learning_rate": 1.8227927777975824e-06, - "loss": 0.8428, - "step": 25358 - }, - { - "epoch": 0.65, - "learning_rate": 1.8227770512157088e-06, - "loss": 0.8682, - "step": 25359 - }, - { - "epoch": 0.65, - "learning_rate": 1.8227613240038729e-06, - "loss": 0.7344, - "step": 25360 - }, - { - "epoch": 0.65, - "learning_rate": 1.8227455961620865e-06, - "loss": 0.8057, - "step": 25361 - }, - { - "epoch": 0.65, - "learning_rate": 1.8227298676903615e-06, - "loss": 0.9229, - "step": 25362 - }, - { - "epoch": 0.65, - "learning_rate": 1.82271413858871e-06, - "loss": 0.9941, - "step": 25363 - }, - { - "epoch": 0.65, - "learning_rate": 1.8226984088571443e-06, - "loss": 1.0068, - "step": 25364 - }, - { - "epoch": 0.65, - "learning_rate": 1.822682678495676e-06, - "loss": 0.9609, - "step": 25365 - }, - { - "epoch": 0.65, - "learning_rate": 1.8226669475043177e-06, - "loss": 0.6938, - "step": 25366 - }, - { - "epoch": 0.65, - "learning_rate": 1.822651215883081e-06, - "loss": 0.8633, - "step": 25367 - }, - { - "epoch": 0.65, - "learning_rate": 1.8226354836319783e-06, - "loss": 0.8018, - "step": 25368 - }, - { - "epoch": 0.65, - "learning_rate": 1.8226197507510211e-06, - "loss": 0.7393, - "step": 25369 - }, - { - "epoch": 0.65, - "learning_rate": 1.8226040172402217e-06, - "loss": 0.6812, - "step": 25370 - }, - { - "epoch": 0.65, - "learning_rate": 1.8225882830995927e-06, - "loss": 0.7524, - "step": 25371 - }, - { - "epoch": 0.65, - "learning_rate": 1.8225725483291452e-06, - "loss": 0.8984, - "step": 25372 - }, - { - "epoch": 0.65, - "learning_rate": 1.8225568129288923e-06, - "loss": 0.8711, - "step": 25373 - }, - { - "epoch": 0.65, - "learning_rate": 1.8225410768988447e-06, - "loss": 1.043, - "step": 25374 - }, - { - "epoch": 0.65, - "learning_rate": 1.8225253402390157e-06, - "loss": 0.9287, - "step": 25375 - }, - { - "epoch": 0.65, - "learning_rate": 1.822509602949417e-06, - "loss": 0.874, - "step": 25376 - }, - { - "epoch": 0.65, - "learning_rate": 1.8224938650300604e-06, - "loss": 0.7417, - "step": 25377 - }, - { - "epoch": 0.65, - "learning_rate": 1.822478126480958e-06, - "loss": 1.0557, - "step": 25378 - }, - { - "epoch": 0.65, - "learning_rate": 1.8224623873021216e-06, - "loss": 0.9434, - "step": 25379 - }, - { - "epoch": 0.65, - "learning_rate": 1.822446647493564e-06, - "loss": 0.7959, - "step": 25380 - }, - { - "epoch": 0.65, - "learning_rate": 1.8224309070552967e-06, - "loss": 0.8438, - "step": 25381 - }, - { - "epoch": 0.65, - "learning_rate": 1.8224151659873319e-06, - "loss": 0.916, - "step": 25382 - }, - { - "epoch": 0.65, - "learning_rate": 1.8223994242896816e-06, - "loss": 0.8525, - "step": 25383 - }, - { - "epoch": 0.65, - "learning_rate": 1.8223836819623579e-06, - "loss": 1.0244, - "step": 25384 - }, - { - "epoch": 0.65, - "learning_rate": 1.8223679390053727e-06, - "loss": 0.8809, - "step": 25385 - }, - { - "epoch": 0.65, - "learning_rate": 1.8223521954187384e-06, - "loss": 0.917, - "step": 25386 - }, - { - "epoch": 0.65, - "learning_rate": 1.8223364512024668e-06, - "loss": 0.875, - "step": 25387 - }, - { - "epoch": 0.65, - "learning_rate": 1.8223207063565698e-06, - "loss": 0.7666, - "step": 25388 - }, - { - "epoch": 0.65, - "learning_rate": 1.8223049608810596e-06, - "loss": 0.9199, - "step": 25389 - }, - { - "epoch": 0.65, - "learning_rate": 1.8222892147759486e-06, - "loss": 0.751, - "step": 25390 - }, - { - "epoch": 0.65, - "learning_rate": 1.8222734680412484e-06, - "loss": 1.0312, - "step": 25391 - }, - { - "epoch": 0.65, - "learning_rate": 1.8222577206769712e-06, - "loss": 0.7197, - "step": 25392 - }, - { - "epoch": 0.65, - "learning_rate": 1.822241972683129e-06, - "loss": 0.8809, - "step": 25393 - }, - { - "epoch": 0.65, - "learning_rate": 1.822226224059734e-06, - "loss": 0.9541, - "step": 25394 - }, - { - "epoch": 0.65, - "learning_rate": 1.8222104748067984e-06, - "loss": 0.9102, - "step": 25395 - }, - { - "epoch": 0.65, - "learning_rate": 1.8221947249243338e-06, - "loss": 0.8955, - "step": 25396 - }, - { - "epoch": 0.65, - "learning_rate": 1.8221789744123526e-06, - "loss": 1.0049, - "step": 25397 - }, - { - "epoch": 0.65, - "learning_rate": 1.8221632232708667e-06, - "loss": 0.6216, - "step": 25398 - }, - { - "epoch": 0.65, - "learning_rate": 1.8221474714998882e-06, - "loss": 0.8232, - "step": 25399 - }, - { - "epoch": 0.65, - "learning_rate": 1.8221317190994295e-06, - "loss": 1.0371, - "step": 25400 - }, - { - "epoch": 0.65, - "learning_rate": 1.8221159660695018e-06, - "loss": 0.8657, - "step": 25401 - }, - { - "epoch": 0.65, - "learning_rate": 1.8221002124101181e-06, - "loss": 0.9238, - "step": 25402 - }, - { - "epoch": 0.65, - "learning_rate": 1.8220844581212899e-06, - "loss": 0.7058, - "step": 25403 - }, - { - "epoch": 0.65, - "learning_rate": 1.8220687032030293e-06, - "loss": 0.9141, - "step": 25404 - }, - { - "epoch": 0.65, - "learning_rate": 1.822052947655349e-06, - "loss": 0.999, - "step": 25405 - }, - { - "epoch": 0.65, - "learning_rate": 1.8220371914782602e-06, - "loss": 0.8857, - "step": 25406 - }, - { - "epoch": 0.65, - "learning_rate": 1.8220214346717752e-06, - "loss": 0.6919, - "step": 25407 - }, - { - "epoch": 0.65, - "learning_rate": 1.8220056772359063e-06, - "loss": 0.7954, - "step": 25408 - }, - { - "epoch": 0.65, - "learning_rate": 1.8219899191706655e-06, - "loss": 0.959, - "step": 25409 - }, - { - "epoch": 0.65, - "learning_rate": 1.8219741604760649e-06, - "loss": 0.7759, - "step": 25410 - }, - { - "epoch": 0.65, - "learning_rate": 1.8219584011521164e-06, - "loss": 0.7261, - "step": 25411 - }, - { - "epoch": 0.65, - "learning_rate": 1.8219426411988322e-06, - "loss": 0.9023, - "step": 25412 - }, - { - "epoch": 0.65, - "learning_rate": 1.8219268806162243e-06, - "loss": 0.6807, - "step": 25413 - }, - { - "epoch": 0.65, - "learning_rate": 1.8219111194043046e-06, - "loss": 0.8721, - "step": 25414 - }, - { - "epoch": 0.65, - "learning_rate": 1.8218953575630853e-06, - "loss": 0.9355, - "step": 25415 - }, - { - "epoch": 0.65, - "learning_rate": 1.8218795950925787e-06, - "loss": 0.7588, - "step": 25416 - }, - { - "epoch": 0.65, - "learning_rate": 1.8218638319927968e-06, - "loss": 0.9121, - "step": 25417 - }, - { - "epoch": 0.65, - "learning_rate": 1.8218480682637516e-06, - "loss": 0.7695, - "step": 25418 - }, - { - "epoch": 0.65, - "learning_rate": 1.8218323039054548e-06, - "loss": 0.8379, - "step": 25419 - }, - { - "epoch": 0.65, - "learning_rate": 1.821816538917919e-06, - "loss": 0.8691, - "step": 25420 - }, - { - "epoch": 0.65, - "learning_rate": 1.821800773301156e-06, - "loss": 0.917, - "step": 25421 - }, - { - "epoch": 0.65, - "learning_rate": 1.8217850070551778e-06, - "loss": 0.9775, - "step": 25422 - }, - { - "epoch": 0.65, - "learning_rate": 1.821769240179997e-06, - "loss": 0.7793, - "step": 25423 - }, - { - "epoch": 0.65, - "learning_rate": 1.8217534726756249e-06, - "loss": 0.708, - "step": 25424 - }, - { - "epoch": 0.65, - "learning_rate": 1.821737704542074e-06, - "loss": 0.7778, - "step": 25425 - }, - { - "epoch": 0.65, - "learning_rate": 1.8217219357793564e-06, - "loss": 0.8296, - "step": 25426 - }, - { - "epoch": 0.65, - "learning_rate": 1.8217061663874845e-06, - "loss": 0.8828, - "step": 25427 - }, - { - "epoch": 0.65, - "learning_rate": 1.8216903963664694e-06, - "loss": 0.6934, - "step": 25428 - }, - { - "epoch": 0.65, - "learning_rate": 1.8216746257163237e-06, - "loss": 0.9844, - "step": 25429 - }, - { - "epoch": 0.65, - "learning_rate": 1.82165885443706e-06, - "loss": 0.6143, - "step": 25430 - }, - { - "epoch": 0.65, - "learning_rate": 1.8216430825286894e-06, - "loss": 1.001, - "step": 25431 - }, - { - "epoch": 0.65, - "learning_rate": 1.821627309991225e-06, - "loss": 0.9541, - "step": 25432 - }, - { - "epoch": 0.65, - "learning_rate": 1.8216115368246778e-06, - "loss": 0.7432, - "step": 25433 - }, - { - "epoch": 0.65, - "learning_rate": 1.821595763029061e-06, - "loss": 0.792, - "step": 25434 - }, - { - "epoch": 0.65, - "learning_rate": 1.8215799886043856e-06, - "loss": 0.7412, - "step": 25435 - }, - { - "epoch": 0.65, - "learning_rate": 1.8215642135506643e-06, - "loss": 0.792, - "step": 25436 - }, - { - "epoch": 0.65, - "learning_rate": 1.8215484378679094e-06, - "loss": 0.7041, - "step": 25437 - }, - { - "epoch": 0.65, - "learning_rate": 1.8215326615561322e-06, - "loss": 0.8701, - "step": 25438 - }, - { - "epoch": 0.65, - "learning_rate": 1.8215168846153452e-06, - "loss": 0.8584, - "step": 25439 - }, - { - "epoch": 0.65, - "learning_rate": 1.8215011070455608e-06, - "loss": 0.6178, - "step": 25440 - }, - { - "epoch": 0.65, - "learning_rate": 1.8214853288467907e-06, - "loss": 0.6904, - "step": 25441 - }, - { - "epoch": 0.65, - "learning_rate": 1.8214695500190472e-06, - "loss": 0.7705, - "step": 25442 - }, - { - "epoch": 0.65, - "learning_rate": 1.8214537705623419e-06, - "loss": 1.0811, - "step": 25443 - }, - { - "epoch": 0.65, - "learning_rate": 1.8214379904766873e-06, - "loss": 0.8945, - "step": 25444 - }, - { - "epoch": 0.65, - "learning_rate": 1.8214222097620955e-06, - "loss": 0.9043, - "step": 25445 - }, - { - "epoch": 0.65, - "learning_rate": 1.8214064284185783e-06, - "loss": 0.595, - "step": 25446 - }, - { - "epoch": 0.65, - "learning_rate": 1.8213906464461481e-06, - "loss": 0.6636, - "step": 25447 - }, - { - "epoch": 0.65, - "learning_rate": 1.821374863844817e-06, - "loss": 0.8545, - "step": 25448 - }, - { - "epoch": 0.65, - "learning_rate": 1.8213590806145968e-06, - "loss": 0.7798, - "step": 25449 - }, - { - "epoch": 0.65, - "learning_rate": 1.8213432967554998e-06, - "loss": 0.8291, - "step": 25450 - }, - { - "epoch": 0.65, - "learning_rate": 1.8213275122675378e-06, - "loss": 1.0371, - "step": 25451 - }, - { - "epoch": 0.65, - "learning_rate": 1.8213117271507233e-06, - "loss": 0.9043, - "step": 25452 - }, - { - "epoch": 0.65, - "learning_rate": 1.8212959414050681e-06, - "loss": 0.8701, - "step": 25453 - }, - { - "epoch": 0.65, - "learning_rate": 1.8212801550305844e-06, - "loss": 1.0391, - "step": 25454 - }, - { - "epoch": 0.65, - "learning_rate": 1.8212643680272844e-06, - "loss": 0.8838, - "step": 25455 - }, - { - "epoch": 0.65, - "learning_rate": 1.8212485803951797e-06, - "loss": 0.6284, - "step": 25456 - }, - { - "epoch": 0.65, - "learning_rate": 1.8212327921342826e-06, - "loss": 0.7002, - "step": 25457 - }, - { - "epoch": 0.65, - "learning_rate": 1.8212170032446057e-06, - "loss": 0.7461, - "step": 25458 - }, - { - "epoch": 0.65, - "learning_rate": 1.8212012137261606e-06, - "loss": 0.7012, - "step": 25459 - }, - { - "epoch": 0.65, - "learning_rate": 1.8211854235789595e-06, - "loss": 0.832, - "step": 25460 - }, - { - "epoch": 0.65, - "learning_rate": 1.8211696328030143e-06, - "loss": 0.6621, - "step": 25461 - }, - { - "epoch": 0.65, - "learning_rate": 1.8211538413983373e-06, - "loss": 0.8721, - "step": 25462 - }, - { - "epoch": 0.65, - "learning_rate": 1.8211380493649408e-06, - "loss": 0.6099, - "step": 25463 - }, - { - "epoch": 0.65, - "learning_rate": 1.8211222567028367e-06, - "loss": 1.04, - "step": 25464 - }, - { - "epoch": 0.65, - "learning_rate": 1.8211064634120367e-06, - "loss": 0.645, - "step": 25465 - }, - { - "epoch": 0.65, - "learning_rate": 1.8210906694925536e-06, - "loss": 0.8916, - "step": 25466 - }, - { - "epoch": 0.65, - "learning_rate": 1.8210748749443989e-06, - "loss": 0.7334, - "step": 25467 - }, - { - "epoch": 0.65, - "learning_rate": 1.821059079767585e-06, - "loss": 0.7266, - "step": 25468 - }, - { - "epoch": 0.65, - "learning_rate": 1.821043283962124e-06, - "loss": 0.8066, - "step": 25469 - }, - { - "epoch": 0.65, - "learning_rate": 1.8210274875280275e-06, - "loss": 0.7134, - "step": 25470 - }, - { - "epoch": 0.65, - "learning_rate": 1.8210116904653083e-06, - "loss": 1.001, - "step": 25471 - }, - { - "epoch": 0.65, - "learning_rate": 1.8209958927739784e-06, - "loss": 0.8877, - "step": 25472 - }, - { - "epoch": 0.65, - "learning_rate": 1.8209800944540495e-06, - "loss": 0.7451, - "step": 25473 - }, - { - "epoch": 0.65, - "learning_rate": 1.8209642955055338e-06, - "loss": 0.9224, - "step": 25474 - }, - { - "epoch": 0.65, - "learning_rate": 1.8209484959284437e-06, - "loss": 0.8936, - "step": 25475 - }, - { - "epoch": 0.65, - "learning_rate": 1.820932695722791e-06, - "loss": 0.6396, - "step": 25476 - }, - { - "epoch": 0.65, - "learning_rate": 1.8209168948885876e-06, - "loss": 0.9912, - "step": 25477 - }, - { - "epoch": 0.65, - "learning_rate": 1.8209010934258463e-06, - "loss": 0.9355, - "step": 25478 - }, - { - "epoch": 0.65, - "learning_rate": 1.8208852913345786e-06, - "loss": 0.6162, - "step": 25479 - }, - { - "epoch": 0.65, - "learning_rate": 1.8208694886147967e-06, - "loss": 0.8711, - "step": 25480 - }, - { - "epoch": 0.65, - "learning_rate": 1.8208536852665128e-06, - "loss": 0.8799, - "step": 25481 - }, - { - "epoch": 0.65, - "learning_rate": 1.820837881289739e-06, - "loss": 1.0459, - "step": 25482 - }, - { - "epoch": 0.65, - "learning_rate": 1.8208220766844874e-06, - "loss": 0.8242, - "step": 25483 - }, - { - "epoch": 0.65, - "learning_rate": 1.8208062714507702e-06, - "loss": 0.8408, - "step": 25484 - }, - { - "epoch": 0.65, - "learning_rate": 1.8207904655885992e-06, - "loss": 0.8975, - "step": 25485 - }, - { - "epoch": 0.65, - "learning_rate": 1.8207746590979868e-06, - "loss": 0.6084, - "step": 25486 - }, - { - "epoch": 0.65, - "learning_rate": 1.8207588519789447e-06, - "loss": 0.8413, - "step": 25487 - }, - { - "epoch": 0.65, - "learning_rate": 1.8207430442314857e-06, - "loss": 0.7295, - "step": 25488 - }, - { - "epoch": 0.65, - "learning_rate": 1.8207272358556214e-06, - "loss": 0.7949, - "step": 25489 - }, - { - "epoch": 0.65, - "learning_rate": 1.8207114268513638e-06, - "loss": 1.0635, - "step": 25490 - }, - { - "epoch": 0.65, - "learning_rate": 1.8206956172187252e-06, - "loss": 0.7983, - "step": 25491 - }, - { - "epoch": 0.65, - "learning_rate": 1.820679806957718e-06, - "loss": 0.8818, - "step": 25492 - }, - { - "epoch": 0.65, - "learning_rate": 1.8206639960683537e-06, - "loss": 1.0029, - "step": 25493 - }, - { - "epoch": 0.65, - "learning_rate": 1.8206481845506448e-06, - "loss": 1.0225, - "step": 25494 - }, - { - "epoch": 0.65, - "learning_rate": 1.8206323724046034e-06, - "loss": 0.5024, - "step": 25495 - }, - { - "epoch": 0.65, - "learning_rate": 1.8206165596302414e-06, - "loss": 0.9043, - "step": 25496 - }, - { - "epoch": 0.65, - "learning_rate": 1.820600746227571e-06, - "loss": 0.7373, - "step": 25497 - }, - { - "epoch": 0.65, - "learning_rate": 1.8205849321966046e-06, - "loss": 0.8604, - "step": 25498 - }, - { - "epoch": 0.65, - "learning_rate": 1.820569117537354e-06, - "loss": 0.9102, - "step": 25499 - }, - { - "epoch": 0.65, - "learning_rate": 1.820553302249831e-06, - "loss": 0.8467, - "step": 25500 - }, - { - "epoch": 0.65, - "learning_rate": 1.8205374863340484e-06, - "loss": 0.7822, - "step": 25501 - }, - { - "epoch": 0.65, - "learning_rate": 1.8205216697900178e-06, - "loss": 0.6562, - "step": 25502 - }, - { - "epoch": 0.65, - "learning_rate": 1.8205058526177517e-06, - "loss": 0.875, - "step": 25503 - }, - { - "epoch": 0.65, - "learning_rate": 1.8204900348172619e-06, - "loss": 0.6895, - "step": 25504 - }, - { - "epoch": 0.65, - "learning_rate": 1.8204742163885605e-06, - "loss": 0.6646, - "step": 25505 - }, - { - "epoch": 0.65, - "learning_rate": 1.82045839733166e-06, - "loss": 0.9883, - "step": 25506 - }, - { - "epoch": 0.65, - "learning_rate": 1.8204425776465717e-06, - "loss": 0.8408, - "step": 25507 - }, - { - "epoch": 0.65, - "learning_rate": 1.8204267573333087e-06, - "loss": 0.4619, - "step": 25508 - }, - { - "epoch": 0.65, - "learning_rate": 1.8204109363918824e-06, - "loss": 0.8306, - "step": 25509 - }, - { - "epoch": 0.65, - "learning_rate": 1.8203951148223053e-06, - "loss": 0.9453, - "step": 25510 - }, - { - "epoch": 0.65, - "learning_rate": 1.8203792926245894e-06, - "loss": 0.8613, - "step": 25511 - }, - { - "epoch": 0.65, - "learning_rate": 1.820363469798747e-06, - "loss": 0.7612, - "step": 25512 - }, - { - "epoch": 0.65, - "learning_rate": 1.8203476463447896e-06, - "loss": 0.7764, - "step": 25513 - }, - { - "epoch": 0.65, - "learning_rate": 1.82033182226273e-06, - "loss": 0.9131, - "step": 25514 - }, - { - "epoch": 0.65, - "learning_rate": 1.82031599755258e-06, - "loss": 0.9932, - "step": 25515 - }, - { - "epoch": 0.65, - "learning_rate": 1.8203001722143516e-06, - "loss": 1.0225, - "step": 25516 - }, - { - "epoch": 0.65, - "learning_rate": 1.8202843462480573e-06, - "loss": 0.8037, - "step": 25517 - }, - { - "epoch": 0.65, - "learning_rate": 1.820268519653709e-06, - "loss": 1.1807, - "step": 25518 - }, - { - "epoch": 0.65, - "learning_rate": 1.8202526924313184e-06, - "loss": 0.8564, - "step": 25519 - }, - { - "epoch": 0.65, - "learning_rate": 1.8202368645808982e-06, - "loss": 0.7441, - "step": 25520 - }, - { - "epoch": 0.65, - "learning_rate": 1.8202210361024605e-06, - "loss": 0.7144, - "step": 25521 - }, - { - "epoch": 0.65, - "learning_rate": 1.8202052069960176e-06, - "loss": 1.0752, - "step": 25522 - }, - { - "epoch": 0.65, - "learning_rate": 1.8201893772615808e-06, - "loss": 0.8516, - "step": 25523 - }, - { - "epoch": 0.65, - "learning_rate": 1.8201735468991629e-06, - "loss": 0.9023, - "step": 25524 - }, - { - "epoch": 0.65, - "learning_rate": 1.8201577159087757e-06, - "loss": 0.8779, - "step": 25525 - }, - { - "epoch": 0.65, - "learning_rate": 1.8201418842904316e-06, - "loss": 1.0146, - "step": 25526 - }, - { - "epoch": 0.65, - "learning_rate": 1.8201260520441423e-06, - "loss": 0.5942, - "step": 25527 - }, - { - "epoch": 0.65, - "learning_rate": 1.8201102191699204e-06, - "loss": 0.8408, - "step": 25528 - }, - { - "epoch": 0.65, - "learning_rate": 1.8200943856677777e-06, - "loss": 0.7559, - "step": 25529 - }, - { - "epoch": 0.65, - "learning_rate": 1.8200785515377265e-06, - "loss": 1.0137, - "step": 25530 - }, - { - "epoch": 0.65, - "learning_rate": 1.820062716779779e-06, - "loss": 0.7158, - "step": 25531 - }, - { - "epoch": 0.65, - "learning_rate": 1.820046881393947e-06, - "loss": 1.1621, - "step": 25532 - }, - { - "epoch": 0.65, - "learning_rate": 1.8200310453802433e-06, - "loss": 0.9111, - "step": 25533 - }, - { - "epoch": 0.65, - "learning_rate": 1.8200152087386788e-06, - "loss": 0.9331, - "step": 25534 - }, - { - "epoch": 0.65, - "learning_rate": 1.8199993714692667e-06, - "loss": 0.9473, - "step": 25535 - }, - { - "epoch": 0.65, - "learning_rate": 1.8199835335720187e-06, - "loss": 0.8281, - "step": 25536 - }, - { - "epoch": 0.65, - "learning_rate": 1.8199676950469472e-06, - "loss": 0.9375, - "step": 25537 - }, - { - "epoch": 0.65, - "learning_rate": 1.8199518558940641e-06, - "loss": 0.834, - "step": 25538 - }, - { - "epoch": 0.65, - "learning_rate": 1.8199360161133814e-06, - "loss": 0.3955, - "step": 25539 - }, - { - "epoch": 0.65, - "learning_rate": 1.8199201757049116e-06, - "loss": 0.719, - "step": 25540 - }, - { - "epoch": 0.65, - "learning_rate": 1.8199043346686664e-06, - "loss": 0.7048, - "step": 25541 - }, - { - "epoch": 0.65, - "learning_rate": 1.8198884930046583e-06, - "loss": 0.8203, - "step": 25542 - }, - { - "epoch": 0.65, - "learning_rate": 1.8198726507128992e-06, - "loss": 0.7754, - "step": 25543 - }, - { - "epoch": 0.65, - "learning_rate": 1.8198568077934016e-06, - "loss": 0.6074, - "step": 25544 - }, - { - "epoch": 0.65, - "learning_rate": 1.8198409642461767e-06, - "loss": 0.7349, - "step": 25545 - }, - { - "epoch": 0.65, - "learning_rate": 1.8198251200712378e-06, - "loss": 1.1689, - "step": 25546 - }, - { - "epoch": 0.65, - "learning_rate": 1.8198092752685965e-06, - "loss": 0.8418, - "step": 25547 - }, - { - "epoch": 0.65, - "learning_rate": 1.8197934298382646e-06, - "loss": 0.791, - "step": 25548 - }, - { - "epoch": 0.65, - "learning_rate": 1.819777583780255e-06, - "loss": 1.0, - "step": 25549 - }, - { - "epoch": 0.65, - "learning_rate": 1.8197617370945788e-06, - "loss": 0.7329, - "step": 25550 - }, - { - "epoch": 0.65, - "learning_rate": 1.8197458897812492e-06, - "loss": 0.9395, - "step": 25551 - }, - { - "epoch": 0.65, - "learning_rate": 1.8197300418402776e-06, - "loss": 0.8018, - "step": 25552 - }, - { - "epoch": 0.65, - "learning_rate": 1.8197141932716766e-06, - "loss": 0.9453, - "step": 25553 - }, - { - "epoch": 0.65, - "learning_rate": 1.8196983440754584e-06, - "loss": 0.7334, - "step": 25554 - }, - { - "epoch": 0.65, - "learning_rate": 1.8196824942516344e-06, - "loss": 0.8828, - "step": 25555 - }, - { - "epoch": 0.66, - "learning_rate": 1.8196666438002174e-06, - "loss": 0.9014, - "step": 25556 - }, - { - "epoch": 0.66, - "learning_rate": 1.8196507927212193e-06, - "loss": 0.8691, - "step": 25557 - }, - { - "epoch": 0.66, - "learning_rate": 1.8196349410146521e-06, - "loss": 0.9238, - "step": 25558 - }, - { - "epoch": 0.66, - "learning_rate": 1.8196190886805284e-06, - "loss": 0.939, - "step": 25559 - }, - { - "epoch": 0.66, - "learning_rate": 1.81960323571886e-06, - "loss": 0.8174, - "step": 25560 - }, - { - "epoch": 0.66, - "learning_rate": 1.819587382129659e-06, - "loss": 0.6157, - "step": 25561 - }, - { - "epoch": 0.66, - "learning_rate": 1.8195715279129375e-06, - "loss": 0.9639, - "step": 25562 - }, - { - "epoch": 0.66, - "learning_rate": 1.819555673068708e-06, - "loss": 0.8975, - "step": 25563 - }, - { - "epoch": 0.66, - "learning_rate": 1.8195398175969825e-06, - "loss": 0.9111, - "step": 25564 - }, - { - "epoch": 0.66, - "learning_rate": 1.8195239614977726e-06, - "loss": 0.9229, - "step": 25565 - }, - { - "epoch": 0.66, - "learning_rate": 1.8195081047710912e-06, - "loss": 0.8022, - "step": 25566 - }, - { - "epoch": 0.66, - "learning_rate": 1.8194922474169503e-06, - "loss": 0.9541, - "step": 25567 - }, - { - "epoch": 0.66, - "learning_rate": 1.8194763894353615e-06, - "loss": 1.0059, - "step": 25568 - }, - { - "epoch": 0.66, - "learning_rate": 1.8194605308263375e-06, - "loss": 0.7729, - "step": 25569 - }, - { - "epoch": 0.66, - "learning_rate": 1.81944467158989e-06, - "loss": 0.8066, - "step": 25570 - }, - { - "epoch": 0.66, - "learning_rate": 1.8194288117260319e-06, - "loss": 0.7441, - "step": 25571 - }, - { - "epoch": 0.66, - "learning_rate": 1.8194129512347744e-06, - "loss": 0.791, - "step": 25572 - }, - { - "epoch": 0.66, - "learning_rate": 1.8193970901161305e-06, - "loss": 0.918, - "step": 25573 - }, - { - "epoch": 0.66, - "learning_rate": 1.8193812283701115e-06, - "loss": 0.9102, - "step": 25574 - }, - { - "epoch": 0.66, - "learning_rate": 1.81936536599673e-06, - "loss": 0.665, - "step": 25575 - }, - { - "epoch": 0.66, - "learning_rate": 1.8193495029959984e-06, - "loss": 0.9453, - "step": 25576 - }, - { - "epoch": 0.66, - "learning_rate": 1.819333639367928e-06, - "loss": 0.998, - "step": 25577 - }, - { - "epoch": 0.66, - "learning_rate": 1.8193177751125322e-06, - "loss": 0.917, - "step": 25578 - }, - { - "epoch": 0.66, - "learning_rate": 1.819301910229822e-06, - "loss": 0.7102, - "step": 25579 - }, - { - "epoch": 0.66, - "learning_rate": 1.8192860447198104e-06, - "loss": 0.7793, - "step": 25580 - }, - { - "epoch": 0.66, - "learning_rate": 1.8192701785825087e-06, - "loss": 0.8135, - "step": 25581 - }, - { - "epoch": 0.66, - "learning_rate": 1.81925431181793e-06, - "loss": 0.9609, - "step": 25582 - }, - { - "epoch": 0.66, - "learning_rate": 1.8192384444260855e-06, - "loss": 1.0615, - "step": 25583 - }, - { - "epoch": 0.66, - "learning_rate": 1.819222576406988e-06, - "loss": 0.8926, - "step": 25584 - }, - { - "epoch": 0.66, - "learning_rate": 1.8192067077606495e-06, - "loss": 0.7549, - "step": 25585 - }, - { - "epoch": 0.66, - "learning_rate": 1.8191908384870817e-06, - "loss": 1.1797, - "step": 25586 - }, - { - "epoch": 0.66, - "learning_rate": 1.8191749685862977e-06, - "loss": 0.877, - "step": 25587 - }, - { - "epoch": 0.66, - "learning_rate": 1.8191590980583084e-06, - "loss": 0.7139, - "step": 25588 - }, - { - "epoch": 0.66, - "learning_rate": 1.8191432269031273e-06, - "loss": 0.7441, - "step": 25589 - }, - { - "epoch": 0.66, - "learning_rate": 1.8191273551207656e-06, - "loss": 0.9434, - "step": 25590 - }, - { - "epoch": 0.66, - "learning_rate": 1.8191114827112358e-06, - "loss": 0.7859, - "step": 25591 - }, - { - "epoch": 0.66, - "learning_rate": 1.8190956096745499e-06, - "loss": 0.9932, - "step": 25592 - }, - { - "epoch": 0.66, - "learning_rate": 1.81907973601072e-06, - "loss": 0.9072, - "step": 25593 - }, - { - "epoch": 0.66, - "learning_rate": 1.8190638617197588e-06, - "loss": 0.8164, - "step": 25594 - }, - { - "epoch": 0.66, - "learning_rate": 1.819047986801678e-06, - "loss": 0.7148, - "step": 25595 - }, - { - "epoch": 0.66, - "learning_rate": 1.8190321112564896e-06, - "loss": 0.6992, - "step": 25596 - }, - { - "epoch": 0.66, - "learning_rate": 1.8190162350842063e-06, - "loss": 0.9619, - "step": 25597 - }, - { - "epoch": 0.66, - "learning_rate": 1.8190003582848397e-06, - "loss": 0.791, - "step": 25598 - }, - { - "epoch": 0.66, - "learning_rate": 1.8189844808584024e-06, - "loss": 0.8027, - "step": 25599 - }, - { - "epoch": 0.66, - "learning_rate": 1.8189686028049059e-06, - "loss": 0.7617, - "step": 25600 - }, - { - "epoch": 0.66, - "learning_rate": 1.818952724124363e-06, - "loss": 0.9551, - "step": 25601 - }, - { - "epoch": 0.66, - "learning_rate": 1.818936844816786e-06, - "loss": 0.8643, - "step": 25602 - }, - { - "epoch": 0.66, - "learning_rate": 1.8189209648821864e-06, - "loss": 0.9834, - "step": 25603 - }, - { - "epoch": 0.66, - "learning_rate": 1.8189050843205766e-06, - "loss": 0.9561, - "step": 25604 - }, - { - "epoch": 0.66, - "learning_rate": 1.818889203131969e-06, - "loss": 0.6658, - "step": 25605 - }, - { - "epoch": 0.66, - "learning_rate": 1.8188733213163754e-06, - "loss": 1.0703, - "step": 25606 - }, - { - "epoch": 0.66, - "learning_rate": 1.8188574388738083e-06, - "loss": 0.7822, - "step": 25607 - }, - { - "epoch": 0.66, - "learning_rate": 1.8188415558042797e-06, - "loss": 0.8955, - "step": 25608 - }, - { - "epoch": 0.66, - "learning_rate": 1.8188256721078017e-06, - "loss": 0.7905, - "step": 25609 - }, - { - "epoch": 0.66, - "learning_rate": 1.8188097877843867e-06, - "loss": 0.9727, - "step": 25610 - }, - { - "epoch": 0.66, - "learning_rate": 1.8187939028340464e-06, - "loss": 0.7314, - "step": 25611 - }, - { - "epoch": 0.66, - "learning_rate": 1.8187780172567938e-06, - "loss": 0.8369, - "step": 25612 - }, - { - "epoch": 0.66, - "learning_rate": 1.81876213105264e-06, - "loss": 1.0166, - "step": 25613 - }, - { - "epoch": 0.66, - "learning_rate": 1.8187462442215977e-06, - "loss": 0.7856, - "step": 25614 - }, - { - "epoch": 0.66, - "learning_rate": 1.8187303567636795e-06, - "loss": 0.8169, - "step": 25615 - }, - { - "epoch": 0.66, - "learning_rate": 1.8187144686788965e-06, - "loss": 0.8467, - "step": 25616 - }, - { - "epoch": 0.66, - "learning_rate": 1.8186985799672617e-06, - "loss": 0.9121, - "step": 25617 - }, - { - "epoch": 0.66, - "learning_rate": 1.8186826906287872e-06, - "loss": 0.8291, - "step": 25618 - }, - { - "epoch": 0.66, - "learning_rate": 1.818666800663485e-06, - "loss": 0.9385, - "step": 25619 - }, - { - "epoch": 0.66, - "learning_rate": 1.8186509100713673e-06, - "loss": 0.9502, - "step": 25620 - }, - { - "epoch": 0.66, - "learning_rate": 1.8186350188524461e-06, - "loss": 0.8652, - "step": 25621 - }, - { - "epoch": 0.66, - "learning_rate": 1.8186191270067338e-06, - "loss": 0.8516, - "step": 25622 - }, - { - "epoch": 0.66, - "learning_rate": 1.8186032345342424e-06, - "loss": 0.8506, - "step": 25623 - }, - { - "epoch": 0.66, - "learning_rate": 1.8185873414349842e-06, - "loss": 0.791, - "step": 25624 - }, - { - "epoch": 0.66, - "learning_rate": 1.8185714477089711e-06, - "loss": 0.7988, - "step": 25625 - }, - { - "epoch": 0.66, - "learning_rate": 1.8185555533562158e-06, - "loss": 1.0713, - "step": 25626 - }, - { - "epoch": 0.66, - "learning_rate": 1.81853965837673e-06, - "loss": 0.5459, - "step": 25627 - }, - { - "epoch": 0.66, - "learning_rate": 1.818523762770526e-06, - "loss": 0.7681, - "step": 25628 - }, - { - "epoch": 0.66, - "learning_rate": 1.818507866537616e-06, - "loss": 0.8379, - "step": 25629 - }, - { - "epoch": 0.66, - "learning_rate": 1.8184919696780124e-06, - "loss": 0.748, - "step": 25630 - }, - { - "epoch": 0.66, - "learning_rate": 1.8184760721917268e-06, - "loss": 0.7588, - "step": 25631 - }, - { - "epoch": 0.66, - "learning_rate": 1.818460174078772e-06, - "loss": 0.9043, - "step": 25632 - }, - { - "epoch": 0.66, - "learning_rate": 1.8184442753391596e-06, - "loss": 0.8042, - "step": 25633 - }, - { - "epoch": 0.66, - "learning_rate": 1.8184283759729022e-06, - "loss": 0.96, - "step": 25634 - }, - { - "epoch": 0.66, - "learning_rate": 1.8184124759800117e-06, - "loss": 0.8574, - "step": 25635 - }, - { - "epoch": 0.66, - "learning_rate": 1.8183965753605004e-06, - "loss": 0.8389, - "step": 25636 - }, - { - "epoch": 0.66, - "learning_rate": 1.8183806741143806e-06, - "loss": 0.7988, - "step": 25637 - }, - { - "epoch": 0.66, - "learning_rate": 1.8183647722416644e-06, - "loss": 0.8291, - "step": 25638 - }, - { - "epoch": 0.66, - "learning_rate": 1.8183488697423638e-06, - "loss": 0.6948, - "step": 25639 - }, - { - "epoch": 0.66, - "learning_rate": 1.818332966616491e-06, - "loss": 0.8755, - "step": 25640 - }, - { - "epoch": 0.66, - "learning_rate": 1.8183170628640588e-06, - "loss": 1.0312, - "step": 25641 - }, - { - "epoch": 0.66, - "learning_rate": 1.8183011584850782e-06, - "loss": 1.0146, - "step": 25642 - }, - { - "epoch": 0.66, - "learning_rate": 1.8182852534795623e-06, - "loss": 0.7803, - "step": 25643 - }, - { - "epoch": 0.66, - "learning_rate": 1.818269347847523e-06, - "loss": 0.8857, - "step": 25644 - }, - { - "epoch": 0.66, - "learning_rate": 1.8182534415889725e-06, - "loss": 0.7544, - "step": 25645 - }, - { - "epoch": 0.66, - "learning_rate": 1.818237534703923e-06, - "loss": 0.645, - "step": 25646 - }, - { - "epoch": 0.66, - "learning_rate": 1.8182216271923866e-06, - "loss": 0.7402, - "step": 25647 - }, - { - "epoch": 0.66, - "learning_rate": 1.8182057190543754e-06, - "loss": 0.7134, - "step": 25648 - }, - { - "epoch": 0.66, - "learning_rate": 1.818189810289902e-06, - "loss": 0.9189, - "step": 25649 - }, - { - "epoch": 0.66, - "learning_rate": 1.8181739008989779e-06, - "loss": 0.834, - "step": 25650 - }, - { - "epoch": 0.66, - "learning_rate": 1.8181579908816161e-06, - "loss": 0.7061, - "step": 25651 - }, - { - "epoch": 0.66, - "learning_rate": 1.818142080237828e-06, - "loss": 1.0283, - "step": 25652 - }, - { - "epoch": 0.66, - "learning_rate": 1.8181261689676262e-06, - "loss": 0.9873, - "step": 25653 - }, - { - "epoch": 0.66, - "learning_rate": 1.818110257071023e-06, - "loss": 0.8711, - "step": 25654 - }, - { - "epoch": 0.66, - "learning_rate": 1.8180943445480301e-06, - "loss": 0.7866, - "step": 25655 - }, - { - "epoch": 0.66, - "learning_rate": 1.81807843139866e-06, - "loss": 0.6836, - "step": 25656 - }, - { - "epoch": 0.66, - "learning_rate": 1.8180625176229253e-06, - "loss": 0.8555, - "step": 25657 - }, - { - "epoch": 0.66, - "learning_rate": 1.8180466032208373e-06, - "loss": 0.7183, - "step": 25658 - }, - { - "epoch": 0.66, - "learning_rate": 1.8180306881924086e-06, - "loss": 0.8291, - "step": 25659 - }, - { - "epoch": 0.66, - "learning_rate": 1.8180147725376516e-06, - "loss": 0.8594, - "step": 25660 - }, - { - "epoch": 0.66, - "learning_rate": 1.8179988562565782e-06, - "loss": 0.7037, - "step": 25661 - }, - { - "epoch": 0.66, - "learning_rate": 1.8179829393492008e-06, - "loss": 0.8057, - "step": 25662 - }, - { - "epoch": 0.66, - "learning_rate": 1.8179670218155315e-06, - "loss": 1.0273, - "step": 25663 - }, - { - "epoch": 0.66, - "learning_rate": 1.8179511036555825e-06, - "loss": 1.0137, - "step": 25664 - }, - { - "epoch": 0.66, - "learning_rate": 1.8179351848693658e-06, - "loss": 0.8186, - "step": 25665 - }, - { - "epoch": 0.66, - "learning_rate": 1.8179192654568937e-06, - "loss": 0.9697, - "step": 25666 - }, - { - "epoch": 0.66, - "learning_rate": 1.8179033454181786e-06, - "loss": 1.0693, - "step": 25667 - }, - { - "epoch": 0.66, - "learning_rate": 1.8178874247532322e-06, - "loss": 0.8994, - "step": 25668 - }, - { - "epoch": 0.66, - "learning_rate": 1.8178715034620673e-06, - "loss": 0.9209, - "step": 25669 - }, - { - "epoch": 0.66, - "learning_rate": 1.8178555815446959e-06, - "loss": 0.9111, - "step": 25670 - }, - { - "epoch": 0.66, - "learning_rate": 1.8178396590011297e-06, - "loss": 0.9746, - "step": 25671 - }, - { - "epoch": 0.66, - "learning_rate": 1.8178237358313817e-06, - "loss": 0.8525, - "step": 25672 - }, - { - "epoch": 0.66, - "learning_rate": 1.8178078120354633e-06, - "loss": 0.9111, - "step": 25673 - }, - { - "epoch": 0.66, - "learning_rate": 1.8177918876133873e-06, - "loss": 0.7305, - "step": 25674 - }, - { - "epoch": 0.66, - "learning_rate": 1.8177759625651658e-06, - "loss": 1.1494, - "step": 25675 - }, - { - "epoch": 0.66, - "learning_rate": 1.8177600368908106e-06, - "loss": 0.9634, - "step": 25676 - }, - { - "epoch": 0.66, - "learning_rate": 1.8177441105903342e-06, - "loss": 0.7031, - "step": 25677 - }, - { - "epoch": 0.66, - "learning_rate": 1.8177281836637488e-06, - "loss": 0.582, - "step": 25678 - }, - { - "epoch": 0.66, - "learning_rate": 1.8177122561110663e-06, - "loss": 0.8857, - "step": 25679 - }, - { - "epoch": 0.66, - "learning_rate": 1.8176963279322992e-06, - "loss": 0.8936, - "step": 25680 - }, - { - "epoch": 0.66, - "learning_rate": 1.8176803991274595e-06, - "loss": 0.6755, - "step": 25681 - }, - { - "epoch": 0.66, - "learning_rate": 1.81766446969656e-06, - "loss": 0.8076, - "step": 25682 - }, - { - "epoch": 0.66, - "learning_rate": 1.8176485396396121e-06, - "loss": 0.8135, - "step": 25683 - }, - { - "epoch": 0.66, - "learning_rate": 1.8176326089566283e-06, - "loss": 0.9775, - "step": 25684 - }, - { - "epoch": 0.66, - "learning_rate": 1.8176166776476206e-06, - "loss": 1.0186, - "step": 25685 - }, - { - "epoch": 0.66, - "learning_rate": 1.8176007457126019e-06, - "loss": 1.0488, - "step": 25686 - }, - { - "epoch": 0.66, - "learning_rate": 1.8175848131515836e-06, - "loss": 0.877, - "step": 25687 - }, - { - "epoch": 0.66, - "learning_rate": 1.817568879964578e-06, - "loss": 0.7607, - "step": 25688 - }, - { - "epoch": 0.66, - "learning_rate": 1.8175529461515979e-06, - "loss": 0.864, - "step": 25689 - }, - { - "epoch": 0.66, - "learning_rate": 1.8175370117126548e-06, - "loss": 1.1172, - "step": 25690 - }, - { - "epoch": 0.66, - "learning_rate": 1.8175210766477616e-06, - "loss": 0.9209, - "step": 25691 - }, - { - "epoch": 0.66, - "learning_rate": 1.8175051409569297e-06, - "loss": 0.9141, - "step": 25692 - }, - { - "epoch": 0.66, - "learning_rate": 1.817489204640172e-06, - "loss": 0.9043, - "step": 25693 - }, - { - "epoch": 0.66, - "learning_rate": 1.8174732676975002e-06, - "loss": 1.041, - "step": 25694 - }, - { - "epoch": 0.66, - "learning_rate": 1.8174573301289269e-06, - "loss": 0.8145, - "step": 25695 - }, - { - "epoch": 0.66, - "learning_rate": 1.817441391934464e-06, - "loss": 0.8887, - "step": 25696 - }, - { - "epoch": 0.66, - "learning_rate": 1.8174254531141238e-06, - "loss": 0.8623, - "step": 25697 - }, - { - "epoch": 0.66, - "learning_rate": 1.8174095136679184e-06, - "loss": 0.8623, - "step": 25698 - }, - { - "epoch": 0.66, - "learning_rate": 1.8173935735958604e-06, - "loss": 0.9824, - "step": 25699 - }, - { - "epoch": 0.66, - "learning_rate": 1.8173776328979616e-06, - "loss": 0.7441, - "step": 25700 - }, - { - "epoch": 0.66, - "learning_rate": 1.8173616915742343e-06, - "loss": 0.6372, - "step": 25701 - }, - { - "epoch": 0.66, - "learning_rate": 1.8173457496246906e-06, - "loss": 0.6699, - "step": 25702 - }, - { - "epoch": 0.66, - "learning_rate": 1.8173298070493428e-06, - "loss": 0.9121, - "step": 25703 - }, - { - "epoch": 0.66, - "learning_rate": 1.8173138638482035e-06, - "loss": 0.8311, - "step": 25704 - }, - { - "epoch": 0.66, - "learning_rate": 1.8172979200212843e-06, - "loss": 0.9609, - "step": 25705 - }, - { - "epoch": 0.66, - "learning_rate": 1.8172819755685976e-06, - "loss": 0.9326, - "step": 25706 - }, - { - "epoch": 0.66, - "learning_rate": 1.817266030490156e-06, - "loss": 0.9258, - "step": 25707 - }, - { - "epoch": 0.66, - "learning_rate": 1.8172500847859711e-06, - "loss": 0.7842, - "step": 25708 - }, - { - "epoch": 0.66, - "learning_rate": 1.8172341384560554e-06, - "loss": 0.8262, - "step": 25709 - }, - { - "epoch": 0.66, - "learning_rate": 1.8172181915004213e-06, - "loss": 0.6383, - "step": 25710 - }, - { - "epoch": 0.66, - "learning_rate": 1.8172022439190806e-06, - "loss": 0.7754, - "step": 25711 - }, - { - "epoch": 0.66, - "learning_rate": 1.8171862957120458e-06, - "loss": 1.0596, - "step": 25712 - }, - { - "epoch": 0.66, - "learning_rate": 1.8171703468793292e-06, - "loss": 1.0967, - "step": 25713 - }, - { - "epoch": 0.66, - "learning_rate": 1.8171543974209426e-06, - "loss": 0.772, - "step": 25714 - }, - { - "epoch": 0.66, - "learning_rate": 1.8171384473368984e-06, - "loss": 0.8252, - "step": 25715 - }, - { - "epoch": 0.66, - "learning_rate": 1.817122496627209e-06, - "loss": 0.8096, - "step": 25716 - }, - { - "epoch": 0.66, - "learning_rate": 1.8171065452918866e-06, - "loss": 0.7793, - "step": 25717 - }, - { - "epoch": 0.66, - "learning_rate": 1.8170905933309428e-06, - "loss": 0.7871, - "step": 25718 - }, - { - "epoch": 0.66, - "learning_rate": 1.8170746407443906e-06, - "loss": 0.7334, - "step": 25719 - }, - { - "epoch": 0.66, - "learning_rate": 1.817058687532242e-06, - "loss": 0.915, - "step": 25720 - }, - { - "epoch": 0.66, - "learning_rate": 1.8170427336945092e-06, - "loss": 0.8271, - "step": 25721 - }, - { - "epoch": 0.66, - "learning_rate": 1.8170267792312042e-06, - "loss": 0.9111, - "step": 25722 - }, - { - "epoch": 0.66, - "learning_rate": 1.8170108241423395e-06, - "loss": 0.9609, - "step": 25723 - }, - { - "epoch": 0.66, - "learning_rate": 1.8169948684279271e-06, - "loss": 1.0107, - "step": 25724 - }, - { - "epoch": 0.66, - "learning_rate": 1.8169789120879793e-06, - "loss": 0.7754, - "step": 25725 - }, - { - "epoch": 0.66, - "learning_rate": 1.8169629551225084e-06, - "loss": 0.917, - "step": 25726 - }, - { - "epoch": 0.66, - "learning_rate": 1.8169469975315263e-06, - "loss": 0.8574, - "step": 25727 - }, - { - "epoch": 0.66, - "learning_rate": 1.8169310393150456e-06, - "loss": 0.8281, - "step": 25728 - }, - { - "epoch": 0.66, - "learning_rate": 1.8169150804730783e-06, - "loss": 0.8125, - "step": 25729 - }, - { - "epoch": 0.66, - "learning_rate": 1.8168991210056368e-06, - "loss": 0.9897, - "step": 25730 - }, - { - "epoch": 0.66, - "learning_rate": 1.816883160912733e-06, - "loss": 0.9658, - "step": 25731 - }, - { - "epoch": 0.66, - "learning_rate": 1.8168672001943794e-06, - "loss": 0.7852, - "step": 25732 - }, - { - "epoch": 0.66, - "learning_rate": 1.8168512388505884e-06, - "loss": 0.6357, - "step": 25733 - }, - { - "epoch": 0.66, - "learning_rate": 1.8168352768813716e-06, - "loss": 0.9492, - "step": 25734 - }, - { - "epoch": 0.66, - "learning_rate": 1.816819314286742e-06, - "loss": 0.833, - "step": 25735 - }, - { - "epoch": 0.66, - "learning_rate": 1.816803351066711e-06, - "loss": 0.8965, - "step": 25736 - }, - { - "epoch": 0.66, - "learning_rate": 1.8167873872212914e-06, - "loss": 0.9297, - "step": 25737 - }, - { - "epoch": 0.66, - "learning_rate": 1.8167714227504951e-06, - "loss": 1.002, - "step": 25738 - }, - { - "epoch": 0.66, - "learning_rate": 1.8167554576543349e-06, - "loss": 0.8506, - "step": 25739 - }, - { - "epoch": 0.66, - "learning_rate": 1.816739491932822e-06, - "loss": 0.8076, - "step": 25740 - }, - { - "epoch": 0.66, - "learning_rate": 1.8167235255859698e-06, - "loss": 1.0527, - "step": 25741 - }, - { - "epoch": 0.66, - "learning_rate": 1.8167075586137897e-06, - "loss": 0.8711, - "step": 25742 - }, - { - "epoch": 0.66, - "learning_rate": 1.8166915910162942e-06, - "loss": 0.8799, - "step": 25743 - }, - { - "epoch": 0.66, - "learning_rate": 1.8166756227934954e-06, - "loss": 0.8037, - "step": 25744 - }, - { - "epoch": 0.66, - "learning_rate": 1.8166596539454058e-06, - "loss": 0.79, - "step": 25745 - }, - { - "epoch": 0.66, - "learning_rate": 1.8166436844720372e-06, - "loss": 0.791, - "step": 25746 - }, - { - "epoch": 0.66, - "learning_rate": 1.8166277143734022e-06, - "loss": 0.8682, - "step": 25747 - }, - { - "epoch": 0.66, - "learning_rate": 1.816611743649513e-06, - "loss": 0.8423, - "step": 25748 - }, - { - "epoch": 0.66, - "learning_rate": 1.8165957723003818e-06, - "loss": 0.7191, - "step": 25749 - }, - { - "epoch": 0.66, - "learning_rate": 1.8165798003260203e-06, - "loss": 0.8135, - "step": 25750 - }, - { - "epoch": 0.66, - "learning_rate": 1.816563827726442e-06, - "loss": 0.8706, - "step": 25751 - }, - { - "epoch": 0.66, - "learning_rate": 1.8165478545016576e-06, - "loss": 1.0635, - "step": 25752 - }, - { - "epoch": 0.66, - "learning_rate": 1.8165318806516804e-06, - "loss": 0.9727, - "step": 25753 - }, - { - "epoch": 0.66, - "learning_rate": 1.8165159061765223e-06, - "loss": 0.915, - "step": 25754 - }, - { - "epoch": 0.66, - "learning_rate": 1.8164999310761954e-06, - "loss": 0.8203, - "step": 25755 - }, - { - "epoch": 0.66, - "learning_rate": 1.8164839553507121e-06, - "loss": 0.8447, - "step": 25756 - }, - { - "epoch": 0.66, - "learning_rate": 1.8164679790000846e-06, - "loss": 0.8525, - "step": 25757 - }, - { - "epoch": 0.66, - "learning_rate": 1.816452002024325e-06, - "loss": 0.7959, - "step": 25758 - }, - { - "epoch": 0.66, - "learning_rate": 1.8164360244234459e-06, - "loss": 0.8496, - "step": 25759 - }, - { - "epoch": 0.66, - "learning_rate": 1.8164200461974588e-06, - "loss": 0.7305, - "step": 25760 - }, - { - "epoch": 0.66, - "learning_rate": 1.8164040673463767e-06, - "loss": 0.8672, - "step": 25761 - }, - { - "epoch": 0.66, - "learning_rate": 1.8163880878702116e-06, - "loss": 0.9521, - "step": 25762 - }, - { - "epoch": 0.66, - "learning_rate": 1.8163721077689757e-06, - "loss": 0.7515, - "step": 25763 - }, - { - "epoch": 0.66, - "learning_rate": 1.816356127042681e-06, - "loss": 0.8462, - "step": 25764 - }, - { - "epoch": 0.66, - "learning_rate": 1.8163401456913402e-06, - "loss": 0.9912, - "step": 25765 - }, - { - "epoch": 0.66, - "learning_rate": 1.816324163714965e-06, - "loss": 0.8301, - "step": 25766 - }, - { - "epoch": 0.66, - "learning_rate": 1.8163081811135683e-06, - "loss": 0.999, - "step": 25767 - }, - { - "epoch": 0.66, - "learning_rate": 1.8162921978871616e-06, - "loss": 0.5903, - "step": 25768 - }, - { - "epoch": 0.66, - "learning_rate": 1.8162762140357577e-06, - "loss": 0.7783, - "step": 25769 - }, - { - "epoch": 0.66, - "learning_rate": 1.8162602295593686e-06, - "loss": 0.8936, - "step": 25770 - }, - { - "epoch": 0.66, - "learning_rate": 1.8162442444580064e-06, - "loss": 0.8965, - "step": 25771 - }, - { - "epoch": 0.66, - "learning_rate": 1.8162282587316837e-06, - "loss": 0.7065, - "step": 25772 - }, - { - "epoch": 0.66, - "learning_rate": 1.8162122723804126e-06, - "loss": 0.7158, - "step": 25773 - }, - { - "epoch": 0.66, - "learning_rate": 1.8161962854042052e-06, - "loss": 0.8145, - "step": 25774 - }, - { - "epoch": 0.66, - "learning_rate": 1.8161802978030737e-06, - "loss": 0.6084, - "step": 25775 - }, - { - "epoch": 0.66, - "learning_rate": 1.8161643095770307e-06, - "loss": 0.8198, - "step": 25776 - }, - { - "epoch": 0.66, - "learning_rate": 1.8161483207260883e-06, - "loss": 1.04, - "step": 25777 - }, - { - "epoch": 0.66, - "learning_rate": 1.8161323312502584e-06, - "loss": 0.8564, - "step": 25778 - }, - { - "epoch": 0.66, - "learning_rate": 1.8161163411495538e-06, - "loss": 0.603, - "step": 25779 - }, - { - "epoch": 0.66, - "learning_rate": 1.8161003504239862e-06, - "loss": 0.7246, - "step": 25780 - }, - { - "epoch": 0.66, - "learning_rate": 1.8160843590735682e-06, - "loss": 0.5781, - "step": 25781 - }, - { - "epoch": 0.66, - "learning_rate": 1.8160683670983117e-06, - "loss": 0.8882, - "step": 25782 - }, - { - "epoch": 0.66, - "learning_rate": 1.8160523744982295e-06, - "loss": 0.7627, - "step": 25783 - }, - { - "epoch": 0.66, - "learning_rate": 1.8160363812733333e-06, - "loss": 1.0342, - "step": 25784 - }, - { - "epoch": 0.66, - "learning_rate": 1.8160203874236355e-06, - "loss": 0.7881, - "step": 25785 - }, - { - "epoch": 0.66, - "learning_rate": 1.8160043929491486e-06, - "loss": 0.8818, - "step": 25786 - }, - { - "epoch": 0.66, - "learning_rate": 1.8159883978498845e-06, - "loss": 0.7471, - "step": 25787 - }, - { - "epoch": 0.66, - "learning_rate": 1.815972402125856e-06, - "loss": 1.0322, - "step": 25788 - }, - { - "epoch": 0.66, - "learning_rate": 1.8159564057770744e-06, - "loss": 0.6826, - "step": 25789 - }, - { - "epoch": 0.66, - "learning_rate": 1.8159404088035527e-06, - "loss": 0.8701, - "step": 25790 - }, - { - "epoch": 0.66, - "learning_rate": 1.8159244112053032e-06, - "loss": 1.0215, - "step": 25791 - }, - { - "epoch": 0.66, - "learning_rate": 1.8159084129823376e-06, - "loss": 0.7031, - "step": 25792 - }, - { - "epoch": 0.66, - "learning_rate": 1.8158924141346686e-06, - "loss": 0.6851, - "step": 25793 - }, - { - "epoch": 0.66, - "learning_rate": 1.8158764146623082e-06, - "loss": 1.0088, - "step": 25794 - }, - { - "epoch": 0.66, - "learning_rate": 1.8158604145652687e-06, - "loss": 0.7266, - "step": 25795 - }, - { - "epoch": 0.66, - "learning_rate": 1.8158444138435626e-06, - "loss": 0.9238, - "step": 25796 - }, - { - "epoch": 0.66, - "learning_rate": 1.8158284124972015e-06, - "loss": 0.6162, - "step": 25797 - }, - { - "epoch": 0.66, - "learning_rate": 1.8158124105261984e-06, - "loss": 0.9463, - "step": 25798 - }, - { - "epoch": 0.66, - "learning_rate": 1.8157964079305655e-06, - "loss": 1.0576, - "step": 25799 - }, - { - "epoch": 0.66, - "learning_rate": 1.8157804047103147e-06, - "loss": 1.041, - "step": 25800 - }, - { - "epoch": 0.66, - "learning_rate": 1.8157644008654583e-06, - "loss": 0.7305, - "step": 25801 - }, - { - "epoch": 0.66, - "learning_rate": 1.8157483963960083e-06, - "loss": 1.0137, - "step": 25802 - }, - { - "epoch": 0.66, - "learning_rate": 1.8157323913019775e-06, - "loss": 0.6909, - "step": 25803 - }, - { - "epoch": 0.66, - "learning_rate": 1.815716385583378e-06, - "loss": 0.6221, - "step": 25804 - }, - { - "epoch": 0.66, - "learning_rate": 1.815700379240222e-06, - "loss": 0.8721, - "step": 25805 - }, - { - "epoch": 0.66, - "learning_rate": 1.8156843722725213e-06, - "loss": 0.7314, - "step": 25806 - }, - { - "epoch": 0.66, - "learning_rate": 1.815668364680289e-06, - "loss": 0.7129, - "step": 25807 - }, - { - "epoch": 0.66, - "learning_rate": 1.8156523564635369e-06, - "loss": 0.7588, - "step": 25808 - }, - { - "epoch": 0.66, - "learning_rate": 1.815636347622277e-06, - "loss": 0.7642, - "step": 25809 - }, - { - "epoch": 0.66, - "learning_rate": 1.8156203381565223e-06, - "loss": 0.7959, - "step": 25810 - }, - { - "epoch": 0.66, - "learning_rate": 1.8156043280662842e-06, - "loss": 0.9453, - "step": 25811 - }, - { - "epoch": 0.66, - "learning_rate": 1.8155883173515755e-06, - "loss": 1.248, - "step": 25812 - }, - { - "epoch": 0.66, - "learning_rate": 1.8155723060124086e-06, - "loss": 0.5811, - "step": 25813 - }, - { - "epoch": 0.66, - "learning_rate": 1.8155562940487951e-06, - "loss": 0.7881, - "step": 25814 - }, - { - "epoch": 0.66, - "learning_rate": 1.815540281460748e-06, - "loss": 0.7715, - "step": 25815 - }, - { - "epoch": 0.66, - "learning_rate": 1.8155242682482789e-06, - "loss": 0.8799, - "step": 25816 - }, - { - "epoch": 0.66, - "learning_rate": 1.8155082544114004e-06, - "loss": 0.9482, - "step": 25817 - }, - { - "epoch": 0.66, - "learning_rate": 1.8154922399501248e-06, - "loss": 0.6206, - "step": 25818 - }, - { - "epoch": 0.66, - "learning_rate": 1.8154762248644644e-06, - "loss": 0.9023, - "step": 25819 - }, - { - "epoch": 0.66, - "learning_rate": 1.8154602091544313e-06, - "loss": 0.7881, - "step": 25820 - }, - { - "epoch": 0.66, - "learning_rate": 1.8154441928200376e-06, - "loss": 0.8379, - "step": 25821 - }, - { - "epoch": 0.66, - "learning_rate": 1.815428175861296e-06, - "loss": 1.0215, - "step": 25822 - }, - { - "epoch": 0.66, - "learning_rate": 1.8154121582782184e-06, - "loss": 1.0469, - "step": 25823 - }, - { - "epoch": 0.66, - "learning_rate": 1.8153961400708172e-06, - "loss": 0.9395, - "step": 25824 - }, - { - "epoch": 0.66, - "learning_rate": 1.815380121239105e-06, - "loss": 0.793, - "step": 25825 - }, - { - "epoch": 0.66, - "learning_rate": 1.8153641017830933e-06, - "loss": 0.9053, - "step": 25826 - }, - { - "epoch": 0.66, - "learning_rate": 1.8153480817027951e-06, - "loss": 0.9121, - "step": 25827 - }, - { - "epoch": 0.66, - "learning_rate": 1.8153320609982222e-06, - "loss": 0.6235, - "step": 25828 - }, - { - "epoch": 0.66, - "learning_rate": 1.8153160396693871e-06, - "loss": 0.876, - "step": 25829 - }, - { - "epoch": 0.66, - "learning_rate": 1.815300017716302e-06, - "loss": 0.8408, - "step": 25830 - }, - { - "epoch": 0.66, - "learning_rate": 1.8152839951389791e-06, - "loss": 0.8086, - "step": 25831 - }, - { - "epoch": 0.66, - "learning_rate": 1.8152679719374308e-06, - "loss": 1.042, - "step": 25832 - }, - { - "epoch": 0.66, - "learning_rate": 1.8152519481116694e-06, - "loss": 0.8376, - "step": 25833 - }, - { - "epoch": 0.66, - "learning_rate": 1.815235923661707e-06, - "loss": 0.9453, - "step": 25834 - }, - { - "epoch": 0.66, - "learning_rate": 1.8152198985875558e-06, - "loss": 0.8984, - "step": 25835 - }, - { - "epoch": 0.66, - "learning_rate": 1.8152038728892282e-06, - "loss": 0.8594, - "step": 25836 - }, - { - "epoch": 0.66, - "learning_rate": 1.8151878465667366e-06, - "loss": 0.8115, - "step": 25837 - }, - { - "epoch": 0.66, - "learning_rate": 1.815171819620093e-06, - "loss": 0.9688, - "step": 25838 - }, - { - "epoch": 0.66, - "learning_rate": 1.81515579204931e-06, - "loss": 1.0273, - "step": 25839 - }, - { - "epoch": 0.66, - "learning_rate": 1.8151397638543997e-06, - "loss": 1.0264, - "step": 25840 - }, - { - "epoch": 0.66, - "learning_rate": 1.8151237350353742e-06, - "loss": 0.9844, - "step": 25841 - }, - { - "epoch": 0.66, - "learning_rate": 1.8151077055922462e-06, - "loss": 0.8828, - "step": 25842 - }, - { - "epoch": 0.66, - "learning_rate": 1.8150916755250276e-06, - "loss": 0.9316, - "step": 25843 - }, - { - "epoch": 0.66, - "learning_rate": 1.8150756448337305e-06, - "loss": 0.8477, - "step": 25844 - }, - { - "epoch": 0.66, - "learning_rate": 1.8150596135183678e-06, - "loss": 1.0059, - "step": 25845 - }, - { - "epoch": 0.66, - "learning_rate": 1.8150435815789513e-06, - "loss": 0.8916, - "step": 25846 - }, - { - "epoch": 0.66, - "learning_rate": 1.8150275490154934e-06, - "loss": 0.9102, - "step": 25847 - }, - { - "epoch": 0.66, - "learning_rate": 1.8150115158280066e-06, - "loss": 1.002, - "step": 25848 - }, - { - "epoch": 0.66, - "learning_rate": 1.8149954820165029e-06, - "loss": 0.8364, - "step": 25849 - }, - { - "epoch": 0.66, - "learning_rate": 1.8149794475809942e-06, - "loss": 0.7471, - "step": 25850 - }, - { - "epoch": 0.66, - "learning_rate": 1.8149634125214934e-06, - "loss": 0.6399, - "step": 25851 - }, - { - "epoch": 0.66, - "learning_rate": 1.8149473768380128e-06, - "loss": 0.8203, - "step": 25852 - }, - { - "epoch": 0.66, - "learning_rate": 1.8149313405305644e-06, - "loss": 0.9414, - "step": 25853 - }, - { - "epoch": 0.66, - "learning_rate": 1.8149153035991605e-06, - "loss": 0.8833, - "step": 25854 - }, - { - "epoch": 0.66, - "learning_rate": 1.8148992660438135e-06, - "loss": 0.9072, - "step": 25855 - }, - { - "epoch": 0.66, - "learning_rate": 1.8148832278645354e-06, - "loss": 0.9287, - "step": 25856 - }, - { - "epoch": 0.66, - "learning_rate": 1.814867189061339e-06, - "loss": 0.834, - "step": 25857 - }, - { - "epoch": 0.66, - "learning_rate": 1.814851149634236e-06, - "loss": 0.9824, - "step": 25858 - }, - { - "epoch": 0.66, - "learning_rate": 1.8148351095832389e-06, - "loss": 0.6895, - "step": 25859 - }, - { - "epoch": 0.66, - "learning_rate": 1.8148190689083601e-06, - "loss": 0.8735, - "step": 25860 - }, - { - "epoch": 0.66, - "learning_rate": 1.8148030276096118e-06, - "loss": 0.9092, - "step": 25861 - }, - { - "epoch": 0.66, - "learning_rate": 1.8147869856870065e-06, - "loss": 0.7388, - "step": 25862 - }, - { - "epoch": 0.66, - "learning_rate": 1.814770943140556e-06, - "loss": 0.8848, - "step": 25863 - }, - { - "epoch": 0.66, - "learning_rate": 1.814754899970273e-06, - "loss": 0.8682, - "step": 25864 - }, - { - "epoch": 0.66, - "learning_rate": 1.8147388561761696e-06, - "loss": 0.9502, - "step": 25865 - }, - { - "epoch": 0.66, - "learning_rate": 1.814722811758258e-06, - "loss": 0.7476, - "step": 25866 - }, - { - "epoch": 0.66, - "learning_rate": 1.8147067667165509e-06, - "loss": 0.8223, - "step": 25867 - }, - { - "epoch": 0.66, - "learning_rate": 1.81469072105106e-06, - "loss": 0.7588, - "step": 25868 - }, - { - "epoch": 0.66, - "learning_rate": 1.814674674761798e-06, - "loss": 0.8262, - "step": 25869 - }, - { - "epoch": 0.66, - "learning_rate": 1.814658627848777e-06, - "loss": 0.7471, - "step": 25870 - }, - { - "epoch": 0.66, - "learning_rate": 1.8146425803120095e-06, - "loss": 0.8555, - "step": 25871 - }, - { - "epoch": 0.66, - "learning_rate": 1.8146265321515074e-06, - "loss": 0.8721, - "step": 25872 - }, - { - "epoch": 0.66, - "learning_rate": 1.8146104833672834e-06, - "loss": 0.7236, - "step": 25873 - }, - { - "epoch": 0.66, - "learning_rate": 1.8145944339593495e-06, - "loss": 0.7722, - "step": 25874 - }, - { - "epoch": 0.66, - "learning_rate": 1.8145783839277181e-06, - "loss": 0.9277, - "step": 25875 - }, - { - "epoch": 0.66, - "learning_rate": 1.8145623332724016e-06, - "loss": 0.9326, - "step": 25876 - }, - { - "epoch": 0.66, - "learning_rate": 1.8145462819934121e-06, - "loss": 0.9238, - "step": 25877 - }, - { - "epoch": 0.66, - "learning_rate": 1.814530230090762e-06, - "loss": 0.6428, - "step": 25878 - }, - { - "epoch": 0.66, - "learning_rate": 1.8145141775644634e-06, - "loss": 0.7793, - "step": 25879 - }, - { - "epoch": 0.66, - "learning_rate": 1.8144981244145292e-06, - "loss": 1.1006, - "step": 25880 - }, - { - "epoch": 0.66, - "learning_rate": 1.8144820706409707e-06, - "loss": 1.0049, - "step": 25881 - }, - { - "epoch": 0.66, - "learning_rate": 1.814466016243801e-06, - "loss": 0.9229, - "step": 25882 - }, - { - "epoch": 0.66, - "learning_rate": 1.814449961223032e-06, - "loss": 0.9502, - "step": 25883 - }, - { - "epoch": 0.66, - "learning_rate": 1.8144339055786762e-06, - "loss": 0.6499, - "step": 25884 - }, - { - "epoch": 0.66, - "learning_rate": 1.8144178493107459e-06, - "loss": 0.9883, - "step": 25885 - }, - { - "epoch": 0.66, - "learning_rate": 1.8144017924192532e-06, - "loss": 0.9189, - "step": 25886 - }, - { - "epoch": 0.66, - "learning_rate": 1.8143857349042105e-06, - "loss": 0.9824, - "step": 25887 - }, - { - "epoch": 0.66, - "learning_rate": 1.81436967676563e-06, - "loss": 1.0186, - "step": 25888 - }, - { - "epoch": 0.66, - "learning_rate": 1.8143536180035241e-06, - "loss": 0.7598, - "step": 25889 - }, - { - "epoch": 0.66, - "learning_rate": 1.8143375586179053e-06, - "loss": 0.6914, - "step": 25890 - }, - { - "epoch": 0.66, - "learning_rate": 1.8143214986087854e-06, - "loss": 0.7268, - "step": 25891 - }, - { - "epoch": 0.66, - "learning_rate": 1.8143054379761772e-06, - "loss": 0.8789, - "step": 25892 - }, - { - "epoch": 0.66, - "learning_rate": 1.8142893767200927e-06, - "loss": 0.7861, - "step": 25893 - }, - { - "epoch": 0.66, - "learning_rate": 1.8142733148405442e-06, - "loss": 0.9141, - "step": 25894 - }, - { - "epoch": 0.66, - "learning_rate": 1.8142572523375442e-06, - "loss": 0.8584, - "step": 25895 - }, - { - "epoch": 0.66, - "learning_rate": 1.8142411892111045e-06, - "loss": 1.0225, - "step": 25896 - }, - { - "epoch": 0.66, - "learning_rate": 1.8142251254612381e-06, - "loss": 0.9297, - "step": 25897 - }, - { - "epoch": 0.66, - "learning_rate": 1.8142090610879568e-06, - "loss": 0.8936, - "step": 25898 - }, - { - "epoch": 0.66, - "learning_rate": 1.8141929960912732e-06, - "loss": 0.8389, - "step": 25899 - }, - { - "epoch": 0.66, - "learning_rate": 1.8141769304711994e-06, - "loss": 0.8848, - "step": 25900 - }, - { - "epoch": 0.66, - "learning_rate": 1.8141608642277477e-06, - "loss": 1.1172, - "step": 25901 - }, - { - "epoch": 0.66, - "learning_rate": 1.8141447973609308e-06, - "loss": 0.8867, - "step": 25902 - }, - { - "epoch": 0.66, - "learning_rate": 1.81412872987076e-06, - "loss": 0.8418, - "step": 25903 - }, - { - "epoch": 0.66, - "learning_rate": 1.814112661757249e-06, - "loss": 0.9072, - "step": 25904 - }, - { - "epoch": 0.66, - "learning_rate": 1.8140965930204088e-06, - "loss": 0.8926, - "step": 25905 - }, - { - "epoch": 0.66, - "learning_rate": 1.8140805236602525e-06, - "loss": 1.0654, - "step": 25906 - }, - { - "epoch": 0.66, - "learning_rate": 1.814064453676792e-06, - "loss": 0.9502, - "step": 25907 - }, - { - "epoch": 0.66, - "learning_rate": 1.81404838307004e-06, - "loss": 0.835, - "step": 25908 - }, - { - "epoch": 0.66, - "learning_rate": 1.8140323118400084e-06, - "loss": 0.7847, - "step": 25909 - }, - { - "epoch": 0.66, - "learning_rate": 1.81401623998671e-06, - "loss": 0.9346, - "step": 25910 - }, - { - "epoch": 0.66, - "learning_rate": 1.814000167510157e-06, - "loss": 1.0518, - "step": 25911 - }, - { - "epoch": 0.66, - "learning_rate": 1.8139840944103608e-06, - "loss": 0.9297, - "step": 25912 - }, - { - "epoch": 0.66, - "learning_rate": 1.8139680206873346e-06, - "loss": 0.9268, - "step": 25913 - }, - { - "epoch": 0.66, - "learning_rate": 1.8139519463410905e-06, - "loss": 0.7446, - "step": 25914 - }, - { - "epoch": 0.66, - "learning_rate": 1.8139358713716413e-06, - "loss": 0.8633, - "step": 25915 - }, - { - "epoch": 0.66, - "learning_rate": 1.8139197957789984e-06, - "loss": 0.835, - "step": 25916 - }, - { - "epoch": 0.66, - "learning_rate": 1.8139037195631746e-06, - "loss": 0.8003, - "step": 25917 - }, - { - "epoch": 0.66, - "learning_rate": 1.813887642724182e-06, - "loss": 0.6895, - "step": 25918 - }, - { - "epoch": 0.66, - "learning_rate": 1.8138715652620332e-06, - "loss": 0.9805, - "step": 25919 - }, - { - "epoch": 0.66, - "learning_rate": 1.8138554871767407e-06, - "loss": 0.9072, - "step": 25920 - }, - { - "epoch": 0.66, - "learning_rate": 1.8138394084683162e-06, - "loss": 0.7422, - "step": 25921 - }, - { - "epoch": 0.66, - "learning_rate": 1.8138233291367722e-06, - "loss": 0.9004, - "step": 25922 - }, - { - "epoch": 0.66, - "learning_rate": 1.813807249182121e-06, - "loss": 0.7754, - "step": 25923 - }, - { - "epoch": 0.66, - "learning_rate": 1.8137911686043752e-06, - "loss": 0.749, - "step": 25924 - }, - { - "epoch": 0.66, - "learning_rate": 1.8137750874035469e-06, - "loss": 0.6519, - "step": 25925 - }, - { - "epoch": 0.66, - "learning_rate": 1.8137590055796483e-06, - "loss": 0.7725, - "step": 25926 - }, - { - "epoch": 0.66, - "learning_rate": 1.813742923132692e-06, - "loss": 0.6763, - "step": 25927 - }, - { - "epoch": 0.66, - "learning_rate": 1.8137268400626902e-06, - "loss": 0.8389, - "step": 25928 - }, - { - "epoch": 0.66, - "learning_rate": 1.813710756369655e-06, - "loss": 0.7705, - "step": 25929 - }, - { - "epoch": 0.66, - "learning_rate": 1.813694672053599e-06, - "loss": 0.876, - "step": 25930 - }, - { - "epoch": 0.66, - "learning_rate": 1.8136785871145343e-06, - "loss": 1.0449, - "step": 25931 - }, - { - "epoch": 0.66, - "learning_rate": 1.8136625015524736e-06, - "loss": 0.9087, - "step": 25932 - }, - { - "epoch": 0.66, - "learning_rate": 1.8136464153674287e-06, - "loss": 0.6377, - "step": 25933 - }, - { - "epoch": 0.66, - "learning_rate": 1.813630328559412e-06, - "loss": 0.7549, - "step": 25934 - }, - { - "epoch": 0.66, - "learning_rate": 1.8136142411284362e-06, - "loss": 0.9883, - "step": 25935 - }, - { - "epoch": 0.66, - "learning_rate": 1.8135981530745136e-06, - "loss": 0.6226, - "step": 25936 - }, - { - "epoch": 0.66, - "learning_rate": 1.8135820643976558e-06, - "loss": 1.0234, - "step": 25937 - }, - { - "epoch": 0.66, - "learning_rate": 1.813565975097876e-06, - "loss": 0.7114, - "step": 25938 - }, - { - "epoch": 0.66, - "learning_rate": 1.813549885175186e-06, - "loss": 0.9092, - "step": 25939 - }, - { - "epoch": 0.66, - "learning_rate": 1.8135337946295984e-06, - "loss": 0.8965, - "step": 25940 - }, - { - "epoch": 0.66, - "learning_rate": 1.8135177034611254e-06, - "loss": 0.8623, - "step": 25941 - }, - { - "epoch": 0.66, - "learning_rate": 1.8135016116697787e-06, - "loss": 1.0254, - "step": 25942 - }, - { - "epoch": 0.66, - "learning_rate": 1.8134855192555718e-06, - "loss": 1.0098, - "step": 25943 - }, - { - "epoch": 0.66, - "learning_rate": 1.8134694262185164e-06, - "loss": 1.0225, - "step": 25944 - }, - { - "epoch": 0.66, - "learning_rate": 1.813453332558625e-06, - "loss": 0.7734, - "step": 25945 - }, - { - "epoch": 0.67, - "learning_rate": 1.8134372382759096e-06, - "loss": 0.9834, - "step": 25946 - }, - { - "epoch": 0.67, - "learning_rate": 1.8134211433703825e-06, - "loss": 1.0586, - "step": 25947 - }, - { - "epoch": 0.67, - "learning_rate": 1.8134050478420565e-06, - "loss": 0.7969, - "step": 25948 - }, - { - "epoch": 0.67, - "learning_rate": 1.8133889516909435e-06, - "loss": 0.7744, - "step": 25949 - }, - { - "epoch": 0.67, - "learning_rate": 1.813372854917056e-06, - "loss": 0.9619, - "step": 25950 - }, - { - "epoch": 0.67, - "learning_rate": 1.8133567575204065e-06, - "loss": 0.7827, - "step": 25951 - }, - { - "epoch": 0.67, - "learning_rate": 1.8133406595010067e-06, - "loss": 0.8652, - "step": 25952 - }, - { - "epoch": 0.67, - "learning_rate": 1.8133245608588698e-06, - "loss": 0.6391, - "step": 25953 - }, - { - "epoch": 0.67, - "learning_rate": 1.8133084615940074e-06, - "loss": 0.873, - "step": 25954 - }, - { - "epoch": 0.67, - "learning_rate": 1.8132923617064325e-06, - "loss": 1.0596, - "step": 25955 - }, - { - "epoch": 0.67, - "learning_rate": 1.8132762611961568e-06, - "loss": 1.0635, - "step": 25956 - }, - { - "epoch": 0.67, - "learning_rate": 1.8132601600631927e-06, - "loss": 0.9658, - "step": 25957 - }, - { - "epoch": 0.67, - "learning_rate": 1.813244058307553e-06, - "loss": 0.752, - "step": 25958 - }, - { - "epoch": 0.67, - "learning_rate": 1.8132279559292493e-06, - "loss": 0.6616, - "step": 25959 - }, - { - "epoch": 0.67, - "learning_rate": 1.8132118529282946e-06, - "loss": 0.771, - "step": 25960 - }, - { - "epoch": 0.67, - "learning_rate": 1.8131957493047013e-06, - "loss": 1.252, - "step": 25961 - }, - { - "epoch": 0.67, - "learning_rate": 1.8131796450584807e-06, - "loss": 1.0293, - "step": 25962 - }, - { - "epoch": 0.67, - "learning_rate": 1.8131635401896464e-06, - "loss": 0.7891, - "step": 25963 - }, - { - "epoch": 0.67, - "learning_rate": 1.8131474346982099e-06, - "loss": 0.9111, - "step": 25964 - }, - { - "epoch": 0.67, - "learning_rate": 1.813131328584184e-06, - "loss": 0.8779, - "step": 25965 - }, - { - "epoch": 0.67, - "learning_rate": 1.8131152218475804e-06, - "loss": 0.9834, - "step": 25966 - }, - { - "epoch": 0.67, - "learning_rate": 1.8130991144884123e-06, - "loss": 0.8311, - "step": 25967 - }, - { - "epoch": 0.67, - "learning_rate": 1.8130830065066915e-06, - "loss": 0.8291, - "step": 25968 - }, - { - "epoch": 0.67, - "learning_rate": 1.8130668979024303e-06, - "loss": 0.873, - "step": 25969 - }, - { - "epoch": 0.67, - "learning_rate": 1.8130507886756412e-06, - "loss": 1.0625, - "step": 25970 - }, - { - "epoch": 0.67, - "learning_rate": 1.8130346788263368e-06, - "loss": 0.7964, - "step": 25971 - }, - { - "epoch": 0.67, - "learning_rate": 1.8130185683545287e-06, - "loss": 0.7959, - "step": 25972 - }, - { - "epoch": 0.67, - "learning_rate": 1.81300245726023e-06, - "loss": 0.998, - "step": 25973 - }, - { - "epoch": 0.67, - "learning_rate": 1.8129863455434525e-06, - "loss": 0.9189, - "step": 25974 - }, - { - "epoch": 0.67, - "learning_rate": 1.8129702332042088e-06, - "loss": 0.8799, - "step": 25975 - }, - { - "epoch": 0.67, - "learning_rate": 1.812954120242511e-06, - "loss": 0.7192, - "step": 25976 - }, - { - "epoch": 0.67, - "learning_rate": 1.8129380066583719e-06, - "loss": 0.8857, - "step": 25977 - }, - { - "epoch": 0.67, - "learning_rate": 1.8129218924518032e-06, - "loss": 0.7964, - "step": 25978 - }, - { - "epoch": 0.67, - "learning_rate": 1.812905777622818e-06, - "loss": 0.7471, - "step": 25979 - }, - { - "epoch": 0.67, - "learning_rate": 1.812889662171428e-06, - "loss": 0.9951, - "step": 25980 - }, - { - "epoch": 0.67, - "learning_rate": 1.812873546097646e-06, - "loss": 0.575, - "step": 25981 - }, - { - "epoch": 0.67, - "learning_rate": 1.8128574294014838e-06, - "loss": 0.6853, - "step": 25982 - }, - { - "epoch": 0.67, - "learning_rate": 1.8128413120829541e-06, - "loss": 0.876, - "step": 25983 - }, - { - "epoch": 0.67, - "learning_rate": 1.8128251941420692e-06, - "loss": 0.7646, - "step": 25984 - }, - { - "epoch": 0.67, - "learning_rate": 1.8128090755788414e-06, - "loss": 0.7158, - "step": 25985 - }, - { - "epoch": 0.67, - "learning_rate": 1.812792956393283e-06, - "loss": 0.8096, - "step": 25986 - }, - { - "epoch": 0.67, - "learning_rate": 1.8127768365854066e-06, - "loss": 0.876, - "step": 25987 - }, - { - "epoch": 0.67, - "learning_rate": 1.8127607161552243e-06, - "loss": 0.9492, - "step": 25988 - }, - { - "epoch": 0.67, - "learning_rate": 1.8127445951027484e-06, - "loss": 0.999, - "step": 25989 - }, - { - "epoch": 0.67, - "learning_rate": 1.8127284734279914e-06, - "loss": 0.9355, - "step": 25990 - }, - { - "epoch": 0.67, - "learning_rate": 1.8127123511309657e-06, - "loss": 0.7654, - "step": 25991 - }, - { - "epoch": 0.67, - "learning_rate": 1.8126962282116834e-06, - "loss": 0.9521, - "step": 25992 - }, - { - "epoch": 0.67, - "learning_rate": 1.8126801046701566e-06, - "loss": 0.9287, - "step": 25993 - }, - { - "epoch": 0.67, - "learning_rate": 1.8126639805063989e-06, - "loss": 0.7261, - "step": 25994 - }, - { - "epoch": 0.67, - "learning_rate": 1.812647855720421e-06, - "loss": 1.0332, - "step": 25995 - }, - { - "epoch": 0.67, - "learning_rate": 1.812631730312236e-06, - "loss": 0.8672, - "step": 25996 - }, - { - "epoch": 0.67, - "learning_rate": 1.8126156042818566e-06, - "loss": 0.9375, - "step": 25997 - }, - { - "epoch": 0.67, - "learning_rate": 1.8125994776292948e-06, - "loss": 1.1074, - "step": 25998 - }, - { - "epoch": 0.67, - "learning_rate": 1.8125833503545627e-06, - "loss": 0.7734, - "step": 25999 - }, - { - "epoch": 0.67, - "learning_rate": 1.8125672224576732e-06, - "loss": 1.0771, - "step": 26000 - }, - { - "epoch": 0.67, - "learning_rate": 1.8125510939386382e-06, - "loss": 1.0781, - "step": 26001 - }, - { - "epoch": 0.67, - "learning_rate": 1.8125349647974699e-06, - "loss": 1.0527, - "step": 26002 - }, - { - "epoch": 0.67, - "learning_rate": 1.8125188350341812e-06, - "loss": 0.9023, - "step": 26003 - }, - { - "epoch": 0.67, - "learning_rate": 1.8125027046487841e-06, - "loss": 0.8594, - "step": 26004 - }, - { - "epoch": 0.67, - "learning_rate": 1.8124865736412913e-06, - "loss": 0.8652, - "step": 26005 - }, - { - "epoch": 0.67, - "learning_rate": 1.8124704420117144e-06, - "loss": 0.6719, - "step": 26006 - }, - { - "epoch": 0.67, - "learning_rate": 1.8124543097600666e-06, - "loss": 0.8809, - "step": 26007 - }, - { - "epoch": 0.67, - "learning_rate": 1.8124381768863598e-06, - "loss": 0.7139, - "step": 26008 - }, - { - "epoch": 0.67, - "learning_rate": 1.8124220433906067e-06, - "loss": 0.793, - "step": 26009 - }, - { - "epoch": 0.67, - "learning_rate": 1.8124059092728193e-06, - "loss": 0.8613, - "step": 26010 - }, - { - "epoch": 0.67, - "learning_rate": 1.8123897745330096e-06, - "loss": 0.9453, - "step": 26011 - }, - { - "epoch": 0.67, - "learning_rate": 1.812373639171191e-06, - "loss": 0.9727, - "step": 26012 - }, - { - "epoch": 0.67, - "learning_rate": 1.8123575031873748e-06, - "loss": 0.8652, - "step": 26013 - }, - { - "epoch": 0.67, - "learning_rate": 1.812341366581574e-06, - "loss": 0.8916, - "step": 26014 - }, - { - "epoch": 0.67, - "learning_rate": 1.8123252293538007e-06, - "loss": 0.6719, - "step": 26015 - }, - { - "epoch": 0.67, - "learning_rate": 1.8123090915040677e-06, - "loss": 0.8428, - "step": 26016 - }, - { - "epoch": 0.67, - "learning_rate": 1.8122929530323865e-06, - "loss": 0.6626, - "step": 26017 - }, - { - "epoch": 0.67, - "learning_rate": 1.8122768139387703e-06, - "loss": 0.7739, - "step": 26018 - }, - { - "epoch": 0.67, - "learning_rate": 1.8122606742232307e-06, - "loss": 0.918, - "step": 26019 - }, - { - "epoch": 0.67, - "learning_rate": 1.8122445338857805e-06, - "loss": 0.7842, - "step": 26020 - }, - { - "epoch": 0.67, - "learning_rate": 1.8122283929264324e-06, - "loss": 0.9404, - "step": 26021 - }, - { - "epoch": 0.67, - "learning_rate": 1.812212251345198e-06, - "loss": 0.8867, - "step": 26022 - }, - { - "epoch": 0.67, - "learning_rate": 1.8121961091420902e-06, - "loss": 0.8594, - "step": 26023 - }, - { - "epoch": 0.67, - "learning_rate": 1.812179966317121e-06, - "loss": 0.7549, - "step": 26024 - }, - { - "epoch": 0.67, - "learning_rate": 1.8121638228703033e-06, - "loss": 1.0312, - "step": 26025 - }, - { - "epoch": 0.67, - "learning_rate": 1.812147678801649e-06, - "loss": 0.8447, - "step": 26026 - }, - { - "epoch": 0.67, - "learning_rate": 1.8121315341111703e-06, - "loss": 0.9453, - "step": 26027 - }, - { - "epoch": 0.67, - "learning_rate": 1.81211538879888e-06, - "loss": 0.8057, - "step": 26028 - }, - { - "epoch": 0.67, - "learning_rate": 1.8120992428647903e-06, - "loss": 0.9414, - "step": 26029 - }, - { - "epoch": 0.67, - "learning_rate": 1.8120830963089136e-06, - "loss": 0.8281, - "step": 26030 - }, - { - "epoch": 0.67, - "learning_rate": 1.8120669491312622e-06, - "loss": 0.9707, - "step": 26031 - }, - { - "epoch": 0.67, - "learning_rate": 1.8120508013318482e-06, - "loss": 0.8076, - "step": 26032 - }, - { - "epoch": 0.67, - "learning_rate": 1.8120346529106844e-06, - "loss": 0.9004, - "step": 26033 - }, - { - "epoch": 0.67, - "learning_rate": 1.812018503867783e-06, - "loss": 0.7305, - "step": 26034 - }, - { - "epoch": 0.67, - "learning_rate": 1.8120023542031567e-06, - "loss": 0.9893, - "step": 26035 - }, - { - "epoch": 0.67, - "learning_rate": 1.8119862039168172e-06, - "loss": 0.8984, - "step": 26036 - }, - { - "epoch": 0.67, - "learning_rate": 1.8119700530087772e-06, - "loss": 0.9619, - "step": 26037 - }, - { - "epoch": 0.67, - "learning_rate": 1.811953901479049e-06, - "loss": 1.1406, - "step": 26038 - }, - { - "epoch": 0.67, - "learning_rate": 1.8119377493276453e-06, - "loss": 0.8877, - "step": 26039 - }, - { - "epoch": 0.67, - "learning_rate": 1.811921596554578e-06, - "loss": 0.813, - "step": 26040 - }, - { - "epoch": 0.67, - "learning_rate": 1.8119054431598598e-06, - "loss": 0.9297, - "step": 26041 - }, - { - "epoch": 0.67, - "learning_rate": 1.8118892891435026e-06, - "loss": 0.8145, - "step": 26042 - }, - { - "epoch": 0.67, - "learning_rate": 1.8118731345055196e-06, - "loss": 0.8643, - "step": 26043 - }, - { - "epoch": 0.67, - "learning_rate": 1.8118569792459223e-06, - "loss": 0.9619, - "step": 26044 - }, - { - "epoch": 0.67, - "learning_rate": 1.8118408233647236e-06, - "loss": 0.7549, - "step": 26045 - }, - { - "epoch": 0.67, - "learning_rate": 1.8118246668619357e-06, - "loss": 0.6851, - "step": 26046 - }, - { - "epoch": 0.67, - "learning_rate": 1.8118085097375709e-06, - "loss": 0.8408, - "step": 26047 - }, - { - "epoch": 0.67, - "learning_rate": 1.8117923519916419e-06, - "loss": 0.8223, - "step": 26048 - }, - { - "epoch": 0.67, - "learning_rate": 1.8117761936241607e-06, - "loss": 1.041, - "step": 26049 - }, - { - "epoch": 0.67, - "learning_rate": 1.8117600346351396e-06, - "loss": 0.7979, - "step": 26050 - }, - { - "epoch": 0.67, - "learning_rate": 1.8117438750245912e-06, - "loss": 0.71, - "step": 26051 - }, - { - "epoch": 0.67, - "learning_rate": 1.811727714792528e-06, - "loss": 0.8662, - "step": 26052 - }, - { - "epoch": 0.67, - "learning_rate": 1.8117115539389623e-06, - "loss": 0.9424, - "step": 26053 - }, - { - "epoch": 0.67, - "learning_rate": 1.811695392463906e-06, - "loss": 1.0098, - "step": 26054 - }, - { - "epoch": 0.67, - "learning_rate": 1.8116792303673722e-06, - "loss": 0.8809, - "step": 26055 - }, - { - "epoch": 0.67, - "learning_rate": 1.8116630676493729e-06, - "loss": 0.7061, - "step": 26056 - }, - { - "epoch": 0.67, - "learning_rate": 1.8116469043099205e-06, - "loss": 1.1426, - "step": 26057 - }, - { - "epoch": 0.67, - "learning_rate": 1.8116307403490274e-06, - "loss": 0.8853, - "step": 26058 - }, - { - "epoch": 0.67, - "learning_rate": 1.8116145757667058e-06, - "loss": 0.9453, - "step": 26059 - }, - { - "epoch": 0.67, - "learning_rate": 1.8115984105629683e-06, - "loss": 0.7744, - "step": 26060 - }, - { - "epoch": 0.67, - "learning_rate": 1.8115822447378272e-06, - "loss": 0.748, - "step": 26061 - }, - { - "epoch": 0.67, - "learning_rate": 1.8115660782912952e-06, - "loss": 0.8291, - "step": 26062 - }, - { - "epoch": 0.67, - "learning_rate": 1.8115499112233838e-06, - "loss": 1.0596, - "step": 26063 - }, - { - "epoch": 0.67, - "learning_rate": 1.8115337435341064e-06, - "loss": 0.9443, - "step": 26064 - }, - { - "epoch": 0.67, - "learning_rate": 1.8115175752234749e-06, - "loss": 0.5376, - "step": 26065 - }, - { - "epoch": 0.67, - "learning_rate": 1.8115014062915015e-06, - "loss": 0.8535, - "step": 26066 - }, - { - "epoch": 0.67, - "learning_rate": 1.811485236738199e-06, - "loss": 0.8457, - "step": 26067 - }, - { - "epoch": 0.67, - "learning_rate": 1.8114690665635793e-06, - "loss": 0.7354, - "step": 26068 - }, - { - "epoch": 0.67, - "learning_rate": 1.8114528957676552e-06, - "loss": 0.8154, - "step": 26069 - }, - { - "epoch": 0.67, - "learning_rate": 1.8114367243504389e-06, - "loss": 0.9102, - "step": 26070 - }, - { - "epoch": 0.67, - "learning_rate": 1.8114205523119427e-06, - "loss": 1.0449, - "step": 26071 - }, - { - "epoch": 0.67, - "learning_rate": 1.8114043796521794e-06, - "loss": 1.1445, - "step": 26072 - }, - { - "epoch": 0.67, - "learning_rate": 1.8113882063711609e-06, - "loss": 0.834, - "step": 26073 - }, - { - "epoch": 0.67, - "learning_rate": 1.8113720324689e-06, - "loss": 0.6655, - "step": 26074 - }, - { - "epoch": 0.67, - "learning_rate": 1.8113558579454084e-06, - "loss": 1.0654, - "step": 26075 - }, - { - "epoch": 0.67, - "learning_rate": 1.8113396828006993e-06, - "loss": 0.7891, - "step": 26076 - }, - { - "epoch": 0.67, - "learning_rate": 1.8113235070347846e-06, - "loss": 0.8105, - "step": 26077 - }, - { - "epoch": 0.67, - "learning_rate": 1.8113073306476766e-06, - "loss": 0.7593, - "step": 26078 - }, - { - "epoch": 0.67, - "learning_rate": 1.811291153639388e-06, - "loss": 0.9141, - "step": 26079 - }, - { - "epoch": 0.67, - "learning_rate": 1.811274976009931e-06, - "loss": 0.8193, - "step": 26080 - }, - { - "epoch": 0.67, - "learning_rate": 1.811258797759318e-06, - "loss": 0.5308, - "step": 26081 - }, - { - "epoch": 0.67, - "learning_rate": 1.8112426188875617e-06, - "loss": 0.9111, - "step": 26082 - }, - { - "epoch": 0.67, - "learning_rate": 1.8112264393946744e-06, - "loss": 1.124, - "step": 26083 - }, - { - "epoch": 0.67, - "learning_rate": 1.811210259280668e-06, - "loss": 1.0361, - "step": 26084 - }, - { - "epoch": 0.67, - "learning_rate": 1.811194078545555e-06, - "loss": 0.9648, - "step": 26085 - }, - { - "epoch": 0.67, - "learning_rate": 1.8111778971893484e-06, - "loss": 0.9727, - "step": 26086 - }, - { - "epoch": 0.67, - "learning_rate": 1.81116171521206e-06, - "loss": 0.9326, - "step": 26087 - }, - { - "epoch": 0.67, - "learning_rate": 1.8111455326137022e-06, - "loss": 0.6442, - "step": 26088 - }, - { - "epoch": 0.67, - "learning_rate": 1.8111293493942879e-06, - "loss": 0.8291, - "step": 26089 - }, - { - "epoch": 0.67, - "learning_rate": 1.811113165553829e-06, - "loss": 0.96, - "step": 26090 - }, - { - "epoch": 0.67, - "learning_rate": 1.811096981092338e-06, - "loss": 0.915, - "step": 26091 - }, - { - "epoch": 0.67, - "learning_rate": 1.8110807960098274e-06, - "loss": 0.6978, - "step": 26092 - }, - { - "epoch": 0.67, - "learning_rate": 1.8110646103063094e-06, - "loss": 0.9482, - "step": 26093 - }, - { - "epoch": 0.67, - "learning_rate": 1.8110484239817966e-06, - "loss": 0.8975, - "step": 26094 - }, - { - "epoch": 0.67, - "learning_rate": 1.8110322370363016e-06, - "loss": 0.9111, - "step": 26095 - }, - { - "epoch": 0.67, - "learning_rate": 1.811016049469836e-06, - "loss": 0.8486, - "step": 26096 - }, - { - "epoch": 0.67, - "learning_rate": 1.8109998612824132e-06, - "loss": 0.8564, - "step": 26097 - }, - { - "epoch": 0.67, - "learning_rate": 1.810983672474045e-06, - "loss": 0.8311, - "step": 26098 - }, - { - "epoch": 0.67, - "learning_rate": 1.8109674830447435e-06, - "loss": 0.7048, - "step": 26099 - }, - { - "epoch": 0.67, - "learning_rate": 1.810951292994522e-06, - "loss": 1.1367, - "step": 26100 - }, - { - "epoch": 0.67, - "learning_rate": 1.810935102323392e-06, - "loss": 1.0625, - "step": 26101 - }, - { - "epoch": 0.67, - "learning_rate": 1.8109189110313663e-06, - "loss": 0.9893, - "step": 26102 - }, - { - "epoch": 0.67, - "learning_rate": 1.8109027191184577e-06, - "loss": 0.6396, - "step": 26103 - }, - { - "epoch": 0.67, - "learning_rate": 1.8108865265846776e-06, - "loss": 1.0889, - "step": 26104 - }, - { - "epoch": 0.67, - "learning_rate": 1.8108703334300392e-06, - "loss": 0.5645, - "step": 26105 - }, - { - "epoch": 0.67, - "learning_rate": 1.810854139654555e-06, - "loss": 0.729, - "step": 26106 - }, - { - "epoch": 0.67, - "learning_rate": 1.8108379452582366e-06, - "loss": 0.6665, - "step": 26107 - }, - { - "epoch": 0.67, - "learning_rate": 1.810821750241097e-06, - "loss": 0.9165, - "step": 26108 - }, - { - "epoch": 0.67, - "learning_rate": 1.8108055546031484e-06, - "loss": 0.8394, - "step": 26109 - }, - { - "epoch": 0.67, - "learning_rate": 1.8107893583444034e-06, - "loss": 0.9189, - "step": 26110 - }, - { - "epoch": 0.67, - "learning_rate": 1.8107731614648742e-06, - "loss": 0.8984, - "step": 26111 - }, - { - "epoch": 0.67, - "learning_rate": 1.8107569639645735e-06, - "loss": 1.1328, - "step": 26112 - }, - { - "epoch": 0.67, - "learning_rate": 1.8107407658435132e-06, - "loss": 0.6914, - "step": 26113 - }, - { - "epoch": 0.67, - "learning_rate": 1.810724567101706e-06, - "loss": 0.8345, - "step": 26114 - }, - { - "epoch": 0.67, - "learning_rate": 1.8107083677391644e-06, - "loss": 0.7949, - "step": 26115 - }, - { - "epoch": 0.67, - "learning_rate": 1.8106921677559006e-06, - "loss": 0.8711, - "step": 26116 - }, - { - "epoch": 0.67, - "learning_rate": 1.8106759671519273e-06, - "loss": 0.8965, - "step": 26117 - }, - { - "epoch": 0.67, - "learning_rate": 1.8106597659272564e-06, - "loss": 0.8506, - "step": 26118 - }, - { - "epoch": 0.67, - "learning_rate": 1.8106435640819004e-06, - "loss": 0.7178, - "step": 26119 - }, - { - "epoch": 0.67, - "learning_rate": 1.8106273616158725e-06, - "loss": 0.9287, - "step": 26120 - }, - { - "epoch": 0.67, - "learning_rate": 1.8106111585291842e-06, - "loss": 1.0791, - "step": 26121 - }, - { - "epoch": 0.67, - "learning_rate": 1.810594954821848e-06, - "loss": 1.1143, - "step": 26122 - }, - { - "epoch": 0.67, - "learning_rate": 1.8105787504938768e-06, - "loss": 0.8281, - "step": 26123 - }, - { - "epoch": 0.67, - "learning_rate": 1.8105625455452826e-06, - "loss": 0.8511, - "step": 26124 - }, - { - "epoch": 0.67, - "learning_rate": 1.810546339976078e-06, - "loss": 0.9072, - "step": 26125 - }, - { - "epoch": 0.67, - "learning_rate": 1.8105301337862753e-06, - "loss": 0.9326, - "step": 26126 - }, - { - "epoch": 0.67, - "learning_rate": 1.810513926975887e-06, - "loss": 0.9375, - "step": 26127 - }, - { - "epoch": 0.67, - "learning_rate": 1.810497719544925e-06, - "loss": 0.7383, - "step": 26128 - }, - { - "epoch": 0.67, - "learning_rate": 1.8104815114934029e-06, - "loss": 0.8662, - "step": 26129 - }, - { - "epoch": 0.67, - "learning_rate": 1.8104653028213318e-06, - "loss": 0.918, - "step": 26130 - }, - { - "epoch": 0.67, - "learning_rate": 1.810449093528725e-06, - "loss": 0.9512, - "step": 26131 - }, - { - "epoch": 0.67, - "learning_rate": 1.8104328836155943e-06, - "loss": 0.7866, - "step": 26132 - }, - { - "epoch": 0.67, - "learning_rate": 1.8104166730819529e-06, - "loss": 0.8809, - "step": 26133 - }, - { - "epoch": 0.67, - "learning_rate": 1.8104004619278123e-06, - "loss": 0.9775, - "step": 26134 - }, - { - "epoch": 0.67, - "learning_rate": 1.8103842501531856e-06, - "loss": 0.8428, - "step": 26135 - }, - { - "epoch": 0.67, - "learning_rate": 1.8103680377580848e-06, - "loss": 0.7188, - "step": 26136 - }, - { - "epoch": 0.67, - "learning_rate": 1.8103518247425224e-06, - "loss": 0.9199, - "step": 26137 - }, - { - "epoch": 0.67, - "learning_rate": 1.810335611106511e-06, - "loss": 0.9531, - "step": 26138 - }, - { - "epoch": 0.67, - "learning_rate": 1.8103193968500627e-06, - "loss": 0.9863, - "step": 26139 - }, - { - "epoch": 0.67, - "learning_rate": 1.8103031819731905e-06, - "loss": 0.9561, - "step": 26140 - }, - { - "epoch": 0.67, - "learning_rate": 1.8102869664759059e-06, - "loss": 0.9229, - "step": 26141 - }, - { - "epoch": 0.67, - "learning_rate": 1.8102707503582221e-06, - "loss": 0.6638, - "step": 26142 - }, - { - "epoch": 0.67, - "learning_rate": 1.8102545336201511e-06, - "loss": 0.9756, - "step": 26143 - }, - { - "epoch": 0.67, - "learning_rate": 1.8102383162617056e-06, - "loss": 0.6807, - "step": 26144 - }, - { - "epoch": 0.67, - "learning_rate": 1.8102220982828977e-06, - "loss": 0.7461, - "step": 26145 - }, - { - "epoch": 0.67, - "learning_rate": 1.8102058796837403e-06, - "loss": 0.8169, - "step": 26146 - }, - { - "epoch": 0.67, - "learning_rate": 1.8101896604642452e-06, - "loss": 0.8633, - "step": 26147 - }, - { - "epoch": 0.67, - "learning_rate": 1.8101734406244255e-06, - "loss": 0.8008, - "step": 26148 - }, - { - "epoch": 0.67, - "learning_rate": 1.810157220164293e-06, - "loss": 0.8452, - "step": 26149 - }, - { - "epoch": 0.67, - "learning_rate": 1.8101409990838603e-06, - "loss": 0.9326, - "step": 26150 - }, - { - "epoch": 0.67, - "learning_rate": 1.8101247773831401e-06, - "loss": 1.041, - "step": 26151 - }, - { - "epoch": 0.67, - "learning_rate": 1.8101085550621443e-06, - "loss": 1.0332, - "step": 26152 - }, - { - "epoch": 0.67, - "learning_rate": 1.8100923321208858e-06, - "loss": 0.9287, - "step": 26153 - }, - { - "epoch": 0.67, - "learning_rate": 1.810076108559377e-06, - "loss": 0.6921, - "step": 26154 - }, - { - "epoch": 0.67, - "learning_rate": 1.81005988437763e-06, - "loss": 0.5059, - "step": 26155 - }, - { - "epoch": 0.67, - "learning_rate": 1.8100436595756575e-06, - "loss": 1.0156, - "step": 26156 - }, - { - "epoch": 0.67, - "learning_rate": 1.8100274341534716e-06, - "loss": 0.7588, - "step": 26157 - }, - { - "epoch": 0.67, - "learning_rate": 1.810011208111085e-06, - "loss": 0.7046, - "step": 26158 - }, - { - "epoch": 0.67, - "learning_rate": 1.8099949814485102e-06, - "loss": 0.7988, - "step": 26159 - }, - { - "epoch": 0.67, - "learning_rate": 1.8099787541657595e-06, - "loss": 0.6409, - "step": 26160 - }, - { - "epoch": 0.67, - "learning_rate": 1.8099625262628454e-06, - "loss": 0.8623, - "step": 26161 - }, - { - "epoch": 0.67, - "learning_rate": 1.8099462977397799e-06, - "loss": 0.8682, - "step": 26162 - }, - { - "epoch": 0.67, - "learning_rate": 1.809930068596576e-06, - "loss": 0.9238, - "step": 26163 - }, - { - "epoch": 0.67, - "learning_rate": 1.8099138388332458e-06, - "loss": 0.6104, - "step": 26164 - }, - { - "epoch": 0.67, - "learning_rate": 1.8098976084498018e-06, - "loss": 0.8223, - "step": 26165 - }, - { - "epoch": 0.67, - "learning_rate": 1.8098813774462567e-06, - "loss": 0.9248, - "step": 26166 - }, - { - "epoch": 0.67, - "learning_rate": 1.8098651458226222e-06, - "loss": 1.0186, - "step": 26167 - }, - { - "epoch": 0.67, - "learning_rate": 1.8098489135789118e-06, - "loss": 0.8916, - "step": 26168 - }, - { - "epoch": 0.67, - "learning_rate": 1.8098326807151368e-06, - "loss": 0.8086, - "step": 26169 - }, - { - "epoch": 0.67, - "learning_rate": 1.8098164472313102e-06, - "loss": 0.9688, - "step": 26170 - }, - { - "epoch": 0.67, - "learning_rate": 1.8098002131274446e-06, - "loss": 0.8198, - "step": 26171 - }, - { - "epoch": 0.67, - "learning_rate": 1.8097839784035523e-06, - "loss": 0.8115, - "step": 26172 - }, - { - "epoch": 0.67, - "learning_rate": 1.809767743059645e-06, - "loss": 0.6533, - "step": 26173 - }, - { - "epoch": 0.67, - "learning_rate": 1.8097515070957365e-06, - "loss": 0.8071, - "step": 26174 - }, - { - "epoch": 0.67, - "learning_rate": 1.8097352705118383e-06, - "loss": 0.8535, - "step": 26175 - }, - { - "epoch": 0.67, - "learning_rate": 1.8097190333079629e-06, - "loss": 0.7859, - "step": 26176 - }, - { - "epoch": 0.67, - "learning_rate": 1.809702795484123e-06, - "loss": 0.8311, - "step": 26177 - }, - { - "epoch": 0.67, - "learning_rate": 1.809686557040331e-06, - "loss": 0.7759, - "step": 26178 - }, - { - "epoch": 0.67, - "learning_rate": 1.809670317976599e-06, - "loss": 1.1348, - "step": 26179 - }, - { - "epoch": 0.67, - "learning_rate": 1.8096540782929397e-06, - "loss": 1.0605, - "step": 26180 - }, - { - "epoch": 0.67, - "learning_rate": 1.8096378379893655e-06, - "loss": 0.9375, - "step": 26181 - }, - { - "epoch": 0.67, - "learning_rate": 1.809621597065889e-06, - "loss": 0.7974, - "step": 26182 - }, - { - "epoch": 0.67, - "learning_rate": 1.8096053555225224e-06, - "loss": 1.0918, - "step": 26183 - }, - { - "epoch": 0.67, - "learning_rate": 1.809589113359278e-06, - "loss": 0.8096, - "step": 26184 - }, - { - "epoch": 0.67, - "learning_rate": 1.8095728705761686e-06, - "loss": 0.8662, - "step": 26185 - }, - { - "epoch": 0.67, - "learning_rate": 1.8095566271732065e-06, - "loss": 0.8115, - "step": 26186 - }, - { - "epoch": 0.67, - "learning_rate": 1.809540383150404e-06, - "loss": 0.876, - "step": 26187 - }, - { - "epoch": 0.67, - "learning_rate": 1.809524138507774e-06, - "loss": 0.6855, - "step": 26188 - }, - { - "epoch": 0.67, - "learning_rate": 1.8095078932453282e-06, - "loss": 0.6655, - "step": 26189 - }, - { - "epoch": 0.67, - "learning_rate": 1.8094916473630797e-06, - "loss": 0.8594, - "step": 26190 - }, - { - "epoch": 0.67, - "learning_rate": 1.8094754008610405e-06, - "loss": 0.8701, - "step": 26191 - }, - { - "epoch": 0.67, - "learning_rate": 1.8094591537392234e-06, - "loss": 0.7725, - "step": 26192 - }, - { - "epoch": 0.67, - "learning_rate": 1.8094429059976402e-06, - "loss": 0.8496, - "step": 26193 - }, - { - "epoch": 0.67, - "learning_rate": 1.8094266576363043e-06, - "loss": 0.8555, - "step": 26194 - }, - { - "epoch": 0.67, - "learning_rate": 1.809410408655227e-06, - "loss": 0.8164, - "step": 26195 - }, - { - "epoch": 0.67, - "learning_rate": 1.8093941590544222e-06, - "loss": 0.7246, - "step": 26196 - }, - { - "epoch": 0.67, - "learning_rate": 1.8093779088339009e-06, - "loss": 0.6268, - "step": 26197 - }, - { - "epoch": 0.67, - "learning_rate": 1.8093616579936763e-06, - "loss": 0.8848, - "step": 26198 - }, - { - "epoch": 0.67, - "learning_rate": 1.8093454065337607e-06, - "loss": 1.1348, - "step": 26199 - }, - { - "epoch": 0.67, - "learning_rate": 1.8093291544541666e-06, - "loss": 1.1416, - "step": 26200 - }, - { - "epoch": 0.67, - "learning_rate": 1.8093129017549066e-06, - "loss": 0.9316, - "step": 26201 - }, - { - "epoch": 0.67, - "learning_rate": 1.8092966484359925e-06, - "loss": 0.7568, - "step": 26202 - }, - { - "epoch": 0.67, - "learning_rate": 1.8092803944974373e-06, - "loss": 0.9502, - "step": 26203 - }, - { - "epoch": 0.67, - "learning_rate": 1.8092641399392533e-06, - "loss": 0.7622, - "step": 26204 - }, - { - "epoch": 0.67, - "learning_rate": 1.809247884761453e-06, - "loss": 0.8701, - "step": 26205 - }, - { - "epoch": 0.67, - "learning_rate": 1.8092316289640488e-06, - "loss": 0.9717, - "step": 26206 - }, - { - "epoch": 0.67, - "learning_rate": 1.809215372547053e-06, - "loss": 0.7852, - "step": 26207 - }, - { - "epoch": 0.67, - "learning_rate": 1.8091991155104784e-06, - "loss": 0.915, - "step": 26208 - }, - { - "epoch": 0.67, - "learning_rate": 1.8091828578543375e-06, - "loss": 0.8906, - "step": 26209 - }, - { - "epoch": 0.67, - "learning_rate": 1.8091665995786421e-06, - "loss": 0.7334, - "step": 26210 - }, - { - "epoch": 0.67, - "learning_rate": 1.8091503406834053e-06, - "loss": 0.9048, - "step": 26211 - }, - { - "epoch": 0.67, - "learning_rate": 1.809134081168639e-06, - "loss": 1.0664, - "step": 26212 - }, - { - "epoch": 0.67, - "learning_rate": 1.809117821034356e-06, - "loss": 1.1455, - "step": 26213 - }, - { - "epoch": 0.67, - "learning_rate": 1.8091015602805688e-06, - "loss": 1.0156, - "step": 26214 - }, - { - "epoch": 0.67, - "learning_rate": 1.8090852989072898e-06, - "loss": 1.0586, - "step": 26215 - }, - { - "epoch": 0.67, - "learning_rate": 1.8090690369145312e-06, - "loss": 0.7849, - "step": 26216 - }, - { - "epoch": 0.67, - "learning_rate": 1.8090527743023056e-06, - "loss": 0.9561, - "step": 26217 - }, - { - "epoch": 0.67, - "learning_rate": 1.8090365110706256e-06, - "loss": 0.8047, - "step": 26218 - }, - { - "epoch": 0.67, - "learning_rate": 1.8090202472195037e-06, - "loss": 0.9639, - "step": 26219 - }, - { - "epoch": 0.67, - "learning_rate": 1.809003982748952e-06, - "loss": 1.1172, - "step": 26220 - }, - { - "epoch": 0.67, - "learning_rate": 1.8089877176589834e-06, - "loss": 1.0586, - "step": 26221 - }, - { - "epoch": 0.67, - "learning_rate": 1.8089714519496097e-06, - "loss": 0.6582, - "step": 26222 - }, - { - "epoch": 0.67, - "learning_rate": 1.808955185620844e-06, - "loss": 0.5376, - "step": 26223 - }, - { - "epoch": 0.67, - "learning_rate": 1.8089389186726986e-06, - "loss": 0.8877, - "step": 26224 - }, - { - "epoch": 0.67, - "learning_rate": 1.8089226511051857e-06, - "loss": 0.9951, - "step": 26225 - }, - { - "epoch": 0.67, - "learning_rate": 1.808906382918318e-06, - "loss": 1.0703, - "step": 26226 - }, - { - "epoch": 0.67, - "learning_rate": 1.8088901141121079e-06, - "loss": 0.9453, - "step": 26227 - }, - { - "epoch": 0.67, - "learning_rate": 1.8088738446865676e-06, - "loss": 0.6709, - "step": 26228 - }, - { - "epoch": 0.67, - "learning_rate": 1.80885757464171e-06, - "loss": 0.8789, - "step": 26229 - }, - { - "epoch": 0.67, - "learning_rate": 1.8088413039775473e-06, - "loss": 0.8066, - "step": 26230 - }, - { - "epoch": 0.67, - "learning_rate": 1.808825032694092e-06, - "loss": 1.0547, - "step": 26231 - }, - { - "epoch": 0.67, - "learning_rate": 1.8088087607913568e-06, - "loss": 0.7642, - "step": 26232 - }, - { - "epoch": 0.67, - "learning_rate": 1.8087924882693537e-06, - "loss": 0.8408, - "step": 26233 - }, - { - "epoch": 0.67, - "learning_rate": 1.8087762151280953e-06, - "loss": 1.0332, - "step": 26234 - }, - { - "epoch": 0.67, - "learning_rate": 1.8087599413675943e-06, - "loss": 0.6987, - "step": 26235 - }, - { - "epoch": 0.67, - "learning_rate": 1.808743666987863e-06, - "loss": 0.8447, - "step": 26236 - }, - { - "epoch": 0.67, - "learning_rate": 1.8087273919889136e-06, - "loss": 0.709, - "step": 26237 - }, - { - "epoch": 0.67, - "learning_rate": 1.8087111163707588e-06, - "loss": 1.1611, - "step": 26238 - }, - { - "epoch": 0.67, - "learning_rate": 1.8086948401334116e-06, - "loss": 0.6577, - "step": 26239 - }, - { - "epoch": 0.67, - "learning_rate": 1.8086785632768834e-06, - "loss": 1.0078, - "step": 26240 - }, - { - "epoch": 0.67, - "learning_rate": 1.8086622858011875e-06, - "loss": 0.8291, - "step": 26241 - }, - { - "epoch": 0.67, - "learning_rate": 1.8086460077063362e-06, - "loss": 0.8784, - "step": 26242 - }, - { - "epoch": 0.67, - "learning_rate": 1.8086297289923416e-06, - "loss": 1.0117, - "step": 26243 - }, - { - "epoch": 0.67, - "learning_rate": 1.8086134496592164e-06, - "loss": 0.9062, - "step": 26244 - }, - { - "epoch": 0.67, - "learning_rate": 1.808597169706973e-06, - "loss": 0.7141, - "step": 26245 - }, - { - "epoch": 0.67, - "learning_rate": 1.8085808891356243e-06, - "loss": 0.9883, - "step": 26246 - }, - { - "epoch": 0.67, - "learning_rate": 1.8085646079451822e-06, - "loss": 0.8398, - "step": 26247 - }, - { - "epoch": 0.67, - "learning_rate": 1.8085483261356592e-06, - "loss": 0.8145, - "step": 26248 - }, - { - "epoch": 0.67, - "learning_rate": 1.8085320437070682e-06, - "loss": 0.915, - "step": 26249 - }, - { - "epoch": 0.67, - "learning_rate": 1.808515760659421e-06, - "loss": 0.6724, - "step": 26250 - }, - { - "epoch": 0.67, - "learning_rate": 1.8084994769927306e-06, - "loss": 0.9019, - "step": 26251 - }, - { - "epoch": 0.67, - "learning_rate": 1.8084831927070094e-06, - "loss": 0.834, - "step": 26252 - }, - { - "epoch": 0.67, - "learning_rate": 1.8084669078022698e-06, - "loss": 0.7041, - "step": 26253 - }, - { - "epoch": 0.67, - "learning_rate": 1.8084506222785243e-06, - "loss": 0.7031, - "step": 26254 - }, - { - "epoch": 0.67, - "learning_rate": 1.8084343361357853e-06, - "loss": 0.7881, - "step": 26255 - }, - { - "epoch": 0.67, - "learning_rate": 1.8084180493740653e-06, - "loss": 0.8857, - "step": 26256 - }, - { - "epoch": 0.67, - "learning_rate": 1.8084017619933766e-06, - "loss": 0.8911, - "step": 26257 - }, - { - "epoch": 0.67, - "learning_rate": 1.8083854739937321e-06, - "loss": 0.5557, - "step": 26258 - }, - { - "epoch": 0.67, - "learning_rate": 1.808369185375144e-06, - "loss": 0.8027, - "step": 26259 - }, - { - "epoch": 0.67, - "learning_rate": 1.8083528961376246e-06, - "loss": 0.8672, - "step": 26260 - }, - { - "epoch": 0.67, - "learning_rate": 1.8083366062811867e-06, - "loss": 1.1172, - "step": 26261 - }, - { - "epoch": 0.67, - "learning_rate": 1.8083203158058424e-06, - "loss": 0.6426, - "step": 26262 - }, - { - "epoch": 0.67, - "learning_rate": 1.8083040247116048e-06, - "loss": 0.7988, - "step": 26263 - }, - { - "epoch": 0.67, - "learning_rate": 1.8082877329984857e-06, - "loss": 0.8594, - "step": 26264 - }, - { - "epoch": 0.67, - "learning_rate": 1.808271440666498e-06, - "loss": 0.8594, - "step": 26265 - }, - { - "epoch": 0.67, - "learning_rate": 1.8082551477156538e-06, - "loss": 0.9678, - "step": 26266 - }, - { - "epoch": 0.67, - "learning_rate": 1.808238854145966e-06, - "loss": 0.9551, - "step": 26267 - }, - { - "epoch": 0.67, - "learning_rate": 1.8082225599574468e-06, - "loss": 0.8574, - "step": 26268 - }, - { - "epoch": 0.67, - "learning_rate": 1.8082062651501087e-06, - "loss": 0.6387, - "step": 26269 - }, - { - "epoch": 0.67, - "learning_rate": 1.8081899697239642e-06, - "loss": 0.8623, - "step": 26270 - }, - { - "epoch": 0.67, - "learning_rate": 1.8081736736790259e-06, - "loss": 0.6689, - "step": 26271 - }, - { - "epoch": 0.67, - "learning_rate": 1.8081573770153063e-06, - "loss": 0.833, - "step": 26272 - }, - { - "epoch": 0.67, - "learning_rate": 1.8081410797328177e-06, - "loss": 0.9346, - "step": 26273 - }, - { - "epoch": 0.67, - "learning_rate": 1.8081247818315726e-06, - "loss": 0.7349, - "step": 26274 - }, - { - "epoch": 0.67, - "learning_rate": 1.8081084833115835e-06, - "loss": 0.6982, - "step": 26275 - }, - { - "epoch": 0.67, - "learning_rate": 1.8080921841728624e-06, - "loss": 0.8491, - "step": 26276 - }, - { - "epoch": 0.67, - "learning_rate": 1.808075884415423e-06, - "loss": 0.6011, - "step": 26277 - }, - { - "epoch": 0.67, - "learning_rate": 1.8080595840392767e-06, - "loss": 0.9814, - "step": 26278 - }, - { - "epoch": 0.67, - "learning_rate": 1.8080432830444363e-06, - "loss": 0.7852, - "step": 26279 - }, - { - "epoch": 0.67, - "learning_rate": 1.8080269814309145e-06, - "loss": 0.9355, - "step": 26280 - }, - { - "epoch": 0.67, - "learning_rate": 1.8080106791987234e-06, - "loss": 0.9004, - "step": 26281 - }, - { - "epoch": 0.67, - "learning_rate": 1.807994376347876e-06, - "loss": 0.7871, - "step": 26282 - }, - { - "epoch": 0.67, - "learning_rate": 1.8079780728783841e-06, - "loss": 0.8291, - "step": 26283 - }, - { - "epoch": 0.67, - "learning_rate": 1.8079617687902609e-06, - "loss": 0.8154, - "step": 26284 - }, - { - "epoch": 0.67, - "learning_rate": 1.8079454640835183e-06, - "loss": 0.9453, - "step": 26285 - }, - { - "epoch": 0.67, - "learning_rate": 1.8079291587581688e-06, - "loss": 0.9941, - "step": 26286 - }, - { - "epoch": 0.67, - "learning_rate": 1.8079128528142254e-06, - "loss": 0.7886, - "step": 26287 - }, - { - "epoch": 0.67, - "learning_rate": 1.8078965462517001e-06, - "loss": 0.8604, - "step": 26288 - }, - { - "epoch": 0.67, - "learning_rate": 1.8078802390706058e-06, - "loss": 0.8584, - "step": 26289 - }, - { - "epoch": 0.67, - "learning_rate": 1.8078639312709546e-06, - "loss": 0.7168, - "step": 26290 - }, - { - "epoch": 0.67, - "learning_rate": 1.8078476228527593e-06, - "loss": 0.6382, - "step": 26291 - }, - { - "epoch": 0.67, - "learning_rate": 1.807831313816032e-06, - "loss": 0.7529, - "step": 26292 - }, - { - "epoch": 0.67, - "learning_rate": 1.8078150041607854e-06, - "loss": 0.752, - "step": 26293 - }, - { - "epoch": 0.67, - "learning_rate": 1.8077986938870323e-06, - "loss": 1.0449, - "step": 26294 - }, - { - "epoch": 0.67, - "learning_rate": 1.8077823829947842e-06, - "loss": 0.8682, - "step": 26295 - }, - { - "epoch": 0.67, - "learning_rate": 1.8077660714840551e-06, - "loss": 0.8352, - "step": 26296 - }, - { - "epoch": 0.67, - "learning_rate": 1.807749759354856e-06, - "loss": 0.9062, - "step": 26297 - }, - { - "epoch": 0.67, - "learning_rate": 1.8077334466072003e-06, - "loss": 1.0098, - "step": 26298 - }, - { - "epoch": 0.67, - "learning_rate": 1.8077171332411006e-06, - "loss": 0.9756, - "step": 26299 - }, - { - "epoch": 0.67, - "learning_rate": 1.8077008192565684e-06, - "loss": 0.9834, - "step": 26300 - }, - { - "epoch": 0.67, - "learning_rate": 1.8076845046536172e-06, - "loss": 0.9629, - "step": 26301 - }, - { - "epoch": 0.67, - "learning_rate": 1.807668189432259e-06, - "loss": 0.6904, - "step": 26302 - }, - { - "epoch": 0.67, - "learning_rate": 1.8076518735925066e-06, - "loss": 0.8125, - "step": 26303 - }, - { - "epoch": 0.67, - "learning_rate": 1.8076355571343722e-06, - "loss": 0.687, - "step": 26304 - }, - { - "epoch": 0.67, - "learning_rate": 1.8076192400578682e-06, - "loss": 0.9092, - "step": 26305 - }, - { - "epoch": 0.67, - "learning_rate": 1.8076029223630075e-06, - "loss": 0.7236, - "step": 26306 - }, - { - "epoch": 0.67, - "learning_rate": 1.8075866040498023e-06, - "loss": 0.9521, - "step": 26307 - }, - { - "epoch": 0.67, - "learning_rate": 1.807570285118265e-06, - "loss": 0.8447, - "step": 26308 - }, - { - "epoch": 0.67, - "learning_rate": 1.8075539655684085e-06, - "loss": 0.9736, - "step": 26309 - }, - { - "epoch": 0.67, - "learning_rate": 1.807537645400245e-06, - "loss": 0.8643, - "step": 26310 - }, - { - "epoch": 0.67, - "learning_rate": 1.807521324613787e-06, - "loss": 1.0664, - "step": 26311 - }, - { - "epoch": 0.67, - "learning_rate": 1.807505003209047e-06, - "loss": 0.6953, - "step": 26312 - }, - { - "epoch": 0.67, - "learning_rate": 1.8074886811860376e-06, - "loss": 0.874, - "step": 26313 - }, - { - "epoch": 0.67, - "learning_rate": 1.8074723585447715e-06, - "loss": 0.6323, - "step": 26314 - }, - { - "epoch": 0.67, - "learning_rate": 1.8074560352852605e-06, - "loss": 0.7732, - "step": 26315 - }, - { - "epoch": 0.67, - "learning_rate": 1.807439711407518e-06, - "loss": 0.8047, - "step": 26316 - }, - { - "epoch": 0.67, - "learning_rate": 1.8074233869115559e-06, - "loss": 0.8506, - "step": 26317 - }, - { - "epoch": 0.67, - "learning_rate": 1.8074070617973866e-06, - "loss": 0.5996, - "step": 26318 - }, - { - "epoch": 0.67, - "learning_rate": 1.807390736065023e-06, - "loss": 0.55, - "step": 26319 - }, - { - "epoch": 0.67, - "learning_rate": 1.8073744097144777e-06, - "loss": 0.8584, - "step": 26320 - }, - { - "epoch": 0.67, - "learning_rate": 1.8073580827457624e-06, - "loss": 0.8262, - "step": 26321 - }, - { - "epoch": 0.67, - "learning_rate": 1.8073417551588905e-06, - "loss": 0.9551, - "step": 26322 - }, - { - "epoch": 0.67, - "learning_rate": 1.807325426953874e-06, - "loss": 0.7749, - "step": 26323 - }, - { - "epoch": 0.67, - "learning_rate": 1.8073090981307258e-06, - "loss": 0.9717, - "step": 26324 - }, - { - "epoch": 0.67, - "learning_rate": 1.8072927686894578e-06, - "loss": 0.6816, - "step": 26325 - }, - { - "epoch": 0.67, - "learning_rate": 1.807276438630083e-06, - "loss": 0.8887, - "step": 26326 - }, - { - "epoch": 0.67, - "learning_rate": 1.8072601079526138e-06, - "loss": 0.5869, - "step": 26327 - }, - { - "epoch": 0.67, - "learning_rate": 1.8072437766570625e-06, - "loss": 1.0508, - "step": 26328 - }, - { - "epoch": 0.67, - "learning_rate": 1.8072274447434417e-06, - "loss": 0.9307, - "step": 26329 - }, - { - "epoch": 0.67, - "learning_rate": 1.8072111122117643e-06, - "loss": 0.9961, - "step": 26330 - }, - { - "epoch": 0.67, - "learning_rate": 1.8071947790620422e-06, - "loss": 0.7373, - "step": 26331 - }, - { - "epoch": 0.67, - "learning_rate": 1.8071784452942883e-06, - "loss": 0.9912, - "step": 26332 - }, - { - "epoch": 0.67, - "learning_rate": 1.8071621109085149e-06, - "loss": 0.9121, - "step": 26333 - }, - { - "epoch": 0.67, - "learning_rate": 1.8071457759047347e-06, - "loss": 0.6396, - "step": 26334 - }, - { - "epoch": 0.67, - "learning_rate": 1.80712944028296e-06, - "loss": 1.0254, - "step": 26335 - }, - { - "epoch": 0.68, - "learning_rate": 1.8071131040432033e-06, - "loss": 0.7139, - "step": 26336 - }, - { - "epoch": 0.68, - "learning_rate": 1.8070967671854774e-06, - "loss": 0.9219, - "step": 26337 - }, - { - "epoch": 0.68, - "learning_rate": 1.8070804297097944e-06, - "loss": 0.8662, - "step": 26338 - }, - { - "epoch": 0.68, - "learning_rate": 1.8070640916161674e-06, - "loss": 0.9199, - "step": 26339 - }, - { - "epoch": 0.68, - "learning_rate": 1.8070477529046081e-06, - "loss": 0.7324, - "step": 26340 - }, - { - "epoch": 0.68, - "learning_rate": 1.8070314135751296e-06, - "loss": 0.6992, - "step": 26341 - }, - { - "epoch": 0.68, - "learning_rate": 1.8070150736277445e-06, - "loss": 0.8564, - "step": 26342 - }, - { - "epoch": 0.68, - "learning_rate": 1.8069987330624648e-06, - "loss": 0.8223, - "step": 26343 - }, - { - "epoch": 0.68, - "learning_rate": 1.8069823918793032e-06, - "loss": 0.9463, - "step": 26344 - }, - { - "epoch": 0.68, - "learning_rate": 1.8069660500782727e-06, - "loss": 0.751, - "step": 26345 - }, - { - "epoch": 0.68, - "learning_rate": 1.8069497076593849e-06, - "loss": 0.6519, - "step": 26346 - }, - { - "epoch": 0.68, - "learning_rate": 1.8069333646226532e-06, - "loss": 0.9385, - "step": 26347 - }, - { - "epoch": 0.68, - "learning_rate": 1.8069170209680895e-06, - "loss": 0.9062, - "step": 26348 - }, - { - "epoch": 0.68, - "learning_rate": 1.8069006766957066e-06, - "loss": 0.874, - "step": 26349 - }, - { - "epoch": 0.68, - "learning_rate": 1.806884331805517e-06, - "loss": 0.9512, - "step": 26350 - }, - { - "epoch": 0.68, - "learning_rate": 1.8068679862975332e-06, - "loss": 0.7466, - "step": 26351 - }, - { - "epoch": 0.68, - "learning_rate": 1.8068516401717674e-06, - "loss": 0.6846, - "step": 26352 - }, - { - "epoch": 0.68, - "learning_rate": 1.8068352934282328e-06, - "loss": 0.9385, - "step": 26353 - }, - { - "epoch": 0.68, - "learning_rate": 1.8068189460669413e-06, - "loss": 0.7217, - "step": 26354 - }, - { - "epoch": 0.68, - "learning_rate": 1.8068025980879056e-06, - "loss": 0.8906, - "step": 26355 - }, - { - "epoch": 0.68, - "learning_rate": 1.8067862494911383e-06, - "loss": 0.7241, - "step": 26356 - }, - { - "epoch": 0.68, - "learning_rate": 1.8067699002766518e-06, - "loss": 0.9365, - "step": 26357 - }, - { - "epoch": 0.68, - "learning_rate": 1.8067535504444588e-06, - "loss": 0.8066, - "step": 26358 - }, - { - "epoch": 0.68, - "learning_rate": 1.8067371999945718e-06, - "loss": 0.833, - "step": 26359 - }, - { - "epoch": 0.68, - "learning_rate": 1.8067208489270033e-06, - "loss": 0.7705, - "step": 26360 - }, - { - "epoch": 0.68, - "learning_rate": 1.8067044972417653e-06, - "loss": 0.9463, - "step": 26361 - }, - { - "epoch": 0.68, - "learning_rate": 1.806688144938871e-06, - "loss": 0.959, - "step": 26362 - }, - { - "epoch": 0.68, - "learning_rate": 1.8066717920183325e-06, - "loss": 0.8125, - "step": 26363 - }, - { - "epoch": 0.68, - "learning_rate": 1.8066554384801628e-06, - "loss": 0.9453, - "step": 26364 - }, - { - "epoch": 0.68, - "learning_rate": 1.806639084324374e-06, - "loss": 0.9199, - "step": 26365 - }, - { - "epoch": 0.68, - "learning_rate": 1.8066227295509786e-06, - "loss": 0.8652, - "step": 26366 - }, - { - "epoch": 0.68, - "learning_rate": 1.8066063741599895e-06, - "loss": 0.6909, - "step": 26367 - }, - { - "epoch": 0.68, - "learning_rate": 1.8065900181514188e-06, - "loss": 0.8623, - "step": 26368 - }, - { - "epoch": 0.68, - "learning_rate": 1.8065736615252793e-06, - "loss": 0.8008, - "step": 26369 - }, - { - "epoch": 0.68, - "learning_rate": 1.8065573042815835e-06, - "loss": 0.7178, - "step": 26370 - }, - { - "epoch": 0.68, - "learning_rate": 1.8065409464203438e-06, - "loss": 0.9043, - "step": 26371 - }, - { - "epoch": 0.68, - "learning_rate": 1.8065245879415728e-06, - "loss": 0.9697, - "step": 26372 - }, - { - "epoch": 0.68, - "learning_rate": 1.806508228845283e-06, - "loss": 0.8809, - "step": 26373 - }, - { - "epoch": 0.68, - "learning_rate": 1.8064918691314869e-06, - "loss": 0.75, - "step": 26374 - }, - { - "epoch": 0.68, - "learning_rate": 1.8064755088001968e-06, - "loss": 0.793, - "step": 26375 - }, - { - "epoch": 0.68, - "learning_rate": 1.806459147851426e-06, - "loss": 0.7812, - "step": 26376 - }, - { - "epoch": 0.68, - "learning_rate": 1.8064427862851862e-06, - "loss": 0.7197, - "step": 26377 - }, - { - "epoch": 0.68, - "learning_rate": 1.8064264241014903e-06, - "loss": 0.9746, - "step": 26378 - }, - { - "epoch": 0.68, - "learning_rate": 1.8064100613003508e-06, - "loss": 0.8037, - "step": 26379 - }, - { - "epoch": 0.68, - "learning_rate": 1.8063936978817802e-06, - "loss": 0.9482, - "step": 26380 - }, - { - "epoch": 0.68, - "learning_rate": 1.8063773338457908e-06, - "loss": 0.7061, - "step": 26381 - }, - { - "epoch": 0.68, - "learning_rate": 1.8063609691923959e-06, - "loss": 0.9629, - "step": 26382 - }, - { - "epoch": 0.68, - "learning_rate": 1.806344603921607e-06, - "loss": 0.8755, - "step": 26383 - }, - { - "epoch": 0.68, - "learning_rate": 1.806328238033437e-06, - "loss": 0.7852, - "step": 26384 - }, - { - "epoch": 0.68, - "learning_rate": 1.806311871527899e-06, - "loss": 1.0225, - "step": 26385 - }, - { - "epoch": 0.68, - "learning_rate": 1.8062955044050047e-06, - "loss": 1.0225, - "step": 26386 - }, - { - "epoch": 0.68, - "learning_rate": 1.8062791366647674e-06, - "loss": 0.7988, - "step": 26387 - }, - { - "epoch": 0.68, - "learning_rate": 1.806262768307199e-06, - "loss": 0.7275, - "step": 26388 - }, - { - "epoch": 0.68, - "learning_rate": 1.8062463993323122e-06, - "loss": 0.7686, - "step": 26389 - }, - { - "epoch": 0.68, - "learning_rate": 1.8062300297401195e-06, - "loss": 0.7969, - "step": 26390 - }, - { - "epoch": 0.68, - "learning_rate": 1.806213659530634e-06, - "loss": 0.7859, - "step": 26391 - }, - { - "epoch": 0.68, - "learning_rate": 1.8061972887038675e-06, - "loss": 0.7588, - "step": 26392 - }, - { - "epoch": 0.68, - "learning_rate": 1.8061809172598327e-06, - "loss": 0.7695, - "step": 26393 - }, - { - "epoch": 0.68, - "learning_rate": 1.8061645451985424e-06, - "loss": 0.79, - "step": 26394 - }, - { - "epoch": 0.68, - "learning_rate": 1.8061481725200088e-06, - "loss": 0.8135, - "step": 26395 - }, - { - "epoch": 0.68, - "learning_rate": 1.8061317992242446e-06, - "loss": 0.8652, - "step": 26396 - }, - { - "epoch": 0.68, - "learning_rate": 1.8061154253112627e-06, - "loss": 0.8721, - "step": 26397 - }, - { - "epoch": 0.68, - "learning_rate": 1.806099050781075e-06, - "loss": 0.6992, - "step": 26398 - }, - { - "epoch": 0.68, - "learning_rate": 1.8060826756336945e-06, - "loss": 0.9062, - "step": 26399 - }, - { - "epoch": 0.68, - "learning_rate": 1.8060662998691333e-06, - "loss": 0.9434, - "step": 26400 - }, - { - "epoch": 0.68, - "learning_rate": 1.8060499234874045e-06, - "loss": 0.8311, - "step": 26401 - }, - { - "epoch": 0.68, - "learning_rate": 1.80603354648852e-06, - "loss": 0.8857, - "step": 26402 - }, - { - "epoch": 0.68, - "learning_rate": 1.806017168872493e-06, - "loss": 0.8311, - "step": 26403 - }, - { - "epoch": 0.68, - "learning_rate": 1.8060007906393354e-06, - "loss": 0.9814, - "step": 26404 - }, - { - "epoch": 0.68, - "learning_rate": 1.8059844117890604e-06, - "loss": 0.8262, - "step": 26405 - }, - { - "epoch": 0.68, - "learning_rate": 1.8059680323216798e-06, - "loss": 0.8276, - "step": 26406 - }, - { - "epoch": 0.68, - "learning_rate": 1.8059516522372068e-06, - "loss": 0.8613, - "step": 26407 - }, - { - "epoch": 0.68, - "learning_rate": 1.8059352715356538e-06, - "loss": 0.9863, - "step": 26408 - }, - { - "epoch": 0.68, - "learning_rate": 1.805918890217033e-06, - "loss": 1.0117, - "step": 26409 - }, - { - "epoch": 0.68, - "learning_rate": 1.8059025082813572e-06, - "loss": 0.9614, - "step": 26410 - }, - { - "epoch": 0.68, - "learning_rate": 1.805886125728639e-06, - "loss": 0.8389, - "step": 26411 - }, - { - "epoch": 0.68, - "learning_rate": 1.8058697425588906e-06, - "loss": 0.7031, - "step": 26412 - }, - { - "epoch": 0.68, - "learning_rate": 1.805853358772125e-06, - "loss": 1.0635, - "step": 26413 - }, - { - "epoch": 0.68, - "learning_rate": 1.8058369743683545e-06, - "loss": 0.8486, - "step": 26414 - }, - { - "epoch": 0.68, - "learning_rate": 1.8058205893475918e-06, - "loss": 0.96, - "step": 26415 - }, - { - "epoch": 0.68, - "learning_rate": 1.805804203709849e-06, - "loss": 0.9766, - "step": 26416 - }, - { - "epoch": 0.68, - "learning_rate": 1.8057878174551395e-06, - "loss": 0.645, - "step": 26417 - }, - { - "epoch": 0.68, - "learning_rate": 1.805771430583475e-06, - "loss": 0.7295, - "step": 26418 - }, - { - "epoch": 0.68, - "learning_rate": 1.8057550430948683e-06, - "loss": 0.7324, - "step": 26419 - }, - { - "epoch": 0.68, - "learning_rate": 1.8057386549893321e-06, - "loss": 0.7571, - "step": 26420 - }, - { - "epoch": 0.68, - "learning_rate": 1.805722266266879e-06, - "loss": 0.8594, - "step": 26421 - }, - { - "epoch": 0.68, - "learning_rate": 1.805705876927521e-06, - "loss": 0.8506, - "step": 26422 - }, - { - "epoch": 0.68, - "learning_rate": 1.8056894869712714e-06, - "loss": 0.8145, - "step": 26423 - }, - { - "epoch": 0.68, - "learning_rate": 1.8056730963981423e-06, - "loss": 0.7939, - "step": 26424 - }, - { - "epoch": 0.68, - "learning_rate": 1.8056567052081464e-06, - "loss": 0.8555, - "step": 26425 - }, - { - "epoch": 0.68, - "learning_rate": 1.8056403134012964e-06, - "loss": 0.8154, - "step": 26426 - }, - { - "epoch": 0.68, - "learning_rate": 1.805623920977604e-06, - "loss": 0.6304, - "step": 26427 - }, - { - "epoch": 0.68, - "learning_rate": 1.8056075279370831e-06, - "loss": 0.9717, - "step": 26428 - }, - { - "epoch": 0.68, - "learning_rate": 1.8055911342797453e-06, - "loss": 0.6558, - "step": 26429 - }, - { - "epoch": 0.68, - "learning_rate": 1.8055747400056033e-06, - "loss": 0.7764, - "step": 26430 - }, - { - "epoch": 0.68, - "learning_rate": 1.8055583451146702e-06, - "loss": 0.814, - "step": 26431 - }, - { - "epoch": 0.68, - "learning_rate": 1.8055419496069577e-06, - "loss": 0.7114, - "step": 26432 - }, - { - "epoch": 0.68, - "learning_rate": 1.8055255534824786e-06, - "loss": 0.6299, - "step": 26433 - }, - { - "epoch": 0.68, - "learning_rate": 1.805509156741246e-06, - "loss": 0.7842, - "step": 26434 - }, - { - "epoch": 0.68, - "learning_rate": 1.8054927593832718e-06, - "loss": 0.4966, - "step": 26435 - }, - { - "epoch": 0.68, - "learning_rate": 1.8054763614085693e-06, - "loss": 0.9834, - "step": 26436 - }, - { - "epoch": 0.68, - "learning_rate": 1.8054599628171502e-06, - "loss": 1.0186, - "step": 26437 - }, - { - "epoch": 0.68, - "learning_rate": 1.8054435636090275e-06, - "loss": 0.8064, - "step": 26438 - }, - { - "epoch": 0.68, - "learning_rate": 1.8054271637842139e-06, - "loss": 0.9399, - "step": 26439 - }, - { - "epoch": 0.68, - "learning_rate": 1.8054107633427213e-06, - "loss": 0.8555, - "step": 26440 - }, - { - "epoch": 0.68, - "learning_rate": 1.805394362284563e-06, - "loss": 0.8701, - "step": 26441 - }, - { - "epoch": 0.68, - "learning_rate": 1.8053779606097513e-06, - "loss": 0.8945, - "step": 26442 - }, - { - "epoch": 0.68, - "learning_rate": 1.8053615583182987e-06, - "loss": 0.752, - "step": 26443 - }, - { - "epoch": 0.68, - "learning_rate": 1.805345155410218e-06, - "loss": 0.8994, - "step": 26444 - }, - { - "epoch": 0.68, - "learning_rate": 1.8053287518855212e-06, - "loss": 0.7754, - "step": 26445 - }, - { - "epoch": 0.68, - "learning_rate": 1.805312347744221e-06, - "loss": 0.6875, - "step": 26446 - }, - { - "epoch": 0.68, - "learning_rate": 1.805295942986331e-06, - "loss": 0.7832, - "step": 26447 - }, - { - "epoch": 0.68, - "learning_rate": 1.8052795376118622e-06, - "loss": 0.877, - "step": 26448 - }, - { - "epoch": 0.68, - "learning_rate": 1.805263131620828e-06, - "loss": 0.6953, - "step": 26449 - }, - { - "epoch": 0.68, - "learning_rate": 1.805246725013241e-06, - "loss": 0.9639, - "step": 26450 - }, - { - "epoch": 0.68, - "learning_rate": 1.8052303177891135e-06, - "loss": 0.917, - "step": 26451 - }, - { - "epoch": 0.68, - "learning_rate": 1.8052139099484582e-06, - "loss": 1.1172, - "step": 26452 - }, - { - "epoch": 0.68, - "learning_rate": 1.8051975014912876e-06, - "loss": 0.8618, - "step": 26453 - }, - { - "epoch": 0.68, - "learning_rate": 1.8051810924176145e-06, - "loss": 0.8213, - "step": 26454 - }, - { - "epoch": 0.68, - "learning_rate": 1.8051646827274508e-06, - "loss": 1.082, - "step": 26455 - }, - { - "epoch": 0.68, - "learning_rate": 1.8051482724208103e-06, - "loss": 0.7144, - "step": 26456 - }, - { - "epoch": 0.68, - "learning_rate": 1.805131861497704e-06, - "loss": 0.9023, - "step": 26457 - }, - { - "epoch": 0.68, - "learning_rate": 1.8051154499581458e-06, - "loss": 0.9658, - "step": 26458 - }, - { - "epoch": 0.68, - "learning_rate": 1.8050990378021473e-06, - "loss": 0.5981, - "step": 26459 - }, - { - "epoch": 0.68, - "learning_rate": 1.8050826250297218e-06, - "loss": 0.9258, - "step": 26460 - }, - { - "epoch": 0.68, - "learning_rate": 1.8050662116408815e-06, - "loss": 0.8975, - "step": 26461 - }, - { - "epoch": 0.68, - "learning_rate": 1.8050497976356391e-06, - "loss": 0.9805, - "step": 26462 - }, - { - "epoch": 0.68, - "learning_rate": 1.805033383014007e-06, - "loss": 0.8604, - "step": 26463 - }, - { - "epoch": 0.68, - "learning_rate": 1.8050169677759977e-06, - "loss": 0.8477, - "step": 26464 - }, - { - "epoch": 0.68, - "learning_rate": 1.805000551921624e-06, - "loss": 0.8633, - "step": 26465 - }, - { - "epoch": 0.68, - "learning_rate": 1.8049841354508983e-06, - "loss": 0.8613, - "step": 26466 - }, - { - "epoch": 0.68, - "learning_rate": 1.8049677183638333e-06, - "loss": 1.1426, - "step": 26467 - }, - { - "epoch": 0.68, - "learning_rate": 1.8049513006604418e-06, - "loss": 0.873, - "step": 26468 - }, - { - "epoch": 0.68, - "learning_rate": 1.8049348823407357e-06, - "loss": 0.6055, - "step": 26469 - }, - { - "epoch": 0.68, - "learning_rate": 1.8049184634047283e-06, - "loss": 0.8623, - "step": 26470 - }, - { - "epoch": 0.68, - "learning_rate": 1.804902043852432e-06, - "loss": 0.7822, - "step": 26471 - }, - { - "epoch": 0.68, - "learning_rate": 1.8048856236838587e-06, - "loss": 0.501, - "step": 26472 - }, - { - "epoch": 0.68, - "learning_rate": 1.8048692028990219e-06, - "loss": 0.9175, - "step": 26473 - }, - { - "epoch": 0.68, - "learning_rate": 1.8048527814979336e-06, - "loss": 1.0449, - "step": 26474 - }, - { - "epoch": 0.68, - "learning_rate": 1.8048363594806064e-06, - "loss": 0.8203, - "step": 26475 - }, - { - "epoch": 0.68, - "learning_rate": 1.8048199368470535e-06, - "loss": 0.4724, - "step": 26476 - }, - { - "epoch": 0.68, - "learning_rate": 1.8048035135972863e-06, - "loss": 0.748, - "step": 26477 - }, - { - "epoch": 0.68, - "learning_rate": 1.8047870897313184e-06, - "loss": 0.708, - "step": 26478 - }, - { - "epoch": 0.68, - "learning_rate": 1.8047706652491618e-06, - "loss": 0.7363, - "step": 26479 - }, - { - "epoch": 0.68, - "learning_rate": 1.8047542401508298e-06, - "loss": 0.9004, - "step": 26480 - }, - { - "epoch": 0.68, - "learning_rate": 1.8047378144363342e-06, - "loss": 0.7773, - "step": 26481 - }, - { - "epoch": 0.68, - "learning_rate": 1.8047213881056878e-06, - "loss": 0.8291, - "step": 26482 - }, - { - "epoch": 0.68, - "learning_rate": 1.8047049611589031e-06, - "loss": 0.9199, - "step": 26483 - }, - { - "epoch": 0.68, - "learning_rate": 1.8046885335959932e-06, - "loss": 0.7568, - "step": 26484 - }, - { - "epoch": 0.68, - "learning_rate": 1.80467210541697e-06, - "loss": 0.7065, - "step": 26485 - }, - { - "epoch": 0.68, - "learning_rate": 1.8046556766218463e-06, - "loss": 1.0908, - "step": 26486 - }, - { - "epoch": 0.68, - "learning_rate": 1.8046392472106349e-06, - "loss": 0.873, - "step": 26487 - }, - { - "epoch": 0.68, - "learning_rate": 1.8046228171833482e-06, - "loss": 0.9883, - "step": 26488 - }, - { - "epoch": 0.68, - "learning_rate": 1.804606386539999e-06, - "loss": 0.74, - "step": 26489 - }, - { - "epoch": 0.68, - "learning_rate": 1.8045899552805995e-06, - "loss": 0.9814, - "step": 26490 - }, - { - "epoch": 0.68, - "learning_rate": 1.8045735234051626e-06, - "loss": 0.9023, - "step": 26491 - }, - { - "epoch": 0.68, - "learning_rate": 1.8045570909137004e-06, - "loss": 0.9082, - "step": 26492 - }, - { - "epoch": 0.68, - "learning_rate": 1.8045406578062261e-06, - "loss": 0.8008, - "step": 26493 - }, - { - "epoch": 0.68, - "learning_rate": 1.804524224082752e-06, - "loss": 0.9092, - "step": 26494 - }, - { - "epoch": 0.68, - "learning_rate": 1.8045077897432907e-06, - "loss": 0.8906, - "step": 26495 - }, - { - "epoch": 0.68, - "learning_rate": 1.8044913547878548e-06, - "loss": 1.001, - "step": 26496 - }, - { - "epoch": 0.68, - "learning_rate": 1.804474919216457e-06, - "loss": 0.6318, - "step": 26497 - }, - { - "epoch": 0.68, - "learning_rate": 1.8044584830291095e-06, - "loss": 0.8809, - "step": 26498 - }, - { - "epoch": 0.68, - "learning_rate": 1.8044420462258252e-06, - "loss": 0.6772, - "step": 26499 - }, - { - "epoch": 0.68, - "learning_rate": 1.8044256088066165e-06, - "loss": 0.666, - "step": 26500 - }, - { - "epoch": 0.68, - "learning_rate": 1.8044091707714963e-06, - "loss": 0.8018, - "step": 26501 - }, - { - "epoch": 0.68, - "learning_rate": 1.8043927321204768e-06, - "loss": 0.8086, - "step": 26502 - }, - { - "epoch": 0.68, - "learning_rate": 1.804376292853571e-06, - "loss": 0.9209, - "step": 26503 - }, - { - "epoch": 0.68, - "learning_rate": 1.8043598529707911e-06, - "loss": 0.7749, - "step": 26504 - }, - { - "epoch": 0.68, - "learning_rate": 1.8043434124721499e-06, - "loss": 0.8809, - "step": 26505 - }, - { - "epoch": 0.68, - "learning_rate": 1.8043269713576596e-06, - "loss": 0.6895, - "step": 26506 - }, - { - "epoch": 0.68, - "learning_rate": 1.8043105296273336e-06, - "loss": 0.7959, - "step": 26507 - }, - { - "epoch": 0.68, - "learning_rate": 1.8042940872811839e-06, - "loss": 0.7861, - "step": 26508 - }, - { - "epoch": 0.68, - "learning_rate": 1.804277644319223e-06, - "loss": 0.7793, - "step": 26509 - }, - { - "epoch": 0.68, - "learning_rate": 1.8042612007414637e-06, - "loss": 0.8213, - "step": 26510 - }, - { - "epoch": 0.68, - "learning_rate": 1.804244756547919e-06, - "loss": 0.7861, - "step": 26511 - }, - { - "epoch": 0.68, - "learning_rate": 1.8042283117386008e-06, - "loss": 0.9404, - "step": 26512 - }, - { - "epoch": 0.68, - "learning_rate": 1.8042118663135217e-06, - "loss": 1.0029, - "step": 26513 - }, - { - "epoch": 0.68, - "learning_rate": 1.8041954202726948e-06, - "loss": 0.8652, - "step": 26514 - }, - { - "epoch": 0.68, - "learning_rate": 1.8041789736161323e-06, - "loss": 0.8145, - "step": 26515 - }, - { - "epoch": 0.68, - "learning_rate": 1.8041625263438473e-06, - "loss": 0.4768, - "step": 26516 - }, - { - "epoch": 0.68, - "learning_rate": 1.8041460784558518e-06, - "loss": 0.665, - "step": 26517 - }, - { - "epoch": 0.68, - "learning_rate": 1.8041296299521587e-06, - "loss": 0.6768, - "step": 26518 - }, - { - "epoch": 0.68, - "learning_rate": 1.8041131808327803e-06, - "loss": 0.8604, - "step": 26519 - }, - { - "epoch": 0.68, - "learning_rate": 1.8040967310977297e-06, - "loss": 0.7998, - "step": 26520 - }, - { - "epoch": 0.68, - "learning_rate": 1.804080280747019e-06, - "loss": 0.7021, - "step": 26521 - }, - { - "epoch": 0.68, - "learning_rate": 1.8040638297806611e-06, - "loss": 0.6431, - "step": 26522 - }, - { - "epoch": 0.68, - "learning_rate": 1.8040473781986685e-06, - "loss": 0.9102, - "step": 26523 - }, - { - "epoch": 0.68, - "learning_rate": 1.8040309260010535e-06, - "loss": 0.9121, - "step": 26524 - }, - { - "epoch": 0.68, - "learning_rate": 1.8040144731878292e-06, - "loss": 0.9463, - "step": 26525 - }, - { - "epoch": 0.68, - "learning_rate": 1.8039980197590081e-06, - "loss": 0.6553, - "step": 26526 - }, - { - "epoch": 0.68, - "learning_rate": 1.8039815657146027e-06, - "loss": 0.9961, - "step": 26527 - }, - { - "epoch": 0.68, - "learning_rate": 1.8039651110546256e-06, - "loss": 0.4666, - "step": 26528 - }, - { - "epoch": 0.68, - "learning_rate": 1.8039486557790893e-06, - "loss": 0.553, - "step": 26529 - }, - { - "epoch": 0.68, - "learning_rate": 1.8039321998880063e-06, - "loss": 0.8794, - "step": 26530 - }, - { - "epoch": 0.68, - "learning_rate": 1.8039157433813895e-06, - "loss": 0.6924, - "step": 26531 - }, - { - "epoch": 0.68, - "learning_rate": 1.8038992862592515e-06, - "loss": 0.8711, - "step": 26532 - }, - { - "epoch": 0.68, - "learning_rate": 1.8038828285216048e-06, - "loss": 0.7412, - "step": 26533 - }, - { - "epoch": 0.68, - "learning_rate": 1.8038663701684617e-06, - "loss": 0.873, - "step": 26534 - }, - { - "epoch": 0.68, - "learning_rate": 1.8038499111998353e-06, - "loss": 0.999, - "step": 26535 - }, - { - "epoch": 0.68, - "learning_rate": 1.803833451615738e-06, - "loss": 0.8428, - "step": 26536 - }, - { - "epoch": 0.68, - "learning_rate": 1.8038169914161823e-06, - "loss": 0.585, - "step": 26537 - }, - { - "epoch": 0.68, - "learning_rate": 1.803800530601181e-06, - "loss": 0.8774, - "step": 26538 - }, - { - "epoch": 0.68, - "learning_rate": 1.8037840691707465e-06, - "loss": 0.9902, - "step": 26539 - }, - { - "epoch": 0.68, - "learning_rate": 1.8037676071248915e-06, - "loss": 1.0166, - "step": 26540 - }, - { - "epoch": 0.68, - "learning_rate": 1.8037511444636286e-06, - "loss": 0.8955, - "step": 26541 - }, - { - "epoch": 0.68, - "learning_rate": 1.8037346811869704e-06, - "loss": 0.8125, - "step": 26542 - }, - { - "epoch": 0.68, - "learning_rate": 1.8037182172949294e-06, - "loss": 0.8569, - "step": 26543 - }, - { - "epoch": 0.68, - "learning_rate": 1.8037017527875187e-06, - "loss": 0.8379, - "step": 26544 - }, - { - "epoch": 0.68, - "learning_rate": 1.80368528766475e-06, - "loss": 0.96, - "step": 26545 - }, - { - "epoch": 0.68, - "learning_rate": 1.803668821926637e-06, - "loss": 0.793, - "step": 26546 - }, - { - "epoch": 0.68, - "learning_rate": 1.8036523555731913e-06, - "loss": 0.6216, - "step": 26547 - }, - { - "epoch": 0.68, - "learning_rate": 1.8036358886044263e-06, - "loss": 0.5903, - "step": 26548 - }, - { - "epoch": 0.68, - "learning_rate": 1.803619421020354e-06, - "loss": 0.8428, - "step": 26549 - }, - { - "epoch": 0.68, - "learning_rate": 1.803602952820987e-06, - "loss": 0.5652, - "step": 26550 - }, - { - "epoch": 0.68, - "learning_rate": 1.8035864840063386e-06, - "loss": 0.6675, - "step": 26551 - }, - { - "epoch": 0.68, - "learning_rate": 1.803570014576421e-06, - "loss": 0.646, - "step": 26552 - }, - { - "epoch": 0.68, - "learning_rate": 1.8035535445312466e-06, - "loss": 0.9585, - "step": 26553 - }, - { - "epoch": 0.68, - "learning_rate": 1.8035370738708279e-06, - "loss": 1.0879, - "step": 26554 - }, - { - "epoch": 0.68, - "learning_rate": 1.8035206025951785e-06, - "loss": 0.52, - "step": 26555 - }, - { - "epoch": 0.68, - "learning_rate": 1.8035041307043097e-06, - "loss": 1.0029, - "step": 26556 - }, - { - "epoch": 0.68, - "learning_rate": 1.803487658198235e-06, - "loss": 0.6528, - "step": 26557 - }, - { - "epoch": 0.68, - "learning_rate": 1.803471185076967e-06, - "loss": 0.7939, - "step": 26558 - }, - { - "epoch": 0.68, - "learning_rate": 1.803454711340518e-06, - "loss": 0.7583, - "step": 26559 - }, - { - "epoch": 0.68, - "learning_rate": 1.8034382369889003e-06, - "loss": 0.9961, - "step": 26560 - }, - { - "epoch": 0.68, - "learning_rate": 1.8034217620221267e-06, - "loss": 1.0293, - "step": 26561 - }, - { - "epoch": 0.68, - "learning_rate": 1.8034052864402107e-06, - "loss": 0.8193, - "step": 26562 - }, - { - "epoch": 0.68, - "learning_rate": 1.8033888102431637e-06, - "loss": 0.7725, - "step": 26563 - }, - { - "epoch": 0.68, - "learning_rate": 1.8033723334309992e-06, - "loss": 0.7529, - "step": 26564 - }, - { - "epoch": 0.68, - "learning_rate": 1.803355856003729e-06, - "loss": 0.9893, - "step": 26565 - }, - { - "epoch": 0.68, - "learning_rate": 1.8033393779613667e-06, - "loss": 0.7676, - "step": 26566 - }, - { - "epoch": 0.68, - "learning_rate": 1.8033228993039238e-06, - "loss": 0.8066, - "step": 26567 - }, - { - "epoch": 0.68, - "learning_rate": 1.803306420031414e-06, - "loss": 0.6909, - "step": 26568 - }, - { - "epoch": 0.68, - "learning_rate": 1.803289940143849e-06, - "loss": 0.8691, - "step": 26569 - }, - { - "epoch": 0.68, - "learning_rate": 1.8032734596412422e-06, - "loss": 0.874, - "step": 26570 - }, - { - "epoch": 0.68, - "learning_rate": 1.8032569785236057e-06, - "loss": 0.8398, - "step": 26571 - }, - { - "epoch": 0.68, - "learning_rate": 1.803240496790952e-06, - "loss": 0.7573, - "step": 26572 - }, - { - "epoch": 0.68, - "learning_rate": 1.8032240144432943e-06, - "loss": 1.0273, - "step": 26573 - }, - { - "epoch": 0.68, - "learning_rate": 1.8032075314806447e-06, - "loss": 0.9473, - "step": 26574 - }, - { - "epoch": 0.68, - "learning_rate": 1.8031910479030163e-06, - "loss": 0.8975, - "step": 26575 - }, - { - "epoch": 0.68, - "learning_rate": 1.8031745637104213e-06, - "loss": 0.8535, - "step": 26576 - }, - { - "epoch": 0.68, - "learning_rate": 1.8031580789028725e-06, - "loss": 0.8003, - "step": 26577 - }, - { - "epoch": 0.68, - "learning_rate": 1.8031415934803824e-06, - "loss": 0.875, - "step": 26578 - }, - { - "epoch": 0.68, - "learning_rate": 1.8031251074429638e-06, - "loss": 0.6094, - "step": 26579 - }, - { - "epoch": 0.68, - "learning_rate": 1.8031086207906289e-06, - "loss": 0.5883, - "step": 26580 - }, - { - "epoch": 0.68, - "learning_rate": 1.8030921335233913e-06, - "loss": 0.9033, - "step": 26581 - }, - { - "epoch": 0.68, - "learning_rate": 1.8030756456412626e-06, - "loss": 0.834, - "step": 26582 - }, - { - "epoch": 0.68, - "learning_rate": 1.803059157144256e-06, - "loss": 1.0713, - "step": 26583 - }, - { - "epoch": 0.68, - "learning_rate": 1.8030426680323837e-06, - "loss": 0.6406, - "step": 26584 - }, - { - "epoch": 0.68, - "learning_rate": 1.8030261783056584e-06, - "loss": 0.915, - "step": 26585 - }, - { - "epoch": 0.68, - "learning_rate": 1.803009687964093e-06, - "loss": 0.6758, - "step": 26586 - }, - { - "epoch": 0.68, - "learning_rate": 1.8029931970077e-06, - "loss": 0.7314, - "step": 26587 - }, - { - "epoch": 0.68, - "learning_rate": 1.8029767054364924e-06, - "loss": 0.6099, - "step": 26588 - }, - { - "epoch": 0.68, - "learning_rate": 1.8029602132504822e-06, - "loss": 0.5947, - "step": 26589 - }, - { - "epoch": 0.68, - "learning_rate": 1.8029437204496823e-06, - "loss": 0.877, - "step": 26590 - }, - { - "epoch": 0.68, - "learning_rate": 1.8029272270341053e-06, - "loss": 0.834, - "step": 26591 - }, - { - "epoch": 0.68, - "learning_rate": 1.8029107330037638e-06, - "loss": 0.8838, - "step": 26592 - }, - { - "epoch": 0.68, - "learning_rate": 1.8028942383586708e-06, - "loss": 0.8525, - "step": 26593 - }, - { - "epoch": 0.68, - "learning_rate": 1.802877743098838e-06, - "loss": 0.8652, - "step": 26594 - }, - { - "epoch": 0.68, - "learning_rate": 1.802861247224279e-06, - "loss": 0.8398, - "step": 26595 - }, - { - "epoch": 0.68, - "learning_rate": 1.8028447507350059e-06, - "loss": 0.9531, - "step": 26596 - }, - { - "epoch": 0.68, - "learning_rate": 1.8028282536310315e-06, - "loss": 0.791, - "step": 26597 - }, - { - "epoch": 0.68, - "learning_rate": 1.8028117559123687e-06, - "loss": 0.8799, - "step": 26598 - }, - { - "epoch": 0.68, - "learning_rate": 1.8027952575790298e-06, - "loss": 0.7866, - "step": 26599 - }, - { - "epoch": 0.68, - "learning_rate": 1.8027787586310272e-06, - "loss": 0.8652, - "step": 26600 - }, - { - "epoch": 0.68, - "learning_rate": 1.802762259068374e-06, - "loss": 0.6741, - "step": 26601 - }, - { - "epoch": 0.68, - "learning_rate": 1.8027457588910826e-06, - "loss": 1.0547, - "step": 26602 - }, - { - "epoch": 0.68, - "learning_rate": 1.8027292580991657e-06, - "loss": 0.8252, - "step": 26603 - }, - { - "epoch": 0.68, - "learning_rate": 1.8027127566926358e-06, - "loss": 0.8203, - "step": 26604 - }, - { - "epoch": 0.68, - "learning_rate": 1.8026962546715056e-06, - "loss": 0.6934, - "step": 26605 - }, - { - "epoch": 0.68, - "learning_rate": 1.8026797520357881e-06, - "loss": 0.9053, - "step": 26606 - }, - { - "epoch": 0.68, - "learning_rate": 1.8026632487854956e-06, - "loss": 0.9443, - "step": 26607 - }, - { - "epoch": 0.68, - "learning_rate": 1.8026467449206406e-06, - "loss": 0.915, - "step": 26608 - }, - { - "epoch": 0.68, - "learning_rate": 1.8026302404412359e-06, - "loss": 0.8506, - "step": 26609 - }, - { - "epoch": 0.68, - "learning_rate": 1.8026137353472942e-06, - "loss": 0.7695, - "step": 26610 - }, - { - "epoch": 0.68, - "learning_rate": 1.802597229638828e-06, - "loss": 0.7422, - "step": 26611 - }, - { - "epoch": 0.68, - "learning_rate": 1.80258072331585e-06, - "loss": 0.9707, - "step": 26612 - }, - { - "epoch": 0.68, - "learning_rate": 1.802564216378373e-06, - "loss": 0.8037, - "step": 26613 - }, - { - "epoch": 0.68, - "learning_rate": 1.8025477088264091e-06, - "loss": 0.7539, - "step": 26614 - }, - { - "epoch": 0.68, - "learning_rate": 1.8025312006599719e-06, - "loss": 0.877, - "step": 26615 - }, - { - "epoch": 0.68, - "learning_rate": 1.802514691879073e-06, - "loss": 0.8799, - "step": 26616 - }, - { - "epoch": 0.68, - "learning_rate": 1.8024981824837258e-06, - "loss": 0.9697, - "step": 26617 - }, - { - "epoch": 0.68, - "learning_rate": 1.8024816724739424e-06, - "loss": 0.8115, - "step": 26618 - }, - { - "epoch": 0.68, - "learning_rate": 1.8024651618497354e-06, - "loss": 0.7607, - "step": 26619 - }, - { - "epoch": 0.68, - "learning_rate": 1.8024486506111184e-06, - "loss": 0.9482, - "step": 26620 - }, - { - "epoch": 0.68, - "learning_rate": 1.802432138758103e-06, - "loss": 0.7837, - "step": 26621 - }, - { - "epoch": 0.68, - "learning_rate": 1.8024156262907022e-06, - "loss": 0.9033, - "step": 26622 - }, - { - "epoch": 0.68, - "learning_rate": 1.8023991132089287e-06, - "loss": 0.8848, - "step": 26623 - }, - { - "epoch": 0.68, - "learning_rate": 1.802382599512795e-06, - "loss": 0.8213, - "step": 26624 - }, - { - "epoch": 0.68, - "learning_rate": 1.8023660852023142e-06, - "loss": 0.7612, - "step": 26625 - }, - { - "epoch": 0.68, - "learning_rate": 1.8023495702774983e-06, - "loss": 0.5889, - "step": 26626 - }, - { - "epoch": 0.68, - "learning_rate": 1.8023330547383602e-06, - "loss": 0.9541, - "step": 26627 - }, - { - "epoch": 0.68, - "learning_rate": 1.8023165385849126e-06, - "loss": 0.6699, - "step": 26628 - }, - { - "epoch": 0.68, - "learning_rate": 1.8023000218171683e-06, - "loss": 0.9082, - "step": 26629 - }, - { - "epoch": 0.68, - "learning_rate": 1.8022835044351394e-06, - "loss": 0.9199, - "step": 26630 - }, - { - "epoch": 0.68, - "learning_rate": 1.8022669864388393e-06, - "loss": 0.749, - "step": 26631 - }, - { - "epoch": 0.68, - "learning_rate": 1.80225046782828e-06, - "loss": 1.0713, - "step": 26632 - }, - { - "epoch": 0.68, - "learning_rate": 1.8022339486034745e-06, - "loss": 0.8174, - "step": 26633 - }, - { - "epoch": 0.68, - "learning_rate": 1.8022174287644354e-06, - "loss": 1.1494, - "step": 26634 - }, - { - "epoch": 0.68, - "learning_rate": 1.8022009083111751e-06, - "loss": 0.9619, - "step": 26635 - }, - { - "epoch": 0.68, - "learning_rate": 1.8021843872437067e-06, - "loss": 0.8799, - "step": 26636 - }, - { - "epoch": 0.68, - "learning_rate": 1.8021678655620424e-06, - "loss": 0.7861, - "step": 26637 - }, - { - "epoch": 0.68, - "learning_rate": 1.8021513432661952e-06, - "loss": 0.709, - "step": 26638 - }, - { - "epoch": 0.68, - "learning_rate": 1.8021348203561777e-06, - "loss": 0.7656, - "step": 26639 - }, - { - "epoch": 0.68, - "learning_rate": 1.802118296832002e-06, - "loss": 0.7461, - "step": 26640 - }, - { - "epoch": 0.68, - "learning_rate": 1.8021017726936816e-06, - "loss": 0.7744, - "step": 26641 - }, - { - "epoch": 0.68, - "learning_rate": 1.8020852479412288e-06, - "loss": 0.7588, - "step": 26642 - }, - { - "epoch": 0.68, - "learning_rate": 1.8020687225746559e-06, - "loss": 0.835, - "step": 26643 - }, - { - "epoch": 0.68, - "learning_rate": 1.8020521965939758e-06, - "loss": 0.873, - "step": 26644 - }, - { - "epoch": 0.68, - "learning_rate": 1.8020356699992013e-06, - "loss": 0.9316, - "step": 26645 - }, - { - "epoch": 0.68, - "learning_rate": 1.8020191427903453e-06, - "loss": 0.6826, - "step": 26646 - }, - { - "epoch": 0.68, - "learning_rate": 1.8020026149674199e-06, - "loss": 0.6274, - "step": 26647 - }, - { - "epoch": 0.68, - "learning_rate": 1.801986086530438e-06, - "loss": 0.8643, - "step": 26648 - }, - { - "epoch": 0.68, - "learning_rate": 1.8019695574794125e-06, - "loss": 0.9805, - "step": 26649 - }, - { - "epoch": 0.68, - "learning_rate": 1.8019530278143553e-06, - "loss": 0.8013, - "step": 26650 - }, - { - "epoch": 0.68, - "learning_rate": 1.8019364975352797e-06, - "loss": 1.0654, - "step": 26651 - }, - { - "epoch": 0.68, - "learning_rate": 1.8019199666421984e-06, - "loss": 0.958, - "step": 26652 - }, - { - "epoch": 0.68, - "learning_rate": 1.8019034351351237e-06, - "loss": 0.6455, - "step": 26653 - }, - { - "epoch": 0.68, - "learning_rate": 1.8018869030140685e-06, - "loss": 0.8746, - "step": 26654 - }, - { - "epoch": 0.68, - "learning_rate": 1.8018703702790452e-06, - "loss": 0.812, - "step": 26655 - }, - { - "epoch": 0.68, - "learning_rate": 1.8018538369300666e-06, - "loss": 0.8721, - "step": 26656 - }, - { - "epoch": 0.68, - "learning_rate": 1.8018373029671454e-06, - "loss": 0.9209, - "step": 26657 - }, - { - "epoch": 0.68, - "learning_rate": 1.8018207683902946e-06, - "loss": 0.874, - "step": 26658 - }, - { - "epoch": 0.68, - "learning_rate": 1.801804233199526e-06, - "loss": 0.6738, - "step": 26659 - }, - { - "epoch": 0.68, - "learning_rate": 1.801787697394853e-06, - "loss": 0.7334, - "step": 26660 - }, - { - "epoch": 0.68, - "learning_rate": 1.8017711609762883e-06, - "loss": 0.5825, - "step": 26661 - }, - { - "epoch": 0.68, - "learning_rate": 1.8017546239438438e-06, - "loss": 0.8003, - "step": 26662 - }, - { - "epoch": 0.68, - "learning_rate": 1.801738086297533e-06, - "loss": 0.793, - "step": 26663 - }, - { - "epoch": 0.68, - "learning_rate": 1.801721548037368e-06, - "loss": 1.0146, - "step": 26664 - }, - { - "epoch": 0.68, - "learning_rate": 1.8017050091633616e-06, - "loss": 0.6589, - "step": 26665 - }, - { - "epoch": 0.68, - "learning_rate": 1.8016884696755268e-06, - "loss": 0.9268, - "step": 26666 - }, - { - "epoch": 0.68, - "learning_rate": 1.801671929573876e-06, - "loss": 0.8838, - "step": 26667 - }, - { - "epoch": 0.68, - "learning_rate": 1.8016553888584217e-06, - "loss": 0.7236, - "step": 26668 - }, - { - "epoch": 0.68, - "learning_rate": 1.8016388475291769e-06, - "loss": 0.9648, - "step": 26669 - }, - { - "epoch": 0.68, - "learning_rate": 1.8016223055861542e-06, - "loss": 0.9766, - "step": 26670 - }, - { - "epoch": 0.68, - "learning_rate": 1.8016057630293657e-06, - "loss": 0.8208, - "step": 26671 - }, - { - "epoch": 0.68, - "learning_rate": 1.8015892198588247e-06, - "loss": 0.9224, - "step": 26672 - }, - { - "epoch": 0.68, - "learning_rate": 1.801572676074544e-06, - "loss": 0.8389, - "step": 26673 - }, - { - "epoch": 0.68, - "learning_rate": 1.8015561316765356e-06, - "loss": 0.6396, - "step": 26674 - }, - { - "epoch": 0.68, - "learning_rate": 1.8015395866648127e-06, - "loss": 0.7109, - "step": 26675 - }, - { - "epoch": 0.68, - "learning_rate": 1.8015230410393877e-06, - "loss": 0.748, - "step": 26676 - }, - { - "epoch": 0.68, - "learning_rate": 1.8015064948002734e-06, - "loss": 0.5356, - "step": 26677 - }, - { - "epoch": 0.68, - "learning_rate": 1.8014899479474825e-06, - "loss": 0.7139, - "step": 26678 - }, - { - "epoch": 0.68, - "learning_rate": 1.8014734004810276e-06, - "loss": 1.04, - "step": 26679 - }, - { - "epoch": 0.68, - "learning_rate": 1.8014568524009212e-06, - "loss": 0.7861, - "step": 26680 - }, - { - "epoch": 0.68, - "learning_rate": 1.8014403037071764e-06, - "loss": 0.9443, - "step": 26681 - }, - { - "epoch": 0.68, - "learning_rate": 1.8014237543998055e-06, - "loss": 0.9932, - "step": 26682 - }, - { - "epoch": 0.68, - "learning_rate": 1.801407204478821e-06, - "loss": 0.7236, - "step": 26683 - }, - { - "epoch": 0.68, - "learning_rate": 1.8013906539442362e-06, - "loss": 0.7686, - "step": 26684 - }, - { - "epoch": 0.68, - "learning_rate": 1.8013741027960635e-06, - "loss": 0.8369, - "step": 26685 - }, - { - "epoch": 0.68, - "learning_rate": 1.8013575510343153e-06, - "loss": 0.8972, - "step": 26686 - }, - { - "epoch": 0.68, - "learning_rate": 1.8013409986590044e-06, - "loss": 0.8232, - "step": 26687 - }, - { - "epoch": 0.68, - "learning_rate": 1.8013244456701435e-06, - "loss": 0.9561, - "step": 26688 - }, - { - "epoch": 0.68, - "learning_rate": 1.8013078920677455e-06, - "loss": 0.8359, - "step": 26689 - }, - { - "epoch": 0.68, - "learning_rate": 1.801291337851823e-06, - "loss": 0.9473, - "step": 26690 - }, - { - "epoch": 0.68, - "learning_rate": 1.8012747830223885e-06, - "loss": 1.0068, - "step": 26691 - }, - { - "epoch": 0.68, - "learning_rate": 1.8012582275794546e-06, - "loss": 0.9424, - "step": 26692 - }, - { - "epoch": 0.68, - "learning_rate": 1.801241671523034e-06, - "loss": 1.0107, - "step": 26693 - }, - { - "epoch": 0.68, - "learning_rate": 1.80122511485314e-06, - "loss": 0.9443, - "step": 26694 - }, - { - "epoch": 0.68, - "learning_rate": 1.8012085575697845e-06, - "loss": 1.0439, - "step": 26695 - }, - { - "epoch": 0.68, - "learning_rate": 1.80119199967298e-06, - "loss": 0.874, - "step": 26696 - }, - { - "epoch": 0.68, - "learning_rate": 1.8011754411627402e-06, - "loss": 1.0723, - "step": 26697 - }, - { - "epoch": 0.68, - "learning_rate": 1.801158882039077e-06, - "loss": 0.7764, - "step": 26698 - }, - { - "epoch": 0.68, - "learning_rate": 1.8011423223020032e-06, - "loss": 0.8477, - "step": 26699 - }, - { - "epoch": 0.68, - "learning_rate": 1.8011257619515318e-06, - "loss": 0.7612, - "step": 26700 - }, - { - "epoch": 0.68, - "learning_rate": 1.801109200987675e-06, - "loss": 0.8604, - "step": 26701 - }, - { - "epoch": 0.68, - "learning_rate": 1.801092639410446e-06, - "loss": 0.876, - "step": 26702 - }, - { - "epoch": 0.68, - "learning_rate": 1.8010760772198569e-06, - "loss": 0.8418, - "step": 26703 - }, - { - "epoch": 0.68, - "learning_rate": 1.8010595144159208e-06, - "loss": 0.7402, - "step": 26704 - }, - { - "epoch": 0.68, - "learning_rate": 1.8010429509986503e-06, - "loss": 0.7183, - "step": 26705 - }, - { - "epoch": 0.68, - "learning_rate": 1.801026386968058e-06, - "loss": 1.0635, - "step": 26706 - }, - { - "epoch": 0.68, - "learning_rate": 1.8010098223241568e-06, - "loss": 0.7241, - "step": 26707 - }, - { - "epoch": 0.68, - "learning_rate": 1.8009932570669588e-06, - "loss": 0.9727, - "step": 26708 - }, - { - "epoch": 0.68, - "learning_rate": 1.8009766911964772e-06, - "loss": 0.9502, - "step": 26709 - }, - { - "epoch": 0.68, - "learning_rate": 1.8009601247127248e-06, - "loss": 0.8921, - "step": 26710 - }, - { - "epoch": 0.68, - "learning_rate": 1.800943557615714e-06, - "loss": 0.8545, - "step": 26711 - }, - { - "epoch": 0.68, - "learning_rate": 1.8009269899054576e-06, - "loss": 0.873, - "step": 26712 - }, - { - "epoch": 0.68, - "learning_rate": 1.8009104215819684e-06, - "loss": 0.8359, - "step": 26713 - }, - { - "epoch": 0.68, - "learning_rate": 1.8008938526452586e-06, - "loss": 0.999, - "step": 26714 - }, - { - "epoch": 0.68, - "learning_rate": 1.8008772830953412e-06, - "loss": 0.8975, - "step": 26715 - }, - { - "epoch": 0.68, - "learning_rate": 1.8008607129322288e-06, - "loss": 0.8667, - "step": 26716 - }, - { - "epoch": 0.68, - "learning_rate": 1.8008441421559345e-06, - "loss": 0.8721, - "step": 26717 - }, - { - "epoch": 0.68, - "learning_rate": 1.8008275707664704e-06, - "loss": 0.7705, - "step": 26718 - }, - { - "epoch": 0.68, - "learning_rate": 1.8008109987638495e-06, - "loss": 0.8838, - "step": 26719 - }, - { - "epoch": 0.68, - "learning_rate": 1.8007944261480847e-06, - "loss": 1.0303, - "step": 26720 - }, - { - "epoch": 0.68, - "learning_rate": 1.8007778529191882e-06, - "loss": 0.8877, - "step": 26721 - }, - { - "epoch": 0.68, - "learning_rate": 1.800761279077173e-06, - "loss": 0.9639, - "step": 26722 - }, - { - "epoch": 0.68, - "learning_rate": 1.8007447046220516e-06, - "loss": 1.0488, - "step": 26723 - }, - { - "epoch": 0.68, - "learning_rate": 1.8007281295538368e-06, - "loss": 0.9561, - "step": 26724 - }, - { - "epoch": 0.68, - "learning_rate": 1.8007115538725416e-06, - "loss": 0.8575, - "step": 26725 - }, - { - "epoch": 0.69, - "learning_rate": 1.8006949775781782e-06, - "loss": 0.8047, - "step": 26726 - }, - { - "epoch": 0.69, - "learning_rate": 1.8006784006707592e-06, - "loss": 0.8701, - "step": 26727 - }, - { - "epoch": 0.69, - "learning_rate": 1.8006618231502978e-06, - "loss": 0.8428, - "step": 26728 - }, - { - "epoch": 0.69, - "learning_rate": 1.8006452450168065e-06, - "loss": 1.0518, - "step": 26729 - }, - { - "epoch": 0.69, - "learning_rate": 1.800628666270298e-06, - "loss": 0.8281, - "step": 26730 - }, - { - "epoch": 0.69, - "learning_rate": 1.8006120869107846e-06, - "loss": 1.1143, - "step": 26731 - }, - { - "epoch": 0.69, - "learning_rate": 1.8005955069382798e-06, - "loss": 0.6143, - "step": 26732 - }, - { - "epoch": 0.69, - "learning_rate": 1.8005789263527955e-06, - "loss": 1.0088, - "step": 26733 - }, - { - "epoch": 0.69, - "learning_rate": 1.8005623451543447e-06, - "loss": 0.9092, - "step": 26734 - }, - { - "epoch": 0.69, - "learning_rate": 1.8005457633429404e-06, - "loss": 0.9277, - "step": 26735 - }, - { - "epoch": 0.69, - "learning_rate": 1.8005291809185947e-06, - "loss": 0.8037, - "step": 26736 - }, - { - "epoch": 0.69, - "learning_rate": 1.8005125978813206e-06, - "loss": 0.9707, - "step": 26737 - }, - { - "epoch": 0.69, - "learning_rate": 1.8004960142311313e-06, - "loss": 0.5767, - "step": 26738 - }, - { - "epoch": 0.69, - "learning_rate": 1.8004794299680386e-06, - "loss": 0.9099, - "step": 26739 - }, - { - "epoch": 0.69, - "learning_rate": 1.8004628450920557e-06, - "loss": 0.9761, - "step": 26740 - }, - { - "epoch": 0.69, - "learning_rate": 1.8004462596031954e-06, - "loss": 0.7598, - "step": 26741 - }, - { - "epoch": 0.69, - "learning_rate": 1.8004296735014699e-06, - "loss": 0.7607, - "step": 26742 - }, - { - "epoch": 0.69, - "learning_rate": 1.8004130867868923e-06, - "loss": 0.8994, - "step": 26743 - }, - { - "epoch": 0.69, - "learning_rate": 1.8003964994594752e-06, - "loss": 0.7871, - "step": 26744 - }, - { - "epoch": 0.69, - "learning_rate": 1.8003799115192314e-06, - "loss": 0.9609, - "step": 26745 - }, - { - "epoch": 0.69, - "learning_rate": 1.8003633229661735e-06, - "loss": 0.7539, - "step": 26746 - }, - { - "epoch": 0.69, - "learning_rate": 1.800346733800314e-06, - "loss": 0.8203, - "step": 26747 - }, - { - "epoch": 0.69, - "learning_rate": 1.800330144021666e-06, - "loss": 0.8018, - "step": 26748 - }, - { - "epoch": 0.69, - "learning_rate": 1.8003135536302421e-06, - "loss": 0.7534, - "step": 26749 - }, - { - "epoch": 0.69, - "learning_rate": 1.8002969626260547e-06, - "loss": 0.7339, - "step": 26750 - }, - { - "epoch": 0.69, - "learning_rate": 1.8002803710091166e-06, - "loss": 0.999, - "step": 26751 - }, - { - "epoch": 0.69, - "learning_rate": 1.800263778779441e-06, - "loss": 1.043, - "step": 26752 - }, - { - "epoch": 0.69, - "learning_rate": 1.80024718593704e-06, - "loss": 0.9922, - "step": 26753 - }, - { - "epoch": 0.69, - "learning_rate": 1.8002305924819265e-06, - "loss": 0.6807, - "step": 26754 - }, - { - "epoch": 0.69, - "learning_rate": 1.8002139984141135e-06, - "loss": 0.7021, - "step": 26755 - }, - { - "epoch": 0.69, - "learning_rate": 1.800197403733613e-06, - "loss": 0.7607, - "step": 26756 - }, - { - "epoch": 0.69, - "learning_rate": 1.8001808084404383e-06, - "loss": 1.0488, - "step": 26757 - }, - { - "epoch": 0.69, - "learning_rate": 1.800164212534602e-06, - "loss": 0.5344, - "step": 26758 - }, - { - "epoch": 0.69, - "learning_rate": 1.8001476160161166e-06, - "loss": 0.8467, - "step": 26759 - }, - { - "epoch": 0.69, - "learning_rate": 1.8001310188849953e-06, - "loss": 0.7583, - "step": 26760 - }, - { - "epoch": 0.69, - "learning_rate": 1.8001144211412504e-06, - "loss": 0.8018, - "step": 26761 - }, - { - "epoch": 0.69, - "learning_rate": 1.8000978227848945e-06, - "loss": 1.0205, - "step": 26762 - }, - { - "epoch": 0.69, - "learning_rate": 1.8000812238159404e-06, - "loss": 1.001, - "step": 26763 - }, - { - "epoch": 0.69, - "learning_rate": 1.8000646242344013e-06, - "loss": 0.9697, - "step": 26764 - }, - { - "epoch": 0.69, - "learning_rate": 1.8000480240402892e-06, - "loss": 1.0449, - "step": 26765 - }, - { - "epoch": 0.69, - "learning_rate": 1.800031423233617e-06, - "loss": 0.8867, - "step": 26766 - }, - { - "epoch": 0.69, - "learning_rate": 1.8000148218143978e-06, - "loss": 0.8604, - "step": 26767 - }, - { - "epoch": 0.69, - "learning_rate": 1.799998219782644e-06, - "loss": 0.6729, - "step": 26768 - }, - { - "epoch": 0.69, - "learning_rate": 1.7999816171383682e-06, - "loss": 1.0283, - "step": 26769 - }, - { - "epoch": 0.69, - "learning_rate": 1.7999650138815834e-06, - "loss": 0.6274, - "step": 26770 - }, - { - "epoch": 0.69, - "learning_rate": 1.799948410012302e-06, - "loss": 0.6299, - "step": 26771 - }, - { - "epoch": 0.69, - "learning_rate": 1.799931805530537e-06, - "loss": 0.8926, - "step": 26772 - }, - { - "epoch": 0.69, - "learning_rate": 1.7999152004363012e-06, - "loss": 0.7568, - "step": 26773 - }, - { - "epoch": 0.69, - "learning_rate": 1.7998985947296068e-06, - "loss": 1.1191, - "step": 26774 - }, - { - "epoch": 0.69, - "learning_rate": 1.7998819884104669e-06, - "loss": 0.7808, - "step": 26775 - }, - { - "epoch": 0.69, - "learning_rate": 1.7998653814788942e-06, - "loss": 0.835, - "step": 26776 - }, - { - "epoch": 0.69, - "learning_rate": 1.7998487739349013e-06, - "loss": 0.918, - "step": 26777 - }, - { - "epoch": 0.69, - "learning_rate": 1.799832165778501e-06, - "loss": 0.8848, - "step": 26778 - }, - { - "epoch": 0.69, - "learning_rate": 1.799815557009706e-06, - "loss": 0.7112, - "step": 26779 - }, - { - "epoch": 0.69, - "learning_rate": 1.799798947628529e-06, - "loss": 1.0391, - "step": 26780 - }, - { - "epoch": 0.69, - "learning_rate": 1.7997823376349828e-06, - "loss": 0.9189, - "step": 26781 - }, - { - "epoch": 0.69, - "learning_rate": 1.79976572702908e-06, - "loss": 0.9932, - "step": 26782 - }, - { - "epoch": 0.69, - "learning_rate": 1.7997491158108332e-06, - "loss": 0.8652, - "step": 26783 - }, - { - "epoch": 0.69, - "learning_rate": 1.7997325039802553e-06, - "loss": 0.9053, - "step": 26784 - }, - { - "epoch": 0.69, - "learning_rate": 1.7997158915373594e-06, - "loss": 0.7559, - "step": 26785 - }, - { - "epoch": 0.69, - "learning_rate": 1.7996992784821572e-06, - "loss": 0.7388, - "step": 26786 - }, - { - "epoch": 0.69, - "learning_rate": 1.7996826648146626e-06, - "loss": 0.8486, - "step": 26787 - }, - { - "epoch": 0.69, - "learning_rate": 1.7996660505348873e-06, - "loss": 0.9268, - "step": 26788 - }, - { - "epoch": 0.69, - "learning_rate": 1.7996494356428446e-06, - "loss": 0.7588, - "step": 26789 - }, - { - "epoch": 0.69, - "learning_rate": 1.7996328201385472e-06, - "loss": 0.7783, - "step": 26790 - }, - { - "epoch": 0.69, - "learning_rate": 1.7996162040220078e-06, - "loss": 0.9365, - "step": 26791 - }, - { - "epoch": 0.69, - "learning_rate": 1.7995995872932388e-06, - "loss": 0.8125, - "step": 26792 - }, - { - "epoch": 0.69, - "learning_rate": 1.7995829699522533e-06, - "loss": 0.8081, - "step": 26793 - }, - { - "epoch": 0.69, - "learning_rate": 1.799566351999064e-06, - "loss": 0.9004, - "step": 26794 - }, - { - "epoch": 0.69, - "learning_rate": 1.7995497334336834e-06, - "loss": 0.8994, - "step": 26795 - }, - { - "epoch": 0.69, - "learning_rate": 1.7995331142561243e-06, - "loss": 0.8501, - "step": 26796 - }, - { - "epoch": 0.69, - "learning_rate": 1.7995164944663994e-06, - "loss": 0.8994, - "step": 26797 - }, - { - "epoch": 0.69, - "learning_rate": 1.7994998740645215e-06, - "loss": 0.8379, - "step": 26798 - }, - { - "epoch": 0.69, - "learning_rate": 1.7994832530505033e-06, - "loss": 0.7344, - "step": 26799 - }, - { - "epoch": 0.69, - "learning_rate": 1.7994666314243576e-06, - "loss": 0.8457, - "step": 26800 - }, - { - "epoch": 0.69, - "learning_rate": 1.7994500091860969e-06, - "loss": 0.7734, - "step": 26801 - }, - { - "epoch": 0.69, - "learning_rate": 1.7994333863357345e-06, - "loss": 0.9346, - "step": 26802 - }, - { - "epoch": 0.69, - "learning_rate": 1.7994167628732824e-06, - "loss": 0.7314, - "step": 26803 - }, - { - "epoch": 0.69, - "learning_rate": 1.7994001387987537e-06, - "loss": 0.9238, - "step": 26804 - }, - { - "epoch": 0.69, - "learning_rate": 1.799383514112161e-06, - "loss": 0.7734, - "step": 26805 - }, - { - "epoch": 0.69, - "learning_rate": 1.7993668888135172e-06, - "loss": 0.7944, - "step": 26806 - }, - { - "epoch": 0.69, - "learning_rate": 1.799350262902835e-06, - "loss": 0.8125, - "step": 26807 - }, - { - "epoch": 0.69, - "learning_rate": 1.799333636380127e-06, - "loss": 0.8496, - "step": 26808 - }, - { - "epoch": 0.69, - "learning_rate": 1.7993170092454058e-06, - "loss": 0.7178, - "step": 26809 - }, - { - "epoch": 0.69, - "learning_rate": 1.7993003814986844e-06, - "loss": 0.8916, - "step": 26810 - }, - { - "epoch": 0.69, - "learning_rate": 1.7992837531399757e-06, - "loss": 0.8242, - "step": 26811 - }, - { - "epoch": 0.69, - "learning_rate": 1.799267124169292e-06, - "loss": 0.5588, - "step": 26812 - }, - { - "epoch": 0.69, - "learning_rate": 1.799250494586646e-06, - "loss": 1.0801, - "step": 26813 - }, - { - "epoch": 0.69, - "learning_rate": 1.7992338643920508e-06, - "loss": 0.7959, - "step": 26814 - }, - { - "epoch": 0.69, - "learning_rate": 1.7992172335855194e-06, - "loss": 1.0088, - "step": 26815 - }, - { - "epoch": 0.69, - "learning_rate": 1.7992006021670636e-06, - "loss": 0.6978, - "step": 26816 - }, - { - "epoch": 0.69, - "learning_rate": 1.7991839701366969e-06, - "loss": 0.959, - "step": 26817 - }, - { - "epoch": 0.69, - "learning_rate": 1.7991673374944316e-06, - "loss": 0.6069, - "step": 26818 - }, - { - "epoch": 0.69, - "learning_rate": 1.7991507042402808e-06, - "loss": 0.771, - "step": 26819 - }, - { - "epoch": 0.69, - "learning_rate": 1.7991340703742566e-06, - "loss": 0.7549, - "step": 26820 - }, - { - "epoch": 0.69, - "learning_rate": 1.7991174358963725e-06, - "loss": 0.7705, - "step": 26821 - }, - { - "epoch": 0.69, - "learning_rate": 1.7991008008066411e-06, - "loss": 0.6062, - "step": 26822 - }, - { - "epoch": 0.69, - "learning_rate": 1.799084165105075e-06, - "loss": 1.1152, - "step": 26823 - }, - { - "epoch": 0.69, - "learning_rate": 1.7990675287916866e-06, - "loss": 0.7915, - "step": 26824 - }, - { - "epoch": 0.69, - "learning_rate": 1.799050891866489e-06, - "loss": 0.8379, - "step": 26825 - }, - { - "epoch": 0.69, - "learning_rate": 1.799034254329495e-06, - "loss": 0.748, - "step": 26826 - }, - { - "epoch": 0.69, - "learning_rate": 1.799017616180717e-06, - "loss": 0.7461, - "step": 26827 - }, - { - "epoch": 0.69, - "learning_rate": 1.7990009774201683e-06, - "loss": 0.9492, - "step": 26828 - }, - { - "epoch": 0.69, - "learning_rate": 1.798984338047861e-06, - "loss": 0.874, - "step": 26829 - }, - { - "epoch": 0.69, - "learning_rate": 1.7989676980638082e-06, - "loss": 0.7188, - "step": 26830 - }, - { - "epoch": 0.69, - "learning_rate": 1.7989510574680224e-06, - "loss": 0.8135, - "step": 26831 - }, - { - "epoch": 0.69, - "learning_rate": 1.7989344162605168e-06, - "loss": 0.9648, - "step": 26832 - }, - { - "epoch": 0.69, - "learning_rate": 1.7989177744413037e-06, - "loss": 0.9961, - "step": 26833 - }, - { - "epoch": 0.69, - "learning_rate": 1.7989011320103962e-06, - "loss": 0.8271, - "step": 26834 - }, - { - "epoch": 0.69, - "learning_rate": 1.7988844889678068e-06, - "loss": 1.0176, - "step": 26835 - }, - { - "epoch": 0.69, - "learning_rate": 1.7988678453135479e-06, - "loss": 0.8955, - "step": 26836 - }, - { - "epoch": 0.69, - "learning_rate": 1.798851201047633e-06, - "loss": 0.8169, - "step": 26837 - }, - { - "epoch": 0.69, - "learning_rate": 1.798834556170074e-06, - "loss": 0.9189, - "step": 26838 - }, - { - "epoch": 0.69, - "learning_rate": 1.7988179106808847e-06, - "loss": 0.9873, - "step": 26839 - }, - { - "epoch": 0.69, - "learning_rate": 1.798801264580077e-06, - "loss": 0.655, - "step": 26840 - }, - { - "epoch": 0.69, - "learning_rate": 1.798784617867664e-06, - "loss": 0.8145, - "step": 26841 - }, - { - "epoch": 0.69, - "learning_rate": 1.7987679705436583e-06, - "loss": 1.0161, - "step": 26842 - }, - { - "epoch": 0.69, - "learning_rate": 1.7987513226080725e-06, - "loss": 0.6978, - "step": 26843 - }, - { - "epoch": 0.69, - "learning_rate": 1.7987346740609197e-06, - "loss": 0.748, - "step": 26844 - }, - { - "epoch": 0.69, - "learning_rate": 1.7987180249022127e-06, - "loss": 0.8564, - "step": 26845 - }, - { - "epoch": 0.69, - "learning_rate": 1.7987013751319638e-06, - "loss": 0.6763, - "step": 26846 - }, - { - "epoch": 0.69, - "learning_rate": 1.798684724750186e-06, - "loss": 0.8213, - "step": 26847 - }, - { - "epoch": 0.69, - "learning_rate": 1.798668073756892e-06, - "loss": 0.5027, - "step": 26848 - }, - { - "epoch": 0.69, - "learning_rate": 1.7986514221520945e-06, - "loss": 0.9385, - "step": 26849 - }, - { - "epoch": 0.69, - "learning_rate": 1.7986347699358065e-06, - "loss": 0.9355, - "step": 26850 - }, - { - "epoch": 0.69, - "learning_rate": 1.7986181171080405e-06, - "loss": 0.958, - "step": 26851 - }, - { - "epoch": 0.69, - "learning_rate": 1.7986014636688093e-06, - "loss": 0.8682, - "step": 26852 - }, - { - "epoch": 0.69, - "learning_rate": 1.7985848096181258e-06, - "loss": 0.8306, - "step": 26853 - }, - { - "epoch": 0.69, - "learning_rate": 1.7985681549560026e-06, - "loss": 0.8867, - "step": 26854 - }, - { - "epoch": 0.69, - "learning_rate": 1.7985514996824525e-06, - "loss": 0.9434, - "step": 26855 - }, - { - "epoch": 0.69, - "learning_rate": 1.7985348437974882e-06, - "loss": 0.7617, - "step": 26856 - }, - { - "epoch": 0.69, - "learning_rate": 1.7985181873011226e-06, - "loss": 0.8789, - "step": 26857 - }, - { - "epoch": 0.69, - "learning_rate": 1.7985015301933682e-06, - "loss": 0.8203, - "step": 26858 - }, - { - "epoch": 0.69, - "learning_rate": 1.7984848724742379e-06, - "loss": 1.1396, - "step": 26859 - }, - { - "epoch": 0.69, - "learning_rate": 1.7984682141437442e-06, - "loss": 1.0557, - "step": 26860 - }, - { - "epoch": 0.69, - "learning_rate": 1.7984515552019004e-06, - "loss": 0.9219, - "step": 26861 - }, - { - "epoch": 0.69, - "learning_rate": 1.7984348956487189e-06, - "loss": 0.6011, - "step": 26862 - }, - { - "epoch": 0.69, - "learning_rate": 1.7984182354842125e-06, - "loss": 1.0547, - "step": 26863 - }, - { - "epoch": 0.69, - "learning_rate": 1.798401574708394e-06, - "loss": 0.4355, - "step": 26864 - }, - { - "epoch": 0.69, - "learning_rate": 1.7983849133212762e-06, - "loss": 0.9619, - "step": 26865 - }, - { - "epoch": 0.69, - "learning_rate": 1.7983682513228717e-06, - "loss": 0.8877, - "step": 26866 - }, - { - "epoch": 0.69, - "learning_rate": 1.7983515887131934e-06, - "loss": 0.8975, - "step": 26867 - }, - { - "epoch": 0.69, - "learning_rate": 1.798334925492254e-06, - "loss": 0.8545, - "step": 26868 - }, - { - "epoch": 0.69, - "learning_rate": 1.7983182616600662e-06, - "loss": 1.0586, - "step": 26869 - }, - { - "epoch": 0.69, - "learning_rate": 1.7983015972166426e-06, - "loss": 0.9297, - "step": 26870 - }, - { - "epoch": 0.69, - "learning_rate": 1.7982849321619963e-06, - "loss": 1.0479, - "step": 26871 - }, - { - "epoch": 0.69, - "learning_rate": 1.79826826649614e-06, - "loss": 0.8975, - "step": 26872 - }, - { - "epoch": 0.69, - "learning_rate": 1.7982516002190865e-06, - "loss": 0.876, - "step": 26873 - }, - { - "epoch": 0.69, - "learning_rate": 1.7982349333308485e-06, - "loss": 0.7876, - "step": 26874 - }, - { - "epoch": 0.69, - "learning_rate": 1.7982182658314385e-06, - "loss": 0.9795, - "step": 26875 - }, - { - "epoch": 0.69, - "learning_rate": 1.7982015977208695e-06, - "loss": 0.6941, - "step": 26876 - }, - { - "epoch": 0.69, - "learning_rate": 1.7981849289991545e-06, - "loss": 0.9761, - "step": 26877 - }, - { - "epoch": 0.69, - "learning_rate": 1.7981682596663057e-06, - "loss": 0.8535, - "step": 26878 - }, - { - "epoch": 0.69, - "learning_rate": 1.7981515897223362e-06, - "loss": 0.5573, - "step": 26879 - }, - { - "epoch": 0.69, - "learning_rate": 1.7981349191672589e-06, - "loss": 0.8276, - "step": 26880 - }, - { - "epoch": 0.69, - "learning_rate": 1.7981182480010864e-06, - "loss": 0.876, - "step": 26881 - }, - { - "epoch": 0.69, - "learning_rate": 1.7981015762238312e-06, - "loss": 0.9131, - "step": 26882 - }, - { - "epoch": 0.69, - "learning_rate": 1.7980849038355067e-06, - "loss": 0.7739, - "step": 26883 - }, - { - "epoch": 0.69, - "learning_rate": 1.7980682308361248e-06, - "loss": 0.96, - "step": 26884 - }, - { - "epoch": 0.69, - "learning_rate": 1.7980515572256988e-06, - "loss": 0.687, - "step": 26885 - }, - { - "epoch": 0.69, - "learning_rate": 1.7980348830042417e-06, - "loss": 0.7891, - "step": 26886 - }, - { - "epoch": 0.69, - "learning_rate": 1.798018208171766e-06, - "loss": 0.7393, - "step": 26887 - }, - { - "epoch": 0.69, - "learning_rate": 1.7980015327282843e-06, - "loss": 0.7031, - "step": 26888 - }, - { - "epoch": 0.69, - "learning_rate": 1.7979848566738095e-06, - "loss": 0.9688, - "step": 26889 - }, - { - "epoch": 0.69, - "learning_rate": 1.7979681800083547e-06, - "loss": 0.8662, - "step": 26890 - }, - { - "epoch": 0.69, - "learning_rate": 1.7979515027319318e-06, - "loss": 0.7373, - "step": 26891 - }, - { - "epoch": 0.69, - "learning_rate": 1.7979348248445544e-06, - "loss": 0.9424, - "step": 26892 - }, - { - "epoch": 0.69, - "learning_rate": 1.7979181463462352e-06, - "loss": 0.9375, - "step": 26893 - }, - { - "epoch": 0.69, - "learning_rate": 1.7979014672369868e-06, - "loss": 0.6829, - "step": 26894 - }, - { - "epoch": 0.69, - "learning_rate": 1.7978847875168218e-06, - "loss": 0.9629, - "step": 26895 - }, - { - "epoch": 0.69, - "learning_rate": 1.7978681071857528e-06, - "loss": 1.0615, - "step": 26896 - }, - { - "epoch": 0.69, - "learning_rate": 1.7978514262437932e-06, - "loss": 0.9639, - "step": 26897 - }, - { - "epoch": 0.69, - "learning_rate": 1.7978347446909555e-06, - "loss": 0.8545, - "step": 26898 - }, - { - "epoch": 0.69, - "learning_rate": 1.797818062527252e-06, - "loss": 0.8799, - "step": 26899 - }, - { - "epoch": 0.69, - "learning_rate": 1.7978013797526963e-06, - "loss": 0.7285, - "step": 26900 - }, - { - "epoch": 0.69, - "learning_rate": 1.7977846963673007e-06, - "loss": 0.7319, - "step": 26901 - }, - { - "epoch": 0.69, - "learning_rate": 1.797768012371078e-06, - "loss": 0.7041, - "step": 26902 - }, - { - "epoch": 0.69, - "learning_rate": 1.797751327764041e-06, - "loss": 1.0605, - "step": 26903 - }, - { - "epoch": 0.69, - "learning_rate": 1.7977346425462025e-06, - "loss": 1.0146, - "step": 26904 - }, - { - "epoch": 0.69, - "learning_rate": 1.7977179567175753e-06, - "loss": 1.0059, - "step": 26905 - }, - { - "epoch": 0.69, - "learning_rate": 1.7977012702781723e-06, - "loss": 1.0781, - "step": 26906 - }, - { - "epoch": 0.69, - "learning_rate": 1.7976845832280056e-06, - "loss": 0.9922, - "step": 26907 - }, - { - "epoch": 0.69, - "learning_rate": 1.797667895567089e-06, - "loss": 0.8291, - "step": 26908 - }, - { - "epoch": 0.69, - "learning_rate": 1.7976512072954344e-06, - "loss": 0.8921, - "step": 26909 - }, - { - "epoch": 0.69, - "learning_rate": 1.797634518413055e-06, - "loss": 0.9668, - "step": 26910 - }, - { - "epoch": 0.69, - "learning_rate": 1.797617828919964e-06, - "loss": 0.5967, - "step": 26911 - }, - { - "epoch": 0.69, - "learning_rate": 1.797601138816173e-06, - "loss": 0.793, - "step": 26912 - }, - { - "epoch": 0.69, - "learning_rate": 1.797584448101696e-06, - "loss": 1.1611, - "step": 26913 - }, - { - "epoch": 0.69, - "learning_rate": 1.797567756776545e-06, - "loss": 1.1133, - "step": 26914 - }, - { - "epoch": 0.69, - "learning_rate": 1.7975510648407332e-06, - "loss": 0.9512, - "step": 26915 - }, - { - "epoch": 0.69, - "learning_rate": 1.7975343722942733e-06, - "loss": 0.6719, - "step": 26916 - }, - { - "epoch": 0.69, - "learning_rate": 1.797517679137178e-06, - "loss": 0.8081, - "step": 26917 - }, - { - "epoch": 0.69, - "learning_rate": 1.7975009853694597e-06, - "loss": 0.8965, - "step": 26918 - }, - { - "epoch": 0.69, - "learning_rate": 1.7974842909911318e-06, - "loss": 0.8633, - "step": 26919 - }, - { - "epoch": 0.69, - "learning_rate": 1.797467596002207e-06, - "loss": 0.9463, - "step": 26920 - }, - { - "epoch": 0.69, - "learning_rate": 1.7974509004026976e-06, - "loss": 0.7915, - "step": 26921 - }, - { - "epoch": 0.69, - "learning_rate": 1.7974342041926171e-06, - "loss": 0.8574, - "step": 26922 - }, - { - "epoch": 0.69, - "learning_rate": 1.7974175073719777e-06, - "loss": 0.707, - "step": 26923 - }, - { - "epoch": 0.69, - "learning_rate": 1.7974008099407923e-06, - "loss": 0.6226, - "step": 26924 - }, - { - "epoch": 0.69, - "learning_rate": 1.797384111899074e-06, - "loss": 0.8159, - "step": 26925 - }, - { - "epoch": 0.69, - "learning_rate": 1.7973674132468353e-06, - "loss": 0.9141, - "step": 26926 - }, - { - "epoch": 0.69, - "learning_rate": 1.7973507139840888e-06, - "loss": 1.0273, - "step": 26927 - }, - { - "epoch": 0.69, - "learning_rate": 1.7973340141108477e-06, - "loss": 0.7969, - "step": 26928 - }, - { - "epoch": 0.69, - "learning_rate": 1.7973173136271245e-06, - "loss": 0.7959, - "step": 26929 - }, - { - "epoch": 0.69, - "learning_rate": 1.7973006125329322e-06, - "loss": 0.8799, - "step": 26930 - }, - { - "epoch": 0.69, - "learning_rate": 1.7972839108282837e-06, - "loss": 0.8623, - "step": 26931 - }, - { - "epoch": 0.69, - "learning_rate": 1.797267208513191e-06, - "loss": 0.7866, - "step": 26932 - }, - { - "epoch": 0.69, - "learning_rate": 1.7972505055876677e-06, - "loss": 0.814, - "step": 26933 - }, - { - "epoch": 0.69, - "learning_rate": 1.7972338020517265e-06, - "loss": 0.6987, - "step": 26934 - }, - { - "epoch": 0.69, - "learning_rate": 1.79721709790538e-06, - "loss": 0.5674, - "step": 26935 - }, - { - "epoch": 0.69, - "learning_rate": 1.7972003931486407e-06, - "loss": 0.8887, - "step": 26936 - }, - { - "epoch": 0.69, - "learning_rate": 1.7971836877815223e-06, - "loss": 0.8223, - "step": 26937 - }, - { - "epoch": 0.69, - "learning_rate": 1.7971669818040364e-06, - "loss": 0.8787, - "step": 26938 - }, - { - "epoch": 0.69, - "learning_rate": 1.797150275216197e-06, - "loss": 0.7085, - "step": 26939 - }, - { - "epoch": 0.69, - "learning_rate": 1.7971335680180159e-06, - "loss": 0.9277, - "step": 26940 - }, - { - "epoch": 0.69, - "learning_rate": 1.7971168602095063e-06, - "loss": 0.875, - "step": 26941 - }, - { - "epoch": 0.69, - "learning_rate": 1.7971001517906813e-06, - "loss": 0.7207, - "step": 26942 - }, - { - "epoch": 0.69, - "learning_rate": 1.797083442761553e-06, - "loss": 0.8252, - "step": 26943 - }, - { - "epoch": 0.69, - "learning_rate": 1.7970667331221346e-06, - "loss": 0.6284, - "step": 26944 - }, - { - "epoch": 0.69, - "learning_rate": 1.797050022872439e-06, - "loss": 0.5957, - "step": 26945 - }, - { - "epoch": 0.69, - "learning_rate": 1.7970333120124787e-06, - "loss": 1.0322, - "step": 26946 - }, - { - "epoch": 0.69, - "learning_rate": 1.7970166005422667e-06, - "loss": 0.9102, - "step": 26947 - }, - { - "epoch": 0.69, - "learning_rate": 1.7969998884618156e-06, - "loss": 0.8926, - "step": 26948 - }, - { - "epoch": 0.69, - "learning_rate": 1.7969831757711388e-06, - "loss": 0.7441, - "step": 26949 - }, - { - "epoch": 0.69, - "learning_rate": 1.7969664624702481e-06, - "loss": 0.7827, - "step": 26950 - }, - { - "epoch": 0.69, - "learning_rate": 1.7969497485591569e-06, - "loss": 0.8311, - "step": 26951 - }, - { - "epoch": 0.69, - "learning_rate": 1.7969330340378781e-06, - "loss": 0.8789, - "step": 26952 - }, - { - "epoch": 0.69, - "learning_rate": 1.7969163189064242e-06, - "loss": 0.8672, - "step": 26953 - }, - { - "epoch": 0.69, - "learning_rate": 1.7968996031648085e-06, - "loss": 0.8369, - "step": 26954 - }, - { - "epoch": 0.69, - "learning_rate": 1.796882886813043e-06, - "loss": 1.0459, - "step": 26955 - }, - { - "epoch": 0.69, - "learning_rate": 1.796866169851141e-06, - "loss": 0.6685, - "step": 26956 - }, - { - "epoch": 0.69, - "learning_rate": 1.7968494522791153e-06, - "loss": 0.7588, - "step": 26957 - }, - { - "epoch": 0.69, - "learning_rate": 1.7968327340969785e-06, - "loss": 0.6796, - "step": 26958 - }, - { - "epoch": 0.69, - "learning_rate": 1.7968160153047435e-06, - "loss": 0.9326, - "step": 26959 - }, - { - "epoch": 0.69, - "learning_rate": 1.7967992959024232e-06, - "loss": 0.6421, - "step": 26960 - }, - { - "epoch": 0.69, - "learning_rate": 1.7967825758900301e-06, - "loss": 0.8906, - "step": 26961 - }, - { - "epoch": 0.69, - "learning_rate": 1.7967658552675777e-06, - "loss": 0.6758, - "step": 26962 - }, - { - "epoch": 0.69, - "learning_rate": 1.7967491340350778e-06, - "loss": 0.8867, - "step": 26963 - }, - { - "epoch": 0.69, - "learning_rate": 1.796732412192544e-06, - "loss": 0.877, - "step": 26964 - }, - { - "epoch": 0.69, - "learning_rate": 1.7967156897399889e-06, - "loss": 0.8867, - "step": 26965 - }, - { - "epoch": 0.69, - "learning_rate": 1.7966989666774251e-06, - "loss": 0.7432, - "step": 26966 - }, - { - "epoch": 0.69, - "learning_rate": 1.7966822430048655e-06, - "loss": 0.9482, - "step": 26967 - }, - { - "epoch": 0.69, - "learning_rate": 1.796665518722323e-06, - "loss": 0.6914, - "step": 26968 - }, - { - "epoch": 0.69, - "learning_rate": 1.7966487938298106e-06, - "loss": 0.9717, - "step": 26969 - }, - { - "epoch": 0.69, - "learning_rate": 1.7966320683273403e-06, - "loss": 0.7866, - "step": 26970 - }, - { - "epoch": 0.69, - "learning_rate": 1.7966153422149258e-06, - "loss": 0.8975, - "step": 26971 - }, - { - "epoch": 0.69, - "learning_rate": 1.7965986154925793e-06, - "loss": 0.8066, - "step": 26972 - }, - { - "epoch": 0.69, - "learning_rate": 1.7965818881603144e-06, - "loss": 0.833, - "step": 26973 - }, - { - "epoch": 0.69, - "learning_rate": 1.7965651602181429e-06, - "loss": 0.8711, - "step": 26974 - }, - { - "epoch": 0.69, - "learning_rate": 1.7965484316660784e-06, - "loss": 0.8359, - "step": 26975 - }, - { - "epoch": 0.69, - "learning_rate": 1.796531702504133e-06, - "loss": 0.9297, - "step": 26976 - }, - { - "epoch": 0.69, - "learning_rate": 1.79651497273232e-06, - "loss": 0.8633, - "step": 26977 - }, - { - "epoch": 0.69, - "learning_rate": 1.7964982423506522e-06, - "loss": 0.8521, - "step": 26978 - }, - { - "epoch": 0.69, - "learning_rate": 1.7964815113591424e-06, - "loss": 0.8877, - "step": 26979 - }, - { - "epoch": 0.69, - "learning_rate": 1.7964647797578034e-06, - "loss": 0.8945, - "step": 26980 - }, - { - "epoch": 0.69, - "learning_rate": 1.7964480475466477e-06, - "loss": 0.9004, - "step": 26981 - }, - { - "epoch": 0.69, - "learning_rate": 1.7964313147256887e-06, - "loss": 0.9033, - "step": 26982 - }, - { - "epoch": 0.69, - "learning_rate": 1.7964145812949385e-06, - "loss": 0.8711, - "step": 26983 - }, - { - "epoch": 0.69, - "learning_rate": 1.7963978472544104e-06, - "loss": 0.8257, - "step": 26984 - }, - { - "epoch": 0.69, - "learning_rate": 1.7963811126041172e-06, - "loss": 0.916, - "step": 26985 - }, - { - "epoch": 0.69, - "learning_rate": 1.7963643773440715e-06, - "loss": 0.7568, - "step": 26986 - }, - { - "epoch": 0.69, - "learning_rate": 1.7963476414742861e-06, - "loss": 0.8477, - "step": 26987 - }, - { - "epoch": 0.69, - "learning_rate": 1.7963309049947739e-06, - "loss": 0.606, - "step": 26988 - }, - { - "epoch": 0.69, - "learning_rate": 1.7963141679055482e-06, - "loss": 0.6714, - "step": 26989 - }, - { - "epoch": 0.69, - "learning_rate": 1.796297430206621e-06, - "loss": 0.8071, - "step": 26990 - }, - { - "epoch": 0.69, - "learning_rate": 1.7962806918980053e-06, - "loss": 0.833, - "step": 26991 - }, - { - "epoch": 0.69, - "learning_rate": 1.7962639529797143e-06, - "loss": 0.6493, - "step": 26992 - }, - { - "epoch": 0.69, - "learning_rate": 1.7962472134517607e-06, - "loss": 0.7451, - "step": 26993 - }, - { - "epoch": 0.69, - "learning_rate": 1.796230473314157e-06, - "loss": 0.9707, - "step": 26994 - }, - { - "epoch": 0.69, - "learning_rate": 1.7962137325669167e-06, - "loss": 0.7949, - "step": 26995 - }, - { - "epoch": 0.69, - "learning_rate": 1.7961969912100517e-06, - "loss": 0.7666, - "step": 26996 - }, - { - "epoch": 0.69, - "learning_rate": 1.7961802492435752e-06, - "loss": 1.0029, - "step": 26997 - }, - { - "epoch": 0.69, - "learning_rate": 1.7961635066675003e-06, - "loss": 0.8467, - "step": 26998 - }, - { - "epoch": 0.69, - "learning_rate": 1.7961467634818397e-06, - "loss": 0.7568, - "step": 26999 - }, - { - "epoch": 0.69, - "learning_rate": 1.796130019686606e-06, - "loss": 1.083, - "step": 27000 - }, - { - "epoch": 0.69, - "learning_rate": 1.7961132752818121e-06, - "loss": 0.6743, - "step": 27001 - }, - { - "epoch": 0.69, - "learning_rate": 1.7960965302674711e-06, - "loss": 0.9629, - "step": 27002 - }, - { - "epoch": 0.69, - "learning_rate": 1.7960797846435955e-06, - "loss": 0.918, - "step": 27003 - }, - { - "epoch": 0.69, - "learning_rate": 1.7960630384101982e-06, - "loss": 0.8013, - "step": 27004 - }, - { - "epoch": 0.69, - "learning_rate": 1.7960462915672918e-06, - "loss": 0.9756, - "step": 27005 - }, - { - "epoch": 0.69, - "learning_rate": 1.7960295441148897e-06, - "loss": 0.9229, - "step": 27006 - }, - { - "epoch": 0.69, - "learning_rate": 1.796012796053004e-06, - "loss": 0.8472, - "step": 27007 - }, - { - "epoch": 0.69, - "learning_rate": 1.7959960473816483e-06, - "loss": 0.4858, - "step": 27008 - }, - { - "epoch": 0.69, - "learning_rate": 1.795979298100835e-06, - "loss": 0.8789, - "step": 27009 - }, - { - "epoch": 0.69, - "learning_rate": 1.7959625482105768e-06, - "loss": 0.7983, - "step": 27010 - }, - { - "epoch": 0.69, - "learning_rate": 1.7959457977108864e-06, - "loss": 0.7671, - "step": 27011 - }, - { - "epoch": 0.69, - "learning_rate": 1.7959290466017773e-06, - "loss": 0.8613, - "step": 27012 - }, - { - "epoch": 0.69, - "learning_rate": 1.795912294883262e-06, - "loss": 0.9844, - "step": 27013 - }, - { - "epoch": 0.69, - "learning_rate": 1.795895542555353e-06, - "loss": 0.7734, - "step": 27014 - }, - { - "epoch": 0.69, - "learning_rate": 1.7958787896180633e-06, - "loss": 0.8926, - "step": 27015 - }, - { - "epoch": 0.69, - "learning_rate": 1.7958620360714061e-06, - "loss": 0.8135, - "step": 27016 - }, - { - "epoch": 0.69, - "learning_rate": 1.7958452819153937e-06, - "loss": 0.8926, - "step": 27017 - }, - { - "epoch": 0.69, - "learning_rate": 1.7958285271500392e-06, - "loss": 0.6895, - "step": 27018 - }, - { - "epoch": 0.69, - "learning_rate": 1.7958117717753556e-06, - "loss": 0.9209, - "step": 27019 - }, - { - "epoch": 0.69, - "learning_rate": 1.7957950157913552e-06, - "loss": 0.6777, - "step": 27020 - }, - { - "epoch": 0.69, - "learning_rate": 1.7957782591980512e-06, - "loss": 0.6836, - "step": 27021 - }, - { - "epoch": 0.69, - "learning_rate": 1.7957615019954567e-06, - "loss": 0.7451, - "step": 27022 - }, - { - "epoch": 0.69, - "learning_rate": 1.795744744183584e-06, - "loss": 0.9355, - "step": 27023 - }, - { - "epoch": 0.69, - "learning_rate": 1.7957279857624461e-06, - "loss": 1.0654, - "step": 27024 - }, - { - "epoch": 0.69, - "learning_rate": 1.795711226732056e-06, - "loss": 1.0283, - "step": 27025 - }, - { - "epoch": 0.69, - "learning_rate": 1.795694467092426e-06, - "loss": 0.9268, - "step": 27026 - }, - { - "epoch": 0.69, - "learning_rate": 1.7956777068435697e-06, - "loss": 0.8213, - "step": 27027 - }, - { - "epoch": 0.69, - "learning_rate": 1.7956609459854997e-06, - "loss": 0.8604, - "step": 27028 - }, - { - "epoch": 0.69, - "learning_rate": 1.7956441845182285e-06, - "loss": 0.7554, - "step": 27029 - }, - { - "epoch": 0.69, - "learning_rate": 1.7956274224417691e-06, - "loss": 0.7808, - "step": 27030 - }, - { - "epoch": 0.69, - "learning_rate": 1.7956106597561345e-06, - "loss": 0.9072, - "step": 27031 - }, - { - "epoch": 0.69, - "learning_rate": 1.7955938964613372e-06, - "loss": 0.7822, - "step": 27032 - }, - { - "epoch": 0.69, - "learning_rate": 1.7955771325573903e-06, - "loss": 0.7358, - "step": 27033 - }, - { - "epoch": 0.69, - "learning_rate": 1.7955603680443066e-06, - "loss": 0.9717, - "step": 27034 - }, - { - "epoch": 0.69, - "learning_rate": 1.795543602922099e-06, - "loss": 0.8054, - "step": 27035 - }, - { - "epoch": 0.69, - "learning_rate": 1.79552683719078e-06, - "loss": 0.813, - "step": 27036 - }, - { - "epoch": 0.69, - "learning_rate": 1.795510070850363e-06, - "loss": 0.7705, - "step": 27037 - }, - { - "epoch": 0.69, - "learning_rate": 1.7954933039008604e-06, - "loss": 0.8398, - "step": 27038 - }, - { - "epoch": 0.69, - "learning_rate": 1.795476536342285e-06, - "loss": 0.856, - "step": 27039 - }, - { - "epoch": 0.69, - "learning_rate": 1.79545976817465e-06, - "loss": 0.9033, - "step": 27040 - }, - { - "epoch": 0.69, - "learning_rate": 1.7954429993979679e-06, - "loss": 0.9814, - "step": 27041 - }, - { - "epoch": 0.69, - "learning_rate": 1.7954262300122518e-06, - "loss": 0.8066, - "step": 27042 - }, - { - "epoch": 0.69, - "learning_rate": 1.7954094600175143e-06, - "loss": 0.9434, - "step": 27043 - }, - { - "epoch": 0.69, - "learning_rate": 1.7953926894137682e-06, - "loss": 0.7402, - "step": 27044 - }, - { - "epoch": 0.69, - "learning_rate": 1.7953759182010266e-06, - "loss": 0.7402, - "step": 27045 - }, - { - "epoch": 0.69, - "learning_rate": 1.7953591463793022e-06, - "loss": 0.9053, - "step": 27046 - }, - { - "epoch": 0.69, - "learning_rate": 1.7953423739486081e-06, - "loss": 0.8496, - "step": 27047 - }, - { - "epoch": 0.69, - "learning_rate": 1.7953256009089569e-06, - "loss": 0.9492, - "step": 27048 - }, - { - "epoch": 0.69, - "learning_rate": 1.7953088272603613e-06, - "loss": 0.9102, - "step": 27049 - }, - { - "epoch": 0.69, - "learning_rate": 1.7952920530028345e-06, - "loss": 0.9316, - "step": 27050 - }, - { - "epoch": 0.69, - "learning_rate": 1.7952752781363887e-06, - "loss": 0.7725, - "step": 27051 - }, - { - "epoch": 0.69, - "learning_rate": 1.7952585026610377e-06, - "loss": 0.7441, - "step": 27052 - }, - { - "epoch": 0.69, - "learning_rate": 1.7952417265767936e-06, - "loss": 0.6396, - "step": 27053 - }, - { - "epoch": 0.69, - "learning_rate": 1.7952249498836694e-06, - "loss": 0.7812, - "step": 27054 - }, - { - "epoch": 0.69, - "learning_rate": 1.795208172581678e-06, - "loss": 0.7717, - "step": 27055 - }, - { - "epoch": 0.69, - "learning_rate": 1.7951913946708324e-06, - "loss": 0.959, - "step": 27056 - }, - { - "epoch": 0.69, - "learning_rate": 1.7951746161511454e-06, - "loss": 0.9746, - "step": 27057 - }, - { - "epoch": 0.69, - "learning_rate": 1.7951578370226294e-06, - "loss": 1.0352, - "step": 27058 - }, - { - "epoch": 0.69, - "learning_rate": 1.795141057285298e-06, - "loss": 1.0312, - "step": 27059 - }, - { - "epoch": 0.69, - "learning_rate": 1.7951242769391634e-06, - "loss": 0.6328, - "step": 27060 - }, - { - "epoch": 0.69, - "learning_rate": 1.7951074959842387e-06, - "loss": 0.7236, - "step": 27061 - }, - { - "epoch": 0.69, - "learning_rate": 1.795090714420537e-06, - "loss": 0.811, - "step": 27062 - }, - { - "epoch": 0.69, - "learning_rate": 1.7950739322480708e-06, - "loss": 1.0215, - "step": 27063 - }, - { - "epoch": 0.69, - "learning_rate": 1.7950571494668529e-06, - "loss": 0.7295, - "step": 27064 - }, - { - "epoch": 0.69, - "learning_rate": 1.7950403660768965e-06, - "loss": 0.658, - "step": 27065 - }, - { - "epoch": 0.69, - "learning_rate": 1.795023582078214e-06, - "loss": 0.9551, - "step": 27066 - }, - { - "epoch": 0.69, - "learning_rate": 1.7950067974708188e-06, - "loss": 1.0293, - "step": 27067 - }, - { - "epoch": 0.69, - "learning_rate": 1.7949900122547233e-06, - "loss": 0.8311, - "step": 27068 - }, - { - "epoch": 0.69, - "learning_rate": 1.7949732264299404e-06, - "loss": 0.8975, - "step": 27069 - }, - { - "epoch": 0.69, - "learning_rate": 1.7949564399964833e-06, - "loss": 0.8027, - "step": 27070 - }, - { - "epoch": 0.69, - "learning_rate": 1.7949396529543643e-06, - "loss": 0.7017, - "step": 27071 - }, - { - "epoch": 0.69, - "learning_rate": 1.7949228653035967e-06, - "loss": 0.8394, - "step": 27072 - }, - { - "epoch": 0.69, - "learning_rate": 1.7949060770441932e-06, - "loss": 0.8496, - "step": 27073 - }, - { - "epoch": 0.69, - "learning_rate": 1.7948892881761668e-06, - "loss": 0.9795, - "step": 27074 - }, - { - "epoch": 0.69, - "learning_rate": 1.7948724986995301e-06, - "loss": 0.7334, - "step": 27075 - }, - { - "epoch": 0.69, - "learning_rate": 1.794855708614296e-06, - "loss": 0.7158, - "step": 27076 - }, - { - "epoch": 0.69, - "learning_rate": 1.7948389179204777e-06, - "loss": 0.7666, - "step": 27077 - }, - { - "epoch": 0.69, - "learning_rate": 1.7948221266180873e-06, - "loss": 0.8252, - "step": 27078 - }, - { - "epoch": 0.69, - "learning_rate": 1.7948053347071387e-06, - "loss": 0.8047, - "step": 27079 - }, - { - "epoch": 0.69, - "learning_rate": 1.7947885421876442e-06, - "loss": 0.4888, - "step": 27080 - }, - { - "epoch": 0.69, - "learning_rate": 1.7947717490596162e-06, - "loss": 0.8564, - "step": 27081 - }, - { - "epoch": 0.69, - "learning_rate": 1.7947549553230682e-06, - "loss": 0.6875, - "step": 27082 - }, - { - "epoch": 0.69, - "learning_rate": 1.794738160978013e-06, - "loss": 0.9658, - "step": 27083 - }, - { - "epoch": 0.69, - "learning_rate": 1.794721366024463e-06, - "loss": 0.9482, - "step": 27084 - }, - { - "epoch": 0.69, - "learning_rate": 1.7947045704624317e-06, - "loss": 1.0068, - "step": 27085 - }, - { - "epoch": 0.69, - "learning_rate": 1.7946877742919317e-06, - "loss": 0.4658, - "step": 27086 - }, - { - "epoch": 0.69, - "learning_rate": 1.7946709775129759e-06, - "loss": 0.8218, - "step": 27087 - }, - { - "epoch": 0.69, - "learning_rate": 1.7946541801255768e-06, - "loss": 1.0322, - "step": 27088 - }, - { - "epoch": 0.69, - "learning_rate": 1.7946373821297477e-06, - "loss": 0.9219, - "step": 27089 - }, - { - "epoch": 0.69, - "learning_rate": 1.794620583525501e-06, - "loss": 1.0703, - "step": 27090 - }, - { - "epoch": 0.69, - "learning_rate": 1.79460378431285e-06, - "loss": 0.8018, - "step": 27091 - }, - { - "epoch": 0.69, - "learning_rate": 1.7945869844918076e-06, - "loss": 0.5942, - "step": 27092 - }, - { - "epoch": 0.69, - "learning_rate": 1.7945701840623863e-06, - "loss": 0.7671, - "step": 27093 - }, - { - "epoch": 0.69, - "learning_rate": 1.794553383024599e-06, - "loss": 1.0645, - "step": 27094 - }, - { - "epoch": 0.69, - "learning_rate": 1.794536581378459e-06, - "loss": 0.8174, - "step": 27095 - }, - { - "epoch": 0.69, - "learning_rate": 1.794519779123979e-06, - "loss": 1.0137, - "step": 27096 - }, - { - "epoch": 0.69, - "learning_rate": 1.7945029762611715e-06, - "loss": 0.7236, - "step": 27097 - }, - { - "epoch": 0.69, - "learning_rate": 1.7944861727900496e-06, - "loss": 1.0156, - "step": 27098 - }, - { - "epoch": 0.69, - "learning_rate": 1.7944693687106263e-06, - "loss": 0.8438, - "step": 27099 - }, - { - "epoch": 0.69, - "learning_rate": 1.7944525640229142e-06, - "loss": 0.8184, - "step": 27100 - }, - { - "epoch": 0.69, - "learning_rate": 1.7944357587269263e-06, - "loss": 0.5933, - "step": 27101 - }, - { - "epoch": 0.69, - "learning_rate": 1.7944189528226757e-06, - "loss": 0.8926, - "step": 27102 - }, - { - "epoch": 0.69, - "learning_rate": 1.7944021463101747e-06, - "loss": 0.8672, - "step": 27103 - }, - { - "epoch": 0.69, - "learning_rate": 1.7943853391894366e-06, - "loss": 0.9854, - "step": 27104 - }, - { - "epoch": 0.69, - "learning_rate": 1.7943685314604742e-06, - "loss": 0.8926, - "step": 27105 - }, - { - "epoch": 0.69, - "learning_rate": 1.7943517231233005e-06, - "loss": 0.9897, - "step": 27106 - }, - { - "epoch": 0.69, - "learning_rate": 1.794334914177928e-06, - "loss": 1.0059, - "step": 27107 - }, - { - "epoch": 0.69, - "learning_rate": 1.7943181046243695e-06, - "loss": 0.9404, - "step": 27108 - }, - { - "epoch": 0.69, - "learning_rate": 1.7943012944626388e-06, - "loss": 0.8887, - "step": 27109 - }, - { - "epoch": 0.69, - "learning_rate": 1.7942844836927479e-06, - "loss": 0.8359, - "step": 27110 - }, - { - "epoch": 0.69, - "learning_rate": 1.7942676723147098e-06, - "loss": 0.7305, - "step": 27111 - }, - { - "epoch": 0.69, - "learning_rate": 1.7942508603285374e-06, - "loss": 0.8252, - "step": 27112 - }, - { - "epoch": 0.69, - "learning_rate": 1.7942340477342438e-06, - "loss": 0.7266, - "step": 27113 - }, - { - "epoch": 0.69, - "learning_rate": 1.7942172345318416e-06, - "loss": 0.8013, - "step": 27114 - }, - { - "epoch": 0.69, - "learning_rate": 1.7942004207213438e-06, - "loss": 0.9072, - "step": 27115 - }, - { - "epoch": 0.69, - "learning_rate": 1.7941836063027634e-06, - "loss": 0.6504, - "step": 27116 - }, - { - "epoch": 0.7, - "learning_rate": 1.7941667912761127e-06, - "loss": 0.6875, - "step": 27117 - }, - { - "epoch": 0.7, - "learning_rate": 1.7941499756414053e-06, - "loss": 0.8613, - "step": 27118 - }, - { - "epoch": 0.7, - "learning_rate": 1.794133159398654e-06, - "loss": 0.8354, - "step": 27119 - }, - { - "epoch": 0.7, - "learning_rate": 1.7941163425478712e-06, - "loss": 0.9336, - "step": 27120 - }, - { - "epoch": 0.7, - "learning_rate": 1.79409952508907e-06, - "loss": 0.9814, - "step": 27121 - }, - { - "epoch": 0.7, - "learning_rate": 1.7940827070222634e-06, - "loss": 0.6609, - "step": 27122 - }, - { - "epoch": 0.7, - "learning_rate": 1.7940658883474642e-06, - "loss": 0.9609, - "step": 27123 - }, - { - "epoch": 0.7, - "learning_rate": 1.7940490690646853e-06, - "loss": 0.7954, - "step": 27124 - }, - { - "epoch": 0.7, - "learning_rate": 1.7940322491739392e-06, - "loss": 0.8662, - "step": 27125 - }, - { - "epoch": 0.7, - "learning_rate": 1.7940154286752396e-06, - "loss": 0.7307, - "step": 27126 - }, - { - "epoch": 0.7, - "learning_rate": 1.7939986075685986e-06, - "loss": 0.8086, - "step": 27127 - }, - { - "epoch": 0.7, - "learning_rate": 1.7939817858540294e-06, - "loss": 0.9053, - "step": 27128 - }, - { - "epoch": 0.7, - "learning_rate": 1.793964963531545e-06, - "loss": 0.8857, - "step": 27129 - }, - { - "epoch": 0.7, - "learning_rate": 1.7939481406011582e-06, - "loss": 0.6133, - "step": 27130 - }, - { - "epoch": 0.7, - "learning_rate": 1.7939313170628813e-06, - "loss": 1.0479, - "step": 27131 - }, - { - "epoch": 0.7, - "learning_rate": 1.7939144929167282e-06, - "loss": 0.8018, - "step": 27132 - }, - { - "epoch": 0.7, - "learning_rate": 1.7938976681627111e-06, - "loss": 0.8831, - "step": 27133 - }, - { - "epoch": 0.7, - "learning_rate": 1.793880842800843e-06, - "loss": 0.8008, - "step": 27134 - }, - { - "epoch": 0.7, - "learning_rate": 1.793864016831137e-06, - "loss": 0.7734, - "step": 27135 - }, - { - "epoch": 0.7, - "learning_rate": 1.7938471902536056e-06, - "loss": 0.915, - "step": 27136 - }, - { - "epoch": 0.7, - "learning_rate": 1.7938303630682624e-06, - "loss": 0.7266, - "step": 27137 - }, - { - "epoch": 0.7, - "learning_rate": 1.7938135352751194e-06, - "loss": 1.0146, - "step": 27138 - }, - { - "epoch": 0.7, - "learning_rate": 1.7937967068741897e-06, - "loss": 0.8027, - "step": 27139 - }, - { - "epoch": 0.7, - "learning_rate": 1.7937798778654867e-06, - "loss": 0.8906, - "step": 27140 - }, - { - "epoch": 0.7, - "learning_rate": 1.7937630482490227e-06, - "loss": 0.9551, - "step": 27141 - }, - { - "epoch": 0.7, - "learning_rate": 1.793746218024811e-06, - "loss": 0.999, - "step": 27142 - }, - { - "epoch": 0.7, - "learning_rate": 1.7937293871928642e-06, - "loss": 0.7319, - "step": 27143 - }, - { - "epoch": 0.7, - "learning_rate": 1.7937125557531957e-06, - "loss": 0.9678, - "step": 27144 - }, - { - "epoch": 0.7, - "learning_rate": 1.7936957237058174e-06, - "loss": 0.9678, - "step": 27145 - }, - { - "epoch": 0.7, - "learning_rate": 1.7936788910507433e-06, - "loss": 0.792, - "step": 27146 - }, - { - "epoch": 0.7, - "learning_rate": 1.7936620577879854e-06, - "loss": 0.6633, - "step": 27147 - }, - { - "epoch": 0.7, - "learning_rate": 1.793645223917557e-06, - "loss": 0.7744, - "step": 27148 - }, - { - "epoch": 0.7, - "learning_rate": 1.7936283894394712e-06, - "loss": 0.8252, - "step": 27149 - }, - { - "epoch": 0.7, - "learning_rate": 1.7936115543537405e-06, - "loss": 0.7559, - "step": 27150 - }, - { - "epoch": 0.7, - "learning_rate": 1.793594718660378e-06, - "loss": 0.9512, - "step": 27151 - }, - { - "epoch": 0.7, - "learning_rate": 1.7935778823593964e-06, - "loss": 0.6655, - "step": 27152 - }, - { - "epoch": 0.7, - "learning_rate": 1.7935610454508086e-06, - "loss": 0.8857, - "step": 27153 - }, - { - "epoch": 0.7, - "learning_rate": 1.7935442079346276e-06, - "loss": 0.8164, - "step": 27154 - }, - { - "epoch": 0.7, - "learning_rate": 1.7935273698108665e-06, - "loss": 0.7329, - "step": 27155 - }, - { - "epoch": 0.7, - "learning_rate": 1.793510531079538e-06, - "loss": 0.8193, - "step": 27156 - }, - { - "epoch": 0.7, - "learning_rate": 1.7934936917406547e-06, - "loss": 0.998, - "step": 27157 - }, - { - "epoch": 0.7, - "learning_rate": 1.7934768517942298e-06, - "loss": 0.8721, - "step": 27158 - }, - { - "epoch": 0.7, - "learning_rate": 1.7934600112402763e-06, - "loss": 0.9697, - "step": 27159 - }, - { - "epoch": 0.7, - "learning_rate": 1.7934431700788068e-06, - "loss": 0.8721, - "step": 27160 - }, - { - "epoch": 0.7, - "learning_rate": 1.7934263283098348e-06, - "loss": 1.0234, - "step": 27161 - }, - { - "epoch": 0.7, - "learning_rate": 1.7934094859333721e-06, - "loss": 0.8555, - "step": 27162 - }, - { - "epoch": 0.7, - "learning_rate": 1.7933926429494325e-06, - "loss": 0.959, - "step": 27163 - }, - { - "epoch": 0.7, - "learning_rate": 1.793375799358029e-06, - "loss": 0.751, - "step": 27164 - }, - { - "epoch": 0.7, - "learning_rate": 1.793358955159174e-06, - "loss": 0.998, - "step": 27165 - }, - { - "epoch": 0.7, - "learning_rate": 1.79334211035288e-06, - "loss": 0.8652, - "step": 27166 - }, - { - "epoch": 0.7, - "learning_rate": 1.7933252649391611e-06, - "loss": 0.8809, - "step": 27167 - }, - { - "epoch": 0.7, - "learning_rate": 1.793308418918029e-06, - "loss": 0.9287, - "step": 27168 - }, - { - "epoch": 0.7, - "learning_rate": 1.7932915722894974e-06, - "loss": 0.917, - "step": 27169 - }, - { - "epoch": 0.7, - "learning_rate": 1.7932747250535786e-06, - "loss": 0.9248, - "step": 27170 - }, - { - "epoch": 0.7, - "learning_rate": 1.7932578772102861e-06, - "loss": 0.9365, - "step": 27171 - }, - { - "epoch": 0.7, - "learning_rate": 1.7932410287596327e-06, - "loss": 0.8574, - "step": 27172 - }, - { - "epoch": 0.7, - "learning_rate": 1.7932241797016308e-06, - "loss": 0.7959, - "step": 27173 - }, - { - "epoch": 0.7, - "learning_rate": 1.7932073300362938e-06, - "loss": 0.8418, - "step": 27174 - }, - { - "epoch": 0.7, - "learning_rate": 1.7931904797636342e-06, - "loss": 0.7295, - "step": 27175 - }, - { - "epoch": 0.7, - "learning_rate": 1.7931736288836653e-06, - "loss": 0.624, - "step": 27176 - }, - { - "epoch": 0.7, - "learning_rate": 1.7931567773963998e-06, - "loss": 0.9131, - "step": 27177 - }, - { - "epoch": 0.7, - "learning_rate": 1.7931399253018507e-06, - "loss": 0.8936, - "step": 27178 - }, - { - "epoch": 0.7, - "learning_rate": 1.7931230726000306e-06, - "loss": 0.8496, - "step": 27179 - }, - { - "epoch": 0.7, - "learning_rate": 1.7931062192909527e-06, - "loss": 0.74, - "step": 27180 - }, - { - "epoch": 0.7, - "learning_rate": 1.7930893653746299e-06, - "loss": 0.8584, - "step": 27181 - }, - { - "epoch": 0.7, - "learning_rate": 1.793072510851075e-06, - "loss": 0.832, - "step": 27182 - }, - { - "epoch": 0.7, - "learning_rate": 1.793055655720301e-06, - "loss": 0.5874, - "step": 27183 - }, - { - "epoch": 0.7, - "learning_rate": 1.793038799982321e-06, - "loss": 0.8643, - "step": 27184 - }, - { - "epoch": 0.7, - "learning_rate": 1.7930219436371472e-06, - "loss": 1.0459, - "step": 27185 - }, - { - "epoch": 0.7, - "learning_rate": 1.7930050866847932e-06, - "loss": 0.9473, - "step": 27186 - }, - { - "epoch": 0.7, - "learning_rate": 1.7929882291252715e-06, - "loss": 0.9043, - "step": 27187 - }, - { - "epoch": 0.7, - "learning_rate": 1.7929713709585954e-06, - "loss": 0.8799, - "step": 27188 - }, - { - "epoch": 0.7, - "learning_rate": 1.7929545121847775e-06, - "loss": 0.7891, - "step": 27189 - }, - { - "epoch": 0.7, - "learning_rate": 1.7929376528038307e-06, - "loss": 0.9316, - "step": 27190 - }, - { - "epoch": 0.7, - "learning_rate": 1.7929207928157682e-06, - "loss": 0.7119, - "step": 27191 - }, - { - "epoch": 0.7, - "learning_rate": 1.7929039322206026e-06, - "loss": 0.9502, - "step": 27192 - }, - { - "epoch": 0.7, - "learning_rate": 1.7928870710183468e-06, - "loss": 0.5837, - "step": 27193 - }, - { - "epoch": 0.7, - "learning_rate": 1.792870209209014e-06, - "loss": 0.9775, - "step": 27194 - }, - { - "epoch": 0.7, - "learning_rate": 1.7928533467926168e-06, - "loss": 0.8516, - "step": 27195 - }, - { - "epoch": 0.7, - "learning_rate": 1.7928364837691685e-06, - "loss": 0.8994, - "step": 27196 - }, - { - "epoch": 0.7, - "learning_rate": 1.7928196201386813e-06, - "loss": 0.9639, - "step": 27197 - }, - { - "epoch": 0.7, - "learning_rate": 1.7928027559011689e-06, - "loss": 0.8418, - "step": 27198 - }, - { - "epoch": 0.7, - "learning_rate": 1.7927858910566438e-06, - "loss": 0.9473, - "step": 27199 - }, - { - "epoch": 0.7, - "learning_rate": 1.792769025605119e-06, - "loss": 0.9727, - "step": 27200 - }, - { - "epoch": 0.7, - "learning_rate": 1.7927521595466075e-06, - "loss": 1.0664, - "step": 27201 - }, - { - "epoch": 0.7, - "learning_rate": 1.7927352928811221e-06, - "loss": 0.8809, - "step": 27202 - }, - { - "epoch": 0.7, - "learning_rate": 1.7927184256086756e-06, - "loss": 0.877, - "step": 27203 - }, - { - "epoch": 0.7, - "learning_rate": 1.7927015577292812e-06, - "loss": 0.7324, - "step": 27204 - }, - { - "epoch": 0.7, - "learning_rate": 1.7926846892429515e-06, - "loss": 0.7913, - "step": 27205 - }, - { - "epoch": 0.7, - "learning_rate": 1.7926678201497e-06, - "loss": 1.125, - "step": 27206 - }, - { - "epoch": 0.7, - "learning_rate": 1.7926509504495386e-06, - "loss": 0.7827, - "step": 27207 - }, - { - "epoch": 0.7, - "learning_rate": 1.792634080142481e-06, - "loss": 0.9443, - "step": 27208 - }, - { - "epoch": 0.7, - "learning_rate": 1.7926172092285403e-06, - "loss": 0.7197, - "step": 27209 - }, - { - "epoch": 0.7, - "learning_rate": 1.7926003377077287e-06, - "loss": 0.9688, - "step": 27210 - }, - { - "epoch": 0.7, - "learning_rate": 1.7925834655800599e-06, - "loss": 0.8721, - "step": 27211 - }, - { - "epoch": 0.7, - "learning_rate": 1.7925665928455457e-06, - "loss": 0.6855, - "step": 27212 - }, - { - "epoch": 0.7, - "learning_rate": 1.7925497195042e-06, - "loss": 0.8506, - "step": 27213 - }, - { - "epoch": 0.7, - "learning_rate": 1.7925328455560356e-06, - "loss": 0.7764, - "step": 27214 - }, - { - "epoch": 0.7, - "learning_rate": 1.7925159710010652e-06, - "loss": 0.8027, - "step": 27215 - }, - { - "epoch": 0.7, - "learning_rate": 1.7924990958393016e-06, - "loss": 0.6919, - "step": 27216 - }, - { - "epoch": 0.7, - "learning_rate": 1.7924822200707578e-06, - "loss": 0.7617, - "step": 27217 - }, - { - "epoch": 0.7, - "learning_rate": 1.792465343695447e-06, - "loss": 0.8848, - "step": 27218 - }, - { - "epoch": 0.7, - "learning_rate": 1.792448466713382e-06, - "loss": 0.8623, - "step": 27219 - }, - { - "epoch": 0.7, - "learning_rate": 1.7924315891245754e-06, - "loss": 0.7021, - "step": 27220 - }, - { - "epoch": 0.7, - "learning_rate": 1.7924147109290403e-06, - "loss": 0.6304, - "step": 27221 - }, - { - "epoch": 0.7, - "learning_rate": 1.79239783212679e-06, - "loss": 0.7471, - "step": 27222 - }, - { - "epoch": 0.7, - "learning_rate": 1.792380952717837e-06, - "loss": 0.688, - "step": 27223 - }, - { - "epoch": 0.7, - "learning_rate": 1.7923640727021944e-06, - "loss": 0.8096, - "step": 27224 - }, - { - "epoch": 0.7, - "learning_rate": 1.7923471920798748e-06, - "loss": 0.8203, - "step": 27225 - }, - { - "epoch": 0.7, - "learning_rate": 1.7923303108508918e-06, - "loss": 0.9336, - "step": 27226 - }, - { - "epoch": 0.7, - "learning_rate": 1.7923134290152577e-06, - "loss": 0.9551, - "step": 27227 - }, - { - "epoch": 0.7, - "learning_rate": 1.7922965465729858e-06, - "loss": 0.7434, - "step": 27228 - }, - { - "epoch": 0.7, - "learning_rate": 1.7922796635240887e-06, - "loss": 0.9053, - "step": 27229 - }, - { - "epoch": 0.7, - "learning_rate": 1.7922627798685795e-06, - "loss": 0.6255, - "step": 27230 - }, - { - "epoch": 0.7, - "learning_rate": 1.792245895606471e-06, - "loss": 0.6016, - "step": 27231 - }, - { - "epoch": 0.7, - "learning_rate": 1.7922290107377762e-06, - "loss": 0.8203, - "step": 27232 - }, - { - "epoch": 0.7, - "learning_rate": 1.7922121252625084e-06, - "loss": 1.0146, - "step": 27233 - }, - { - "epoch": 0.7, - "learning_rate": 1.7921952391806801e-06, - "loss": 0.7834, - "step": 27234 - }, - { - "epoch": 0.7, - "learning_rate": 1.7921783524923042e-06, - "loss": 0.8994, - "step": 27235 - }, - { - "epoch": 0.7, - "learning_rate": 1.7921614651973939e-06, - "loss": 0.9854, - "step": 27236 - }, - { - "epoch": 0.7, - "learning_rate": 1.792144577295962e-06, - "loss": 0.6863, - "step": 27237 - }, - { - "epoch": 0.7, - "learning_rate": 1.7921276887880212e-06, - "loss": 0.6853, - "step": 27238 - }, - { - "epoch": 0.7, - "learning_rate": 1.7921107996735846e-06, - "loss": 0.9482, - "step": 27239 - }, - { - "epoch": 0.7, - "learning_rate": 1.7920939099526656e-06, - "loss": 0.7051, - "step": 27240 - }, - { - "epoch": 0.7, - "learning_rate": 1.7920770196252767e-06, - "loss": 0.8975, - "step": 27241 - }, - { - "epoch": 0.7, - "learning_rate": 1.7920601286914306e-06, - "loss": 0.8555, - "step": 27242 - }, - { - "epoch": 0.7, - "learning_rate": 1.7920432371511405e-06, - "loss": 0.9766, - "step": 27243 - }, - { - "epoch": 0.7, - "learning_rate": 1.792026345004419e-06, - "loss": 0.6506, - "step": 27244 - }, - { - "epoch": 0.7, - "learning_rate": 1.7920094522512799e-06, - "loss": 0.8643, - "step": 27245 - }, - { - "epoch": 0.7, - "learning_rate": 1.7919925588917354e-06, - "loss": 0.9004, - "step": 27246 - }, - { - "epoch": 0.7, - "learning_rate": 1.7919756649257985e-06, - "loss": 0.9141, - "step": 27247 - }, - { - "epoch": 0.7, - "learning_rate": 1.7919587703534824e-06, - "loss": 0.8374, - "step": 27248 - }, - { - "epoch": 0.7, - "learning_rate": 1.7919418751747998e-06, - "loss": 0.9375, - "step": 27249 - }, - { - "epoch": 0.7, - "learning_rate": 1.7919249793897637e-06, - "loss": 1.0605, - "step": 27250 - }, - { - "epoch": 0.7, - "learning_rate": 1.791908082998387e-06, - "loss": 0.8887, - "step": 27251 - }, - { - "epoch": 0.7, - "learning_rate": 1.7918911860006829e-06, - "loss": 0.8643, - "step": 27252 - }, - { - "epoch": 0.7, - "learning_rate": 1.791874288396664e-06, - "loss": 0.6016, - "step": 27253 - }, - { - "epoch": 0.7, - "learning_rate": 1.7918573901863434e-06, - "loss": 0.7517, - "step": 27254 - }, - { - "epoch": 0.7, - "learning_rate": 1.7918404913697339e-06, - "loss": 0.9941, - "step": 27255 - }, - { - "epoch": 0.7, - "learning_rate": 1.7918235919468486e-06, - "loss": 0.7988, - "step": 27256 - }, - { - "epoch": 0.7, - "learning_rate": 1.7918066919177004e-06, - "loss": 0.7139, - "step": 27257 - }, - { - "epoch": 0.7, - "learning_rate": 1.7917897912823024e-06, - "loss": 1.0332, - "step": 27258 - }, - { - "epoch": 0.7, - "learning_rate": 1.7917728900406672e-06, - "loss": 0.7534, - "step": 27259 - }, - { - "epoch": 0.7, - "learning_rate": 1.7917559881928077e-06, - "loss": 0.8037, - "step": 27260 - }, - { - "epoch": 0.7, - "learning_rate": 1.7917390857387374e-06, - "loss": 0.8389, - "step": 27261 - }, - { - "epoch": 0.7, - "learning_rate": 1.7917221826784687e-06, - "loss": 0.9268, - "step": 27262 - }, - { - "epoch": 0.7, - "learning_rate": 1.7917052790120149e-06, - "loss": 1.0322, - "step": 27263 - }, - { - "epoch": 0.7, - "learning_rate": 1.7916883747393885e-06, - "loss": 0.8379, - "step": 27264 - }, - { - "epoch": 0.7, - "learning_rate": 1.7916714698606027e-06, - "loss": 0.6572, - "step": 27265 - }, - { - "epoch": 0.7, - "learning_rate": 1.7916545643756708e-06, - "loss": 0.8535, - "step": 27266 - }, - { - "epoch": 0.7, - "learning_rate": 1.7916376582846051e-06, - "loss": 0.9561, - "step": 27267 - }, - { - "epoch": 0.7, - "learning_rate": 1.7916207515874192e-06, - "loss": 1.1133, - "step": 27268 - }, - { - "epoch": 0.7, - "learning_rate": 1.7916038442841252e-06, - "loss": 0.7314, - "step": 27269 - }, - { - "epoch": 0.7, - "learning_rate": 1.7915869363747369e-06, - "loss": 0.9863, - "step": 27270 - }, - { - "epoch": 0.7, - "learning_rate": 1.7915700278592668e-06, - "loss": 0.8306, - "step": 27271 - }, - { - "epoch": 0.7, - "learning_rate": 1.791553118737728e-06, - "loss": 1.0244, - "step": 27272 - }, - { - "epoch": 0.7, - "learning_rate": 1.7915362090101331e-06, - "loss": 0.9775, - "step": 27273 - }, - { - "epoch": 0.7, - "learning_rate": 1.7915192986764956e-06, - "loss": 0.8662, - "step": 27274 - }, - { - "epoch": 0.7, - "learning_rate": 1.7915023877368278e-06, - "loss": 1.1162, - "step": 27275 - }, - { - "epoch": 0.7, - "learning_rate": 1.7914854761911435e-06, - "loss": 1.0098, - "step": 27276 - }, - { - "epoch": 0.7, - "learning_rate": 1.7914685640394548e-06, - "loss": 0.7988, - "step": 27277 - }, - { - "epoch": 0.7, - "learning_rate": 1.7914516512817752e-06, - "loss": 0.9365, - "step": 27278 - }, - { - "epoch": 0.7, - "learning_rate": 1.7914347379181175e-06, - "loss": 0.8794, - "step": 27279 - }, - { - "epoch": 0.7, - "learning_rate": 1.7914178239484942e-06, - "loss": 0.8486, - "step": 27280 - }, - { - "epoch": 0.7, - "learning_rate": 1.7914009093729193e-06, - "loss": 0.7969, - "step": 27281 - }, - { - "epoch": 0.7, - "learning_rate": 1.7913839941914047e-06, - "loss": 1.002, - "step": 27282 - }, - { - "epoch": 0.7, - "learning_rate": 1.791367078403964e-06, - "loss": 0.9189, - "step": 27283 - }, - { - "epoch": 0.7, - "learning_rate": 1.7913501620106097e-06, - "loss": 0.9893, - "step": 27284 - }, - { - "epoch": 0.7, - "learning_rate": 1.791333245011355e-06, - "loss": 0.8818, - "step": 27285 - }, - { - "epoch": 0.7, - "learning_rate": 1.7913163274062128e-06, - "loss": 0.8467, - "step": 27286 - }, - { - "epoch": 0.7, - "learning_rate": 1.7912994091951962e-06, - "loss": 0.9639, - "step": 27287 - }, - { - "epoch": 0.7, - "learning_rate": 1.791282490378318e-06, - "loss": 0.6951, - "step": 27288 - }, - { - "epoch": 0.7, - "learning_rate": 1.7912655709555912e-06, - "loss": 0.8193, - "step": 27289 - }, - { - "epoch": 0.7, - "learning_rate": 1.7912486509270286e-06, - "loss": 1.0186, - "step": 27290 - }, - { - "epoch": 0.7, - "learning_rate": 1.7912317302926433e-06, - "loss": 0.8477, - "step": 27291 - }, - { - "epoch": 0.7, - "learning_rate": 1.7912148090524484e-06, - "loss": 0.8428, - "step": 27292 - }, - { - "epoch": 0.7, - "learning_rate": 1.7911978872064566e-06, - "loss": 0.6992, - "step": 27293 - }, - { - "epoch": 0.7, - "learning_rate": 1.7911809647546812e-06, - "loss": 0.8076, - "step": 27294 - }, - { - "epoch": 0.7, - "learning_rate": 1.7911640416971346e-06, - "loss": 0.876, - "step": 27295 - }, - { - "epoch": 0.7, - "learning_rate": 1.7911471180338302e-06, - "loss": 1.1152, - "step": 27296 - }, - { - "epoch": 0.7, - "learning_rate": 1.7911301937647808e-06, - "loss": 0.6816, - "step": 27297 - }, - { - "epoch": 0.7, - "learning_rate": 1.7911132688899993e-06, - "loss": 0.6689, - "step": 27298 - }, - { - "epoch": 0.7, - "learning_rate": 1.791096343409499e-06, - "loss": 0.7495, - "step": 27299 - }, - { - "epoch": 0.7, - "learning_rate": 1.7910794173232922e-06, - "loss": 0.7676, - "step": 27300 - }, - { - "epoch": 0.7, - "learning_rate": 1.7910624906313925e-06, - "loss": 0.7529, - "step": 27301 - }, - { - "epoch": 0.7, - "learning_rate": 1.7910455633338128e-06, - "loss": 0.9482, - "step": 27302 - }, - { - "epoch": 0.7, - "learning_rate": 1.7910286354305658e-06, - "loss": 0.9199, - "step": 27303 - }, - { - "epoch": 0.7, - "learning_rate": 1.7910117069216644e-06, - "loss": 0.9375, - "step": 27304 - }, - { - "epoch": 0.7, - "learning_rate": 1.7909947778071217e-06, - "loss": 0.8613, - "step": 27305 - }, - { - "epoch": 0.7, - "learning_rate": 1.7909778480869507e-06, - "loss": 0.8936, - "step": 27306 - }, - { - "epoch": 0.7, - "learning_rate": 1.7909609177611644e-06, - "loss": 0.8408, - "step": 27307 - }, - { - "epoch": 0.7, - "learning_rate": 1.7909439868297755e-06, - "loss": 0.8115, - "step": 27308 - }, - { - "epoch": 0.7, - "learning_rate": 1.7909270552927976e-06, - "loss": 0.6313, - "step": 27309 - }, - { - "epoch": 0.7, - "learning_rate": 1.7909101231502427e-06, - "loss": 0.8047, - "step": 27310 - }, - { - "epoch": 0.7, - "learning_rate": 1.7908931904021248e-06, - "loss": 0.8242, - "step": 27311 - }, - { - "epoch": 0.7, - "learning_rate": 1.7908762570484558e-06, - "loss": 0.9736, - "step": 27312 - }, - { - "epoch": 0.7, - "learning_rate": 1.7908593230892498e-06, - "loss": 0.6235, - "step": 27313 - }, - { - "epoch": 0.7, - "learning_rate": 1.7908423885245187e-06, - "loss": 0.6914, - "step": 27314 - }, - { - "epoch": 0.7, - "learning_rate": 1.7908254533542762e-06, - "loss": 0.9004, - "step": 27315 - }, - { - "epoch": 0.7, - "learning_rate": 1.7908085175785349e-06, - "loss": 1.0801, - "step": 27316 - }, - { - "epoch": 0.7, - "learning_rate": 1.790791581197308e-06, - "loss": 0.8354, - "step": 27317 - }, - { - "epoch": 0.7, - "learning_rate": 1.7907746442106082e-06, - "loss": 0.5962, - "step": 27318 - }, - { - "epoch": 0.7, - "learning_rate": 1.7907577066184488e-06, - "loss": 1.0508, - "step": 27319 - }, - { - "epoch": 0.7, - "learning_rate": 1.7907407684208421e-06, - "loss": 0.9482, - "step": 27320 - }, - { - "epoch": 0.7, - "learning_rate": 1.7907238296178021e-06, - "loss": 0.8301, - "step": 27321 - }, - { - "epoch": 0.7, - "learning_rate": 1.7907068902093409e-06, - "loss": 0.6345, - "step": 27322 - }, - { - "epoch": 0.7, - "learning_rate": 1.790689950195472e-06, - "loss": 0.915, - "step": 27323 - }, - { - "epoch": 0.7, - "learning_rate": 1.7906730095762082e-06, - "loss": 0.8945, - "step": 27324 - }, - { - "epoch": 0.7, - "learning_rate": 1.7906560683515625e-06, - "loss": 0.5955, - "step": 27325 - }, - { - "epoch": 0.7, - "learning_rate": 1.7906391265215475e-06, - "loss": 0.7296, - "step": 27326 - }, - { - "epoch": 0.7, - "learning_rate": 1.7906221840861763e-06, - "loss": 0.8018, - "step": 27327 - }, - { - "epoch": 0.7, - "learning_rate": 1.7906052410454627e-06, - "loss": 0.7734, - "step": 27328 - }, - { - "epoch": 0.7, - "learning_rate": 1.7905882973994187e-06, - "loss": 0.7266, - "step": 27329 - }, - { - "epoch": 0.7, - "learning_rate": 1.7905713531480573e-06, - "loss": 0.8672, - "step": 27330 - }, - { - "epoch": 0.7, - "learning_rate": 1.790554408291392e-06, - "loss": 0.7065, - "step": 27331 - }, - { - "epoch": 0.7, - "learning_rate": 1.7905374628294356e-06, - "loss": 0.8643, - "step": 27332 - }, - { - "epoch": 0.7, - "learning_rate": 1.790520516762201e-06, - "loss": 0.7744, - "step": 27333 - }, - { - "epoch": 0.7, - "learning_rate": 1.7905035700897013e-06, - "loss": 0.8105, - "step": 27334 - }, - { - "epoch": 0.7, - "learning_rate": 1.790486622811949e-06, - "loss": 0.8408, - "step": 27335 - }, - { - "epoch": 0.7, - "learning_rate": 1.790469674928958e-06, - "loss": 0.7969, - "step": 27336 - }, - { - "epoch": 0.7, - "learning_rate": 1.7904527264407403e-06, - "loss": 0.8662, - "step": 27337 - }, - { - "epoch": 0.7, - "learning_rate": 1.7904357773473095e-06, - "loss": 0.9121, - "step": 27338 - }, - { - "epoch": 0.7, - "learning_rate": 1.7904188276486782e-06, - "loss": 0.7705, - "step": 27339 - }, - { - "epoch": 0.7, - "learning_rate": 1.7904018773448595e-06, - "loss": 0.8115, - "step": 27340 - }, - { - "epoch": 0.7, - "learning_rate": 1.7903849264358666e-06, - "loss": 0.8203, - "step": 27341 - }, - { - "epoch": 0.7, - "learning_rate": 1.7903679749217122e-06, - "loss": 0.834, - "step": 27342 - }, - { - "epoch": 0.7, - "learning_rate": 1.7903510228024094e-06, - "loss": 0.8818, - "step": 27343 - }, - { - "epoch": 0.7, - "learning_rate": 1.7903340700779712e-06, - "loss": 0.666, - "step": 27344 - }, - { - "epoch": 0.7, - "learning_rate": 1.7903171167484107e-06, - "loss": 0.7451, - "step": 27345 - }, - { - "epoch": 0.7, - "learning_rate": 1.7903001628137403e-06, - "loss": 0.8506, - "step": 27346 - }, - { - "epoch": 0.7, - "learning_rate": 1.7902832082739738e-06, - "loss": 0.8018, - "step": 27347 - }, - { - "epoch": 0.7, - "learning_rate": 1.7902662531291237e-06, - "loss": 0.853, - "step": 27348 - }, - { - "epoch": 0.7, - "learning_rate": 1.790249297379203e-06, - "loss": 0.9219, - "step": 27349 - }, - { - "epoch": 0.7, - "learning_rate": 1.7902323410242249e-06, - "loss": 0.8945, - "step": 27350 - }, - { - "epoch": 0.7, - "learning_rate": 1.790215384064202e-06, - "loss": 0.7402, - "step": 27351 - }, - { - "epoch": 0.7, - "learning_rate": 1.7901984264991477e-06, - "loss": 0.9551, - "step": 27352 - }, - { - "epoch": 0.7, - "learning_rate": 1.7901814683290746e-06, - "loss": 0.7188, - "step": 27353 - }, - { - "epoch": 0.7, - "learning_rate": 1.7901645095539961e-06, - "loss": 1.0889, - "step": 27354 - }, - { - "epoch": 0.7, - "learning_rate": 1.7901475501739248e-06, - "loss": 0.7881, - "step": 27355 - }, - { - "epoch": 0.7, - "learning_rate": 1.7901305901888738e-06, - "loss": 0.7695, - "step": 27356 - }, - { - "epoch": 0.7, - "learning_rate": 1.7901136295988563e-06, - "loss": 0.6953, - "step": 27357 - }, - { - "epoch": 0.7, - "learning_rate": 1.7900966684038852e-06, - "loss": 0.9893, - "step": 27358 - }, - { - "epoch": 0.7, - "learning_rate": 1.790079706603973e-06, - "loss": 0.9053, - "step": 27359 - }, - { - "epoch": 0.7, - "learning_rate": 1.7900627441991336e-06, - "loss": 0.9619, - "step": 27360 - }, - { - "epoch": 0.7, - "learning_rate": 1.7900457811893792e-06, - "loss": 0.9092, - "step": 27361 - }, - { - "epoch": 0.7, - "learning_rate": 1.7900288175747231e-06, - "loss": 0.9082, - "step": 27362 - }, - { - "epoch": 0.7, - "learning_rate": 1.7900118533551782e-06, - "loss": 0.9854, - "step": 27363 - }, - { - "epoch": 0.7, - "learning_rate": 1.789994888530758e-06, - "loss": 0.958, - "step": 27364 - }, - { - "epoch": 0.7, - "learning_rate": 1.7899779231014744e-06, - "loss": 1.165, - "step": 27365 - }, - { - "epoch": 0.7, - "learning_rate": 1.7899609570673416e-06, - "loss": 0.9297, - "step": 27366 - }, - { - "epoch": 0.7, - "learning_rate": 1.7899439904283716e-06, - "loss": 0.7617, - "step": 27367 - }, - { - "epoch": 0.7, - "learning_rate": 1.7899270231845777e-06, - "loss": 0.9082, - "step": 27368 - }, - { - "epoch": 0.7, - "learning_rate": 1.7899100553359735e-06, - "loss": 0.7529, - "step": 27369 - }, - { - "epoch": 0.7, - "learning_rate": 1.789893086882571e-06, - "loss": 0.8584, - "step": 27370 - }, - { - "epoch": 0.7, - "learning_rate": 1.789876117824384e-06, - "loss": 0.752, - "step": 27371 - }, - { - "epoch": 0.7, - "learning_rate": 1.789859148161425e-06, - "loss": 0.9893, - "step": 27372 - }, - { - "epoch": 0.7, - "learning_rate": 1.7898421778937074e-06, - "loss": 0.7354, - "step": 27373 - }, - { - "epoch": 0.7, - "learning_rate": 1.7898252070212439e-06, - "loss": 0.9033, - "step": 27374 - }, - { - "epoch": 0.7, - "learning_rate": 1.7898082355440473e-06, - "loss": 0.709, - "step": 27375 - }, - { - "epoch": 0.7, - "learning_rate": 1.7897912634621312e-06, - "loss": 0.9727, - "step": 27376 - }, - { - "epoch": 0.7, - "learning_rate": 1.789774290775508e-06, - "loss": 0.9053, - "step": 27377 - }, - { - "epoch": 0.7, - "learning_rate": 1.7897573174841912e-06, - "loss": 0.9375, - "step": 27378 - }, - { - "epoch": 0.7, - "learning_rate": 1.7897403435881931e-06, - "loss": 0.8291, - "step": 27379 - }, - { - "epoch": 0.7, - "learning_rate": 1.7897233690875275e-06, - "loss": 0.8164, - "step": 27380 - }, - { - "epoch": 0.7, - "learning_rate": 1.7897063939822071e-06, - "loss": 0.8906, - "step": 27381 - }, - { - "epoch": 0.7, - "learning_rate": 1.7896894182722444e-06, - "loss": 0.7437, - "step": 27382 - }, - { - "epoch": 0.7, - "learning_rate": 1.789672441957653e-06, - "loss": 0.7354, - "step": 27383 - }, - { - "epoch": 0.7, - "learning_rate": 1.7896554650384459e-06, - "loss": 0.8501, - "step": 27384 - }, - { - "epoch": 0.7, - "learning_rate": 1.7896384875146358e-06, - "loss": 0.9336, - "step": 27385 - }, - { - "epoch": 0.7, - "learning_rate": 1.7896215093862358e-06, - "loss": 1.0117, - "step": 27386 - }, - { - "epoch": 0.7, - "learning_rate": 1.789604530653259e-06, - "loss": 0.6309, - "step": 27387 - }, - { - "epoch": 0.7, - "learning_rate": 1.7895875513157184e-06, - "loss": 0.9746, - "step": 27388 - }, - { - "epoch": 0.7, - "learning_rate": 1.7895705713736267e-06, - "loss": 0.9219, - "step": 27389 - }, - { - "epoch": 0.7, - "learning_rate": 1.7895535908269972e-06, - "loss": 0.9258, - "step": 27390 - }, - { - "epoch": 0.7, - "learning_rate": 1.7895366096758426e-06, - "loss": 0.6377, - "step": 27391 - }, - { - "epoch": 0.7, - "learning_rate": 1.7895196279201765e-06, - "loss": 0.875, - "step": 27392 - }, - { - "epoch": 0.7, - "learning_rate": 1.7895026455600113e-06, - "loss": 0.8525, - "step": 27393 - }, - { - "epoch": 0.7, - "learning_rate": 1.7894856625953602e-06, - "loss": 0.7036, - "step": 27394 - }, - { - "epoch": 0.7, - "learning_rate": 1.7894686790262366e-06, - "loss": 0.7915, - "step": 27395 - }, - { - "epoch": 0.7, - "learning_rate": 1.7894516948526529e-06, - "loss": 1.0449, - "step": 27396 - }, - { - "epoch": 0.7, - "learning_rate": 1.789434710074622e-06, - "loss": 0.8213, - "step": 27397 - }, - { - "epoch": 0.7, - "learning_rate": 1.7894177246921575e-06, - "loss": 1.0283, - "step": 27398 - }, - { - "epoch": 0.7, - "learning_rate": 1.7894007387052723e-06, - "loss": 0.9287, - "step": 27399 - }, - { - "epoch": 0.7, - "learning_rate": 1.7893837521139792e-06, - "loss": 0.4854, - "step": 27400 - }, - { - "epoch": 0.7, - "learning_rate": 1.7893667649182912e-06, - "loss": 0.6299, - "step": 27401 - }, - { - "epoch": 0.7, - "learning_rate": 1.7893497771182212e-06, - "loss": 0.998, - "step": 27402 - }, - { - "epoch": 0.7, - "learning_rate": 1.7893327887137825e-06, - "loss": 0.9229, - "step": 27403 - }, - { - "epoch": 0.7, - "learning_rate": 1.789315799704988e-06, - "loss": 0.9224, - "step": 27404 - }, - { - "epoch": 0.7, - "learning_rate": 1.7892988100918509e-06, - "loss": 0.7271, - "step": 27405 - }, - { - "epoch": 0.7, - "learning_rate": 1.7892818198743838e-06, - "loss": 0.8643, - "step": 27406 - }, - { - "epoch": 0.7, - "learning_rate": 1.7892648290525999e-06, - "loss": 0.8262, - "step": 27407 - }, - { - "epoch": 0.7, - "learning_rate": 1.789247837626512e-06, - "loss": 1.083, - "step": 27408 - }, - { - "epoch": 0.7, - "learning_rate": 1.7892308455961337e-06, - "loss": 0.9502, - "step": 27409 - }, - { - "epoch": 0.7, - "learning_rate": 1.7892138529614773e-06, - "loss": 0.9043, - "step": 27410 - }, - { - "epoch": 0.7, - "learning_rate": 1.7891968597225563e-06, - "loss": 0.7822, - "step": 27411 - }, - { - "epoch": 0.7, - "learning_rate": 1.7891798658793835e-06, - "loss": 0.9082, - "step": 27412 - }, - { - "epoch": 0.7, - "learning_rate": 1.789162871431972e-06, - "loss": 0.8145, - "step": 27413 - }, - { - "epoch": 0.7, - "learning_rate": 1.7891458763803349e-06, - "loss": 0.9463, - "step": 27414 - }, - { - "epoch": 0.7, - "learning_rate": 1.7891288807244852e-06, - "loss": 1.0459, - "step": 27415 - }, - { - "epoch": 0.7, - "learning_rate": 1.7891118844644352e-06, - "loss": 0.5898, - "step": 27416 - }, - { - "epoch": 0.7, - "learning_rate": 1.789094887600199e-06, - "loss": 0.6682, - "step": 27417 - }, - { - "epoch": 0.7, - "learning_rate": 1.7890778901317888e-06, - "loss": 0.8623, - "step": 27418 - }, - { - "epoch": 0.7, - "learning_rate": 1.7890608920592186e-06, - "loss": 0.7969, - "step": 27419 - }, - { - "epoch": 0.7, - "learning_rate": 1.7890438933825e-06, - "loss": 1.0156, - "step": 27420 - }, - { - "epoch": 0.7, - "learning_rate": 1.789026894101647e-06, - "loss": 0.792, - "step": 27421 - }, - { - "epoch": 0.7, - "learning_rate": 1.7890098942166728e-06, - "loss": 0.7212, - "step": 27422 - }, - { - "epoch": 0.7, - "learning_rate": 1.7889928937275895e-06, - "loss": 0.8125, - "step": 27423 - }, - { - "epoch": 0.7, - "learning_rate": 1.7889758926344107e-06, - "loss": 0.7812, - "step": 27424 - }, - { - "epoch": 0.7, - "learning_rate": 1.7889588909371495e-06, - "loss": 0.7612, - "step": 27425 - }, - { - "epoch": 0.7, - "learning_rate": 1.7889418886358188e-06, - "loss": 0.8193, - "step": 27426 - }, - { - "epoch": 0.7, - "learning_rate": 1.7889248857304313e-06, - "loss": 0.8325, - "step": 27427 - }, - { - "epoch": 0.7, - "learning_rate": 1.7889078822210006e-06, - "loss": 0.8154, - "step": 27428 - }, - { - "epoch": 0.7, - "learning_rate": 1.7888908781075394e-06, - "loss": 0.7991, - "step": 27429 - }, - { - "epoch": 0.7, - "learning_rate": 1.7888738733900603e-06, - "loss": 0.707, - "step": 27430 - }, - { - "epoch": 0.7, - "learning_rate": 1.7888568680685772e-06, - "loss": 0.8335, - "step": 27431 - }, - { - "epoch": 0.7, - "learning_rate": 1.7888398621431025e-06, - "loss": 0.9531, - "step": 27432 - }, - { - "epoch": 0.7, - "learning_rate": 1.7888228556136493e-06, - "loss": 0.8877, - "step": 27433 - }, - { - "epoch": 0.7, - "learning_rate": 1.7888058484802308e-06, - "loss": 0.8525, - "step": 27434 - }, - { - "epoch": 0.7, - "learning_rate": 1.78878884074286e-06, - "loss": 1.1562, - "step": 27435 - }, - { - "epoch": 0.7, - "learning_rate": 1.78877183240155e-06, - "loss": 0.7383, - "step": 27436 - }, - { - "epoch": 0.7, - "learning_rate": 1.7887548234563132e-06, - "loss": 0.874, - "step": 27437 - }, - { - "epoch": 0.7, - "learning_rate": 1.7887378139071636e-06, - "loss": 0.8877, - "step": 27438 - }, - { - "epoch": 0.7, - "learning_rate": 1.7887208037541135e-06, - "loss": 0.7832, - "step": 27439 - }, - { - "epoch": 0.7, - "learning_rate": 1.788703792997176e-06, - "loss": 0.689, - "step": 27440 - }, - { - "epoch": 0.7, - "learning_rate": 1.7886867816363643e-06, - "loss": 0.8394, - "step": 27441 - }, - { - "epoch": 0.7, - "learning_rate": 1.7886697696716917e-06, - "loss": 0.9355, - "step": 27442 - }, - { - "epoch": 0.7, - "learning_rate": 1.7886527571031707e-06, - "loss": 0.8857, - "step": 27443 - }, - { - "epoch": 0.7, - "learning_rate": 1.7886357439308143e-06, - "loss": 0.749, - "step": 27444 - }, - { - "epoch": 0.7, - "learning_rate": 1.7886187301546363e-06, - "loss": 0.6707, - "step": 27445 - }, - { - "epoch": 0.7, - "learning_rate": 1.788601715774649e-06, - "loss": 1.0137, - "step": 27446 - }, - { - "epoch": 0.7, - "learning_rate": 1.7885847007908654e-06, - "loss": 0.8701, - "step": 27447 - }, - { - "epoch": 0.7, - "learning_rate": 1.788567685203299e-06, - "loss": 0.9277, - "step": 27448 - }, - { - "epoch": 0.7, - "learning_rate": 1.7885506690119624e-06, - "loss": 0.957, - "step": 27449 - }, - { - "epoch": 0.7, - "learning_rate": 1.788533652216869e-06, - "loss": 0.6099, - "step": 27450 - }, - { - "epoch": 0.7, - "learning_rate": 1.7885166348180317e-06, - "loss": 0.8955, - "step": 27451 - }, - { - "epoch": 0.7, - "learning_rate": 1.7884996168154634e-06, - "loss": 0.8555, - "step": 27452 - }, - { - "epoch": 0.7, - "learning_rate": 1.788482598209177e-06, - "loss": 0.8955, - "step": 27453 - }, - { - "epoch": 0.7, - "learning_rate": 1.7884655789991859e-06, - "loss": 0.9941, - "step": 27454 - }, - { - "epoch": 0.7, - "learning_rate": 1.788448559185503e-06, - "loss": 0.9014, - "step": 27455 - }, - { - "epoch": 0.7, - "learning_rate": 1.7884315387681413e-06, - "loss": 0.9824, - "step": 27456 - }, - { - "epoch": 0.7, - "learning_rate": 1.7884145177471135e-06, - "loss": 1.0332, - "step": 27457 - }, - { - "epoch": 0.7, - "learning_rate": 1.7883974961224332e-06, - "loss": 0.7871, - "step": 27458 - }, - { - "epoch": 0.7, - "learning_rate": 1.7883804738941133e-06, - "loss": 0.918, - "step": 27459 - }, - { - "epoch": 0.7, - "learning_rate": 1.7883634510621665e-06, - "loss": 0.875, - "step": 27460 - }, - { - "epoch": 0.7, - "learning_rate": 1.7883464276266062e-06, - "loss": 0.8359, - "step": 27461 - }, - { - "epoch": 0.7, - "learning_rate": 1.7883294035874452e-06, - "loss": 1.043, - "step": 27462 - }, - { - "epoch": 0.7, - "learning_rate": 1.7883123789446968e-06, - "loss": 0.769, - "step": 27463 - }, - { - "epoch": 0.7, - "learning_rate": 1.7882953536983739e-06, - "loss": 0.7314, - "step": 27464 - }, - { - "epoch": 0.7, - "learning_rate": 1.7882783278484891e-06, - "loss": 0.7256, - "step": 27465 - }, - { - "epoch": 0.7, - "learning_rate": 1.788261301395056e-06, - "loss": 0.8174, - "step": 27466 - }, - { - "epoch": 0.7, - "learning_rate": 1.7882442743380875e-06, - "loss": 1.0361, - "step": 27467 - }, - { - "epoch": 0.7, - "learning_rate": 1.7882272466775967e-06, - "loss": 0.9365, - "step": 27468 - }, - { - "epoch": 0.7, - "learning_rate": 1.7882102184135963e-06, - "loss": 0.9185, - "step": 27469 - }, - { - "epoch": 0.7, - "learning_rate": 1.7881931895461e-06, - "loss": 0.9971, - "step": 27470 - }, - { - "epoch": 0.7, - "learning_rate": 1.7881761600751202e-06, - "loss": 0.7358, - "step": 27471 - }, - { - "epoch": 0.7, - "learning_rate": 1.78815913000067e-06, - "loss": 1.0449, - "step": 27472 - }, - { - "epoch": 0.7, - "learning_rate": 1.7881420993227628e-06, - "loss": 0.8008, - "step": 27473 - }, - { - "epoch": 0.7, - "learning_rate": 1.7881250680414112e-06, - "loss": 0.9482, - "step": 27474 - }, - { - "epoch": 0.7, - "learning_rate": 1.7881080361566287e-06, - "loss": 0.7058, - "step": 27475 - }, - { - "epoch": 0.7, - "learning_rate": 1.788091003668428e-06, - "loss": 1.0391, - "step": 27476 - }, - { - "epoch": 0.7, - "learning_rate": 1.7880739705768221e-06, - "loss": 0.8457, - "step": 27477 - }, - { - "epoch": 0.7, - "learning_rate": 1.7880569368818245e-06, - "loss": 0.9473, - "step": 27478 - }, - { - "epoch": 0.7, - "learning_rate": 1.788039902583448e-06, - "loss": 0.8291, - "step": 27479 - }, - { - "epoch": 0.7, - "learning_rate": 1.7880228676817054e-06, - "loss": 0.8633, - "step": 27480 - }, - { - "epoch": 0.7, - "learning_rate": 1.7880058321766098e-06, - "loss": 0.7627, - "step": 27481 - }, - { - "epoch": 0.7, - "learning_rate": 1.7879887960681748e-06, - "loss": 0.9434, - "step": 27482 - }, - { - "epoch": 0.7, - "learning_rate": 1.7879717593564126e-06, - "loss": 0.7212, - "step": 27483 - }, - { - "epoch": 0.7, - "learning_rate": 1.7879547220413368e-06, - "loss": 0.7803, - "step": 27484 - }, - { - "epoch": 0.7, - "learning_rate": 1.7879376841229604e-06, - "loss": 0.9199, - "step": 27485 - }, - { - "epoch": 0.7, - "learning_rate": 1.787920645601296e-06, - "loss": 0.8218, - "step": 27486 - }, - { - "epoch": 0.7, - "learning_rate": 1.7879036064763574e-06, - "loss": 0.7715, - "step": 27487 - }, - { - "epoch": 0.7, - "learning_rate": 1.7878865667481571e-06, - "loss": 0.9736, - "step": 27488 - }, - { - "epoch": 0.7, - "learning_rate": 1.787869526416708e-06, - "loss": 0.7676, - "step": 27489 - }, - { - "epoch": 0.7, - "learning_rate": 1.7878524854820238e-06, - "loss": 1.0156, - "step": 27490 - }, - { - "epoch": 0.7, - "learning_rate": 1.7878354439441169e-06, - "loss": 0.9189, - "step": 27491 - }, - { - "epoch": 0.7, - "learning_rate": 1.7878184018030008e-06, - "loss": 0.8594, - "step": 27492 - }, - { - "epoch": 0.7, - "learning_rate": 1.7878013590586884e-06, - "loss": 0.8701, - "step": 27493 - }, - { - "epoch": 0.7, - "learning_rate": 1.7877843157111924e-06, - "loss": 0.8711, - "step": 27494 - }, - { - "epoch": 0.7, - "learning_rate": 1.7877672717605266e-06, - "loss": 0.8706, - "step": 27495 - }, - { - "epoch": 0.7, - "learning_rate": 1.7877502272067036e-06, - "loss": 0.8936, - "step": 27496 - }, - { - "epoch": 0.7, - "learning_rate": 1.7877331820497364e-06, - "loss": 0.9932, - "step": 27497 - }, - { - "epoch": 0.7, - "learning_rate": 1.7877161362896378e-06, - "loss": 0.6533, - "step": 27498 - }, - { - "epoch": 0.7, - "learning_rate": 1.7876990899264216e-06, - "loss": 1.0195, - "step": 27499 - }, - { - "epoch": 0.7, - "learning_rate": 1.7876820429601003e-06, - "loss": 0.8896, - "step": 27500 - }, - { - "epoch": 0.7, - "learning_rate": 1.787664995390687e-06, - "loss": 0.8018, - "step": 27501 - }, - { - "epoch": 0.7, - "learning_rate": 1.7876479472181946e-06, - "loss": 0.7197, - "step": 27502 - }, - { - "epoch": 0.7, - "learning_rate": 1.7876308984426369e-06, - "loss": 0.998, - "step": 27503 - }, - { - "epoch": 0.7, - "learning_rate": 1.787613849064026e-06, - "loss": 0.9121, - "step": 27504 - }, - { - "epoch": 0.7, - "learning_rate": 1.7875967990823758e-06, - "loss": 0.9346, - "step": 27505 - }, - { - "epoch": 0.7, - "learning_rate": 1.7875797484976986e-06, - "loss": 0.7842, - "step": 27506 - }, - { - "epoch": 0.71, - "learning_rate": 1.787562697310008e-06, - "loss": 0.834, - "step": 27507 - }, - { - "epoch": 0.71, - "learning_rate": 1.7875456455193167e-06, - "loss": 1.0049, - "step": 27508 - }, - { - "epoch": 0.71, - "learning_rate": 1.7875285931256382e-06, - "loss": 0.6953, - "step": 27509 - }, - { - "epoch": 0.71, - "learning_rate": 1.7875115401289849e-06, - "loss": 1.0049, - "step": 27510 - }, - { - "epoch": 0.71, - "learning_rate": 1.7874944865293703e-06, - "loss": 0.9014, - "step": 27511 - }, - { - "epoch": 0.71, - "learning_rate": 1.7874774323268077e-06, - "loss": 0.8789, - "step": 27512 - }, - { - "epoch": 0.71, - "learning_rate": 1.7874603775213096e-06, - "loss": 0.7637, - "step": 27513 - }, - { - "epoch": 0.71, - "learning_rate": 1.7874433221128892e-06, - "loss": 0.5981, - "step": 27514 - }, - { - "epoch": 0.71, - "learning_rate": 1.7874262661015597e-06, - "loss": 0.8857, - "step": 27515 - }, - { - "epoch": 0.71, - "learning_rate": 1.7874092094873343e-06, - "loss": 0.9199, - "step": 27516 - }, - { - "epoch": 0.71, - "learning_rate": 1.7873921522702257e-06, - "loss": 0.9473, - "step": 27517 - }, - { - "epoch": 0.71, - "learning_rate": 1.787375094450247e-06, - "loss": 0.8818, - "step": 27518 - }, - { - "epoch": 0.71, - "learning_rate": 1.7873580360274117e-06, - "loss": 0.8486, - "step": 27519 - }, - { - "epoch": 0.71, - "learning_rate": 1.7873409770017325e-06, - "loss": 0.6167, - "step": 27520 - }, - { - "epoch": 0.71, - "learning_rate": 1.7873239173732225e-06, - "loss": 0.8525, - "step": 27521 - }, - { - "epoch": 0.71, - "learning_rate": 1.7873068571418946e-06, - "loss": 0.917, - "step": 27522 - }, - { - "epoch": 0.71, - "learning_rate": 1.7872897963077623e-06, - "loss": 0.8887, - "step": 27523 - }, - { - "epoch": 0.71, - "learning_rate": 1.787272734870838e-06, - "loss": 0.9775, - "step": 27524 - }, - { - "epoch": 0.71, - "learning_rate": 1.7872556728311356e-06, - "loss": 0.999, - "step": 27525 - }, - { - "epoch": 0.71, - "learning_rate": 1.7872386101886676e-06, - "loss": 0.8682, - "step": 27526 - }, - { - "epoch": 0.71, - "learning_rate": 1.7872215469434471e-06, - "loss": 0.7314, - "step": 27527 - }, - { - "epoch": 0.71, - "learning_rate": 1.7872044830954876e-06, - "loss": 1.0566, - "step": 27528 - }, - { - "epoch": 0.71, - "learning_rate": 1.7871874186448012e-06, - "loss": 0.8604, - "step": 27529 - }, - { - "epoch": 0.71, - "learning_rate": 1.787170353591402e-06, - "loss": 0.7544, - "step": 27530 - }, - { - "epoch": 0.71, - "learning_rate": 1.7871532879353025e-06, - "loss": 0.9482, - "step": 27531 - }, - { - "epoch": 0.71, - "learning_rate": 1.7871362216765161e-06, - "loss": 0.7378, - "step": 27532 - }, - { - "epoch": 0.71, - "learning_rate": 1.7871191548150558e-06, - "loss": 1.0215, - "step": 27533 - }, - { - "epoch": 0.71, - "learning_rate": 1.7871020873509343e-06, - "loss": 1.2529, - "step": 27534 - }, - { - "epoch": 0.71, - "learning_rate": 1.787085019284165e-06, - "loss": 0.7285, - "step": 27535 - }, - { - "epoch": 0.71, - "learning_rate": 1.7870679506147608e-06, - "loss": 0.8975, - "step": 27536 - }, - { - "epoch": 0.71, - "learning_rate": 1.787050881342735e-06, - "loss": 0.8633, - "step": 27537 - }, - { - "epoch": 0.71, - "learning_rate": 1.7870338114681002e-06, - "loss": 0.7295, - "step": 27538 - }, - { - "epoch": 0.71, - "learning_rate": 1.7870167409908703e-06, - "loss": 0.7334, - "step": 27539 - }, - { - "epoch": 0.71, - "learning_rate": 1.7869996699110574e-06, - "loss": 0.9062, - "step": 27540 - }, - { - "epoch": 0.71, - "learning_rate": 1.7869825982286754e-06, - "loss": 0.6338, - "step": 27541 - }, - { - "epoch": 0.71, - "learning_rate": 1.7869655259437368e-06, - "loss": 0.9805, - "step": 27542 - }, - { - "epoch": 0.71, - "learning_rate": 1.7869484530562552e-06, - "loss": 1.0732, - "step": 27543 - }, - { - "epoch": 0.71, - "learning_rate": 1.7869313795662428e-06, - "loss": 0.9004, - "step": 27544 - }, - { - "epoch": 0.71, - "learning_rate": 1.7869143054737137e-06, - "loss": 1.0244, - "step": 27545 - }, - { - "epoch": 0.71, - "learning_rate": 1.7868972307786803e-06, - "loss": 0.9619, - "step": 27546 - }, - { - "epoch": 0.71, - "learning_rate": 1.7868801554811561e-06, - "loss": 0.8936, - "step": 27547 - }, - { - "epoch": 0.71, - "learning_rate": 1.7868630795811538e-06, - "loss": 0.8193, - "step": 27548 - }, - { - "epoch": 0.71, - "learning_rate": 1.7868460030786865e-06, - "loss": 1.0352, - "step": 27549 - }, - { - "epoch": 0.71, - "learning_rate": 1.7868289259737675e-06, - "loss": 0.6919, - "step": 27550 - }, - { - "epoch": 0.71, - "learning_rate": 1.7868118482664096e-06, - "loss": 0.9541, - "step": 27551 - }, - { - "epoch": 0.71, - "learning_rate": 1.7867947699566263e-06, - "loss": 0.8818, - "step": 27552 - }, - { - "epoch": 0.71, - "learning_rate": 1.7867776910444303e-06, - "loss": 0.8486, - "step": 27553 - }, - { - "epoch": 0.71, - "learning_rate": 1.7867606115298347e-06, - "loss": 0.5787, - "step": 27554 - }, - { - "epoch": 0.71, - "learning_rate": 1.786743531412853e-06, - "loss": 1.041, - "step": 27555 - }, - { - "epoch": 0.71, - "learning_rate": 1.7867264506934978e-06, - "loss": 0.9707, - "step": 27556 - }, - { - "epoch": 0.71, - "learning_rate": 1.786709369371782e-06, - "loss": 0.8135, - "step": 27557 - }, - { - "epoch": 0.71, - "learning_rate": 1.7866922874477194e-06, - "loss": 0.8564, - "step": 27558 - }, - { - "epoch": 0.71, - "learning_rate": 1.7866752049213226e-06, - "loss": 0.5417, - "step": 27559 - }, - { - "epoch": 0.71, - "learning_rate": 1.786658121792605e-06, - "loss": 0.9492, - "step": 27560 - }, - { - "epoch": 0.71, - "learning_rate": 1.786641038061579e-06, - "loss": 0.8994, - "step": 27561 - }, - { - "epoch": 0.71, - "learning_rate": 1.7866239537282583e-06, - "loss": 0.7278, - "step": 27562 - }, - { - "epoch": 0.71, - "learning_rate": 1.7866068687926559e-06, - "loss": 0.752, - "step": 27563 - }, - { - "epoch": 0.71, - "learning_rate": 1.7865897832547846e-06, - "loss": 0.7866, - "step": 27564 - }, - { - "epoch": 0.71, - "learning_rate": 1.786572697114658e-06, - "loss": 0.8125, - "step": 27565 - }, - { - "epoch": 0.71, - "learning_rate": 1.7865556103722884e-06, - "loss": 1.0068, - "step": 27566 - }, - { - "epoch": 0.71, - "learning_rate": 1.7865385230276898e-06, - "loss": 0.9717, - "step": 27567 - }, - { - "epoch": 0.71, - "learning_rate": 1.7865214350808744e-06, - "loss": 0.6672, - "step": 27568 - }, - { - "epoch": 0.71, - "learning_rate": 1.7865043465318559e-06, - "loss": 0.8379, - "step": 27569 - }, - { - "epoch": 0.71, - "learning_rate": 1.7864872573806473e-06, - "loss": 0.8657, - "step": 27570 - }, - { - "epoch": 0.71, - "learning_rate": 1.7864701676272614e-06, - "loss": 0.8115, - "step": 27571 - }, - { - "epoch": 0.71, - "learning_rate": 1.7864530772717116e-06, - "loss": 0.9541, - "step": 27572 - }, - { - "epoch": 0.71, - "learning_rate": 1.7864359863140108e-06, - "loss": 0.9268, - "step": 27573 - }, - { - "epoch": 0.71, - "learning_rate": 1.7864188947541718e-06, - "loss": 1.0039, - "step": 27574 - }, - { - "epoch": 0.71, - "learning_rate": 1.7864018025922085e-06, - "loss": 0.7871, - "step": 27575 - }, - { - "epoch": 0.71, - "learning_rate": 1.7863847098281332e-06, - "loss": 0.9395, - "step": 27576 - }, - { - "epoch": 0.71, - "learning_rate": 1.7863676164619595e-06, - "loss": 1.0283, - "step": 27577 - }, - { - "epoch": 0.71, - "learning_rate": 1.7863505224937002e-06, - "loss": 0.8457, - "step": 27578 - }, - { - "epoch": 0.71, - "learning_rate": 1.7863334279233684e-06, - "loss": 0.7881, - "step": 27579 - }, - { - "epoch": 0.71, - "learning_rate": 1.7863163327509772e-06, - "loss": 0.9785, - "step": 27580 - }, - { - "epoch": 0.71, - "learning_rate": 1.7862992369765398e-06, - "loss": 0.96, - "step": 27581 - }, - { - "epoch": 0.71, - "learning_rate": 1.7862821406000692e-06, - "loss": 1.0166, - "step": 27582 - }, - { - "epoch": 0.71, - "learning_rate": 1.7862650436215785e-06, - "loss": 0.7046, - "step": 27583 - }, - { - "epoch": 0.71, - "learning_rate": 1.786247946041081e-06, - "loss": 0.7686, - "step": 27584 - }, - { - "epoch": 0.71, - "learning_rate": 1.7862308478585894e-06, - "loss": 0.8789, - "step": 27585 - }, - { - "epoch": 0.71, - "learning_rate": 1.786213749074117e-06, - "loss": 0.7148, - "step": 27586 - }, - { - "epoch": 0.71, - "learning_rate": 1.786196649687677e-06, - "loss": 0.8018, - "step": 27587 - }, - { - "epoch": 0.71, - "learning_rate": 1.7861795496992824e-06, - "loss": 0.834, - "step": 27588 - }, - { - "epoch": 0.71, - "learning_rate": 1.786162449108946e-06, - "loss": 0.7725, - "step": 27589 - }, - { - "epoch": 0.71, - "learning_rate": 1.7861453479166815e-06, - "loss": 0.9834, - "step": 27590 - }, - { - "epoch": 0.71, - "learning_rate": 1.7861282461225016e-06, - "loss": 0.9395, - "step": 27591 - }, - { - "epoch": 0.71, - "learning_rate": 1.786111143726419e-06, - "loss": 0.6536, - "step": 27592 - }, - { - "epoch": 0.71, - "learning_rate": 1.786094040728448e-06, - "loss": 1.082, - "step": 27593 - }, - { - "epoch": 0.71, - "learning_rate": 1.7860769371286004e-06, - "loss": 0.9756, - "step": 27594 - }, - { - "epoch": 0.71, - "learning_rate": 1.7860598329268899e-06, - "loss": 0.7156, - "step": 27595 - }, - { - "epoch": 0.71, - "learning_rate": 1.7860427281233296e-06, - "loss": 0.9941, - "step": 27596 - }, - { - "epoch": 0.71, - "learning_rate": 1.7860256227179328e-06, - "loss": 0.7356, - "step": 27597 - }, - { - "epoch": 0.71, - "learning_rate": 1.7860085167107118e-06, - "loss": 0.7734, - "step": 27598 - }, - { - "epoch": 0.71, - "learning_rate": 1.7859914101016807e-06, - "loss": 0.9512, - "step": 27599 - }, - { - "epoch": 0.71, - "learning_rate": 1.7859743028908515e-06, - "loss": 0.8086, - "step": 27600 - }, - { - "epoch": 0.71, - "learning_rate": 1.7859571950782387e-06, - "loss": 0.6318, - "step": 27601 - }, - { - "epoch": 0.71, - "learning_rate": 1.7859400866638539e-06, - "loss": 0.8081, - "step": 27602 - }, - { - "epoch": 0.71, - "learning_rate": 1.7859229776477114e-06, - "loss": 0.7959, - "step": 27603 - }, - { - "epoch": 0.71, - "learning_rate": 1.7859058680298236e-06, - "loss": 0.8823, - "step": 27604 - }, - { - "epoch": 0.71, - "learning_rate": 1.7858887578102039e-06, - "loss": 0.6436, - "step": 27605 - }, - { - "epoch": 0.71, - "learning_rate": 1.7858716469888652e-06, - "loss": 0.9229, - "step": 27606 - }, - { - "epoch": 0.71, - "learning_rate": 1.7858545355658208e-06, - "loss": 0.6953, - "step": 27607 - }, - { - "epoch": 0.71, - "learning_rate": 1.7858374235410838e-06, - "loss": 0.998, - "step": 27608 - }, - { - "epoch": 0.71, - "learning_rate": 1.785820310914667e-06, - "loss": 0.9541, - "step": 27609 - }, - { - "epoch": 0.71, - "learning_rate": 1.785803197686584e-06, - "loss": 0.8936, - "step": 27610 - }, - { - "epoch": 0.71, - "learning_rate": 1.7857860838568474e-06, - "loss": 0.9443, - "step": 27611 - }, - { - "epoch": 0.71, - "learning_rate": 1.7857689694254705e-06, - "loss": 1.002, - "step": 27612 - }, - { - "epoch": 0.71, - "learning_rate": 1.7857518543924665e-06, - "loss": 0.7119, - "step": 27613 - }, - { - "epoch": 0.71, - "learning_rate": 1.7857347387578486e-06, - "loss": 0.605, - "step": 27614 - }, - { - "epoch": 0.71, - "learning_rate": 1.7857176225216294e-06, - "loss": 0.71, - "step": 27615 - }, - { - "epoch": 0.71, - "learning_rate": 1.7857005056838226e-06, - "loss": 1.0029, - "step": 27616 - }, - { - "epoch": 0.71, - "learning_rate": 1.785683388244441e-06, - "loss": 0.5664, - "step": 27617 - }, - { - "epoch": 0.71, - "learning_rate": 1.7856662702034977e-06, - "loss": 0.4883, - "step": 27618 - }, - { - "epoch": 0.71, - "learning_rate": 1.7856491515610062e-06, - "loss": 0.9111, - "step": 27619 - }, - { - "epoch": 0.71, - "learning_rate": 1.7856320323169788e-06, - "loss": 0.6033, - "step": 27620 - }, - { - "epoch": 0.71, - "learning_rate": 1.7856149124714293e-06, - "loss": 0.915, - "step": 27621 - }, - { - "epoch": 0.71, - "learning_rate": 1.7855977920243706e-06, - "loss": 0.6858, - "step": 27622 - }, - { - "epoch": 0.71, - "learning_rate": 1.7855806709758157e-06, - "loss": 0.6384, - "step": 27623 - }, - { - "epoch": 0.71, - "learning_rate": 1.7855635493257779e-06, - "loss": 0.6865, - "step": 27624 - }, - { - "epoch": 0.71, - "learning_rate": 1.7855464270742702e-06, - "loss": 0.9414, - "step": 27625 - }, - { - "epoch": 0.71, - "learning_rate": 1.7855293042213052e-06, - "loss": 0.7949, - "step": 27626 - }, - { - "epoch": 0.71, - "learning_rate": 1.7855121807668973e-06, - "loss": 0.8301, - "step": 27627 - }, - { - "epoch": 0.71, - "learning_rate": 1.7854950567110585e-06, - "loss": 0.874, - "step": 27628 - }, - { - "epoch": 0.71, - "learning_rate": 1.7854779320538024e-06, - "loss": 0.8481, - "step": 27629 - }, - { - "epoch": 0.71, - "learning_rate": 1.7854608067951418e-06, - "loss": 0.8223, - "step": 27630 - }, - { - "epoch": 0.71, - "learning_rate": 1.78544368093509e-06, - "loss": 0.8433, - "step": 27631 - }, - { - "epoch": 0.71, - "learning_rate": 1.7854265544736603e-06, - "loss": 0.9697, - "step": 27632 - }, - { - "epoch": 0.71, - "learning_rate": 1.7854094274108653e-06, - "loss": 0.8813, - "step": 27633 - }, - { - "epoch": 0.71, - "learning_rate": 1.7853922997467186e-06, - "loss": 0.9248, - "step": 27634 - }, - { - "epoch": 0.71, - "learning_rate": 1.785375171481233e-06, - "loss": 1.0029, - "step": 27635 - }, - { - "epoch": 0.71, - "learning_rate": 1.785358042614422e-06, - "loss": 0.9316, - "step": 27636 - }, - { - "epoch": 0.71, - "learning_rate": 1.7853409131462982e-06, - "loss": 0.707, - "step": 27637 - }, - { - "epoch": 0.71, - "learning_rate": 1.785323783076875e-06, - "loss": 0.8721, - "step": 27638 - }, - { - "epoch": 0.71, - "learning_rate": 1.7853066524061655e-06, - "loss": 0.9785, - "step": 27639 - }, - { - "epoch": 0.71, - "learning_rate": 1.785289521134183e-06, - "loss": 0.9609, - "step": 27640 - }, - { - "epoch": 0.71, - "learning_rate": 1.7852723892609403e-06, - "loss": 0.8262, - "step": 27641 - }, - { - "epoch": 0.71, - "learning_rate": 1.7852552567864506e-06, - "loss": 0.8262, - "step": 27642 - }, - { - "epoch": 0.71, - "learning_rate": 1.7852381237107271e-06, - "loss": 0.7773, - "step": 27643 - }, - { - "epoch": 0.71, - "learning_rate": 1.7852209900337826e-06, - "loss": 0.9248, - "step": 27644 - }, - { - "epoch": 0.71, - "learning_rate": 1.7852038557556309e-06, - "loss": 0.8545, - "step": 27645 - }, - { - "epoch": 0.71, - "learning_rate": 1.7851867208762846e-06, - "loss": 0.8398, - "step": 27646 - }, - { - "epoch": 0.71, - "learning_rate": 1.7851695853957568e-06, - "loss": 0.7506, - "step": 27647 - }, - { - "epoch": 0.71, - "learning_rate": 1.7851524493140606e-06, - "loss": 1.0098, - "step": 27648 - }, - { - "epoch": 0.71, - "learning_rate": 1.7851353126312096e-06, - "loss": 0.9844, - "step": 27649 - }, - { - "epoch": 0.71, - "learning_rate": 1.7851181753472164e-06, - "loss": 0.8604, - "step": 27650 - }, - { - "epoch": 0.71, - "learning_rate": 1.7851010374620947e-06, - "loss": 0.8633, - "step": 27651 - }, - { - "epoch": 0.71, - "learning_rate": 1.785083898975857e-06, - "loss": 1.0576, - "step": 27652 - }, - { - "epoch": 0.71, - "learning_rate": 1.7850667598885165e-06, - "loss": 0.9258, - "step": 27653 - }, - { - "epoch": 0.71, - "learning_rate": 1.7850496202000866e-06, - "loss": 0.9639, - "step": 27654 - }, - { - "epoch": 0.71, - "learning_rate": 1.7850324799105804e-06, - "loss": 0.7832, - "step": 27655 - }, - { - "epoch": 0.71, - "learning_rate": 1.7850153390200106e-06, - "loss": 1.0742, - "step": 27656 - }, - { - "epoch": 0.71, - "learning_rate": 1.784998197528391e-06, - "loss": 0.8994, - "step": 27657 - }, - { - "epoch": 0.71, - "learning_rate": 1.7849810554357343e-06, - "loss": 0.9141, - "step": 27658 - }, - { - "epoch": 0.71, - "learning_rate": 1.7849639127420534e-06, - "loss": 0.9502, - "step": 27659 - }, - { - "epoch": 0.71, - "learning_rate": 1.7849467694473621e-06, - "loss": 0.8301, - "step": 27660 - }, - { - "epoch": 0.71, - "learning_rate": 1.784929625551673e-06, - "loss": 0.7734, - "step": 27661 - }, - { - "epoch": 0.71, - "learning_rate": 1.7849124810549995e-06, - "loss": 0.9609, - "step": 27662 - }, - { - "epoch": 0.71, - "learning_rate": 1.7848953359573545e-06, - "loss": 1.0381, - "step": 27663 - }, - { - "epoch": 0.71, - "learning_rate": 1.7848781902587511e-06, - "loss": 1.0742, - "step": 27664 - }, - { - "epoch": 0.71, - "learning_rate": 1.7848610439592026e-06, - "loss": 0.5249, - "step": 27665 - }, - { - "epoch": 0.71, - "learning_rate": 1.7848438970587222e-06, - "loss": 0.7588, - "step": 27666 - }, - { - "epoch": 0.71, - "learning_rate": 1.784826749557323e-06, - "loss": 0.7747, - "step": 27667 - }, - { - "epoch": 0.71, - "learning_rate": 1.7848096014550179e-06, - "loss": 0.6714, - "step": 27668 - }, - { - "epoch": 0.71, - "learning_rate": 1.7847924527518203e-06, - "loss": 0.8477, - "step": 27669 - }, - { - "epoch": 0.71, - "learning_rate": 1.784775303447743e-06, - "loss": 0.7471, - "step": 27670 - }, - { - "epoch": 0.71, - "learning_rate": 1.7847581535427994e-06, - "loss": 0.9395, - "step": 27671 - }, - { - "epoch": 0.71, - "learning_rate": 1.7847410030370027e-06, - "loss": 0.7646, - "step": 27672 - }, - { - "epoch": 0.71, - "learning_rate": 1.7847238519303658e-06, - "loss": 0.6123, - "step": 27673 - }, - { - "epoch": 0.71, - "learning_rate": 1.784706700222902e-06, - "loss": 1.1836, - "step": 27674 - }, - { - "epoch": 0.71, - "learning_rate": 1.7846895479146242e-06, - "loss": 0.9229, - "step": 27675 - }, - { - "epoch": 0.71, - "learning_rate": 1.7846723950055457e-06, - "loss": 0.8281, - "step": 27676 - }, - { - "epoch": 0.71, - "learning_rate": 1.7846552414956799e-06, - "loss": 0.9541, - "step": 27677 - }, - { - "epoch": 0.71, - "learning_rate": 1.7846380873850396e-06, - "loss": 0.9141, - "step": 27678 - }, - { - "epoch": 0.71, - "learning_rate": 1.7846209326736376e-06, - "loss": 0.8125, - "step": 27679 - }, - { - "epoch": 0.71, - "learning_rate": 1.784603777361488e-06, - "loss": 0.8633, - "step": 27680 - }, - { - "epoch": 0.71, - "learning_rate": 1.784586621448603e-06, - "loss": 0.7764, - "step": 27681 - }, - { - "epoch": 0.71, - "learning_rate": 1.784569464934996e-06, - "loss": 0.9873, - "step": 27682 - }, - { - "epoch": 0.71, - "learning_rate": 1.7845523078206806e-06, - "loss": 0.9707, - "step": 27683 - }, - { - "epoch": 0.71, - "learning_rate": 1.7845351501056693e-06, - "loss": 0.73, - "step": 27684 - }, - { - "epoch": 0.71, - "learning_rate": 1.7845179917899755e-06, - "loss": 0.9961, - "step": 27685 - }, - { - "epoch": 0.71, - "learning_rate": 1.7845008328736127e-06, - "loss": 1.0127, - "step": 27686 - }, - { - "epoch": 0.71, - "learning_rate": 1.7844836733565932e-06, - "loss": 0.6528, - "step": 27687 - }, - { - "epoch": 0.71, - "learning_rate": 1.7844665132389308e-06, - "loss": 0.7573, - "step": 27688 - }, - { - "epoch": 0.71, - "learning_rate": 1.7844493525206389e-06, - "loss": 0.8408, - "step": 27689 - }, - { - "epoch": 0.71, - "learning_rate": 1.7844321912017296e-06, - "loss": 0.8945, - "step": 27690 - }, - { - "epoch": 0.71, - "learning_rate": 1.7844150292822168e-06, - "loss": 0.8906, - "step": 27691 - }, - { - "epoch": 0.71, - "learning_rate": 1.7843978667621136e-06, - "loss": 0.771, - "step": 27692 - }, - { - "epoch": 0.71, - "learning_rate": 1.7843807036414329e-06, - "loss": 0.8789, - "step": 27693 - }, - { - "epoch": 0.71, - "learning_rate": 1.784363539920188e-06, - "loss": 0.9492, - "step": 27694 - }, - { - "epoch": 0.71, - "learning_rate": 1.7843463755983921e-06, - "loss": 1.1133, - "step": 27695 - }, - { - "epoch": 0.71, - "learning_rate": 1.7843292106760582e-06, - "loss": 0.7407, - "step": 27696 - }, - { - "epoch": 0.71, - "learning_rate": 1.7843120451531994e-06, - "loss": 0.9531, - "step": 27697 - }, - { - "epoch": 0.71, - "learning_rate": 1.7842948790298289e-06, - "loss": 0.8184, - "step": 27698 - }, - { - "epoch": 0.71, - "learning_rate": 1.78427771230596e-06, - "loss": 0.7793, - "step": 27699 - }, - { - "epoch": 0.71, - "learning_rate": 1.7842605449816058e-06, - "loss": 0.9023, - "step": 27700 - }, - { - "epoch": 0.71, - "learning_rate": 1.784243377056779e-06, - "loss": 0.7363, - "step": 27701 - }, - { - "epoch": 0.71, - "learning_rate": 1.7842262085314937e-06, - "loss": 0.9521, - "step": 27702 - }, - { - "epoch": 0.71, - "learning_rate": 1.7842090394057619e-06, - "loss": 0.9717, - "step": 27703 - }, - { - "epoch": 0.71, - "learning_rate": 1.7841918696795975e-06, - "loss": 0.8887, - "step": 27704 - }, - { - "epoch": 0.71, - "learning_rate": 1.7841746993530133e-06, - "loss": 0.7773, - "step": 27705 - }, - { - "epoch": 0.71, - "learning_rate": 1.784157528426023e-06, - "loss": 0.7461, - "step": 27706 - }, - { - "epoch": 0.71, - "learning_rate": 1.784140356898639e-06, - "loss": 0.6714, - "step": 27707 - }, - { - "epoch": 0.71, - "learning_rate": 1.7841231847708745e-06, - "loss": 0.8379, - "step": 27708 - }, - { - "epoch": 0.71, - "learning_rate": 1.7841060120427436e-06, - "loss": 1.0029, - "step": 27709 - }, - { - "epoch": 0.71, - "learning_rate": 1.7840888387142586e-06, - "loss": 0.6686, - "step": 27710 - }, - { - "epoch": 0.71, - "learning_rate": 1.7840716647854324e-06, - "loss": 0.9512, - "step": 27711 - }, - { - "epoch": 0.71, - "learning_rate": 1.7840544902562788e-06, - "loss": 0.957, - "step": 27712 - }, - { - "epoch": 0.71, - "learning_rate": 1.784037315126811e-06, - "loss": 0.9561, - "step": 27713 - }, - { - "epoch": 0.71, - "learning_rate": 1.7840201393970417e-06, - "loss": 0.4406, - "step": 27714 - }, - { - "epoch": 0.71, - "learning_rate": 1.7840029630669843e-06, - "loss": 0.7329, - "step": 27715 - }, - { - "epoch": 0.71, - "learning_rate": 1.7839857861366517e-06, - "loss": 0.7246, - "step": 27716 - }, - { - "epoch": 0.71, - "learning_rate": 1.7839686086060572e-06, - "loss": 1.1064, - "step": 27717 - }, - { - "epoch": 0.71, - "learning_rate": 1.783951430475214e-06, - "loss": 0.7715, - "step": 27718 - }, - { - "epoch": 0.71, - "learning_rate": 1.7839342517441356e-06, - "loss": 0.7461, - "step": 27719 - }, - { - "epoch": 0.71, - "learning_rate": 1.7839170724128346e-06, - "loss": 1.0, - "step": 27720 - }, - { - "epoch": 0.71, - "learning_rate": 1.7838998924813242e-06, - "loss": 0.7529, - "step": 27721 - }, - { - "epoch": 0.71, - "learning_rate": 1.7838827119496176e-06, - "loss": 0.7292, - "step": 27722 - }, - { - "epoch": 0.71, - "learning_rate": 1.7838655308177284e-06, - "loss": 0.7715, - "step": 27723 - }, - { - "epoch": 0.71, - "learning_rate": 1.783848349085669e-06, - "loss": 0.9346, - "step": 27724 - }, - { - "epoch": 0.71, - "learning_rate": 1.7838311667534533e-06, - "loss": 0.8755, - "step": 27725 - }, - { - "epoch": 0.71, - "learning_rate": 1.7838139838210942e-06, - "loss": 0.6641, - "step": 27726 - }, - { - "epoch": 0.71, - "learning_rate": 1.7837968002886043e-06, - "loss": 0.8096, - "step": 27727 - }, - { - "epoch": 0.71, - "learning_rate": 1.7837796161559978e-06, - "loss": 0.6729, - "step": 27728 - }, - { - "epoch": 0.71, - "learning_rate": 1.7837624314232869e-06, - "loss": 1.0293, - "step": 27729 - }, - { - "epoch": 0.71, - "learning_rate": 1.7837452460904851e-06, - "loss": 0.9814, - "step": 27730 - }, - { - "epoch": 0.71, - "learning_rate": 1.7837280601576058e-06, - "loss": 0.9648, - "step": 27731 - }, - { - "epoch": 0.71, - "learning_rate": 1.783710873624662e-06, - "loss": 0.8186, - "step": 27732 - }, - { - "epoch": 0.71, - "learning_rate": 1.7836936864916666e-06, - "loss": 0.6187, - "step": 27733 - }, - { - "epoch": 0.71, - "learning_rate": 1.7836764987586333e-06, - "loss": 0.6562, - "step": 27734 - }, - { - "epoch": 0.71, - "learning_rate": 1.7836593104255745e-06, - "loss": 0.9609, - "step": 27735 - }, - { - "epoch": 0.71, - "learning_rate": 1.783642121492504e-06, - "loss": 1.1172, - "step": 27736 - }, - { - "epoch": 0.71, - "learning_rate": 1.783624931959435e-06, - "loss": 0.9023, - "step": 27737 - }, - { - "epoch": 0.71, - "learning_rate": 1.7836077418263801e-06, - "loss": 0.9082, - "step": 27738 - }, - { - "epoch": 0.71, - "learning_rate": 1.7835905510933529e-06, - "loss": 1.0371, - "step": 27739 - }, - { - "epoch": 0.71, - "learning_rate": 1.7835733597603664e-06, - "loss": 0.8428, - "step": 27740 - }, - { - "epoch": 0.71, - "learning_rate": 1.783556167827434e-06, - "loss": 0.957, - "step": 27741 - }, - { - "epoch": 0.71, - "learning_rate": 1.7835389752945686e-06, - "loss": 0.7676, - "step": 27742 - }, - { - "epoch": 0.71, - "learning_rate": 1.7835217821617833e-06, - "loss": 0.957, - "step": 27743 - }, - { - "epoch": 0.71, - "learning_rate": 1.7835045884290913e-06, - "loss": 0.8047, - "step": 27744 - }, - { - "epoch": 0.71, - "learning_rate": 1.783487394096506e-06, - "loss": 0.7808, - "step": 27745 - }, - { - "epoch": 0.71, - "learning_rate": 1.7834701991640406e-06, - "loss": 1.0186, - "step": 27746 - }, - { - "epoch": 0.71, - "learning_rate": 1.7834530036317079e-06, - "loss": 0.8535, - "step": 27747 - }, - { - "epoch": 0.71, - "learning_rate": 1.7834358074995213e-06, - "loss": 0.7671, - "step": 27748 - }, - { - "epoch": 0.71, - "learning_rate": 1.783418610767494e-06, - "loss": 0.877, - "step": 27749 - }, - { - "epoch": 0.71, - "learning_rate": 1.783401413435639e-06, - "loss": 0.7275, - "step": 27750 - }, - { - "epoch": 0.71, - "learning_rate": 1.7833842155039695e-06, - "loss": 1.0195, - "step": 27751 - }, - { - "epoch": 0.71, - "learning_rate": 1.783367016972499e-06, - "loss": 0.7446, - "step": 27752 - }, - { - "epoch": 0.71, - "learning_rate": 1.7833498178412402e-06, - "loss": 0.8994, - "step": 27753 - }, - { - "epoch": 0.71, - "learning_rate": 1.7833326181102067e-06, - "loss": 0.9678, - "step": 27754 - }, - { - "epoch": 0.71, - "learning_rate": 1.783315417779411e-06, - "loss": 0.9238, - "step": 27755 - }, - { - "epoch": 0.71, - "learning_rate": 1.7832982168488668e-06, - "loss": 0.9258, - "step": 27756 - }, - { - "epoch": 0.71, - "learning_rate": 1.7832810153185873e-06, - "loss": 0.8115, - "step": 27757 - }, - { - "epoch": 0.71, - "learning_rate": 1.7832638131885856e-06, - "loss": 1.0117, - "step": 27758 - }, - { - "epoch": 0.71, - "learning_rate": 1.7832466104588746e-06, - "loss": 0.6506, - "step": 27759 - }, - { - "epoch": 0.71, - "learning_rate": 1.7832294071294677e-06, - "loss": 0.8223, - "step": 27760 - }, - { - "epoch": 0.71, - "learning_rate": 1.7832122032003784e-06, - "loss": 0.9517, - "step": 27761 - }, - { - "epoch": 0.71, - "learning_rate": 1.7831949986716192e-06, - "loss": 0.8555, - "step": 27762 - }, - { - "epoch": 0.71, - "learning_rate": 1.7831777935432037e-06, - "loss": 1.0088, - "step": 27763 - }, - { - "epoch": 0.71, - "learning_rate": 1.783160587815145e-06, - "loss": 0.7217, - "step": 27764 - }, - { - "epoch": 0.71, - "learning_rate": 1.7831433814874563e-06, - "loss": 0.8364, - "step": 27765 - }, - { - "epoch": 0.71, - "learning_rate": 1.7831261745601507e-06, - "loss": 1.1641, - "step": 27766 - }, - { - "epoch": 0.71, - "learning_rate": 1.7831089670332413e-06, - "loss": 1.0166, - "step": 27767 - }, - { - "epoch": 0.71, - "learning_rate": 1.7830917589067417e-06, - "loss": 1.0303, - "step": 27768 - }, - { - "epoch": 0.71, - "learning_rate": 1.7830745501806644e-06, - "loss": 0.7988, - "step": 27769 - }, - { - "epoch": 0.71, - "learning_rate": 1.783057340855023e-06, - "loss": 0.9902, - "step": 27770 - }, - { - "epoch": 0.71, - "learning_rate": 1.7830401309298304e-06, - "loss": 0.7139, - "step": 27771 - }, - { - "epoch": 0.71, - "learning_rate": 1.7830229204051003e-06, - "loss": 0.8857, - "step": 27772 - }, - { - "epoch": 0.71, - "learning_rate": 1.7830057092808452e-06, - "loss": 0.9297, - "step": 27773 - }, - { - "epoch": 0.71, - "learning_rate": 1.782988497557079e-06, - "loss": 0.7578, - "step": 27774 - }, - { - "epoch": 0.71, - "learning_rate": 1.7829712852338146e-06, - "loss": 0.8418, - "step": 27775 - }, - { - "epoch": 0.71, - "learning_rate": 1.7829540723110648e-06, - "loss": 0.8457, - "step": 27776 - }, - { - "epoch": 0.71, - "learning_rate": 1.7829368587888428e-06, - "loss": 0.6592, - "step": 27777 - }, - { - "epoch": 0.71, - "learning_rate": 1.7829196446671625e-06, - "loss": 0.9067, - "step": 27778 - }, - { - "epoch": 0.71, - "learning_rate": 1.7829024299460364e-06, - "loss": 0.7678, - "step": 27779 - }, - { - "epoch": 0.71, - "learning_rate": 1.782885214625478e-06, - "loss": 0.9814, - "step": 27780 - }, - { - "epoch": 0.71, - "learning_rate": 1.7828679987055006e-06, - "loss": 0.6648, - "step": 27781 - }, - { - "epoch": 0.71, - "learning_rate": 1.782850782186117e-06, - "loss": 0.7822, - "step": 27782 - }, - { - "epoch": 0.71, - "learning_rate": 1.7828335650673406e-06, - "loss": 0.9297, - "step": 27783 - }, - { - "epoch": 0.71, - "learning_rate": 1.7828163473491845e-06, - "loss": 0.8145, - "step": 27784 - }, - { - "epoch": 0.71, - "learning_rate": 1.7827991290316617e-06, - "loss": 0.7358, - "step": 27785 - }, - { - "epoch": 0.71, - "learning_rate": 1.7827819101147856e-06, - "loss": 1.0791, - "step": 27786 - }, - { - "epoch": 0.71, - "learning_rate": 1.7827646905985695e-06, - "loss": 0.9922, - "step": 27787 - }, - { - "epoch": 0.71, - "learning_rate": 1.7827474704830268e-06, - "loss": 0.9609, - "step": 27788 - }, - { - "epoch": 0.71, - "learning_rate": 1.78273024976817e-06, - "loss": 0.8477, - "step": 27789 - }, - { - "epoch": 0.71, - "learning_rate": 1.7827130284540128e-06, - "loss": 0.7734, - "step": 27790 - }, - { - "epoch": 0.71, - "learning_rate": 1.7826958065405679e-06, - "loss": 0.7803, - "step": 27791 - }, - { - "epoch": 0.71, - "learning_rate": 1.7826785840278493e-06, - "loss": 0.8652, - "step": 27792 - }, - { - "epoch": 0.71, - "learning_rate": 1.7826613609158693e-06, - "loss": 0.877, - "step": 27793 - }, - { - "epoch": 0.71, - "learning_rate": 1.7826441372046417e-06, - "loss": 1.0107, - "step": 27794 - }, - { - "epoch": 0.71, - "learning_rate": 1.7826269128941795e-06, - "loss": 0.7715, - "step": 27795 - }, - { - "epoch": 0.71, - "learning_rate": 1.7826096879844958e-06, - "loss": 0.8906, - "step": 27796 - }, - { - "epoch": 0.71, - "learning_rate": 1.7825924624756038e-06, - "loss": 1.0566, - "step": 27797 - }, - { - "epoch": 0.71, - "learning_rate": 1.7825752363675166e-06, - "loss": 0.7485, - "step": 27798 - }, - { - "epoch": 0.71, - "learning_rate": 1.782558009660248e-06, - "loss": 0.8242, - "step": 27799 - }, - { - "epoch": 0.71, - "learning_rate": 1.7825407823538101e-06, - "loss": 0.9404, - "step": 27800 - }, - { - "epoch": 0.71, - "learning_rate": 1.7825235544482172e-06, - "loss": 1.1221, - "step": 27801 - }, - { - "epoch": 0.71, - "learning_rate": 1.7825063259434817e-06, - "loss": 0.6758, - "step": 27802 - }, - { - "epoch": 0.71, - "learning_rate": 1.782489096839617e-06, - "loss": 1.002, - "step": 27803 - }, - { - "epoch": 0.71, - "learning_rate": 1.7824718671366368e-06, - "loss": 0.9766, - "step": 27804 - }, - { - "epoch": 0.71, - "learning_rate": 1.7824546368345535e-06, - "loss": 0.6104, - "step": 27805 - }, - { - "epoch": 0.71, - "learning_rate": 1.7824374059333809e-06, - "loss": 0.8447, - "step": 27806 - }, - { - "epoch": 0.71, - "learning_rate": 1.7824201744331318e-06, - "loss": 0.9443, - "step": 27807 - }, - { - "epoch": 0.71, - "learning_rate": 1.7824029423338197e-06, - "loss": 0.9932, - "step": 27808 - }, - { - "epoch": 0.71, - "learning_rate": 1.7823857096354575e-06, - "loss": 0.9287, - "step": 27809 - }, - { - "epoch": 0.71, - "learning_rate": 1.7823684763380585e-06, - "loss": 1.0684, - "step": 27810 - }, - { - "epoch": 0.71, - "learning_rate": 1.7823512424416358e-06, - "loss": 1.0537, - "step": 27811 - }, - { - "epoch": 0.71, - "learning_rate": 1.7823340079462032e-06, - "loss": 0.8555, - "step": 27812 - }, - { - "epoch": 0.71, - "learning_rate": 1.7823167728517729e-06, - "loss": 0.7476, - "step": 27813 - }, - { - "epoch": 0.71, - "learning_rate": 1.7822995371583591e-06, - "loss": 0.8164, - "step": 27814 - }, - { - "epoch": 0.71, - "learning_rate": 1.7822823008659741e-06, - "loss": 1.0654, - "step": 27815 - }, - { - "epoch": 0.71, - "learning_rate": 1.782265063974632e-06, - "loss": 1.0996, - "step": 27816 - }, - { - "epoch": 0.71, - "learning_rate": 1.7822478264843452e-06, - "loss": 1.0732, - "step": 27817 - }, - { - "epoch": 0.71, - "learning_rate": 1.782230588395127e-06, - "loss": 0.8242, - "step": 27818 - }, - { - "epoch": 0.71, - "learning_rate": 1.7822133497069914e-06, - "loss": 1.0908, - "step": 27819 - }, - { - "epoch": 0.71, - "learning_rate": 1.7821961104199504e-06, - "loss": 0.9629, - "step": 27820 - }, - { - "epoch": 0.71, - "learning_rate": 1.7821788705340181e-06, - "loss": 0.897, - "step": 27821 - }, - { - "epoch": 0.71, - "learning_rate": 1.7821616300492073e-06, - "loss": 0.7554, - "step": 27822 - }, - { - "epoch": 0.71, - "learning_rate": 1.7821443889655315e-06, - "loss": 0.8467, - "step": 27823 - }, - { - "epoch": 0.71, - "learning_rate": 1.7821271472830034e-06, - "loss": 0.8862, - "step": 27824 - }, - { - "epoch": 0.71, - "learning_rate": 1.7821099050016366e-06, - "loss": 0.9844, - "step": 27825 - }, - { - "epoch": 0.71, - "learning_rate": 1.7820926621214443e-06, - "loss": 0.8701, - "step": 27826 - }, - { - "epoch": 0.71, - "learning_rate": 1.7820754186424396e-06, - "loss": 0.9307, - "step": 27827 - }, - { - "epoch": 0.71, - "learning_rate": 1.7820581745646357e-06, - "loss": 0.8789, - "step": 27828 - }, - { - "epoch": 0.71, - "learning_rate": 1.7820409298880458e-06, - "loss": 0.8457, - "step": 27829 - }, - { - "epoch": 0.71, - "learning_rate": 1.782023684612683e-06, - "loss": 0.8711, - "step": 27830 - }, - { - "epoch": 0.71, - "learning_rate": 1.782006438738561e-06, - "loss": 0.8164, - "step": 27831 - }, - { - "epoch": 0.71, - "learning_rate": 1.7819891922656922e-06, - "loss": 0.7744, - "step": 27832 - }, - { - "epoch": 0.71, - "learning_rate": 1.7819719451940904e-06, - "loss": 0.7744, - "step": 27833 - }, - { - "epoch": 0.71, - "learning_rate": 1.7819546975237687e-06, - "loss": 0.959, - "step": 27834 - }, - { - "epoch": 0.71, - "learning_rate": 1.7819374492547401e-06, - "loss": 0.8223, - "step": 27835 - }, - { - "epoch": 0.71, - "learning_rate": 1.7819202003870179e-06, - "loss": 0.8135, - "step": 27836 - }, - { - "epoch": 0.71, - "learning_rate": 1.7819029509206157e-06, - "loss": 0.8369, - "step": 27837 - }, - { - "epoch": 0.71, - "learning_rate": 1.781885700855546e-06, - "loss": 0.4861, - "step": 27838 - }, - { - "epoch": 0.71, - "learning_rate": 1.7818684501918226e-06, - "loss": 0.874, - "step": 27839 - }, - { - "epoch": 0.71, - "learning_rate": 1.7818511989294584e-06, - "loss": 0.7812, - "step": 27840 - }, - { - "epoch": 0.71, - "learning_rate": 1.781833947068467e-06, - "loss": 0.959, - "step": 27841 - }, - { - "epoch": 0.71, - "learning_rate": 1.7818166946088607e-06, - "loss": 0.834, - "step": 27842 - }, - { - "epoch": 0.71, - "learning_rate": 1.7817994415506536e-06, - "loss": 0.748, - "step": 27843 - }, - { - "epoch": 0.71, - "learning_rate": 1.7817821878938587e-06, - "loss": 0.6487, - "step": 27844 - }, - { - "epoch": 0.71, - "learning_rate": 1.781764933638489e-06, - "loss": 0.7681, - "step": 27845 - }, - { - "epoch": 0.71, - "learning_rate": 1.781747678784558e-06, - "loss": 0.6362, - "step": 27846 - }, - { - "epoch": 0.71, - "learning_rate": 1.7817304233320784e-06, - "loss": 0.8164, - "step": 27847 - }, - { - "epoch": 0.71, - "learning_rate": 1.781713167281064e-06, - "loss": 0.7285, - "step": 27848 - }, - { - "epoch": 0.71, - "learning_rate": 1.7816959106315279e-06, - "loss": 0.8457, - "step": 27849 - }, - { - "epoch": 0.71, - "learning_rate": 1.7816786533834831e-06, - "loss": 0.8877, - "step": 27850 - }, - { - "epoch": 0.71, - "learning_rate": 1.781661395536943e-06, - "loss": 0.958, - "step": 27851 - }, - { - "epoch": 0.71, - "learning_rate": 1.7816441370919204e-06, - "loss": 0.9053, - "step": 27852 - }, - { - "epoch": 0.71, - "learning_rate": 1.7816268780484288e-06, - "loss": 0.8457, - "step": 27853 - }, - { - "epoch": 0.71, - "learning_rate": 1.7816096184064818e-06, - "loss": 0.9141, - "step": 27854 - }, - { - "epoch": 0.71, - "learning_rate": 1.781592358166092e-06, - "loss": 0.9492, - "step": 27855 - }, - { - "epoch": 0.71, - "learning_rate": 1.781575097327273e-06, - "loss": 0.7842, - "step": 27856 - }, - { - "epoch": 0.71, - "learning_rate": 1.781557835890038e-06, - "loss": 0.7476, - "step": 27857 - }, - { - "epoch": 0.71, - "learning_rate": 1.7815405738543995e-06, - "loss": 0.8979, - "step": 27858 - }, - { - "epoch": 0.71, - "learning_rate": 1.7815233112203721e-06, - "loss": 0.8105, - "step": 27859 - }, - { - "epoch": 0.71, - "learning_rate": 1.7815060479879676e-06, - "loss": 0.7393, - "step": 27860 - }, - { - "epoch": 0.71, - "learning_rate": 1.7814887841572004e-06, - "loss": 0.7598, - "step": 27861 - }, - { - "epoch": 0.71, - "learning_rate": 1.7814715197280828e-06, - "loss": 0.709, - "step": 27862 - }, - { - "epoch": 0.71, - "learning_rate": 1.7814542547006285e-06, - "loss": 0.7949, - "step": 27863 - }, - { - "epoch": 0.71, - "learning_rate": 1.7814369890748506e-06, - "loss": 0.5498, - "step": 27864 - }, - { - "epoch": 0.71, - "learning_rate": 1.7814197228507624e-06, - "loss": 0.7346, - "step": 27865 - }, - { - "epoch": 0.71, - "learning_rate": 1.7814024560283769e-06, - "loss": 0.8955, - "step": 27866 - }, - { - "epoch": 0.71, - "learning_rate": 1.7813851886077074e-06, - "loss": 0.916, - "step": 27867 - }, - { - "epoch": 0.71, - "learning_rate": 1.7813679205887672e-06, - "loss": 0.9121, - "step": 27868 - }, - { - "epoch": 0.71, - "learning_rate": 1.7813506519715697e-06, - "loss": 0.9072, - "step": 27869 - }, - { - "epoch": 0.71, - "learning_rate": 1.781333382756128e-06, - "loss": 0.6814, - "step": 27870 - }, - { - "epoch": 0.71, - "learning_rate": 1.7813161129424552e-06, - "loss": 0.7422, - "step": 27871 - }, - { - "epoch": 0.71, - "learning_rate": 1.7812988425305643e-06, - "loss": 0.6494, - "step": 27872 - }, - { - "epoch": 0.71, - "learning_rate": 1.7812815715204693e-06, - "loss": 0.7832, - "step": 27873 - }, - { - "epoch": 0.71, - "learning_rate": 1.7812642999121827e-06, - "loss": 0.834, - "step": 27874 - }, - { - "epoch": 0.71, - "learning_rate": 1.7812470277057176e-06, - "loss": 0.8203, - "step": 27875 - }, - { - "epoch": 0.71, - "learning_rate": 1.781229754901088e-06, - "loss": 0.8364, - "step": 27876 - }, - { - "epoch": 0.71, - "learning_rate": 1.7812124814983066e-06, - "loss": 0.832, - "step": 27877 - }, - { - "epoch": 0.71, - "learning_rate": 1.7811952074973867e-06, - "loss": 0.9053, - "step": 27878 - }, - { - "epoch": 0.71, - "learning_rate": 1.7811779328983415e-06, - "loss": 1.2246, - "step": 27879 - }, - { - "epoch": 0.71, - "learning_rate": 1.7811606577011844e-06, - "loss": 0.7412, - "step": 27880 - }, - { - "epoch": 0.71, - "learning_rate": 1.7811433819059283e-06, - "loss": 0.8926, - "step": 27881 - }, - { - "epoch": 0.71, - "learning_rate": 1.781126105512587e-06, - "loss": 0.9082, - "step": 27882 - }, - { - "epoch": 0.71, - "learning_rate": 1.781108828521173e-06, - "loss": 0.7485, - "step": 27883 - }, - { - "epoch": 0.71, - "learning_rate": 1.7810915509317e-06, - "loss": 0.9199, - "step": 27884 - }, - { - "epoch": 0.71, - "learning_rate": 1.7810742727441812e-06, - "loss": 0.9541, - "step": 27885 - }, - { - "epoch": 0.71, - "learning_rate": 1.7810569939586295e-06, - "loss": 0.5928, - "step": 27886 - }, - { - "epoch": 0.71, - "learning_rate": 1.7810397145750585e-06, - "loss": 0.7239, - "step": 27887 - }, - { - "epoch": 0.71, - "learning_rate": 1.7810224345934815e-06, - "loss": 0.8877, - "step": 27888 - }, - { - "epoch": 0.71, - "learning_rate": 1.7810051540139113e-06, - "loss": 1.1602, - "step": 27889 - }, - { - "epoch": 0.71, - "learning_rate": 1.7809878728363614e-06, - "loss": 0.6157, - "step": 27890 - }, - { - "epoch": 0.71, - "learning_rate": 1.780970591060845e-06, - "loss": 0.9111, - "step": 27891 - }, - { - "epoch": 0.71, - "learning_rate": 1.7809533086873753e-06, - "loss": 0.8264, - "step": 27892 - }, - { - "epoch": 0.71, - "learning_rate": 1.7809360257159657e-06, - "loss": 0.9219, - "step": 27893 - }, - { - "epoch": 0.71, - "learning_rate": 1.7809187421466292e-06, - "loss": 0.9121, - "step": 27894 - }, - { - "epoch": 0.71, - "learning_rate": 1.7809014579793792e-06, - "loss": 0.9795, - "step": 27895 - }, - { - "epoch": 0.71, - "learning_rate": 1.7808841732142289e-06, - "loss": 1.0918, - "step": 27896 - }, - { - "epoch": 0.72, - "learning_rate": 1.7808668878511913e-06, - "loss": 0.6758, - "step": 27897 - }, - { - "epoch": 0.72, - "learning_rate": 1.78084960189028e-06, - "loss": 0.7363, - "step": 27898 - }, - { - "epoch": 0.72, - "learning_rate": 1.780832315331508e-06, - "loss": 0.8213, - "step": 27899 - }, - { - "epoch": 0.72, - "learning_rate": 1.7808150281748884e-06, - "loss": 0.9326, - "step": 27900 - }, - { - "epoch": 0.72, - "learning_rate": 1.7807977404204348e-06, - "loss": 0.4316, - "step": 27901 - }, - { - "epoch": 0.72, - "learning_rate": 1.7807804520681603e-06, - "loss": 0.9297, - "step": 27902 - }, - { - "epoch": 0.72, - "learning_rate": 1.7807631631180781e-06, - "loss": 0.7607, - "step": 27903 - }, - { - "epoch": 0.72, - "learning_rate": 1.7807458735702014e-06, - "loss": 0.833, - "step": 27904 - }, - { - "epoch": 0.72, - "learning_rate": 1.7807285834245435e-06, - "loss": 0.8574, - "step": 27905 - }, - { - "epoch": 0.72, - "learning_rate": 1.7807112926811179e-06, - "loss": 0.8838, - "step": 27906 - }, - { - "epoch": 0.72, - "learning_rate": 1.7806940013399375e-06, - "loss": 0.8398, - "step": 27907 - }, - { - "epoch": 0.72, - "learning_rate": 1.780676709401015e-06, - "loss": 1.0391, - "step": 27908 - }, - { - "epoch": 0.72, - "learning_rate": 1.7806594168643646e-06, - "loss": 0.5353, - "step": 27909 - }, - { - "epoch": 0.72, - "learning_rate": 1.7806421237299994e-06, - "loss": 0.8799, - "step": 27910 - }, - { - "epoch": 0.72, - "learning_rate": 1.7806248299979322e-06, - "loss": 0.7793, - "step": 27911 - }, - { - "epoch": 0.72, - "learning_rate": 1.7806075356681767e-06, - "loss": 0.8027, - "step": 27912 - }, - { - "epoch": 0.72, - "learning_rate": 1.7805902407407457e-06, - "loss": 0.9326, - "step": 27913 - }, - { - "epoch": 0.72, - "learning_rate": 1.7805729452156526e-06, - "loss": 0.7617, - "step": 27914 - }, - { - "epoch": 0.72, - "learning_rate": 1.7805556490929107e-06, - "loss": 0.8633, - "step": 27915 - }, - { - "epoch": 0.72, - "learning_rate": 1.7805383523725333e-06, - "loss": 0.8203, - "step": 27916 - }, - { - "epoch": 0.72, - "learning_rate": 1.7805210550545334e-06, - "loss": 0.8477, - "step": 27917 - }, - { - "epoch": 0.72, - "learning_rate": 1.7805037571389247e-06, - "loss": 0.6787, - "step": 27918 - }, - { - "epoch": 0.72, - "learning_rate": 1.7804864586257201e-06, - "loss": 0.8359, - "step": 27919 - }, - { - "epoch": 0.72, - "learning_rate": 1.780469159514933e-06, - "loss": 0.7539, - "step": 27920 - }, - { - "epoch": 0.72, - "learning_rate": 1.7804518598065762e-06, - "loss": 0.5693, - "step": 27921 - }, - { - "epoch": 0.72, - "learning_rate": 1.7804345595006636e-06, - "loss": 0.8789, - "step": 27922 - }, - { - "epoch": 0.72, - "learning_rate": 1.7804172585972078e-06, - "loss": 0.6768, - "step": 27923 - }, - { - "epoch": 0.72, - "learning_rate": 1.7803999570962228e-06, - "loss": 0.7891, - "step": 27924 - }, - { - "epoch": 0.72, - "learning_rate": 1.7803826549977213e-06, - "loss": 0.9902, - "step": 27925 - }, - { - "epoch": 0.72, - "learning_rate": 1.7803653523017168e-06, - "loss": 0.5569, - "step": 27926 - }, - { - "epoch": 0.72, - "learning_rate": 1.7803480490082224e-06, - "loss": 1.0137, - "step": 27927 - }, - { - "epoch": 0.72, - "learning_rate": 1.7803307451172511e-06, - "loss": 0.7822, - "step": 27928 - }, - { - "epoch": 0.72, - "learning_rate": 1.7803134406288165e-06, - "loss": 0.8789, - "step": 27929 - }, - { - "epoch": 0.72, - "learning_rate": 1.7802961355429318e-06, - "loss": 0.7007, - "step": 27930 - }, - { - "epoch": 0.72, - "learning_rate": 1.7802788298596102e-06, - "loss": 0.8193, - "step": 27931 - }, - { - "epoch": 0.72, - "learning_rate": 1.7802615235788655e-06, - "loss": 0.6792, - "step": 27932 - }, - { - "epoch": 0.72, - "learning_rate": 1.78024421670071e-06, - "loss": 0.9341, - "step": 27933 - }, - { - "epoch": 0.72, - "learning_rate": 1.7802269092251573e-06, - "loss": 0.8047, - "step": 27934 - }, - { - "epoch": 0.72, - "learning_rate": 1.7802096011522206e-06, - "loss": 0.9248, - "step": 27935 - }, - { - "epoch": 0.72, - "learning_rate": 1.7801922924819136e-06, - "loss": 0.6187, - "step": 27936 - }, - { - "epoch": 0.72, - "learning_rate": 1.7801749832142493e-06, - "loss": 0.7805, - "step": 27937 - }, - { - "epoch": 0.72, - "learning_rate": 1.7801576733492406e-06, - "loss": 0.7012, - "step": 27938 - }, - { - "epoch": 0.72, - "learning_rate": 1.780140362886901e-06, - "loss": 0.853, - "step": 27939 - }, - { - "epoch": 0.72, - "learning_rate": 1.780123051827244e-06, - "loss": 0.6995, - "step": 27940 - }, - { - "epoch": 0.72, - "learning_rate": 1.7801057401702826e-06, - "loss": 0.7617, - "step": 27941 - }, - { - "epoch": 0.72, - "learning_rate": 1.7800884279160303e-06, - "loss": 0.9741, - "step": 27942 - }, - { - "epoch": 0.72, - "learning_rate": 1.7800711150644997e-06, - "loss": 0.7793, - "step": 27943 - }, - { - "epoch": 0.72, - "learning_rate": 1.780053801615705e-06, - "loss": 0.8213, - "step": 27944 - }, - { - "epoch": 0.72, - "learning_rate": 1.7800364875696587e-06, - "loss": 1.0068, - "step": 27945 - }, - { - "epoch": 0.72, - "learning_rate": 1.7800191729263743e-06, - "loss": 0.8828, - "step": 27946 - }, - { - "epoch": 0.72, - "learning_rate": 1.7800018576858652e-06, - "loss": 0.9805, - "step": 27947 - }, - { - "epoch": 0.72, - "learning_rate": 1.7799845418481445e-06, - "loss": 0.6909, - "step": 27948 - }, - { - "epoch": 0.72, - "learning_rate": 1.7799672254132256e-06, - "loss": 1.0283, - "step": 27949 - }, - { - "epoch": 0.72, - "learning_rate": 1.7799499083811215e-06, - "loss": 0.708, - "step": 27950 - }, - { - "epoch": 0.72, - "learning_rate": 1.7799325907518459e-06, - "loss": 0.6514, - "step": 27951 - }, - { - "epoch": 0.72, - "learning_rate": 1.7799152725254114e-06, - "loss": 0.8955, - "step": 27952 - }, - { - "epoch": 0.72, - "learning_rate": 1.7798979537018318e-06, - "loss": 0.8086, - "step": 27953 - }, - { - "epoch": 0.72, - "learning_rate": 1.7798806342811204e-06, - "loss": 0.7256, - "step": 27954 - }, - { - "epoch": 0.72, - "learning_rate": 1.77986331426329e-06, - "loss": 0.7256, - "step": 27955 - }, - { - "epoch": 0.72, - "learning_rate": 1.7798459936483541e-06, - "loss": 0.875, - "step": 27956 - }, - { - "epoch": 0.72, - "learning_rate": 1.7798286724363263e-06, - "loss": 0.8193, - "step": 27957 - }, - { - "epoch": 0.72, - "learning_rate": 1.7798113506272192e-06, - "loss": 1.0439, - "step": 27958 - }, - { - "epoch": 0.72, - "learning_rate": 1.7797940282210464e-06, - "loss": 0.8149, - "step": 27959 - }, - { - "epoch": 0.72, - "learning_rate": 1.7797767052178215e-06, - "loss": 0.8564, - "step": 27960 - }, - { - "epoch": 0.72, - "learning_rate": 1.779759381617557e-06, - "loss": 0.8564, - "step": 27961 - }, - { - "epoch": 0.72, - "learning_rate": 1.779742057420267e-06, - "loss": 0.8867, - "step": 27962 - }, - { - "epoch": 0.72, - "learning_rate": 1.7797247326259641e-06, - "loss": 0.8926, - "step": 27963 - }, - { - "epoch": 0.72, - "learning_rate": 1.7797074072346618e-06, - "loss": 0.7832, - "step": 27964 - }, - { - "epoch": 0.72, - "learning_rate": 1.7796900812463735e-06, - "loss": 0.874, - "step": 27965 - }, - { - "epoch": 0.72, - "learning_rate": 1.7796727546611123e-06, - "loss": 1.0908, - "step": 27966 - }, - { - "epoch": 0.72, - "learning_rate": 1.7796554274788918e-06, - "loss": 0.9893, - "step": 27967 - }, - { - "epoch": 0.72, - "learning_rate": 1.7796380996997247e-06, - "loss": 0.8481, - "step": 27968 - }, - { - "epoch": 0.72, - "learning_rate": 1.7796207713236243e-06, - "loss": 0.9355, - "step": 27969 - }, - { - "epoch": 0.72, - "learning_rate": 1.7796034423506048e-06, - "loss": 0.9043, - "step": 27970 - }, - { - "epoch": 0.72, - "learning_rate": 1.7795861127806782e-06, - "loss": 0.748, - "step": 27971 - }, - { - "epoch": 0.72, - "learning_rate": 1.7795687826138589e-06, - "loss": 0.8818, - "step": 27972 - }, - { - "epoch": 0.72, - "learning_rate": 1.7795514518501592e-06, - "loss": 0.9277, - "step": 27973 - }, - { - "epoch": 0.72, - "learning_rate": 1.7795341204895928e-06, - "loss": 0.7139, - "step": 27974 - }, - { - "epoch": 0.72, - "learning_rate": 1.779516788532173e-06, - "loss": 0.7588, - "step": 27975 - }, - { - "epoch": 0.72, - "learning_rate": 1.779499455977913e-06, - "loss": 1.0371, - "step": 27976 - }, - { - "epoch": 0.72, - "learning_rate": 1.7794821228268264e-06, - "loss": 0.8486, - "step": 27977 - }, - { - "epoch": 0.72, - "learning_rate": 1.779464789078926e-06, - "loss": 0.8965, - "step": 27978 - }, - { - "epoch": 0.72, - "learning_rate": 1.7794474547342254e-06, - "loss": 1.0811, - "step": 27979 - }, - { - "epoch": 0.72, - "learning_rate": 1.7794301197927374e-06, - "loss": 0.9775, - "step": 27980 - }, - { - "epoch": 0.72, - "learning_rate": 1.7794127842544757e-06, - "loss": 0.958, - "step": 27981 - }, - { - "epoch": 0.72, - "learning_rate": 1.7793954481194535e-06, - "loss": 1.0498, - "step": 27982 - }, - { - "epoch": 0.72, - "learning_rate": 1.7793781113876842e-06, - "loss": 1.0732, - "step": 27983 - }, - { - "epoch": 0.72, - "learning_rate": 1.7793607740591808e-06, - "loss": 0.8779, - "step": 27984 - }, - { - "epoch": 0.72, - "learning_rate": 1.7793434361339569e-06, - "loss": 0.9922, - "step": 27985 - }, - { - "epoch": 0.72, - "learning_rate": 1.7793260976120253e-06, - "loss": 0.8457, - "step": 27986 - }, - { - "epoch": 0.72, - "learning_rate": 1.7793087584933995e-06, - "loss": 0.8291, - "step": 27987 - }, - { - "epoch": 0.72, - "learning_rate": 1.7792914187780932e-06, - "loss": 0.9971, - "step": 27988 - }, - { - "epoch": 0.72, - "learning_rate": 1.7792740784661189e-06, - "loss": 1.0967, - "step": 27989 - }, - { - "epoch": 0.72, - "learning_rate": 1.7792567375574903e-06, - "loss": 0.8711, - "step": 27990 - }, - { - "epoch": 0.72, - "learning_rate": 1.7792393960522207e-06, - "loss": 0.7715, - "step": 27991 - }, - { - "epoch": 0.72, - "learning_rate": 1.7792220539503236e-06, - "loss": 0.7407, - "step": 27992 - }, - { - "epoch": 0.72, - "learning_rate": 1.7792047112518116e-06, - "loss": 0.6982, - "step": 27993 - }, - { - "epoch": 0.72, - "learning_rate": 1.7791873679566986e-06, - "loss": 0.7905, - "step": 27994 - }, - { - "epoch": 0.72, - "learning_rate": 1.7791700240649977e-06, - "loss": 0.8213, - "step": 27995 - }, - { - "epoch": 0.72, - "learning_rate": 1.7791526795767217e-06, - "loss": 0.917, - "step": 27996 - }, - { - "epoch": 0.72, - "learning_rate": 1.7791353344918848e-06, - "loss": 0.6597, - "step": 27997 - }, - { - "epoch": 0.72, - "learning_rate": 1.7791179888104999e-06, - "loss": 0.832, - "step": 27998 - }, - { - "epoch": 0.72, - "learning_rate": 1.7791006425325796e-06, - "loss": 0.7598, - "step": 27999 - }, - { - "epoch": 0.72, - "learning_rate": 1.7790832956581384e-06, - "loss": 0.8418, - "step": 28000 - }, - { - "epoch": 0.72, - "learning_rate": 1.7790659481871883e-06, - "loss": 0.7783, - "step": 28001 - }, - { - "epoch": 0.72, - "learning_rate": 1.7790486001197437e-06, - "loss": 0.8994, - "step": 28002 - }, - { - "epoch": 0.72, - "learning_rate": 1.7790312514558172e-06, - "loss": 0.8711, - "step": 28003 - }, - { - "epoch": 0.72, - "learning_rate": 1.7790139021954224e-06, - "loss": 0.8994, - "step": 28004 - }, - { - "epoch": 0.72, - "learning_rate": 1.7789965523385726e-06, - "loss": 0.8633, - "step": 28005 - }, - { - "epoch": 0.72, - "learning_rate": 1.778979201885281e-06, - "loss": 0.9307, - "step": 28006 - }, - { - "epoch": 0.72, - "learning_rate": 1.7789618508355604e-06, - "loss": 0.9209, - "step": 28007 - }, - { - "epoch": 0.72, - "learning_rate": 1.778944499189425e-06, - "loss": 0.7354, - "step": 28008 - }, - { - "epoch": 0.72, - "learning_rate": 1.7789271469468874e-06, - "loss": 0.9482, - "step": 28009 - }, - { - "epoch": 0.72, - "learning_rate": 1.7789097941079609e-06, - "loss": 0.4575, - "step": 28010 - }, - { - "epoch": 0.72, - "learning_rate": 1.778892440672659e-06, - "loss": 0.9062, - "step": 28011 - }, - { - "epoch": 0.72, - "learning_rate": 1.7788750866409954e-06, - "loss": 0.9385, - "step": 28012 - }, - { - "epoch": 0.72, - "learning_rate": 1.7788577320129827e-06, - "loss": 0.709, - "step": 28013 - }, - { - "epoch": 0.72, - "learning_rate": 1.7788403767886344e-06, - "loss": 0.9229, - "step": 28014 - }, - { - "epoch": 0.72, - "learning_rate": 1.7788230209679637e-06, - "loss": 0.7719, - "step": 28015 - }, - { - "epoch": 0.72, - "learning_rate": 1.7788056645509846e-06, - "loss": 0.7451, - "step": 28016 - }, - { - "epoch": 0.72, - "learning_rate": 1.7787883075377093e-06, - "loss": 1.0254, - "step": 28017 - }, - { - "epoch": 0.72, - "learning_rate": 1.7787709499281518e-06, - "loss": 0.7432, - "step": 28018 - }, - { - "epoch": 0.72, - "learning_rate": 1.778753591722325e-06, - "loss": 0.833, - "step": 28019 - }, - { - "epoch": 0.72, - "learning_rate": 1.7787362329202424e-06, - "loss": 0.7959, - "step": 28020 - }, - { - "epoch": 0.72, - "learning_rate": 1.7787188735219175e-06, - "loss": 0.6389, - "step": 28021 - }, - { - "epoch": 0.72, - "learning_rate": 1.7787015135273632e-06, - "loss": 0.8496, - "step": 28022 - }, - { - "epoch": 0.72, - "learning_rate": 1.7786841529365933e-06, - "loss": 1.0718, - "step": 28023 - }, - { - "epoch": 0.72, - "learning_rate": 1.7786667917496203e-06, - "loss": 0.958, - "step": 28024 - }, - { - "epoch": 0.72, - "learning_rate": 1.778649429966458e-06, - "loss": 0.791, - "step": 28025 - }, - { - "epoch": 0.72, - "learning_rate": 1.7786320675871198e-06, - "loss": 0.6709, - "step": 28026 - }, - { - "epoch": 0.72, - "learning_rate": 1.778614704611619e-06, - "loss": 1.0957, - "step": 28027 - }, - { - "epoch": 0.72, - "learning_rate": 1.778597341039968e-06, - "loss": 0.8652, - "step": 28028 - }, - { - "epoch": 0.72, - "learning_rate": 1.7785799768721814e-06, - "loss": 0.853, - "step": 28029 - }, - { - "epoch": 0.72, - "learning_rate": 1.7785626121082719e-06, - "loss": 0.9297, - "step": 28030 - }, - { - "epoch": 0.72, - "learning_rate": 1.7785452467482526e-06, - "loss": 0.9678, - "step": 28031 - }, - { - "epoch": 0.72, - "learning_rate": 1.7785278807921373e-06, - "loss": 0.9014, - "step": 28032 - }, - { - "epoch": 0.72, - "learning_rate": 1.7785105142399388e-06, - "loss": 0.7128, - "step": 28033 - }, - { - "epoch": 0.72, - "learning_rate": 1.7784931470916706e-06, - "loss": 0.8789, - "step": 28034 - }, - { - "epoch": 0.72, - "learning_rate": 1.7784757793473459e-06, - "loss": 1.0254, - "step": 28035 - }, - { - "epoch": 0.72, - "learning_rate": 1.7784584110069783e-06, - "loss": 0.8379, - "step": 28036 - }, - { - "epoch": 0.72, - "learning_rate": 1.778441042070581e-06, - "loss": 0.6826, - "step": 28037 - }, - { - "epoch": 0.72, - "learning_rate": 1.778423672538167e-06, - "loss": 0.748, - "step": 28038 - }, - { - "epoch": 0.72, - "learning_rate": 1.7784063024097496e-06, - "loss": 0.8311, - "step": 28039 - }, - { - "epoch": 0.72, - "learning_rate": 1.7783889316853424e-06, - "loss": 0.5825, - "step": 28040 - }, - { - "epoch": 0.72, - "learning_rate": 1.7783715603649587e-06, - "loss": 0.8608, - "step": 28041 - }, - { - "epoch": 0.72, - "learning_rate": 1.7783541884486116e-06, - "loss": 0.7812, - "step": 28042 - }, - { - "epoch": 0.72, - "learning_rate": 1.7783368159363145e-06, - "loss": 0.709, - "step": 28043 - }, - { - "epoch": 0.72, - "learning_rate": 1.7783194428280808e-06, - "loss": 0.8223, - "step": 28044 - }, - { - "epoch": 0.72, - "learning_rate": 1.7783020691239234e-06, - "loss": 1.0381, - "step": 28045 - }, - { - "epoch": 0.72, - "learning_rate": 1.7782846948238564e-06, - "loss": 0.8145, - "step": 28046 - }, - { - "epoch": 0.72, - "learning_rate": 1.778267319927892e-06, - "loss": 0.7314, - "step": 28047 - }, - { - "epoch": 0.72, - "learning_rate": 1.7782499444360446e-06, - "loss": 1.1201, - "step": 28048 - }, - { - "epoch": 0.72, - "learning_rate": 1.7782325683483266e-06, - "loss": 0.8857, - "step": 28049 - }, - { - "epoch": 0.72, - "learning_rate": 1.7782151916647518e-06, - "loss": 0.6792, - "step": 28050 - }, - { - "epoch": 0.72, - "learning_rate": 1.7781978143853338e-06, - "loss": 1.001, - "step": 28051 - }, - { - "epoch": 0.72, - "learning_rate": 1.7781804365100853e-06, - "loss": 0.7812, - "step": 28052 - }, - { - "epoch": 0.72, - "learning_rate": 1.7781630580390194e-06, - "loss": 0.5264, - "step": 28053 - }, - { - "epoch": 0.72, - "learning_rate": 1.7781456789721504e-06, - "loss": 0.8828, - "step": 28054 - }, - { - "epoch": 0.72, - "learning_rate": 1.7781282993094906e-06, - "loss": 0.6543, - "step": 28055 - }, - { - "epoch": 0.72, - "learning_rate": 1.7781109190510541e-06, - "loss": 0.6685, - "step": 28056 - }, - { - "epoch": 0.72, - "learning_rate": 1.7780935381968537e-06, - "loss": 0.8408, - "step": 28057 - }, - { - "epoch": 0.72, - "learning_rate": 1.778076156746903e-06, - "loss": 0.5991, - "step": 28058 - }, - { - "epoch": 0.72, - "learning_rate": 1.7780587747012149e-06, - "loss": 0.9678, - "step": 28059 - }, - { - "epoch": 0.72, - "learning_rate": 1.778041392059803e-06, - "loss": 0.8311, - "step": 28060 - }, - { - "epoch": 0.72, - "learning_rate": 1.7780240088226806e-06, - "loss": 0.9434, - "step": 28061 - }, - { - "epoch": 0.72, - "learning_rate": 1.7780066249898612e-06, - "loss": 0.8218, - "step": 28062 - }, - { - "epoch": 0.72, - "learning_rate": 1.7779892405613576e-06, - "loss": 0.8223, - "step": 28063 - }, - { - "epoch": 0.72, - "learning_rate": 1.7779718555371837e-06, - "loss": 0.8105, - "step": 28064 - }, - { - "epoch": 0.72, - "learning_rate": 1.7779544699173522e-06, - "loss": 0.752, - "step": 28065 - }, - { - "epoch": 0.72, - "learning_rate": 1.777937083701877e-06, - "loss": 0.8096, - "step": 28066 - }, - { - "epoch": 0.72, - "learning_rate": 1.777919696890771e-06, - "loss": 0.9492, - "step": 28067 - }, - { - "epoch": 0.72, - "learning_rate": 1.7779023094840477e-06, - "loss": 0.6064, - "step": 28068 - }, - { - "epoch": 0.72, - "learning_rate": 1.7778849214817203e-06, - "loss": 0.7891, - "step": 28069 - }, - { - "epoch": 0.72, - "learning_rate": 1.7778675328838023e-06, - "loss": 0.8804, - "step": 28070 - }, - { - "epoch": 0.72, - "learning_rate": 1.7778501436903071e-06, - "loss": 0.6411, - "step": 28071 - }, - { - "epoch": 0.72, - "learning_rate": 1.7778327539012474e-06, - "loss": 0.9844, - "step": 28072 - }, - { - "epoch": 0.72, - "learning_rate": 1.777815363516637e-06, - "loss": 1.0205, - "step": 28073 - }, - { - "epoch": 0.72, - "learning_rate": 1.7777979725364895e-06, - "loss": 0.8906, - "step": 28074 - }, - { - "epoch": 0.72, - "learning_rate": 1.7777805809608174e-06, - "loss": 0.6069, - "step": 28075 - }, - { - "epoch": 0.72, - "learning_rate": 1.7777631887896346e-06, - "loss": 0.7002, - "step": 28076 - }, - { - "epoch": 0.72, - "learning_rate": 1.7777457960229544e-06, - "loss": 0.9751, - "step": 28077 - }, - { - "epoch": 0.72, - "learning_rate": 1.7777284026607901e-06, - "loss": 0.9844, - "step": 28078 - }, - { - "epoch": 0.72, - "learning_rate": 1.7777110087031547e-06, - "loss": 0.7749, - "step": 28079 - }, - { - "epoch": 0.72, - "learning_rate": 1.7776936141500621e-06, - "loss": 0.9482, - "step": 28080 - }, - { - "epoch": 0.72, - "learning_rate": 1.7776762190015248e-06, - "loss": 0.7441, - "step": 28081 - }, - { - "epoch": 0.72, - "learning_rate": 1.7776588232575568e-06, - "loss": 0.8081, - "step": 28082 - }, - { - "epoch": 0.72, - "learning_rate": 1.7776414269181715e-06, - "loss": 0.6748, - "step": 28083 - }, - { - "epoch": 0.72, - "learning_rate": 1.7776240299833813e-06, - "loss": 0.8408, - "step": 28084 - }, - { - "epoch": 0.72, - "learning_rate": 1.7776066324532004e-06, - "loss": 0.6055, - "step": 28085 - }, - { - "epoch": 0.72, - "learning_rate": 1.777589234327642e-06, - "loss": 0.8271, - "step": 28086 - }, - { - "epoch": 0.72, - "learning_rate": 1.777571835606719e-06, - "loss": 0.8687, - "step": 28087 - }, - { - "epoch": 0.72, - "learning_rate": 1.7775544362904453e-06, - "loss": 0.9961, - "step": 28088 - }, - { - "epoch": 0.72, - "learning_rate": 1.7775370363788338e-06, - "loss": 0.7285, - "step": 28089 - }, - { - "epoch": 0.72, - "learning_rate": 1.777519635871898e-06, - "loss": 0.7163, - "step": 28090 - }, - { - "epoch": 0.72, - "learning_rate": 1.777502234769651e-06, - "loss": 1.1113, - "step": 28091 - }, - { - "epoch": 0.72, - "learning_rate": 1.7774848330721063e-06, - "loss": 0.9707, - "step": 28092 - }, - { - "epoch": 0.72, - "learning_rate": 1.7774674307792772e-06, - "loss": 0.8975, - "step": 28093 - }, - { - "epoch": 0.72, - "learning_rate": 1.7774500278911774e-06, - "loss": 0.9307, - "step": 28094 - }, - { - "epoch": 0.72, - "learning_rate": 1.7774326244078194e-06, - "loss": 0.7192, - "step": 28095 - }, - { - "epoch": 0.72, - "learning_rate": 1.7774152203292172e-06, - "loss": 1.0059, - "step": 28096 - }, - { - "epoch": 0.72, - "learning_rate": 1.7773978156553838e-06, - "loss": 0.6453, - "step": 28097 - }, - { - "epoch": 0.72, - "learning_rate": 1.7773804103863328e-06, - "loss": 0.7651, - "step": 28098 - }, - { - "epoch": 0.72, - "learning_rate": 1.7773630045220774e-06, - "loss": 0.8545, - "step": 28099 - }, - { - "epoch": 0.72, - "learning_rate": 1.7773455980626308e-06, - "loss": 0.8516, - "step": 28100 - }, - { - "epoch": 0.72, - "learning_rate": 1.7773281910080064e-06, - "loss": 1.0566, - "step": 28101 - }, - { - "epoch": 0.72, - "learning_rate": 1.7773107833582174e-06, - "loss": 0.8164, - "step": 28102 - }, - { - "epoch": 0.72, - "learning_rate": 1.7772933751132774e-06, - "loss": 0.8032, - "step": 28103 - }, - { - "epoch": 0.72, - "learning_rate": 1.7772759662731999e-06, - "loss": 0.957, - "step": 28104 - }, - { - "epoch": 0.72, - "learning_rate": 1.7772585568379976e-06, - "loss": 0.8672, - "step": 28105 - }, - { - "epoch": 0.72, - "learning_rate": 1.7772411468076843e-06, - "loss": 0.7744, - "step": 28106 - }, - { - "epoch": 0.72, - "learning_rate": 1.777223736182273e-06, - "loss": 0.8594, - "step": 28107 - }, - { - "epoch": 0.72, - "learning_rate": 1.7772063249617775e-06, - "loss": 1.0054, - "step": 28108 - }, - { - "epoch": 0.72, - "learning_rate": 1.7771889131462106e-06, - "loss": 0.8574, - "step": 28109 - }, - { - "epoch": 0.72, - "learning_rate": 1.777171500735586e-06, - "loss": 1.0137, - "step": 28110 - }, - { - "epoch": 0.72, - "learning_rate": 1.777154087729917e-06, - "loss": 0.873, - "step": 28111 - }, - { - "epoch": 0.72, - "learning_rate": 1.7771366741292165e-06, - "loss": 0.5957, - "step": 28112 - }, - { - "epoch": 0.72, - "learning_rate": 1.7771192599334985e-06, - "loss": 0.9346, - "step": 28113 - }, - { - "epoch": 0.72, - "learning_rate": 1.777101845142776e-06, - "loss": 0.7383, - "step": 28114 - }, - { - "epoch": 0.72, - "learning_rate": 1.7770844297570622e-06, - "loss": 0.9434, - "step": 28115 - }, - { - "epoch": 0.72, - "learning_rate": 1.7770670137763707e-06, - "loss": 0.7559, - "step": 28116 - }, - { - "epoch": 0.72, - "learning_rate": 1.7770495972007145e-06, - "loss": 1.0225, - "step": 28117 - }, - { - "epoch": 0.72, - "learning_rate": 1.7770321800301073e-06, - "loss": 1.0205, - "step": 28118 - }, - { - "epoch": 0.72, - "learning_rate": 1.7770147622645623e-06, - "loss": 0.7041, - "step": 28119 - }, - { - "epoch": 0.72, - "learning_rate": 1.776997343904093e-06, - "loss": 0.6548, - "step": 28120 - }, - { - "epoch": 0.72, - "learning_rate": 1.7769799249487126e-06, - "loss": 0.9814, - "step": 28121 - }, - { - "epoch": 0.72, - "learning_rate": 1.776962505398434e-06, - "loss": 1.0898, - "step": 28122 - }, - { - "epoch": 0.72, - "learning_rate": 1.7769450852532712e-06, - "loss": 0.9268, - "step": 28123 - }, - { - "epoch": 0.72, - "learning_rate": 1.7769276645132374e-06, - "loss": 1.0283, - "step": 28124 - }, - { - "epoch": 0.72, - "learning_rate": 1.7769102431783454e-06, - "loss": 0.7585, - "step": 28125 - }, - { - "epoch": 0.72, - "learning_rate": 1.7768928212486092e-06, - "loss": 0.9912, - "step": 28126 - }, - { - "epoch": 0.72, - "learning_rate": 1.776875398724042e-06, - "loss": 0.7549, - "step": 28127 - }, - { - "epoch": 0.72, - "learning_rate": 1.7768579756046568e-06, - "loss": 0.8066, - "step": 28128 - }, - { - "epoch": 0.72, - "learning_rate": 1.7768405518904674e-06, - "loss": 0.9414, - "step": 28129 - }, - { - "epoch": 0.72, - "learning_rate": 1.7768231275814869e-06, - "loss": 0.7715, - "step": 28130 - }, - { - "epoch": 0.72, - "learning_rate": 1.7768057026777284e-06, - "loss": 0.8828, - "step": 28131 - }, - { - "epoch": 0.72, - "learning_rate": 1.7767882771792055e-06, - "loss": 0.8105, - "step": 28132 - }, - { - "epoch": 0.72, - "learning_rate": 1.7767708510859318e-06, - "loss": 0.7012, - "step": 28133 - }, - { - "epoch": 0.72, - "learning_rate": 1.77675342439792e-06, - "loss": 0.5427, - "step": 28134 - }, - { - "epoch": 0.72, - "learning_rate": 1.7767359971151843e-06, - "loss": 1.125, - "step": 28135 - }, - { - "epoch": 0.72, - "learning_rate": 1.7767185692377371e-06, - "loss": 1.0518, - "step": 28136 - }, - { - "epoch": 0.72, - "learning_rate": 1.7767011407655926e-06, - "loss": 0.9551, - "step": 28137 - }, - { - "epoch": 0.72, - "learning_rate": 1.7766837116987636e-06, - "loss": 0.8174, - "step": 28138 - }, - { - "epoch": 0.72, - "learning_rate": 1.7766662820372635e-06, - "loss": 1.0449, - "step": 28139 - }, - { - "epoch": 0.72, - "learning_rate": 1.7766488517811058e-06, - "loss": 0.918, - "step": 28140 - }, - { - "epoch": 0.72, - "learning_rate": 1.776631420930304e-06, - "loss": 0.9785, - "step": 28141 - }, - { - "epoch": 0.72, - "learning_rate": 1.7766139894848708e-06, - "loss": 0.9043, - "step": 28142 - }, - { - "epoch": 0.72, - "learning_rate": 1.7765965574448204e-06, - "loss": 0.9951, - "step": 28143 - }, - { - "epoch": 0.72, - "learning_rate": 1.7765791248101654e-06, - "loss": 1.0117, - "step": 28144 - }, - { - "epoch": 0.72, - "learning_rate": 1.7765616915809197e-06, - "loss": 0.6462, - "step": 28145 - }, - { - "epoch": 0.72, - "learning_rate": 1.7765442577570965e-06, - "loss": 0.6685, - "step": 28146 - }, - { - "epoch": 0.72, - "learning_rate": 1.7765268233387088e-06, - "loss": 0.8794, - "step": 28147 - }, - { - "epoch": 0.72, - "learning_rate": 1.77650938832577e-06, - "loss": 0.9238, - "step": 28148 - }, - { - "epoch": 0.72, - "learning_rate": 1.776491952718294e-06, - "loss": 0.8516, - "step": 28149 - }, - { - "epoch": 0.72, - "learning_rate": 1.776474516516294e-06, - "loss": 1.0146, - "step": 28150 - }, - { - "epoch": 0.72, - "learning_rate": 1.7764570797197829e-06, - "loss": 1.0898, - "step": 28151 - }, - { - "epoch": 0.72, - "learning_rate": 1.7764396423287744e-06, - "loss": 0.6934, - "step": 28152 - }, - { - "epoch": 0.72, - "learning_rate": 1.7764222043432816e-06, - "loss": 0.8789, - "step": 28153 - }, - { - "epoch": 0.72, - "learning_rate": 1.7764047657633184e-06, - "loss": 0.6484, - "step": 28154 - }, - { - "epoch": 0.72, - "learning_rate": 1.7763873265888974e-06, - "loss": 0.8416, - "step": 28155 - }, - { - "epoch": 0.72, - "learning_rate": 1.7763698868200324e-06, - "loss": 0.7632, - "step": 28156 - }, - { - "epoch": 0.72, - "learning_rate": 1.7763524464567368e-06, - "loss": 0.8838, - "step": 28157 - }, - { - "epoch": 0.72, - "learning_rate": 1.7763350054990238e-06, - "loss": 1.0088, - "step": 28158 - }, - { - "epoch": 0.72, - "learning_rate": 1.7763175639469065e-06, - "loss": 0.7588, - "step": 28159 - }, - { - "epoch": 0.72, - "learning_rate": 1.776300121800399e-06, - "loss": 0.6562, - "step": 28160 - }, - { - "epoch": 0.72, - "learning_rate": 1.776282679059514e-06, - "loss": 1.0059, - "step": 28161 - }, - { - "epoch": 0.72, - "learning_rate": 1.7762652357242649e-06, - "loss": 0.75, - "step": 28162 - }, - { - "epoch": 0.72, - "learning_rate": 1.7762477917946654e-06, - "loss": 0.9248, - "step": 28163 - }, - { - "epoch": 0.72, - "learning_rate": 1.7762303472707286e-06, - "loss": 0.7271, - "step": 28164 - }, - { - "epoch": 0.72, - "learning_rate": 1.7762129021524679e-06, - "loss": 0.7866, - "step": 28165 - }, - { - "epoch": 0.72, - "learning_rate": 1.7761954564398965e-06, - "loss": 0.9268, - "step": 28166 - }, - { - "epoch": 0.72, - "learning_rate": 1.7761780101330281e-06, - "loss": 0.8125, - "step": 28167 - }, - { - "epoch": 0.72, - "learning_rate": 1.776160563231876e-06, - "loss": 0.7979, - "step": 28168 - }, - { - "epoch": 0.72, - "learning_rate": 1.7761431157364533e-06, - "loss": 0.6687, - "step": 28169 - }, - { - "epoch": 0.72, - "learning_rate": 1.7761256676467735e-06, - "loss": 0.6309, - "step": 28170 - }, - { - "epoch": 0.72, - "learning_rate": 1.77610821896285e-06, - "loss": 0.7676, - "step": 28171 - }, - { - "epoch": 0.72, - "learning_rate": 1.776090769684696e-06, - "loss": 0.8496, - "step": 28172 - }, - { - "epoch": 0.72, - "learning_rate": 1.7760733198123253e-06, - "loss": 1.0244, - "step": 28173 - }, - { - "epoch": 0.72, - "learning_rate": 1.7760558693457507e-06, - "loss": 0.9365, - "step": 28174 - }, - { - "epoch": 0.72, - "learning_rate": 1.776038418284986e-06, - "loss": 0.9053, - "step": 28175 - }, - { - "epoch": 0.72, - "learning_rate": 1.7760209666300441e-06, - "loss": 0.9189, - "step": 28176 - }, - { - "epoch": 0.72, - "learning_rate": 1.7760035143809387e-06, - "loss": 0.874, - "step": 28177 - }, - { - "epoch": 0.72, - "learning_rate": 1.7759860615376831e-06, - "loss": 0.9258, - "step": 28178 - }, - { - "epoch": 0.72, - "learning_rate": 1.7759686081002907e-06, - "loss": 0.9111, - "step": 28179 - }, - { - "epoch": 0.72, - "learning_rate": 1.775951154068775e-06, - "loss": 0.8955, - "step": 28180 - }, - { - "epoch": 0.72, - "learning_rate": 1.7759336994431488e-06, - "loss": 0.9609, - "step": 28181 - }, - { - "epoch": 0.72, - "learning_rate": 1.775916244223426e-06, - "loss": 0.8506, - "step": 28182 - }, - { - "epoch": 0.72, - "learning_rate": 1.77589878840962e-06, - "loss": 0.8496, - "step": 28183 - }, - { - "epoch": 0.72, - "learning_rate": 1.7758813320017437e-06, - "loss": 0.7471, - "step": 28184 - }, - { - "epoch": 0.72, - "learning_rate": 1.7758638749998108e-06, - "loss": 1.0146, - "step": 28185 - }, - { - "epoch": 0.72, - "learning_rate": 1.7758464174038345e-06, - "loss": 0.9814, - "step": 28186 - }, - { - "epoch": 0.72, - "learning_rate": 1.7758289592138285e-06, - "loss": 0.9248, - "step": 28187 - }, - { - "epoch": 0.72, - "learning_rate": 1.775811500429806e-06, - "loss": 0.8955, - "step": 28188 - }, - { - "epoch": 0.72, - "learning_rate": 1.77579404105178e-06, - "loss": 0.8662, - "step": 28189 - }, - { - "epoch": 0.72, - "learning_rate": 1.7757765810797647e-06, - "loss": 0.7144, - "step": 28190 - }, - { - "epoch": 0.72, - "learning_rate": 1.7757591205137724e-06, - "loss": 0.7207, - "step": 28191 - }, - { - "epoch": 0.72, - "learning_rate": 1.7757416593538173e-06, - "loss": 0.8057, - "step": 28192 - }, - { - "epoch": 0.72, - "learning_rate": 1.7757241975999121e-06, - "loss": 0.7891, - "step": 28193 - }, - { - "epoch": 0.72, - "learning_rate": 1.775706735252071e-06, - "loss": 1.002, - "step": 28194 - }, - { - "epoch": 0.72, - "learning_rate": 1.775689272310307e-06, - "loss": 1.0654, - "step": 28195 - }, - { - "epoch": 0.72, - "learning_rate": 1.775671808774633e-06, - "loss": 0.6621, - "step": 28196 - }, - { - "epoch": 0.72, - "learning_rate": 1.775654344645063e-06, - "loss": 1.0293, - "step": 28197 - }, - { - "epoch": 0.72, - "learning_rate": 1.77563687992161e-06, - "loss": 0.7451, - "step": 28198 - }, - { - "epoch": 0.72, - "learning_rate": 1.7756194146042876e-06, - "loss": 0.7905, - "step": 28199 - }, - { - "epoch": 0.72, - "learning_rate": 1.775601948693109e-06, - "loss": 0.7178, - "step": 28200 - }, - { - "epoch": 0.72, - "learning_rate": 1.7755844821880877e-06, - "loss": 0.9277, - "step": 28201 - }, - { - "epoch": 0.72, - "learning_rate": 1.775567015089237e-06, - "loss": 0.8984, - "step": 28202 - }, - { - "epoch": 0.72, - "learning_rate": 1.7755495473965703e-06, - "loss": 0.8184, - "step": 28203 - }, - { - "epoch": 0.72, - "learning_rate": 1.7755320791101007e-06, - "loss": 0.7197, - "step": 28204 - }, - { - "epoch": 0.72, - "learning_rate": 1.7755146102298424e-06, - "loss": 0.8149, - "step": 28205 - }, - { - "epoch": 0.72, - "learning_rate": 1.775497140755808e-06, - "loss": 0.9404, - "step": 28206 - }, - { - "epoch": 0.72, - "learning_rate": 1.775479670688011e-06, - "loss": 0.9375, - "step": 28207 - }, - { - "epoch": 0.72, - "learning_rate": 1.7754622000264648e-06, - "loss": 0.9082, - "step": 28208 - }, - { - "epoch": 0.72, - "learning_rate": 1.775444728771183e-06, - "loss": 0.8516, - "step": 28209 - }, - { - "epoch": 0.72, - "learning_rate": 1.775427256922179e-06, - "loss": 0.8516, - "step": 28210 - }, - { - "epoch": 0.72, - "learning_rate": 1.7754097844794656e-06, - "loss": 0.9775, - "step": 28211 - }, - { - "epoch": 0.72, - "learning_rate": 1.7753923114430566e-06, - "loss": 0.9668, - "step": 28212 - }, - { - "epoch": 0.72, - "learning_rate": 1.7753748378129658e-06, - "loss": 0.9346, - "step": 28213 - }, - { - "epoch": 0.72, - "learning_rate": 1.7753573635892059e-06, - "loss": 0.7666, - "step": 28214 - }, - { - "epoch": 0.72, - "learning_rate": 1.7753398887717906e-06, - "loss": 0.8477, - "step": 28215 - }, - { - "epoch": 0.72, - "learning_rate": 1.775322413360733e-06, - "loss": 0.958, - "step": 28216 - }, - { - "epoch": 0.72, - "learning_rate": 1.7753049373560467e-06, - "loss": 0.7095, - "step": 28217 - }, - { - "epoch": 0.72, - "learning_rate": 1.7752874607577453e-06, - "loss": 0.8779, - "step": 28218 - }, - { - "epoch": 0.72, - "learning_rate": 1.7752699835658415e-06, - "loss": 0.8213, - "step": 28219 - }, - { - "epoch": 0.72, - "learning_rate": 1.7752525057803496e-06, - "loss": 0.7275, - "step": 28220 - }, - { - "epoch": 0.72, - "learning_rate": 1.7752350274012824e-06, - "loss": 0.8662, - "step": 28221 - }, - { - "epoch": 0.72, - "learning_rate": 1.7752175484286532e-06, - "loss": 0.8555, - "step": 28222 - }, - { - "epoch": 0.72, - "learning_rate": 1.7752000688624756e-06, - "loss": 0.7153, - "step": 28223 - }, - { - "epoch": 0.72, - "learning_rate": 1.775182588702763e-06, - "loss": 0.877, - "step": 28224 - }, - { - "epoch": 0.72, - "learning_rate": 1.7751651079495287e-06, - "loss": 0.9141, - "step": 28225 - }, - { - "epoch": 0.72, - "learning_rate": 1.775147626602786e-06, - "loss": 0.6384, - "step": 28226 - }, - { - "epoch": 0.72, - "learning_rate": 1.7751301446625488e-06, - "loss": 0.8184, - "step": 28227 - }, - { - "epoch": 0.72, - "learning_rate": 1.7751126621288298e-06, - "loss": 0.8242, - "step": 28228 - }, - { - "epoch": 0.72, - "learning_rate": 1.7750951790016425e-06, - "loss": 0.8506, - "step": 28229 - }, - { - "epoch": 0.72, - "learning_rate": 1.7750776952810009e-06, - "loss": 0.793, - "step": 28230 - }, - { - "epoch": 0.72, - "learning_rate": 1.7750602109669178e-06, - "loss": 0.9346, - "step": 28231 - }, - { - "epoch": 0.72, - "learning_rate": 1.7750427260594068e-06, - "loss": 0.8994, - "step": 28232 - }, - { - "epoch": 0.72, - "learning_rate": 1.7750252405584808e-06, - "loss": 0.7185, - "step": 28233 - }, - { - "epoch": 0.72, - "learning_rate": 1.775007754464154e-06, - "loss": 0.8794, - "step": 28234 - }, - { - "epoch": 0.72, - "learning_rate": 1.7749902677764394e-06, - "loss": 0.8545, - "step": 28235 - }, - { - "epoch": 0.72, - "learning_rate": 1.7749727804953503e-06, - "loss": 0.8115, - "step": 28236 - }, - { - "epoch": 0.72, - "learning_rate": 1.7749552926209001e-06, - "loss": 0.8887, - "step": 28237 - }, - { - "epoch": 0.72, - "learning_rate": 1.7749378041531023e-06, - "loss": 0.792, - "step": 28238 - }, - { - "epoch": 0.72, - "learning_rate": 1.7749203150919705e-06, - "loss": 0.915, - "step": 28239 - }, - { - "epoch": 0.72, - "learning_rate": 1.7749028254375174e-06, - "loss": 0.7847, - "step": 28240 - }, - { - "epoch": 0.72, - "learning_rate": 1.774885335189757e-06, - "loss": 0.8291, - "step": 28241 - }, - { - "epoch": 0.72, - "learning_rate": 1.774867844348703e-06, - "loss": 0.8501, - "step": 28242 - }, - { - "epoch": 0.72, - "learning_rate": 1.7748503529143677e-06, - "loss": 0.7437, - "step": 28243 - }, - { - "epoch": 0.72, - "learning_rate": 1.7748328608867653e-06, - "loss": 0.9014, - "step": 28244 - }, - { - "epoch": 0.72, - "learning_rate": 1.774815368265909e-06, - "loss": 0.6998, - "step": 28245 - }, - { - "epoch": 0.72, - "learning_rate": 1.7747978750518123e-06, - "loss": 0.8535, - "step": 28246 - }, - { - "epoch": 0.72, - "learning_rate": 1.7747803812444887e-06, - "loss": 1.0498, - "step": 28247 - }, - { - "epoch": 0.72, - "learning_rate": 1.7747628868439508e-06, - "loss": 0.8274, - "step": 28248 - }, - { - "epoch": 0.72, - "learning_rate": 1.7747453918502129e-06, - "loss": 0.9053, - "step": 28249 - }, - { - "epoch": 0.72, - "learning_rate": 1.774727896263288e-06, - "loss": 0.9238, - "step": 28250 - }, - { - "epoch": 0.72, - "learning_rate": 1.7747104000831898e-06, - "loss": 0.9004, - "step": 28251 - }, - { - "epoch": 0.72, - "learning_rate": 1.7746929033099312e-06, - "loss": 0.7935, - "step": 28252 - }, - { - "epoch": 0.72, - "learning_rate": 1.774675405943526e-06, - "loss": 0.8911, - "step": 28253 - }, - { - "epoch": 0.72, - "learning_rate": 1.7746579079839874e-06, - "loss": 0.8867, - "step": 28254 - }, - { - "epoch": 0.72, - "learning_rate": 1.774640409431329e-06, - "loss": 0.897, - "step": 28255 - }, - { - "epoch": 0.72, - "learning_rate": 1.774622910285564e-06, - "loss": 1.1309, - "step": 28256 - }, - { - "epoch": 0.72, - "learning_rate": 1.7746054105467058e-06, - "loss": 0.8926, - "step": 28257 - }, - { - "epoch": 0.72, - "learning_rate": 1.7745879102147679e-06, - "loss": 1.0752, - "step": 28258 - }, - { - "epoch": 0.72, - "learning_rate": 1.7745704092897634e-06, - "loss": 0.9492, - "step": 28259 - }, - { - "epoch": 0.72, - "learning_rate": 1.7745529077717066e-06, - "loss": 0.7939, - "step": 28260 - }, - { - "epoch": 0.72, - "learning_rate": 1.7745354056606096e-06, - "loss": 0.7329, - "step": 28261 - }, - { - "epoch": 0.72, - "learning_rate": 1.7745179029564868e-06, - "loss": 0.9189, - "step": 28262 - }, - { - "epoch": 0.72, - "learning_rate": 1.774500399659351e-06, - "loss": 1.0811, - "step": 28263 - }, - { - "epoch": 0.72, - "learning_rate": 1.7744828957692163e-06, - "loss": 0.7529, - "step": 28264 - }, - { - "epoch": 0.72, - "learning_rate": 1.7744653912860952e-06, - "loss": 0.9541, - "step": 28265 - }, - { - "epoch": 0.72, - "learning_rate": 1.7744478862100019e-06, - "loss": 0.9668, - "step": 28266 - }, - { - "epoch": 0.72, - "learning_rate": 1.7744303805409491e-06, - "loss": 1.1348, - "step": 28267 - }, - { - "epoch": 0.72, - "learning_rate": 1.7744128742789508e-06, - "loss": 0.5928, - "step": 28268 - }, - { - "epoch": 0.72, - "learning_rate": 1.7743953674240202e-06, - "loss": 0.8936, - "step": 28269 - }, - { - "epoch": 0.72, - "learning_rate": 1.7743778599761705e-06, - "loss": 0.7432, - "step": 28270 - }, - { - "epoch": 0.72, - "learning_rate": 1.7743603519354155e-06, - "loss": 0.8252, - "step": 28271 - }, - { - "epoch": 0.72, - "learning_rate": 1.7743428433017682e-06, - "loss": 1.0215, - "step": 28272 - }, - { - "epoch": 0.72, - "learning_rate": 1.7743253340752422e-06, - "loss": 0.7866, - "step": 28273 - }, - { - "epoch": 0.72, - "learning_rate": 1.7743078242558509e-06, - "loss": 0.8994, - "step": 28274 - }, - { - "epoch": 0.72, - "learning_rate": 1.7742903138436078e-06, - "loss": 0.8477, - "step": 28275 - }, - { - "epoch": 0.72, - "learning_rate": 1.7742728028385261e-06, - "loss": 0.8301, - "step": 28276 - }, - { - "epoch": 0.72, - "learning_rate": 1.7742552912406196e-06, - "loss": 0.8867, - "step": 28277 - }, - { - "epoch": 0.72, - "learning_rate": 1.7742377790499013e-06, - "loss": 0.8604, - "step": 28278 - }, - { - "epoch": 0.72, - "learning_rate": 1.7742202662663846e-06, - "loss": 0.9385, - "step": 28279 - }, - { - "epoch": 0.72, - "learning_rate": 1.7742027528900829e-06, - "loss": 0.96, - "step": 28280 - }, - { - "epoch": 0.72, - "learning_rate": 1.77418523892101e-06, - "loss": 0.9072, - "step": 28281 - }, - { - "epoch": 0.72, - "learning_rate": 1.7741677243591791e-06, - "loss": 0.8623, - "step": 28282 - }, - { - "epoch": 0.72, - "learning_rate": 1.7741502092046034e-06, - "loss": 0.7568, - "step": 28283 - }, - { - "epoch": 0.72, - "learning_rate": 1.7741326934572964e-06, - "loss": 0.8867, - "step": 28284 - }, - { - "epoch": 0.72, - "learning_rate": 1.774115177117272e-06, - "loss": 1.084, - "step": 28285 - }, - { - "epoch": 0.72, - "learning_rate": 1.7740976601845427e-06, - "loss": 0.6455, - "step": 28286 - }, - { - "epoch": 0.73, - "learning_rate": 1.7740801426591228e-06, - "loss": 0.9033, - "step": 28287 - }, - { - "epoch": 0.73, - "learning_rate": 1.774062624541025e-06, - "loss": 0.6909, - "step": 28288 - }, - { - "epoch": 0.73, - "learning_rate": 1.7740451058302633e-06, - "loss": 0.874, - "step": 28289 - }, - { - "epoch": 0.73, - "learning_rate": 1.7740275865268509e-06, - "loss": 0.8682, - "step": 28290 - }, - { - "epoch": 0.73, - "learning_rate": 1.7740100666308009e-06, - "loss": 0.7368, - "step": 28291 - }, - { - "epoch": 0.73, - "learning_rate": 1.7739925461421272e-06, - "loss": 0.9834, - "step": 28292 - }, - { - "epoch": 0.73, - "learning_rate": 1.7739750250608428e-06, - "loss": 1.0488, - "step": 28293 - }, - { - "epoch": 0.73, - "learning_rate": 1.7739575033869617e-06, - "loss": 0.8477, - "step": 28294 - }, - { - "epoch": 0.73, - "learning_rate": 1.7739399811204965e-06, - "loss": 0.917, - "step": 28295 - }, - { - "epoch": 0.73, - "learning_rate": 1.773922458261461e-06, - "loss": 0.8955, - "step": 28296 - }, - { - "epoch": 0.73, - "learning_rate": 1.773904934809869e-06, - "loss": 0.8086, - "step": 28297 - }, - { - "epoch": 0.73, - "learning_rate": 1.7738874107657336e-06, - "loss": 0.7295, - "step": 28298 - }, - { - "epoch": 0.73, - "learning_rate": 1.7738698861290678e-06, - "loss": 1.0371, - "step": 28299 - }, - { - "epoch": 0.73, - "learning_rate": 1.7738523608998857e-06, - "loss": 0.7632, - "step": 28300 - }, - { - "epoch": 0.73, - "learning_rate": 1.7738348350782003e-06, - "loss": 0.5583, - "step": 28301 - }, - { - "epoch": 0.73, - "learning_rate": 1.7738173086640253e-06, - "loss": 0.5886, - "step": 28302 - }, - { - "epoch": 0.73, - "learning_rate": 1.773799781657374e-06, - "loss": 1.0371, - "step": 28303 - }, - { - "epoch": 0.73, - "learning_rate": 1.7737822540582596e-06, - "loss": 0.7471, - "step": 28304 - }, - { - "epoch": 0.73, - "learning_rate": 1.7737647258666959e-06, - "loss": 0.8945, - "step": 28305 - }, - { - "epoch": 0.73, - "learning_rate": 1.773747197082696e-06, - "loss": 0.8262, - "step": 28306 - }, - { - "epoch": 0.73, - "learning_rate": 1.7737296677062734e-06, - "loss": 0.8975, - "step": 28307 - }, - { - "epoch": 0.73, - "learning_rate": 1.7737121377374416e-06, - "loss": 0.5657, - "step": 28308 - }, - { - "epoch": 0.73, - "learning_rate": 1.773694607176214e-06, - "loss": 0.7314, - "step": 28309 - }, - { - "epoch": 0.73, - "learning_rate": 1.7736770760226043e-06, - "loss": 0.6685, - "step": 28310 - }, - { - "epoch": 0.73, - "learning_rate": 1.7736595442766253e-06, - "loss": 0.6243, - "step": 28311 - }, - { - "epoch": 0.73, - "learning_rate": 1.7736420119382909e-06, - "loss": 0.7432, - "step": 28312 - }, - { - "epoch": 0.73, - "learning_rate": 1.7736244790076142e-06, - "loss": 0.958, - "step": 28313 - }, - { - "epoch": 0.73, - "learning_rate": 1.7736069454846087e-06, - "loss": 0.9297, - "step": 28314 - }, - { - "epoch": 0.73, - "learning_rate": 1.7735894113692882e-06, - "loss": 0.9932, - "step": 28315 - }, - { - "epoch": 0.73, - "learning_rate": 1.7735718766616658e-06, - "loss": 0.7324, - "step": 28316 - }, - { - "epoch": 0.73, - "learning_rate": 1.773554341361755e-06, - "loss": 0.7759, - "step": 28317 - }, - { - "epoch": 0.73, - "learning_rate": 1.7735368054695695e-06, - "loss": 0.7056, - "step": 28318 - }, - { - "epoch": 0.73, - "learning_rate": 1.773519268985122e-06, - "loss": 1.0518, - "step": 28319 - }, - { - "epoch": 0.73, - "learning_rate": 1.7735017319084266e-06, - "loss": 0.8018, - "step": 28320 - }, - { - "epoch": 0.73, - "learning_rate": 1.7734841942394963e-06, - "loss": 0.9678, - "step": 28321 - }, - { - "epoch": 0.73, - "learning_rate": 1.773466655978345e-06, - "loss": 0.7524, - "step": 28322 - }, - { - "epoch": 0.73, - "learning_rate": 1.7734491171249854e-06, - "loss": 0.8916, - "step": 28323 - }, - { - "epoch": 0.73, - "learning_rate": 1.7734315776794317e-06, - "loss": 1.0098, - "step": 28324 - }, - { - "epoch": 0.73, - "learning_rate": 1.7734140376416972e-06, - "loss": 0.7749, - "step": 28325 - }, - { - "epoch": 0.73, - "learning_rate": 1.7733964970117947e-06, - "loss": 0.8696, - "step": 28326 - }, - { - "epoch": 0.73, - "learning_rate": 1.7733789557897384e-06, - "loss": 0.9238, - "step": 28327 - }, - { - "epoch": 0.73, - "learning_rate": 1.7733614139755413e-06, - "loss": 0.9741, - "step": 28328 - }, - { - "epoch": 0.73, - "learning_rate": 1.7733438715692168e-06, - "loss": 1.0068, - "step": 28329 - }, - { - "epoch": 0.73, - "learning_rate": 1.7733263285707785e-06, - "loss": 0.9609, - "step": 28330 - }, - { - "epoch": 0.73, - "learning_rate": 1.77330878498024e-06, - "loss": 0.6895, - "step": 28331 - }, - { - "epoch": 0.73, - "learning_rate": 1.773291240797614e-06, - "loss": 0.604, - "step": 28332 - }, - { - "epoch": 0.73, - "learning_rate": 1.773273696022915e-06, - "loss": 0.7949, - "step": 28333 - }, - { - "epoch": 0.73, - "learning_rate": 1.7732561506561555e-06, - "loss": 0.8672, - "step": 28334 - }, - { - "epoch": 0.73, - "learning_rate": 1.7732386046973496e-06, - "loss": 0.6846, - "step": 28335 - }, - { - "epoch": 0.73, - "learning_rate": 1.7732210581465104e-06, - "loss": 0.9883, - "step": 28336 - }, - { - "epoch": 0.73, - "learning_rate": 1.7732035110036513e-06, - "loss": 0.8428, - "step": 28337 - }, - { - "epoch": 0.73, - "learning_rate": 1.7731859632687858e-06, - "loss": 0.7925, - "step": 28338 - }, - { - "epoch": 0.73, - "learning_rate": 1.7731684149419275e-06, - "loss": 0.8057, - "step": 28339 - }, - { - "epoch": 0.73, - "learning_rate": 1.7731508660230896e-06, - "loss": 1.0723, - "step": 28340 - }, - { - "epoch": 0.73, - "learning_rate": 1.7731333165122857e-06, - "loss": 1.0376, - "step": 28341 - }, - { - "epoch": 0.73, - "learning_rate": 1.773115766409529e-06, - "loss": 1.1201, - "step": 28342 - }, - { - "epoch": 0.73, - "learning_rate": 1.7730982157148333e-06, - "loss": 0.7041, - "step": 28343 - }, - { - "epoch": 0.73, - "learning_rate": 1.7730806644282118e-06, - "loss": 0.8037, - "step": 28344 - }, - { - "epoch": 0.73, - "learning_rate": 1.773063112549678e-06, - "loss": 0.8291, - "step": 28345 - }, - { - "epoch": 0.73, - "learning_rate": 1.7730455600792453e-06, - "loss": 0.9854, - "step": 28346 - }, - { - "epoch": 0.73, - "learning_rate": 1.773028007016927e-06, - "loss": 0.9102, - "step": 28347 - }, - { - "epoch": 0.73, - "learning_rate": 1.773010453362737e-06, - "loss": 0.8535, - "step": 28348 - }, - { - "epoch": 0.73, - "learning_rate": 1.772992899116688e-06, - "loss": 0.8926, - "step": 28349 - }, - { - "epoch": 0.73, - "learning_rate": 1.7729753442787945e-06, - "loss": 0.7061, - "step": 28350 - }, - { - "epoch": 0.73, - "learning_rate": 1.7729577888490688e-06, - "loss": 0.8301, - "step": 28351 - }, - { - "epoch": 0.73, - "learning_rate": 1.7729402328275252e-06, - "loss": 0.6719, - "step": 28352 - }, - { - "epoch": 0.73, - "learning_rate": 1.7729226762141764e-06, - "loss": 0.7588, - "step": 28353 - }, - { - "epoch": 0.73, - "learning_rate": 1.7729051190090364e-06, - "loss": 0.8232, - "step": 28354 - }, - { - "epoch": 0.73, - "learning_rate": 1.7728875612121187e-06, - "loss": 0.8071, - "step": 28355 - }, - { - "epoch": 0.73, - "learning_rate": 1.7728700028234365e-06, - "loss": 1.0391, - "step": 28356 - }, - { - "epoch": 0.73, - "learning_rate": 1.7728524438430032e-06, - "loss": 1.0098, - "step": 28357 - }, - { - "epoch": 0.73, - "learning_rate": 1.7728348842708325e-06, - "loss": 0.8418, - "step": 28358 - }, - { - "epoch": 0.73, - "learning_rate": 1.7728173241069372e-06, - "loss": 0.9316, - "step": 28359 - }, - { - "epoch": 0.73, - "learning_rate": 1.7727997633513314e-06, - "loss": 0.7993, - "step": 28360 - }, - { - "epoch": 0.73, - "learning_rate": 1.7727822020040287e-06, - "loss": 0.9043, - "step": 28361 - }, - { - "epoch": 0.73, - "learning_rate": 1.7727646400650418e-06, - "loss": 0.7803, - "step": 28362 - }, - { - "epoch": 0.73, - "learning_rate": 1.7727470775343846e-06, - "loss": 0.7925, - "step": 28363 - }, - { - "epoch": 0.73, - "learning_rate": 1.7727295144120706e-06, - "loss": 0.6357, - "step": 28364 - }, - { - "epoch": 0.73, - "learning_rate": 1.7727119506981133e-06, - "loss": 0.9629, - "step": 28365 - }, - { - "epoch": 0.73, - "learning_rate": 1.7726943863925258e-06, - "loss": 0.834, - "step": 28366 - }, - { - "epoch": 0.73, - "learning_rate": 1.7726768214953217e-06, - "loss": 1.0693, - "step": 28367 - }, - { - "epoch": 0.73, - "learning_rate": 1.7726592560065145e-06, - "loss": 0.635, - "step": 28368 - }, - { - "epoch": 0.73, - "learning_rate": 1.7726416899261176e-06, - "loss": 0.9717, - "step": 28369 - }, - { - "epoch": 0.73, - "learning_rate": 1.7726241232541447e-06, - "loss": 0.8984, - "step": 28370 - }, - { - "epoch": 0.73, - "learning_rate": 1.772606555990609e-06, - "loss": 0.6272, - "step": 28371 - }, - { - "epoch": 0.73, - "learning_rate": 1.7725889881355238e-06, - "loss": 0.7471, - "step": 28372 - }, - { - "epoch": 0.73, - "learning_rate": 1.7725714196889029e-06, - "loss": 0.8242, - "step": 28373 - }, - { - "epoch": 0.73, - "learning_rate": 1.7725538506507594e-06, - "loss": 0.7251, - "step": 28374 - }, - { - "epoch": 0.73, - "learning_rate": 1.7725362810211072e-06, - "loss": 0.8721, - "step": 28375 - }, - { - "epoch": 0.73, - "learning_rate": 1.7725187107999592e-06, - "loss": 0.892, - "step": 28376 - }, - { - "epoch": 0.73, - "learning_rate": 1.7725011399873293e-06, - "loss": 0.8066, - "step": 28377 - }, - { - "epoch": 0.73, - "learning_rate": 1.772483568583231e-06, - "loss": 0.6992, - "step": 28378 - }, - { - "epoch": 0.73, - "learning_rate": 1.7724659965876773e-06, - "loss": 0.9365, - "step": 28379 - }, - { - "epoch": 0.73, - "learning_rate": 1.772448424000682e-06, - "loss": 0.9917, - "step": 28380 - }, - { - "epoch": 0.73, - "learning_rate": 1.7724308508222584e-06, - "loss": 0.7612, - "step": 28381 - }, - { - "epoch": 0.73, - "learning_rate": 1.7724132770524199e-06, - "loss": 0.9268, - "step": 28382 - }, - { - "epoch": 0.73, - "learning_rate": 1.77239570269118e-06, - "loss": 0.7739, - "step": 28383 - }, - { - "epoch": 0.73, - "learning_rate": 1.7723781277385523e-06, - "loss": 0.9844, - "step": 28384 - }, - { - "epoch": 0.73, - "learning_rate": 1.7723605521945504e-06, - "loss": 1.1016, - "step": 28385 - }, - { - "epoch": 0.73, - "learning_rate": 1.7723429760591875e-06, - "loss": 1.0674, - "step": 28386 - }, - { - "epoch": 0.73, - "learning_rate": 1.7723253993324772e-06, - "loss": 0.8096, - "step": 28387 - }, - { - "epoch": 0.73, - "learning_rate": 1.7723078220144325e-06, - "loss": 0.8301, - "step": 28388 - }, - { - "epoch": 0.73, - "learning_rate": 1.7722902441050674e-06, - "loss": 0.6316, - "step": 28389 - }, - { - "epoch": 0.73, - "learning_rate": 1.772272665604395e-06, - "loss": 0.665, - "step": 28390 - }, - { - "epoch": 0.73, - "learning_rate": 1.772255086512429e-06, - "loss": 0.9673, - "step": 28391 - }, - { - "epoch": 0.73, - "learning_rate": 1.772237506829183e-06, - "loss": 0.9551, - "step": 28392 - }, - { - "epoch": 0.73, - "learning_rate": 1.7722199265546702e-06, - "loss": 1.0098, - "step": 28393 - }, - { - "epoch": 0.73, - "learning_rate": 1.772202345688904e-06, - "loss": 0.6725, - "step": 28394 - }, - { - "epoch": 0.73, - "learning_rate": 1.772184764231898e-06, - "loss": 0.8462, - "step": 28395 - }, - { - "epoch": 0.73, - "learning_rate": 1.7721671821836659e-06, - "loss": 0.8555, - "step": 28396 - }, - { - "epoch": 0.73, - "learning_rate": 1.7721495995442205e-06, - "loss": 0.6299, - "step": 28397 - }, - { - "epoch": 0.73, - "learning_rate": 1.7721320163135759e-06, - "loss": 0.6807, - "step": 28398 - }, - { - "epoch": 0.73, - "learning_rate": 1.7721144324917452e-06, - "loss": 0.874, - "step": 28399 - }, - { - "epoch": 0.73, - "learning_rate": 1.772096848078742e-06, - "loss": 0.7529, - "step": 28400 - }, - { - "epoch": 0.73, - "learning_rate": 1.7720792630745796e-06, - "loss": 0.7061, - "step": 28401 - }, - { - "epoch": 0.73, - "learning_rate": 1.7720616774792717e-06, - "loss": 0.9189, - "step": 28402 - }, - { - "epoch": 0.73, - "learning_rate": 1.7720440912928319e-06, - "loss": 0.752, - "step": 28403 - }, - { - "epoch": 0.73, - "learning_rate": 1.7720265045152734e-06, - "loss": 1.0293, - "step": 28404 - }, - { - "epoch": 0.73, - "learning_rate": 1.7720089171466093e-06, - "loss": 0.7578, - "step": 28405 - }, - { - "epoch": 0.73, - "learning_rate": 1.7719913291868537e-06, - "loss": 0.7749, - "step": 28406 - }, - { - "epoch": 0.73, - "learning_rate": 1.77197374063602e-06, - "loss": 0.957, - "step": 28407 - }, - { - "epoch": 0.73, - "learning_rate": 1.7719561514941215e-06, - "loss": 0.4404, - "step": 28408 - }, - { - "epoch": 0.73, - "learning_rate": 1.7719385617611713e-06, - "loss": 0.709, - "step": 28409 - }, - { - "epoch": 0.73, - "learning_rate": 1.7719209714371836e-06, - "loss": 0.7334, - "step": 28410 - }, - { - "epoch": 0.73, - "learning_rate": 1.7719033805221716e-06, - "loss": 0.6255, - "step": 28411 - }, - { - "epoch": 0.73, - "learning_rate": 1.7718857890161482e-06, - "loss": 0.7327, - "step": 28412 - }, - { - "epoch": 0.73, - "learning_rate": 1.7718681969191275e-06, - "loss": 0.9404, - "step": 28413 - }, - { - "epoch": 0.73, - "learning_rate": 1.771850604231123e-06, - "loss": 0.9766, - "step": 28414 - }, - { - "epoch": 0.73, - "learning_rate": 1.771833010952148e-06, - "loss": 0.7466, - "step": 28415 - }, - { - "epoch": 0.73, - "learning_rate": 1.771815417082216e-06, - "loss": 1.0039, - "step": 28416 - }, - { - "epoch": 0.73, - "learning_rate": 1.7717978226213402e-06, - "loss": 0.7783, - "step": 28417 - }, - { - "epoch": 0.73, - "learning_rate": 1.7717802275695344e-06, - "loss": 1.0586, - "step": 28418 - }, - { - "epoch": 0.73, - "learning_rate": 1.771762631926812e-06, - "loss": 0.7246, - "step": 28419 - }, - { - "epoch": 0.73, - "learning_rate": 1.7717450356931863e-06, - "loss": 0.7666, - "step": 28420 - }, - { - "epoch": 0.73, - "learning_rate": 1.771727438868671e-06, - "loss": 0.7578, - "step": 28421 - }, - { - "epoch": 0.73, - "learning_rate": 1.7717098414532794e-06, - "loss": 0.6885, - "step": 28422 - }, - { - "epoch": 0.73, - "learning_rate": 1.771692243447025e-06, - "loss": 1.0391, - "step": 28423 - }, - { - "epoch": 0.73, - "learning_rate": 1.7716746448499216e-06, - "loss": 0.9453, - "step": 28424 - }, - { - "epoch": 0.73, - "learning_rate": 1.7716570456619823e-06, - "loss": 0.8105, - "step": 28425 - }, - { - "epoch": 0.73, - "learning_rate": 1.7716394458832207e-06, - "loss": 0.7129, - "step": 28426 - }, - { - "epoch": 0.73, - "learning_rate": 1.7716218455136501e-06, - "loss": 0.7163, - "step": 28427 - }, - { - "epoch": 0.73, - "learning_rate": 1.771604244553284e-06, - "loss": 0.957, - "step": 28428 - }, - { - "epoch": 0.73, - "learning_rate": 1.7715866430021365e-06, - "loss": 0.7842, - "step": 28429 - }, - { - "epoch": 0.73, - "learning_rate": 1.7715690408602204e-06, - "loss": 0.5476, - "step": 28430 - }, - { - "epoch": 0.73, - "learning_rate": 1.7715514381275493e-06, - "loss": 0.8564, - "step": 28431 - }, - { - "epoch": 0.73, - "learning_rate": 1.7715338348041367e-06, - "loss": 0.9736, - "step": 28432 - }, - { - "epoch": 0.73, - "learning_rate": 1.7715162308899963e-06, - "loss": 0.6665, - "step": 28433 - }, - { - "epoch": 0.73, - "learning_rate": 1.7714986263851412e-06, - "loss": 1.0205, - "step": 28434 - }, - { - "epoch": 0.73, - "learning_rate": 1.7714810212895853e-06, - "loss": 0.9463, - "step": 28435 - }, - { - "epoch": 0.73, - "learning_rate": 1.7714634156033416e-06, - "loss": 1.0762, - "step": 28436 - }, - { - "epoch": 0.73, - "learning_rate": 1.771445809326424e-06, - "loss": 1.0801, - "step": 28437 - }, - { - "epoch": 0.73, - "learning_rate": 1.771428202458846e-06, - "loss": 0.874, - "step": 28438 - }, - { - "epoch": 0.73, - "learning_rate": 1.7714105950006203e-06, - "loss": 0.9502, - "step": 28439 - }, - { - "epoch": 0.73, - "learning_rate": 1.7713929869517612e-06, - "loss": 0.7793, - "step": 28440 - }, - { - "epoch": 0.73, - "learning_rate": 1.7713753783122821e-06, - "loss": 0.4625, - "step": 28441 - }, - { - "epoch": 0.73, - "learning_rate": 1.7713577690821966e-06, - "loss": 0.8457, - "step": 28442 - }, - { - "epoch": 0.73, - "learning_rate": 1.7713401592615176e-06, - "loss": 0.5254, - "step": 28443 - }, - { - "epoch": 0.73, - "learning_rate": 1.771322548850259e-06, - "loss": 0.8215, - "step": 28444 - }, - { - "epoch": 0.73, - "learning_rate": 1.7713049378484343e-06, - "loss": 0.9238, - "step": 28445 - }, - { - "epoch": 0.73, - "learning_rate": 1.7712873262560564e-06, - "loss": 0.7319, - "step": 28446 - }, - { - "epoch": 0.73, - "learning_rate": 1.7712697140731397e-06, - "loss": 0.6562, - "step": 28447 - }, - { - "epoch": 0.73, - "learning_rate": 1.771252101299697e-06, - "loss": 0.73, - "step": 28448 - }, - { - "epoch": 0.73, - "learning_rate": 1.7712344879357422e-06, - "loss": 1.0195, - "step": 28449 - }, - { - "epoch": 0.73, - "learning_rate": 1.7712168739812885e-06, - "loss": 0.4001, - "step": 28450 - }, - { - "epoch": 0.73, - "learning_rate": 1.7711992594363497e-06, - "loss": 0.9062, - "step": 28451 - }, - { - "epoch": 0.73, - "learning_rate": 1.771181644300939e-06, - "loss": 0.7422, - "step": 28452 - }, - { - "epoch": 0.73, - "learning_rate": 1.7711640285750698e-06, - "loss": 0.8389, - "step": 28453 - }, - { - "epoch": 0.73, - "learning_rate": 1.7711464122587557e-06, - "loss": 0.9111, - "step": 28454 - }, - { - "epoch": 0.73, - "learning_rate": 1.7711287953520106e-06, - "loss": 0.9092, - "step": 28455 - }, - { - "epoch": 0.73, - "learning_rate": 1.7711111778548475e-06, - "loss": 0.9053, - "step": 28456 - }, - { - "epoch": 0.73, - "learning_rate": 1.77109355976728e-06, - "loss": 0.645, - "step": 28457 - }, - { - "epoch": 0.73, - "learning_rate": 1.7710759410893217e-06, - "loss": 0.5415, - "step": 28458 - }, - { - "epoch": 0.73, - "learning_rate": 1.7710583218209858e-06, - "loss": 0.9717, - "step": 28459 - }, - { - "epoch": 0.73, - "learning_rate": 1.7710407019622862e-06, - "loss": 0.7129, - "step": 28460 - }, - { - "epoch": 0.73, - "learning_rate": 1.7710230815132362e-06, - "loss": 0.9863, - "step": 28461 - }, - { - "epoch": 0.73, - "learning_rate": 1.7710054604738493e-06, - "loss": 0.9189, - "step": 28462 - }, - { - "epoch": 0.73, - "learning_rate": 1.7709878388441388e-06, - "loss": 0.8799, - "step": 28463 - }, - { - "epoch": 0.73, - "learning_rate": 1.7709702166241185e-06, - "loss": 0.8838, - "step": 28464 - }, - { - "epoch": 0.73, - "learning_rate": 1.7709525938138015e-06, - "loss": 0.9297, - "step": 28465 - }, - { - "epoch": 0.73, - "learning_rate": 1.7709349704132018e-06, - "loss": 0.9175, - "step": 28466 - }, - { - "epoch": 0.73, - "learning_rate": 1.7709173464223326e-06, - "loss": 0.8789, - "step": 28467 - }, - { - "epoch": 0.73, - "learning_rate": 1.7708997218412075e-06, - "loss": 0.7129, - "step": 28468 - }, - { - "epoch": 0.73, - "learning_rate": 1.77088209666984e-06, - "loss": 0.6321, - "step": 28469 - }, - { - "epoch": 0.73, - "learning_rate": 1.7708644709082433e-06, - "loss": 0.9062, - "step": 28470 - }, - { - "epoch": 0.73, - "learning_rate": 1.7708468445564311e-06, - "loss": 0.7183, - "step": 28471 - }, - { - "epoch": 0.73, - "learning_rate": 1.770829217614417e-06, - "loss": 0.834, - "step": 28472 - }, - { - "epoch": 0.73, - "learning_rate": 1.7708115900822142e-06, - "loss": 1.0625, - "step": 28473 - }, - { - "epoch": 0.73, - "learning_rate": 1.7707939619598368e-06, - "loss": 0.9512, - "step": 28474 - }, - { - "epoch": 0.73, - "learning_rate": 1.770776333247298e-06, - "loss": 0.8174, - "step": 28475 - }, - { - "epoch": 0.73, - "learning_rate": 1.7707587039446106e-06, - "loss": 0.7578, - "step": 28476 - }, - { - "epoch": 0.73, - "learning_rate": 1.7707410740517893e-06, - "loss": 0.7881, - "step": 28477 - }, - { - "epoch": 0.73, - "learning_rate": 1.7707234435688464e-06, - "loss": 0.7932, - "step": 28478 - }, - { - "epoch": 0.73, - "learning_rate": 1.7707058124957963e-06, - "loss": 0.8525, - "step": 28479 - }, - { - "epoch": 0.73, - "learning_rate": 1.7706881808326524e-06, - "loss": 0.8369, - "step": 28480 - }, - { - "epoch": 0.73, - "learning_rate": 1.7706705485794279e-06, - "loss": 0.8154, - "step": 28481 - }, - { - "epoch": 0.73, - "learning_rate": 1.7706529157361362e-06, - "loss": 0.7461, - "step": 28482 - }, - { - "epoch": 0.73, - "learning_rate": 1.7706352823027913e-06, - "loss": 0.8223, - "step": 28483 - }, - { - "epoch": 0.73, - "learning_rate": 1.7706176482794062e-06, - "loss": 0.8735, - "step": 28484 - }, - { - "epoch": 0.73, - "learning_rate": 1.7706000136659945e-06, - "loss": 0.8359, - "step": 28485 - }, - { - "epoch": 0.73, - "learning_rate": 1.7705823784625698e-06, - "loss": 1.0166, - "step": 28486 - }, - { - "epoch": 0.73, - "learning_rate": 1.770564742669146e-06, - "loss": 0.9404, - "step": 28487 - }, - { - "epoch": 0.73, - "learning_rate": 1.7705471062857358e-06, - "loss": 0.8887, - "step": 28488 - }, - { - "epoch": 0.73, - "learning_rate": 1.7705294693123532e-06, - "loss": 0.7202, - "step": 28489 - }, - { - "epoch": 0.73, - "learning_rate": 1.7705118317490118e-06, - "loss": 0.7129, - "step": 28490 - }, - { - "epoch": 0.73, - "learning_rate": 1.7704941935957244e-06, - "loss": 1.0273, - "step": 28491 - }, - { - "epoch": 0.73, - "learning_rate": 1.7704765548525055e-06, - "loss": 0.9038, - "step": 28492 - }, - { - "epoch": 0.73, - "learning_rate": 1.7704589155193684e-06, - "loss": 0.8545, - "step": 28493 - }, - { - "epoch": 0.73, - "learning_rate": 1.7704412755963255e-06, - "loss": 0.9336, - "step": 28494 - }, - { - "epoch": 0.73, - "learning_rate": 1.770423635083392e-06, - "loss": 0.7988, - "step": 28495 - }, - { - "epoch": 0.73, - "learning_rate": 1.77040599398058e-06, - "loss": 0.9619, - "step": 28496 - }, - { - "epoch": 0.73, - "learning_rate": 1.7703883522879037e-06, - "loss": 0.9668, - "step": 28497 - }, - { - "epoch": 0.73, - "learning_rate": 1.7703707100053764e-06, - "loss": 0.8955, - "step": 28498 - }, - { - "epoch": 0.73, - "learning_rate": 1.770353067133012e-06, - "loss": 0.8965, - "step": 28499 - }, - { - "epoch": 0.73, - "learning_rate": 1.7703354236708235e-06, - "loss": 0.8369, - "step": 28500 - }, - { - "epoch": 0.73, - "learning_rate": 1.7703177796188243e-06, - "loss": 0.9482, - "step": 28501 - }, - { - "epoch": 0.73, - "learning_rate": 1.7703001349770284e-06, - "loss": 0.8564, - "step": 28502 - }, - { - "epoch": 0.73, - "learning_rate": 1.770282489745449e-06, - "loss": 0.7803, - "step": 28503 - }, - { - "epoch": 0.73, - "learning_rate": 1.7702648439240999e-06, - "loss": 0.7285, - "step": 28504 - }, - { - "epoch": 0.73, - "learning_rate": 1.7702471975129945e-06, - "loss": 0.7344, - "step": 28505 - }, - { - "epoch": 0.73, - "learning_rate": 1.770229550512146e-06, - "loss": 0.835, - "step": 28506 - }, - { - "epoch": 0.73, - "learning_rate": 1.7702119029215682e-06, - "loss": 0.8477, - "step": 28507 - }, - { - "epoch": 0.73, - "learning_rate": 1.7701942547412747e-06, - "loss": 0.8311, - "step": 28508 - }, - { - "epoch": 0.73, - "learning_rate": 1.7701766059712789e-06, - "loss": 0.873, - "step": 28509 - }, - { - "epoch": 0.73, - "learning_rate": 1.770158956611594e-06, - "loss": 0.9033, - "step": 28510 - }, - { - "epoch": 0.73, - "learning_rate": 1.770141306662234e-06, - "loss": 0.7773, - "step": 28511 - }, - { - "epoch": 0.73, - "learning_rate": 1.7701236561232122e-06, - "loss": 0.7021, - "step": 28512 - }, - { - "epoch": 0.73, - "learning_rate": 1.7701060049945422e-06, - "loss": 0.9072, - "step": 28513 - }, - { - "epoch": 0.73, - "learning_rate": 1.7700883532762371e-06, - "loss": 0.9033, - "step": 28514 - }, - { - "epoch": 0.73, - "learning_rate": 1.7700707009683111e-06, - "loss": 0.6938, - "step": 28515 - }, - { - "epoch": 0.73, - "learning_rate": 1.7700530480707774e-06, - "loss": 0.7808, - "step": 28516 - }, - { - "epoch": 0.73, - "learning_rate": 1.7700353945836492e-06, - "loss": 0.7598, - "step": 28517 - }, - { - "epoch": 0.73, - "learning_rate": 1.7700177405069405e-06, - "loss": 0.7422, - "step": 28518 - }, - { - "epoch": 0.73, - "learning_rate": 1.7700000858406647e-06, - "loss": 0.9141, - "step": 28519 - }, - { - "epoch": 0.73, - "learning_rate": 1.769982430584835e-06, - "loss": 0.7578, - "step": 28520 - }, - { - "epoch": 0.73, - "learning_rate": 1.7699647747394652e-06, - "loss": 0.7998, - "step": 28521 - }, - { - "epoch": 0.73, - "learning_rate": 1.769947118304569e-06, - "loss": 0.8784, - "step": 28522 - }, - { - "epoch": 0.73, - "learning_rate": 1.7699294612801596e-06, - "loss": 1.001, - "step": 28523 - }, - { - "epoch": 0.73, - "learning_rate": 1.7699118036662506e-06, - "loss": 0.9141, - "step": 28524 - }, - { - "epoch": 0.73, - "learning_rate": 1.7698941454628555e-06, - "loss": 0.73, - "step": 28525 - }, - { - "epoch": 0.73, - "learning_rate": 1.7698764866699878e-06, - "loss": 0.9043, - "step": 28526 - }, - { - "epoch": 0.73, - "learning_rate": 1.769858827287661e-06, - "loss": 0.9971, - "step": 28527 - }, - { - "epoch": 0.73, - "learning_rate": 1.769841167315889e-06, - "loss": 0.564, - "step": 28528 - }, - { - "epoch": 0.73, - "learning_rate": 1.7698235067546849e-06, - "loss": 0.8262, - "step": 28529 - }, - { - "epoch": 0.73, - "learning_rate": 1.7698058456040623e-06, - "loss": 1.0127, - "step": 28530 - }, - { - "epoch": 0.73, - "learning_rate": 1.7697881838640348e-06, - "loss": 0.8965, - "step": 28531 - }, - { - "epoch": 0.73, - "learning_rate": 1.7697705215346157e-06, - "loss": 0.6958, - "step": 28532 - }, - { - "epoch": 0.73, - "learning_rate": 1.7697528586158189e-06, - "loss": 0.8047, - "step": 28533 - }, - { - "epoch": 0.73, - "learning_rate": 1.7697351951076577e-06, - "loss": 0.6235, - "step": 28534 - }, - { - "epoch": 0.73, - "learning_rate": 1.7697175310101455e-06, - "loss": 0.9424, - "step": 28535 - }, - { - "epoch": 0.73, - "learning_rate": 1.7696998663232963e-06, - "loss": 1.0527, - "step": 28536 - }, - { - "epoch": 0.73, - "learning_rate": 1.7696822010471229e-06, - "loss": 0.9238, - "step": 28537 - }, - { - "epoch": 0.73, - "learning_rate": 1.7696645351816394e-06, - "loss": 0.7646, - "step": 28538 - }, - { - "epoch": 0.73, - "learning_rate": 1.7696468687268592e-06, - "loss": 0.7085, - "step": 28539 - }, - { - "epoch": 0.73, - "learning_rate": 1.769629201682796e-06, - "loss": 0.605, - "step": 28540 - }, - { - "epoch": 0.73, - "learning_rate": 1.7696115340494626e-06, - "loss": 0.8545, - "step": 28541 - }, - { - "epoch": 0.73, - "learning_rate": 1.7695938658268736e-06, - "loss": 0.8906, - "step": 28542 - }, - { - "epoch": 0.73, - "learning_rate": 1.7695761970150415e-06, - "loss": 0.606, - "step": 28543 - }, - { - "epoch": 0.73, - "learning_rate": 1.7695585276139807e-06, - "loss": 0.6021, - "step": 28544 - }, - { - "epoch": 0.73, - "learning_rate": 1.769540857623704e-06, - "loss": 0.8047, - "step": 28545 - }, - { - "epoch": 0.73, - "learning_rate": 1.7695231870442254e-06, - "loss": 0.8057, - "step": 28546 - }, - { - "epoch": 0.73, - "learning_rate": 1.7695055158755582e-06, - "loss": 0.7651, - "step": 28547 - }, - { - "epoch": 0.73, - "learning_rate": 1.7694878441177159e-06, - "loss": 0.9932, - "step": 28548 - }, - { - "epoch": 0.73, - "learning_rate": 1.7694701717707124e-06, - "loss": 0.77, - "step": 28549 - }, - { - "epoch": 0.73, - "learning_rate": 1.769452498834561e-06, - "loss": 0.7285, - "step": 28550 - }, - { - "epoch": 0.73, - "learning_rate": 1.7694348253092748e-06, - "loss": 0.9639, - "step": 28551 - }, - { - "epoch": 0.73, - "learning_rate": 1.769417151194868e-06, - "loss": 0.7324, - "step": 28552 - }, - { - "epoch": 0.73, - "learning_rate": 1.7693994764913538e-06, - "loss": 0.7114, - "step": 28553 - }, - { - "epoch": 0.73, - "learning_rate": 1.769381801198746e-06, - "loss": 0.9561, - "step": 28554 - }, - { - "epoch": 0.73, - "learning_rate": 1.7693641253170577e-06, - "loss": 0.9189, - "step": 28555 - }, - { - "epoch": 0.73, - "learning_rate": 1.7693464488463029e-06, - "loss": 0.8945, - "step": 28556 - }, - { - "epoch": 0.73, - "learning_rate": 1.7693287717864947e-06, - "loss": 1.085, - "step": 28557 - }, - { - "epoch": 0.73, - "learning_rate": 1.7693110941376468e-06, - "loss": 0.8975, - "step": 28558 - }, - { - "epoch": 0.73, - "learning_rate": 1.7692934158997727e-06, - "loss": 1.04, - "step": 28559 - }, - { - "epoch": 0.73, - "learning_rate": 1.769275737072886e-06, - "loss": 0.8867, - "step": 28560 - }, - { - "epoch": 0.73, - "learning_rate": 1.7692580576570006e-06, - "loss": 0.791, - "step": 28561 - }, - { - "epoch": 0.73, - "learning_rate": 1.7692403776521294e-06, - "loss": 0.769, - "step": 28562 - }, - { - "epoch": 0.73, - "learning_rate": 1.7692226970582862e-06, - "loss": 0.8076, - "step": 28563 - }, - { - "epoch": 0.73, - "learning_rate": 1.7692050158754848e-06, - "loss": 0.9824, - "step": 28564 - }, - { - "epoch": 0.73, - "learning_rate": 1.7691873341037384e-06, - "loss": 0.8389, - "step": 28565 - }, - { - "epoch": 0.73, - "learning_rate": 1.7691696517430606e-06, - "loss": 0.9473, - "step": 28566 - }, - { - "epoch": 0.73, - "learning_rate": 1.7691519687934649e-06, - "loss": 0.6777, - "step": 28567 - }, - { - "epoch": 0.73, - "learning_rate": 1.7691342852549646e-06, - "loss": 0.9717, - "step": 28568 - }, - { - "epoch": 0.73, - "learning_rate": 1.7691166011275743e-06, - "loss": 0.874, - "step": 28569 - }, - { - "epoch": 0.73, - "learning_rate": 1.7690989164113059e-06, - "loss": 0.7949, - "step": 28570 - }, - { - "epoch": 0.73, - "learning_rate": 1.7690812311061744e-06, - "loss": 0.9756, - "step": 28571 - }, - { - "epoch": 0.73, - "learning_rate": 1.7690635452121927e-06, - "loss": 0.8584, - "step": 28572 - }, - { - "epoch": 0.73, - "learning_rate": 1.7690458587293744e-06, - "loss": 0.615, - "step": 28573 - }, - { - "epoch": 0.73, - "learning_rate": 1.7690281716577329e-06, - "loss": 0.7026, - "step": 28574 - }, - { - "epoch": 0.73, - "learning_rate": 1.769010483997282e-06, - "loss": 0.667, - "step": 28575 - }, - { - "epoch": 0.73, - "learning_rate": 1.7689927957480353e-06, - "loss": 1.0088, - "step": 28576 - }, - { - "epoch": 0.73, - "learning_rate": 1.7689751069100059e-06, - "loss": 0.9092, - "step": 28577 - }, - { - "epoch": 0.73, - "learning_rate": 1.7689574174832077e-06, - "loss": 0.9541, - "step": 28578 - }, - { - "epoch": 0.73, - "learning_rate": 1.768939727467654e-06, - "loss": 0.8862, - "step": 28579 - }, - { - "epoch": 0.73, - "learning_rate": 1.7689220368633589e-06, - "loss": 0.8613, - "step": 28580 - }, - { - "epoch": 0.73, - "learning_rate": 1.768904345670335e-06, - "loss": 0.6733, - "step": 28581 - }, - { - "epoch": 0.73, - "learning_rate": 1.7688866538885967e-06, - "loss": 0.9375, - "step": 28582 - }, - { - "epoch": 0.73, - "learning_rate": 1.7688689615181572e-06, - "loss": 0.686, - "step": 28583 - }, - { - "epoch": 0.73, - "learning_rate": 1.7688512685590303e-06, - "loss": 0.7427, - "step": 28584 - }, - { - "epoch": 0.73, - "learning_rate": 1.7688335750112292e-06, - "loss": 0.8225, - "step": 28585 - }, - { - "epoch": 0.73, - "learning_rate": 1.7688158808747677e-06, - "loss": 0.7017, - "step": 28586 - }, - { - "epoch": 0.73, - "learning_rate": 1.768798186149659e-06, - "loss": 0.9521, - "step": 28587 - }, - { - "epoch": 0.73, - "learning_rate": 1.768780490835917e-06, - "loss": 1.0703, - "step": 28588 - }, - { - "epoch": 0.73, - "learning_rate": 1.768762794933555e-06, - "loss": 0.9414, - "step": 28589 - }, - { - "epoch": 0.73, - "learning_rate": 1.7687450984425868e-06, - "loss": 1.0908, - "step": 28590 - }, - { - "epoch": 0.73, - "learning_rate": 1.768727401363026e-06, - "loss": 0.7344, - "step": 28591 - }, - { - "epoch": 0.73, - "learning_rate": 1.7687097036948858e-06, - "loss": 0.8076, - "step": 28592 - }, - { - "epoch": 0.73, - "learning_rate": 1.7686920054381797e-06, - "loss": 1.0596, - "step": 28593 - }, - { - "epoch": 0.73, - "learning_rate": 1.7686743065929219e-06, - "loss": 0.8086, - "step": 28594 - }, - { - "epoch": 0.73, - "learning_rate": 1.768656607159125e-06, - "loss": 1.0742, - "step": 28595 - }, - { - "epoch": 0.73, - "learning_rate": 1.7686389071368035e-06, - "loss": 0.79, - "step": 28596 - }, - { - "epoch": 0.73, - "learning_rate": 1.7686212065259706e-06, - "loss": 0.9082, - "step": 28597 - }, - { - "epoch": 0.73, - "learning_rate": 1.7686035053266396e-06, - "loss": 0.8447, - "step": 28598 - }, - { - "epoch": 0.73, - "learning_rate": 1.768585803538824e-06, - "loss": 1.1465, - "step": 28599 - }, - { - "epoch": 0.73, - "learning_rate": 1.768568101162538e-06, - "loss": 0.9082, - "step": 28600 - }, - { - "epoch": 0.73, - "learning_rate": 1.7685503981977946e-06, - "loss": 0.73, - "step": 28601 - }, - { - "epoch": 0.73, - "learning_rate": 1.7685326946446074e-06, - "loss": 0.9111, - "step": 28602 - }, - { - "epoch": 0.73, - "learning_rate": 1.7685149905029904e-06, - "loss": 0.8984, - "step": 28603 - }, - { - "epoch": 0.73, - "learning_rate": 1.7684972857729564e-06, - "loss": 0.8682, - "step": 28604 - }, - { - "epoch": 0.73, - "learning_rate": 1.7684795804545197e-06, - "loss": 0.9756, - "step": 28605 - }, - { - "epoch": 0.73, - "learning_rate": 1.768461874547693e-06, - "loss": 0.4963, - "step": 28606 - }, - { - "epoch": 0.73, - "learning_rate": 1.7684441680524908e-06, - "loss": 0.9277, - "step": 28607 - }, - { - "epoch": 0.73, - "learning_rate": 1.7684264609689264e-06, - "loss": 0.9453, - "step": 28608 - }, - { - "epoch": 0.73, - "learning_rate": 1.7684087532970127e-06, - "loss": 0.7529, - "step": 28609 - }, - { - "epoch": 0.73, - "learning_rate": 1.768391045036764e-06, - "loss": 0.8066, - "step": 28610 - }, - { - "epoch": 0.73, - "learning_rate": 1.7683733361881937e-06, - "loss": 1.0029, - "step": 28611 - }, - { - "epoch": 0.73, - "learning_rate": 1.7683556267513153e-06, - "loss": 0.7441, - "step": 28612 - }, - { - "epoch": 0.73, - "learning_rate": 1.768337916726142e-06, - "loss": 0.9365, - "step": 28613 - }, - { - "epoch": 0.73, - "learning_rate": 1.7683202061126879e-06, - "loss": 0.8818, - "step": 28614 - }, - { - "epoch": 0.73, - "learning_rate": 1.7683024949109664e-06, - "loss": 1.0605, - "step": 28615 - }, - { - "epoch": 0.73, - "learning_rate": 1.768284783120991e-06, - "loss": 0.845, - "step": 28616 - }, - { - "epoch": 0.73, - "learning_rate": 1.7682670707427751e-06, - "loss": 0.8467, - "step": 28617 - }, - { - "epoch": 0.73, - "learning_rate": 1.7682493577763324e-06, - "loss": 0.8955, - "step": 28618 - }, - { - "epoch": 0.73, - "learning_rate": 1.7682316442216769e-06, - "loss": 1.002, - "step": 28619 - }, - { - "epoch": 0.73, - "learning_rate": 1.7682139300788213e-06, - "loss": 1.0234, - "step": 28620 - }, - { - "epoch": 0.73, - "learning_rate": 1.7681962153477799e-06, - "loss": 0.8584, - "step": 28621 - }, - { - "epoch": 0.73, - "learning_rate": 1.7681785000285658e-06, - "loss": 0.8079, - "step": 28622 - }, - { - "epoch": 0.73, - "learning_rate": 1.7681607841211927e-06, - "loss": 0.9014, - "step": 28623 - }, - { - "epoch": 0.73, - "learning_rate": 1.7681430676256746e-06, - "loss": 0.5098, - "step": 28624 - }, - { - "epoch": 0.73, - "learning_rate": 1.7681253505420241e-06, - "loss": 0.8633, - "step": 28625 - }, - { - "epoch": 0.73, - "learning_rate": 1.7681076328702558e-06, - "loss": 0.9756, - "step": 28626 - }, - { - "epoch": 0.73, - "learning_rate": 1.7680899146103826e-06, - "loss": 0.7739, - "step": 28627 - }, - { - "epoch": 0.73, - "learning_rate": 1.7680721957624183e-06, - "loss": 0.8066, - "step": 28628 - }, - { - "epoch": 0.73, - "learning_rate": 1.7680544763263765e-06, - "loss": 0.9375, - "step": 28629 - }, - { - "epoch": 0.73, - "learning_rate": 1.7680367563022707e-06, - "loss": 1.0244, - "step": 28630 - }, - { - "epoch": 0.73, - "learning_rate": 1.7680190356901143e-06, - "loss": 1.0713, - "step": 28631 - }, - { - "epoch": 0.73, - "learning_rate": 1.768001314489921e-06, - "loss": 0.8975, - "step": 28632 - }, - { - "epoch": 0.73, - "learning_rate": 1.7679835927017046e-06, - "loss": 0.8936, - "step": 28633 - }, - { - "epoch": 0.73, - "learning_rate": 1.7679658703254785e-06, - "loss": 0.8662, - "step": 28634 - }, - { - "epoch": 0.73, - "learning_rate": 1.7679481473612563e-06, - "loss": 0.8101, - "step": 28635 - }, - { - "epoch": 0.73, - "learning_rate": 1.7679304238090515e-06, - "loss": 0.7378, - "step": 28636 - }, - { - "epoch": 0.73, - "learning_rate": 1.7679126996688776e-06, - "loss": 0.6943, - "step": 28637 - }, - { - "epoch": 0.73, - "learning_rate": 1.767894974940748e-06, - "loss": 0.7212, - "step": 28638 - }, - { - "epoch": 0.73, - "learning_rate": 1.767877249624677e-06, - "loss": 0.9053, - "step": 28639 - }, - { - "epoch": 0.73, - "learning_rate": 1.7678595237206775e-06, - "loss": 0.9756, - "step": 28640 - }, - { - "epoch": 0.73, - "learning_rate": 1.7678417972287632e-06, - "loss": 0.9424, - "step": 28641 - }, - { - "epoch": 0.73, - "learning_rate": 1.7678240701489477e-06, - "loss": 0.6455, - "step": 28642 - }, - { - "epoch": 0.73, - "learning_rate": 1.767806342481245e-06, - "loss": 0.8965, - "step": 28643 - }, - { - "epoch": 0.73, - "learning_rate": 1.767788614225668e-06, - "loss": 1.0713, - "step": 28644 - }, - { - "epoch": 0.73, - "learning_rate": 1.7677708853822302e-06, - "loss": 0.7583, - "step": 28645 - }, - { - "epoch": 0.73, - "learning_rate": 1.767753155950946e-06, - "loss": 0.9434, - "step": 28646 - }, - { - "epoch": 0.73, - "learning_rate": 1.7677354259318285e-06, - "loss": 0.9326, - "step": 28647 - }, - { - "epoch": 0.73, - "learning_rate": 1.767717695324891e-06, - "loss": 0.9922, - "step": 28648 - }, - { - "epoch": 0.73, - "learning_rate": 1.7676999641301476e-06, - "loss": 0.7239, - "step": 28649 - }, - { - "epoch": 0.73, - "learning_rate": 1.7676822323476115e-06, - "loss": 0.7559, - "step": 28650 - }, - { - "epoch": 0.73, - "learning_rate": 1.7676644999772968e-06, - "loss": 0.6885, - "step": 28651 - }, - { - "epoch": 0.73, - "learning_rate": 1.7676467670192162e-06, - "loss": 0.4807, - "step": 28652 - }, - { - "epoch": 0.73, - "learning_rate": 1.7676290334733838e-06, - "loss": 0.8125, - "step": 28653 - }, - { - "epoch": 0.73, - "learning_rate": 1.7676112993398134e-06, - "loss": 0.8926, - "step": 28654 - }, - { - "epoch": 0.73, - "learning_rate": 1.7675935646185183e-06, - "loss": 0.8193, - "step": 28655 - }, - { - "epoch": 0.73, - "learning_rate": 1.7675758293095119e-06, - "loss": 0.8633, - "step": 28656 - }, - { - "epoch": 0.73, - "learning_rate": 1.7675580934128082e-06, - "loss": 0.6816, - "step": 28657 - }, - { - "epoch": 0.73, - "learning_rate": 1.7675403569284204e-06, - "loss": 0.8457, - "step": 28658 - }, - { - "epoch": 0.73, - "learning_rate": 1.7675226198563622e-06, - "loss": 0.9609, - "step": 28659 - }, - { - "epoch": 0.73, - "learning_rate": 1.7675048821966473e-06, - "loss": 0.6328, - "step": 28660 - }, - { - "epoch": 0.73, - "learning_rate": 1.7674871439492894e-06, - "loss": 0.9434, - "step": 28661 - }, - { - "epoch": 0.73, - "learning_rate": 1.7674694051143017e-06, - "loss": 1.0508, - "step": 28662 - }, - { - "epoch": 0.73, - "learning_rate": 1.767451665691698e-06, - "loss": 0.7324, - "step": 28663 - }, - { - "epoch": 0.73, - "learning_rate": 1.767433925681492e-06, - "loss": 0.6621, - "step": 28664 - }, - { - "epoch": 0.73, - "learning_rate": 1.7674161850836966e-06, - "loss": 0.792, - "step": 28665 - }, - { - "epoch": 0.73, - "learning_rate": 1.7673984438983265e-06, - "loss": 0.8594, - "step": 28666 - }, - { - "epoch": 0.73, - "learning_rate": 1.7673807021253944e-06, - "loss": 0.8086, - "step": 28667 - }, - { - "epoch": 0.73, - "learning_rate": 1.7673629597649142e-06, - "loss": 0.8975, - "step": 28668 - }, - { - "epoch": 0.73, - "learning_rate": 1.7673452168168997e-06, - "loss": 0.7334, - "step": 28669 - }, - { - "epoch": 0.73, - "learning_rate": 1.7673274732813638e-06, - "loss": 0.9902, - "step": 28670 - }, - { - "epoch": 0.73, - "learning_rate": 1.7673097291583209e-06, - "loss": 0.9893, - "step": 28671 - }, - { - "epoch": 0.73, - "learning_rate": 1.7672919844477843e-06, - "loss": 0.9512, - "step": 28672 - }, - { - "epoch": 0.73, - "learning_rate": 1.7672742391497673e-06, - "loss": 0.9297, - "step": 28673 - }, - { - "epoch": 0.73, - "learning_rate": 1.7672564932642836e-06, - "loss": 0.7871, - "step": 28674 - }, - { - "epoch": 0.73, - "learning_rate": 1.767238746791347e-06, - "loss": 1.1465, - "step": 28675 - }, - { - "epoch": 0.73, - "learning_rate": 1.767220999730971e-06, - "loss": 1.0508, - "step": 28676 - }, - { - "epoch": 0.74, - "learning_rate": 1.7672032520831693e-06, - "loss": 0.7471, - "step": 28677 - }, - { - "epoch": 0.74, - "learning_rate": 1.7671855038479548e-06, - "loss": 0.7051, - "step": 28678 - }, - { - "epoch": 0.74, - "learning_rate": 1.7671677550253424e-06, - "loss": 0.8848, - "step": 28679 - }, - { - "epoch": 0.74, - "learning_rate": 1.7671500056153445e-06, - "loss": 0.793, - "step": 28680 - }, - { - "epoch": 0.74, - "learning_rate": 1.7671322556179751e-06, - "loss": 0.9229, - "step": 28681 - }, - { - "epoch": 0.74, - "learning_rate": 1.767114505033248e-06, - "loss": 0.77, - "step": 28682 - }, - { - "epoch": 0.74, - "learning_rate": 1.7670967538611762e-06, - "loss": 0.6047, - "step": 28683 - }, - { - "epoch": 0.74, - "learning_rate": 1.767079002101774e-06, - "loss": 0.9746, - "step": 28684 - }, - { - "epoch": 0.74, - "learning_rate": 1.7670612497550548e-06, - "loss": 0.8271, - "step": 28685 - }, - { - "epoch": 0.74, - "learning_rate": 1.767043496821032e-06, - "loss": 0.7988, - "step": 28686 - }, - { - "epoch": 0.74, - "learning_rate": 1.7670257432997189e-06, - "loss": 1.0869, - "step": 28687 - }, - { - "epoch": 0.74, - "learning_rate": 1.7670079891911299e-06, - "loss": 0.6846, - "step": 28688 - }, - { - "epoch": 0.74, - "learning_rate": 1.766990234495278e-06, - "loss": 0.9434, - "step": 28689 - }, - { - "epoch": 0.74, - "learning_rate": 1.7669724792121769e-06, - "loss": 0.7817, - "step": 28690 - }, - { - "epoch": 0.74, - "learning_rate": 1.7669547233418402e-06, - "loss": 0.6108, - "step": 28691 - }, - { - "epoch": 0.74, - "learning_rate": 1.7669369668842817e-06, - "loss": 0.877, - "step": 28692 - }, - { - "epoch": 0.74, - "learning_rate": 1.7669192098395148e-06, - "loss": 1.1484, - "step": 28693 - }, - { - "epoch": 0.74, - "learning_rate": 1.7669014522075529e-06, - "loss": 0.9238, - "step": 28694 - }, - { - "epoch": 0.74, - "learning_rate": 1.76688369398841e-06, - "loss": 1.1055, - "step": 28695 - }, - { - "epoch": 0.74, - "learning_rate": 1.7668659351820993e-06, - "loss": 0.8311, - "step": 28696 - }, - { - "epoch": 0.74, - "learning_rate": 1.7668481757886348e-06, - "loss": 1.0156, - "step": 28697 - }, - { - "epoch": 0.74, - "learning_rate": 1.76683041580803e-06, - "loss": 0.6953, - "step": 28698 - }, - { - "epoch": 0.74, - "learning_rate": 1.7668126552402982e-06, - "loss": 0.7529, - "step": 28699 - }, - { - "epoch": 0.74, - "learning_rate": 1.7667948940854536e-06, - "loss": 0.8281, - "step": 28700 - }, - { - "epoch": 0.74, - "learning_rate": 1.766777132343509e-06, - "loss": 0.7891, - "step": 28701 - }, - { - "epoch": 0.74, - "learning_rate": 1.7667593700144785e-06, - "loss": 0.9023, - "step": 28702 - }, - { - "epoch": 0.74, - "learning_rate": 1.7667416070983757e-06, - "loss": 0.6768, - "step": 28703 - }, - { - "epoch": 0.74, - "learning_rate": 1.766723843595214e-06, - "loss": 0.9434, - "step": 28704 - }, - { - "epoch": 0.74, - "learning_rate": 1.7667060795050073e-06, - "loss": 1.041, - "step": 28705 - }, - { - "epoch": 0.74, - "learning_rate": 1.766688314827769e-06, - "loss": 0.9258, - "step": 28706 - }, - { - "epoch": 0.74, - "learning_rate": 1.7666705495635123e-06, - "loss": 0.8047, - "step": 28707 - }, - { - "epoch": 0.74, - "learning_rate": 1.7666527837122515e-06, - "loss": 0.9209, - "step": 28708 - }, - { - "epoch": 0.74, - "learning_rate": 1.766635017274e-06, - "loss": 0.7061, - "step": 28709 - }, - { - "epoch": 0.74, - "learning_rate": 1.7666172502487713e-06, - "loss": 1.0918, - "step": 28710 - }, - { - "epoch": 0.74, - "learning_rate": 1.766599482636579e-06, - "loss": 0.9043, - "step": 28711 - }, - { - "epoch": 0.74, - "learning_rate": 1.7665817144374367e-06, - "loss": 0.8555, - "step": 28712 - }, - { - "epoch": 0.74, - "learning_rate": 1.7665639456513579e-06, - "loss": 0.8564, - "step": 28713 - }, - { - "epoch": 0.74, - "learning_rate": 1.7665461762783564e-06, - "loss": 1.1133, - "step": 28714 - }, - { - "epoch": 0.74, - "learning_rate": 1.766528406318446e-06, - "loss": 0.998, - "step": 28715 - }, - { - "epoch": 0.74, - "learning_rate": 1.7665106357716395e-06, - "loss": 0.9209, - "step": 28716 - }, - { - "epoch": 0.74, - "learning_rate": 1.7664928646379516e-06, - "loss": 0.8545, - "step": 28717 - }, - { - "epoch": 0.74, - "learning_rate": 1.7664750929173953e-06, - "loss": 0.772, - "step": 28718 - }, - { - "epoch": 0.74, - "learning_rate": 1.7664573206099837e-06, - "loss": 0.7686, - "step": 28719 - }, - { - "epoch": 0.74, - "learning_rate": 1.7664395477157315e-06, - "loss": 0.7988, - "step": 28720 - }, - { - "epoch": 0.74, - "learning_rate": 1.7664217742346516e-06, - "loss": 0.7979, - "step": 28721 - }, - { - "epoch": 0.74, - "learning_rate": 1.766404000166758e-06, - "loss": 0.8438, - "step": 28722 - }, - { - "epoch": 0.74, - "learning_rate": 1.7663862255120639e-06, - "loss": 0.8848, - "step": 28723 - }, - { - "epoch": 0.74, - "learning_rate": 1.7663684502705832e-06, - "loss": 0.8691, - "step": 28724 - }, - { - "epoch": 0.74, - "learning_rate": 1.7663506744423292e-06, - "loss": 0.8838, - "step": 28725 - }, - { - "epoch": 0.74, - "learning_rate": 1.7663328980273162e-06, - "loss": 0.5798, - "step": 28726 - }, - { - "epoch": 0.74, - "learning_rate": 1.766315121025557e-06, - "loss": 0.9756, - "step": 28727 - }, - { - "epoch": 0.74, - "learning_rate": 1.7662973434370655e-06, - "loss": 0.9082, - "step": 28728 - }, - { - "epoch": 0.74, - "learning_rate": 1.7662795652618554e-06, - "loss": 0.8955, - "step": 28729 - }, - { - "epoch": 0.74, - "learning_rate": 1.7662617864999402e-06, - "loss": 0.9951, - "step": 28730 - }, - { - "epoch": 0.74, - "learning_rate": 1.7662440071513339e-06, - "loss": 0.8359, - "step": 28731 - }, - { - "epoch": 0.74, - "learning_rate": 1.7662262272160496e-06, - "loss": 0.7856, - "step": 28732 - }, - { - "epoch": 0.74, - "learning_rate": 1.766208446694101e-06, - "loss": 1.0264, - "step": 28733 - }, - { - "epoch": 0.74, - "learning_rate": 1.7661906655855018e-06, - "loss": 0.7051, - "step": 28734 - }, - { - "epoch": 0.74, - "learning_rate": 1.7661728838902658e-06, - "loss": 1.0059, - "step": 28735 - }, - { - "epoch": 0.74, - "learning_rate": 1.7661551016084064e-06, - "loss": 0.917, - "step": 28736 - }, - { - "epoch": 0.74, - "learning_rate": 1.7661373187399372e-06, - "loss": 0.7891, - "step": 28737 - }, - { - "epoch": 0.74, - "learning_rate": 1.7661195352848722e-06, - "loss": 0.7646, - "step": 28738 - }, - { - "epoch": 0.74, - "learning_rate": 1.7661017512432243e-06, - "loss": 0.6455, - "step": 28739 - }, - { - "epoch": 0.74, - "learning_rate": 1.7660839666150077e-06, - "loss": 0.8418, - "step": 28740 - }, - { - "epoch": 0.74, - "learning_rate": 1.766066181400236e-06, - "loss": 0.7314, - "step": 28741 - }, - { - "epoch": 0.74, - "learning_rate": 1.7660483955989222e-06, - "loss": 0.7598, - "step": 28742 - }, - { - "epoch": 0.74, - "learning_rate": 1.766030609211081e-06, - "loss": 0.7012, - "step": 28743 - }, - { - "epoch": 0.74, - "learning_rate": 1.7660128222367248e-06, - "loss": 0.6318, - "step": 28744 - }, - { - "epoch": 0.74, - "learning_rate": 1.765995034675868e-06, - "loss": 0.9326, - "step": 28745 - }, - { - "epoch": 0.74, - "learning_rate": 1.7659772465285242e-06, - "loss": 0.604, - "step": 28746 - }, - { - "epoch": 0.74, - "learning_rate": 1.7659594577947065e-06, - "loss": 0.6709, - "step": 28747 - }, - { - "epoch": 0.74, - "learning_rate": 1.7659416684744291e-06, - "loss": 0.8945, - "step": 28748 - }, - { - "epoch": 0.74, - "learning_rate": 1.7659238785677053e-06, - "loss": 0.9619, - "step": 28749 - }, - { - "epoch": 0.74, - "learning_rate": 1.7659060880745486e-06, - "loss": 0.8364, - "step": 28750 - }, - { - "epoch": 0.74, - "learning_rate": 1.7658882969949734e-06, - "loss": 0.7427, - "step": 28751 - }, - { - "epoch": 0.74, - "learning_rate": 1.7658705053289924e-06, - "loss": 0.9785, - "step": 28752 - }, - { - "epoch": 0.74, - "learning_rate": 1.7658527130766194e-06, - "loss": 0.6172, - "step": 28753 - }, - { - "epoch": 0.74, - "learning_rate": 1.7658349202378684e-06, - "loss": 0.9771, - "step": 28754 - }, - { - "epoch": 0.74, - "learning_rate": 1.7658171268127529e-06, - "loss": 0.584, - "step": 28755 - }, - { - "epoch": 0.74, - "learning_rate": 1.7657993328012864e-06, - "loss": 0.7871, - "step": 28756 - }, - { - "epoch": 0.74, - "learning_rate": 1.7657815382034821e-06, - "loss": 0.8276, - "step": 28757 - }, - { - "epoch": 0.74, - "learning_rate": 1.7657637430193547e-06, - "loss": 0.7441, - "step": 28758 - }, - { - "epoch": 0.74, - "learning_rate": 1.765745947248917e-06, - "loss": 0.6885, - "step": 28759 - }, - { - "epoch": 0.74, - "learning_rate": 1.765728150892183e-06, - "loss": 1.0078, - "step": 28760 - }, - { - "epoch": 0.74, - "learning_rate": 1.7657103539491657e-06, - "loss": 0.7119, - "step": 28761 - }, - { - "epoch": 0.74, - "learning_rate": 1.7656925564198795e-06, - "loss": 1.0127, - "step": 28762 - }, - { - "epoch": 0.74, - "learning_rate": 1.7656747583043377e-06, - "loss": 1.0195, - "step": 28763 - }, - { - "epoch": 0.74, - "learning_rate": 1.765656959602554e-06, - "loss": 0.8877, - "step": 28764 - }, - { - "epoch": 0.74, - "learning_rate": 1.7656391603145417e-06, - "loss": 0.7051, - "step": 28765 - }, - { - "epoch": 0.74, - "learning_rate": 1.7656213604403151e-06, - "loss": 1.041, - "step": 28766 - }, - { - "epoch": 0.74, - "learning_rate": 1.7656035599798873e-06, - "loss": 0.7886, - "step": 28767 - }, - { - "epoch": 0.74, - "learning_rate": 1.7655857589332718e-06, - "loss": 0.8477, - "step": 28768 - }, - { - "epoch": 0.74, - "learning_rate": 1.7655679573004826e-06, - "loss": 0.8135, - "step": 28769 - }, - { - "epoch": 0.74, - "learning_rate": 1.7655501550815335e-06, - "loss": 0.9834, - "step": 28770 - }, - { - "epoch": 0.74, - "learning_rate": 1.7655323522764376e-06, - "loss": 0.8574, - "step": 28771 - }, - { - "epoch": 0.74, - "learning_rate": 1.7655145488852088e-06, - "loss": 0.9004, - "step": 28772 - }, - { - "epoch": 0.74, - "learning_rate": 1.7654967449078608e-06, - "loss": 0.8975, - "step": 28773 - }, - { - "epoch": 0.74, - "learning_rate": 1.7654789403444071e-06, - "loss": 0.9199, - "step": 28774 - }, - { - "epoch": 0.74, - "learning_rate": 1.7654611351948612e-06, - "loss": 0.9375, - "step": 28775 - }, - { - "epoch": 0.74, - "learning_rate": 1.7654433294592371e-06, - "loss": 0.8408, - "step": 28776 - }, - { - "epoch": 0.74, - "learning_rate": 1.7654255231375484e-06, - "loss": 0.9473, - "step": 28777 - }, - { - "epoch": 0.74, - "learning_rate": 1.7654077162298084e-06, - "loss": 0.7715, - "step": 28778 - }, - { - "epoch": 0.74, - "learning_rate": 1.7653899087360306e-06, - "loss": 0.6406, - "step": 28779 - }, - { - "epoch": 0.74, - "learning_rate": 1.7653721006562291e-06, - "loss": 0.7703, - "step": 28780 - }, - { - "epoch": 0.74, - "learning_rate": 1.7653542919904178e-06, - "loss": 0.6851, - "step": 28781 - }, - { - "epoch": 0.74, - "learning_rate": 1.7653364827386094e-06, - "loss": 0.8613, - "step": 28782 - }, - { - "epoch": 0.74, - "learning_rate": 1.7653186729008183e-06, - "loss": 0.8569, - "step": 28783 - }, - { - "epoch": 0.74, - "learning_rate": 1.765300862477058e-06, - "loss": 0.564, - "step": 28784 - }, - { - "epoch": 0.74, - "learning_rate": 1.7652830514673418e-06, - "loss": 0.7744, - "step": 28785 - }, - { - "epoch": 0.74, - "learning_rate": 1.7652652398716836e-06, - "loss": 0.8643, - "step": 28786 - }, - { - "epoch": 0.74, - "learning_rate": 1.765247427690097e-06, - "loss": 0.9922, - "step": 28787 - }, - { - "epoch": 0.74, - "learning_rate": 1.7652296149225956e-06, - "loss": 0.999, - "step": 28788 - }, - { - "epoch": 0.74, - "learning_rate": 1.765211801569193e-06, - "loss": 0.7461, - "step": 28789 - }, - { - "epoch": 0.74, - "learning_rate": 1.7651939876299032e-06, - "loss": 0.6838, - "step": 28790 - }, - { - "epoch": 0.74, - "learning_rate": 1.7651761731047391e-06, - "loss": 1.1689, - "step": 28791 - }, - { - "epoch": 0.74, - "learning_rate": 1.765158357993715e-06, - "loss": 0.9043, - "step": 28792 - }, - { - "epoch": 0.74, - "learning_rate": 1.7651405422968443e-06, - "loss": 0.6729, - "step": 28793 - }, - { - "epoch": 0.74, - "learning_rate": 1.7651227260141411e-06, - "loss": 0.834, - "step": 28794 - }, - { - "epoch": 0.74, - "learning_rate": 1.765104909145618e-06, - "loss": 0.916, - "step": 28795 - }, - { - "epoch": 0.74, - "learning_rate": 1.7650870916912898e-06, - "loss": 1.0742, - "step": 28796 - }, - { - "epoch": 0.74, - "learning_rate": 1.7650692736511692e-06, - "loss": 1.002, - "step": 28797 - }, - { - "epoch": 0.74, - "learning_rate": 1.7650514550252704e-06, - "loss": 0.6519, - "step": 28798 - }, - { - "epoch": 0.74, - "learning_rate": 1.7650336358136067e-06, - "loss": 0.7915, - "step": 28799 - }, - { - "epoch": 0.74, - "learning_rate": 1.765015816016192e-06, - "loss": 0.8623, - "step": 28800 - }, - { - "epoch": 0.74, - "learning_rate": 1.76499799563304e-06, - "loss": 0.8057, - "step": 28801 - }, - { - "epoch": 0.74, - "learning_rate": 1.764980174664164e-06, - "loss": 0.9229, - "step": 28802 - }, - { - "epoch": 0.74, - "learning_rate": 1.764962353109578e-06, - "loss": 0.9629, - "step": 28803 - }, - { - "epoch": 0.74, - "learning_rate": 1.7649445309692954e-06, - "loss": 0.5957, - "step": 28804 - }, - { - "epoch": 0.74, - "learning_rate": 1.76492670824333e-06, - "loss": 0.6455, - "step": 28805 - }, - { - "epoch": 0.74, - "learning_rate": 1.7649088849316954e-06, - "loss": 1.04, - "step": 28806 - }, - { - "epoch": 0.74, - "learning_rate": 1.7648910610344053e-06, - "loss": 0.8276, - "step": 28807 - }, - { - "epoch": 0.74, - "learning_rate": 1.7648732365514732e-06, - "loss": 1.083, - "step": 28808 - }, - { - "epoch": 0.74, - "learning_rate": 1.764855411482913e-06, - "loss": 0.8584, - "step": 28809 - }, - { - "epoch": 0.74, - "learning_rate": 1.7648375858287378e-06, - "loss": 1.0859, - "step": 28810 - }, - { - "epoch": 0.74, - "learning_rate": 1.764819759588962e-06, - "loss": 0.917, - "step": 28811 - }, - { - "epoch": 0.74, - "learning_rate": 1.7648019327635986e-06, - "loss": 0.835, - "step": 28812 - }, - { - "epoch": 0.74, - "learning_rate": 1.7647841053526618e-06, - "loss": 1.0029, - "step": 28813 - }, - { - "epoch": 0.74, - "learning_rate": 1.7647662773561648e-06, - "loss": 0.8799, - "step": 28814 - }, - { - "epoch": 0.74, - "learning_rate": 1.7647484487741214e-06, - "loss": 0.6875, - "step": 28815 - }, - { - "epoch": 0.74, - "learning_rate": 1.7647306196065455e-06, - "loss": 0.8408, - "step": 28816 - }, - { - "epoch": 0.74, - "learning_rate": 1.7647127898534504e-06, - "loss": 0.6523, - "step": 28817 - }, - { - "epoch": 0.74, - "learning_rate": 1.7646949595148498e-06, - "loss": 1.0361, - "step": 28818 - }, - { - "epoch": 0.74, - "learning_rate": 1.7646771285907573e-06, - "loss": 0.8145, - "step": 28819 - }, - { - "epoch": 0.74, - "learning_rate": 1.7646592970811871e-06, - "loss": 0.9541, - "step": 28820 - }, - { - "epoch": 0.74, - "learning_rate": 1.7646414649861523e-06, - "loss": 0.8887, - "step": 28821 - }, - { - "epoch": 0.74, - "learning_rate": 1.7646236323056664e-06, - "loss": 0.9756, - "step": 28822 - }, - { - "epoch": 0.74, - "learning_rate": 1.7646057990397436e-06, - "loss": 0.9375, - "step": 28823 - }, - { - "epoch": 0.74, - "learning_rate": 1.7645879651883972e-06, - "loss": 0.6938, - "step": 28824 - }, - { - "epoch": 0.74, - "learning_rate": 1.764570130751641e-06, - "loss": 0.8203, - "step": 28825 - }, - { - "epoch": 0.74, - "learning_rate": 1.7645522957294886e-06, - "loss": 1.0127, - "step": 28826 - }, - { - "epoch": 0.74, - "learning_rate": 1.7645344601219535e-06, - "loss": 0.9258, - "step": 28827 - }, - { - "epoch": 0.74, - "learning_rate": 1.7645166239290497e-06, - "loss": 0.9014, - "step": 28828 - }, - { - "epoch": 0.74, - "learning_rate": 1.7644987871507909e-06, - "loss": 1.0039, - "step": 28829 - }, - { - "epoch": 0.74, - "learning_rate": 1.7644809497871899e-06, - "loss": 0.793, - "step": 28830 - }, - { - "epoch": 0.74, - "learning_rate": 1.7644631118382616e-06, - "loss": 0.6304, - "step": 28831 - }, - { - "epoch": 0.74, - "learning_rate": 1.7644452733040188e-06, - "loss": 0.8223, - "step": 28832 - }, - { - "epoch": 0.74, - "learning_rate": 1.7644274341844753e-06, - "loss": 0.8379, - "step": 28833 - }, - { - "epoch": 0.74, - "learning_rate": 1.7644095944796452e-06, - "loss": 0.9688, - "step": 28834 - }, - { - "epoch": 0.74, - "learning_rate": 1.7643917541895414e-06, - "loss": 0.8525, - "step": 28835 - }, - { - "epoch": 0.74, - "learning_rate": 1.7643739133141784e-06, - "loss": 0.8096, - "step": 28836 - }, - { - "epoch": 0.74, - "learning_rate": 1.764356071853569e-06, - "loss": 0.7275, - "step": 28837 - }, - { - "epoch": 0.74, - "learning_rate": 1.764338229807728e-06, - "loss": 1.0352, - "step": 28838 - }, - { - "epoch": 0.74, - "learning_rate": 1.7643203871766677e-06, - "loss": 0.7988, - "step": 28839 - }, - { - "epoch": 0.74, - "learning_rate": 1.7643025439604024e-06, - "loss": 0.8242, - "step": 28840 - }, - { - "epoch": 0.74, - "learning_rate": 1.7642847001589463e-06, - "loss": 0.79, - "step": 28841 - }, - { - "epoch": 0.74, - "learning_rate": 1.764266855772312e-06, - "loss": 0.6621, - "step": 28842 - }, - { - "epoch": 0.74, - "learning_rate": 1.7642490108005142e-06, - "loss": 0.8145, - "step": 28843 - }, - { - "epoch": 0.74, - "learning_rate": 1.7642311652435654e-06, - "loss": 0.8291, - "step": 28844 - }, - { - "epoch": 0.74, - "learning_rate": 1.7642133191014806e-06, - "loss": 0.9824, - "step": 28845 - }, - { - "epoch": 0.74, - "learning_rate": 1.7641954723742724e-06, - "loss": 0.5688, - "step": 28846 - }, - { - "epoch": 0.74, - "learning_rate": 1.7641776250619552e-06, - "loss": 0.8076, - "step": 28847 - }, - { - "epoch": 0.74, - "learning_rate": 1.7641597771645422e-06, - "loss": 0.7188, - "step": 28848 - }, - { - "epoch": 0.74, - "learning_rate": 1.764141928682047e-06, - "loss": 0.8975, - "step": 28849 - }, - { - "epoch": 0.74, - "learning_rate": 1.7641240796144836e-06, - "loss": 0.9902, - "step": 28850 - }, - { - "epoch": 0.74, - "learning_rate": 1.7641062299618656e-06, - "loss": 0.8721, - "step": 28851 - }, - { - "epoch": 0.74, - "learning_rate": 1.7640883797242067e-06, - "loss": 0.8018, - "step": 28852 - }, - { - "epoch": 0.74, - "learning_rate": 1.7640705289015203e-06, - "loss": 0.7217, - "step": 28853 - }, - { - "epoch": 0.74, - "learning_rate": 1.76405267749382e-06, - "loss": 0.9287, - "step": 28854 - }, - { - "epoch": 0.74, - "learning_rate": 1.76403482550112e-06, - "loss": 0.9873, - "step": 28855 - }, - { - "epoch": 0.74, - "learning_rate": 1.7640169729234337e-06, - "loss": 1.0098, - "step": 28856 - }, - { - "epoch": 0.74, - "learning_rate": 1.7639991197607746e-06, - "loss": 0.75, - "step": 28857 - }, - { - "epoch": 0.74, - "learning_rate": 1.7639812660131565e-06, - "loss": 0.8418, - "step": 28858 - }, - { - "epoch": 0.74, - "learning_rate": 1.763963411680593e-06, - "loss": 0.9648, - "step": 28859 - }, - { - "epoch": 0.74, - "learning_rate": 1.7639455567630982e-06, - "loss": 0.9277, - "step": 28860 - }, - { - "epoch": 0.74, - "learning_rate": 1.7639277012606852e-06, - "loss": 0.8359, - "step": 28861 - }, - { - "epoch": 0.74, - "learning_rate": 1.7639098451733675e-06, - "loss": 0.7778, - "step": 28862 - }, - { - "epoch": 0.74, - "learning_rate": 1.7638919885011599e-06, - "loss": 0.5789, - "step": 28863 - }, - { - "epoch": 0.74, - "learning_rate": 1.763874131244075e-06, - "loss": 0.7666, - "step": 28864 - }, - { - "epoch": 0.74, - "learning_rate": 1.7638562734021264e-06, - "loss": 0.8994, - "step": 28865 - }, - { - "epoch": 0.74, - "learning_rate": 1.7638384149753288e-06, - "loss": 1.0381, - "step": 28866 - }, - { - "epoch": 0.74, - "learning_rate": 1.7638205559636949e-06, - "loss": 0.9785, - "step": 28867 - }, - { - "epoch": 0.74, - "learning_rate": 1.7638026963672387e-06, - "loss": 0.8608, - "step": 28868 - }, - { - "epoch": 0.74, - "learning_rate": 1.763784836185974e-06, - "loss": 0.9199, - "step": 28869 - }, - { - "epoch": 0.74, - "learning_rate": 1.7637669754199146e-06, - "loss": 0.8857, - "step": 28870 - }, - { - "epoch": 0.74, - "learning_rate": 1.7637491140690734e-06, - "loss": 0.8359, - "step": 28871 - }, - { - "epoch": 0.74, - "learning_rate": 1.763731252133465e-06, - "loss": 0.6514, - "step": 28872 - }, - { - "epoch": 0.74, - "learning_rate": 1.7637133896131027e-06, - "loss": 0.708, - "step": 28873 - }, - { - "epoch": 0.74, - "learning_rate": 1.763695526508e-06, - "loss": 0.751, - "step": 28874 - }, - { - "epoch": 0.74, - "learning_rate": 1.763677662818171e-06, - "loss": 0.8613, - "step": 28875 - }, - { - "epoch": 0.74, - "learning_rate": 1.7636597985436287e-06, - "loss": 0.8213, - "step": 28876 - }, - { - "epoch": 0.74, - "learning_rate": 1.7636419336843875e-06, - "loss": 0.9736, - "step": 28877 - }, - { - "epoch": 0.74, - "learning_rate": 1.7636240682404608e-06, - "loss": 0.8379, - "step": 28878 - }, - { - "epoch": 0.74, - "learning_rate": 1.7636062022118622e-06, - "loss": 0.9512, - "step": 28879 - }, - { - "epoch": 0.74, - "learning_rate": 1.7635883355986057e-06, - "loss": 0.8965, - "step": 28880 - }, - { - "epoch": 0.74, - "learning_rate": 1.7635704684007044e-06, - "loss": 0.9824, - "step": 28881 - }, - { - "epoch": 0.74, - "learning_rate": 1.7635526006181722e-06, - "loss": 0.7212, - "step": 28882 - }, - { - "epoch": 0.74, - "learning_rate": 1.7635347322510232e-06, - "loss": 0.8262, - "step": 28883 - }, - { - "epoch": 0.74, - "learning_rate": 1.7635168632992707e-06, - "loss": 0.875, - "step": 28884 - }, - { - "epoch": 0.74, - "learning_rate": 1.7634989937629283e-06, - "loss": 0.6846, - "step": 28885 - }, - { - "epoch": 0.74, - "learning_rate": 1.76348112364201e-06, - "loss": 0.9355, - "step": 28886 - }, - { - "epoch": 0.74, - "learning_rate": 1.7634632529365292e-06, - "loss": 1.2227, - "step": 28887 - }, - { - "epoch": 0.74, - "learning_rate": 1.7634453816464995e-06, - "loss": 0.7319, - "step": 28888 - }, - { - "epoch": 0.74, - "learning_rate": 1.763427509771935e-06, - "loss": 0.8945, - "step": 28889 - }, - { - "epoch": 0.74, - "learning_rate": 1.7634096373128493e-06, - "loss": 0.6328, - "step": 28890 - }, - { - "epoch": 0.74, - "learning_rate": 1.7633917642692558e-06, - "loss": 0.8857, - "step": 28891 - }, - { - "epoch": 0.74, - "learning_rate": 1.7633738906411684e-06, - "loss": 1.0508, - "step": 28892 - }, - { - "epoch": 0.74, - "learning_rate": 1.7633560164286006e-06, - "loss": 0.7222, - "step": 28893 - }, - { - "epoch": 0.74, - "learning_rate": 1.763338141631566e-06, - "loss": 0.7842, - "step": 28894 - }, - { - "epoch": 0.74, - "learning_rate": 1.763320266250079e-06, - "loss": 0.6125, - "step": 28895 - }, - { - "epoch": 0.74, - "learning_rate": 1.7633023902841524e-06, - "loss": 0.832, - "step": 28896 - }, - { - "epoch": 0.74, - "learning_rate": 1.7632845137338005e-06, - "loss": 0.9805, - "step": 28897 - }, - { - "epoch": 0.74, - "learning_rate": 1.7632666365990363e-06, - "loss": 0.5728, - "step": 28898 - }, - { - "epoch": 0.74, - "learning_rate": 1.7632487588798743e-06, - "loss": 0.8057, - "step": 28899 - }, - { - "epoch": 0.74, - "learning_rate": 1.763230880576328e-06, - "loss": 0.9316, - "step": 28900 - }, - { - "epoch": 0.74, - "learning_rate": 1.7632130016884103e-06, - "loss": 0.8555, - "step": 28901 - }, - { - "epoch": 0.74, - "learning_rate": 1.763195122216136e-06, - "loss": 0.7764, - "step": 28902 - }, - { - "epoch": 0.74, - "learning_rate": 1.7631772421595178e-06, - "loss": 0.7246, - "step": 28903 - }, - { - "epoch": 0.74, - "learning_rate": 1.7631593615185705e-06, - "loss": 0.8379, - "step": 28904 - }, - { - "epoch": 0.74, - "learning_rate": 1.763141480293307e-06, - "loss": 0.7043, - "step": 28905 - }, - { - "epoch": 0.74, - "learning_rate": 1.7631235984837409e-06, - "loss": 1.0771, - "step": 28906 - }, - { - "epoch": 0.74, - "learning_rate": 1.7631057160898864e-06, - "loss": 0.8701, - "step": 28907 - }, - { - "epoch": 0.74, - "learning_rate": 1.7630878331117566e-06, - "loss": 1.1611, - "step": 28908 - }, - { - "epoch": 0.74, - "learning_rate": 1.763069949549366e-06, - "loss": 0.709, - "step": 28909 - }, - { - "epoch": 0.74, - "learning_rate": 1.7630520654027275e-06, - "loss": 0.9658, - "step": 28910 - }, - { - "epoch": 0.74, - "learning_rate": 1.763034180671855e-06, - "loss": 0.9102, - "step": 28911 - }, - { - "epoch": 0.74, - "learning_rate": 1.7630162953567627e-06, - "loss": 0.8691, - "step": 28912 - }, - { - "epoch": 0.74, - "learning_rate": 1.7629984094574636e-06, - "loss": 0.8516, - "step": 28913 - }, - { - "epoch": 0.74, - "learning_rate": 1.7629805229739718e-06, - "loss": 1.1572, - "step": 28914 - }, - { - "epoch": 0.74, - "learning_rate": 1.762962635906301e-06, - "loss": 0.8701, - "step": 28915 - }, - { - "epoch": 0.74, - "learning_rate": 1.7629447482544648e-06, - "loss": 0.7905, - "step": 28916 - }, - { - "epoch": 0.74, - "learning_rate": 1.7629268600184769e-06, - "loss": 0.8857, - "step": 28917 - }, - { - "epoch": 0.74, - "learning_rate": 1.7629089711983507e-06, - "loss": 0.9951, - "step": 28918 - }, - { - "epoch": 0.74, - "learning_rate": 1.7628910817941004e-06, - "loss": 0.6168, - "step": 28919 - }, - { - "epoch": 0.74, - "learning_rate": 1.7628731918057396e-06, - "loss": 0.8262, - "step": 28920 - }, - { - "epoch": 0.74, - "learning_rate": 1.7628553012332814e-06, - "loss": 0.9668, - "step": 28921 - }, - { - "epoch": 0.74, - "learning_rate": 1.7628374100767404e-06, - "loss": 0.9238, - "step": 28922 - }, - { - "epoch": 0.74, - "learning_rate": 1.76281951833613e-06, - "loss": 0.8721, - "step": 28923 - }, - { - "epoch": 0.74, - "learning_rate": 1.7628016260114634e-06, - "loss": 1.0332, - "step": 28924 - }, - { - "epoch": 0.74, - "learning_rate": 1.7627837331027547e-06, - "loss": 0.9395, - "step": 28925 - }, - { - "epoch": 0.74, - "learning_rate": 1.7627658396100178e-06, - "loss": 0.8496, - "step": 28926 - }, - { - "epoch": 0.74, - "learning_rate": 1.762747945533266e-06, - "loss": 0.834, - "step": 28927 - }, - { - "epoch": 0.74, - "learning_rate": 1.7627300508725132e-06, - "loss": 0.9551, - "step": 28928 - }, - { - "epoch": 0.74, - "learning_rate": 1.762712155627773e-06, - "loss": 0.8643, - "step": 28929 - }, - { - "epoch": 0.74, - "learning_rate": 1.7626942597990592e-06, - "loss": 0.9062, - "step": 28930 - }, - { - "epoch": 0.74, - "learning_rate": 1.7626763633863857e-06, - "loss": 0.7007, - "step": 28931 - }, - { - "epoch": 0.74, - "learning_rate": 1.762658466389766e-06, - "loss": 0.9502, - "step": 28932 - }, - { - "epoch": 0.74, - "learning_rate": 1.7626405688092134e-06, - "loss": 0.8584, - "step": 28933 - }, - { - "epoch": 0.74, - "learning_rate": 1.7626226706447421e-06, - "loss": 0.7898, - "step": 28934 - }, - { - "epoch": 0.74, - "learning_rate": 1.762604771896366e-06, - "loss": 0.9727, - "step": 28935 - }, - { - "epoch": 0.74, - "learning_rate": 1.762586872564098e-06, - "loss": 0.9346, - "step": 28936 - }, - { - "epoch": 0.74, - "learning_rate": 1.7625689726479526e-06, - "loss": 0.916, - "step": 28937 - }, - { - "epoch": 0.74, - "learning_rate": 1.7625510721479432e-06, - "loss": 0.9658, - "step": 28938 - }, - { - "epoch": 0.74, - "learning_rate": 1.7625331710640833e-06, - "loss": 0.7969, - "step": 28939 - }, - { - "epoch": 0.74, - "learning_rate": 1.762515269396387e-06, - "loss": 0.5625, - "step": 28940 - }, - { - "epoch": 0.74, - "learning_rate": 1.762497367144868e-06, - "loss": 0.9785, - "step": 28941 - }, - { - "epoch": 0.74, - "learning_rate": 1.7624794643095396e-06, - "loss": 0.918, - "step": 28942 - }, - { - "epoch": 0.74, - "learning_rate": 1.7624615608904156e-06, - "loss": 0.6248, - "step": 28943 - }, - { - "epoch": 0.74, - "learning_rate": 1.76244365688751e-06, - "loss": 0.7446, - "step": 28944 - }, - { - "epoch": 0.74, - "learning_rate": 1.7624257523008363e-06, - "loss": 0.915, - "step": 28945 - }, - { - "epoch": 0.74, - "learning_rate": 1.7624078471304084e-06, - "loss": 0.7585, - "step": 28946 - }, - { - "epoch": 0.74, - "learning_rate": 1.7623899413762399e-06, - "loss": 0.9648, - "step": 28947 - }, - { - "epoch": 0.74, - "learning_rate": 1.7623720350383443e-06, - "loss": 0.9551, - "step": 28948 - }, - { - "epoch": 0.74, - "learning_rate": 1.7623541281167356e-06, - "loss": 0.8584, - "step": 28949 - }, - { - "epoch": 0.74, - "learning_rate": 1.762336220611427e-06, - "loss": 0.572, - "step": 28950 - }, - { - "epoch": 0.74, - "learning_rate": 1.7623183125224332e-06, - "loss": 0.8203, - "step": 28951 - }, - { - "epoch": 0.74, - "learning_rate": 1.762300403849767e-06, - "loss": 0.9492, - "step": 28952 - }, - { - "epoch": 0.74, - "learning_rate": 1.7622824945934424e-06, - "loss": 0.8242, - "step": 28953 - }, - { - "epoch": 0.74, - "learning_rate": 1.7622645847534732e-06, - "loss": 0.7251, - "step": 28954 - }, - { - "epoch": 0.74, - "learning_rate": 1.7622466743298733e-06, - "loss": 1.0977, - "step": 28955 - }, - { - "epoch": 0.74, - "learning_rate": 1.7622287633226561e-06, - "loss": 0.7427, - "step": 28956 - }, - { - "epoch": 0.74, - "learning_rate": 1.7622108517318351e-06, - "loss": 0.8652, - "step": 28957 - }, - { - "epoch": 0.74, - "learning_rate": 1.7621929395574245e-06, - "loss": 1.0088, - "step": 28958 - }, - { - "epoch": 0.74, - "learning_rate": 1.7621750267994378e-06, - "loss": 0.6919, - "step": 28959 - }, - { - "epoch": 0.74, - "learning_rate": 1.7621571134578884e-06, - "loss": 0.8984, - "step": 28960 - }, - { - "epoch": 0.74, - "learning_rate": 1.7621391995327907e-06, - "loss": 0.7231, - "step": 28961 - }, - { - "epoch": 0.74, - "learning_rate": 1.762121285024158e-06, - "loss": 0.8564, - "step": 28962 - }, - { - "epoch": 0.74, - "learning_rate": 1.762103369932004e-06, - "loss": 0.7334, - "step": 28963 - }, - { - "epoch": 0.74, - "learning_rate": 1.7620854542563427e-06, - "loss": 0.7515, - "step": 28964 - }, - { - "epoch": 0.74, - "learning_rate": 1.7620675379971874e-06, - "loss": 0.7783, - "step": 28965 - }, - { - "epoch": 0.74, - "learning_rate": 1.762049621154552e-06, - "loss": 0.9316, - "step": 28966 - }, - { - "epoch": 0.74, - "learning_rate": 1.7620317037284504e-06, - "loss": 0.8184, - "step": 28967 - }, - { - "epoch": 0.74, - "learning_rate": 1.762013785718896e-06, - "loss": 0.6533, - "step": 28968 - }, - { - "epoch": 0.74, - "learning_rate": 1.761995867125903e-06, - "loss": 0.7495, - "step": 28969 - }, - { - "epoch": 0.74, - "learning_rate": 1.7619779479494845e-06, - "loss": 0.7974, - "step": 28970 - }, - { - "epoch": 0.74, - "learning_rate": 1.7619600281896548e-06, - "loss": 0.9521, - "step": 28971 - }, - { - "epoch": 0.74, - "learning_rate": 1.7619421078464269e-06, - "loss": 0.9062, - "step": 28972 - }, - { - "epoch": 0.74, - "learning_rate": 1.7619241869198154e-06, - "loss": 1.1006, - "step": 28973 - }, - { - "epoch": 0.74, - "learning_rate": 1.7619062654098333e-06, - "loss": 0.9277, - "step": 28974 - }, - { - "epoch": 0.74, - "learning_rate": 1.7618883433164947e-06, - "loss": 1.1689, - "step": 28975 - }, - { - "epoch": 0.74, - "learning_rate": 1.7618704206398132e-06, - "loss": 0.999, - "step": 28976 - }, - { - "epoch": 0.74, - "learning_rate": 1.7618524973798028e-06, - "loss": 0.7275, - "step": 28977 - }, - { - "epoch": 0.74, - "learning_rate": 1.7618345735364767e-06, - "loss": 1.0312, - "step": 28978 - }, - { - "epoch": 0.74, - "learning_rate": 1.761816649109849e-06, - "loss": 0.9375, - "step": 28979 - }, - { - "epoch": 0.74, - "learning_rate": 1.761798724099933e-06, - "loss": 0.957, - "step": 28980 - }, - { - "epoch": 0.74, - "learning_rate": 1.7617807985067432e-06, - "loss": 1.0137, - "step": 28981 - }, - { - "epoch": 0.74, - "learning_rate": 1.7617628723302927e-06, - "loss": 0.8359, - "step": 28982 - }, - { - "epoch": 0.74, - "learning_rate": 1.7617449455705954e-06, - "loss": 0.8828, - "step": 28983 - }, - { - "epoch": 0.74, - "learning_rate": 1.761727018227665e-06, - "loss": 0.8096, - "step": 28984 - }, - { - "epoch": 0.74, - "learning_rate": 1.7617090903015153e-06, - "loss": 0.4728, - "step": 28985 - }, - { - "epoch": 0.74, - "learning_rate": 1.7616911617921598e-06, - "loss": 0.9346, - "step": 28986 - }, - { - "epoch": 0.74, - "learning_rate": 1.7616732326996125e-06, - "loss": 0.6895, - "step": 28987 - }, - { - "epoch": 0.74, - "learning_rate": 1.761655303023887e-06, - "loss": 0.6963, - "step": 28988 - }, - { - "epoch": 0.74, - "learning_rate": 1.7616373727649974e-06, - "loss": 0.916, - "step": 28989 - }, - { - "epoch": 0.74, - "learning_rate": 1.7616194419229566e-06, - "loss": 0.792, - "step": 28990 - }, - { - "epoch": 0.74, - "learning_rate": 1.761601510497779e-06, - "loss": 0.7827, - "step": 28991 - }, - { - "epoch": 0.74, - "learning_rate": 1.761583578489478e-06, - "loss": 0.8691, - "step": 28992 - }, - { - "epoch": 0.74, - "learning_rate": 1.761565645898068e-06, - "loss": 0.8555, - "step": 28993 - }, - { - "epoch": 0.74, - "learning_rate": 1.7615477127235616e-06, - "loss": 0.8252, - "step": 28994 - }, - { - "epoch": 0.74, - "learning_rate": 1.7615297789659733e-06, - "loss": 0.9458, - "step": 28995 - }, - { - "epoch": 0.74, - "learning_rate": 1.7615118446253167e-06, - "loss": 0.6492, - "step": 28996 - }, - { - "epoch": 0.74, - "learning_rate": 1.7614939097016057e-06, - "loss": 0.9023, - "step": 28997 - }, - { - "epoch": 0.74, - "learning_rate": 1.7614759741948534e-06, - "loss": 0.709, - "step": 28998 - }, - { - "epoch": 0.74, - "learning_rate": 1.7614580381050743e-06, - "loss": 0.9658, - "step": 28999 - }, - { - "epoch": 0.74, - "learning_rate": 1.7614401014322819e-06, - "loss": 0.7598, - "step": 29000 - }, - { - "epoch": 0.74, - "learning_rate": 1.7614221641764896e-06, - "loss": 0.8569, - "step": 29001 - }, - { - "epoch": 0.74, - "learning_rate": 1.7614042263377113e-06, - "loss": 0.877, - "step": 29002 - }, - { - "epoch": 0.74, - "learning_rate": 1.7613862879159612e-06, - "loss": 0.9736, - "step": 29003 - }, - { - "epoch": 0.74, - "learning_rate": 1.7613683489112522e-06, - "loss": 0.874, - "step": 29004 - }, - { - "epoch": 0.74, - "learning_rate": 1.7613504093235985e-06, - "loss": 0.9951, - "step": 29005 - }, - { - "epoch": 0.74, - "learning_rate": 1.7613324691530139e-06, - "loss": 0.73, - "step": 29006 - }, - { - "epoch": 0.74, - "learning_rate": 1.761314528399512e-06, - "loss": 1.002, - "step": 29007 - }, - { - "epoch": 0.74, - "learning_rate": 1.7612965870631065e-06, - "loss": 0.8442, - "step": 29008 - }, - { - "epoch": 0.74, - "learning_rate": 1.7612786451438113e-06, - "loss": 0.8057, - "step": 29009 - }, - { - "epoch": 0.74, - "learning_rate": 1.7612607026416399e-06, - "loss": 0.8633, - "step": 29010 - }, - { - "epoch": 0.74, - "learning_rate": 1.7612427595566067e-06, - "loss": 0.9805, - "step": 29011 - }, - { - "epoch": 0.74, - "learning_rate": 1.7612248158887244e-06, - "loss": 0.5591, - "step": 29012 - }, - { - "epoch": 0.74, - "learning_rate": 1.7612068716380072e-06, - "loss": 0.9121, - "step": 29013 - }, - { - "epoch": 0.74, - "learning_rate": 1.7611889268044694e-06, - "loss": 0.937, - "step": 29014 - }, - { - "epoch": 0.74, - "learning_rate": 1.7611709813881239e-06, - "loss": 0.751, - "step": 29015 - }, - { - "epoch": 0.74, - "learning_rate": 1.7611530353889848e-06, - "loss": 0.8179, - "step": 29016 - }, - { - "epoch": 0.74, - "learning_rate": 1.7611350888070657e-06, - "loss": 0.9209, - "step": 29017 - }, - { - "epoch": 0.74, - "learning_rate": 1.7611171416423807e-06, - "loss": 0.9854, - "step": 29018 - }, - { - "epoch": 0.74, - "learning_rate": 1.7610991938949431e-06, - "loss": 0.8584, - "step": 29019 - }, - { - "epoch": 0.74, - "learning_rate": 1.761081245564767e-06, - "loss": 0.9219, - "step": 29020 - }, - { - "epoch": 0.74, - "learning_rate": 1.761063296651866e-06, - "loss": 0.8975, - "step": 29021 - }, - { - "epoch": 0.74, - "learning_rate": 1.7610453471562537e-06, - "loss": 0.6143, - "step": 29022 - }, - { - "epoch": 0.74, - "learning_rate": 1.761027397077944e-06, - "loss": 0.9453, - "step": 29023 - }, - { - "epoch": 0.74, - "learning_rate": 1.7610094464169506e-06, - "loss": 0.8301, - "step": 29024 - }, - { - "epoch": 0.74, - "learning_rate": 1.7609914951732874e-06, - "loss": 0.8457, - "step": 29025 - }, - { - "epoch": 0.74, - "learning_rate": 1.760973543346968e-06, - "loss": 0.9805, - "step": 29026 - }, - { - "epoch": 0.74, - "learning_rate": 1.760955590938006e-06, - "loss": 0.7656, - "step": 29027 - }, - { - "epoch": 0.74, - "learning_rate": 1.7609376379464153e-06, - "loss": 0.835, - "step": 29028 - }, - { - "epoch": 0.74, - "learning_rate": 1.7609196843722098e-06, - "loss": 0.8643, - "step": 29029 - }, - { - "epoch": 0.74, - "learning_rate": 1.7609017302154027e-06, - "loss": 0.9414, - "step": 29030 - }, - { - "epoch": 0.74, - "learning_rate": 1.7608837754760084e-06, - "loss": 0.7358, - "step": 29031 - }, - { - "epoch": 0.74, - "learning_rate": 1.7608658201540404e-06, - "loss": 0.8262, - "step": 29032 - }, - { - "epoch": 0.74, - "learning_rate": 1.7608478642495125e-06, - "loss": 0.8057, - "step": 29033 - }, - { - "epoch": 0.74, - "learning_rate": 1.7608299077624382e-06, - "loss": 0.7715, - "step": 29034 - }, - { - "epoch": 0.74, - "learning_rate": 1.7608119506928317e-06, - "loss": 0.9414, - "step": 29035 - }, - { - "epoch": 0.74, - "learning_rate": 1.7607939930407064e-06, - "loss": 0.832, - "step": 29036 - }, - { - "epoch": 0.74, - "learning_rate": 1.760776034806076e-06, - "loss": 0.9043, - "step": 29037 - }, - { - "epoch": 0.74, - "learning_rate": 1.7607580759889542e-06, - "loss": 0.5695, - "step": 29038 - }, - { - "epoch": 0.74, - "learning_rate": 1.7607401165893551e-06, - "loss": 0.9551, - "step": 29039 - }, - { - "epoch": 0.74, - "learning_rate": 1.7607221566072924e-06, - "loss": 0.7397, - "step": 29040 - }, - { - "epoch": 0.74, - "learning_rate": 1.7607041960427795e-06, - "loss": 0.7357, - "step": 29041 - }, - { - "epoch": 0.74, - "learning_rate": 1.7606862348958305e-06, - "loss": 0.875, - "step": 29042 - }, - { - "epoch": 0.74, - "learning_rate": 1.760668273166459e-06, - "loss": 0.6616, - "step": 29043 - }, - { - "epoch": 0.74, - "learning_rate": 1.7606503108546788e-06, - "loss": 0.8525, - "step": 29044 - }, - { - "epoch": 0.74, - "learning_rate": 1.7606323479605037e-06, - "loss": 0.8867, - "step": 29045 - }, - { - "epoch": 0.74, - "learning_rate": 1.7606143844839472e-06, - "loss": 0.9365, - "step": 29046 - }, - { - "epoch": 0.74, - "learning_rate": 1.7605964204250234e-06, - "loss": 0.7786, - "step": 29047 - }, - { - "epoch": 0.74, - "learning_rate": 1.760578455783746e-06, - "loss": 0.957, - "step": 29048 - }, - { - "epoch": 0.74, - "learning_rate": 1.7605604905601282e-06, - "loss": 0.8955, - "step": 29049 - }, - { - "epoch": 0.74, - "learning_rate": 1.7605425247541846e-06, - "loss": 1.0684, - "step": 29050 - }, - { - "epoch": 0.74, - "learning_rate": 1.7605245583659285e-06, - "loss": 0.8877, - "step": 29051 - }, - { - "epoch": 0.74, - "learning_rate": 1.7605065913953736e-06, - "loss": 0.9404, - "step": 29052 - }, - { - "epoch": 0.74, - "learning_rate": 1.7604886238425338e-06, - "loss": 0.9023, - "step": 29053 - }, - { - "epoch": 0.74, - "learning_rate": 1.7604706557074227e-06, - "loss": 0.918, - "step": 29054 - }, - { - "epoch": 0.74, - "learning_rate": 1.7604526869900545e-06, - "loss": 0.958, - "step": 29055 - }, - { - "epoch": 0.74, - "learning_rate": 1.7604347176904426e-06, - "loss": 0.7583, - "step": 29056 - }, - { - "epoch": 0.74, - "learning_rate": 1.7604167478086005e-06, - "loss": 0.9443, - "step": 29057 - }, - { - "epoch": 0.74, - "learning_rate": 1.7603987773445425e-06, - "loss": 0.7319, - "step": 29058 - }, - { - "epoch": 0.74, - "learning_rate": 1.7603808062982822e-06, - "loss": 0.9111, - "step": 29059 - }, - { - "epoch": 0.74, - "learning_rate": 1.7603628346698332e-06, - "loss": 1.0088, - "step": 29060 - }, - { - "epoch": 0.74, - "learning_rate": 1.7603448624592092e-06, - "loss": 0.9678, - "step": 29061 - }, - { - "epoch": 0.74, - "learning_rate": 1.7603268896664243e-06, - "loss": 0.7949, - "step": 29062 - }, - { - "epoch": 0.74, - "learning_rate": 1.7603089162914918e-06, - "loss": 0.7637, - "step": 29063 - }, - { - "epoch": 0.74, - "learning_rate": 1.7602909423344258e-06, - "loss": 0.7803, - "step": 29064 - }, - { - "epoch": 0.74, - "learning_rate": 1.7602729677952405e-06, - "loss": 0.791, - "step": 29065 - }, - { - "epoch": 0.74, - "learning_rate": 1.7602549926739484e-06, - "loss": 0.8042, - "step": 29066 - }, - { - "epoch": 0.75, - "learning_rate": 1.7602370169705646e-06, - "loss": 0.8438, - "step": 29067 - }, - { - "epoch": 0.75, - "learning_rate": 1.7602190406851016e-06, - "loss": 0.875, - "step": 29068 - }, - { - "epoch": 0.75, - "learning_rate": 1.7602010638175745e-06, - "loss": 0.7871, - "step": 29069 - }, - { - "epoch": 0.75, - "learning_rate": 1.7601830863679962e-06, - "loss": 1.0615, - "step": 29070 - }, - { - "epoch": 0.75, - "learning_rate": 1.7601651083363805e-06, - "loss": 0.8926, - "step": 29071 - }, - { - "epoch": 0.75, - "learning_rate": 1.7601471297227413e-06, - "loss": 0.5347, - "step": 29072 - }, - { - "epoch": 0.75, - "learning_rate": 1.7601291505270925e-06, - "loss": 0.7402, - "step": 29073 - }, - { - "epoch": 0.75, - "learning_rate": 1.7601111707494477e-06, - "loss": 0.7852, - "step": 29074 - }, - { - "epoch": 0.75, - "learning_rate": 1.760093190389821e-06, - "loss": 0.7744, - "step": 29075 - }, - { - "epoch": 0.75, - "learning_rate": 1.7600752094482255e-06, - "loss": 0.6675, - "step": 29076 - }, - { - "epoch": 0.75, - "learning_rate": 1.7600572279246756e-06, - "loss": 0.8599, - "step": 29077 - }, - { - "epoch": 0.75, - "learning_rate": 1.7600392458191849e-06, - "loss": 0.7728, - "step": 29078 - }, - { - "epoch": 0.75, - "learning_rate": 1.760021263131767e-06, - "loss": 0.8916, - "step": 29079 - }, - { - "epoch": 0.75, - "learning_rate": 1.7600032798624358e-06, - "loss": 0.8867, - "step": 29080 - }, - { - "epoch": 0.75, - "learning_rate": 1.7599852960112049e-06, - "loss": 0.8906, - "step": 29081 - }, - { - "epoch": 0.75, - "learning_rate": 1.7599673115780883e-06, - "loss": 0.8633, - "step": 29082 - }, - { - "epoch": 0.75, - "learning_rate": 1.7599493265630997e-06, - "loss": 0.7314, - "step": 29083 - }, - { - "epoch": 0.75, - "learning_rate": 1.7599313409662529e-06, - "loss": 0.9375, - "step": 29084 - }, - { - "epoch": 0.75, - "learning_rate": 1.7599133547875615e-06, - "loss": 0.7451, - "step": 29085 - }, - { - "epoch": 0.75, - "learning_rate": 1.7598953680270394e-06, - "loss": 1.043, - "step": 29086 - }, - { - "epoch": 0.75, - "learning_rate": 1.7598773806847005e-06, - "loss": 0.9629, - "step": 29087 - }, - { - "epoch": 0.75, - "learning_rate": 1.7598593927605582e-06, - "loss": 0.5767, - "step": 29088 - }, - { - "epoch": 0.75, - "learning_rate": 1.7598414042546265e-06, - "loss": 0.7192, - "step": 29089 - }, - { - "epoch": 0.75, - "learning_rate": 1.7598234151669193e-06, - "loss": 0.8457, - "step": 29090 - }, - { - "epoch": 0.75, - "learning_rate": 1.7598054254974501e-06, - "loss": 0.8135, - "step": 29091 - }, - { - "epoch": 0.75, - "learning_rate": 1.7597874352462332e-06, - "loss": 0.8828, - "step": 29092 - }, - { - "epoch": 0.75, - "learning_rate": 1.7597694444132815e-06, - "loss": 1.0449, - "step": 29093 - }, - { - "epoch": 0.75, - "learning_rate": 1.7597514529986096e-06, - "loss": 0.749, - "step": 29094 - }, - { - "epoch": 0.75, - "learning_rate": 1.7597334610022309e-06, - "loss": 0.624, - "step": 29095 - }, - { - "epoch": 0.75, - "learning_rate": 1.7597154684241592e-06, - "loss": 0.6152, - "step": 29096 - }, - { - "epoch": 0.75, - "learning_rate": 1.7596974752644082e-06, - "loss": 0.7871, - "step": 29097 - }, - { - "epoch": 0.75, - "learning_rate": 1.7596794815229919e-06, - "loss": 0.9248, - "step": 29098 - }, - { - "epoch": 0.75, - "learning_rate": 1.7596614871999237e-06, - "loss": 0.8799, - "step": 29099 - }, - { - "epoch": 0.75, - "learning_rate": 1.7596434922952182e-06, - "loss": 0.8403, - "step": 29100 - }, - { - "epoch": 0.75, - "learning_rate": 1.759625496808888e-06, - "loss": 1.04, - "step": 29101 - }, - { - "epoch": 0.75, - "learning_rate": 1.759607500740948e-06, - "loss": 0.8457, - "step": 29102 - }, - { - "epoch": 0.75, - "learning_rate": 1.7595895040914113e-06, - "loss": 0.9229, - "step": 29103 - }, - { - "epoch": 0.75, - "learning_rate": 1.7595715068602916e-06, - "loss": 0.8125, - "step": 29104 - }, - { - "epoch": 0.75, - "learning_rate": 1.7595535090476031e-06, - "loss": 0.8115, - "step": 29105 - }, - { - "epoch": 0.75, - "learning_rate": 1.7595355106533592e-06, - "loss": 1.0215, - "step": 29106 - }, - { - "epoch": 0.75, - "learning_rate": 1.7595175116775742e-06, - "loss": 0.9268, - "step": 29107 - }, - { - "epoch": 0.75, - "learning_rate": 1.7594995121202613e-06, - "loss": 1.0742, - "step": 29108 - }, - { - "epoch": 0.75, - "learning_rate": 1.7594815119814346e-06, - "loss": 1.0049, - "step": 29109 - }, - { - "epoch": 0.75, - "learning_rate": 1.759463511261108e-06, - "loss": 0.6343, - "step": 29110 - }, - { - "epoch": 0.75, - "learning_rate": 1.7594455099592952e-06, - "loss": 0.8242, - "step": 29111 - }, - { - "epoch": 0.75, - "learning_rate": 1.7594275080760097e-06, - "loss": 0.7976, - "step": 29112 - }, - { - "epoch": 0.75, - "learning_rate": 1.7594095056112655e-06, - "loss": 0.8623, - "step": 29113 - }, - { - "epoch": 0.75, - "learning_rate": 1.7593915025650761e-06, - "loss": 0.7393, - "step": 29114 - }, - { - "epoch": 0.75, - "learning_rate": 1.7593734989374559e-06, - "loss": 0.8096, - "step": 29115 - }, - { - "epoch": 0.75, - "learning_rate": 1.7593554947284182e-06, - "loss": 0.5864, - "step": 29116 - }, - { - "epoch": 0.75, - "learning_rate": 1.7593374899379767e-06, - "loss": 0.6895, - "step": 29117 - }, - { - "epoch": 0.75, - "learning_rate": 1.7593194845661458e-06, - "loss": 1.0146, - "step": 29118 - }, - { - "epoch": 0.75, - "learning_rate": 1.7593014786129388e-06, - "loss": 1.0586, - "step": 29119 - }, - { - "epoch": 0.75, - "learning_rate": 1.7592834720783694e-06, - "loss": 0.8369, - "step": 29120 - }, - { - "epoch": 0.75, - "learning_rate": 1.7592654649624517e-06, - "loss": 1.1377, - "step": 29121 - }, - { - "epoch": 0.75, - "learning_rate": 1.7592474572651992e-06, - "loss": 0.8574, - "step": 29122 - }, - { - "epoch": 0.75, - "learning_rate": 1.759229448986626e-06, - "loss": 0.9082, - "step": 29123 - }, - { - "epoch": 0.75, - "learning_rate": 1.7592114401267454e-06, - "loss": 1.0522, - "step": 29124 - }, - { - "epoch": 0.75, - "learning_rate": 1.7591934306855719e-06, - "loss": 0.7241, - "step": 29125 - }, - { - "epoch": 0.75, - "learning_rate": 1.7591754206631186e-06, - "loss": 0.6106, - "step": 29126 - }, - { - "epoch": 0.75, - "learning_rate": 1.7591574100593998e-06, - "loss": 0.6812, - "step": 29127 - }, - { - "epoch": 0.75, - "learning_rate": 1.759139398874429e-06, - "loss": 0.8848, - "step": 29128 - }, - { - "epoch": 0.75, - "learning_rate": 1.75912138710822e-06, - "loss": 0.876, - "step": 29129 - }, - { - "epoch": 0.75, - "learning_rate": 1.7591033747607868e-06, - "loss": 0.7852, - "step": 29130 - }, - { - "epoch": 0.75, - "learning_rate": 1.7590853618321431e-06, - "loss": 0.9756, - "step": 29131 - }, - { - "epoch": 0.75, - "learning_rate": 1.7590673483223023e-06, - "loss": 0.8701, - "step": 29132 - }, - { - "epoch": 0.75, - "learning_rate": 1.7590493342312788e-06, - "loss": 0.6606, - "step": 29133 - }, - { - "epoch": 0.75, - "learning_rate": 1.759031319559086e-06, - "loss": 0.7891, - "step": 29134 - }, - { - "epoch": 0.75, - "learning_rate": 1.7590133043057382e-06, - "loss": 0.8857, - "step": 29135 - }, - { - "epoch": 0.75, - "learning_rate": 1.7589952884712485e-06, - "loss": 0.8506, - "step": 29136 - }, - { - "epoch": 0.75, - "learning_rate": 1.7589772720556312e-06, - "loss": 0.835, - "step": 29137 - }, - { - "epoch": 0.75, - "learning_rate": 1.7589592550588996e-06, - "loss": 0.9941, - "step": 29138 - }, - { - "epoch": 0.75, - "learning_rate": 1.7589412374810677e-06, - "loss": 1.0068, - "step": 29139 - }, - { - "epoch": 0.75, - "learning_rate": 1.7589232193221498e-06, - "loss": 0.7666, - "step": 29140 - }, - { - "epoch": 0.75, - "learning_rate": 1.7589052005821592e-06, - "loss": 0.7715, - "step": 29141 - }, - { - "epoch": 0.75, - "learning_rate": 1.7588871812611095e-06, - "loss": 1.0645, - "step": 29142 - }, - { - "epoch": 0.75, - "learning_rate": 1.758869161359015e-06, - "loss": 0.9414, - "step": 29143 - }, - { - "epoch": 0.75, - "learning_rate": 1.758851140875889e-06, - "loss": 0.7241, - "step": 29144 - }, - { - "epoch": 0.75, - "learning_rate": 1.7588331198117462e-06, - "loss": 0.7964, - "step": 29145 - }, - { - "epoch": 0.75, - "learning_rate": 1.7588150981665992e-06, - "loss": 0.7803, - "step": 29146 - }, - { - "epoch": 0.75, - "learning_rate": 1.7587970759404627e-06, - "loss": 0.834, - "step": 29147 - }, - { - "epoch": 0.75, - "learning_rate": 1.75877905313335e-06, - "loss": 0.5481, - "step": 29148 - }, - { - "epoch": 0.75, - "learning_rate": 1.7587610297452748e-06, - "loss": 0.9141, - "step": 29149 - }, - { - "epoch": 0.75, - "learning_rate": 1.7587430057762517e-06, - "loss": 0.7401, - "step": 29150 - }, - { - "epoch": 0.75, - "learning_rate": 1.7587249812262938e-06, - "loss": 0.7393, - "step": 29151 - }, - { - "epoch": 0.75, - "learning_rate": 1.758706956095415e-06, - "loss": 0.7266, - "step": 29152 - }, - { - "epoch": 0.75, - "learning_rate": 1.758688930383629e-06, - "loss": 0.8599, - "step": 29153 - }, - { - "epoch": 0.75, - "learning_rate": 1.75867090409095e-06, - "loss": 0.832, - "step": 29154 - }, - { - "epoch": 0.75, - "learning_rate": 1.7586528772173917e-06, - "loss": 0.8955, - "step": 29155 - }, - { - "epoch": 0.75, - "learning_rate": 1.7586348497629676e-06, - "loss": 0.9717, - "step": 29156 - }, - { - "epoch": 0.75, - "learning_rate": 1.7586168217276916e-06, - "loss": 0.8164, - "step": 29157 - }, - { - "epoch": 0.75, - "learning_rate": 1.7585987931115777e-06, - "loss": 0.793, - "step": 29158 - }, - { - "epoch": 0.75, - "learning_rate": 1.7585807639146395e-06, - "loss": 0.9199, - "step": 29159 - }, - { - "epoch": 0.75, - "learning_rate": 1.758562734136891e-06, - "loss": 1.0996, - "step": 29160 - }, - { - "epoch": 0.75, - "learning_rate": 1.7585447037783458e-06, - "loss": 0.7407, - "step": 29161 - }, - { - "epoch": 0.75, - "learning_rate": 1.7585266728390179e-06, - "loss": 0.8291, - "step": 29162 - }, - { - "epoch": 0.75, - "learning_rate": 1.7585086413189207e-06, - "loss": 0.9473, - "step": 29163 - }, - { - "epoch": 0.75, - "learning_rate": 1.7584906092180685e-06, - "loss": 0.7959, - "step": 29164 - }, - { - "epoch": 0.75, - "learning_rate": 1.7584725765364751e-06, - "loss": 0.7188, - "step": 29165 - }, - { - "epoch": 0.75, - "learning_rate": 1.758454543274154e-06, - "loss": 0.7344, - "step": 29166 - }, - { - "epoch": 0.75, - "learning_rate": 1.7584365094311192e-06, - "loss": 0.8555, - "step": 29167 - }, - { - "epoch": 0.75, - "learning_rate": 1.7584184750073842e-06, - "loss": 0.7559, - "step": 29168 - }, - { - "epoch": 0.75, - "learning_rate": 1.7584004400029632e-06, - "loss": 0.749, - "step": 29169 - }, - { - "epoch": 0.75, - "learning_rate": 1.7583824044178698e-06, - "loss": 0.9541, - "step": 29170 - }, - { - "epoch": 0.75, - "learning_rate": 1.758364368252118e-06, - "loss": 0.7866, - "step": 29171 - }, - { - "epoch": 0.75, - "learning_rate": 1.7583463315057214e-06, - "loss": 0.834, - "step": 29172 - }, - { - "epoch": 0.75, - "learning_rate": 1.7583282941786938e-06, - "loss": 0.7803, - "step": 29173 - }, - { - "epoch": 0.75, - "learning_rate": 1.7583102562710492e-06, - "loss": 0.7549, - "step": 29174 - }, - { - "epoch": 0.75, - "learning_rate": 1.7582922177828014e-06, - "loss": 0.771, - "step": 29175 - }, - { - "epoch": 0.75, - "learning_rate": 1.758274178713964e-06, - "loss": 1.0029, - "step": 29176 - }, - { - "epoch": 0.75, - "learning_rate": 1.7582561390645507e-06, - "loss": 0.8105, - "step": 29177 - }, - { - "epoch": 0.75, - "learning_rate": 1.758238098834576e-06, - "loss": 0.7988, - "step": 29178 - }, - { - "epoch": 0.75, - "learning_rate": 1.7582200580240529e-06, - "loss": 0.8135, - "step": 29179 - }, - { - "epoch": 0.75, - "learning_rate": 1.7582020166329956e-06, - "loss": 0.8154, - "step": 29180 - }, - { - "epoch": 0.75, - "learning_rate": 1.758183974661418e-06, - "loss": 0.7646, - "step": 29181 - }, - { - "epoch": 0.75, - "learning_rate": 1.7581659321093338e-06, - "loss": 0.9268, - "step": 29182 - }, - { - "epoch": 0.75, - "learning_rate": 1.7581478889767567e-06, - "loss": 0.6875, - "step": 29183 - }, - { - "epoch": 0.75, - "learning_rate": 1.7581298452637005e-06, - "loss": 0.8169, - "step": 29184 - }, - { - "epoch": 0.75, - "learning_rate": 1.7581118009701794e-06, - "loss": 1.1191, - "step": 29185 - }, - { - "epoch": 0.75, - "learning_rate": 1.758093756096207e-06, - "loss": 0.9551, - "step": 29186 - }, - { - "epoch": 0.75, - "learning_rate": 1.7580757106417968e-06, - "loss": 0.7451, - "step": 29187 - }, - { - "epoch": 0.75, - "learning_rate": 1.7580576646069632e-06, - "loss": 0.9619, - "step": 29188 - }, - { - "epoch": 0.75, - "learning_rate": 1.7580396179917195e-06, - "loss": 0.8945, - "step": 29189 - }, - { - "epoch": 0.75, - "learning_rate": 1.7580215707960795e-06, - "loss": 0.793, - "step": 29190 - }, - { - "epoch": 0.75, - "learning_rate": 1.7580035230200576e-06, - "loss": 0.8936, - "step": 29191 - }, - { - "epoch": 0.75, - "learning_rate": 1.757985474663667e-06, - "loss": 0.917, - "step": 29192 - }, - { - "epoch": 0.75, - "learning_rate": 1.7579674257269218e-06, - "loss": 0.9131, - "step": 29193 - }, - { - "epoch": 0.75, - "learning_rate": 1.757949376209836e-06, - "loss": 0.873, - "step": 29194 - }, - { - "epoch": 0.75, - "learning_rate": 1.7579313261124234e-06, - "loss": 1.0, - "step": 29195 - }, - { - "epoch": 0.75, - "learning_rate": 1.7579132754346972e-06, - "loss": 0.7949, - "step": 29196 - }, - { - "epoch": 0.75, - "learning_rate": 1.7578952241766718e-06, - "loss": 0.9951, - "step": 29197 - }, - { - "epoch": 0.75, - "learning_rate": 1.757877172338361e-06, - "loss": 0.8633, - "step": 29198 - }, - { - "epoch": 0.75, - "learning_rate": 1.7578591199197782e-06, - "loss": 0.9844, - "step": 29199 - }, - { - "epoch": 0.75, - "learning_rate": 1.757841066920938e-06, - "loss": 0.7407, - "step": 29200 - }, - { - "epoch": 0.75, - "learning_rate": 1.7578230133418533e-06, - "loss": 0.7402, - "step": 29201 - }, - { - "epoch": 0.75, - "learning_rate": 1.7578049591825386e-06, - "loss": 0.96, - "step": 29202 - }, - { - "epoch": 0.75, - "learning_rate": 1.7577869044430074e-06, - "loss": 0.9541, - "step": 29203 - }, - { - "epoch": 0.75, - "learning_rate": 1.7577688491232737e-06, - "loss": 0.9297, - "step": 29204 - }, - { - "epoch": 0.75, - "learning_rate": 1.757750793223351e-06, - "loss": 0.8105, - "step": 29205 - }, - { - "epoch": 0.75, - "learning_rate": 1.7577327367432535e-06, - "loss": 0.873, - "step": 29206 - }, - { - "epoch": 0.75, - "learning_rate": 1.7577146796829948e-06, - "loss": 0.9424, - "step": 29207 - }, - { - "epoch": 0.75, - "learning_rate": 1.7576966220425888e-06, - "loss": 0.8271, - "step": 29208 - }, - { - "epoch": 0.75, - "learning_rate": 1.7576785638220497e-06, - "loss": 0.998, - "step": 29209 - }, - { - "epoch": 0.75, - "learning_rate": 1.7576605050213905e-06, - "loss": 0.9941, - "step": 29210 - }, - { - "epoch": 0.75, - "learning_rate": 1.7576424456406259e-06, - "loss": 1.1641, - "step": 29211 - }, - { - "epoch": 0.75, - "learning_rate": 1.7576243856797689e-06, - "loss": 0.8906, - "step": 29212 - }, - { - "epoch": 0.75, - "learning_rate": 1.757606325138834e-06, - "loss": 0.9492, - "step": 29213 - }, - { - "epoch": 0.75, - "learning_rate": 1.7575882640178348e-06, - "loss": 0.6353, - "step": 29214 - }, - { - "epoch": 0.75, - "learning_rate": 1.7575702023167848e-06, - "loss": 0.5163, - "step": 29215 - }, - { - "epoch": 0.75, - "learning_rate": 1.7575521400356986e-06, - "loss": 0.7764, - "step": 29216 - }, - { - "epoch": 0.75, - "learning_rate": 1.7575340771745893e-06, - "loss": 0.9102, - "step": 29217 - }, - { - "epoch": 0.75, - "learning_rate": 1.757516013733471e-06, - "loss": 0.79, - "step": 29218 - }, - { - "epoch": 0.75, - "learning_rate": 1.7574979497123574e-06, - "loss": 1.001, - "step": 29219 - }, - { - "epoch": 0.75, - "learning_rate": 1.7574798851112625e-06, - "loss": 0.7822, - "step": 29220 - }, - { - "epoch": 0.75, - "learning_rate": 1.7574618199302004e-06, - "loss": 0.7891, - "step": 29221 - }, - { - "epoch": 0.75, - "learning_rate": 1.7574437541691842e-06, - "loss": 1.0166, - "step": 29222 - }, - { - "epoch": 0.75, - "learning_rate": 1.7574256878282284e-06, - "loss": 0.7227, - "step": 29223 - }, - { - "epoch": 0.75, - "learning_rate": 1.7574076209073466e-06, - "loss": 0.6729, - "step": 29224 - }, - { - "epoch": 0.75, - "learning_rate": 1.7573895534065523e-06, - "loss": 0.8105, - "step": 29225 - }, - { - "epoch": 0.75, - "learning_rate": 1.7573714853258598e-06, - "loss": 0.7021, - "step": 29226 - }, - { - "epoch": 0.75, - "learning_rate": 1.7573534166652829e-06, - "loss": 0.8154, - "step": 29227 - }, - { - "epoch": 0.75, - "learning_rate": 1.7573353474248354e-06, - "loss": 0.9531, - "step": 29228 - }, - { - "epoch": 0.75, - "learning_rate": 1.7573172776045306e-06, - "loss": 0.9756, - "step": 29229 - }, - { - "epoch": 0.75, - "learning_rate": 1.757299207204383e-06, - "loss": 0.7393, - "step": 29230 - }, - { - "epoch": 0.75, - "learning_rate": 1.7572811362244064e-06, - "loss": 0.9814, - "step": 29231 - }, - { - "epoch": 0.75, - "learning_rate": 1.7572630646646144e-06, - "loss": 0.7002, - "step": 29232 - }, - { - "epoch": 0.75, - "learning_rate": 1.7572449925250207e-06, - "loss": 0.9224, - "step": 29233 - }, - { - "epoch": 0.75, - "learning_rate": 1.7572269198056395e-06, - "loss": 1.0605, - "step": 29234 - }, - { - "epoch": 0.75, - "learning_rate": 1.7572088465064844e-06, - "loss": 0.9443, - "step": 29235 - }, - { - "epoch": 0.75, - "learning_rate": 1.7571907726275693e-06, - "loss": 0.7275, - "step": 29236 - }, - { - "epoch": 0.75, - "learning_rate": 1.757172698168908e-06, - "loss": 1.043, - "step": 29237 - }, - { - "epoch": 0.75, - "learning_rate": 1.7571546231305146e-06, - "loss": 1.0615, - "step": 29238 - }, - { - "epoch": 0.75, - "learning_rate": 1.7571365475124024e-06, - "loss": 0.7061, - "step": 29239 - }, - { - "epoch": 0.75, - "learning_rate": 1.757118471314586e-06, - "loss": 0.9043, - "step": 29240 - }, - { - "epoch": 0.75, - "learning_rate": 1.7571003945370784e-06, - "loss": 0.79, - "step": 29241 - }, - { - "epoch": 0.75, - "learning_rate": 1.7570823171798941e-06, - "loss": 0.9521, - "step": 29242 - }, - { - "epoch": 0.75, - "learning_rate": 1.7570642392430464e-06, - "loss": 0.8242, - "step": 29243 - }, - { - "epoch": 0.75, - "learning_rate": 1.7570461607265497e-06, - "loss": 0.8428, - "step": 29244 - }, - { - "epoch": 0.75, - "learning_rate": 1.7570280816304176e-06, - "loss": 0.8057, - "step": 29245 - }, - { - "epoch": 0.75, - "learning_rate": 1.7570100019546636e-06, - "loss": 0.7437, - "step": 29246 - }, - { - "epoch": 0.75, - "learning_rate": 1.7569919216993018e-06, - "loss": 0.9785, - "step": 29247 - }, - { - "epoch": 0.75, - "learning_rate": 1.7569738408643463e-06, - "loss": 0.9473, - "step": 29248 - }, - { - "epoch": 0.75, - "learning_rate": 1.756955759449811e-06, - "loss": 0.9258, - "step": 29249 - }, - { - "epoch": 0.75, - "learning_rate": 1.756937677455709e-06, - "loss": 0.8325, - "step": 29250 - }, - { - "epoch": 0.75, - "learning_rate": 1.756919594882055e-06, - "loss": 0.9531, - "step": 29251 - }, - { - "epoch": 0.75, - "learning_rate": 1.756901511728862e-06, - "loss": 0.6982, - "step": 29252 - }, - { - "epoch": 0.75, - "learning_rate": 1.7568834279961448e-06, - "loss": 0.7842, - "step": 29253 - }, - { - "epoch": 0.75, - "learning_rate": 1.7568653436839167e-06, - "loss": 0.8945, - "step": 29254 - }, - { - "epoch": 0.75, - "learning_rate": 1.7568472587921911e-06, - "loss": 0.9531, - "step": 29255 - }, - { - "epoch": 0.75, - "learning_rate": 1.756829173320983e-06, - "loss": 0.7832, - "step": 29256 - }, - { - "epoch": 0.75, - "learning_rate": 1.7568110872703055e-06, - "loss": 0.7363, - "step": 29257 - }, - { - "epoch": 0.75, - "learning_rate": 1.7567930006401723e-06, - "loss": 0.7891, - "step": 29258 - }, - { - "epoch": 0.75, - "learning_rate": 1.7567749134305977e-06, - "loss": 0.6631, - "step": 29259 - }, - { - "epoch": 0.75, - "learning_rate": 1.7567568256415953e-06, - "loss": 0.9561, - "step": 29260 - }, - { - "epoch": 0.75, - "learning_rate": 1.7567387372731788e-06, - "loss": 0.6631, - "step": 29261 - }, - { - "epoch": 0.75, - "learning_rate": 1.7567206483253623e-06, - "loss": 0.9473, - "step": 29262 - }, - { - "epoch": 0.75, - "learning_rate": 1.7567025587981596e-06, - "loss": 0.9482, - "step": 29263 - }, - { - "epoch": 0.75, - "learning_rate": 1.7566844686915847e-06, - "loss": 0.8569, - "step": 29264 - }, - { - "epoch": 0.75, - "learning_rate": 1.7566663780056513e-06, - "loss": 0.9736, - "step": 29265 - }, - { - "epoch": 0.75, - "learning_rate": 1.756648286740373e-06, - "loss": 0.8721, - "step": 29266 - }, - { - "epoch": 0.75, - "learning_rate": 1.7566301948957643e-06, - "loss": 0.7852, - "step": 29267 - }, - { - "epoch": 0.75, - "learning_rate": 1.7566121024718381e-06, - "loss": 0.7271, - "step": 29268 - }, - { - "epoch": 0.75, - "learning_rate": 1.7565940094686091e-06, - "loss": 0.8105, - "step": 29269 - }, - { - "epoch": 0.75, - "learning_rate": 1.7565759158860911e-06, - "loss": 0.8633, - "step": 29270 - }, - { - "epoch": 0.75, - "learning_rate": 1.7565578217242973e-06, - "loss": 0.8267, - "step": 29271 - }, - { - "epoch": 0.75, - "learning_rate": 1.7565397269832423e-06, - "loss": 0.8193, - "step": 29272 - }, - { - "epoch": 0.75, - "learning_rate": 1.7565216316629395e-06, - "loss": 0.8867, - "step": 29273 - }, - { - "epoch": 0.75, - "learning_rate": 1.7565035357634029e-06, - "loss": 0.9229, - "step": 29274 - }, - { - "epoch": 0.75, - "learning_rate": 1.756485439284646e-06, - "loss": 0.9668, - "step": 29275 - }, - { - "epoch": 0.75, - "learning_rate": 1.7564673422266833e-06, - "loss": 0.7998, - "step": 29276 - }, - { - "epoch": 0.75, - "learning_rate": 1.7564492445895283e-06, - "loss": 0.7866, - "step": 29277 - }, - { - "epoch": 0.75, - "learning_rate": 1.7564311463731948e-06, - "loss": 0.959, - "step": 29278 - }, - { - "epoch": 0.75, - "learning_rate": 1.756413047577697e-06, - "loss": 0.999, - "step": 29279 - }, - { - "epoch": 0.75, - "learning_rate": 1.7563949482030483e-06, - "loss": 0.8594, - "step": 29280 - }, - { - "epoch": 0.75, - "learning_rate": 1.7563768482492626e-06, - "loss": 0.7036, - "step": 29281 - }, - { - "epoch": 0.75, - "learning_rate": 1.7563587477163542e-06, - "loss": 0.6567, - "step": 29282 - }, - { - "epoch": 0.75, - "learning_rate": 1.7563406466043367e-06, - "loss": 0.6025, - "step": 29283 - }, - { - "epoch": 0.75, - "learning_rate": 1.7563225449132238e-06, - "loss": 0.8086, - "step": 29284 - }, - { - "epoch": 0.75, - "learning_rate": 1.7563044426430296e-06, - "loss": 0.9141, - "step": 29285 - }, - { - "epoch": 0.75, - "learning_rate": 1.756286339793768e-06, - "loss": 0.9805, - "step": 29286 - }, - { - "epoch": 0.75, - "learning_rate": 1.7562682363654524e-06, - "loss": 0.9287, - "step": 29287 - }, - { - "epoch": 0.75, - "learning_rate": 1.7562501323580971e-06, - "loss": 0.9355, - "step": 29288 - }, - { - "epoch": 0.75, - "learning_rate": 1.7562320277717159e-06, - "loss": 1.0068, - "step": 29289 - }, - { - "epoch": 0.75, - "learning_rate": 1.7562139226063226e-06, - "loss": 0.7764, - "step": 29290 - }, - { - "epoch": 0.75, - "learning_rate": 1.756195816861931e-06, - "loss": 0.8174, - "step": 29291 - }, - { - "epoch": 0.75, - "learning_rate": 1.756177710538555e-06, - "loss": 0.6621, - "step": 29292 - }, - { - "epoch": 0.75, - "learning_rate": 1.7561596036362087e-06, - "loss": 0.8389, - "step": 29293 - }, - { - "epoch": 0.75, - "learning_rate": 1.756141496154906e-06, - "loss": 0.7896, - "step": 29294 - }, - { - "epoch": 0.75, - "learning_rate": 1.7561233880946599e-06, - "loss": 0.7705, - "step": 29295 - }, - { - "epoch": 0.75, - "learning_rate": 1.7561052794554852e-06, - "loss": 0.8027, - "step": 29296 - }, - { - "epoch": 0.75, - "learning_rate": 1.7560871702373954e-06, - "loss": 0.8867, - "step": 29297 - }, - { - "epoch": 0.75, - "learning_rate": 1.7560690604404044e-06, - "loss": 0.8789, - "step": 29298 - }, - { - "epoch": 0.75, - "learning_rate": 1.7560509500645263e-06, - "loss": 0.8442, - "step": 29299 - }, - { - "epoch": 0.75, - "learning_rate": 1.7560328391097744e-06, - "loss": 0.9785, - "step": 29300 - }, - { - "epoch": 0.75, - "learning_rate": 1.7560147275761632e-06, - "loss": 0.6812, - "step": 29301 - }, - { - "epoch": 0.75, - "learning_rate": 1.7559966154637062e-06, - "loss": 0.7842, - "step": 29302 - }, - { - "epoch": 0.75, - "learning_rate": 1.7559785027724171e-06, - "loss": 0.791, - "step": 29303 - }, - { - "epoch": 0.75, - "learning_rate": 1.7559603895023104e-06, - "loss": 0.8164, - "step": 29304 - }, - { - "epoch": 0.75, - "learning_rate": 1.7559422756533997e-06, - "loss": 1.0254, - "step": 29305 - }, - { - "epoch": 0.75, - "learning_rate": 1.7559241612256984e-06, - "loss": 0.9922, - "step": 29306 - }, - { - "epoch": 0.75, - "learning_rate": 1.7559060462192207e-06, - "loss": 0.6636, - "step": 29307 - }, - { - "epoch": 0.75, - "learning_rate": 1.755887930633981e-06, - "loss": 0.7988, - "step": 29308 - }, - { - "epoch": 0.75, - "learning_rate": 1.7558698144699919e-06, - "loss": 0.7832, - "step": 29309 - }, - { - "epoch": 0.75, - "learning_rate": 1.7558516977272686e-06, - "loss": 0.7783, - "step": 29310 - }, - { - "epoch": 0.75, - "learning_rate": 1.7558335804058241e-06, - "loss": 0.6406, - "step": 29311 - }, - { - "epoch": 0.75, - "learning_rate": 1.755815462505673e-06, - "loss": 0.916, - "step": 29312 - }, - { - "epoch": 0.75, - "learning_rate": 1.7557973440268284e-06, - "loss": 0.958, - "step": 29313 - }, - { - "epoch": 0.75, - "learning_rate": 1.7557792249693047e-06, - "loss": 0.8291, - "step": 29314 - }, - { - "epoch": 0.75, - "learning_rate": 1.7557611053331154e-06, - "loss": 0.9023, - "step": 29315 - }, - { - "epoch": 0.75, - "learning_rate": 1.7557429851182748e-06, - "loss": 0.9961, - "step": 29316 - }, - { - "epoch": 0.75, - "learning_rate": 1.7557248643247964e-06, - "loss": 0.9648, - "step": 29317 - }, - { - "epoch": 0.75, - "learning_rate": 1.7557067429526942e-06, - "loss": 0.8691, - "step": 29318 - }, - { - "epoch": 0.75, - "learning_rate": 1.7556886210019822e-06, - "loss": 0.7041, - "step": 29319 - }, - { - "epoch": 0.75, - "learning_rate": 1.755670498472674e-06, - "loss": 1.0322, - "step": 29320 - }, - { - "epoch": 0.75, - "learning_rate": 1.7556523753647838e-06, - "loss": 0.7217, - "step": 29321 - }, - { - "epoch": 0.75, - "learning_rate": 1.7556342516783254e-06, - "loss": 0.9082, - "step": 29322 - }, - { - "epoch": 0.75, - "learning_rate": 1.7556161274133124e-06, - "loss": 0.4453, - "step": 29323 - }, - { - "epoch": 0.75, - "learning_rate": 1.755598002569759e-06, - "loss": 0.5957, - "step": 29324 - }, - { - "epoch": 0.75, - "learning_rate": 1.7555798771476788e-06, - "loss": 0.7715, - "step": 29325 - }, - { - "epoch": 0.75, - "learning_rate": 1.755561751147086e-06, - "loss": 0.8984, - "step": 29326 - }, - { - "epoch": 0.75, - "learning_rate": 1.7555436245679943e-06, - "loss": 0.811, - "step": 29327 - }, - { - "epoch": 0.75, - "learning_rate": 1.7555254974104173e-06, - "loss": 0.6172, - "step": 29328 - }, - { - "epoch": 0.75, - "learning_rate": 1.7555073696743696e-06, - "loss": 0.8291, - "step": 29329 - }, - { - "epoch": 0.75, - "learning_rate": 1.7554892413598643e-06, - "loss": 0.9629, - "step": 29330 - }, - { - "epoch": 0.75, - "learning_rate": 1.755471112466916e-06, - "loss": 0.9648, - "step": 29331 - }, - { - "epoch": 0.75, - "learning_rate": 1.7554529829955378e-06, - "loss": 0.833, - "step": 29332 - }, - { - "epoch": 0.75, - "learning_rate": 1.7554348529457444e-06, - "loss": 0.6108, - "step": 29333 - }, - { - "epoch": 0.75, - "learning_rate": 1.755416722317549e-06, - "loss": 0.7832, - "step": 29334 - }, - { - "epoch": 0.75, - "learning_rate": 1.7553985911109658e-06, - "loss": 0.9634, - "step": 29335 - }, - { - "epoch": 0.75, - "learning_rate": 1.7553804593260087e-06, - "loss": 0.9707, - "step": 29336 - }, - { - "epoch": 0.75, - "learning_rate": 1.7553623269626914e-06, - "loss": 0.8564, - "step": 29337 - }, - { - "epoch": 0.75, - "learning_rate": 1.7553441940210278e-06, - "loss": 1.1221, - "step": 29338 - }, - { - "epoch": 0.75, - "learning_rate": 1.7553260605010323e-06, - "loss": 0.9502, - "step": 29339 - }, - { - "epoch": 0.75, - "learning_rate": 1.7553079264027177e-06, - "loss": 0.8457, - "step": 29340 - }, - { - "epoch": 0.75, - "learning_rate": 1.7552897917260992e-06, - "loss": 0.9775, - "step": 29341 - }, - { - "epoch": 0.75, - "learning_rate": 1.7552716564711899e-06, - "loss": 0.8379, - "step": 29342 - }, - { - "epoch": 0.75, - "learning_rate": 1.7552535206380035e-06, - "loss": 0.9189, - "step": 29343 - }, - { - "epoch": 0.75, - "learning_rate": 1.7552353842265544e-06, - "loss": 0.9004, - "step": 29344 - }, - { - "epoch": 0.75, - "learning_rate": 1.7552172472368562e-06, - "loss": 0.8789, - "step": 29345 - }, - { - "epoch": 0.75, - "learning_rate": 1.7551991096689229e-06, - "loss": 0.6431, - "step": 29346 - }, - { - "epoch": 0.75, - "learning_rate": 1.7551809715227685e-06, - "loss": 0.7124, - "step": 29347 - }, - { - "epoch": 0.75, - "learning_rate": 1.7551628327984067e-06, - "loss": 0.667, - "step": 29348 - }, - { - "epoch": 0.75, - "learning_rate": 1.7551446934958516e-06, - "loss": 0.9844, - "step": 29349 - }, - { - "epoch": 0.75, - "learning_rate": 1.7551265536151166e-06, - "loss": 0.8096, - "step": 29350 - }, - { - "epoch": 0.75, - "learning_rate": 1.7551084131562162e-06, - "loss": 0.8408, - "step": 29351 - }, - { - "epoch": 0.75, - "learning_rate": 1.755090272119164e-06, - "loss": 0.9844, - "step": 29352 - }, - { - "epoch": 0.75, - "learning_rate": 1.7550721305039734e-06, - "loss": 1.0488, - "step": 29353 - }, - { - "epoch": 0.75, - "learning_rate": 1.7550539883106596e-06, - "loss": 0.8457, - "step": 29354 - }, - { - "epoch": 0.75, - "learning_rate": 1.7550358455392352e-06, - "loss": 0.9697, - "step": 29355 - }, - { - "epoch": 0.75, - "learning_rate": 1.7550177021897146e-06, - "loss": 0.8506, - "step": 29356 - }, - { - "epoch": 0.75, - "learning_rate": 1.7549995582621118e-06, - "loss": 0.71, - "step": 29357 - }, - { - "epoch": 0.75, - "learning_rate": 1.7549814137564402e-06, - "loss": 0.8711, - "step": 29358 - }, - { - "epoch": 0.75, - "learning_rate": 1.7549632686727145e-06, - "loss": 0.7583, - "step": 29359 - }, - { - "epoch": 0.75, - "learning_rate": 1.7549451230109477e-06, - "loss": 0.6836, - "step": 29360 - }, - { - "epoch": 0.75, - "learning_rate": 1.7549269767711548e-06, - "loss": 0.9102, - "step": 29361 - }, - { - "epoch": 0.75, - "learning_rate": 1.7549088299533484e-06, - "loss": 0.917, - "step": 29362 - }, - { - "epoch": 0.75, - "learning_rate": 1.7548906825575431e-06, - "loss": 0.8975, - "step": 29363 - }, - { - "epoch": 0.75, - "learning_rate": 1.754872534583753e-06, - "loss": 0.7061, - "step": 29364 - }, - { - "epoch": 0.75, - "learning_rate": 1.7548543860319916e-06, - "loss": 0.9521, - "step": 29365 - }, - { - "epoch": 0.75, - "learning_rate": 1.7548362369022727e-06, - "loss": 0.8506, - "step": 29366 - }, - { - "epoch": 0.75, - "learning_rate": 1.7548180871946102e-06, - "loss": 0.9023, - "step": 29367 - }, - { - "epoch": 0.75, - "learning_rate": 1.754799936909019e-06, - "loss": 1.1436, - "step": 29368 - }, - { - "epoch": 0.75, - "learning_rate": 1.7547817860455116e-06, - "loss": 0.7109, - "step": 29369 - }, - { - "epoch": 0.75, - "learning_rate": 1.7547636346041025e-06, - "loss": 0.8813, - "step": 29370 - }, - { - "epoch": 0.75, - "learning_rate": 1.754745482584806e-06, - "loss": 0.8096, - "step": 29371 - }, - { - "epoch": 0.75, - "learning_rate": 1.7547273299876354e-06, - "loss": 0.7495, - "step": 29372 - }, - { - "epoch": 0.75, - "learning_rate": 1.7547091768126046e-06, - "loss": 0.791, - "step": 29373 - }, - { - "epoch": 0.75, - "learning_rate": 1.7546910230597275e-06, - "loss": 0.8853, - "step": 29374 - }, - { - "epoch": 0.75, - "learning_rate": 1.7546728687290185e-06, - "loss": 1.1035, - "step": 29375 - }, - { - "epoch": 0.75, - "learning_rate": 1.7546547138204914e-06, - "loss": 0.9053, - "step": 29376 - }, - { - "epoch": 0.75, - "learning_rate": 1.7546365583341595e-06, - "loss": 0.5188, - "step": 29377 - }, - { - "epoch": 0.75, - "learning_rate": 1.7546184022700372e-06, - "loss": 0.6292, - "step": 29378 - }, - { - "epoch": 0.75, - "learning_rate": 1.7546002456281383e-06, - "loss": 0.6953, - "step": 29379 - }, - { - "epoch": 0.75, - "learning_rate": 1.7545820884084767e-06, - "loss": 1.0127, - "step": 29380 - }, - { - "epoch": 0.75, - "learning_rate": 1.7545639306110664e-06, - "loss": 0.7896, - "step": 29381 - }, - { - "epoch": 0.75, - "learning_rate": 1.7545457722359212e-06, - "loss": 1.001, - "step": 29382 - }, - { - "epoch": 0.75, - "learning_rate": 1.754527613283055e-06, - "loss": 0.8984, - "step": 29383 - }, - { - "epoch": 0.75, - "learning_rate": 1.7545094537524814e-06, - "loss": 0.7871, - "step": 29384 - }, - { - "epoch": 0.75, - "learning_rate": 1.7544912936442149e-06, - "loss": 1.0811, - "step": 29385 - }, - { - "epoch": 0.75, - "learning_rate": 1.7544731329582687e-06, - "loss": 1.0518, - "step": 29386 - }, - { - "epoch": 0.75, - "learning_rate": 1.7544549716946576e-06, - "loss": 0.8188, - "step": 29387 - }, - { - "epoch": 0.75, - "learning_rate": 1.7544368098533947e-06, - "loss": 1.0039, - "step": 29388 - }, - { - "epoch": 0.75, - "learning_rate": 1.7544186474344943e-06, - "loss": 0.9717, - "step": 29389 - }, - { - "epoch": 0.75, - "learning_rate": 1.7544004844379706e-06, - "loss": 0.7891, - "step": 29390 - }, - { - "epoch": 0.75, - "learning_rate": 1.7543823208638367e-06, - "loss": 0.7471, - "step": 29391 - }, - { - "epoch": 0.75, - "learning_rate": 1.754364156712107e-06, - "loss": 0.7793, - "step": 29392 - }, - { - "epoch": 0.75, - "learning_rate": 1.7543459919827953e-06, - "loss": 0.7075, - "step": 29393 - }, - { - "epoch": 0.75, - "learning_rate": 1.7543278266759158e-06, - "loss": 0.7285, - "step": 29394 - }, - { - "epoch": 0.75, - "learning_rate": 1.754309660791482e-06, - "loss": 0.7979, - "step": 29395 - }, - { - "epoch": 0.75, - "learning_rate": 1.7542914943295082e-06, - "loss": 0.9033, - "step": 29396 - }, - { - "epoch": 0.75, - "learning_rate": 1.7542733272900078e-06, - "loss": 0.958, - "step": 29397 - }, - { - "epoch": 0.75, - "learning_rate": 1.7542551596729952e-06, - "loss": 0.6611, - "step": 29398 - }, - { - "epoch": 0.75, - "learning_rate": 1.754236991478484e-06, - "loss": 1.042, - "step": 29399 - }, - { - "epoch": 0.75, - "learning_rate": 1.7542188227064881e-06, - "loss": 0.8096, - "step": 29400 - }, - { - "epoch": 0.75, - "learning_rate": 1.7542006533570216e-06, - "loss": 0.6611, - "step": 29401 - }, - { - "epoch": 0.75, - "learning_rate": 1.7541824834300987e-06, - "loss": 0.79, - "step": 29402 - }, - { - "epoch": 0.75, - "learning_rate": 1.7541643129257327e-06, - "loss": 0.8662, - "step": 29403 - }, - { - "epoch": 0.75, - "learning_rate": 1.7541461418439373e-06, - "loss": 0.8027, - "step": 29404 - }, - { - "epoch": 0.75, - "learning_rate": 1.7541279701847276e-06, - "loss": 0.876, - "step": 29405 - }, - { - "epoch": 0.75, - "learning_rate": 1.7541097979481165e-06, - "loss": 0.8462, - "step": 29406 - }, - { - "epoch": 0.75, - "learning_rate": 1.754091625134118e-06, - "loss": 0.7949, - "step": 29407 - }, - { - "epoch": 0.75, - "learning_rate": 1.7540734517427465e-06, - "loss": 0.9512, - "step": 29408 - }, - { - "epoch": 0.75, - "learning_rate": 1.7540552777740155e-06, - "loss": 1.0781, - "step": 29409 - }, - { - "epoch": 0.75, - "learning_rate": 1.7540371032279388e-06, - "loss": 0.6641, - "step": 29410 - }, - { - "epoch": 0.75, - "learning_rate": 1.7540189281045312e-06, - "loss": 0.8691, - "step": 29411 - }, - { - "epoch": 0.75, - "learning_rate": 1.7540007524038054e-06, - "loss": 0.9502, - "step": 29412 - }, - { - "epoch": 0.75, - "learning_rate": 1.753982576125776e-06, - "loss": 0.606, - "step": 29413 - }, - { - "epoch": 0.75, - "learning_rate": 1.7539643992704572e-06, - "loss": 0.75, - "step": 29414 - }, - { - "epoch": 0.75, - "learning_rate": 1.7539462218378622e-06, - "loss": 1.0166, - "step": 29415 - }, - { - "epoch": 0.75, - "learning_rate": 1.7539280438280052e-06, - "loss": 0.9229, - "step": 29416 - }, - { - "epoch": 0.75, - "learning_rate": 1.7539098652409004e-06, - "loss": 0.7842, - "step": 29417 - }, - { - "epoch": 0.75, - "learning_rate": 1.7538916860765612e-06, - "loss": 0.792, - "step": 29418 - }, - { - "epoch": 0.75, - "learning_rate": 1.7538735063350018e-06, - "loss": 0.8506, - "step": 29419 - }, - { - "epoch": 0.75, - "learning_rate": 1.7538553260162363e-06, - "loss": 0.9268, - "step": 29420 - }, - { - "epoch": 0.75, - "learning_rate": 1.7538371451202787e-06, - "loss": 0.8828, - "step": 29421 - }, - { - "epoch": 0.75, - "learning_rate": 1.7538189636471424e-06, - "loss": 0.9434, - "step": 29422 - }, - { - "epoch": 0.75, - "learning_rate": 1.7538007815968415e-06, - "loss": 0.9033, - "step": 29423 - }, - { - "epoch": 0.75, - "learning_rate": 1.7537825989693896e-06, - "loss": 0.7178, - "step": 29424 - }, - { - "epoch": 0.75, - "learning_rate": 1.7537644157648017e-06, - "loss": 0.9062, - "step": 29425 - }, - { - "epoch": 0.75, - "learning_rate": 1.753746231983091e-06, - "loss": 0.877, - "step": 29426 - }, - { - "epoch": 0.75, - "learning_rate": 1.7537280476242711e-06, - "loss": 1.0537, - "step": 29427 - }, - { - "epoch": 0.75, - "learning_rate": 1.7537098626883564e-06, - "loss": 0.6348, - "step": 29428 - }, - { - "epoch": 0.75, - "learning_rate": 1.7536916771753608e-06, - "loss": 0.7307, - "step": 29429 - }, - { - "epoch": 0.75, - "learning_rate": 1.7536734910852982e-06, - "loss": 1.0488, - "step": 29430 - }, - { - "epoch": 0.75, - "learning_rate": 1.7536553044181824e-06, - "loss": 0.8643, - "step": 29431 - }, - { - "epoch": 0.75, - "learning_rate": 1.7536371171740273e-06, - "loss": 0.9619, - "step": 29432 - }, - { - "epoch": 0.75, - "learning_rate": 1.753618929352847e-06, - "loss": 0.8525, - "step": 29433 - }, - { - "epoch": 0.75, - "learning_rate": 1.7536007409546554e-06, - "loss": 1.0293, - "step": 29434 - }, - { - "epoch": 0.75, - "learning_rate": 1.7535825519794663e-06, - "loss": 0.7007, - "step": 29435 - }, - { - "epoch": 0.75, - "learning_rate": 1.7535643624272935e-06, - "loss": 0.7144, - "step": 29436 - }, - { - "epoch": 0.75, - "learning_rate": 1.7535461722981514e-06, - "loss": 0.7832, - "step": 29437 - }, - { - "epoch": 0.75, - "learning_rate": 1.7535279815920534e-06, - "loss": 0.6006, - "step": 29438 - }, - { - "epoch": 0.75, - "learning_rate": 1.7535097903090139e-06, - "loss": 0.8789, - "step": 29439 - }, - { - "epoch": 0.75, - "learning_rate": 1.7534915984490465e-06, - "loss": 1.0684, - "step": 29440 - }, - { - "epoch": 0.75, - "learning_rate": 1.7534734060121652e-06, - "loss": 1.0664, - "step": 29441 - }, - { - "epoch": 0.75, - "learning_rate": 1.753455212998384e-06, - "loss": 0.9766, - "step": 29442 - }, - { - "epoch": 0.75, - "learning_rate": 1.753437019407717e-06, - "loss": 0.8174, - "step": 29443 - }, - { - "epoch": 0.75, - "learning_rate": 1.7534188252401777e-06, - "loss": 0.8789, - "step": 29444 - }, - { - "epoch": 0.75, - "learning_rate": 1.75340063049578e-06, - "loss": 0.8896, - "step": 29445 - }, - { - "epoch": 0.75, - "learning_rate": 1.7533824351745385e-06, - "loss": 0.8389, - "step": 29446 - }, - { - "epoch": 0.75, - "learning_rate": 1.7533642392764665e-06, - "loss": 1.0459, - "step": 29447 - }, - { - "epoch": 0.75, - "learning_rate": 1.7533460428015784e-06, - "loss": 0.667, - "step": 29448 - }, - { - "epoch": 0.75, - "learning_rate": 1.7533278457498875e-06, - "loss": 0.9297, - "step": 29449 - }, - { - "epoch": 0.75, - "learning_rate": 1.7533096481214083e-06, - "loss": 0.8447, - "step": 29450 - }, - { - "epoch": 0.75, - "learning_rate": 1.7532914499161544e-06, - "loss": 0.8418, - "step": 29451 - }, - { - "epoch": 0.75, - "learning_rate": 1.7532732511341402e-06, - "loss": 0.6748, - "step": 29452 - }, - { - "epoch": 0.75, - "learning_rate": 1.7532550517753787e-06, - "loss": 0.8347, - "step": 29453 - }, - { - "epoch": 0.75, - "learning_rate": 1.753236851839885e-06, - "loss": 0.8389, - "step": 29454 - }, - { - "epoch": 0.75, - "learning_rate": 1.7532186513276724e-06, - "loss": 0.8604, - "step": 29455 - }, - { - "epoch": 0.75, - "learning_rate": 1.7532004502387548e-06, - "loss": 1.0938, - "step": 29456 - }, - { - "epoch": 0.75, - "learning_rate": 1.7531822485731463e-06, - "loss": 0.9287, - "step": 29457 - }, - { - "epoch": 0.76, - "learning_rate": 1.7531640463308608e-06, - "loss": 0.6924, - "step": 29458 - }, - { - "epoch": 0.76, - "learning_rate": 1.7531458435119122e-06, - "loss": 0.7363, - "step": 29459 - }, - { - "epoch": 0.76, - "learning_rate": 1.7531276401163142e-06, - "loss": 0.8262, - "step": 29460 - }, - { - "epoch": 0.76, - "learning_rate": 1.7531094361440815e-06, - "loss": 0.8555, - "step": 29461 - }, - { - "epoch": 0.76, - "learning_rate": 1.753091231595227e-06, - "loss": 0.7959, - "step": 29462 - }, - { - "epoch": 0.76, - "learning_rate": 1.7530730264697655e-06, - "loss": 0.9111, - "step": 29463 - }, - { - "epoch": 0.76, - "learning_rate": 1.7530548207677106e-06, - "loss": 0.9795, - "step": 29464 - }, - { - "epoch": 0.76, - "learning_rate": 1.7530366144890762e-06, - "loss": 0.644, - "step": 29465 - }, - { - "epoch": 0.76, - "learning_rate": 1.7530184076338764e-06, - "loss": 0.6816, - "step": 29466 - }, - { - "epoch": 0.76, - "learning_rate": 1.7530002002021246e-06, - "loss": 1.2051, - "step": 29467 - }, - { - "epoch": 0.76, - "learning_rate": 1.7529819921938358e-06, - "loss": 0.7744, - "step": 29468 - }, - { - "epoch": 0.76, - "learning_rate": 1.752963783609023e-06, - "loss": 0.9229, - "step": 29469 - }, - { - "epoch": 0.76, - "learning_rate": 1.7529455744477005e-06, - "loss": 0.8184, - "step": 29470 - }, - { - "epoch": 0.76, - "learning_rate": 1.7529273647098821e-06, - "loss": 0.6426, - "step": 29471 - }, - { - "epoch": 0.76, - "learning_rate": 1.752909154395582e-06, - "loss": 0.8984, - "step": 29472 - }, - { - "epoch": 0.76, - "learning_rate": 1.7528909435048137e-06, - "loss": 0.5981, - "step": 29473 - }, - { - "epoch": 0.76, - "learning_rate": 1.7528727320375917e-06, - "loss": 0.8496, - "step": 29474 - }, - { - "epoch": 0.76, - "learning_rate": 1.7528545199939293e-06, - "loss": 0.7744, - "step": 29475 - }, - { - "epoch": 0.76, - "learning_rate": 1.7528363073738412e-06, - "loss": 0.7383, - "step": 29476 - }, - { - "epoch": 0.76, - "learning_rate": 1.752818094177341e-06, - "loss": 1.0117, - "step": 29477 - }, - { - "epoch": 0.76, - "learning_rate": 1.752799880404442e-06, - "loss": 0.9727, - "step": 29478 - }, - { - "epoch": 0.76, - "learning_rate": 1.7527816660551596e-06, - "loss": 0.8359, - "step": 29479 - }, - { - "epoch": 0.76, - "learning_rate": 1.7527634511295063e-06, - "loss": 0.8633, - "step": 29480 - }, - { - "epoch": 0.76, - "learning_rate": 1.7527452356274967e-06, - "loss": 1.0498, - "step": 29481 - }, - { - "epoch": 0.76, - "learning_rate": 1.752727019549145e-06, - "loss": 0.7632, - "step": 29482 - }, - { - "epoch": 0.76, - "learning_rate": 1.7527088028944646e-06, - "loss": 0.9736, - "step": 29483 - }, - { - "epoch": 0.76, - "learning_rate": 1.7526905856634695e-06, - "loss": 0.9062, - "step": 29484 - }, - { - "epoch": 0.76, - "learning_rate": 1.7526723678561741e-06, - "loss": 0.9092, - "step": 29485 - }, - { - "epoch": 0.76, - "learning_rate": 1.752654149472592e-06, - "loss": 0.9521, - "step": 29486 - }, - { - "epoch": 0.76, - "learning_rate": 1.7526359305127373e-06, - "loss": 0.7148, - "step": 29487 - }, - { - "epoch": 0.76, - "learning_rate": 1.7526177109766237e-06, - "loss": 0.7881, - "step": 29488 - }, - { - "epoch": 0.76, - "learning_rate": 1.7525994908642656e-06, - "loss": 0.6658, - "step": 29489 - }, - { - "epoch": 0.76, - "learning_rate": 1.7525812701756763e-06, - "loss": 0.6611, - "step": 29490 - }, - { - "epoch": 0.76, - "learning_rate": 1.7525630489108704e-06, - "loss": 0.7969, - "step": 29491 - }, - { - "epoch": 0.76, - "learning_rate": 1.7525448270698618e-06, - "loss": 0.8018, - "step": 29492 - }, - { - "epoch": 0.76, - "learning_rate": 1.752526604652664e-06, - "loss": 0.9424, - "step": 29493 - }, - { - "epoch": 0.76, - "learning_rate": 1.752508381659291e-06, - "loss": 0.7817, - "step": 29494 - }, - { - "epoch": 0.76, - "learning_rate": 1.752490158089757e-06, - "loss": 0.7847, - "step": 29495 - }, - { - "epoch": 0.76, - "learning_rate": 1.752471933944076e-06, - "loss": 0.9717, - "step": 29496 - }, - { - "epoch": 0.76, - "learning_rate": 1.7524537092222617e-06, - "loss": 0.749, - "step": 29497 - }, - { - "epoch": 0.76, - "learning_rate": 1.7524354839243283e-06, - "loss": 0.8311, - "step": 29498 - }, - { - "epoch": 0.76, - "learning_rate": 1.7524172580502895e-06, - "loss": 0.5977, - "step": 29499 - }, - { - "epoch": 0.76, - "learning_rate": 1.7523990316001594e-06, - "loss": 0.8506, - "step": 29500 - }, - { - "epoch": 0.76, - "learning_rate": 1.7523808045739523e-06, - "loss": 0.4318, - "step": 29501 - }, - { - "epoch": 0.76, - "learning_rate": 1.7523625769716814e-06, - "loss": 0.9082, - "step": 29502 - }, - { - "epoch": 0.76, - "learning_rate": 1.7523443487933614e-06, - "loss": 1.0898, - "step": 29503 - }, - { - "epoch": 0.76, - "learning_rate": 1.752326120039006e-06, - "loss": 0.7676, - "step": 29504 - }, - { - "epoch": 0.76, - "learning_rate": 1.7523078907086286e-06, - "loss": 0.6621, - "step": 29505 - }, - { - "epoch": 0.76, - "learning_rate": 1.7522896608022439e-06, - "loss": 0.6895, - "step": 29506 - }, - { - "epoch": 0.76, - "learning_rate": 1.7522714303198655e-06, - "loss": 0.9055, - "step": 29507 - }, - { - "epoch": 0.76, - "learning_rate": 1.7522531992615078e-06, - "loss": 0.9941, - "step": 29508 - }, - { - "epoch": 0.76, - "learning_rate": 1.752234967627184e-06, - "loss": 0.8857, - "step": 29509 - }, - { - "epoch": 0.76, - "learning_rate": 1.752216735416909e-06, - "loss": 0.8691, - "step": 29510 - }, - { - "epoch": 0.76, - "learning_rate": 1.7521985026306956e-06, - "loss": 0.8711, - "step": 29511 - }, - { - "epoch": 0.76, - "learning_rate": 1.7521802692685586e-06, - "loss": 0.9111, - "step": 29512 - }, - { - "epoch": 0.76, - "learning_rate": 1.752162035330512e-06, - "loss": 0.6248, - "step": 29513 - }, - { - "epoch": 0.76, - "learning_rate": 1.7521438008165692e-06, - "loss": 0.9434, - "step": 29514 - }, - { - "epoch": 0.76, - "learning_rate": 1.752125565726745e-06, - "loss": 1.0957, - "step": 29515 - }, - { - "epoch": 0.76, - "learning_rate": 1.7521073300610523e-06, - "loss": 0.6787, - "step": 29516 - }, - { - "epoch": 0.76, - "learning_rate": 1.7520890938195057e-06, - "loss": 0.9248, - "step": 29517 - }, - { - "epoch": 0.76, - "learning_rate": 1.7520708570021193e-06, - "loss": 0.915, - "step": 29518 - }, - { - "epoch": 0.76, - "learning_rate": 1.7520526196089065e-06, - "loss": 0.9199, - "step": 29519 - }, - { - "epoch": 0.76, - "learning_rate": 1.7520343816398817e-06, - "loss": 0.8164, - "step": 29520 - }, - { - "epoch": 0.76, - "learning_rate": 1.7520161430950586e-06, - "loss": 0.8467, - "step": 29521 - }, - { - "epoch": 0.76, - "learning_rate": 1.7519979039744517e-06, - "loss": 0.8379, - "step": 29522 - }, - { - "epoch": 0.76, - "learning_rate": 1.7519796642780744e-06, - "loss": 0.8828, - "step": 29523 - }, - { - "epoch": 0.76, - "learning_rate": 1.7519614240059408e-06, - "loss": 1.0059, - "step": 29524 - }, - { - "epoch": 0.76, - "learning_rate": 1.751943183158065e-06, - "loss": 0.7744, - "step": 29525 - }, - { - "epoch": 0.76, - "learning_rate": 1.7519249417344608e-06, - "loss": 0.939, - "step": 29526 - }, - { - "epoch": 0.76, - "learning_rate": 1.7519066997351422e-06, - "loss": 0.8701, - "step": 29527 - }, - { - "epoch": 0.76, - "learning_rate": 1.7518884571601236e-06, - "loss": 1.0098, - "step": 29528 - }, - { - "epoch": 0.76, - "learning_rate": 1.751870214009418e-06, - "loss": 1.0693, - "step": 29529 - }, - { - "epoch": 0.76, - "learning_rate": 1.7518519702830402e-06, - "loss": 0.8208, - "step": 29530 - }, - { - "epoch": 0.76, - "learning_rate": 1.751833725981004e-06, - "loss": 1.0537, - "step": 29531 - }, - { - "epoch": 0.76, - "learning_rate": 1.7518154811033235e-06, - "loss": 0.8398, - "step": 29532 - }, - { - "epoch": 0.76, - "learning_rate": 1.7517972356500122e-06, - "loss": 0.7773, - "step": 29533 - }, - { - "epoch": 0.76, - "learning_rate": 1.751778989621084e-06, - "loss": 0.8359, - "step": 29534 - }, - { - "epoch": 0.76, - "learning_rate": 1.7517607430165535e-06, - "loss": 1.0156, - "step": 29535 - }, - { - "epoch": 0.76, - "learning_rate": 1.7517424958364346e-06, - "loss": 0.6748, - "step": 29536 - }, - { - "epoch": 0.76, - "learning_rate": 1.7517242480807406e-06, - "loss": 1.0234, - "step": 29537 - }, - { - "epoch": 0.76, - "learning_rate": 1.7517059997494862e-06, - "loss": 0.8281, - "step": 29538 - }, - { - "epoch": 0.76, - "learning_rate": 1.751687750842685e-06, - "loss": 0.8701, - "step": 29539 - }, - { - "epoch": 0.76, - "learning_rate": 1.751669501360351e-06, - "loss": 0.8965, - "step": 29540 - }, - { - "epoch": 0.76, - "learning_rate": 1.7516512513024983e-06, - "loss": 0.8008, - "step": 29541 - }, - { - "epoch": 0.76, - "learning_rate": 1.751633000669141e-06, - "loss": 0.8921, - "step": 29542 - }, - { - "epoch": 0.76, - "learning_rate": 1.7516147494602924e-06, - "loss": 0.7842, - "step": 29543 - }, - { - "epoch": 0.76, - "learning_rate": 1.7515964976759672e-06, - "loss": 0.7959, - "step": 29544 - }, - { - "epoch": 0.76, - "learning_rate": 1.7515782453161792e-06, - "loss": 0.7881, - "step": 29545 - }, - { - "epoch": 0.76, - "learning_rate": 1.751559992380942e-06, - "loss": 0.7671, - "step": 29546 - }, - { - "epoch": 0.76, - "learning_rate": 1.7515417388702703e-06, - "loss": 0.8047, - "step": 29547 - }, - { - "epoch": 0.76, - "learning_rate": 1.7515234847841773e-06, - "loss": 0.9033, - "step": 29548 - }, - { - "epoch": 0.76, - "learning_rate": 1.7515052301226777e-06, - "loss": 0.9497, - "step": 29549 - }, - { - "epoch": 0.76, - "learning_rate": 1.7514869748857848e-06, - "loss": 0.8047, - "step": 29550 - }, - { - "epoch": 0.76, - "learning_rate": 1.751468719073513e-06, - "loss": 0.8535, - "step": 29551 - }, - { - "epoch": 0.76, - "learning_rate": 1.751450462685876e-06, - "loss": 0.7329, - "step": 29552 - }, - { - "epoch": 0.76, - "learning_rate": 1.7514322057228879e-06, - "loss": 0.6675, - "step": 29553 - }, - { - "epoch": 0.76, - "learning_rate": 1.7514139481845628e-06, - "loss": 0.9463, - "step": 29554 - }, - { - "epoch": 0.76, - "learning_rate": 1.7513956900709146e-06, - "loss": 0.7471, - "step": 29555 - }, - { - "epoch": 0.76, - "learning_rate": 1.7513774313819573e-06, - "loss": 0.9033, - "step": 29556 - }, - { - "epoch": 0.76, - "learning_rate": 1.751359172117705e-06, - "loss": 0.8193, - "step": 29557 - }, - { - "epoch": 0.76, - "learning_rate": 1.7513409122781716e-06, - "loss": 0.6587, - "step": 29558 - }, - { - "epoch": 0.76, - "learning_rate": 1.7513226518633705e-06, - "loss": 0.8027, - "step": 29559 - }, - { - "epoch": 0.76, - "learning_rate": 1.7513043908733165e-06, - "loss": 0.916, - "step": 29560 - }, - { - "epoch": 0.76, - "learning_rate": 1.7512861293080232e-06, - "loss": 0.6597, - "step": 29561 - }, - { - "epoch": 0.76, - "learning_rate": 1.7512678671675047e-06, - "loss": 0.666, - "step": 29562 - }, - { - "epoch": 0.76, - "learning_rate": 1.751249604451775e-06, - "loss": 0.7783, - "step": 29563 - }, - { - "epoch": 0.76, - "learning_rate": 1.751231341160848e-06, - "loss": 0.9736, - "step": 29564 - }, - { - "epoch": 0.76, - "learning_rate": 1.7512130772947376e-06, - "loss": 0.8369, - "step": 29565 - }, - { - "epoch": 0.76, - "learning_rate": 1.7511948128534582e-06, - "loss": 0.6826, - "step": 29566 - }, - { - "epoch": 0.76, - "learning_rate": 1.751176547837023e-06, - "loss": 0.9629, - "step": 29567 - }, - { - "epoch": 0.76, - "learning_rate": 1.7511582822454468e-06, - "loss": 0.9502, - "step": 29568 - }, - { - "epoch": 0.76, - "learning_rate": 1.751140016078743e-06, - "loss": 0.6616, - "step": 29569 - }, - { - "epoch": 0.76, - "learning_rate": 1.751121749336926e-06, - "loss": 0.8291, - "step": 29570 - }, - { - "epoch": 0.76, - "learning_rate": 1.7511034820200097e-06, - "loss": 0.5261, - "step": 29571 - }, - { - "epoch": 0.76, - "learning_rate": 1.7510852141280078e-06, - "loss": 0.8838, - "step": 29572 - }, - { - "epoch": 0.76, - "learning_rate": 1.7510669456609346e-06, - "loss": 0.7559, - "step": 29573 - }, - { - "epoch": 0.76, - "learning_rate": 1.751048676618804e-06, - "loss": 0.5625, - "step": 29574 - }, - { - "epoch": 0.76, - "learning_rate": 1.7510304070016298e-06, - "loss": 0.8389, - "step": 29575 - }, - { - "epoch": 0.76, - "learning_rate": 1.7510121368094262e-06, - "loss": 0.998, - "step": 29576 - }, - { - "epoch": 0.76, - "learning_rate": 1.7509938660422073e-06, - "loss": 0.6504, - "step": 29577 - }, - { - "epoch": 0.76, - "learning_rate": 1.750975594699987e-06, - "loss": 0.7788, - "step": 29578 - }, - { - "epoch": 0.76, - "learning_rate": 1.7509573227827788e-06, - "loss": 0.6208, - "step": 29579 - }, - { - "epoch": 0.76, - "learning_rate": 1.7509390502905971e-06, - "loss": 0.8252, - "step": 29580 - }, - { - "epoch": 0.76, - "learning_rate": 1.7509207772234565e-06, - "loss": 0.7727, - "step": 29581 - }, - { - "epoch": 0.76, - "learning_rate": 1.7509025035813699e-06, - "loss": 0.9609, - "step": 29582 - }, - { - "epoch": 0.76, - "learning_rate": 1.750884229364352e-06, - "loss": 0.6948, - "step": 29583 - }, - { - "epoch": 0.76, - "learning_rate": 1.7508659545724164e-06, - "loss": 0.7246, - "step": 29584 - }, - { - "epoch": 0.76, - "learning_rate": 1.7508476792055773e-06, - "loss": 0.9795, - "step": 29585 - }, - { - "epoch": 0.76, - "learning_rate": 1.750829403263849e-06, - "loss": 0.7744, - "step": 29586 - }, - { - "epoch": 0.76, - "learning_rate": 1.7508111267472448e-06, - "loss": 0.7866, - "step": 29587 - }, - { - "epoch": 0.76, - "learning_rate": 1.7507928496557789e-06, - "loss": 0.7422, - "step": 29588 - }, - { - "epoch": 0.76, - "learning_rate": 1.7507745719894658e-06, - "loss": 0.999, - "step": 29589 - }, - { - "epoch": 0.76, - "learning_rate": 1.7507562937483189e-06, - "loss": 0.9097, - "step": 29590 - }, - { - "epoch": 0.76, - "learning_rate": 1.7507380149323523e-06, - "loss": 0.9229, - "step": 29591 - }, - { - "epoch": 0.76, - "learning_rate": 1.7507197355415803e-06, - "loss": 0.6128, - "step": 29592 - }, - { - "epoch": 0.76, - "learning_rate": 1.7507014555760168e-06, - "loss": 0.7725, - "step": 29593 - }, - { - "epoch": 0.76, - "learning_rate": 1.7506831750356756e-06, - "loss": 0.6284, - "step": 29594 - }, - { - "epoch": 0.76, - "learning_rate": 1.750664893920571e-06, - "loss": 0.6504, - "step": 29595 - }, - { - "epoch": 0.76, - "learning_rate": 1.7506466122307166e-06, - "loss": 0.8711, - "step": 29596 - }, - { - "epoch": 0.76, - "learning_rate": 1.7506283299661266e-06, - "loss": 0.6694, - "step": 29597 - }, - { - "epoch": 0.76, - "learning_rate": 1.7506100471268152e-06, - "loss": 0.9863, - "step": 29598 - }, - { - "epoch": 0.76, - "learning_rate": 1.7505917637127961e-06, - "loss": 0.7939, - "step": 29599 - }, - { - "epoch": 0.76, - "learning_rate": 1.7505734797240832e-06, - "loss": 0.9229, - "step": 29600 - }, - { - "epoch": 0.76, - "learning_rate": 1.7505551951606908e-06, - "loss": 0.8672, - "step": 29601 - }, - { - "epoch": 0.76, - "learning_rate": 1.750536910022633e-06, - "loss": 0.9443, - "step": 29602 - }, - { - "epoch": 0.76, - "learning_rate": 1.7505186243099237e-06, - "loss": 0.834, - "step": 29603 - }, - { - "epoch": 0.76, - "learning_rate": 1.7505003380225764e-06, - "loss": 0.9062, - "step": 29604 - }, - { - "epoch": 0.76, - "learning_rate": 1.7504820511606057e-06, - "loss": 0.8374, - "step": 29605 - }, - { - "epoch": 0.76, - "learning_rate": 1.7504637637240253e-06, - "loss": 0.7803, - "step": 29606 - }, - { - "epoch": 0.76, - "learning_rate": 1.7504454757128495e-06, - "loss": 0.6929, - "step": 29607 - }, - { - "epoch": 0.76, - "learning_rate": 1.7504271871270918e-06, - "loss": 0.9609, - "step": 29608 - }, - { - "epoch": 0.76, - "learning_rate": 1.7504088979667668e-06, - "loss": 1.0303, - "step": 29609 - }, - { - "epoch": 0.76, - "learning_rate": 1.7503906082318882e-06, - "loss": 0.7412, - "step": 29610 - }, - { - "epoch": 0.76, - "learning_rate": 1.7503723179224696e-06, - "loss": 1.0029, - "step": 29611 - }, - { - "epoch": 0.76, - "learning_rate": 1.7503540270385258e-06, - "loss": 0.8223, - "step": 29612 - }, - { - "epoch": 0.76, - "learning_rate": 1.7503357355800705e-06, - "loss": 0.8232, - "step": 29613 - }, - { - "epoch": 0.76, - "learning_rate": 1.7503174435471175e-06, - "loss": 0.7749, - "step": 29614 - }, - { - "epoch": 0.76, - "learning_rate": 1.7502991509396809e-06, - "loss": 0.8145, - "step": 29615 - }, - { - "epoch": 0.76, - "learning_rate": 1.7502808577577749e-06, - "loss": 0.9424, - "step": 29616 - }, - { - "epoch": 0.76, - "learning_rate": 1.750262564001413e-06, - "loss": 0.9297, - "step": 29617 - }, - { - "epoch": 0.76, - "learning_rate": 1.7502442696706097e-06, - "loss": 0.4971, - "step": 29618 - }, - { - "epoch": 0.76, - "learning_rate": 1.750225974765379e-06, - "loss": 0.5254, - "step": 29619 - }, - { - "epoch": 0.76, - "learning_rate": 1.7502076792857347e-06, - "loss": 1.0547, - "step": 29620 - }, - { - "epoch": 0.76, - "learning_rate": 1.750189383231691e-06, - "loss": 0.8193, - "step": 29621 - }, - { - "epoch": 0.76, - "learning_rate": 1.7501710866032614e-06, - "loss": 0.8457, - "step": 29622 - }, - { - "epoch": 0.76, - "learning_rate": 1.7501527894004608e-06, - "loss": 0.9854, - "step": 29623 - }, - { - "epoch": 0.76, - "learning_rate": 1.7501344916233024e-06, - "loss": 0.7227, - "step": 29624 - }, - { - "epoch": 0.76, - "learning_rate": 1.7501161932718005e-06, - "loss": 0.9121, - "step": 29625 - }, - { - "epoch": 0.76, - "learning_rate": 1.750097894345969e-06, - "loss": 0.9102, - "step": 29626 - }, - { - "epoch": 0.76, - "learning_rate": 1.7500795948458222e-06, - "loss": 0.9551, - "step": 29627 - }, - { - "epoch": 0.76, - "learning_rate": 1.750061294771374e-06, - "loss": 0.5867, - "step": 29628 - }, - { - "epoch": 0.76, - "learning_rate": 1.7500429941226384e-06, - "loss": 0.8857, - "step": 29629 - }, - { - "epoch": 0.76, - "learning_rate": 1.7500246928996294e-06, - "loss": 0.7852, - "step": 29630 - }, - { - "epoch": 0.76, - "learning_rate": 1.7500063911023605e-06, - "loss": 0.7856, - "step": 29631 - }, - { - "epoch": 0.76, - "learning_rate": 1.7499880887308467e-06, - "loss": 0.7595, - "step": 29632 - }, - { - "epoch": 0.76, - "learning_rate": 1.7499697857851015e-06, - "loss": 0.6714, - "step": 29633 - }, - { - "epoch": 0.76, - "learning_rate": 1.7499514822651386e-06, - "loss": 0.7622, - "step": 29634 - }, - { - "epoch": 0.76, - "learning_rate": 1.7499331781709726e-06, - "loss": 0.8994, - "step": 29635 - }, - { - "epoch": 0.76, - "learning_rate": 1.7499148735026173e-06, - "loss": 0.6841, - "step": 29636 - }, - { - "epoch": 0.76, - "learning_rate": 1.7498965682600861e-06, - "loss": 0.9238, - "step": 29637 - }, - { - "epoch": 0.76, - "learning_rate": 1.7498782624433943e-06, - "loss": 1.001, - "step": 29638 - }, - { - "epoch": 0.76, - "learning_rate": 1.7498599560525546e-06, - "loss": 0.875, - "step": 29639 - }, - { - "epoch": 0.76, - "learning_rate": 1.7498416490875823e-06, - "loss": 0.9346, - "step": 29640 - }, - { - "epoch": 0.76, - "learning_rate": 1.74982334154849e-06, - "loss": 1.0322, - "step": 29641 - }, - { - "epoch": 0.76, - "learning_rate": 1.7498050334352929e-06, - "loss": 0.6284, - "step": 29642 - }, - { - "epoch": 0.76, - "learning_rate": 1.7497867247480045e-06, - "loss": 0.8047, - "step": 29643 - }, - { - "epoch": 0.76, - "learning_rate": 1.7497684154866387e-06, - "loss": 0.8105, - "step": 29644 - }, - { - "epoch": 0.76, - "learning_rate": 1.74975010565121e-06, - "loss": 0.7979, - "step": 29645 - }, - { - "epoch": 0.76, - "learning_rate": 1.749731795241732e-06, - "loss": 0.8857, - "step": 29646 - }, - { - "epoch": 0.76, - "learning_rate": 1.7497134842582186e-06, - "loss": 0.7852, - "step": 29647 - }, - { - "epoch": 0.76, - "learning_rate": 1.7496951727006843e-06, - "loss": 0.999, - "step": 29648 - }, - { - "epoch": 0.76, - "learning_rate": 1.7496768605691427e-06, - "loss": 0.7305, - "step": 29649 - }, - { - "epoch": 0.76, - "learning_rate": 1.7496585478636084e-06, - "loss": 0.8994, - "step": 29650 - }, - { - "epoch": 0.76, - "learning_rate": 1.7496402345840946e-06, - "loss": 0.9805, - "step": 29651 - }, - { - "epoch": 0.76, - "learning_rate": 1.7496219207306157e-06, - "loss": 0.7627, - "step": 29652 - }, - { - "epoch": 0.76, - "learning_rate": 1.7496036063031858e-06, - "loss": 0.9033, - "step": 29653 - }, - { - "epoch": 0.76, - "learning_rate": 1.7495852913018193e-06, - "loss": 0.9834, - "step": 29654 - }, - { - "epoch": 0.76, - "learning_rate": 1.7495669757265295e-06, - "loss": 0.8135, - "step": 29655 - }, - { - "epoch": 0.76, - "learning_rate": 1.7495486595773308e-06, - "loss": 1.0586, - "step": 29656 - }, - { - "epoch": 0.76, - "learning_rate": 1.7495303428542368e-06, - "loss": 0.8311, - "step": 29657 - }, - { - "epoch": 0.76, - "learning_rate": 1.7495120255572624e-06, - "loss": 0.9062, - "step": 29658 - }, - { - "epoch": 0.76, - "learning_rate": 1.749493707686421e-06, - "loss": 1.0068, - "step": 29659 - }, - { - "epoch": 0.76, - "learning_rate": 1.7494753892417266e-06, - "loss": 1.2227, - "step": 29660 - }, - { - "epoch": 0.76, - "learning_rate": 1.7494570702231935e-06, - "loss": 0.562, - "step": 29661 - }, - { - "epoch": 0.76, - "learning_rate": 1.7494387506308353e-06, - "loss": 0.8643, - "step": 29662 - }, - { - "epoch": 0.76, - "learning_rate": 1.7494204304646665e-06, - "loss": 0.874, - "step": 29663 - }, - { - "epoch": 0.76, - "learning_rate": 1.749402109724701e-06, - "loss": 0.6768, - "step": 29664 - }, - { - "epoch": 0.76, - "learning_rate": 1.7493837884109526e-06, - "loss": 0.7266, - "step": 29665 - }, - { - "epoch": 0.76, - "learning_rate": 1.7493654665234355e-06, - "loss": 0.9175, - "step": 29666 - }, - { - "epoch": 0.76, - "learning_rate": 1.7493471440621638e-06, - "loss": 0.7529, - "step": 29667 - }, - { - "epoch": 0.76, - "learning_rate": 1.7493288210271516e-06, - "loss": 0.8994, - "step": 29668 - }, - { - "epoch": 0.76, - "learning_rate": 1.7493104974184125e-06, - "loss": 0.6943, - "step": 29669 - }, - { - "epoch": 0.76, - "learning_rate": 1.7492921732359612e-06, - "loss": 0.9531, - "step": 29670 - }, - { - "epoch": 0.76, - "learning_rate": 1.7492738484798108e-06, - "loss": 0.8809, - "step": 29671 - }, - { - "epoch": 0.76, - "learning_rate": 1.7492555231499761e-06, - "loss": 0.9673, - "step": 29672 - }, - { - "epoch": 0.76, - "learning_rate": 1.749237197246471e-06, - "loss": 0.9658, - "step": 29673 - }, - { - "epoch": 0.76, - "learning_rate": 1.7492188707693094e-06, - "loss": 0.6162, - "step": 29674 - }, - { - "epoch": 0.76, - "learning_rate": 1.7492005437185053e-06, - "loss": 0.9541, - "step": 29675 - }, - { - "epoch": 0.76, - "learning_rate": 1.7491822160940725e-06, - "loss": 0.9092, - "step": 29676 - }, - { - "epoch": 0.76, - "learning_rate": 1.7491638878960259e-06, - "loss": 0.9053, - "step": 29677 - }, - { - "epoch": 0.76, - "learning_rate": 1.7491455591243786e-06, - "loss": 0.8271, - "step": 29678 - }, - { - "epoch": 0.76, - "learning_rate": 1.749127229779145e-06, - "loss": 0.9209, - "step": 29679 - }, - { - "epoch": 0.76, - "learning_rate": 1.749108899860339e-06, - "loss": 0.8232, - "step": 29680 - }, - { - "epoch": 0.76, - "learning_rate": 1.7490905693679751e-06, - "loss": 0.8467, - "step": 29681 - }, - { - "epoch": 0.76, - "learning_rate": 1.7490722383020668e-06, - "loss": 0.9287, - "step": 29682 - }, - { - "epoch": 0.76, - "learning_rate": 1.7490539066626286e-06, - "loss": 0.7192, - "step": 29683 - }, - { - "epoch": 0.76, - "learning_rate": 1.749035574449674e-06, - "loss": 0.9141, - "step": 29684 - }, - { - "epoch": 0.76, - "learning_rate": 1.7490172416632176e-06, - "loss": 0.9268, - "step": 29685 - }, - { - "epoch": 0.76, - "learning_rate": 1.7489989083032727e-06, - "loss": 0.9043, - "step": 29686 - }, - { - "epoch": 0.76, - "learning_rate": 1.748980574369854e-06, - "loss": 0.9434, - "step": 29687 - }, - { - "epoch": 0.76, - "learning_rate": 1.7489622398629754e-06, - "loss": 0.7881, - "step": 29688 - }, - { - "epoch": 0.76, - "learning_rate": 1.7489439047826507e-06, - "loss": 0.8447, - "step": 29689 - }, - { - "epoch": 0.76, - "learning_rate": 1.748925569128894e-06, - "loss": 0.8052, - "step": 29690 - }, - { - "epoch": 0.76, - "learning_rate": 1.7489072329017196e-06, - "loss": 0.7446, - "step": 29691 - }, - { - "epoch": 0.76, - "learning_rate": 1.7488888961011413e-06, - "loss": 1.0049, - "step": 29692 - }, - { - "epoch": 0.76, - "learning_rate": 1.7488705587271736e-06, - "loss": 1.0156, - "step": 29693 - }, - { - "epoch": 0.76, - "learning_rate": 1.7488522207798296e-06, - "loss": 1.0068, - "step": 29694 - }, - { - "epoch": 0.76, - "learning_rate": 1.748833882259124e-06, - "loss": 0.7559, - "step": 29695 - }, - { - "epoch": 0.76, - "learning_rate": 1.7488155431650707e-06, - "loss": 0.8188, - "step": 29696 - }, - { - "epoch": 0.76, - "learning_rate": 1.748797203497684e-06, - "loss": 0.7139, - "step": 29697 - }, - { - "epoch": 0.76, - "learning_rate": 1.7487788632569775e-06, - "loss": 0.9629, - "step": 29698 - }, - { - "epoch": 0.76, - "learning_rate": 1.7487605224429657e-06, - "loss": 0.8242, - "step": 29699 - }, - { - "epoch": 0.76, - "learning_rate": 1.748742181055662e-06, - "loss": 0.8691, - "step": 29700 - }, - { - "epoch": 0.76, - "learning_rate": 1.748723839095081e-06, - "loss": 0.6353, - "step": 29701 - }, - { - "epoch": 0.76, - "learning_rate": 1.7487054965612367e-06, - "loss": 0.7803, - "step": 29702 - }, - { - "epoch": 0.76, - "learning_rate": 1.748687153454143e-06, - "loss": 0.6091, - "step": 29703 - }, - { - "epoch": 0.76, - "learning_rate": 1.748668809773814e-06, - "loss": 0.8984, - "step": 29704 - }, - { - "epoch": 0.76, - "learning_rate": 1.7486504655202636e-06, - "loss": 0.9062, - "step": 29705 - }, - { - "epoch": 0.76, - "learning_rate": 1.748632120693506e-06, - "loss": 0.5796, - "step": 29706 - }, - { - "epoch": 0.76, - "learning_rate": 1.7486137752935553e-06, - "loss": 0.7773, - "step": 29707 - }, - { - "epoch": 0.76, - "learning_rate": 1.7485954293204255e-06, - "loss": 0.8037, - "step": 29708 - }, - { - "epoch": 0.76, - "learning_rate": 1.7485770827741305e-06, - "loss": 0.6772, - "step": 29709 - }, - { - "epoch": 0.76, - "learning_rate": 1.7485587356546843e-06, - "loss": 0.7783, - "step": 29710 - }, - { - "epoch": 0.76, - "learning_rate": 1.7485403879621012e-06, - "loss": 0.9072, - "step": 29711 - }, - { - "epoch": 0.76, - "learning_rate": 1.7485220396963954e-06, - "loss": 0.7417, - "step": 29712 - }, - { - "epoch": 0.76, - "learning_rate": 1.7485036908575803e-06, - "loss": 0.9053, - "step": 29713 - }, - { - "epoch": 0.76, - "learning_rate": 1.7484853414456706e-06, - "loss": 0.8936, - "step": 29714 - }, - { - "epoch": 0.76, - "learning_rate": 1.74846699146068e-06, - "loss": 0.9346, - "step": 29715 - }, - { - "epoch": 0.76, - "learning_rate": 1.7484486409026228e-06, - "loss": 1.126, - "step": 29716 - }, - { - "epoch": 0.76, - "learning_rate": 1.7484302897715125e-06, - "loss": 1.1035, - "step": 29717 - }, - { - "epoch": 0.76, - "learning_rate": 1.7484119380673639e-06, - "loss": 0.751, - "step": 29718 - }, - { - "epoch": 0.76, - "learning_rate": 1.7483935857901907e-06, - "loss": 0.8906, - "step": 29719 - }, - { - "epoch": 0.76, - "learning_rate": 1.7483752329400065e-06, - "loss": 0.823, - "step": 29720 - }, - { - "epoch": 0.76, - "learning_rate": 1.7483568795168263e-06, - "loss": 0.9033, - "step": 29721 - }, - { - "epoch": 0.76, - "learning_rate": 1.7483385255206633e-06, - "loss": 0.9219, - "step": 29722 - }, - { - "epoch": 0.76, - "learning_rate": 1.748320170951532e-06, - "loss": 0.834, - "step": 29723 - }, - { - "epoch": 0.76, - "learning_rate": 1.7483018158094465e-06, - "loss": 0.9561, - "step": 29724 - }, - { - "epoch": 0.76, - "learning_rate": 1.7482834600944204e-06, - "loss": 0.9629, - "step": 29725 - }, - { - "epoch": 0.76, - "learning_rate": 1.7482651038064685e-06, - "loss": 0.9551, - "step": 29726 - }, - { - "epoch": 0.76, - "learning_rate": 1.748246746945604e-06, - "loss": 0.8301, - "step": 29727 - }, - { - "epoch": 0.76, - "learning_rate": 1.748228389511842e-06, - "loss": 0.6792, - "step": 29728 - }, - { - "epoch": 0.76, - "learning_rate": 1.7482100315051953e-06, - "loss": 0.9243, - "step": 29729 - }, - { - "epoch": 0.76, - "learning_rate": 1.748191672925679e-06, - "loss": 0.8896, - "step": 29730 - }, - { - "epoch": 0.76, - "learning_rate": 1.7481733137733063e-06, - "loss": 0.8984, - "step": 29731 - }, - { - "epoch": 0.76, - "learning_rate": 1.748154954048092e-06, - "loss": 0.9414, - "step": 29732 - }, - { - "epoch": 0.76, - "learning_rate": 1.7481365937500497e-06, - "loss": 0.7822, - "step": 29733 - }, - { - "epoch": 0.76, - "learning_rate": 1.7481182328791934e-06, - "loss": 0.5864, - "step": 29734 - }, - { - "epoch": 0.76, - "learning_rate": 1.7480998714355379e-06, - "loss": 0.7852, - "step": 29735 - }, - { - "epoch": 0.76, - "learning_rate": 1.7480815094190966e-06, - "loss": 0.937, - "step": 29736 - }, - { - "epoch": 0.76, - "learning_rate": 1.7480631468298835e-06, - "loss": 0.9473, - "step": 29737 - }, - { - "epoch": 0.76, - "learning_rate": 1.7480447836679128e-06, - "loss": 1.041, - "step": 29738 - }, - { - "epoch": 0.76, - "learning_rate": 1.7480264199331987e-06, - "loss": 0.8164, - "step": 29739 - }, - { - "epoch": 0.76, - "learning_rate": 1.7480080556257553e-06, - "loss": 0.9004, - "step": 29740 - }, - { - "epoch": 0.76, - "learning_rate": 1.7479896907455962e-06, - "loss": 0.7808, - "step": 29741 - }, - { - "epoch": 0.76, - "learning_rate": 1.747971325292736e-06, - "loss": 0.8369, - "step": 29742 - }, - { - "epoch": 0.76, - "learning_rate": 1.7479529592671885e-06, - "loss": 0.9014, - "step": 29743 - }, - { - "epoch": 0.76, - "learning_rate": 1.747934592668968e-06, - "loss": 0.7783, - "step": 29744 - }, - { - "epoch": 0.76, - "learning_rate": 1.747916225498088e-06, - "loss": 0.8115, - "step": 29745 - }, - { - "epoch": 0.76, - "learning_rate": 1.7478978577545634e-06, - "loss": 0.77, - "step": 29746 - }, - { - "epoch": 0.76, - "learning_rate": 1.7478794894384072e-06, - "loss": 1.0186, - "step": 29747 - }, - { - "epoch": 0.76, - "learning_rate": 1.7478611205496346e-06, - "loss": 0.7617, - "step": 29748 - }, - { - "epoch": 0.76, - "learning_rate": 1.747842751088259e-06, - "loss": 0.9844, - "step": 29749 - }, - { - "epoch": 0.76, - "learning_rate": 1.7478243810542944e-06, - "loss": 0.665, - "step": 29750 - }, - { - "epoch": 0.76, - "learning_rate": 1.7478060104477552e-06, - "loss": 0.9102, - "step": 29751 - }, - { - "epoch": 0.76, - "learning_rate": 1.7477876392686555e-06, - "loss": 0.8818, - "step": 29752 - }, - { - "epoch": 0.76, - "learning_rate": 1.7477692675170088e-06, - "loss": 0.5962, - "step": 29753 - }, - { - "epoch": 0.76, - "learning_rate": 1.7477508951928299e-06, - "loss": 0.9434, - "step": 29754 - }, - { - "epoch": 0.76, - "learning_rate": 1.7477325222961325e-06, - "loss": 0.8555, - "step": 29755 - }, - { - "epoch": 0.76, - "learning_rate": 1.7477141488269304e-06, - "loss": 0.7612, - "step": 29756 - }, - { - "epoch": 0.76, - "learning_rate": 1.7476957747852384e-06, - "loss": 0.6255, - "step": 29757 - }, - { - "epoch": 0.76, - "learning_rate": 1.7476774001710697e-06, - "loss": 1.0117, - "step": 29758 - }, - { - "epoch": 0.76, - "learning_rate": 1.7476590249844389e-06, - "loss": 0.96, - "step": 29759 - }, - { - "epoch": 0.76, - "learning_rate": 1.74764064922536e-06, - "loss": 1.0811, - "step": 29760 - }, - { - "epoch": 0.76, - "learning_rate": 1.747622272893847e-06, - "loss": 0.9346, - "step": 29761 - }, - { - "epoch": 0.76, - "learning_rate": 1.747603895989914e-06, - "loss": 0.7231, - "step": 29762 - }, - { - "epoch": 0.76, - "learning_rate": 1.7475855185135753e-06, - "loss": 0.6377, - "step": 29763 - }, - { - "epoch": 0.76, - "learning_rate": 1.7475671404648445e-06, - "loss": 0.8174, - "step": 29764 - }, - { - "epoch": 0.76, - "learning_rate": 1.7475487618437358e-06, - "loss": 0.8574, - "step": 29765 - }, - { - "epoch": 0.76, - "learning_rate": 1.7475303826502637e-06, - "loss": 0.9795, - "step": 29766 - }, - { - "epoch": 0.76, - "learning_rate": 1.7475120028844419e-06, - "loss": 0.8672, - "step": 29767 - }, - { - "epoch": 0.76, - "learning_rate": 1.747493622546284e-06, - "loss": 0.8604, - "step": 29768 - }, - { - "epoch": 0.76, - "learning_rate": 1.7474752416358055e-06, - "loss": 0.8242, - "step": 29769 - }, - { - "epoch": 0.76, - "learning_rate": 1.747456860153019e-06, - "loss": 0.6777, - "step": 29770 - }, - { - "epoch": 0.76, - "learning_rate": 1.7474384780979393e-06, - "loss": 0.7402, - "step": 29771 - }, - { - "epoch": 0.76, - "learning_rate": 1.7474200954705803e-06, - "loss": 0.7075, - "step": 29772 - }, - { - "epoch": 0.76, - "learning_rate": 1.7474017122709562e-06, - "loss": 0.7068, - "step": 29773 - }, - { - "epoch": 0.76, - "learning_rate": 1.7473833284990808e-06, - "loss": 0.6768, - "step": 29774 - }, - { - "epoch": 0.76, - "learning_rate": 1.7473649441549686e-06, - "loss": 0.71, - "step": 29775 - }, - { - "epoch": 0.76, - "learning_rate": 1.7473465592386331e-06, - "loss": 1.0293, - "step": 29776 - }, - { - "epoch": 0.76, - "learning_rate": 1.747328173750089e-06, - "loss": 0.6071, - "step": 29777 - }, - { - "epoch": 0.76, - "learning_rate": 1.74730978768935e-06, - "loss": 1.002, - "step": 29778 - }, - { - "epoch": 0.76, - "learning_rate": 1.74729140105643e-06, - "loss": 0.6572, - "step": 29779 - }, - { - "epoch": 0.76, - "learning_rate": 1.7472730138513435e-06, - "loss": 0.8477, - "step": 29780 - }, - { - "epoch": 0.76, - "learning_rate": 1.7472546260741045e-06, - "loss": 0.6689, - "step": 29781 - }, - { - "epoch": 0.76, - "learning_rate": 1.747236237724727e-06, - "loss": 0.8203, - "step": 29782 - }, - { - "epoch": 0.76, - "learning_rate": 1.747217848803225e-06, - "loss": 0.8447, - "step": 29783 - }, - { - "epoch": 0.76, - "learning_rate": 1.7471994593096126e-06, - "loss": 0.771, - "step": 29784 - }, - { - "epoch": 0.76, - "learning_rate": 1.7471810692439042e-06, - "loss": 0.8535, - "step": 29785 - }, - { - "epoch": 0.76, - "learning_rate": 1.7471626786061134e-06, - "loss": 0.8516, - "step": 29786 - }, - { - "epoch": 0.76, - "learning_rate": 1.7471442873962543e-06, - "loss": 0.5986, - "step": 29787 - }, - { - "epoch": 0.76, - "learning_rate": 1.7471258956143413e-06, - "loss": 1.0, - "step": 29788 - }, - { - "epoch": 0.76, - "learning_rate": 1.7471075032603885e-06, - "loss": 0.9111, - "step": 29789 - }, - { - "epoch": 0.76, - "learning_rate": 1.74708911033441e-06, - "loss": 0.7559, - "step": 29790 - }, - { - "epoch": 0.76, - "learning_rate": 1.7470707168364195e-06, - "loss": 0.9609, - "step": 29791 - }, - { - "epoch": 0.76, - "learning_rate": 1.747052322766431e-06, - "loss": 1.0625, - "step": 29792 - }, - { - "epoch": 0.76, - "learning_rate": 1.7470339281244592e-06, - "loss": 1.0166, - "step": 29793 - }, - { - "epoch": 0.76, - "learning_rate": 1.747015532910518e-06, - "loss": 0.8174, - "step": 29794 - }, - { - "epoch": 0.76, - "learning_rate": 1.7469971371246213e-06, - "loss": 0.96, - "step": 29795 - }, - { - "epoch": 0.76, - "learning_rate": 1.7469787407667828e-06, - "loss": 0.7593, - "step": 29796 - }, - { - "epoch": 0.76, - "learning_rate": 1.7469603438370174e-06, - "loss": 0.6311, - "step": 29797 - }, - { - "epoch": 0.76, - "learning_rate": 1.746941946335339e-06, - "loss": 0.8613, - "step": 29798 - }, - { - "epoch": 0.76, - "learning_rate": 1.7469235482617612e-06, - "loss": 0.8267, - "step": 29799 - }, - { - "epoch": 0.76, - "learning_rate": 1.7469051496162985e-06, - "loss": 0.6553, - "step": 29800 - }, - { - "epoch": 0.76, - "learning_rate": 1.7468867503989648e-06, - "loss": 0.8535, - "step": 29801 - }, - { - "epoch": 0.76, - "learning_rate": 1.7468683506097743e-06, - "loss": 0.7217, - "step": 29802 - }, - { - "epoch": 0.76, - "learning_rate": 1.746849950248741e-06, - "loss": 0.7896, - "step": 29803 - }, - { - "epoch": 0.76, - "learning_rate": 1.7468315493158793e-06, - "loss": 0.7366, - "step": 29804 - }, - { - "epoch": 0.76, - "learning_rate": 1.7468131478112027e-06, - "loss": 0.8525, - "step": 29805 - }, - { - "epoch": 0.76, - "learning_rate": 1.7467947457347255e-06, - "loss": 0.8135, - "step": 29806 - }, - { - "epoch": 0.76, - "learning_rate": 1.7467763430864624e-06, - "loss": 0.7271, - "step": 29807 - }, - { - "epoch": 0.76, - "learning_rate": 1.7467579398664266e-06, - "loss": 0.8096, - "step": 29808 - }, - { - "epoch": 0.76, - "learning_rate": 1.7467395360746327e-06, - "loss": 0.7397, - "step": 29809 - }, - { - "epoch": 0.76, - "learning_rate": 1.7467211317110946e-06, - "loss": 0.8984, - "step": 29810 - }, - { - "epoch": 0.76, - "learning_rate": 1.7467027267758266e-06, - "loss": 0.7266, - "step": 29811 - }, - { - "epoch": 0.76, - "learning_rate": 1.7466843212688425e-06, - "loss": 0.9678, - "step": 29812 - }, - { - "epoch": 0.76, - "learning_rate": 1.7466659151901566e-06, - "loss": 0.748, - "step": 29813 - }, - { - "epoch": 0.76, - "learning_rate": 1.7466475085397829e-06, - "loss": 0.8936, - "step": 29814 - }, - { - "epoch": 0.76, - "learning_rate": 1.7466291013177358e-06, - "loss": 0.8174, - "step": 29815 - }, - { - "epoch": 0.76, - "learning_rate": 1.7466106935240289e-06, - "loss": 0.8115, - "step": 29816 - }, - { - "epoch": 0.76, - "learning_rate": 1.7465922851586766e-06, - "loss": 0.7314, - "step": 29817 - }, - { - "epoch": 0.76, - "learning_rate": 1.7465738762216927e-06, - "loss": 0.9541, - "step": 29818 - }, - { - "epoch": 0.76, - "learning_rate": 1.7465554667130918e-06, - "loss": 0.9922, - "step": 29819 - }, - { - "epoch": 0.76, - "learning_rate": 1.7465370566328876e-06, - "loss": 0.834, - "step": 29820 - }, - { - "epoch": 0.76, - "learning_rate": 1.7465186459810942e-06, - "loss": 1.0449, - "step": 29821 - }, - { - "epoch": 0.76, - "learning_rate": 1.7465002347577257e-06, - "loss": 0.7734, - "step": 29822 - }, - { - "epoch": 0.76, - "learning_rate": 1.7464818229627966e-06, - "loss": 0.6428, - "step": 29823 - }, - { - "epoch": 0.76, - "learning_rate": 1.7464634105963207e-06, - "loss": 0.8813, - "step": 29824 - }, - { - "epoch": 0.76, - "learning_rate": 1.7464449976583119e-06, - "loss": 0.8062, - "step": 29825 - }, - { - "epoch": 0.76, - "learning_rate": 1.7464265841487845e-06, - "loss": 0.8115, - "step": 29826 - }, - { - "epoch": 0.76, - "learning_rate": 1.7464081700677528e-06, - "loss": 0.7783, - "step": 29827 - }, - { - "epoch": 0.76, - "learning_rate": 1.7463897554152305e-06, - "loss": 0.9531, - "step": 29828 - }, - { - "epoch": 0.76, - "learning_rate": 1.7463713401912318e-06, - "loss": 0.8037, - "step": 29829 - }, - { - "epoch": 0.76, - "learning_rate": 1.746352924395771e-06, - "loss": 0.9043, - "step": 29830 - }, - { - "epoch": 0.76, - "learning_rate": 1.7463345080288622e-06, - "loss": 0.7769, - "step": 29831 - }, - { - "epoch": 0.76, - "learning_rate": 1.7463160910905192e-06, - "loss": 0.6768, - "step": 29832 - }, - { - "epoch": 0.76, - "learning_rate": 1.7462976735807561e-06, - "loss": 1.0225, - "step": 29833 - }, - { - "epoch": 0.76, - "learning_rate": 1.7462792554995876e-06, - "loss": 0.7656, - "step": 29834 - }, - { - "epoch": 0.76, - "learning_rate": 1.7462608368470272e-06, - "loss": 0.7314, - "step": 29835 - }, - { - "epoch": 0.76, - "learning_rate": 1.7462424176230892e-06, - "loss": 0.9121, - "step": 29836 - }, - { - "epoch": 0.76, - "learning_rate": 1.7462239978277877e-06, - "loss": 0.646, - "step": 29837 - }, - { - "epoch": 0.76, - "learning_rate": 1.746205577461137e-06, - "loss": 0.6738, - "step": 29838 - }, - { - "epoch": 0.76, - "learning_rate": 1.7461871565231507e-06, - "loss": 0.8467, - "step": 29839 - }, - { - "epoch": 0.76, - "learning_rate": 1.7461687350138434e-06, - "loss": 0.7559, - "step": 29840 - }, - { - "epoch": 0.76, - "learning_rate": 1.7461503129332286e-06, - "loss": 0.957, - "step": 29841 - }, - { - "epoch": 0.76, - "learning_rate": 1.7461318902813214e-06, - "loss": 0.8384, - "step": 29842 - }, - { - "epoch": 0.76, - "learning_rate": 1.746113467058135e-06, - "loss": 0.6167, - "step": 29843 - }, - { - "epoch": 0.76, - "learning_rate": 1.746095043263684e-06, - "loss": 0.8359, - "step": 29844 - }, - { - "epoch": 0.76, - "learning_rate": 1.7460766188979822e-06, - "loss": 0.9277, - "step": 29845 - }, - { - "epoch": 0.76, - "learning_rate": 1.7460581939610438e-06, - "loss": 0.7959, - "step": 29846 - }, - { - "epoch": 0.76, - "learning_rate": 1.7460397684528828e-06, - "loss": 0.7222, - "step": 29847 - }, - { - "epoch": 0.77, - "learning_rate": 1.7460213423735138e-06, - "loss": 0.7222, - "step": 29848 - }, - { - "epoch": 0.77, - "learning_rate": 1.7460029157229504e-06, - "loss": 0.8032, - "step": 29849 - }, - { - "epoch": 0.77, - "learning_rate": 1.745984488501207e-06, - "loss": 0.5918, - "step": 29850 - }, - { - "epoch": 0.77, - "learning_rate": 1.7459660607082974e-06, - "loss": 0.8516, - "step": 29851 - }, - { - "epoch": 0.77, - "learning_rate": 1.745947632344236e-06, - "loss": 0.8623, - "step": 29852 - }, - { - "epoch": 0.77, - "learning_rate": 1.7459292034090365e-06, - "loss": 0.5393, - "step": 29853 - }, - { - "epoch": 0.77, - "learning_rate": 1.7459107739027136e-06, - "loss": 0.8398, - "step": 29854 - }, - { - "epoch": 0.77, - "learning_rate": 1.745892343825281e-06, - "loss": 0.9502, - "step": 29855 - }, - { - "epoch": 0.77, - "learning_rate": 1.7458739131767531e-06, - "loss": 0.7354, - "step": 29856 - }, - { - "epoch": 0.77, - "learning_rate": 1.7458554819571437e-06, - "loss": 0.8062, - "step": 29857 - }, - { - "epoch": 0.77, - "learning_rate": 1.7458370501664672e-06, - "loss": 1.0176, - "step": 29858 - }, - { - "epoch": 0.77, - "learning_rate": 1.7458186178047374e-06, - "loss": 0.8369, - "step": 29859 - }, - { - "epoch": 0.77, - "learning_rate": 1.7458001848719687e-06, - "loss": 0.9443, - "step": 29860 - }, - { - "epoch": 0.77, - "learning_rate": 1.7457817513681748e-06, - "loss": 1.0635, - "step": 29861 - }, - { - "epoch": 0.77, - "learning_rate": 1.7457633172933704e-06, - "loss": 0.8076, - "step": 29862 - }, - { - "epoch": 0.77, - "learning_rate": 1.7457448826475694e-06, - "loss": 0.8193, - "step": 29863 - }, - { - "epoch": 0.77, - "learning_rate": 1.7457264474307855e-06, - "loss": 0.9805, - "step": 29864 - }, - { - "epoch": 0.77, - "learning_rate": 1.7457080116430333e-06, - "loss": 0.6702, - "step": 29865 - }, - { - "epoch": 0.77, - "learning_rate": 1.7456895752843268e-06, - "loss": 0.7588, - "step": 29866 - }, - { - "epoch": 0.77, - "learning_rate": 1.7456711383546802e-06, - "loss": 0.811, - "step": 29867 - }, - { - "epoch": 0.77, - "learning_rate": 1.7456527008541074e-06, - "loss": 0.9297, - "step": 29868 - }, - { - "epoch": 0.77, - "learning_rate": 1.7456342627826227e-06, - "loss": 0.7451, - "step": 29869 - }, - { - "epoch": 0.77, - "learning_rate": 1.74561582414024e-06, - "loss": 0.6326, - "step": 29870 - }, - { - "epoch": 0.77, - "learning_rate": 1.7455973849269735e-06, - "loss": 0.7314, - "step": 29871 - }, - { - "epoch": 0.77, - "learning_rate": 1.7455789451428373e-06, - "loss": 0.5981, - "step": 29872 - }, - { - "epoch": 0.77, - "learning_rate": 1.7455605047878458e-06, - "loss": 0.7852, - "step": 29873 - }, - { - "epoch": 0.77, - "learning_rate": 1.7455420638620128e-06, - "loss": 0.8359, - "step": 29874 - }, - { - "epoch": 0.77, - "learning_rate": 1.7455236223653524e-06, - "loss": 0.9395, - "step": 29875 - }, - { - "epoch": 0.77, - "learning_rate": 1.745505180297879e-06, - "loss": 1.127, - "step": 29876 - }, - { - "epoch": 0.77, - "learning_rate": 1.7454867376596067e-06, - "loss": 0.7246, - "step": 29877 - }, - { - "epoch": 0.77, - "learning_rate": 1.7454682944505491e-06, - "loss": 1.0547, - "step": 29878 - }, - { - "epoch": 0.77, - "learning_rate": 1.7454498506707212e-06, - "loss": 1.082, - "step": 29879 - }, - { - "epoch": 0.77, - "learning_rate": 1.7454314063201362e-06, - "loss": 0.9951, - "step": 29880 - }, - { - "epoch": 0.77, - "learning_rate": 1.745412961398809e-06, - "loss": 0.9941, - "step": 29881 - }, - { - "epoch": 0.77, - "learning_rate": 1.745394515906753e-06, - "loss": 0.9307, - "step": 29882 - }, - { - "epoch": 0.77, - "learning_rate": 1.7453760698439827e-06, - "loss": 0.7988, - "step": 29883 - }, - { - "epoch": 0.77, - "learning_rate": 1.7453576232105124e-06, - "loss": 0.7881, - "step": 29884 - }, - { - "epoch": 0.77, - "learning_rate": 1.745339176006356e-06, - "loss": 0.9463, - "step": 29885 - }, - { - "epoch": 0.77, - "learning_rate": 1.7453207282315278e-06, - "loss": 0.8535, - "step": 29886 - }, - { - "epoch": 0.77, - "learning_rate": 1.7453022798860417e-06, - "loss": 1.0156, - "step": 29887 - }, - { - "epoch": 0.77, - "learning_rate": 1.745283830969912e-06, - "loss": 0.8672, - "step": 29888 - }, - { - "epoch": 0.77, - "learning_rate": 1.7452653814831524e-06, - "loss": 0.6631, - "step": 29889 - }, - { - "epoch": 0.77, - "learning_rate": 1.7452469314257775e-06, - "loss": 0.9512, - "step": 29890 - }, - { - "epoch": 0.77, - "learning_rate": 1.7452284807978015e-06, - "loss": 0.9307, - "step": 29891 - }, - { - "epoch": 0.77, - "learning_rate": 1.7452100295992382e-06, - "loss": 0.7808, - "step": 29892 - }, - { - "epoch": 0.77, - "learning_rate": 1.7451915778301021e-06, - "loss": 0.6035, - "step": 29893 - }, - { - "epoch": 0.77, - "learning_rate": 1.7451731254904067e-06, - "loss": 0.9062, - "step": 29894 - }, - { - "epoch": 0.77, - "learning_rate": 1.7451546725801667e-06, - "loss": 0.9502, - "step": 29895 - }, - { - "epoch": 0.77, - "learning_rate": 1.745136219099396e-06, - "loss": 0.4932, - "step": 29896 - }, - { - "epoch": 0.77, - "learning_rate": 1.7451177650481087e-06, - "loss": 0.9023, - "step": 29897 - }, - { - "epoch": 0.77, - "learning_rate": 1.745099310426319e-06, - "loss": 0.8926, - "step": 29898 - }, - { - "epoch": 0.77, - "learning_rate": 1.745080855234041e-06, - "loss": 1.0068, - "step": 29899 - }, - { - "epoch": 0.77, - "learning_rate": 1.7450623994712888e-06, - "loss": 0.7202, - "step": 29900 - }, - { - "epoch": 0.77, - "learning_rate": 1.7450439431380768e-06, - "loss": 0.9067, - "step": 29901 - }, - { - "epoch": 0.77, - "learning_rate": 1.7450254862344186e-06, - "loss": 0.8398, - "step": 29902 - }, - { - "epoch": 0.77, - "learning_rate": 1.7450070287603289e-06, - "loss": 0.7612, - "step": 29903 - }, - { - "epoch": 0.77, - "learning_rate": 1.7449885707158215e-06, - "loss": 0.7778, - "step": 29904 - }, - { - "epoch": 0.77, - "learning_rate": 1.7449701121009107e-06, - "loss": 0.8008, - "step": 29905 - }, - { - "epoch": 0.77, - "learning_rate": 1.7449516529156104e-06, - "loss": 1.0, - "step": 29906 - }, - { - "epoch": 0.77, - "learning_rate": 1.7449331931599347e-06, - "loss": 0.7734, - "step": 29907 - }, - { - "epoch": 0.77, - "learning_rate": 1.7449147328338983e-06, - "loss": 0.7949, - "step": 29908 - }, - { - "epoch": 0.77, - "learning_rate": 1.7448962719375146e-06, - "loss": 0.7424, - "step": 29909 - }, - { - "epoch": 0.77, - "learning_rate": 1.7448778104707983e-06, - "loss": 1.1328, - "step": 29910 - }, - { - "epoch": 0.77, - "learning_rate": 1.7448593484337632e-06, - "loss": 0.5593, - "step": 29911 - }, - { - "epoch": 0.77, - "learning_rate": 1.7448408858264236e-06, - "loss": 0.833, - "step": 29912 - }, - { - "epoch": 0.77, - "learning_rate": 1.7448224226487936e-06, - "loss": 0.7529, - "step": 29913 - }, - { - "epoch": 0.77, - "learning_rate": 1.7448039589008873e-06, - "loss": 0.9893, - "step": 29914 - }, - { - "epoch": 0.77, - "learning_rate": 1.744785494582719e-06, - "loss": 0.9951, - "step": 29915 - }, - { - "epoch": 0.77, - "learning_rate": 1.7447670296943025e-06, - "loss": 0.7666, - "step": 29916 - }, - { - "epoch": 0.77, - "learning_rate": 1.7447485642356522e-06, - "loss": 0.873, - "step": 29917 - }, - { - "epoch": 0.77, - "learning_rate": 1.7447300982067818e-06, - "loss": 0.7261, - "step": 29918 - }, - { - "epoch": 0.77, - "learning_rate": 1.7447116316077063e-06, - "loss": 1.0508, - "step": 29919 - }, - { - "epoch": 0.77, - "learning_rate": 1.744693164438439e-06, - "loss": 0.9287, - "step": 29920 - }, - { - "epoch": 0.77, - "learning_rate": 1.7446746966989948e-06, - "loss": 0.7476, - "step": 29921 - }, - { - "epoch": 0.77, - "learning_rate": 1.744656228389387e-06, - "loss": 0.8433, - "step": 29922 - }, - { - "epoch": 0.77, - "learning_rate": 1.7446377595096304e-06, - "loss": 0.8926, - "step": 29923 - }, - { - "epoch": 0.77, - "learning_rate": 1.744619290059739e-06, - "loss": 0.8047, - "step": 29924 - }, - { - "epoch": 0.77, - "learning_rate": 1.7446008200397267e-06, - "loss": 0.9526, - "step": 29925 - }, - { - "epoch": 0.77, - "learning_rate": 1.7445823494496076e-06, - "loss": 0.8037, - "step": 29926 - }, - { - "epoch": 0.77, - "learning_rate": 1.7445638782893965e-06, - "loss": 1.0908, - "step": 29927 - }, - { - "epoch": 0.77, - "learning_rate": 1.7445454065591067e-06, - "loss": 0.9551, - "step": 29928 - }, - { - "epoch": 0.77, - "learning_rate": 1.744526934258753e-06, - "loss": 1.1055, - "step": 29929 - }, - { - "epoch": 0.77, - "learning_rate": 1.744508461388349e-06, - "loss": 0.9199, - "step": 29930 - }, - { - "epoch": 0.77, - "learning_rate": 1.744489987947909e-06, - "loss": 0.7983, - "step": 29931 - }, - { - "epoch": 0.77, - "learning_rate": 1.7444715139374475e-06, - "loss": 1.0137, - "step": 29932 - }, - { - "epoch": 0.77, - "learning_rate": 1.7444530393569784e-06, - "loss": 0.9023, - "step": 29933 - }, - { - "epoch": 0.77, - "learning_rate": 1.744434564206516e-06, - "loss": 0.8413, - "step": 29934 - }, - { - "epoch": 0.77, - "learning_rate": 1.744416088486074e-06, - "loss": 0.8428, - "step": 29935 - }, - { - "epoch": 0.77, - "learning_rate": 1.7443976121956667e-06, - "loss": 0.8252, - "step": 29936 - }, - { - "epoch": 0.77, - "learning_rate": 1.7443791353353086e-06, - "loss": 0.9414, - "step": 29937 - }, - { - "epoch": 0.77, - "learning_rate": 1.7443606579050137e-06, - "loss": 1.0234, - "step": 29938 - }, - { - "epoch": 0.77, - "learning_rate": 1.744342179904796e-06, - "loss": 0.6484, - "step": 29939 - }, - { - "epoch": 0.77, - "learning_rate": 1.7443237013346696e-06, - "loss": 0.6494, - "step": 29940 - }, - { - "epoch": 0.77, - "learning_rate": 1.744305222194649e-06, - "loss": 0.7832, - "step": 29941 - }, - { - "epoch": 0.77, - "learning_rate": 1.744286742484748e-06, - "loss": 1.0371, - "step": 29942 - }, - { - "epoch": 0.77, - "learning_rate": 1.7442682622049807e-06, - "loss": 0.8955, - "step": 29943 - }, - { - "epoch": 0.77, - "learning_rate": 1.7442497813553617e-06, - "loss": 0.6309, - "step": 29944 - }, - { - "epoch": 0.77, - "learning_rate": 1.7442312999359046e-06, - "loss": 0.9629, - "step": 29945 - }, - { - "epoch": 0.77, - "learning_rate": 1.7442128179466239e-06, - "loss": 0.9639, - "step": 29946 - }, - { - "epoch": 0.77, - "learning_rate": 1.7441943353875335e-06, - "loss": 0.7236, - "step": 29947 - }, - { - "epoch": 0.77, - "learning_rate": 1.7441758522586481e-06, - "loss": 0.8506, - "step": 29948 - }, - { - "epoch": 0.77, - "learning_rate": 1.744157368559981e-06, - "loss": 1.002, - "step": 29949 - }, - { - "epoch": 0.77, - "learning_rate": 1.7441388842915474e-06, - "loss": 0.9414, - "step": 29950 - }, - { - "epoch": 0.77, - "learning_rate": 1.7441203994533604e-06, - "loss": 0.6055, - "step": 29951 - }, - { - "epoch": 0.77, - "learning_rate": 1.744101914045435e-06, - "loss": 0.9619, - "step": 29952 - }, - { - "epoch": 0.77, - "learning_rate": 1.7440834280677844e-06, - "loss": 0.8281, - "step": 29953 - }, - { - "epoch": 0.77, - "learning_rate": 1.744064941520424e-06, - "loss": 0.7891, - "step": 29954 - }, - { - "epoch": 0.77, - "learning_rate": 1.744046454403367e-06, - "loss": 0.8262, - "step": 29955 - }, - { - "epoch": 0.77, - "learning_rate": 1.7440279667166277e-06, - "loss": 0.8477, - "step": 29956 - }, - { - "epoch": 0.77, - "learning_rate": 1.7440094784602206e-06, - "loss": 0.7871, - "step": 29957 - }, - { - "epoch": 0.77, - "learning_rate": 1.7439909896341596e-06, - "loss": 0.8604, - "step": 29958 - }, - { - "epoch": 0.77, - "learning_rate": 1.743972500238459e-06, - "loss": 1.0059, - "step": 29959 - }, - { - "epoch": 0.77, - "learning_rate": 1.7439540102731325e-06, - "loss": 0.8955, - "step": 29960 - }, - { - "epoch": 0.77, - "learning_rate": 1.743935519738195e-06, - "loss": 0.6138, - "step": 29961 - }, - { - "epoch": 0.77, - "learning_rate": 1.7439170286336601e-06, - "loss": 0.9482, - "step": 29962 - }, - { - "epoch": 0.77, - "learning_rate": 1.7438985369595424e-06, - "loss": 0.874, - "step": 29963 - }, - { - "epoch": 0.77, - "learning_rate": 1.7438800447158553e-06, - "loss": 0.8545, - "step": 29964 - }, - { - "epoch": 0.77, - "learning_rate": 1.7438615519026139e-06, - "loss": 0.7124, - "step": 29965 - }, - { - "epoch": 0.77, - "learning_rate": 1.7438430585198316e-06, - "loss": 0.7646, - "step": 29966 - }, - { - "epoch": 0.77, - "learning_rate": 1.7438245645675232e-06, - "loss": 0.958, - "step": 29967 - }, - { - "epoch": 0.77, - "learning_rate": 1.7438060700457022e-06, - "loss": 0.5366, - "step": 29968 - }, - { - "epoch": 0.77, - "learning_rate": 1.7437875749543833e-06, - "loss": 0.8408, - "step": 29969 - }, - { - "epoch": 0.77, - "learning_rate": 1.7437690792935805e-06, - "loss": 0.6396, - "step": 29970 - }, - { - "epoch": 0.77, - "learning_rate": 1.7437505830633076e-06, - "loss": 0.9971, - "step": 29971 - }, - { - "epoch": 0.77, - "learning_rate": 1.7437320862635793e-06, - "loss": 0.9893, - "step": 29972 - }, - { - "epoch": 0.77, - "learning_rate": 1.7437135888944097e-06, - "loss": 0.7593, - "step": 29973 - }, - { - "epoch": 0.77, - "learning_rate": 1.7436950909558128e-06, - "loss": 0.874, - "step": 29974 - }, - { - "epoch": 0.77, - "learning_rate": 1.7436765924478025e-06, - "loss": 0.728, - "step": 29975 - }, - { - "epoch": 0.77, - "learning_rate": 1.7436580933703936e-06, - "loss": 0.6943, - "step": 29976 - }, - { - "epoch": 0.77, - "learning_rate": 1.7436395937235996e-06, - "loss": 0.9238, - "step": 29977 - }, - { - "epoch": 0.77, - "learning_rate": 1.7436210935074347e-06, - "loss": 0.793, - "step": 29978 - }, - { - "epoch": 0.77, - "learning_rate": 1.7436025927219137e-06, - "loss": 0.7437, - "step": 29979 - }, - { - "epoch": 0.77, - "learning_rate": 1.7435840913670504e-06, - "loss": 0.8682, - "step": 29980 - }, - { - "epoch": 0.77, - "learning_rate": 1.7435655894428586e-06, - "loss": 0.5166, - "step": 29981 - }, - { - "epoch": 0.77, - "learning_rate": 1.7435470869493533e-06, - "loss": 0.9609, - "step": 29982 - }, - { - "epoch": 0.77, - "learning_rate": 1.7435285838865478e-06, - "loss": 0.7979, - "step": 29983 - }, - { - "epoch": 0.77, - "learning_rate": 1.7435100802544568e-06, - "loss": 0.8105, - "step": 29984 - }, - { - "epoch": 0.77, - "learning_rate": 1.7434915760530944e-06, - "loss": 0.9551, - "step": 29985 - }, - { - "epoch": 0.77, - "learning_rate": 1.7434730712824746e-06, - "loss": 0.6812, - "step": 29986 - }, - { - "epoch": 0.77, - "learning_rate": 1.7434545659426117e-06, - "loss": 0.6943, - "step": 29987 - }, - { - "epoch": 0.77, - "learning_rate": 1.74343606003352e-06, - "loss": 0.9707, - "step": 29988 - }, - { - "epoch": 0.77, - "learning_rate": 1.743417553555213e-06, - "loss": 0.9004, - "step": 29989 - }, - { - "epoch": 0.77, - "learning_rate": 1.7433990465077057e-06, - "loss": 0.9434, - "step": 29990 - }, - { - "epoch": 0.77, - "learning_rate": 1.743380538891012e-06, - "loss": 0.8809, - "step": 29991 - }, - { - "epoch": 0.77, - "learning_rate": 1.7433620307051458e-06, - "loss": 0.7568, - "step": 29992 - }, - { - "epoch": 0.77, - "learning_rate": 1.7433435219501214e-06, - "loss": 0.8203, - "step": 29993 - }, - { - "epoch": 0.77, - "learning_rate": 1.743325012625953e-06, - "loss": 0.8721, - "step": 29994 - }, - { - "epoch": 0.77, - "learning_rate": 1.7433065027326553e-06, - "loss": 0.7441, - "step": 29995 - }, - { - "epoch": 0.77, - "learning_rate": 1.7432879922702416e-06, - "loss": 0.9316, - "step": 29996 - }, - { - "epoch": 0.77, - "learning_rate": 1.7432694812387267e-06, - "loss": 0.7119, - "step": 29997 - }, - { - "epoch": 0.77, - "learning_rate": 1.7432509696381244e-06, - "loss": 0.8809, - "step": 29998 - }, - { - "epoch": 0.77, - "learning_rate": 1.743232457468449e-06, - "loss": 0.96, - "step": 29999 - }, - { - "epoch": 0.77, - "learning_rate": 1.7432139447297147e-06, - "loss": 0.6895, - "step": 30000 - }, - { - "epoch": 0.77, - "learning_rate": 1.7431954314219354e-06, - "loss": 0.73, - "step": 30001 - }, - { - "epoch": 0.77, - "learning_rate": 1.7431769175451262e-06, - "loss": 0.8896, - "step": 30002 - }, - { - "epoch": 0.77, - "learning_rate": 1.7431584030992999e-06, - "loss": 0.8604, - "step": 30003 - }, - { - "epoch": 0.77, - "learning_rate": 1.7431398880844718e-06, - "loss": 0.9375, - "step": 30004 - }, - { - "epoch": 0.77, - "learning_rate": 1.7431213725006555e-06, - "loss": 1.0127, - "step": 30005 - }, - { - "epoch": 0.77, - "learning_rate": 1.7431028563478653e-06, - "loss": 0.9746, - "step": 30006 - }, - { - "epoch": 0.77, - "learning_rate": 1.7430843396261155e-06, - "loss": 1.0654, - "step": 30007 - }, - { - "epoch": 0.77, - "learning_rate": 1.7430658223354202e-06, - "loss": 0.8325, - "step": 30008 - }, - { - "epoch": 0.77, - "learning_rate": 1.7430473044757934e-06, - "loss": 0.8613, - "step": 30009 - }, - { - "epoch": 0.77, - "learning_rate": 1.7430287860472497e-06, - "loss": 0.7666, - "step": 30010 - }, - { - "epoch": 0.77, - "learning_rate": 1.7430102670498027e-06, - "loss": 0.9316, - "step": 30011 - }, - { - "epoch": 0.77, - "learning_rate": 1.742991747483467e-06, - "loss": 0.8403, - "step": 30012 - }, - { - "epoch": 0.77, - "learning_rate": 1.742973227348257e-06, - "loss": 0.8047, - "step": 30013 - }, - { - "epoch": 0.77, - "learning_rate": 1.7429547066441862e-06, - "loss": 0.8672, - "step": 30014 - }, - { - "epoch": 0.77, - "learning_rate": 1.742936185371269e-06, - "loss": 1.0479, - "step": 30015 - }, - { - "epoch": 0.77, - "learning_rate": 1.7429176635295204e-06, - "loss": 0.8672, - "step": 30016 - }, - { - "epoch": 0.77, - "learning_rate": 1.7428991411189535e-06, - "loss": 0.792, - "step": 30017 - }, - { - "epoch": 0.77, - "learning_rate": 1.742880618139583e-06, - "loss": 1.0469, - "step": 30018 - }, - { - "epoch": 0.77, - "learning_rate": 1.7428620945914228e-06, - "loss": 0.9912, - "step": 30019 - }, - { - "epoch": 0.77, - "learning_rate": 1.7428435704744873e-06, - "loss": 0.9141, - "step": 30020 - }, - { - "epoch": 0.77, - "learning_rate": 1.7428250457887907e-06, - "loss": 0.8887, - "step": 30021 - }, - { - "epoch": 0.77, - "learning_rate": 1.742806520534347e-06, - "loss": 0.9609, - "step": 30022 - }, - { - "epoch": 0.77, - "learning_rate": 1.7427879947111705e-06, - "loss": 0.7607, - "step": 30023 - }, - { - "epoch": 0.77, - "learning_rate": 1.7427694683192758e-06, - "loss": 0.9001, - "step": 30024 - }, - { - "epoch": 0.77, - "learning_rate": 1.742750941358676e-06, - "loss": 0.9395, - "step": 30025 - }, - { - "epoch": 0.77, - "learning_rate": 1.7427324138293865e-06, - "loss": 0.6309, - "step": 30026 - }, - { - "epoch": 0.77, - "learning_rate": 1.7427138857314207e-06, - "loss": 0.9854, - "step": 30027 - }, - { - "epoch": 0.77, - "learning_rate": 1.742695357064793e-06, - "loss": 0.7715, - "step": 30028 - }, - { - "epoch": 0.77, - "learning_rate": 1.7426768278295175e-06, - "loss": 0.5098, - "step": 30029 - }, - { - "epoch": 0.77, - "learning_rate": 1.742658298025609e-06, - "loss": 0.8594, - "step": 30030 - }, - { - "epoch": 0.77, - "learning_rate": 1.7426397676530806e-06, - "loss": 0.6719, - "step": 30031 - }, - { - "epoch": 0.77, - "learning_rate": 1.7426212367119475e-06, - "loss": 1.0283, - "step": 30032 - }, - { - "epoch": 0.77, - "learning_rate": 1.7426027052022234e-06, - "loss": 0.8555, - "step": 30033 - }, - { - "epoch": 0.77, - "learning_rate": 1.7425841731239223e-06, - "loss": 0.8174, - "step": 30034 - }, - { - "epoch": 0.77, - "learning_rate": 1.7425656404770588e-06, - "loss": 0.9258, - "step": 30035 - }, - { - "epoch": 0.77, - "learning_rate": 1.7425471072616471e-06, - "loss": 0.9824, - "step": 30036 - }, - { - "epoch": 0.77, - "learning_rate": 1.7425285734777008e-06, - "loss": 0.9385, - "step": 30037 - }, - { - "epoch": 0.77, - "learning_rate": 1.742510039125235e-06, - "loss": 1.1328, - "step": 30038 - }, - { - "epoch": 0.77, - "learning_rate": 1.7424915042042632e-06, - "loss": 0.9463, - "step": 30039 - }, - { - "epoch": 0.77, - "learning_rate": 1.7424729687147997e-06, - "loss": 1.1299, - "step": 30040 - }, - { - "epoch": 0.77, - "learning_rate": 1.742454432656859e-06, - "loss": 0.8906, - "step": 30041 - }, - { - "epoch": 0.77, - "learning_rate": 1.7424358960304549e-06, - "loss": 0.8525, - "step": 30042 - }, - { - "epoch": 0.77, - "learning_rate": 1.7424173588356017e-06, - "loss": 1.0215, - "step": 30043 - }, - { - "epoch": 0.77, - "learning_rate": 1.7423988210723136e-06, - "loss": 0.9785, - "step": 30044 - }, - { - "epoch": 0.77, - "learning_rate": 1.7423802827406052e-06, - "loss": 1.0156, - "step": 30045 - }, - { - "epoch": 0.77, - "learning_rate": 1.7423617438404903e-06, - "loss": 0.9365, - "step": 30046 - }, - { - "epoch": 0.77, - "learning_rate": 1.7423432043719833e-06, - "loss": 0.7378, - "step": 30047 - }, - { - "epoch": 0.77, - "learning_rate": 1.7423246643350978e-06, - "loss": 0.96, - "step": 30048 - }, - { - "epoch": 0.77, - "learning_rate": 1.7423061237298486e-06, - "loss": 0.7695, - "step": 30049 - }, - { - "epoch": 0.77, - "learning_rate": 1.7422875825562498e-06, - "loss": 0.7852, - "step": 30050 - }, - { - "epoch": 0.77, - "learning_rate": 1.7422690408143154e-06, - "loss": 1.0078, - "step": 30051 - }, - { - "epoch": 0.77, - "learning_rate": 1.74225049850406e-06, - "loss": 0.8975, - "step": 30052 - }, - { - "epoch": 0.77, - "learning_rate": 1.7422319556254972e-06, - "loss": 0.8242, - "step": 30053 - }, - { - "epoch": 0.77, - "learning_rate": 1.7422134121786415e-06, - "loss": 0.6711, - "step": 30054 - }, - { - "epoch": 0.77, - "learning_rate": 1.7421948681635075e-06, - "loss": 0.8564, - "step": 30055 - }, - { - "epoch": 0.77, - "learning_rate": 1.7421763235801085e-06, - "loss": 0.8779, - "step": 30056 - }, - { - "epoch": 0.77, - "learning_rate": 1.7421577784284595e-06, - "loss": 1.0498, - "step": 30057 - }, - { - "epoch": 0.77, - "learning_rate": 1.7421392327085746e-06, - "loss": 0.8994, - "step": 30058 - }, - { - "epoch": 0.77, - "learning_rate": 1.7421206864204679e-06, - "loss": 0.8682, - "step": 30059 - }, - { - "epoch": 0.77, - "learning_rate": 1.742102139564153e-06, - "loss": 0.6389, - "step": 30060 - }, - { - "epoch": 0.77, - "learning_rate": 1.7420835921396448e-06, - "loss": 0.9697, - "step": 30061 - }, - { - "epoch": 0.77, - "learning_rate": 1.7420650441469573e-06, - "loss": 0.6621, - "step": 30062 - }, - { - "epoch": 0.77, - "learning_rate": 1.7420464955861049e-06, - "loss": 0.9287, - "step": 30063 - }, - { - "epoch": 0.77, - "learning_rate": 1.7420279464571017e-06, - "loss": 0.8994, - "step": 30064 - }, - { - "epoch": 0.77, - "learning_rate": 1.7420093967599616e-06, - "loss": 0.9678, - "step": 30065 - }, - { - "epoch": 0.77, - "learning_rate": 1.741990846494699e-06, - "loss": 0.8489, - "step": 30066 - }, - { - "epoch": 0.77, - "learning_rate": 1.7419722956613284e-06, - "loss": 0.9453, - "step": 30067 - }, - { - "epoch": 0.77, - "learning_rate": 1.7419537442598633e-06, - "loss": 0.728, - "step": 30068 - }, - { - "epoch": 0.77, - "learning_rate": 1.7419351922903184e-06, - "loss": 0.8184, - "step": 30069 - }, - { - "epoch": 0.77, - "learning_rate": 1.7419166397527083e-06, - "loss": 0.8877, - "step": 30070 - }, - { - "epoch": 0.77, - "learning_rate": 1.7418980866470464e-06, - "loss": 0.6064, - "step": 30071 - }, - { - "epoch": 0.77, - "learning_rate": 1.741879532973347e-06, - "loss": 0.8477, - "step": 30072 - }, - { - "epoch": 0.77, - "learning_rate": 1.741860978731625e-06, - "loss": 0.7124, - "step": 30073 - }, - { - "epoch": 0.77, - "learning_rate": 1.741842423921894e-06, - "loss": 0.7188, - "step": 30074 - }, - { - "epoch": 0.77, - "learning_rate": 1.7418238685441684e-06, - "loss": 0.6265, - "step": 30075 - }, - { - "epoch": 0.77, - "learning_rate": 1.7418053125984624e-06, - "loss": 0.6475, - "step": 30076 - }, - { - "epoch": 0.77, - "learning_rate": 1.7417867560847901e-06, - "loss": 0.6787, - "step": 30077 - }, - { - "epoch": 0.77, - "learning_rate": 1.741768199003166e-06, - "loss": 0.9756, - "step": 30078 - }, - { - "epoch": 0.77, - "learning_rate": 1.7417496413536034e-06, - "loss": 1.0234, - "step": 30079 - }, - { - "epoch": 0.77, - "learning_rate": 1.741731083136118e-06, - "loss": 0.9351, - "step": 30080 - }, - { - "epoch": 0.77, - "learning_rate": 1.741712524350723e-06, - "loss": 0.9102, - "step": 30081 - }, - { - "epoch": 0.77, - "learning_rate": 1.7416939649974327e-06, - "loss": 1.0098, - "step": 30082 - }, - { - "epoch": 0.77, - "learning_rate": 1.7416754050762612e-06, - "loss": 0.8119, - "step": 30083 - }, - { - "epoch": 0.77, - "learning_rate": 1.7416568445872235e-06, - "loss": 0.8242, - "step": 30084 - }, - { - "epoch": 0.77, - "learning_rate": 1.7416382835303329e-06, - "loss": 0.917, - "step": 30085 - }, - { - "epoch": 0.77, - "learning_rate": 1.741619721905604e-06, - "loss": 1.0117, - "step": 30086 - }, - { - "epoch": 0.77, - "learning_rate": 1.741601159713051e-06, - "loss": 0.916, - "step": 30087 - }, - { - "epoch": 0.77, - "learning_rate": 1.7415825969526882e-06, - "loss": 0.6831, - "step": 30088 - }, - { - "epoch": 0.77, - "learning_rate": 1.7415640336245297e-06, - "loss": 0.9668, - "step": 30089 - }, - { - "epoch": 0.77, - "learning_rate": 1.7415454697285896e-06, - "loss": 0.8506, - "step": 30090 - }, - { - "epoch": 0.77, - "learning_rate": 1.7415269052648825e-06, - "loss": 0.9053, - "step": 30091 - }, - { - "epoch": 0.77, - "learning_rate": 1.7415083402334219e-06, - "loss": 0.7109, - "step": 30092 - }, - { - "epoch": 0.77, - "learning_rate": 1.7414897746342226e-06, - "loss": 1.0107, - "step": 30093 - }, - { - "epoch": 0.77, - "learning_rate": 1.741471208467299e-06, - "loss": 0.7842, - "step": 30094 - }, - { - "epoch": 0.77, - "learning_rate": 1.7414526417326645e-06, - "loss": 0.7759, - "step": 30095 - }, - { - "epoch": 0.77, - "learning_rate": 1.7414340744303341e-06, - "loss": 0.9102, - "step": 30096 - }, - { - "epoch": 0.77, - "learning_rate": 1.7414155065603217e-06, - "loss": 0.7686, - "step": 30097 - }, - { - "epoch": 0.77, - "learning_rate": 1.7413969381226416e-06, - "loss": 0.9473, - "step": 30098 - }, - { - "epoch": 0.77, - "learning_rate": 1.7413783691173079e-06, - "loss": 1.0576, - "step": 30099 - }, - { - "epoch": 0.77, - "learning_rate": 1.7413597995443349e-06, - "loss": 0.605, - "step": 30100 - }, - { - "epoch": 0.77, - "learning_rate": 1.7413412294037367e-06, - "loss": 1.0273, - "step": 30101 - }, - { - "epoch": 0.77, - "learning_rate": 1.7413226586955275e-06, - "loss": 0.8276, - "step": 30102 - }, - { - "epoch": 0.77, - "learning_rate": 1.7413040874197216e-06, - "loss": 0.8486, - "step": 30103 - }, - { - "epoch": 0.77, - "learning_rate": 1.7412855155763335e-06, - "loss": 0.9004, - "step": 30104 - }, - { - "epoch": 0.77, - "learning_rate": 1.7412669431653773e-06, - "loss": 0.6589, - "step": 30105 - }, - { - "epoch": 0.77, - "learning_rate": 1.7412483701868668e-06, - "loss": 1.0703, - "step": 30106 - }, - { - "epoch": 0.77, - "learning_rate": 1.7412297966408165e-06, - "loss": 0.9082, - "step": 30107 - }, - { - "epoch": 0.77, - "learning_rate": 1.7412112225272405e-06, - "loss": 0.9766, - "step": 30108 - }, - { - "epoch": 0.77, - "learning_rate": 1.7411926478461534e-06, - "loss": 0.9307, - "step": 30109 - }, - { - "epoch": 0.77, - "learning_rate": 1.7411740725975692e-06, - "loss": 0.8652, - "step": 30110 - }, - { - "epoch": 0.77, - "learning_rate": 1.7411554967815021e-06, - "loss": 0.8672, - "step": 30111 - }, - { - "epoch": 0.77, - "learning_rate": 1.7411369203979662e-06, - "loss": 0.9072, - "step": 30112 - }, - { - "epoch": 0.77, - "learning_rate": 1.7411183434469758e-06, - "loss": 1.04, - "step": 30113 - }, - { - "epoch": 0.77, - "learning_rate": 1.741099765928545e-06, - "loss": 0.8672, - "step": 30114 - }, - { - "epoch": 0.77, - "learning_rate": 1.7410811878426887e-06, - "loss": 0.7842, - "step": 30115 - }, - { - "epoch": 0.77, - "learning_rate": 1.7410626091894202e-06, - "loss": 0.8511, - "step": 30116 - }, - { - "epoch": 0.77, - "learning_rate": 1.7410440299687544e-06, - "loss": 0.9414, - "step": 30117 - }, - { - "epoch": 0.77, - "learning_rate": 1.741025450180705e-06, - "loss": 0.7871, - "step": 30118 - }, - { - "epoch": 0.77, - "learning_rate": 1.7410068698252866e-06, - "loss": 0.9775, - "step": 30119 - }, - { - "epoch": 0.77, - "learning_rate": 1.7409882889025134e-06, - "loss": 0.9014, - "step": 30120 - }, - { - "epoch": 0.77, - "learning_rate": 1.7409697074123994e-06, - "loss": 0.7017, - "step": 30121 - }, - { - "epoch": 0.77, - "learning_rate": 1.740951125354959e-06, - "loss": 1.0225, - "step": 30122 - }, - { - "epoch": 0.77, - "learning_rate": 1.7409325427302064e-06, - "loss": 0.7537, - "step": 30123 - }, - { - "epoch": 0.77, - "learning_rate": 1.7409139595381559e-06, - "loss": 0.853, - "step": 30124 - }, - { - "epoch": 0.77, - "learning_rate": 1.7408953757788214e-06, - "loss": 0.8369, - "step": 30125 - }, - { - "epoch": 0.77, - "learning_rate": 1.7408767914522177e-06, - "loss": 0.8428, - "step": 30126 - }, - { - "epoch": 0.77, - "learning_rate": 1.7408582065583585e-06, - "loss": 0.9619, - "step": 30127 - }, - { - "epoch": 0.77, - "learning_rate": 1.7408396210972582e-06, - "loss": 1.0498, - "step": 30128 - }, - { - "epoch": 0.77, - "learning_rate": 1.7408210350689314e-06, - "loss": 0.8613, - "step": 30129 - }, - { - "epoch": 0.77, - "learning_rate": 1.7408024484733916e-06, - "loss": 0.8013, - "step": 30130 - }, - { - "epoch": 0.77, - "learning_rate": 1.7407838613106537e-06, - "loss": 0.8193, - "step": 30131 - }, - { - "epoch": 0.77, - "learning_rate": 1.7407652735807313e-06, - "loss": 0.9072, - "step": 30132 - }, - { - "epoch": 0.77, - "learning_rate": 1.7407466852836395e-06, - "loss": 0.875, - "step": 30133 - }, - { - "epoch": 0.77, - "learning_rate": 1.7407280964193918e-06, - "loss": 1.0312, - "step": 30134 - }, - { - "epoch": 0.77, - "learning_rate": 1.7407095069880024e-06, - "loss": 0.9639, - "step": 30135 - }, - { - "epoch": 0.77, - "learning_rate": 1.7406909169894863e-06, - "loss": 0.7524, - "step": 30136 - }, - { - "epoch": 0.77, - "learning_rate": 1.7406723264238567e-06, - "loss": 0.6846, - "step": 30137 - }, - { - "epoch": 0.77, - "learning_rate": 1.7406537352911287e-06, - "loss": 0.8516, - "step": 30138 - }, - { - "epoch": 0.77, - "learning_rate": 1.7406351435913163e-06, - "loss": 0.6411, - "step": 30139 - }, - { - "epoch": 0.77, - "learning_rate": 1.7406165513244332e-06, - "loss": 0.8232, - "step": 30140 - }, - { - "epoch": 0.77, - "learning_rate": 1.7405979584904945e-06, - "loss": 0.8765, - "step": 30141 - }, - { - "epoch": 0.77, - "learning_rate": 1.7405793650895135e-06, - "loss": 1.0625, - "step": 30142 - }, - { - "epoch": 0.77, - "learning_rate": 1.7405607711215054e-06, - "loss": 1.0586, - "step": 30143 - }, - { - "epoch": 0.77, - "learning_rate": 1.7405421765864837e-06, - "loss": 0.6953, - "step": 30144 - }, - { - "epoch": 0.77, - "learning_rate": 1.740523581484463e-06, - "loss": 0.8872, - "step": 30145 - }, - { - "epoch": 0.77, - "learning_rate": 1.7405049858154573e-06, - "loss": 1.042, - "step": 30146 - }, - { - "epoch": 0.77, - "learning_rate": 1.7404863895794813e-06, - "loss": 0.7988, - "step": 30147 - }, - { - "epoch": 0.77, - "learning_rate": 1.7404677927765485e-06, - "loss": 0.9473, - "step": 30148 - }, - { - "epoch": 0.77, - "learning_rate": 1.7404491954066738e-06, - "loss": 0.7305, - "step": 30149 - }, - { - "epoch": 0.77, - "learning_rate": 1.7404305974698712e-06, - "loss": 0.8945, - "step": 30150 - }, - { - "epoch": 0.77, - "learning_rate": 1.740411998966155e-06, - "loss": 0.8506, - "step": 30151 - }, - { - "epoch": 0.77, - "learning_rate": 1.7403933998955393e-06, - "loss": 0.8779, - "step": 30152 - }, - { - "epoch": 0.77, - "learning_rate": 1.7403748002580386e-06, - "loss": 0.7495, - "step": 30153 - }, - { - "epoch": 0.77, - "learning_rate": 1.7403562000536668e-06, - "loss": 0.9785, - "step": 30154 - }, - { - "epoch": 0.77, - "learning_rate": 1.740337599282438e-06, - "loss": 0.9492, - "step": 30155 - }, - { - "epoch": 0.77, - "learning_rate": 1.740318997944367e-06, - "loss": 0.7407, - "step": 30156 - }, - { - "epoch": 0.77, - "learning_rate": 1.7403003960394678e-06, - "loss": 1.1143, - "step": 30157 - }, - { - "epoch": 0.77, - "learning_rate": 1.7402817935677545e-06, - "loss": 0.657, - "step": 30158 - }, - { - "epoch": 0.77, - "learning_rate": 1.7402631905292418e-06, - "loss": 0.9424, - "step": 30159 - }, - { - "epoch": 0.77, - "learning_rate": 1.7402445869239434e-06, - "loss": 0.6904, - "step": 30160 - }, - { - "epoch": 0.77, - "learning_rate": 1.7402259827518738e-06, - "loss": 0.6812, - "step": 30161 - }, - { - "epoch": 0.77, - "learning_rate": 1.740207378013047e-06, - "loss": 0.8228, - "step": 30162 - }, - { - "epoch": 0.77, - "learning_rate": 1.7401887727074777e-06, - "loss": 0.9106, - "step": 30163 - }, - { - "epoch": 0.77, - "learning_rate": 1.7401701668351799e-06, - "loss": 0.75, - "step": 30164 - }, - { - "epoch": 0.77, - "learning_rate": 1.7401515603961676e-06, - "loss": 0.7104, - "step": 30165 - }, - { - "epoch": 0.77, - "learning_rate": 1.7401329533904554e-06, - "loss": 1.0049, - "step": 30166 - }, - { - "epoch": 0.77, - "learning_rate": 1.7401143458180573e-06, - "loss": 0.9951, - "step": 30167 - }, - { - "epoch": 0.77, - "learning_rate": 1.7400957376789881e-06, - "loss": 0.6538, - "step": 30168 - }, - { - "epoch": 0.77, - "learning_rate": 1.7400771289732613e-06, - "loss": 0.873, - "step": 30169 - }, - { - "epoch": 0.77, - "learning_rate": 1.7400585197008914e-06, - "loss": 1.0586, - "step": 30170 - }, - { - "epoch": 0.77, - "learning_rate": 1.740039909861893e-06, - "loss": 0.7783, - "step": 30171 - }, - { - "epoch": 0.77, - "learning_rate": 1.7400212994562796e-06, - "loss": 0.999, - "step": 30172 - }, - { - "epoch": 0.77, - "learning_rate": 1.7400026884840667e-06, - "loss": 0.9355, - "step": 30173 - }, - { - "epoch": 0.77, - "learning_rate": 1.739984076945267e-06, - "loss": 0.8682, - "step": 30174 - }, - { - "epoch": 0.77, - "learning_rate": 1.739965464839896e-06, - "loss": 0.8291, - "step": 30175 - }, - { - "epoch": 0.77, - "learning_rate": 1.7399468521679672e-06, - "loss": 0.6477, - "step": 30176 - }, - { - "epoch": 0.77, - "learning_rate": 1.7399282389294952e-06, - "loss": 0.9854, - "step": 30177 - }, - { - "epoch": 0.77, - "learning_rate": 1.7399096251244943e-06, - "loss": 0.8579, - "step": 30178 - }, - { - "epoch": 0.77, - "learning_rate": 1.7398910107529785e-06, - "loss": 0.7935, - "step": 30179 - }, - { - "epoch": 0.77, - "learning_rate": 1.7398723958149621e-06, - "loss": 0.9609, - "step": 30180 - }, - { - "epoch": 0.77, - "learning_rate": 1.7398537803104593e-06, - "loss": 0.7815, - "step": 30181 - }, - { - "epoch": 0.77, - "learning_rate": 1.739835164239485e-06, - "loss": 0.8408, - "step": 30182 - }, - { - "epoch": 0.77, - "learning_rate": 1.7398165476020522e-06, - "loss": 0.6514, - "step": 30183 - }, - { - "epoch": 0.77, - "learning_rate": 1.7397979303981764e-06, - "loss": 0.9893, - "step": 30184 - }, - { - "epoch": 0.77, - "learning_rate": 1.7397793126278714e-06, - "loss": 0.8281, - "step": 30185 - }, - { - "epoch": 0.77, - "learning_rate": 1.7397606942911513e-06, - "loss": 0.7368, - "step": 30186 - }, - { - "epoch": 0.77, - "learning_rate": 1.7397420753880306e-06, - "loss": 0.8271, - "step": 30187 - }, - { - "epoch": 0.77, - "learning_rate": 1.739723455918523e-06, - "loss": 0.8574, - "step": 30188 - }, - { - "epoch": 0.77, - "learning_rate": 1.7397048358826432e-06, - "loss": 0.7236, - "step": 30189 - }, - { - "epoch": 0.77, - "learning_rate": 1.7396862152804057e-06, - "loss": 0.7354, - "step": 30190 - }, - { - "epoch": 0.77, - "learning_rate": 1.7396675941118245e-06, - "loss": 0.8447, - "step": 30191 - }, - { - "epoch": 0.77, - "learning_rate": 1.7396489723769134e-06, - "loss": 0.9609, - "step": 30192 - }, - { - "epoch": 0.77, - "learning_rate": 1.7396303500756875e-06, - "loss": 0.6792, - "step": 30193 - }, - { - "epoch": 0.77, - "learning_rate": 1.7396117272081606e-06, - "loss": 0.8379, - "step": 30194 - }, - { - "epoch": 0.77, - "learning_rate": 1.739593103774347e-06, - "loss": 0.8652, - "step": 30195 - }, - { - "epoch": 0.77, - "learning_rate": 1.7395744797742609e-06, - "loss": 0.7949, - "step": 30196 - }, - { - "epoch": 0.77, - "learning_rate": 1.7395558552079166e-06, - "loss": 0.6934, - "step": 30197 - }, - { - "epoch": 0.77, - "learning_rate": 1.7395372300753283e-06, - "loss": 0.8174, - "step": 30198 - }, - { - "epoch": 0.77, - "learning_rate": 1.7395186043765103e-06, - "loss": 0.9131, - "step": 30199 - }, - { - "epoch": 0.77, - "learning_rate": 1.7394999781114773e-06, - "loss": 0.8418, - "step": 30200 - }, - { - "epoch": 0.77, - "learning_rate": 1.739481351280243e-06, - "loss": 1.0859, - "step": 30201 - }, - { - "epoch": 0.77, - "learning_rate": 1.7394627238828216e-06, - "loss": 0.7998, - "step": 30202 - }, - { - "epoch": 0.77, - "learning_rate": 1.7394440959192279e-06, - "loss": 0.729, - "step": 30203 - }, - { - "epoch": 0.77, - "learning_rate": 1.7394254673894757e-06, - "loss": 0.7725, - "step": 30204 - }, - { - "epoch": 0.77, - "learning_rate": 1.7394068382935796e-06, - "loss": 0.875, - "step": 30205 - }, - { - "epoch": 0.77, - "learning_rate": 1.7393882086315535e-06, - "loss": 0.7285, - "step": 30206 - }, - { - "epoch": 0.77, - "learning_rate": 1.7393695784034117e-06, - "loss": 0.793, - "step": 30207 - }, - { - "epoch": 0.77, - "learning_rate": 1.739350947609169e-06, - "loss": 0.8779, - "step": 30208 - }, - { - "epoch": 0.77, - "learning_rate": 1.7393323162488392e-06, - "loss": 0.9805, - "step": 30209 - }, - { - "epoch": 0.77, - "learning_rate": 1.7393136843224363e-06, - "loss": 0.6309, - "step": 30210 - }, - { - "epoch": 0.77, - "learning_rate": 1.7392950518299751e-06, - "loss": 0.7703, - "step": 30211 - }, - { - "epoch": 0.77, - "learning_rate": 1.7392764187714696e-06, - "loss": 0.8018, - "step": 30212 - }, - { - "epoch": 0.77, - "learning_rate": 1.7392577851469343e-06, - "loss": 0.7725, - "step": 30213 - }, - { - "epoch": 0.77, - "learning_rate": 1.7392391509563834e-06, - "loss": 0.7744, - "step": 30214 - }, - { - "epoch": 0.77, - "learning_rate": 1.7392205161998308e-06, - "loss": 0.8311, - "step": 30215 - }, - { - "epoch": 0.77, - "learning_rate": 1.739201880877291e-06, - "loss": 0.8701, - "step": 30216 - }, - { - "epoch": 0.77, - "learning_rate": 1.7391832449887784e-06, - "loss": 0.7534, - "step": 30217 - }, - { - "epoch": 0.77, - "learning_rate": 1.7391646085343075e-06, - "loss": 0.6035, - "step": 30218 - }, - { - "epoch": 0.77, - "learning_rate": 1.739145971513892e-06, - "loss": 0.7715, - "step": 30219 - }, - { - "epoch": 0.77, - "learning_rate": 1.7391273339275463e-06, - "loss": 0.8525, - "step": 30220 - }, - { - "epoch": 0.77, - "learning_rate": 1.7391086957752847e-06, - "loss": 0.8438, - "step": 30221 - }, - { - "epoch": 0.77, - "learning_rate": 1.7390900570571218e-06, - "loss": 0.7949, - "step": 30222 - }, - { - "epoch": 0.77, - "learning_rate": 1.7390714177730717e-06, - "loss": 0.7783, - "step": 30223 - }, - { - "epoch": 0.77, - "learning_rate": 1.7390527779231485e-06, - "loss": 0.8828, - "step": 30224 - }, - { - "epoch": 0.77, - "learning_rate": 1.7390341375073664e-06, - "loss": 0.6558, - "step": 30225 - }, - { - "epoch": 0.77, - "learning_rate": 1.7390154965257399e-06, - "loss": 0.8223, - "step": 30226 - }, - { - "epoch": 0.77, - "learning_rate": 1.7389968549782835e-06, - "loss": 1.0234, - "step": 30227 - }, - { - "epoch": 0.77, - "learning_rate": 1.7389782128650107e-06, - "loss": 1.001, - "step": 30228 - }, - { - "epoch": 0.77, - "learning_rate": 1.7389595701859367e-06, - "loss": 0.8154, - "step": 30229 - }, - { - "epoch": 0.77, - "learning_rate": 1.7389409269410752e-06, - "loss": 1.0703, - "step": 30230 - }, - { - "epoch": 0.77, - "learning_rate": 1.7389222831304406e-06, - "loss": 1.1436, - "step": 30231 - }, - { - "epoch": 0.77, - "learning_rate": 1.7389036387540472e-06, - "loss": 0.8828, - "step": 30232 - }, - { - "epoch": 0.77, - "learning_rate": 1.7388849938119093e-06, - "loss": 0.4924, - "step": 30233 - }, - { - "epoch": 0.77, - "learning_rate": 1.7388663483040409e-06, - "loss": 0.792, - "step": 30234 - }, - { - "epoch": 0.77, - "learning_rate": 1.7388477022304567e-06, - "loss": 0.8311, - "step": 30235 - }, - { - "epoch": 0.77, - "learning_rate": 1.7388290555911706e-06, - "loss": 1.0156, - "step": 30236 - }, - { - "epoch": 0.77, - "learning_rate": 1.7388104083861975e-06, - "loss": 0.6714, - "step": 30237 - }, - { - "epoch": 0.78, - "learning_rate": 1.7387917606155509e-06, - "loss": 0.8828, - "step": 30238 - }, - { - "epoch": 0.78, - "learning_rate": 1.7387731122792454e-06, - "loss": 0.7871, - "step": 30239 - }, - { - "epoch": 0.78, - "learning_rate": 1.7387544633772952e-06, - "loss": 0.8174, - "step": 30240 - }, - { - "epoch": 0.78, - "learning_rate": 1.7387358139097153e-06, - "loss": 1.0166, - "step": 30241 - }, - { - "epoch": 0.78, - "learning_rate": 1.7387171638765189e-06, - "loss": 0.9453, - "step": 30242 - }, - { - "epoch": 0.78, - "learning_rate": 1.7386985132777205e-06, - "loss": 1.0244, - "step": 30243 - }, - { - "epoch": 0.78, - "learning_rate": 1.7386798621133349e-06, - "loss": 0.8242, - "step": 30244 - }, - { - "epoch": 0.78, - "learning_rate": 1.738661210383376e-06, - "loss": 0.8535, - "step": 30245 - }, - { - "epoch": 0.78, - "learning_rate": 1.7386425580878585e-06, - "loss": 1.0713, - "step": 30246 - }, - { - "epoch": 0.78, - "learning_rate": 1.738623905226796e-06, - "loss": 0.9316, - "step": 30247 - }, - { - "epoch": 0.78, - "learning_rate": 1.7386052518002033e-06, - "loss": 0.8516, - "step": 30248 - }, - { - "epoch": 0.78, - "learning_rate": 1.7385865978080942e-06, - "loss": 0.6208, - "step": 30249 - }, - { - "epoch": 0.78, - "learning_rate": 1.7385679432504836e-06, - "loss": 0.8916, - "step": 30250 - }, - { - "epoch": 0.78, - "learning_rate": 1.7385492881273855e-06, - "loss": 0.8545, - "step": 30251 - }, - { - "epoch": 0.78, - "learning_rate": 1.738530632438814e-06, - "loss": 0.9424, - "step": 30252 - }, - { - "epoch": 0.78, - "learning_rate": 1.738511976184784e-06, - "loss": 0.5132, - "step": 30253 - }, - { - "epoch": 0.78, - "learning_rate": 1.7384933193653088e-06, - "loss": 0.9106, - "step": 30254 - }, - { - "epoch": 0.78, - "learning_rate": 1.7384746619804034e-06, - "loss": 0.9678, - "step": 30255 - }, - { - "epoch": 0.78, - "learning_rate": 1.738456004030082e-06, - "loss": 0.9316, - "step": 30256 - }, - { - "epoch": 0.78, - "learning_rate": 1.7384373455143586e-06, - "loss": 0.7559, - "step": 30257 - }, - { - "epoch": 0.78, - "learning_rate": 1.738418686433248e-06, - "loss": 0.7959, - "step": 30258 - }, - { - "epoch": 0.78, - "learning_rate": 1.7384000267867638e-06, - "loss": 0.9883, - "step": 30259 - }, - { - "epoch": 0.78, - "learning_rate": 1.738381366574921e-06, - "loss": 0.835, - "step": 30260 - }, - { - "epoch": 0.78, - "learning_rate": 1.7383627057977332e-06, - "loss": 0.8623, - "step": 30261 - }, - { - "epoch": 0.78, - "learning_rate": 1.7383440444552152e-06, - "loss": 0.9297, - "step": 30262 - }, - { - "epoch": 0.78, - "learning_rate": 1.7383253825473814e-06, - "loss": 0.8213, - "step": 30263 - }, - { - "epoch": 0.78, - "learning_rate": 1.7383067200742452e-06, - "loss": 0.8599, - "step": 30264 - }, - { - "epoch": 0.78, - "learning_rate": 1.738288057035822e-06, - "loss": 0.8857, - "step": 30265 - }, - { - "epoch": 0.78, - "learning_rate": 1.7382693934321253e-06, - "loss": 0.832, - "step": 30266 - }, - { - "epoch": 0.78, - "learning_rate": 1.7382507292631696e-06, - "loss": 0.7212, - "step": 30267 - }, - { - "epoch": 0.78, - "learning_rate": 1.7382320645289697e-06, - "loss": 0.8838, - "step": 30268 - }, - { - "epoch": 0.78, - "learning_rate": 1.738213399229539e-06, - "loss": 0.8926, - "step": 30269 - }, - { - "epoch": 0.78, - "learning_rate": 1.7381947333648923e-06, - "loss": 1.0518, - "step": 30270 - }, - { - "epoch": 0.78, - "learning_rate": 1.7381760669350443e-06, - "loss": 0.9883, - "step": 30271 - }, - { - "epoch": 0.78, - "learning_rate": 1.7381573999400082e-06, - "loss": 0.458, - "step": 30272 - }, - { - "epoch": 0.78, - "learning_rate": 1.7381387323797994e-06, - "loss": 0.8584, - "step": 30273 - }, - { - "epoch": 0.78, - "learning_rate": 1.7381200642544314e-06, - "loss": 0.7959, - "step": 30274 - }, - { - "epoch": 0.78, - "learning_rate": 1.7381013955639188e-06, - "loss": 0.7988, - "step": 30275 - }, - { - "epoch": 0.78, - "learning_rate": 1.738082726308276e-06, - "loss": 0.6157, - "step": 30276 - }, - { - "epoch": 0.78, - "learning_rate": 1.7380640564875172e-06, - "loss": 0.5559, - "step": 30277 - }, - { - "epoch": 0.78, - "learning_rate": 1.7380453861016569e-06, - "loss": 0.9351, - "step": 30278 - }, - { - "epoch": 0.78, - "learning_rate": 1.738026715150709e-06, - "loss": 0.999, - "step": 30279 - }, - { - "epoch": 0.78, - "learning_rate": 1.738008043634688e-06, - "loss": 1.0986, - "step": 30280 - }, - { - "epoch": 0.78, - "learning_rate": 1.737989371553608e-06, - "loss": 0.7803, - "step": 30281 - }, - { - "epoch": 0.78, - "learning_rate": 1.7379706989074835e-06, - "loss": 0.874, - "step": 30282 - }, - { - "epoch": 0.78, - "learning_rate": 1.737952025696329e-06, - "loss": 1.1289, - "step": 30283 - }, - { - "epoch": 0.78, - "learning_rate": 1.7379333519201584e-06, - "loss": 1.0225, - "step": 30284 - }, - { - "epoch": 0.78, - "learning_rate": 1.737914677578986e-06, - "loss": 0.67, - "step": 30285 - }, - { - "epoch": 0.78, - "learning_rate": 1.7378960026728269e-06, - "loss": 0.9209, - "step": 30286 - }, - { - "epoch": 0.78, - "learning_rate": 1.7378773272016941e-06, - "loss": 1.0312, - "step": 30287 - }, - { - "epoch": 0.78, - "learning_rate": 1.7378586511656027e-06, - "loss": 0.7856, - "step": 30288 - }, - { - "epoch": 0.78, - "learning_rate": 1.737839974564567e-06, - "loss": 0.8936, - "step": 30289 - }, - { - "epoch": 0.78, - "learning_rate": 1.737821297398601e-06, - "loss": 0.9736, - "step": 30290 - }, - { - "epoch": 0.78, - "learning_rate": 1.7378026196677197e-06, - "loss": 1.0264, - "step": 30291 - }, - { - "epoch": 0.78, - "learning_rate": 1.7377839413719362e-06, - "loss": 0.6729, - "step": 30292 - }, - { - "epoch": 0.78, - "learning_rate": 1.7377652625112658e-06, - "loss": 0.8789, - "step": 30293 - }, - { - "epoch": 0.78, - "learning_rate": 1.7377465830857223e-06, - "loss": 0.8611, - "step": 30294 - }, - { - "epoch": 0.78, - "learning_rate": 1.7377279030953202e-06, - "loss": 0.8027, - "step": 30295 - }, - { - "epoch": 0.78, - "learning_rate": 1.7377092225400738e-06, - "loss": 0.7178, - "step": 30296 - }, - { - "epoch": 0.78, - "learning_rate": 1.7376905414199975e-06, - "loss": 0.7063, - "step": 30297 - }, - { - "epoch": 0.78, - "learning_rate": 1.7376718597351052e-06, - "loss": 0.9229, - "step": 30298 - }, - { - "epoch": 0.78, - "learning_rate": 1.7376531774854115e-06, - "loss": 0.4912, - "step": 30299 - }, - { - "epoch": 0.78, - "learning_rate": 1.7376344946709306e-06, - "loss": 1.0498, - "step": 30300 - }, - { - "epoch": 0.78, - "learning_rate": 1.7376158112916772e-06, - "loss": 0.957, - "step": 30301 - }, - { - "epoch": 0.78, - "learning_rate": 1.7375971273476653e-06, - "loss": 0.7397, - "step": 30302 - }, - { - "epoch": 0.78, - "learning_rate": 1.737578442838909e-06, - "loss": 0.9224, - "step": 30303 - }, - { - "epoch": 0.78, - "learning_rate": 1.737559757765423e-06, - "loss": 0.6968, - "step": 30304 - }, - { - "epoch": 0.78, - "learning_rate": 1.737541072127221e-06, - "loss": 0.8496, - "step": 30305 - }, - { - "epoch": 0.78, - "learning_rate": 1.737522385924318e-06, - "loss": 0.8818, - "step": 30306 - }, - { - "epoch": 0.78, - "learning_rate": 1.737503699156728e-06, - "loss": 0.834, - "step": 30307 - }, - { - "epoch": 0.78, - "learning_rate": 1.7374850118244653e-06, - "loss": 1.0293, - "step": 30308 - }, - { - "epoch": 0.78, - "learning_rate": 1.7374663239275443e-06, - "loss": 0.9229, - "step": 30309 - }, - { - "epoch": 0.78, - "learning_rate": 1.7374476354659793e-06, - "loss": 0.7646, - "step": 30310 - }, - { - "epoch": 0.78, - "learning_rate": 1.7374289464397842e-06, - "loss": 0.9375, - "step": 30311 - }, - { - "epoch": 0.78, - "learning_rate": 1.7374102568489742e-06, - "loss": 0.9668, - "step": 30312 - }, - { - "epoch": 0.78, - "learning_rate": 1.7373915666935628e-06, - "loss": 0.8223, - "step": 30313 - }, - { - "epoch": 0.78, - "learning_rate": 1.7373728759735645e-06, - "loss": 1.0098, - "step": 30314 - }, - { - "epoch": 0.78, - "learning_rate": 1.7373541846889937e-06, - "loss": 0.8125, - "step": 30315 - }, - { - "epoch": 0.78, - "learning_rate": 1.7373354928398648e-06, - "loss": 0.7646, - "step": 30316 - }, - { - "epoch": 0.78, - "learning_rate": 1.737316800426192e-06, - "loss": 0.8721, - "step": 30317 - }, - { - "epoch": 0.78, - "learning_rate": 1.7372981074479895e-06, - "loss": 0.8506, - "step": 30318 - }, - { - "epoch": 0.78, - "learning_rate": 1.737279413905272e-06, - "loss": 0.5801, - "step": 30319 - }, - { - "epoch": 0.78, - "learning_rate": 1.7372607197980533e-06, - "loss": 0.9014, - "step": 30320 - }, - { - "epoch": 0.78, - "learning_rate": 1.7372420251263482e-06, - "loss": 0.6562, - "step": 30321 - }, - { - "epoch": 0.78, - "learning_rate": 1.7372233298901705e-06, - "loss": 0.6641, - "step": 30322 - }, - { - "epoch": 0.78, - "learning_rate": 1.737204634089535e-06, - "loss": 0.8643, - "step": 30323 - }, - { - "epoch": 0.78, - "learning_rate": 1.7371859377244558e-06, - "loss": 0.9082, - "step": 30324 - }, - { - "epoch": 0.78, - "learning_rate": 1.7371672407949474e-06, - "loss": 0.8652, - "step": 30325 - }, - { - "epoch": 0.78, - "learning_rate": 1.7371485433010235e-06, - "loss": 0.9053, - "step": 30326 - }, - { - "epoch": 0.78, - "learning_rate": 1.7371298452426993e-06, - "loss": 0.8364, - "step": 30327 - }, - { - "epoch": 0.78, - "learning_rate": 1.7371111466199881e-06, - "loss": 0.8066, - "step": 30328 - }, - { - "epoch": 0.78, - "learning_rate": 1.7370924474329055e-06, - "loss": 0.6079, - "step": 30329 - }, - { - "epoch": 0.78, - "learning_rate": 1.7370737476814645e-06, - "loss": 0.8218, - "step": 30330 - }, - { - "epoch": 0.78, - "learning_rate": 1.7370550473656804e-06, - "loss": 0.811, - "step": 30331 - }, - { - "epoch": 0.78, - "learning_rate": 1.7370363464855671e-06, - "loss": 0.8223, - "step": 30332 - }, - { - "epoch": 0.78, - "learning_rate": 1.737017645041139e-06, - "loss": 0.6294, - "step": 30333 - }, - { - "epoch": 0.78, - "learning_rate": 1.7369989430324102e-06, - "loss": 0.9473, - "step": 30334 - }, - { - "epoch": 0.78, - "learning_rate": 1.736980240459395e-06, - "loss": 0.9619, - "step": 30335 - }, - { - "epoch": 0.78, - "learning_rate": 1.7369615373221082e-06, - "loss": 0.8083, - "step": 30336 - }, - { - "epoch": 0.78, - "learning_rate": 1.7369428336205638e-06, - "loss": 0.6841, - "step": 30337 - }, - { - "epoch": 0.78, - "learning_rate": 1.7369241293547764e-06, - "loss": 0.7646, - "step": 30338 - }, - { - "epoch": 0.78, - "learning_rate": 1.7369054245247596e-06, - "loss": 0.9561, - "step": 30339 - }, - { - "epoch": 0.78, - "learning_rate": 1.7368867191305285e-06, - "loss": 0.9238, - "step": 30340 - }, - { - "epoch": 0.78, - "learning_rate": 1.736868013172097e-06, - "loss": 0.9028, - "step": 30341 - }, - { - "epoch": 0.78, - "learning_rate": 1.7368493066494796e-06, - "loss": 0.6772, - "step": 30342 - }, - { - "epoch": 0.78, - "learning_rate": 1.7368305995626905e-06, - "loss": 0.8584, - "step": 30343 - }, - { - "epoch": 0.78, - "learning_rate": 1.7368118919117442e-06, - "loss": 0.8086, - "step": 30344 - }, - { - "epoch": 0.78, - "learning_rate": 1.736793183696655e-06, - "loss": 0.8525, - "step": 30345 - }, - { - "epoch": 0.78, - "learning_rate": 1.7367744749174368e-06, - "loss": 0.9971, - "step": 30346 - }, - { - "epoch": 0.78, - "learning_rate": 1.7367557655741045e-06, - "loss": 0.8477, - "step": 30347 - }, - { - "epoch": 0.78, - "learning_rate": 1.7367370556666722e-06, - "loss": 0.9004, - "step": 30348 - }, - { - "epoch": 0.78, - "learning_rate": 1.7367183451951545e-06, - "loss": 0.9785, - "step": 30349 - }, - { - "epoch": 0.78, - "learning_rate": 1.736699634159565e-06, - "loss": 0.6392, - "step": 30350 - }, - { - "epoch": 0.78, - "learning_rate": 1.7366809225599183e-06, - "loss": 0.9531, - "step": 30351 - }, - { - "epoch": 0.78, - "learning_rate": 1.7366622103962293e-06, - "loss": 0.8154, - "step": 30352 - }, - { - "epoch": 0.78, - "learning_rate": 1.7366434976685118e-06, - "loss": 0.7285, - "step": 30353 - }, - { - "epoch": 0.78, - "learning_rate": 1.7366247843767803e-06, - "loss": 0.8096, - "step": 30354 - }, - { - "epoch": 0.78, - "learning_rate": 1.736606070521049e-06, - "loss": 0.7668, - "step": 30355 - }, - { - "epoch": 0.78, - "learning_rate": 1.7365873561013324e-06, - "loss": 0.9199, - "step": 30356 - }, - { - "epoch": 0.78, - "learning_rate": 1.7365686411176445e-06, - "loss": 0.8145, - "step": 30357 - }, - { - "epoch": 0.78, - "learning_rate": 1.7365499255700002e-06, - "loss": 0.9717, - "step": 30358 - }, - { - "epoch": 0.78, - "learning_rate": 1.736531209458413e-06, - "loss": 0.7241, - "step": 30359 - }, - { - "epoch": 0.78, - "learning_rate": 1.7365124927828982e-06, - "loss": 0.8271, - "step": 30360 - }, - { - "epoch": 0.78, - "learning_rate": 1.7364937755434695e-06, - "loss": 0.7866, - "step": 30361 - }, - { - "epoch": 0.78, - "learning_rate": 1.7364750577401413e-06, - "loss": 1.0381, - "step": 30362 - }, - { - "epoch": 0.78, - "learning_rate": 1.736456339372928e-06, - "loss": 1.0342, - "step": 30363 - }, - { - "epoch": 0.78, - "learning_rate": 1.736437620441844e-06, - "loss": 0.856, - "step": 30364 - }, - { - "epoch": 0.78, - "learning_rate": 1.7364189009469036e-06, - "loss": 0.6858, - "step": 30365 - }, - { - "epoch": 0.78, - "learning_rate": 1.736400180888121e-06, - "loss": 0.7666, - "step": 30366 - }, - { - "epoch": 0.78, - "learning_rate": 1.7363814602655106e-06, - "loss": 0.9805, - "step": 30367 - }, - { - "epoch": 0.78, - "learning_rate": 1.7363627390790869e-06, - "loss": 0.7764, - "step": 30368 - }, - { - "epoch": 0.78, - "learning_rate": 1.7363440173288645e-06, - "loss": 0.7876, - "step": 30369 - }, - { - "epoch": 0.78, - "learning_rate": 1.7363252950148567e-06, - "loss": 0.8164, - "step": 30370 - }, - { - "epoch": 0.78, - "learning_rate": 1.7363065721370789e-06, - "loss": 1.0156, - "step": 30371 - }, - { - "epoch": 0.78, - "learning_rate": 1.7362878486955449e-06, - "loss": 0.8711, - "step": 30372 - }, - { - "epoch": 0.78, - "learning_rate": 1.736269124690269e-06, - "loss": 0.6108, - "step": 30373 - }, - { - "epoch": 0.78, - "learning_rate": 1.7362504001212658e-06, - "loss": 0.793, - "step": 30374 - }, - { - "epoch": 0.78, - "learning_rate": 1.7362316749885494e-06, - "loss": 0.8994, - "step": 30375 - }, - { - "epoch": 0.78, - "learning_rate": 1.7362129492921343e-06, - "loss": 0.8867, - "step": 30376 - }, - { - "epoch": 0.78, - "learning_rate": 1.7361942230320347e-06, - "loss": 0.7246, - "step": 30377 - }, - { - "epoch": 0.78, - "learning_rate": 1.7361754962082653e-06, - "loss": 1.0, - "step": 30378 - }, - { - "epoch": 0.78, - "learning_rate": 1.73615676882084e-06, - "loss": 0.7754, - "step": 30379 - }, - { - "epoch": 0.78, - "learning_rate": 1.7361380408697736e-06, - "loss": 0.7783, - "step": 30380 - }, - { - "epoch": 0.78, - "learning_rate": 1.73611931235508e-06, - "loss": 0.9141, - "step": 30381 - }, - { - "epoch": 0.78, - "learning_rate": 1.7361005832767734e-06, - "loss": 0.7754, - "step": 30382 - }, - { - "epoch": 0.78, - "learning_rate": 1.7360818536348689e-06, - "loss": 0.8477, - "step": 30383 - }, - { - "epoch": 0.78, - "learning_rate": 1.73606312342938e-06, - "loss": 1.002, - "step": 30384 - }, - { - "epoch": 0.78, - "learning_rate": 1.7360443926603216e-06, - "loss": 0.8555, - "step": 30385 - }, - { - "epoch": 0.78, - "learning_rate": 1.7360256613277077e-06, - "loss": 0.8359, - "step": 30386 - }, - { - "epoch": 0.78, - "learning_rate": 1.736006929431553e-06, - "loss": 0.4766, - "step": 30387 - }, - { - "epoch": 0.78, - "learning_rate": 1.7359881969718716e-06, - "loss": 0.8652, - "step": 30388 - }, - { - "epoch": 0.78, - "learning_rate": 1.7359694639486774e-06, - "loss": 0.8398, - "step": 30389 - }, - { - "epoch": 0.78, - "learning_rate": 1.7359507303619859e-06, - "loss": 0.9033, - "step": 30390 - }, - { - "epoch": 0.78, - "learning_rate": 1.7359319962118103e-06, - "loss": 0.793, - "step": 30391 - }, - { - "epoch": 0.78, - "learning_rate": 1.7359132614981658e-06, - "loss": 0.687, - "step": 30392 - }, - { - "epoch": 0.78, - "learning_rate": 1.735894526221066e-06, - "loss": 0.7871, - "step": 30393 - }, - { - "epoch": 0.78, - "learning_rate": 1.735875790380526e-06, - "loss": 0.834, - "step": 30394 - }, - { - "epoch": 0.78, - "learning_rate": 1.7358570539765593e-06, - "loss": 0.7656, - "step": 30395 - }, - { - "epoch": 0.78, - "learning_rate": 1.7358383170091807e-06, - "loss": 0.7188, - "step": 30396 - }, - { - "epoch": 0.78, - "learning_rate": 1.735819579478405e-06, - "loss": 0.9629, - "step": 30397 - }, - { - "epoch": 0.78, - "learning_rate": 1.7358008413842456e-06, - "loss": 0.9473, - "step": 30398 - }, - { - "epoch": 0.78, - "learning_rate": 1.7357821027267177e-06, - "loss": 0.7524, - "step": 30399 - }, - { - "epoch": 0.78, - "learning_rate": 1.735763363505835e-06, - "loss": 1.0625, - "step": 30400 - }, - { - "epoch": 0.78, - "learning_rate": 1.7357446237216123e-06, - "loss": 0.9697, - "step": 30401 - }, - { - "epoch": 0.78, - "learning_rate": 1.7357258833740637e-06, - "loss": 1.0645, - "step": 30402 - }, - { - "epoch": 0.78, - "learning_rate": 1.7357071424632034e-06, - "loss": 0.5676, - "step": 30403 - }, - { - "epoch": 0.78, - "learning_rate": 1.7356884009890465e-06, - "loss": 0.9717, - "step": 30404 - }, - { - "epoch": 0.78, - "learning_rate": 1.7356696589516064e-06, - "loss": 0.9316, - "step": 30405 - }, - { - "epoch": 0.78, - "learning_rate": 1.7356509163508978e-06, - "loss": 1.1523, - "step": 30406 - }, - { - "epoch": 0.78, - "learning_rate": 1.7356321731869354e-06, - "loss": 0.8955, - "step": 30407 - }, - { - "epoch": 0.78, - "learning_rate": 1.7356134294597333e-06, - "loss": 0.8975, - "step": 30408 - }, - { - "epoch": 0.78, - "learning_rate": 1.7355946851693054e-06, - "loss": 0.6885, - "step": 30409 - }, - { - "epoch": 0.78, - "learning_rate": 1.7355759403156669e-06, - "loss": 0.874, - "step": 30410 - }, - { - "epoch": 0.78, - "learning_rate": 1.7355571948988317e-06, - "loss": 0.9355, - "step": 30411 - }, - { - "epoch": 0.78, - "learning_rate": 1.735538448918814e-06, - "loss": 0.9609, - "step": 30412 - }, - { - "epoch": 0.78, - "learning_rate": 1.7355197023756282e-06, - "loss": 0.8965, - "step": 30413 - }, - { - "epoch": 0.78, - "learning_rate": 1.735500955269289e-06, - "loss": 0.9951, - "step": 30414 - }, - { - "epoch": 0.78, - "learning_rate": 1.7354822075998108e-06, - "loss": 0.8281, - "step": 30415 - }, - { - "epoch": 0.78, - "learning_rate": 1.7354634593672073e-06, - "loss": 0.9629, - "step": 30416 - }, - { - "epoch": 0.78, - "learning_rate": 1.7354447105714933e-06, - "loss": 0.7324, - "step": 30417 - }, - { - "epoch": 0.78, - "learning_rate": 1.7354259612126832e-06, - "loss": 0.7095, - "step": 30418 - }, - { - "epoch": 0.78, - "learning_rate": 1.7354072112907912e-06, - "loss": 0.7957, - "step": 30419 - }, - { - "epoch": 0.78, - "learning_rate": 1.7353884608058318e-06, - "loss": 0.9199, - "step": 30420 - }, - { - "epoch": 0.78, - "learning_rate": 1.735369709757819e-06, - "loss": 0.9746, - "step": 30421 - }, - { - "epoch": 0.78, - "learning_rate": 1.7353509581467676e-06, - "loss": 0.9316, - "step": 30422 - }, - { - "epoch": 0.78, - "learning_rate": 1.7353322059726917e-06, - "loss": 1.0078, - "step": 30423 - }, - { - "epoch": 0.78, - "learning_rate": 1.735313453235606e-06, - "loss": 0.6899, - "step": 30424 - }, - { - "epoch": 0.78, - "learning_rate": 1.7352946999355247e-06, - "loss": 0.7977, - "step": 30425 - }, - { - "epoch": 0.78, - "learning_rate": 1.7352759460724617e-06, - "loss": 0.7266, - "step": 30426 - }, - { - "epoch": 0.78, - "learning_rate": 1.7352571916464318e-06, - "loss": 0.8389, - "step": 30427 - }, - { - "epoch": 0.78, - "learning_rate": 1.7352384366574492e-06, - "loss": 0.9033, - "step": 30428 - }, - { - "epoch": 0.78, - "learning_rate": 1.7352196811055287e-06, - "loss": 0.7617, - "step": 30429 - }, - { - "epoch": 0.78, - "learning_rate": 1.735200924990684e-06, - "loss": 0.8818, - "step": 30430 - }, - { - "epoch": 0.78, - "learning_rate": 1.7351821683129298e-06, - "loss": 0.6753, - "step": 30431 - }, - { - "epoch": 0.78, - "learning_rate": 1.7351634110722801e-06, - "loss": 0.8887, - "step": 30432 - }, - { - "epoch": 0.78, - "learning_rate": 1.7351446532687502e-06, - "loss": 0.7773, - "step": 30433 - }, - { - "epoch": 0.78, - "learning_rate": 1.7351258949023536e-06, - "loss": 0.9092, - "step": 30434 - }, - { - "epoch": 0.78, - "learning_rate": 1.7351071359731043e-06, - "loss": 0.9736, - "step": 30435 - }, - { - "epoch": 0.78, - "learning_rate": 1.735088376481018e-06, - "loss": 0.7393, - "step": 30436 - }, - { - "epoch": 0.78, - "learning_rate": 1.735069616426108e-06, - "loss": 0.7231, - "step": 30437 - }, - { - "epoch": 0.78, - "learning_rate": 1.7350508558083892e-06, - "loss": 0.9727, - "step": 30438 - }, - { - "epoch": 0.78, - "learning_rate": 1.7350320946278757e-06, - "loss": 0.8271, - "step": 30439 - }, - { - "epoch": 0.78, - "learning_rate": 1.735013332884582e-06, - "loss": 0.7329, - "step": 30440 - }, - { - "epoch": 0.78, - "learning_rate": 1.7349945705785223e-06, - "loss": 0.7881, - "step": 30441 - }, - { - "epoch": 0.78, - "learning_rate": 1.734975807709711e-06, - "loss": 0.9746, - "step": 30442 - }, - { - "epoch": 0.78, - "learning_rate": 1.7349570442781624e-06, - "loss": 0.6055, - "step": 30443 - }, - { - "epoch": 0.78, - "learning_rate": 1.7349382802838912e-06, - "loss": 0.9287, - "step": 30444 - }, - { - "epoch": 0.78, - "learning_rate": 1.7349195157269117e-06, - "loss": 0.7637, - "step": 30445 - }, - { - "epoch": 0.78, - "learning_rate": 1.7349007506072378e-06, - "loss": 0.7705, - "step": 30446 - }, - { - "epoch": 0.78, - "learning_rate": 1.7348819849248844e-06, - "loss": 0.9512, - "step": 30447 - }, - { - "epoch": 0.78, - "learning_rate": 1.7348632186798656e-06, - "loss": 0.8486, - "step": 30448 - }, - { - "epoch": 0.78, - "learning_rate": 1.7348444518721958e-06, - "loss": 0.7852, - "step": 30449 - }, - { - "epoch": 0.78, - "learning_rate": 1.7348256845018894e-06, - "loss": 0.5398, - "step": 30450 - }, - { - "epoch": 0.78, - "learning_rate": 1.7348069165689607e-06, - "loss": 0.6875, - "step": 30451 - }, - { - "epoch": 0.78, - "learning_rate": 1.734788148073424e-06, - "loss": 1.1006, - "step": 30452 - }, - { - "epoch": 0.78, - "learning_rate": 1.7347693790152941e-06, - "loss": 0.9321, - "step": 30453 - }, - { - "epoch": 0.78, - "learning_rate": 1.734750609394585e-06, - "loss": 0.9775, - "step": 30454 - }, - { - "epoch": 0.78, - "learning_rate": 1.734731839211311e-06, - "loss": 0.9697, - "step": 30455 - }, - { - "epoch": 0.78, - "learning_rate": 1.7347130684654868e-06, - "loss": 0.9287, - "step": 30456 - }, - { - "epoch": 0.78, - "learning_rate": 1.7346942971571266e-06, - "loss": 0.6709, - "step": 30457 - }, - { - "epoch": 0.78, - "learning_rate": 1.7346755252862443e-06, - "loss": 0.5254, - "step": 30458 - }, - { - "epoch": 0.78, - "learning_rate": 1.7346567528528554e-06, - "loss": 0.5513, - "step": 30459 - }, - { - "epoch": 0.78, - "learning_rate": 1.734637979856973e-06, - "loss": 0.9453, - "step": 30460 - }, - { - "epoch": 0.78, - "learning_rate": 1.7346192062986124e-06, - "loss": 0.9609, - "step": 30461 - }, - { - "epoch": 0.78, - "learning_rate": 1.7346004321777875e-06, - "loss": 0.7346, - "step": 30462 - }, - { - "epoch": 0.78, - "learning_rate": 1.7345816574945132e-06, - "loss": 0.915, - "step": 30463 - }, - { - "epoch": 0.78, - "learning_rate": 1.7345628822488031e-06, - "loss": 0.9121, - "step": 30464 - }, - { - "epoch": 0.78, - "learning_rate": 1.7345441064406723e-06, - "loss": 0.8682, - "step": 30465 - }, - { - "epoch": 0.78, - "learning_rate": 1.7345253300701346e-06, - "loss": 0.9775, - "step": 30466 - }, - { - "epoch": 0.78, - "learning_rate": 1.7345065531372048e-06, - "loss": 0.9287, - "step": 30467 - }, - { - "epoch": 0.78, - "learning_rate": 1.734487775641897e-06, - "loss": 0.9219, - "step": 30468 - }, - { - "epoch": 0.78, - "learning_rate": 1.7344689975842255e-06, - "loss": 0.7517, - "step": 30469 - }, - { - "epoch": 0.78, - "learning_rate": 1.7344502189642053e-06, - "loss": 1.0527, - "step": 30470 - }, - { - "epoch": 0.78, - "learning_rate": 1.7344314397818498e-06, - "loss": 0.636, - "step": 30471 - }, - { - "epoch": 0.78, - "learning_rate": 1.7344126600371744e-06, - "loss": 0.8555, - "step": 30472 - }, - { - "epoch": 0.78, - "learning_rate": 1.734393879730193e-06, - "loss": 0.9053, - "step": 30473 - }, - { - "epoch": 0.78, - "learning_rate": 1.7343750988609196e-06, - "loss": 0.9199, - "step": 30474 - }, - { - "epoch": 0.78, - "learning_rate": 1.7343563174293692e-06, - "loss": 0.769, - "step": 30475 - }, - { - "epoch": 0.78, - "learning_rate": 1.7343375354355557e-06, - "loss": 0.8955, - "step": 30476 - }, - { - "epoch": 0.78, - "learning_rate": 1.734318752879494e-06, - "loss": 0.8574, - "step": 30477 - }, - { - "epoch": 0.78, - "learning_rate": 1.7342999697611979e-06, - "loss": 0.8267, - "step": 30478 - }, - { - "epoch": 0.78, - "learning_rate": 1.7342811860806824e-06, - "loss": 0.998, - "step": 30479 - }, - { - "epoch": 0.78, - "learning_rate": 1.7342624018379612e-06, - "loss": 0.7568, - "step": 30480 - }, - { - "epoch": 0.78, - "learning_rate": 1.7342436170330493e-06, - "loss": 0.6804, - "step": 30481 - }, - { - "epoch": 0.78, - "learning_rate": 1.7342248316659606e-06, - "loss": 0.8516, - "step": 30482 - }, - { - "epoch": 0.78, - "learning_rate": 1.7342060457367102e-06, - "loss": 0.9766, - "step": 30483 - }, - { - "epoch": 0.78, - "learning_rate": 1.7341872592453116e-06, - "loss": 1.1631, - "step": 30484 - }, - { - "epoch": 0.78, - "learning_rate": 1.7341684721917797e-06, - "loss": 0.8999, - "step": 30485 - }, - { - "epoch": 0.78, - "learning_rate": 1.7341496845761286e-06, - "loss": 0.8945, - "step": 30486 - }, - { - "epoch": 0.78, - "learning_rate": 1.7341308963983733e-06, - "loss": 0.9268, - "step": 30487 - }, - { - "epoch": 0.78, - "learning_rate": 1.734112107658527e-06, - "loss": 0.7632, - "step": 30488 - }, - { - "epoch": 0.78, - "learning_rate": 1.7340933183566053e-06, - "loss": 0.7451, - "step": 30489 - }, - { - "epoch": 0.78, - "learning_rate": 1.734074528492622e-06, - "loss": 0.791, - "step": 30490 - }, - { - "epoch": 0.78, - "learning_rate": 1.7340557380665916e-06, - "loss": 0.6831, - "step": 30491 - }, - { - "epoch": 0.78, - "learning_rate": 1.7340369470785286e-06, - "loss": 1.0508, - "step": 30492 - }, - { - "epoch": 0.78, - "learning_rate": 1.734018155528447e-06, - "loss": 0.9355, - "step": 30493 - }, - { - "epoch": 0.78, - "learning_rate": 1.7339993634163618e-06, - "loss": 0.8164, - "step": 30494 - }, - { - "epoch": 0.78, - "learning_rate": 1.7339805707422866e-06, - "loss": 0.7178, - "step": 30495 - }, - { - "epoch": 0.78, - "learning_rate": 1.7339617775062364e-06, - "loss": 0.9414, - "step": 30496 - }, - { - "epoch": 0.78, - "learning_rate": 1.7339429837082256e-06, - "loss": 0.8706, - "step": 30497 - }, - { - "epoch": 0.78, - "learning_rate": 1.7339241893482682e-06, - "loss": 0.8223, - "step": 30498 - }, - { - "epoch": 0.78, - "learning_rate": 1.7339053944263787e-06, - "loss": 0.9092, - "step": 30499 - }, - { - "epoch": 0.78, - "learning_rate": 1.7338865989425718e-06, - "loss": 0.8975, - "step": 30500 - }, - { - "epoch": 0.78, - "learning_rate": 1.7338678028968617e-06, - "loss": 0.8462, - "step": 30501 - }, - { - "epoch": 0.78, - "learning_rate": 1.7338490062892625e-06, - "loss": 0.8555, - "step": 30502 - }, - { - "epoch": 0.78, - "learning_rate": 1.7338302091197891e-06, - "loss": 0.7319, - "step": 30503 - }, - { - "epoch": 0.78, - "learning_rate": 1.7338114113884555e-06, - "loss": 0.8154, - "step": 30504 - }, - { - "epoch": 0.78, - "learning_rate": 1.7337926130952764e-06, - "loss": 0.8486, - "step": 30505 - }, - { - "epoch": 0.78, - "learning_rate": 1.733773814240266e-06, - "loss": 0.8848, - "step": 30506 - }, - { - "epoch": 0.78, - "learning_rate": 1.7337550148234387e-06, - "loss": 0.9111, - "step": 30507 - }, - { - "epoch": 0.78, - "learning_rate": 1.733736214844809e-06, - "loss": 0.6182, - "step": 30508 - }, - { - "epoch": 0.78, - "learning_rate": 1.7337174143043911e-06, - "loss": 0.8281, - "step": 30509 - }, - { - "epoch": 0.78, - "learning_rate": 1.7336986132021996e-06, - "loss": 0.9531, - "step": 30510 - }, - { - "epoch": 0.78, - "learning_rate": 1.7336798115382485e-06, - "loss": 0.8115, - "step": 30511 - }, - { - "epoch": 0.78, - "learning_rate": 1.733661009312553e-06, - "loss": 1.0127, - "step": 30512 - }, - { - "epoch": 0.78, - "learning_rate": 1.7336422065251268e-06, - "loss": 0.7402, - "step": 30513 - }, - { - "epoch": 0.78, - "learning_rate": 1.7336234031759841e-06, - "loss": 0.9121, - "step": 30514 - }, - { - "epoch": 0.78, - "learning_rate": 1.7336045992651402e-06, - "loss": 0.6697, - "step": 30515 - }, - { - "epoch": 0.78, - "learning_rate": 1.733585794792609e-06, - "loss": 0.9053, - "step": 30516 - }, - { - "epoch": 0.78, - "learning_rate": 1.7335669897584047e-06, - "loss": 0.9092, - "step": 30517 - }, - { - "epoch": 0.78, - "learning_rate": 1.733548184162542e-06, - "loss": 0.8135, - "step": 30518 - }, - { - "epoch": 0.78, - "learning_rate": 1.733529378005035e-06, - "loss": 0.8057, - "step": 30519 - }, - { - "epoch": 0.78, - "learning_rate": 1.7335105712858983e-06, - "loss": 0.9346, - "step": 30520 - }, - { - "epoch": 0.78, - "learning_rate": 1.7334917640051466e-06, - "loss": 0.8418, - "step": 30521 - }, - { - "epoch": 0.78, - "learning_rate": 1.7334729561627938e-06, - "loss": 0.8701, - "step": 30522 - }, - { - "epoch": 0.78, - "learning_rate": 1.7334541477588545e-06, - "loss": 1.0752, - "step": 30523 - }, - { - "epoch": 0.78, - "learning_rate": 1.7334353387933428e-06, - "loss": 0.7444, - "step": 30524 - }, - { - "epoch": 0.78, - "learning_rate": 1.7334165292662734e-06, - "loss": 0.7549, - "step": 30525 - }, - { - "epoch": 0.78, - "learning_rate": 1.733397719177661e-06, - "loss": 0.8662, - "step": 30526 - }, - { - "epoch": 0.78, - "learning_rate": 1.7333789085275198e-06, - "loss": 0.9736, - "step": 30527 - }, - { - "epoch": 0.78, - "learning_rate": 1.7333600973158637e-06, - "loss": 1.002, - "step": 30528 - }, - { - "epoch": 0.78, - "learning_rate": 1.7333412855427077e-06, - "loss": 0.8721, - "step": 30529 - }, - { - "epoch": 0.78, - "learning_rate": 1.7333224732080661e-06, - "loss": 0.7183, - "step": 30530 - }, - { - "epoch": 0.78, - "learning_rate": 1.7333036603119528e-06, - "loss": 1.3154, - "step": 30531 - }, - { - "epoch": 0.78, - "learning_rate": 1.733284846854383e-06, - "loss": 0.6633, - "step": 30532 - }, - { - "epoch": 0.78, - "learning_rate": 1.7332660328353708e-06, - "loss": 0.9033, - "step": 30533 - }, - { - "epoch": 0.78, - "learning_rate": 1.73324721825493e-06, - "loss": 0.7578, - "step": 30534 - }, - { - "epoch": 0.78, - "learning_rate": 1.733228403113076e-06, - "loss": 0.8159, - "step": 30535 - }, - { - "epoch": 0.78, - "learning_rate": 1.7332095874098224e-06, - "loss": 0.8262, - "step": 30536 - }, - { - "epoch": 0.78, - "learning_rate": 1.733190771145184e-06, - "loss": 0.7373, - "step": 30537 - }, - { - "epoch": 0.78, - "learning_rate": 1.7331719543191755e-06, - "loss": 0.875, - "step": 30538 - }, - { - "epoch": 0.78, - "learning_rate": 1.7331531369318104e-06, - "loss": 0.7832, - "step": 30539 - }, - { - "epoch": 0.78, - "learning_rate": 1.733134318983104e-06, - "loss": 1.0068, - "step": 30540 - }, - { - "epoch": 0.78, - "learning_rate": 1.73311550047307e-06, - "loss": 0.6387, - "step": 30541 - }, - { - "epoch": 0.78, - "learning_rate": 1.733096681401724e-06, - "loss": 0.4897, - "step": 30542 - }, - { - "epoch": 0.78, - "learning_rate": 1.7330778617690788e-06, - "loss": 0.9326, - "step": 30543 - }, - { - "epoch": 0.78, - "learning_rate": 1.7330590415751497e-06, - "loss": 0.7754, - "step": 30544 - }, - { - "epoch": 0.78, - "learning_rate": 1.7330402208199514e-06, - "loss": 0.7222, - "step": 30545 - }, - { - "epoch": 0.78, - "learning_rate": 1.7330213995034975e-06, - "loss": 0.5425, - "step": 30546 - }, - { - "epoch": 0.78, - "learning_rate": 1.733002577625803e-06, - "loss": 0.9404, - "step": 30547 - }, - { - "epoch": 0.78, - "learning_rate": 1.732983755186882e-06, - "loss": 0.8896, - "step": 30548 - }, - { - "epoch": 0.78, - "learning_rate": 1.732964932186749e-06, - "loss": 1.0615, - "step": 30549 - }, - { - "epoch": 0.78, - "learning_rate": 1.7329461086254188e-06, - "loss": 0.752, - "step": 30550 - }, - { - "epoch": 0.78, - "learning_rate": 1.7329272845029053e-06, - "loss": 0.9912, - "step": 30551 - }, - { - "epoch": 0.78, - "learning_rate": 1.7329084598192228e-06, - "loss": 0.915, - "step": 30552 - }, - { - "epoch": 0.78, - "learning_rate": 1.7328896345743864e-06, - "loss": 0.8042, - "step": 30553 - }, - { - "epoch": 0.78, - "learning_rate": 1.7328708087684096e-06, - "loss": 1.0801, - "step": 30554 - }, - { - "epoch": 0.78, - "learning_rate": 1.732851982401308e-06, - "loss": 0.9268, - "step": 30555 - }, - { - "epoch": 0.78, - "learning_rate": 1.7328331554730948e-06, - "loss": 0.7891, - "step": 30556 - }, - { - "epoch": 0.78, - "learning_rate": 1.7328143279837853e-06, - "loss": 0.958, - "step": 30557 - }, - { - "epoch": 0.78, - "learning_rate": 1.732795499933393e-06, - "loss": 0.8281, - "step": 30558 - }, - { - "epoch": 0.78, - "learning_rate": 1.7327766713219334e-06, - "loss": 0.9209, - "step": 30559 - }, - { - "epoch": 0.78, - "learning_rate": 1.7327578421494201e-06, - "loss": 0.8965, - "step": 30560 - }, - { - "epoch": 0.78, - "learning_rate": 1.7327390124158682e-06, - "loss": 0.8203, - "step": 30561 - }, - { - "epoch": 0.78, - "learning_rate": 1.7327201821212916e-06, - "loss": 0.8018, - "step": 30562 - }, - { - "epoch": 0.78, - "learning_rate": 1.7327013512657048e-06, - "loss": 1.082, - "step": 30563 - }, - { - "epoch": 0.78, - "learning_rate": 1.732682519849122e-06, - "loss": 0.6718, - "step": 30564 - }, - { - "epoch": 0.78, - "learning_rate": 1.7326636878715584e-06, - "loss": 0.5869, - "step": 30565 - }, - { - "epoch": 0.78, - "learning_rate": 1.7326448553330274e-06, - "loss": 0.8535, - "step": 30566 - }, - { - "epoch": 0.78, - "learning_rate": 1.732626022233544e-06, - "loss": 0.8374, - "step": 30567 - }, - { - "epoch": 0.78, - "learning_rate": 1.7326071885731228e-06, - "loss": 0.9932, - "step": 30568 - }, - { - "epoch": 0.78, - "learning_rate": 1.732588354351778e-06, - "loss": 0.7178, - "step": 30569 - }, - { - "epoch": 0.78, - "learning_rate": 1.7325695195695236e-06, - "loss": 0.6948, - "step": 30570 - }, - { - "epoch": 0.78, - "learning_rate": 1.7325506842263746e-06, - "loss": 0.8452, - "step": 30571 - }, - { - "epoch": 0.78, - "learning_rate": 1.7325318483223454e-06, - "loss": 0.8237, - "step": 30572 - }, - { - "epoch": 0.78, - "learning_rate": 1.73251301185745e-06, - "loss": 0.6733, - "step": 30573 - }, - { - "epoch": 0.78, - "learning_rate": 1.7324941748317033e-06, - "loss": 0.7646, - "step": 30574 - }, - { - "epoch": 0.78, - "learning_rate": 1.7324753372451192e-06, - "loss": 0.9355, - "step": 30575 - }, - { - "epoch": 0.78, - "learning_rate": 1.7324564990977127e-06, - "loss": 0.8018, - "step": 30576 - }, - { - "epoch": 0.78, - "learning_rate": 1.7324376603894977e-06, - "loss": 0.8105, - "step": 30577 - }, - { - "epoch": 0.78, - "learning_rate": 1.7324188211204889e-06, - "loss": 0.8164, - "step": 30578 - }, - { - "epoch": 0.78, - "learning_rate": 1.7323999812907006e-06, - "loss": 0.8276, - "step": 30579 - }, - { - "epoch": 0.78, - "learning_rate": 1.7323811409001475e-06, - "loss": 0.9834, - "step": 30580 - }, - { - "epoch": 0.78, - "learning_rate": 1.732362299948844e-06, - "loss": 0.9404, - "step": 30581 - }, - { - "epoch": 0.78, - "learning_rate": 1.732343458436804e-06, - "loss": 0.8856, - "step": 30582 - }, - { - "epoch": 0.78, - "learning_rate": 1.7323246163640425e-06, - "loss": 0.9883, - "step": 30583 - }, - { - "epoch": 0.78, - "learning_rate": 1.7323057737305737e-06, - "loss": 0.8076, - "step": 30584 - }, - { - "epoch": 0.78, - "learning_rate": 1.7322869305364121e-06, - "loss": 1.0283, - "step": 30585 - }, - { - "epoch": 0.78, - "learning_rate": 1.7322680867815719e-06, - "loss": 0.8428, - "step": 30586 - }, - { - "epoch": 0.78, - "learning_rate": 1.732249242466068e-06, - "loss": 0.7949, - "step": 30587 - }, - { - "epoch": 0.78, - "learning_rate": 1.7322303975899141e-06, - "loss": 0.7578, - "step": 30588 - }, - { - "epoch": 0.78, - "learning_rate": 1.7322115521531252e-06, - "loss": 0.958, - "step": 30589 - }, - { - "epoch": 0.78, - "learning_rate": 1.7321927061557155e-06, - "loss": 0.689, - "step": 30590 - }, - { - "epoch": 0.78, - "learning_rate": 1.7321738595977e-06, - "loss": 0.7959, - "step": 30591 - }, - { - "epoch": 0.78, - "learning_rate": 1.732155012479092e-06, - "loss": 0.686, - "step": 30592 - }, - { - "epoch": 0.78, - "learning_rate": 1.732136164799907e-06, - "loss": 0.8398, - "step": 30593 - }, - { - "epoch": 0.78, - "learning_rate": 1.7321173165601588e-06, - "loss": 1.126, - "step": 30594 - }, - { - "epoch": 0.78, - "learning_rate": 1.732098467759862e-06, - "loss": 0.5806, - "step": 30595 - }, - { - "epoch": 0.78, - "learning_rate": 1.7320796183990312e-06, - "loss": 0.9243, - "step": 30596 - }, - { - "epoch": 0.78, - "learning_rate": 1.7320607684776807e-06, - "loss": 0.7998, - "step": 30597 - }, - { - "epoch": 0.78, - "learning_rate": 1.7320419179958247e-06, - "loss": 0.7847, - "step": 30598 - }, - { - "epoch": 0.78, - "learning_rate": 1.732023066953478e-06, - "loss": 0.7148, - "step": 30599 - }, - { - "epoch": 0.78, - "learning_rate": 1.7320042153506554e-06, - "loss": 0.9365, - "step": 30600 - }, - { - "epoch": 0.78, - "learning_rate": 1.7319853631873703e-06, - "loss": 0.7783, - "step": 30601 - }, - { - "epoch": 0.78, - "learning_rate": 1.7319665104636378e-06, - "loss": 1.0088, - "step": 30602 - }, - { - "epoch": 0.78, - "learning_rate": 1.731947657179472e-06, - "loss": 0.8848, - "step": 30603 - }, - { - "epoch": 0.78, - "learning_rate": 1.7319288033348877e-06, - "loss": 0.8232, - "step": 30604 - }, - { - "epoch": 0.78, - "learning_rate": 1.7319099489298992e-06, - "loss": 0.7803, - "step": 30605 - }, - { - "epoch": 0.78, - "learning_rate": 1.7318910939645207e-06, - "loss": 0.8047, - "step": 30606 - }, - { - "epoch": 0.78, - "learning_rate": 1.7318722384387673e-06, - "loss": 0.8945, - "step": 30607 - }, - { - "epoch": 0.78, - "learning_rate": 1.7318533823526524e-06, - "loss": 0.7021, - "step": 30608 - }, - { - "epoch": 0.78, - "learning_rate": 1.7318345257061916e-06, - "loss": 0.7354, - "step": 30609 - }, - { - "epoch": 0.78, - "learning_rate": 1.7318156684993983e-06, - "loss": 1.1035, - "step": 30610 - }, - { - "epoch": 0.78, - "learning_rate": 1.7317968107322875e-06, - "loss": 0.9072, - "step": 30611 - }, - { - "epoch": 0.78, - "learning_rate": 1.7317779524048736e-06, - "loss": 1.0566, - "step": 30612 - }, - { - "epoch": 0.78, - "learning_rate": 1.7317590935171708e-06, - "loss": 0.707, - "step": 30613 - }, - { - "epoch": 0.78, - "learning_rate": 1.731740234069194e-06, - "loss": 0.9629, - "step": 30614 - }, - { - "epoch": 0.78, - "learning_rate": 1.731721374060957e-06, - "loss": 1.0205, - "step": 30615 - }, - { - "epoch": 0.78, - "learning_rate": 1.7317025134924749e-06, - "loss": 0.8296, - "step": 30616 - }, - { - "epoch": 0.78, - "learning_rate": 1.7316836523637618e-06, - "loss": 0.8252, - "step": 30617 - }, - { - "epoch": 0.78, - "learning_rate": 1.731664790674832e-06, - "loss": 0.9951, - "step": 30618 - }, - { - "epoch": 0.78, - "learning_rate": 1.7316459284257001e-06, - "loss": 0.874, - "step": 30619 - }, - { - "epoch": 0.78, - "learning_rate": 1.7316270656163807e-06, - "loss": 0.6406, - "step": 30620 - }, - { - "epoch": 0.78, - "learning_rate": 1.731608202246888e-06, - "loss": 0.8818, - "step": 30621 - }, - { - "epoch": 0.78, - "learning_rate": 1.7315893383172369e-06, - "loss": 0.9746, - "step": 30622 - }, - { - "epoch": 0.78, - "learning_rate": 1.731570473827441e-06, - "loss": 0.7412, - "step": 30623 - }, - { - "epoch": 0.78, - "learning_rate": 1.7315516087775156e-06, - "loss": 1.0381, - "step": 30624 - }, - { - "epoch": 0.78, - "learning_rate": 1.7315327431674744e-06, - "loss": 0.6729, - "step": 30625 - }, - { - "epoch": 0.78, - "learning_rate": 1.7315138769973326e-06, - "loss": 1.002, - "step": 30626 - }, - { - "epoch": 0.78, - "learning_rate": 1.7314950102671038e-06, - "loss": 1.1914, - "step": 30627 - }, - { - "epoch": 0.79, - "learning_rate": 1.7314761429768032e-06, - "loss": 0.8379, - "step": 30628 - }, - { - "epoch": 0.79, - "learning_rate": 1.7314572751264448e-06, - "loss": 0.8652, - "step": 30629 - }, - { - "epoch": 0.79, - "learning_rate": 1.7314384067160434e-06, - "loss": 0.8247, - "step": 30630 - }, - { - "epoch": 0.79, - "learning_rate": 1.7314195377456131e-06, - "loss": 0.6304, - "step": 30631 - }, - { - "epoch": 0.79, - "learning_rate": 1.7314006682151688e-06, - "loss": 0.8838, - "step": 30632 - }, - { - "epoch": 0.79, - "learning_rate": 1.7313817981247242e-06, - "loss": 0.7842, - "step": 30633 - }, - { - "epoch": 0.79, - "learning_rate": 1.7313629274742946e-06, - "loss": 0.8135, - "step": 30634 - }, - { - "epoch": 0.79, - "learning_rate": 1.7313440562638935e-06, - "loss": 0.8188, - "step": 30635 - }, - { - "epoch": 0.79, - "learning_rate": 1.7313251844935364e-06, - "loss": 0.6675, - "step": 30636 - }, - { - "epoch": 0.79, - "learning_rate": 1.7313063121632369e-06, - "loss": 0.7959, - "step": 30637 - }, - { - "epoch": 0.79, - "learning_rate": 1.7312874392730099e-06, - "loss": 0.6084, - "step": 30638 - }, - { - "epoch": 0.79, - "learning_rate": 1.7312685658228697e-06, - "loss": 0.7371, - "step": 30639 - }, - { - "epoch": 0.79, - "learning_rate": 1.7312496918128308e-06, - "loss": 0.8535, - "step": 30640 - }, - { - "epoch": 0.79, - "learning_rate": 1.7312308172429076e-06, - "loss": 0.7988, - "step": 30641 - }, - { - "epoch": 0.79, - "learning_rate": 1.7312119421131146e-06, - "loss": 0.7402, - "step": 30642 - }, - { - "epoch": 0.79, - "learning_rate": 1.7311930664234664e-06, - "loss": 0.9268, - "step": 30643 - }, - { - "epoch": 0.79, - "learning_rate": 1.7311741901739772e-06, - "loss": 0.8018, - "step": 30644 - }, - { - "epoch": 0.79, - "learning_rate": 1.7311553133646615e-06, - "loss": 0.8467, - "step": 30645 - }, - { - "epoch": 0.79, - "learning_rate": 1.7311364359955337e-06, - "loss": 0.7932, - "step": 30646 - }, - { - "epoch": 0.79, - "learning_rate": 1.7311175580666085e-06, - "loss": 0.8853, - "step": 30647 - }, - { - "epoch": 0.79, - "learning_rate": 1.7310986795779003e-06, - "loss": 0.8682, - "step": 30648 - }, - { - "epoch": 0.79, - "learning_rate": 1.7310798005294234e-06, - "loss": 0.7578, - "step": 30649 - }, - { - "epoch": 0.79, - "learning_rate": 1.7310609209211919e-06, - "loss": 0.9893, - "step": 30650 - }, - { - "epoch": 0.79, - "learning_rate": 1.7310420407532211e-06, - "loss": 1.0547, - "step": 30651 - }, - { - "epoch": 0.79, - "learning_rate": 1.731023160025525e-06, - "loss": 0.9307, - "step": 30652 - }, - { - "epoch": 0.79, - "learning_rate": 1.7310042787381182e-06, - "loss": 0.8369, - "step": 30653 - }, - { - "epoch": 0.79, - "learning_rate": 1.7309853968910147e-06, - "loss": 0.9434, - "step": 30654 - }, - { - "epoch": 0.79, - "learning_rate": 1.7309665144842294e-06, - "loss": 0.8984, - "step": 30655 - }, - { - "epoch": 0.79, - "learning_rate": 1.7309476315177767e-06, - "loss": 0.9951, - "step": 30656 - }, - { - "epoch": 0.79, - "learning_rate": 1.7309287479916708e-06, - "loss": 0.6865, - "step": 30657 - }, - { - "epoch": 0.79, - "learning_rate": 1.7309098639059268e-06, - "loss": 0.8862, - "step": 30658 - }, - { - "epoch": 0.79, - "learning_rate": 1.7308909792605584e-06, - "loss": 0.9023, - "step": 30659 - }, - { - "epoch": 0.79, - "learning_rate": 1.7308720940555804e-06, - "loss": 0.5674, - "step": 30660 - }, - { - "epoch": 0.79, - "learning_rate": 1.7308532082910072e-06, - "loss": 0.9004, - "step": 30661 - }, - { - "epoch": 0.79, - "learning_rate": 1.7308343219668535e-06, - "loss": 0.9258, - "step": 30662 - }, - { - "epoch": 0.79, - "learning_rate": 1.7308154350831337e-06, - "loss": 0.7988, - "step": 30663 - }, - { - "epoch": 0.79, - "learning_rate": 1.730796547639862e-06, - "loss": 0.9365, - "step": 30664 - }, - { - "epoch": 0.79, - "learning_rate": 1.7307776596370526e-06, - "loss": 0.9473, - "step": 30665 - }, - { - "epoch": 0.79, - "learning_rate": 1.7307587710747207e-06, - "loss": 1.0078, - "step": 30666 - }, - { - "epoch": 0.79, - "learning_rate": 1.7307398819528802e-06, - "loss": 0.9219, - "step": 30667 - }, - { - "epoch": 0.79, - "learning_rate": 1.730720992271546e-06, - "loss": 0.7881, - "step": 30668 - }, - { - "epoch": 0.79, - "learning_rate": 1.7307021020307325e-06, - "loss": 0.8232, - "step": 30669 - }, - { - "epoch": 0.79, - "learning_rate": 1.7306832112304535e-06, - "loss": 0.9795, - "step": 30670 - }, - { - "epoch": 0.79, - "learning_rate": 1.7306643198707243e-06, - "loss": 0.7393, - "step": 30671 - }, - { - "epoch": 0.79, - "learning_rate": 1.730645427951559e-06, - "loss": 0.9336, - "step": 30672 - }, - { - "epoch": 0.79, - "learning_rate": 1.7306265354729722e-06, - "loss": 0.5161, - "step": 30673 - }, - { - "epoch": 0.79, - "learning_rate": 1.730607642434978e-06, - "loss": 0.7217, - "step": 30674 - }, - { - "epoch": 0.79, - "learning_rate": 1.730588748837591e-06, - "loss": 0.998, - "step": 30675 - }, - { - "epoch": 0.79, - "learning_rate": 1.7305698546808261e-06, - "loss": 1.0957, - "step": 30676 - }, - { - "epoch": 0.79, - "learning_rate": 1.7305509599646976e-06, - "loss": 0.9785, - "step": 30677 - }, - { - "epoch": 0.79, - "learning_rate": 1.7305320646892193e-06, - "loss": 0.8037, - "step": 30678 - }, - { - "epoch": 0.79, - "learning_rate": 1.7305131688544065e-06, - "loss": 0.8936, - "step": 30679 - }, - { - "epoch": 0.79, - "learning_rate": 1.7304942724602734e-06, - "loss": 0.9551, - "step": 30680 - }, - { - "epoch": 0.79, - "learning_rate": 1.7304753755068342e-06, - "loss": 0.8755, - "step": 30681 - }, - { - "epoch": 0.79, - "learning_rate": 1.7304564779941039e-06, - "loss": 0.8535, - "step": 30682 - }, - { - "epoch": 0.79, - "learning_rate": 1.7304375799220962e-06, - "loss": 0.9248, - "step": 30683 - }, - { - "epoch": 0.79, - "learning_rate": 1.7304186812908265e-06, - "loss": 0.915, - "step": 30684 - }, - { - "epoch": 0.79, - "learning_rate": 1.7303997821003086e-06, - "loss": 0.9404, - "step": 30685 - }, - { - "epoch": 0.79, - "learning_rate": 1.7303808823505572e-06, - "loss": 0.8135, - "step": 30686 - }, - { - "epoch": 0.79, - "learning_rate": 1.730361982041587e-06, - "loss": 0.8438, - "step": 30687 - }, - { - "epoch": 0.79, - "learning_rate": 1.7303430811734119e-06, - "loss": 0.6401, - "step": 30688 - }, - { - "epoch": 0.79, - "learning_rate": 1.7303241797460468e-06, - "loss": 0.9736, - "step": 30689 - }, - { - "epoch": 0.79, - "learning_rate": 1.730305277759506e-06, - "loss": 0.7427, - "step": 30690 - }, - { - "epoch": 0.79, - "learning_rate": 1.730286375213804e-06, - "loss": 0.6758, - "step": 30691 - }, - { - "epoch": 0.79, - "learning_rate": 1.7302674721089555e-06, - "loss": 0.8867, - "step": 30692 - }, - { - "epoch": 0.79, - "learning_rate": 1.7302485684449745e-06, - "loss": 0.8105, - "step": 30693 - }, - { - "epoch": 0.79, - "learning_rate": 1.7302296642218758e-06, - "loss": 0.959, - "step": 30694 - }, - { - "epoch": 0.79, - "learning_rate": 1.7302107594396738e-06, - "loss": 1.0459, - "step": 30695 - }, - { - "epoch": 0.79, - "learning_rate": 1.7301918540983832e-06, - "loss": 0.7739, - "step": 30696 - }, - { - "epoch": 0.79, - "learning_rate": 1.7301729481980182e-06, - "loss": 0.8809, - "step": 30697 - }, - { - "epoch": 0.79, - "learning_rate": 1.730154041738593e-06, - "loss": 0.7354, - "step": 30698 - }, - { - "epoch": 0.79, - "learning_rate": 1.7301351347201232e-06, - "loss": 0.8906, - "step": 30699 - }, - { - "epoch": 0.79, - "learning_rate": 1.7301162271426218e-06, - "loss": 0.7607, - "step": 30700 - }, - { - "epoch": 0.79, - "learning_rate": 1.7300973190061044e-06, - "loss": 0.7153, - "step": 30701 - }, - { - "epoch": 0.79, - "learning_rate": 1.7300784103105847e-06, - "loss": 0.9541, - "step": 30702 - }, - { - "epoch": 0.79, - "learning_rate": 1.7300595010560777e-06, - "loss": 0.8428, - "step": 30703 - }, - { - "epoch": 0.79, - "learning_rate": 1.7300405912425978e-06, - "loss": 0.8223, - "step": 30704 - }, - { - "epoch": 0.79, - "learning_rate": 1.730021680870159e-06, - "loss": 0.9473, - "step": 30705 - }, - { - "epoch": 0.79, - "learning_rate": 1.7300027699387765e-06, - "loss": 0.8545, - "step": 30706 - }, - { - "epoch": 0.79, - "learning_rate": 1.7299838584484644e-06, - "loss": 0.7676, - "step": 30707 - }, - { - "epoch": 0.79, - "learning_rate": 1.7299649463992374e-06, - "loss": 1.1797, - "step": 30708 - }, - { - "epoch": 0.79, - "learning_rate": 1.7299460337911097e-06, - "loss": 0.7607, - "step": 30709 - }, - { - "epoch": 0.79, - "learning_rate": 1.7299271206240954e-06, - "loss": 0.7832, - "step": 30710 - }, - { - "epoch": 0.79, - "learning_rate": 1.7299082068982101e-06, - "loss": 0.8047, - "step": 30711 - }, - { - "epoch": 0.79, - "learning_rate": 1.7298892926134677e-06, - "loss": 0.7607, - "step": 30712 - }, - { - "epoch": 0.79, - "learning_rate": 1.729870377769882e-06, - "loss": 0.9463, - "step": 30713 - }, - { - "epoch": 0.79, - "learning_rate": 1.7298514623674688e-06, - "loss": 0.8525, - "step": 30714 - }, - { - "epoch": 0.79, - "learning_rate": 1.7298325464062415e-06, - "loss": 0.9541, - "step": 30715 - }, - { - "epoch": 0.79, - "learning_rate": 1.729813629886215e-06, - "loss": 0.8672, - "step": 30716 - }, - { - "epoch": 0.79, - "learning_rate": 1.7297947128074037e-06, - "loss": 1.0127, - "step": 30717 - }, - { - "epoch": 0.79, - "learning_rate": 1.7297757951698224e-06, - "loss": 0.8555, - "step": 30718 - }, - { - "epoch": 0.79, - "learning_rate": 1.729756876973485e-06, - "loss": 0.8232, - "step": 30719 - }, - { - "epoch": 0.79, - "learning_rate": 1.7297379582184066e-06, - "loss": 0.9443, - "step": 30720 - }, - { - "epoch": 0.79, - "learning_rate": 1.7297190389046013e-06, - "loss": 0.8086, - "step": 30721 - }, - { - "epoch": 0.79, - "learning_rate": 1.7297001190320837e-06, - "loss": 0.6499, - "step": 30722 - }, - { - "epoch": 0.79, - "learning_rate": 1.7296811986008681e-06, - "loss": 0.7642, - "step": 30723 - }, - { - "epoch": 0.79, - "learning_rate": 1.7296622776109695e-06, - "loss": 0.8613, - "step": 30724 - }, - { - "epoch": 0.79, - "learning_rate": 1.7296433560624018e-06, - "loss": 0.7678, - "step": 30725 - }, - { - "epoch": 0.79, - "learning_rate": 1.7296244339551797e-06, - "loss": 0.6841, - "step": 30726 - }, - { - "epoch": 0.79, - "learning_rate": 1.7296055112893178e-06, - "loss": 0.835, - "step": 30727 - }, - { - "epoch": 0.79, - "learning_rate": 1.7295865880648304e-06, - "loss": 0.9883, - "step": 30728 - }, - { - "epoch": 0.79, - "learning_rate": 1.7295676642817324e-06, - "loss": 0.917, - "step": 30729 - }, - { - "epoch": 0.79, - "learning_rate": 1.7295487399400376e-06, - "loss": 1.0215, - "step": 30730 - }, - { - "epoch": 0.79, - "learning_rate": 1.7295298150397612e-06, - "loss": 0.5799, - "step": 30731 - }, - { - "epoch": 0.79, - "learning_rate": 1.7295108895809171e-06, - "loss": 0.9072, - "step": 30732 - }, - { - "epoch": 0.79, - "learning_rate": 1.7294919635635203e-06, - "loss": 0.9473, - "step": 30733 - }, - { - "epoch": 0.79, - "learning_rate": 1.7294730369875849e-06, - "loss": 0.9014, - "step": 30734 - }, - { - "epoch": 0.79, - "learning_rate": 1.7294541098531256e-06, - "loss": 0.7461, - "step": 30735 - }, - { - "epoch": 0.79, - "learning_rate": 1.7294351821601566e-06, - "loss": 0.6836, - "step": 30736 - }, - { - "epoch": 0.79, - "learning_rate": 1.7294162539086932e-06, - "loss": 0.6914, - "step": 30737 - }, - { - "epoch": 0.79, - "learning_rate": 1.7293973250987488e-06, - "loss": 0.9395, - "step": 30738 - }, - { - "epoch": 0.79, - "learning_rate": 1.7293783957303387e-06, - "loss": 0.6709, - "step": 30739 - }, - { - "epoch": 0.79, - "learning_rate": 1.7293594658034768e-06, - "loss": 0.7412, - "step": 30740 - }, - { - "epoch": 0.79, - "learning_rate": 1.729340535318178e-06, - "loss": 1.0283, - "step": 30741 - }, - { - "epoch": 0.79, - "learning_rate": 1.7293216042744568e-06, - "loss": 1.0615, - "step": 30742 - }, - { - "epoch": 0.79, - "learning_rate": 1.7293026726723276e-06, - "loss": 1.0049, - "step": 30743 - }, - { - "epoch": 0.79, - "learning_rate": 1.7292837405118048e-06, - "loss": 0.8662, - "step": 30744 - }, - { - "epoch": 0.79, - "learning_rate": 1.729264807792903e-06, - "loss": 0.8394, - "step": 30745 - }, - { - "epoch": 0.79, - "learning_rate": 1.7292458745156365e-06, - "loss": 0.8701, - "step": 30746 - }, - { - "epoch": 0.79, - "learning_rate": 1.72922694068002e-06, - "loss": 0.8379, - "step": 30747 - }, - { - "epoch": 0.79, - "learning_rate": 1.7292080062860681e-06, - "loss": 0.8882, - "step": 30748 - }, - { - "epoch": 0.79, - "learning_rate": 1.729189071333795e-06, - "loss": 0.6709, - "step": 30749 - }, - { - "epoch": 0.79, - "learning_rate": 1.7291701358232155e-06, - "loss": 0.9414, - "step": 30750 - }, - { - "epoch": 0.79, - "learning_rate": 1.729151199754344e-06, - "loss": 0.9365, - "step": 30751 - }, - { - "epoch": 0.79, - "learning_rate": 1.729132263127195e-06, - "loss": 0.6064, - "step": 30752 - }, - { - "epoch": 0.79, - "learning_rate": 1.7291133259417827e-06, - "loss": 0.8164, - "step": 30753 - }, - { - "epoch": 0.79, - "learning_rate": 1.7290943881981221e-06, - "loss": 0.7495, - "step": 30754 - }, - { - "epoch": 0.79, - "learning_rate": 1.7290754498962272e-06, - "loss": 1.1338, - "step": 30755 - }, - { - "epoch": 0.79, - "learning_rate": 1.7290565110361128e-06, - "loss": 0.9697, - "step": 30756 - }, - { - "epoch": 0.79, - "learning_rate": 1.7290375716177938e-06, - "loss": 0.9658, - "step": 30757 - }, - { - "epoch": 0.79, - "learning_rate": 1.7290186316412838e-06, - "loss": 0.917, - "step": 30758 - }, - { - "epoch": 0.79, - "learning_rate": 1.7289996911065977e-06, - "loss": 0.7979, - "step": 30759 - }, - { - "epoch": 0.79, - "learning_rate": 1.7289807500137502e-06, - "loss": 1.0078, - "step": 30760 - }, - { - "epoch": 0.79, - "learning_rate": 1.7289618083627557e-06, - "loss": 0.7764, - "step": 30761 - }, - { - "epoch": 0.79, - "learning_rate": 1.7289428661536286e-06, - "loss": 0.7451, - "step": 30762 - }, - { - "epoch": 0.79, - "learning_rate": 1.7289239233863838e-06, - "loss": 0.7949, - "step": 30763 - }, - { - "epoch": 0.79, - "learning_rate": 1.728904980061035e-06, - "loss": 0.8408, - "step": 30764 - }, - { - "epoch": 0.79, - "learning_rate": 1.7288860361775974e-06, - "loss": 0.9346, - "step": 30765 - }, - { - "epoch": 0.79, - "learning_rate": 1.728867091736085e-06, - "loss": 0.7803, - "step": 30766 - }, - { - "epoch": 0.79, - "learning_rate": 1.728848146736513e-06, - "loss": 0.8271, - "step": 30767 - }, - { - "epoch": 0.79, - "learning_rate": 1.7288292011788955e-06, - "loss": 0.9258, - "step": 30768 - }, - { - "epoch": 0.79, - "learning_rate": 1.7288102550632466e-06, - "loss": 0.7881, - "step": 30769 - }, - { - "epoch": 0.79, - "learning_rate": 1.728791308389581e-06, - "loss": 0.8535, - "step": 30770 - }, - { - "epoch": 0.79, - "learning_rate": 1.7287723611579141e-06, - "loss": 0.9434, - "step": 30771 - }, - { - "epoch": 0.79, - "learning_rate": 1.7287534133682594e-06, - "loss": 1.1094, - "step": 30772 - }, - { - "epoch": 0.79, - "learning_rate": 1.7287344650206317e-06, - "loss": 0.8115, - "step": 30773 - }, - { - "epoch": 0.79, - "learning_rate": 1.7287155161150455e-06, - "loss": 0.9668, - "step": 30774 - }, - { - "epoch": 0.79, - "learning_rate": 1.7286965666515154e-06, - "loss": 0.7739, - "step": 30775 - }, - { - "epoch": 0.79, - "learning_rate": 1.7286776166300557e-06, - "loss": 0.7461, - "step": 30776 - }, - { - "epoch": 0.79, - "learning_rate": 1.7286586660506814e-06, - "loss": 0.8396, - "step": 30777 - }, - { - "epoch": 0.79, - "learning_rate": 1.7286397149134064e-06, - "loss": 1.3643, - "step": 30778 - }, - { - "epoch": 0.79, - "learning_rate": 1.7286207632182455e-06, - "loss": 0.3237, - "step": 30779 - }, - { - "epoch": 0.79, - "learning_rate": 1.7286018109652132e-06, - "loss": 0.8613, - "step": 30780 - }, - { - "epoch": 0.79, - "learning_rate": 1.7285828581543238e-06, - "loss": 0.9844, - "step": 30781 - }, - { - "epoch": 0.79, - "learning_rate": 1.7285639047855923e-06, - "loss": 0.9209, - "step": 30782 - }, - { - "epoch": 0.79, - "learning_rate": 1.7285449508590331e-06, - "loss": 0.6904, - "step": 30783 - }, - { - "epoch": 0.79, - "learning_rate": 1.7285259963746602e-06, - "loss": 0.7217, - "step": 30784 - }, - { - "epoch": 0.79, - "learning_rate": 1.7285070413324885e-06, - "loss": 0.8623, - "step": 30785 - }, - { - "epoch": 0.79, - "learning_rate": 1.7284880857325324e-06, - "loss": 0.7988, - "step": 30786 - }, - { - "epoch": 0.79, - "learning_rate": 1.7284691295748065e-06, - "loss": 0.7505, - "step": 30787 - }, - { - "epoch": 0.79, - "learning_rate": 1.7284501728593252e-06, - "loss": 0.9697, - "step": 30788 - }, - { - "epoch": 0.79, - "learning_rate": 1.7284312155861033e-06, - "loss": 0.5938, - "step": 30789 - }, - { - "epoch": 0.79, - "learning_rate": 1.728412257755155e-06, - "loss": 0.9629, - "step": 30790 - }, - { - "epoch": 0.79, - "learning_rate": 1.7283932993664948e-06, - "loss": 0.7476, - "step": 30791 - }, - { - "epoch": 0.79, - "learning_rate": 1.7283743404201374e-06, - "loss": 0.833, - "step": 30792 - }, - { - "epoch": 0.79, - "learning_rate": 1.7283553809160974e-06, - "loss": 0.7886, - "step": 30793 - }, - { - "epoch": 0.79, - "learning_rate": 1.7283364208543892e-06, - "loss": 0.7654, - "step": 30794 - }, - { - "epoch": 0.79, - "learning_rate": 1.7283174602350271e-06, - "loss": 0.8564, - "step": 30795 - }, - { - "epoch": 0.79, - "learning_rate": 1.728298499058026e-06, - "loss": 0.8252, - "step": 30796 - }, - { - "epoch": 0.79, - "learning_rate": 1.7282795373234002e-06, - "loss": 0.7617, - "step": 30797 - }, - { - "epoch": 0.79, - "learning_rate": 1.728260575031164e-06, - "loss": 1.0146, - "step": 30798 - }, - { - "epoch": 0.79, - "learning_rate": 1.7282416121813326e-06, - "loss": 0.7578, - "step": 30799 - }, - { - "epoch": 0.79, - "learning_rate": 1.72822264877392e-06, - "loss": 0.7676, - "step": 30800 - }, - { - "epoch": 0.79, - "learning_rate": 1.7282036848089404e-06, - "loss": 0.8965, - "step": 30801 - }, - { - "epoch": 0.79, - "learning_rate": 1.728184720286409e-06, - "loss": 0.9629, - "step": 30802 - }, - { - "epoch": 0.79, - "learning_rate": 1.72816575520634e-06, - "loss": 0.667, - "step": 30803 - }, - { - "epoch": 0.79, - "learning_rate": 1.7281467895687481e-06, - "loss": 0.9229, - "step": 30804 - }, - { - "epoch": 0.79, - "learning_rate": 1.7281278233736477e-06, - "loss": 0.9121, - "step": 30805 - }, - { - "epoch": 0.79, - "learning_rate": 1.7281088566210528e-06, - "loss": 0.7524, - "step": 30806 - }, - { - "epoch": 0.79, - "learning_rate": 1.728089889310979e-06, - "loss": 0.8926, - "step": 30807 - }, - { - "epoch": 0.79, - "learning_rate": 1.7280709214434398e-06, - "loss": 0.7563, - "step": 30808 - }, - { - "epoch": 0.79, - "learning_rate": 1.7280519530184506e-06, - "loss": 0.8652, - "step": 30809 - }, - { - "epoch": 0.79, - "learning_rate": 1.7280329840360252e-06, - "loss": 1.0264, - "step": 30810 - }, - { - "epoch": 0.79, - "learning_rate": 1.7280140144961788e-06, - "loss": 0.9258, - "step": 30811 - }, - { - "epoch": 0.79, - "learning_rate": 1.7279950443989252e-06, - "loss": 0.9375, - "step": 30812 - }, - { - "epoch": 0.79, - "learning_rate": 1.7279760737442795e-06, - "loss": 0.9346, - "step": 30813 - }, - { - "epoch": 0.79, - "learning_rate": 1.7279571025322554e-06, - "loss": 0.9365, - "step": 30814 - }, - { - "epoch": 0.79, - "learning_rate": 1.7279381307628686e-06, - "loss": 0.7412, - "step": 30815 - }, - { - "epoch": 0.79, - "learning_rate": 1.727919158436133e-06, - "loss": 0.8342, - "step": 30816 - }, - { - "epoch": 0.79, - "learning_rate": 1.727900185552063e-06, - "loss": 0.9189, - "step": 30817 - }, - { - "epoch": 0.79, - "learning_rate": 1.7278812121106734e-06, - "loss": 0.7227, - "step": 30818 - }, - { - "epoch": 0.79, - "learning_rate": 1.7278622381119784e-06, - "loss": 0.7285, - "step": 30819 - }, - { - "epoch": 0.79, - "learning_rate": 1.727843263555993e-06, - "loss": 1.1104, - "step": 30820 - }, - { - "epoch": 0.79, - "learning_rate": 1.7278242884427316e-06, - "loss": 0.8984, - "step": 30821 - }, - { - "epoch": 0.79, - "learning_rate": 1.7278053127722086e-06, - "loss": 0.8809, - "step": 30822 - }, - { - "epoch": 0.79, - "learning_rate": 1.727786336544438e-06, - "loss": 0.7734, - "step": 30823 - }, - { - "epoch": 0.79, - "learning_rate": 1.7277673597594356e-06, - "loss": 0.7505, - "step": 30824 - }, - { - "epoch": 0.79, - "learning_rate": 1.7277483824172147e-06, - "loss": 0.8125, - "step": 30825 - }, - { - "epoch": 0.79, - "learning_rate": 1.7277294045177903e-06, - "loss": 0.8115, - "step": 30826 - }, - { - "epoch": 0.79, - "learning_rate": 1.7277104260611773e-06, - "loss": 0.8604, - "step": 30827 - }, - { - "epoch": 0.79, - "learning_rate": 1.7276914470473898e-06, - "loss": 0.6641, - "step": 30828 - }, - { - "epoch": 0.79, - "learning_rate": 1.7276724674764422e-06, - "loss": 1.0703, - "step": 30829 - }, - { - "epoch": 0.79, - "learning_rate": 1.7276534873483492e-06, - "loss": 0.6675, - "step": 30830 - }, - { - "epoch": 0.79, - "learning_rate": 1.7276345066631258e-06, - "loss": 0.8984, - "step": 30831 - }, - { - "epoch": 0.79, - "learning_rate": 1.7276155254207857e-06, - "loss": 0.998, - "step": 30832 - }, - { - "epoch": 0.79, - "learning_rate": 1.727596543621344e-06, - "loss": 1.1318, - "step": 30833 - }, - { - "epoch": 0.79, - "learning_rate": 1.7275775612648151e-06, - "loss": 0.7549, - "step": 30834 - }, - { - "epoch": 0.79, - "learning_rate": 1.7275585783512136e-06, - "loss": 0.8301, - "step": 30835 - }, - { - "epoch": 0.79, - "learning_rate": 1.7275395948805539e-06, - "loss": 0.8984, - "step": 30836 - }, - { - "epoch": 0.79, - "learning_rate": 1.7275206108528506e-06, - "loss": 0.915, - "step": 30837 - }, - { - "epoch": 0.79, - "learning_rate": 1.727501626268118e-06, - "loss": 0.8535, - "step": 30838 - }, - { - "epoch": 0.79, - "learning_rate": 1.7274826411263712e-06, - "loss": 0.6948, - "step": 30839 - }, - { - "epoch": 0.79, - "learning_rate": 1.7274636554276243e-06, - "loss": 0.9629, - "step": 30840 - }, - { - "epoch": 0.79, - "learning_rate": 1.727444669171892e-06, - "loss": 0.8662, - "step": 30841 - }, - { - "epoch": 0.79, - "learning_rate": 1.7274256823591883e-06, - "loss": 0.5795, - "step": 30842 - }, - { - "epoch": 0.79, - "learning_rate": 1.7274066949895288e-06, - "loss": 0.7158, - "step": 30843 - }, - { - "epoch": 0.79, - "learning_rate": 1.727387707062927e-06, - "loss": 0.8926, - "step": 30844 - }, - { - "epoch": 0.79, - "learning_rate": 1.7273687185793978e-06, - "loss": 0.9131, - "step": 30845 - }, - { - "epoch": 0.79, - "learning_rate": 1.7273497295389563e-06, - "loss": 0.9062, - "step": 30846 - }, - { - "epoch": 0.79, - "learning_rate": 1.7273307399416162e-06, - "loss": 0.9111, - "step": 30847 - }, - { - "epoch": 0.79, - "learning_rate": 1.7273117497873926e-06, - "loss": 0.917, - "step": 30848 - }, - { - "epoch": 0.79, - "learning_rate": 1.7272927590762997e-06, - "loss": 0.8555, - "step": 30849 - }, - { - "epoch": 0.79, - "learning_rate": 1.7272737678083521e-06, - "loss": 0.6226, - "step": 30850 - }, - { - "epoch": 0.79, - "learning_rate": 1.7272547759835646e-06, - "loss": 0.8052, - "step": 30851 - }, - { - "epoch": 0.79, - "learning_rate": 1.7272357836019516e-06, - "loss": 0.8379, - "step": 30852 - }, - { - "epoch": 0.79, - "learning_rate": 1.7272167906635276e-06, - "loss": 0.8438, - "step": 30853 - }, - { - "epoch": 0.79, - "learning_rate": 1.7271977971683073e-06, - "loss": 1.0205, - "step": 30854 - }, - { - "epoch": 0.79, - "learning_rate": 1.7271788031163044e-06, - "loss": 0.9951, - "step": 30855 - }, - { - "epoch": 0.79, - "learning_rate": 1.7271598085075348e-06, - "loss": 0.6318, - "step": 30856 - }, - { - "epoch": 0.79, - "learning_rate": 1.727140813342012e-06, - "loss": 0.5947, - "step": 30857 - }, - { - "epoch": 0.79, - "learning_rate": 1.7271218176197511e-06, - "loss": 0.6785, - "step": 30858 - }, - { - "epoch": 0.79, - "learning_rate": 1.7271028213407663e-06, - "loss": 1.0205, - "step": 30859 - }, - { - "epoch": 0.79, - "learning_rate": 1.7270838245050725e-06, - "loss": 0.834, - "step": 30860 - }, - { - "epoch": 0.79, - "learning_rate": 1.727064827112684e-06, - "loss": 0.7422, - "step": 30861 - }, - { - "epoch": 0.79, - "learning_rate": 1.7270458291636153e-06, - "loss": 0.9854, - "step": 30862 - }, - { - "epoch": 0.79, - "learning_rate": 1.727026830657881e-06, - "loss": 0.7017, - "step": 30863 - }, - { - "epoch": 0.79, - "learning_rate": 1.727007831595496e-06, - "loss": 0.9648, - "step": 30864 - }, - { - "epoch": 0.79, - "learning_rate": 1.726988831976474e-06, - "loss": 0.9546, - "step": 30865 - }, - { - "epoch": 0.79, - "learning_rate": 1.7269698318008304e-06, - "loss": 0.8252, - "step": 30866 - }, - { - "epoch": 0.79, - "learning_rate": 1.7269508310685794e-06, - "loss": 0.7969, - "step": 30867 - }, - { - "epoch": 0.79, - "learning_rate": 1.7269318297797354e-06, - "loss": 0.7014, - "step": 30868 - }, - { - "epoch": 0.79, - "learning_rate": 1.7269128279343135e-06, - "loss": 0.9746, - "step": 30869 - }, - { - "epoch": 0.79, - "learning_rate": 1.7268938255323277e-06, - "loss": 0.9131, - "step": 30870 - }, - { - "epoch": 0.79, - "learning_rate": 1.7268748225737925e-06, - "loss": 0.5811, - "step": 30871 - }, - { - "epoch": 0.79, - "learning_rate": 1.726855819058723e-06, - "loss": 0.9307, - "step": 30872 - }, - { - "epoch": 0.79, - "learning_rate": 1.7268368149871333e-06, - "loss": 0.6079, - "step": 30873 - }, - { - "epoch": 0.79, - "learning_rate": 1.7268178103590382e-06, - "loss": 0.7808, - "step": 30874 - }, - { - "epoch": 0.79, - "learning_rate": 1.7267988051744519e-06, - "loss": 0.7905, - "step": 30875 - }, - { - "epoch": 0.79, - "learning_rate": 1.7267797994333893e-06, - "loss": 0.8799, - "step": 30876 - }, - { - "epoch": 0.79, - "learning_rate": 1.7267607931358648e-06, - "loss": 0.916, - "step": 30877 - }, - { - "epoch": 0.79, - "learning_rate": 1.7267417862818929e-06, - "loss": 0.8447, - "step": 30878 - }, - { - "epoch": 0.79, - "learning_rate": 1.7267227788714882e-06, - "loss": 0.6489, - "step": 30879 - }, - { - "epoch": 0.79, - "learning_rate": 1.7267037709046655e-06, - "loss": 0.8613, - "step": 30880 - }, - { - "epoch": 0.79, - "learning_rate": 1.726684762381439e-06, - "loss": 0.8574, - "step": 30881 - }, - { - "epoch": 0.79, - "learning_rate": 1.7266657533018231e-06, - "loss": 0.8115, - "step": 30882 - }, - { - "epoch": 0.79, - "learning_rate": 1.7266467436658329e-06, - "loss": 0.8203, - "step": 30883 - }, - { - "epoch": 0.79, - "learning_rate": 1.726627733473483e-06, - "loss": 0.9375, - "step": 30884 - }, - { - "epoch": 0.79, - "learning_rate": 1.7266087227247875e-06, - "loss": 0.8433, - "step": 30885 - }, - { - "epoch": 0.79, - "learning_rate": 1.726589711419761e-06, - "loss": 0.9668, - "step": 30886 - }, - { - "epoch": 0.79, - "learning_rate": 1.726570699558418e-06, - "loss": 0.8721, - "step": 30887 - }, - { - "epoch": 0.79, - "learning_rate": 1.7265516871407736e-06, - "loss": 0.7227, - "step": 30888 - }, - { - "epoch": 0.79, - "learning_rate": 1.7265326741668416e-06, - "loss": 0.8584, - "step": 30889 - }, - { - "epoch": 0.79, - "learning_rate": 1.726513660636637e-06, - "loss": 0.6096, - "step": 30890 - }, - { - "epoch": 0.79, - "learning_rate": 1.7264946465501745e-06, - "loss": 0.9502, - "step": 30891 - }, - { - "epoch": 0.79, - "learning_rate": 1.7264756319074684e-06, - "loss": 1.085, - "step": 30892 - }, - { - "epoch": 0.79, - "learning_rate": 1.7264566167085332e-06, - "loss": 0.668, - "step": 30893 - }, - { - "epoch": 0.79, - "learning_rate": 1.7264376009533838e-06, - "loss": 0.833, - "step": 30894 - }, - { - "epoch": 0.79, - "learning_rate": 1.7264185846420344e-06, - "loss": 0.9814, - "step": 30895 - }, - { - "epoch": 0.79, - "learning_rate": 1.7263995677744997e-06, - "loss": 0.7217, - "step": 30896 - }, - { - "epoch": 0.79, - "learning_rate": 1.7263805503507945e-06, - "loss": 0.6875, - "step": 30897 - }, - { - "epoch": 0.79, - "learning_rate": 1.7263615323709326e-06, - "loss": 0.7966, - "step": 30898 - }, - { - "epoch": 0.79, - "learning_rate": 1.7263425138349295e-06, - "loss": 0.7261, - "step": 30899 - }, - { - "epoch": 0.79, - "learning_rate": 1.726323494742799e-06, - "loss": 0.9727, - "step": 30900 - }, - { - "epoch": 0.79, - "learning_rate": 1.7263044750945563e-06, - "loss": 0.7759, - "step": 30901 - }, - { - "epoch": 0.79, - "learning_rate": 1.7262854548902154e-06, - "loss": 0.8057, - "step": 30902 - }, - { - "epoch": 0.79, - "learning_rate": 1.7262664341297912e-06, - "loss": 0.8311, - "step": 30903 - }, - { - "epoch": 0.79, - "learning_rate": 1.7262474128132983e-06, - "loss": 0.7666, - "step": 30904 - }, - { - "epoch": 0.79, - "learning_rate": 1.726228390940751e-06, - "loss": 0.8926, - "step": 30905 - }, - { - "epoch": 0.79, - "learning_rate": 1.7262093685121642e-06, - "loss": 0.999, - "step": 30906 - }, - { - "epoch": 0.79, - "learning_rate": 1.7261903455275521e-06, - "loss": 0.7432, - "step": 30907 - }, - { - "epoch": 0.79, - "learning_rate": 1.7261713219869295e-06, - "loss": 0.7808, - "step": 30908 - }, - { - "epoch": 0.79, - "learning_rate": 1.726152297890311e-06, - "loss": 1.0039, - "step": 30909 - }, - { - "epoch": 0.79, - "learning_rate": 1.7261332732377109e-06, - "loss": 0.8984, - "step": 30910 - }, - { - "epoch": 0.79, - "learning_rate": 1.726114248029144e-06, - "loss": 0.9717, - "step": 30911 - }, - { - "epoch": 0.79, - "learning_rate": 1.7260952222646249e-06, - "loss": 0.646, - "step": 30912 - }, - { - "epoch": 0.79, - "learning_rate": 1.726076195944168e-06, - "loss": 1.0166, - "step": 30913 - }, - { - "epoch": 0.79, - "learning_rate": 1.7260571690677879e-06, - "loss": 0.5547, - "step": 30914 - }, - { - "epoch": 0.79, - "learning_rate": 1.7260381416354992e-06, - "loss": 0.9209, - "step": 30915 - }, - { - "epoch": 0.79, - "learning_rate": 1.7260191136473168e-06, - "loss": 0.5781, - "step": 30916 - }, - { - "epoch": 0.79, - "learning_rate": 1.7260000851032547e-06, - "loss": 0.7217, - "step": 30917 - }, - { - "epoch": 0.79, - "learning_rate": 1.7259810560033277e-06, - "loss": 0.8848, - "step": 30918 - }, - { - "epoch": 0.79, - "learning_rate": 1.7259620263475503e-06, - "loss": 0.7539, - "step": 30919 - }, - { - "epoch": 0.79, - "learning_rate": 1.7259429961359371e-06, - "loss": 1.0293, - "step": 30920 - }, - { - "epoch": 0.79, - "learning_rate": 1.7259239653685032e-06, - "loss": 0.6611, - "step": 30921 - }, - { - "epoch": 0.79, - "learning_rate": 1.7259049340452622e-06, - "loss": 0.8193, - "step": 30922 - }, - { - "epoch": 0.79, - "learning_rate": 1.7258859021662293e-06, - "loss": 0.6641, - "step": 30923 - }, - { - "epoch": 0.79, - "learning_rate": 1.7258668697314192e-06, - "loss": 0.9102, - "step": 30924 - }, - { - "epoch": 0.79, - "learning_rate": 1.7258478367408459e-06, - "loss": 0.8252, - "step": 30925 - }, - { - "epoch": 0.79, - "learning_rate": 1.7258288031945243e-06, - "loss": 1.0122, - "step": 30926 - }, - { - "epoch": 0.79, - "learning_rate": 1.7258097690924691e-06, - "loss": 0.9561, - "step": 30927 - }, - { - "epoch": 0.79, - "learning_rate": 1.7257907344346947e-06, - "loss": 0.8613, - "step": 30928 - }, - { - "epoch": 0.79, - "learning_rate": 1.7257716992212154e-06, - "loss": 0.79, - "step": 30929 - }, - { - "epoch": 0.79, - "learning_rate": 1.7257526634520464e-06, - "loss": 0.7197, - "step": 30930 - }, - { - "epoch": 0.79, - "learning_rate": 1.725733627127202e-06, - "loss": 0.7122, - "step": 30931 - }, - { - "epoch": 0.79, - "learning_rate": 1.7257145902466967e-06, - "loss": 0.6953, - "step": 30932 - }, - { - "epoch": 0.79, - "learning_rate": 1.7256955528105453e-06, - "loss": 0.7808, - "step": 30933 - }, - { - "epoch": 0.79, - "learning_rate": 1.7256765148187617e-06, - "loss": 0.7471, - "step": 30934 - }, - { - "epoch": 0.79, - "learning_rate": 1.7256574762713614e-06, - "loss": 0.8066, - "step": 30935 - }, - { - "epoch": 0.79, - "learning_rate": 1.7256384371683584e-06, - "loss": 1.1328, - "step": 30936 - }, - { - "epoch": 0.79, - "learning_rate": 1.7256193975097673e-06, - "loss": 0.6895, - "step": 30937 - }, - { - "epoch": 0.79, - "learning_rate": 1.7256003572956028e-06, - "loss": 0.7656, - "step": 30938 - }, - { - "epoch": 0.79, - "learning_rate": 1.7255813165258796e-06, - "loss": 0.7168, - "step": 30939 - }, - { - "epoch": 0.79, - "learning_rate": 1.725562275200612e-06, - "loss": 0.9619, - "step": 30940 - }, - { - "epoch": 0.79, - "learning_rate": 1.725543233319815e-06, - "loss": 0.8496, - "step": 30941 - }, - { - "epoch": 0.79, - "learning_rate": 1.7255241908835027e-06, - "loss": 0.7505, - "step": 30942 - }, - { - "epoch": 0.79, - "learning_rate": 1.72550514789169e-06, - "loss": 0.7407, - "step": 30943 - }, - { - "epoch": 0.79, - "learning_rate": 1.7254861043443911e-06, - "loss": 0.9502, - "step": 30944 - }, - { - "epoch": 0.79, - "learning_rate": 1.725467060241621e-06, - "loss": 0.9121, - "step": 30945 - }, - { - "epoch": 0.79, - "learning_rate": 1.7254480155833942e-06, - "loss": 0.6084, - "step": 30946 - }, - { - "epoch": 0.79, - "learning_rate": 1.725428970369725e-06, - "loss": 0.8867, - "step": 30947 - }, - { - "epoch": 0.79, - "learning_rate": 1.7254099246006283e-06, - "loss": 0.9629, - "step": 30948 - }, - { - "epoch": 0.79, - "learning_rate": 1.7253908782761187e-06, - "loss": 0.9277, - "step": 30949 - }, - { - "epoch": 0.79, - "learning_rate": 1.7253718313962105e-06, - "loss": 0.8975, - "step": 30950 - }, - { - "epoch": 0.79, - "learning_rate": 1.7253527839609188e-06, - "loss": 1.0146, - "step": 30951 - }, - { - "epoch": 0.79, - "learning_rate": 1.7253337359702575e-06, - "loss": 0.9434, - "step": 30952 - }, - { - "epoch": 0.79, - "learning_rate": 1.7253146874242414e-06, - "loss": 0.8203, - "step": 30953 - }, - { - "epoch": 0.79, - "learning_rate": 1.7252956383228857e-06, - "loss": 0.8965, - "step": 30954 - }, - { - "epoch": 0.79, - "learning_rate": 1.7252765886662037e-06, - "loss": 0.915, - "step": 30955 - }, - { - "epoch": 0.79, - "learning_rate": 1.7252575384542114e-06, - "loss": 0.6187, - "step": 30956 - }, - { - "epoch": 0.79, - "learning_rate": 1.7252384876869225e-06, - "loss": 0.7583, - "step": 30957 - }, - { - "epoch": 0.79, - "learning_rate": 1.7252194363643523e-06, - "loss": 0.7102, - "step": 30958 - }, - { - "epoch": 0.79, - "learning_rate": 1.7252003844865143e-06, - "loss": 1.0117, - "step": 30959 - }, - { - "epoch": 0.79, - "learning_rate": 1.725181332053424e-06, - "loss": 0.8633, - "step": 30960 - }, - { - "epoch": 0.79, - "learning_rate": 1.7251622790650954e-06, - "loss": 0.5498, - "step": 30961 - }, - { - "epoch": 0.79, - "learning_rate": 1.7251432255215436e-06, - "loss": 0.9658, - "step": 30962 - }, - { - "epoch": 0.79, - "learning_rate": 1.725124171422783e-06, - "loss": 0.4546, - "step": 30963 - }, - { - "epoch": 0.79, - "learning_rate": 1.7251051167688284e-06, - "loss": 1.1436, - "step": 30964 - }, - { - "epoch": 0.79, - "learning_rate": 1.725086061559694e-06, - "loss": 0.873, - "step": 30965 - }, - { - "epoch": 0.79, - "learning_rate": 1.7250670057953943e-06, - "loss": 0.7964, - "step": 30966 - }, - { - "epoch": 0.79, - "learning_rate": 1.7250479494759442e-06, - "loss": 0.9375, - "step": 30967 - }, - { - "epoch": 0.79, - "learning_rate": 1.7250288926013582e-06, - "loss": 0.7354, - "step": 30968 - }, - { - "epoch": 0.79, - "learning_rate": 1.725009835171651e-06, - "loss": 1.002, - "step": 30969 - }, - { - "epoch": 0.79, - "learning_rate": 1.7249907771868374e-06, - "loss": 1.0029, - "step": 30970 - }, - { - "epoch": 0.79, - "learning_rate": 1.7249717186469313e-06, - "loss": 0.7441, - "step": 30971 - }, - { - "epoch": 0.79, - "learning_rate": 1.7249526595519477e-06, - "loss": 1.0234, - "step": 30972 - }, - { - "epoch": 0.79, - "learning_rate": 1.7249335999019014e-06, - "loss": 1.043, - "step": 30973 - }, - { - "epoch": 0.79, - "learning_rate": 1.7249145396968067e-06, - "loss": 0.7227, - "step": 30974 - }, - { - "epoch": 0.79, - "learning_rate": 1.7248954789366784e-06, - "loss": 0.855, - "step": 30975 - }, - { - "epoch": 0.79, - "learning_rate": 1.7248764176215306e-06, - "loss": 1.1406, - "step": 30976 - }, - { - "epoch": 0.79, - "learning_rate": 1.7248573557513786e-06, - "loss": 0.6768, - "step": 30977 - }, - { - "epoch": 0.79, - "learning_rate": 1.7248382933262365e-06, - "loss": 0.9111, - "step": 30978 - }, - { - "epoch": 0.79, - "learning_rate": 1.7248192303461191e-06, - "loss": 0.9805, - "step": 30979 - }, - { - "epoch": 0.79, - "learning_rate": 1.7248001668110408e-06, - "loss": 0.8467, - "step": 30980 - }, - { - "epoch": 0.79, - "learning_rate": 1.7247811027210163e-06, - "loss": 0.5366, - "step": 30981 - }, - { - "epoch": 0.79, - "learning_rate": 1.7247620380760605e-06, - "loss": 0.6313, - "step": 30982 - }, - { - "epoch": 0.79, - "learning_rate": 1.7247429728761876e-06, - "loss": 1.0205, - "step": 30983 - }, - { - "epoch": 0.79, - "learning_rate": 1.7247239071214124e-06, - "loss": 0.8154, - "step": 30984 - }, - { - "epoch": 0.79, - "learning_rate": 1.7247048408117495e-06, - "loss": 0.9131, - "step": 30985 - }, - { - "epoch": 0.79, - "learning_rate": 1.7246857739472132e-06, - "loss": 0.5234, - "step": 30986 - }, - { - "epoch": 0.79, - "learning_rate": 1.7246667065278183e-06, - "loss": 0.7632, - "step": 30987 - }, - { - "epoch": 0.79, - "learning_rate": 1.7246476385535798e-06, - "loss": 1.042, - "step": 30988 - }, - { - "epoch": 0.79, - "learning_rate": 1.7246285700245115e-06, - "loss": 0.8901, - "step": 30989 - }, - { - "epoch": 0.79, - "learning_rate": 1.7246095009406285e-06, - "loss": 0.9092, - "step": 30990 - }, - { - "epoch": 0.79, - "learning_rate": 1.7245904313019457e-06, - "loss": 0.8096, - "step": 30991 - }, - { - "epoch": 0.79, - "learning_rate": 1.724571361108477e-06, - "loss": 0.791, - "step": 30992 - }, - { - "epoch": 0.79, - "learning_rate": 1.724552290360237e-06, - "loss": 0.9658, - "step": 30993 - }, - { - "epoch": 0.79, - "learning_rate": 1.7245332190572413e-06, - "loss": 0.6792, - "step": 30994 - }, - { - "epoch": 0.79, - "learning_rate": 1.7245141471995033e-06, - "loss": 0.833, - "step": 30995 - }, - { - "epoch": 0.79, - "learning_rate": 1.7244950747870383e-06, - "loss": 0.8691, - "step": 30996 - }, - { - "epoch": 0.79, - "learning_rate": 1.724476001819861e-06, - "loss": 0.7969, - "step": 30997 - }, - { - "epoch": 0.79, - "learning_rate": 1.7244569282979856e-06, - "loss": 0.7949, - "step": 30998 - }, - { - "epoch": 0.79, - "learning_rate": 1.7244378542214267e-06, - "loss": 0.8877, - "step": 30999 - }, - { - "epoch": 0.79, - "learning_rate": 1.724418779590199e-06, - "loss": 0.8154, - "step": 31000 - }, - { - "epoch": 0.79, - "learning_rate": 1.7243997044043176e-06, - "loss": 0.8594, - "step": 31001 - }, - { - "epoch": 0.79, - "learning_rate": 1.724380628663796e-06, - "loss": 0.7969, - "step": 31002 - }, - { - "epoch": 0.79, - "learning_rate": 1.72436155236865e-06, - "loss": 0.9062, - "step": 31003 - }, - { - "epoch": 0.79, - "learning_rate": 1.7243424755188934e-06, - "loss": 1.0107, - "step": 31004 - }, - { - "epoch": 0.79, - "learning_rate": 1.724323398114541e-06, - "loss": 1.0371, - "step": 31005 - }, - { - "epoch": 0.79, - "learning_rate": 1.7243043201556077e-06, - "loss": 0.8467, - "step": 31006 - }, - { - "epoch": 0.79, - "learning_rate": 1.7242852416421076e-06, - "loss": 0.8774, - "step": 31007 - }, - { - "epoch": 0.79, - "learning_rate": 1.724266162574056e-06, - "loss": 0.8994, - "step": 31008 - }, - { - "epoch": 0.79, - "learning_rate": 1.724247082951467e-06, - "loss": 0.998, - "step": 31009 - }, - { - "epoch": 0.79, - "learning_rate": 1.724228002774355e-06, - "loss": 0.7471, - "step": 31010 - }, - { - "epoch": 0.79, - "learning_rate": 1.7242089220427353e-06, - "loss": 0.6445, - "step": 31011 - }, - { - "epoch": 0.79, - "learning_rate": 1.724189840756622e-06, - "loss": 0.8398, - "step": 31012 - }, - { - "epoch": 0.79, - "learning_rate": 1.7241707589160295e-06, - "loss": 0.8652, - "step": 31013 - }, - { - "epoch": 0.79, - "learning_rate": 1.724151676520973e-06, - "loss": 0.7451, - "step": 31014 - }, - { - "epoch": 0.79, - "learning_rate": 1.724132593571467e-06, - "loss": 0.7783, - "step": 31015 - }, - { - "epoch": 0.79, - "learning_rate": 1.724113510067526e-06, - "loss": 0.6699, - "step": 31016 - }, - { - "epoch": 0.79, - "learning_rate": 1.7240944260091643e-06, - "loss": 0.9883, - "step": 31017 - }, - { - "epoch": 0.8, - "learning_rate": 1.724075341396397e-06, - "loss": 0.8984, - "step": 31018 - }, - { - "epoch": 0.8, - "learning_rate": 1.7240562562292383e-06, - "loss": 0.8574, - "step": 31019 - }, - { - "epoch": 0.8, - "learning_rate": 1.724037170507703e-06, - "loss": 0.8887, - "step": 31020 - }, - { - "epoch": 0.8, - "learning_rate": 1.724018084231806e-06, - "loss": 0.6758, - "step": 31021 - }, - { - "epoch": 0.8, - "learning_rate": 1.7239989974015616e-06, - "loss": 0.8203, - "step": 31022 - }, - { - "epoch": 0.8, - "learning_rate": 1.7239799100169844e-06, - "loss": 0.9404, - "step": 31023 - }, - { - "epoch": 0.8, - "learning_rate": 1.723960822078089e-06, - "loss": 0.7275, - "step": 31024 - }, - { - "epoch": 0.8, - "learning_rate": 1.72394173358489e-06, - "loss": 0.8818, - "step": 31025 - }, - { - "epoch": 0.8, - "learning_rate": 1.7239226445374025e-06, - "loss": 0.7051, - "step": 31026 - }, - { - "epoch": 0.8, - "learning_rate": 1.7239035549356405e-06, - "loss": 0.8447, - "step": 31027 - }, - { - "epoch": 0.8, - "learning_rate": 1.7238844647796188e-06, - "loss": 1.0176, - "step": 31028 - }, - { - "epoch": 0.8, - "learning_rate": 1.7238653740693518e-06, - "loss": 0.9102, - "step": 31029 - }, - { - "epoch": 0.8, - "learning_rate": 1.7238462828048548e-06, - "loss": 0.9736, - "step": 31030 - }, - { - "epoch": 0.8, - "learning_rate": 1.7238271909861419e-06, - "loss": 0.8301, - "step": 31031 - }, - { - "epoch": 0.8, - "learning_rate": 1.7238080986132278e-06, - "loss": 0.595, - "step": 31032 - }, - { - "epoch": 0.8, - "learning_rate": 1.723789005686127e-06, - "loss": 0.6909, - "step": 31033 - }, - { - "epoch": 0.8, - "learning_rate": 1.723769912204854e-06, - "loss": 0.8662, - "step": 31034 - }, - { - "epoch": 0.8, - "learning_rate": 1.723750818169424e-06, - "loss": 0.9883, - "step": 31035 - }, - { - "epoch": 0.8, - "learning_rate": 1.7237317235798513e-06, - "loss": 1.0752, - "step": 31036 - }, - { - "epoch": 0.8, - "learning_rate": 1.7237126284361506e-06, - "loss": 0.6611, - "step": 31037 - }, - { - "epoch": 0.8, - "learning_rate": 1.723693532738336e-06, - "loss": 0.7383, - "step": 31038 - }, - { - "epoch": 0.8, - "learning_rate": 1.7236744364864226e-06, - "loss": 1.0088, - "step": 31039 - }, - { - "epoch": 0.8, - "learning_rate": 1.723655339680425e-06, - "loss": 0.8574, - "step": 31040 - }, - { - "epoch": 0.8, - "learning_rate": 1.723636242320358e-06, - "loss": 0.7446, - "step": 31041 - }, - { - "epoch": 0.8, - "learning_rate": 1.723617144406236e-06, - "loss": 0.7732, - "step": 31042 - }, - { - "epoch": 0.8, - "learning_rate": 1.7235980459380736e-06, - "loss": 0.9268, - "step": 31043 - }, - { - "epoch": 0.8, - "learning_rate": 1.7235789469158853e-06, - "loss": 1.0498, - "step": 31044 - }, - { - "epoch": 0.8, - "learning_rate": 1.7235598473396857e-06, - "loss": 0.9502, - "step": 31045 - }, - { - "epoch": 0.8, - "learning_rate": 1.72354074720949e-06, - "loss": 0.7266, - "step": 31046 - }, - { - "epoch": 0.8, - "learning_rate": 1.723521646525312e-06, - "loss": 0.7529, - "step": 31047 - }, - { - "epoch": 0.8, - "learning_rate": 1.7235025452871672e-06, - "loss": 0.5576, - "step": 31048 - }, - { - "epoch": 0.8, - "learning_rate": 1.7234834434950699e-06, - "loss": 0.834, - "step": 31049 - }, - { - "epoch": 0.8, - "learning_rate": 1.7234643411490342e-06, - "loss": 0.9219, - "step": 31050 - }, - { - "epoch": 0.8, - "learning_rate": 1.723445238249075e-06, - "loss": 0.9297, - "step": 31051 - }, - { - "epoch": 0.8, - "learning_rate": 1.7234261347952073e-06, - "loss": 0.9189, - "step": 31052 - }, - { - "epoch": 0.8, - "learning_rate": 1.7234070307874452e-06, - "loss": 0.7417, - "step": 31053 - }, - { - "epoch": 0.8, - "learning_rate": 1.723387926225804e-06, - "loss": 1.0361, - "step": 31054 - }, - { - "epoch": 0.8, - "learning_rate": 1.7233688211102976e-06, - "loss": 0.9922, - "step": 31055 - }, - { - "epoch": 0.8, - "learning_rate": 1.7233497154409413e-06, - "loss": 0.7852, - "step": 31056 - }, - { - "epoch": 0.8, - "learning_rate": 1.723330609217749e-06, - "loss": 0.5734, - "step": 31057 - }, - { - "epoch": 0.8, - "learning_rate": 1.723311502440736e-06, - "loss": 0.8608, - "step": 31058 - }, - { - "epoch": 0.8, - "learning_rate": 1.7232923951099166e-06, - "loss": 0.9209, - "step": 31059 - }, - { - "epoch": 0.8, - "learning_rate": 1.7232732872253051e-06, - "loss": 0.749, - "step": 31060 - }, - { - "epoch": 0.8, - "learning_rate": 1.723254178786917e-06, - "loss": 0.7578, - "step": 31061 - }, - { - "epoch": 0.8, - "learning_rate": 1.7232350697947663e-06, - "loss": 0.8037, - "step": 31062 - }, - { - "epoch": 0.8, - "learning_rate": 1.7232159602488675e-06, - "loss": 0.8643, - "step": 31063 - }, - { - "epoch": 0.8, - "learning_rate": 1.7231968501492356e-06, - "loss": 0.8574, - "step": 31064 - }, - { - "epoch": 0.8, - "learning_rate": 1.7231777394958852e-06, - "loss": 0.8877, - "step": 31065 - }, - { - "epoch": 0.8, - "learning_rate": 1.7231586282888307e-06, - "loss": 0.9082, - "step": 31066 - }, - { - "epoch": 0.8, - "learning_rate": 1.7231395165280874e-06, - "loss": 0.8633, - "step": 31067 - }, - { - "epoch": 0.8, - "learning_rate": 1.723120404213669e-06, - "loss": 0.6313, - "step": 31068 - }, - { - "epoch": 0.8, - "learning_rate": 1.7231012913455905e-06, - "loss": 0.7075, - "step": 31069 - }, - { - "epoch": 0.8, - "learning_rate": 1.723082177923867e-06, - "loss": 0.9971, - "step": 31070 - }, - { - "epoch": 0.8, - "learning_rate": 1.7230630639485124e-06, - "loss": 0.7485, - "step": 31071 - }, - { - "epoch": 0.8, - "learning_rate": 1.7230439494195417e-06, - "loss": 0.8975, - "step": 31072 - }, - { - "epoch": 0.8, - "learning_rate": 1.7230248343369693e-06, - "loss": 0.9707, - "step": 31073 - }, - { - "epoch": 0.8, - "learning_rate": 1.7230057187008103e-06, - "loss": 0.9619, - "step": 31074 - }, - { - "epoch": 0.8, - "learning_rate": 1.7229866025110789e-06, - "loss": 0.8413, - "step": 31075 - }, - { - "epoch": 0.8, - "learning_rate": 1.72296748576779e-06, - "loss": 0.7266, - "step": 31076 - }, - { - "epoch": 0.8, - "learning_rate": 1.7229483684709583e-06, - "loss": 0.5337, - "step": 31077 - }, - { - "epoch": 0.8, - "learning_rate": 1.722929250620598e-06, - "loss": 0.7969, - "step": 31078 - }, - { - "epoch": 0.8, - "learning_rate": 1.7229101322167244e-06, - "loss": 0.9092, - "step": 31079 - }, - { - "epoch": 0.8, - "learning_rate": 1.7228910132593513e-06, - "loss": 0.7441, - "step": 31080 - }, - { - "epoch": 0.8, - "learning_rate": 1.7228718937484939e-06, - "loss": 0.8936, - "step": 31081 - }, - { - "epoch": 0.8, - "learning_rate": 1.7228527736841669e-06, - "loss": 0.6597, - "step": 31082 - }, - { - "epoch": 0.8, - "learning_rate": 1.7228336530663846e-06, - "loss": 0.5833, - "step": 31083 - }, - { - "epoch": 0.8, - "learning_rate": 1.7228145318951617e-06, - "loss": 0.7783, - "step": 31084 - }, - { - "epoch": 0.8, - "learning_rate": 1.7227954101705132e-06, - "loss": 0.7192, - "step": 31085 - }, - { - "epoch": 0.8, - "learning_rate": 1.7227762878924535e-06, - "loss": 0.7881, - "step": 31086 - }, - { - "epoch": 0.8, - "learning_rate": 1.7227571650609972e-06, - "loss": 0.9092, - "step": 31087 - }, - { - "epoch": 0.8, - "learning_rate": 1.722738041676159e-06, - "loss": 0.8828, - "step": 31088 - }, - { - "epoch": 0.8, - "learning_rate": 1.722718917737953e-06, - "loss": 0.9404, - "step": 31089 - }, - { - "epoch": 0.8, - "learning_rate": 1.7226997932463951e-06, - "loss": 1.0361, - "step": 31090 - }, - { - "epoch": 0.8, - "learning_rate": 1.722680668201499e-06, - "loss": 0.5918, - "step": 31091 - }, - { - "epoch": 0.8, - "learning_rate": 1.7226615426032792e-06, - "loss": 0.4253, - "step": 31092 - }, - { - "epoch": 0.8, - "learning_rate": 1.722642416451751e-06, - "loss": 0.9307, - "step": 31093 - }, - { - "epoch": 0.8, - "learning_rate": 1.7226232897469286e-06, - "loss": 0.9893, - "step": 31094 - }, - { - "epoch": 0.8, - "learning_rate": 1.7226041624888268e-06, - "loss": 0.6304, - "step": 31095 - }, - { - "epoch": 0.8, - "learning_rate": 1.7225850346774605e-06, - "loss": 0.873, - "step": 31096 - }, - { - "epoch": 0.8, - "learning_rate": 1.7225659063128438e-06, - "loss": 1.0137, - "step": 31097 - }, - { - "epoch": 0.8, - "learning_rate": 1.7225467773949914e-06, - "loss": 0.8594, - "step": 31098 - }, - { - "epoch": 0.8, - "learning_rate": 1.7225276479239184e-06, - "loss": 0.8682, - "step": 31099 - }, - { - "epoch": 0.8, - "learning_rate": 1.722508517899639e-06, - "loss": 0.875, - "step": 31100 - }, - { - "epoch": 0.8, - "learning_rate": 1.7224893873221685e-06, - "loss": 0.793, - "step": 31101 - }, - { - "epoch": 0.8, - "learning_rate": 1.7224702561915208e-06, - "loss": 0.8086, - "step": 31102 - }, - { - "epoch": 0.8, - "learning_rate": 1.7224511245077107e-06, - "loss": 0.9395, - "step": 31103 - }, - { - "epoch": 0.8, - "learning_rate": 1.7224319922707533e-06, - "loss": 1.0508, - "step": 31104 - }, - { - "epoch": 0.8, - "learning_rate": 1.7224128594806626e-06, - "loss": 0.9375, - "step": 31105 - }, - { - "epoch": 0.8, - "learning_rate": 1.7223937261374539e-06, - "loss": 1.0645, - "step": 31106 - }, - { - "epoch": 0.8, - "learning_rate": 1.7223745922411411e-06, - "loss": 1.0029, - "step": 31107 - }, - { - "epoch": 0.8, - "learning_rate": 1.7223554577917398e-06, - "loss": 0.7744, - "step": 31108 - }, - { - "epoch": 0.8, - "learning_rate": 1.722336322789264e-06, - "loss": 0.7842, - "step": 31109 - }, - { - "epoch": 0.8, - "learning_rate": 1.7223171872337286e-06, - "loss": 0.7246, - "step": 31110 - }, - { - "epoch": 0.8, - "learning_rate": 1.7222980511251479e-06, - "loss": 0.8623, - "step": 31111 - }, - { - "epoch": 0.8, - "learning_rate": 1.7222789144635368e-06, - "loss": 0.8936, - "step": 31112 - }, - { - "epoch": 0.8, - "learning_rate": 1.7222597772489103e-06, - "loss": 0.8115, - "step": 31113 - }, - { - "epoch": 0.8, - "learning_rate": 1.7222406394812824e-06, - "loss": 0.8828, - "step": 31114 - }, - { - "epoch": 0.8, - "learning_rate": 1.7222215011606677e-06, - "loss": 0.7324, - "step": 31115 - }, - { - "epoch": 0.8, - "learning_rate": 1.7222023622870818e-06, - "loss": 1.0391, - "step": 31116 - }, - { - "epoch": 0.8, - "learning_rate": 1.7221832228605386e-06, - "loss": 0.7754, - "step": 31117 - }, - { - "epoch": 0.8, - "learning_rate": 1.722164082881053e-06, - "loss": 0.8711, - "step": 31118 - }, - { - "epoch": 0.8, - "learning_rate": 1.7221449423486392e-06, - "loss": 0.7515, - "step": 31119 - }, - { - "epoch": 0.8, - "learning_rate": 1.7221258012633126e-06, - "loss": 0.6846, - "step": 31120 - }, - { - "epoch": 0.8, - "learning_rate": 1.7221066596250873e-06, - "loss": 0.9746, - "step": 31121 - }, - { - "epoch": 0.8, - "learning_rate": 1.7220875174339779e-06, - "loss": 0.7969, - "step": 31122 - }, - { - "epoch": 0.8, - "learning_rate": 1.7220683746899999e-06, - "loss": 0.7227, - "step": 31123 - }, - { - "epoch": 0.8, - "learning_rate": 1.722049231393167e-06, - "loss": 0.9102, - "step": 31124 - }, - { - "epoch": 0.8, - "learning_rate": 1.7220300875434938e-06, - "loss": 1.0117, - "step": 31125 - }, - { - "epoch": 0.8, - "learning_rate": 1.722010943140996e-06, - "loss": 0.9062, - "step": 31126 - }, - { - "epoch": 0.8, - "learning_rate": 1.7219917981856873e-06, - "loss": 1.0361, - "step": 31127 - }, - { - "epoch": 0.8, - "learning_rate": 1.7219726526775828e-06, - "loss": 0.8508, - "step": 31128 - }, - { - "epoch": 0.8, - "learning_rate": 1.721953506616697e-06, - "loss": 0.8701, - "step": 31129 - }, - { - "epoch": 0.8, - "learning_rate": 1.7219343600030448e-06, - "loss": 0.9492, - "step": 31130 - }, - { - "epoch": 0.8, - "learning_rate": 1.7219152128366404e-06, - "loss": 0.8301, - "step": 31131 - }, - { - "epoch": 0.8, - "learning_rate": 1.7218960651174985e-06, - "loss": 0.9209, - "step": 31132 - }, - { - "epoch": 0.8, - "learning_rate": 1.7218769168456344e-06, - "loss": 0.9873, - "step": 31133 - }, - { - "epoch": 0.8, - "learning_rate": 1.7218577680210622e-06, - "loss": 0.9414, - "step": 31134 - }, - { - "epoch": 0.8, - "learning_rate": 1.7218386186437968e-06, - "loss": 0.9053, - "step": 31135 - }, - { - "epoch": 0.8, - "learning_rate": 1.7218194687138526e-06, - "loss": 0.7891, - "step": 31136 - }, - { - "epoch": 0.8, - "learning_rate": 1.7218003182312443e-06, - "loss": 1.0039, - "step": 31137 - }, - { - "epoch": 0.8, - "learning_rate": 1.721781167195987e-06, - "loss": 0.8545, - "step": 31138 - }, - { - "epoch": 0.8, - "learning_rate": 1.7217620156080948e-06, - "loss": 0.79, - "step": 31139 - }, - { - "epoch": 0.8, - "learning_rate": 1.7217428634675829e-06, - "loss": 0.7031, - "step": 31140 - }, - { - "epoch": 0.8, - "learning_rate": 1.7217237107744653e-06, - "loss": 0.7932, - "step": 31141 - }, - { - "epoch": 0.8, - "learning_rate": 1.7217045575287572e-06, - "loss": 0.6641, - "step": 31142 - }, - { - "epoch": 0.8, - "learning_rate": 1.7216854037304732e-06, - "loss": 0.7141, - "step": 31143 - }, - { - "epoch": 0.8, - "learning_rate": 1.721666249379628e-06, - "loss": 0.9189, - "step": 31144 - }, - { - "epoch": 0.8, - "learning_rate": 1.7216470944762357e-06, - "loss": 0.7861, - "step": 31145 - }, - { - "epoch": 0.8, - "learning_rate": 1.7216279390203118e-06, - "loss": 0.782, - "step": 31146 - }, - { - "epoch": 0.8, - "learning_rate": 1.7216087830118703e-06, - "loss": 0.8867, - "step": 31147 - }, - { - "epoch": 0.8, - "learning_rate": 1.7215896264509263e-06, - "loss": 0.875, - "step": 31148 - }, - { - "epoch": 0.8, - "learning_rate": 1.7215704693374944e-06, - "loss": 0.9834, - "step": 31149 - }, - { - "epoch": 0.8, - "learning_rate": 1.7215513116715888e-06, - "loss": 0.9785, - "step": 31150 - }, - { - "epoch": 0.8, - "learning_rate": 1.7215321534532247e-06, - "loss": 0.8503, - "step": 31151 - }, - { - "epoch": 0.8, - "learning_rate": 1.7215129946824168e-06, - "loss": 0.9756, - "step": 31152 - }, - { - "epoch": 0.8, - "learning_rate": 1.7214938353591792e-06, - "loss": 0.8828, - "step": 31153 - }, - { - "epoch": 0.8, - "learning_rate": 1.7214746754835274e-06, - "loss": 0.5942, - "step": 31154 - }, - { - "epoch": 0.8, - "learning_rate": 1.7214555150554752e-06, - "loss": 0.7822, - "step": 31155 - }, - { - "epoch": 0.8, - "learning_rate": 1.7214363540750381e-06, - "loss": 0.96, - "step": 31156 - }, - { - "epoch": 0.8, - "learning_rate": 1.72141719254223e-06, - "loss": 0.7568, - "step": 31157 - }, - { - "epoch": 0.8, - "learning_rate": 1.7213980304570664e-06, - "loss": 0.8789, - "step": 31158 - }, - { - "epoch": 0.8, - "learning_rate": 1.7213788678195612e-06, - "loss": 1.1016, - "step": 31159 - }, - { - "epoch": 0.8, - "learning_rate": 1.7213597046297293e-06, - "loss": 0.6943, - "step": 31160 - }, - { - "epoch": 0.8, - "learning_rate": 1.7213405408875853e-06, - "loss": 1.0293, - "step": 31161 - }, - { - "epoch": 0.8, - "learning_rate": 1.7213213765931443e-06, - "loss": 0.8545, - "step": 31162 - }, - { - "epoch": 0.8, - "learning_rate": 1.7213022117464205e-06, - "loss": 0.7324, - "step": 31163 - }, - { - "epoch": 0.8, - "learning_rate": 1.7212830463474288e-06, - "loss": 0.6758, - "step": 31164 - }, - { - "epoch": 0.8, - "learning_rate": 1.7212638803961838e-06, - "loss": 0.7542, - "step": 31165 - }, - { - "epoch": 0.8, - "learning_rate": 1.7212447138927003e-06, - "loss": 0.8457, - "step": 31166 - }, - { - "epoch": 0.8, - "learning_rate": 1.721225546836993e-06, - "loss": 0.6719, - "step": 31167 - }, - { - "epoch": 0.8, - "learning_rate": 1.7212063792290766e-06, - "loss": 0.9775, - "step": 31168 - }, - { - "epoch": 0.8, - "learning_rate": 1.7211872110689652e-06, - "loss": 0.9307, - "step": 31169 - }, - { - "epoch": 0.8, - "learning_rate": 1.7211680423566742e-06, - "loss": 0.7358, - "step": 31170 - }, - { - "epoch": 0.8, - "learning_rate": 1.7211488730922176e-06, - "loss": 1.0098, - "step": 31171 - }, - { - "epoch": 0.8, - "learning_rate": 1.721129703275611e-06, - "loss": 0.8804, - "step": 31172 - }, - { - "epoch": 0.8, - "learning_rate": 1.7211105329068682e-06, - "loss": 0.8076, - "step": 31173 - }, - { - "epoch": 0.8, - "learning_rate": 1.7210913619860042e-06, - "loss": 0.8008, - "step": 31174 - }, - { - "epoch": 0.8, - "learning_rate": 1.721072190513034e-06, - "loss": 0.8936, - "step": 31175 - }, - { - "epoch": 0.8, - "learning_rate": 1.7210530184879716e-06, - "loss": 0.7944, - "step": 31176 - }, - { - "epoch": 0.8, - "learning_rate": 1.7210338459108323e-06, - "loss": 0.5916, - "step": 31177 - }, - { - "epoch": 0.8, - "learning_rate": 1.7210146727816306e-06, - "loss": 0.8838, - "step": 31178 - }, - { - "epoch": 0.8, - "learning_rate": 1.720995499100381e-06, - "loss": 0.7119, - "step": 31179 - }, - { - "epoch": 0.8, - "learning_rate": 1.7209763248670983e-06, - "loss": 0.9199, - "step": 31180 - }, - { - "epoch": 0.8, - "learning_rate": 1.7209571500817972e-06, - "loss": 0.8545, - "step": 31181 - }, - { - "epoch": 0.8, - "learning_rate": 1.7209379747444922e-06, - "loss": 0.6396, - "step": 31182 - }, - { - "epoch": 0.8, - "learning_rate": 1.7209187988551985e-06, - "loss": 0.7695, - "step": 31183 - }, - { - "epoch": 0.8, - "learning_rate": 1.7208996224139302e-06, - "loss": 0.8018, - "step": 31184 - }, - { - "epoch": 0.8, - "learning_rate": 1.7208804454207022e-06, - "loss": 0.7725, - "step": 31185 - }, - { - "epoch": 0.8, - "learning_rate": 1.7208612678755292e-06, - "loss": 0.8145, - "step": 31186 - }, - { - "epoch": 0.8, - "learning_rate": 1.720842089778426e-06, - "loss": 0.9014, - "step": 31187 - }, - { - "epoch": 0.8, - "learning_rate": 1.720822911129407e-06, - "loss": 0.7939, - "step": 31188 - }, - { - "epoch": 0.8, - "learning_rate": 1.7208037319284872e-06, - "loss": 0.9883, - "step": 31189 - }, - { - "epoch": 0.8, - "learning_rate": 1.720784552175681e-06, - "loss": 0.8882, - "step": 31190 - }, - { - "epoch": 0.8, - "learning_rate": 1.720765371871003e-06, - "loss": 0.8223, - "step": 31191 - }, - { - "epoch": 0.8, - "learning_rate": 1.7207461910144684e-06, - "loss": 1.0029, - "step": 31192 - }, - { - "epoch": 0.8, - "learning_rate": 1.7207270096060916e-06, - "loss": 0.9209, - "step": 31193 - }, - { - "epoch": 0.8, - "learning_rate": 1.7207078276458872e-06, - "loss": 0.6989, - "step": 31194 - }, - { - "epoch": 0.8, - "learning_rate": 1.7206886451338698e-06, - "loss": 1.2227, - "step": 31195 - }, - { - "epoch": 0.8, - "learning_rate": 1.7206694620700544e-06, - "loss": 1.0215, - "step": 31196 - }, - { - "epoch": 0.8, - "learning_rate": 1.7206502784544554e-06, - "loss": 1.0566, - "step": 31197 - }, - { - "epoch": 0.8, - "learning_rate": 1.7206310942870879e-06, - "loss": 0.9023, - "step": 31198 - }, - { - "epoch": 0.8, - "learning_rate": 1.720611909567966e-06, - "loss": 0.5334, - "step": 31199 - }, - { - "epoch": 0.8, - "learning_rate": 1.7205927242971048e-06, - "loss": 0.9375, - "step": 31200 - }, - { - "epoch": 0.8, - "learning_rate": 1.7205735384745191e-06, - "loss": 0.5137, - "step": 31201 - }, - { - "epoch": 0.8, - "learning_rate": 1.720554352100223e-06, - "loss": 0.8799, - "step": 31202 - }, - { - "epoch": 0.8, - "learning_rate": 1.720535165174232e-06, - "loss": 0.8828, - "step": 31203 - }, - { - "epoch": 0.8, - "learning_rate": 1.7205159776965598e-06, - "loss": 0.7695, - "step": 31204 - }, - { - "epoch": 0.8, - "learning_rate": 1.720496789667222e-06, - "loss": 1.0098, - "step": 31205 - }, - { - "epoch": 0.8, - "learning_rate": 1.7204776010862329e-06, - "loss": 0.7773, - "step": 31206 - }, - { - "epoch": 0.8, - "learning_rate": 1.7204584119536074e-06, - "loss": 0.668, - "step": 31207 - }, - { - "epoch": 0.8, - "learning_rate": 1.7204392222693597e-06, - "loss": 0.7417, - "step": 31208 - }, - { - "epoch": 0.8, - "learning_rate": 1.720420032033505e-06, - "loss": 0.6729, - "step": 31209 - }, - { - "epoch": 0.8, - "learning_rate": 1.7204008412460578e-06, - "loss": 0.8438, - "step": 31210 - }, - { - "epoch": 0.8, - "learning_rate": 1.7203816499070326e-06, - "loss": 1.0723, - "step": 31211 - }, - { - "epoch": 0.8, - "learning_rate": 1.7203624580164444e-06, - "loss": 0.916, - "step": 31212 - }, - { - "epoch": 0.8, - "learning_rate": 1.720343265574308e-06, - "loss": 0.8916, - "step": 31213 - }, - { - "epoch": 0.8, - "learning_rate": 1.7203240725806376e-06, - "loss": 0.9678, - "step": 31214 - }, - { - "epoch": 0.8, - "learning_rate": 1.7203048790354484e-06, - "loss": 0.9229, - "step": 31215 - }, - { - "epoch": 0.8, - "learning_rate": 1.7202856849387548e-06, - "loss": 1.1953, - "step": 31216 - }, - { - "epoch": 0.8, - "learning_rate": 1.7202664902905718e-06, - "loss": 0.6743, - "step": 31217 - }, - { - "epoch": 0.8, - "learning_rate": 1.7202472950909135e-06, - "loss": 0.9336, - "step": 31218 - }, - { - "epoch": 0.8, - "learning_rate": 1.7202280993397951e-06, - "loss": 0.8076, - "step": 31219 - }, - { - "epoch": 0.8, - "learning_rate": 1.7202089030372312e-06, - "loss": 0.9023, - "step": 31220 - }, - { - "epoch": 0.8, - "learning_rate": 1.7201897061832363e-06, - "loss": 0.7285, - "step": 31221 - }, - { - "epoch": 0.8, - "learning_rate": 1.720170508777825e-06, - "loss": 0.6909, - "step": 31222 - }, - { - "epoch": 0.8, - "learning_rate": 1.7201513108210128e-06, - "loss": 0.7114, - "step": 31223 - }, - { - "epoch": 0.8, - "learning_rate": 1.7201321123128136e-06, - "loss": 1.0547, - "step": 31224 - }, - { - "epoch": 0.8, - "learning_rate": 1.7201129132532425e-06, - "loss": 0.606, - "step": 31225 - }, - { - "epoch": 0.8, - "learning_rate": 1.7200937136423142e-06, - "loss": 0.6963, - "step": 31226 - }, - { - "epoch": 0.8, - "learning_rate": 1.7200745134800428e-06, - "loss": 0.8701, - "step": 31227 - }, - { - "epoch": 0.8, - "learning_rate": 1.7200553127664438e-06, - "loss": 1.0273, - "step": 31228 - }, - { - "epoch": 0.8, - "learning_rate": 1.7200361115015315e-06, - "loss": 0.5615, - "step": 31229 - }, - { - "epoch": 0.8, - "learning_rate": 1.7200169096853205e-06, - "loss": 0.9971, - "step": 31230 - }, - { - "epoch": 0.8, - "learning_rate": 1.7199977073178257e-06, - "loss": 0.8672, - "step": 31231 - }, - { - "epoch": 0.8, - "learning_rate": 1.719978504399062e-06, - "loss": 0.4878, - "step": 31232 - }, - { - "epoch": 0.8, - "learning_rate": 1.7199593009290435e-06, - "loss": 0.8447, - "step": 31233 - }, - { - "epoch": 0.8, - "learning_rate": 1.7199400969077856e-06, - "loss": 0.8252, - "step": 31234 - }, - { - "epoch": 0.8, - "learning_rate": 1.7199208923353027e-06, - "loss": 0.917, - "step": 31235 - }, - { - "epoch": 0.8, - "learning_rate": 1.719901687211609e-06, - "loss": 0.8828, - "step": 31236 - }, - { - "epoch": 0.8, - "learning_rate": 1.71988248153672e-06, - "loss": 0.9287, - "step": 31237 - }, - { - "epoch": 0.8, - "learning_rate": 1.71986327531065e-06, - "loss": 0.6245, - "step": 31238 - }, - { - "epoch": 0.8, - "learning_rate": 1.7198440685334141e-06, - "loss": 0.6816, - "step": 31239 - }, - { - "epoch": 0.8, - "learning_rate": 1.7198248612050263e-06, - "loss": 0.7451, - "step": 31240 - }, - { - "epoch": 0.8, - "learning_rate": 1.719805653325502e-06, - "loss": 0.917, - "step": 31241 - }, - { - "epoch": 0.8, - "learning_rate": 1.7197864448948556e-06, - "loss": 0.6787, - "step": 31242 - }, - { - "epoch": 0.8, - "learning_rate": 1.7197672359131014e-06, - "loss": 0.7373, - "step": 31243 - }, - { - "epoch": 0.8, - "learning_rate": 1.7197480263802549e-06, - "loss": 0.8223, - "step": 31244 - }, - { - "epoch": 0.8, - "learning_rate": 1.7197288162963304e-06, - "loss": 0.8359, - "step": 31245 - }, - { - "epoch": 0.8, - "learning_rate": 1.7197096056613424e-06, - "loss": 0.9844, - "step": 31246 - }, - { - "epoch": 0.8, - "learning_rate": 1.719690394475306e-06, - "loss": 0.6466, - "step": 31247 - }, - { - "epoch": 0.8, - "learning_rate": 1.719671182738236e-06, - "loss": 1.0454, - "step": 31248 - }, - { - "epoch": 0.8, - "learning_rate": 1.7196519704501466e-06, - "loss": 0.6433, - "step": 31249 - }, - { - "epoch": 0.8, - "learning_rate": 1.7196327576110527e-06, - "loss": 0.8574, - "step": 31250 - }, - { - "epoch": 0.8, - "learning_rate": 1.7196135442209693e-06, - "loss": 0.7881, - "step": 31251 - }, - { - "epoch": 0.8, - "learning_rate": 1.7195943302799107e-06, - "loss": 0.9221, - "step": 31252 - }, - { - "epoch": 0.8, - "learning_rate": 1.719575115787892e-06, - "loss": 0.6362, - "step": 31253 - }, - { - "epoch": 0.8, - "learning_rate": 1.7195559007449277e-06, - "loss": 0.7678, - "step": 31254 - }, - { - "epoch": 0.8, - "learning_rate": 1.7195366851510325e-06, - "loss": 0.7871, - "step": 31255 - }, - { - "epoch": 0.8, - "learning_rate": 1.719517469006221e-06, - "loss": 0.9639, - "step": 31256 - }, - { - "epoch": 0.8, - "learning_rate": 1.7194982523105081e-06, - "loss": 0.8887, - "step": 31257 - }, - { - "epoch": 0.8, - "learning_rate": 1.7194790350639087e-06, - "loss": 0.9355, - "step": 31258 - }, - { - "epoch": 0.8, - "learning_rate": 1.7194598172664372e-06, - "loss": 1.0605, - "step": 31259 - }, - { - "epoch": 0.8, - "learning_rate": 1.7194405989181082e-06, - "loss": 1.0381, - "step": 31260 - }, - { - "epoch": 0.8, - "learning_rate": 1.7194213800189367e-06, - "loss": 0.9043, - "step": 31261 - }, - { - "epoch": 0.8, - "learning_rate": 1.7194021605689374e-06, - "loss": 0.998, - "step": 31262 - }, - { - "epoch": 0.8, - "learning_rate": 1.719382940568125e-06, - "loss": 0.5486, - "step": 31263 - }, - { - "epoch": 0.8, - "learning_rate": 1.7193637200165139e-06, - "loss": 0.9482, - "step": 31264 - }, - { - "epoch": 0.8, - "learning_rate": 1.7193444989141193e-06, - "loss": 0.791, - "step": 31265 - }, - { - "epoch": 0.8, - "learning_rate": 1.719325277260956e-06, - "loss": 0.7197, - "step": 31266 - }, - { - "epoch": 0.8, - "learning_rate": 1.719306055057038e-06, - "loss": 0.9258, - "step": 31267 - }, - { - "epoch": 0.8, - "learning_rate": 1.71928683230238e-06, - "loss": 0.9844, - "step": 31268 - }, - { - "epoch": 0.8, - "learning_rate": 1.719267608996998e-06, - "loss": 0.6836, - "step": 31269 - }, - { - "epoch": 0.8, - "learning_rate": 1.7192483851409055e-06, - "loss": 1.0176, - "step": 31270 - }, - { - "epoch": 0.8, - "learning_rate": 1.7192291607341174e-06, - "loss": 0.7939, - "step": 31271 - }, - { - "epoch": 0.8, - "learning_rate": 1.7192099357766489e-06, - "loss": 0.7307, - "step": 31272 - }, - { - "epoch": 0.8, - "learning_rate": 1.7191907102685143e-06, - "loss": 1.0488, - "step": 31273 - }, - { - "epoch": 0.8, - "learning_rate": 1.7191714842097284e-06, - "loss": 0.6807, - "step": 31274 - }, - { - "epoch": 0.8, - "learning_rate": 1.7191522576003061e-06, - "loss": 1.0723, - "step": 31275 - }, - { - "epoch": 0.8, - "learning_rate": 1.719133030440262e-06, - "loss": 0.9395, - "step": 31276 - }, - { - "epoch": 0.8, - "learning_rate": 1.7191138027296105e-06, - "loss": 0.8384, - "step": 31277 - }, - { - "epoch": 0.8, - "learning_rate": 1.7190945744683669e-06, - "loss": 1.0303, - "step": 31278 - }, - { - "epoch": 0.8, - "learning_rate": 1.7190753456565456e-06, - "loss": 0.835, - "step": 31279 - }, - { - "epoch": 0.8, - "learning_rate": 1.7190561162941614e-06, - "loss": 1.0078, - "step": 31280 - }, - { - "epoch": 0.8, - "learning_rate": 1.7190368863812287e-06, - "loss": 0.7979, - "step": 31281 - }, - { - "epoch": 0.8, - "learning_rate": 1.719017655917763e-06, - "loss": 0.8311, - "step": 31282 - }, - { - "epoch": 0.8, - "learning_rate": 1.7189984249037784e-06, - "loss": 0.9443, - "step": 31283 - }, - { - "epoch": 0.8, - "learning_rate": 1.7189791933392894e-06, - "loss": 0.8438, - "step": 31284 - }, - { - "epoch": 0.8, - "learning_rate": 1.7189599612243116e-06, - "loss": 0.4159, - "step": 31285 - }, - { - "epoch": 0.8, - "learning_rate": 1.718940728558859e-06, - "loss": 0.7905, - "step": 31286 - }, - { - "epoch": 0.8, - "learning_rate": 1.7189214953429466e-06, - "loss": 0.7554, - "step": 31287 - }, - { - "epoch": 0.8, - "learning_rate": 1.7189022615765887e-06, - "loss": 1.0059, - "step": 31288 - }, - { - "epoch": 0.8, - "learning_rate": 1.7188830272598008e-06, - "loss": 0.8462, - "step": 31289 - }, - { - "epoch": 0.8, - "learning_rate": 1.7188637923925971e-06, - "loss": 0.9072, - "step": 31290 - }, - { - "epoch": 0.8, - "learning_rate": 1.7188445569749925e-06, - "loss": 0.8223, - "step": 31291 - }, - { - "epoch": 0.8, - "learning_rate": 1.7188253210070016e-06, - "loss": 0.833, - "step": 31292 - }, - { - "epoch": 0.8, - "learning_rate": 1.7188060844886391e-06, - "loss": 0.7861, - "step": 31293 - }, - { - "epoch": 0.8, - "learning_rate": 1.7187868474199202e-06, - "loss": 0.9268, - "step": 31294 - }, - { - "epoch": 0.8, - "learning_rate": 1.7187676098008587e-06, - "loss": 0.8213, - "step": 31295 - }, - { - "epoch": 0.8, - "learning_rate": 1.7187483716314704e-06, - "loss": 0.8643, - "step": 31296 - }, - { - "epoch": 0.8, - "learning_rate": 1.7187291329117693e-06, - "loss": 0.8525, - "step": 31297 - }, - { - "epoch": 0.8, - "learning_rate": 1.7187098936417703e-06, - "loss": 0.9199, - "step": 31298 - }, - { - "epoch": 0.8, - "learning_rate": 1.7186906538214886e-06, - "loss": 1.0967, - "step": 31299 - }, - { - "epoch": 0.8, - "learning_rate": 1.718671413450938e-06, - "loss": 0.7021, - "step": 31300 - }, - { - "epoch": 0.8, - "learning_rate": 1.7186521725301339e-06, - "loss": 0.8369, - "step": 31301 - }, - { - "epoch": 0.8, - "learning_rate": 1.718632931059091e-06, - "loss": 0.8867, - "step": 31302 - }, - { - "epoch": 0.8, - "learning_rate": 1.7186136890378238e-06, - "loss": 0.7271, - "step": 31303 - }, - { - "epoch": 0.8, - "learning_rate": 1.718594446466347e-06, - "loss": 0.791, - "step": 31304 - }, - { - "epoch": 0.8, - "learning_rate": 1.7185752033446756e-06, - "loss": 0.8979, - "step": 31305 - }, - { - "epoch": 0.8, - "learning_rate": 1.7185559596728243e-06, - "loss": 0.8838, - "step": 31306 - }, - { - "epoch": 0.8, - "learning_rate": 1.7185367154508077e-06, - "loss": 0.6624, - "step": 31307 - }, - { - "epoch": 0.8, - "learning_rate": 1.7185174706786405e-06, - "loss": 0.6304, - "step": 31308 - }, - { - "epoch": 0.8, - "learning_rate": 1.7184982253563376e-06, - "loss": 1.1016, - "step": 31309 - }, - { - "epoch": 0.8, - "learning_rate": 1.7184789794839135e-06, - "loss": 0.9434, - "step": 31310 - }, - { - "epoch": 0.8, - "learning_rate": 1.7184597330613833e-06, - "loss": 0.8486, - "step": 31311 - }, - { - "epoch": 0.8, - "learning_rate": 1.7184404860887613e-06, - "loss": 0.9023, - "step": 31312 - }, - { - "epoch": 0.8, - "learning_rate": 1.7184212385660625e-06, - "loss": 0.5947, - "step": 31313 - }, - { - "epoch": 0.8, - "learning_rate": 1.7184019904933018e-06, - "loss": 0.9795, - "step": 31314 - }, - { - "epoch": 0.8, - "learning_rate": 1.7183827418704938e-06, - "loss": 1.0469, - "step": 31315 - }, - { - "epoch": 0.8, - "learning_rate": 1.7183634926976528e-06, - "loss": 0.9414, - "step": 31316 - }, - { - "epoch": 0.8, - "learning_rate": 1.718344242974794e-06, - "loss": 1.0869, - "step": 31317 - }, - { - "epoch": 0.8, - "learning_rate": 1.7183249927019321e-06, - "loss": 0.6885, - "step": 31318 - }, - { - "epoch": 0.8, - "learning_rate": 1.7183057418790818e-06, - "loss": 0.9902, - "step": 31319 - }, - { - "epoch": 0.8, - "learning_rate": 1.7182864905062577e-06, - "loss": 0.6494, - "step": 31320 - }, - { - "epoch": 0.8, - "learning_rate": 1.718267238583475e-06, - "loss": 0.832, - "step": 31321 - }, - { - "epoch": 0.8, - "learning_rate": 1.718247986110748e-06, - "loss": 0.8799, - "step": 31322 - }, - { - "epoch": 0.8, - "learning_rate": 1.7182287330880913e-06, - "loss": 0.7402, - "step": 31323 - }, - { - "epoch": 0.8, - "learning_rate": 1.71820947951552e-06, - "loss": 0.5845, - "step": 31324 - }, - { - "epoch": 0.8, - "learning_rate": 1.7181902253930486e-06, - "loss": 0.9385, - "step": 31325 - }, - { - "epoch": 0.8, - "learning_rate": 1.7181709707206921e-06, - "loss": 0.9287, - "step": 31326 - }, - { - "epoch": 0.8, - "learning_rate": 1.7181517154984651e-06, - "loss": 0.9131, - "step": 31327 - }, - { - "epoch": 0.8, - "learning_rate": 1.7181324597263824e-06, - "loss": 0.8965, - "step": 31328 - }, - { - "epoch": 0.8, - "learning_rate": 1.7181132034044587e-06, - "loss": 1.0986, - "step": 31329 - }, - { - "epoch": 0.8, - "learning_rate": 1.7180939465327087e-06, - "loss": 1.0684, - "step": 31330 - }, - { - "epoch": 0.8, - "learning_rate": 1.7180746891111471e-06, - "loss": 0.9248, - "step": 31331 - }, - { - "epoch": 0.8, - "learning_rate": 1.7180554311397887e-06, - "loss": 0.8271, - "step": 31332 - }, - { - "epoch": 0.8, - "learning_rate": 1.7180361726186483e-06, - "loss": 1.0674, - "step": 31333 - }, - { - "epoch": 0.8, - "learning_rate": 1.718016913547741e-06, - "loss": 0.7949, - "step": 31334 - }, - { - "epoch": 0.8, - "learning_rate": 1.717997653927081e-06, - "loss": 0.9697, - "step": 31335 - }, - { - "epoch": 0.8, - "learning_rate": 1.7179783937566827e-06, - "loss": 0.8926, - "step": 31336 - }, - { - "epoch": 0.8, - "learning_rate": 1.7179591330365617e-06, - "loss": 0.7891, - "step": 31337 - }, - { - "epoch": 0.8, - "learning_rate": 1.7179398717667323e-06, - "loss": 0.5605, - "step": 31338 - }, - { - "epoch": 0.8, - "learning_rate": 1.7179206099472096e-06, - "loss": 0.7568, - "step": 31339 - }, - { - "epoch": 0.8, - "learning_rate": 1.7179013475780079e-06, - "loss": 0.6387, - "step": 31340 - }, - { - "epoch": 0.8, - "learning_rate": 1.7178820846591423e-06, - "loss": 0.8613, - "step": 31341 - }, - { - "epoch": 0.8, - "learning_rate": 1.7178628211906275e-06, - "loss": 0.8379, - "step": 31342 - }, - { - "epoch": 0.8, - "learning_rate": 1.7178435571724782e-06, - "loss": 0.8652, - "step": 31343 - }, - { - "epoch": 0.8, - "learning_rate": 1.7178242926047086e-06, - "loss": 0.9834, - "step": 31344 - }, - { - "epoch": 0.8, - "learning_rate": 1.7178050274873343e-06, - "loss": 0.7803, - "step": 31345 - }, - { - "epoch": 0.8, - "learning_rate": 1.7177857618203694e-06, - "loss": 0.8984, - "step": 31346 - }, - { - "epoch": 0.8, - "learning_rate": 1.7177664956038295e-06, - "loss": 0.9199, - "step": 31347 - }, - { - "epoch": 0.8, - "learning_rate": 1.7177472288377284e-06, - "loss": 0.6509, - "step": 31348 - }, - { - "epoch": 0.8, - "learning_rate": 1.7177279615220812e-06, - "loss": 1.0049, - "step": 31349 - }, - { - "epoch": 0.8, - "learning_rate": 1.7177086936569028e-06, - "loss": 0.6841, - "step": 31350 - }, - { - "epoch": 0.8, - "learning_rate": 1.7176894252422078e-06, - "loss": 0.6843, - "step": 31351 - }, - { - "epoch": 0.8, - "learning_rate": 1.717670156278011e-06, - "loss": 0.6846, - "step": 31352 - }, - { - "epoch": 0.8, - "learning_rate": 1.7176508867643274e-06, - "loss": 0.9463, - "step": 31353 - }, - { - "epoch": 0.8, - "learning_rate": 1.7176316167011713e-06, - "loss": 0.7861, - "step": 31354 - }, - { - "epoch": 0.8, - "learning_rate": 1.7176123460885577e-06, - "loss": 1.0273, - "step": 31355 - }, - { - "epoch": 0.8, - "learning_rate": 1.7175930749265013e-06, - "loss": 0.875, - "step": 31356 - }, - { - "epoch": 0.8, - "learning_rate": 1.7175738032150168e-06, - "loss": 0.9062, - "step": 31357 - }, - { - "epoch": 0.8, - "learning_rate": 1.7175545309541192e-06, - "loss": 0.9521, - "step": 31358 - }, - { - "epoch": 0.8, - "learning_rate": 1.7175352581438229e-06, - "loss": 1.0322, - "step": 31359 - }, - { - "epoch": 0.8, - "learning_rate": 1.7175159847841431e-06, - "loss": 0.5898, - "step": 31360 - }, - { - "epoch": 0.8, - "learning_rate": 1.7174967108750943e-06, - "loss": 0.6841, - "step": 31361 - }, - { - "epoch": 0.8, - "learning_rate": 1.7174774364166913e-06, - "loss": 0.8152, - "step": 31362 - }, - { - "epoch": 0.8, - "learning_rate": 1.7174581614089486e-06, - "loss": 0.8486, - "step": 31363 - }, - { - "epoch": 0.8, - "learning_rate": 1.7174388858518811e-06, - "loss": 0.9727, - "step": 31364 - }, - { - "epoch": 0.8, - "learning_rate": 1.717419609745504e-06, - "loss": 0.6404, - "step": 31365 - }, - { - "epoch": 0.8, - "learning_rate": 1.7174003330898311e-06, - "loss": 0.9863, - "step": 31366 - }, - { - "epoch": 0.8, - "learning_rate": 1.7173810558848784e-06, - "loss": 0.8115, - "step": 31367 - }, - { - "epoch": 0.8, - "learning_rate": 1.7173617781306598e-06, - "loss": 0.5669, - "step": 31368 - }, - { - "epoch": 0.8, - "learning_rate": 1.71734249982719e-06, - "loss": 0.9082, - "step": 31369 - }, - { - "epoch": 0.8, - "learning_rate": 1.7173232209744843e-06, - "loss": 0.7622, - "step": 31370 - }, - { - "epoch": 0.8, - "learning_rate": 1.717303941572557e-06, - "loss": 0.896, - "step": 31371 - }, - { - "epoch": 0.8, - "learning_rate": 1.7172846616214232e-06, - "loss": 0.8916, - "step": 31372 - }, - { - "epoch": 0.8, - "learning_rate": 1.7172653811210975e-06, - "loss": 1.0059, - "step": 31373 - }, - { - "epoch": 0.8, - "learning_rate": 1.7172461000715948e-06, - "loss": 0.8335, - "step": 31374 - }, - { - "epoch": 0.8, - "learning_rate": 1.7172268184729295e-06, - "loss": 0.8818, - "step": 31375 - }, - { - "epoch": 0.8, - "learning_rate": 1.717207536325117e-06, - "loss": 0.8125, - "step": 31376 - }, - { - "epoch": 0.8, - "learning_rate": 1.7171882536281712e-06, - "loss": 0.8652, - "step": 31377 - }, - { - "epoch": 0.8, - "learning_rate": 1.7171689703821075e-06, - "loss": 0.8574, - "step": 31378 - }, - { - "epoch": 0.8, - "learning_rate": 1.7171496865869405e-06, - "loss": 0.6934, - "step": 31379 - }, - { - "epoch": 0.8, - "learning_rate": 1.7171304022426849e-06, - "loss": 0.9141, - "step": 31380 - }, - { - "epoch": 0.8, - "learning_rate": 1.7171111173493556e-06, - "loss": 0.5537, - "step": 31381 - }, - { - "epoch": 0.8, - "learning_rate": 1.7170918319069675e-06, - "loss": 1.0625, - "step": 31382 - }, - { - "epoch": 0.8, - "learning_rate": 1.717072545915535e-06, - "loss": 0.9648, - "step": 31383 - }, - { - "epoch": 0.8, - "learning_rate": 1.7170532593750728e-06, - "loss": 0.6079, - "step": 31384 - }, - { - "epoch": 0.8, - "learning_rate": 1.7170339722855962e-06, - "loss": 0.9717, - "step": 31385 - }, - { - "epoch": 0.8, - "learning_rate": 1.7170146846471193e-06, - "loss": 0.793, - "step": 31386 - }, - { - "epoch": 0.8, - "learning_rate": 1.7169953964596575e-06, - "loss": 1.0088, - "step": 31387 - }, - { - "epoch": 0.8, - "learning_rate": 1.7169761077232252e-06, - "loss": 0.7544, - "step": 31388 - }, - { - "epoch": 0.8, - "learning_rate": 1.7169568184378376e-06, - "loss": 1.0225, - "step": 31389 - }, - { - "epoch": 0.8, - "learning_rate": 1.7169375286035086e-06, - "loss": 0.9512, - "step": 31390 - }, - { - "epoch": 0.8, - "learning_rate": 1.7169182382202539e-06, - "loss": 1.1172, - "step": 31391 - }, - { - "epoch": 0.8, - "learning_rate": 1.7168989472880875e-06, - "loss": 0.7344, - "step": 31392 - }, - { - "epoch": 0.8, - "learning_rate": 1.7168796558070246e-06, - "loss": 0.686, - "step": 31393 - }, - { - "epoch": 0.8, - "learning_rate": 1.7168603637770802e-06, - "loss": 1.0449, - "step": 31394 - }, - { - "epoch": 0.8, - "learning_rate": 1.7168410711982686e-06, - "loss": 0.6147, - "step": 31395 - }, - { - "epoch": 0.8, - "learning_rate": 1.7168217780706047e-06, - "loss": 0.8525, - "step": 31396 - }, - { - "epoch": 0.8, - "learning_rate": 1.7168024843941036e-06, - "loss": 0.644, - "step": 31397 - }, - { - "epoch": 0.8, - "learning_rate": 1.7167831901687794e-06, - "loss": 0.792, - "step": 31398 - }, - { - "epoch": 0.8, - "learning_rate": 1.7167638953946477e-06, - "loss": 0.8818, - "step": 31399 - }, - { - "epoch": 0.8, - "learning_rate": 1.7167446000717225e-06, - "loss": 0.8506, - "step": 31400 - }, - { - "epoch": 0.8, - "learning_rate": 1.7167253042000191e-06, - "loss": 0.7822, - "step": 31401 - }, - { - "epoch": 0.8, - "learning_rate": 1.716706007779552e-06, - "loss": 0.7534, - "step": 31402 - }, - { - "epoch": 0.8, - "learning_rate": 1.716686710810336e-06, - "loss": 0.9375, - "step": 31403 - }, - { - "epoch": 0.8, - "learning_rate": 1.716667413292386e-06, - "loss": 0.6499, - "step": 31404 - }, - { - "epoch": 0.8, - "learning_rate": 1.716648115225717e-06, - "loss": 0.939, - "step": 31405 - }, - { - "epoch": 0.8, - "learning_rate": 1.716628816610343e-06, - "loss": 1.0137, - "step": 31406 - }, - { - "epoch": 0.8, - "learning_rate": 1.7166095174462795e-06, - "loss": 0.625, - "step": 31407 - }, - { - "epoch": 0.81, - "learning_rate": 1.7165902177335411e-06, - "loss": 0.7832, - "step": 31408 - }, - { - "epoch": 0.81, - "learning_rate": 1.7165709174721426e-06, - "loss": 0.5706, - "step": 31409 - }, - { - "epoch": 0.81, - "learning_rate": 1.7165516166620986e-06, - "loss": 0.7651, - "step": 31410 - }, - { - "epoch": 0.81, - "learning_rate": 1.716532315303424e-06, - "loss": 0.7783, - "step": 31411 - }, - { - "epoch": 0.81, - "learning_rate": 1.7165130133961335e-06, - "loss": 0.7578, - "step": 31412 - }, - { - "epoch": 0.81, - "learning_rate": 1.7164937109402418e-06, - "loss": 0.8438, - "step": 31413 - }, - { - "epoch": 0.81, - "learning_rate": 1.7164744079357641e-06, - "loss": 0.8545, - "step": 31414 - }, - { - "epoch": 0.81, - "learning_rate": 1.7164551043827147e-06, - "loss": 0.876, - "step": 31415 - }, - { - "epoch": 0.81, - "learning_rate": 1.7164358002811085e-06, - "loss": 0.7622, - "step": 31416 - }, - { - "epoch": 0.81, - "learning_rate": 1.7164164956309604e-06, - "loss": 0.9072, - "step": 31417 - }, - { - "epoch": 0.81, - "learning_rate": 1.7163971904322851e-06, - "loss": 0.8838, - "step": 31418 - }, - { - "epoch": 0.81, - "learning_rate": 1.7163778846850976e-06, - "loss": 0.9639, - "step": 31419 - }, - { - "epoch": 0.81, - "learning_rate": 1.7163585783894123e-06, - "loss": 0.8054, - "step": 31420 - }, - { - "epoch": 0.81, - "learning_rate": 1.7163392715452442e-06, - "loss": 0.769, - "step": 31421 - }, - { - "epoch": 0.81, - "learning_rate": 1.7163199641526082e-06, - "loss": 0.9873, - "step": 31422 - }, - { - "epoch": 0.81, - "learning_rate": 1.7163006562115188e-06, - "loss": 0.9043, - "step": 31423 - }, - { - "epoch": 0.81, - "learning_rate": 1.7162813477219912e-06, - "loss": 0.8301, - "step": 31424 - }, - { - "epoch": 0.81, - "learning_rate": 1.7162620386840394e-06, - "loss": 0.9434, - "step": 31425 - }, - { - "epoch": 0.81, - "learning_rate": 1.716242729097679e-06, - "loss": 0.8174, - "step": 31426 - }, - { - "epoch": 0.81, - "learning_rate": 1.7162234189629246e-06, - "loss": 0.9355, - "step": 31427 - }, - { - "epoch": 0.81, - "learning_rate": 1.7162041082797907e-06, - "loss": 1.0742, - "step": 31428 - }, - { - "epoch": 0.81, - "learning_rate": 1.7161847970482923e-06, - "loss": 0.8662, - "step": 31429 - }, - { - "epoch": 0.81, - "learning_rate": 1.7161654852684443e-06, - "loss": 0.6682, - "step": 31430 - }, - { - "epoch": 0.81, - "learning_rate": 1.716146172940261e-06, - "loss": 0.6797, - "step": 31431 - }, - { - "epoch": 0.81, - "learning_rate": 1.7161268600637574e-06, - "loss": 1.1807, - "step": 31432 - }, - { - "epoch": 0.81, - "learning_rate": 1.7161075466389487e-06, - "loss": 0.8252, - "step": 31433 - }, - { - "epoch": 0.81, - "learning_rate": 1.7160882326658493e-06, - "loss": 0.8311, - "step": 31434 - }, - { - "epoch": 0.81, - "learning_rate": 1.716068918144474e-06, - "loss": 1.0381, - "step": 31435 - }, - { - "epoch": 0.81, - "learning_rate": 1.7160496030748377e-06, - "loss": 0.8467, - "step": 31436 - }, - { - "epoch": 0.81, - "learning_rate": 1.7160302874569552e-06, - "loss": 0.7129, - "step": 31437 - }, - { - "epoch": 0.81, - "learning_rate": 1.7160109712908413e-06, - "loss": 0.8691, - "step": 31438 - }, - { - "epoch": 0.81, - "learning_rate": 1.7159916545765105e-06, - "loss": 0.9678, - "step": 31439 - }, - { - "epoch": 0.81, - "learning_rate": 1.7159723373139778e-06, - "loss": 0.9707, - "step": 31440 - }, - { - "epoch": 0.81, - "learning_rate": 1.7159530195032584e-06, - "loss": 0.873, - "step": 31441 - }, - { - "epoch": 0.81, - "learning_rate": 1.7159337011443663e-06, - "loss": 0.7612, - "step": 31442 - }, - { - "epoch": 0.81, - "learning_rate": 1.7159143822373169e-06, - "loss": 0.8369, - "step": 31443 - }, - { - "epoch": 0.81, - "learning_rate": 1.7158950627821244e-06, - "loss": 0.5562, - "step": 31444 - }, - { - "epoch": 0.81, - "learning_rate": 1.7158757427788045e-06, - "loss": 0.8149, - "step": 31445 - }, - { - "epoch": 0.81, - "learning_rate": 1.715856422227371e-06, - "loss": 0.707, - "step": 31446 - }, - { - "epoch": 0.81, - "learning_rate": 1.7158371011278395e-06, - "loss": 0.915, - "step": 31447 - }, - { - "epoch": 0.81, - "learning_rate": 1.7158177794802242e-06, - "loss": 0.752, - "step": 31448 - }, - { - "epoch": 0.81, - "learning_rate": 1.7157984572845403e-06, - "loss": 1.043, - "step": 31449 - }, - { - "epoch": 0.81, - "learning_rate": 1.7157791345408024e-06, - "loss": 0.7559, - "step": 31450 - }, - { - "epoch": 0.81, - "learning_rate": 1.7157598112490253e-06, - "loss": 0.8271, - "step": 31451 - }, - { - "epoch": 0.81, - "learning_rate": 1.7157404874092238e-06, - "loss": 0.9463, - "step": 31452 - }, - { - "epoch": 0.81, - "learning_rate": 1.7157211630214127e-06, - "loss": 0.7998, - "step": 31453 - }, - { - "epoch": 0.81, - "learning_rate": 1.715701838085607e-06, - "loss": 0.918, - "step": 31454 - }, - { - "epoch": 0.81, - "learning_rate": 1.715682512601821e-06, - "loss": 0.7314, - "step": 31455 - }, - { - "epoch": 0.81, - "learning_rate": 1.7156631865700701e-06, - "loss": 0.8164, - "step": 31456 - }, - { - "epoch": 0.81, - "learning_rate": 1.7156438599903686e-06, - "loss": 0.9609, - "step": 31457 - }, - { - "epoch": 0.81, - "learning_rate": 1.7156245328627316e-06, - "loss": 0.8311, - "step": 31458 - }, - { - "epoch": 0.81, - "learning_rate": 1.7156052051871738e-06, - "loss": 1.0059, - "step": 31459 - }, - { - "epoch": 0.81, - "learning_rate": 1.7155858769637102e-06, - "loss": 0.8428, - "step": 31460 - }, - { - "epoch": 0.81, - "learning_rate": 1.7155665481923552e-06, - "loss": 1.0049, - "step": 31461 - }, - { - "epoch": 0.81, - "learning_rate": 1.7155472188731238e-06, - "loss": 0.8916, - "step": 31462 - }, - { - "epoch": 0.81, - "learning_rate": 1.7155278890060306e-06, - "loss": 0.8086, - "step": 31463 - }, - { - "epoch": 0.81, - "learning_rate": 1.715508558591091e-06, - "loss": 1.0088, - "step": 31464 - }, - { - "epoch": 0.81, - "learning_rate": 1.715489227628319e-06, - "loss": 0.8467, - "step": 31465 - }, - { - "epoch": 0.81, - "learning_rate": 1.71546989611773e-06, - "loss": 0.77, - "step": 31466 - }, - { - "epoch": 0.81, - "learning_rate": 1.7154505640593386e-06, - "loss": 0.7305, - "step": 31467 - }, - { - "epoch": 0.81, - "learning_rate": 1.7154312314531597e-06, - "loss": 0.9707, - "step": 31468 - }, - { - "epoch": 0.81, - "learning_rate": 1.715411898299208e-06, - "loss": 0.9453, - "step": 31469 - }, - { - "epoch": 0.81, - "learning_rate": 1.715392564597498e-06, - "loss": 0.6025, - "step": 31470 - }, - { - "epoch": 0.81, - "learning_rate": 1.715373230348045e-06, - "loss": 0.8965, - "step": 31471 - }, - { - "epoch": 0.81, - "learning_rate": 1.7153538955508635e-06, - "loss": 0.8428, - "step": 31472 - }, - { - "epoch": 0.81, - "learning_rate": 1.7153345602059685e-06, - "loss": 0.6797, - "step": 31473 - }, - { - "epoch": 0.81, - "learning_rate": 1.7153152243133747e-06, - "loss": 0.8174, - "step": 31474 - }, - { - "epoch": 0.81, - "learning_rate": 1.715295887873097e-06, - "loss": 1.0596, - "step": 31475 - }, - { - "epoch": 0.81, - "learning_rate": 1.71527655088515e-06, - "loss": 1.0186, - "step": 31476 - }, - { - "epoch": 0.81, - "learning_rate": 1.715257213349549e-06, - "loss": 0.874, - "step": 31477 - }, - { - "epoch": 0.81, - "learning_rate": 1.715237875266308e-06, - "loss": 0.5916, - "step": 31478 - }, - { - "epoch": 0.81, - "learning_rate": 1.7152185366354424e-06, - "loss": 0.957, - "step": 31479 - }, - { - "epoch": 0.81, - "learning_rate": 1.715199197456967e-06, - "loss": 0.8955, - "step": 31480 - }, - { - "epoch": 0.81, - "learning_rate": 1.7151798577308963e-06, - "loss": 0.958, - "step": 31481 - }, - { - "epoch": 0.81, - "learning_rate": 1.7151605174572455e-06, - "loss": 0.9121, - "step": 31482 - }, - { - "epoch": 0.81, - "learning_rate": 1.715141176636029e-06, - "loss": 0.7686, - "step": 31483 - }, - { - "epoch": 0.81, - "learning_rate": 1.7151218352672613e-06, - "loss": 0.8145, - "step": 31484 - }, - { - "epoch": 0.81, - "learning_rate": 1.715102493350958e-06, - "loss": 0.8984, - "step": 31485 - }, - { - "epoch": 0.81, - "learning_rate": 1.715083150887134e-06, - "loss": 0.7236, - "step": 31486 - }, - { - "epoch": 0.81, - "learning_rate": 1.7150638078758035e-06, - "loss": 0.6587, - "step": 31487 - }, - { - "epoch": 0.81, - "learning_rate": 1.7150444643169816e-06, - "loss": 0.8298, - "step": 31488 - }, - { - "epoch": 0.81, - "learning_rate": 1.7150251202106829e-06, - "loss": 1.0342, - "step": 31489 - }, - { - "epoch": 0.81, - "learning_rate": 1.7150057755569222e-06, - "loss": 0.8936, - "step": 31490 - }, - { - "epoch": 0.81, - "learning_rate": 1.7149864303557147e-06, - "loss": 0.8921, - "step": 31491 - }, - { - "epoch": 0.81, - "learning_rate": 1.7149670846070748e-06, - "loss": 0.8418, - "step": 31492 - }, - { - "epoch": 0.81, - "learning_rate": 1.7149477383110176e-06, - "loss": 0.8203, - "step": 31493 - }, - { - "epoch": 0.81, - "learning_rate": 1.7149283914675578e-06, - "loss": 0.688, - "step": 31494 - }, - { - "epoch": 0.81, - "learning_rate": 1.7149090440767101e-06, - "loss": 1.0928, - "step": 31495 - }, - { - "epoch": 0.81, - "learning_rate": 1.7148896961384892e-06, - "loss": 0.9258, - "step": 31496 - }, - { - "epoch": 0.81, - "learning_rate": 1.7148703476529108e-06, - "loss": 0.8613, - "step": 31497 - }, - { - "epoch": 0.81, - "learning_rate": 1.7148509986199885e-06, - "loss": 0.7852, - "step": 31498 - }, - { - "epoch": 0.81, - "learning_rate": 1.714831649039738e-06, - "loss": 0.9863, - "step": 31499 - }, - { - "epoch": 0.81, - "learning_rate": 1.7148122989121734e-06, - "loss": 1.0596, - "step": 31500 - }, - { - "epoch": 0.81, - "learning_rate": 1.71479294823731e-06, - "loss": 0.7012, - "step": 31501 - }, - { - "epoch": 0.81, - "learning_rate": 1.7147735970151627e-06, - "loss": 0.5493, - "step": 31502 - }, - { - "epoch": 0.81, - "learning_rate": 1.7147542452457459e-06, - "loss": 0.6846, - "step": 31503 - }, - { - "epoch": 0.81, - "learning_rate": 1.7147348929290747e-06, - "loss": 0.8936, - "step": 31504 - }, - { - "epoch": 0.81, - "learning_rate": 1.714715540065164e-06, - "loss": 0.9014, - "step": 31505 - }, - { - "epoch": 0.81, - "learning_rate": 1.7146961866540284e-06, - "loss": 0.7236, - "step": 31506 - }, - { - "epoch": 0.81, - "learning_rate": 1.7146768326956827e-06, - "loss": 0.7188, - "step": 31507 - }, - { - "epoch": 0.81, - "learning_rate": 1.714657478190142e-06, - "loss": 0.8379, - "step": 31508 - }, - { - "epoch": 0.81, - "learning_rate": 1.7146381231374205e-06, - "loss": 0.7852, - "step": 31509 - }, - { - "epoch": 0.81, - "learning_rate": 1.714618767537534e-06, - "loss": 0.8682, - "step": 31510 - }, - { - "epoch": 0.81, - "learning_rate": 1.7145994113904965e-06, - "loss": 0.708, - "step": 31511 - }, - { - "epoch": 0.81, - "learning_rate": 1.7145800546963233e-06, - "loss": 0.7598, - "step": 31512 - }, - { - "epoch": 0.81, - "learning_rate": 1.7145606974550283e-06, - "loss": 0.9678, - "step": 31513 - }, - { - "epoch": 0.81, - "learning_rate": 1.7145413396666278e-06, - "loss": 1.0557, - "step": 31514 - }, - { - "epoch": 0.81, - "learning_rate": 1.7145219813311355e-06, - "loss": 1.0029, - "step": 31515 - }, - { - "epoch": 0.81, - "learning_rate": 1.7145026224485669e-06, - "loss": 0.8096, - "step": 31516 - }, - { - "epoch": 0.81, - "learning_rate": 1.7144832630189363e-06, - "loss": 0.6533, - "step": 31517 - }, - { - "epoch": 0.81, - "learning_rate": 1.7144639030422586e-06, - "loss": 0.8975, - "step": 31518 - }, - { - "epoch": 0.81, - "learning_rate": 1.7144445425185488e-06, - "loss": 0.7808, - "step": 31519 - }, - { - "epoch": 0.81, - "learning_rate": 1.7144251814478217e-06, - "loss": 0.8252, - "step": 31520 - }, - { - "epoch": 0.81, - "learning_rate": 1.714405819830092e-06, - "loss": 0.8594, - "step": 31521 - }, - { - "epoch": 0.81, - "learning_rate": 1.7143864576653748e-06, - "loss": 0.75, - "step": 31522 - }, - { - "epoch": 0.81, - "learning_rate": 1.7143670949536847e-06, - "loss": 0.7554, - "step": 31523 - }, - { - "epoch": 0.81, - "learning_rate": 1.7143477316950366e-06, - "loss": 0.7363, - "step": 31524 - }, - { - "epoch": 0.81, - "learning_rate": 1.714328367889445e-06, - "loss": 1.0303, - "step": 31525 - }, - { - "epoch": 0.81, - "learning_rate": 1.7143090035369253e-06, - "loss": 0.8701, - "step": 31526 - }, - { - "epoch": 0.81, - "learning_rate": 1.714289638637492e-06, - "loss": 0.957, - "step": 31527 - }, - { - "epoch": 0.81, - "learning_rate": 1.7142702731911598e-06, - "loss": 1.167, - "step": 31528 - }, - { - "epoch": 0.81, - "learning_rate": 1.7142509071979437e-06, - "loss": 0.8418, - "step": 31529 - }, - { - "epoch": 0.81, - "learning_rate": 1.7142315406578586e-06, - "loss": 0.8667, - "step": 31530 - }, - { - "epoch": 0.81, - "learning_rate": 1.714212173570919e-06, - "loss": 0.8818, - "step": 31531 - }, - { - "epoch": 0.81, - "learning_rate": 1.7141928059371406e-06, - "loss": 0.7852, - "step": 31532 - }, - { - "epoch": 0.81, - "learning_rate": 1.7141734377565374e-06, - "loss": 0.5671, - "step": 31533 - }, - { - "epoch": 0.81, - "learning_rate": 1.7141540690291244e-06, - "loss": 0.6848, - "step": 31534 - }, - { - "epoch": 0.81, - "learning_rate": 1.7141346997549162e-06, - "loss": 0.7695, - "step": 31535 - }, - { - "epoch": 0.81, - "learning_rate": 1.7141153299339282e-06, - "loss": 0.5859, - "step": 31536 - }, - { - "epoch": 0.81, - "learning_rate": 1.7140959595661745e-06, - "loss": 1.0, - "step": 31537 - }, - { - "epoch": 0.81, - "learning_rate": 1.7140765886516707e-06, - "loss": 0.9492, - "step": 31538 - }, - { - "epoch": 0.81, - "learning_rate": 1.7140572171904314e-06, - "loss": 0.7988, - "step": 31539 - }, - { - "epoch": 0.81, - "learning_rate": 1.7140378451824708e-06, - "loss": 0.8359, - "step": 31540 - }, - { - "epoch": 0.81, - "learning_rate": 1.7140184726278048e-06, - "loss": 1.0283, - "step": 31541 - }, - { - "epoch": 0.81, - "learning_rate": 1.7139990995264475e-06, - "loss": 0.7466, - "step": 31542 - }, - { - "epoch": 0.81, - "learning_rate": 1.7139797258784139e-06, - "loss": 0.791, - "step": 31543 - }, - { - "epoch": 0.81, - "learning_rate": 1.7139603516837192e-06, - "loss": 0.791, - "step": 31544 - }, - { - "epoch": 0.81, - "learning_rate": 1.713940976942377e-06, - "loss": 0.7896, - "step": 31545 - }, - { - "epoch": 0.81, - "learning_rate": 1.713921601654404e-06, - "loss": 0.8594, - "step": 31546 - }, - { - "epoch": 0.81, - "learning_rate": 1.7139022258198135e-06, - "loss": 0.625, - "step": 31547 - }, - { - "epoch": 0.81, - "learning_rate": 1.7138828494386211e-06, - "loss": 0.9971, - "step": 31548 - }, - { - "epoch": 0.81, - "learning_rate": 1.7138634725108414e-06, - "loss": 0.8975, - "step": 31549 - }, - { - "epoch": 0.81, - "learning_rate": 1.713844095036489e-06, - "loss": 0.96, - "step": 31550 - }, - { - "epoch": 0.81, - "learning_rate": 1.7138247170155795e-06, - "loss": 1.043, - "step": 31551 - }, - { - "epoch": 0.81, - "learning_rate": 1.713805338448127e-06, - "loss": 0.7788, - "step": 31552 - }, - { - "epoch": 0.81, - "learning_rate": 1.7137859593341465e-06, - "loss": 0.7385, - "step": 31553 - }, - { - "epoch": 0.81, - "learning_rate": 1.7137665796736527e-06, - "loss": 0.8936, - "step": 31554 - }, - { - "epoch": 0.81, - "learning_rate": 1.713747199466661e-06, - "loss": 0.7202, - "step": 31555 - }, - { - "epoch": 0.81, - "learning_rate": 1.7137278187131858e-06, - "loss": 0.7266, - "step": 31556 - }, - { - "epoch": 0.81, - "learning_rate": 1.713708437413242e-06, - "loss": 0.9395, - "step": 31557 - }, - { - "epoch": 0.81, - "learning_rate": 1.7136890555668444e-06, - "loss": 0.748, - "step": 31558 - }, - { - "epoch": 0.81, - "learning_rate": 1.713669673174008e-06, - "loss": 0.9648, - "step": 31559 - }, - { - "epoch": 0.81, - "learning_rate": 1.7136502902347477e-06, - "loss": 1.0635, - "step": 31560 - }, - { - "epoch": 0.81, - "learning_rate": 1.713630906749078e-06, - "loss": 0.7246, - "step": 31561 - }, - { - "epoch": 0.81, - "learning_rate": 1.7136115227170139e-06, - "loss": 0.9805, - "step": 31562 - }, - { - "epoch": 0.81, - "learning_rate": 1.7135921381385702e-06, - "loss": 0.9756, - "step": 31563 - }, - { - "epoch": 0.81, - "learning_rate": 1.7135727530137621e-06, - "loss": 0.9541, - "step": 31564 - }, - { - "epoch": 0.81, - "learning_rate": 1.713553367342604e-06, - "loss": 0.8057, - "step": 31565 - }, - { - "epoch": 0.81, - "learning_rate": 1.713533981125111e-06, - "loss": 0.666, - "step": 31566 - }, - { - "epoch": 0.81, - "learning_rate": 1.7135145943612974e-06, - "loss": 0.8662, - "step": 31567 - }, - { - "epoch": 0.81, - "learning_rate": 1.7134952070511789e-06, - "loss": 0.8604, - "step": 31568 - }, - { - "epoch": 0.81, - "learning_rate": 1.71347581919477e-06, - "loss": 0.875, - "step": 31569 - }, - { - "epoch": 0.81, - "learning_rate": 1.7134564307920854e-06, - "loss": 0.9893, - "step": 31570 - }, - { - "epoch": 0.81, - "learning_rate": 1.7134370418431395e-06, - "loss": 0.6816, - "step": 31571 - }, - { - "epoch": 0.81, - "learning_rate": 1.7134176523479483e-06, - "loss": 0.8257, - "step": 31572 - }, - { - "epoch": 0.81, - "learning_rate": 1.7133982623065258e-06, - "loss": 0.8652, - "step": 31573 - }, - { - "epoch": 0.81, - "learning_rate": 1.713378871718887e-06, - "loss": 0.8896, - "step": 31574 - }, - { - "epoch": 0.81, - "learning_rate": 1.7133594805850469e-06, - "loss": 0.5898, - "step": 31575 - }, - { - "epoch": 0.81, - "learning_rate": 1.7133400889050203e-06, - "loss": 0.9551, - "step": 31576 - }, - { - "epoch": 0.81, - "learning_rate": 1.7133206966788216e-06, - "loss": 0.6616, - "step": 31577 - }, - { - "epoch": 0.81, - "learning_rate": 1.7133013039064666e-06, - "loss": 0.7788, - "step": 31578 - }, - { - "epoch": 0.81, - "learning_rate": 1.7132819105879692e-06, - "loss": 0.917, - "step": 31579 - }, - { - "epoch": 0.81, - "learning_rate": 1.7132625167233447e-06, - "loss": 0.7202, - "step": 31580 - }, - { - "epoch": 0.81, - "learning_rate": 1.713243122312608e-06, - "loss": 0.877, - "step": 31581 - }, - { - "epoch": 0.81, - "learning_rate": 1.7132237273557737e-06, - "loss": 0.6106, - "step": 31582 - }, - { - "epoch": 0.81, - "learning_rate": 1.7132043318528568e-06, - "loss": 1.0264, - "step": 31583 - }, - { - "epoch": 0.81, - "learning_rate": 1.7131849358038724e-06, - "loss": 0.7744, - "step": 31584 - }, - { - "epoch": 0.81, - "learning_rate": 1.713165539208835e-06, - "loss": 0.8926, - "step": 31585 - }, - { - "epoch": 0.81, - "learning_rate": 1.7131461420677593e-06, - "loss": 0.9385, - "step": 31586 - }, - { - "epoch": 0.81, - "learning_rate": 1.7131267443806606e-06, - "loss": 0.8154, - "step": 31587 - }, - { - "epoch": 0.81, - "learning_rate": 1.713107346147553e-06, - "loss": 0.7803, - "step": 31588 - }, - { - "epoch": 0.81, - "learning_rate": 1.7130879473684527e-06, - "loss": 0.8662, - "step": 31589 - }, - { - "epoch": 0.81, - "learning_rate": 1.7130685480433736e-06, - "loss": 0.8252, - "step": 31590 - }, - { - "epoch": 0.81, - "learning_rate": 1.7130491481723303e-06, - "loss": 0.9609, - "step": 31591 - }, - { - "epoch": 0.81, - "learning_rate": 1.7130297477553382e-06, - "loss": 0.9189, - "step": 31592 - }, - { - "epoch": 0.81, - "learning_rate": 1.7130103467924122e-06, - "loss": 1.002, - "step": 31593 - }, - { - "epoch": 0.81, - "learning_rate": 1.7129909452835668e-06, - "loss": 0.8164, - "step": 31594 - }, - { - "epoch": 0.81, - "learning_rate": 1.712971543228817e-06, - "loss": 0.8394, - "step": 31595 - }, - { - "epoch": 0.81, - "learning_rate": 1.7129521406281778e-06, - "loss": 0.8735, - "step": 31596 - }, - { - "epoch": 0.81, - "learning_rate": 1.7129327374816636e-06, - "loss": 0.6709, - "step": 31597 - }, - { - "epoch": 0.81, - "learning_rate": 1.7129133337892898e-06, - "loss": 0.9795, - "step": 31598 - }, - { - "epoch": 0.81, - "learning_rate": 1.7128939295510714e-06, - "loss": 0.6934, - "step": 31599 - }, - { - "epoch": 0.81, - "learning_rate": 1.7128745247670225e-06, - "loss": 0.6772, - "step": 31600 - }, - { - "epoch": 0.81, - "learning_rate": 1.7128551194371582e-06, - "loss": 0.6548, - "step": 31601 - }, - { - "epoch": 0.81, - "learning_rate": 1.712835713561494e-06, - "loss": 1.0391, - "step": 31602 - }, - { - "epoch": 0.81, - "learning_rate": 1.7128163071400439e-06, - "loss": 0.73, - "step": 31603 - }, - { - "epoch": 0.81, - "learning_rate": 1.7127969001728232e-06, - "loss": 0.9814, - "step": 31604 - }, - { - "epoch": 0.81, - "learning_rate": 1.7127774926598465e-06, - "loss": 0.8389, - "step": 31605 - }, - { - "epoch": 0.81, - "learning_rate": 1.7127580846011295e-06, - "loss": 0.9756, - "step": 31606 - }, - { - "epoch": 0.81, - "learning_rate": 1.712738675996686e-06, - "loss": 0.8025, - "step": 31607 - }, - { - "epoch": 0.81, - "learning_rate": 1.7127192668465312e-06, - "loss": 0.9297, - "step": 31608 - }, - { - "epoch": 0.81, - "learning_rate": 1.71269985715068e-06, - "loss": 0.9409, - "step": 31609 - }, - { - "epoch": 0.81, - "learning_rate": 1.7126804469091473e-06, - "loss": 0.7236, - "step": 31610 - }, - { - "epoch": 0.81, - "learning_rate": 1.7126610361219482e-06, - "loss": 0.7905, - "step": 31611 - }, - { - "epoch": 0.81, - "learning_rate": 1.7126416247890969e-06, - "loss": 0.8906, - "step": 31612 - }, - { - "epoch": 0.81, - "learning_rate": 1.7126222129106091e-06, - "loss": 0.6943, - "step": 31613 - }, - { - "epoch": 0.81, - "learning_rate": 1.712602800486499e-06, - "loss": 0.8184, - "step": 31614 - }, - { - "epoch": 0.81, - "learning_rate": 1.7125833875167817e-06, - "loss": 0.665, - "step": 31615 - }, - { - "epoch": 0.81, - "learning_rate": 1.712563974001472e-06, - "loss": 1.0322, - "step": 31616 - }, - { - "epoch": 0.81, - "learning_rate": 1.7125445599405853e-06, - "loss": 0.7979, - "step": 31617 - }, - { - "epoch": 0.81, - "learning_rate": 1.7125251453341356e-06, - "loss": 0.957, - "step": 31618 - }, - { - "epoch": 0.81, - "learning_rate": 1.7125057301821379e-06, - "loss": 0.5947, - "step": 31619 - }, - { - "epoch": 0.81, - "learning_rate": 1.7124863144846077e-06, - "loss": 0.5942, - "step": 31620 - }, - { - "epoch": 0.81, - "learning_rate": 1.7124668982415595e-06, - "loss": 0.8525, - "step": 31621 - }, - { - "epoch": 0.81, - "learning_rate": 1.7124474814530081e-06, - "loss": 0.804, - "step": 31622 - }, - { - "epoch": 0.81, - "learning_rate": 1.7124280641189684e-06, - "loss": 0.793, - "step": 31623 - }, - { - "epoch": 0.81, - "learning_rate": 1.712408646239455e-06, - "loss": 0.7119, - "step": 31624 - }, - { - "epoch": 0.81, - "learning_rate": 1.7123892278144835e-06, - "loss": 0.9463, - "step": 31625 - }, - { - "epoch": 0.81, - "learning_rate": 1.7123698088440684e-06, - "loss": 0.9053, - "step": 31626 - }, - { - "epoch": 0.81, - "learning_rate": 1.712350389328224e-06, - "loss": 0.8975, - "step": 31627 - }, - { - "epoch": 0.81, - "learning_rate": 1.7123309692669658e-06, - "loss": 0.7656, - "step": 31628 - }, - { - "epoch": 0.81, - "learning_rate": 1.7123115486603088e-06, - "loss": 0.9834, - "step": 31629 - }, - { - "epoch": 0.81, - "learning_rate": 1.7122921275082677e-06, - "loss": 0.9111, - "step": 31630 - }, - { - "epoch": 0.81, - "learning_rate": 1.712272705810857e-06, - "loss": 0.7271, - "step": 31631 - }, - { - "epoch": 0.81, - "learning_rate": 1.7122532835680916e-06, - "loss": 1.124, - "step": 31632 - }, - { - "epoch": 0.81, - "learning_rate": 1.712233860779987e-06, - "loss": 1.2744, - "step": 31633 - }, - { - "epoch": 0.81, - "learning_rate": 1.7122144374465575e-06, - "loss": 0.854, - "step": 31634 - }, - { - "epoch": 0.81, - "learning_rate": 1.7121950135678182e-06, - "loss": 0.8848, - "step": 31635 - }, - { - "epoch": 0.81, - "learning_rate": 1.7121755891437842e-06, - "loss": 0.9111, - "step": 31636 - }, - { - "epoch": 0.81, - "learning_rate": 1.7121561641744696e-06, - "loss": 0.7334, - "step": 31637 - }, - { - "epoch": 0.81, - "learning_rate": 1.71213673865989e-06, - "loss": 0.8086, - "step": 31638 - }, - { - "epoch": 0.81, - "learning_rate": 1.7121173126000602e-06, - "loss": 0.999, - "step": 31639 - }, - { - "epoch": 0.81, - "learning_rate": 1.7120978859949945e-06, - "loss": 1.042, - "step": 31640 - }, - { - "epoch": 0.81, - "learning_rate": 1.7120784588447086e-06, - "loss": 0.5464, - "step": 31641 - }, - { - "epoch": 0.81, - "learning_rate": 1.712059031149217e-06, - "loss": 0.8887, - "step": 31642 - }, - { - "epoch": 0.81, - "learning_rate": 1.712039602908534e-06, - "loss": 0.9321, - "step": 31643 - }, - { - "epoch": 0.81, - "learning_rate": 1.7120201741226756e-06, - "loss": 0.8315, - "step": 31644 - }, - { - "epoch": 0.81, - "learning_rate": 1.7120007447916559e-06, - "loss": 1.0566, - "step": 31645 - }, - { - "epoch": 0.81, - "learning_rate": 1.7119813149154898e-06, - "loss": 0.9346, - "step": 31646 - }, - { - "epoch": 0.81, - "learning_rate": 1.7119618844941926e-06, - "loss": 0.7676, - "step": 31647 - }, - { - "epoch": 0.81, - "learning_rate": 1.7119424535277788e-06, - "loss": 0.8623, - "step": 31648 - }, - { - "epoch": 0.81, - "learning_rate": 1.7119230220162634e-06, - "loss": 0.6523, - "step": 31649 - }, - { - "epoch": 0.81, - "learning_rate": 1.7119035899596615e-06, - "loss": 0.5405, - "step": 31650 - }, - { - "epoch": 0.81, - "learning_rate": 1.7118841573579873e-06, - "loss": 0.9131, - "step": 31651 - }, - { - "epoch": 0.81, - "learning_rate": 1.7118647242112566e-06, - "loss": 0.7017, - "step": 31652 - }, - { - "epoch": 0.81, - "learning_rate": 1.7118452905194834e-06, - "loss": 0.815, - "step": 31653 - }, - { - "epoch": 0.81, - "learning_rate": 1.7118258562826833e-06, - "loss": 0.8887, - "step": 31654 - }, - { - "epoch": 0.81, - "learning_rate": 1.7118064215008707e-06, - "loss": 0.9854, - "step": 31655 - }, - { - "epoch": 0.81, - "learning_rate": 1.7117869861740605e-06, - "loss": 0.5005, - "step": 31656 - }, - { - "epoch": 0.81, - "learning_rate": 1.7117675503022682e-06, - "loss": 0.8979, - "step": 31657 - }, - { - "epoch": 0.81, - "learning_rate": 1.711748113885508e-06, - "loss": 0.7466, - "step": 31658 - }, - { - "epoch": 0.81, - "learning_rate": 1.7117286769237948e-06, - "loss": 1.1523, - "step": 31659 - }, - { - "epoch": 0.81, - "learning_rate": 1.7117092394171438e-06, - "loss": 0.8848, - "step": 31660 - }, - { - "epoch": 0.81, - "learning_rate": 1.71168980136557e-06, - "loss": 0.875, - "step": 31661 - }, - { - "epoch": 0.81, - "learning_rate": 1.7116703627690878e-06, - "loss": 0.4827, - "step": 31662 - }, - { - "epoch": 0.81, - "learning_rate": 1.7116509236277122e-06, - "loss": 0.6553, - "step": 31663 - }, - { - "epoch": 0.81, - "learning_rate": 1.7116314839414585e-06, - "loss": 0.8198, - "step": 31664 - }, - { - "epoch": 0.81, - "learning_rate": 1.7116120437103411e-06, - "loss": 0.7329, - "step": 31665 - }, - { - "epoch": 0.81, - "learning_rate": 1.7115926029343753e-06, - "loss": 0.8428, - "step": 31666 - }, - { - "epoch": 0.81, - "learning_rate": 1.7115731616135754e-06, - "loss": 0.9219, - "step": 31667 - }, - { - "epoch": 0.81, - "learning_rate": 1.7115537197479568e-06, - "loss": 0.9346, - "step": 31668 - }, - { - "epoch": 0.81, - "learning_rate": 1.7115342773375346e-06, - "loss": 0.9229, - "step": 31669 - }, - { - "epoch": 0.81, - "learning_rate": 1.711514834382323e-06, - "loss": 0.8242, - "step": 31670 - }, - { - "epoch": 0.81, - "learning_rate": 1.7114953908823371e-06, - "loss": 0.8301, - "step": 31671 - }, - { - "epoch": 0.81, - "learning_rate": 1.711475946837592e-06, - "loss": 0.9365, - "step": 31672 - }, - { - "epoch": 0.81, - "learning_rate": 1.7114565022481023e-06, - "loss": 0.79, - "step": 31673 - }, - { - "epoch": 0.81, - "learning_rate": 1.7114370571138835e-06, - "loss": 0.6304, - "step": 31674 - }, - { - "epoch": 0.81, - "learning_rate": 1.7114176114349496e-06, - "loss": 0.9043, - "step": 31675 - }, - { - "epoch": 0.81, - "learning_rate": 1.7113981652113163e-06, - "loss": 0.9678, - "step": 31676 - }, - { - "epoch": 0.81, - "learning_rate": 1.711378718442998e-06, - "loss": 0.9453, - "step": 31677 - }, - { - "epoch": 0.81, - "learning_rate": 1.7113592711300098e-06, - "loss": 1.0166, - "step": 31678 - }, - { - "epoch": 0.81, - "learning_rate": 1.7113398232723664e-06, - "loss": 1.0088, - "step": 31679 - }, - { - "epoch": 0.81, - "learning_rate": 1.7113203748700829e-06, - "loss": 0.5432, - "step": 31680 - }, - { - "epoch": 0.81, - "learning_rate": 1.7113009259231741e-06, - "loss": 0.7109, - "step": 31681 - }, - { - "epoch": 0.81, - "learning_rate": 1.7112814764316547e-06, - "loss": 0.7793, - "step": 31682 - }, - { - "epoch": 0.81, - "learning_rate": 1.71126202639554e-06, - "loss": 0.9785, - "step": 31683 - }, - { - "epoch": 0.81, - "learning_rate": 1.7112425758148446e-06, - "loss": 0.7539, - "step": 31684 - }, - { - "epoch": 0.81, - "learning_rate": 1.7112231246895833e-06, - "loss": 0.9238, - "step": 31685 - }, - { - "epoch": 0.81, - "learning_rate": 1.7112036730197713e-06, - "loss": 0.9775, - "step": 31686 - }, - { - "epoch": 0.81, - "learning_rate": 1.7111842208054235e-06, - "loss": 0.918, - "step": 31687 - }, - { - "epoch": 0.81, - "learning_rate": 1.7111647680465543e-06, - "loss": 0.8564, - "step": 31688 - }, - { - "epoch": 0.81, - "learning_rate": 1.7111453147431792e-06, - "loss": 0.8496, - "step": 31689 - }, - { - "epoch": 0.81, - "learning_rate": 1.7111258608953128e-06, - "loss": 1.0068, - "step": 31690 - }, - { - "epoch": 0.81, - "learning_rate": 1.7111064065029698e-06, - "loss": 0.9365, - "step": 31691 - }, - { - "epoch": 0.81, - "learning_rate": 1.7110869515661657e-06, - "loss": 0.8584, - "step": 31692 - }, - { - "epoch": 0.81, - "learning_rate": 1.711067496084915e-06, - "loss": 0.876, - "step": 31693 - }, - { - "epoch": 0.81, - "learning_rate": 1.7110480400592322e-06, - "loss": 0.8271, - "step": 31694 - }, - { - "epoch": 0.81, - "learning_rate": 1.7110285834891332e-06, - "loss": 0.6111, - "step": 31695 - }, - { - "epoch": 0.81, - "learning_rate": 1.7110091263746317e-06, - "loss": 1.0117, - "step": 31696 - }, - { - "epoch": 0.81, - "learning_rate": 1.7109896687157437e-06, - "loss": 0.7432, - "step": 31697 - }, - { - "epoch": 0.81, - "learning_rate": 1.7109702105124833e-06, - "loss": 0.8574, - "step": 31698 - }, - { - "epoch": 0.81, - "learning_rate": 1.7109507517648659e-06, - "loss": 0.4272, - "step": 31699 - }, - { - "epoch": 0.81, - "learning_rate": 1.7109312924729057e-06, - "loss": 0.7622, - "step": 31700 - }, - { - "epoch": 0.81, - "learning_rate": 1.7109118326366187e-06, - "loss": 0.9658, - "step": 31701 - }, - { - "epoch": 0.81, - "learning_rate": 1.710892372256019e-06, - "loss": 1.0967, - "step": 31702 - }, - { - "epoch": 0.81, - "learning_rate": 1.7108729113311218e-06, - "loss": 0.6372, - "step": 31703 - }, - { - "epoch": 0.81, - "learning_rate": 1.7108534498619416e-06, - "loss": 0.707, - "step": 31704 - }, - { - "epoch": 0.81, - "learning_rate": 1.7108339878484936e-06, - "loss": 0.998, - "step": 31705 - }, - { - "epoch": 0.81, - "learning_rate": 1.710814525290793e-06, - "loss": 0.7935, - "step": 31706 - }, - { - "epoch": 0.81, - "learning_rate": 1.7107950621888543e-06, - "loss": 0.8154, - "step": 31707 - }, - { - "epoch": 0.81, - "learning_rate": 1.7107755985426925e-06, - "loss": 0.791, - "step": 31708 - }, - { - "epoch": 0.81, - "learning_rate": 1.7107561343523224e-06, - "loss": 0.9219, - "step": 31709 - }, - { - "epoch": 0.81, - "learning_rate": 1.7107366696177593e-06, - "loss": 1.0156, - "step": 31710 - }, - { - "epoch": 0.81, - "learning_rate": 1.7107172043390175e-06, - "loss": 1.1221, - "step": 31711 - }, - { - "epoch": 0.81, - "learning_rate": 1.7106977385161122e-06, - "loss": 0.875, - "step": 31712 - }, - { - "epoch": 0.81, - "learning_rate": 1.7106782721490585e-06, - "loss": 0.8882, - "step": 31713 - }, - { - "epoch": 0.81, - "learning_rate": 1.710658805237871e-06, - "loss": 0.6064, - "step": 31714 - }, - { - "epoch": 0.81, - "learning_rate": 1.710639337782565e-06, - "loss": 0.707, - "step": 31715 - }, - { - "epoch": 0.81, - "learning_rate": 1.710619869783155e-06, - "loss": 0.7026, - "step": 31716 - }, - { - "epoch": 0.81, - "learning_rate": 1.7106004012396557e-06, - "loss": 1.0264, - "step": 31717 - }, - { - "epoch": 0.81, - "learning_rate": 1.7105809321520827e-06, - "loss": 0.6914, - "step": 31718 - }, - { - "epoch": 0.81, - "learning_rate": 1.7105614625204504e-06, - "loss": 0.9033, - "step": 31719 - }, - { - "epoch": 0.81, - "learning_rate": 1.710541992344774e-06, - "loss": 0.7705, - "step": 31720 - }, - { - "epoch": 0.81, - "learning_rate": 1.7105225216250682e-06, - "loss": 0.605, - "step": 31721 - }, - { - "epoch": 0.81, - "learning_rate": 1.710503050361348e-06, - "loss": 0.7803, - "step": 31722 - }, - { - "epoch": 0.81, - "learning_rate": 1.7104835785536285e-06, - "loss": 0.8516, - "step": 31723 - }, - { - "epoch": 0.81, - "learning_rate": 1.710464106201924e-06, - "loss": 0.6602, - "step": 31724 - }, - { - "epoch": 0.81, - "learning_rate": 1.7104446333062498e-06, - "loss": 1.082, - "step": 31725 - }, - { - "epoch": 0.81, - "learning_rate": 1.710425159866621e-06, - "loss": 0.8154, - "step": 31726 - }, - { - "epoch": 0.81, - "learning_rate": 1.7104056858830523e-06, - "loss": 0.7158, - "step": 31727 - }, - { - "epoch": 0.81, - "learning_rate": 1.7103862113555584e-06, - "loss": 0.8613, - "step": 31728 - }, - { - "epoch": 0.81, - "learning_rate": 1.710366736284155e-06, - "loss": 1.0176, - "step": 31729 - }, - { - "epoch": 0.81, - "learning_rate": 1.710347260668856e-06, - "loss": 0.8447, - "step": 31730 - }, - { - "epoch": 0.81, - "learning_rate": 1.710327784509677e-06, - "loss": 0.8076, - "step": 31731 - }, - { - "epoch": 0.81, - "learning_rate": 1.7103083078066326e-06, - "loss": 0.7773, - "step": 31732 - }, - { - "epoch": 0.81, - "learning_rate": 1.7102888305597377e-06, - "loss": 0.9443, - "step": 31733 - }, - { - "epoch": 0.81, - "learning_rate": 1.7102693527690074e-06, - "loss": 1.0068, - "step": 31734 - }, - { - "epoch": 0.81, - "learning_rate": 1.7102498744344564e-06, - "loss": 0.7344, - "step": 31735 - }, - { - "epoch": 0.81, - "learning_rate": 1.7102303955560998e-06, - "loss": 0.8555, - "step": 31736 - }, - { - "epoch": 0.81, - "learning_rate": 1.7102109161339525e-06, - "loss": 0.8672, - "step": 31737 - }, - { - "epoch": 0.81, - "learning_rate": 1.7101914361680291e-06, - "loss": 0.6929, - "step": 31738 - }, - { - "epoch": 0.81, - "learning_rate": 1.710171955658345e-06, - "loss": 0.9395, - "step": 31739 - }, - { - "epoch": 0.81, - "learning_rate": 1.7101524746049146e-06, - "loss": 0.769, - "step": 31740 - }, - { - "epoch": 0.81, - "learning_rate": 1.7101329930077536e-06, - "loss": 0.6631, - "step": 31741 - }, - { - "epoch": 0.81, - "learning_rate": 1.7101135108668762e-06, - "loss": 0.7695, - "step": 31742 - }, - { - "epoch": 0.81, - "learning_rate": 1.7100940281822975e-06, - "loss": 0.8462, - "step": 31743 - }, - { - "epoch": 0.81, - "learning_rate": 1.7100745449540326e-06, - "loss": 0.7246, - "step": 31744 - }, - { - "epoch": 0.81, - "learning_rate": 1.710055061182096e-06, - "loss": 0.8887, - "step": 31745 - }, - { - "epoch": 0.81, - "learning_rate": 1.710035576866503e-06, - "loss": 0.8125, - "step": 31746 - }, - { - "epoch": 0.81, - "learning_rate": 1.7100160920072687e-06, - "loss": 0.7285, - "step": 31747 - }, - { - "epoch": 0.81, - "learning_rate": 1.7099966066044075e-06, - "loss": 0.7334, - "step": 31748 - }, - { - "epoch": 0.81, - "learning_rate": 1.7099771206579345e-06, - "loss": 0.873, - "step": 31749 - }, - { - "epoch": 0.81, - "learning_rate": 1.7099576341678646e-06, - "loss": 0.9033, - "step": 31750 - }, - { - "epoch": 0.81, - "learning_rate": 1.709938147134213e-06, - "loss": 0.8818, - "step": 31751 - }, - { - "epoch": 0.81, - "learning_rate": 1.7099186595569938e-06, - "loss": 0.6418, - "step": 31752 - }, - { - "epoch": 0.81, - "learning_rate": 1.7098991714362232e-06, - "loss": 1.0029, - "step": 31753 - }, - { - "epoch": 0.81, - "learning_rate": 1.7098796827719152e-06, - "loss": 0.647, - "step": 31754 - }, - { - "epoch": 0.81, - "learning_rate": 1.709860193564085e-06, - "loss": 0.8394, - "step": 31755 - }, - { - "epoch": 0.81, - "learning_rate": 1.7098407038127477e-06, - "loss": 0.6973, - "step": 31756 - }, - { - "epoch": 0.81, - "learning_rate": 1.7098212135179178e-06, - "loss": 0.6797, - "step": 31757 - }, - { - "epoch": 0.81, - "learning_rate": 1.7098017226796103e-06, - "loss": 0.7441, - "step": 31758 - }, - { - "epoch": 0.81, - "learning_rate": 1.7097822312978404e-06, - "loss": 0.8467, - "step": 31759 - }, - { - "epoch": 0.81, - "learning_rate": 1.7097627393726229e-06, - "loss": 0.8086, - "step": 31760 - }, - { - "epoch": 0.81, - "learning_rate": 1.7097432469039727e-06, - "loss": 0.8438, - "step": 31761 - }, - { - "epoch": 0.81, - "learning_rate": 1.7097237538919047e-06, - "loss": 0.6538, - "step": 31762 - }, - { - "epoch": 0.81, - "learning_rate": 1.709704260336434e-06, - "loss": 0.9258, - "step": 31763 - }, - { - "epoch": 0.81, - "learning_rate": 1.7096847662375753e-06, - "loss": 0.9365, - "step": 31764 - }, - { - "epoch": 0.81, - "learning_rate": 1.7096652715953433e-06, - "loss": 1.0283, - "step": 31765 - }, - { - "epoch": 0.81, - "learning_rate": 1.7096457764097536e-06, - "loss": 0.8613, - "step": 31766 - }, - { - "epoch": 0.81, - "learning_rate": 1.7096262806808207e-06, - "loss": 0.8589, - "step": 31767 - }, - { - "epoch": 0.81, - "learning_rate": 1.7096067844085595e-06, - "loss": 0.9688, - "step": 31768 - }, - { - "epoch": 0.81, - "learning_rate": 1.7095872875929852e-06, - "loss": 0.8066, - "step": 31769 - }, - { - "epoch": 0.81, - "learning_rate": 1.709567790234112e-06, - "loss": 0.7622, - "step": 31770 - }, - { - "epoch": 0.81, - "learning_rate": 1.7095482923319562e-06, - "loss": 0.7832, - "step": 31771 - }, - { - "epoch": 0.81, - "learning_rate": 1.7095287938865312e-06, - "loss": 0.8369, - "step": 31772 - }, - { - "epoch": 0.81, - "learning_rate": 1.709509294897853e-06, - "loss": 0.9766, - "step": 31773 - }, - { - "epoch": 0.81, - "learning_rate": 1.709489795365936e-06, - "loss": 0.9248, - "step": 31774 - }, - { - "epoch": 0.81, - "learning_rate": 1.7094702952907953e-06, - "loss": 1.0195, - "step": 31775 - }, - { - "epoch": 0.81, - "learning_rate": 1.7094507946724458e-06, - "loss": 0.8271, - "step": 31776 - }, - { - "epoch": 0.81, - "learning_rate": 1.7094312935109025e-06, - "loss": 0.8057, - "step": 31777 - }, - { - "epoch": 0.81, - "learning_rate": 1.7094117918061803e-06, - "loss": 0.8154, - "step": 31778 - }, - { - "epoch": 0.81, - "learning_rate": 1.7093922895582942e-06, - "loss": 0.8447, - "step": 31779 - }, - { - "epoch": 0.81, - "learning_rate": 1.709372786767259e-06, - "loss": 0.7207, - "step": 31780 - }, - { - "epoch": 0.81, - "learning_rate": 1.7093532834330896e-06, - "loss": 0.7373, - "step": 31781 - }, - { - "epoch": 0.81, - "learning_rate": 1.709333779555801e-06, - "loss": 0.7747, - "step": 31782 - }, - { - "epoch": 0.81, - "learning_rate": 1.709314275135408e-06, - "loss": 0.8599, - "step": 31783 - }, - { - "epoch": 0.81, - "learning_rate": 1.709294770171926e-06, - "loss": 0.958, - "step": 31784 - }, - { - "epoch": 0.81, - "learning_rate": 1.7092752646653695e-06, - "loss": 0.7944, - "step": 31785 - }, - { - "epoch": 0.81, - "learning_rate": 1.7092557586157535e-06, - "loss": 0.8145, - "step": 31786 - }, - { - "epoch": 0.81, - "learning_rate": 1.7092362520230927e-06, - "loss": 0.7646, - "step": 31787 - }, - { - "epoch": 0.81, - "learning_rate": 1.7092167448874028e-06, - "loss": 0.6885, - "step": 31788 - }, - { - "epoch": 0.81, - "learning_rate": 1.709197237208698e-06, - "loss": 0.8525, - "step": 31789 - }, - { - "epoch": 0.81, - "learning_rate": 1.7091777289869933e-06, - "loss": 0.7922, - "step": 31790 - }, - { - "epoch": 0.81, - "learning_rate": 1.7091582202223044e-06, - "loss": 0.8105, - "step": 31791 - }, - { - "epoch": 0.81, - "learning_rate": 1.7091387109146451e-06, - "loss": 0.7158, - "step": 31792 - }, - { - "epoch": 0.81, - "learning_rate": 1.709119201064031e-06, - "loss": 0.916, - "step": 31793 - }, - { - "epoch": 0.81, - "learning_rate": 1.7090996906704768e-06, - "loss": 0.7483, - "step": 31794 - }, - { - "epoch": 0.81, - "learning_rate": 1.709080179733998e-06, - "loss": 0.9883, - "step": 31795 - }, - { - "epoch": 0.81, - "learning_rate": 1.709060668254609e-06, - "loss": 0.9824, - "step": 31796 - }, - { - "epoch": 0.81, - "learning_rate": 1.7090411562323247e-06, - "loss": 0.9082, - "step": 31797 - }, - { - "epoch": 0.81, - "learning_rate": 1.7090216436671603e-06, - "loss": 0.7998, - "step": 31798 - }, - { - "epoch": 0.82, - "learning_rate": 1.7090021305591304e-06, - "loss": 0.9033, - "step": 31799 - }, - { - "epoch": 0.82, - "learning_rate": 1.7089826169082505e-06, - "loss": 0.8164, - "step": 31800 - }, - { - "epoch": 0.82, - "learning_rate": 1.7089631027145348e-06, - "loss": 0.8779, - "step": 31801 - }, - { - "epoch": 0.82, - "learning_rate": 1.708943587977999e-06, - "loss": 0.875, - "step": 31802 - }, - { - "epoch": 0.82, - "learning_rate": 1.7089240726986577e-06, - "loss": 1.1104, - "step": 31803 - }, - { - "epoch": 0.82, - "learning_rate": 1.7089045568765256e-06, - "loss": 0.7979, - "step": 31804 - }, - { - "epoch": 0.82, - "learning_rate": 1.708885040511618e-06, - "loss": 0.8838, - "step": 31805 - }, - { - "epoch": 0.82, - "learning_rate": 1.7088655236039498e-06, - "loss": 0.8828, - "step": 31806 - }, - { - "epoch": 0.82, - "learning_rate": 1.7088460061535356e-06, - "loss": 0.8467, - "step": 31807 - }, - { - "epoch": 0.82, - "learning_rate": 1.7088264881603908e-06, - "loss": 0.9307, - "step": 31808 - }, - { - "epoch": 0.82, - "learning_rate": 1.7088069696245303e-06, - "loss": 0.8203, - "step": 31809 - }, - { - "epoch": 0.82, - "learning_rate": 1.7087874505459687e-06, - "loss": 0.832, - "step": 31810 - }, - { - "epoch": 0.82, - "learning_rate": 1.708767930924721e-06, - "loss": 0.6553, - "step": 31811 - }, - { - "epoch": 0.82, - "learning_rate": 1.7087484107608028e-06, - "loss": 0.8926, - "step": 31812 - }, - { - "epoch": 0.82, - "learning_rate": 1.7087288900542283e-06, - "loss": 0.9512, - "step": 31813 - }, - { - "epoch": 0.82, - "learning_rate": 1.7087093688050124e-06, - "loss": 0.9033, - "step": 31814 - }, - { - "epoch": 0.82, - "learning_rate": 1.7086898470131705e-06, - "loss": 0.8896, - "step": 31815 - }, - { - "epoch": 0.82, - "learning_rate": 1.7086703246787173e-06, - "loss": 0.8843, - "step": 31816 - }, - { - "epoch": 0.82, - "learning_rate": 1.7086508018016682e-06, - "loss": 0.8408, - "step": 31817 - }, - { - "epoch": 0.82, - "learning_rate": 1.7086312783820373e-06, - "loss": 0.6875, - "step": 31818 - }, - { - "epoch": 0.82, - "learning_rate": 1.7086117544198403e-06, - "loss": 0.6951, - "step": 31819 - }, - { - "epoch": 0.82, - "learning_rate": 1.7085922299150917e-06, - "loss": 0.7422, - "step": 31820 - }, - { - "epoch": 0.82, - "learning_rate": 1.7085727048678066e-06, - "loss": 0.8838, - "step": 31821 - }, - { - "epoch": 0.82, - "learning_rate": 1.7085531792779997e-06, - "loss": 0.8037, - "step": 31822 - }, - { - "epoch": 0.82, - "learning_rate": 1.7085336531456867e-06, - "loss": 0.79, - "step": 31823 - }, - { - "epoch": 0.82, - "learning_rate": 1.7085141264708817e-06, - "loss": 0.751, - "step": 31824 - }, - { - "epoch": 0.82, - "learning_rate": 1.7084945992536004e-06, - "loss": 0.8711, - "step": 31825 - }, - { - "epoch": 0.82, - "learning_rate": 1.708475071493857e-06, - "loss": 0.7178, - "step": 31826 - }, - { - "epoch": 0.82, - "learning_rate": 1.708455543191667e-06, - "loss": 0.8516, - "step": 31827 - }, - { - "epoch": 0.82, - "learning_rate": 1.708436014347045e-06, - "loss": 1.0156, - "step": 31828 - }, - { - "epoch": 0.82, - "learning_rate": 1.7084164849600065e-06, - "loss": 0.9229, - "step": 31829 - }, - { - "epoch": 0.82, - "learning_rate": 1.7083969550305657e-06, - "loss": 0.6924, - "step": 31830 - }, - { - "epoch": 0.82, - "learning_rate": 1.7083774245587382e-06, - "loss": 0.8613, - "step": 31831 - }, - { - "epoch": 0.82, - "learning_rate": 1.7083578935445385e-06, - "loss": 0.9736, - "step": 31832 - }, - { - "epoch": 0.82, - "learning_rate": 1.7083383619879817e-06, - "loss": 0.6699, - "step": 31833 - }, - { - "epoch": 0.82, - "learning_rate": 1.7083188298890829e-06, - "loss": 0.9639, - "step": 31834 - }, - { - "epoch": 0.82, - "learning_rate": 1.7082992972478568e-06, - "loss": 0.5278, - "step": 31835 - }, - { - "epoch": 0.82, - "learning_rate": 1.7082797640643185e-06, - "loss": 0.9189, - "step": 31836 - }, - { - "epoch": 0.82, - "learning_rate": 1.708260230338483e-06, - "loss": 0.7744, - "step": 31837 - }, - { - "epoch": 0.82, - "learning_rate": 1.7082406960703652e-06, - "loss": 0.7646, - "step": 31838 - }, - { - "epoch": 0.82, - "learning_rate": 1.7082211612599805e-06, - "loss": 0.7246, - "step": 31839 - }, - { - "epoch": 0.82, - "learning_rate": 1.7082016259073426e-06, - "loss": 0.7881, - "step": 31840 - }, - { - "epoch": 0.82, - "learning_rate": 1.708182090012468e-06, - "loss": 0.7441, - "step": 31841 - }, - { - "epoch": 0.82, - "learning_rate": 1.7081625535753704e-06, - "loss": 0.7156, - "step": 31842 - }, - { - "epoch": 0.82, - "learning_rate": 1.7081430165960655e-06, - "loss": 1.0742, - "step": 31843 - }, - { - "epoch": 0.82, - "learning_rate": 1.708123479074568e-06, - "loss": 1.0654, - "step": 31844 - }, - { - "epoch": 0.82, - "learning_rate": 1.708103941010893e-06, - "loss": 0.7002, - "step": 31845 - }, - { - "epoch": 0.82, - "learning_rate": 1.7080844024050556e-06, - "loss": 0.5337, - "step": 31846 - }, - { - "epoch": 0.82, - "learning_rate": 1.7080648632570702e-06, - "loss": 0.7986, - "step": 31847 - }, - { - "epoch": 0.82, - "learning_rate": 1.7080453235669524e-06, - "loss": 0.6611, - "step": 31848 - }, - { - "epoch": 0.82, - "learning_rate": 1.7080257833347165e-06, - "loss": 1.0635, - "step": 31849 - }, - { - "epoch": 0.82, - "learning_rate": 1.7080062425603781e-06, - "loss": 0.8574, - "step": 31850 - }, - { - "epoch": 0.82, - "learning_rate": 1.7079867012439518e-06, - "loss": 0.877, - "step": 31851 - }, - { - "epoch": 0.82, - "learning_rate": 1.7079671593854523e-06, - "loss": 0.9199, - "step": 31852 - }, - { - "epoch": 0.82, - "learning_rate": 1.7079476169848955e-06, - "loss": 1.0596, - "step": 31853 - }, - { - "epoch": 0.82, - "learning_rate": 1.7079280740422953e-06, - "loss": 0.9561, - "step": 31854 - }, - { - "epoch": 0.82, - "learning_rate": 1.7079085305576672e-06, - "loss": 0.9824, - "step": 31855 - }, - { - "epoch": 0.82, - "learning_rate": 1.7078889865310262e-06, - "loss": 0.6748, - "step": 31856 - }, - { - "epoch": 0.82, - "learning_rate": 1.7078694419623872e-06, - "loss": 0.7803, - "step": 31857 - }, - { - "epoch": 0.82, - "learning_rate": 1.7078498968517648e-06, - "loss": 0.8804, - "step": 31858 - }, - { - "epoch": 0.82, - "learning_rate": 1.7078303511991746e-06, - "loss": 1.0449, - "step": 31859 - }, - { - "epoch": 0.82, - "learning_rate": 1.707810805004631e-06, - "loss": 0.3906, - "step": 31860 - }, - { - "epoch": 0.82, - "learning_rate": 1.7077912582681495e-06, - "loss": 0.8066, - "step": 31861 - }, - { - "epoch": 0.82, - "learning_rate": 1.7077717109897445e-06, - "loss": 0.8311, - "step": 31862 - }, - { - "epoch": 0.82, - "learning_rate": 1.7077521631694314e-06, - "loss": 0.9639, - "step": 31863 - }, - { - "epoch": 0.82, - "learning_rate": 1.707732614807225e-06, - "loss": 1.001, - "step": 31864 - }, - { - "epoch": 0.82, - "learning_rate": 1.7077130659031402e-06, - "loss": 0.8379, - "step": 31865 - }, - { - "epoch": 0.82, - "learning_rate": 1.7076935164571921e-06, - "loss": 0.9541, - "step": 31866 - }, - { - "epoch": 0.82, - "learning_rate": 1.7076739664693958e-06, - "loss": 0.9453, - "step": 31867 - }, - { - "epoch": 0.82, - "learning_rate": 1.7076544159397658e-06, - "loss": 0.8975, - "step": 31868 - }, - { - "epoch": 0.82, - "learning_rate": 1.7076348648683174e-06, - "loss": 0.7393, - "step": 31869 - }, - { - "epoch": 0.82, - "learning_rate": 1.707615313255066e-06, - "loss": 1.041, - "step": 31870 - }, - { - "epoch": 0.82, - "learning_rate": 1.7075957611000256e-06, - "loss": 0.8027, - "step": 31871 - }, - { - "epoch": 0.82, - "learning_rate": 1.7075762084032115e-06, - "loss": 0.9009, - "step": 31872 - }, - { - "epoch": 0.82, - "learning_rate": 1.7075566551646392e-06, - "loss": 0.8486, - "step": 31873 - }, - { - "epoch": 0.82, - "learning_rate": 1.7075371013843232e-06, - "loss": 0.8457, - "step": 31874 - }, - { - "epoch": 0.82, - "learning_rate": 1.7075175470622787e-06, - "loss": 0.813, - "step": 31875 - }, - { - "epoch": 0.82, - "learning_rate": 1.7074979921985203e-06, - "loss": 1.0288, - "step": 31876 - }, - { - "epoch": 0.82, - "learning_rate": 1.7074784367930633e-06, - "loss": 0.7559, - "step": 31877 - }, - { - "epoch": 0.82, - "learning_rate": 1.7074588808459228e-06, - "loss": 0.8662, - "step": 31878 - }, - { - "epoch": 0.82, - "learning_rate": 1.707439324357113e-06, - "loss": 0.7549, - "step": 31879 - }, - { - "epoch": 0.82, - "learning_rate": 1.70741976732665e-06, - "loss": 0.6968, - "step": 31880 - }, - { - "epoch": 0.82, - "learning_rate": 1.7074002097545481e-06, - "loss": 0.9131, - "step": 31881 - }, - { - "epoch": 0.82, - "learning_rate": 1.7073806516408223e-06, - "loss": 0.9131, - "step": 31882 - }, - { - "epoch": 0.82, - "learning_rate": 1.7073610929854877e-06, - "loss": 0.7212, - "step": 31883 - }, - { - "epoch": 0.82, - "learning_rate": 1.707341533788559e-06, - "loss": 1.084, - "step": 31884 - }, - { - "epoch": 0.82, - "learning_rate": 1.7073219740500518e-06, - "loss": 1.0547, - "step": 31885 - }, - { - "epoch": 0.82, - "learning_rate": 1.7073024137699804e-06, - "loss": 0.8545, - "step": 31886 - }, - { - "epoch": 0.82, - "learning_rate": 1.70728285294836e-06, - "loss": 0.8828, - "step": 31887 - }, - { - "epoch": 0.82, - "learning_rate": 1.707263291585206e-06, - "loss": 0.5757, - "step": 31888 - }, - { - "epoch": 0.82, - "learning_rate": 1.7072437296805328e-06, - "loss": 0.877, - "step": 31889 - }, - { - "epoch": 0.82, - "learning_rate": 1.7072241672343556e-06, - "loss": 0.9346, - "step": 31890 - }, - { - "epoch": 0.82, - "learning_rate": 1.7072046042466894e-06, - "loss": 0.9805, - "step": 31891 - }, - { - "epoch": 0.82, - "learning_rate": 1.7071850407175492e-06, - "loss": 0.9268, - "step": 31892 - }, - { - "epoch": 0.82, - "learning_rate": 1.70716547664695e-06, - "loss": 0.6416, - "step": 31893 - }, - { - "epoch": 0.82, - "learning_rate": 1.7071459120349065e-06, - "loss": 0.8438, - "step": 31894 - }, - { - "epoch": 0.82, - "learning_rate": 1.7071263468814341e-06, - "loss": 1.0215, - "step": 31895 - }, - { - "epoch": 0.82, - "learning_rate": 1.7071067811865474e-06, - "loss": 1.0059, - "step": 31896 - }, - { - "epoch": 0.82, - "learning_rate": 1.7070872149502616e-06, - "loss": 0.7842, - "step": 31897 - }, - { - "epoch": 0.82, - "learning_rate": 1.7070676481725915e-06, - "loss": 0.7197, - "step": 31898 - }, - { - "epoch": 0.82, - "learning_rate": 1.7070480808535526e-06, - "loss": 0.9395, - "step": 31899 - }, - { - "epoch": 0.82, - "learning_rate": 1.7070285129931593e-06, - "loss": 0.7822, - "step": 31900 - }, - { - "epoch": 0.82, - "learning_rate": 1.707008944591427e-06, - "loss": 1.2422, - "step": 31901 - }, - { - "epoch": 0.82, - "learning_rate": 1.7069893756483697e-06, - "loss": 1.1035, - "step": 31902 - }, - { - "epoch": 0.82, - "learning_rate": 1.7069698061640039e-06, - "loss": 0.9023, - "step": 31903 - }, - { - "epoch": 0.82, - "learning_rate": 1.7069502361383434e-06, - "loss": 0.6616, - "step": 31904 - }, - { - "epoch": 0.82, - "learning_rate": 1.706930665571404e-06, - "loss": 1.0166, - "step": 31905 - }, - { - "epoch": 0.82, - "learning_rate": 1.7069110944632e-06, - "loss": 0.6484, - "step": 31906 - }, - { - "epoch": 0.82, - "learning_rate": 1.7068915228137465e-06, - "loss": 0.9043, - "step": 31907 - }, - { - "epoch": 0.82, - "learning_rate": 1.706871950623059e-06, - "loss": 0.8369, - "step": 31908 - }, - { - "epoch": 0.82, - "learning_rate": 1.7068523778911522e-06, - "loss": 0.8584, - "step": 31909 - }, - { - "epoch": 0.82, - "learning_rate": 1.7068328046180409e-06, - "loss": 0.5923, - "step": 31910 - }, - { - "epoch": 0.82, - "learning_rate": 1.70681323080374e-06, - "loss": 0.8301, - "step": 31911 - }, - { - "epoch": 0.82, - "learning_rate": 1.7067936564482653e-06, - "loss": 0.9619, - "step": 31912 - }, - { - "epoch": 0.82, - "learning_rate": 1.7067740815516304e-06, - "loss": 0.6206, - "step": 31913 - }, - { - "epoch": 0.82, - "learning_rate": 1.7067545061138517e-06, - "loss": 0.8037, - "step": 31914 - }, - { - "epoch": 0.82, - "learning_rate": 1.7067349301349435e-06, - "loss": 0.8223, - "step": 31915 - }, - { - "epoch": 0.82, - "learning_rate": 1.7067153536149207e-06, - "loss": 0.7354, - "step": 31916 - }, - { - "epoch": 0.82, - "learning_rate": 1.7066957765537984e-06, - "loss": 0.8066, - "step": 31917 - }, - { - "epoch": 0.82, - "learning_rate": 1.706676198951592e-06, - "loss": 0.835, - "step": 31918 - }, - { - "epoch": 0.82, - "learning_rate": 1.7066566208083158e-06, - "loss": 0.7285, - "step": 31919 - }, - { - "epoch": 0.82, - "learning_rate": 1.7066370421239853e-06, - "loss": 0.8311, - "step": 31920 - }, - { - "epoch": 0.82, - "learning_rate": 1.706617462898615e-06, - "loss": 0.6943, - "step": 31921 - }, - { - "epoch": 0.82, - "learning_rate": 1.7065978831322205e-06, - "loss": 0.6741, - "step": 31922 - }, - { - "epoch": 0.82, - "learning_rate": 1.7065783028248163e-06, - "loss": 0.6816, - "step": 31923 - }, - { - "epoch": 0.82, - "learning_rate": 1.7065587219764176e-06, - "loss": 0.8574, - "step": 31924 - }, - { - "epoch": 0.82, - "learning_rate": 1.7065391405870396e-06, - "loss": 0.8809, - "step": 31925 - }, - { - "epoch": 0.82, - "learning_rate": 1.706519558656697e-06, - "loss": 0.9375, - "step": 31926 - }, - { - "epoch": 0.82, - "learning_rate": 1.7064999761854045e-06, - "loss": 0.7651, - "step": 31927 - }, - { - "epoch": 0.82, - "learning_rate": 1.7064803931731778e-06, - "loss": 0.5275, - "step": 31928 - }, - { - "epoch": 0.82, - "learning_rate": 1.7064608096200314e-06, - "loss": 0.9512, - "step": 31929 - }, - { - "epoch": 0.82, - "learning_rate": 1.7064412255259806e-06, - "loss": 0.9268, - "step": 31930 - }, - { - "epoch": 0.82, - "learning_rate": 1.7064216408910401e-06, - "loss": 0.7144, - "step": 31931 - }, - { - "epoch": 0.82, - "learning_rate": 1.706402055715225e-06, - "loss": 0.9492, - "step": 31932 - }, - { - "epoch": 0.82, - "learning_rate": 1.7063824699985505e-06, - "loss": 0.7993, - "step": 31933 - }, - { - "epoch": 0.82, - "learning_rate": 1.7063628837410312e-06, - "loss": 0.9697, - "step": 31934 - }, - { - "epoch": 0.82, - "learning_rate": 1.7063432969426827e-06, - "loss": 0.573, - "step": 31935 - }, - { - "epoch": 0.82, - "learning_rate": 1.7063237096035192e-06, - "loss": 0.8057, - "step": 31936 - }, - { - "epoch": 0.82, - "learning_rate": 1.7063041217235564e-06, - "loss": 0.8486, - "step": 31937 - }, - { - "epoch": 0.82, - "learning_rate": 1.7062845333028085e-06, - "loss": 1.0703, - "step": 31938 - }, - { - "epoch": 0.82, - "learning_rate": 1.7062649443412918e-06, - "loss": 0.686, - "step": 31939 - }, - { - "epoch": 0.82, - "learning_rate": 1.70624535483902e-06, - "loss": 0.9316, - "step": 31940 - }, - { - "epoch": 0.82, - "learning_rate": 1.7062257647960087e-06, - "loss": 0.8564, - "step": 31941 - }, - { - "epoch": 0.82, - "learning_rate": 1.7062061742122728e-06, - "loss": 0.6753, - "step": 31942 - }, - { - "epoch": 0.82, - "learning_rate": 1.7061865830878276e-06, - "loss": 1.0469, - "step": 31943 - }, - { - "epoch": 0.82, - "learning_rate": 1.7061669914226875e-06, - "loss": 0.6016, - "step": 31944 - }, - { - "epoch": 0.82, - "learning_rate": 1.7061473992168675e-06, - "loss": 0.7007, - "step": 31945 - }, - { - "epoch": 0.82, - "learning_rate": 1.7061278064703832e-06, - "loss": 0.887, - "step": 31946 - }, - { - "epoch": 0.82, - "learning_rate": 1.7061082131832495e-06, - "loss": 1.042, - "step": 31947 - }, - { - "epoch": 0.82, - "learning_rate": 1.7060886193554808e-06, - "loss": 0.7671, - "step": 31948 - }, - { - "epoch": 0.82, - "learning_rate": 1.706069024987093e-06, - "loss": 0.8135, - "step": 31949 - }, - { - "epoch": 0.82, - "learning_rate": 1.7060494300781003e-06, - "loss": 0.834, - "step": 31950 - }, - { - "epoch": 0.82, - "learning_rate": 1.7060298346285182e-06, - "loss": 0.6138, - "step": 31951 - }, - { - "epoch": 0.82, - "learning_rate": 1.7060102386383614e-06, - "loss": 0.8486, - "step": 31952 - }, - { - "epoch": 0.82, - "learning_rate": 1.7059906421076452e-06, - "loss": 0.8848, - "step": 31953 - }, - { - "epoch": 0.82, - "learning_rate": 1.7059710450363842e-06, - "loss": 0.6306, - "step": 31954 - }, - { - "epoch": 0.82, - "learning_rate": 1.7059514474245935e-06, - "loss": 0.6919, - "step": 31955 - }, - { - "epoch": 0.82, - "learning_rate": 1.7059318492722885e-06, - "loss": 0.9854, - "step": 31956 - }, - { - "epoch": 0.82, - "learning_rate": 1.7059122505794838e-06, - "loss": 0.5931, - "step": 31957 - }, - { - "epoch": 0.82, - "learning_rate": 1.7058926513461946e-06, - "loss": 0.9678, - "step": 31958 - }, - { - "epoch": 0.82, - "learning_rate": 1.705873051572436e-06, - "loss": 0.7949, - "step": 31959 - }, - { - "epoch": 0.82, - "learning_rate": 1.7058534512582227e-06, - "loss": 0.6143, - "step": 31960 - }, - { - "epoch": 0.82, - "learning_rate": 1.70583385040357e-06, - "loss": 0.7241, - "step": 31961 - }, - { - "epoch": 0.82, - "learning_rate": 1.7058142490084925e-06, - "loss": 0.9766, - "step": 31962 - }, - { - "epoch": 0.82, - "learning_rate": 1.7057946470730058e-06, - "loss": 0.7627, - "step": 31963 - }, - { - "epoch": 0.82, - "learning_rate": 1.7057750445971247e-06, - "loss": 0.7812, - "step": 31964 - }, - { - "epoch": 0.82, - "learning_rate": 1.7057554415808637e-06, - "loss": 0.8066, - "step": 31965 - }, - { - "epoch": 0.82, - "learning_rate": 1.7057358380242383e-06, - "loss": 0.7988, - "step": 31966 - }, - { - "epoch": 0.82, - "learning_rate": 1.7057162339272634e-06, - "loss": 0.8359, - "step": 31967 - }, - { - "epoch": 0.82, - "learning_rate": 1.7056966292899542e-06, - "loss": 0.9619, - "step": 31968 - }, - { - "epoch": 0.82, - "learning_rate": 1.7056770241123256e-06, - "loss": 0.8359, - "step": 31969 - }, - { - "epoch": 0.82, - "learning_rate": 1.7056574183943925e-06, - "loss": 0.9531, - "step": 31970 - }, - { - "epoch": 0.82, - "learning_rate": 1.7056378121361696e-06, - "loss": 1.0078, - "step": 31971 - }, - { - "epoch": 0.82, - "learning_rate": 1.7056182053376725e-06, - "loss": 0.8242, - "step": 31972 - }, - { - "epoch": 0.82, - "learning_rate": 1.7055985979989162e-06, - "loss": 0.8359, - "step": 31973 - }, - { - "epoch": 0.82, - "learning_rate": 1.7055789901199153e-06, - "loss": 1.0156, - "step": 31974 - }, - { - "epoch": 0.82, - "learning_rate": 1.705559381700685e-06, - "loss": 0.5875, - "step": 31975 - }, - { - "epoch": 0.82, - "learning_rate": 1.7055397727412403e-06, - "loss": 0.793, - "step": 31976 - }, - { - "epoch": 0.82, - "learning_rate": 1.7055201632415962e-06, - "loss": 0.7822, - "step": 31977 - }, - { - "epoch": 0.82, - "learning_rate": 1.7055005532017681e-06, - "loss": 0.8364, - "step": 31978 - }, - { - "epoch": 0.82, - "learning_rate": 1.7054809426217704e-06, - "loss": 0.6084, - "step": 31979 - }, - { - "epoch": 0.82, - "learning_rate": 1.7054613315016185e-06, - "loss": 0.874, - "step": 31980 - }, - { - "epoch": 0.82, - "learning_rate": 1.705441719841327e-06, - "loss": 1.1133, - "step": 31981 - }, - { - "epoch": 0.82, - "learning_rate": 1.7054221076409113e-06, - "loss": 0.791, - "step": 31982 - }, - { - "epoch": 0.82, - "learning_rate": 1.7054024949003867e-06, - "loss": 0.9355, - "step": 31983 - }, - { - "epoch": 0.82, - "learning_rate": 1.7053828816197675e-06, - "loss": 1.0479, - "step": 31984 - }, - { - "epoch": 0.82, - "learning_rate": 1.7053632677990693e-06, - "loss": 0.9531, - "step": 31985 - }, - { - "epoch": 0.82, - "learning_rate": 1.7053436534383066e-06, - "loss": 0.8037, - "step": 31986 - }, - { - "epoch": 0.82, - "learning_rate": 1.7053240385374947e-06, - "loss": 0.9531, - "step": 31987 - }, - { - "epoch": 0.82, - "learning_rate": 1.7053044230966486e-06, - "loss": 0.7842, - "step": 31988 - }, - { - "epoch": 0.82, - "learning_rate": 1.7052848071157837e-06, - "loss": 1.1133, - "step": 31989 - }, - { - "epoch": 0.82, - "learning_rate": 1.7052651905949144e-06, - "loss": 0.6694, - "step": 31990 - }, - { - "epoch": 0.82, - "learning_rate": 1.7052455735340558e-06, - "loss": 0.7563, - "step": 31991 - }, - { - "epoch": 0.82, - "learning_rate": 1.7052259559332237e-06, - "loss": 0.6404, - "step": 31992 - }, - { - "epoch": 0.82, - "learning_rate": 1.7052063377924317e-06, - "loss": 0.9736, - "step": 31993 - }, - { - "epoch": 0.82, - "learning_rate": 1.7051867191116961e-06, - "loss": 0.7715, - "step": 31994 - }, - { - "epoch": 0.82, - "learning_rate": 1.7051670998910316e-06, - "loss": 0.8408, - "step": 31995 - }, - { - "epoch": 0.82, - "learning_rate": 1.7051474801304529e-06, - "loss": 0.8926, - "step": 31996 - }, - { - "epoch": 0.82, - "learning_rate": 1.7051278598299751e-06, - "loss": 0.7891, - "step": 31997 - }, - { - "epoch": 0.82, - "learning_rate": 1.7051082389896134e-06, - "loss": 1.1318, - "step": 31998 - }, - { - "epoch": 0.82, - "learning_rate": 1.7050886176093827e-06, - "loss": 0.9248, - "step": 31999 - }, - { - "epoch": 0.82, - "learning_rate": 1.7050689956892981e-06, - "loss": 0.8721, - "step": 32000 - }, - { - "epoch": 0.82, - "learning_rate": 1.7050493732293744e-06, - "loss": 0.6841, - "step": 32001 - }, - { - "epoch": 0.82, - "learning_rate": 1.705029750229627e-06, - "loss": 0.79, - "step": 32002 - }, - { - "epoch": 0.82, - "learning_rate": 1.7050101266900706e-06, - "loss": 0.7979, - "step": 32003 - }, - { - "epoch": 0.82, - "learning_rate": 1.7049905026107208e-06, - "loss": 0.9229, - "step": 32004 - }, - { - "epoch": 0.82, - "learning_rate": 1.704970877991592e-06, - "loss": 0.688, - "step": 32005 - }, - { - "epoch": 0.82, - "learning_rate": 1.704951252832699e-06, - "loss": 0.8115, - "step": 32006 - }, - { - "epoch": 0.82, - "learning_rate": 1.7049316271340576e-06, - "loss": 1.0566, - "step": 32007 - }, - { - "epoch": 0.82, - "learning_rate": 1.7049120008956824e-06, - "loss": 1.0635, - "step": 32008 - }, - { - "epoch": 0.82, - "learning_rate": 1.7048923741175888e-06, - "loss": 0.6826, - "step": 32009 - }, - { - "epoch": 0.82, - "learning_rate": 1.704872746799791e-06, - "loss": 0.7827, - "step": 32010 - }, - { - "epoch": 0.82, - "learning_rate": 1.7048531189423048e-06, - "loss": 0.6406, - "step": 32011 - }, - { - "epoch": 0.82, - "learning_rate": 1.704833490545145e-06, - "loss": 0.7168, - "step": 32012 - }, - { - "epoch": 0.82, - "learning_rate": 1.7048138616083265e-06, - "loss": 0.8682, - "step": 32013 - }, - { - "epoch": 0.82, - "learning_rate": 1.7047942321318644e-06, - "loss": 0.728, - "step": 32014 - }, - { - "epoch": 0.82, - "learning_rate": 1.7047746021157741e-06, - "loss": 0.8643, - "step": 32015 - }, - { - "epoch": 0.82, - "learning_rate": 1.70475497156007e-06, - "loss": 0.8672, - "step": 32016 - }, - { - "epoch": 0.82, - "learning_rate": 1.7047353404647672e-06, - "loss": 0.8008, - "step": 32017 - }, - { - "epoch": 0.82, - "learning_rate": 1.7047157088298814e-06, - "loss": 0.8696, - "step": 32018 - }, - { - "epoch": 0.82, - "learning_rate": 1.704696076655427e-06, - "loss": 0.7451, - "step": 32019 - }, - { - "epoch": 0.82, - "learning_rate": 1.7046764439414193e-06, - "loss": 0.834, - "step": 32020 - }, - { - "epoch": 0.82, - "learning_rate": 1.7046568106878731e-06, - "loss": 0.7339, - "step": 32021 - }, - { - "epoch": 0.82, - "learning_rate": 1.7046371768948036e-06, - "loss": 0.7729, - "step": 32022 - }, - { - "epoch": 0.82, - "learning_rate": 1.704617542562226e-06, - "loss": 0.8945, - "step": 32023 - }, - { - "epoch": 0.82, - "learning_rate": 1.704597907690155e-06, - "loss": 0.9033, - "step": 32024 - }, - { - "epoch": 0.82, - "learning_rate": 1.7045782722786058e-06, - "loss": 0.8525, - "step": 32025 - }, - { - "epoch": 0.82, - "learning_rate": 1.7045586363275932e-06, - "loss": 0.7744, - "step": 32026 - }, - { - "epoch": 0.82, - "learning_rate": 1.7045389998371327e-06, - "loss": 0.8545, - "step": 32027 - }, - { - "epoch": 0.82, - "learning_rate": 1.704519362807239e-06, - "loss": 1.0, - "step": 32028 - }, - { - "epoch": 0.82, - "learning_rate": 1.7044997252379274e-06, - "loss": 0.9346, - "step": 32029 - }, - { - "epoch": 0.82, - "learning_rate": 1.7044800871292124e-06, - "loss": 0.77, - "step": 32030 - }, - { - "epoch": 0.82, - "learning_rate": 1.7044604484811099e-06, - "loss": 0.6118, - "step": 32031 - }, - { - "epoch": 0.82, - "learning_rate": 1.704440809293634e-06, - "loss": 0.874, - "step": 32032 - }, - { - "epoch": 0.82, - "learning_rate": 1.7044211695668003e-06, - "loss": 0.9951, - "step": 32033 - }, - { - "epoch": 0.82, - "learning_rate": 1.7044015293006237e-06, - "loss": 0.7725, - "step": 32034 - }, - { - "epoch": 0.82, - "learning_rate": 1.7043818884951192e-06, - "loss": 0.7949, - "step": 32035 - }, - { - "epoch": 0.82, - "learning_rate": 1.704362247150302e-06, - "loss": 0.9785, - "step": 32036 - }, - { - "epoch": 0.82, - "learning_rate": 1.7043426052661869e-06, - "loss": 0.7197, - "step": 32037 - }, - { - "epoch": 0.82, - "learning_rate": 1.7043229628427889e-06, - "loss": 0.9346, - "step": 32038 - }, - { - "epoch": 0.82, - "learning_rate": 1.7043033198801236e-06, - "loss": 0.7637, - "step": 32039 - }, - { - "epoch": 0.82, - "learning_rate": 1.7042836763782053e-06, - "loss": 0.8779, - "step": 32040 - }, - { - "epoch": 0.82, - "learning_rate": 1.7042640323370496e-06, - "loss": 0.71, - "step": 32041 - }, - { - "epoch": 0.82, - "learning_rate": 1.7042443877566712e-06, - "loss": 0.55, - "step": 32042 - }, - { - "epoch": 0.82, - "learning_rate": 1.7042247426370851e-06, - "loss": 0.8516, - "step": 32043 - }, - { - "epoch": 0.82, - "learning_rate": 1.7042050969783065e-06, - "loss": 0.8301, - "step": 32044 - }, - { - "epoch": 0.82, - "learning_rate": 1.7041854507803506e-06, - "loss": 0.9688, - "step": 32045 - }, - { - "epoch": 0.82, - "learning_rate": 1.7041658040432325e-06, - "loss": 0.8345, - "step": 32046 - }, - { - "epoch": 0.82, - "learning_rate": 1.7041461567669666e-06, - "loss": 0.9609, - "step": 32047 - }, - { - "epoch": 0.82, - "learning_rate": 1.7041265089515688e-06, - "loss": 0.835, - "step": 32048 - }, - { - "epoch": 0.82, - "learning_rate": 1.7041068605970534e-06, - "loss": 0.6689, - "step": 32049 - }, - { - "epoch": 0.82, - "learning_rate": 1.7040872117034357e-06, - "loss": 0.835, - "step": 32050 - }, - { - "epoch": 0.82, - "learning_rate": 1.704067562270731e-06, - "loss": 0.7905, - "step": 32051 - }, - { - "epoch": 0.82, - "learning_rate": 1.7040479122989538e-06, - "loss": 0.8447, - "step": 32052 - }, - { - "epoch": 0.82, - "learning_rate": 1.7040282617881201e-06, - "loss": 0.8638, - "step": 32053 - }, - { - "epoch": 0.82, - "learning_rate": 1.7040086107382439e-06, - "loss": 0.7334, - "step": 32054 - }, - { - "epoch": 0.82, - "learning_rate": 1.7039889591493406e-06, - "loss": 0.9648, - "step": 32055 - }, - { - "epoch": 0.82, - "learning_rate": 1.7039693070214253e-06, - "loss": 0.835, - "step": 32056 - }, - { - "epoch": 0.82, - "learning_rate": 1.7039496543545134e-06, - "loss": 0.8936, - "step": 32057 - }, - { - "epoch": 0.82, - "learning_rate": 1.7039300011486195e-06, - "loss": 0.6211, - "step": 32058 - }, - { - "epoch": 0.82, - "learning_rate": 1.7039103474037586e-06, - "loss": 0.8838, - "step": 32059 - }, - { - "epoch": 0.82, - "learning_rate": 1.7038906931199461e-06, - "loss": 0.7476, - "step": 32060 - }, - { - "epoch": 0.82, - "learning_rate": 1.7038710382971968e-06, - "loss": 0.8726, - "step": 32061 - }, - { - "epoch": 0.82, - "learning_rate": 1.7038513829355256e-06, - "loss": 0.8408, - "step": 32062 - }, - { - "epoch": 0.82, - "learning_rate": 1.7038317270349483e-06, - "loss": 0.9023, - "step": 32063 - }, - { - "epoch": 0.82, - "learning_rate": 1.7038120705954788e-06, - "loss": 0.7056, - "step": 32064 - }, - { - "epoch": 0.82, - "learning_rate": 1.7037924136171332e-06, - "loss": 0.791, - "step": 32065 - }, - { - "epoch": 0.82, - "learning_rate": 1.703772756099926e-06, - "loss": 1.0332, - "step": 32066 - }, - { - "epoch": 0.82, - "learning_rate": 1.703753098043872e-06, - "loss": 1.1289, - "step": 32067 - }, - { - "epoch": 0.82, - "learning_rate": 1.7037334394489871e-06, - "loss": 0.54, - "step": 32068 - }, - { - "epoch": 0.82, - "learning_rate": 1.7037137803152857e-06, - "loss": 0.6609, - "step": 32069 - }, - { - "epoch": 0.82, - "learning_rate": 1.7036941206427828e-06, - "loss": 0.7283, - "step": 32070 - }, - { - "epoch": 0.82, - "learning_rate": 1.703674460431494e-06, - "loss": 0.8408, - "step": 32071 - }, - { - "epoch": 0.82, - "learning_rate": 1.703654799681434e-06, - "loss": 0.8613, - "step": 32072 - }, - { - "epoch": 0.82, - "learning_rate": 1.7036351383926178e-06, - "loss": 0.9185, - "step": 32073 - }, - { - "epoch": 0.82, - "learning_rate": 1.7036154765650602e-06, - "loss": 0.9775, - "step": 32074 - }, - { - "epoch": 0.82, - "learning_rate": 1.7035958141987772e-06, - "loss": 0.6895, - "step": 32075 - }, - { - "epoch": 0.82, - "learning_rate": 1.7035761512937827e-06, - "loss": 0.8779, - "step": 32076 - }, - { - "epoch": 0.82, - "learning_rate": 1.7035564878500925e-06, - "loss": 0.6382, - "step": 32077 - }, - { - "epoch": 0.82, - "learning_rate": 1.7035368238677217e-06, - "loss": 0.8633, - "step": 32078 - }, - { - "epoch": 0.82, - "learning_rate": 1.7035171593466848e-06, - "loss": 0.9658, - "step": 32079 - }, - { - "epoch": 0.82, - "learning_rate": 1.703497494286997e-06, - "loss": 0.9922, - "step": 32080 - }, - { - "epoch": 0.82, - "learning_rate": 1.703477828688674e-06, - "loss": 0.8525, - "step": 32081 - }, - { - "epoch": 0.82, - "learning_rate": 1.7034581625517299e-06, - "loss": 1.0098, - "step": 32082 - }, - { - "epoch": 0.82, - "learning_rate": 1.7034384958761805e-06, - "loss": 0.7983, - "step": 32083 - }, - { - "epoch": 0.82, - "learning_rate": 1.7034188286620403e-06, - "loss": 0.9951, - "step": 32084 - }, - { - "epoch": 0.82, - "learning_rate": 1.703399160909325e-06, - "loss": 1.0908, - "step": 32085 - }, - { - "epoch": 0.82, - "learning_rate": 1.7033794926180495e-06, - "loss": 0.79, - "step": 32086 - }, - { - "epoch": 0.82, - "learning_rate": 1.703359823788228e-06, - "loss": 0.7207, - "step": 32087 - }, - { - "epoch": 0.82, - "learning_rate": 1.7033401544198766e-06, - "loss": 0.9092, - "step": 32088 - }, - { - "epoch": 0.82, - "learning_rate": 1.70332048451301e-06, - "loss": 0.8906, - "step": 32089 - }, - { - "epoch": 0.82, - "learning_rate": 1.703300814067643e-06, - "loss": 0.668, - "step": 32090 - }, - { - "epoch": 0.82, - "learning_rate": 1.7032811430837912e-06, - "loss": 0.8081, - "step": 32091 - }, - { - "epoch": 0.82, - "learning_rate": 1.7032614715614693e-06, - "loss": 0.9651, - "step": 32092 - }, - { - "epoch": 0.82, - "learning_rate": 1.7032417995006926e-06, - "loss": 0.6914, - "step": 32093 - }, - { - "epoch": 0.82, - "learning_rate": 1.7032221269014756e-06, - "loss": 1.0498, - "step": 32094 - }, - { - "epoch": 0.82, - "learning_rate": 1.7032024537638342e-06, - "loss": 0.9326, - "step": 32095 - }, - { - "epoch": 0.82, - "learning_rate": 1.7031827800877825e-06, - "loss": 0.7827, - "step": 32096 - }, - { - "epoch": 0.82, - "learning_rate": 1.7031631058733362e-06, - "loss": 1.2617, - "step": 32097 - }, - { - "epoch": 0.82, - "learning_rate": 1.7031434311205107e-06, - "loss": 0.9619, - "step": 32098 - }, - { - "epoch": 0.82, - "learning_rate": 1.7031237558293201e-06, - "loss": 0.7256, - "step": 32099 - }, - { - "epoch": 0.82, - "learning_rate": 1.7031040799997802e-06, - "loss": 0.8428, - "step": 32100 - }, - { - "epoch": 0.82, - "learning_rate": 1.7030844036319055e-06, - "loss": 0.9209, - "step": 32101 - }, - { - "epoch": 0.82, - "learning_rate": 1.703064726725712e-06, - "loss": 0.8125, - "step": 32102 - }, - { - "epoch": 0.82, - "learning_rate": 1.7030450492812138e-06, - "loss": 0.6917, - "step": 32103 - }, - { - "epoch": 0.82, - "learning_rate": 1.7030253712984263e-06, - "loss": 0.5117, - "step": 32104 - }, - { - "epoch": 0.82, - "learning_rate": 1.7030056927773648e-06, - "loss": 0.8125, - "step": 32105 - }, - { - "epoch": 0.82, - "learning_rate": 1.702986013718044e-06, - "loss": 0.623, - "step": 32106 - }, - { - "epoch": 0.82, - "learning_rate": 1.702966334120479e-06, - "loss": 0.9131, - "step": 32107 - }, - { - "epoch": 0.82, - "learning_rate": 1.7029466539846853e-06, - "loss": 0.8147, - "step": 32108 - }, - { - "epoch": 0.82, - "learning_rate": 1.7029269733106774e-06, - "loss": 0.958, - "step": 32109 - }, - { - "epoch": 0.82, - "learning_rate": 1.7029072920984708e-06, - "loss": 0.9932, - "step": 32110 - }, - { - "epoch": 0.82, - "learning_rate": 1.7028876103480805e-06, - "loss": 0.7432, - "step": 32111 - }, - { - "epoch": 0.82, - "learning_rate": 1.7028679280595216e-06, - "loss": 0.8115, - "step": 32112 - }, - { - "epoch": 0.82, - "learning_rate": 1.7028482452328087e-06, - "loss": 0.8496, - "step": 32113 - }, - { - "epoch": 0.82, - "learning_rate": 1.7028285618679574e-06, - "loss": 0.9688, - "step": 32114 - }, - { - "epoch": 0.82, - "learning_rate": 1.7028088779649824e-06, - "loss": 0.8296, - "step": 32115 - }, - { - "epoch": 0.82, - "learning_rate": 1.702789193523899e-06, - "loss": 0.5969, - "step": 32116 - }, - { - "epoch": 0.82, - "learning_rate": 1.7027695085447224e-06, - "loss": 1.0039, - "step": 32117 - }, - { - "epoch": 0.82, - "learning_rate": 1.7027498230274676e-06, - "loss": 0.7275, - "step": 32118 - }, - { - "epoch": 0.82, - "learning_rate": 1.7027301369721493e-06, - "loss": 0.8086, - "step": 32119 - }, - { - "epoch": 0.82, - "learning_rate": 1.7027104503787828e-06, - "loss": 0.9043, - "step": 32120 - }, - { - "epoch": 0.82, - "learning_rate": 1.7026907632473835e-06, - "loss": 0.8262, - "step": 32121 - }, - { - "epoch": 0.82, - "learning_rate": 1.7026710755779662e-06, - "loss": 0.7026, - "step": 32122 - }, - { - "epoch": 0.82, - "learning_rate": 1.7026513873705458e-06, - "loss": 0.8662, - "step": 32123 - }, - { - "epoch": 0.82, - "learning_rate": 1.7026316986251374e-06, - "loss": 0.9648, - "step": 32124 - }, - { - "epoch": 0.82, - "learning_rate": 1.7026120093417565e-06, - "loss": 0.8867, - "step": 32125 - }, - { - "epoch": 0.82, - "learning_rate": 1.7025923195204177e-06, - "loss": 0.6958, - "step": 32126 - }, - { - "epoch": 0.82, - "learning_rate": 1.702572629161136e-06, - "loss": 0.959, - "step": 32127 - }, - { - "epoch": 0.82, - "learning_rate": 1.7025529382639272e-06, - "loss": 0.8506, - "step": 32128 - }, - { - "epoch": 0.82, - "learning_rate": 1.702533246828806e-06, - "loss": 0.8955, - "step": 32129 - }, - { - "epoch": 0.82, - "learning_rate": 1.702513554855787e-06, - "loss": 0.6958, - "step": 32130 - }, - { - "epoch": 0.82, - "learning_rate": 1.7024938623448862e-06, - "loss": 0.9521, - "step": 32131 - }, - { - "epoch": 0.82, - "learning_rate": 1.7024741692961174e-06, - "loss": 0.918, - "step": 32132 - }, - { - "epoch": 0.82, - "learning_rate": 1.702454475709497e-06, - "loss": 0.7754, - "step": 32133 - }, - { - "epoch": 0.82, - "learning_rate": 1.7024347815850396e-06, - "loss": 0.6245, - "step": 32134 - }, - { - "epoch": 0.82, - "learning_rate": 1.70241508692276e-06, - "loss": 0.7939, - "step": 32135 - }, - { - "epoch": 0.82, - "learning_rate": 1.702395391722673e-06, - "loss": 0.6794, - "step": 32136 - }, - { - "epoch": 0.82, - "learning_rate": 1.7023756959847946e-06, - "loss": 0.7188, - "step": 32137 - }, - { - "epoch": 0.82, - "learning_rate": 1.7023559997091395e-06, - "loss": 0.7832, - "step": 32138 - }, - { - "epoch": 0.82, - "learning_rate": 1.7023363028957225e-06, - "loss": 0.8584, - "step": 32139 - }, - { - "epoch": 0.82, - "learning_rate": 1.702316605544559e-06, - "loss": 0.957, - "step": 32140 - }, - { - "epoch": 0.82, - "learning_rate": 1.702296907655664e-06, - "loss": 0.7002, - "step": 32141 - }, - { - "epoch": 0.82, - "learning_rate": 1.7022772092290523e-06, - "loss": 0.9004, - "step": 32142 - }, - { - "epoch": 0.82, - "learning_rate": 1.7022575102647395e-06, - "loss": 0.6733, - "step": 32143 - }, - { - "epoch": 0.82, - "learning_rate": 1.7022378107627404e-06, - "loss": 0.7734, - "step": 32144 - }, - { - "epoch": 0.82, - "learning_rate": 1.70221811072307e-06, - "loss": 0.8252, - "step": 32145 - }, - { - "epoch": 0.82, - "learning_rate": 1.7021984101457436e-06, - "loss": 0.801, - "step": 32146 - }, - { - "epoch": 0.82, - "learning_rate": 1.702178709030776e-06, - "loss": 0.627, - "step": 32147 - }, - { - "epoch": 0.82, - "learning_rate": 1.7021590073781827e-06, - "loss": 0.9365, - "step": 32148 - }, - { - "epoch": 0.82, - "learning_rate": 1.7021393051879781e-06, - "loss": 0.96, - "step": 32149 - }, - { - "epoch": 0.82, - "learning_rate": 1.7021196024601781e-06, - "loss": 0.8516, - "step": 32150 - }, - { - "epoch": 0.82, - "learning_rate": 1.7020998991947972e-06, - "loss": 0.8809, - "step": 32151 - }, - { - "epoch": 0.82, - "learning_rate": 1.7020801953918506e-06, - "loss": 0.6533, - "step": 32152 - }, - { - "epoch": 0.82, - "learning_rate": 1.7020604910513538e-06, - "loss": 0.8193, - "step": 32153 - }, - { - "epoch": 0.82, - "learning_rate": 1.7020407861733215e-06, - "loss": 0.7256, - "step": 32154 - }, - { - "epoch": 0.82, - "learning_rate": 1.7020210807577686e-06, - "loss": 0.96, - "step": 32155 - }, - { - "epoch": 0.82, - "learning_rate": 1.7020013748047108e-06, - "loss": 0.5815, - "step": 32156 - }, - { - "epoch": 0.82, - "learning_rate": 1.7019816683141626e-06, - "loss": 0.8076, - "step": 32157 - }, - { - "epoch": 0.82, - "learning_rate": 1.7019619612861393e-06, - "loss": 0.8535, - "step": 32158 - }, - { - "epoch": 0.82, - "learning_rate": 1.7019422537206563e-06, - "loss": 0.9414, - "step": 32159 - }, - { - "epoch": 0.82, - "learning_rate": 1.701922545617728e-06, - "loss": 0.8701, - "step": 32160 - }, - { - "epoch": 0.82, - "learning_rate": 1.70190283697737e-06, - "loss": 0.7041, - "step": 32161 - }, - { - "epoch": 0.82, - "learning_rate": 1.701883127799597e-06, - "loss": 0.9775, - "step": 32162 - }, - { - "epoch": 0.82, - "learning_rate": 1.701863418084425e-06, - "loss": 0.7129, - "step": 32163 - }, - { - "epoch": 0.82, - "learning_rate": 1.7018437078318679e-06, - "loss": 0.9688, - "step": 32164 - }, - { - "epoch": 0.82, - "learning_rate": 1.7018239970419418e-06, - "loss": 1.0107, - "step": 32165 - }, - { - "epoch": 0.82, - "learning_rate": 1.701804285714661e-06, - "loss": 0.8535, - "step": 32166 - }, - { - "epoch": 0.82, - "learning_rate": 1.701784573850041e-06, - "loss": 0.7676, - "step": 32167 - }, - { - "epoch": 0.82, - "learning_rate": 1.701764861448097e-06, - "loss": 0.7134, - "step": 32168 - }, - { - "epoch": 0.82, - "learning_rate": 1.7017451485088436e-06, - "loss": 0.7998, - "step": 32169 - }, - { - "epoch": 0.82, - "learning_rate": 1.7017254350322965e-06, - "loss": 0.7646, - "step": 32170 - }, - { - "epoch": 0.82, - "learning_rate": 1.7017057210184702e-06, - "loss": 0.8037, - "step": 32171 - }, - { - "epoch": 0.82, - "learning_rate": 1.7016860064673803e-06, - "loss": 0.9111, - "step": 32172 - }, - { - "epoch": 0.82, - "learning_rate": 1.7016662913790417e-06, - "loss": 0.7803, - "step": 32173 - }, - { - "epoch": 0.82, - "learning_rate": 1.7016465757534695e-06, - "loss": 0.8398, - "step": 32174 - }, - { - "epoch": 0.82, - "learning_rate": 1.7016268595906787e-06, - "loss": 1.1387, - "step": 32175 - }, - { - "epoch": 0.82, - "learning_rate": 1.7016071428906844e-06, - "loss": 0.9141, - "step": 32176 - }, - { - "epoch": 0.82, - "learning_rate": 1.7015874256535018e-06, - "loss": 0.9922, - "step": 32177 - }, - { - "epoch": 0.82, - "learning_rate": 1.701567707879146e-06, - "loss": 0.9766, - "step": 32178 - }, - { - "epoch": 0.82, - "learning_rate": 1.7015479895676322e-06, - "loss": 0.6973, - "step": 32179 - }, - { - "epoch": 0.82, - "learning_rate": 1.7015282707189753e-06, - "loss": 0.8599, - "step": 32180 - }, - { - "epoch": 0.82, - "learning_rate": 1.70150855133319e-06, - "loss": 0.7964, - "step": 32181 - }, - { - "epoch": 0.82, - "learning_rate": 1.7014888314102923e-06, - "loss": 0.9727, - "step": 32182 - }, - { - "epoch": 0.82, - "learning_rate": 1.7014691109502972e-06, - "loss": 0.8164, - "step": 32183 - }, - { - "epoch": 0.82, - "learning_rate": 1.701449389953219e-06, - "loss": 0.6577, - "step": 32184 - }, - { - "epoch": 0.82, - "learning_rate": 1.7014296684190733e-06, - "loss": 0.9092, - "step": 32185 - }, - { - "epoch": 0.82, - "learning_rate": 1.701409946347875e-06, - "loss": 0.7754, - "step": 32186 - }, - { - "epoch": 0.82, - "learning_rate": 1.7013902237396397e-06, - "loss": 0.9316, - "step": 32187 - }, - { - "epoch": 0.82, - "learning_rate": 1.7013705005943821e-06, - "loss": 0.6982, - "step": 32188 - }, - { - "epoch": 0.83, - "learning_rate": 1.7013507769121174e-06, - "loss": 0.7837, - "step": 32189 - }, - { - "epoch": 0.83, - "learning_rate": 1.7013310526928604e-06, - "loss": 1.1074, - "step": 32190 - }, - { - "epoch": 0.83, - "learning_rate": 1.7013113279366266e-06, - "loss": 0.8149, - "step": 32191 - }, - { - "epoch": 0.83, - "learning_rate": 1.701291602643431e-06, - "loss": 1.1914, - "step": 32192 - }, - { - "epoch": 0.83, - "learning_rate": 1.7012718768132886e-06, - "loss": 0.627, - "step": 32193 - }, - { - "epoch": 0.83, - "learning_rate": 1.7012521504462146e-06, - "loss": 0.8379, - "step": 32194 - }, - { - "epoch": 0.83, - "learning_rate": 1.701232423542224e-06, - "loss": 0.8428, - "step": 32195 - }, - { - "epoch": 0.83, - "learning_rate": 1.701212696101332e-06, - "loss": 1.0283, - "step": 32196 - }, - { - "epoch": 0.83, - "learning_rate": 1.7011929681235538e-06, - "loss": 0.6528, - "step": 32197 - }, - { - "epoch": 0.83, - "learning_rate": 1.7011732396089042e-06, - "loss": 0.8926, - "step": 32198 - }, - { - "epoch": 0.83, - "learning_rate": 1.7011535105573985e-06, - "loss": 0.9136, - "step": 32199 - }, - { - "epoch": 0.83, - "learning_rate": 1.7011337809690521e-06, - "loss": 0.9688, - "step": 32200 - }, - { - "epoch": 0.83, - "learning_rate": 1.7011140508438793e-06, - "loss": 0.8379, - "step": 32201 - }, - { - "epoch": 0.83, - "learning_rate": 1.7010943201818961e-06, - "loss": 0.7153, - "step": 32202 - }, - { - "epoch": 0.83, - "learning_rate": 1.7010745889831173e-06, - "loss": 0.998, - "step": 32203 - }, - { - "epoch": 0.83, - "learning_rate": 1.7010548572475578e-06, - "loss": 0.9932, - "step": 32204 - }, - { - "epoch": 0.83, - "learning_rate": 1.7010351249752327e-06, - "loss": 0.9551, - "step": 32205 - }, - { - "epoch": 0.83, - "learning_rate": 1.7010153921661572e-06, - "loss": 0.8633, - "step": 32206 - }, - { - "epoch": 0.83, - "learning_rate": 1.7009956588203466e-06, - "loss": 1.1104, - "step": 32207 - }, - { - "epoch": 0.83, - "learning_rate": 1.7009759249378156e-06, - "loss": 0.875, - "step": 32208 - }, - { - "epoch": 0.83, - "learning_rate": 1.70095619051858e-06, - "loss": 0.6794, - "step": 32209 - }, - { - "epoch": 0.83, - "learning_rate": 1.7009364555626542e-06, - "loss": 0.7539, - "step": 32210 - }, - { - "epoch": 0.83, - "learning_rate": 1.7009167200700536e-06, - "loss": 0.9209, - "step": 32211 - }, - { - "epoch": 0.83, - "learning_rate": 1.7008969840407935e-06, - "loss": 0.7036, - "step": 32212 - }, - { - "epoch": 0.83, - "learning_rate": 1.7008772474748886e-06, - "loss": 0.6338, - "step": 32213 - }, - { - "epoch": 0.83, - "learning_rate": 1.7008575103723541e-06, - "loss": 0.7097, - "step": 32214 - }, - { - "epoch": 0.83, - "learning_rate": 1.7008377727332056e-06, - "loss": 0.5322, - "step": 32215 - }, - { - "epoch": 0.83, - "learning_rate": 1.7008180345574577e-06, - "loss": 0.8844, - "step": 32216 - }, - { - "epoch": 0.83, - "learning_rate": 1.7007982958451254e-06, - "loss": 1.0, - "step": 32217 - }, - { - "epoch": 0.83, - "learning_rate": 1.7007785565962242e-06, - "loss": 0.8975, - "step": 32218 - }, - { - "epoch": 0.83, - "learning_rate": 1.7007588168107691e-06, - "loss": 0.75, - "step": 32219 - }, - { - "epoch": 0.83, - "learning_rate": 1.7007390764887752e-06, - "loss": 0.7549, - "step": 32220 - }, - { - "epoch": 0.83, - "learning_rate": 1.7007193356302578e-06, - "loss": 0.7114, - "step": 32221 - }, - { - "epoch": 0.83, - "learning_rate": 1.7006995942352317e-06, - "loss": 0.6616, - "step": 32222 - }, - { - "epoch": 0.83, - "learning_rate": 1.700679852303712e-06, - "loss": 0.8447, - "step": 32223 - }, - { - "epoch": 0.83, - "learning_rate": 1.7006601098357144e-06, - "loss": 1.1289, - "step": 32224 - }, - { - "epoch": 0.83, - "learning_rate": 1.700640366831253e-06, - "loss": 0.7959, - "step": 32225 - }, - { - "epoch": 0.83, - "learning_rate": 1.7006206232903437e-06, - "loss": 0.7192, - "step": 32226 - }, - { - "epoch": 0.83, - "learning_rate": 1.7006008792130014e-06, - "loss": 0.917, - "step": 32227 - }, - { - "epoch": 0.83, - "learning_rate": 1.7005811345992415e-06, - "loss": 1.0361, - "step": 32228 - }, - { - "epoch": 0.83, - "learning_rate": 1.7005613894490785e-06, - "loss": 0.6829, - "step": 32229 - }, - { - "epoch": 0.83, - "learning_rate": 1.700541643762528e-06, - "loss": 0.7236, - "step": 32230 - }, - { - "epoch": 0.83, - "learning_rate": 1.7005218975396049e-06, - "loss": 0.7773, - "step": 32231 - }, - { - "epoch": 0.83, - "learning_rate": 1.7005021507803243e-06, - "loss": 0.8599, - "step": 32232 - }, - { - "epoch": 0.83, - "learning_rate": 1.7004824034847016e-06, - "loss": 1.0938, - "step": 32233 - }, - { - "epoch": 0.83, - "learning_rate": 1.7004626556527518e-06, - "loss": 0.7676, - "step": 32234 - }, - { - "epoch": 0.83, - "learning_rate": 1.7004429072844897e-06, - "loss": 0.6851, - "step": 32235 - }, - { - "epoch": 0.83, - "learning_rate": 1.7004231583799307e-06, - "loss": 0.7417, - "step": 32236 - }, - { - "epoch": 0.83, - "learning_rate": 1.7004034089390901e-06, - "loss": 0.835, - "step": 32237 - }, - { - "epoch": 0.83, - "learning_rate": 1.7003836589619826e-06, - "loss": 0.7705, - "step": 32238 - }, - { - "epoch": 0.83, - "learning_rate": 1.7003639084486236e-06, - "loss": 0.8604, - "step": 32239 - }, - { - "epoch": 0.83, - "learning_rate": 1.7003441573990282e-06, - "loss": 1.0645, - "step": 32240 - }, - { - "epoch": 0.83, - "learning_rate": 1.7003244058132115e-06, - "loss": 0.8701, - "step": 32241 - }, - { - "epoch": 0.83, - "learning_rate": 1.7003046536911887e-06, - "loss": 0.6855, - "step": 32242 - }, - { - "epoch": 0.83, - "learning_rate": 1.7002849010329748e-06, - "loss": 0.7651, - "step": 32243 - }, - { - "epoch": 0.83, - "learning_rate": 1.7002651478385848e-06, - "loss": 0.7793, - "step": 32244 - }, - { - "epoch": 0.83, - "learning_rate": 1.700245394108034e-06, - "loss": 0.7725, - "step": 32245 - }, - { - "epoch": 0.83, - "learning_rate": 1.7002256398413375e-06, - "loss": 0.8887, - "step": 32246 - }, - { - "epoch": 0.83, - "learning_rate": 1.7002058850385105e-06, - "loss": 0.9199, - "step": 32247 - }, - { - "epoch": 0.83, - "learning_rate": 1.700186129699568e-06, - "loss": 0.8467, - "step": 32248 - }, - { - "epoch": 0.83, - "learning_rate": 1.7001663738245253e-06, - "loss": 0.9678, - "step": 32249 - }, - { - "epoch": 0.83, - "learning_rate": 1.7001466174133972e-06, - "loss": 0.9092, - "step": 32250 - }, - { - "epoch": 0.83, - "learning_rate": 1.7001268604661992e-06, - "loss": 0.7993, - "step": 32251 - }, - { - "epoch": 0.83, - "learning_rate": 1.700107102982946e-06, - "loss": 0.7163, - "step": 32252 - }, - { - "epoch": 0.83, - "learning_rate": 1.7000873449636532e-06, - "loss": 0.9531, - "step": 32253 - }, - { - "epoch": 0.83, - "learning_rate": 1.7000675864083357e-06, - "loss": 0.8521, - "step": 32254 - }, - { - "epoch": 0.83, - "learning_rate": 1.7000478273170086e-06, - "loss": 1.0391, - "step": 32255 - }, - { - "epoch": 0.83, - "learning_rate": 1.700028067689687e-06, - "loss": 0.7715, - "step": 32256 - }, - { - "epoch": 0.83, - "learning_rate": 1.700008307526386e-06, - "loss": 0.688, - "step": 32257 - }, - { - "epoch": 0.83, - "learning_rate": 1.699988546827121e-06, - "loss": 0.8975, - "step": 32258 - }, - { - "epoch": 0.83, - "learning_rate": 1.6999687855919072e-06, - "loss": 0.541, - "step": 32259 - }, - { - "epoch": 0.83, - "learning_rate": 1.6999490238207591e-06, - "loss": 0.9619, - "step": 32260 - }, - { - "epoch": 0.83, - "learning_rate": 1.6999292615136924e-06, - "loss": 0.8457, - "step": 32261 - }, - { - "epoch": 0.83, - "learning_rate": 1.699909498670722e-06, - "loss": 0.593, - "step": 32262 - }, - { - "epoch": 0.83, - "learning_rate": 1.6998897352918632e-06, - "loss": 0.8691, - "step": 32263 - }, - { - "epoch": 0.83, - "learning_rate": 1.6998699713771307e-06, - "loss": 0.7422, - "step": 32264 - }, - { - "epoch": 0.83, - "learning_rate": 1.6998502069265404e-06, - "loss": 0.9219, - "step": 32265 - }, - { - "epoch": 0.83, - "learning_rate": 1.6998304419401066e-06, - "loss": 0.6094, - "step": 32266 - }, - { - "epoch": 0.83, - "learning_rate": 1.699810676417845e-06, - "loss": 0.8804, - "step": 32267 - }, - { - "epoch": 0.83, - "learning_rate": 1.6997909103597703e-06, - "loss": 0.9307, - "step": 32268 - }, - { - "epoch": 0.83, - "learning_rate": 1.699771143765898e-06, - "loss": 0.9756, - "step": 32269 - }, - { - "epoch": 0.83, - "learning_rate": 1.6997513766362433e-06, - "loss": 0.8477, - "step": 32270 - }, - { - "epoch": 0.83, - "learning_rate": 1.699731608970821e-06, - "loss": 0.7915, - "step": 32271 - }, - { - "epoch": 0.83, - "learning_rate": 1.6997118407696463e-06, - "loss": 1.0957, - "step": 32272 - }, - { - "epoch": 0.83, - "learning_rate": 1.6996920720327345e-06, - "loss": 0.7051, - "step": 32273 - }, - { - "epoch": 0.83, - "learning_rate": 1.6996723027601008e-06, - "loss": 0.8506, - "step": 32274 - }, - { - "epoch": 0.83, - "learning_rate": 1.6996525329517599e-06, - "loss": 0.7861, - "step": 32275 - }, - { - "epoch": 0.83, - "learning_rate": 1.6996327626077273e-06, - "loss": 0.6855, - "step": 32276 - }, - { - "epoch": 0.83, - "learning_rate": 1.6996129917280183e-06, - "loss": 0.8545, - "step": 32277 - }, - { - "epoch": 0.83, - "learning_rate": 1.6995932203126477e-06, - "loss": 1.0879, - "step": 32278 - }, - { - "epoch": 0.83, - "learning_rate": 1.6995734483616306e-06, - "loss": 0.6411, - "step": 32279 - }, - { - "epoch": 0.83, - "learning_rate": 1.6995536758749825e-06, - "loss": 0.6772, - "step": 32280 - }, - { - "epoch": 0.83, - "learning_rate": 1.699533902852718e-06, - "loss": 0.7695, - "step": 32281 - }, - { - "epoch": 0.83, - "learning_rate": 1.6995141292948527e-06, - "loss": 0.9795, - "step": 32282 - }, - { - "epoch": 0.83, - "learning_rate": 1.6994943552014015e-06, - "loss": 0.791, - "step": 32283 - }, - { - "epoch": 0.83, - "learning_rate": 1.6994745805723799e-06, - "loss": 0.8457, - "step": 32284 - }, - { - "epoch": 0.83, - "learning_rate": 1.6994548054078026e-06, - "loss": 0.835, - "step": 32285 - }, - { - "epoch": 0.83, - "learning_rate": 1.699435029707685e-06, - "loss": 0.9463, - "step": 32286 - }, - { - "epoch": 0.83, - "learning_rate": 1.699415253472042e-06, - "loss": 0.9951, - "step": 32287 - }, - { - "epoch": 0.83, - "learning_rate": 1.6993954767008891e-06, - "loss": 0.7285, - "step": 32288 - }, - { - "epoch": 0.83, - "learning_rate": 1.699375699394241e-06, - "loss": 0.7822, - "step": 32289 - }, - { - "epoch": 0.83, - "learning_rate": 1.6993559215521133e-06, - "loss": 0.8252, - "step": 32290 - }, - { - "epoch": 0.83, - "learning_rate": 1.6993361431745209e-06, - "loss": 0.542, - "step": 32291 - }, - { - "epoch": 0.83, - "learning_rate": 1.6993163642614787e-06, - "loss": 0.8301, - "step": 32292 - }, - { - "epoch": 0.83, - "learning_rate": 1.6992965848130028e-06, - "loss": 0.6802, - "step": 32293 - }, - { - "epoch": 0.83, - "learning_rate": 1.699276804829107e-06, - "loss": 0.875, - "step": 32294 - }, - { - "epoch": 0.83, - "learning_rate": 1.6992570243098073e-06, - "loss": 0.9189, - "step": 32295 - }, - { - "epoch": 0.83, - "learning_rate": 1.6992372432551188e-06, - "loss": 0.7192, - "step": 32296 - }, - { - "epoch": 0.83, - "learning_rate": 1.6992174616650563e-06, - "loss": 0.8135, - "step": 32297 - }, - { - "epoch": 0.83, - "learning_rate": 1.6991976795396353e-06, - "loss": 0.8828, - "step": 32298 - }, - { - "epoch": 0.83, - "learning_rate": 1.6991778968788706e-06, - "loss": 0.9512, - "step": 32299 - }, - { - "epoch": 0.83, - "learning_rate": 1.6991581136827775e-06, - "loss": 0.8672, - "step": 32300 - }, - { - "epoch": 0.83, - "learning_rate": 1.6991383299513713e-06, - "loss": 1.1553, - "step": 32301 - }, - { - "epoch": 0.83, - "learning_rate": 1.6991185456846671e-06, - "loss": 0.9697, - "step": 32302 - }, - { - "epoch": 0.83, - "learning_rate": 1.69909876088268e-06, - "loss": 0.8926, - "step": 32303 - }, - { - "epoch": 0.83, - "learning_rate": 1.6990789755454249e-06, - "loss": 0.8096, - "step": 32304 - }, - { - "epoch": 0.83, - "learning_rate": 1.6990591896729173e-06, - "loss": 0.8994, - "step": 32305 - }, - { - "epoch": 0.83, - "learning_rate": 1.6990394032651722e-06, - "loss": 0.9053, - "step": 32306 - }, - { - "epoch": 0.83, - "learning_rate": 1.6990196163222047e-06, - "loss": 0.689, - "step": 32307 - }, - { - "epoch": 0.83, - "learning_rate": 1.6989998288440304e-06, - "loss": 0.8389, - "step": 32308 - }, - { - "epoch": 0.83, - "learning_rate": 1.6989800408306636e-06, - "loss": 0.96, - "step": 32309 - }, - { - "epoch": 0.83, - "learning_rate": 1.69896025228212e-06, - "loss": 0.97, - "step": 32310 - }, - { - "epoch": 0.83, - "learning_rate": 1.698940463198415e-06, - "loss": 0.6951, - "step": 32311 - }, - { - "epoch": 0.83, - "learning_rate": 1.698920673579563e-06, - "loss": 1.0059, - "step": 32312 - }, - { - "epoch": 0.83, - "learning_rate": 1.69890088342558e-06, - "loss": 0.8887, - "step": 32313 - }, - { - "epoch": 0.83, - "learning_rate": 1.6988810927364805e-06, - "loss": 0.8247, - "step": 32314 - }, - { - "epoch": 0.83, - "learning_rate": 1.6988613015122799e-06, - "loss": 0.9268, - "step": 32315 - }, - { - "epoch": 0.83, - "learning_rate": 1.6988415097529933e-06, - "loss": 0.9053, - "step": 32316 - }, - { - "epoch": 0.83, - "learning_rate": 1.698821717458636e-06, - "loss": 0.6719, - "step": 32317 - }, - { - "epoch": 0.83, - "learning_rate": 1.6988019246292228e-06, - "loss": 0.7959, - "step": 32318 - }, - { - "epoch": 0.83, - "learning_rate": 1.6987821312647694e-06, - "loss": 0.6631, - "step": 32319 - }, - { - "epoch": 0.83, - "learning_rate": 1.6987623373652906e-06, - "loss": 0.8965, - "step": 32320 - }, - { - "epoch": 0.83, - "learning_rate": 1.6987425429308014e-06, - "loss": 0.8711, - "step": 32321 - }, - { - "epoch": 0.83, - "learning_rate": 1.6987227479613174e-06, - "loss": 0.8438, - "step": 32322 - }, - { - "epoch": 0.83, - "learning_rate": 1.6987029524568532e-06, - "loss": 0.873, - "step": 32323 - }, - { - "epoch": 0.83, - "learning_rate": 1.6986831564174246e-06, - "loss": 0.7769, - "step": 32324 - }, - { - "epoch": 0.83, - "learning_rate": 1.6986633598430463e-06, - "loss": 0.9033, - "step": 32325 - }, - { - "epoch": 0.83, - "learning_rate": 1.6986435627337336e-06, - "loss": 0.9961, - "step": 32326 - }, - { - "epoch": 0.83, - "learning_rate": 1.6986237650895016e-06, - "loss": 0.9014, - "step": 32327 - }, - { - "epoch": 0.83, - "learning_rate": 1.6986039669103657e-06, - "loss": 0.8301, - "step": 32328 - }, - { - "epoch": 0.83, - "learning_rate": 1.6985841681963406e-06, - "loss": 0.9033, - "step": 32329 - }, - { - "epoch": 0.83, - "learning_rate": 1.698564368947442e-06, - "loss": 0.8965, - "step": 32330 - }, - { - "epoch": 0.83, - "learning_rate": 1.6985445691636846e-06, - "loss": 0.9766, - "step": 32331 - }, - { - "epoch": 0.83, - "learning_rate": 1.698524768845084e-06, - "loss": 0.7666, - "step": 32332 - }, - { - "epoch": 0.83, - "learning_rate": 1.6985049679916545e-06, - "loss": 0.7681, - "step": 32333 - }, - { - "epoch": 0.83, - "learning_rate": 1.6984851666034126e-06, - "loss": 0.7793, - "step": 32334 - }, - { - "epoch": 0.83, - "learning_rate": 1.698465364680372e-06, - "loss": 0.834, - "step": 32335 - }, - { - "epoch": 0.83, - "learning_rate": 1.698445562222549e-06, - "loss": 0.8232, - "step": 32336 - }, - { - "epoch": 0.83, - "learning_rate": 1.6984257592299583e-06, - "loss": 0.8447, - "step": 32337 - }, - { - "epoch": 0.83, - "learning_rate": 1.6984059557026153e-06, - "loss": 0.6357, - "step": 32338 - }, - { - "epoch": 0.83, - "learning_rate": 1.698386151640535e-06, - "loss": 0.7979, - "step": 32339 - }, - { - "epoch": 0.83, - "learning_rate": 1.6983663470437322e-06, - "loss": 0.8574, - "step": 32340 - }, - { - "epoch": 0.83, - "learning_rate": 1.6983465419122226e-06, - "loss": 0.7104, - "step": 32341 - }, - { - "epoch": 0.83, - "learning_rate": 1.6983267362460213e-06, - "loss": 0.9609, - "step": 32342 - }, - { - "epoch": 0.83, - "learning_rate": 1.6983069300451427e-06, - "loss": 1.0723, - "step": 32343 - }, - { - "epoch": 0.83, - "learning_rate": 1.698287123309603e-06, - "loss": 0.8525, - "step": 32344 - }, - { - "epoch": 0.83, - "learning_rate": 1.6982673160394172e-06, - "loss": 0.6587, - "step": 32345 - }, - { - "epoch": 0.83, - "learning_rate": 1.6982475082346e-06, - "loss": 1.0449, - "step": 32346 - }, - { - "epoch": 0.83, - "learning_rate": 1.6982276998951668e-06, - "loss": 0.9092, - "step": 32347 - }, - { - "epoch": 0.83, - "learning_rate": 1.6982078910211329e-06, - "loss": 0.8237, - "step": 32348 - }, - { - "epoch": 0.83, - "learning_rate": 1.698188081612513e-06, - "loss": 0.6575, - "step": 32349 - }, - { - "epoch": 0.83, - "learning_rate": 1.6981682716693226e-06, - "loss": 0.4856, - "step": 32350 - }, - { - "epoch": 0.83, - "learning_rate": 1.698148461191577e-06, - "loss": 0.7871, - "step": 32351 - }, - { - "epoch": 0.83, - "learning_rate": 1.6981286501792913e-06, - "loss": 0.9355, - "step": 32352 - }, - { - "epoch": 0.83, - "learning_rate": 1.6981088386324807e-06, - "loss": 0.9824, - "step": 32353 - }, - { - "epoch": 0.83, - "learning_rate": 1.6980890265511598e-06, - "loss": 0.8032, - "step": 32354 - }, - { - "epoch": 0.83, - "learning_rate": 1.6980692139353445e-06, - "loss": 0.9258, - "step": 32355 - }, - { - "epoch": 0.83, - "learning_rate": 1.69804940078505e-06, - "loss": 1.0498, - "step": 32356 - }, - { - "epoch": 0.83, - "learning_rate": 1.6980295871002908e-06, - "loss": 0.9043, - "step": 32357 - }, - { - "epoch": 0.83, - "learning_rate": 1.6980097728810826e-06, - "loss": 0.9121, - "step": 32358 - }, - { - "epoch": 0.83, - "learning_rate": 1.6979899581274402e-06, - "loss": 0.6704, - "step": 32359 - }, - { - "epoch": 0.83, - "learning_rate": 1.6979701428393791e-06, - "loss": 0.792, - "step": 32360 - }, - { - "epoch": 0.83, - "learning_rate": 1.6979503270169144e-06, - "loss": 1.0654, - "step": 32361 - }, - { - "epoch": 0.83, - "learning_rate": 1.6979305106600612e-06, - "loss": 0.8213, - "step": 32362 - }, - { - "epoch": 0.83, - "learning_rate": 1.6979106937688349e-06, - "loss": 0.8652, - "step": 32363 - }, - { - "epoch": 0.83, - "learning_rate": 1.69789087634325e-06, - "loss": 0.6978, - "step": 32364 - }, - { - "epoch": 0.83, - "learning_rate": 1.6978710583833228e-06, - "loss": 1.0186, - "step": 32365 - }, - { - "epoch": 0.83, - "learning_rate": 1.6978512398890673e-06, - "loss": 0.7866, - "step": 32366 - }, - { - "epoch": 0.83, - "learning_rate": 1.6978314208604994e-06, - "loss": 0.7007, - "step": 32367 - }, - { - "epoch": 0.83, - "learning_rate": 1.697811601297634e-06, - "loss": 0.7207, - "step": 32368 - }, - { - "epoch": 0.83, - "learning_rate": 1.6977917812004864e-06, - "loss": 0.7422, - "step": 32369 - }, - { - "epoch": 0.83, - "learning_rate": 1.6977719605690717e-06, - "loss": 0.8359, - "step": 32370 - }, - { - "epoch": 0.83, - "learning_rate": 1.697752139403405e-06, - "loss": 0.9795, - "step": 32371 - }, - { - "epoch": 0.83, - "learning_rate": 1.6977323177035014e-06, - "loss": 0.9033, - "step": 32372 - }, - { - "epoch": 0.83, - "learning_rate": 1.6977124954693767e-06, - "loss": 0.8008, - "step": 32373 - }, - { - "epoch": 0.83, - "learning_rate": 1.6976926727010455e-06, - "loss": 0.814, - "step": 32374 - }, - { - "epoch": 0.83, - "learning_rate": 1.6976728493985228e-06, - "loss": 0.835, - "step": 32375 - }, - { - "epoch": 0.83, - "learning_rate": 1.6976530255618245e-06, - "loss": 1.0059, - "step": 32376 - }, - { - "epoch": 0.83, - "learning_rate": 1.697633201190965e-06, - "loss": 0.9214, - "step": 32377 - }, - { - "epoch": 0.83, - "learning_rate": 1.6976133762859601e-06, - "loss": 0.6667, - "step": 32378 - }, - { - "epoch": 0.83, - "learning_rate": 1.6975935508468245e-06, - "loss": 0.9092, - "step": 32379 - }, - { - "epoch": 0.83, - "learning_rate": 1.6975737248735737e-06, - "loss": 0.8506, - "step": 32380 - }, - { - "epoch": 0.83, - "learning_rate": 1.6975538983662229e-06, - "loss": 1.0098, - "step": 32381 - }, - { - "epoch": 0.83, - "learning_rate": 1.697534071324787e-06, - "loss": 0.7852, - "step": 32382 - }, - { - "epoch": 0.83, - "learning_rate": 1.697514243749281e-06, - "loss": 0.8506, - "step": 32383 - }, - { - "epoch": 0.83, - "learning_rate": 1.697494415639721e-06, - "loss": 0.439, - "step": 32384 - }, - { - "epoch": 0.83, - "learning_rate": 1.6974745869961213e-06, - "loss": 0.7764, - "step": 32385 - }, - { - "epoch": 0.83, - "learning_rate": 1.6974547578184974e-06, - "loss": 0.7871, - "step": 32386 - }, - { - "epoch": 0.83, - "learning_rate": 1.6974349281068648e-06, - "loss": 0.5645, - "step": 32387 - }, - { - "epoch": 0.83, - "learning_rate": 1.697415097861238e-06, - "loss": 0.7637, - "step": 32388 - }, - { - "epoch": 0.83, - "learning_rate": 1.6973952670816325e-06, - "loss": 0.8301, - "step": 32389 - }, - { - "epoch": 0.83, - "learning_rate": 1.6973754357680634e-06, - "loss": 0.9873, - "step": 32390 - }, - { - "epoch": 0.83, - "learning_rate": 1.6973556039205463e-06, - "loss": 0.8613, - "step": 32391 - }, - { - "epoch": 0.83, - "learning_rate": 1.6973357715390961e-06, - "loss": 0.7593, - "step": 32392 - }, - { - "epoch": 0.83, - "learning_rate": 1.6973159386237278e-06, - "loss": 1.0947, - "step": 32393 - }, - { - "epoch": 0.83, - "learning_rate": 1.6972961051744568e-06, - "loss": 0.5903, - "step": 32394 - }, - { - "epoch": 0.83, - "learning_rate": 1.6972762711912982e-06, - "loss": 0.9502, - "step": 32395 - }, - { - "epoch": 0.83, - "learning_rate": 1.6972564366742672e-06, - "loss": 0.9482, - "step": 32396 - }, - { - "epoch": 0.83, - "learning_rate": 1.6972366016233793e-06, - "loss": 0.8867, - "step": 32397 - }, - { - "epoch": 0.83, - "learning_rate": 1.697216766038649e-06, - "loss": 0.9453, - "step": 32398 - }, - { - "epoch": 0.83, - "learning_rate": 1.6971969299200919e-06, - "loss": 1.041, - "step": 32399 - }, - { - "epoch": 0.83, - "learning_rate": 1.6971770932677232e-06, - "loss": 0.8066, - "step": 32400 - }, - { - "epoch": 0.83, - "learning_rate": 1.6971572560815585e-06, - "loss": 0.958, - "step": 32401 - }, - { - "epoch": 0.83, - "learning_rate": 1.6971374183616121e-06, - "loss": 0.7461, - "step": 32402 - }, - { - "epoch": 0.83, - "learning_rate": 1.6971175801078993e-06, - "loss": 1.0215, - "step": 32403 - }, - { - "epoch": 0.83, - "learning_rate": 1.6970977413204364e-06, - "loss": 0.9463, - "step": 32404 - }, - { - "epoch": 0.83, - "learning_rate": 1.6970779019992372e-06, - "loss": 0.8574, - "step": 32405 - }, - { - "epoch": 0.83, - "learning_rate": 1.6970580621443178e-06, - "loss": 0.9648, - "step": 32406 - }, - { - "epoch": 0.83, - "learning_rate": 1.6970382217556934e-06, - "loss": 0.917, - "step": 32407 - }, - { - "epoch": 0.83, - "learning_rate": 1.6970183808333785e-06, - "loss": 0.8574, - "step": 32408 - }, - { - "epoch": 0.83, - "learning_rate": 1.6969985393773887e-06, - "loss": 0.7856, - "step": 32409 - }, - { - "epoch": 0.83, - "learning_rate": 1.6969786973877392e-06, - "loss": 0.9355, - "step": 32410 - }, - { - "epoch": 0.83, - "learning_rate": 1.6969588548644448e-06, - "loss": 0.8506, - "step": 32411 - }, - { - "epoch": 0.83, - "learning_rate": 1.6969390118075216e-06, - "loss": 0.834, - "step": 32412 - }, - { - "epoch": 0.83, - "learning_rate": 1.696919168216984e-06, - "loss": 0.833, - "step": 32413 - }, - { - "epoch": 0.83, - "learning_rate": 1.6968993240928476e-06, - "loss": 0.9414, - "step": 32414 - }, - { - "epoch": 0.83, - "learning_rate": 1.6968794794351272e-06, - "loss": 0.6855, - "step": 32415 - }, - { - "epoch": 0.83, - "learning_rate": 1.6968596342438382e-06, - "loss": 0.8672, - "step": 32416 - }, - { - "epoch": 0.83, - "learning_rate": 1.696839788518996e-06, - "loss": 1.1602, - "step": 32417 - }, - { - "epoch": 0.83, - "learning_rate": 1.6968199422606157e-06, - "loss": 0.7227, - "step": 32418 - }, - { - "epoch": 0.83, - "learning_rate": 1.6968000954687123e-06, - "loss": 0.7236, - "step": 32419 - }, - { - "epoch": 0.83, - "learning_rate": 1.696780248143301e-06, - "loss": 0.7363, - "step": 32420 - }, - { - "epoch": 0.83, - "learning_rate": 1.6967604002843972e-06, - "loss": 0.8301, - "step": 32421 - }, - { - "epoch": 0.83, - "learning_rate": 1.6967405518920161e-06, - "loss": 0.6475, - "step": 32422 - }, - { - "epoch": 0.83, - "learning_rate": 1.6967207029661727e-06, - "loss": 0.9497, - "step": 32423 - }, - { - "epoch": 0.83, - "learning_rate": 1.6967008535068823e-06, - "loss": 0.8315, - "step": 32424 - }, - { - "epoch": 0.83, - "learning_rate": 1.6966810035141598e-06, - "loss": 0.9717, - "step": 32425 - }, - { - "epoch": 0.83, - "learning_rate": 1.696661152988021e-06, - "loss": 0.8223, - "step": 32426 - }, - { - "epoch": 0.83, - "learning_rate": 1.6966413019284809e-06, - "loss": 0.625, - "step": 32427 - }, - { - "epoch": 0.83, - "learning_rate": 1.6966214503355545e-06, - "loss": 0.7445, - "step": 32428 - }, - { - "epoch": 0.83, - "learning_rate": 1.696601598209257e-06, - "loss": 0.9512, - "step": 32429 - }, - { - "epoch": 0.83, - "learning_rate": 1.6965817455496036e-06, - "loss": 0.8232, - "step": 32430 - }, - { - "epoch": 0.83, - "learning_rate": 1.6965618923566098e-06, - "loss": 0.7329, - "step": 32431 - }, - { - "epoch": 0.83, - "learning_rate": 1.6965420386302903e-06, - "loss": 0.7134, - "step": 32432 - }, - { - "epoch": 0.83, - "learning_rate": 1.696522184370661e-06, - "loss": 0.6416, - "step": 32433 - }, - { - "epoch": 0.83, - "learning_rate": 1.6965023295777362e-06, - "loss": 0.8672, - "step": 32434 - }, - { - "epoch": 0.83, - "learning_rate": 1.696482474251532e-06, - "loss": 0.8955, - "step": 32435 - }, - { - "epoch": 0.83, - "learning_rate": 1.696462618392063e-06, - "loss": 0.7227, - "step": 32436 - }, - { - "epoch": 0.83, - "learning_rate": 1.6964427619993447e-06, - "loss": 0.9277, - "step": 32437 - }, - { - "epoch": 0.83, - "learning_rate": 1.6964229050733922e-06, - "loss": 0.6787, - "step": 32438 - }, - { - "epoch": 0.83, - "learning_rate": 1.6964030476142206e-06, - "loss": 1.041, - "step": 32439 - }, - { - "epoch": 0.83, - "learning_rate": 1.6963831896218453e-06, - "loss": 0.6553, - "step": 32440 - }, - { - "epoch": 0.83, - "learning_rate": 1.6963633310962812e-06, - "loss": 0.7954, - "step": 32441 - }, - { - "epoch": 0.83, - "learning_rate": 1.6963434720375442e-06, - "loss": 0.7744, - "step": 32442 - }, - { - "epoch": 0.83, - "learning_rate": 1.6963236124456487e-06, - "loss": 0.833, - "step": 32443 - }, - { - "epoch": 0.83, - "learning_rate": 1.69630375232061e-06, - "loss": 0.8818, - "step": 32444 - }, - { - "epoch": 0.83, - "learning_rate": 1.696283891662444e-06, - "loss": 0.783, - "step": 32445 - }, - { - "epoch": 0.83, - "learning_rate": 1.6962640304711654e-06, - "loss": 0.9336, - "step": 32446 - }, - { - "epoch": 0.83, - "learning_rate": 1.696244168746789e-06, - "loss": 0.9375, - "step": 32447 - }, - { - "epoch": 0.83, - "learning_rate": 1.6962243064893308e-06, - "loss": 1.0742, - "step": 32448 - }, - { - "epoch": 0.83, - "learning_rate": 1.6962044436988054e-06, - "loss": 0.7729, - "step": 32449 - }, - { - "epoch": 0.83, - "learning_rate": 1.6961845803752283e-06, - "loss": 0.8115, - "step": 32450 - }, - { - "epoch": 0.83, - "learning_rate": 1.696164716518615e-06, - "loss": 0.9619, - "step": 32451 - }, - { - "epoch": 0.83, - "learning_rate": 1.6961448521289805e-06, - "loss": 1.0195, - "step": 32452 - }, - { - "epoch": 0.83, - "learning_rate": 1.6961249872063394e-06, - "loss": 0.8789, - "step": 32453 - }, - { - "epoch": 0.83, - "learning_rate": 1.6961051217507077e-06, - "loss": 0.7451, - "step": 32454 - }, - { - "epoch": 0.83, - "learning_rate": 1.6960852557621002e-06, - "loss": 0.644, - "step": 32455 - }, - { - "epoch": 0.83, - "learning_rate": 1.696065389240532e-06, - "loss": 0.8047, - "step": 32456 - }, - { - "epoch": 0.83, - "learning_rate": 1.6960455221860191e-06, - "loss": 0.9346, - "step": 32457 - }, - { - "epoch": 0.83, - "learning_rate": 1.6960256545985758e-06, - "loss": 0.7788, - "step": 32458 - }, - { - "epoch": 0.83, - "learning_rate": 1.6960057864782176e-06, - "loss": 0.9326, - "step": 32459 - }, - { - "epoch": 0.83, - "learning_rate": 1.69598591782496e-06, - "loss": 0.5102, - "step": 32460 - }, - { - "epoch": 0.83, - "learning_rate": 1.6959660486388177e-06, - "loss": 0.8799, - "step": 32461 - }, - { - "epoch": 0.83, - "learning_rate": 1.6959461789198066e-06, - "loss": 0.5645, - "step": 32462 - }, - { - "epoch": 0.83, - "learning_rate": 1.695926308667941e-06, - "loss": 0.8301, - "step": 32463 - }, - { - "epoch": 0.83, - "learning_rate": 1.6959064378832371e-06, - "loss": 0.8379, - "step": 32464 - }, - { - "epoch": 0.83, - "learning_rate": 1.6958865665657093e-06, - "loss": 0.6826, - "step": 32465 - }, - { - "epoch": 0.83, - "learning_rate": 1.6958666947153734e-06, - "loss": 0.8096, - "step": 32466 - }, - { - "epoch": 0.83, - "learning_rate": 1.6958468223322444e-06, - "loss": 0.6465, - "step": 32467 - }, - { - "epoch": 0.83, - "learning_rate": 1.6958269494163374e-06, - "loss": 0.8398, - "step": 32468 - }, - { - "epoch": 0.83, - "learning_rate": 1.6958070759676675e-06, - "loss": 1.0303, - "step": 32469 - }, - { - "epoch": 0.83, - "learning_rate": 1.69578720198625e-06, - "loss": 0.9414, - "step": 32470 - }, - { - "epoch": 0.83, - "learning_rate": 1.6957673274721005e-06, - "loss": 0.9902, - "step": 32471 - }, - { - "epoch": 0.83, - "learning_rate": 1.695747452425234e-06, - "loss": 0.9766, - "step": 32472 - }, - { - "epoch": 0.83, - "learning_rate": 1.6957275768456656e-06, - "loss": 1.0557, - "step": 32473 - }, - { - "epoch": 0.83, - "learning_rate": 1.6957077007334108e-06, - "loss": 0.8438, - "step": 32474 - }, - { - "epoch": 0.83, - "learning_rate": 1.6956878240884842e-06, - "loss": 0.9668, - "step": 32475 - }, - { - "epoch": 0.83, - "learning_rate": 1.6956679469109017e-06, - "loss": 0.9092, - "step": 32476 - }, - { - "epoch": 0.83, - "learning_rate": 1.6956480692006783e-06, - "loss": 0.8086, - "step": 32477 - }, - { - "epoch": 0.83, - "learning_rate": 1.695628190957829e-06, - "loss": 0.5361, - "step": 32478 - }, - { - "epoch": 0.83, - "learning_rate": 1.6956083121823692e-06, - "loss": 0.6602, - "step": 32479 - }, - { - "epoch": 0.83, - "learning_rate": 1.695588432874314e-06, - "loss": 0.8027, - "step": 32480 - }, - { - "epoch": 0.83, - "learning_rate": 1.6955685530336787e-06, - "loss": 0.9365, - "step": 32481 - }, - { - "epoch": 0.83, - "learning_rate": 1.6955486726604789e-06, - "loss": 0.8486, - "step": 32482 - }, - { - "epoch": 0.83, - "learning_rate": 1.6955287917547293e-06, - "loss": 0.8398, - "step": 32483 - }, - { - "epoch": 0.83, - "learning_rate": 1.695508910316445e-06, - "loss": 0.73, - "step": 32484 - }, - { - "epoch": 0.83, - "learning_rate": 1.6954890283456417e-06, - "loss": 0.6985, - "step": 32485 - }, - { - "epoch": 0.83, - "learning_rate": 1.6954691458423346e-06, - "loss": 0.8955, - "step": 32486 - }, - { - "epoch": 0.83, - "learning_rate": 1.6954492628065385e-06, - "loss": 0.7969, - "step": 32487 - }, - { - "epoch": 0.83, - "learning_rate": 1.695429379238269e-06, - "loss": 0.7515, - "step": 32488 - }, - { - "epoch": 0.83, - "learning_rate": 1.6954094951375411e-06, - "loss": 0.8447, - "step": 32489 - }, - { - "epoch": 0.83, - "learning_rate": 1.6953896105043701e-06, - "loss": 1.0205, - "step": 32490 - }, - { - "epoch": 0.83, - "learning_rate": 1.6953697253387715e-06, - "loss": 0.8423, - "step": 32491 - }, - { - "epoch": 0.83, - "learning_rate": 1.6953498396407603e-06, - "loss": 0.8643, - "step": 32492 - }, - { - "epoch": 0.83, - "learning_rate": 1.6953299534103513e-06, - "loss": 0.7881, - "step": 32493 - }, - { - "epoch": 0.83, - "learning_rate": 1.6953100666475605e-06, - "loss": 0.8828, - "step": 32494 - }, - { - "epoch": 0.83, - "learning_rate": 1.6952901793524025e-06, - "loss": 0.8262, - "step": 32495 - }, - { - "epoch": 0.83, - "learning_rate": 1.6952702915248928e-06, - "loss": 0.8726, - "step": 32496 - }, - { - "epoch": 0.83, - "learning_rate": 1.6952504031650468e-06, - "loss": 0.6685, - "step": 32497 - }, - { - "epoch": 0.83, - "learning_rate": 1.6952305142728793e-06, - "loss": 0.9209, - "step": 32498 - }, - { - "epoch": 0.83, - "learning_rate": 1.695210624848406e-06, - "loss": 0.8359, - "step": 32499 - }, - { - "epoch": 0.83, - "learning_rate": 1.6951907348916419e-06, - "loss": 0.8029, - "step": 32500 - }, - { - "epoch": 0.83, - "learning_rate": 1.695170844402602e-06, - "loss": 0.877, - "step": 32501 - }, - { - "epoch": 0.83, - "learning_rate": 1.695150953381302e-06, - "loss": 0.5042, - "step": 32502 - }, - { - "epoch": 0.83, - "learning_rate": 1.6951310618277566e-06, - "loss": 0.9033, - "step": 32503 - }, - { - "epoch": 0.83, - "learning_rate": 1.6951111697419816e-06, - "loss": 0.6904, - "step": 32504 - }, - { - "epoch": 0.83, - "learning_rate": 1.6950912771239917e-06, - "loss": 0.6943, - "step": 32505 - }, - { - "epoch": 0.83, - "learning_rate": 1.6950713839738024e-06, - "loss": 0.7197, - "step": 32506 - }, - { - "epoch": 0.83, - "learning_rate": 1.695051490291429e-06, - "loss": 0.6885, - "step": 32507 - }, - { - "epoch": 0.83, - "learning_rate": 1.6950315960768866e-06, - "loss": 0.7842, - "step": 32508 - }, - { - "epoch": 0.83, - "learning_rate": 1.6950117013301902e-06, - "loss": 0.9268, - "step": 32509 - }, - { - "epoch": 0.83, - "learning_rate": 1.6949918060513558e-06, - "loss": 0.7417, - "step": 32510 - }, - { - "epoch": 0.83, - "learning_rate": 1.694971910240398e-06, - "loss": 0.9336, - "step": 32511 - }, - { - "epoch": 0.83, - "learning_rate": 1.6949520138973318e-06, - "loss": 0.9326, - "step": 32512 - }, - { - "epoch": 0.83, - "learning_rate": 1.694932117022173e-06, - "loss": 0.5508, - "step": 32513 - }, - { - "epoch": 0.83, - "learning_rate": 1.6949122196149368e-06, - "loss": 0.5701, - "step": 32514 - }, - { - "epoch": 0.83, - "learning_rate": 1.6948923216756382e-06, - "loss": 1.0352, - "step": 32515 - }, - { - "epoch": 0.83, - "learning_rate": 1.6948724232042924e-06, - "loss": 1.0107, - "step": 32516 - }, - { - "epoch": 0.83, - "learning_rate": 1.6948525242009147e-06, - "loss": 0.8193, - "step": 32517 - }, - { - "epoch": 0.83, - "learning_rate": 1.6948326246655204e-06, - "loss": 0.7593, - "step": 32518 - }, - { - "epoch": 0.83, - "learning_rate": 1.6948127245981247e-06, - "loss": 0.96, - "step": 32519 - }, - { - "epoch": 0.83, - "learning_rate": 1.694792823998743e-06, - "loss": 0.9023, - "step": 32520 - }, - { - "epoch": 0.83, - "learning_rate": 1.6947729228673904e-06, - "loss": 0.5811, - "step": 32521 - }, - { - "epoch": 0.83, - "learning_rate": 1.694753021204082e-06, - "loss": 0.7451, - "step": 32522 - }, - { - "epoch": 0.83, - "learning_rate": 1.6947331190088333e-06, - "loss": 0.751, - "step": 32523 - }, - { - "epoch": 0.83, - "learning_rate": 1.6947132162816591e-06, - "loss": 0.8633, - "step": 32524 - }, - { - "epoch": 0.83, - "learning_rate": 1.6946933130225752e-06, - "loss": 1.0264, - "step": 32525 - }, - { - "epoch": 0.83, - "learning_rate": 1.6946734092315964e-06, - "loss": 0.7637, - "step": 32526 - }, - { - "epoch": 0.83, - "learning_rate": 1.6946535049087382e-06, - "loss": 1.0039, - "step": 32527 - }, - { - "epoch": 0.83, - "learning_rate": 1.6946336000540159e-06, - "loss": 0.7178, - "step": 32528 - }, - { - "epoch": 0.83, - "learning_rate": 1.6946136946674443e-06, - "loss": 0.8848, - "step": 32529 - }, - { - "epoch": 0.83, - "learning_rate": 1.694593788749039e-06, - "loss": 0.8594, - "step": 32530 - }, - { - "epoch": 0.83, - "learning_rate": 1.6945738822988152e-06, - "loss": 0.6758, - "step": 32531 - }, - { - "epoch": 0.83, - "learning_rate": 1.694553975316788e-06, - "loss": 0.8647, - "step": 32532 - }, - { - "epoch": 0.83, - "learning_rate": 1.6945340678029729e-06, - "loss": 1.0186, - "step": 32533 - }, - { - "epoch": 0.83, - "learning_rate": 1.6945141597573851e-06, - "loss": 0.8086, - "step": 32534 - }, - { - "epoch": 0.83, - "learning_rate": 1.6944942511800394e-06, - "loss": 0.9277, - "step": 32535 - }, - { - "epoch": 0.83, - "learning_rate": 1.694474342070952e-06, - "loss": 0.7588, - "step": 32536 - }, - { - "epoch": 0.83, - "learning_rate": 1.6944544324301372e-06, - "loss": 1.0303, - "step": 32537 - }, - { - "epoch": 0.83, - "learning_rate": 1.6944345222576104e-06, - "loss": 0.915, - "step": 32538 - }, - { - "epoch": 0.83, - "learning_rate": 1.6944146115533872e-06, - "loss": 0.6445, - "step": 32539 - }, - { - "epoch": 0.83, - "learning_rate": 1.6943947003174826e-06, - "loss": 0.6758, - "step": 32540 - }, - { - "epoch": 0.83, - "learning_rate": 1.6943747885499118e-06, - "loss": 0.749, - "step": 32541 - }, - { - "epoch": 0.83, - "learning_rate": 1.6943548762506904e-06, - "loss": 0.7026, - "step": 32542 - }, - { - "epoch": 0.83, - "learning_rate": 1.6943349634198333e-06, - "loss": 0.8047, - "step": 32543 - }, - { - "epoch": 0.83, - "learning_rate": 1.6943150500573558e-06, - "loss": 0.7705, - "step": 32544 - }, - { - "epoch": 0.83, - "learning_rate": 1.6942951361632732e-06, - "loss": 0.8511, - "step": 32545 - }, - { - "epoch": 0.83, - "learning_rate": 1.6942752217376008e-06, - "loss": 0.8447, - "step": 32546 - }, - { - "epoch": 0.83, - "learning_rate": 1.6942553067803538e-06, - "loss": 0.6807, - "step": 32547 - }, - { - "epoch": 0.83, - "learning_rate": 1.6942353912915474e-06, - "loss": 0.8936, - "step": 32548 - }, - { - "epoch": 0.83, - "learning_rate": 1.6942154752711968e-06, - "loss": 0.874, - "step": 32549 - }, - { - "epoch": 0.83, - "learning_rate": 1.6941955587193173e-06, - "loss": 0.8142, - "step": 32550 - }, - { - "epoch": 0.83, - "learning_rate": 1.6941756416359242e-06, - "loss": 0.8174, - "step": 32551 - }, - { - "epoch": 0.83, - "learning_rate": 1.6941557240210328e-06, - "loss": 0.8535, - "step": 32552 - }, - { - "epoch": 0.83, - "learning_rate": 1.6941358058746583e-06, - "loss": 0.9795, - "step": 32553 - }, - { - "epoch": 0.83, - "learning_rate": 1.6941158871968159e-06, - "loss": 0.8047, - "step": 32554 - }, - { - "epoch": 0.83, - "learning_rate": 1.694095967987521e-06, - "loss": 0.8359, - "step": 32555 - }, - { - "epoch": 0.83, - "learning_rate": 1.6940760482467887e-06, - "loss": 0.9775, - "step": 32556 - }, - { - "epoch": 0.83, - "learning_rate": 1.6940561279746342e-06, - "loss": 0.8145, - "step": 32557 - }, - { - "epoch": 0.83, - "learning_rate": 1.6940362071710729e-06, - "loss": 0.8857, - "step": 32558 - }, - { - "epoch": 0.83, - "learning_rate": 1.6940162858361195e-06, - "loss": 0.8945, - "step": 32559 - }, - { - "epoch": 0.83, - "learning_rate": 1.6939963639697903e-06, - "loss": 0.793, - "step": 32560 - }, - { - "epoch": 0.83, - "learning_rate": 1.6939764415720998e-06, - "loss": 0.8169, - "step": 32561 - }, - { - "epoch": 0.83, - "learning_rate": 1.6939565186430636e-06, - "loss": 0.9189, - "step": 32562 - }, - { - "epoch": 0.83, - "learning_rate": 1.6939365951826966e-06, - "loss": 0.752, - "step": 32563 - }, - { - "epoch": 0.83, - "learning_rate": 1.6939166711910144e-06, - "loss": 0.8604, - "step": 32564 - }, - { - "epoch": 0.83, - "learning_rate": 1.6938967466680323e-06, - "loss": 0.959, - "step": 32565 - }, - { - "epoch": 0.83, - "learning_rate": 1.6938768216137648e-06, - "loss": 0.8018, - "step": 32566 - }, - { - "epoch": 0.83, - "learning_rate": 1.6938568960282286e-06, - "loss": 0.7383, - "step": 32567 - }, - { - "epoch": 0.83, - "learning_rate": 1.6938369699114375e-06, - "loss": 0.8379, - "step": 32568 - }, - { - "epoch": 0.83, - "learning_rate": 1.6938170432634072e-06, - "loss": 0.7842, - "step": 32569 - }, - { - "epoch": 0.83, - "learning_rate": 1.6937971160841533e-06, - "loss": 0.9688, - "step": 32570 - }, - { - "epoch": 0.83, - "learning_rate": 1.6937771883736906e-06, - "loss": 0.9102, - "step": 32571 - }, - { - "epoch": 0.83, - "learning_rate": 1.693757260132035e-06, - "loss": 0.8286, - "step": 32572 - }, - { - "epoch": 0.83, - "learning_rate": 1.6937373313592015e-06, - "loss": 0.7295, - "step": 32573 - }, - { - "epoch": 0.83, - "learning_rate": 1.6937174020552047e-06, - "loss": 0.8594, - "step": 32574 - }, - { - "epoch": 0.83, - "learning_rate": 1.6936974722200606e-06, - "loss": 1.043, - "step": 32575 - }, - { - "epoch": 0.83, - "learning_rate": 1.6936775418537842e-06, - "loss": 0.874, - "step": 32576 - }, - { - "epoch": 0.83, - "learning_rate": 1.693657610956391e-06, - "loss": 0.7769, - "step": 32577 - }, - { - "epoch": 0.83, - "learning_rate": 1.6936376795278959e-06, - "loss": 0.7236, - "step": 32578 - }, - { - "epoch": 0.84, - "learning_rate": 1.6936177475683143e-06, - "loss": 0.8418, - "step": 32579 - }, - { - "epoch": 0.84, - "learning_rate": 1.6935978150776613e-06, - "loss": 0.876, - "step": 32580 - }, - { - "epoch": 0.84, - "learning_rate": 1.6935778820559527e-06, - "loss": 0.8398, - "step": 32581 - }, - { - "epoch": 0.84, - "learning_rate": 1.6935579485032035e-06, - "loss": 0.8818, - "step": 32582 - }, - { - "epoch": 0.84, - "learning_rate": 1.6935380144194285e-06, - "loss": 0.8472, - "step": 32583 - }, - { - "epoch": 0.84, - "learning_rate": 1.6935180798046434e-06, - "loss": 0.9492, - "step": 32584 - }, - { - "epoch": 0.84, - "learning_rate": 1.6934981446588635e-06, - "loss": 0.9355, - "step": 32585 - }, - { - "epoch": 0.84, - "learning_rate": 1.693478208982104e-06, - "loss": 0.9341, - "step": 32586 - }, - { - "epoch": 0.84, - "learning_rate": 1.69345827277438e-06, - "loss": 0.6836, - "step": 32587 - }, - { - "epoch": 0.84, - "learning_rate": 1.6934383360357072e-06, - "loss": 0.9756, - "step": 32588 - }, - { - "epoch": 0.84, - "learning_rate": 1.6934183987661002e-06, - "loss": 0.8457, - "step": 32589 - }, - { - "epoch": 0.84, - "learning_rate": 1.6933984609655747e-06, - "loss": 0.793, - "step": 32590 - }, - { - "epoch": 0.84, - "learning_rate": 1.6933785226341458e-06, - "loss": 0.7036, - "step": 32591 - }, - { - "epoch": 0.84, - "learning_rate": 1.6933585837718289e-06, - "loss": 0.7363, - "step": 32592 - }, - { - "epoch": 0.84, - "learning_rate": 1.6933386443786396e-06, - "loss": 0.8477, - "step": 32593 - }, - { - "epoch": 0.84, - "learning_rate": 1.693318704454592e-06, - "loss": 1.0586, - "step": 32594 - }, - { - "epoch": 0.84, - "learning_rate": 1.6932987639997028e-06, - "loss": 0.5798, - "step": 32595 - }, - { - "epoch": 0.84, - "learning_rate": 1.6932788230139863e-06, - "loss": 0.9023, - "step": 32596 - }, - { - "epoch": 0.84, - "learning_rate": 1.6932588814974582e-06, - "loss": 1.0205, - "step": 32597 - }, - { - "epoch": 0.84, - "learning_rate": 1.6932389394501337e-06, - "loss": 0.6011, - "step": 32598 - }, - { - "epoch": 0.84, - "learning_rate": 1.6932189968720279e-06, - "loss": 0.6641, - "step": 32599 - }, - { - "epoch": 0.84, - "learning_rate": 1.6931990537631564e-06, - "loss": 0.8779, - "step": 32600 - }, - { - "epoch": 0.84, - "learning_rate": 1.693179110123534e-06, - "loss": 0.8223, - "step": 32601 - }, - { - "epoch": 0.84, - "learning_rate": 1.6931591659531763e-06, - "loss": 0.7847, - "step": 32602 - }, - { - "epoch": 0.84, - "learning_rate": 1.6931392212520986e-06, - "loss": 0.8242, - "step": 32603 - }, - { - "epoch": 0.84, - "learning_rate": 1.6931192760203159e-06, - "loss": 0.6538, - "step": 32604 - }, - { - "epoch": 0.84, - "learning_rate": 1.6930993302578439e-06, - "loss": 1.0166, - "step": 32605 - }, - { - "epoch": 0.84, - "learning_rate": 1.6930793839646973e-06, - "loss": 0.7764, - "step": 32606 - }, - { - "epoch": 0.84, - "learning_rate": 1.6930594371408917e-06, - "loss": 0.8213, - "step": 32607 - }, - { - "epoch": 0.84, - "learning_rate": 1.6930394897864427e-06, - "loss": 1.0322, - "step": 32608 - }, - { - "epoch": 0.84, - "learning_rate": 1.693019541901365e-06, - "loss": 1.2217, - "step": 32609 - }, - { - "epoch": 0.84, - "learning_rate": 1.692999593485674e-06, - "loss": 0.7891, - "step": 32610 - }, - { - "epoch": 0.84, - "learning_rate": 1.692979644539385e-06, - "loss": 0.8867, - "step": 32611 - }, - { - "epoch": 0.84, - "learning_rate": 1.6929596950625137e-06, - "loss": 1.1074, - "step": 32612 - }, - { - "epoch": 0.84, - "learning_rate": 1.692939745055075e-06, - "loss": 0.8477, - "step": 32613 - }, - { - "epoch": 0.84, - "learning_rate": 1.6929197945170841e-06, - "loss": 0.8271, - "step": 32614 - }, - { - "epoch": 0.84, - "learning_rate": 1.6928998434485563e-06, - "loss": 0.9463, - "step": 32615 - }, - { - "epoch": 0.84, - "learning_rate": 1.692879891849507e-06, - "loss": 0.7681, - "step": 32616 - }, - { - "epoch": 0.84, - "learning_rate": 1.6928599397199515e-06, - "loss": 0.6245, - "step": 32617 - }, - { - "epoch": 0.84, - "learning_rate": 1.6928399870599052e-06, - "loss": 0.8633, - "step": 32618 - }, - { - "epoch": 0.84, - "learning_rate": 1.6928200338693826e-06, - "loss": 0.9141, - "step": 32619 - }, - { - "epoch": 0.84, - "learning_rate": 1.6928000801484e-06, - "loss": 0.7495, - "step": 32620 - }, - { - "epoch": 0.84, - "learning_rate": 1.6927801258969718e-06, - "loss": 0.6797, - "step": 32621 - }, - { - "epoch": 0.84, - "learning_rate": 1.6927601711151143e-06, - "loss": 0.9307, - "step": 32622 - }, - { - "epoch": 0.84, - "learning_rate": 1.692740215802842e-06, - "loss": 0.5938, - "step": 32623 - }, - { - "epoch": 0.84, - "learning_rate": 1.6927202599601699e-06, - "loss": 0.7573, - "step": 32624 - }, - { - "epoch": 0.84, - "learning_rate": 1.6927003035871144e-06, - "loss": 0.6396, - "step": 32625 - }, - { - "epoch": 0.84, - "learning_rate": 1.6926803466836896e-06, - "loss": 0.9355, - "step": 32626 - }, - { - "epoch": 0.84, - "learning_rate": 1.6926603892499119e-06, - "loss": 1.0977, - "step": 32627 - }, - { - "epoch": 0.84, - "learning_rate": 1.6926404312857954e-06, - "loss": 0.5513, - "step": 32628 - }, - { - "epoch": 0.84, - "learning_rate": 1.6926204727913562e-06, - "loss": 0.7222, - "step": 32629 - }, - { - "epoch": 0.84, - "learning_rate": 1.6926005137666092e-06, - "loss": 1.1328, - "step": 32630 - }, - { - "epoch": 0.84, - "learning_rate": 1.69258055421157e-06, - "loss": 0.6992, - "step": 32631 - }, - { - "epoch": 0.84, - "learning_rate": 1.692560594126254e-06, - "loss": 1.0674, - "step": 32632 - }, - { - "epoch": 0.84, - "learning_rate": 1.692540633510676e-06, - "loss": 0.7119, - "step": 32633 - }, - { - "epoch": 0.84, - "learning_rate": 1.6925206723648513e-06, - "loss": 0.9014, - "step": 32634 - }, - { - "epoch": 0.84, - "learning_rate": 1.6925007106887955e-06, - "loss": 0.8447, - "step": 32635 - }, - { - "epoch": 0.84, - "learning_rate": 1.6924807484825237e-06, - "loss": 1.0742, - "step": 32636 - }, - { - "epoch": 0.84, - "learning_rate": 1.6924607857460514e-06, - "loss": 0.811, - "step": 32637 - }, - { - "epoch": 0.84, - "learning_rate": 1.6924408224793933e-06, - "loss": 0.8398, - "step": 32638 - }, - { - "epoch": 0.84, - "learning_rate": 1.6924208586825651e-06, - "loss": 0.8789, - "step": 32639 - }, - { - "epoch": 0.84, - "learning_rate": 1.6924008943555825e-06, - "loss": 0.7852, - "step": 32640 - }, - { - "epoch": 0.84, - "learning_rate": 1.6923809294984603e-06, - "loss": 0.6685, - "step": 32641 - }, - { - "epoch": 0.84, - "learning_rate": 1.6923609641112137e-06, - "loss": 0.7725, - "step": 32642 - }, - { - "epoch": 0.84, - "learning_rate": 1.6923409981938583e-06, - "loss": 0.8467, - "step": 32643 - }, - { - "epoch": 0.84, - "learning_rate": 1.692321031746409e-06, - "loss": 0.8252, - "step": 32644 - }, - { - "epoch": 0.84, - "learning_rate": 1.6923010647688818e-06, - "loss": 0.8311, - "step": 32645 - }, - { - "epoch": 0.84, - "learning_rate": 1.692281097261291e-06, - "loss": 1.1221, - "step": 32646 - }, - { - "epoch": 0.84, - "learning_rate": 1.6922611292236527e-06, - "loss": 0.8213, - "step": 32647 - }, - { - "epoch": 0.84, - "learning_rate": 1.6922411606559816e-06, - "loss": 0.9199, - "step": 32648 - }, - { - "epoch": 0.84, - "learning_rate": 1.6922211915582936e-06, - "loss": 0.6226, - "step": 32649 - }, - { - "epoch": 0.84, - "learning_rate": 1.6922012219306035e-06, - "loss": 1.0371, - "step": 32650 - }, - { - "epoch": 0.84, - "learning_rate": 1.6921812517729266e-06, - "loss": 0.8081, - "step": 32651 - }, - { - "epoch": 0.84, - "learning_rate": 1.6921612810852786e-06, - "loss": 0.7993, - "step": 32652 - }, - { - "epoch": 0.84, - "learning_rate": 1.6921413098676744e-06, - "loss": 0.7378, - "step": 32653 - }, - { - "epoch": 0.84, - "learning_rate": 1.6921213381201294e-06, - "loss": 1.001, - "step": 32654 - }, - { - "epoch": 0.84, - "learning_rate": 1.692101365842659e-06, - "loss": 0.835, - "step": 32655 - }, - { - "epoch": 0.84, - "learning_rate": 1.6920813930352785e-06, - "loss": 0.791, - "step": 32656 - }, - { - "epoch": 0.84, - "learning_rate": 1.692061419698003e-06, - "loss": 0.8696, - "step": 32657 - }, - { - "epoch": 0.84, - "learning_rate": 1.6920414458308478e-06, - "loss": 0.7393, - "step": 32658 - }, - { - "epoch": 0.84, - "learning_rate": 1.6920214714338284e-06, - "loss": 1.0811, - "step": 32659 - }, - { - "epoch": 0.84, - "learning_rate": 1.6920014965069598e-06, - "loss": 0.9404, - "step": 32660 - }, - { - "epoch": 0.84, - "learning_rate": 1.6919815210502577e-06, - "loss": 0.4829, - "step": 32661 - }, - { - "epoch": 0.84, - "learning_rate": 1.6919615450637371e-06, - "loss": 0.9502, - "step": 32662 - }, - { - "epoch": 0.84, - "learning_rate": 1.6919415685474135e-06, - "loss": 0.9092, - "step": 32663 - }, - { - "epoch": 0.84, - "learning_rate": 1.6919215915013015e-06, - "loss": 0.8848, - "step": 32664 - }, - { - "epoch": 0.84, - "learning_rate": 1.6919016139254177e-06, - "loss": 0.677, - "step": 32665 - }, - { - "epoch": 0.84, - "learning_rate": 1.6918816358197763e-06, - "loss": 0.8066, - "step": 32666 - }, - { - "epoch": 0.84, - "learning_rate": 1.691861657184393e-06, - "loss": 0.9316, - "step": 32667 - }, - { - "epoch": 0.84, - "learning_rate": 1.6918416780192825e-06, - "loss": 0.7729, - "step": 32668 - }, - { - "epoch": 0.84, - "learning_rate": 1.6918216983244612e-06, - "loss": 0.7424, - "step": 32669 - }, - { - "epoch": 0.84, - "learning_rate": 1.6918017180999437e-06, - "loss": 0.9834, - "step": 32670 - }, - { - "epoch": 0.84, - "learning_rate": 1.6917817373457457e-06, - "loss": 0.8486, - "step": 32671 - }, - { - "epoch": 0.84, - "learning_rate": 1.691761756061882e-06, - "loss": 0.7158, - "step": 32672 - }, - { - "epoch": 0.84, - "learning_rate": 1.6917417742483682e-06, - "loss": 1.0215, - "step": 32673 - }, - { - "epoch": 0.84, - "learning_rate": 1.6917217919052194e-06, - "loss": 0.9209, - "step": 32674 - }, - { - "epoch": 0.84, - "learning_rate": 1.691701809032451e-06, - "loss": 0.8516, - "step": 32675 - }, - { - "epoch": 0.84, - "learning_rate": 1.6916818256300787e-06, - "loss": 0.6421, - "step": 32676 - }, - { - "epoch": 0.84, - "learning_rate": 1.6916618416981171e-06, - "loss": 0.7856, - "step": 32677 - }, - { - "epoch": 0.84, - "learning_rate": 1.6916418572365817e-06, - "loss": 0.833, - "step": 32678 - }, - { - "epoch": 0.84, - "learning_rate": 1.6916218722454883e-06, - "loss": 0.6514, - "step": 32679 - }, - { - "epoch": 0.84, - "learning_rate": 1.6916018867248515e-06, - "loss": 1.0576, - "step": 32680 - }, - { - "epoch": 0.84, - "learning_rate": 1.6915819006746874e-06, - "loss": 1.0625, - "step": 32681 - }, - { - "epoch": 0.84, - "learning_rate": 1.6915619140950106e-06, - "loss": 0.6445, - "step": 32682 - }, - { - "epoch": 0.84, - "learning_rate": 1.6915419269858365e-06, - "loss": 0.7544, - "step": 32683 - }, - { - "epoch": 0.84, - "learning_rate": 1.6915219393471807e-06, - "loss": 0.8557, - "step": 32684 - }, - { - "epoch": 0.84, - "learning_rate": 1.6915019511790583e-06, - "loss": 0.5503, - "step": 32685 - }, - { - "epoch": 0.84, - "learning_rate": 1.6914819624814847e-06, - "loss": 0.7061, - "step": 32686 - }, - { - "epoch": 0.84, - "learning_rate": 1.691461973254475e-06, - "loss": 0.7959, - "step": 32687 - }, - { - "epoch": 0.84, - "learning_rate": 1.6914419834980447e-06, - "loss": 0.8188, - "step": 32688 - }, - { - "epoch": 0.84, - "learning_rate": 1.6914219932122091e-06, - "loss": 0.7051, - "step": 32689 - }, - { - "epoch": 0.84, - "learning_rate": 1.6914020023969835e-06, - "loss": 0.7407, - "step": 32690 - }, - { - "epoch": 0.84, - "learning_rate": 1.6913820110523834e-06, - "loss": 0.9854, - "step": 32691 - }, - { - "epoch": 0.84, - "learning_rate": 1.6913620191784235e-06, - "loss": 0.8574, - "step": 32692 - }, - { - "epoch": 0.84, - "learning_rate": 1.6913420267751194e-06, - "loss": 0.8633, - "step": 32693 - }, - { - "epoch": 0.84, - "learning_rate": 1.691322033842487e-06, - "loss": 0.9883, - "step": 32694 - }, - { - "epoch": 0.84, - "learning_rate": 1.6913020403805408e-06, - "loss": 0.668, - "step": 32695 - }, - { - "epoch": 0.84, - "learning_rate": 1.6912820463892964e-06, - "loss": 0.6665, - "step": 32696 - }, - { - "epoch": 0.84, - "learning_rate": 1.6912620518687692e-06, - "loss": 0.8506, - "step": 32697 - }, - { - "epoch": 0.84, - "learning_rate": 1.6912420568189744e-06, - "loss": 0.8237, - "step": 32698 - }, - { - "epoch": 0.84, - "learning_rate": 1.6912220612399275e-06, - "loss": 0.9629, - "step": 32699 - }, - { - "epoch": 0.84, - "learning_rate": 1.6912020651316435e-06, - "loss": 0.8994, - "step": 32700 - }, - { - "epoch": 0.84, - "learning_rate": 1.6911820684941378e-06, - "loss": 0.6746, - "step": 32701 - }, - { - "epoch": 0.84, - "learning_rate": 1.691162071327426e-06, - "loss": 1.001, - "step": 32702 - }, - { - "epoch": 0.84, - "learning_rate": 1.691142073631523e-06, - "loss": 0.8535, - "step": 32703 - }, - { - "epoch": 0.84, - "learning_rate": 1.6911220754064442e-06, - "loss": 0.7261, - "step": 32704 - }, - { - "epoch": 0.84, - "learning_rate": 1.6911020766522051e-06, - "loss": 0.8379, - "step": 32705 - }, - { - "epoch": 0.84, - "learning_rate": 1.6910820773688211e-06, - "loss": 0.9697, - "step": 32706 - }, - { - "epoch": 0.84, - "learning_rate": 1.691062077556307e-06, - "loss": 0.8252, - "step": 32707 - }, - { - "epoch": 0.84, - "learning_rate": 1.6910420772146786e-06, - "loss": 0.7197, - "step": 32708 - }, - { - "epoch": 0.84, - "learning_rate": 1.691022076343951e-06, - "loss": 0.7344, - "step": 32709 - }, - { - "epoch": 0.84, - "learning_rate": 1.6910020749441399e-06, - "loss": 0.7603, - "step": 32710 - }, - { - "epoch": 0.84, - "learning_rate": 1.69098207301526e-06, - "loss": 0.9014, - "step": 32711 - }, - { - "epoch": 0.84, - "learning_rate": 1.690962070557327e-06, - "loss": 0.8418, - "step": 32712 - }, - { - "epoch": 0.84, - "learning_rate": 1.6909420675703558e-06, - "loss": 0.8428, - "step": 32713 - }, - { - "epoch": 0.84, - "learning_rate": 1.6909220640543621e-06, - "loss": 0.8369, - "step": 32714 - }, - { - "epoch": 0.84, - "learning_rate": 1.6909020600093614e-06, - "loss": 0.8701, - "step": 32715 - }, - { - "epoch": 0.84, - "learning_rate": 1.6908820554353688e-06, - "loss": 1.0547, - "step": 32716 - }, - { - "epoch": 0.84, - "learning_rate": 1.6908620503323996e-06, - "loss": 0.6548, - "step": 32717 - }, - { - "epoch": 0.84, - "learning_rate": 1.690842044700469e-06, - "loss": 0.7949, - "step": 32718 - }, - { - "epoch": 0.84, - "learning_rate": 1.6908220385395923e-06, - "loss": 0.8369, - "step": 32719 - }, - { - "epoch": 0.84, - "learning_rate": 1.6908020318497848e-06, - "loss": 0.9326, - "step": 32720 - }, - { - "epoch": 0.84, - "learning_rate": 1.6907820246310624e-06, - "loss": 0.6157, - "step": 32721 - }, - { - "epoch": 0.84, - "learning_rate": 1.6907620168834397e-06, - "loss": 0.8066, - "step": 32722 - }, - { - "epoch": 0.84, - "learning_rate": 1.6907420086069322e-06, - "loss": 0.8926, - "step": 32723 - }, - { - "epoch": 0.84, - "learning_rate": 1.6907219998015554e-06, - "loss": 0.9893, - "step": 32724 - }, - { - "epoch": 0.84, - "learning_rate": 1.6907019904673244e-06, - "loss": 0.7612, - "step": 32725 - }, - { - "epoch": 0.84, - "learning_rate": 1.690681980604255e-06, - "loss": 0.9502, - "step": 32726 - }, - { - "epoch": 0.84, - "learning_rate": 1.6906619702123618e-06, - "loss": 0.8428, - "step": 32727 - }, - { - "epoch": 0.84, - "learning_rate": 1.6906419592916606e-06, - "loss": 0.8506, - "step": 32728 - }, - { - "epoch": 0.84, - "learning_rate": 1.6906219478421666e-06, - "loss": 1.0342, - "step": 32729 - }, - { - "epoch": 0.84, - "learning_rate": 1.6906019358638951e-06, - "loss": 0.9082, - "step": 32730 - }, - { - "epoch": 0.84, - "learning_rate": 1.6905819233568617e-06, - "loss": 0.6787, - "step": 32731 - }, - { - "epoch": 0.84, - "learning_rate": 1.6905619103210812e-06, - "loss": 0.9209, - "step": 32732 - }, - { - "epoch": 0.84, - "learning_rate": 1.6905418967565693e-06, - "loss": 0.9453, - "step": 32733 - }, - { - "epoch": 0.84, - "learning_rate": 1.690521882663341e-06, - "loss": 0.9717, - "step": 32734 - }, - { - "epoch": 0.84, - "learning_rate": 1.6905018680414122e-06, - "loss": 0.959, - "step": 32735 - }, - { - "epoch": 0.84, - "learning_rate": 1.6904818528907978e-06, - "loss": 0.5698, - "step": 32736 - }, - { - "epoch": 0.84, - "learning_rate": 1.6904618372115131e-06, - "loss": 0.832, - "step": 32737 - }, - { - "epoch": 0.84, - "learning_rate": 1.6904418210035733e-06, - "loss": 0.541, - "step": 32738 - }, - { - "epoch": 0.84, - "learning_rate": 1.6904218042669944e-06, - "loss": 0.79, - "step": 32739 - }, - { - "epoch": 0.84, - "learning_rate": 1.690401787001791e-06, - "loss": 0.9102, - "step": 32740 - }, - { - "epoch": 0.84, - "learning_rate": 1.690381769207979e-06, - "loss": 0.9531, - "step": 32741 - }, - { - "epoch": 0.84, - "learning_rate": 1.690361750885573e-06, - "loss": 0.8096, - "step": 32742 - }, - { - "epoch": 0.84, - "learning_rate": 1.690341732034589e-06, - "loss": 0.9004, - "step": 32743 - }, - { - "epoch": 0.84, - "learning_rate": 1.690321712655042e-06, - "loss": 1.1875, - "step": 32744 - }, - { - "epoch": 0.84, - "learning_rate": 1.690301692746947e-06, - "loss": 0.9346, - "step": 32745 - }, - { - "epoch": 0.84, - "learning_rate": 1.6902816723103206e-06, - "loss": 0.6777, - "step": 32746 - }, - { - "epoch": 0.84, - "learning_rate": 1.6902616513451768e-06, - "loss": 0.6724, - "step": 32747 - }, - { - "epoch": 0.84, - "learning_rate": 1.6902416298515312e-06, - "loss": 0.832, - "step": 32748 - }, - { - "epoch": 0.84, - "learning_rate": 1.6902216078293997e-06, - "loss": 0.9062, - "step": 32749 - }, - { - "epoch": 0.84, - "learning_rate": 1.690201585278797e-06, - "loss": 0.9248, - "step": 32750 - }, - { - "epoch": 0.84, - "learning_rate": 1.6901815621997388e-06, - "loss": 0.9785, - "step": 32751 - }, - { - "epoch": 0.84, - "learning_rate": 1.6901615385922403e-06, - "loss": 0.6389, - "step": 32752 - }, - { - "epoch": 0.84, - "learning_rate": 1.6901415144563167e-06, - "loss": 0.6914, - "step": 32753 - }, - { - "epoch": 0.84, - "learning_rate": 1.6901214897919837e-06, - "loss": 0.5713, - "step": 32754 - }, - { - "epoch": 0.84, - "learning_rate": 1.6901014645992563e-06, - "loss": 0.7368, - "step": 32755 - }, - { - "epoch": 0.84, - "learning_rate": 1.69008143887815e-06, - "loss": 0.813, - "step": 32756 - }, - { - "epoch": 0.84, - "learning_rate": 1.6900614126286798e-06, - "loss": 0.8262, - "step": 32757 - }, - { - "epoch": 0.84, - "learning_rate": 1.6900413858508615e-06, - "loss": 0.7095, - "step": 32758 - }, - { - "epoch": 0.84, - "learning_rate": 1.6900213585447103e-06, - "loss": 1.1133, - "step": 32759 - }, - { - "epoch": 0.84, - "learning_rate": 1.6900013307102414e-06, - "loss": 0.9297, - "step": 32760 - }, - { - "epoch": 0.84, - "learning_rate": 1.6899813023474706e-06, - "loss": 0.8818, - "step": 32761 - }, - { - "epoch": 0.84, - "learning_rate": 1.6899612734564122e-06, - "loss": 0.7549, - "step": 32762 - }, - { - "epoch": 0.84, - "learning_rate": 1.6899412440370825e-06, - "loss": 0.8662, - "step": 32763 - }, - { - "epoch": 0.84, - "learning_rate": 1.6899212140894962e-06, - "loss": 0.6445, - "step": 32764 - }, - { - "epoch": 0.84, - "learning_rate": 1.6899011836136693e-06, - "loss": 0.8975, - "step": 32765 - }, - { - "epoch": 0.84, - "learning_rate": 1.689881152609617e-06, - "loss": 0.8535, - "step": 32766 - }, - { - "epoch": 0.84, - "learning_rate": 1.6898611210773538e-06, - "loss": 0.9395, - "step": 32767 - }, - { - "epoch": 0.84, - "learning_rate": 1.6898410890168962e-06, - "loss": 0.7998, - "step": 32768 - }, - { - "epoch": 0.84, - "learning_rate": 1.6898210564282586e-06, - "loss": 0.6821, - "step": 32769 - }, - { - "epoch": 0.84, - "learning_rate": 1.689801023311457e-06, - "loss": 0.5591, - "step": 32770 - }, - { - "epoch": 0.84, - "learning_rate": 1.6897809896665068e-06, - "loss": 0.876, - "step": 32771 - }, - { - "epoch": 0.84, - "learning_rate": 1.6897609554934221e-06, - "loss": 0.7334, - "step": 32772 - }, - { - "epoch": 0.84, - "learning_rate": 1.6897409207922198e-06, - "loss": 0.9072, - "step": 32773 - }, - { - "epoch": 0.84, - "learning_rate": 1.6897208855629145e-06, - "loss": 0.8491, - "step": 32774 - }, - { - "epoch": 0.84, - "learning_rate": 1.6897008498055217e-06, - "loss": 0.9688, - "step": 32775 - }, - { - "epoch": 0.84, - "learning_rate": 1.6896808135200567e-06, - "loss": 0.7336, - "step": 32776 - }, - { - "epoch": 0.84, - "learning_rate": 1.6896607767065344e-06, - "loss": 0.7573, - "step": 32777 - }, - { - "epoch": 0.84, - "learning_rate": 1.6896407393649708e-06, - "loss": 1.1504, - "step": 32778 - }, - { - "epoch": 0.84, - "learning_rate": 1.6896207014953812e-06, - "loss": 0.8164, - "step": 32779 - }, - { - "epoch": 0.84, - "learning_rate": 1.6896006630977807e-06, - "loss": 0.8149, - "step": 32780 - }, - { - "epoch": 0.84, - "learning_rate": 1.6895806241721843e-06, - "loss": 0.877, - "step": 32781 - }, - { - "epoch": 0.84, - "learning_rate": 1.689560584718608e-06, - "loss": 0.6904, - "step": 32782 - }, - { - "epoch": 0.84, - "learning_rate": 1.6895405447370669e-06, - "loss": 0.8906, - "step": 32783 - }, - { - "epoch": 0.84, - "learning_rate": 1.6895205042275763e-06, - "loss": 0.7686, - "step": 32784 - }, - { - "epoch": 0.84, - "learning_rate": 1.6895004631901512e-06, - "loss": 0.8672, - "step": 32785 - }, - { - "epoch": 0.84, - "learning_rate": 1.689480421624808e-06, - "loss": 0.6331, - "step": 32786 - }, - { - "epoch": 0.84, - "learning_rate": 1.6894603795315606e-06, - "loss": 0.8574, - "step": 32787 - }, - { - "epoch": 0.84, - "learning_rate": 1.6894403369104256e-06, - "loss": 0.6338, - "step": 32788 - }, - { - "epoch": 0.84, - "learning_rate": 1.6894202937614177e-06, - "loss": 0.667, - "step": 32789 - }, - { - "epoch": 0.84, - "learning_rate": 1.6894002500845522e-06, - "loss": 0.8154, - "step": 32790 - }, - { - "epoch": 0.84, - "learning_rate": 1.689380205879845e-06, - "loss": 0.8027, - "step": 32791 - }, - { - "epoch": 0.84, - "learning_rate": 1.6893601611473108e-06, - "loss": 0.7673, - "step": 32792 - }, - { - "epoch": 0.84, - "learning_rate": 1.6893401158869653e-06, - "loss": 0.8066, - "step": 32793 - }, - { - "epoch": 0.84, - "learning_rate": 1.6893200700988238e-06, - "loss": 0.6328, - "step": 32794 - }, - { - "epoch": 0.84, - "learning_rate": 1.6893000237829016e-06, - "loss": 0.749, - "step": 32795 - }, - { - "epoch": 0.84, - "learning_rate": 1.689279976939214e-06, - "loss": 0.8584, - "step": 32796 - }, - { - "epoch": 0.84, - "learning_rate": 1.6892599295677762e-06, - "loss": 1.0449, - "step": 32797 - }, - { - "epoch": 0.84, - "learning_rate": 1.6892398816686042e-06, - "loss": 1.1133, - "step": 32798 - }, - { - "epoch": 0.84, - "learning_rate": 1.6892198332417126e-06, - "loss": 0.8936, - "step": 32799 - }, - { - "epoch": 0.84, - "learning_rate": 1.6891997842871172e-06, - "loss": 0.856, - "step": 32800 - }, - { - "epoch": 0.84, - "learning_rate": 1.6891797348048334e-06, - "loss": 0.7666, - "step": 32801 - }, - { - "epoch": 0.84, - "learning_rate": 1.6891596847948762e-06, - "loss": 0.9814, - "step": 32802 - }, - { - "epoch": 0.84, - "learning_rate": 1.6891396342572609e-06, - "loss": 0.8652, - "step": 32803 - }, - { - "epoch": 0.84, - "learning_rate": 1.6891195831920034e-06, - "loss": 0.8926, - "step": 32804 - }, - { - "epoch": 0.84, - "learning_rate": 1.6890995315991186e-06, - "loss": 0.856, - "step": 32805 - }, - { - "epoch": 0.84, - "learning_rate": 1.6890794794786222e-06, - "loss": 0.8374, - "step": 32806 - }, - { - "epoch": 0.84, - "learning_rate": 1.689059426830529e-06, - "loss": 0.9067, - "step": 32807 - }, - { - "epoch": 0.84, - "learning_rate": 1.6890393736548546e-06, - "loss": 0.6797, - "step": 32808 - }, - { - "epoch": 0.84, - "learning_rate": 1.6890193199516146e-06, - "loss": 0.9697, - "step": 32809 - }, - { - "epoch": 0.84, - "learning_rate": 1.688999265720824e-06, - "loss": 0.6309, - "step": 32810 - }, - { - "epoch": 0.84, - "learning_rate": 1.6889792109624988e-06, - "loss": 1.1328, - "step": 32811 - }, - { - "epoch": 0.84, - "learning_rate": 1.6889591556766535e-06, - "loss": 0.6685, - "step": 32812 - }, - { - "epoch": 0.84, - "learning_rate": 1.688939099863304e-06, - "loss": 0.96, - "step": 32813 - }, - { - "epoch": 0.84, - "learning_rate": 1.6889190435224654e-06, - "loss": 0.6001, - "step": 32814 - }, - { - "epoch": 0.84, - "learning_rate": 1.6888989866541533e-06, - "loss": 1.0146, - "step": 32815 - }, - { - "epoch": 0.84, - "learning_rate": 1.688878929258383e-06, - "loss": 1.0586, - "step": 32816 - }, - { - "epoch": 0.84, - "learning_rate": 1.6888588713351697e-06, - "loss": 0.8428, - "step": 32817 - }, - { - "epoch": 0.84, - "learning_rate": 1.6888388128845288e-06, - "loss": 0.9707, - "step": 32818 - }, - { - "epoch": 0.84, - "learning_rate": 1.6888187539064756e-06, - "loss": 0.8301, - "step": 32819 - }, - { - "epoch": 0.84, - "learning_rate": 1.6887986944010258e-06, - "loss": 0.7666, - "step": 32820 - }, - { - "epoch": 0.84, - "learning_rate": 1.6887786343681942e-06, - "loss": 0.9443, - "step": 32821 - }, - { - "epoch": 0.84, - "learning_rate": 1.6887585738079966e-06, - "loss": 0.8281, - "step": 32822 - }, - { - "epoch": 0.84, - "learning_rate": 1.688738512720448e-06, - "loss": 1.0312, - "step": 32823 - }, - { - "epoch": 0.84, - "learning_rate": 1.6887184511055646e-06, - "loss": 0.8008, - "step": 32824 - }, - { - "epoch": 0.84, - "learning_rate": 1.6886983889633605e-06, - "loss": 0.6516, - "step": 32825 - }, - { - "epoch": 0.84, - "learning_rate": 1.6886783262938522e-06, - "loss": 1.0273, - "step": 32826 - }, - { - "epoch": 0.84, - "learning_rate": 1.6886582630970544e-06, - "loss": 0.7251, - "step": 32827 - }, - { - "epoch": 0.84, - "learning_rate": 1.6886381993729825e-06, - "loss": 0.8887, - "step": 32828 - }, - { - "epoch": 0.84, - "learning_rate": 1.6886181351216522e-06, - "loss": 0.6699, - "step": 32829 - }, - { - "epoch": 0.84, - "learning_rate": 1.6885980703430786e-06, - "loss": 0.7305, - "step": 32830 - }, - { - "epoch": 0.84, - "learning_rate": 1.6885780050372772e-06, - "loss": 0.6895, - "step": 32831 - }, - { - "epoch": 0.84, - "learning_rate": 1.688557939204263e-06, - "loss": 1.1113, - "step": 32832 - }, - { - "epoch": 0.84, - "learning_rate": 1.6885378728440518e-06, - "loss": 0.8867, - "step": 32833 - }, - { - "epoch": 0.84, - "learning_rate": 1.688517805956659e-06, - "loss": 0.7852, - "step": 32834 - }, - { - "epoch": 0.84, - "learning_rate": 1.6884977385420992e-06, - "loss": 1.0957, - "step": 32835 - }, - { - "epoch": 0.84, - "learning_rate": 1.6884776706003891e-06, - "loss": 0.793, - "step": 32836 - }, - { - "epoch": 0.84, - "learning_rate": 1.688457602131543e-06, - "loss": 0.96, - "step": 32837 - }, - { - "epoch": 0.84, - "learning_rate": 1.6884375331355764e-06, - "loss": 0.7458, - "step": 32838 - }, - { - "epoch": 0.84, - "learning_rate": 1.6884174636125051e-06, - "loss": 0.4956, - "step": 32839 - }, - { - "epoch": 0.84, - "learning_rate": 1.6883973935623439e-06, - "loss": 0.7754, - "step": 32840 - }, - { - "epoch": 0.84, - "learning_rate": 1.6883773229851087e-06, - "loss": 0.7852, - "step": 32841 - }, - { - "epoch": 0.84, - "learning_rate": 1.6883572518808148e-06, - "loss": 0.7513, - "step": 32842 - }, - { - "epoch": 0.84, - "learning_rate": 1.6883371802494768e-06, - "loss": 0.6484, - "step": 32843 - }, - { - "epoch": 0.84, - "learning_rate": 1.6883171080911111e-06, - "loss": 0.8135, - "step": 32844 - }, - { - "epoch": 0.84, - "learning_rate": 1.6882970354057327e-06, - "loss": 1.0049, - "step": 32845 - }, - { - "epoch": 0.84, - "learning_rate": 1.6882769621933565e-06, - "loss": 0.8623, - "step": 32846 - }, - { - "epoch": 0.84, - "learning_rate": 1.6882568884539987e-06, - "loss": 1.1406, - "step": 32847 - }, - { - "epoch": 0.84, - "learning_rate": 1.6882368141876742e-06, - "loss": 0.8477, - "step": 32848 - }, - { - "epoch": 0.84, - "learning_rate": 1.6882167393943983e-06, - "loss": 0.9629, - "step": 32849 - }, - { - "epoch": 0.84, - "learning_rate": 1.6881966640741865e-06, - "loss": 0.8477, - "step": 32850 - }, - { - "epoch": 0.84, - "learning_rate": 1.6881765882270541e-06, - "loss": 0.8225, - "step": 32851 - }, - { - "epoch": 0.84, - "learning_rate": 1.6881565118530167e-06, - "loss": 0.8418, - "step": 32852 - }, - { - "epoch": 0.84, - "learning_rate": 1.6881364349520894e-06, - "loss": 0.9404, - "step": 32853 - }, - { - "epoch": 0.84, - "learning_rate": 1.6881163575242877e-06, - "loss": 1.1133, - "step": 32854 - }, - { - "epoch": 0.84, - "learning_rate": 1.6880962795696268e-06, - "loss": 0.8408, - "step": 32855 - }, - { - "epoch": 0.84, - "learning_rate": 1.6880762010881227e-06, - "loss": 0.6523, - "step": 32856 - }, - { - "epoch": 0.84, - "learning_rate": 1.6880561220797897e-06, - "loss": 0.8691, - "step": 32857 - }, - { - "epoch": 0.84, - "learning_rate": 1.688036042544644e-06, - "loss": 0.9619, - "step": 32858 - }, - { - "epoch": 0.84, - "learning_rate": 1.6880159624827006e-06, - "loss": 0.854, - "step": 32859 - }, - { - "epoch": 0.84, - "learning_rate": 1.6879958818939753e-06, - "loss": 0.8608, - "step": 32860 - }, - { - "epoch": 0.84, - "learning_rate": 1.6879758007784833e-06, - "loss": 0.8159, - "step": 32861 - }, - { - "epoch": 0.84, - "learning_rate": 1.6879557191362395e-06, - "loss": 0.689, - "step": 32862 - }, - { - "epoch": 0.84, - "learning_rate": 1.6879356369672598e-06, - "loss": 0.9434, - "step": 32863 - }, - { - "epoch": 0.84, - "learning_rate": 1.687915554271559e-06, - "loss": 0.9492, - "step": 32864 - }, - { - "epoch": 0.84, - "learning_rate": 1.6878954710491533e-06, - "loss": 0.7939, - "step": 32865 - }, - { - "epoch": 0.84, - "learning_rate": 1.6878753873000578e-06, - "loss": 0.627, - "step": 32866 - }, - { - "epoch": 0.84, - "learning_rate": 1.6878553030242875e-06, - "loss": 0.8281, - "step": 32867 - }, - { - "epoch": 0.84, - "learning_rate": 1.687835218221858e-06, - "loss": 0.8682, - "step": 32868 - }, - { - "epoch": 0.84, - "learning_rate": 1.6878151328927848e-06, - "loss": 0.8232, - "step": 32869 - }, - { - "epoch": 0.84, - "learning_rate": 1.6877950470370832e-06, - "loss": 0.8723, - "step": 32870 - }, - { - "epoch": 0.84, - "learning_rate": 1.6877749606547687e-06, - "loss": 0.8711, - "step": 32871 - }, - { - "epoch": 0.84, - "learning_rate": 1.687754873745856e-06, - "loss": 0.7817, - "step": 32872 - }, - { - "epoch": 0.84, - "learning_rate": 1.6877347863103615e-06, - "loss": 0.958, - "step": 32873 - }, - { - "epoch": 0.84, - "learning_rate": 1.6877146983482999e-06, - "loss": 0.8174, - "step": 32874 - }, - { - "epoch": 0.84, - "learning_rate": 1.6876946098596868e-06, - "loss": 0.7344, - "step": 32875 - }, - { - "epoch": 0.84, - "learning_rate": 1.6876745208445379e-06, - "loss": 0.8105, - "step": 32876 - }, - { - "epoch": 0.84, - "learning_rate": 1.6876544313028678e-06, - "loss": 0.79, - "step": 32877 - }, - { - "epoch": 0.84, - "learning_rate": 1.6876343412346926e-06, - "loss": 1.0615, - "step": 32878 - }, - { - "epoch": 0.84, - "learning_rate": 1.6876142506400272e-06, - "loss": 0.9375, - "step": 32879 - }, - { - "epoch": 0.84, - "learning_rate": 1.6875941595188871e-06, - "loss": 1.0381, - "step": 32880 - }, - { - "epoch": 0.84, - "learning_rate": 1.6875740678712882e-06, - "loss": 0.7832, - "step": 32881 - }, - { - "epoch": 0.84, - "learning_rate": 1.687553975697245e-06, - "loss": 0.791, - "step": 32882 - }, - { - "epoch": 0.84, - "learning_rate": 1.6875338829967736e-06, - "loss": 0.8457, - "step": 32883 - }, - { - "epoch": 0.84, - "learning_rate": 1.687513789769889e-06, - "loss": 0.6855, - "step": 32884 - }, - { - "epoch": 0.84, - "learning_rate": 1.6874936960166067e-06, - "loss": 0.8247, - "step": 32885 - }, - { - "epoch": 0.84, - "learning_rate": 1.6874736017369422e-06, - "loss": 0.9189, - "step": 32886 - }, - { - "epoch": 0.84, - "learning_rate": 1.6874535069309106e-06, - "loss": 0.7178, - "step": 32887 - }, - { - "epoch": 0.84, - "learning_rate": 1.6874334115985276e-06, - "loss": 0.8477, - "step": 32888 - }, - { - "epoch": 0.84, - "learning_rate": 1.6874133157398084e-06, - "loss": 0.8438, - "step": 32889 - }, - { - "epoch": 0.84, - "learning_rate": 1.6873932193547683e-06, - "loss": 0.8223, - "step": 32890 - }, - { - "epoch": 0.84, - "learning_rate": 1.687373122443423e-06, - "loss": 0.9658, - "step": 32891 - }, - { - "epoch": 0.84, - "learning_rate": 1.6873530250057877e-06, - "loss": 0.8418, - "step": 32892 - }, - { - "epoch": 0.84, - "learning_rate": 1.687332927041878e-06, - "loss": 1.0166, - "step": 32893 - }, - { - "epoch": 0.84, - "learning_rate": 1.6873128285517084e-06, - "loss": 0.8496, - "step": 32894 - }, - { - "epoch": 0.84, - "learning_rate": 1.6872927295352955e-06, - "loss": 0.8174, - "step": 32895 - }, - { - "epoch": 0.84, - "learning_rate": 1.6872726299926543e-06, - "loss": 0.6748, - "step": 32896 - }, - { - "epoch": 0.84, - "learning_rate": 1.6872525299238e-06, - "loss": 0.8047, - "step": 32897 - }, - { - "epoch": 0.84, - "learning_rate": 1.6872324293287474e-06, - "loss": 0.7783, - "step": 32898 - }, - { - "epoch": 0.84, - "learning_rate": 1.6872123282075133e-06, - "loss": 0.7334, - "step": 32899 - }, - { - "epoch": 0.84, - "learning_rate": 1.6871922265601118e-06, - "loss": 0.7119, - "step": 32900 - }, - { - "epoch": 0.84, - "learning_rate": 1.6871721243865592e-06, - "loss": 0.6597, - "step": 32901 - }, - { - "epoch": 0.84, - "learning_rate": 1.6871520216868703e-06, - "loss": 0.8379, - "step": 32902 - }, - { - "epoch": 0.84, - "learning_rate": 1.6871319184610606e-06, - "loss": 0.6753, - "step": 32903 - }, - { - "epoch": 0.84, - "learning_rate": 1.6871118147091457e-06, - "loss": 1.0, - "step": 32904 - }, - { - "epoch": 0.84, - "learning_rate": 1.687091710431141e-06, - "loss": 0.9551, - "step": 32905 - }, - { - "epoch": 0.84, - "learning_rate": 1.6870716056270618e-06, - "loss": 1.1973, - "step": 32906 - }, - { - "epoch": 0.84, - "learning_rate": 1.6870515002969233e-06, - "loss": 0.7393, - "step": 32907 - }, - { - "epoch": 0.84, - "learning_rate": 1.6870313944407407e-06, - "loss": 0.8398, - "step": 32908 - }, - { - "epoch": 0.84, - "learning_rate": 1.6870112880585304e-06, - "loss": 0.6387, - "step": 32909 - }, - { - "epoch": 0.84, - "learning_rate": 1.6869911811503066e-06, - "loss": 0.8613, - "step": 32910 - }, - { - "epoch": 0.84, - "learning_rate": 1.6869710737160856e-06, - "loss": 0.8574, - "step": 32911 - }, - { - "epoch": 0.84, - "learning_rate": 1.6869509657558823e-06, - "loss": 0.9893, - "step": 32912 - }, - { - "epoch": 0.84, - "learning_rate": 1.6869308572697124e-06, - "loss": 0.8926, - "step": 32913 - }, - { - "epoch": 0.84, - "learning_rate": 1.6869107482575911e-06, - "loss": 0.7959, - "step": 32914 - }, - { - "epoch": 0.84, - "learning_rate": 1.6868906387195335e-06, - "loss": 0.9473, - "step": 32915 - }, - { - "epoch": 0.84, - "learning_rate": 1.6868705286555556e-06, - "loss": 0.8304, - "step": 32916 - }, - { - "epoch": 0.84, - "learning_rate": 1.6868504180656724e-06, - "loss": 0.8965, - "step": 32917 - }, - { - "epoch": 0.84, - "learning_rate": 1.6868303069498995e-06, - "loss": 0.9424, - "step": 32918 - }, - { - "epoch": 0.84, - "learning_rate": 1.6868101953082521e-06, - "loss": 1.0, - "step": 32919 - }, - { - "epoch": 0.84, - "learning_rate": 1.686790083140746e-06, - "loss": 0.833, - "step": 32920 - }, - { - "epoch": 0.84, - "learning_rate": 1.686769970447396e-06, - "loss": 0.9629, - "step": 32921 - }, - { - "epoch": 0.84, - "learning_rate": 1.686749857228218e-06, - "loss": 0.6719, - "step": 32922 - }, - { - "epoch": 0.84, - "learning_rate": 1.686729743483227e-06, - "loss": 0.5156, - "step": 32923 - }, - { - "epoch": 0.84, - "learning_rate": 1.686709629212439e-06, - "loss": 0.8965, - "step": 32924 - }, - { - "epoch": 0.84, - "learning_rate": 1.6866895144158686e-06, - "loss": 0.917, - "step": 32925 - }, - { - "epoch": 0.84, - "learning_rate": 1.6866693990935319e-06, - "loss": 0.8877, - "step": 32926 - }, - { - "epoch": 0.84, - "learning_rate": 1.686649283245444e-06, - "loss": 0.8633, - "step": 32927 - }, - { - "epoch": 0.84, - "learning_rate": 1.6866291668716202e-06, - "loss": 0.9434, - "step": 32928 - }, - { - "epoch": 0.84, - "learning_rate": 1.686609049972076e-06, - "loss": 0.8276, - "step": 32929 - }, - { - "epoch": 0.84, - "learning_rate": 1.6865889325468268e-06, - "loss": 0.6685, - "step": 32930 - }, - { - "epoch": 0.84, - "learning_rate": 1.6865688145958881e-06, - "loss": 0.6406, - "step": 32931 - }, - { - "epoch": 0.84, - "learning_rate": 1.6865486961192753e-06, - "loss": 0.6655, - "step": 32932 - }, - { - "epoch": 0.84, - "learning_rate": 1.6865285771170035e-06, - "loss": 0.7617, - "step": 32933 - }, - { - "epoch": 0.84, - "learning_rate": 1.6865084575890887e-06, - "loss": 0.9463, - "step": 32934 - }, - { - "epoch": 0.84, - "learning_rate": 1.6864883375355457e-06, - "loss": 0.8516, - "step": 32935 - }, - { - "epoch": 0.84, - "learning_rate": 1.6864682169563902e-06, - "loss": 0.8828, - "step": 32936 - }, - { - "epoch": 0.84, - "learning_rate": 1.6864480958516371e-06, - "loss": 0.8049, - "step": 32937 - }, - { - "epoch": 0.84, - "learning_rate": 1.6864279742213027e-06, - "loss": 0.8262, - "step": 32938 - }, - { - "epoch": 0.84, - "learning_rate": 1.6864078520654021e-06, - "loss": 0.8213, - "step": 32939 - }, - { - "epoch": 0.84, - "learning_rate": 1.6863877293839504e-06, - "loss": 0.7539, - "step": 32940 - }, - { - "epoch": 0.84, - "learning_rate": 1.6863676061769635e-06, - "loss": 0.7534, - "step": 32941 - }, - { - "epoch": 0.84, - "learning_rate": 1.686347482444456e-06, - "loss": 0.9746, - "step": 32942 - }, - { - "epoch": 0.84, - "learning_rate": 1.6863273581864438e-06, - "loss": 0.8174, - "step": 32943 - }, - { - "epoch": 0.84, - "learning_rate": 1.6863072334029424e-06, - "loss": 0.8125, - "step": 32944 - }, - { - "epoch": 0.84, - "learning_rate": 1.6862871080939674e-06, - "loss": 0.4692, - "step": 32945 - }, - { - "epoch": 0.84, - "learning_rate": 1.6862669822595336e-06, - "loss": 0.9492, - "step": 32946 - }, - { - "epoch": 0.84, - "learning_rate": 1.6862468558996569e-06, - "loss": 0.9443, - "step": 32947 - }, - { - "epoch": 0.84, - "learning_rate": 1.6862267290143525e-06, - "loss": 0.8301, - "step": 32948 - }, - { - "epoch": 0.84, - "learning_rate": 1.6862066016036357e-06, - "loss": 0.9546, - "step": 32949 - }, - { - "epoch": 0.84, - "learning_rate": 1.686186473667522e-06, - "loss": 0.6885, - "step": 32950 - }, - { - "epoch": 0.84, - "learning_rate": 1.6861663452060273e-06, - "loss": 0.8369, - "step": 32951 - }, - { - "epoch": 0.84, - "learning_rate": 1.6861462162191662e-06, - "loss": 0.7227, - "step": 32952 - }, - { - "epoch": 0.84, - "learning_rate": 1.6861260867069547e-06, - "loss": 0.6719, - "step": 32953 - }, - { - "epoch": 0.84, - "learning_rate": 1.6861059566694076e-06, - "loss": 0.7261, - "step": 32954 - }, - { - "epoch": 0.84, - "learning_rate": 1.6860858261065412e-06, - "loss": 0.9727, - "step": 32955 - }, - { - "epoch": 0.84, - "learning_rate": 1.68606569501837e-06, - "loss": 1.0176, - "step": 32956 - }, - { - "epoch": 0.84, - "learning_rate": 1.6860455634049102e-06, - "loss": 0.8096, - "step": 32957 - }, - { - "epoch": 0.84, - "learning_rate": 1.6860254312661768e-06, - "loss": 0.9648, - "step": 32958 - }, - { - "epoch": 0.84, - "learning_rate": 1.6860052986021854e-06, - "loss": 0.9102, - "step": 32959 - }, - { - "epoch": 0.84, - "learning_rate": 1.685985165412951e-06, - "loss": 0.6504, - "step": 32960 - }, - { - "epoch": 0.84, - "learning_rate": 1.6859650316984895e-06, - "loss": 0.8618, - "step": 32961 - }, - { - "epoch": 0.84, - "learning_rate": 1.6859448974588157e-06, - "loss": 0.9023, - "step": 32962 - }, - { - "epoch": 0.84, - "learning_rate": 1.685924762693946e-06, - "loss": 0.7427, - "step": 32963 - }, - { - "epoch": 0.84, - "learning_rate": 1.685904627403895e-06, - "loss": 0.8936, - "step": 32964 - }, - { - "epoch": 0.84, - "learning_rate": 1.6858844915886784e-06, - "loss": 0.7671, - "step": 32965 - }, - { - "epoch": 0.84, - "learning_rate": 1.6858643552483115e-06, - "loss": 0.7935, - "step": 32966 - }, - { - "epoch": 0.84, - "learning_rate": 1.6858442183828099e-06, - "loss": 1.0396, - "step": 32967 - }, - { - "epoch": 0.84, - "learning_rate": 1.6858240809921887e-06, - "loss": 0.5015, - "step": 32968 - }, - { - "epoch": 0.85, - "learning_rate": 1.6858039430764638e-06, - "loss": 0.9209, - "step": 32969 - }, - { - "epoch": 0.85, - "learning_rate": 1.6857838046356503e-06, - "loss": 1.127, - "step": 32970 - }, - { - "epoch": 0.85, - "learning_rate": 1.6857636656697638e-06, - "loss": 0.7959, - "step": 32971 - }, - { - "epoch": 0.85, - "learning_rate": 1.6857435261788192e-06, - "loss": 0.8398, - "step": 32972 - }, - { - "epoch": 0.85, - "learning_rate": 1.6857233861628327e-06, - "loss": 0.9268, - "step": 32973 - }, - { - "epoch": 0.85, - "learning_rate": 1.685703245621819e-06, - "loss": 0.7295, - "step": 32974 - }, - { - "epoch": 0.85, - "learning_rate": 1.6856831045557941e-06, - "loss": 0.8877, - "step": 32975 - }, - { - "epoch": 0.85, - "learning_rate": 1.685662962964773e-06, - "loss": 0.9961, - "step": 32976 - }, - { - "epoch": 0.85, - "learning_rate": 1.6856428208487716e-06, - "loss": 1.0312, - "step": 32977 - }, - { - "epoch": 0.85, - "learning_rate": 1.6856226782078046e-06, - "loss": 0.8877, - "step": 32978 - }, - { - "epoch": 0.85, - "learning_rate": 1.6856025350418883e-06, - "loss": 0.7644, - "step": 32979 - }, - { - "epoch": 0.85, - "learning_rate": 1.6855823913510373e-06, - "loss": 0.7227, - "step": 32980 - }, - { - "epoch": 0.85, - "learning_rate": 1.6855622471352675e-06, - "loss": 0.8848, - "step": 32981 - }, - { - "epoch": 0.85, - "learning_rate": 1.6855421023945944e-06, - "loss": 1.0703, - "step": 32982 - }, - { - "epoch": 0.85, - "learning_rate": 1.685521957129033e-06, - "loss": 0.9648, - "step": 32983 - }, - { - "epoch": 0.85, - "learning_rate": 1.6855018113385988e-06, - "loss": 0.6128, - "step": 32984 - }, - { - "epoch": 0.85, - "learning_rate": 1.6854816650233077e-06, - "loss": 0.9639, - "step": 32985 - }, - { - "epoch": 0.85, - "learning_rate": 1.6854615181831746e-06, - "loss": 1.0244, - "step": 32986 - }, - { - "epoch": 0.85, - "learning_rate": 1.6854413708182153e-06, - "loss": 1.1152, - "step": 32987 - }, - { - "epoch": 0.85, - "learning_rate": 1.685421222928445e-06, - "loss": 0.8672, - "step": 32988 - }, - { - "epoch": 0.85, - "learning_rate": 1.685401074513879e-06, - "loss": 0.7832, - "step": 32989 - }, - { - "epoch": 0.85, - "learning_rate": 1.6853809255745335e-06, - "loss": 0.6543, - "step": 32990 - }, - { - "epoch": 0.85, - "learning_rate": 1.6853607761104226e-06, - "loss": 0.7881, - "step": 32991 - }, - { - "epoch": 0.85, - "learning_rate": 1.685340626121563e-06, - "loss": 0.8008, - "step": 32992 - }, - { - "epoch": 0.85, - "learning_rate": 1.6853204756079694e-06, - "loss": 0.7383, - "step": 32993 - }, - { - "epoch": 0.85, - "learning_rate": 1.6853003245696575e-06, - "loss": 0.9893, - "step": 32994 - }, - { - "epoch": 0.85, - "learning_rate": 1.6852801730066426e-06, - "loss": 0.7168, - "step": 32995 - }, - { - "epoch": 0.85, - "learning_rate": 1.6852600209189403e-06, - "loss": 0.8623, - "step": 32996 - }, - { - "epoch": 0.85, - "learning_rate": 1.6852398683065655e-06, - "loss": 0.9941, - "step": 32997 - }, - { - "epoch": 0.85, - "learning_rate": 1.6852197151695343e-06, - "loss": 0.6924, - "step": 32998 - }, - { - "epoch": 0.85, - "learning_rate": 1.6851995615078619e-06, - "loss": 0.8154, - "step": 32999 - }, - { - "epoch": 0.85, - "learning_rate": 1.6851794073215637e-06, - "loss": 0.7725, - "step": 33000 - }, - { - "epoch": 0.85, - "learning_rate": 1.685159252610655e-06, - "loss": 0.791, - "step": 33001 - }, - { - "epoch": 0.85, - "learning_rate": 1.6851390973751515e-06, - "loss": 0.6465, - "step": 33002 - }, - { - "epoch": 0.85, - "learning_rate": 1.6851189416150687e-06, - "loss": 0.7275, - "step": 33003 - }, - { - "epoch": 0.85, - "learning_rate": 1.6850987853304215e-06, - "loss": 0.7603, - "step": 33004 - }, - { - "epoch": 0.85, - "learning_rate": 1.685078628521226e-06, - "loss": 0.8052, - "step": 33005 - }, - { - "epoch": 0.85, - "learning_rate": 1.6850584711874969e-06, - "loss": 1.1309, - "step": 33006 - }, - { - "epoch": 0.85, - "learning_rate": 1.68503831332925e-06, - "loss": 0.9556, - "step": 33007 - }, - { - "epoch": 0.85, - "learning_rate": 1.6850181549465013e-06, - "loss": 1.0557, - "step": 33008 - }, - { - "epoch": 0.85, - "learning_rate": 1.6849979960392652e-06, - "loss": 0.9238, - "step": 33009 - }, - { - "epoch": 0.85, - "learning_rate": 1.6849778366075577e-06, - "loss": 0.8906, - "step": 33010 - }, - { - "epoch": 0.85, - "learning_rate": 1.6849576766513941e-06, - "loss": 0.8467, - "step": 33011 - }, - { - "epoch": 0.85, - "learning_rate": 1.68493751617079e-06, - "loss": 0.646, - "step": 33012 - }, - { - "epoch": 0.85, - "learning_rate": 1.684917355165761e-06, - "loss": 0.9404, - "step": 33013 - }, - { - "epoch": 0.85, - "learning_rate": 1.6848971936363221e-06, - "loss": 0.8027, - "step": 33014 - }, - { - "epoch": 0.85, - "learning_rate": 1.6848770315824888e-06, - "loss": 0.7627, - "step": 33015 - }, - { - "epoch": 0.85, - "learning_rate": 1.6848568690042768e-06, - "loss": 0.9258, - "step": 33016 - }, - { - "epoch": 0.85, - "learning_rate": 1.6848367059017013e-06, - "loss": 0.8154, - "step": 33017 - }, - { - "epoch": 0.85, - "learning_rate": 1.684816542274778e-06, - "loss": 0.9072, - "step": 33018 - }, - { - "epoch": 0.85, - "learning_rate": 1.6847963781235217e-06, - "loss": 0.9854, - "step": 33019 - }, - { - "epoch": 0.85, - "learning_rate": 1.6847762134479489e-06, - "loss": 0.5991, - "step": 33020 - }, - { - "epoch": 0.85, - "learning_rate": 1.684756048248074e-06, - "loss": 0.7129, - "step": 33021 - }, - { - "epoch": 0.85, - "learning_rate": 1.684735882523913e-06, - "loss": 0.9492, - "step": 33022 - }, - { - "epoch": 0.85, - "learning_rate": 1.6847157162754814e-06, - "loss": 0.6731, - "step": 33023 - }, - { - "epoch": 0.85, - "learning_rate": 1.684695549502794e-06, - "loss": 1.0938, - "step": 33024 - }, - { - "epoch": 0.85, - "learning_rate": 1.6846753822058673e-06, - "loss": 0.7378, - "step": 33025 - }, - { - "epoch": 0.85, - "learning_rate": 1.6846552143847157e-06, - "loss": 0.8301, - "step": 33026 - }, - { - "epoch": 0.85, - "learning_rate": 1.6846350460393553e-06, - "loss": 0.9346, - "step": 33027 - }, - { - "epoch": 0.85, - "learning_rate": 1.6846148771698013e-06, - "loss": 0.9893, - "step": 33028 - }, - { - "epoch": 0.85, - "learning_rate": 1.6845947077760688e-06, - "loss": 0.8042, - "step": 33029 - }, - { - "epoch": 0.85, - "learning_rate": 1.6845745378581744e-06, - "loss": 0.7773, - "step": 33030 - }, - { - "epoch": 0.85, - "learning_rate": 1.684554367416132e-06, - "loss": 0.9111, - "step": 33031 - }, - { - "epoch": 0.85, - "learning_rate": 1.6845341964499582e-06, - "loss": 0.7764, - "step": 33032 - }, - { - "epoch": 0.85, - "learning_rate": 1.684514024959668e-06, - "loss": 0.8506, - "step": 33033 - }, - { - "epoch": 0.85, - "learning_rate": 1.6844938529452766e-06, - "loss": 0.8271, - "step": 33034 - }, - { - "epoch": 0.85, - "learning_rate": 1.6844736804068e-06, - "loss": 0.8682, - "step": 33035 - }, - { - "epoch": 0.85, - "learning_rate": 1.6844535073442534e-06, - "loss": 0.853, - "step": 33036 - }, - { - "epoch": 0.85, - "learning_rate": 1.684433333757652e-06, - "loss": 0.7705, - "step": 33037 - }, - { - "epoch": 0.85, - "learning_rate": 1.6844131596470117e-06, - "loss": 0.9111, - "step": 33038 - }, - { - "epoch": 0.85, - "learning_rate": 1.6843929850123474e-06, - "loss": 1.0742, - "step": 33039 - }, - { - "epoch": 0.85, - "learning_rate": 1.6843728098536754e-06, - "loss": 0.7861, - "step": 33040 - }, - { - "epoch": 0.85, - "learning_rate": 1.6843526341710103e-06, - "loss": 1.1553, - "step": 33041 - }, - { - "epoch": 0.85, - "learning_rate": 1.6843324579643676e-06, - "loss": 0.8789, - "step": 33042 - }, - { - "epoch": 0.85, - "learning_rate": 1.6843122812337634e-06, - "loss": 0.75, - "step": 33043 - }, - { - "epoch": 0.85, - "learning_rate": 1.6842921039792124e-06, - "loss": 0.8799, - "step": 33044 - }, - { - "epoch": 0.85, - "learning_rate": 1.6842719262007309e-06, - "loss": 1.165, - "step": 33045 - }, - { - "epoch": 0.85, - "learning_rate": 1.6842517478983334e-06, - "loss": 0.9961, - "step": 33046 - }, - { - "epoch": 0.85, - "learning_rate": 1.6842315690720359e-06, - "loss": 0.585, - "step": 33047 - }, - { - "epoch": 0.85, - "learning_rate": 1.6842113897218538e-06, - "loss": 0.8301, - "step": 33048 - }, - { - "epoch": 0.85, - "learning_rate": 1.6841912098478024e-06, - "loss": 0.7686, - "step": 33049 - }, - { - "epoch": 0.85, - "learning_rate": 1.6841710294498977e-06, - "loss": 0.9238, - "step": 33050 - }, - { - "epoch": 0.85, - "learning_rate": 1.6841508485281542e-06, - "loss": 0.6978, - "step": 33051 - }, - { - "epoch": 0.85, - "learning_rate": 1.684130667082588e-06, - "loss": 0.9678, - "step": 33052 - }, - { - "epoch": 0.85, - "learning_rate": 1.6841104851132143e-06, - "loss": 0.9258, - "step": 33053 - }, - { - "epoch": 0.85, - "learning_rate": 1.6840903026200487e-06, - "loss": 0.8008, - "step": 33054 - }, - { - "epoch": 0.85, - "learning_rate": 1.6840701196031068e-06, - "loss": 0.8726, - "step": 33055 - }, - { - "epoch": 0.85, - "learning_rate": 1.6840499360624039e-06, - "loss": 0.7959, - "step": 33056 - }, - { - "epoch": 0.85, - "learning_rate": 1.684029751997955e-06, - "loss": 0.8506, - "step": 33057 - }, - { - "epoch": 0.85, - "learning_rate": 1.6840095674097763e-06, - "loss": 0.7681, - "step": 33058 - }, - { - "epoch": 0.85, - "learning_rate": 1.6839893822978828e-06, - "loss": 0.7649, - "step": 33059 - }, - { - "epoch": 0.85, - "learning_rate": 1.6839691966622901e-06, - "loss": 0.8281, - "step": 33060 - }, - { - "epoch": 0.85, - "learning_rate": 1.683949010503014e-06, - "loss": 0.9473, - "step": 33061 - }, - { - "epoch": 0.85, - "learning_rate": 1.683928823820069e-06, - "loss": 0.9902, - "step": 33062 - }, - { - "epoch": 0.85, - "learning_rate": 1.6839086366134713e-06, - "loss": 0.7407, - "step": 33063 - }, - { - "epoch": 0.85, - "learning_rate": 1.6838884488832363e-06, - "loss": 0.8203, - "step": 33064 - }, - { - "epoch": 0.85, - "learning_rate": 1.6838682606293797e-06, - "loss": 0.9014, - "step": 33065 - }, - { - "epoch": 0.85, - "learning_rate": 1.6838480718519162e-06, - "loss": 0.793, - "step": 33066 - }, - { - "epoch": 0.85, - "learning_rate": 1.6838278825508615e-06, - "loss": 0.7197, - "step": 33067 - }, - { - "epoch": 0.85, - "learning_rate": 1.6838076927262317e-06, - "loss": 0.6079, - "step": 33068 - }, - { - "epoch": 0.85, - "learning_rate": 1.6837875023780415e-06, - "loss": 0.7148, - "step": 33069 - }, - { - "epoch": 0.85, - "learning_rate": 1.683767311506307e-06, - "loss": 0.8965, - "step": 33070 - }, - { - "epoch": 0.85, - "learning_rate": 1.683747120111043e-06, - "loss": 0.9375, - "step": 33071 - }, - { - "epoch": 0.85, - "learning_rate": 1.6837269281922652e-06, - "loss": 0.9648, - "step": 33072 - }, - { - "epoch": 0.85, - "learning_rate": 1.6837067357499893e-06, - "loss": 0.7793, - "step": 33073 - }, - { - "epoch": 0.85, - "learning_rate": 1.6836865427842303e-06, - "loss": 0.7131, - "step": 33074 - }, - { - "epoch": 0.85, - "learning_rate": 1.6836663492950045e-06, - "loss": 0.9531, - "step": 33075 - }, - { - "epoch": 0.85, - "learning_rate": 1.6836461552823266e-06, - "loss": 0.8735, - "step": 33076 - }, - { - "epoch": 0.85, - "learning_rate": 1.6836259607462119e-06, - "loss": 0.8232, - "step": 33077 - }, - { - "epoch": 0.85, - "learning_rate": 1.6836057656866766e-06, - "loss": 0.731, - "step": 33078 - }, - { - "epoch": 0.85, - "learning_rate": 1.6835855701037355e-06, - "loss": 1.0254, - "step": 33079 - }, - { - "epoch": 0.85, - "learning_rate": 1.6835653739974047e-06, - "loss": 0.686, - "step": 33080 - }, - { - "epoch": 0.85, - "learning_rate": 1.6835451773676993e-06, - "loss": 0.7408, - "step": 33081 - }, - { - "epoch": 0.85, - "learning_rate": 1.6835249802146348e-06, - "loss": 0.6836, - "step": 33082 - }, - { - "epoch": 0.85, - "learning_rate": 1.6835047825382262e-06, - "loss": 0.6543, - "step": 33083 - }, - { - "epoch": 0.85, - "learning_rate": 1.6834845843384899e-06, - "loss": 0.8091, - "step": 33084 - }, - { - "epoch": 0.85, - "learning_rate": 1.683464385615441e-06, - "loss": 0.9424, - "step": 33085 - }, - { - "epoch": 0.85, - "learning_rate": 1.6834441863690944e-06, - "loss": 0.8721, - "step": 33086 - }, - { - "epoch": 0.85, - "learning_rate": 1.6834239865994664e-06, - "loss": 0.8496, - "step": 33087 - }, - { - "epoch": 0.85, - "learning_rate": 1.6834037863065715e-06, - "loss": 0.9551, - "step": 33088 - }, - { - "epoch": 0.85, - "learning_rate": 1.6833835854904263e-06, - "loss": 0.7783, - "step": 33089 - }, - { - "epoch": 0.85, - "learning_rate": 1.6833633841510455e-06, - "loss": 0.8135, - "step": 33090 - }, - { - "epoch": 0.85, - "learning_rate": 1.683343182288445e-06, - "loss": 0.6313, - "step": 33091 - }, - { - "epoch": 0.85, - "learning_rate": 1.6833229799026397e-06, - "loss": 0.8213, - "step": 33092 - }, - { - "epoch": 0.85, - "learning_rate": 1.6833027769936456e-06, - "loss": 0.7988, - "step": 33093 - }, - { - "epoch": 0.85, - "learning_rate": 1.683282573561478e-06, - "loss": 0.9873, - "step": 33094 - }, - { - "epoch": 0.85, - "learning_rate": 1.6832623696061523e-06, - "loss": 0.7393, - "step": 33095 - }, - { - "epoch": 0.85, - "learning_rate": 1.6832421651276839e-06, - "loss": 0.6987, - "step": 33096 - }, - { - "epoch": 0.85, - "learning_rate": 1.6832219601260883e-06, - "loss": 0.9785, - "step": 33097 - }, - { - "epoch": 0.85, - "learning_rate": 1.6832017546013814e-06, - "loss": 0.8916, - "step": 33098 - }, - { - "epoch": 0.85, - "learning_rate": 1.6831815485535784e-06, - "loss": 0.7324, - "step": 33099 - }, - { - "epoch": 0.85, - "learning_rate": 1.6831613419826947e-06, - "loss": 0.729, - "step": 33100 - }, - { - "epoch": 0.85, - "learning_rate": 1.6831411348887455e-06, - "loss": 0.8213, - "step": 33101 - }, - { - "epoch": 0.85, - "learning_rate": 1.6831209272717466e-06, - "loss": 0.9209, - "step": 33102 - }, - { - "epoch": 0.85, - "learning_rate": 1.6831007191317132e-06, - "loss": 0.9404, - "step": 33103 - }, - { - "epoch": 0.85, - "learning_rate": 1.6830805104686615e-06, - "loss": 0.8926, - "step": 33104 - }, - { - "epoch": 0.85, - "learning_rate": 1.683060301282606e-06, - "loss": 0.9678, - "step": 33105 - }, - { - "epoch": 0.85, - "learning_rate": 1.683040091573563e-06, - "loss": 0.8755, - "step": 33106 - }, - { - "epoch": 0.85, - "learning_rate": 1.6830198813415472e-06, - "loss": 0.7759, - "step": 33107 - }, - { - "epoch": 0.85, - "learning_rate": 1.6829996705865749e-06, - "loss": 0.7783, - "step": 33108 - }, - { - "epoch": 0.85, - "learning_rate": 1.6829794593086609e-06, - "loss": 0.6855, - "step": 33109 - }, - { - "epoch": 0.85, - "learning_rate": 1.6829592475078211e-06, - "loss": 0.73, - "step": 33110 - }, - { - "epoch": 0.85, - "learning_rate": 1.6829390351840707e-06, - "loss": 0.9014, - "step": 33111 - }, - { - "epoch": 0.85, - "learning_rate": 1.6829188223374252e-06, - "loss": 0.7861, - "step": 33112 - }, - { - "epoch": 0.85, - "learning_rate": 1.6828986089679004e-06, - "loss": 0.7031, - "step": 33113 - }, - { - "epoch": 0.85, - "learning_rate": 1.6828783950755112e-06, - "loss": 0.7275, - "step": 33114 - }, - { - "epoch": 0.85, - "learning_rate": 1.6828581806602738e-06, - "loss": 0.9932, - "step": 33115 - }, - { - "epoch": 0.85, - "learning_rate": 1.682837965722203e-06, - "loss": 0.7563, - "step": 33116 - }, - { - "epoch": 0.85, - "learning_rate": 1.6828177502613148e-06, - "loss": 0.9473, - "step": 33117 - }, - { - "epoch": 0.85, - "learning_rate": 1.6827975342776241e-06, - "loss": 0.833, - "step": 33118 - }, - { - "epoch": 0.85, - "learning_rate": 1.6827773177711468e-06, - "loss": 0.9365, - "step": 33119 - }, - { - "epoch": 0.85, - "learning_rate": 1.6827571007418988e-06, - "loss": 0.6934, - "step": 33120 - }, - { - "epoch": 0.85, - "learning_rate": 1.6827368831898947e-06, - "loss": 0.874, - "step": 33121 - }, - { - "epoch": 0.85, - "learning_rate": 1.68271666511515e-06, - "loss": 0.9941, - "step": 33122 - }, - { - "epoch": 0.85, - "learning_rate": 1.6826964465176812e-06, - "loss": 0.8525, - "step": 33123 - }, - { - "epoch": 0.85, - "learning_rate": 1.6826762273975029e-06, - "loss": 0.9023, - "step": 33124 - }, - { - "epoch": 0.85, - "learning_rate": 1.6826560077546307e-06, - "loss": 0.9131, - "step": 33125 - }, - { - "epoch": 0.85, - "learning_rate": 1.6826357875890802e-06, - "loss": 0.7744, - "step": 33126 - }, - { - "epoch": 0.85, - "learning_rate": 1.6826155669008669e-06, - "loss": 0.7793, - "step": 33127 - }, - { - "epoch": 0.85, - "learning_rate": 1.6825953456900061e-06, - "loss": 0.793, - "step": 33128 - }, - { - "epoch": 0.85, - "learning_rate": 1.6825751239565137e-06, - "loss": 0.7681, - "step": 33129 - }, - { - "epoch": 0.85, - "learning_rate": 1.6825549017004047e-06, - "loss": 0.8477, - "step": 33130 - }, - { - "epoch": 0.85, - "learning_rate": 1.682534678921695e-06, - "loss": 0.9199, - "step": 33131 - }, - { - "epoch": 0.85, - "learning_rate": 1.6825144556203998e-06, - "loss": 0.7627, - "step": 33132 - }, - { - "epoch": 0.85, - "learning_rate": 1.6824942317965345e-06, - "loss": 0.7891, - "step": 33133 - }, - { - "epoch": 0.85, - "learning_rate": 1.6824740074501148e-06, - "loss": 0.9326, - "step": 33134 - }, - { - "epoch": 0.85, - "learning_rate": 1.6824537825811565e-06, - "loss": 0.9678, - "step": 33135 - }, - { - "epoch": 0.85, - "learning_rate": 1.6824335571896744e-06, - "loss": 0.9785, - "step": 33136 - }, - { - "epoch": 0.85, - "learning_rate": 1.682413331275684e-06, - "loss": 0.8301, - "step": 33137 - }, - { - "epoch": 0.85, - "learning_rate": 1.6823931048392014e-06, - "loss": 0.8281, - "step": 33138 - }, - { - "epoch": 0.85, - "learning_rate": 1.6823728778802419e-06, - "loss": 0.8213, - "step": 33139 - }, - { - "epoch": 0.85, - "learning_rate": 1.6823526503988208e-06, - "loss": 0.9023, - "step": 33140 - }, - { - "epoch": 0.85, - "learning_rate": 1.6823324223949537e-06, - "loss": 0.915, - "step": 33141 - }, - { - "epoch": 0.85, - "learning_rate": 1.682312193868656e-06, - "loss": 1.0244, - "step": 33142 - }, - { - "epoch": 0.85, - "learning_rate": 1.6822919648199432e-06, - "loss": 1.0049, - "step": 33143 - }, - { - "epoch": 0.85, - "learning_rate": 1.6822717352488308e-06, - "loss": 1.0215, - "step": 33144 - }, - { - "epoch": 0.85, - "learning_rate": 1.6822515051553343e-06, - "loss": 0.8232, - "step": 33145 - }, - { - "epoch": 0.85, - "learning_rate": 1.682231274539469e-06, - "loss": 0.918, - "step": 33146 - }, - { - "epoch": 0.85, - "learning_rate": 1.682211043401251e-06, - "loss": 0.7617, - "step": 33147 - }, - { - "epoch": 0.85, - "learning_rate": 1.6821908117406951e-06, - "loss": 0.6885, - "step": 33148 - }, - { - "epoch": 0.85, - "learning_rate": 1.682170579557817e-06, - "loss": 0.8613, - "step": 33149 - }, - { - "epoch": 0.85, - "learning_rate": 1.6821503468526325e-06, - "loss": 0.6475, - "step": 33150 - }, - { - "epoch": 0.85, - "learning_rate": 1.6821301136251567e-06, - "loss": 0.6631, - "step": 33151 - }, - { - "epoch": 0.85, - "learning_rate": 1.6821098798754055e-06, - "loss": 0.8555, - "step": 33152 - }, - { - "epoch": 0.85, - "learning_rate": 1.6820896456033936e-06, - "loss": 0.7539, - "step": 33153 - }, - { - "epoch": 0.85, - "learning_rate": 1.6820694108091373e-06, - "loss": 0.7744, - "step": 33154 - }, - { - "epoch": 0.85, - "learning_rate": 1.682049175492652e-06, - "loss": 0.7549, - "step": 33155 - }, - { - "epoch": 0.85, - "learning_rate": 1.6820289396539526e-06, - "loss": 1.0459, - "step": 33156 - }, - { - "epoch": 0.85, - "learning_rate": 1.6820087032930555e-06, - "loss": 0.7656, - "step": 33157 - }, - { - "epoch": 0.85, - "learning_rate": 1.6819884664099752e-06, - "loss": 1.0586, - "step": 33158 - }, - { - "epoch": 0.85, - "learning_rate": 1.681968229004728e-06, - "loss": 0.915, - "step": 33159 - }, - { - "epoch": 0.85, - "learning_rate": 1.681947991077329e-06, - "loss": 0.9492, - "step": 33160 - }, - { - "epoch": 0.85, - "learning_rate": 1.6819277526277937e-06, - "loss": 0.9062, - "step": 33161 - }, - { - "epoch": 0.85, - "learning_rate": 1.6819075136561377e-06, - "loss": 1.0029, - "step": 33162 - }, - { - "epoch": 0.85, - "learning_rate": 1.6818872741623764e-06, - "loss": 0.8159, - "step": 33163 - }, - { - "epoch": 0.85, - "learning_rate": 1.6818670341465255e-06, - "loss": 0.7871, - "step": 33164 - }, - { - "epoch": 0.85, - "learning_rate": 1.6818467936086007e-06, - "loss": 0.8281, - "step": 33165 - }, - { - "epoch": 0.85, - "learning_rate": 1.6818265525486166e-06, - "loss": 0.8115, - "step": 33166 - }, - { - "epoch": 0.85, - "learning_rate": 1.6818063109665897e-06, - "loss": 0.6548, - "step": 33167 - }, - { - "epoch": 0.85, - "learning_rate": 1.6817860688625345e-06, - "loss": 0.8984, - "step": 33168 - }, - { - "epoch": 0.85, - "learning_rate": 1.6817658262364675e-06, - "loss": 0.707, - "step": 33169 - }, - { - "epoch": 0.85, - "learning_rate": 1.6817455830884038e-06, - "loss": 0.917, - "step": 33170 - }, - { - "epoch": 0.85, - "learning_rate": 1.6817253394183587e-06, - "loss": 0.874, - "step": 33171 - }, - { - "epoch": 0.85, - "learning_rate": 1.6817050952263476e-06, - "loss": 0.9023, - "step": 33172 - }, - { - "epoch": 0.85, - "learning_rate": 1.6816848505123866e-06, - "loss": 0.8389, - "step": 33173 - }, - { - "epoch": 0.85, - "learning_rate": 1.6816646052764906e-06, - "loss": 0.9404, - "step": 33174 - }, - { - "epoch": 0.85, - "learning_rate": 1.681644359518676e-06, - "loss": 0.9727, - "step": 33175 - }, - { - "epoch": 0.85, - "learning_rate": 1.6816241132389571e-06, - "loss": 0.6934, - "step": 33176 - }, - { - "epoch": 0.85, - "learning_rate": 1.6816038664373498e-06, - "loss": 0.7507, - "step": 33177 - }, - { - "epoch": 0.85, - "learning_rate": 1.6815836191138701e-06, - "loss": 0.7729, - "step": 33178 - }, - { - "epoch": 0.85, - "learning_rate": 1.6815633712685329e-06, - "loss": 0.8086, - "step": 33179 - }, - { - "epoch": 0.85, - "learning_rate": 1.6815431229013543e-06, - "loss": 0.71, - "step": 33180 - }, - { - "epoch": 0.85, - "learning_rate": 1.6815228740123492e-06, - "loss": 0.8608, - "step": 33181 - }, - { - "epoch": 0.85, - "learning_rate": 1.6815026246015335e-06, - "loss": 0.7344, - "step": 33182 - }, - { - "epoch": 0.85, - "learning_rate": 1.6814823746689224e-06, - "loss": 0.7432, - "step": 33183 - }, - { - "epoch": 0.85, - "learning_rate": 1.6814621242145318e-06, - "loss": 0.8691, - "step": 33184 - }, - { - "epoch": 0.85, - "learning_rate": 1.681441873238377e-06, - "loss": 0.5488, - "step": 33185 - }, - { - "epoch": 0.85, - "learning_rate": 1.6814216217404735e-06, - "loss": 0.8955, - "step": 33186 - }, - { - "epoch": 0.85, - "learning_rate": 1.6814013697208366e-06, - "loss": 0.7581, - "step": 33187 - }, - { - "epoch": 0.85, - "learning_rate": 1.681381117179482e-06, - "loss": 0.9512, - "step": 33188 - }, - { - "epoch": 0.85, - "learning_rate": 1.6813608641164251e-06, - "loss": 0.9043, - "step": 33189 - }, - { - "epoch": 0.85, - "learning_rate": 1.681340610531682e-06, - "loss": 0.8809, - "step": 33190 - }, - { - "epoch": 0.85, - "learning_rate": 1.6813203564252673e-06, - "loss": 1.0215, - "step": 33191 - }, - { - "epoch": 0.85, - "learning_rate": 1.6813001017971973e-06, - "loss": 0.7627, - "step": 33192 - }, - { - "epoch": 0.85, - "learning_rate": 1.6812798466474869e-06, - "loss": 0.8882, - "step": 33193 - }, - { - "epoch": 0.85, - "learning_rate": 1.6812595909761517e-06, - "loss": 0.7344, - "step": 33194 - }, - { - "epoch": 0.85, - "learning_rate": 1.6812393347832078e-06, - "loss": 0.7754, - "step": 33195 - }, - { - "epoch": 0.85, - "learning_rate": 1.6812190780686699e-06, - "loss": 0.8457, - "step": 33196 - }, - { - "epoch": 0.85, - "learning_rate": 1.681198820832554e-06, - "loss": 1.0049, - "step": 33197 - }, - { - "epoch": 0.85, - "learning_rate": 1.6811785630748753e-06, - "loss": 0.6338, - "step": 33198 - }, - { - "epoch": 0.85, - "learning_rate": 1.6811583047956496e-06, - "loss": 0.6562, - "step": 33199 - }, - { - "epoch": 0.85, - "learning_rate": 1.6811380459948924e-06, - "loss": 0.7144, - "step": 33200 - }, - { - "epoch": 0.85, - "learning_rate": 1.6811177866726191e-06, - "loss": 0.7598, - "step": 33201 - }, - { - "epoch": 0.85, - "learning_rate": 1.6810975268288453e-06, - "loss": 1.0488, - "step": 33202 - }, - { - "epoch": 0.85, - "learning_rate": 1.6810772664635864e-06, - "loss": 0.9961, - "step": 33203 - }, - { - "epoch": 0.85, - "learning_rate": 1.681057005576858e-06, - "loss": 0.8359, - "step": 33204 - }, - { - "epoch": 0.85, - "learning_rate": 1.6810367441686751e-06, - "loss": 0.8447, - "step": 33205 - }, - { - "epoch": 0.85, - "learning_rate": 1.6810164822390542e-06, - "loss": 0.582, - "step": 33206 - }, - { - "epoch": 0.85, - "learning_rate": 1.68099621978801e-06, - "loss": 0.8047, - "step": 33207 - }, - { - "epoch": 0.85, - "learning_rate": 1.6809759568155586e-06, - "loss": 0.9658, - "step": 33208 - }, - { - "epoch": 0.85, - "learning_rate": 1.680955693321715e-06, - "loss": 0.9199, - "step": 33209 - }, - { - "epoch": 0.85, - "learning_rate": 1.680935429306495e-06, - "loss": 0.6914, - "step": 33210 - }, - { - "epoch": 0.85, - "learning_rate": 1.6809151647699142e-06, - "loss": 0.7314, - "step": 33211 - }, - { - "epoch": 0.85, - "learning_rate": 1.6808948997119878e-06, - "loss": 0.8447, - "step": 33212 - }, - { - "epoch": 0.85, - "learning_rate": 1.6808746341327313e-06, - "loss": 0.6143, - "step": 33213 - }, - { - "epoch": 0.85, - "learning_rate": 1.6808543680321607e-06, - "loss": 0.9023, - "step": 33214 - }, - { - "epoch": 0.85, - "learning_rate": 1.6808341014102911e-06, - "loss": 1.0264, - "step": 33215 - }, - { - "epoch": 0.85, - "learning_rate": 1.6808138342671384e-06, - "loss": 0.7598, - "step": 33216 - }, - { - "epoch": 0.85, - "learning_rate": 1.6807935666027175e-06, - "loss": 0.9209, - "step": 33217 - }, - { - "epoch": 0.85, - "learning_rate": 1.6807732984170443e-06, - "loss": 1.0049, - "step": 33218 - }, - { - "epoch": 0.85, - "learning_rate": 1.6807530297101345e-06, - "loss": 0.7026, - "step": 33219 - }, - { - "epoch": 0.85, - "learning_rate": 1.6807327604820031e-06, - "loss": 0.792, - "step": 33220 - }, - { - "epoch": 0.85, - "learning_rate": 1.6807124907326662e-06, - "loss": 1.0156, - "step": 33221 - }, - { - "epoch": 0.85, - "learning_rate": 1.6806922204621388e-06, - "loss": 0.8369, - "step": 33222 - }, - { - "epoch": 0.85, - "learning_rate": 1.680671949670437e-06, - "loss": 0.8574, - "step": 33223 - }, - { - "epoch": 0.85, - "learning_rate": 1.6806516783575757e-06, - "loss": 0.9097, - "step": 33224 - }, - { - "epoch": 0.85, - "learning_rate": 1.6806314065235708e-06, - "loss": 1.0117, - "step": 33225 - }, - { - "epoch": 0.85, - "learning_rate": 1.6806111341684378e-06, - "loss": 1.0801, - "step": 33226 - }, - { - "epoch": 0.85, - "learning_rate": 1.6805908612921919e-06, - "loss": 0.9609, - "step": 33227 - }, - { - "epoch": 0.85, - "learning_rate": 1.680570587894849e-06, - "loss": 0.8115, - "step": 33228 - }, - { - "epoch": 0.85, - "learning_rate": 1.6805503139764248e-06, - "loss": 0.8906, - "step": 33229 - }, - { - "epoch": 0.85, - "learning_rate": 1.6805300395369342e-06, - "loss": 0.7266, - "step": 33230 - }, - { - "epoch": 0.85, - "learning_rate": 1.680509764576393e-06, - "loss": 0.9287, - "step": 33231 - }, - { - "epoch": 0.85, - "learning_rate": 1.680489489094817e-06, - "loss": 0.7158, - "step": 33232 - }, - { - "epoch": 0.85, - "learning_rate": 1.6804692130922212e-06, - "loss": 0.7407, - "step": 33233 - }, - { - "epoch": 0.85, - "learning_rate": 1.6804489365686218e-06, - "loss": 0.9541, - "step": 33234 - }, - { - "epoch": 0.85, - "learning_rate": 1.6804286595240336e-06, - "loss": 0.751, - "step": 33235 - }, - { - "epoch": 0.85, - "learning_rate": 1.6804083819584727e-06, - "loss": 0.9629, - "step": 33236 - }, - { - "epoch": 0.85, - "learning_rate": 1.6803881038719543e-06, - "loss": 0.8926, - "step": 33237 - }, - { - "epoch": 0.85, - "learning_rate": 1.6803678252644938e-06, - "loss": 0.8525, - "step": 33238 - }, - { - "epoch": 0.85, - "learning_rate": 1.680347546136107e-06, - "loss": 0.6763, - "step": 33239 - }, - { - "epoch": 0.85, - "learning_rate": 1.6803272664868096e-06, - "loss": 0.751, - "step": 33240 - }, - { - "epoch": 0.85, - "learning_rate": 1.6803069863166169e-06, - "loss": 0.7988, - "step": 33241 - }, - { - "epoch": 0.85, - "learning_rate": 1.6802867056255444e-06, - "loss": 0.9204, - "step": 33242 - }, - { - "epoch": 0.85, - "learning_rate": 1.6802664244136072e-06, - "loss": 0.8428, - "step": 33243 - }, - { - "epoch": 0.85, - "learning_rate": 1.6802461426808217e-06, - "loss": 0.8276, - "step": 33244 - }, - { - "epoch": 0.85, - "learning_rate": 1.6802258604272028e-06, - "loss": 0.9004, - "step": 33245 - }, - { - "epoch": 0.85, - "learning_rate": 1.6802055776527664e-06, - "loss": 0.583, - "step": 33246 - }, - { - "epoch": 0.85, - "learning_rate": 1.6801852943575278e-06, - "loss": 0.9385, - "step": 33247 - }, - { - "epoch": 0.85, - "learning_rate": 1.6801650105415028e-06, - "loss": 0.9316, - "step": 33248 - }, - { - "epoch": 0.85, - "learning_rate": 1.6801447262047065e-06, - "loss": 0.7104, - "step": 33249 - }, - { - "epoch": 0.85, - "learning_rate": 1.6801244413471548e-06, - "loss": 0.8486, - "step": 33250 - }, - { - "epoch": 0.85, - "learning_rate": 1.680104155968863e-06, - "loss": 0.8867, - "step": 33251 - }, - { - "epoch": 0.85, - "learning_rate": 1.6800838700698465e-06, - "loss": 0.9092, - "step": 33252 - }, - { - "epoch": 0.85, - "learning_rate": 1.6800635836501214e-06, - "loss": 0.8369, - "step": 33253 - }, - { - "epoch": 0.85, - "learning_rate": 1.680043296709703e-06, - "loss": 0.9355, - "step": 33254 - }, - { - "epoch": 0.85, - "learning_rate": 1.6800230092486062e-06, - "loss": 0.833, - "step": 33255 - }, - { - "epoch": 0.85, - "learning_rate": 1.6800027212668476e-06, - "loss": 0.7441, - "step": 33256 - }, - { - "epoch": 0.85, - "learning_rate": 1.6799824327644417e-06, - "loss": 0.8389, - "step": 33257 - }, - { - "epoch": 0.85, - "learning_rate": 1.6799621437414046e-06, - "loss": 0.9277, - "step": 33258 - }, - { - "epoch": 0.85, - "learning_rate": 1.6799418541977521e-06, - "loss": 0.8242, - "step": 33259 - }, - { - "epoch": 0.85, - "learning_rate": 1.6799215641334993e-06, - "loss": 0.8945, - "step": 33260 - }, - { - "epoch": 0.85, - "learning_rate": 1.6799012735486614e-06, - "loss": 0.9219, - "step": 33261 - }, - { - "epoch": 0.85, - "learning_rate": 1.6798809824432547e-06, - "loss": 0.9707, - "step": 33262 - }, - { - "epoch": 0.85, - "learning_rate": 1.6798606908172944e-06, - "loss": 0.8154, - "step": 33263 - }, - { - "epoch": 0.85, - "learning_rate": 1.6798403986707959e-06, - "loss": 0.709, - "step": 33264 - }, - { - "epoch": 0.85, - "learning_rate": 1.6798201060037749e-06, - "loss": 0.8877, - "step": 33265 - }, - { - "epoch": 0.85, - "learning_rate": 1.679799812816247e-06, - "loss": 0.3755, - "step": 33266 - }, - { - "epoch": 0.85, - "learning_rate": 1.6797795191082276e-06, - "loss": 0.8027, - "step": 33267 - }, - { - "epoch": 0.85, - "learning_rate": 1.6797592248797323e-06, - "loss": 0.8984, - "step": 33268 - }, - { - "epoch": 0.85, - "learning_rate": 1.6797389301307766e-06, - "loss": 1.0361, - "step": 33269 - }, - { - "epoch": 0.85, - "learning_rate": 1.6797186348613758e-06, - "loss": 0.8281, - "step": 33270 - }, - { - "epoch": 0.85, - "learning_rate": 1.6796983390715461e-06, - "loss": 0.8125, - "step": 33271 - }, - { - "epoch": 0.85, - "learning_rate": 1.6796780427613024e-06, - "loss": 0.9863, - "step": 33272 - }, - { - "epoch": 0.85, - "learning_rate": 1.6796577459306604e-06, - "loss": 0.8379, - "step": 33273 - }, - { - "epoch": 0.85, - "learning_rate": 1.6796374485796362e-06, - "loss": 0.853, - "step": 33274 - }, - { - "epoch": 0.85, - "learning_rate": 1.6796171507082444e-06, - "loss": 0.8848, - "step": 33275 - }, - { - "epoch": 0.85, - "learning_rate": 1.6795968523165008e-06, - "loss": 0.8428, - "step": 33276 - }, - { - "epoch": 0.85, - "learning_rate": 1.6795765534044218e-06, - "loss": 0.9375, - "step": 33277 - }, - { - "epoch": 0.85, - "learning_rate": 1.6795562539720218e-06, - "loss": 0.7969, - "step": 33278 - }, - { - "epoch": 0.85, - "learning_rate": 1.679535954019317e-06, - "loss": 0.917, - "step": 33279 - }, - { - "epoch": 0.85, - "learning_rate": 1.6795156535463226e-06, - "loss": 0.9771, - "step": 33280 - }, - { - "epoch": 0.85, - "learning_rate": 1.6794953525530543e-06, - "loss": 0.876, - "step": 33281 - }, - { - "epoch": 0.85, - "learning_rate": 1.6794750510395278e-06, - "loss": 0.6279, - "step": 33282 - }, - { - "epoch": 0.85, - "learning_rate": 1.6794547490057584e-06, - "loss": 0.5913, - "step": 33283 - }, - { - "epoch": 0.85, - "learning_rate": 1.6794344464517622e-06, - "loss": 0.6807, - "step": 33284 - }, - { - "epoch": 0.85, - "learning_rate": 1.6794141433775536e-06, - "loss": 0.8994, - "step": 33285 - }, - { - "epoch": 0.85, - "learning_rate": 1.6793938397831493e-06, - "loss": 1.0391, - "step": 33286 - }, - { - "epoch": 0.85, - "learning_rate": 1.6793735356685642e-06, - "loss": 0.7295, - "step": 33287 - }, - { - "epoch": 0.85, - "learning_rate": 1.679353231033814e-06, - "loss": 0.8076, - "step": 33288 - }, - { - "epoch": 0.85, - "learning_rate": 1.6793329258789145e-06, - "loss": 0.8486, - "step": 33289 - }, - { - "epoch": 0.85, - "learning_rate": 1.6793126202038806e-06, - "loss": 0.8132, - "step": 33290 - }, - { - "epoch": 0.85, - "learning_rate": 1.6792923140087285e-06, - "loss": 0.8467, - "step": 33291 - }, - { - "epoch": 0.85, - "learning_rate": 1.6792720072934734e-06, - "loss": 0.918, - "step": 33292 - }, - { - "epoch": 0.85, - "learning_rate": 1.6792517000581313e-06, - "loss": 0.9561, - "step": 33293 - }, - { - "epoch": 0.85, - "learning_rate": 1.679231392302717e-06, - "loss": 0.8306, - "step": 33294 - }, - { - "epoch": 0.85, - "learning_rate": 1.6792110840272464e-06, - "loss": 0.7542, - "step": 33295 - }, - { - "epoch": 0.85, - "learning_rate": 1.6791907752317353e-06, - "loss": 0.6335, - "step": 33296 - }, - { - "epoch": 0.85, - "learning_rate": 1.6791704659161992e-06, - "loss": 0.7988, - "step": 33297 - }, - { - "epoch": 0.85, - "learning_rate": 1.6791501560806532e-06, - "loss": 0.7451, - "step": 33298 - }, - { - "epoch": 0.85, - "learning_rate": 1.6791298457251135e-06, - "loss": 0.9902, - "step": 33299 - }, - { - "epoch": 0.85, - "learning_rate": 1.6791095348495952e-06, - "loss": 0.9248, - "step": 33300 - }, - { - "epoch": 0.85, - "learning_rate": 1.6790892234541135e-06, - "loss": 0.9844, - "step": 33301 - }, - { - "epoch": 0.85, - "learning_rate": 1.679068911538685e-06, - "loss": 0.8154, - "step": 33302 - }, - { - "epoch": 0.85, - "learning_rate": 1.6790485991033246e-06, - "loss": 0.6509, - "step": 33303 - }, - { - "epoch": 0.85, - "learning_rate": 1.6790282861480476e-06, - "loss": 0.8652, - "step": 33304 - }, - { - "epoch": 0.85, - "learning_rate": 1.6790079726728701e-06, - "loss": 0.8857, - "step": 33305 - }, - { - "epoch": 0.85, - "learning_rate": 1.6789876586778073e-06, - "loss": 0.7856, - "step": 33306 - }, - { - "epoch": 0.85, - "learning_rate": 1.678967344162875e-06, - "loss": 0.9023, - "step": 33307 - }, - { - "epoch": 0.85, - "learning_rate": 1.6789470291280883e-06, - "loss": 1.0332, - "step": 33308 - }, - { - "epoch": 0.85, - "learning_rate": 1.6789267135734635e-06, - "loss": 0.9043, - "step": 33309 - }, - { - "epoch": 0.85, - "learning_rate": 1.6789063974990154e-06, - "loss": 0.585, - "step": 33310 - }, - { - "epoch": 0.85, - "learning_rate": 1.67888608090476e-06, - "loss": 0.8901, - "step": 33311 - }, - { - "epoch": 0.85, - "learning_rate": 1.6788657637907128e-06, - "loss": 0.8667, - "step": 33312 - }, - { - "epoch": 0.85, - "learning_rate": 1.6788454461568896e-06, - "loss": 0.8633, - "step": 33313 - }, - { - "epoch": 0.85, - "learning_rate": 1.678825128003305e-06, - "loss": 0.9668, - "step": 33314 - }, - { - "epoch": 0.85, - "learning_rate": 1.6788048093299756e-06, - "loss": 0.5161, - "step": 33315 - }, - { - "epoch": 0.85, - "learning_rate": 1.6787844901369165e-06, - "loss": 1.0068, - "step": 33316 - }, - { - "epoch": 0.85, - "learning_rate": 1.6787641704241432e-06, - "loss": 0.707, - "step": 33317 - }, - { - "epoch": 0.85, - "learning_rate": 1.6787438501916714e-06, - "loss": 0.8232, - "step": 33318 - }, - { - "epoch": 0.85, - "learning_rate": 1.6787235294395172e-06, - "loss": 0.71, - "step": 33319 - }, - { - "epoch": 0.85, - "learning_rate": 1.678703208167695e-06, - "loss": 0.7375, - "step": 33320 - }, - { - "epoch": 0.85, - "learning_rate": 1.678682886376221e-06, - "loss": 0.5332, - "step": 33321 - }, - { - "epoch": 0.85, - "learning_rate": 1.678662564065111e-06, - "loss": 0.5955, - "step": 33322 - }, - { - "epoch": 0.85, - "learning_rate": 1.67864224123438e-06, - "loss": 0.8965, - "step": 33323 - }, - { - "epoch": 0.85, - "learning_rate": 1.6786219178840442e-06, - "loss": 0.8994, - "step": 33324 - }, - { - "epoch": 0.85, - "learning_rate": 1.6786015940141185e-06, - "loss": 0.71, - "step": 33325 - }, - { - "epoch": 0.85, - "learning_rate": 1.6785812696246189e-06, - "loss": 0.8076, - "step": 33326 - }, - { - "epoch": 0.85, - "learning_rate": 1.6785609447155606e-06, - "loss": 0.7991, - "step": 33327 - }, - { - "epoch": 0.85, - "learning_rate": 1.6785406192869595e-06, - "loss": 0.7686, - "step": 33328 - }, - { - "epoch": 0.85, - "learning_rate": 1.678520293338831e-06, - "loss": 0.7979, - "step": 33329 - }, - { - "epoch": 0.85, - "learning_rate": 1.678499966871191e-06, - "loss": 0.5913, - "step": 33330 - }, - { - "epoch": 0.85, - "learning_rate": 1.6784796398840547e-06, - "loss": 0.9912, - "step": 33331 - }, - { - "epoch": 0.85, - "learning_rate": 1.6784593123774376e-06, - "loss": 0.7812, - "step": 33332 - }, - { - "epoch": 0.85, - "learning_rate": 1.6784389843513553e-06, - "loss": 0.8271, - "step": 33333 - }, - { - "epoch": 0.85, - "learning_rate": 1.6784186558058236e-06, - "loss": 0.6426, - "step": 33334 - }, - { - "epoch": 0.85, - "learning_rate": 1.678398326740858e-06, - "loss": 0.8594, - "step": 33335 - }, - { - "epoch": 0.85, - "learning_rate": 1.6783779971564737e-06, - "loss": 0.8105, - "step": 33336 - }, - { - "epoch": 0.85, - "learning_rate": 1.6783576670526869e-06, - "loss": 0.8984, - "step": 33337 - }, - { - "epoch": 0.85, - "learning_rate": 1.6783373364295126e-06, - "loss": 0.8584, - "step": 33338 - }, - { - "epoch": 0.85, - "learning_rate": 1.6783170052869668e-06, - "loss": 0.6719, - "step": 33339 - }, - { - "epoch": 0.85, - "learning_rate": 1.6782966736250648e-06, - "loss": 0.8203, - "step": 33340 - }, - { - "epoch": 0.85, - "learning_rate": 1.678276341443822e-06, - "loss": 0.7598, - "step": 33341 - }, - { - "epoch": 0.85, - "learning_rate": 1.6782560087432544e-06, - "loss": 0.9834, - "step": 33342 - }, - { - "epoch": 0.85, - "learning_rate": 1.6782356755233772e-06, - "loss": 0.8525, - "step": 33343 - }, - { - "epoch": 0.85, - "learning_rate": 1.6782153417842063e-06, - "loss": 0.728, - "step": 33344 - }, - { - "epoch": 0.85, - "learning_rate": 1.6781950075257572e-06, - "loss": 0.8896, - "step": 33345 - }, - { - "epoch": 0.85, - "learning_rate": 1.678174672748045e-06, - "loss": 1.0469, - "step": 33346 - }, - { - "epoch": 0.85, - "learning_rate": 1.678154337451086e-06, - "loss": 0.6934, - "step": 33347 - }, - { - "epoch": 0.85, - "learning_rate": 1.6781340016348953e-06, - "loss": 0.9082, - "step": 33348 - }, - { - "epoch": 0.85, - "learning_rate": 1.6781136652994886e-06, - "loss": 0.7231, - "step": 33349 - }, - { - "epoch": 0.85, - "learning_rate": 1.6780933284448814e-06, - "loss": 0.8418, - "step": 33350 - }, - { - "epoch": 0.85, - "learning_rate": 1.6780729910710894e-06, - "loss": 0.5332, - "step": 33351 - }, - { - "epoch": 0.85, - "learning_rate": 1.6780526531781278e-06, - "loss": 0.9795, - "step": 33352 - }, - { - "epoch": 0.85, - "learning_rate": 1.6780323147660127e-06, - "loss": 0.999, - "step": 33353 - }, - { - "epoch": 0.85, - "learning_rate": 1.6780119758347592e-06, - "loss": 0.8115, - "step": 33354 - }, - { - "epoch": 0.85, - "learning_rate": 1.6779916363843834e-06, - "loss": 0.8037, - "step": 33355 - }, - { - "epoch": 0.85, - "learning_rate": 1.6779712964149004e-06, - "loss": 0.8867, - "step": 33356 - }, - { - "epoch": 0.85, - "learning_rate": 1.6779509559263262e-06, - "loss": 0.9023, - "step": 33357 - }, - { - "epoch": 0.85, - "learning_rate": 1.6779306149186758e-06, - "loss": 0.791, - "step": 33358 - }, - { - "epoch": 0.86, - "learning_rate": 1.6779102733919653e-06, - "loss": 0.9678, - "step": 33359 - }, - { - "epoch": 0.86, - "learning_rate": 1.67788993134621e-06, - "loss": 0.6895, - "step": 33360 - }, - { - "epoch": 0.86, - "learning_rate": 1.6778695887814257e-06, - "loss": 0.875, - "step": 33361 - }, - { - "epoch": 0.86, - "learning_rate": 1.6778492456976276e-06, - "loss": 0.999, - "step": 33362 - }, - { - "epoch": 0.86, - "learning_rate": 1.6778289020948316e-06, - "loss": 1.0293, - "step": 33363 - }, - { - "epoch": 0.86, - "learning_rate": 1.6778085579730533e-06, - "loss": 0.9482, - "step": 33364 - }, - { - "epoch": 0.86, - "learning_rate": 1.6777882133323077e-06, - "loss": 0.8486, - "step": 33365 - }, - { - "epoch": 0.86, - "learning_rate": 1.6777678681726113e-06, - "loss": 0.6895, - "step": 33366 - }, - { - "epoch": 0.86, - "learning_rate": 1.6777475224939793e-06, - "loss": 0.77, - "step": 33367 - }, - { - "epoch": 0.86, - "learning_rate": 1.6777271762964268e-06, - "loss": 0.832, - "step": 33368 - }, - { - "epoch": 0.86, - "learning_rate": 1.6777068295799702e-06, - "loss": 0.915, - "step": 33369 - }, - { - "epoch": 0.86, - "learning_rate": 1.6776864823446242e-06, - "loss": 0.811, - "step": 33370 - }, - { - "epoch": 0.86, - "learning_rate": 1.6776661345904049e-06, - "loss": 0.7017, - "step": 33371 - }, - { - "epoch": 0.86, - "learning_rate": 1.6776457863173277e-06, - "loss": 0.6433, - "step": 33372 - }, - { - "epoch": 0.86, - "learning_rate": 1.6776254375254087e-06, - "loss": 0.9736, - "step": 33373 - }, - { - "epoch": 0.86, - "learning_rate": 1.6776050882146628e-06, - "loss": 0.8145, - "step": 33374 - }, - { - "epoch": 0.86, - "learning_rate": 1.6775847383851058e-06, - "loss": 0.6987, - "step": 33375 - }, - { - "epoch": 0.86, - "learning_rate": 1.6775643880367534e-06, - "loss": 0.835, - "step": 33376 - }, - { - "epoch": 0.86, - "learning_rate": 1.677544037169621e-06, - "loss": 0.6592, - "step": 33377 - }, - { - "epoch": 0.86, - "learning_rate": 1.6775236857837243e-06, - "loss": 0.6748, - "step": 33378 - }, - { - "epoch": 0.86, - "learning_rate": 1.6775033338790791e-06, - "loss": 0.8242, - "step": 33379 - }, - { - "epoch": 0.86, - "learning_rate": 1.6774829814557006e-06, - "loss": 0.6904, - "step": 33380 - }, - { - "epoch": 0.86, - "learning_rate": 1.6774626285136043e-06, - "loss": 0.7246, - "step": 33381 - }, - { - "epoch": 0.86, - "learning_rate": 1.6774422750528063e-06, - "loss": 0.793, - "step": 33382 - }, - { - "epoch": 0.86, - "learning_rate": 1.6774219210733217e-06, - "loss": 0.834, - "step": 33383 - }, - { - "epoch": 0.86, - "learning_rate": 1.677401566575167e-06, - "loss": 0.8174, - "step": 33384 - }, - { - "epoch": 0.86, - "learning_rate": 1.677381211558356e-06, - "loss": 0.8281, - "step": 33385 - }, - { - "epoch": 0.86, - "learning_rate": 1.677360856022906e-06, - "loss": 0.833, - "step": 33386 - }, - { - "epoch": 0.86, - "learning_rate": 1.6773404999688317e-06, - "loss": 0.7412, - "step": 33387 - }, - { - "epoch": 0.86, - "learning_rate": 1.677320143396149e-06, - "loss": 0.792, - "step": 33388 - }, - { - "epoch": 0.86, - "learning_rate": 1.6772997863048737e-06, - "loss": 0.7031, - "step": 33389 - }, - { - "epoch": 0.86, - "learning_rate": 1.6772794286950207e-06, - "loss": 0.9229, - "step": 33390 - }, - { - "epoch": 0.86, - "learning_rate": 1.6772590705666062e-06, - "loss": 0.8154, - "step": 33391 - }, - { - "epoch": 0.86, - "learning_rate": 1.6772387119196454e-06, - "loss": 0.6592, - "step": 33392 - }, - { - "epoch": 0.86, - "learning_rate": 1.6772183527541542e-06, - "loss": 0.7715, - "step": 33393 - }, - { - "epoch": 0.86, - "learning_rate": 1.677197993070148e-06, - "loss": 1.335, - "step": 33394 - }, - { - "epoch": 0.86, - "learning_rate": 1.677177632867642e-06, - "loss": 0.6533, - "step": 33395 - }, - { - "epoch": 0.86, - "learning_rate": 1.677157272146653e-06, - "loss": 0.9365, - "step": 33396 - }, - { - "epoch": 0.86, - "learning_rate": 1.6771369109071954e-06, - "loss": 0.7124, - "step": 33397 - }, - { - "epoch": 0.86, - "learning_rate": 1.6771165491492851e-06, - "loss": 0.8945, - "step": 33398 - }, - { - "epoch": 0.86, - "learning_rate": 1.6770961868729381e-06, - "loss": 0.8779, - "step": 33399 - }, - { - "epoch": 0.86, - "learning_rate": 1.6770758240781695e-06, - "loss": 0.7217, - "step": 33400 - }, - { - "epoch": 0.86, - "learning_rate": 1.677055460764995e-06, - "loss": 0.8096, - "step": 33401 - }, - { - "epoch": 0.86, - "learning_rate": 1.6770350969334303e-06, - "loss": 0.8164, - "step": 33402 - }, - { - "epoch": 0.86, - "learning_rate": 1.677014732583491e-06, - "loss": 0.8203, - "step": 33403 - }, - { - "epoch": 0.86, - "learning_rate": 1.6769943677151927e-06, - "loss": 0.9692, - "step": 33404 - }, - { - "epoch": 0.86, - "learning_rate": 1.676974002328551e-06, - "loss": 0.7939, - "step": 33405 - }, - { - "epoch": 0.86, - "learning_rate": 1.6769536364235814e-06, - "loss": 0.9336, - "step": 33406 - }, - { - "epoch": 0.86, - "learning_rate": 1.6769332700002994e-06, - "loss": 0.7109, - "step": 33407 - }, - { - "epoch": 0.86, - "learning_rate": 1.6769129030587209e-06, - "loss": 0.728, - "step": 33408 - }, - { - "epoch": 0.86, - "learning_rate": 1.6768925355988613e-06, - "loss": 0.8345, - "step": 33409 - }, - { - "epoch": 0.86, - "learning_rate": 1.6768721676207357e-06, - "loss": 0.8555, - "step": 33410 - }, - { - "epoch": 0.86, - "learning_rate": 1.676851799124361e-06, - "loss": 0.9521, - "step": 33411 - }, - { - "epoch": 0.86, - "learning_rate": 1.6768314301097514e-06, - "loss": 1.0361, - "step": 33412 - }, - { - "epoch": 0.86, - "learning_rate": 1.6768110605769233e-06, - "loss": 0.795, - "step": 33413 - }, - { - "epoch": 0.86, - "learning_rate": 1.6767906905258924e-06, - "loss": 0.6631, - "step": 33414 - }, - { - "epoch": 0.86, - "learning_rate": 1.6767703199566733e-06, - "loss": 0.7822, - "step": 33415 - }, - { - "epoch": 0.86, - "learning_rate": 1.676749948869283e-06, - "loss": 0.6885, - "step": 33416 - }, - { - "epoch": 0.86, - "learning_rate": 1.676729577263736e-06, - "loss": 0.9277, - "step": 33417 - }, - { - "epoch": 0.86, - "learning_rate": 1.6767092051400482e-06, - "loss": 0.7983, - "step": 33418 - }, - { - "epoch": 0.86, - "learning_rate": 1.6766888324982355e-06, - "loss": 0.8223, - "step": 33419 - }, - { - "epoch": 0.86, - "learning_rate": 1.6766684593383134e-06, - "loss": 0.8799, - "step": 33420 - }, - { - "epoch": 0.86, - "learning_rate": 1.6766480856602971e-06, - "loss": 1.0107, - "step": 33421 - }, - { - "epoch": 0.86, - "learning_rate": 1.6766277114642024e-06, - "loss": 0.918, - "step": 33422 - }, - { - "epoch": 0.86, - "learning_rate": 1.6766073367500452e-06, - "loss": 0.8672, - "step": 33423 - }, - { - "epoch": 0.86, - "learning_rate": 1.6765869615178408e-06, - "loss": 0.6785, - "step": 33424 - }, - { - "epoch": 0.86, - "learning_rate": 1.6765665857676047e-06, - "loss": 0.8867, - "step": 33425 - }, - { - "epoch": 0.86, - "learning_rate": 1.676546209499353e-06, - "loss": 0.9707, - "step": 33426 - }, - { - "epoch": 0.86, - "learning_rate": 1.6765258327131008e-06, - "loss": 0.9033, - "step": 33427 - }, - { - "epoch": 0.86, - "learning_rate": 1.676505455408864e-06, - "loss": 0.8447, - "step": 33428 - }, - { - "epoch": 0.86, - "learning_rate": 1.676485077586658e-06, - "loss": 0.6846, - "step": 33429 - }, - { - "epoch": 0.86, - "learning_rate": 1.6764646992464984e-06, - "loss": 0.8213, - "step": 33430 - }, - { - "epoch": 0.86, - "learning_rate": 1.6764443203884008e-06, - "loss": 0.7783, - "step": 33431 - }, - { - "epoch": 0.86, - "learning_rate": 1.676423941012381e-06, - "loss": 0.7092, - "step": 33432 - }, - { - "epoch": 0.86, - "learning_rate": 1.6764035611184546e-06, - "loss": 0.5874, - "step": 33433 - }, - { - "epoch": 0.86, - "learning_rate": 1.6763831807066372e-06, - "loss": 0.8203, - "step": 33434 - }, - { - "epoch": 0.86, - "learning_rate": 1.676362799776944e-06, - "loss": 1.0713, - "step": 33435 - }, - { - "epoch": 0.86, - "learning_rate": 1.676342418329391e-06, - "loss": 0.7881, - "step": 33436 - }, - { - "epoch": 0.86, - "learning_rate": 1.6763220363639938e-06, - "loss": 0.6855, - "step": 33437 - }, - { - "epoch": 0.86, - "learning_rate": 1.6763016538807676e-06, - "loss": 0.6611, - "step": 33438 - }, - { - "epoch": 0.86, - "learning_rate": 1.6762812708797286e-06, - "loss": 0.9248, - "step": 33439 - }, - { - "epoch": 0.86, - "learning_rate": 1.6762608873608924e-06, - "loss": 0.7915, - "step": 33440 - }, - { - "epoch": 0.86, - "learning_rate": 1.6762405033242739e-06, - "loss": 0.8135, - "step": 33441 - }, - { - "epoch": 0.86, - "learning_rate": 1.6762201187698893e-06, - "loss": 0.9414, - "step": 33442 - }, - { - "epoch": 0.86, - "learning_rate": 1.6761997336977541e-06, - "loss": 0.7559, - "step": 33443 - }, - { - "epoch": 0.86, - "learning_rate": 1.6761793481078836e-06, - "loss": 0.7629, - "step": 33444 - }, - { - "epoch": 0.86, - "learning_rate": 1.676158962000294e-06, - "loss": 0.9014, - "step": 33445 - }, - { - "epoch": 0.86, - "learning_rate": 1.6761385753750003e-06, - "loss": 0.8838, - "step": 33446 - }, - { - "epoch": 0.86, - "learning_rate": 1.6761181882320185e-06, - "loss": 0.8252, - "step": 33447 - }, - { - "epoch": 0.86, - "learning_rate": 1.676097800571364e-06, - "loss": 1.0391, - "step": 33448 - }, - { - "epoch": 0.86, - "learning_rate": 1.6760774123930529e-06, - "loss": 1.0986, - "step": 33449 - }, - { - "epoch": 0.86, - "learning_rate": 1.6760570236970998e-06, - "loss": 0.7783, - "step": 33450 - }, - { - "epoch": 0.86, - "learning_rate": 1.676036634483521e-06, - "loss": 0.8389, - "step": 33451 - }, - { - "epoch": 0.86, - "learning_rate": 1.6760162447523323e-06, - "loss": 0.8154, - "step": 33452 - }, - { - "epoch": 0.86, - "learning_rate": 1.6759958545035491e-06, - "loss": 0.793, - "step": 33453 - }, - { - "epoch": 0.86, - "learning_rate": 1.675975463737187e-06, - "loss": 0.6865, - "step": 33454 - }, - { - "epoch": 0.86, - "learning_rate": 1.6759550724532613e-06, - "loss": 0.9346, - "step": 33455 - }, - { - "epoch": 0.86, - "learning_rate": 1.675934680651788e-06, - "loss": 0.7568, - "step": 33456 - }, - { - "epoch": 0.86, - "learning_rate": 1.6759142883327826e-06, - "loss": 0.7637, - "step": 33457 - }, - { - "epoch": 0.86, - "learning_rate": 1.6758938954962606e-06, - "loss": 0.9258, - "step": 33458 - }, - { - "epoch": 0.86, - "learning_rate": 1.6758735021422381e-06, - "loss": 0.7695, - "step": 33459 - }, - { - "epoch": 0.86, - "learning_rate": 1.6758531082707302e-06, - "loss": 0.9668, - "step": 33460 - }, - { - "epoch": 0.86, - "learning_rate": 1.6758327138817525e-06, - "loss": 0.9355, - "step": 33461 - }, - { - "epoch": 0.86, - "learning_rate": 1.6758123189753207e-06, - "loss": 0.8779, - "step": 33462 - }, - { - "epoch": 0.86, - "learning_rate": 1.6757919235514506e-06, - "loss": 0.9541, - "step": 33463 - }, - { - "epoch": 0.86, - "learning_rate": 1.6757715276101577e-06, - "loss": 0.8623, - "step": 33464 - }, - { - "epoch": 0.86, - "learning_rate": 1.6757511311514575e-06, - "loss": 0.8184, - "step": 33465 - }, - { - "epoch": 0.86, - "learning_rate": 1.6757307341753659e-06, - "loss": 0.7969, - "step": 33466 - }, - { - "epoch": 0.86, - "learning_rate": 1.675710336681898e-06, - "loss": 0.9785, - "step": 33467 - }, - { - "epoch": 0.86, - "learning_rate": 1.6756899386710701e-06, - "loss": 0.8037, - "step": 33468 - }, - { - "epoch": 0.86, - "learning_rate": 1.6756695401428976e-06, - "loss": 0.8193, - "step": 33469 - }, - { - "epoch": 0.86, - "learning_rate": 1.6756491410973958e-06, - "loss": 0.8623, - "step": 33470 - }, - { - "epoch": 0.86, - "learning_rate": 1.6756287415345803e-06, - "loss": 0.6733, - "step": 33471 - }, - { - "epoch": 0.86, - "learning_rate": 1.6756083414544672e-06, - "loss": 0.9189, - "step": 33472 - }, - { - "epoch": 0.86, - "learning_rate": 1.675587940857072e-06, - "loss": 0.6123, - "step": 33473 - }, - { - "epoch": 0.86, - "learning_rate": 1.6755675397424097e-06, - "loss": 0.9268, - "step": 33474 - }, - { - "epoch": 0.86, - "learning_rate": 1.6755471381104971e-06, - "loss": 0.8398, - "step": 33475 - }, - { - "epoch": 0.86, - "learning_rate": 1.6755267359613485e-06, - "loss": 0.6865, - "step": 33476 - }, - { - "epoch": 0.86, - "learning_rate": 1.6755063332949804e-06, - "loss": 1.0703, - "step": 33477 - }, - { - "epoch": 0.86, - "learning_rate": 1.675485930111408e-06, - "loss": 0.7715, - "step": 33478 - }, - { - "epoch": 0.86, - "learning_rate": 1.6754655264106475e-06, - "loss": 0.7202, - "step": 33479 - }, - { - "epoch": 0.86, - "learning_rate": 1.6754451221927136e-06, - "loss": 0.7148, - "step": 33480 - }, - { - "epoch": 0.86, - "learning_rate": 1.6754247174576225e-06, - "loss": 0.8857, - "step": 33481 - }, - { - "epoch": 0.86, - "learning_rate": 1.6754043122053903e-06, - "loss": 0.8428, - "step": 33482 - }, - { - "epoch": 0.86, - "learning_rate": 1.6753839064360315e-06, - "loss": 0.8291, - "step": 33483 - }, - { - "epoch": 0.86, - "learning_rate": 1.6753635001495625e-06, - "loss": 0.9326, - "step": 33484 - }, - { - "epoch": 0.86, - "learning_rate": 1.6753430933459986e-06, - "loss": 1.1074, - "step": 33485 - }, - { - "epoch": 0.86, - "learning_rate": 1.6753226860253557e-06, - "loss": 0.8115, - "step": 33486 - }, - { - "epoch": 0.86, - "learning_rate": 1.6753022781876492e-06, - "loss": 0.793, - "step": 33487 - }, - { - "epoch": 0.86, - "learning_rate": 1.6752818698328948e-06, - "loss": 0.8457, - "step": 33488 - }, - { - "epoch": 0.86, - "learning_rate": 1.6752614609611082e-06, - "loss": 0.8154, - "step": 33489 - }, - { - "epoch": 0.86, - "learning_rate": 1.6752410515723048e-06, - "loss": 0.7715, - "step": 33490 - }, - { - "epoch": 0.86, - "learning_rate": 1.6752206416665005e-06, - "loss": 0.5874, - "step": 33491 - }, - { - "epoch": 0.86, - "learning_rate": 1.6752002312437106e-06, - "loss": 0.5474, - "step": 33492 - }, - { - "epoch": 0.86, - "learning_rate": 1.6751798203039511e-06, - "loss": 0.4722, - "step": 33493 - }, - { - "epoch": 0.86, - "learning_rate": 1.6751594088472377e-06, - "loss": 0.8633, - "step": 33494 - }, - { - "epoch": 0.86, - "learning_rate": 1.6751389968735854e-06, - "loss": 0.7891, - "step": 33495 - }, - { - "epoch": 0.86, - "learning_rate": 1.6751185843830102e-06, - "loss": 0.8311, - "step": 33496 - }, - { - "epoch": 0.86, - "learning_rate": 1.675098171375528e-06, - "loss": 0.8374, - "step": 33497 - }, - { - "epoch": 0.86, - "learning_rate": 1.675077757851154e-06, - "loss": 0.8574, - "step": 33498 - }, - { - "epoch": 0.86, - "learning_rate": 1.6750573438099043e-06, - "loss": 0.8999, - "step": 33499 - }, - { - "epoch": 0.86, - "learning_rate": 1.6750369292517935e-06, - "loss": 0.8418, - "step": 33500 - }, - { - "epoch": 0.86, - "learning_rate": 1.6750165141768387e-06, - "loss": 0.9521, - "step": 33501 - }, - { - "epoch": 0.86, - "learning_rate": 1.6749960985850544e-06, - "loss": 0.6766, - "step": 33502 - }, - { - "epoch": 0.86, - "learning_rate": 1.674975682476457e-06, - "loss": 0.8789, - "step": 33503 - }, - { - "epoch": 0.86, - "learning_rate": 1.6749552658510615e-06, - "loss": 0.9287, - "step": 33504 - }, - { - "epoch": 0.86, - "learning_rate": 1.6749348487088838e-06, - "loss": 0.9141, - "step": 33505 - }, - { - "epoch": 0.86, - "learning_rate": 1.6749144310499394e-06, - "loss": 1.0781, - "step": 33506 - }, - { - "epoch": 0.86, - "learning_rate": 1.6748940128742444e-06, - "loss": 0.7676, - "step": 33507 - }, - { - "epoch": 0.86, - "learning_rate": 1.6748735941818137e-06, - "loss": 0.9209, - "step": 33508 - }, - { - "epoch": 0.86, - "learning_rate": 1.6748531749726636e-06, - "loss": 0.7344, - "step": 33509 - }, - { - "epoch": 0.86, - "learning_rate": 1.6748327552468093e-06, - "loss": 0.7588, - "step": 33510 - }, - { - "epoch": 0.86, - "learning_rate": 1.6748123350042667e-06, - "loss": 0.7998, - "step": 33511 - }, - { - "epoch": 0.86, - "learning_rate": 1.674791914245051e-06, - "loss": 0.8125, - "step": 33512 - }, - { - "epoch": 0.86, - "learning_rate": 1.6747714929691785e-06, - "loss": 0.6616, - "step": 33513 - }, - { - "epoch": 0.86, - "learning_rate": 1.6747510711766645e-06, - "loss": 0.9229, - "step": 33514 - }, - { - "epoch": 0.86, - "learning_rate": 1.6747306488675244e-06, - "loss": 0.8521, - "step": 33515 - }, - { - "epoch": 0.86, - "learning_rate": 1.6747102260417743e-06, - "loss": 0.918, - "step": 33516 - }, - { - "epoch": 0.86, - "learning_rate": 1.6746898026994293e-06, - "loss": 0.7686, - "step": 33517 - }, - { - "epoch": 0.86, - "learning_rate": 1.6746693788405058e-06, - "loss": 0.7197, - "step": 33518 - }, - { - "epoch": 0.86, - "learning_rate": 1.674648954465019e-06, - "loss": 0.7744, - "step": 33519 - }, - { - "epoch": 0.86, - "learning_rate": 1.6746285295729838e-06, - "loss": 0.9414, - "step": 33520 - }, - { - "epoch": 0.86, - "learning_rate": 1.6746081041644171e-06, - "loss": 0.9219, - "step": 33521 - }, - { - "epoch": 0.86, - "learning_rate": 1.6745876782393338e-06, - "loss": 1.0752, - "step": 33522 - }, - { - "epoch": 0.86, - "learning_rate": 1.67456725179775e-06, - "loss": 0.9727, - "step": 33523 - }, - { - "epoch": 0.86, - "learning_rate": 1.6745468248396807e-06, - "loss": 0.8662, - "step": 33524 - }, - { - "epoch": 0.86, - "learning_rate": 1.6745263973651423e-06, - "loss": 0.7534, - "step": 33525 - }, - { - "epoch": 0.86, - "learning_rate": 1.6745059693741499e-06, - "loss": 0.834, - "step": 33526 - }, - { - "epoch": 0.86, - "learning_rate": 1.6744855408667191e-06, - "loss": 0.8604, - "step": 33527 - }, - { - "epoch": 0.86, - "learning_rate": 1.6744651118428662e-06, - "loss": 0.7637, - "step": 33528 - }, - { - "epoch": 0.86, - "learning_rate": 1.6744446823026062e-06, - "loss": 0.8975, - "step": 33529 - }, - { - "epoch": 0.86, - "learning_rate": 1.6744242522459543e-06, - "loss": 0.8613, - "step": 33530 - }, - { - "epoch": 0.86, - "learning_rate": 1.6744038216729274e-06, - "loss": 1.0049, - "step": 33531 - }, - { - "epoch": 0.86, - "learning_rate": 1.6743833905835404e-06, - "loss": 1.042, - "step": 33532 - }, - { - "epoch": 0.86, - "learning_rate": 1.674362958977809e-06, - "loss": 0.7812, - "step": 33533 - }, - { - "epoch": 0.86, - "learning_rate": 1.674342526855749e-06, - "loss": 0.8555, - "step": 33534 - }, - { - "epoch": 0.86, - "learning_rate": 1.6743220942173757e-06, - "loss": 0.8042, - "step": 33535 - }, - { - "epoch": 0.86, - "learning_rate": 1.6743016610627052e-06, - "loss": 0.915, - "step": 33536 - }, - { - "epoch": 0.86, - "learning_rate": 1.6742812273917527e-06, - "loss": 0.6133, - "step": 33537 - }, - { - "epoch": 0.86, - "learning_rate": 1.6742607932045343e-06, - "loss": 0.6862, - "step": 33538 - }, - { - "epoch": 0.86, - "learning_rate": 1.6742403585010654e-06, - "loss": 0.7766, - "step": 33539 - }, - { - "epoch": 0.86, - "learning_rate": 1.6742199232813614e-06, - "loss": 0.9561, - "step": 33540 - }, - { - "epoch": 0.86, - "learning_rate": 1.6741994875454383e-06, - "loss": 0.8325, - "step": 33541 - }, - { - "epoch": 0.86, - "learning_rate": 1.6741790512933118e-06, - "loss": 0.6388, - "step": 33542 - }, - { - "epoch": 0.86, - "learning_rate": 1.6741586145249976e-06, - "loss": 0.916, - "step": 33543 - }, - { - "epoch": 0.86, - "learning_rate": 1.6741381772405109e-06, - "loss": 0.8252, - "step": 33544 - }, - { - "epoch": 0.86, - "learning_rate": 1.6741177394398672e-06, - "loss": 0.8047, - "step": 33545 - }, - { - "epoch": 0.86, - "learning_rate": 1.674097301123083e-06, - "loss": 0.8193, - "step": 33546 - }, - { - "epoch": 0.86, - "learning_rate": 1.6740768622901735e-06, - "loss": 0.8535, - "step": 33547 - }, - { - "epoch": 0.86, - "learning_rate": 1.6740564229411543e-06, - "loss": 0.6626, - "step": 33548 - }, - { - "epoch": 0.86, - "learning_rate": 1.674035983076041e-06, - "loss": 1.2129, - "step": 33549 - }, - { - "epoch": 0.86, - "learning_rate": 1.6740155426948495e-06, - "loss": 0.7812, - "step": 33550 - }, - { - "epoch": 0.86, - "learning_rate": 1.6739951017975951e-06, - "loss": 0.9883, - "step": 33551 - }, - { - "epoch": 0.86, - "learning_rate": 1.6739746603842937e-06, - "loss": 0.9941, - "step": 33552 - }, - { - "epoch": 0.86, - "learning_rate": 1.6739542184549608e-06, - "loss": 0.8604, - "step": 33553 - }, - { - "epoch": 0.86, - "learning_rate": 1.6739337760096124e-06, - "loss": 0.8682, - "step": 33554 - }, - { - "epoch": 0.86, - "learning_rate": 1.6739133330482637e-06, - "loss": 0.8311, - "step": 33555 - }, - { - "epoch": 0.86, - "learning_rate": 1.6738928895709306e-06, - "loss": 0.8877, - "step": 33556 - }, - { - "epoch": 0.86, - "learning_rate": 1.6738724455776287e-06, - "loss": 0.835, - "step": 33557 - }, - { - "epoch": 0.86, - "learning_rate": 1.6738520010683738e-06, - "loss": 0.9238, - "step": 33558 - }, - { - "epoch": 0.86, - "learning_rate": 1.673831556043181e-06, - "loss": 0.8105, - "step": 33559 - }, - { - "epoch": 0.86, - "learning_rate": 1.6738111105020667e-06, - "loss": 0.7007, - "step": 33560 - }, - { - "epoch": 0.86, - "learning_rate": 1.6737906644450461e-06, - "loss": 0.8174, - "step": 33561 - }, - { - "epoch": 0.86, - "learning_rate": 1.6737702178721352e-06, - "loss": 1.0771, - "step": 33562 - }, - { - "epoch": 0.86, - "learning_rate": 1.6737497707833493e-06, - "loss": 0.8594, - "step": 33563 - }, - { - "epoch": 0.86, - "learning_rate": 1.673729323178704e-06, - "loss": 1.1504, - "step": 33564 - }, - { - "epoch": 0.86, - "learning_rate": 1.6737088750582152e-06, - "loss": 0.8813, - "step": 33565 - }, - { - "epoch": 0.86, - "learning_rate": 1.6736884264218985e-06, - "loss": 0.7053, - "step": 33566 - }, - { - "epoch": 0.86, - "learning_rate": 1.6736679772697696e-06, - "loss": 0.751, - "step": 33567 - }, - { - "epoch": 0.86, - "learning_rate": 1.6736475276018443e-06, - "loss": 0.918, - "step": 33568 - }, - { - "epoch": 0.86, - "learning_rate": 1.6736270774181378e-06, - "loss": 1.0, - "step": 33569 - }, - { - "epoch": 0.86, - "learning_rate": 1.6736066267186662e-06, - "loss": 0.6814, - "step": 33570 - }, - { - "epoch": 0.86, - "learning_rate": 1.6735861755034447e-06, - "loss": 0.8506, - "step": 33571 - }, - { - "epoch": 0.86, - "learning_rate": 1.6735657237724894e-06, - "loss": 0.8311, - "step": 33572 - }, - { - "epoch": 0.86, - "learning_rate": 1.6735452715258158e-06, - "loss": 0.565, - "step": 33573 - }, - { - "epoch": 0.86, - "learning_rate": 1.6735248187634397e-06, - "loss": 0.9463, - "step": 33574 - }, - { - "epoch": 0.86, - "learning_rate": 1.6735043654853764e-06, - "loss": 0.6903, - "step": 33575 - }, - { - "epoch": 0.86, - "learning_rate": 1.6734839116916417e-06, - "loss": 0.8809, - "step": 33576 - }, - { - "epoch": 0.86, - "learning_rate": 1.6734634573822514e-06, - "loss": 0.8496, - "step": 33577 - }, - { - "epoch": 0.86, - "learning_rate": 1.6734430025572213e-06, - "loss": 0.959, - "step": 33578 - }, - { - "epoch": 0.86, - "learning_rate": 1.6734225472165665e-06, - "loss": 0.8945, - "step": 33579 - }, - { - "epoch": 0.86, - "learning_rate": 1.6734020913603035e-06, - "loss": 0.8125, - "step": 33580 - }, - { - "epoch": 0.86, - "learning_rate": 1.673381634988447e-06, - "loss": 0.7466, - "step": 33581 - }, - { - "epoch": 0.86, - "learning_rate": 1.6733611781010135e-06, - "loss": 0.8711, - "step": 33582 - }, - { - "epoch": 0.86, - "learning_rate": 1.673340720698018e-06, - "loss": 0.8936, - "step": 33583 - }, - { - "epoch": 0.86, - "learning_rate": 1.673320262779477e-06, - "loss": 0.8008, - "step": 33584 - }, - { - "epoch": 0.86, - "learning_rate": 1.6732998043454053e-06, - "loss": 0.6743, - "step": 33585 - }, - { - "epoch": 0.86, - "learning_rate": 1.6732793453958188e-06, - "loss": 1.0273, - "step": 33586 - }, - { - "epoch": 0.86, - "learning_rate": 1.6732588859307333e-06, - "loss": 0.8896, - "step": 33587 - }, - { - "epoch": 0.86, - "learning_rate": 1.6732384259501646e-06, - "loss": 0.7021, - "step": 33588 - }, - { - "epoch": 0.86, - "learning_rate": 1.673217965454128e-06, - "loss": 0.8955, - "step": 33589 - }, - { - "epoch": 0.86, - "learning_rate": 1.6731975044426395e-06, - "loss": 0.6929, - "step": 33590 - }, - { - "epoch": 0.86, - "learning_rate": 1.6731770429157145e-06, - "loss": 0.9639, - "step": 33591 - }, - { - "epoch": 0.86, - "learning_rate": 1.673156580873369e-06, - "loss": 0.9541, - "step": 33592 - }, - { - "epoch": 0.86, - "learning_rate": 1.6731361183156183e-06, - "loss": 0.8286, - "step": 33593 - }, - { - "epoch": 0.86, - "learning_rate": 1.673115655242478e-06, - "loss": 0.7393, - "step": 33594 - }, - { - "epoch": 0.86, - "learning_rate": 1.6730951916539644e-06, - "loss": 0.8115, - "step": 33595 - }, - { - "epoch": 0.86, - "learning_rate": 1.6730747275500927e-06, - "loss": 0.6504, - "step": 33596 - }, - { - "epoch": 0.86, - "learning_rate": 1.6730542629308784e-06, - "loss": 0.8945, - "step": 33597 - }, - { - "epoch": 0.86, - "learning_rate": 1.6730337977963376e-06, - "loss": 0.9736, - "step": 33598 - }, - { - "epoch": 0.86, - "learning_rate": 1.6730133321464857e-06, - "loss": 1.0479, - "step": 33599 - }, - { - "epoch": 0.86, - "learning_rate": 1.6729928659813385e-06, - "loss": 0.8643, - "step": 33600 - }, - { - "epoch": 0.86, - "learning_rate": 1.6729723993009115e-06, - "loss": 0.835, - "step": 33601 - }, - { - "epoch": 0.86, - "learning_rate": 1.6729519321052204e-06, - "loss": 0.5422, - "step": 33602 - }, - { - "epoch": 0.86, - "learning_rate": 1.672931464394281e-06, - "loss": 0.7734, - "step": 33603 - }, - { - "epoch": 0.86, - "learning_rate": 1.6729109961681091e-06, - "loss": 1.1172, - "step": 33604 - }, - { - "epoch": 0.86, - "learning_rate": 1.67289052742672e-06, - "loss": 0.9463, - "step": 33605 - }, - { - "epoch": 0.86, - "learning_rate": 1.6728700581701297e-06, - "loss": 0.6938, - "step": 33606 - }, - { - "epoch": 0.86, - "learning_rate": 1.6728495883983537e-06, - "loss": 0.9014, - "step": 33607 - }, - { - "epoch": 0.86, - "learning_rate": 1.6728291181114078e-06, - "loss": 0.8936, - "step": 33608 - }, - { - "epoch": 0.86, - "learning_rate": 1.6728086473093072e-06, - "loss": 0.8818, - "step": 33609 - }, - { - "epoch": 0.86, - "learning_rate": 1.6727881759920684e-06, - "loss": 0.8359, - "step": 33610 - }, - { - "epoch": 0.86, - "learning_rate": 1.6727677041597064e-06, - "loss": 0.636, - "step": 33611 - }, - { - "epoch": 0.86, - "learning_rate": 1.672747231812237e-06, - "loss": 0.79, - "step": 33612 - }, - { - "epoch": 0.86, - "learning_rate": 1.6727267589496764e-06, - "loss": 0.8604, - "step": 33613 - }, - { - "epoch": 0.86, - "learning_rate": 1.6727062855720396e-06, - "loss": 0.7842, - "step": 33614 - }, - { - "epoch": 0.86, - "learning_rate": 1.6726858116793422e-06, - "loss": 0.6167, - "step": 33615 - }, - { - "epoch": 0.86, - "learning_rate": 1.6726653372716007e-06, - "loss": 0.9092, - "step": 33616 - }, - { - "epoch": 0.86, - "learning_rate": 1.67264486234883e-06, - "loss": 0.9707, - "step": 33617 - }, - { - "epoch": 0.86, - "learning_rate": 1.6726243869110464e-06, - "loss": 0.8604, - "step": 33618 - }, - { - "epoch": 0.86, - "learning_rate": 1.6726039109582648e-06, - "loss": 0.7773, - "step": 33619 - }, - { - "epoch": 0.86, - "learning_rate": 1.6725834344905017e-06, - "loss": 0.9111, - "step": 33620 - }, - { - "epoch": 0.86, - "learning_rate": 1.672562957507772e-06, - "loss": 0.9482, - "step": 33621 - }, - { - "epoch": 0.86, - "learning_rate": 1.672542480010092e-06, - "loss": 0.8105, - "step": 33622 - }, - { - "epoch": 0.86, - "learning_rate": 1.672522001997477e-06, - "loss": 0.7139, - "step": 33623 - }, - { - "epoch": 0.86, - "learning_rate": 1.672501523469943e-06, - "loss": 0.8584, - "step": 33624 - }, - { - "epoch": 0.86, - "learning_rate": 1.6724810444275055e-06, - "loss": 0.6855, - "step": 33625 - }, - { - "epoch": 0.86, - "learning_rate": 1.6724605648701802e-06, - "loss": 0.7969, - "step": 33626 - }, - { - "epoch": 0.86, - "learning_rate": 1.6724400847979828e-06, - "loss": 0.9199, - "step": 33627 - }, - { - "epoch": 0.86, - "learning_rate": 1.6724196042109286e-06, - "loss": 0.7871, - "step": 33628 - }, - { - "epoch": 0.86, - "learning_rate": 1.672399123109034e-06, - "loss": 0.5742, - "step": 33629 - }, - { - "epoch": 0.86, - "learning_rate": 1.672378641492314e-06, - "loss": 0.8262, - "step": 33630 - }, - { - "epoch": 0.86, - "learning_rate": 1.672358159360785e-06, - "loss": 0.7588, - "step": 33631 - }, - { - "epoch": 0.86, - "learning_rate": 1.6723376767144619e-06, - "loss": 0.8447, - "step": 33632 - }, - { - "epoch": 0.86, - "learning_rate": 1.672317193553361e-06, - "loss": 0.6621, - "step": 33633 - }, - { - "epoch": 0.86, - "learning_rate": 1.6722967098774976e-06, - "loss": 0.9209, - "step": 33634 - }, - { - "epoch": 0.86, - "learning_rate": 1.6722762256868875e-06, - "loss": 0.791, - "step": 33635 - }, - { - "epoch": 0.86, - "learning_rate": 1.6722557409815465e-06, - "loss": 0.9678, - "step": 33636 - }, - { - "epoch": 0.86, - "learning_rate": 1.67223525576149e-06, - "loss": 0.918, - "step": 33637 - }, - { - "epoch": 0.86, - "learning_rate": 1.6722147700267341e-06, - "loss": 0.7017, - "step": 33638 - }, - { - "epoch": 0.86, - "learning_rate": 1.6721942837772941e-06, - "loss": 0.7935, - "step": 33639 - }, - { - "epoch": 0.86, - "learning_rate": 1.672173797013186e-06, - "loss": 0.8774, - "step": 33640 - }, - { - "epoch": 0.86, - "learning_rate": 1.6721533097344254e-06, - "loss": 0.8369, - "step": 33641 - }, - { - "epoch": 0.86, - "learning_rate": 1.6721328219410276e-06, - "loss": 0.6992, - "step": 33642 - }, - { - "epoch": 0.86, - "learning_rate": 1.672112333633009e-06, - "loss": 0.875, - "step": 33643 - }, - { - "epoch": 0.86, - "learning_rate": 1.6720918448103847e-06, - "loss": 0.8213, - "step": 33644 - }, - { - "epoch": 0.86, - "learning_rate": 1.6720713554731704e-06, - "loss": 0.8818, - "step": 33645 - }, - { - "epoch": 0.86, - "learning_rate": 1.6720508656213821e-06, - "loss": 0.8574, - "step": 33646 - }, - { - "epoch": 0.86, - "learning_rate": 1.6720303752550353e-06, - "loss": 1.0352, - "step": 33647 - }, - { - "epoch": 0.86, - "learning_rate": 1.672009884374146e-06, - "loss": 1.0029, - "step": 33648 - }, - { - "epoch": 0.86, - "learning_rate": 1.6719893929787295e-06, - "loss": 0.6704, - "step": 33649 - }, - { - "epoch": 0.86, - "learning_rate": 1.6719689010688013e-06, - "loss": 0.7422, - "step": 33650 - }, - { - "epoch": 0.86, - "learning_rate": 1.6719484086443779e-06, - "loss": 0.9766, - "step": 33651 - }, - { - "epoch": 0.86, - "learning_rate": 1.6719279157054742e-06, - "loss": 1.1641, - "step": 33652 - }, - { - "epoch": 0.86, - "learning_rate": 1.6719074222521065e-06, - "loss": 0.7783, - "step": 33653 - }, - { - "epoch": 0.86, - "learning_rate": 1.6718869282842897e-06, - "loss": 0.958, - "step": 33654 - }, - { - "epoch": 0.86, - "learning_rate": 1.6718664338020404e-06, - "loss": 0.9287, - "step": 33655 - }, - { - "epoch": 0.86, - "learning_rate": 1.6718459388053736e-06, - "loss": 0.9893, - "step": 33656 - }, - { - "epoch": 0.86, - "learning_rate": 1.6718254432943053e-06, - "loss": 0.8291, - "step": 33657 - }, - { - "epoch": 0.86, - "learning_rate": 1.6718049472688513e-06, - "loss": 0.6533, - "step": 33658 - }, - { - "epoch": 0.86, - "learning_rate": 1.671784450729027e-06, - "loss": 0.6348, - "step": 33659 - }, - { - "epoch": 0.86, - "learning_rate": 1.6717639536748483e-06, - "loss": 0.9531, - "step": 33660 - }, - { - "epoch": 0.86, - "learning_rate": 1.671743456106331e-06, - "loss": 0.832, - "step": 33661 - }, - { - "epoch": 0.86, - "learning_rate": 1.6717229580234902e-06, - "loss": 0.7559, - "step": 33662 - }, - { - "epoch": 0.86, - "learning_rate": 1.6717024594263425e-06, - "loss": 0.8789, - "step": 33663 - }, - { - "epoch": 0.86, - "learning_rate": 1.6716819603149025e-06, - "loss": 0.9424, - "step": 33664 - }, - { - "epoch": 0.86, - "learning_rate": 1.671661460689187e-06, - "loss": 1.0264, - "step": 33665 - }, - { - "epoch": 0.86, - "learning_rate": 1.6716409605492112e-06, - "loss": 0.9893, - "step": 33666 - }, - { - "epoch": 0.86, - "learning_rate": 1.6716204598949905e-06, - "loss": 0.876, - "step": 33667 - }, - { - "epoch": 0.86, - "learning_rate": 1.6715999587265413e-06, - "loss": 0.5815, - "step": 33668 - }, - { - "epoch": 0.86, - "learning_rate": 1.6715794570438786e-06, - "loss": 0.8643, - "step": 33669 - }, - { - "epoch": 0.86, - "learning_rate": 1.6715589548470183e-06, - "loss": 0.8779, - "step": 33670 - }, - { - "epoch": 0.86, - "learning_rate": 1.6715384521359765e-06, - "loss": 0.9541, - "step": 33671 - }, - { - "epoch": 0.86, - "learning_rate": 1.6715179489107683e-06, - "loss": 1.0352, - "step": 33672 - }, - { - "epoch": 0.86, - "learning_rate": 1.67149744517141e-06, - "loss": 0.7578, - "step": 33673 - }, - { - "epoch": 0.86, - "learning_rate": 1.6714769409179165e-06, - "loss": 0.7666, - "step": 33674 - }, - { - "epoch": 0.86, - "learning_rate": 1.6714564361503043e-06, - "loss": 0.7949, - "step": 33675 - }, - { - "epoch": 0.86, - "learning_rate": 1.6714359308685888e-06, - "loss": 0.9482, - "step": 33676 - }, - { - "epoch": 0.86, - "learning_rate": 1.6714154250727855e-06, - "loss": 0.689, - "step": 33677 - }, - { - "epoch": 0.86, - "learning_rate": 1.6713949187629107e-06, - "loss": 0.8604, - "step": 33678 - }, - { - "epoch": 0.86, - "learning_rate": 1.6713744119389795e-06, - "loss": 0.9092, - "step": 33679 - }, - { - "epoch": 0.86, - "learning_rate": 1.6713539046010074e-06, - "loss": 0.9805, - "step": 33680 - }, - { - "epoch": 0.86, - "learning_rate": 1.6713333967490107e-06, - "loss": 0.8511, - "step": 33681 - }, - { - "epoch": 0.86, - "learning_rate": 1.671312888383005e-06, - "loss": 0.8398, - "step": 33682 - }, - { - "epoch": 0.86, - "learning_rate": 1.671292379503006e-06, - "loss": 0.8828, - "step": 33683 - }, - { - "epoch": 0.86, - "learning_rate": 1.6712718701090293e-06, - "loss": 0.79, - "step": 33684 - }, - { - "epoch": 0.86, - "learning_rate": 1.67125136020109e-06, - "loss": 0.8867, - "step": 33685 - }, - { - "epoch": 0.86, - "learning_rate": 1.6712308497792049e-06, - "loss": 1.0195, - "step": 33686 - }, - { - "epoch": 0.86, - "learning_rate": 1.6712103388433892e-06, - "loss": 0.8438, - "step": 33687 - }, - { - "epoch": 0.86, - "learning_rate": 1.6711898273936586e-06, - "loss": 0.835, - "step": 33688 - }, - { - "epoch": 0.86, - "learning_rate": 1.6711693154300286e-06, - "loss": 0.9277, - "step": 33689 - }, - { - "epoch": 0.86, - "learning_rate": 1.6711488029525154e-06, - "loss": 0.5605, - "step": 33690 - }, - { - "epoch": 0.86, - "learning_rate": 1.671128289961134e-06, - "loss": 0.9229, - "step": 33691 - }, - { - "epoch": 0.86, - "learning_rate": 1.6711077764559009e-06, - "loss": 0.8369, - "step": 33692 - }, - { - "epoch": 0.86, - "learning_rate": 1.6710872624368316e-06, - "loss": 0.8701, - "step": 33693 - }, - { - "epoch": 0.86, - "learning_rate": 1.6710667479039412e-06, - "loss": 1.0156, - "step": 33694 - }, - { - "epoch": 0.86, - "learning_rate": 1.671046232857246e-06, - "loss": 0.9004, - "step": 33695 - }, - { - "epoch": 0.86, - "learning_rate": 1.6710257172967616e-06, - "loss": 0.8213, - "step": 33696 - }, - { - "epoch": 0.86, - "learning_rate": 1.6710052012225036e-06, - "loss": 0.9277, - "step": 33697 - }, - { - "epoch": 0.86, - "learning_rate": 1.670984684634488e-06, - "loss": 0.8857, - "step": 33698 - }, - { - "epoch": 0.86, - "learning_rate": 1.67096416753273e-06, - "loss": 0.7559, - "step": 33699 - }, - { - "epoch": 0.86, - "learning_rate": 1.6709436499172458e-06, - "loss": 0.8164, - "step": 33700 - }, - { - "epoch": 0.86, - "learning_rate": 1.6709231317880508e-06, - "loss": 0.9531, - "step": 33701 - }, - { - "epoch": 0.86, - "learning_rate": 1.6709026131451607e-06, - "loss": 0.8804, - "step": 33702 - }, - { - "epoch": 0.86, - "learning_rate": 1.6708820939885918e-06, - "loss": 1.0303, - "step": 33703 - }, - { - "epoch": 0.86, - "learning_rate": 1.6708615743183585e-06, - "loss": 0.8232, - "step": 33704 - }, - { - "epoch": 0.86, - "learning_rate": 1.670841054134478e-06, - "loss": 0.9111, - "step": 33705 - }, - { - "epoch": 0.86, - "learning_rate": 1.6708205334369652e-06, - "loss": 1.1113, - "step": 33706 - }, - { - "epoch": 0.86, - "learning_rate": 1.6708000122258357e-06, - "loss": 0.6646, - "step": 33707 - }, - { - "epoch": 0.86, - "learning_rate": 1.6707794905011058e-06, - "loss": 0.812, - "step": 33708 - }, - { - "epoch": 0.86, - "learning_rate": 1.6707589682627907e-06, - "loss": 0.3755, - "step": 33709 - }, - { - "epoch": 0.86, - "learning_rate": 1.6707384455109063e-06, - "loss": 0.8438, - "step": 33710 - }, - { - "epoch": 0.86, - "learning_rate": 1.6707179222454684e-06, - "loss": 1.0342, - "step": 33711 - }, - { - "epoch": 0.86, - "learning_rate": 1.6706973984664926e-06, - "loss": 1.0049, - "step": 33712 - }, - { - "epoch": 0.86, - "learning_rate": 1.6706768741739947e-06, - "loss": 0.8315, - "step": 33713 - }, - { - "epoch": 0.86, - "learning_rate": 1.6706563493679902e-06, - "loss": 0.8945, - "step": 33714 - }, - { - "epoch": 0.86, - "learning_rate": 1.670635824048495e-06, - "loss": 0.9961, - "step": 33715 - }, - { - "epoch": 0.86, - "learning_rate": 1.6706152982155247e-06, - "loss": 0.9971, - "step": 33716 - }, - { - "epoch": 0.86, - "learning_rate": 1.6705947718690955e-06, - "loss": 0.9697, - "step": 33717 - }, - { - "epoch": 0.86, - "learning_rate": 1.6705742450092225e-06, - "loss": 0.9092, - "step": 33718 - }, - { - "epoch": 0.86, - "learning_rate": 1.6705537176359217e-06, - "loss": 0.7539, - "step": 33719 - }, - { - "epoch": 0.86, - "learning_rate": 1.6705331897492086e-06, - "loss": 0.6257, - "step": 33720 - }, - { - "epoch": 0.86, - "learning_rate": 1.670512661349099e-06, - "loss": 0.9531, - "step": 33721 - }, - { - "epoch": 0.86, - "learning_rate": 1.670492132435609e-06, - "loss": 0.7207, - "step": 33722 - }, - { - "epoch": 0.86, - "learning_rate": 1.6704716030087538e-06, - "loss": 0.6108, - "step": 33723 - }, - { - "epoch": 0.86, - "learning_rate": 1.6704510730685493e-06, - "loss": 0.6836, - "step": 33724 - }, - { - "epoch": 0.86, - "learning_rate": 1.670430542615011e-06, - "loss": 0.8818, - "step": 33725 - }, - { - "epoch": 0.86, - "learning_rate": 1.6704100116481552e-06, - "loss": 0.6943, - "step": 33726 - }, - { - "epoch": 0.86, - "learning_rate": 1.6703894801679974e-06, - "loss": 1.0615, - "step": 33727 - }, - { - "epoch": 0.86, - "learning_rate": 1.670368948174553e-06, - "loss": 0.8408, - "step": 33728 - }, - { - "epoch": 0.86, - "learning_rate": 1.670348415667838e-06, - "loss": 0.9209, - "step": 33729 - }, - { - "epoch": 0.86, - "learning_rate": 1.670327882647868e-06, - "loss": 0.7065, - "step": 33730 - }, - { - "epoch": 0.86, - "learning_rate": 1.6703073491146586e-06, - "loss": 0.9385, - "step": 33731 - }, - { - "epoch": 0.86, - "learning_rate": 1.6702868150682258e-06, - "loss": 0.7939, - "step": 33732 - }, - { - "epoch": 0.86, - "learning_rate": 1.6702662805085855e-06, - "loss": 0.9219, - "step": 33733 - }, - { - "epoch": 0.86, - "learning_rate": 1.6702457454357529e-06, - "loss": 0.8975, - "step": 33734 - }, - { - "epoch": 0.86, - "learning_rate": 1.6702252098497439e-06, - "loss": 0.9326, - "step": 33735 - }, - { - "epoch": 0.86, - "learning_rate": 1.6702046737505741e-06, - "loss": 0.9453, - "step": 33736 - }, - { - "epoch": 0.86, - "learning_rate": 1.6701841371382598e-06, - "loss": 0.7603, - "step": 33737 - }, - { - "epoch": 0.86, - "learning_rate": 1.6701636000128158e-06, - "loss": 0.6826, - "step": 33738 - }, - { - "epoch": 0.86, - "learning_rate": 1.670143062374259e-06, - "loss": 0.6948, - "step": 33739 - }, - { - "epoch": 0.86, - "learning_rate": 1.670122524222604e-06, - "loss": 0.5615, - "step": 33740 - }, - { - "epoch": 0.86, - "learning_rate": 1.6701019855578671e-06, - "loss": 0.7852, - "step": 33741 - }, - { - "epoch": 0.86, - "learning_rate": 1.6700814463800638e-06, - "loss": 0.8604, - "step": 33742 - }, - { - "epoch": 0.86, - "learning_rate": 1.6700609066892101e-06, - "loss": 0.9092, - "step": 33743 - }, - { - "epoch": 0.86, - "learning_rate": 1.6700403664853217e-06, - "loss": 0.7285, - "step": 33744 - }, - { - "epoch": 0.86, - "learning_rate": 1.6700198257684142e-06, - "loss": 0.8071, - "step": 33745 - }, - { - "epoch": 0.86, - "learning_rate": 1.6699992845385032e-06, - "loss": 0.7227, - "step": 33746 - }, - { - "epoch": 0.86, - "learning_rate": 1.6699787427956046e-06, - "loss": 0.6128, - "step": 33747 - }, - { - "epoch": 0.86, - "learning_rate": 1.669958200539734e-06, - "loss": 0.8262, - "step": 33748 - }, - { - "epoch": 0.87, - "learning_rate": 1.6699376577709071e-06, - "loss": 0.9014, - "step": 33749 - }, - { - "epoch": 0.87, - "learning_rate": 1.66991711448914e-06, - "loss": 0.8105, - "step": 33750 - }, - { - "epoch": 0.87, - "learning_rate": 1.6698965706944482e-06, - "loss": 0.8096, - "step": 33751 - }, - { - "epoch": 0.87, - "learning_rate": 1.6698760263868469e-06, - "loss": 1.0361, - "step": 33752 - }, - { - "epoch": 0.87, - "learning_rate": 1.669855481566353e-06, - "loss": 0.999, - "step": 33753 - }, - { - "epoch": 0.87, - "learning_rate": 1.669834936232981e-06, - "loss": 0.8389, - "step": 33754 - }, - { - "epoch": 0.87, - "learning_rate": 1.6698143903867474e-06, - "loss": 1.0508, - "step": 33755 - }, - { - "epoch": 0.87, - "learning_rate": 1.669793844027668e-06, - "loss": 0.9609, - "step": 33756 - }, - { - "epoch": 0.87, - "learning_rate": 1.6697732971557578e-06, - "loss": 0.8242, - "step": 33757 - }, - { - "epoch": 0.87, - "learning_rate": 1.6697527497710332e-06, - "loss": 0.6426, - "step": 33758 - }, - { - "epoch": 0.87, - "learning_rate": 1.6697322018735098e-06, - "loss": 0.9434, - "step": 33759 - }, - { - "epoch": 0.87, - "learning_rate": 1.669711653463203e-06, - "loss": 0.6416, - "step": 33760 - }, - { - "epoch": 0.87, - "learning_rate": 1.6696911045401292e-06, - "loss": 0.8926, - "step": 33761 - }, - { - "epoch": 0.87, - "learning_rate": 1.6696705551043033e-06, - "loss": 0.728, - "step": 33762 - }, - { - "epoch": 0.87, - "learning_rate": 1.6696500051557417e-06, - "loss": 0.8154, - "step": 33763 - }, - { - "epoch": 0.87, - "learning_rate": 1.6696294546944598e-06, - "loss": 0.9795, - "step": 33764 - }, - { - "epoch": 0.87, - "learning_rate": 1.6696089037204732e-06, - "loss": 0.7734, - "step": 33765 - }, - { - "epoch": 0.87, - "learning_rate": 1.6695883522337982e-06, - "loss": 0.7241, - "step": 33766 - }, - { - "epoch": 0.87, - "learning_rate": 1.66956780023445e-06, - "loss": 0.6963, - "step": 33767 - }, - { - "epoch": 0.87, - "learning_rate": 1.6695472477224446e-06, - "loss": 0.9775, - "step": 33768 - }, - { - "epoch": 0.87, - "learning_rate": 1.6695266946977977e-06, - "loss": 0.8975, - "step": 33769 - }, - { - "epoch": 0.87, - "learning_rate": 1.6695061411605246e-06, - "loss": 0.8633, - "step": 33770 - }, - { - "epoch": 0.87, - "learning_rate": 1.669485587110642e-06, - "loss": 0.6726, - "step": 33771 - }, - { - "epoch": 0.87, - "learning_rate": 1.6694650325481646e-06, - "loss": 0.791, - "step": 33772 - }, - { - "epoch": 0.87, - "learning_rate": 1.669444477473109e-06, - "loss": 0.7256, - "step": 33773 - }, - { - "epoch": 0.87, - "learning_rate": 1.6694239218854905e-06, - "loss": 0.8159, - "step": 33774 - }, - { - "epoch": 0.87, - "learning_rate": 1.6694033657853246e-06, - "loss": 0.7339, - "step": 33775 - }, - { - "epoch": 0.87, - "learning_rate": 1.6693828091726275e-06, - "loss": 0.7124, - "step": 33776 - }, - { - "epoch": 0.87, - "learning_rate": 1.6693622520474147e-06, - "loss": 0.8174, - "step": 33777 - }, - { - "epoch": 0.87, - "learning_rate": 1.669341694409702e-06, - "loss": 0.7354, - "step": 33778 - }, - { - "epoch": 0.87, - "learning_rate": 1.6693211362595051e-06, - "loss": 0.9102, - "step": 33779 - }, - { - "epoch": 0.87, - "learning_rate": 1.6693005775968399e-06, - "loss": 0.8027, - "step": 33780 - }, - { - "epoch": 0.87, - "learning_rate": 1.669280018421722e-06, - "loss": 0.8379, - "step": 33781 - }, - { - "epoch": 0.87, - "learning_rate": 1.6692594587341672e-06, - "loss": 0.6938, - "step": 33782 - }, - { - "epoch": 0.87, - "learning_rate": 1.6692388985341912e-06, - "loss": 0.9902, - "step": 33783 - }, - { - "epoch": 0.87, - "learning_rate": 1.6692183378218098e-06, - "loss": 0.7773, - "step": 33784 - }, - { - "epoch": 0.87, - "learning_rate": 1.6691977765970384e-06, - "loss": 0.5803, - "step": 33785 - }, - { - "epoch": 0.87, - "learning_rate": 1.6691772148598932e-06, - "loss": 0.7715, - "step": 33786 - }, - { - "epoch": 0.87, - "learning_rate": 1.6691566526103897e-06, - "loss": 0.5513, - "step": 33787 - }, - { - "epoch": 0.87, - "learning_rate": 1.669136089848544e-06, - "loss": 0.8086, - "step": 33788 - }, - { - "epoch": 0.87, - "learning_rate": 1.6691155265743712e-06, - "loss": 0.7832, - "step": 33789 - }, - { - "epoch": 0.87, - "learning_rate": 1.6690949627878878e-06, - "loss": 0.9395, - "step": 33790 - }, - { - "epoch": 0.87, - "learning_rate": 1.669074398489109e-06, - "loss": 0.7339, - "step": 33791 - }, - { - "epoch": 0.87, - "learning_rate": 1.6690538336780505e-06, - "loss": 0.9902, - "step": 33792 - }, - { - "epoch": 0.87, - "learning_rate": 1.6690332683547283e-06, - "loss": 0.9082, - "step": 33793 - }, - { - "epoch": 0.87, - "learning_rate": 1.6690127025191583e-06, - "loss": 0.7734, - "step": 33794 - }, - { - "epoch": 0.87, - "learning_rate": 1.668992136171356e-06, - "loss": 1.0244, - "step": 33795 - }, - { - "epoch": 0.87, - "learning_rate": 1.668971569311337e-06, - "loss": 0.8408, - "step": 33796 - }, - { - "epoch": 0.87, - "learning_rate": 1.6689510019391173e-06, - "loss": 0.7803, - "step": 33797 - }, - { - "epoch": 0.87, - "learning_rate": 1.6689304340547127e-06, - "loss": 0.7944, - "step": 33798 - }, - { - "epoch": 0.87, - "learning_rate": 1.6689098656581386e-06, - "loss": 0.7148, - "step": 33799 - }, - { - "epoch": 0.87, - "learning_rate": 1.6688892967494113e-06, - "loss": 0.8359, - "step": 33800 - }, - { - "epoch": 0.87, - "learning_rate": 1.668868727328546e-06, - "loss": 0.9785, - "step": 33801 - }, - { - "epoch": 0.87, - "learning_rate": 1.6688481573955586e-06, - "loss": 0.959, - "step": 33802 - }, - { - "epoch": 0.87, - "learning_rate": 1.668827586950465e-06, - "loss": 0.6887, - "step": 33803 - }, - { - "epoch": 0.87, - "learning_rate": 1.668807015993281e-06, - "loss": 0.7109, - "step": 33804 - }, - { - "epoch": 0.87, - "learning_rate": 1.6687864445240218e-06, - "loss": 0.8252, - "step": 33805 - }, - { - "epoch": 0.87, - "learning_rate": 1.668765872542704e-06, - "loss": 0.626, - "step": 33806 - }, - { - "epoch": 0.87, - "learning_rate": 1.668745300049343e-06, - "loss": 0.5913, - "step": 33807 - }, - { - "epoch": 0.87, - "learning_rate": 1.6687247270439543e-06, - "loss": 0.9365, - "step": 33808 - }, - { - "epoch": 0.87, - "learning_rate": 1.6687041535265535e-06, - "loss": 0.7861, - "step": 33809 - }, - { - "epoch": 0.87, - "learning_rate": 1.668683579497157e-06, - "loss": 0.8877, - "step": 33810 - }, - { - "epoch": 0.87, - "learning_rate": 1.6686630049557802e-06, - "loss": 0.8291, - "step": 33811 - }, - { - "epoch": 0.87, - "learning_rate": 1.668642429902439e-06, - "loss": 0.9229, - "step": 33812 - }, - { - "epoch": 0.87, - "learning_rate": 1.6686218543371488e-06, - "loss": 0.8857, - "step": 33813 - }, - { - "epoch": 0.87, - "learning_rate": 1.668601278259926e-06, - "loss": 0.752, - "step": 33814 - }, - { - "epoch": 0.87, - "learning_rate": 1.6685807016707853e-06, - "loss": 0.6377, - "step": 33815 - }, - { - "epoch": 0.87, - "learning_rate": 1.6685601245697436e-06, - "loss": 0.8555, - "step": 33816 - }, - { - "epoch": 0.87, - "learning_rate": 1.668539546956816e-06, - "loss": 0.6631, - "step": 33817 - }, - { - "epoch": 0.87, - "learning_rate": 1.6685189688320186e-06, - "loss": 0.7354, - "step": 33818 - }, - { - "epoch": 0.87, - "learning_rate": 1.6684983901953667e-06, - "loss": 0.7764, - "step": 33819 - }, - { - "epoch": 0.87, - "learning_rate": 1.6684778110468764e-06, - "loss": 0.7715, - "step": 33820 - }, - { - "epoch": 0.87, - "learning_rate": 1.6684572313865634e-06, - "loss": 0.9219, - "step": 33821 - }, - { - "epoch": 0.87, - "learning_rate": 1.6684366512144434e-06, - "loss": 1.0596, - "step": 33822 - }, - { - "epoch": 0.87, - "learning_rate": 1.6684160705305321e-06, - "loss": 1.0381, - "step": 33823 - }, - { - "epoch": 0.87, - "learning_rate": 1.6683954893348457e-06, - "loss": 0.8975, - "step": 33824 - }, - { - "epoch": 0.87, - "learning_rate": 1.6683749076273991e-06, - "loss": 0.8574, - "step": 33825 - }, - { - "epoch": 0.87, - "learning_rate": 1.668354325408209e-06, - "loss": 0.8066, - "step": 33826 - }, - { - "epoch": 0.87, - "learning_rate": 1.6683337426772905e-06, - "loss": 0.7275, - "step": 33827 - }, - { - "epoch": 0.87, - "learning_rate": 1.6683131594346596e-06, - "loss": 0.7725, - "step": 33828 - }, - { - "epoch": 0.87, - "learning_rate": 1.668292575680332e-06, - "loss": 0.9004, - "step": 33829 - }, - { - "epoch": 0.87, - "learning_rate": 1.6682719914143237e-06, - "loss": 0.7031, - "step": 33830 - }, - { - "epoch": 0.87, - "learning_rate": 1.6682514066366502e-06, - "loss": 0.833, - "step": 33831 - }, - { - "epoch": 0.87, - "learning_rate": 1.6682308213473272e-06, - "loss": 0.9648, - "step": 33832 - }, - { - "epoch": 0.87, - "learning_rate": 1.6682102355463707e-06, - "loss": 0.9648, - "step": 33833 - }, - { - "epoch": 0.87, - "learning_rate": 1.6681896492337963e-06, - "loss": 0.8506, - "step": 33834 - }, - { - "epoch": 0.87, - "learning_rate": 1.6681690624096198e-06, - "loss": 0.8779, - "step": 33835 - }, - { - "epoch": 0.87, - "learning_rate": 1.668148475073857e-06, - "loss": 0.8389, - "step": 33836 - }, - { - "epoch": 0.87, - "learning_rate": 1.668127887226524e-06, - "loss": 0.623, - "step": 33837 - }, - { - "epoch": 0.87, - "learning_rate": 1.6681072988676355e-06, - "loss": 0.7891, - "step": 33838 - }, - { - "epoch": 0.87, - "learning_rate": 1.6680867099972082e-06, - "loss": 0.8828, - "step": 33839 - }, - { - "epoch": 0.87, - "learning_rate": 1.6680661206152577e-06, - "loss": 0.7158, - "step": 33840 - }, - { - "epoch": 0.87, - "learning_rate": 1.6680455307217997e-06, - "loss": 0.7144, - "step": 33841 - }, - { - "epoch": 0.87, - "learning_rate": 1.66802494031685e-06, - "loss": 0.96, - "step": 33842 - }, - { - "epoch": 0.87, - "learning_rate": 1.6680043494004244e-06, - "loss": 0.5376, - "step": 33843 - }, - { - "epoch": 0.87, - "learning_rate": 1.6679837579725385e-06, - "loss": 1.0137, - "step": 33844 - }, - { - "epoch": 0.87, - "learning_rate": 1.6679631660332079e-06, - "loss": 0.6233, - "step": 33845 - }, - { - "epoch": 0.87, - "learning_rate": 1.6679425735824488e-06, - "loss": 0.8779, - "step": 33846 - }, - { - "epoch": 0.87, - "learning_rate": 1.667921980620277e-06, - "loss": 0.8184, - "step": 33847 - }, - { - "epoch": 0.87, - "learning_rate": 1.6679013871467078e-06, - "loss": 0.915, - "step": 33848 - }, - { - "epoch": 0.87, - "learning_rate": 1.6678807931617573e-06, - "loss": 0.7607, - "step": 33849 - }, - { - "epoch": 0.87, - "learning_rate": 1.667860198665441e-06, - "loss": 0.8438, - "step": 33850 - }, - { - "epoch": 0.87, - "learning_rate": 1.667839603657775e-06, - "loss": 0.9355, - "step": 33851 - }, - { - "epoch": 0.87, - "learning_rate": 1.667819008138775e-06, - "loss": 0.8867, - "step": 33852 - }, - { - "epoch": 0.87, - "learning_rate": 1.6677984121084567e-06, - "loss": 0.8115, - "step": 33853 - }, - { - "epoch": 0.87, - "learning_rate": 1.6677778155668358e-06, - "loss": 0.6685, - "step": 33854 - }, - { - "epoch": 0.87, - "learning_rate": 1.667757218513928e-06, - "loss": 0.7603, - "step": 33855 - }, - { - "epoch": 0.87, - "learning_rate": 1.6677366209497495e-06, - "loss": 0.8027, - "step": 33856 - }, - { - "epoch": 0.87, - "learning_rate": 1.6677160228743157e-06, - "loss": 1.0596, - "step": 33857 - }, - { - "epoch": 0.87, - "learning_rate": 1.6676954242876425e-06, - "loss": 0.5299, - "step": 33858 - }, - { - "epoch": 0.87, - "learning_rate": 1.6676748251897453e-06, - "loss": 1.0693, - "step": 33859 - }, - { - "epoch": 0.87, - "learning_rate": 1.6676542255806402e-06, - "loss": 0.9697, - "step": 33860 - }, - { - "epoch": 0.87, - "learning_rate": 1.6676336254603432e-06, - "loss": 0.8474, - "step": 33861 - }, - { - "epoch": 0.87, - "learning_rate": 1.6676130248288698e-06, - "loss": 0.8271, - "step": 33862 - }, - { - "epoch": 0.87, - "learning_rate": 1.6675924236862357e-06, - "loss": 0.9268, - "step": 33863 - }, - { - "epoch": 0.87, - "learning_rate": 1.6675718220324568e-06, - "loss": 0.8008, - "step": 33864 - }, - { - "epoch": 0.87, - "learning_rate": 1.667551219867549e-06, - "loss": 0.9443, - "step": 33865 - }, - { - "epoch": 0.87, - "learning_rate": 1.6675306171915278e-06, - "loss": 0.9111, - "step": 33866 - }, - { - "epoch": 0.87, - "learning_rate": 1.6675100140044093e-06, - "loss": 0.9336, - "step": 33867 - }, - { - "epoch": 0.87, - "learning_rate": 1.6674894103062088e-06, - "loss": 1.0215, - "step": 33868 - }, - { - "epoch": 0.87, - "learning_rate": 1.6674688060969423e-06, - "loss": 0.8169, - "step": 33869 - }, - { - "epoch": 0.87, - "learning_rate": 1.6674482013766257e-06, - "loss": 0.9297, - "step": 33870 - }, - { - "epoch": 0.87, - "learning_rate": 1.667427596145275e-06, - "loss": 0.8677, - "step": 33871 - }, - { - "epoch": 0.87, - "learning_rate": 1.6674069904029053e-06, - "loss": 0.9277, - "step": 33872 - }, - { - "epoch": 0.87, - "learning_rate": 1.6673863841495327e-06, - "loss": 1.0693, - "step": 33873 - }, - { - "epoch": 0.87, - "learning_rate": 1.6673657773851732e-06, - "loss": 0.9473, - "step": 33874 - }, - { - "epoch": 0.87, - "learning_rate": 1.6673451701098427e-06, - "loss": 0.7285, - "step": 33875 - }, - { - "epoch": 0.87, - "learning_rate": 1.6673245623235563e-06, - "loss": 0.916, - "step": 33876 - }, - { - "epoch": 0.87, - "learning_rate": 1.6673039540263303e-06, - "loss": 0.6084, - "step": 33877 - }, - { - "epoch": 0.87, - "learning_rate": 1.6672833452181804e-06, - "loss": 1.0, - "step": 33878 - }, - { - "epoch": 0.87, - "learning_rate": 1.6672627358991222e-06, - "loss": 0.8564, - "step": 33879 - }, - { - "epoch": 0.87, - "learning_rate": 1.6672421260691717e-06, - "loss": 1.0342, - "step": 33880 - }, - { - "epoch": 0.87, - "learning_rate": 1.6672215157283445e-06, - "loss": 0.5425, - "step": 33881 - }, - { - "epoch": 0.87, - "learning_rate": 1.6672009048766567e-06, - "loss": 0.7812, - "step": 33882 - }, - { - "epoch": 0.87, - "learning_rate": 1.6671802935141237e-06, - "loss": 1.0332, - "step": 33883 - }, - { - "epoch": 0.87, - "learning_rate": 1.6671596816407614e-06, - "loss": 0.832, - "step": 33884 - }, - { - "epoch": 0.87, - "learning_rate": 1.6671390692565854e-06, - "loss": 0.6567, - "step": 33885 - }, - { - "epoch": 0.87, - "learning_rate": 1.6671184563616118e-06, - "loss": 1.0215, - "step": 33886 - }, - { - "epoch": 0.87, - "learning_rate": 1.6670978429558567e-06, - "loss": 0.916, - "step": 33887 - }, - { - "epoch": 0.87, - "learning_rate": 1.667077229039335e-06, - "loss": 0.9121, - "step": 33888 - }, - { - "epoch": 0.87, - "learning_rate": 1.667056614612063e-06, - "loss": 1.0938, - "step": 33889 - }, - { - "epoch": 0.87, - "learning_rate": 1.6670359996740567e-06, - "loss": 0.9668, - "step": 33890 - }, - { - "epoch": 0.87, - "learning_rate": 1.667015384225331e-06, - "loss": 0.7017, - "step": 33891 - }, - { - "epoch": 0.87, - "learning_rate": 1.6669947682659029e-06, - "loss": 0.959, - "step": 33892 - }, - { - "epoch": 0.87, - "learning_rate": 1.666974151795787e-06, - "loss": 0.7295, - "step": 33893 - }, - { - "epoch": 0.87, - "learning_rate": 1.6669535348150002e-06, - "loss": 0.7363, - "step": 33894 - }, - { - "epoch": 0.87, - "learning_rate": 1.6669329173235576e-06, - "loss": 0.8828, - "step": 33895 - }, - { - "epoch": 0.87, - "learning_rate": 1.666912299321475e-06, - "loss": 0.6953, - "step": 33896 - }, - { - "epoch": 0.87, - "learning_rate": 1.6668916808087684e-06, - "loss": 0.9268, - "step": 33897 - }, - { - "epoch": 0.87, - "learning_rate": 1.6668710617854535e-06, - "loss": 0.8457, - "step": 33898 - }, - { - "epoch": 0.87, - "learning_rate": 1.6668504422515462e-06, - "loss": 0.7227, - "step": 33899 - }, - { - "epoch": 0.87, - "learning_rate": 1.6668298222070623e-06, - "loss": 0.7246, - "step": 33900 - }, - { - "epoch": 0.87, - "learning_rate": 1.666809201652017e-06, - "loss": 0.6772, - "step": 33901 - }, - { - "epoch": 0.87, - "learning_rate": 1.6667885805864271e-06, - "loss": 0.96, - "step": 33902 - }, - { - "epoch": 0.87, - "learning_rate": 1.6667679590103073e-06, - "loss": 0.7852, - "step": 33903 - }, - { - "epoch": 0.87, - "learning_rate": 1.6667473369236742e-06, - "loss": 0.7329, - "step": 33904 - }, - { - "epoch": 0.87, - "learning_rate": 1.6667267143265433e-06, - "loss": 0.9072, - "step": 33905 - }, - { - "epoch": 0.87, - "learning_rate": 1.6667060912189305e-06, - "loss": 0.7114, - "step": 33906 - }, - { - "epoch": 0.87, - "learning_rate": 1.6666854676008515e-06, - "loss": 0.8096, - "step": 33907 - }, - { - "epoch": 0.87, - "learning_rate": 1.666664843472322e-06, - "loss": 0.8438, - "step": 33908 - }, - { - "epoch": 0.87, - "learning_rate": 1.6666442188333578e-06, - "loss": 0.5942, - "step": 33909 - }, - { - "epoch": 0.87, - "learning_rate": 1.6666235936839749e-06, - "loss": 0.8311, - "step": 33910 - }, - { - "epoch": 0.87, - "learning_rate": 1.666602968024189e-06, - "loss": 0.8318, - "step": 33911 - }, - { - "epoch": 0.87, - "learning_rate": 1.6665823418540157e-06, - "loss": 0.6421, - "step": 33912 - }, - { - "epoch": 0.87, - "learning_rate": 1.6665617151734713e-06, - "loss": 0.7598, - "step": 33913 - }, - { - "epoch": 0.87, - "learning_rate": 1.6665410879825708e-06, - "loss": 0.9072, - "step": 33914 - }, - { - "epoch": 0.87, - "learning_rate": 1.6665204602813305e-06, - "loss": 0.999, - "step": 33915 - }, - { - "epoch": 0.87, - "learning_rate": 1.6664998320697664e-06, - "loss": 0.9678, - "step": 33916 - }, - { - "epoch": 0.87, - "learning_rate": 1.666479203347894e-06, - "loss": 0.6821, - "step": 33917 - }, - { - "epoch": 0.87, - "learning_rate": 1.6664585741157288e-06, - "loss": 0.8281, - "step": 33918 - }, - { - "epoch": 0.87, - "learning_rate": 1.6664379443732873e-06, - "loss": 0.7358, - "step": 33919 - }, - { - "epoch": 0.87, - "learning_rate": 1.6664173141205846e-06, - "loss": 0.7783, - "step": 33920 - }, - { - "epoch": 0.87, - "learning_rate": 1.6663966833576368e-06, - "loss": 1.0078, - "step": 33921 - }, - { - "epoch": 0.87, - "learning_rate": 1.6663760520844598e-06, - "loss": 0.8311, - "step": 33922 - }, - { - "epoch": 0.87, - "learning_rate": 1.6663554203010695e-06, - "loss": 0.9355, - "step": 33923 - }, - { - "epoch": 0.87, - "learning_rate": 1.6663347880074814e-06, - "loss": 0.5664, - "step": 33924 - }, - { - "epoch": 0.87, - "learning_rate": 1.666314155203711e-06, - "loss": 0.999, - "step": 33925 - }, - { - "epoch": 0.87, - "learning_rate": 1.6662935218897748e-06, - "loss": 0.9346, - "step": 33926 - }, - { - "epoch": 0.87, - "learning_rate": 1.6662728880656886e-06, - "loss": 0.916, - "step": 33927 - }, - { - "epoch": 0.87, - "learning_rate": 1.6662522537314673e-06, - "loss": 1.0859, - "step": 33928 - }, - { - "epoch": 0.87, - "learning_rate": 1.6662316188871276e-06, - "loss": 0.6875, - "step": 33929 - }, - { - "epoch": 0.87, - "learning_rate": 1.666210983532685e-06, - "loss": 0.8066, - "step": 33930 - }, - { - "epoch": 0.87, - "learning_rate": 1.6661903476681553e-06, - "loss": 0.7222, - "step": 33931 - }, - { - "epoch": 0.87, - "learning_rate": 1.6661697112935543e-06, - "loss": 0.8008, - "step": 33932 - }, - { - "epoch": 0.87, - "learning_rate": 1.6661490744088975e-06, - "loss": 0.8169, - "step": 33933 - }, - { - "epoch": 0.87, - "learning_rate": 1.6661284370142013e-06, - "loss": 0.8252, - "step": 33934 - }, - { - "epoch": 0.87, - "learning_rate": 1.666107799109481e-06, - "loss": 0.7686, - "step": 33935 - }, - { - "epoch": 0.87, - "learning_rate": 1.6660871606947525e-06, - "loss": 0.7463, - "step": 33936 - }, - { - "epoch": 0.87, - "learning_rate": 1.666066521770032e-06, - "loss": 0.7617, - "step": 33937 - }, - { - "epoch": 0.87, - "learning_rate": 1.6660458823353348e-06, - "loss": 0.833, - "step": 33938 - }, - { - "epoch": 0.87, - "learning_rate": 1.666025242390677e-06, - "loss": 0.791, - "step": 33939 - }, - { - "epoch": 0.87, - "learning_rate": 1.6660046019360742e-06, - "loss": 0.7217, - "step": 33940 - }, - { - "epoch": 0.87, - "learning_rate": 1.6659839609715422e-06, - "loss": 0.9678, - "step": 33941 - }, - { - "epoch": 0.87, - "learning_rate": 1.6659633194970972e-06, - "loss": 0.8535, - "step": 33942 - }, - { - "epoch": 0.87, - "learning_rate": 1.6659426775127545e-06, - "loss": 0.8418, - "step": 33943 - }, - { - "epoch": 0.87, - "learning_rate": 1.6659220350185301e-06, - "loss": 0.832, - "step": 33944 - }, - { - "epoch": 0.87, - "learning_rate": 1.6659013920144398e-06, - "loss": 0.8916, - "step": 33945 - }, - { - "epoch": 0.87, - "learning_rate": 1.6658807485004995e-06, - "loss": 0.8408, - "step": 33946 - }, - { - "epoch": 0.87, - "learning_rate": 1.6658601044767249e-06, - "loss": 1.0762, - "step": 33947 - }, - { - "epoch": 0.87, - "learning_rate": 1.6658394599431321e-06, - "loss": 0.9434, - "step": 33948 - }, - { - "epoch": 0.87, - "learning_rate": 1.6658188148997362e-06, - "loss": 0.7783, - "step": 33949 - }, - { - "epoch": 0.87, - "learning_rate": 1.6657981693465536e-06, - "loss": 0.8252, - "step": 33950 - }, - { - "epoch": 0.87, - "learning_rate": 1.6657775232836e-06, - "loss": 0.7393, - "step": 33951 - }, - { - "epoch": 0.87, - "learning_rate": 1.6657568767108913e-06, - "loss": 1.0625, - "step": 33952 - }, - { - "epoch": 0.87, - "learning_rate": 1.665736229628443e-06, - "loss": 0.9893, - "step": 33953 - }, - { - "epoch": 0.87, - "learning_rate": 1.6657155820362712e-06, - "loss": 0.959, - "step": 33954 - }, - { - "epoch": 0.87, - "learning_rate": 1.6656949339343914e-06, - "loss": 0.7354, - "step": 33955 - }, - { - "epoch": 0.87, - "learning_rate": 1.6656742853228197e-06, - "loss": 0.7998, - "step": 33956 - }, - { - "epoch": 0.87, - "learning_rate": 1.6656536362015716e-06, - "loss": 0.6416, - "step": 33957 - }, - { - "epoch": 0.87, - "learning_rate": 1.6656329865706635e-06, - "loss": 0.8125, - "step": 33958 - }, - { - "epoch": 0.87, - "learning_rate": 1.6656123364301107e-06, - "loss": 0.7529, - "step": 33959 - }, - { - "epoch": 0.87, - "learning_rate": 1.665591685779929e-06, - "loss": 0.9512, - "step": 33960 - }, - { - "epoch": 0.87, - "learning_rate": 1.6655710346201346e-06, - "loss": 0.8252, - "step": 33961 - }, - { - "epoch": 0.87, - "learning_rate": 1.6655503829507426e-06, - "loss": 0.7881, - "step": 33962 - }, - { - "epoch": 0.87, - "learning_rate": 1.6655297307717697e-06, - "loss": 0.8213, - "step": 33963 - }, - { - "epoch": 0.87, - "learning_rate": 1.6655090780832312e-06, - "loss": 0.686, - "step": 33964 - }, - { - "epoch": 0.87, - "learning_rate": 1.6654884248851428e-06, - "loss": 0.9434, - "step": 33965 - }, - { - "epoch": 0.87, - "learning_rate": 1.6654677711775208e-06, - "loss": 0.6631, - "step": 33966 - }, - { - "epoch": 0.87, - "learning_rate": 1.6654471169603808e-06, - "loss": 0.9507, - "step": 33967 - }, - { - "epoch": 0.87, - "learning_rate": 1.6654264622337384e-06, - "loss": 0.9062, - "step": 33968 - }, - { - "epoch": 0.87, - "learning_rate": 1.6654058069976094e-06, - "loss": 0.9453, - "step": 33969 - }, - { - "epoch": 0.87, - "learning_rate": 1.6653851512520099e-06, - "loss": 0.6138, - "step": 33970 - }, - { - "epoch": 0.87, - "learning_rate": 1.6653644949969554e-06, - "loss": 0.7046, - "step": 33971 - }, - { - "epoch": 0.87, - "learning_rate": 1.6653438382324622e-06, - "loss": 0.9141, - "step": 33972 - }, - { - "epoch": 0.87, - "learning_rate": 1.6653231809585457e-06, - "loss": 0.6384, - "step": 33973 - }, - { - "epoch": 0.87, - "learning_rate": 1.6653025231752218e-06, - "loss": 0.9229, - "step": 33974 - }, - { - "epoch": 0.87, - "learning_rate": 1.6652818648825063e-06, - "loss": 0.8887, - "step": 33975 - }, - { - "epoch": 0.87, - "learning_rate": 1.665261206080415e-06, - "loss": 0.8008, - "step": 33976 - }, - { - "epoch": 0.87, - "learning_rate": 1.6652405467689641e-06, - "loss": 0.96, - "step": 33977 - }, - { - "epoch": 0.87, - "learning_rate": 1.665219886948169e-06, - "loss": 0.668, - "step": 33978 - }, - { - "epoch": 0.87, - "learning_rate": 1.6651992266180455e-06, - "loss": 1.0566, - "step": 33979 - }, - { - "epoch": 0.87, - "learning_rate": 1.6651785657786094e-06, - "loss": 1.0625, - "step": 33980 - }, - { - "epoch": 0.87, - "learning_rate": 1.665157904429877e-06, - "loss": 1.0889, - "step": 33981 - }, - { - "epoch": 0.87, - "learning_rate": 1.6651372425718634e-06, - "loss": 0.751, - "step": 33982 - }, - { - "epoch": 0.87, - "learning_rate": 1.665116580204585e-06, - "loss": 0.7549, - "step": 33983 - }, - { - "epoch": 0.87, - "learning_rate": 1.6650959173280574e-06, - "loss": 0.6484, - "step": 33984 - }, - { - "epoch": 0.87, - "learning_rate": 1.6650752539422965e-06, - "loss": 0.7437, - "step": 33985 - }, - { - "epoch": 0.87, - "learning_rate": 1.665054590047318e-06, - "loss": 0.917, - "step": 33986 - }, - { - "epoch": 0.87, - "learning_rate": 1.6650339256431378e-06, - "loss": 0.9414, - "step": 33987 - }, - { - "epoch": 0.87, - "learning_rate": 1.6650132607297718e-06, - "loss": 0.6943, - "step": 33988 - }, - { - "epoch": 0.87, - "learning_rate": 1.6649925953072357e-06, - "loss": 0.9365, - "step": 33989 - }, - { - "epoch": 0.87, - "learning_rate": 1.664971929375545e-06, - "loss": 0.8594, - "step": 33990 - }, - { - "epoch": 0.87, - "learning_rate": 1.6649512629347163e-06, - "loss": 0.9658, - "step": 33991 - }, - { - "epoch": 0.87, - "learning_rate": 1.664930595984765e-06, - "loss": 0.9561, - "step": 33992 - }, - { - "epoch": 0.87, - "learning_rate": 1.6649099285257067e-06, - "loss": 1.0322, - "step": 33993 - }, - { - "epoch": 0.87, - "learning_rate": 1.6648892605575573e-06, - "loss": 0.8853, - "step": 33994 - }, - { - "epoch": 0.87, - "learning_rate": 1.664868592080333e-06, - "loss": 0.8916, - "step": 33995 - }, - { - "epoch": 0.87, - "learning_rate": 1.6648479230940493e-06, - "loss": 0.9141, - "step": 33996 - }, - { - "epoch": 0.87, - "learning_rate": 1.6648272535987223e-06, - "loss": 0.6904, - "step": 33997 - }, - { - "epoch": 0.87, - "learning_rate": 1.6648065835943674e-06, - "loss": 0.9785, - "step": 33998 - }, - { - "epoch": 0.87, - "learning_rate": 1.6647859130810007e-06, - "loss": 0.8418, - "step": 33999 - }, - { - "epoch": 0.87, - "learning_rate": 1.6647652420586382e-06, - "loss": 0.7588, - "step": 34000 - }, - { - "epoch": 0.87, - "learning_rate": 1.6647445705272954e-06, - "loss": 0.8711, - "step": 34001 - }, - { - "epoch": 0.87, - "learning_rate": 1.6647238984869883e-06, - "loss": 0.7607, - "step": 34002 - }, - { - "epoch": 0.87, - "learning_rate": 1.6647032259377327e-06, - "loss": 0.6333, - "step": 34003 - }, - { - "epoch": 0.87, - "learning_rate": 1.6646825528795443e-06, - "loss": 0.9658, - "step": 34004 - }, - { - "epoch": 0.87, - "learning_rate": 1.664661879312439e-06, - "loss": 0.7729, - "step": 34005 - }, - { - "epoch": 0.87, - "learning_rate": 1.6646412052364327e-06, - "loss": 1.0166, - "step": 34006 - }, - { - "epoch": 0.87, - "learning_rate": 1.664620530651541e-06, - "loss": 0.7549, - "step": 34007 - }, - { - "epoch": 0.87, - "learning_rate": 1.6645998555577802e-06, - "loss": 1.0312, - "step": 34008 - }, - { - "epoch": 0.87, - "learning_rate": 1.6645791799551657e-06, - "loss": 0.9775, - "step": 34009 - }, - { - "epoch": 0.87, - "learning_rate": 1.6645585038437135e-06, - "loss": 0.7969, - "step": 34010 - }, - { - "epoch": 0.87, - "learning_rate": 1.6645378272234397e-06, - "loss": 0.9482, - "step": 34011 - }, - { - "epoch": 0.87, - "learning_rate": 1.6645171500943595e-06, - "loss": 0.8633, - "step": 34012 - }, - { - "epoch": 0.87, - "learning_rate": 1.6644964724564892e-06, - "loss": 0.8887, - "step": 34013 - }, - { - "epoch": 0.87, - "learning_rate": 1.6644757943098444e-06, - "loss": 0.917, - "step": 34014 - }, - { - "epoch": 0.87, - "learning_rate": 1.664455115654441e-06, - "loss": 0.5789, - "step": 34015 - }, - { - "epoch": 0.87, - "learning_rate": 1.6644344364902952e-06, - "loss": 0.8613, - "step": 34016 - }, - { - "epoch": 0.87, - "learning_rate": 1.6644137568174224e-06, - "loss": 0.8752, - "step": 34017 - }, - { - "epoch": 0.87, - "learning_rate": 1.6643930766358382e-06, - "loss": 0.9766, - "step": 34018 - }, - { - "epoch": 0.87, - "learning_rate": 1.6643723959455592e-06, - "loss": 1.0459, - "step": 34019 - }, - { - "epoch": 0.87, - "learning_rate": 1.6643517147466003e-06, - "loss": 0.8613, - "step": 34020 - }, - { - "epoch": 0.87, - "learning_rate": 1.6643310330389785e-06, - "loss": 0.7397, - "step": 34021 - }, - { - "epoch": 0.87, - "learning_rate": 1.6643103508227084e-06, - "loss": 0.7778, - "step": 34022 - }, - { - "epoch": 0.87, - "learning_rate": 1.6642896680978068e-06, - "loss": 0.9375, - "step": 34023 - }, - { - "epoch": 0.87, - "learning_rate": 1.664268984864289e-06, - "loss": 0.6675, - "step": 34024 - }, - { - "epoch": 0.87, - "learning_rate": 1.6642483011221708e-06, - "loss": 0.7339, - "step": 34025 - }, - { - "epoch": 0.87, - "learning_rate": 1.6642276168714685e-06, - "loss": 0.96, - "step": 34026 - }, - { - "epoch": 0.87, - "learning_rate": 1.6642069321121974e-06, - "loss": 1.0088, - "step": 34027 - }, - { - "epoch": 0.87, - "learning_rate": 1.6641862468443737e-06, - "loss": 0.8916, - "step": 34028 - }, - { - "epoch": 0.87, - "learning_rate": 1.6641655610680131e-06, - "loss": 0.8584, - "step": 34029 - }, - { - "epoch": 0.87, - "learning_rate": 1.6641448747831315e-06, - "loss": 1.0181, - "step": 34030 - }, - { - "epoch": 0.87, - "learning_rate": 1.6641241879897447e-06, - "loss": 0.9648, - "step": 34031 - }, - { - "epoch": 0.87, - "learning_rate": 1.6641035006878688e-06, - "loss": 0.79, - "step": 34032 - }, - { - "epoch": 0.87, - "learning_rate": 1.6640828128775191e-06, - "loss": 0.6348, - "step": 34033 - }, - { - "epoch": 0.87, - "learning_rate": 1.6640621245587117e-06, - "loss": 0.9678, - "step": 34034 - }, - { - "epoch": 0.87, - "learning_rate": 1.6640414357314624e-06, - "loss": 0.8047, - "step": 34035 - }, - { - "epoch": 0.87, - "learning_rate": 1.6640207463957873e-06, - "loss": 0.8896, - "step": 34036 - }, - { - "epoch": 0.87, - "learning_rate": 1.6640000565517023e-06, - "loss": 0.9243, - "step": 34037 - }, - { - "epoch": 0.87, - "learning_rate": 1.6639793661992228e-06, - "loss": 0.8525, - "step": 34038 - }, - { - "epoch": 0.87, - "learning_rate": 1.6639586753383645e-06, - "loss": 0.6357, - "step": 34039 - }, - { - "epoch": 0.87, - "learning_rate": 1.6639379839691437e-06, - "loss": 0.9033, - "step": 34040 - }, - { - "epoch": 0.87, - "learning_rate": 1.6639172920915762e-06, - "loss": 0.833, - "step": 34041 - }, - { - "epoch": 0.87, - "learning_rate": 1.6638965997056779e-06, - "loss": 0.8906, - "step": 34042 - }, - { - "epoch": 0.87, - "learning_rate": 1.6638759068114645e-06, - "loss": 0.752, - "step": 34043 - }, - { - "epoch": 0.87, - "learning_rate": 1.6638552134089517e-06, - "loss": 0.707, - "step": 34044 - }, - { - "epoch": 0.87, - "learning_rate": 1.6638345194981553e-06, - "loss": 0.6777, - "step": 34045 - }, - { - "epoch": 0.87, - "learning_rate": 1.6638138250790916e-06, - "loss": 0.9043, - "step": 34046 - }, - { - "epoch": 0.87, - "learning_rate": 1.663793130151776e-06, - "loss": 0.9619, - "step": 34047 - }, - { - "epoch": 0.87, - "learning_rate": 1.6637724347162248e-06, - "loss": 0.7744, - "step": 34048 - }, - { - "epoch": 0.87, - "learning_rate": 1.6637517387724533e-06, - "loss": 0.9014, - "step": 34049 - }, - { - "epoch": 0.87, - "learning_rate": 1.6637310423204779e-06, - "loss": 0.8701, - "step": 34050 - }, - { - "epoch": 0.87, - "learning_rate": 1.6637103453603138e-06, - "loss": 0.7043, - "step": 34051 - }, - { - "epoch": 0.87, - "learning_rate": 1.6636896478919774e-06, - "loss": 0.7773, - "step": 34052 - }, - { - "epoch": 0.87, - "learning_rate": 1.6636689499154844e-06, - "loss": 0.8462, - "step": 34053 - }, - { - "epoch": 0.87, - "learning_rate": 1.6636482514308506e-06, - "loss": 1.0635, - "step": 34054 - }, - { - "epoch": 0.87, - "learning_rate": 1.6636275524380916e-06, - "loss": 0.8379, - "step": 34055 - }, - { - "epoch": 0.87, - "learning_rate": 1.6636068529372237e-06, - "loss": 0.7974, - "step": 34056 - }, - { - "epoch": 0.87, - "learning_rate": 1.6635861529282626e-06, - "loss": 0.8867, - "step": 34057 - }, - { - "epoch": 0.87, - "learning_rate": 1.6635654524112242e-06, - "loss": 0.8604, - "step": 34058 - }, - { - "epoch": 0.87, - "learning_rate": 1.6635447513861238e-06, - "loss": 0.8193, - "step": 34059 - }, - { - "epoch": 0.87, - "learning_rate": 1.663524049852978e-06, - "loss": 0.7178, - "step": 34060 - }, - { - "epoch": 0.87, - "learning_rate": 1.6635033478118023e-06, - "loss": 0.7812, - "step": 34061 - }, - { - "epoch": 0.87, - "learning_rate": 1.6634826452626127e-06, - "loss": 0.8994, - "step": 34062 - }, - { - "epoch": 0.87, - "learning_rate": 1.663461942205425e-06, - "loss": 0.6953, - "step": 34063 - }, - { - "epoch": 0.87, - "learning_rate": 1.6634412386402548e-06, - "loss": 0.9189, - "step": 34064 - }, - { - "epoch": 0.87, - "learning_rate": 1.663420534567118e-06, - "loss": 0.7246, - "step": 34065 - }, - { - "epoch": 0.87, - "learning_rate": 1.663399829986031e-06, - "loss": 0.9111, - "step": 34066 - }, - { - "epoch": 0.87, - "learning_rate": 1.663379124897009e-06, - "loss": 0.874, - "step": 34067 - }, - { - "epoch": 0.87, - "learning_rate": 1.663358419300068e-06, - "loss": 1.0352, - "step": 34068 - }, - { - "epoch": 0.87, - "learning_rate": 1.6633377131952245e-06, - "loss": 0.6226, - "step": 34069 - }, - { - "epoch": 0.87, - "learning_rate": 1.6633170065824932e-06, - "loss": 1.1113, - "step": 34070 - }, - { - "epoch": 0.87, - "learning_rate": 1.6632962994618907e-06, - "loss": 0.9434, - "step": 34071 - }, - { - "epoch": 0.87, - "learning_rate": 1.6632755918334329e-06, - "loss": 1.0732, - "step": 34072 - }, - { - "epoch": 0.87, - "learning_rate": 1.6632548836971354e-06, - "loss": 0.9053, - "step": 34073 - }, - { - "epoch": 0.87, - "learning_rate": 1.663234175053014e-06, - "loss": 1.0576, - "step": 34074 - }, - { - "epoch": 0.87, - "learning_rate": 1.663213465901085e-06, - "loss": 1.0049, - "step": 34075 - }, - { - "epoch": 0.87, - "learning_rate": 1.6631927562413637e-06, - "loss": 0.7427, - "step": 34076 - }, - { - "epoch": 0.87, - "learning_rate": 1.6631720460738664e-06, - "loss": 0.7285, - "step": 34077 - }, - { - "epoch": 0.87, - "learning_rate": 1.6631513353986084e-06, - "loss": 0.8486, - "step": 34078 - }, - { - "epoch": 0.87, - "learning_rate": 1.6631306242156062e-06, - "loss": 0.8682, - "step": 34079 - }, - { - "epoch": 0.87, - "learning_rate": 1.6631099125248754e-06, - "loss": 0.7439, - "step": 34080 - }, - { - "epoch": 0.87, - "learning_rate": 1.6630892003264317e-06, - "loss": 0.8428, - "step": 34081 - }, - { - "epoch": 0.87, - "learning_rate": 1.6630684876202913e-06, - "loss": 0.9795, - "step": 34082 - }, - { - "epoch": 0.87, - "learning_rate": 1.6630477744064698e-06, - "loss": 0.8501, - "step": 34083 - }, - { - "epoch": 0.87, - "learning_rate": 1.6630270606849827e-06, - "loss": 0.835, - "step": 34084 - }, - { - "epoch": 0.87, - "learning_rate": 1.6630063464558466e-06, - "loss": 0.8242, - "step": 34085 - }, - { - "epoch": 0.87, - "learning_rate": 1.6629856317190768e-06, - "loss": 0.6221, - "step": 34086 - }, - { - "epoch": 0.87, - "learning_rate": 1.66296491647469e-06, - "loss": 0.9678, - "step": 34087 - }, - { - "epoch": 0.87, - "learning_rate": 1.6629442007227008e-06, - "loss": 0.8555, - "step": 34088 - }, - { - "epoch": 0.87, - "learning_rate": 1.662923484463126e-06, - "loss": 0.8154, - "step": 34089 - }, - { - "epoch": 0.87, - "learning_rate": 1.6629027676959811e-06, - "loss": 0.8643, - "step": 34090 - }, - { - "epoch": 0.87, - "learning_rate": 1.6628820504212819e-06, - "loss": 0.7344, - "step": 34091 - }, - { - "epoch": 0.87, - "learning_rate": 1.6628613326390446e-06, - "loss": 0.647, - "step": 34092 - }, - { - "epoch": 0.87, - "learning_rate": 1.6628406143492848e-06, - "loss": 0.8379, - "step": 34093 - }, - { - "epoch": 0.87, - "learning_rate": 1.6628198955520184e-06, - "loss": 0.9717, - "step": 34094 - }, - { - "epoch": 0.87, - "learning_rate": 1.6627991762472614e-06, - "loss": 0.8154, - "step": 34095 - }, - { - "epoch": 0.87, - "learning_rate": 1.6627784564350291e-06, - "loss": 1.0293, - "step": 34096 - }, - { - "epoch": 0.87, - "learning_rate": 1.6627577361153383e-06, - "loss": 0.6709, - "step": 34097 - }, - { - "epoch": 0.87, - "learning_rate": 1.6627370152882043e-06, - "loss": 0.9238, - "step": 34098 - }, - { - "epoch": 0.87, - "learning_rate": 1.6627162939536427e-06, - "loss": 0.6348, - "step": 34099 - }, - { - "epoch": 0.87, - "learning_rate": 1.66269557211167e-06, - "loss": 0.7671, - "step": 34100 - }, - { - "epoch": 0.87, - "learning_rate": 1.6626748497623018e-06, - "loss": 0.8916, - "step": 34101 - }, - { - "epoch": 0.87, - "learning_rate": 1.6626541269055538e-06, - "loss": 0.8242, - "step": 34102 - }, - { - "epoch": 0.87, - "learning_rate": 1.6626334035414422e-06, - "loss": 1.0605, - "step": 34103 - }, - { - "epoch": 0.87, - "learning_rate": 1.6626126796699826e-06, - "loss": 0.7861, - "step": 34104 - }, - { - "epoch": 0.87, - "learning_rate": 1.662591955291191e-06, - "loss": 0.5156, - "step": 34105 - }, - { - "epoch": 0.87, - "learning_rate": 1.6625712304050827e-06, - "loss": 0.957, - "step": 34106 - }, - { - "epoch": 0.87, - "learning_rate": 1.6625505050116745e-06, - "loss": 0.5942, - "step": 34107 - }, - { - "epoch": 0.87, - "learning_rate": 1.662529779110982e-06, - "loss": 1.0264, - "step": 34108 - }, - { - "epoch": 0.87, - "learning_rate": 1.6625090527030208e-06, - "loss": 0.7505, - "step": 34109 - }, - { - "epoch": 0.87, - "learning_rate": 1.6624883257878066e-06, - "loss": 0.9502, - "step": 34110 - }, - { - "epoch": 0.87, - "learning_rate": 1.6624675983653558e-06, - "loss": 0.9355, - "step": 34111 - }, - { - "epoch": 0.87, - "learning_rate": 1.662446870435684e-06, - "loss": 1.0059, - "step": 34112 - }, - { - "epoch": 0.87, - "learning_rate": 1.6624261419988073e-06, - "loss": 0.8018, - "step": 34113 - }, - { - "epoch": 0.87, - "learning_rate": 1.6624054130547412e-06, - "loss": 0.9443, - "step": 34114 - }, - { - "epoch": 0.87, - "learning_rate": 1.6623846836035014e-06, - "loss": 0.8203, - "step": 34115 - }, - { - "epoch": 0.87, - "learning_rate": 1.6623639536451045e-06, - "loss": 0.8438, - "step": 34116 - }, - { - "epoch": 0.87, - "learning_rate": 1.6623432231795658e-06, - "loss": 0.6953, - "step": 34117 - }, - { - "epoch": 0.87, - "learning_rate": 1.6623224922069014e-06, - "loss": 0.8013, - "step": 34118 - }, - { - "epoch": 0.87, - "learning_rate": 1.662301760727127e-06, - "loss": 0.9941, - "step": 34119 - }, - { - "epoch": 0.87, - "learning_rate": 1.6622810287402587e-06, - "loss": 1.0205, - "step": 34120 - }, - { - "epoch": 0.87, - "learning_rate": 1.6622602962463124e-06, - "loss": 0.8984, - "step": 34121 - }, - { - "epoch": 0.87, - "learning_rate": 1.6622395632453037e-06, - "loss": 0.8223, - "step": 34122 - }, - { - "epoch": 0.87, - "learning_rate": 1.6622188297372485e-06, - "loss": 0.7815, - "step": 34123 - }, - { - "epoch": 0.87, - "learning_rate": 1.662198095722163e-06, - "loss": 0.7271, - "step": 34124 - }, - { - "epoch": 0.87, - "learning_rate": 1.662177361200063e-06, - "loss": 0.7939, - "step": 34125 - }, - { - "epoch": 0.87, - "learning_rate": 1.6621566261709638e-06, - "loss": 0.9912, - "step": 34126 - }, - { - "epoch": 0.87, - "learning_rate": 1.6621358906348822e-06, - "loss": 0.8447, - "step": 34127 - }, - { - "epoch": 0.87, - "learning_rate": 1.6621151545918332e-06, - "loss": 0.7881, - "step": 34128 - }, - { - "epoch": 0.87, - "learning_rate": 1.6620944180418333e-06, - "loss": 0.8186, - "step": 34129 - }, - { - "epoch": 0.87, - "learning_rate": 1.6620736809848981e-06, - "loss": 0.7485, - "step": 34130 - }, - { - "epoch": 0.87, - "learning_rate": 1.6620529434210436e-06, - "loss": 0.6404, - "step": 34131 - }, - { - "epoch": 0.87, - "learning_rate": 1.6620322053502854e-06, - "loss": 0.6953, - "step": 34132 - }, - { - "epoch": 0.87, - "learning_rate": 1.6620114667726398e-06, - "loss": 0.9365, - "step": 34133 - }, - { - "epoch": 0.87, - "learning_rate": 1.661990727688122e-06, - "loss": 0.7266, - "step": 34134 - }, - { - "epoch": 0.87, - "learning_rate": 1.6619699880967489e-06, - "loss": 0.6877, - "step": 34135 - }, - { - "epoch": 0.87, - "learning_rate": 1.6619492479985355e-06, - "loss": 0.7134, - "step": 34136 - }, - { - "epoch": 0.87, - "learning_rate": 1.6619285073934981e-06, - "loss": 0.8276, - "step": 34137 - }, - { - "epoch": 0.87, - "learning_rate": 1.6619077662816526e-06, - "loss": 0.8906, - "step": 34138 - }, - { - "epoch": 0.88, - "learning_rate": 1.6618870246630145e-06, - "loss": 0.79, - "step": 34139 - }, - { - "epoch": 0.88, - "learning_rate": 1.6618662825376002e-06, - "loss": 0.6687, - "step": 34140 - }, - { - "epoch": 0.88, - "learning_rate": 1.6618455399054251e-06, - "loss": 1.0576, - "step": 34141 - }, - { - "epoch": 0.88, - "learning_rate": 1.6618247967665054e-06, - "loss": 1.1064, - "step": 34142 - }, - { - "epoch": 0.88, - "learning_rate": 1.661804053120857e-06, - "loss": 0.9277, - "step": 34143 - }, - { - "epoch": 0.88, - "learning_rate": 1.6617833089684955e-06, - "loss": 0.7563, - "step": 34144 - }, - { - "epoch": 0.88, - "learning_rate": 1.6617625643094369e-06, - "loss": 0.8604, - "step": 34145 - }, - { - "epoch": 0.88, - "learning_rate": 1.6617418191436973e-06, - "loss": 0.6997, - "step": 34146 - }, - { - "epoch": 0.88, - "learning_rate": 1.6617210734712923e-06, - "loss": 0.5957, - "step": 34147 - }, - { - "epoch": 0.88, - "learning_rate": 1.661700327292238e-06, - "loss": 0.9844, - "step": 34148 - }, - { - "epoch": 0.88, - "learning_rate": 1.6616795806065503e-06, - "loss": 0.6543, - "step": 34149 - }, - { - "epoch": 0.88, - "learning_rate": 1.6616588334142448e-06, - "loss": 0.6042, - "step": 34150 - }, - { - "epoch": 0.88, - "learning_rate": 1.6616380857153374e-06, - "loss": 0.9121, - "step": 34151 - }, - { - "epoch": 0.88, - "learning_rate": 1.6616173375098444e-06, - "loss": 1.043, - "step": 34152 - }, - { - "epoch": 0.88, - "learning_rate": 1.6615965887977812e-06, - "loss": 0.731, - "step": 34153 - }, - { - "epoch": 0.88, - "learning_rate": 1.6615758395791639e-06, - "loss": 0.8926, - "step": 34154 - }, - { - "epoch": 0.88, - "learning_rate": 1.6615550898540084e-06, - "loss": 0.8369, - "step": 34155 - }, - { - "epoch": 0.88, - "learning_rate": 1.661534339622331e-06, - "loss": 1.0859, - "step": 34156 - }, - { - "epoch": 0.88, - "learning_rate": 1.661513588884147e-06, - "loss": 0.8408, - "step": 34157 - }, - { - "epoch": 0.88, - "learning_rate": 1.6614928376394722e-06, - "loss": 0.8857, - "step": 34158 - }, - { - "epoch": 0.88, - "learning_rate": 1.6614720858883228e-06, - "loss": 0.8896, - "step": 34159 - }, - { - "epoch": 0.88, - "learning_rate": 1.661451333630715e-06, - "loss": 0.9717, - "step": 34160 - }, - { - "epoch": 0.88, - "learning_rate": 1.6614305808666643e-06, - "loss": 0.7896, - "step": 34161 - }, - { - "epoch": 0.88, - "learning_rate": 1.661409827596186e-06, - "loss": 0.7031, - "step": 34162 - }, - { - "epoch": 0.88, - "learning_rate": 1.661389073819297e-06, - "loss": 0.7808, - "step": 34163 - }, - { - "epoch": 0.88, - "learning_rate": 1.6613683195360129e-06, - "loss": 0.771, - "step": 34164 - }, - { - "epoch": 0.88, - "learning_rate": 1.6613475647463494e-06, - "loss": 0.6191, - "step": 34165 - }, - { - "epoch": 0.88, - "learning_rate": 1.6613268094503226e-06, - "loss": 0.8545, - "step": 34166 - }, - { - "epoch": 0.88, - "learning_rate": 1.661306053647948e-06, - "loss": 0.9385, - "step": 34167 - }, - { - "epoch": 0.88, - "learning_rate": 1.661285297339242e-06, - "loss": 0.999, - "step": 34168 - }, - { - "epoch": 0.88, - "learning_rate": 1.66126454052422e-06, - "loss": 1.0996, - "step": 34169 - }, - { - "epoch": 0.88, - "learning_rate": 1.6612437832028982e-06, - "loss": 0.7837, - "step": 34170 - }, - { - "epoch": 0.88, - "learning_rate": 1.661223025375293e-06, - "loss": 0.8516, - "step": 34171 - }, - { - "epoch": 0.88, - "learning_rate": 1.661202267041419e-06, - "loss": 0.73, - "step": 34172 - }, - { - "epoch": 0.88, - "learning_rate": 1.6611815082012933e-06, - "loss": 0.9048, - "step": 34173 - }, - { - "epoch": 0.88, - "learning_rate": 1.661160748854931e-06, - "loss": 0.8672, - "step": 34174 - }, - { - "epoch": 0.88, - "learning_rate": 1.6611399890023484e-06, - "loss": 0.8096, - "step": 34175 - }, - { - "epoch": 0.88, - "learning_rate": 1.6611192286435616e-06, - "loss": 0.8022, - "step": 34176 - }, - { - "epoch": 0.88, - "learning_rate": 1.661098467778586e-06, - "loss": 0.9033, - "step": 34177 - }, - { - "epoch": 0.88, - "learning_rate": 1.6610777064074376e-06, - "loss": 0.8154, - "step": 34178 - }, - { - "epoch": 0.88, - "learning_rate": 1.661056944530132e-06, - "loss": 0.7136, - "step": 34179 - }, - { - "epoch": 0.88, - "learning_rate": 1.6610361821466862e-06, - "loss": 1.0117, - "step": 34180 - }, - { - "epoch": 0.88, - "learning_rate": 1.6610154192571151e-06, - "loss": 0.8477, - "step": 34181 - }, - { - "epoch": 0.88, - "learning_rate": 1.6609946558614349e-06, - "loss": 0.9355, - "step": 34182 - }, - { - "epoch": 0.88, - "learning_rate": 1.6609738919596616e-06, - "loss": 1.0488, - "step": 34183 - }, - { - "epoch": 0.88, - "learning_rate": 1.660953127551811e-06, - "loss": 0.7666, - "step": 34184 - }, - { - "epoch": 0.88, - "learning_rate": 1.6609323626378987e-06, - "loss": 0.729, - "step": 34185 - }, - { - "epoch": 0.88, - "learning_rate": 1.6609115972179412e-06, - "loss": 0.791, - "step": 34186 - }, - { - "epoch": 0.88, - "learning_rate": 1.660890831291954e-06, - "loss": 1.0225, - "step": 34187 - }, - { - "epoch": 0.88, - "learning_rate": 1.660870064859953e-06, - "loss": 0.731, - "step": 34188 - }, - { - "epoch": 0.88, - "learning_rate": 1.660849297921954e-06, - "loss": 0.9365, - "step": 34189 - }, - { - "epoch": 0.88, - "learning_rate": 1.6608285304779735e-06, - "loss": 0.8525, - "step": 34190 - }, - { - "epoch": 0.88, - "learning_rate": 1.6608077625280266e-06, - "loss": 0.7441, - "step": 34191 - }, - { - "epoch": 0.88, - "learning_rate": 1.6607869940721298e-06, - "loss": 0.7393, - "step": 34192 - }, - { - "epoch": 0.88, - "learning_rate": 1.6607662251102988e-06, - "loss": 0.8564, - "step": 34193 - }, - { - "epoch": 0.88, - "learning_rate": 1.6607454556425493e-06, - "loss": 0.9609, - "step": 34194 - }, - { - "epoch": 0.88, - "learning_rate": 1.6607246856688974e-06, - "loss": 1.0518, - "step": 34195 - }, - { - "epoch": 0.88, - "learning_rate": 1.6607039151893592e-06, - "loss": 1.1182, - "step": 34196 - }, - { - "epoch": 0.88, - "learning_rate": 1.6606831442039504e-06, - "loss": 0.8984, - "step": 34197 - }, - { - "epoch": 0.88, - "learning_rate": 1.6606623727126867e-06, - "loss": 0.8828, - "step": 34198 - }, - { - "epoch": 0.88, - "learning_rate": 1.6606416007155844e-06, - "loss": 0.748, - "step": 34199 - }, - { - "epoch": 0.88, - "learning_rate": 1.6606208282126588e-06, - "loss": 1.0342, - "step": 34200 - }, - { - "epoch": 0.88, - "learning_rate": 1.6606000552039267e-06, - "loss": 0.6328, - "step": 34201 - }, - { - "epoch": 0.88, - "learning_rate": 1.660579281689403e-06, - "loss": 0.6836, - "step": 34202 - }, - { - "epoch": 0.88, - "learning_rate": 1.6605585076691048e-06, - "loss": 0.8516, - "step": 34203 - }, - { - "epoch": 0.88, - "learning_rate": 1.6605377331430467e-06, - "loss": 0.79, - "step": 34204 - }, - { - "epoch": 0.88, - "learning_rate": 1.6605169581112454e-06, - "loss": 1.0596, - "step": 34205 - }, - { - "epoch": 0.88, - "learning_rate": 1.6604961825737167e-06, - "loss": 0.9004, - "step": 34206 - }, - { - "epoch": 0.88, - "learning_rate": 1.6604754065304768e-06, - "loss": 0.8594, - "step": 34207 - }, - { - "epoch": 0.88, - "learning_rate": 1.6604546299815408e-06, - "loss": 0.8311, - "step": 34208 - }, - { - "epoch": 0.88, - "learning_rate": 1.6604338529269249e-06, - "loss": 0.8252, - "step": 34209 - }, - { - "epoch": 0.88, - "learning_rate": 1.6604130753666455e-06, - "loss": 0.8525, - "step": 34210 - }, - { - "epoch": 0.88, - "learning_rate": 1.660392297300718e-06, - "loss": 0.9473, - "step": 34211 - }, - { - "epoch": 0.88, - "learning_rate": 1.6603715187291586e-06, - "loss": 0.8445, - "step": 34212 - }, - { - "epoch": 0.88, - "learning_rate": 1.6603507396519832e-06, - "loss": 0.8271, - "step": 34213 - }, - { - "epoch": 0.88, - "learning_rate": 1.6603299600692073e-06, - "loss": 1.0713, - "step": 34214 - }, - { - "epoch": 0.88, - "learning_rate": 1.6603091799808474e-06, - "loss": 0.812, - "step": 34215 - }, - { - "epoch": 0.88, - "learning_rate": 1.6602883993869191e-06, - "loss": 0.9717, - "step": 34216 - }, - { - "epoch": 0.88, - "learning_rate": 1.6602676182874382e-06, - "loss": 0.6768, - "step": 34217 - }, - { - "epoch": 0.88, - "learning_rate": 1.6602468366824206e-06, - "loss": 0.8789, - "step": 34218 - }, - { - "epoch": 0.88, - "learning_rate": 1.6602260545718826e-06, - "loss": 0.7695, - "step": 34219 - }, - { - "epoch": 0.88, - "learning_rate": 1.66020527195584e-06, - "loss": 0.8662, - "step": 34220 - }, - { - "epoch": 0.88, - "learning_rate": 1.6601844888343085e-06, - "loss": 1.041, - "step": 34221 - }, - { - "epoch": 0.88, - "learning_rate": 1.6601637052073039e-06, - "loss": 0.6768, - "step": 34222 - }, - { - "epoch": 0.88, - "learning_rate": 1.6601429210748423e-06, - "loss": 0.8164, - "step": 34223 - }, - { - "epoch": 0.88, - "learning_rate": 1.6601221364369399e-06, - "loss": 1.0566, - "step": 34224 - }, - { - "epoch": 0.88, - "learning_rate": 1.660101351293612e-06, - "loss": 0.8799, - "step": 34225 - }, - { - "epoch": 0.88, - "learning_rate": 1.660080565644875e-06, - "loss": 0.6855, - "step": 34226 - }, - { - "epoch": 0.88, - "learning_rate": 1.6600597794907447e-06, - "loss": 0.6545, - "step": 34227 - }, - { - "epoch": 0.88, - "learning_rate": 1.6600389928312368e-06, - "loss": 0.8516, - "step": 34228 - }, - { - "epoch": 0.88, - "learning_rate": 1.6600182056663674e-06, - "loss": 0.8984, - "step": 34229 - }, - { - "epoch": 0.88, - "learning_rate": 1.6599974179961527e-06, - "loss": 0.7134, - "step": 34230 - }, - { - "epoch": 0.88, - "learning_rate": 1.659976629820608e-06, - "loss": 0.8896, - "step": 34231 - }, - { - "epoch": 0.88, - "learning_rate": 1.6599558411397498e-06, - "loss": 0.9707, - "step": 34232 - }, - { - "epoch": 0.88, - "learning_rate": 1.6599350519535937e-06, - "loss": 0.999, - "step": 34233 - }, - { - "epoch": 0.88, - "learning_rate": 1.6599142622621557e-06, - "loss": 0.9072, - "step": 34234 - }, - { - "epoch": 0.88, - "learning_rate": 1.6598934720654513e-06, - "loss": 0.6304, - "step": 34235 - }, - { - "epoch": 0.88, - "learning_rate": 1.6598726813634975e-06, - "loss": 0.7256, - "step": 34236 - }, - { - "epoch": 0.88, - "learning_rate": 1.659851890156309e-06, - "loss": 0.644, - "step": 34237 - }, - { - "epoch": 0.88, - "learning_rate": 1.6598310984439024e-06, - "loss": 0.8848, - "step": 34238 - }, - { - "epoch": 0.88, - "learning_rate": 1.6598103062262934e-06, - "loss": 0.7117, - "step": 34239 - }, - { - "epoch": 0.88, - "learning_rate": 1.6597895135034983e-06, - "loss": 0.8223, - "step": 34240 - }, - { - "epoch": 0.88, - "learning_rate": 1.6597687202755324e-06, - "loss": 1.0859, - "step": 34241 - }, - { - "epoch": 0.88, - "learning_rate": 1.659747926542412e-06, - "loss": 0.7168, - "step": 34242 - }, - { - "epoch": 0.88, - "learning_rate": 1.6597271323041531e-06, - "loss": 0.8896, - "step": 34243 - }, - { - "epoch": 0.88, - "learning_rate": 1.6597063375607712e-06, - "loss": 0.6392, - "step": 34244 - }, - { - "epoch": 0.88, - "learning_rate": 1.6596855423122827e-06, - "loss": 0.8359, - "step": 34245 - }, - { - "epoch": 0.88, - "learning_rate": 1.6596647465587031e-06, - "loss": 0.8867, - "step": 34246 - }, - { - "epoch": 0.88, - "learning_rate": 1.6596439503000489e-06, - "loss": 0.7271, - "step": 34247 - }, - { - "epoch": 0.88, - "learning_rate": 1.659623153536335e-06, - "loss": 0.8613, - "step": 34248 - }, - { - "epoch": 0.88, - "learning_rate": 1.6596023562675786e-06, - "loss": 0.8936, - "step": 34249 - }, - { - "epoch": 0.88, - "learning_rate": 1.659581558493795e-06, - "loss": 0.5469, - "step": 34250 - }, - { - "epoch": 0.88, - "learning_rate": 1.6595607602149997e-06, - "loss": 0.9058, - "step": 34251 - }, - { - "epoch": 0.88, - "learning_rate": 1.6595399614312094e-06, - "loss": 0.9668, - "step": 34252 - }, - { - "epoch": 0.88, - "learning_rate": 1.6595191621424394e-06, - "loss": 0.8662, - "step": 34253 - }, - { - "epoch": 0.88, - "learning_rate": 1.6594983623487063e-06, - "loss": 0.9834, - "step": 34254 - }, - { - "epoch": 0.88, - "learning_rate": 1.659477562050025e-06, - "loss": 0.9697, - "step": 34255 - }, - { - "epoch": 0.88, - "learning_rate": 1.6594567612464128e-06, - "loss": 0.7827, - "step": 34256 - }, - { - "epoch": 0.88, - "learning_rate": 1.6594359599378845e-06, - "loss": 0.8025, - "step": 34257 - }, - { - "epoch": 0.88, - "learning_rate": 1.6594151581244561e-06, - "loss": 0.7976, - "step": 34258 - }, - { - "epoch": 0.88, - "learning_rate": 1.6593943558061442e-06, - "loss": 0.6943, - "step": 34259 - }, - { - "epoch": 0.88, - "learning_rate": 1.6593735529829645e-06, - "loss": 0.8633, - "step": 34260 - }, - { - "epoch": 0.88, - "learning_rate": 1.6593527496549328e-06, - "loss": 0.9775, - "step": 34261 - }, - { - "epoch": 0.88, - "learning_rate": 1.6593319458220648e-06, - "loss": 0.9199, - "step": 34262 - }, - { - "epoch": 0.88, - "learning_rate": 1.6593111414843769e-06, - "loss": 1.0557, - "step": 34263 - }, - { - "epoch": 0.88, - "learning_rate": 1.6592903366418841e-06, - "loss": 0.9131, - "step": 34264 - }, - { - "epoch": 0.88, - "learning_rate": 1.6592695312946034e-06, - "loss": 1.0869, - "step": 34265 - }, - { - "epoch": 0.88, - "learning_rate": 1.6592487254425508e-06, - "loss": 1.0879, - "step": 34266 - }, - { - "epoch": 0.88, - "learning_rate": 1.6592279190857412e-06, - "loss": 0.563, - "step": 34267 - }, - { - "epoch": 0.88, - "learning_rate": 1.6592071122241913e-06, - "loss": 0.6777, - "step": 34268 - }, - { - "epoch": 0.88, - "learning_rate": 1.6591863048579167e-06, - "loss": 0.8291, - "step": 34269 - }, - { - "epoch": 0.88, - "learning_rate": 1.6591654969869335e-06, - "loss": 0.8408, - "step": 34270 - }, - { - "epoch": 0.88, - "learning_rate": 1.6591446886112578e-06, - "loss": 0.9014, - "step": 34271 - }, - { - "epoch": 0.88, - "learning_rate": 1.659123879730905e-06, - "loss": 0.9023, - "step": 34272 - }, - { - "epoch": 0.88, - "learning_rate": 1.6591030703458917e-06, - "loss": 0.7671, - "step": 34273 - }, - { - "epoch": 0.88, - "learning_rate": 1.659082260456233e-06, - "loss": 0.7471, - "step": 34274 - }, - { - "epoch": 0.88, - "learning_rate": 1.6590614500619457e-06, - "loss": 0.9492, - "step": 34275 - }, - { - "epoch": 0.88, - "learning_rate": 1.6590406391630454e-06, - "loss": 0.916, - "step": 34276 - }, - { - "epoch": 0.88, - "learning_rate": 1.6590198277595477e-06, - "loss": 0.6265, - "step": 34277 - }, - { - "epoch": 0.88, - "learning_rate": 1.6589990158514691e-06, - "loss": 0.9111, - "step": 34278 - }, - { - "epoch": 0.88, - "learning_rate": 1.658978203438825e-06, - "loss": 0.834, - "step": 34279 - }, - { - "epoch": 0.88, - "learning_rate": 1.6589573905216318e-06, - "loss": 0.7124, - "step": 34280 - }, - { - "epoch": 0.88, - "learning_rate": 1.6589365770999053e-06, - "loss": 0.8428, - "step": 34281 - }, - { - "epoch": 0.88, - "learning_rate": 1.658915763173661e-06, - "loss": 1.0938, - "step": 34282 - }, - { - "epoch": 0.88, - "learning_rate": 1.6588949487429154e-06, - "loss": 0.7793, - "step": 34283 - }, - { - "epoch": 0.88, - "learning_rate": 1.6588741338076844e-06, - "loss": 0.9062, - "step": 34284 - }, - { - "epoch": 0.88, - "learning_rate": 1.6588533183679833e-06, - "loss": 0.6089, - "step": 34285 - }, - { - "epoch": 0.88, - "learning_rate": 1.658832502423829e-06, - "loss": 0.8838, - "step": 34286 - }, - { - "epoch": 0.88, - "learning_rate": 1.6588116859752367e-06, - "loss": 0.9971, - "step": 34287 - }, - { - "epoch": 0.88, - "learning_rate": 1.6587908690222227e-06, - "loss": 0.8369, - "step": 34288 - }, - { - "epoch": 0.88, - "learning_rate": 1.6587700515648026e-06, - "loss": 0.9004, - "step": 34289 - }, - { - "epoch": 0.88, - "learning_rate": 1.6587492336029927e-06, - "loss": 0.8691, - "step": 34290 - }, - { - "epoch": 0.88, - "learning_rate": 1.6587284151368093e-06, - "loss": 0.7393, - "step": 34291 - }, - { - "epoch": 0.88, - "learning_rate": 1.6587075961662672e-06, - "loss": 0.7861, - "step": 34292 - }, - { - "epoch": 0.88, - "learning_rate": 1.658686776691383e-06, - "loss": 0.6919, - "step": 34293 - }, - { - "epoch": 0.88, - "learning_rate": 1.6586659567121729e-06, - "loss": 0.5806, - "step": 34294 - }, - { - "epoch": 0.88, - "learning_rate": 1.6586451362286522e-06, - "loss": 0.7402, - "step": 34295 - }, - { - "epoch": 0.88, - "learning_rate": 1.6586243152408376e-06, - "loss": 0.7285, - "step": 34296 - }, - { - "epoch": 0.88, - "learning_rate": 1.6586034937487445e-06, - "loss": 0.6689, - "step": 34297 - }, - { - "epoch": 0.88, - "learning_rate": 1.658582671752389e-06, - "loss": 0.8877, - "step": 34298 - }, - { - "epoch": 0.88, - "learning_rate": 1.6585618492517868e-06, - "loss": 0.7812, - "step": 34299 - }, - { - "epoch": 0.88, - "learning_rate": 1.6585410262469544e-06, - "loss": 0.9775, - "step": 34300 - }, - { - "epoch": 0.88, - "learning_rate": 1.6585202027379075e-06, - "loss": 0.7954, - "step": 34301 - }, - { - "epoch": 0.88, - "learning_rate": 1.6584993787246616e-06, - "loss": 0.876, - "step": 34302 - }, - { - "epoch": 0.88, - "learning_rate": 1.658478554207233e-06, - "loss": 0.8027, - "step": 34303 - }, - { - "epoch": 0.88, - "learning_rate": 1.6584577291856378e-06, - "loss": 0.6594, - "step": 34304 - }, - { - "epoch": 0.88, - "learning_rate": 1.658436903659892e-06, - "loss": 0.8154, - "step": 34305 - }, - { - "epoch": 0.88, - "learning_rate": 1.658416077630011e-06, - "loss": 0.7168, - "step": 34306 - }, - { - "epoch": 0.88, - "learning_rate": 1.6583952510960115e-06, - "loss": 0.959, - "step": 34307 - }, - { - "epoch": 0.88, - "learning_rate": 1.6583744240579085e-06, - "loss": 1.1162, - "step": 34308 - }, - { - "epoch": 0.88, - "learning_rate": 1.6583535965157189e-06, - "loss": 0.7617, - "step": 34309 - }, - { - "epoch": 0.88, - "learning_rate": 1.658332768469458e-06, - "loss": 1.0615, - "step": 34310 - }, - { - "epoch": 0.88, - "learning_rate": 1.6583119399191422e-06, - "loss": 0.8247, - "step": 34311 - }, - { - "epoch": 0.88, - "learning_rate": 1.658291110864787e-06, - "loss": 0.7583, - "step": 34312 - }, - { - "epoch": 0.88, - "learning_rate": 1.6582702813064086e-06, - "loss": 0.7163, - "step": 34313 - }, - { - "epoch": 0.88, - "learning_rate": 1.6582494512440228e-06, - "loss": 0.9092, - "step": 34314 - }, - { - "epoch": 0.88, - "learning_rate": 1.658228620677646e-06, - "loss": 0.6323, - "step": 34315 - }, - { - "epoch": 0.88, - "learning_rate": 1.6582077896072935e-06, - "loss": 1.04, - "step": 34316 - }, - { - "epoch": 0.88, - "learning_rate": 1.6581869580329815e-06, - "loss": 0.7715, - "step": 34317 - }, - { - "epoch": 0.88, - "learning_rate": 1.658166125954726e-06, - "loss": 0.9639, - "step": 34318 - }, - { - "epoch": 0.88, - "learning_rate": 1.6581452933725434e-06, - "loss": 0.7559, - "step": 34319 - }, - { - "epoch": 0.88, - "learning_rate": 1.6581244602864488e-06, - "loss": 0.897, - "step": 34320 - }, - { - "epoch": 0.88, - "learning_rate": 1.6581036266964587e-06, - "loss": 0.9775, - "step": 34321 - }, - { - "epoch": 0.88, - "learning_rate": 1.658082792602589e-06, - "loss": 1.0732, - "step": 34322 - }, - { - "epoch": 0.88, - "learning_rate": 1.6580619580048555e-06, - "loss": 0.8604, - "step": 34323 - }, - { - "epoch": 0.88, - "learning_rate": 1.6580411229032742e-06, - "loss": 0.9775, - "step": 34324 - }, - { - "epoch": 0.88, - "learning_rate": 1.658020287297861e-06, - "loss": 0.6465, - "step": 34325 - }, - { - "epoch": 0.88, - "learning_rate": 1.6579994511886322e-06, - "loss": 0.6143, - "step": 34326 - }, - { - "epoch": 0.88, - "learning_rate": 1.6579786145756031e-06, - "loss": 0.9512, - "step": 34327 - }, - { - "epoch": 0.88, - "learning_rate": 1.6579577774587902e-06, - "loss": 0.874, - "step": 34328 - }, - { - "epoch": 0.88, - "learning_rate": 1.6579369398382093e-06, - "loss": 0.8149, - "step": 34329 - }, - { - "epoch": 0.88, - "learning_rate": 1.6579161017138763e-06, - "loss": 0.875, - "step": 34330 - }, - { - "epoch": 0.88, - "learning_rate": 1.6578952630858073e-06, - "loss": 0.8691, - "step": 34331 - }, - { - "epoch": 0.88, - "learning_rate": 1.6578744239540182e-06, - "loss": 0.873, - "step": 34332 - }, - { - "epoch": 0.88, - "learning_rate": 1.6578535843185246e-06, - "loss": 0.8457, - "step": 34333 - }, - { - "epoch": 0.88, - "learning_rate": 1.657832744179343e-06, - "loss": 0.8789, - "step": 34334 - }, - { - "epoch": 0.88, - "learning_rate": 1.6578119035364888e-06, - "loss": 0.7139, - "step": 34335 - }, - { - "epoch": 0.88, - "learning_rate": 1.6577910623899789e-06, - "loss": 0.7905, - "step": 34336 - }, - { - "epoch": 0.88, - "learning_rate": 1.657770220739828e-06, - "loss": 0.7285, - "step": 34337 - }, - { - "epoch": 0.88, - "learning_rate": 1.657749378586053e-06, - "loss": 0.6013, - "step": 34338 - }, - { - "epoch": 0.88, - "learning_rate": 1.6577285359286694e-06, - "loss": 0.7295, - "step": 34339 - }, - { - "epoch": 0.88, - "learning_rate": 1.6577076927676935e-06, - "loss": 0.75, - "step": 34340 - }, - { - "epoch": 0.88, - "learning_rate": 1.657686849103141e-06, - "loss": 0.9336, - "step": 34341 - }, - { - "epoch": 0.88, - "learning_rate": 1.6576660049350278e-06, - "loss": 0.6709, - "step": 34342 - }, - { - "epoch": 0.88, - "learning_rate": 1.65764516026337e-06, - "loss": 0.7434, - "step": 34343 - }, - { - "epoch": 0.88, - "learning_rate": 1.6576243150881834e-06, - "loss": 0.7891, - "step": 34344 - }, - { - "epoch": 0.88, - "learning_rate": 1.6576034694094845e-06, - "loss": 0.7178, - "step": 34345 - }, - { - "epoch": 0.88, - "learning_rate": 1.6575826232272886e-06, - "loss": 0.603, - "step": 34346 - }, - { - "epoch": 0.88, - "learning_rate": 1.6575617765416122e-06, - "loss": 0.8242, - "step": 34347 - }, - { - "epoch": 0.88, - "learning_rate": 1.6575409293524705e-06, - "loss": 0.9355, - "step": 34348 - }, - { - "epoch": 0.88, - "learning_rate": 1.65752008165988e-06, - "loss": 0.8457, - "step": 34349 - }, - { - "epoch": 0.88, - "learning_rate": 1.657499233463857e-06, - "loss": 0.8154, - "step": 34350 - }, - { - "epoch": 0.88, - "learning_rate": 1.657478384764417e-06, - "loss": 0.7456, - "step": 34351 - }, - { - "epoch": 0.88, - "learning_rate": 1.6574575355615759e-06, - "loss": 0.9551, - "step": 34352 - }, - { - "epoch": 0.88, - "learning_rate": 1.6574366858553497e-06, - "loss": 0.7524, - "step": 34353 - }, - { - "epoch": 0.88, - "learning_rate": 1.6574158356457546e-06, - "loss": 0.9453, - "step": 34354 - }, - { - "epoch": 0.88, - "learning_rate": 1.6573949849328065e-06, - "loss": 0.6885, - "step": 34355 - }, - { - "epoch": 0.88, - "learning_rate": 1.657374133716521e-06, - "loss": 0.9727, - "step": 34356 - }, - { - "epoch": 0.88, - "learning_rate": 1.6573532819969144e-06, - "loss": 0.8408, - "step": 34357 - }, - { - "epoch": 0.88, - "learning_rate": 1.6573324297740028e-06, - "loss": 0.9492, - "step": 34358 - }, - { - "epoch": 0.88, - "learning_rate": 1.6573115770478018e-06, - "loss": 0.8604, - "step": 34359 - }, - { - "epoch": 0.88, - "learning_rate": 1.6572907238183278e-06, - "loss": 0.7578, - "step": 34360 - }, - { - "epoch": 0.88, - "learning_rate": 1.6572698700855962e-06, - "loss": 0.7783, - "step": 34361 - }, - { - "epoch": 0.88, - "learning_rate": 1.6572490158496234e-06, - "loss": 0.6738, - "step": 34362 - }, - { - "epoch": 0.88, - "learning_rate": 1.6572281611104255e-06, - "loss": 0.9385, - "step": 34363 - }, - { - "epoch": 0.88, - "learning_rate": 1.657207305868018e-06, - "loss": 0.8252, - "step": 34364 - }, - { - "epoch": 0.88, - "learning_rate": 1.6571864501224174e-06, - "loss": 0.8149, - "step": 34365 - }, - { - "epoch": 0.88, - "learning_rate": 1.6571655938736391e-06, - "loss": 0.8506, - "step": 34366 - }, - { - "epoch": 0.88, - "learning_rate": 1.657144737121699e-06, - "loss": 1.0176, - "step": 34367 - }, - { - "epoch": 0.88, - "learning_rate": 1.6571238798666137e-06, - "loss": 0.7217, - "step": 34368 - }, - { - "epoch": 0.88, - "learning_rate": 1.6571030221083988e-06, - "loss": 0.7095, - "step": 34369 - }, - { - "epoch": 0.88, - "learning_rate": 1.6570821638470704e-06, - "loss": 0.9229, - "step": 34370 - }, - { - "epoch": 0.88, - "learning_rate": 1.6570613050826445e-06, - "loss": 0.8945, - "step": 34371 - }, - { - "epoch": 0.88, - "learning_rate": 1.6570404458151367e-06, - "loss": 0.7842, - "step": 34372 - }, - { - "epoch": 0.88, - "learning_rate": 1.6570195860445635e-06, - "loss": 0.5664, - "step": 34373 - }, - { - "epoch": 0.88, - "learning_rate": 1.6569987257709403e-06, - "loss": 0.873, - "step": 34374 - }, - { - "epoch": 0.88, - "learning_rate": 1.6569778649942836e-06, - "loss": 0.8633, - "step": 34375 - }, - { - "epoch": 0.88, - "learning_rate": 1.6569570037146095e-06, - "loss": 0.7402, - "step": 34376 - }, - { - "epoch": 0.88, - "learning_rate": 1.6569361419319333e-06, - "loss": 0.5537, - "step": 34377 - }, - { - "epoch": 0.88, - "learning_rate": 1.6569152796462711e-06, - "loss": 0.9297, - "step": 34378 - }, - { - "epoch": 0.88, - "learning_rate": 1.6568944168576393e-06, - "loss": 0.8613, - "step": 34379 - }, - { - "epoch": 0.88, - "learning_rate": 1.6568735535660533e-06, - "loss": 0.9268, - "step": 34380 - }, - { - "epoch": 0.88, - "learning_rate": 1.6568526897715303e-06, - "loss": 0.6685, - "step": 34381 - }, - { - "epoch": 0.88, - "learning_rate": 1.6568318254740844e-06, - "loss": 0.7773, - "step": 34382 - }, - { - "epoch": 0.88, - "learning_rate": 1.656810960673733e-06, - "loss": 0.9326, - "step": 34383 - }, - { - "epoch": 0.88, - "learning_rate": 1.656790095370492e-06, - "loss": 0.8633, - "step": 34384 - }, - { - "epoch": 0.88, - "learning_rate": 1.6567692295643764e-06, - "loss": 0.79, - "step": 34385 - }, - { - "epoch": 0.88, - "learning_rate": 1.656748363255403e-06, - "loss": 0.7639, - "step": 34386 - }, - { - "epoch": 0.88, - "learning_rate": 1.6567274964435877e-06, - "loss": 0.9062, - "step": 34387 - }, - { - "epoch": 0.88, - "learning_rate": 1.6567066291289463e-06, - "loss": 0.8545, - "step": 34388 - }, - { - "epoch": 0.88, - "learning_rate": 1.6566857613114947e-06, - "loss": 0.7612, - "step": 34389 - }, - { - "epoch": 0.88, - "learning_rate": 1.6566648929912493e-06, - "loss": 0.7451, - "step": 34390 - }, - { - "epoch": 0.88, - "learning_rate": 1.6566440241682256e-06, - "loss": 0.8779, - "step": 34391 - }, - { - "epoch": 0.88, - "learning_rate": 1.6566231548424398e-06, - "loss": 0.8506, - "step": 34392 - }, - { - "epoch": 0.88, - "learning_rate": 1.656602285013908e-06, - "loss": 0.9434, - "step": 34393 - }, - { - "epoch": 0.88, - "learning_rate": 1.6565814146826455e-06, - "loss": 0.709, - "step": 34394 - }, - { - "epoch": 0.88, - "learning_rate": 1.6565605438486695e-06, - "loss": 0.7773, - "step": 34395 - }, - { - "epoch": 0.88, - "learning_rate": 1.6565396725119948e-06, - "loss": 0.8291, - "step": 34396 - }, - { - "epoch": 0.88, - "learning_rate": 1.6565188006726381e-06, - "loss": 1.0176, - "step": 34397 - }, - { - "epoch": 0.88, - "learning_rate": 1.6564979283306148e-06, - "loss": 0.8633, - "step": 34398 - }, - { - "epoch": 0.88, - "learning_rate": 1.6564770554859418e-06, - "loss": 0.7114, - "step": 34399 - }, - { - "epoch": 0.88, - "learning_rate": 1.656456182138634e-06, - "loss": 0.8037, - "step": 34400 - }, - { - "epoch": 0.88, - "learning_rate": 1.6564353082887081e-06, - "loss": 0.8174, - "step": 34401 - }, - { - "epoch": 0.88, - "learning_rate": 1.6564144339361799e-06, - "loss": 0.874, - "step": 34402 - }, - { - "epoch": 0.88, - "learning_rate": 1.6563935590810653e-06, - "loss": 0.8428, - "step": 34403 - }, - { - "epoch": 0.88, - "learning_rate": 1.6563726837233802e-06, - "loss": 0.9717, - "step": 34404 - }, - { - "epoch": 0.88, - "learning_rate": 1.6563518078631407e-06, - "loss": 1.0225, - "step": 34405 - }, - { - "epoch": 0.88, - "learning_rate": 1.6563309315003631e-06, - "loss": 0.876, - "step": 34406 - }, - { - "epoch": 0.88, - "learning_rate": 1.6563100546350627e-06, - "loss": 0.6743, - "step": 34407 - }, - { - "epoch": 0.88, - "learning_rate": 1.656289177267256e-06, - "loss": 0.8691, - "step": 34408 - }, - { - "epoch": 0.88, - "learning_rate": 1.656268299396959e-06, - "loss": 0.8047, - "step": 34409 - }, - { - "epoch": 0.88, - "learning_rate": 1.6562474210241878e-06, - "loss": 0.8496, - "step": 34410 - }, - { - "epoch": 0.88, - "learning_rate": 1.6562265421489576e-06, - "loss": 0.7964, - "step": 34411 - }, - { - "epoch": 0.88, - "learning_rate": 1.6562056627712852e-06, - "loss": 0.875, - "step": 34412 - }, - { - "epoch": 0.88, - "learning_rate": 1.6561847828911862e-06, - "loss": 0.8311, - "step": 34413 - }, - { - "epoch": 0.88, - "learning_rate": 1.6561639025086764e-06, - "loss": 0.7568, - "step": 34414 - }, - { - "epoch": 0.88, - "learning_rate": 1.6561430216237726e-06, - "loss": 0.6426, - "step": 34415 - }, - { - "epoch": 0.88, - "learning_rate": 1.65612214023649e-06, - "loss": 0.9707, - "step": 34416 - }, - { - "epoch": 0.88, - "learning_rate": 1.6561012583468448e-06, - "loss": 0.6792, - "step": 34417 - }, - { - "epoch": 0.88, - "learning_rate": 1.6560803759548532e-06, - "loss": 0.9678, - "step": 34418 - }, - { - "epoch": 0.88, - "learning_rate": 1.656059493060531e-06, - "loss": 0.8555, - "step": 34419 - }, - { - "epoch": 0.88, - "learning_rate": 1.6560386096638941e-06, - "loss": 0.7686, - "step": 34420 - }, - { - "epoch": 0.88, - "learning_rate": 1.6560177257649586e-06, - "loss": 0.6611, - "step": 34421 - }, - { - "epoch": 0.88, - "learning_rate": 1.6559968413637405e-06, - "loss": 0.7783, - "step": 34422 - }, - { - "epoch": 0.88, - "learning_rate": 1.6559759564602558e-06, - "loss": 0.8052, - "step": 34423 - }, - { - "epoch": 0.88, - "learning_rate": 1.6559550710545204e-06, - "loss": 0.9814, - "step": 34424 - }, - { - "epoch": 0.88, - "learning_rate": 1.6559341851465504e-06, - "loss": 0.8789, - "step": 34425 - }, - { - "epoch": 0.88, - "learning_rate": 1.6559132987363618e-06, - "loss": 0.9385, - "step": 34426 - }, - { - "epoch": 0.88, - "learning_rate": 1.6558924118239706e-06, - "loss": 0.9199, - "step": 34427 - }, - { - "epoch": 0.88, - "learning_rate": 1.6558715244093928e-06, - "loss": 0.7402, - "step": 34428 - }, - { - "epoch": 0.88, - "learning_rate": 1.655850636492644e-06, - "loss": 0.9121, - "step": 34429 - }, - { - "epoch": 0.88, - "learning_rate": 1.6558297480737408e-06, - "loss": 0.7715, - "step": 34430 - }, - { - "epoch": 0.88, - "learning_rate": 1.655808859152699e-06, - "loss": 1.0635, - "step": 34431 - }, - { - "epoch": 0.88, - "learning_rate": 1.6557879697295342e-06, - "loss": 0.8486, - "step": 34432 - }, - { - "epoch": 0.88, - "learning_rate": 1.655767079804263e-06, - "loss": 0.7126, - "step": 34433 - }, - { - "epoch": 0.88, - "learning_rate": 1.655746189376901e-06, - "loss": 0.6156, - "step": 34434 - }, - { - "epoch": 0.88, - "learning_rate": 1.6557252984474644e-06, - "loss": 0.8584, - "step": 34435 - }, - { - "epoch": 0.88, - "learning_rate": 1.655704407015969e-06, - "loss": 0.7073, - "step": 34436 - }, - { - "epoch": 0.88, - "learning_rate": 1.6556835150824306e-06, - "loss": 0.9824, - "step": 34437 - }, - { - "epoch": 0.88, - "learning_rate": 1.6556626226468657e-06, - "loss": 0.583, - "step": 34438 - }, - { - "epoch": 0.88, - "learning_rate": 1.65564172970929e-06, - "loss": 0.7046, - "step": 34439 - }, - { - "epoch": 0.88, - "learning_rate": 1.65562083626972e-06, - "loss": 0.8652, - "step": 34440 - }, - { - "epoch": 0.88, - "learning_rate": 1.655599942328171e-06, - "loss": 0.9053, - "step": 34441 - }, - { - "epoch": 0.88, - "learning_rate": 1.6555790478846592e-06, - "loss": 0.8408, - "step": 34442 - }, - { - "epoch": 0.88, - "learning_rate": 1.6555581529392004e-06, - "loss": 0.9033, - "step": 34443 - }, - { - "epoch": 0.88, - "learning_rate": 1.6555372574918113e-06, - "loss": 0.833, - "step": 34444 - }, - { - "epoch": 0.88, - "learning_rate": 1.6555163615425075e-06, - "loss": 0.9697, - "step": 34445 - }, - { - "epoch": 0.88, - "learning_rate": 1.6554954650913047e-06, - "loss": 0.8857, - "step": 34446 - }, - { - "epoch": 0.88, - "learning_rate": 1.6554745681382192e-06, - "loss": 0.8018, - "step": 34447 - }, - { - "epoch": 0.88, - "learning_rate": 1.6554536706832671e-06, - "loss": 0.6953, - "step": 34448 - }, - { - "epoch": 0.88, - "learning_rate": 1.655432772726464e-06, - "loss": 0.8008, - "step": 34449 - }, - { - "epoch": 0.88, - "learning_rate": 1.6554118742678265e-06, - "loss": 0.8838, - "step": 34450 - }, - { - "epoch": 0.88, - "learning_rate": 1.65539097530737e-06, - "loss": 0.8467, - "step": 34451 - }, - { - "epoch": 0.88, - "learning_rate": 1.6553700758451109e-06, - "loss": 0.5132, - "step": 34452 - }, - { - "epoch": 0.88, - "learning_rate": 1.6553491758810649e-06, - "loss": 0.7666, - "step": 34453 - }, - { - "epoch": 0.88, - "learning_rate": 1.6553282754152484e-06, - "loss": 0.6992, - "step": 34454 - }, - { - "epoch": 0.88, - "learning_rate": 1.6553073744476772e-06, - "loss": 0.7471, - "step": 34455 - }, - { - "epoch": 0.88, - "learning_rate": 1.655286472978367e-06, - "loss": 0.8159, - "step": 34456 - }, - { - "epoch": 0.88, - "learning_rate": 1.6552655710073342e-06, - "loss": 0.7451, - "step": 34457 - }, - { - "epoch": 0.88, - "learning_rate": 1.655244668534595e-06, - "loss": 0.7764, - "step": 34458 - }, - { - "epoch": 0.88, - "learning_rate": 1.6552237655601645e-06, - "loss": 0.8525, - "step": 34459 - }, - { - "epoch": 0.88, - "learning_rate": 1.6552028620840596e-06, - "loss": 0.4675, - "step": 34460 - }, - { - "epoch": 0.88, - "learning_rate": 1.6551819581062963e-06, - "loss": 0.8809, - "step": 34461 - }, - { - "epoch": 0.88, - "learning_rate": 1.6551610536268896e-06, - "loss": 0.8555, - "step": 34462 - }, - { - "epoch": 0.88, - "learning_rate": 1.6551401486458567e-06, - "loss": 0.8701, - "step": 34463 - }, - { - "epoch": 0.88, - "learning_rate": 1.6551192431632132e-06, - "loss": 0.7832, - "step": 34464 - }, - { - "epoch": 0.88, - "learning_rate": 1.6550983371789747e-06, - "loss": 0.8281, - "step": 34465 - }, - { - "epoch": 0.88, - "learning_rate": 1.6550774306931577e-06, - "loss": 0.8525, - "step": 34466 - }, - { - "epoch": 0.88, - "learning_rate": 1.655056523705778e-06, - "loss": 0.7852, - "step": 34467 - }, - { - "epoch": 0.88, - "learning_rate": 1.6550356162168515e-06, - "loss": 1.082, - "step": 34468 - }, - { - "epoch": 0.88, - "learning_rate": 1.6550147082263944e-06, - "loss": 0.9902, - "step": 34469 - }, - { - "epoch": 0.88, - "learning_rate": 1.6549937997344228e-06, - "loss": 0.7646, - "step": 34470 - }, - { - "epoch": 0.88, - "learning_rate": 1.6549728907409524e-06, - "loss": 0.7188, - "step": 34471 - }, - { - "epoch": 0.88, - "learning_rate": 1.6549519812459996e-06, - "loss": 0.8945, - "step": 34472 - }, - { - "epoch": 0.88, - "learning_rate": 1.65493107124958e-06, - "loss": 0.4934, - "step": 34473 - }, - { - "epoch": 0.88, - "learning_rate": 1.6549101607517098e-06, - "loss": 0.772, - "step": 34474 - }, - { - "epoch": 0.88, - "learning_rate": 1.6548892497524053e-06, - "loss": 0.9111, - "step": 34475 - }, - { - "epoch": 0.88, - "learning_rate": 1.6548683382516816e-06, - "loss": 0.71, - "step": 34476 - }, - { - "epoch": 0.88, - "learning_rate": 1.6548474262495557e-06, - "loss": 0.7188, - "step": 34477 - }, - { - "epoch": 0.88, - "learning_rate": 1.6548265137460433e-06, - "loss": 0.7783, - "step": 34478 - }, - { - "epoch": 0.88, - "learning_rate": 1.6548056007411604e-06, - "loss": 0.7468, - "step": 34479 - }, - { - "epoch": 0.88, - "learning_rate": 1.654784687234923e-06, - "loss": 0.958, - "step": 34480 - }, - { - "epoch": 0.88, - "learning_rate": 1.6547637732273468e-06, - "loss": 0.918, - "step": 34481 - }, - { - "epoch": 0.88, - "learning_rate": 1.6547428587184479e-06, - "loss": 0.6821, - "step": 34482 - }, - { - "epoch": 0.88, - "learning_rate": 1.6547219437082429e-06, - "loss": 0.8057, - "step": 34483 - }, - { - "epoch": 0.88, - "learning_rate": 1.6547010281967473e-06, - "loss": 0.5962, - "step": 34484 - }, - { - "epoch": 0.88, - "learning_rate": 1.6546801121839773e-06, - "loss": 0.875, - "step": 34485 - }, - { - "epoch": 0.88, - "learning_rate": 1.6546591956699488e-06, - "loss": 0.7244, - "step": 34486 - }, - { - "epoch": 0.88, - "learning_rate": 1.6546382786546779e-06, - "loss": 0.8926, - "step": 34487 - }, - { - "epoch": 0.88, - "learning_rate": 1.6546173611381803e-06, - "loss": 1.0742, - "step": 34488 - }, - { - "epoch": 0.88, - "learning_rate": 1.6545964431204724e-06, - "loss": 0.7451, - "step": 34489 - }, - { - "epoch": 0.88, - "learning_rate": 1.6545755246015704e-06, - "loss": 1.0068, - "step": 34490 - }, - { - "epoch": 0.88, - "learning_rate": 1.6545546055814898e-06, - "loss": 1.1768, - "step": 34491 - }, - { - "epoch": 0.88, - "learning_rate": 1.6545336860602467e-06, - "loss": 0.729, - "step": 34492 - }, - { - "epoch": 0.88, - "learning_rate": 1.6545127660378574e-06, - "loss": 0.7874, - "step": 34493 - }, - { - "epoch": 0.88, - "learning_rate": 1.6544918455143376e-06, - "loss": 0.7021, - "step": 34494 - }, - { - "epoch": 0.88, - "learning_rate": 1.6544709244897036e-06, - "loss": 0.8896, - "step": 34495 - }, - { - "epoch": 0.88, - "learning_rate": 1.6544500029639717e-06, - "loss": 0.7539, - "step": 34496 - }, - { - "epoch": 0.88, - "learning_rate": 1.654429080937157e-06, - "loss": 0.8643, - "step": 34497 - }, - { - "epoch": 0.88, - "learning_rate": 1.6544081584092763e-06, - "loss": 1.0723, - "step": 34498 - }, - { - "epoch": 0.88, - "learning_rate": 1.6543872353803453e-06, - "loss": 0.666, - "step": 34499 - }, - { - "epoch": 0.88, - "learning_rate": 1.65436631185038e-06, - "loss": 0.7461, - "step": 34500 - }, - { - "epoch": 0.88, - "learning_rate": 1.6543453878193968e-06, - "loss": 0.9912, - "step": 34501 - }, - { - "epoch": 0.88, - "learning_rate": 1.6543244632874109e-06, - "loss": 0.9854, - "step": 34502 - }, - { - "epoch": 0.88, - "learning_rate": 1.6543035382544393e-06, - "loss": 1.123, - "step": 34503 - }, - { - "epoch": 0.88, - "learning_rate": 1.6542826127204972e-06, - "loss": 0.9912, - "step": 34504 - }, - { - "epoch": 0.88, - "learning_rate": 1.6542616866856017e-06, - "loss": 1.0908, - "step": 34505 - }, - { - "epoch": 0.88, - "learning_rate": 1.6542407601497673e-06, - "loss": 0.8252, - "step": 34506 - }, - { - "epoch": 0.88, - "learning_rate": 1.6542198331130114e-06, - "loss": 0.8906, - "step": 34507 - }, - { - "epoch": 0.88, - "learning_rate": 1.654198905575349e-06, - "loss": 0.6123, - "step": 34508 - }, - { - "epoch": 0.88, - "learning_rate": 1.6541779775367966e-06, - "loss": 0.6273, - "step": 34509 - }, - { - "epoch": 0.88, - "learning_rate": 1.6541570489973707e-06, - "loss": 0.6318, - "step": 34510 - }, - { - "epoch": 0.88, - "learning_rate": 1.6541361199570863e-06, - "loss": 0.9326, - "step": 34511 - }, - { - "epoch": 0.88, - "learning_rate": 1.6541151904159603e-06, - "loss": 0.7979, - "step": 34512 - }, - { - "epoch": 0.88, - "learning_rate": 1.6540942603740081e-06, - "loss": 0.9043, - "step": 34513 - }, - { - "epoch": 0.88, - "learning_rate": 1.654073329831246e-06, - "loss": 0.6992, - "step": 34514 - }, - { - "epoch": 0.88, - "learning_rate": 1.6540523987876903e-06, - "loss": 0.8389, - "step": 34515 - }, - { - "epoch": 0.88, - "learning_rate": 1.6540314672433567e-06, - "loss": 0.7461, - "step": 34516 - }, - { - "epoch": 0.88, - "learning_rate": 1.6540105351982611e-06, - "loss": 0.8623, - "step": 34517 - }, - { - "epoch": 0.88, - "learning_rate": 1.6539896026524199e-06, - "loss": 0.6924, - "step": 34518 - }, - { - "epoch": 0.88, - "learning_rate": 1.6539686696058487e-06, - "loss": 0.5852, - "step": 34519 - }, - { - "epoch": 0.88, - "learning_rate": 1.6539477360585638e-06, - "loss": 0.666, - "step": 34520 - }, - { - "epoch": 0.88, - "learning_rate": 1.6539268020105815e-06, - "loss": 0.448, - "step": 34521 - }, - { - "epoch": 0.88, - "learning_rate": 1.6539058674619173e-06, - "loss": 0.8574, - "step": 34522 - }, - { - "epoch": 0.88, - "learning_rate": 1.6538849324125871e-06, - "loss": 0.8755, - "step": 34523 - }, - { - "epoch": 0.88, - "learning_rate": 1.6538639968626078e-06, - "loss": 0.5488, - "step": 34524 - }, - { - "epoch": 0.88, - "learning_rate": 1.6538430608119947e-06, - "loss": 0.6567, - "step": 34525 - }, - { - "epoch": 0.88, - "learning_rate": 1.6538221242607641e-06, - "loss": 0.7383, - "step": 34526 - }, - { - "epoch": 0.88, - "learning_rate": 1.6538011872089318e-06, - "loss": 0.9766, - "step": 34527 - }, - { - "epoch": 0.88, - "learning_rate": 1.6537802496565143e-06, - "loss": 0.772, - "step": 34528 - }, - { - "epoch": 0.88, - "learning_rate": 1.653759311603527e-06, - "loss": 0.9727, - "step": 34529 - }, - { - "epoch": 0.89, - "learning_rate": 1.6537383730499865e-06, - "loss": 0.7969, - "step": 34530 - }, - { - "epoch": 0.89, - "learning_rate": 1.6537174339959083e-06, - "loss": 0.668, - "step": 34531 - }, - { - "epoch": 0.89, - "learning_rate": 1.653696494441309e-06, - "loss": 0.9717, - "step": 34532 - }, - { - "epoch": 0.89, - "learning_rate": 1.6536755543862042e-06, - "loss": 1.0986, - "step": 34533 - }, - { - "epoch": 0.89, - "learning_rate": 1.6536546138306102e-06, - "loss": 0.8623, - "step": 34534 - }, - { - "epoch": 0.89, - "learning_rate": 1.6536336727745427e-06, - "loss": 1.0361, - "step": 34535 - }, - { - "epoch": 0.89, - "learning_rate": 1.6536127312180183e-06, - "loss": 1.0195, - "step": 34536 - }, - { - "epoch": 0.89, - "learning_rate": 1.6535917891610524e-06, - "loss": 0.915, - "step": 34537 - }, - { - "epoch": 0.89, - "learning_rate": 1.6535708466036616e-06, - "loss": 0.5605, - "step": 34538 - }, - { - "epoch": 0.89, - "learning_rate": 1.653549903545861e-06, - "loss": 0.873, - "step": 34539 - }, - { - "epoch": 0.89, - "learning_rate": 1.653528959987668e-06, - "loss": 1.001, - "step": 34540 - }, - { - "epoch": 0.89, - "learning_rate": 1.6535080159290974e-06, - "loss": 0.96, - "step": 34541 - }, - { - "epoch": 0.89, - "learning_rate": 1.6534870713701662e-06, - "loss": 0.7395, - "step": 34542 - }, - { - "epoch": 0.89, - "learning_rate": 1.65346612631089e-06, - "loss": 0.8906, - "step": 34543 - }, - { - "epoch": 0.89, - "learning_rate": 1.6534451807512847e-06, - "loss": 0.9404, - "step": 34544 - }, - { - "epoch": 0.89, - "learning_rate": 1.6534242346913664e-06, - "loss": 0.9316, - "step": 34545 - }, - { - "epoch": 0.89, - "learning_rate": 1.6534032881311512e-06, - "loss": 0.8945, - "step": 34546 - }, - { - "epoch": 0.89, - "learning_rate": 1.6533823410706552e-06, - "loss": 0.792, - "step": 34547 - }, - { - "epoch": 0.89, - "learning_rate": 1.6533613935098943e-06, - "loss": 0.9717, - "step": 34548 - }, - { - "epoch": 0.89, - "learning_rate": 1.6533404454488847e-06, - "loss": 1.1738, - "step": 34549 - }, - { - "epoch": 0.89, - "learning_rate": 1.6533194968876426e-06, - "loss": 0.627, - "step": 34550 - }, - { - "epoch": 0.89, - "learning_rate": 1.6532985478261835e-06, - "loss": 0.877, - "step": 34551 - }, - { - "epoch": 0.89, - "learning_rate": 1.6532775982645237e-06, - "loss": 0.7944, - "step": 34552 - }, - { - "epoch": 0.89, - "learning_rate": 1.6532566482026793e-06, - "loss": 0.8188, - "step": 34553 - }, - { - "epoch": 0.89, - "learning_rate": 1.6532356976406664e-06, - "loss": 0.8193, - "step": 34554 - }, - { - "epoch": 0.89, - "learning_rate": 1.653214746578501e-06, - "loss": 0.8057, - "step": 34555 - }, - { - "epoch": 0.89, - "learning_rate": 1.6531937950161992e-06, - "loss": 0.7202, - "step": 34556 - }, - { - "epoch": 0.89, - "learning_rate": 1.6531728429537765e-06, - "loss": 0.8789, - "step": 34557 - }, - { - "epoch": 0.89, - "learning_rate": 1.65315189039125e-06, - "loss": 0.8184, - "step": 34558 - }, - { - "epoch": 0.89, - "learning_rate": 1.6531309373286346e-06, - "loss": 0.8301, - "step": 34559 - }, - { - "epoch": 0.89, - "learning_rate": 1.6531099837659475e-06, - "loss": 0.6694, - "step": 34560 - }, - { - "epoch": 0.89, - "learning_rate": 1.6530890297032034e-06, - "loss": 0.9346, - "step": 34561 - }, - { - "epoch": 0.89, - "learning_rate": 1.6530680751404197e-06, - "loss": 0.8008, - "step": 34562 - }, - { - "epoch": 0.89, - "learning_rate": 1.6530471200776112e-06, - "loss": 0.7192, - "step": 34563 - }, - { - "epoch": 0.89, - "learning_rate": 1.653026164514795e-06, - "loss": 0.7217, - "step": 34564 - }, - { - "epoch": 0.89, - "learning_rate": 1.6530052084519865e-06, - "loss": 0.9604, - "step": 34565 - }, - { - "epoch": 0.89, - "learning_rate": 1.6529842518892019e-06, - "loss": 0.8594, - "step": 34566 - }, - { - "epoch": 0.89, - "learning_rate": 1.6529632948264574e-06, - "loss": 0.9287, - "step": 34567 - }, - { - "epoch": 0.89, - "learning_rate": 1.6529423372637688e-06, - "loss": 0.8828, - "step": 34568 - }, - { - "epoch": 0.89, - "learning_rate": 1.6529213792011524e-06, - "loss": 0.7759, - "step": 34569 - }, - { - "epoch": 0.89, - "learning_rate": 1.652900420638624e-06, - "loss": 0.9307, - "step": 34570 - }, - { - "epoch": 0.89, - "learning_rate": 1.6528794615762e-06, - "loss": 0.6533, - "step": 34571 - }, - { - "epoch": 0.89, - "learning_rate": 1.652858502013896e-06, - "loss": 0.7222, - "step": 34572 - }, - { - "epoch": 0.89, - "learning_rate": 1.6528375419517281e-06, - "loss": 0.7236, - "step": 34573 - }, - { - "epoch": 0.89, - "learning_rate": 1.6528165813897129e-06, - "loss": 0.7783, - "step": 34574 - }, - { - "epoch": 0.89, - "learning_rate": 1.6527956203278662e-06, - "loss": 0.8555, - "step": 34575 - }, - { - "epoch": 0.89, - "learning_rate": 1.6527746587662034e-06, - "loss": 0.7231, - "step": 34576 - }, - { - "epoch": 0.89, - "learning_rate": 1.6527536967047412e-06, - "loss": 0.8577, - "step": 34577 - }, - { - "epoch": 0.89, - "learning_rate": 1.6527327341434957e-06, - "loss": 0.9287, - "step": 34578 - }, - { - "epoch": 0.89, - "learning_rate": 1.6527117710824827e-06, - "loss": 0.8848, - "step": 34579 - }, - { - "epoch": 0.89, - "learning_rate": 1.6526908075217184e-06, - "loss": 1.0254, - "step": 34580 - }, - { - "epoch": 0.89, - "learning_rate": 1.6526698434612186e-06, - "loss": 0.8174, - "step": 34581 - }, - { - "epoch": 0.89, - "learning_rate": 1.6526488789009995e-06, - "loss": 0.8506, - "step": 34582 - }, - { - "epoch": 0.89, - "learning_rate": 1.652627913841077e-06, - "loss": 0.8311, - "step": 34583 - }, - { - "epoch": 0.89, - "learning_rate": 1.6526069482814674e-06, - "loss": 0.6572, - "step": 34584 - }, - { - "epoch": 0.89, - "learning_rate": 1.6525859822221867e-06, - "loss": 0.7617, - "step": 34585 - }, - { - "epoch": 0.89, - "learning_rate": 1.652565015663251e-06, - "loss": 0.6914, - "step": 34586 - }, - { - "epoch": 0.89, - "learning_rate": 1.6525440486046765e-06, - "loss": 0.8213, - "step": 34587 - }, - { - "epoch": 0.89, - "learning_rate": 1.6525230810464789e-06, - "loss": 0.8081, - "step": 34588 - }, - { - "epoch": 0.89, - "learning_rate": 1.6525021129886741e-06, - "loss": 0.9814, - "step": 34589 - }, - { - "epoch": 0.89, - "learning_rate": 1.6524811444312787e-06, - "loss": 0.8535, - "step": 34590 - }, - { - "epoch": 0.89, - "learning_rate": 1.6524601753743084e-06, - "loss": 0.9873, - "step": 34591 - }, - { - "epoch": 0.89, - "learning_rate": 1.6524392058177793e-06, - "loss": 0.5947, - "step": 34592 - }, - { - "epoch": 0.89, - "learning_rate": 1.6524182357617073e-06, - "loss": 0.8271, - "step": 34593 - }, - { - "epoch": 0.89, - "learning_rate": 1.652397265206109e-06, - "loss": 0.8145, - "step": 34594 - }, - { - "epoch": 0.89, - "learning_rate": 1.6523762941510002e-06, - "loss": 0.9336, - "step": 34595 - }, - { - "epoch": 0.89, - "learning_rate": 1.6523553225963967e-06, - "loss": 0.7881, - "step": 34596 - }, - { - "epoch": 0.89, - "learning_rate": 1.6523343505423145e-06, - "loss": 0.7051, - "step": 34597 - }, - { - "epoch": 0.89, - "learning_rate": 1.65231337798877e-06, - "loss": 0.8213, - "step": 34598 - }, - { - "epoch": 0.89, - "learning_rate": 1.6522924049357791e-06, - "loss": 0.9521, - "step": 34599 - }, - { - "epoch": 0.89, - "learning_rate": 1.6522714313833583e-06, - "loss": 0.7861, - "step": 34600 - }, - { - "epoch": 0.89, - "learning_rate": 1.6522504573315228e-06, - "loss": 0.8279, - "step": 34601 - }, - { - "epoch": 0.89, - "learning_rate": 1.6522294827802893e-06, - "loss": 0.9619, - "step": 34602 - }, - { - "epoch": 0.89, - "learning_rate": 1.6522085077296737e-06, - "loss": 0.8848, - "step": 34603 - }, - { - "epoch": 0.89, - "learning_rate": 1.6521875321796918e-06, - "loss": 0.9023, - "step": 34604 - }, - { - "epoch": 0.89, - "learning_rate": 1.6521665561303603e-06, - "loss": 0.4976, - "step": 34605 - }, - { - "epoch": 0.89, - "learning_rate": 1.6521455795816947e-06, - "loss": 0.8848, - "step": 34606 - }, - { - "epoch": 0.89, - "learning_rate": 1.6521246025337111e-06, - "loss": 0.9702, - "step": 34607 - }, - { - "epoch": 0.89, - "learning_rate": 1.652103624986426e-06, - "loss": 0.6973, - "step": 34608 - }, - { - "epoch": 0.89, - "learning_rate": 1.6520826469398546e-06, - "loss": 0.8701, - "step": 34609 - }, - { - "epoch": 0.89, - "learning_rate": 1.652061668394014e-06, - "loss": 1.0889, - "step": 34610 - }, - { - "epoch": 0.89, - "learning_rate": 1.6520406893489197e-06, - "loss": 0.7271, - "step": 34611 - }, - { - "epoch": 0.89, - "learning_rate": 1.6520197098045873e-06, - "loss": 0.6699, - "step": 34612 - }, - { - "epoch": 0.89, - "learning_rate": 1.6519987297610339e-06, - "loss": 0.8867, - "step": 34613 - }, - { - "epoch": 0.89, - "learning_rate": 1.651977749218275e-06, - "loss": 0.8252, - "step": 34614 - }, - { - "epoch": 0.89, - "learning_rate": 1.6519567681763267e-06, - "loss": 0.9131, - "step": 34615 - }, - { - "epoch": 0.89, - "learning_rate": 1.6519357866352049e-06, - "loss": 0.9053, - "step": 34616 - }, - { - "epoch": 0.89, - "learning_rate": 1.6519148045949258e-06, - "loss": 0.6357, - "step": 34617 - }, - { - "epoch": 0.89, - "learning_rate": 1.6518938220555057e-06, - "loss": 0.7817, - "step": 34618 - }, - { - "epoch": 0.89, - "learning_rate": 1.6518728390169604e-06, - "loss": 0.8496, - "step": 34619 - }, - { - "epoch": 0.89, - "learning_rate": 1.6518518554793063e-06, - "loss": 0.5593, - "step": 34620 - }, - { - "epoch": 0.89, - "learning_rate": 1.651830871442559e-06, - "loss": 0.5693, - "step": 34621 - }, - { - "epoch": 0.89, - "learning_rate": 1.6518098869067347e-06, - "loss": 1.043, - "step": 34622 - }, - { - "epoch": 0.89, - "learning_rate": 1.6517889018718496e-06, - "loss": 0.5894, - "step": 34623 - }, - { - "epoch": 0.89, - "learning_rate": 1.6517679163379196e-06, - "loss": 0.9209, - "step": 34624 - }, - { - "epoch": 0.89, - "learning_rate": 1.651746930304961e-06, - "loss": 0.8613, - "step": 34625 - }, - { - "epoch": 0.89, - "learning_rate": 1.6517259437729898e-06, - "loss": 1.0381, - "step": 34626 - }, - { - "epoch": 0.89, - "learning_rate": 1.651704956742022e-06, - "loss": 0.9502, - "step": 34627 - }, - { - "epoch": 0.89, - "learning_rate": 1.6516839692120737e-06, - "loss": 0.874, - "step": 34628 - }, - { - "epoch": 0.89, - "learning_rate": 1.6516629811831608e-06, - "loss": 0.7983, - "step": 34629 - }, - { - "epoch": 0.89, - "learning_rate": 1.6516419926553e-06, - "loss": 0.9883, - "step": 34630 - }, - { - "epoch": 0.89, - "learning_rate": 1.6516210036285061e-06, - "loss": 0.8604, - "step": 34631 - }, - { - "epoch": 0.89, - "learning_rate": 1.6516000141027964e-06, - "loss": 0.8813, - "step": 34632 - }, - { - "epoch": 0.89, - "learning_rate": 1.6515790240781864e-06, - "loss": 0.4575, - "step": 34633 - }, - { - "epoch": 0.89, - "learning_rate": 1.6515580335546923e-06, - "loss": 0.8174, - "step": 34634 - }, - { - "epoch": 0.89, - "learning_rate": 1.6515370425323302e-06, - "loss": 0.9043, - "step": 34635 - }, - { - "epoch": 0.89, - "learning_rate": 1.6515160510111163e-06, - "loss": 0.8936, - "step": 34636 - }, - { - "epoch": 0.89, - "learning_rate": 1.6514950589910663e-06, - "loss": 0.7988, - "step": 34637 - }, - { - "epoch": 0.89, - "learning_rate": 1.6514740664721969e-06, - "loss": 0.6274, - "step": 34638 - }, - { - "epoch": 0.89, - "learning_rate": 1.6514530734545233e-06, - "loss": 0.9121, - "step": 34639 - }, - { - "epoch": 0.89, - "learning_rate": 1.6514320799380623e-06, - "loss": 0.8999, - "step": 34640 - }, - { - "epoch": 0.89, - "learning_rate": 1.6514110859228295e-06, - "loss": 0.9233, - "step": 34641 - }, - { - "epoch": 0.89, - "learning_rate": 1.6513900914088413e-06, - "loss": 0.8975, - "step": 34642 - }, - { - "epoch": 0.89, - "learning_rate": 1.6513690963961136e-06, - "loss": 0.8281, - "step": 34643 - }, - { - "epoch": 0.89, - "learning_rate": 1.6513481008846628e-06, - "loss": 0.8379, - "step": 34644 - }, - { - "epoch": 0.89, - "learning_rate": 1.6513271048745044e-06, - "loss": 0.5896, - "step": 34645 - }, - { - "epoch": 0.89, - "learning_rate": 1.651306108365655e-06, - "loss": 0.6904, - "step": 34646 - }, - { - "epoch": 0.89, - "learning_rate": 1.6512851113581303e-06, - "loss": 0.6885, - "step": 34647 - }, - { - "epoch": 0.89, - "learning_rate": 1.6512641138519465e-06, - "loss": 0.8975, - "step": 34648 - }, - { - "epoch": 0.89, - "learning_rate": 1.6512431158471197e-06, - "loss": 0.7646, - "step": 34649 - }, - { - "epoch": 0.89, - "learning_rate": 1.6512221173436663e-06, - "loss": 0.8926, - "step": 34650 - }, - { - "epoch": 0.89, - "learning_rate": 1.6512011183416016e-06, - "loss": 0.8447, - "step": 34651 - }, - { - "epoch": 0.89, - "learning_rate": 1.6511801188409424e-06, - "loss": 0.6069, - "step": 34652 - }, - { - "epoch": 0.89, - "learning_rate": 1.6511591188417046e-06, - "loss": 0.6877, - "step": 34653 - }, - { - "epoch": 0.89, - "learning_rate": 1.6511381183439042e-06, - "loss": 0.5923, - "step": 34654 - }, - { - "epoch": 0.89, - "learning_rate": 1.651117117347557e-06, - "loss": 0.9023, - "step": 34655 - }, - { - "epoch": 0.89, - "learning_rate": 1.6510961158526796e-06, - "loss": 1.0361, - "step": 34656 - }, - { - "epoch": 0.89, - "learning_rate": 1.651075113859288e-06, - "loss": 0.9102, - "step": 34657 - }, - { - "epoch": 0.89, - "learning_rate": 1.6510541113673978e-06, - "loss": 0.8613, - "step": 34658 - }, - { - "epoch": 0.89, - "learning_rate": 1.6510331083770256e-06, - "loss": 0.8516, - "step": 34659 - }, - { - "epoch": 0.89, - "learning_rate": 1.6510121048881875e-06, - "loss": 0.8555, - "step": 34660 - }, - { - "epoch": 0.89, - "learning_rate": 1.650991100900899e-06, - "loss": 0.9463, - "step": 34661 - }, - { - "epoch": 0.89, - "learning_rate": 1.6509700964151767e-06, - "loss": 0.6099, - "step": 34662 - }, - { - "epoch": 0.89, - "learning_rate": 1.6509490914310363e-06, - "loss": 0.8418, - "step": 34663 - }, - { - "epoch": 0.89, - "learning_rate": 1.6509280859484942e-06, - "loss": 0.9824, - "step": 34664 - }, - { - "epoch": 0.89, - "learning_rate": 1.6509070799675667e-06, - "loss": 0.8472, - "step": 34665 - }, - { - "epoch": 0.89, - "learning_rate": 1.6508860734882693e-06, - "loss": 0.7036, - "step": 34666 - }, - { - "epoch": 0.89, - "learning_rate": 1.6508650665106182e-06, - "loss": 0.9365, - "step": 34667 - }, - { - "epoch": 0.89, - "learning_rate": 1.65084405903463e-06, - "loss": 0.7002, - "step": 34668 - }, - { - "epoch": 0.89, - "learning_rate": 1.6508230510603202e-06, - "loss": 0.9199, - "step": 34669 - }, - { - "epoch": 0.89, - "learning_rate": 1.6508020425877055e-06, - "loss": 1.0693, - "step": 34670 - }, - { - "epoch": 0.89, - "learning_rate": 1.6507810336168012e-06, - "loss": 0.8438, - "step": 34671 - }, - { - "epoch": 0.89, - "learning_rate": 1.6507600241476238e-06, - "loss": 0.9746, - "step": 34672 - }, - { - "epoch": 0.89, - "learning_rate": 1.6507390141801895e-06, - "loss": 0.9414, - "step": 34673 - }, - { - "epoch": 0.89, - "learning_rate": 1.6507180037145143e-06, - "loss": 0.8115, - "step": 34674 - }, - { - "epoch": 0.89, - "learning_rate": 1.650696992750614e-06, - "loss": 0.8467, - "step": 34675 - }, - { - "epoch": 0.89, - "learning_rate": 1.650675981288505e-06, - "loss": 0.8223, - "step": 34676 - }, - { - "epoch": 0.89, - "learning_rate": 1.6506549693282036e-06, - "loss": 0.7141, - "step": 34677 - }, - { - "epoch": 0.89, - "learning_rate": 1.6506339568697254e-06, - "loss": 0.9424, - "step": 34678 - }, - { - "epoch": 0.89, - "learning_rate": 1.6506129439130867e-06, - "loss": 0.8506, - "step": 34679 - }, - { - "epoch": 0.89, - "learning_rate": 1.6505919304583038e-06, - "loss": 1.0049, - "step": 34680 - }, - { - "epoch": 0.89, - "learning_rate": 1.6505709165053925e-06, - "loss": 0.8984, - "step": 34681 - }, - { - "epoch": 0.89, - "learning_rate": 1.6505499020543688e-06, - "loss": 0.688, - "step": 34682 - }, - { - "epoch": 0.89, - "learning_rate": 1.6505288871052487e-06, - "loss": 0.6343, - "step": 34683 - }, - { - "epoch": 0.89, - "learning_rate": 1.6505078716580489e-06, - "loss": 0.7324, - "step": 34684 - }, - { - "epoch": 0.89, - "learning_rate": 1.6504868557127854e-06, - "loss": 0.8613, - "step": 34685 - }, - { - "epoch": 0.89, - "learning_rate": 1.6504658392694736e-06, - "loss": 0.7383, - "step": 34686 - }, - { - "epoch": 0.89, - "learning_rate": 1.6504448223281303e-06, - "loss": 0.8701, - "step": 34687 - }, - { - "epoch": 0.89, - "learning_rate": 1.6504238048887708e-06, - "loss": 0.917, - "step": 34688 - }, - { - "epoch": 0.89, - "learning_rate": 1.650402786951412e-06, - "loss": 0.9561, - "step": 34689 - }, - { - "epoch": 0.89, - "learning_rate": 1.65038176851607e-06, - "loss": 0.6553, - "step": 34690 - }, - { - "epoch": 0.89, - "learning_rate": 1.6503607495827603e-06, - "loss": 0.9502, - "step": 34691 - }, - { - "epoch": 0.89, - "learning_rate": 1.6503397301514993e-06, - "loss": 0.7744, - "step": 34692 - }, - { - "epoch": 0.89, - "learning_rate": 1.6503187102223027e-06, - "loss": 1.0029, - "step": 34693 - }, - { - "epoch": 0.89, - "learning_rate": 1.6502976897951874e-06, - "loss": 1.0654, - "step": 34694 - }, - { - "epoch": 0.89, - "learning_rate": 1.6502766688701692e-06, - "loss": 0.9375, - "step": 34695 - }, - { - "epoch": 0.89, - "learning_rate": 1.6502556474472637e-06, - "loss": 0.8018, - "step": 34696 - }, - { - "epoch": 0.89, - "learning_rate": 1.6502346255264875e-06, - "loss": 0.957, - "step": 34697 - }, - { - "epoch": 0.89, - "learning_rate": 1.6502136031078563e-06, - "loss": 0.8652, - "step": 34698 - }, - { - "epoch": 0.89, - "learning_rate": 1.650192580191387e-06, - "loss": 0.9883, - "step": 34699 - }, - { - "epoch": 0.89, - "learning_rate": 1.6501715567770948e-06, - "loss": 0.9268, - "step": 34700 - }, - { - "epoch": 0.89, - "learning_rate": 1.650150532864996e-06, - "loss": 0.7949, - "step": 34701 - }, - { - "epoch": 0.89, - "learning_rate": 1.650129508455107e-06, - "loss": 0.7441, - "step": 34702 - }, - { - "epoch": 0.89, - "learning_rate": 1.6501084835474438e-06, - "loss": 0.7852, - "step": 34703 - }, - { - "epoch": 0.89, - "learning_rate": 1.6500874581420221e-06, - "loss": 1.0254, - "step": 34704 - }, - { - "epoch": 0.89, - "learning_rate": 1.650066432238859e-06, - "loss": 1.0869, - "step": 34705 - }, - { - "epoch": 0.89, - "learning_rate": 1.6500454058379694e-06, - "loss": 1.0352, - "step": 34706 - }, - { - "epoch": 0.89, - "learning_rate": 1.6500243789393697e-06, - "loss": 0.7793, - "step": 34707 - }, - { - "epoch": 0.89, - "learning_rate": 1.6500033515430767e-06, - "loss": 0.8423, - "step": 34708 - }, - { - "epoch": 0.89, - "learning_rate": 1.649982323649106e-06, - "loss": 0.749, - "step": 34709 - }, - { - "epoch": 0.89, - "learning_rate": 1.6499612952574734e-06, - "loss": 0.7607, - "step": 34710 - }, - { - "epoch": 0.89, - "learning_rate": 1.6499402663681955e-06, - "loss": 0.8281, - "step": 34711 - }, - { - "epoch": 0.89, - "learning_rate": 1.6499192369812885e-06, - "loss": 0.8555, - "step": 34712 - }, - { - "epoch": 0.89, - "learning_rate": 1.6498982070967678e-06, - "loss": 0.8159, - "step": 34713 - }, - { - "epoch": 0.89, - "learning_rate": 1.64987717671465e-06, - "loss": 0.592, - "step": 34714 - }, - { - "epoch": 0.89, - "learning_rate": 1.6498561458349514e-06, - "loss": 0.8042, - "step": 34715 - }, - { - "epoch": 0.89, - "learning_rate": 1.6498351144576877e-06, - "loss": 0.6831, - "step": 34716 - }, - { - "epoch": 0.89, - "learning_rate": 1.6498140825828748e-06, - "loss": 0.7793, - "step": 34717 - }, - { - "epoch": 0.89, - "learning_rate": 1.6497930502105292e-06, - "loss": 1.0684, - "step": 34718 - }, - { - "epoch": 0.89, - "learning_rate": 1.6497720173406674e-06, - "loss": 0.8389, - "step": 34719 - }, - { - "epoch": 0.89, - "learning_rate": 1.6497509839733046e-06, - "loss": 0.6382, - "step": 34720 - }, - { - "epoch": 0.89, - "learning_rate": 1.6497299501084576e-06, - "loss": 0.9746, - "step": 34721 - }, - { - "epoch": 0.89, - "learning_rate": 1.6497089157461421e-06, - "loss": 0.8457, - "step": 34722 - }, - { - "epoch": 0.89, - "learning_rate": 1.6496878808863746e-06, - "loss": 0.7871, - "step": 34723 - }, - { - "epoch": 0.89, - "learning_rate": 1.6496668455291709e-06, - "loss": 0.998, - "step": 34724 - }, - { - "epoch": 0.89, - "learning_rate": 1.6496458096745469e-06, - "loss": 1.0186, - "step": 34725 - }, - { - "epoch": 0.89, - "learning_rate": 1.649624773322519e-06, - "loss": 0.9023, - "step": 34726 - }, - { - "epoch": 0.89, - "learning_rate": 1.6496037364731037e-06, - "loss": 0.8682, - "step": 34727 - }, - { - "epoch": 0.89, - "learning_rate": 1.6495826991263164e-06, - "loss": 0.8564, - "step": 34728 - }, - { - "epoch": 0.89, - "learning_rate": 1.6495616612821736e-06, - "loss": 0.8535, - "step": 34729 - }, - { - "epoch": 0.89, - "learning_rate": 1.6495406229406909e-06, - "loss": 0.7988, - "step": 34730 - }, - { - "epoch": 0.89, - "learning_rate": 1.649519584101885e-06, - "loss": 0.9102, - "step": 34731 - }, - { - "epoch": 0.89, - "learning_rate": 1.6494985447657723e-06, - "loss": 0.7368, - "step": 34732 - }, - { - "epoch": 0.89, - "learning_rate": 1.6494775049323679e-06, - "loss": 0.7627, - "step": 34733 - }, - { - "epoch": 0.89, - "learning_rate": 1.6494564646016889e-06, - "loss": 0.5718, - "step": 34734 - }, - { - "epoch": 0.89, - "learning_rate": 1.6494354237737507e-06, - "loss": 0.8506, - "step": 34735 - }, - { - "epoch": 0.89, - "learning_rate": 1.6494143824485693e-06, - "loss": 0.9062, - "step": 34736 - }, - { - "epoch": 0.89, - "learning_rate": 1.6493933406261617e-06, - "loss": 0.7056, - "step": 34737 - }, - { - "epoch": 0.89, - "learning_rate": 1.649372298306543e-06, - "loss": 0.8652, - "step": 34738 - }, - { - "epoch": 0.89, - "learning_rate": 1.6493512554897305e-06, - "loss": 0.9463, - "step": 34739 - }, - { - "epoch": 0.89, - "learning_rate": 1.649330212175739e-06, - "loss": 0.7344, - "step": 34740 - }, - { - "epoch": 0.89, - "learning_rate": 1.6493091683645853e-06, - "loss": 0.5061, - "step": 34741 - }, - { - "epoch": 0.89, - "learning_rate": 1.6492881240562855e-06, - "loss": 0.6191, - "step": 34742 - }, - { - "epoch": 0.89, - "learning_rate": 1.6492670792508555e-06, - "loss": 0.8574, - "step": 34743 - }, - { - "epoch": 0.89, - "learning_rate": 1.6492460339483119e-06, - "loss": 0.7061, - "step": 34744 - }, - { - "epoch": 0.89, - "learning_rate": 1.6492249881486702e-06, - "loss": 0.8154, - "step": 34745 - }, - { - "epoch": 0.89, - "learning_rate": 1.6492039418519468e-06, - "loss": 0.73, - "step": 34746 - }, - { - "epoch": 0.89, - "learning_rate": 1.6491828950581578e-06, - "loss": 1.0762, - "step": 34747 - }, - { - "epoch": 0.89, - "learning_rate": 1.6491618477673193e-06, - "loss": 0.9688, - "step": 34748 - }, - { - "epoch": 0.89, - "learning_rate": 1.6491407999794476e-06, - "loss": 0.9199, - "step": 34749 - }, - { - "epoch": 0.89, - "learning_rate": 1.6491197516945583e-06, - "loss": 0.6592, - "step": 34750 - }, - { - "epoch": 0.89, - "learning_rate": 1.6490987029126682e-06, - "loss": 0.6309, - "step": 34751 - }, - { - "epoch": 0.89, - "learning_rate": 1.649077653633793e-06, - "loss": 0.8359, - "step": 34752 - }, - { - "epoch": 0.89, - "learning_rate": 1.6490566038579487e-06, - "loss": 0.833, - "step": 34753 - }, - { - "epoch": 0.89, - "learning_rate": 1.6490355535851519e-06, - "loss": 1.0088, - "step": 34754 - }, - { - "epoch": 0.89, - "learning_rate": 1.6490145028154182e-06, - "loss": 0.7104, - "step": 34755 - }, - { - "epoch": 0.89, - "learning_rate": 1.6489934515487637e-06, - "loss": 0.9814, - "step": 34756 - }, - { - "epoch": 0.89, - "learning_rate": 1.648972399785205e-06, - "loss": 0.9072, - "step": 34757 - }, - { - "epoch": 0.89, - "learning_rate": 1.6489513475247581e-06, - "loss": 0.8135, - "step": 34758 - }, - { - "epoch": 0.89, - "learning_rate": 1.6489302947674387e-06, - "loss": 0.7178, - "step": 34759 - }, - { - "epoch": 0.89, - "learning_rate": 1.6489092415132638e-06, - "loss": 0.9824, - "step": 34760 - }, - { - "epoch": 0.89, - "learning_rate": 1.6488881877622482e-06, - "loss": 0.6331, - "step": 34761 - }, - { - "epoch": 0.89, - "learning_rate": 1.6488671335144094e-06, - "loss": 0.9092, - "step": 34762 - }, - { - "epoch": 0.89, - "learning_rate": 1.6488460787697624e-06, - "loss": 0.7021, - "step": 34763 - }, - { - "epoch": 0.89, - "learning_rate": 1.648825023528324e-06, - "loss": 0.8076, - "step": 34764 - }, - { - "epoch": 0.89, - "learning_rate": 1.6488039677901097e-06, - "loss": 0.6738, - "step": 34765 - }, - { - "epoch": 0.89, - "learning_rate": 1.6487829115551367e-06, - "loss": 0.8799, - "step": 34766 - }, - { - "epoch": 0.89, - "learning_rate": 1.64876185482342e-06, - "loss": 0.614, - "step": 34767 - }, - { - "epoch": 0.89, - "learning_rate": 1.6487407975949763e-06, - "loss": 0.9126, - "step": 34768 - }, - { - "epoch": 0.89, - "learning_rate": 1.6487197398698216e-06, - "loss": 0.8047, - "step": 34769 - }, - { - "epoch": 0.89, - "learning_rate": 1.6486986816479721e-06, - "loss": 0.7576, - "step": 34770 - }, - { - "epoch": 0.89, - "learning_rate": 1.6486776229294439e-06, - "loss": 0.9404, - "step": 34771 - }, - { - "epoch": 0.89, - "learning_rate": 1.648656563714253e-06, - "loss": 0.6182, - "step": 34772 - }, - { - "epoch": 0.89, - "learning_rate": 1.6486355040024153e-06, - "loss": 0.8237, - "step": 34773 - }, - { - "epoch": 0.89, - "learning_rate": 1.6486144437939477e-06, - "loss": 0.8867, - "step": 34774 - }, - { - "epoch": 0.89, - "learning_rate": 1.6485933830888656e-06, - "loss": 0.8896, - "step": 34775 - }, - { - "epoch": 0.89, - "learning_rate": 1.6485723218871853e-06, - "loss": 0.915, - "step": 34776 - }, - { - "epoch": 0.89, - "learning_rate": 1.648551260188923e-06, - "loss": 0.8555, - "step": 34777 - }, - { - "epoch": 0.89, - "learning_rate": 1.6485301979940952e-06, - "loss": 0.8359, - "step": 34778 - }, - { - "epoch": 0.89, - "learning_rate": 1.6485091353027175e-06, - "loss": 0.6987, - "step": 34779 - }, - { - "epoch": 0.89, - "learning_rate": 1.648488072114806e-06, - "loss": 0.8662, - "step": 34780 - }, - { - "epoch": 0.89, - "learning_rate": 1.648467008430377e-06, - "loss": 0.7627, - "step": 34781 - }, - { - "epoch": 0.89, - "learning_rate": 1.6484459442494465e-06, - "loss": 0.9756, - "step": 34782 - }, - { - "epoch": 0.89, - "learning_rate": 1.648424879572031e-06, - "loss": 0.8418, - "step": 34783 - }, - { - "epoch": 0.89, - "learning_rate": 1.6484038143981462e-06, - "loss": 0.9004, - "step": 34784 - }, - { - "epoch": 0.89, - "learning_rate": 1.6483827487278087e-06, - "loss": 1.042, - "step": 34785 - }, - { - "epoch": 0.89, - "learning_rate": 1.648361682561034e-06, - "loss": 0.7832, - "step": 34786 - }, - { - "epoch": 0.89, - "learning_rate": 1.6483406158978388e-06, - "loss": 0.7886, - "step": 34787 - }, - { - "epoch": 0.89, - "learning_rate": 1.6483195487382391e-06, - "loss": 0.7334, - "step": 34788 - }, - { - "epoch": 0.89, - "learning_rate": 1.6482984810822508e-06, - "loss": 0.8242, - "step": 34789 - }, - { - "epoch": 0.89, - "learning_rate": 1.6482774129298899e-06, - "loss": 0.7471, - "step": 34790 - }, - { - "epoch": 0.89, - "learning_rate": 1.6482563442811732e-06, - "loss": 0.8174, - "step": 34791 - }, - { - "epoch": 0.89, - "learning_rate": 1.6482352751361162e-06, - "loss": 0.8887, - "step": 34792 - }, - { - "epoch": 0.89, - "learning_rate": 1.6482142054947351e-06, - "loss": 0.9229, - "step": 34793 - }, - { - "epoch": 0.89, - "learning_rate": 1.6481931353570465e-06, - "loss": 0.7617, - "step": 34794 - }, - { - "epoch": 0.89, - "learning_rate": 1.6481720647230661e-06, - "loss": 1.0039, - "step": 34795 - }, - { - "epoch": 0.89, - "learning_rate": 1.6481509935928101e-06, - "loss": 0.9365, - "step": 34796 - }, - { - "epoch": 0.89, - "learning_rate": 1.6481299219662947e-06, - "loss": 0.6914, - "step": 34797 - }, - { - "epoch": 0.89, - "learning_rate": 1.6481088498435364e-06, - "loss": 0.7734, - "step": 34798 - }, - { - "epoch": 0.89, - "learning_rate": 1.6480877772245507e-06, - "loss": 0.8271, - "step": 34799 - }, - { - "epoch": 0.89, - "learning_rate": 1.648066704109354e-06, - "loss": 0.957, - "step": 34800 - }, - { - "epoch": 0.89, - "learning_rate": 1.648045630497962e-06, - "loss": 0.8672, - "step": 34801 - }, - { - "epoch": 0.89, - "learning_rate": 1.6480245563903918e-06, - "loss": 0.8193, - "step": 34802 - }, - { - "epoch": 0.89, - "learning_rate": 1.6480034817866585e-06, - "loss": 0.7061, - "step": 34803 - }, - { - "epoch": 0.89, - "learning_rate": 1.647982406686779e-06, - "loss": 0.6987, - "step": 34804 - }, - { - "epoch": 0.89, - "learning_rate": 1.6479613310907695e-06, - "loss": 0.8496, - "step": 34805 - }, - { - "epoch": 0.89, - "learning_rate": 1.6479402549986453e-06, - "loss": 0.9043, - "step": 34806 - }, - { - "epoch": 0.89, - "learning_rate": 1.6479191784104233e-06, - "loss": 0.8608, - "step": 34807 - }, - { - "epoch": 0.89, - "learning_rate": 1.6478981013261195e-06, - "loss": 0.9199, - "step": 34808 - }, - { - "epoch": 0.89, - "learning_rate": 1.6478770237457495e-06, - "loss": 0.8682, - "step": 34809 - }, - { - "epoch": 0.89, - "learning_rate": 1.6478559456693302e-06, - "loss": 0.998, - "step": 34810 - }, - { - "epoch": 0.89, - "learning_rate": 1.6478348670968774e-06, - "loss": 0.8945, - "step": 34811 - }, - { - "epoch": 0.89, - "learning_rate": 1.647813788028407e-06, - "loss": 0.8154, - "step": 34812 - }, - { - "epoch": 0.89, - "learning_rate": 1.6477927084639353e-06, - "loss": 0.6431, - "step": 34813 - }, - { - "epoch": 0.89, - "learning_rate": 1.6477716284034788e-06, - "loss": 0.8174, - "step": 34814 - }, - { - "epoch": 0.89, - "learning_rate": 1.6477505478470533e-06, - "loss": 0.7891, - "step": 34815 - }, - { - "epoch": 0.89, - "learning_rate": 1.6477294667946747e-06, - "loss": 0.9541, - "step": 34816 - }, - { - "epoch": 0.89, - "learning_rate": 1.64770838524636e-06, - "loss": 0.8135, - "step": 34817 - }, - { - "epoch": 0.89, - "learning_rate": 1.6476873032021242e-06, - "loss": 1.0195, - "step": 34818 - }, - { - "epoch": 0.89, - "learning_rate": 1.6476662206619842e-06, - "loss": 0.8926, - "step": 34819 - }, - { - "epoch": 0.89, - "learning_rate": 1.6476451376259561e-06, - "loss": 0.8203, - "step": 34820 - }, - { - "epoch": 0.89, - "learning_rate": 1.6476240540940557e-06, - "loss": 0.8623, - "step": 34821 - }, - { - "epoch": 0.89, - "learning_rate": 1.6476029700662997e-06, - "loss": 0.917, - "step": 34822 - }, - { - "epoch": 0.89, - "learning_rate": 1.6475818855427033e-06, - "loss": 0.8574, - "step": 34823 - }, - { - "epoch": 0.89, - "learning_rate": 1.647560800523284e-06, - "loss": 0.6821, - "step": 34824 - }, - { - "epoch": 0.89, - "learning_rate": 1.6475397150080564e-06, - "loss": 0.8154, - "step": 34825 - }, - { - "epoch": 0.89, - "learning_rate": 1.6475186289970377e-06, - "loss": 0.8633, - "step": 34826 - }, - { - "epoch": 0.89, - "learning_rate": 1.6474975424902437e-06, - "loss": 0.9238, - "step": 34827 - }, - { - "epoch": 0.89, - "learning_rate": 1.6474764554876908e-06, - "loss": 0.9209, - "step": 34828 - }, - { - "epoch": 0.89, - "learning_rate": 1.6474553679893947e-06, - "loss": 0.8428, - "step": 34829 - }, - { - "epoch": 0.89, - "learning_rate": 1.6474342799953722e-06, - "loss": 0.877, - "step": 34830 - }, - { - "epoch": 0.89, - "learning_rate": 1.6474131915056386e-06, - "loss": 0.562, - "step": 34831 - }, - { - "epoch": 0.89, - "learning_rate": 1.6473921025202108e-06, - "loss": 0.8271, - "step": 34832 - }, - { - "epoch": 0.89, - "learning_rate": 1.6473710130391044e-06, - "loss": 1.0723, - "step": 34833 - }, - { - "epoch": 0.89, - "learning_rate": 1.647349923062336e-06, - "loss": 0.6689, - "step": 34834 - }, - { - "epoch": 0.89, - "learning_rate": 1.6473288325899213e-06, - "loss": 1.0234, - "step": 34835 - }, - { - "epoch": 0.89, - "learning_rate": 1.6473077416218769e-06, - "loss": 0.9141, - "step": 34836 - }, - { - "epoch": 0.89, - "learning_rate": 1.6472866501582185e-06, - "loss": 0.999, - "step": 34837 - }, - { - "epoch": 0.89, - "learning_rate": 1.6472655581989624e-06, - "loss": 1.0176, - "step": 34838 - }, - { - "epoch": 0.89, - "learning_rate": 1.6472444657441253e-06, - "loss": 1.0469, - "step": 34839 - }, - { - "epoch": 0.89, - "learning_rate": 1.6472233727937226e-06, - "loss": 1.0645, - "step": 34840 - }, - { - "epoch": 0.89, - "learning_rate": 1.6472022793477708e-06, - "loss": 0.9512, - "step": 34841 - }, - { - "epoch": 0.89, - "learning_rate": 1.6471811854062858e-06, - "loss": 0.8711, - "step": 34842 - }, - { - "epoch": 0.89, - "learning_rate": 1.6471600909692839e-06, - "loss": 0.5391, - "step": 34843 - }, - { - "epoch": 0.89, - "learning_rate": 1.6471389960367816e-06, - "loss": 0.8926, - "step": 34844 - }, - { - "epoch": 0.89, - "learning_rate": 1.6471179006087946e-06, - "loss": 0.8701, - "step": 34845 - }, - { - "epoch": 0.89, - "learning_rate": 1.6470968046853391e-06, - "loss": 0.8862, - "step": 34846 - }, - { - "epoch": 0.89, - "learning_rate": 1.6470757082664313e-06, - "loss": 1.0098, - "step": 34847 - }, - { - "epoch": 0.89, - "learning_rate": 1.6470546113520873e-06, - "loss": 0.7783, - "step": 34848 - }, - { - "epoch": 0.89, - "learning_rate": 1.6470335139423233e-06, - "loss": 0.8477, - "step": 34849 - }, - { - "epoch": 0.89, - "learning_rate": 1.647012416037156e-06, - "loss": 0.7446, - "step": 34850 - }, - { - "epoch": 0.89, - "learning_rate": 1.6469913176366003e-06, - "loss": 0.7861, - "step": 34851 - }, - { - "epoch": 0.89, - "learning_rate": 1.6469702187406736e-06, - "loss": 0.7227, - "step": 34852 - }, - { - "epoch": 0.89, - "learning_rate": 1.6469491193493914e-06, - "loss": 0.9395, - "step": 34853 - }, - { - "epoch": 0.89, - "learning_rate": 1.6469280194627703e-06, - "loss": 0.7993, - "step": 34854 - }, - { - "epoch": 0.89, - "learning_rate": 1.6469069190808256e-06, - "loss": 0.8521, - "step": 34855 - }, - { - "epoch": 0.89, - "learning_rate": 1.6468858182035743e-06, - "loss": 0.6147, - "step": 34856 - }, - { - "epoch": 0.89, - "learning_rate": 1.6468647168310323e-06, - "loss": 0.8613, - "step": 34857 - }, - { - "epoch": 0.89, - "learning_rate": 1.6468436149632157e-06, - "loss": 0.7812, - "step": 34858 - }, - { - "epoch": 0.89, - "learning_rate": 1.6468225126001406e-06, - "loss": 0.752, - "step": 34859 - }, - { - "epoch": 0.89, - "learning_rate": 1.6468014097418234e-06, - "loss": 0.6709, - "step": 34860 - }, - { - "epoch": 0.89, - "learning_rate": 1.64678030638828e-06, - "loss": 0.8633, - "step": 34861 - }, - { - "epoch": 0.89, - "learning_rate": 1.646759202539527e-06, - "loss": 0.8545, - "step": 34862 - }, - { - "epoch": 0.89, - "learning_rate": 1.6467380981955797e-06, - "loss": 0.8218, - "step": 34863 - }, - { - "epoch": 0.89, - "learning_rate": 1.6467169933564554e-06, - "loss": 0.8145, - "step": 34864 - }, - { - "epoch": 0.89, - "learning_rate": 1.6466958880221691e-06, - "loss": 0.6699, - "step": 34865 - }, - { - "epoch": 0.89, - "learning_rate": 1.6466747821927375e-06, - "loss": 0.6982, - "step": 34866 - }, - { - "epoch": 0.89, - "learning_rate": 1.646653675868177e-06, - "loss": 0.8467, - "step": 34867 - }, - { - "epoch": 0.89, - "learning_rate": 1.6466325690485031e-06, - "loss": 0.876, - "step": 34868 - }, - { - "epoch": 0.89, - "learning_rate": 1.646611461733733e-06, - "loss": 0.6685, - "step": 34869 - }, - { - "epoch": 0.89, - "learning_rate": 1.6465903539238818e-06, - "loss": 0.6924, - "step": 34870 - }, - { - "epoch": 0.89, - "learning_rate": 1.6465692456189663e-06, - "loss": 1.0742, - "step": 34871 - }, - { - "epoch": 0.89, - "learning_rate": 1.6465481368190025e-06, - "loss": 1.043, - "step": 34872 - }, - { - "epoch": 0.89, - "learning_rate": 1.6465270275240063e-06, - "loss": 0.8066, - "step": 34873 - }, - { - "epoch": 0.89, - "learning_rate": 1.6465059177339939e-06, - "loss": 0.7104, - "step": 34874 - }, - { - "epoch": 0.89, - "learning_rate": 1.6464848074489822e-06, - "loss": 0.833, - "step": 34875 - }, - { - "epoch": 0.89, - "learning_rate": 1.6464636966689863e-06, - "loss": 0.6382, - "step": 34876 - }, - { - "epoch": 0.89, - "learning_rate": 1.6464425853940234e-06, - "loss": 0.9375, - "step": 34877 - }, - { - "epoch": 0.89, - "learning_rate": 1.6464214736241086e-06, - "loss": 1.1475, - "step": 34878 - }, - { - "epoch": 0.89, - "learning_rate": 1.6464003613592588e-06, - "loss": 0.9736, - "step": 34879 - }, - { - "epoch": 0.89, - "learning_rate": 1.64637924859949e-06, - "loss": 0.8408, - "step": 34880 - }, - { - "epoch": 0.89, - "learning_rate": 1.6463581353448183e-06, - "loss": 0.6826, - "step": 34881 - }, - { - "epoch": 0.89, - "learning_rate": 1.6463370215952602e-06, - "loss": 0.8416, - "step": 34882 - }, - { - "epoch": 0.89, - "learning_rate": 1.6463159073508311e-06, - "loss": 0.7344, - "step": 34883 - }, - { - "epoch": 0.89, - "learning_rate": 1.646294792611548e-06, - "loss": 0.8408, - "step": 34884 - }, - { - "epoch": 0.89, - "learning_rate": 1.6462736773774264e-06, - "loss": 0.606, - "step": 34885 - }, - { - "epoch": 0.89, - "learning_rate": 1.646252561648483e-06, - "loss": 0.6787, - "step": 34886 - }, - { - "epoch": 0.89, - "learning_rate": 1.6462314454247333e-06, - "loss": 0.7695, - "step": 34887 - }, - { - "epoch": 0.89, - "learning_rate": 1.6462103287061942e-06, - "loss": 0.7312, - "step": 34888 - }, - { - "epoch": 0.89, - "learning_rate": 1.6461892114928819e-06, - "loss": 0.7891, - "step": 34889 - }, - { - "epoch": 0.89, - "learning_rate": 1.6461680937848116e-06, - "loss": 0.7979, - "step": 34890 - }, - { - "epoch": 0.89, - "learning_rate": 1.6461469755820006e-06, - "loss": 0.7354, - "step": 34891 - }, - { - "epoch": 0.89, - "learning_rate": 1.6461258568844642e-06, - "loss": 0.9004, - "step": 34892 - }, - { - "epoch": 0.89, - "learning_rate": 1.646104737692219e-06, - "loss": 1.0283, - "step": 34893 - }, - { - "epoch": 0.89, - "learning_rate": 1.6460836180052815e-06, - "loss": 0.8711, - "step": 34894 - }, - { - "epoch": 0.89, - "learning_rate": 1.6460624978236671e-06, - "loss": 1.0186, - "step": 34895 - }, - { - "epoch": 0.89, - "learning_rate": 1.6460413771473927e-06, - "loss": 1.04, - "step": 34896 - }, - { - "epoch": 0.89, - "learning_rate": 1.6460202559764737e-06, - "loss": 0.9912, - "step": 34897 - }, - { - "epoch": 0.89, - "learning_rate": 1.645999134310927e-06, - "loss": 0.8896, - "step": 34898 - }, - { - "epoch": 0.89, - "learning_rate": 1.6459780121507683e-06, - "loss": 0.8164, - "step": 34899 - }, - { - "epoch": 0.89, - "learning_rate": 1.6459568894960138e-06, - "loss": 0.8887, - "step": 34900 - }, - { - "epoch": 0.89, - "learning_rate": 1.64593576634668e-06, - "loss": 0.7109, - "step": 34901 - }, - { - "epoch": 0.89, - "learning_rate": 1.6459146427027828e-06, - "loss": 0.9346, - "step": 34902 - }, - { - "epoch": 0.89, - "learning_rate": 1.6458935185643386e-06, - "loss": 0.7253, - "step": 34903 - }, - { - "epoch": 0.89, - "learning_rate": 1.6458723939313634e-06, - "loss": 0.8721, - "step": 34904 - }, - { - "epoch": 0.89, - "learning_rate": 1.6458512688038735e-06, - "loss": 0.6919, - "step": 34905 - }, - { - "epoch": 0.89, - "learning_rate": 1.6458301431818846e-06, - "loss": 0.7217, - "step": 34906 - }, - { - "epoch": 0.89, - "learning_rate": 1.6458090170654138e-06, - "loss": 0.7236, - "step": 34907 - }, - { - "epoch": 0.89, - "learning_rate": 1.6457878904544763e-06, - "loss": 0.7695, - "step": 34908 - }, - { - "epoch": 0.89, - "learning_rate": 1.6457667633490888e-06, - "loss": 0.8394, - "step": 34909 - }, - { - "epoch": 0.89, - "learning_rate": 1.6457456357492676e-06, - "loss": 0.8887, - "step": 34910 - }, - { - "epoch": 0.89, - "learning_rate": 1.6457245076550286e-06, - "loss": 0.8555, - "step": 34911 - }, - { - "epoch": 0.89, - "learning_rate": 1.6457033790663877e-06, - "loss": 0.7651, - "step": 34912 - }, - { - "epoch": 0.89, - "learning_rate": 1.6456822499833615e-06, - "loss": 0.9336, - "step": 34913 - }, - { - "epoch": 0.89, - "learning_rate": 1.6456611204059666e-06, - "loss": 0.5151, - "step": 34914 - }, - { - "epoch": 0.89, - "learning_rate": 1.6456399903342182e-06, - "loss": 0.9258, - "step": 34915 - }, - { - "epoch": 0.89, - "learning_rate": 1.6456188597681328e-06, - "loss": 0.6289, - "step": 34916 - }, - { - "epoch": 0.89, - "learning_rate": 1.645597728707727e-06, - "loss": 0.6133, - "step": 34917 - }, - { - "epoch": 0.89, - "learning_rate": 1.6455765971530168e-06, - "loss": 0.8037, - "step": 34918 - }, - { - "epoch": 0.89, - "learning_rate": 1.6455554651040183e-06, - "loss": 1.0088, - "step": 34919 - }, - { - "epoch": 0.9, - "learning_rate": 1.6455343325607474e-06, - "loss": 0.8232, - "step": 34920 - }, - { - "epoch": 0.9, - "learning_rate": 1.6455131995232206e-06, - "loss": 0.9209, - "step": 34921 - }, - { - "epoch": 0.9, - "learning_rate": 1.645492065991454e-06, - "loss": 0.6553, - "step": 34922 - }, - { - "epoch": 0.9, - "learning_rate": 1.6454709319654641e-06, - "loss": 0.9639, - "step": 34923 - }, - { - "epoch": 0.9, - "learning_rate": 1.6454497974452667e-06, - "loss": 0.9736, - "step": 34924 - }, - { - "epoch": 0.9, - "learning_rate": 1.6454286624308778e-06, - "loss": 0.9287, - "step": 34925 - }, - { - "epoch": 0.9, - "learning_rate": 1.6454075269223138e-06, - "loss": 0.9844, - "step": 34926 - }, - { - "epoch": 0.9, - "learning_rate": 1.645386390919591e-06, - "loss": 0.875, - "step": 34927 - }, - { - "epoch": 0.9, - "learning_rate": 1.6453652544227259e-06, - "loss": 0.917, - "step": 34928 - }, - { - "epoch": 0.9, - "learning_rate": 1.6453441174317342e-06, - "loss": 0.8345, - "step": 34929 - }, - { - "epoch": 0.9, - "learning_rate": 1.645322979946632e-06, - "loss": 0.7578, - "step": 34930 - }, - { - "epoch": 0.9, - "learning_rate": 1.6453018419674357e-06, - "loss": 0.877, - "step": 34931 - }, - { - "epoch": 0.9, - "learning_rate": 1.6452807034941613e-06, - "loss": 0.8271, - "step": 34932 - }, - { - "epoch": 0.9, - "learning_rate": 1.6452595645268255e-06, - "loss": 0.7957, - "step": 34933 - }, - { - "epoch": 0.9, - "learning_rate": 1.6452384250654438e-06, - "loss": 0.8311, - "step": 34934 - }, - { - "epoch": 0.9, - "learning_rate": 1.645217285110033e-06, - "loss": 0.7666, - "step": 34935 - }, - { - "epoch": 0.9, - "learning_rate": 1.6451961446606085e-06, - "loss": 0.9668, - "step": 34936 - }, - { - "epoch": 0.9, - "learning_rate": 1.6451750037171875e-06, - "loss": 0.73, - "step": 34937 - }, - { - "epoch": 0.9, - "learning_rate": 1.6451538622797854e-06, - "loss": 0.8271, - "step": 34938 - }, - { - "epoch": 0.9, - "learning_rate": 1.6451327203484186e-06, - "loss": 0.811, - "step": 34939 - }, - { - "epoch": 0.9, - "learning_rate": 1.6451115779231036e-06, - "loss": 0.9697, - "step": 34940 - }, - { - "epoch": 0.9, - "learning_rate": 1.6450904350038562e-06, - "loss": 0.9014, - "step": 34941 - }, - { - "epoch": 0.9, - "learning_rate": 1.6450692915906924e-06, - "loss": 0.6943, - "step": 34942 - }, - { - "epoch": 0.9, - "learning_rate": 1.645048147683629e-06, - "loss": 0.9424, - "step": 34943 - }, - { - "epoch": 0.9, - "learning_rate": 1.6450270032826821e-06, - "loss": 0.7573, - "step": 34944 - }, - { - "epoch": 0.9, - "learning_rate": 1.6450058583878674e-06, - "loss": 0.8887, - "step": 34945 - }, - { - "epoch": 0.9, - "learning_rate": 1.6449847129992013e-06, - "loss": 0.8252, - "step": 34946 - }, - { - "epoch": 0.9, - "learning_rate": 1.6449635671167004e-06, - "loss": 0.7979, - "step": 34947 - }, - { - "epoch": 0.9, - "learning_rate": 1.6449424207403801e-06, - "loss": 0.8125, - "step": 34948 - }, - { - "epoch": 0.9, - "learning_rate": 1.6449212738702576e-06, - "loss": 0.7891, - "step": 34949 - }, - { - "epoch": 0.9, - "learning_rate": 1.6449001265063482e-06, - "loss": 0.8945, - "step": 34950 - }, - { - "epoch": 0.9, - "learning_rate": 1.6448789786486685e-06, - "loss": 0.9248, - "step": 34951 - }, - { - "epoch": 0.9, - "learning_rate": 1.6448578302972345e-06, - "loss": 0.8105, - "step": 34952 - }, - { - "epoch": 0.9, - "learning_rate": 1.6448366814520624e-06, - "loss": 0.9453, - "step": 34953 - }, - { - "epoch": 0.9, - "learning_rate": 1.644815532113169e-06, - "loss": 0.9961, - "step": 34954 - }, - { - "epoch": 0.9, - "learning_rate": 1.6447943822805694e-06, - "loss": 0.7529, - "step": 34955 - }, - { - "epoch": 0.9, - "learning_rate": 1.6447732319542808e-06, - "loss": 0.7104, - "step": 34956 - }, - { - "epoch": 0.9, - "learning_rate": 1.6447520811343187e-06, - "loss": 0.8809, - "step": 34957 - }, - { - "epoch": 0.9, - "learning_rate": 1.6447309298207e-06, - "loss": 0.7803, - "step": 34958 - }, - { - "epoch": 0.9, - "learning_rate": 1.6447097780134403e-06, - "loss": 1.1113, - "step": 34959 - }, - { - "epoch": 0.9, - "learning_rate": 1.644688625712556e-06, - "loss": 1.0791, - "step": 34960 - }, - { - "epoch": 0.9, - "learning_rate": 1.6446674729180629e-06, - "loss": 0.7656, - "step": 34961 - }, - { - "epoch": 0.9, - "learning_rate": 1.6446463196299779e-06, - "loss": 0.9141, - "step": 34962 - }, - { - "epoch": 0.9, - "learning_rate": 1.6446251658483169e-06, - "loss": 1.0156, - "step": 34963 - }, - { - "epoch": 0.9, - "learning_rate": 1.6446040115730957e-06, - "loss": 0.9404, - "step": 34964 - }, - { - "epoch": 0.9, - "learning_rate": 1.6445828568043312e-06, - "loss": 0.7363, - "step": 34965 - }, - { - "epoch": 0.9, - "learning_rate": 1.644561701542039e-06, - "loss": 0.8369, - "step": 34966 - }, - { - "epoch": 0.9, - "learning_rate": 1.6445405457862354e-06, - "loss": 0.7876, - "step": 34967 - }, - { - "epoch": 0.9, - "learning_rate": 1.6445193895369372e-06, - "loss": 0.8857, - "step": 34968 - }, - { - "epoch": 0.9, - "learning_rate": 1.64449823279416e-06, - "loss": 0.7725, - "step": 34969 - }, - { - "epoch": 0.9, - "learning_rate": 1.6444770755579201e-06, - "loss": 0.5283, - "step": 34970 - }, - { - "epoch": 0.9, - "learning_rate": 1.6444559178282336e-06, - "loss": 0.7793, - "step": 34971 - }, - { - "epoch": 0.9, - "learning_rate": 1.6444347596051168e-06, - "loss": 1.0898, - "step": 34972 - }, - { - "epoch": 0.9, - "learning_rate": 1.6444136008885861e-06, - "loss": 0.9209, - "step": 34973 - }, - { - "epoch": 0.9, - "learning_rate": 1.6443924416786577e-06, - "loss": 0.9746, - "step": 34974 - }, - { - "epoch": 0.9, - "learning_rate": 1.6443712819753474e-06, - "loss": 0.6064, - "step": 34975 - }, - { - "epoch": 0.9, - "learning_rate": 1.6443501217786718e-06, - "loss": 0.8652, - "step": 34976 - }, - { - "epoch": 0.9, - "learning_rate": 1.6443289610886467e-06, - "loss": 0.8184, - "step": 34977 - }, - { - "epoch": 0.9, - "learning_rate": 1.6443077999052886e-06, - "loss": 0.7471, - "step": 34978 - }, - { - "epoch": 0.9, - "learning_rate": 1.6442866382286139e-06, - "loss": 1.0234, - "step": 34979 - }, - { - "epoch": 0.9, - "learning_rate": 1.6442654760586382e-06, - "loss": 0.876, - "step": 34980 - }, - { - "epoch": 0.9, - "learning_rate": 1.644244313395378e-06, - "loss": 0.916, - "step": 34981 - }, - { - "epoch": 0.9, - "learning_rate": 1.64422315023885e-06, - "loss": 0.8325, - "step": 34982 - }, - { - "epoch": 0.9, - "learning_rate": 1.6442019865890698e-06, - "loss": 0.7144, - "step": 34983 - }, - { - "epoch": 0.9, - "learning_rate": 1.6441808224460537e-06, - "loss": 1.0293, - "step": 34984 - }, - { - "epoch": 0.9, - "learning_rate": 1.6441596578098179e-06, - "loss": 0.8545, - "step": 34985 - }, - { - "epoch": 0.9, - "learning_rate": 1.6441384926803785e-06, - "loss": 0.7983, - "step": 34986 - }, - { - "epoch": 0.9, - "learning_rate": 1.6441173270577521e-06, - "loss": 0.8203, - "step": 34987 - }, - { - "epoch": 0.9, - "learning_rate": 1.6440961609419545e-06, - "loss": 0.7812, - "step": 34988 - }, - { - "epoch": 0.9, - "learning_rate": 1.6440749943330025e-06, - "loss": 0.9209, - "step": 34989 - }, - { - "epoch": 0.9, - "learning_rate": 1.6440538272309117e-06, - "loss": 1.1465, - "step": 34990 - }, - { - "epoch": 0.9, - "learning_rate": 1.6440326596356983e-06, - "loss": 0.8779, - "step": 34991 - }, - { - "epoch": 0.9, - "learning_rate": 1.6440114915473789e-06, - "loss": 0.9116, - "step": 34992 - }, - { - "epoch": 0.9, - "learning_rate": 1.6439903229659696e-06, - "loss": 0.8906, - "step": 34993 - }, - { - "epoch": 0.9, - "learning_rate": 1.6439691538914864e-06, - "loss": 0.9287, - "step": 34994 - }, - { - "epoch": 0.9, - "learning_rate": 1.6439479843239457e-06, - "loss": 0.7588, - "step": 34995 - }, - { - "epoch": 0.9, - "learning_rate": 1.6439268142633634e-06, - "loss": 0.7314, - "step": 34996 - }, - { - "epoch": 0.9, - "learning_rate": 1.6439056437097559e-06, - "loss": 0.8369, - "step": 34997 - }, - { - "epoch": 0.9, - "learning_rate": 1.6438844726631396e-06, - "loss": 0.9453, - "step": 34998 - }, - { - "epoch": 0.9, - "learning_rate": 1.643863301123531e-06, - "loss": 0.7656, - "step": 34999 - }, - { - "epoch": 0.9, - "learning_rate": 1.6438421290909452e-06, - "loss": 0.9951, - "step": 35000 - }, - { - "epoch": 0.9, - "learning_rate": 1.6438209565653996e-06, - "loss": 0.8135, - "step": 35001 - }, - { - "epoch": 0.9, - "learning_rate": 1.6437997835469095e-06, - "loss": 0.7607, - "step": 35002 - }, - { - "epoch": 0.9, - "learning_rate": 1.643778610035492e-06, - "loss": 0.8057, - "step": 35003 - }, - { - "epoch": 0.9, - "learning_rate": 1.6437574360311624e-06, - "loss": 1.0967, - "step": 35004 - }, - { - "epoch": 0.9, - "learning_rate": 1.6437362615339371e-06, - "loss": 0.8838, - "step": 35005 - }, - { - "epoch": 0.9, - "learning_rate": 1.6437150865438332e-06, - "loss": 0.8555, - "step": 35006 - }, - { - "epoch": 0.9, - "learning_rate": 1.6436939110608655e-06, - "loss": 0.957, - "step": 35007 - }, - { - "epoch": 0.9, - "learning_rate": 1.643672735085052e-06, - "loss": 0.8291, - "step": 35008 - }, - { - "epoch": 0.9, - "learning_rate": 1.6436515586164071e-06, - "loss": 0.6753, - "step": 35009 - }, - { - "epoch": 0.9, - "learning_rate": 1.643630381654948e-06, - "loss": 0.7783, - "step": 35010 - }, - { - "epoch": 0.9, - "learning_rate": 1.6436092042006906e-06, - "loss": 0.8076, - "step": 35011 - }, - { - "epoch": 0.9, - "learning_rate": 1.6435880262536512e-06, - "loss": 0.7256, - "step": 35012 - }, - { - "epoch": 0.9, - "learning_rate": 1.6435668478138466e-06, - "loss": 0.7852, - "step": 35013 - }, - { - "epoch": 0.9, - "learning_rate": 1.6435456688812917e-06, - "loss": 0.8643, - "step": 35014 - }, - { - "epoch": 0.9, - "learning_rate": 1.6435244894560038e-06, - "loss": 0.8613, - "step": 35015 - }, - { - "epoch": 0.9, - "learning_rate": 1.6435033095379988e-06, - "loss": 0.7842, - "step": 35016 - }, - { - "epoch": 0.9, - "learning_rate": 1.6434821291272928e-06, - "loss": 0.6729, - "step": 35017 - }, - { - "epoch": 0.9, - "learning_rate": 1.6434609482239024e-06, - "loss": 0.8096, - "step": 35018 - }, - { - "epoch": 0.9, - "learning_rate": 1.6434397668278433e-06, - "loss": 0.9668, - "step": 35019 - }, - { - "epoch": 0.9, - "learning_rate": 1.643418584939132e-06, - "loss": 0.9766, - "step": 35020 - }, - { - "epoch": 0.9, - "learning_rate": 1.6433974025577847e-06, - "loss": 0.6406, - "step": 35021 - }, - { - "epoch": 0.9, - "learning_rate": 1.6433762196838174e-06, - "loss": 0.6526, - "step": 35022 - }, - { - "epoch": 0.9, - "learning_rate": 1.643355036317247e-06, - "loss": 0.8003, - "step": 35023 - }, - { - "epoch": 0.9, - "learning_rate": 1.643333852458089e-06, - "loss": 0.8828, - "step": 35024 - }, - { - "epoch": 0.9, - "learning_rate": 1.6433126681063596e-06, - "loss": 0.998, - "step": 35025 - }, - { - "epoch": 0.9, - "learning_rate": 1.6432914832620753e-06, - "loss": 0.7227, - "step": 35026 - }, - { - "epoch": 0.9, - "learning_rate": 1.6432702979252526e-06, - "loss": 0.8828, - "step": 35027 - }, - { - "epoch": 0.9, - "learning_rate": 1.643249112095907e-06, - "loss": 0.8691, - "step": 35028 - }, - { - "epoch": 0.9, - "learning_rate": 1.6432279257740555e-06, - "loss": 0.8994, - "step": 35029 - }, - { - "epoch": 0.9, - "learning_rate": 1.643206738959714e-06, - "loss": 0.9229, - "step": 35030 - }, - { - "epoch": 0.9, - "learning_rate": 1.6431855516528983e-06, - "loss": 0.9502, - "step": 35031 - }, - { - "epoch": 0.9, - "learning_rate": 1.6431643638536252e-06, - "loss": 1.0684, - "step": 35032 - }, - { - "epoch": 0.9, - "learning_rate": 1.6431431755619109e-06, - "loss": 0.7749, - "step": 35033 - }, - { - "epoch": 0.9, - "learning_rate": 1.6431219867777712e-06, - "loss": 0.6562, - "step": 35034 - }, - { - "epoch": 0.9, - "learning_rate": 1.6431007975012225e-06, - "loss": 0.873, - "step": 35035 - }, - { - "epoch": 0.9, - "learning_rate": 1.6430796077322812e-06, - "loss": 0.6775, - "step": 35036 - }, - { - "epoch": 0.9, - "learning_rate": 1.6430584174709635e-06, - "loss": 0.8301, - "step": 35037 - }, - { - "epoch": 0.9, - "learning_rate": 1.6430372267172854e-06, - "loss": 0.6914, - "step": 35038 - }, - { - "epoch": 0.9, - "learning_rate": 1.6430160354712635e-06, - "loss": 0.5869, - "step": 35039 - }, - { - "epoch": 0.9, - "learning_rate": 1.6429948437329135e-06, - "loss": 0.6592, - "step": 35040 - }, - { - "epoch": 0.9, - "learning_rate": 1.642973651502252e-06, - "loss": 0.7432, - "step": 35041 - }, - { - "epoch": 0.9, - "learning_rate": 1.6429524587792952e-06, - "loss": 0.6467, - "step": 35042 - }, - { - "epoch": 0.9, - "learning_rate": 1.6429312655640596e-06, - "loss": 0.958, - "step": 35043 - }, - { - "epoch": 0.9, - "learning_rate": 1.6429100718565606e-06, - "loss": 0.3379, - "step": 35044 - }, - { - "epoch": 0.9, - "learning_rate": 1.642888877656815e-06, - "loss": 0.646, - "step": 35045 - }, - { - "epoch": 0.9, - "learning_rate": 1.642867682964839e-06, - "loss": 0.8315, - "step": 35046 - }, - { - "epoch": 0.9, - "learning_rate": 1.6428464877806488e-06, - "loss": 0.6299, - "step": 35047 - }, - { - "epoch": 0.9, - "learning_rate": 1.6428252921042605e-06, - "loss": 0.9131, - "step": 35048 - }, - { - "epoch": 0.9, - "learning_rate": 1.6428040959356905e-06, - "loss": 0.7612, - "step": 35049 - }, - { - "epoch": 0.9, - "learning_rate": 1.6427828992749548e-06, - "loss": 0.5732, - "step": 35050 - }, - { - "epoch": 0.9, - "learning_rate": 1.6427617021220701e-06, - "loss": 0.8301, - "step": 35051 - }, - { - "epoch": 0.9, - "learning_rate": 1.642740504477052e-06, - "loss": 1.0225, - "step": 35052 - }, - { - "epoch": 0.9, - "learning_rate": 1.6427193063399174e-06, - "loss": 0.8838, - "step": 35053 - }, - { - "epoch": 0.9, - "learning_rate": 1.642698107710682e-06, - "loss": 0.8428, - "step": 35054 - }, - { - "epoch": 0.9, - "learning_rate": 1.6426769085893622e-06, - "loss": 0.9756, - "step": 35055 - }, - { - "epoch": 0.9, - "learning_rate": 1.6426557089759742e-06, - "loss": 0.7627, - "step": 35056 - }, - { - "epoch": 0.9, - "learning_rate": 1.6426345088705343e-06, - "loss": 0.9775, - "step": 35057 - }, - { - "epoch": 0.9, - "learning_rate": 1.6426133082730588e-06, - "loss": 0.5925, - "step": 35058 - }, - { - "epoch": 0.9, - "learning_rate": 1.6425921071835637e-06, - "loss": 0.9707, - "step": 35059 - }, - { - "epoch": 0.9, - "learning_rate": 1.6425709056020657e-06, - "loss": 0.8047, - "step": 35060 - }, - { - "epoch": 0.9, - "learning_rate": 1.6425497035285805e-06, - "loss": 0.9521, - "step": 35061 - }, - { - "epoch": 0.9, - "learning_rate": 1.6425285009631243e-06, - "loss": 0.71, - "step": 35062 - }, - { - "epoch": 0.9, - "learning_rate": 1.642507297905714e-06, - "loss": 0.835, - "step": 35063 - }, - { - "epoch": 0.9, - "learning_rate": 1.6424860943563653e-06, - "loss": 0.6899, - "step": 35064 - }, - { - "epoch": 0.9, - "learning_rate": 1.6424648903150942e-06, - "loss": 0.875, - "step": 35065 - }, - { - "epoch": 0.9, - "learning_rate": 1.6424436857819174e-06, - "loss": 0.8311, - "step": 35066 - }, - { - "epoch": 0.9, - "learning_rate": 1.642422480756851e-06, - "loss": 0.9268, - "step": 35067 - }, - { - "epoch": 0.9, - "learning_rate": 1.6424012752399117e-06, - "loss": 0.7451, - "step": 35068 - }, - { - "epoch": 0.9, - "learning_rate": 1.6423800692311148e-06, - "loss": 0.6836, - "step": 35069 - }, - { - "epoch": 0.9, - "learning_rate": 1.642358862730477e-06, - "loss": 0.8379, - "step": 35070 - }, - { - "epoch": 0.9, - "learning_rate": 1.6423376557380148e-06, - "loss": 0.7139, - "step": 35071 - }, - { - "epoch": 0.9, - "learning_rate": 1.6423164482537438e-06, - "loss": 0.9766, - "step": 35072 - }, - { - "epoch": 0.9, - "learning_rate": 1.6422952402776811e-06, - "loss": 0.9619, - "step": 35073 - }, - { - "epoch": 0.9, - "learning_rate": 1.6422740318098423e-06, - "loss": 0.7158, - "step": 35074 - }, - { - "epoch": 0.9, - "learning_rate": 1.642252822850244e-06, - "loss": 0.875, - "step": 35075 - }, - { - "epoch": 0.9, - "learning_rate": 1.642231613398902e-06, - "loss": 0.7471, - "step": 35076 - }, - { - "epoch": 0.9, - "learning_rate": 1.6422104034558325e-06, - "loss": 0.9561, - "step": 35077 - }, - { - "epoch": 0.9, - "learning_rate": 1.6421891930210526e-06, - "loss": 0.834, - "step": 35078 - }, - { - "epoch": 0.9, - "learning_rate": 1.6421679820945778e-06, - "loss": 0.958, - "step": 35079 - }, - { - "epoch": 0.9, - "learning_rate": 1.6421467706764242e-06, - "loss": 0.9248, - "step": 35080 - }, - { - "epoch": 0.9, - "learning_rate": 1.6421255587666085e-06, - "loss": 0.8599, - "step": 35081 - }, - { - "epoch": 0.9, - "learning_rate": 1.642104346365147e-06, - "loss": 0.8594, - "step": 35082 - }, - { - "epoch": 0.9, - "learning_rate": 1.6420831334720555e-06, - "loss": 0.8574, - "step": 35083 - }, - { - "epoch": 0.9, - "learning_rate": 1.6420619200873508e-06, - "loss": 1.0703, - "step": 35084 - }, - { - "epoch": 0.9, - "learning_rate": 1.6420407062110484e-06, - "loss": 0.5884, - "step": 35085 - }, - { - "epoch": 0.9, - "learning_rate": 1.6420194918431652e-06, - "loss": 0.7832, - "step": 35086 - }, - { - "epoch": 0.9, - "learning_rate": 1.6419982769837168e-06, - "loss": 0.877, - "step": 35087 - }, - { - "epoch": 0.9, - "learning_rate": 1.6419770616327205e-06, - "loss": 0.4651, - "step": 35088 - }, - { - "epoch": 0.9, - "learning_rate": 1.6419558457901915e-06, - "loss": 0.7671, - "step": 35089 - }, - { - "epoch": 0.9, - "learning_rate": 1.6419346294561463e-06, - "loss": 0.5342, - "step": 35090 - }, - { - "epoch": 0.9, - "learning_rate": 1.6419134126306013e-06, - "loss": 0.7769, - "step": 35091 - }, - { - "epoch": 0.9, - "learning_rate": 1.641892195313573e-06, - "loss": 0.48, - "step": 35092 - }, - { - "epoch": 0.9, - "learning_rate": 1.6418709775050772e-06, - "loss": 0.8687, - "step": 35093 - }, - { - "epoch": 0.9, - "learning_rate": 1.6418497592051303e-06, - "loss": 0.8564, - "step": 35094 - }, - { - "epoch": 0.9, - "learning_rate": 1.6418285404137486e-06, - "loss": 0.9385, - "step": 35095 - }, - { - "epoch": 0.9, - "learning_rate": 1.641807321130948e-06, - "loss": 1.0312, - "step": 35096 - }, - { - "epoch": 0.9, - "learning_rate": 1.6417861013567453e-06, - "loss": 0.7178, - "step": 35097 - }, - { - "epoch": 0.9, - "learning_rate": 1.6417648810911567e-06, - "loss": 0.8867, - "step": 35098 - }, - { - "epoch": 0.9, - "learning_rate": 1.6417436603341978e-06, - "loss": 0.7117, - "step": 35099 - }, - { - "epoch": 0.9, - "learning_rate": 1.6417224390858854e-06, - "loss": 0.626, - "step": 35100 - }, - { - "epoch": 0.9, - "learning_rate": 1.641701217346236e-06, - "loss": 0.7852, - "step": 35101 - }, - { - "epoch": 0.9, - "learning_rate": 1.6416799951152651e-06, - "loss": 0.6909, - "step": 35102 - }, - { - "epoch": 0.9, - "learning_rate": 1.6416587723929894e-06, - "loss": 0.8916, - "step": 35103 - }, - { - "epoch": 0.9, - "learning_rate": 1.6416375491794253e-06, - "loss": 0.8369, - "step": 35104 - }, - { - "epoch": 0.9, - "learning_rate": 1.6416163254745887e-06, - "loss": 0.7222, - "step": 35105 - }, - { - "epoch": 0.9, - "learning_rate": 1.641595101278496e-06, - "loss": 1.0264, - "step": 35106 - }, - { - "epoch": 0.9, - "learning_rate": 1.6415738765911633e-06, - "loss": 0.8701, - "step": 35107 - }, - { - "epoch": 0.9, - "learning_rate": 1.6415526514126073e-06, - "loss": 0.9453, - "step": 35108 - }, - { - "epoch": 0.9, - "learning_rate": 1.6415314257428437e-06, - "loss": 1.0361, - "step": 35109 - }, - { - "epoch": 0.9, - "learning_rate": 1.6415101995818889e-06, - "loss": 0.8223, - "step": 35110 - }, - { - "epoch": 0.9, - "learning_rate": 1.6414889729297594e-06, - "loss": 0.8555, - "step": 35111 - }, - { - "epoch": 0.9, - "learning_rate": 1.6414677457864712e-06, - "loss": 1.0156, - "step": 35112 - }, - { - "epoch": 0.9, - "learning_rate": 1.641446518152041e-06, - "loss": 1.0029, - "step": 35113 - }, - { - "epoch": 0.9, - "learning_rate": 1.641425290026484e-06, - "loss": 0.8262, - "step": 35114 - }, - { - "epoch": 0.9, - "learning_rate": 1.6414040614098177e-06, - "loss": 0.8252, - "step": 35115 - }, - { - "epoch": 0.9, - "learning_rate": 1.6413828323020575e-06, - "loss": 0.7471, - "step": 35116 - }, - { - "epoch": 0.9, - "learning_rate": 1.64136160270322e-06, - "loss": 0.8896, - "step": 35117 - }, - { - "epoch": 0.9, - "learning_rate": 1.6413403726133215e-06, - "loss": 1.083, - "step": 35118 - }, - { - "epoch": 0.9, - "learning_rate": 1.6413191420323783e-06, - "loss": 0.8398, - "step": 35119 - }, - { - "epoch": 0.9, - "learning_rate": 1.6412979109604063e-06, - "loss": 0.7324, - "step": 35120 - }, - { - "epoch": 0.9, - "learning_rate": 1.6412766793974222e-06, - "loss": 0.958, - "step": 35121 - }, - { - "epoch": 0.9, - "learning_rate": 1.6412554473434417e-06, - "loss": 0.9941, - "step": 35122 - }, - { - "epoch": 0.9, - "learning_rate": 1.6412342147984817e-06, - "loss": 0.9204, - "step": 35123 - }, - { - "epoch": 0.9, - "learning_rate": 1.641212981762558e-06, - "loss": 0.8154, - "step": 35124 - }, - { - "epoch": 0.9, - "learning_rate": 1.641191748235687e-06, - "loss": 0.6792, - "step": 35125 - }, - { - "epoch": 0.9, - "learning_rate": 1.6411705142178849e-06, - "loss": 1.0547, - "step": 35126 - }, - { - "epoch": 0.9, - "learning_rate": 1.6411492797091682e-06, - "loss": 0.7646, - "step": 35127 - }, - { - "epoch": 0.9, - "learning_rate": 1.641128044709553e-06, - "loss": 0.8301, - "step": 35128 - }, - { - "epoch": 0.9, - "learning_rate": 1.6411068092190555e-06, - "loss": 1.1201, - "step": 35129 - }, - { - "epoch": 0.9, - "learning_rate": 1.6410855732376918e-06, - "loss": 1.1445, - "step": 35130 - }, - { - "epoch": 0.9, - "learning_rate": 1.6410643367654781e-06, - "loss": 0.8301, - "step": 35131 - }, - { - "epoch": 0.9, - "learning_rate": 1.6410430998024314e-06, - "loss": 0.8975, - "step": 35132 - }, - { - "epoch": 0.9, - "learning_rate": 1.6410218623485673e-06, - "loss": 0.7217, - "step": 35133 - }, - { - "epoch": 0.9, - "learning_rate": 1.6410006244039026e-06, - "loss": 0.7178, - "step": 35134 - }, - { - "epoch": 0.9, - "learning_rate": 1.640979385968453e-06, - "loss": 0.9736, - "step": 35135 - }, - { - "epoch": 0.9, - "learning_rate": 1.6409581470422347e-06, - "loss": 0.9141, - "step": 35136 - }, - { - "epoch": 0.9, - "learning_rate": 1.6409369076252642e-06, - "loss": 0.9121, - "step": 35137 - }, - { - "epoch": 0.9, - "learning_rate": 1.6409156677175583e-06, - "loss": 0.7339, - "step": 35138 - }, - { - "epoch": 0.9, - "learning_rate": 1.6408944273191322e-06, - "loss": 0.875, - "step": 35139 - }, - { - "epoch": 0.9, - "learning_rate": 1.640873186430003e-06, - "loss": 0.9023, - "step": 35140 - }, - { - "epoch": 0.9, - "learning_rate": 1.6408519450501866e-06, - "loss": 0.7695, - "step": 35141 - }, - { - "epoch": 0.9, - "learning_rate": 1.640830703179699e-06, - "loss": 1.082, - "step": 35142 - }, - { - "epoch": 0.9, - "learning_rate": 1.6408094608185572e-06, - "loss": 0.5334, - "step": 35143 - }, - { - "epoch": 0.9, - "learning_rate": 1.6407882179667769e-06, - "loss": 0.8467, - "step": 35144 - }, - { - "epoch": 0.9, - "learning_rate": 1.6407669746243745e-06, - "loss": 0.8125, - "step": 35145 - }, - { - "epoch": 0.9, - "learning_rate": 1.6407457307913663e-06, - "loss": 0.9092, - "step": 35146 - }, - { - "epoch": 0.9, - "learning_rate": 1.6407244864677688e-06, - "loss": 0.8594, - "step": 35147 - }, - { - "epoch": 0.9, - "learning_rate": 1.6407032416535978e-06, - "loss": 0.9941, - "step": 35148 - }, - { - "epoch": 0.9, - "learning_rate": 1.64068199634887e-06, - "loss": 0.877, - "step": 35149 - }, - { - "epoch": 0.9, - "learning_rate": 1.6406607505536012e-06, - "loss": 0.7666, - "step": 35150 - }, - { - "epoch": 0.9, - "learning_rate": 1.640639504267808e-06, - "loss": 0.9551, - "step": 35151 - }, - { - "epoch": 0.9, - "learning_rate": 1.6406182574915066e-06, - "loss": 0.8115, - "step": 35152 - }, - { - "epoch": 0.9, - "learning_rate": 1.6405970102247134e-06, - "loss": 0.8945, - "step": 35153 - }, - { - "epoch": 0.9, - "learning_rate": 1.6405757624674444e-06, - "loss": 0.9175, - "step": 35154 - }, - { - "epoch": 0.9, - "learning_rate": 1.6405545142197159e-06, - "loss": 0.9521, - "step": 35155 - }, - { - "epoch": 0.9, - "learning_rate": 1.6405332654815442e-06, - "loss": 0.7378, - "step": 35156 - }, - { - "epoch": 0.9, - "learning_rate": 1.6405120162529458e-06, - "loss": 0.9805, - "step": 35157 - }, - { - "epoch": 0.9, - "learning_rate": 1.640490766533937e-06, - "loss": 0.8486, - "step": 35158 - }, - { - "epoch": 0.9, - "learning_rate": 1.6404695163245334e-06, - "loss": 0.9004, - "step": 35159 - }, - { - "epoch": 0.9, - "learning_rate": 1.640448265624752e-06, - "loss": 0.874, - "step": 35160 - }, - { - "epoch": 0.9, - "learning_rate": 1.640427014434609e-06, - "loss": 0.9014, - "step": 35161 - }, - { - "epoch": 0.9, - "learning_rate": 1.6404057627541201e-06, - "loss": 1.0771, - "step": 35162 - }, - { - "epoch": 0.9, - "learning_rate": 1.6403845105833024e-06, - "loss": 0.8486, - "step": 35163 - }, - { - "epoch": 0.9, - "learning_rate": 1.6403632579221713e-06, - "loss": 0.9482, - "step": 35164 - }, - { - "epoch": 0.9, - "learning_rate": 1.6403420047707438e-06, - "loss": 0.8516, - "step": 35165 - }, - { - "epoch": 0.9, - "learning_rate": 1.6403207511290353e-06, - "loss": 0.835, - "step": 35166 - }, - { - "epoch": 0.9, - "learning_rate": 1.640299496997063e-06, - "loss": 0.6279, - "step": 35167 - }, - { - "epoch": 0.9, - "learning_rate": 1.640278242374843e-06, - "loss": 0.9033, - "step": 35168 - }, - { - "epoch": 0.9, - "learning_rate": 1.6402569872623912e-06, - "loss": 0.9727, - "step": 35169 - }, - { - "epoch": 0.9, - "learning_rate": 1.6402357316597244e-06, - "loss": 0.7549, - "step": 35170 - }, - { - "epoch": 0.9, - "learning_rate": 1.640214475566858e-06, - "loss": 0.7939, - "step": 35171 - }, - { - "epoch": 0.9, - "learning_rate": 1.6401932189838092e-06, - "loss": 0.6001, - "step": 35172 - }, - { - "epoch": 0.9, - "learning_rate": 1.640171961910594e-06, - "loss": 0.8008, - "step": 35173 - }, - { - "epoch": 0.9, - "learning_rate": 1.6401507043472283e-06, - "loss": 1.0166, - "step": 35174 - }, - { - "epoch": 0.9, - "learning_rate": 1.6401294462937284e-06, - "loss": 0.9346, - "step": 35175 - }, - { - "epoch": 0.9, - "learning_rate": 1.6401081877501113e-06, - "loss": 0.8838, - "step": 35176 - }, - { - "epoch": 0.9, - "learning_rate": 1.6400869287163925e-06, - "loss": 0.9092, - "step": 35177 - }, - { - "epoch": 0.9, - "learning_rate": 1.6400656691925889e-06, - "loss": 0.7393, - "step": 35178 - }, - { - "epoch": 0.9, - "learning_rate": 1.6400444091787161e-06, - "loss": 1.2139, - "step": 35179 - }, - { - "epoch": 0.9, - "learning_rate": 1.6400231486747908e-06, - "loss": 0.7891, - "step": 35180 - }, - { - "epoch": 0.9, - "learning_rate": 1.6400018876808296e-06, - "loss": 0.7551, - "step": 35181 - }, - { - "epoch": 0.9, - "learning_rate": 1.6399806261968477e-06, - "loss": 1.0254, - "step": 35182 - }, - { - "epoch": 0.9, - "learning_rate": 1.6399593642228626e-06, - "loss": 0.958, - "step": 35183 - }, - { - "epoch": 0.9, - "learning_rate": 1.6399381017588896e-06, - "loss": 0.8828, - "step": 35184 - }, - { - "epoch": 0.9, - "learning_rate": 1.6399168388049458e-06, - "loss": 0.9053, - "step": 35185 - }, - { - "epoch": 0.9, - "learning_rate": 1.6398955753610468e-06, - "loss": 0.7695, - "step": 35186 - }, - { - "epoch": 0.9, - "learning_rate": 1.6398743114272096e-06, - "loss": 0.6487, - "step": 35187 - }, - { - "epoch": 0.9, - "learning_rate": 1.6398530470034495e-06, - "loss": 0.8638, - "step": 35188 - }, - { - "epoch": 0.9, - "learning_rate": 1.6398317820897838e-06, - "loss": 0.7881, - "step": 35189 - }, - { - "epoch": 0.9, - "learning_rate": 1.6398105166862282e-06, - "loss": 0.6929, - "step": 35190 - }, - { - "epoch": 0.9, - "learning_rate": 1.6397892507927988e-06, - "loss": 0.9883, - "step": 35191 - }, - { - "epoch": 0.9, - "learning_rate": 1.6397679844095125e-06, - "loss": 0.8896, - "step": 35192 - }, - { - "epoch": 0.9, - "learning_rate": 1.6397467175363854e-06, - "loss": 0.7725, - "step": 35193 - }, - { - "epoch": 0.9, - "learning_rate": 1.6397254501734335e-06, - "loss": 0.7021, - "step": 35194 - }, - { - "epoch": 0.9, - "learning_rate": 1.6397041823206732e-06, - "loss": 0.8457, - "step": 35195 - }, - { - "epoch": 0.9, - "learning_rate": 1.6396829139781207e-06, - "loss": 0.958, - "step": 35196 - }, - { - "epoch": 0.9, - "learning_rate": 1.6396616451457926e-06, - "loss": 0.6938, - "step": 35197 - }, - { - "epoch": 0.9, - "learning_rate": 1.639640375823705e-06, - "loss": 0.9014, - "step": 35198 - }, - { - "epoch": 0.9, - "learning_rate": 1.6396191060118743e-06, - "loss": 0.9434, - "step": 35199 - }, - { - "epoch": 0.9, - "learning_rate": 1.6395978357103163e-06, - "loss": 0.8936, - "step": 35200 - }, - { - "epoch": 0.9, - "learning_rate": 1.6395765649190477e-06, - "loss": 0.6826, - "step": 35201 - }, - { - "epoch": 0.9, - "learning_rate": 1.639555293638085e-06, - "loss": 0.8564, - "step": 35202 - }, - { - "epoch": 0.9, - "learning_rate": 1.639534021867444e-06, - "loss": 0.6855, - "step": 35203 - }, - { - "epoch": 0.9, - "learning_rate": 1.6395127496071415e-06, - "loss": 0.8877, - "step": 35204 - }, - { - "epoch": 0.9, - "learning_rate": 1.6394914768571932e-06, - "loss": 0.7603, - "step": 35205 - }, - { - "epoch": 0.9, - "learning_rate": 1.6394702036176157e-06, - "loss": 1.0459, - "step": 35206 - }, - { - "epoch": 0.9, - "learning_rate": 1.6394489298884254e-06, - "loss": 0.7656, - "step": 35207 - }, - { - "epoch": 0.9, - "learning_rate": 1.6394276556696384e-06, - "loss": 0.8232, - "step": 35208 - }, - { - "epoch": 0.9, - "learning_rate": 1.639406380961271e-06, - "loss": 0.8125, - "step": 35209 - }, - { - "epoch": 0.9, - "learning_rate": 1.6393851057633397e-06, - "loss": 0.9463, - "step": 35210 - }, - { - "epoch": 0.9, - "learning_rate": 1.6393638300758603e-06, - "loss": 0.7568, - "step": 35211 - }, - { - "epoch": 0.9, - "learning_rate": 1.6393425538988498e-06, - "loss": 0.6707, - "step": 35212 - }, - { - "epoch": 0.9, - "learning_rate": 1.639321277232324e-06, - "loss": 0.8809, - "step": 35213 - }, - { - "epoch": 0.9, - "learning_rate": 1.639300000076299e-06, - "loss": 0.6279, - "step": 35214 - }, - { - "epoch": 0.9, - "learning_rate": 1.6392787224307917e-06, - "loss": 0.9902, - "step": 35215 - }, - { - "epoch": 0.9, - "learning_rate": 1.6392574442958177e-06, - "loss": 0.814, - "step": 35216 - }, - { - "epoch": 0.9, - "learning_rate": 1.639236165671394e-06, - "loss": 1.0566, - "step": 35217 - }, - { - "epoch": 0.9, - "learning_rate": 1.6392148865575367e-06, - "loss": 0.9414, - "step": 35218 - }, - { - "epoch": 0.9, - "learning_rate": 1.6391936069542616e-06, - "loss": 0.8169, - "step": 35219 - }, - { - "epoch": 0.9, - "learning_rate": 1.6391723268615855e-06, - "loss": 0.8765, - "step": 35220 - }, - { - "epoch": 0.9, - "learning_rate": 1.6391510462795247e-06, - "loss": 0.8145, - "step": 35221 - }, - { - "epoch": 0.9, - "learning_rate": 1.639129765208095e-06, - "loss": 0.9492, - "step": 35222 - }, - { - "epoch": 0.9, - "learning_rate": 1.6391084836473132e-06, - "loss": 0.917, - "step": 35223 - }, - { - "epoch": 0.9, - "learning_rate": 1.6390872015971955e-06, - "loss": 0.9219, - "step": 35224 - }, - { - "epoch": 0.9, - "learning_rate": 1.6390659190577577e-06, - "loss": 0.6758, - "step": 35225 - }, - { - "epoch": 0.9, - "learning_rate": 1.639044636029017e-06, - "loss": 0.8525, - "step": 35226 - }, - { - "epoch": 0.9, - "learning_rate": 1.639023352510989e-06, - "loss": 0.6753, - "step": 35227 - }, - { - "epoch": 0.9, - "learning_rate": 1.6390020685036905e-06, - "loss": 0.834, - "step": 35228 - }, - { - "epoch": 0.9, - "learning_rate": 1.6389807840071372e-06, - "loss": 0.8604, - "step": 35229 - }, - { - "epoch": 0.9, - "learning_rate": 1.6389594990213457e-06, - "loss": 0.8936, - "step": 35230 - }, - { - "epoch": 0.9, - "learning_rate": 1.6389382135463323e-06, - "loss": 0.8555, - "step": 35231 - }, - { - "epoch": 0.9, - "learning_rate": 1.6389169275821132e-06, - "loss": 0.9258, - "step": 35232 - }, - { - "epoch": 0.9, - "learning_rate": 1.638895641128705e-06, - "loss": 0.667, - "step": 35233 - }, - { - "epoch": 0.9, - "learning_rate": 1.6388743541861239e-06, - "loss": 0.8975, - "step": 35234 - }, - { - "epoch": 0.9, - "learning_rate": 1.6388530667543856e-06, - "loss": 0.9277, - "step": 35235 - }, - { - "epoch": 0.9, - "learning_rate": 1.638831778833507e-06, - "loss": 0.9922, - "step": 35236 - }, - { - "epoch": 0.9, - "learning_rate": 1.6388104904235046e-06, - "loss": 0.7549, - "step": 35237 - }, - { - "epoch": 0.9, - "learning_rate": 1.6387892015243945e-06, - "loss": 0.7266, - "step": 35238 - }, - { - "epoch": 0.9, - "learning_rate": 1.6387679121361925e-06, - "loss": 0.8374, - "step": 35239 - }, - { - "epoch": 0.9, - "learning_rate": 1.6387466222589153e-06, - "loss": 0.8779, - "step": 35240 - }, - { - "epoch": 0.9, - "learning_rate": 1.6387253318925791e-06, - "loss": 0.793, - "step": 35241 - }, - { - "epoch": 0.9, - "learning_rate": 1.6387040410372007e-06, - "loss": 1.0479, - "step": 35242 - }, - { - "epoch": 0.9, - "learning_rate": 1.6386827496927957e-06, - "loss": 1.1123, - "step": 35243 - }, - { - "epoch": 0.9, - "learning_rate": 1.6386614578593807e-06, - "loss": 0.8643, - "step": 35244 - }, - { - "epoch": 0.9, - "learning_rate": 1.638640165536972e-06, - "loss": 0.6284, - "step": 35245 - }, - { - "epoch": 0.9, - "learning_rate": 1.638618872725586e-06, - "loss": 0.9121, - "step": 35246 - }, - { - "epoch": 0.9, - "learning_rate": 1.6385975794252388e-06, - "loss": 1.0576, - "step": 35247 - }, - { - "epoch": 0.9, - "learning_rate": 1.6385762856359467e-06, - "loss": 0.6167, - "step": 35248 - }, - { - "epoch": 0.9, - "learning_rate": 1.6385549913577261e-06, - "loss": 0.7773, - "step": 35249 - }, - { - "epoch": 0.9, - "learning_rate": 1.6385336965905934e-06, - "loss": 0.7881, - "step": 35250 - }, - { - "epoch": 0.9, - "learning_rate": 1.6385124013345647e-06, - "loss": 0.8721, - "step": 35251 - }, - { - "epoch": 0.9, - "learning_rate": 1.6384911055896566e-06, - "loss": 0.958, - "step": 35252 - }, - { - "epoch": 0.9, - "learning_rate": 1.638469809355885e-06, - "loss": 0.8545, - "step": 35253 - }, - { - "epoch": 0.9, - "learning_rate": 1.6384485126332667e-06, - "loss": 0.9082, - "step": 35254 - }, - { - "epoch": 0.9, - "learning_rate": 1.6384272154218177e-06, - "loss": 0.5962, - "step": 35255 - }, - { - "epoch": 0.9, - "learning_rate": 1.6384059177215544e-06, - "loss": 0.7417, - "step": 35256 - }, - { - "epoch": 0.9, - "learning_rate": 1.6383846195324926e-06, - "loss": 0.7163, - "step": 35257 - }, - { - "epoch": 0.9, - "learning_rate": 1.6383633208546495e-06, - "loss": 0.783, - "step": 35258 - }, - { - "epoch": 0.9, - "learning_rate": 1.6383420216880408e-06, - "loss": 0.8193, - "step": 35259 - }, - { - "epoch": 0.9, - "learning_rate": 1.6383207220326826e-06, - "loss": 0.7417, - "step": 35260 - }, - { - "epoch": 0.9, - "learning_rate": 1.638299421888592e-06, - "loss": 1.0186, - "step": 35261 - }, - { - "epoch": 0.9, - "learning_rate": 1.6382781212557849e-06, - "loss": 0.4438, - "step": 35262 - }, - { - "epoch": 0.9, - "learning_rate": 1.6382568201342775e-06, - "loss": 0.916, - "step": 35263 - }, - { - "epoch": 0.9, - "learning_rate": 1.638235518524086e-06, - "loss": 1.0137, - "step": 35264 - }, - { - "epoch": 0.9, - "learning_rate": 1.6382142164252272e-06, - "loss": 0.9717, - "step": 35265 - }, - { - "epoch": 0.9, - "learning_rate": 1.6381929138377171e-06, - "loss": 0.915, - "step": 35266 - }, - { - "epoch": 0.9, - "learning_rate": 1.638171610761572e-06, - "loss": 0.8047, - "step": 35267 - }, - { - "epoch": 0.9, - "learning_rate": 1.6381503071968084e-06, - "loss": 0.6865, - "step": 35268 - }, - { - "epoch": 0.9, - "learning_rate": 1.638129003143442e-06, - "loss": 0.8506, - "step": 35269 - }, - { - "epoch": 0.9, - "learning_rate": 1.63810769860149e-06, - "loss": 0.8213, - "step": 35270 - }, - { - "epoch": 0.9, - "learning_rate": 1.6380863935709679e-06, - "loss": 0.7297, - "step": 35271 - }, - { - "epoch": 0.9, - "learning_rate": 1.6380650880518924e-06, - "loss": 0.9199, - "step": 35272 - }, - { - "epoch": 0.9, - "learning_rate": 1.6380437820442804e-06, - "loss": 0.8174, - "step": 35273 - }, - { - "epoch": 0.9, - "learning_rate": 1.638022475548147e-06, - "loss": 0.6479, - "step": 35274 - }, - { - "epoch": 0.9, - "learning_rate": 1.6380011685635092e-06, - "loss": 0.8662, - "step": 35275 - }, - { - "epoch": 0.9, - "learning_rate": 1.6379798610903834e-06, - "loss": 0.6294, - "step": 35276 - }, - { - "epoch": 0.9, - "learning_rate": 1.6379585531287856e-06, - "loss": 0.8584, - "step": 35277 - }, - { - "epoch": 0.9, - "learning_rate": 1.6379372446787328e-06, - "loss": 0.9453, - "step": 35278 - }, - { - "epoch": 0.9, - "learning_rate": 1.6379159357402402e-06, - "loss": 0.6133, - "step": 35279 - }, - { - "epoch": 0.9, - "learning_rate": 1.637894626313325e-06, - "loss": 0.5513, - "step": 35280 - }, - { - "epoch": 0.9, - "learning_rate": 1.6378733163980028e-06, - "loss": 0.8242, - "step": 35281 - }, - { - "epoch": 0.9, - "learning_rate": 1.6378520059942906e-06, - "loss": 1.0186, - "step": 35282 - }, - { - "epoch": 0.9, - "learning_rate": 1.6378306951022048e-06, - "loss": 0.8779, - "step": 35283 - }, - { - "epoch": 0.9, - "learning_rate": 1.6378093837217609e-06, - "loss": 0.7441, - "step": 35284 - }, - { - "epoch": 0.9, - "learning_rate": 1.6377880718529758e-06, - "loss": 0.8027, - "step": 35285 - }, - { - "epoch": 0.9, - "learning_rate": 1.6377667594958658e-06, - "loss": 0.9824, - "step": 35286 - }, - { - "epoch": 0.9, - "learning_rate": 1.6377454466504469e-06, - "loss": 0.793, - "step": 35287 - }, - { - "epoch": 0.9, - "learning_rate": 1.6377241333167357e-06, - "loss": 0.7422, - "step": 35288 - }, - { - "epoch": 0.9, - "learning_rate": 1.6377028194947487e-06, - "loss": 0.9531, - "step": 35289 - }, - { - "epoch": 0.9, - "learning_rate": 1.6376815051845017e-06, - "loss": 0.8882, - "step": 35290 - }, - { - "epoch": 0.9, - "learning_rate": 1.6376601903860111e-06, - "loss": 0.8818, - "step": 35291 - }, - { - "epoch": 0.9, - "learning_rate": 1.6376388750992937e-06, - "loss": 0.8701, - "step": 35292 - }, - { - "epoch": 0.9, - "learning_rate": 1.637617559324366e-06, - "loss": 0.7676, - "step": 35293 - }, - { - "epoch": 0.9, - "learning_rate": 1.6375962430612433e-06, - "loss": 0.8018, - "step": 35294 - }, - { - "epoch": 0.9, - "learning_rate": 1.6375749263099424e-06, - "loss": 0.9248, - "step": 35295 - }, - { - "epoch": 0.9, - "learning_rate": 1.6375536090704799e-06, - "loss": 0.718, - "step": 35296 - }, - { - "epoch": 0.9, - "learning_rate": 1.6375322913428719e-06, - "loss": 0.9902, - "step": 35297 - }, - { - "epoch": 0.9, - "learning_rate": 1.6375109731271347e-06, - "loss": 0.8145, - "step": 35298 - }, - { - "epoch": 0.9, - "learning_rate": 1.6374896544232848e-06, - "loss": 1.0283, - "step": 35299 - }, - { - "epoch": 0.9, - "learning_rate": 1.637468335231338e-06, - "loss": 0.832, - "step": 35300 - }, - { - "epoch": 0.9, - "learning_rate": 1.6374470155513115e-06, - "loss": 0.9473, - "step": 35301 - }, - { - "epoch": 0.9, - "learning_rate": 1.637425695383221e-06, - "loss": 0.8516, - "step": 35302 - }, - { - "epoch": 0.9, - "learning_rate": 1.6374043747270827e-06, - "loss": 0.6699, - "step": 35303 - }, - { - "epoch": 0.9, - "learning_rate": 1.6373830535829135e-06, - "loss": 0.9316, - "step": 35304 - }, - { - "epoch": 0.9, - "learning_rate": 1.6373617319507288e-06, - "loss": 0.7463, - "step": 35305 - }, - { - "epoch": 0.9, - "learning_rate": 1.637340409830546e-06, - "loss": 0.6592, - "step": 35306 - }, - { - "epoch": 0.9, - "learning_rate": 1.637319087222381e-06, - "loss": 0.6699, - "step": 35307 - }, - { - "epoch": 0.9, - "learning_rate": 1.63729776412625e-06, - "loss": 0.8047, - "step": 35308 - }, - { - "epoch": 0.9, - "learning_rate": 1.6372764405421695e-06, - "loss": 0.5991, - "step": 35309 - }, - { - "epoch": 0.91, - "learning_rate": 1.6372551164701556e-06, - "loss": 0.8096, - "step": 35310 - }, - { - "epoch": 0.91, - "learning_rate": 1.6372337919102246e-06, - "loss": 0.6616, - "step": 35311 - }, - { - "epoch": 0.91, - "learning_rate": 1.6372124668623936e-06, - "loss": 0.7334, - "step": 35312 - }, - { - "epoch": 0.91, - "learning_rate": 1.6371911413266777e-06, - "loss": 1.0059, - "step": 35313 - }, - { - "epoch": 0.91, - "learning_rate": 1.6371698153030939e-06, - "loss": 1.0371, - "step": 35314 - }, - { - "epoch": 0.91, - "learning_rate": 1.6371484887916587e-06, - "loss": 0.8262, - "step": 35315 - }, - { - "epoch": 0.91, - "learning_rate": 1.637127161792388e-06, - "loss": 0.7812, - "step": 35316 - }, - { - "epoch": 0.91, - "learning_rate": 1.6371058343052986e-06, - "loss": 0.5088, - "step": 35317 - }, - { - "epoch": 0.91, - "learning_rate": 1.6370845063304065e-06, - "loss": 0.7944, - "step": 35318 - }, - { - "epoch": 0.91, - "learning_rate": 1.637063177867728e-06, - "loss": 0.7275, - "step": 35319 - }, - { - "epoch": 0.91, - "learning_rate": 1.6370418489172794e-06, - "loss": 0.6138, - "step": 35320 - }, - { - "epoch": 0.91, - "learning_rate": 1.6370205194790771e-06, - "loss": 0.9619, - "step": 35321 - }, - { - "epoch": 0.91, - "learning_rate": 1.6369991895531378e-06, - "loss": 0.9199, - "step": 35322 - }, - { - "epoch": 0.91, - "learning_rate": 1.636977859139477e-06, - "loss": 0.6738, - "step": 35323 - }, - { - "epoch": 0.91, - "learning_rate": 1.636956528238112e-06, - "loss": 1.0508, - "step": 35324 - }, - { - "epoch": 0.91, - "learning_rate": 1.6369351968490586e-06, - "loss": 0.8779, - "step": 35325 - }, - { - "epoch": 0.91, - "learning_rate": 1.636913864972333e-06, - "loss": 0.7002, - "step": 35326 - }, - { - "epoch": 0.91, - "learning_rate": 1.6368925326079521e-06, - "loss": 0.8887, - "step": 35327 - }, - { - "epoch": 0.91, - "learning_rate": 1.6368711997559318e-06, - "loss": 0.9912, - "step": 35328 - }, - { - "epoch": 0.91, - "learning_rate": 1.636849866416288e-06, - "loss": 0.8052, - "step": 35329 - }, - { - "epoch": 0.91, - "learning_rate": 1.636828532589038e-06, - "loss": 0.7588, - "step": 35330 - }, - { - "epoch": 0.91, - "learning_rate": 1.6368071982741975e-06, - "loss": 1.1348, - "step": 35331 - }, - { - "epoch": 0.91, - "learning_rate": 1.6367858634717834e-06, - "loss": 0.9883, - "step": 35332 - }, - { - "epoch": 0.91, - "learning_rate": 1.6367645281818114e-06, - "loss": 0.9189, - "step": 35333 - }, - { - "epoch": 0.91, - "learning_rate": 1.6367431924042978e-06, - "loss": 0.8887, - "step": 35334 - }, - { - "epoch": 0.91, - "learning_rate": 1.6367218561392594e-06, - "loss": 1.041, - "step": 35335 - }, - { - "epoch": 0.91, - "learning_rate": 1.6367005193867125e-06, - "loss": 0.75, - "step": 35336 - }, - { - "epoch": 0.91, - "learning_rate": 1.6366791821466733e-06, - "loss": 0.5796, - "step": 35337 - }, - { - "epoch": 0.91, - "learning_rate": 1.6366578444191582e-06, - "loss": 0.9961, - "step": 35338 - }, - { - "epoch": 0.91, - "learning_rate": 1.6366365062041832e-06, - "loss": 0.7666, - "step": 35339 - }, - { - "epoch": 0.91, - "learning_rate": 1.6366151675017647e-06, - "loss": 0.832, - "step": 35340 - }, - { - "epoch": 0.91, - "learning_rate": 1.6365938283119194e-06, - "loss": 0.9805, - "step": 35341 - }, - { - "epoch": 0.91, - "learning_rate": 1.6365724886346639e-06, - "loss": 0.6187, - "step": 35342 - }, - { - "epoch": 0.91, - "learning_rate": 1.6365511484700137e-06, - "loss": 0.7124, - "step": 35343 - }, - { - "epoch": 0.91, - "learning_rate": 1.6365298078179856e-06, - "loss": 0.7773, - "step": 35344 - }, - { - "epoch": 0.91, - "learning_rate": 1.6365084666785957e-06, - "loss": 0.9512, - "step": 35345 - }, - { - "epoch": 0.91, - "learning_rate": 1.636487125051861e-06, - "loss": 1.0723, - "step": 35346 - }, - { - "epoch": 0.91, - "learning_rate": 1.6364657829377973e-06, - "loss": 0.752, - "step": 35347 - }, - { - "epoch": 0.91, - "learning_rate": 1.636444440336421e-06, - "loss": 0.8281, - "step": 35348 - }, - { - "epoch": 0.91, - "learning_rate": 1.6364230972477482e-06, - "loss": 1.0254, - "step": 35349 - }, - { - "epoch": 0.91, - "learning_rate": 1.6364017536717954e-06, - "loss": 0.6978, - "step": 35350 - }, - { - "epoch": 0.91, - "learning_rate": 1.6363804096085793e-06, - "loss": 0.9697, - "step": 35351 - }, - { - "epoch": 0.91, - "learning_rate": 1.6363590650581162e-06, - "loss": 0.8291, - "step": 35352 - }, - { - "epoch": 0.91, - "learning_rate": 1.6363377200204221e-06, - "loss": 0.8062, - "step": 35353 - }, - { - "epoch": 0.91, - "learning_rate": 1.636316374495513e-06, - "loss": 0.9414, - "step": 35354 - }, - { - "epoch": 0.91, - "learning_rate": 1.636295028483406e-06, - "loss": 0.9502, - "step": 35355 - }, - { - "epoch": 0.91, - "learning_rate": 1.6362736819841172e-06, - "loss": 1.2451, - "step": 35356 - }, - { - "epoch": 0.91, - "learning_rate": 1.6362523349976631e-06, - "loss": 0.8867, - "step": 35357 - }, - { - "epoch": 0.91, - "learning_rate": 1.6362309875240597e-06, - "loss": 0.7905, - "step": 35358 - }, - { - "epoch": 0.91, - "learning_rate": 1.6362096395633233e-06, - "loss": 0.7852, - "step": 35359 - }, - { - "epoch": 0.91, - "learning_rate": 1.6361882911154706e-06, - "loss": 0.8164, - "step": 35360 - }, - { - "epoch": 0.91, - "learning_rate": 1.6361669421805178e-06, - "loss": 0.8916, - "step": 35361 - }, - { - "epoch": 0.91, - "learning_rate": 1.6361455927584813e-06, - "loss": 0.9141, - "step": 35362 - }, - { - "epoch": 0.91, - "learning_rate": 1.636124242849377e-06, - "loss": 0.832, - "step": 35363 - }, - { - "epoch": 0.91, - "learning_rate": 1.6361028924532221e-06, - "loss": 0.6985, - "step": 35364 - }, - { - "epoch": 0.91, - "learning_rate": 1.6360815415700322e-06, - "loss": 0.9185, - "step": 35365 - }, - { - "epoch": 0.91, - "learning_rate": 1.6360601901998239e-06, - "loss": 0.9404, - "step": 35366 - }, - { - "epoch": 0.91, - "learning_rate": 1.6360388383426135e-06, - "loss": 0.874, - "step": 35367 - }, - { - "epoch": 0.91, - "learning_rate": 1.6360174859984175e-06, - "loss": 1.0293, - "step": 35368 - }, - { - "epoch": 0.91, - "learning_rate": 1.6359961331672523e-06, - "loss": 0.709, - "step": 35369 - }, - { - "epoch": 0.91, - "learning_rate": 1.6359747798491338e-06, - "loss": 0.9492, - "step": 35370 - }, - { - "epoch": 0.91, - "learning_rate": 1.6359534260440789e-06, - "loss": 0.627, - "step": 35371 - }, - { - "epoch": 0.91, - "learning_rate": 1.6359320717521037e-06, - "loss": 0.8008, - "step": 35372 - }, - { - "epoch": 0.91, - "learning_rate": 1.6359107169732243e-06, - "loss": 0.9736, - "step": 35373 - }, - { - "epoch": 0.91, - "learning_rate": 1.6358893617074573e-06, - "loss": 0.9424, - "step": 35374 - }, - { - "epoch": 0.91, - "learning_rate": 1.6358680059548193e-06, - "loss": 0.7349, - "step": 35375 - }, - { - "epoch": 0.91, - "learning_rate": 1.6358466497153263e-06, - "loss": 0.6035, - "step": 35376 - }, - { - "epoch": 0.91, - "learning_rate": 1.635825292988995e-06, - "loss": 0.5889, - "step": 35377 - }, - { - "epoch": 0.91, - "learning_rate": 1.6358039357758414e-06, - "loss": 0.8428, - "step": 35378 - }, - { - "epoch": 0.91, - "learning_rate": 1.6357825780758816e-06, - "loss": 0.8252, - "step": 35379 - }, - { - "epoch": 0.91, - "learning_rate": 1.6357612198891327e-06, - "loss": 0.604, - "step": 35380 - }, - { - "epoch": 0.91, - "learning_rate": 1.6357398612156103e-06, - "loss": 0.8652, - "step": 35381 - }, - { - "epoch": 0.91, - "learning_rate": 1.6357185020553316e-06, - "loss": 0.7461, - "step": 35382 - }, - { - "epoch": 0.91, - "learning_rate": 1.6356971424083123e-06, - "loss": 0.6738, - "step": 35383 - }, - { - "epoch": 0.91, - "learning_rate": 1.6356757822745688e-06, - "loss": 0.9043, - "step": 35384 - }, - { - "epoch": 0.91, - "learning_rate": 1.6356544216541178e-06, - "loss": 0.5308, - "step": 35385 - }, - { - "epoch": 0.91, - "learning_rate": 1.6356330605469753e-06, - "loss": 1.0449, - "step": 35386 - }, - { - "epoch": 0.91, - "learning_rate": 1.6356116989531576e-06, - "loss": 0.8789, - "step": 35387 - }, - { - "epoch": 0.91, - "learning_rate": 1.6355903368726813e-06, - "loss": 0.9165, - "step": 35388 - }, - { - "epoch": 0.91, - "learning_rate": 1.6355689743055629e-06, - "loss": 0.8867, - "step": 35389 - }, - { - "epoch": 0.91, - "learning_rate": 1.6355476112518185e-06, - "loss": 0.7925, - "step": 35390 - }, - { - "epoch": 0.91, - "learning_rate": 1.6355262477114646e-06, - "loss": 0.8994, - "step": 35391 - }, - { - "epoch": 0.91, - "learning_rate": 1.6355048836845175e-06, - "loss": 0.7217, - "step": 35392 - }, - { - "epoch": 0.91, - "learning_rate": 1.6354835191709934e-06, - "loss": 0.918, - "step": 35393 - }, - { - "epoch": 0.91, - "learning_rate": 1.6354621541709088e-06, - "loss": 1.0449, - "step": 35394 - }, - { - "epoch": 0.91, - "learning_rate": 1.63544078868428e-06, - "loss": 0.9258, - "step": 35395 - }, - { - "epoch": 0.91, - "learning_rate": 1.6354194227111233e-06, - "loss": 0.8145, - "step": 35396 - }, - { - "epoch": 0.91, - "learning_rate": 1.6353980562514555e-06, - "loss": 0.7151, - "step": 35397 - }, - { - "epoch": 0.91, - "learning_rate": 1.6353766893052926e-06, - "loss": 0.8994, - "step": 35398 - }, - { - "epoch": 0.91, - "learning_rate": 1.635355321872651e-06, - "loss": 0.8379, - "step": 35399 - }, - { - "epoch": 0.91, - "learning_rate": 1.6353339539535463e-06, - "loss": 0.9141, - "step": 35400 - }, - { - "epoch": 0.91, - "learning_rate": 1.6353125855479963e-06, - "loss": 0.7471, - "step": 35401 - }, - { - "epoch": 0.91, - "learning_rate": 1.6352912166560166e-06, - "loss": 0.6362, - "step": 35402 - }, - { - "epoch": 0.91, - "learning_rate": 1.6352698472776236e-06, - "loss": 1.0439, - "step": 35403 - }, - { - "epoch": 0.91, - "learning_rate": 1.635248477412834e-06, - "loss": 0.9736, - "step": 35404 - }, - { - "epoch": 0.91, - "learning_rate": 1.6352271070616632e-06, - "loss": 0.8311, - "step": 35405 - }, - { - "epoch": 0.91, - "learning_rate": 1.6352057362241284e-06, - "loss": 0.8755, - "step": 35406 - }, - { - "epoch": 0.91, - "learning_rate": 1.6351843649002462e-06, - "loss": 0.8789, - "step": 35407 - }, - { - "epoch": 0.91, - "learning_rate": 1.6351629930900321e-06, - "loss": 0.7747, - "step": 35408 - }, - { - "epoch": 0.91, - "learning_rate": 1.6351416207935032e-06, - "loss": 0.7666, - "step": 35409 - }, - { - "epoch": 0.91, - "learning_rate": 1.6351202480106751e-06, - "loss": 0.75, - "step": 35410 - }, - { - "epoch": 0.91, - "learning_rate": 1.635098874741565e-06, - "loss": 0.7888, - "step": 35411 - }, - { - "epoch": 0.91, - "learning_rate": 1.635077500986189e-06, - "loss": 0.8242, - "step": 35412 - }, - { - "epoch": 0.91, - "learning_rate": 1.6350561267445632e-06, - "loss": 0.8098, - "step": 35413 - }, - { - "epoch": 0.91, - "learning_rate": 1.635034752016704e-06, - "loss": 0.876, - "step": 35414 - }, - { - "epoch": 0.91, - "learning_rate": 1.635013376802628e-06, - "loss": 0.9395, - "step": 35415 - }, - { - "epoch": 0.91, - "learning_rate": 1.6349920011023516e-06, - "loss": 0.8877, - "step": 35416 - }, - { - "epoch": 0.91, - "learning_rate": 1.634970624915891e-06, - "loss": 0.9424, - "step": 35417 - }, - { - "epoch": 0.91, - "learning_rate": 1.6349492482432623e-06, - "loss": 1.0205, - "step": 35418 - }, - { - "epoch": 0.91, - "learning_rate": 1.6349278710844822e-06, - "loss": 0.7061, - "step": 35419 - }, - { - "epoch": 0.91, - "learning_rate": 1.6349064934395673e-06, - "loss": 1.0098, - "step": 35420 - }, - { - "epoch": 0.91, - "learning_rate": 1.6348851153085336e-06, - "loss": 0.9414, - "step": 35421 - }, - { - "epoch": 0.91, - "learning_rate": 1.6348637366913976e-06, - "loss": 0.7305, - "step": 35422 - }, - { - "epoch": 0.91, - "learning_rate": 1.6348423575881753e-06, - "loss": 0.9062, - "step": 35423 - }, - { - "epoch": 0.91, - "learning_rate": 1.6348209779988837e-06, - "loss": 0.9131, - "step": 35424 - }, - { - "epoch": 0.91, - "learning_rate": 1.6347995979235388e-06, - "loss": 0.8496, - "step": 35425 - }, - { - "epoch": 0.91, - "learning_rate": 1.6347782173621568e-06, - "loss": 0.8398, - "step": 35426 - }, - { - "epoch": 0.91, - "learning_rate": 1.634756836314755e-06, - "loss": 0.8252, - "step": 35427 - }, - { - "epoch": 0.91, - "learning_rate": 1.6347354547813486e-06, - "loss": 0.7559, - "step": 35428 - }, - { - "epoch": 0.91, - "learning_rate": 1.6347140727619544e-06, - "loss": 0.8623, - "step": 35429 - }, - { - "epoch": 0.91, - "learning_rate": 1.6346926902565887e-06, - "loss": 0.8779, - "step": 35430 - }, - { - "epoch": 0.91, - "learning_rate": 1.6346713072652683e-06, - "loss": 0.5322, - "step": 35431 - }, - { - "epoch": 0.91, - "learning_rate": 1.634649923788009e-06, - "loss": 0.7314, - "step": 35432 - }, - { - "epoch": 0.91, - "learning_rate": 1.6346285398248276e-06, - "loss": 0.6641, - "step": 35433 - }, - { - "epoch": 0.91, - "learning_rate": 1.6346071553757404e-06, - "loss": 1.1748, - "step": 35434 - }, - { - "epoch": 0.91, - "learning_rate": 1.6345857704407636e-06, - "loss": 0.7227, - "step": 35435 - }, - { - "epoch": 0.91, - "learning_rate": 1.6345643850199136e-06, - "loss": 0.6941, - "step": 35436 - }, - { - "epoch": 0.91, - "learning_rate": 1.634542999113207e-06, - "loss": 1.0498, - "step": 35437 - }, - { - "epoch": 0.91, - "learning_rate": 1.6345216127206599e-06, - "loss": 0.8047, - "step": 35438 - }, - { - "epoch": 0.91, - "learning_rate": 1.6345002258422883e-06, - "loss": 0.8081, - "step": 35439 - }, - { - "epoch": 0.91, - "learning_rate": 1.6344788384781097e-06, - "loss": 0.7373, - "step": 35440 - }, - { - "epoch": 0.91, - "learning_rate": 1.6344574506281395e-06, - "loss": 0.8721, - "step": 35441 - }, - { - "epoch": 0.91, - "learning_rate": 1.6344360622923946e-06, - "loss": 0.9629, - "step": 35442 - }, - { - "epoch": 0.91, - "learning_rate": 1.634414673470891e-06, - "loss": 0.7539, - "step": 35443 - }, - { - "epoch": 0.91, - "learning_rate": 1.6343932841636455e-06, - "loss": 0.9111, - "step": 35444 - }, - { - "epoch": 0.91, - "learning_rate": 1.6343718943706742e-06, - "loss": 1.0186, - "step": 35445 - }, - { - "epoch": 0.91, - "learning_rate": 1.634350504091993e-06, - "loss": 0.9023, - "step": 35446 - }, - { - "epoch": 0.91, - "learning_rate": 1.6343291133276194e-06, - "loss": 0.8555, - "step": 35447 - }, - { - "epoch": 0.91, - "learning_rate": 1.634307722077569e-06, - "loss": 0.8428, - "step": 35448 - }, - { - "epoch": 0.91, - "learning_rate": 1.6342863303418582e-06, - "loss": 0.8301, - "step": 35449 - }, - { - "epoch": 0.91, - "learning_rate": 1.6342649381205036e-06, - "loss": 0.7861, - "step": 35450 - }, - { - "epoch": 0.91, - "learning_rate": 1.6342435454135215e-06, - "loss": 0.7803, - "step": 35451 - }, - { - "epoch": 0.91, - "learning_rate": 1.6342221522209285e-06, - "loss": 0.8311, - "step": 35452 - }, - { - "epoch": 0.91, - "learning_rate": 1.6342007585427403e-06, - "loss": 0.563, - "step": 35453 - }, - { - "epoch": 0.91, - "learning_rate": 1.634179364378974e-06, - "loss": 1.1055, - "step": 35454 - }, - { - "epoch": 0.91, - "learning_rate": 1.6341579697296459e-06, - "loss": 0.8311, - "step": 35455 - }, - { - "epoch": 0.91, - "learning_rate": 1.634136574594772e-06, - "loss": 1.0605, - "step": 35456 - }, - { - "epoch": 0.91, - "learning_rate": 1.6341151789743688e-06, - "loss": 0.9707, - "step": 35457 - }, - { - "epoch": 0.91, - "learning_rate": 1.634093782868453e-06, - "loss": 0.6287, - "step": 35458 - }, - { - "epoch": 0.91, - "learning_rate": 1.6340723862770405e-06, - "loss": 0.4653, - "step": 35459 - }, - { - "epoch": 0.91, - "learning_rate": 1.6340509892001479e-06, - "loss": 1.0098, - "step": 35460 - }, - { - "epoch": 0.91, - "learning_rate": 1.6340295916377917e-06, - "loss": 0.7383, - "step": 35461 - }, - { - "epoch": 0.91, - "learning_rate": 1.6340081935899886e-06, - "loss": 0.9365, - "step": 35462 - }, - { - "epoch": 0.91, - "learning_rate": 1.6339867950567542e-06, - "loss": 0.8193, - "step": 35463 - }, - { - "epoch": 0.91, - "learning_rate": 1.6339653960381052e-06, - "loss": 0.7471, - "step": 35464 - }, - { - "epoch": 0.91, - "learning_rate": 1.633943996534058e-06, - "loss": 0.8652, - "step": 35465 - }, - { - "epoch": 0.91, - "learning_rate": 1.6339225965446292e-06, - "loss": 0.7676, - "step": 35466 - }, - { - "epoch": 0.91, - "learning_rate": 1.6339011960698352e-06, - "loss": 0.8428, - "step": 35467 - }, - { - "epoch": 0.91, - "learning_rate": 1.6338797951096918e-06, - "loss": 1.0049, - "step": 35468 - }, - { - "epoch": 0.91, - "learning_rate": 1.6338583936642158e-06, - "loss": 0.9482, - "step": 35469 - }, - { - "epoch": 0.91, - "learning_rate": 1.6338369917334238e-06, - "loss": 0.7578, - "step": 35470 - }, - { - "epoch": 0.91, - "learning_rate": 1.633815589317332e-06, - "loss": 0.7822, - "step": 35471 - }, - { - "epoch": 0.91, - "learning_rate": 1.6337941864159567e-06, - "loss": 0.8022, - "step": 35472 - }, - { - "epoch": 0.91, - "learning_rate": 1.6337727830293143e-06, - "loss": 0.8906, - "step": 35473 - }, - { - "epoch": 0.91, - "learning_rate": 1.6337513791574211e-06, - "loss": 0.9551, - "step": 35474 - }, - { - "epoch": 0.91, - "learning_rate": 1.6337299748002937e-06, - "loss": 0.9546, - "step": 35475 - }, - { - "epoch": 0.91, - "learning_rate": 1.6337085699579485e-06, - "loss": 0.8076, - "step": 35476 - }, - { - "epoch": 0.91, - "learning_rate": 1.6336871646304019e-06, - "loss": 0.7793, - "step": 35477 - }, - { - "epoch": 0.91, - "learning_rate": 1.6336657588176697e-06, - "loss": 0.9414, - "step": 35478 - }, - { - "epoch": 0.91, - "learning_rate": 1.6336443525197691e-06, - "loss": 1.0723, - "step": 35479 - }, - { - "epoch": 0.91, - "learning_rate": 1.6336229457367158e-06, - "loss": 0.8447, - "step": 35480 - }, - { - "epoch": 0.91, - "learning_rate": 1.6336015384685272e-06, - "loss": 1.0527, - "step": 35481 - }, - { - "epoch": 0.91, - "learning_rate": 1.6335801307152188e-06, - "loss": 0.8271, - "step": 35482 - }, - { - "epoch": 0.91, - "learning_rate": 1.633558722476807e-06, - "loss": 0.8096, - "step": 35483 - }, - { - "epoch": 0.91, - "learning_rate": 1.6335373137533084e-06, - "loss": 0.9756, - "step": 35484 - }, - { - "epoch": 0.91, - "learning_rate": 1.6335159045447396e-06, - "loss": 0.8379, - "step": 35485 - }, - { - "epoch": 0.91, - "learning_rate": 1.6334944948511168e-06, - "loss": 0.7627, - "step": 35486 - }, - { - "epoch": 0.91, - "learning_rate": 1.6334730846724562e-06, - "loss": 0.835, - "step": 35487 - }, - { - "epoch": 0.91, - "learning_rate": 1.6334516740087746e-06, - "loss": 0.915, - "step": 35488 - }, - { - "epoch": 0.91, - "learning_rate": 1.633430262860088e-06, - "loss": 0.5811, - "step": 35489 - }, - { - "epoch": 0.91, - "learning_rate": 1.633408851226413e-06, - "loss": 0.8105, - "step": 35490 - }, - { - "epoch": 0.91, - "learning_rate": 1.633387439107766e-06, - "loss": 0.8496, - "step": 35491 - }, - { - "epoch": 0.91, - "learning_rate": 1.6333660265041639e-06, - "loss": 0.8721, - "step": 35492 - }, - { - "epoch": 0.91, - "learning_rate": 1.633344613415622e-06, - "loss": 0.9053, - "step": 35493 - }, - { - "epoch": 0.91, - "learning_rate": 1.633323199842157e-06, - "loss": 0.8701, - "step": 35494 - }, - { - "epoch": 0.91, - "learning_rate": 1.633301785783786e-06, - "loss": 0.8125, - "step": 35495 - }, - { - "epoch": 0.91, - "learning_rate": 1.6332803712405245e-06, - "loss": 0.5515, - "step": 35496 - }, - { - "epoch": 0.91, - "learning_rate": 1.6332589562123898e-06, - "loss": 0.8789, - "step": 35497 - }, - { - "epoch": 0.91, - "learning_rate": 1.633237540699398e-06, - "loss": 0.9326, - "step": 35498 - }, - { - "epoch": 0.91, - "learning_rate": 1.6332161247015645e-06, - "loss": 0.6948, - "step": 35499 - }, - { - "epoch": 0.91, - "learning_rate": 1.6331947082189074e-06, - "loss": 0.7959, - "step": 35500 - }, - { - "epoch": 0.91, - "learning_rate": 1.6331732912514418e-06, - "loss": 0.8047, - "step": 35501 - }, - { - "epoch": 0.91, - "learning_rate": 1.6331518737991846e-06, - "loss": 0.8091, - "step": 35502 - }, - { - "epoch": 0.91, - "learning_rate": 1.633130455862152e-06, - "loss": 0.6245, - "step": 35503 - }, - { - "epoch": 0.91, - "learning_rate": 1.6331090374403607e-06, - "loss": 1.0791, - "step": 35504 - }, - { - "epoch": 0.91, - "learning_rate": 1.6330876185338267e-06, - "loss": 0.8408, - "step": 35505 - }, - { - "epoch": 0.91, - "learning_rate": 1.6330661991425666e-06, - "loss": 0.8438, - "step": 35506 - }, - { - "epoch": 0.91, - "learning_rate": 1.6330447792665973e-06, - "loss": 0.8545, - "step": 35507 - }, - { - "epoch": 0.91, - "learning_rate": 1.6330233589059342e-06, - "loss": 0.8579, - "step": 35508 - }, - { - "epoch": 0.91, - "learning_rate": 1.6330019380605945e-06, - "loss": 0.7583, - "step": 35509 - }, - { - "epoch": 0.91, - "learning_rate": 1.6329805167305942e-06, - "loss": 0.7129, - "step": 35510 - }, - { - "epoch": 0.91, - "learning_rate": 1.6329590949159498e-06, - "loss": 1.1748, - "step": 35511 - }, - { - "epoch": 0.91, - "learning_rate": 1.6329376726166778e-06, - "loss": 0.7666, - "step": 35512 - }, - { - "epoch": 0.91, - "learning_rate": 1.6329162498327946e-06, - "loss": 0.874, - "step": 35513 - }, - { - "epoch": 0.91, - "learning_rate": 1.6328948265643166e-06, - "loss": 0.9346, - "step": 35514 - }, - { - "epoch": 0.91, - "learning_rate": 1.63287340281126e-06, - "loss": 0.7285, - "step": 35515 - }, - { - "epoch": 0.91, - "learning_rate": 1.6328519785736411e-06, - "loss": 0.7949, - "step": 35516 - }, - { - "epoch": 0.91, - "learning_rate": 1.6328305538514772e-06, - "loss": 0.7803, - "step": 35517 - }, - { - "epoch": 0.91, - "learning_rate": 1.6328091286447834e-06, - "loss": 0.8076, - "step": 35518 - }, - { - "epoch": 0.91, - "learning_rate": 1.6327877029535771e-06, - "loss": 0.9277, - "step": 35519 - }, - { - "epoch": 0.91, - "learning_rate": 1.632766276777874e-06, - "loss": 0.7212, - "step": 35520 - }, - { - "epoch": 0.91, - "learning_rate": 1.6327448501176911e-06, - "loss": 0.6763, - "step": 35521 - }, - { - "epoch": 0.91, - "learning_rate": 1.6327234229730444e-06, - "loss": 0.9785, - "step": 35522 - }, - { - "epoch": 0.91, - "learning_rate": 1.6327019953439506e-06, - "loss": 0.9385, - "step": 35523 - }, - { - "epoch": 0.91, - "learning_rate": 1.632680567230426e-06, - "loss": 0.8486, - "step": 35524 - }, - { - "epoch": 0.91, - "learning_rate": 1.632659138632487e-06, - "loss": 0.7944, - "step": 35525 - }, - { - "epoch": 0.91, - "learning_rate": 1.63263770955015e-06, - "loss": 0.8145, - "step": 35526 - }, - { - "epoch": 0.91, - "learning_rate": 1.6326162799834316e-06, - "loss": 0.6875, - "step": 35527 - }, - { - "epoch": 0.91, - "learning_rate": 1.6325948499323477e-06, - "loss": 0.8726, - "step": 35528 - }, - { - "epoch": 0.91, - "learning_rate": 1.6325734193969146e-06, - "loss": 0.6401, - "step": 35529 - }, - { - "epoch": 0.91, - "learning_rate": 1.6325519883771496e-06, - "loss": 0.8115, - "step": 35530 - }, - { - "epoch": 0.91, - "learning_rate": 1.6325305568730688e-06, - "loss": 0.9521, - "step": 35531 - }, - { - "epoch": 0.91, - "learning_rate": 1.6325091248846883e-06, - "loss": 0.8506, - "step": 35532 - }, - { - "epoch": 0.91, - "learning_rate": 1.6324876924120246e-06, - "loss": 0.7568, - "step": 35533 - }, - { - "epoch": 0.91, - "learning_rate": 1.6324662594550942e-06, - "loss": 0.8066, - "step": 35534 - }, - { - "epoch": 0.91, - "learning_rate": 1.6324448260139132e-06, - "loss": 0.7871, - "step": 35535 - }, - { - "epoch": 0.91, - "learning_rate": 1.6324233920884986e-06, - "loss": 1.0068, - "step": 35536 - }, - { - "epoch": 0.91, - "learning_rate": 1.6324019576788667e-06, - "loss": 0.8906, - "step": 35537 - }, - { - "epoch": 0.91, - "learning_rate": 1.632380522785033e-06, - "loss": 0.8379, - "step": 35538 - }, - { - "epoch": 0.91, - "learning_rate": 1.632359087407015e-06, - "loss": 0.8438, - "step": 35539 - }, - { - "epoch": 0.91, - "learning_rate": 1.6323376515448289e-06, - "loss": 0.6968, - "step": 35540 - }, - { - "epoch": 0.91, - "learning_rate": 1.6323162151984904e-06, - "loss": 0.8506, - "step": 35541 - }, - { - "epoch": 0.91, - "learning_rate": 1.632294778368017e-06, - "loss": 0.6729, - "step": 35542 - }, - { - "epoch": 0.91, - "learning_rate": 1.6322733410534245e-06, - "loss": 0.9268, - "step": 35543 - }, - { - "epoch": 0.91, - "learning_rate": 1.632251903254729e-06, - "loss": 0.7568, - "step": 35544 - }, - { - "epoch": 0.91, - "learning_rate": 1.6322304649719474e-06, - "loss": 0.9443, - "step": 35545 - }, - { - "epoch": 0.91, - "learning_rate": 1.6322090262050963e-06, - "loss": 1.0039, - "step": 35546 - }, - { - "epoch": 0.91, - "learning_rate": 1.6321875869541914e-06, - "loss": 0.8135, - "step": 35547 - }, - { - "epoch": 0.91, - "learning_rate": 1.6321661472192497e-06, - "loss": 0.8271, - "step": 35548 - }, - { - "epoch": 0.91, - "learning_rate": 1.6321447070002879e-06, - "loss": 0.8008, - "step": 35549 - }, - { - "epoch": 0.91, - "learning_rate": 1.6321232662973214e-06, - "loss": 0.8389, - "step": 35550 - }, - { - "epoch": 0.91, - "learning_rate": 1.6321018251103673e-06, - "loss": 0.7705, - "step": 35551 - }, - { - "epoch": 0.91, - "learning_rate": 1.632080383439442e-06, - "loss": 0.5488, - "step": 35552 - }, - { - "epoch": 0.91, - "learning_rate": 1.632058941284562e-06, - "loss": 0.9629, - "step": 35553 - }, - { - "epoch": 0.91, - "learning_rate": 1.6320374986457433e-06, - "loss": 0.8018, - "step": 35554 - }, - { - "epoch": 0.91, - "learning_rate": 1.6320160555230023e-06, - "loss": 0.917, - "step": 35555 - }, - { - "epoch": 0.91, - "learning_rate": 1.6319946119163559e-06, - "loss": 0.9116, - "step": 35556 - }, - { - "epoch": 0.91, - "learning_rate": 1.6319731678258207e-06, - "loss": 0.8687, - "step": 35557 - }, - { - "epoch": 0.91, - "learning_rate": 1.6319517232514122e-06, - "loss": 0.8975, - "step": 35558 - }, - { - "epoch": 0.91, - "learning_rate": 1.6319302781931472e-06, - "loss": 0.9082, - "step": 35559 - }, - { - "epoch": 0.91, - "learning_rate": 1.6319088326510427e-06, - "loss": 0.8062, - "step": 35560 - }, - { - "epoch": 0.91, - "learning_rate": 1.6318873866251143e-06, - "loss": 0.873, - "step": 35561 - }, - { - "epoch": 0.91, - "learning_rate": 1.6318659401153791e-06, - "loss": 0.9229, - "step": 35562 - }, - { - "epoch": 0.91, - "learning_rate": 1.6318444931218532e-06, - "loss": 0.8652, - "step": 35563 - }, - { - "epoch": 0.91, - "learning_rate": 1.6318230456445527e-06, - "loss": 0.8145, - "step": 35564 - }, - { - "epoch": 0.91, - "learning_rate": 1.6318015976834946e-06, - "loss": 0.8291, - "step": 35565 - }, - { - "epoch": 0.91, - "learning_rate": 1.6317801492386946e-06, - "loss": 0.7578, - "step": 35566 - }, - { - "epoch": 0.91, - "learning_rate": 1.6317587003101702e-06, - "loss": 0.8726, - "step": 35567 - }, - { - "epoch": 0.91, - "learning_rate": 1.6317372508979369e-06, - "loss": 0.696, - "step": 35568 - }, - { - "epoch": 0.91, - "learning_rate": 1.6317158010020115e-06, - "loss": 0.7939, - "step": 35569 - }, - { - "epoch": 0.91, - "learning_rate": 1.6316943506224104e-06, - "loss": 1.0225, - "step": 35570 - }, - { - "epoch": 0.91, - "learning_rate": 1.6316728997591497e-06, - "loss": 0.9287, - "step": 35571 - }, - { - "epoch": 0.91, - "learning_rate": 1.6316514484122465e-06, - "loss": 0.8486, - "step": 35572 - }, - { - "epoch": 0.91, - "learning_rate": 1.6316299965817168e-06, - "loss": 0.8721, - "step": 35573 - }, - { - "epoch": 0.91, - "learning_rate": 1.631608544267577e-06, - "loss": 0.8708, - "step": 35574 - }, - { - "epoch": 0.91, - "learning_rate": 1.6315870914698433e-06, - "loss": 0.6333, - "step": 35575 - }, - { - "epoch": 0.91, - "learning_rate": 1.6315656381885329e-06, - "loss": 0.6001, - "step": 35576 - }, - { - "epoch": 0.91, - "learning_rate": 1.6315441844236615e-06, - "loss": 0.8193, - "step": 35577 - }, - { - "epoch": 0.91, - "learning_rate": 1.6315227301752454e-06, - "loss": 0.584, - "step": 35578 - }, - { - "epoch": 0.91, - "learning_rate": 1.6315012754433017e-06, - "loss": 0.9424, - "step": 35579 - }, - { - "epoch": 0.91, - "learning_rate": 1.6314798202278466e-06, - "loss": 0.8613, - "step": 35580 - }, - { - "epoch": 0.91, - "learning_rate": 1.6314583645288962e-06, - "loss": 0.8975, - "step": 35581 - }, - { - "epoch": 0.91, - "learning_rate": 1.6314369083464676e-06, - "loss": 0.6929, - "step": 35582 - }, - { - "epoch": 0.91, - "learning_rate": 1.6314154516805766e-06, - "loss": 0.6714, - "step": 35583 - }, - { - "epoch": 0.91, - "learning_rate": 1.6313939945312396e-06, - "loss": 0.9443, - "step": 35584 - }, - { - "epoch": 0.91, - "learning_rate": 1.6313725368984731e-06, - "loss": 0.8579, - "step": 35585 - }, - { - "epoch": 0.91, - "learning_rate": 1.631351078782294e-06, - "loss": 0.9424, - "step": 35586 - }, - { - "epoch": 0.91, - "learning_rate": 1.6313296201827184e-06, - "loss": 0.8906, - "step": 35587 - }, - { - "epoch": 0.91, - "learning_rate": 1.631308161099763e-06, - "loss": 0.7988, - "step": 35588 - }, - { - "epoch": 0.91, - "learning_rate": 1.6312867015334434e-06, - "loss": 0.7666, - "step": 35589 - }, - { - "epoch": 0.91, - "learning_rate": 1.631265241483777e-06, - "loss": 0.8975, - "step": 35590 - }, - { - "epoch": 0.91, - "learning_rate": 1.6312437809507796e-06, - "loss": 1.0293, - "step": 35591 - }, - { - "epoch": 0.91, - "learning_rate": 1.6312223199344678e-06, - "loss": 0.8281, - "step": 35592 - }, - { - "epoch": 0.91, - "learning_rate": 1.6312008584348583e-06, - "loss": 0.8574, - "step": 35593 - }, - { - "epoch": 0.91, - "learning_rate": 1.6311793964519676e-06, - "loss": 0.6997, - "step": 35594 - }, - { - "epoch": 0.91, - "learning_rate": 1.6311579339858112e-06, - "loss": 0.7441, - "step": 35595 - }, - { - "epoch": 0.91, - "learning_rate": 1.6311364710364067e-06, - "loss": 0.9102, - "step": 35596 - }, - { - "epoch": 0.91, - "learning_rate": 1.6311150076037698e-06, - "loss": 0.7148, - "step": 35597 - }, - { - "epoch": 0.91, - "learning_rate": 1.631093543687917e-06, - "loss": 0.5958, - "step": 35598 - }, - { - "epoch": 0.91, - "learning_rate": 1.6310720792888653e-06, - "loss": 0.7622, - "step": 35599 - }, - { - "epoch": 0.91, - "learning_rate": 1.6310506144066306e-06, - "loss": 0.7656, - "step": 35600 - }, - { - "epoch": 0.91, - "learning_rate": 1.6310291490412296e-06, - "loss": 0.8262, - "step": 35601 - }, - { - "epoch": 0.91, - "learning_rate": 1.6310076831926781e-06, - "loss": 0.8037, - "step": 35602 - }, - { - "epoch": 0.91, - "learning_rate": 1.6309862168609936e-06, - "loss": 0.7012, - "step": 35603 - }, - { - "epoch": 0.91, - "learning_rate": 1.6309647500461914e-06, - "loss": 0.8545, - "step": 35604 - }, - { - "epoch": 0.91, - "learning_rate": 1.630943282748289e-06, - "loss": 0.6826, - "step": 35605 - }, - { - "epoch": 0.91, - "learning_rate": 1.6309218149673024e-06, - "loss": 0.75, - "step": 35606 - }, - { - "epoch": 0.91, - "learning_rate": 1.6309003467032473e-06, - "loss": 0.5825, - "step": 35607 - }, - { - "epoch": 0.91, - "learning_rate": 1.6308788779561412e-06, - "loss": 0.9102, - "step": 35608 - }, - { - "epoch": 0.91, - "learning_rate": 1.6308574087260004e-06, - "loss": 0.5508, - "step": 35609 - }, - { - "epoch": 0.91, - "learning_rate": 1.6308359390128408e-06, - "loss": 0.8662, - "step": 35610 - }, - { - "epoch": 0.91, - "learning_rate": 1.6308144688166792e-06, - "loss": 0.6008, - "step": 35611 - }, - { - "epoch": 0.91, - "learning_rate": 1.6307929981375318e-06, - "loss": 0.5984, - "step": 35612 - }, - { - "epoch": 0.91, - "learning_rate": 1.6307715269754154e-06, - "loss": 0.8604, - "step": 35613 - }, - { - "epoch": 0.91, - "learning_rate": 1.6307500553303463e-06, - "loss": 0.6636, - "step": 35614 - }, - { - "epoch": 0.91, - "learning_rate": 1.6307285832023406e-06, - "loss": 0.8506, - "step": 35615 - }, - { - "epoch": 0.91, - "learning_rate": 1.6307071105914156e-06, - "loss": 0.9365, - "step": 35616 - }, - { - "epoch": 0.91, - "learning_rate": 1.6306856374975868e-06, - "loss": 0.7803, - "step": 35617 - }, - { - "epoch": 0.91, - "learning_rate": 1.630664163920871e-06, - "loss": 0.7148, - "step": 35618 - }, - { - "epoch": 0.91, - "learning_rate": 1.6306426898612843e-06, - "loss": 0.8467, - "step": 35619 - }, - { - "epoch": 0.91, - "learning_rate": 1.6306212153188438e-06, - "loss": 0.9707, - "step": 35620 - }, - { - "epoch": 0.91, - "learning_rate": 1.630599740293566e-06, - "loss": 0.9668, - "step": 35621 - }, - { - "epoch": 0.91, - "learning_rate": 1.6305782647854666e-06, - "loss": 0.5068, - "step": 35622 - }, - { - "epoch": 0.91, - "learning_rate": 1.6305567887945623e-06, - "loss": 0.4688, - "step": 35623 - }, - { - "epoch": 0.91, - "learning_rate": 1.6305353123208701e-06, - "loss": 0.791, - "step": 35624 - }, - { - "epoch": 0.91, - "learning_rate": 1.6305138353644054e-06, - "loss": 0.916, - "step": 35625 - }, - { - "epoch": 0.91, - "learning_rate": 1.6304923579251857e-06, - "loss": 0.9521, - "step": 35626 - }, - { - "epoch": 0.91, - "learning_rate": 1.630470880003227e-06, - "loss": 0.7314, - "step": 35627 - }, - { - "epoch": 0.91, - "learning_rate": 1.6304494015985455e-06, - "loss": 0.832, - "step": 35628 - }, - { - "epoch": 0.91, - "learning_rate": 1.630427922711158e-06, - "loss": 1.0269, - "step": 35629 - }, - { - "epoch": 0.91, - "learning_rate": 1.630406443341081e-06, - "loss": 0.9424, - "step": 35630 - }, - { - "epoch": 0.91, - "learning_rate": 1.6303849634883305e-06, - "loss": 0.8984, - "step": 35631 - }, - { - "epoch": 0.91, - "learning_rate": 1.6303634831529232e-06, - "loss": 0.998, - "step": 35632 - }, - { - "epoch": 0.91, - "learning_rate": 1.6303420023348755e-06, - "loss": 0.8291, - "step": 35633 - }, - { - "epoch": 0.91, - "learning_rate": 1.6303205210342043e-06, - "loss": 0.8613, - "step": 35634 - }, - { - "epoch": 0.91, - "learning_rate": 1.6302990392509256e-06, - "loss": 0.752, - "step": 35635 - }, - { - "epoch": 0.91, - "learning_rate": 1.6302775569850555e-06, - "loss": 0.6558, - "step": 35636 - }, - { - "epoch": 0.91, - "learning_rate": 1.6302560742366112e-06, - "loss": 0.8335, - "step": 35637 - }, - { - "epoch": 0.91, - "learning_rate": 1.6302345910056085e-06, - "loss": 1.1309, - "step": 35638 - }, - { - "epoch": 0.91, - "learning_rate": 1.6302131072920645e-06, - "loss": 0.835, - "step": 35639 - }, - { - "epoch": 0.91, - "learning_rate": 1.6301916230959952e-06, - "loss": 0.6473, - "step": 35640 - }, - { - "epoch": 0.91, - "learning_rate": 1.6301701384174172e-06, - "loss": 0.8955, - "step": 35641 - }, - { - "epoch": 0.91, - "learning_rate": 1.630148653256347e-06, - "loss": 0.6694, - "step": 35642 - }, - { - "epoch": 0.91, - "learning_rate": 1.6301271676128004e-06, - "loss": 0.7979, - "step": 35643 - }, - { - "epoch": 0.91, - "learning_rate": 1.6301056814867947e-06, - "loss": 0.9648, - "step": 35644 - }, - { - "epoch": 0.91, - "learning_rate": 1.6300841948783462e-06, - "loss": 0.8062, - "step": 35645 - }, - { - "epoch": 0.91, - "learning_rate": 1.6300627077874713e-06, - "loss": 0.8516, - "step": 35646 - }, - { - "epoch": 0.91, - "learning_rate": 1.6300412202141861e-06, - "loss": 0.9443, - "step": 35647 - }, - { - "epoch": 0.91, - "learning_rate": 1.6300197321585075e-06, - "loss": 0.6758, - "step": 35648 - }, - { - "epoch": 0.91, - "learning_rate": 1.6299982436204514e-06, - "loss": 0.8359, - "step": 35649 - }, - { - "epoch": 0.91, - "learning_rate": 1.629976754600035e-06, - "loss": 0.7021, - "step": 35650 - }, - { - "epoch": 0.91, - "learning_rate": 1.6299552650972744e-06, - "loss": 1.0361, - "step": 35651 - }, - { - "epoch": 0.91, - "learning_rate": 1.6299337751121858e-06, - "loss": 0.8066, - "step": 35652 - }, - { - "epoch": 0.91, - "learning_rate": 1.629912284644786e-06, - "loss": 0.8516, - "step": 35653 - }, - { - "epoch": 0.91, - "learning_rate": 1.629890793695091e-06, - "loss": 0.8799, - "step": 35654 - }, - { - "epoch": 0.91, - "learning_rate": 1.6298693022631177e-06, - "loss": 0.8408, - "step": 35655 - }, - { - "epoch": 0.91, - "learning_rate": 1.6298478103488828e-06, - "loss": 0.6284, - "step": 35656 - }, - { - "epoch": 0.91, - "learning_rate": 1.629826317952402e-06, - "loss": 0.8643, - "step": 35657 - }, - { - "epoch": 0.91, - "learning_rate": 1.6298048250736924e-06, - "loss": 0.7539, - "step": 35658 - }, - { - "epoch": 0.91, - "learning_rate": 1.62978333171277e-06, - "loss": 0.7998, - "step": 35659 - }, - { - "epoch": 0.91, - "learning_rate": 1.6297618378696517e-06, - "loss": 0.7715, - "step": 35660 - }, - { - "epoch": 0.91, - "learning_rate": 1.6297403435443537e-06, - "loss": 0.7168, - "step": 35661 - }, - { - "epoch": 0.91, - "learning_rate": 1.6297188487368922e-06, - "loss": 0.7183, - "step": 35662 - }, - { - "epoch": 0.91, - "learning_rate": 1.629697353447284e-06, - "loss": 0.9443, - "step": 35663 - }, - { - "epoch": 0.91, - "learning_rate": 1.6296758576755459e-06, - "loss": 0.835, - "step": 35664 - }, - { - "epoch": 0.91, - "learning_rate": 1.6296543614216934e-06, - "loss": 0.8584, - "step": 35665 - }, - { - "epoch": 0.91, - "learning_rate": 1.6296328646857437e-06, - "loss": 0.6082, - "step": 35666 - }, - { - "epoch": 0.91, - "learning_rate": 1.6296113674677133e-06, - "loss": 1.0366, - "step": 35667 - }, - { - "epoch": 0.91, - "learning_rate": 1.6295898697676183e-06, - "loss": 0.8364, - "step": 35668 - }, - { - "epoch": 0.91, - "learning_rate": 1.629568371585475e-06, - "loss": 0.9385, - "step": 35669 - }, - { - "epoch": 0.91, - "learning_rate": 1.6295468729213004e-06, - "loss": 0.8662, - "step": 35670 - }, - { - "epoch": 0.91, - "learning_rate": 1.6295253737751108e-06, - "loss": 1.082, - "step": 35671 - }, - { - "epoch": 0.91, - "learning_rate": 1.6295038741469224e-06, - "loss": 0.6631, - "step": 35672 - }, - { - "epoch": 0.91, - "learning_rate": 1.629482374036752e-06, - "loss": 0.8848, - "step": 35673 - }, - { - "epoch": 0.91, - "learning_rate": 1.6294608734446155e-06, - "loss": 0.9609, - "step": 35674 - }, - { - "epoch": 0.91, - "learning_rate": 1.6294393723705302e-06, - "loss": 0.8232, - "step": 35675 - }, - { - "epoch": 0.91, - "learning_rate": 1.629417870814512e-06, - "loss": 0.9258, - "step": 35676 - }, - { - "epoch": 0.91, - "learning_rate": 1.6293963687765776e-06, - "loss": 1.0273, - "step": 35677 - }, - { - "epoch": 0.91, - "learning_rate": 1.629374866256743e-06, - "loss": 0.7314, - "step": 35678 - }, - { - "epoch": 0.91, - "learning_rate": 1.6293533632550252e-06, - "loss": 0.9473, - "step": 35679 - }, - { - "epoch": 0.91, - "learning_rate": 1.6293318597714402e-06, - "loss": 0.75, - "step": 35680 - }, - { - "epoch": 0.91, - "learning_rate": 1.629310355806005e-06, - "loss": 0.8159, - "step": 35681 - }, - { - "epoch": 0.91, - "learning_rate": 1.6292888513587357e-06, - "loss": 0.9355, - "step": 35682 - }, - { - "epoch": 0.91, - "learning_rate": 1.629267346429649e-06, - "loss": 0.875, - "step": 35683 - }, - { - "epoch": 0.91, - "learning_rate": 1.6292458410187613e-06, - "loss": 0.6841, - "step": 35684 - }, - { - "epoch": 0.91, - "learning_rate": 1.6292243351260888e-06, - "loss": 0.8672, - "step": 35685 - }, - { - "epoch": 0.91, - "learning_rate": 1.6292028287516482e-06, - "loss": 0.9131, - "step": 35686 - }, - { - "epoch": 0.91, - "learning_rate": 1.629181321895456e-06, - "loss": 0.8613, - "step": 35687 - }, - { - "epoch": 0.91, - "learning_rate": 1.6291598145575284e-06, - "loss": 0.9111, - "step": 35688 - }, - { - "epoch": 0.91, - "learning_rate": 1.6291383067378822e-06, - "loss": 1.0215, - "step": 35689 - }, - { - "epoch": 0.91, - "learning_rate": 1.6291167984365334e-06, - "loss": 0.7783, - "step": 35690 - }, - { - "epoch": 0.91, - "learning_rate": 1.6290952896534992e-06, - "loss": 0.9512, - "step": 35691 - }, - { - "epoch": 0.91, - "learning_rate": 1.6290737803887957e-06, - "loss": 0.9014, - "step": 35692 - }, - { - "epoch": 0.91, - "learning_rate": 1.6290522706424392e-06, - "loss": 0.8057, - "step": 35693 - }, - { - "epoch": 0.91, - "learning_rate": 1.6290307604144462e-06, - "loss": 0.4137, - "step": 35694 - }, - { - "epoch": 0.91, - "learning_rate": 1.6290092497048335e-06, - "loss": 0.7373, - "step": 35695 - }, - { - "epoch": 0.91, - "learning_rate": 1.6289877385136173e-06, - "loss": 0.8828, - "step": 35696 - }, - { - "epoch": 0.91, - "learning_rate": 1.628966226840814e-06, - "loss": 0.9238, - "step": 35697 - }, - { - "epoch": 0.91, - "learning_rate": 1.6289447146864401e-06, - "loss": 0.7656, - "step": 35698 - }, - { - "epoch": 0.91, - "learning_rate": 1.628923202050512e-06, - "loss": 0.7148, - "step": 35699 - }, - { - "epoch": 0.92, - "learning_rate": 1.628901688933047e-06, - "loss": 0.7354, - "step": 35700 - }, - { - "epoch": 0.92, - "learning_rate": 1.6288801753340602e-06, - "loss": 1.0088, - "step": 35701 - }, - { - "epoch": 0.92, - "learning_rate": 1.6288586612535691e-06, - "loss": 0.7734, - "step": 35702 - }, - { - "epoch": 0.92, - "learning_rate": 1.6288371466915897e-06, - "loss": 0.8252, - "step": 35703 - }, - { - "epoch": 0.92, - "learning_rate": 1.6288156316481386e-06, - "loss": 0.8594, - "step": 35704 - }, - { - "epoch": 0.92, - "learning_rate": 1.6287941161232323e-06, - "loss": 0.7485, - "step": 35705 - }, - { - "epoch": 0.92, - "learning_rate": 1.6287726001168875e-06, - "loss": 0.9912, - "step": 35706 - }, - { - "epoch": 0.92, - "learning_rate": 1.6287510836291203e-06, - "loss": 0.8037, - "step": 35707 - }, - { - "epoch": 0.92, - "learning_rate": 1.6287295666599472e-06, - "loss": 0.9121, - "step": 35708 - }, - { - "epoch": 0.92, - "learning_rate": 1.628708049209385e-06, - "loss": 0.748, - "step": 35709 - }, - { - "epoch": 0.92, - "learning_rate": 1.6286865312774496e-06, - "loss": 0.8809, - "step": 35710 - }, - { - "epoch": 0.92, - "learning_rate": 1.6286650128641582e-06, - "loss": 1.0234, - "step": 35711 - }, - { - "epoch": 0.92, - "learning_rate": 1.628643493969527e-06, - "loss": 0.7886, - "step": 35712 - }, - { - "epoch": 0.92, - "learning_rate": 1.628621974593572e-06, - "loss": 0.8291, - "step": 35713 - }, - { - "epoch": 0.92, - "learning_rate": 1.62860045473631e-06, - "loss": 0.71, - "step": 35714 - }, - { - "epoch": 0.92, - "learning_rate": 1.6285789343977576e-06, - "loss": 0.6509, - "step": 35715 - }, - { - "epoch": 0.92, - "learning_rate": 1.6285574135779316e-06, - "loss": 0.5269, - "step": 35716 - }, - { - "epoch": 0.92, - "learning_rate": 1.6285358922768478e-06, - "loss": 0.8633, - "step": 35717 - }, - { - "epoch": 0.92, - "learning_rate": 1.6285143704945228e-06, - "loss": 0.874, - "step": 35718 - }, - { - "epoch": 0.92, - "learning_rate": 1.6284928482309734e-06, - "loss": 0.8408, - "step": 35719 - }, - { - "epoch": 0.92, - "learning_rate": 1.628471325486216e-06, - "loss": 0.9482, - "step": 35720 - }, - { - "epoch": 0.92, - "learning_rate": 1.628449802260267e-06, - "loss": 0.8398, - "step": 35721 - }, - { - "epoch": 0.92, - "learning_rate": 1.6284282785531426e-06, - "loss": 0.7729, - "step": 35722 - }, - { - "epoch": 0.92, - "learning_rate": 1.62840675436486e-06, - "loss": 0.873, - "step": 35723 - }, - { - "epoch": 0.92, - "learning_rate": 1.628385229695435e-06, - "loss": 0.8311, - "step": 35724 - }, - { - "epoch": 0.92, - "learning_rate": 1.6283637045448844e-06, - "loss": 0.5376, - "step": 35725 - }, - { - "epoch": 0.92, - "learning_rate": 1.6283421789132246e-06, - "loss": 0.9277, - "step": 35726 - }, - { - "epoch": 0.92, - "learning_rate": 1.628320652800472e-06, - "loss": 0.8418, - "step": 35727 - }, - { - "epoch": 0.92, - "learning_rate": 1.6282991262066432e-06, - "loss": 0.7832, - "step": 35728 - }, - { - "epoch": 0.92, - "learning_rate": 1.6282775991317546e-06, - "loss": 0.7725, - "step": 35729 - }, - { - "epoch": 0.92, - "learning_rate": 1.6282560715758229e-06, - "loss": 0.9238, - "step": 35730 - }, - { - "epoch": 0.92, - "learning_rate": 1.6282345435388646e-06, - "loss": 1.0127, - "step": 35731 - }, - { - "epoch": 0.92, - "learning_rate": 1.6282130150208955e-06, - "loss": 0.8965, - "step": 35732 - }, - { - "epoch": 0.92, - "learning_rate": 1.6281914860219328e-06, - "loss": 0.7793, - "step": 35733 - }, - { - "epoch": 0.92, - "learning_rate": 1.6281699565419929e-06, - "loss": 0.8662, - "step": 35734 - }, - { - "epoch": 0.92, - "learning_rate": 1.6281484265810915e-06, - "loss": 0.5859, - "step": 35735 - }, - { - "epoch": 0.92, - "learning_rate": 1.6281268961392468e-06, - "loss": 0.9287, - "step": 35736 - }, - { - "epoch": 0.92, - "learning_rate": 1.6281053652164735e-06, - "loss": 1.1426, - "step": 35737 - }, - { - "epoch": 0.92, - "learning_rate": 1.628083833812789e-06, - "loss": 0.6318, - "step": 35738 - }, - { - "epoch": 0.92, - "learning_rate": 1.6280623019282093e-06, - "loss": 1.04, - "step": 35739 - }, - { - "epoch": 0.92, - "learning_rate": 1.6280407695627516e-06, - "loss": 1.0332, - "step": 35740 - }, - { - "epoch": 0.92, - "learning_rate": 1.628019236716432e-06, - "loss": 0.7007, - "step": 35741 - }, - { - "epoch": 0.92, - "learning_rate": 1.6279977033892664e-06, - "loss": 1.0459, - "step": 35742 - }, - { - "epoch": 0.92, - "learning_rate": 1.6279761695812723e-06, - "loss": 0.9111, - "step": 35743 - }, - { - "epoch": 0.92, - "learning_rate": 1.6279546352924656e-06, - "loss": 0.8086, - "step": 35744 - }, - { - "epoch": 0.92, - "learning_rate": 1.627933100522863e-06, - "loss": 0.7588, - "step": 35745 - }, - { - "epoch": 0.92, - "learning_rate": 1.6279115652724808e-06, - "loss": 0.9238, - "step": 35746 - }, - { - "epoch": 0.92, - "learning_rate": 1.6278900295413354e-06, - "loss": 0.9106, - "step": 35747 - }, - { - "epoch": 0.92, - "learning_rate": 1.6278684933294438e-06, - "loss": 0.7422, - "step": 35748 - }, - { - "epoch": 0.92, - "learning_rate": 1.627846956636822e-06, - "loss": 0.8623, - "step": 35749 - }, - { - "epoch": 0.92, - "learning_rate": 1.6278254194634866e-06, - "loss": 0.7607, - "step": 35750 - }, - { - "epoch": 0.92, - "learning_rate": 1.6278038818094544e-06, - "loss": 0.7417, - "step": 35751 - }, - { - "epoch": 0.92, - "learning_rate": 1.6277823436747413e-06, - "loss": 0.7363, - "step": 35752 - }, - { - "epoch": 0.92, - "learning_rate": 1.6277608050593642e-06, - "loss": 0.7383, - "step": 35753 - }, - { - "epoch": 0.92, - "learning_rate": 1.6277392659633398e-06, - "loss": 0.9395, - "step": 35754 - }, - { - "epoch": 0.92, - "learning_rate": 1.6277177263866841e-06, - "loss": 0.8916, - "step": 35755 - }, - { - "epoch": 0.92, - "learning_rate": 1.627696186329414e-06, - "loss": 0.7601, - "step": 35756 - }, - { - "epoch": 0.92, - "learning_rate": 1.6276746457915454e-06, - "loss": 1.0112, - "step": 35757 - }, - { - "epoch": 0.92, - "learning_rate": 1.6276531047730955e-06, - "loss": 0.9287, - "step": 35758 - }, - { - "epoch": 0.92, - "learning_rate": 1.6276315632740803e-06, - "loss": 0.8357, - "step": 35759 - }, - { - "epoch": 0.92, - "learning_rate": 1.6276100212945165e-06, - "loss": 0.7979, - "step": 35760 - }, - { - "epoch": 0.92, - "learning_rate": 1.6275884788344206e-06, - "loss": 0.9102, - "step": 35761 - }, - { - "epoch": 0.92, - "learning_rate": 1.6275669358938092e-06, - "loss": 0.6953, - "step": 35762 - }, - { - "epoch": 0.92, - "learning_rate": 1.6275453924726984e-06, - "loss": 0.8936, - "step": 35763 - }, - { - "epoch": 0.92, - "learning_rate": 1.627523848571105e-06, - "loss": 0.771, - "step": 35764 - }, - { - "epoch": 0.92, - "learning_rate": 1.6275023041890457e-06, - "loss": 1.001, - "step": 35765 - }, - { - "epoch": 0.92, - "learning_rate": 1.6274807593265366e-06, - "loss": 0.7688, - "step": 35766 - }, - { - "epoch": 0.92, - "learning_rate": 1.6274592139835942e-06, - "loss": 0.9922, - "step": 35767 - }, - { - "epoch": 0.92, - "learning_rate": 1.627437668160235e-06, - "loss": 0.9082, - "step": 35768 - }, - { - "epoch": 0.92, - "learning_rate": 1.6274161218564759e-06, - "loss": 0.9238, - "step": 35769 - }, - { - "epoch": 0.92, - "learning_rate": 1.627394575072333e-06, - "loss": 0.7021, - "step": 35770 - }, - { - "epoch": 0.92, - "learning_rate": 1.6273730278078231e-06, - "loss": 0.7725, - "step": 35771 - }, - { - "epoch": 0.92, - "learning_rate": 1.6273514800629623e-06, - "loss": 0.8491, - "step": 35772 - }, - { - "epoch": 0.92, - "learning_rate": 1.6273299318377676e-06, - "loss": 0.7261, - "step": 35773 - }, - { - "epoch": 0.92, - "learning_rate": 1.627308383132255e-06, - "loss": 0.8232, - "step": 35774 - }, - { - "epoch": 0.92, - "learning_rate": 1.6272868339464412e-06, - "loss": 0.897, - "step": 35775 - }, - { - "epoch": 0.92, - "learning_rate": 1.6272652842803426e-06, - "loss": 0.9209, - "step": 35776 - }, - { - "epoch": 0.92, - "learning_rate": 1.6272437341339762e-06, - "loss": 0.6318, - "step": 35777 - }, - { - "epoch": 0.92, - "learning_rate": 1.6272221835073579e-06, - "loss": 0.8735, - "step": 35778 - }, - { - "epoch": 0.92, - "learning_rate": 1.6272006324005045e-06, - "loss": 0.9678, - "step": 35779 - }, - { - "epoch": 0.92, - "learning_rate": 1.6271790808134322e-06, - "loss": 0.9912, - "step": 35780 - }, - { - "epoch": 0.92, - "learning_rate": 1.6271575287461578e-06, - "loss": 0.752, - "step": 35781 - }, - { - "epoch": 0.92, - "learning_rate": 1.6271359761986977e-06, - "loss": 0.9053, - "step": 35782 - }, - { - "epoch": 0.92, - "learning_rate": 1.6271144231710684e-06, - "loss": 0.6409, - "step": 35783 - }, - { - "epoch": 0.92, - "learning_rate": 1.6270928696632869e-06, - "loss": 0.835, - "step": 35784 - }, - { - "epoch": 0.92, - "learning_rate": 1.6270713156753687e-06, - "loss": 0.7461, - "step": 35785 - }, - { - "epoch": 0.92, - "learning_rate": 1.627049761207331e-06, - "loss": 1.0889, - "step": 35786 - }, - { - "epoch": 0.92, - "learning_rate": 1.6270282062591903e-06, - "loss": 0.6846, - "step": 35787 - }, - { - "epoch": 0.92, - "learning_rate": 1.6270066508309626e-06, - "loss": 0.6914, - "step": 35788 - }, - { - "epoch": 0.92, - "learning_rate": 1.6269850949226647e-06, - "loss": 0.7573, - "step": 35789 - }, - { - "epoch": 0.92, - "learning_rate": 1.6269635385343134e-06, - "loss": 0.9658, - "step": 35790 - }, - { - "epoch": 0.92, - "learning_rate": 1.626941981665925e-06, - "loss": 1.0049, - "step": 35791 - }, - { - "epoch": 0.92, - "learning_rate": 1.6269204243175154e-06, - "loss": 0.7939, - "step": 35792 - }, - { - "epoch": 0.92, - "learning_rate": 1.6268988664891024e-06, - "loss": 0.9277, - "step": 35793 - }, - { - "epoch": 0.92, - "learning_rate": 1.6268773081807012e-06, - "loss": 0.8057, - "step": 35794 - }, - { - "epoch": 0.92, - "learning_rate": 1.6268557493923289e-06, - "loss": 0.5688, - "step": 35795 - }, - { - "epoch": 0.92, - "learning_rate": 1.6268341901240024e-06, - "loss": 0.7695, - "step": 35796 - }, - { - "epoch": 0.92, - "learning_rate": 1.6268126303757374e-06, - "loss": 0.9619, - "step": 35797 - }, - { - "epoch": 0.92, - "learning_rate": 1.626791070147551e-06, - "loss": 0.9141, - "step": 35798 - }, - { - "epoch": 0.92, - "learning_rate": 1.6267695094394596e-06, - "loss": 0.9961, - "step": 35799 - }, - { - "epoch": 0.92, - "learning_rate": 1.6267479482514795e-06, - "loss": 0.5913, - "step": 35800 - }, - { - "epoch": 0.92, - "learning_rate": 1.6267263865836273e-06, - "loss": 0.8213, - "step": 35801 - }, - { - "epoch": 0.92, - "learning_rate": 1.6267048244359193e-06, - "loss": 0.8896, - "step": 35802 - }, - { - "epoch": 0.92, - "learning_rate": 1.6266832618083726e-06, - "loss": 0.8867, - "step": 35803 - }, - { - "epoch": 0.92, - "learning_rate": 1.6266616987010032e-06, - "loss": 0.7466, - "step": 35804 - }, - { - "epoch": 0.92, - "learning_rate": 1.6266401351138275e-06, - "loss": 0.697, - "step": 35805 - }, - { - "epoch": 0.92, - "learning_rate": 1.6266185710468627e-06, - "loss": 0.8066, - "step": 35806 - }, - { - "epoch": 0.92, - "learning_rate": 1.6265970065001246e-06, - "loss": 0.9961, - "step": 35807 - }, - { - "epoch": 0.92, - "learning_rate": 1.6265754414736299e-06, - "loss": 0.7246, - "step": 35808 - }, - { - "epoch": 0.92, - "learning_rate": 1.6265538759673954e-06, - "loss": 0.8994, - "step": 35809 - }, - { - "epoch": 0.92, - "learning_rate": 1.6265323099814372e-06, - "loss": 0.8887, - "step": 35810 - }, - { - "epoch": 0.92, - "learning_rate": 1.626510743515772e-06, - "loss": 0.6855, - "step": 35811 - }, - { - "epoch": 0.92, - "learning_rate": 1.6264891765704167e-06, - "loss": 0.9805, - "step": 35812 - }, - { - "epoch": 0.92, - "learning_rate": 1.6264676091453872e-06, - "loss": 0.9199, - "step": 35813 - }, - { - "epoch": 0.92, - "learning_rate": 1.6264460412407001e-06, - "loss": 0.8965, - "step": 35814 - }, - { - "epoch": 0.92, - "learning_rate": 1.6264244728563724e-06, - "loss": 0.7905, - "step": 35815 - }, - { - "epoch": 0.92, - "learning_rate": 1.6264029039924203e-06, - "loss": 0.7461, - "step": 35816 - }, - { - "epoch": 0.92, - "learning_rate": 1.62638133464886e-06, - "loss": 0.9014, - "step": 35817 - }, - { - "epoch": 0.92, - "learning_rate": 1.6263597648257084e-06, - "loss": 0.5918, - "step": 35818 - }, - { - "epoch": 0.92, - "learning_rate": 1.6263381945229821e-06, - "loss": 0.877, - "step": 35819 - }, - { - "epoch": 0.92, - "learning_rate": 1.6263166237406973e-06, - "loss": 0.8018, - "step": 35820 - }, - { - "epoch": 0.92, - "learning_rate": 1.6262950524788708e-06, - "loss": 0.7278, - "step": 35821 - }, - { - "epoch": 0.92, - "learning_rate": 1.626273480737519e-06, - "loss": 0.9316, - "step": 35822 - }, - { - "epoch": 0.92, - "learning_rate": 1.6262519085166582e-06, - "loss": 0.7974, - "step": 35823 - }, - { - "epoch": 0.92, - "learning_rate": 1.626230335816305e-06, - "loss": 0.71, - "step": 35824 - }, - { - "epoch": 0.92, - "learning_rate": 1.6262087626364762e-06, - "loss": 0.6541, - "step": 35825 - }, - { - "epoch": 0.92, - "learning_rate": 1.6261871889771883e-06, - "loss": 0.792, - "step": 35826 - }, - { - "epoch": 0.92, - "learning_rate": 1.6261656148384574e-06, - "loss": 0.6631, - "step": 35827 - }, - { - "epoch": 0.92, - "learning_rate": 1.6261440402203004e-06, - "loss": 0.7686, - "step": 35828 - }, - { - "epoch": 0.92, - "learning_rate": 1.6261224651227336e-06, - "loss": 0.915, - "step": 35829 - }, - { - "epoch": 0.92, - "learning_rate": 1.6261008895457735e-06, - "loss": 0.7896, - "step": 35830 - }, - { - "epoch": 0.92, - "learning_rate": 1.6260793134894372e-06, - "loss": 0.7163, - "step": 35831 - }, - { - "epoch": 0.92, - "learning_rate": 1.6260577369537404e-06, - "loss": 0.833, - "step": 35832 - }, - { - "epoch": 0.92, - "learning_rate": 1.6260361599387e-06, - "loss": 0.791, - "step": 35833 - }, - { - "epoch": 0.92, - "learning_rate": 1.6260145824443327e-06, - "loss": 0.9277, - "step": 35834 - }, - { - "epoch": 0.92, - "learning_rate": 1.6259930044706547e-06, - "loss": 0.75, - "step": 35835 - }, - { - "epoch": 0.92, - "learning_rate": 1.6259714260176827e-06, - "loss": 0.8379, - "step": 35836 - }, - { - "epoch": 0.92, - "learning_rate": 1.6259498470854329e-06, - "loss": 0.8179, - "step": 35837 - }, - { - "epoch": 0.92, - "learning_rate": 1.6259282676739224e-06, - "loss": 0.6426, - "step": 35838 - }, - { - "epoch": 0.92, - "learning_rate": 1.625906687783167e-06, - "loss": 0.6636, - "step": 35839 - }, - { - "epoch": 0.92, - "learning_rate": 1.6258851074131838e-06, - "loss": 0.96, - "step": 35840 - }, - { - "epoch": 0.92, - "learning_rate": 1.6258635265639895e-06, - "loss": 0.96, - "step": 35841 - }, - { - "epoch": 0.92, - "learning_rate": 1.6258419452356003e-06, - "loss": 0.8145, - "step": 35842 - }, - { - "epoch": 0.92, - "learning_rate": 1.625820363428032e-06, - "loss": 0.8174, - "step": 35843 - }, - { - "epoch": 0.92, - "learning_rate": 1.6257987811413023e-06, - "loss": 0.3842, - "step": 35844 - }, - { - "epoch": 0.92, - "learning_rate": 1.6257771983754273e-06, - "loss": 0.7256, - "step": 35845 - }, - { - "epoch": 0.92, - "learning_rate": 1.6257556151304238e-06, - "loss": 0.7969, - "step": 35846 - }, - { - "epoch": 0.92, - "learning_rate": 1.6257340314063074e-06, - "loss": 0.7661, - "step": 35847 - }, - { - "epoch": 0.92, - "learning_rate": 1.6257124472030953e-06, - "loss": 0.9023, - "step": 35848 - }, - { - "epoch": 0.92, - "learning_rate": 1.6256908625208042e-06, - "loss": 0.5884, - "step": 35849 - }, - { - "epoch": 0.92, - "learning_rate": 1.62566927735945e-06, - "loss": 0.959, - "step": 35850 - }, - { - "epoch": 0.92, - "learning_rate": 1.6256476917190501e-06, - "loss": 0.7642, - "step": 35851 - }, - { - "epoch": 0.92, - "learning_rate": 1.62562610559962e-06, - "loss": 0.8213, - "step": 35852 - }, - { - "epoch": 0.92, - "learning_rate": 1.625604519001177e-06, - "loss": 0.6338, - "step": 35853 - }, - { - "epoch": 0.92, - "learning_rate": 1.6255829319237375e-06, - "loss": 0.8193, - "step": 35854 - }, - { - "epoch": 0.92, - "learning_rate": 1.6255613443673176e-06, - "loss": 0.6411, - "step": 35855 - }, - { - "epoch": 0.92, - "learning_rate": 1.6255397563319346e-06, - "loss": 0.792, - "step": 35856 - }, - { - "epoch": 0.92, - "learning_rate": 1.6255181678176041e-06, - "loss": 0.8252, - "step": 35857 - }, - { - "epoch": 0.92, - "learning_rate": 1.6254965788243435e-06, - "loss": 0.8223, - "step": 35858 - }, - { - "epoch": 0.92, - "learning_rate": 1.625474989352169e-06, - "loss": 0.8672, - "step": 35859 - }, - { - "epoch": 0.92, - "learning_rate": 1.6254533994010966e-06, - "loss": 0.7061, - "step": 35860 - }, - { - "epoch": 0.92, - "learning_rate": 1.6254318089711437e-06, - "loss": 0.9258, - "step": 35861 - }, - { - "epoch": 0.92, - "learning_rate": 1.625410218062326e-06, - "loss": 0.793, - "step": 35862 - }, - { - "epoch": 0.92, - "learning_rate": 1.6253886266746609e-06, - "loss": 0.8623, - "step": 35863 - }, - { - "epoch": 0.92, - "learning_rate": 1.625367034808164e-06, - "loss": 0.8662, - "step": 35864 - }, - { - "epoch": 0.92, - "learning_rate": 1.6253454424628527e-06, - "loss": 0.7969, - "step": 35865 - }, - { - "epoch": 0.92, - "learning_rate": 1.6253238496387432e-06, - "loss": 0.7803, - "step": 35866 - }, - { - "epoch": 0.92, - "learning_rate": 1.6253022563358518e-06, - "loss": 0.8638, - "step": 35867 - }, - { - "epoch": 0.92, - "learning_rate": 1.625280662554195e-06, - "loss": 0.875, - "step": 35868 - }, - { - "epoch": 0.92, - "learning_rate": 1.6252590682937899e-06, - "loss": 0.5085, - "step": 35869 - }, - { - "epoch": 0.92, - "learning_rate": 1.6252374735546526e-06, - "loss": 0.877, - "step": 35870 - }, - { - "epoch": 0.92, - "learning_rate": 1.6252158783368e-06, - "loss": 0.7744, - "step": 35871 - }, - { - "epoch": 0.92, - "learning_rate": 1.6251942826402478e-06, - "loss": 0.6128, - "step": 35872 - }, - { - "epoch": 0.92, - "learning_rate": 1.6251726864650132e-06, - "loss": 0.8467, - "step": 35873 - }, - { - "epoch": 0.92, - "learning_rate": 1.6251510898111129e-06, - "loss": 0.6753, - "step": 35874 - }, - { - "epoch": 0.92, - "learning_rate": 1.6251294926785631e-06, - "loss": 0.6992, - "step": 35875 - }, - { - "epoch": 0.92, - "learning_rate": 1.6251078950673803e-06, - "loss": 0.9277, - "step": 35876 - }, - { - "epoch": 0.92, - "learning_rate": 1.6250862969775812e-06, - "loss": 0.9111, - "step": 35877 - }, - { - "epoch": 0.92, - "learning_rate": 1.625064698409182e-06, - "loss": 0.793, - "step": 35878 - }, - { - "epoch": 0.92, - "learning_rate": 1.6250430993621996e-06, - "loss": 0.8574, - "step": 35879 - }, - { - "epoch": 0.92, - "learning_rate": 1.6250214998366505e-06, - "loss": 0.8545, - "step": 35880 - }, - { - "epoch": 0.92, - "learning_rate": 1.6249998998325513e-06, - "loss": 0.8252, - "step": 35881 - }, - { - "epoch": 0.92, - "learning_rate": 1.624978299349918e-06, - "loss": 0.7783, - "step": 35882 - }, - { - "epoch": 0.92, - "learning_rate": 1.6249566983887682e-06, - "loss": 0.7827, - "step": 35883 - }, - { - "epoch": 0.92, - "learning_rate": 1.6249350969491173e-06, - "loss": 0.9238, - "step": 35884 - }, - { - "epoch": 0.92, - "learning_rate": 1.6249134950309826e-06, - "loss": 0.8159, - "step": 35885 - }, - { - "epoch": 0.92, - "learning_rate": 1.6248918926343804e-06, - "loss": 0.9229, - "step": 35886 - }, - { - "epoch": 0.92, - "learning_rate": 1.624870289759327e-06, - "loss": 0.8447, - "step": 35887 - }, - { - "epoch": 0.92, - "learning_rate": 1.6248486864058392e-06, - "loss": 0.7998, - "step": 35888 - }, - { - "epoch": 0.92, - "learning_rate": 1.6248270825739335e-06, - "loss": 0.958, - "step": 35889 - }, - { - "epoch": 0.92, - "learning_rate": 1.6248054782636268e-06, - "loss": 0.8037, - "step": 35890 - }, - { - "epoch": 0.92, - "learning_rate": 1.6247838734749347e-06, - "loss": 0.8477, - "step": 35891 - }, - { - "epoch": 0.92, - "learning_rate": 1.6247622682078746e-06, - "loss": 0.8887, - "step": 35892 - }, - { - "epoch": 0.92, - "learning_rate": 1.6247406624624626e-06, - "loss": 0.8867, - "step": 35893 - }, - { - "epoch": 0.92, - "learning_rate": 1.6247190562387155e-06, - "loss": 0.8047, - "step": 35894 - }, - { - "epoch": 0.92, - "learning_rate": 1.6246974495366498e-06, - "loss": 0.7056, - "step": 35895 - }, - { - "epoch": 0.92, - "learning_rate": 1.6246758423562819e-06, - "loss": 0.6155, - "step": 35896 - }, - { - "epoch": 0.92, - "learning_rate": 1.6246542346976285e-06, - "loss": 0.8682, - "step": 35897 - }, - { - "epoch": 0.92, - "learning_rate": 1.624632626560706e-06, - "loss": 1.0293, - "step": 35898 - }, - { - "epoch": 0.92, - "learning_rate": 1.624611017945531e-06, - "loss": 0.7607, - "step": 35899 - }, - { - "epoch": 0.92, - "learning_rate": 1.6245894088521202e-06, - "loss": 0.8545, - "step": 35900 - }, - { - "epoch": 0.92, - "learning_rate": 1.6245677992804897e-06, - "loss": 0.8984, - "step": 35901 - }, - { - "epoch": 0.92, - "learning_rate": 1.6245461892306566e-06, - "loss": 0.8438, - "step": 35902 - }, - { - "epoch": 0.92, - "learning_rate": 1.6245245787026374e-06, - "loss": 0.7959, - "step": 35903 - }, - { - "epoch": 0.92, - "learning_rate": 1.6245029676964482e-06, - "loss": 0.9766, - "step": 35904 - }, - { - "epoch": 0.92, - "learning_rate": 1.6244813562121057e-06, - "loss": 0.876, - "step": 35905 - }, - { - "epoch": 0.92, - "learning_rate": 1.6244597442496267e-06, - "loss": 0.9307, - "step": 35906 - }, - { - "epoch": 0.92, - "learning_rate": 1.6244381318090276e-06, - "loss": 0.5574, - "step": 35907 - }, - { - "epoch": 0.92, - "learning_rate": 1.6244165188903249e-06, - "loss": 0.916, - "step": 35908 - }, - { - "epoch": 0.92, - "learning_rate": 1.624394905493535e-06, - "loss": 0.7061, - "step": 35909 - }, - { - "epoch": 0.92, - "learning_rate": 1.624373291618675e-06, - "loss": 0.98, - "step": 35910 - }, - { - "epoch": 0.92, - "learning_rate": 1.6243516772657608e-06, - "loss": 0.9551, - "step": 35911 - }, - { - "epoch": 0.92, - "learning_rate": 1.6243300624348094e-06, - "loss": 0.7532, - "step": 35912 - }, - { - "epoch": 0.92, - "learning_rate": 1.6243084471258368e-06, - "loss": 0.6694, - "step": 35913 - }, - { - "epoch": 0.92, - "learning_rate": 1.6242868313388604e-06, - "loss": 0.9258, - "step": 35914 - }, - { - "epoch": 0.92, - "learning_rate": 1.6242652150738962e-06, - "loss": 0.3662, - "step": 35915 - }, - { - "epoch": 0.92, - "learning_rate": 1.6242435983309606e-06, - "loss": 0.7405, - "step": 35916 - }, - { - "epoch": 0.92, - "learning_rate": 1.6242219811100705e-06, - "loss": 0.751, - "step": 35917 - }, - { - "epoch": 0.92, - "learning_rate": 1.6242003634112425e-06, - "loss": 0.8496, - "step": 35918 - }, - { - "epoch": 0.92, - "learning_rate": 1.6241787452344927e-06, - "loss": 0.6826, - "step": 35919 - }, - { - "epoch": 0.92, - "learning_rate": 1.6241571265798378e-06, - "loss": 0.7412, - "step": 35920 - }, - { - "epoch": 0.92, - "learning_rate": 1.624135507447295e-06, - "loss": 0.4719, - "step": 35921 - }, - { - "epoch": 0.92, - "learning_rate": 1.6241138878368801e-06, - "loss": 0.7598, - "step": 35922 - }, - { - "epoch": 0.92, - "learning_rate": 1.6240922677486099e-06, - "loss": 0.8438, - "step": 35923 - }, - { - "epoch": 0.92, - "learning_rate": 1.624070647182501e-06, - "loss": 0.7114, - "step": 35924 - }, - { - "epoch": 0.92, - "learning_rate": 1.6240490261385697e-06, - "loss": 0.876, - "step": 35925 - }, - { - "epoch": 0.92, - "learning_rate": 1.624027404616833e-06, - "loss": 0.9785, - "step": 35926 - }, - { - "epoch": 0.92, - "learning_rate": 1.6240057826173069e-06, - "loss": 0.6162, - "step": 35927 - }, - { - "epoch": 0.92, - "learning_rate": 1.6239841601400084e-06, - "loss": 0.7671, - "step": 35928 - }, - { - "epoch": 0.92, - "learning_rate": 1.6239625371849539e-06, - "loss": 0.9648, - "step": 35929 - }, - { - "epoch": 0.92, - "learning_rate": 1.6239409137521603e-06, - "loss": 0.7871, - "step": 35930 - }, - { - "epoch": 0.92, - "learning_rate": 1.6239192898416437e-06, - "loss": 0.8477, - "step": 35931 - }, - { - "epoch": 0.92, - "learning_rate": 1.6238976654534207e-06, - "loss": 0.9424, - "step": 35932 - }, - { - "epoch": 0.92, - "learning_rate": 1.6238760405875077e-06, - "loss": 0.8916, - "step": 35933 - }, - { - "epoch": 0.92, - "learning_rate": 1.6238544152439217e-06, - "loss": 0.8999, - "step": 35934 - }, - { - "epoch": 0.92, - "learning_rate": 1.6238327894226792e-06, - "loss": 0.7153, - "step": 35935 - }, - { - "epoch": 0.92, - "learning_rate": 1.6238111631237966e-06, - "loss": 1.0645, - "step": 35936 - }, - { - "epoch": 0.92, - "learning_rate": 1.6237895363472903e-06, - "loss": 0.6816, - "step": 35937 - }, - { - "epoch": 0.92, - "learning_rate": 1.623767909093177e-06, - "loss": 0.9619, - "step": 35938 - }, - { - "epoch": 0.92, - "learning_rate": 1.6237462813614733e-06, - "loss": 0.834, - "step": 35939 - }, - { - "epoch": 0.92, - "learning_rate": 1.623724653152196e-06, - "loss": 0.7617, - "step": 35940 - }, - { - "epoch": 0.92, - "learning_rate": 1.6237030244653614e-06, - "loss": 0.8438, - "step": 35941 - }, - { - "epoch": 0.92, - "learning_rate": 1.6236813953009857e-06, - "loss": 0.79, - "step": 35942 - }, - { - "epoch": 0.92, - "learning_rate": 1.6236597656590861e-06, - "loss": 0.9453, - "step": 35943 - }, - { - "epoch": 0.92, - "learning_rate": 1.623638135539679e-06, - "loss": 0.709, - "step": 35944 - }, - { - "epoch": 0.92, - "learning_rate": 1.6236165049427807e-06, - "loss": 0.8281, - "step": 35945 - }, - { - "epoch": 0.92, - "learning_rate": 1.623594873868408e-06, - "loss": 0.8489, - "step": 35946 - }, - { - "epoch": 0.92, - "learning_rate": 1.6235732423165774e-06, - "loss": 1.0283, - "step": 35947 - }, - { - "epoch": 0.92, - "learning_rate": 1.6235516102873051e-06, - "loss": 0.96, - "step": 35948 - }, - { - "epoch": 0.92, - "learning_rate": 1.6235299777806084e-06, - "loss": 0.5596, - "step": 35949 - }, - { - "epoch": 0.92, - "learning_rate": 1.6235083447965034e-06, - "loss": 0.917, - "step": 35950 - }, - { - "epoch": 0.92, - "learning_rate": 1.6234867113350066e-06, - "loss": 0.6865, - "step": 35951 - }, - { - "epoch": 0.92, - "learning_rate": 1.6234650773961347e-06, - "loss": 0.7715, - "step": 35952 - }, - { - "epoch": 0.92, - "learning_rate": 1.6234434429799043e-06, - "loss": 0.562, - "step": 35953 - }, - { - "epoch": 0.92, - "learning_rate": 1.623421808086332e-06, - "loss": 0.8574, - "step": 35954 - }, - { - "epoch": 0.92, - "learning_rate": 1.623400172715434e-06, - "loss": 0.772, - "step": 35955 - }, - { - "epoch": 0.92, - "learning_rate": 1.6233785368672278e-06, - "loss": 0.8516, - "step": 35956 - }, - { - "epoch": 0.92, - "learning_rate": 1.6233569005417285e-06, - "loss": 0.8516, - "step": 35957 - }, - { - "epoch": 0.92, - "learning_rate": 1.623335263738954e-06, - "loss": 0.9561, - "step": 35958 - }, - { - "epoch": 0.92, - "learning_rate": 1.6233136264589202e-06, - "loss": 0.8008, - "step": 35959 - }, - { - "epoch": 0.92, - "learning_rate": 1.6232919887016441e-06, - "loss": 0.8179, - "step": 35960 - }, - { - "epoch": 0.92, - "learning_rate": 1.6232703504671416e-06, - "loss": 0.8203, - "step": 35961 - }, - { - "epoch": 0.92, - "learning_rate": 1.6232487117554297e-06, - "loss": 0.8037, - "step": 35962 - }, - { - "epoch": 0.92, - "learning_rate": 1.623227072566525e-06, - "loss": 0.8389, - "step": 35963 - }, - { - "epoch": 0.92, - "learning_rate": 1.6232054329004439e-06, - "loss": 0.8779, - "step": 35964 - }, - { - "epoch": 0.92, - "learning_rate": 1.6231837927572032e-06, - "loss": 0.8076, - "step": 35965 - }, - { - "epoch": 0.92, - "learning_rate": 1.6231621521368192e-06, - "loss": 0.6655, - "step": 35966 - }, - { - "epoch": 0.92, - "learning_rate": 1.6231405110393087e-06, - "loss": 0.8594, - "step": 35967 - }, - { - "epoch": 0.92, - "learning_rate": 1.6231188694646881e-06, - "loss": 0.8457, - "step": 35968 - }, - { - "epoch": 0.92, - "learning_rate": 1.6230972274129743e-06, - "loss": 0.8066, - "step": 35969 - }, - { - "epoch": 0.92, - "learning_rate": 1.6230755848841833e-06, - "loss": 0.7324, - "step": 35970 - }, - { - "epoch": 0.92, - "learning_rate": 1.6230539418783317e-06, - "loss": 0.686, - "step": 35971 - }, - { - "epoch": 0.92, - "learning_rate": 1.6230322983954367e-06, - "loss": 0.7676, - "step": 35972 - }, - { - "epoch": 0.92, - "learning_rate": 1.6230106544355143e-06, - "loss": 0.8076, - "step": 35973 - }, - { - "epoch": 0.92, - "learning_rate": 1.6229890099985818e-06, - "loss": 0.7295, - "step": 35974 - }, - { - "epoch": 0.92, - "learning_rate": 1.6229673650846549e-06, - "loss": 0.957, - "step": 35975 - }, - { - "epoch": 0.92, - "learning_rate": 1.6229457196937508e-06, - "loss": 1.0547, - "step": 35976 - }, - { - "epoch": 0.92, - "learning_rate": 1.6229240738258856e-06, - "loss": 0.6523, - "step": 35977 - }, - { - "epoch": 0.92, - "learning_rate": 1.622902427481076e-06, - "loss": 0.874, - "step": 35978 - }, - { - "epoch": 0.92, - "learning_rate": 1.6228807806593386e-06, - "loss": 0.9336, - "step": 35979 - }, - { - "epoch": 0.92, - "learning_rate": 1.6228591333606902e-06, - "loss": 0.7549, - "step": 35980 - }, - { - "epoch": 0.92, - "learning_rate": 1.6228374855851472e-06, - "loss": 0.9668, - "step": 35981 - }, - { - "epoch": 0.92, - "learning_rate": 1.622815837332726e-06, - "loss": 0.9678, - "step": 35982 - }, - { - "epoch": 0.92, - "learning_rate": 1.6227941886034435e-06, - "loss": 0.9287, - "step": 35983 - }, - { - "epoch": 0.92, - "learning_rate": 1.622772539397316e-06, - "loss": 0.875, - "step": 35984 - }, - { - "epoch": 0.92, - "learning_rate": 1.6227508897143605e-06, - "loss": 0.4636, - "step": 35985 - }, - { - "epoch": 0.92, - "learning_rate": 1.6227292395545931e-06, - "loss": 0.5842, - "step": 35986 - }, - { - "epoch": 0.92, - "learning_rate": 1.6227075889180303e-06, - "loss": 0.6948, - "step": 35987 - }, - { - "epoch": 0.92, - "learning_rate": 1.6226859378046894e-06, - "loss": 0.7881, - "step": 35988 - }, - { - "epoch": 0.92, - "learning_rate": 1.622664286214586e-06, - "loss": 0.9004, - "step": 35989 - }, - { - "epoch": 0.92, - "learning_rate": 1.6226426341477378e-06, - "loss": 0.9707, - "step": 35990 - }, - { - "epoch": 0.92, - "learning_rate": 1.6226209816041604e-06, - "loss": 0.8809, - "step": 35991 - }, - { - "epoch": 0.92, - "learning_rate": 1.6225993285838706e-06, - "loss": 0.6445, - "step": 35992 - }, - { - "epoch": 0.92, - "learning_rate": 1.6225776750868852e-06, - "loss": 0.6782, - "step": 35993 - }, - { - "epoch": 0.92, - "learning_rate": 1.6225560211132207e-06, - "loss": 0.8838, - "step": 35994 - }, - { - "epoch": 0.92, - "learning_rate": 1.6225343666628942e-06, - "loss": 0.7773, - "step": 35995 - }, - { - "epoch": 0.92, - "learning_rate": 1.6225127117359213e-06, - "loss": 1.0215, - "step": 35996 - }, - { - "epoch": 0.92, - "learning_rate": 1.6224910563323189e-06, - "loss": 1.0391, - "step": 35997 - }, - { - "epoch": 0.92, - "learning_rate": 1.622469400452104e-06, - "loss": 0.8142, - "step": 35998 - }, - { - "epoch": 0.92, - "learning_rate": 1.6224477440952926e-06, - "loss": 0.8682, - "step": 35999 - }, - { - "epoch": 0.92, - "learning_rate": 1.622426087261902e-06, - "loss": 1.1377, - "step": 36000 - }, - { - "epoch": 0.92, - "learning_rate": 1.6224044299519481e-06, - "loss": 0.9082, - "step": 36001 - }, - { - "epoch": 0.92, - "learning_rate": 1.6223827721654477e-06, - "loss": 0.7227, - "step": 36002 - }, - { - "epoch": 0.92, - "learning_rate": 1.6223611139024175e-06, - "loss": 0.834, - "step": 36003 - }, - { - "epoch": 0.92, - "learning_rate": 1.6223394551628743e-06, - "loss": 0.9082, - "step": 36004 - }, - { - "epoch": 0.92, - "learning_rate": 1.622317795946834e-06, - "loss": 0.8115, - "step": 36005 - }, - { - "epoch": 0.92, - "learning_rate": 1.6222961362543137e-06, - "loss": 0.6672, - "step": 36006 - }, - { - "epoch": 0.92, - "learning_rate": 1.6222744760853297e-06, - "loss": 0.8789, - "step": 36007 - }, - { - "epoch": 0.92, - "learning_rate": 1.622252815439899e-06, - "loss": 0.7617, - "step": 36008 - }, - { - "epoch": 0.92, - "learning_rate": 1.6222311543180378e-06, - "loss": 0.9961, - "step": 36009 - }, - { - "epoch": 0.92, - "learning_rate": 1.6222094927197629e-06, - "loss": 0.9805, - "step": 36010 - }, - { - "epoch": 0.92, - "learning_rate": 1.6221878306450908e-06, - "loss": 0.876, - "step": 36011 - }, - { - "epoch": 0.92, - "learning_rate": 1.6221661680940382e-06, - "loss": 0.6919, - "step": 36012 - }, - { - "epoch": 0.92, - "learning_rate": 1.6221445050666213e-06, - "loss": 0.8901, - "step": 36013 - }, - { - "epoch": 0.92, - "learning_rate": 1.6221228415628573e-06, - "loss": 0.7651, - "step": 36014 - }, - { - "epoch": 0.92, - "learning_rate": 1.622101177582762e-06, - "loss": 0.8262, - "step": 36015 - }, - { - "epoch": 0.92, - "learning_rate": 1.6220795131263528e-06, - "loss": 0.6797, - "step": 36016 - }, - { - "epoch": 0.92, - "learning_rate": 1.6220578481936458e-06, - "loss": 0.6616, - "step": 36017 - }, - { - "epoch": 0.92, - "learning_rate": 1.6220361827846575e-06, - "loss": 0.7373, - "step": 36018 - }, - { - "epoch": 0.92, - "learning_rate": 1.6220145168994048e-06, - "loss": 0.6484, - "step": 36019 - }, - { - "epoch": 0.92, - "learning_rate": 1.6219928505379047e-06, - "loss": 0.7229, - "step": 36020 - }, - { - "epoch": 0.92, - "learning_rate": 1.6219711837001725e-06, - "loss": 0.7456, - "step": 36021 - }, - { - "epoch": 0.92, - "learning_rate": 1.621949516386226e-06, - "loss": 0.9297, - "step": 36022 - }, - { - "epoch": 0.92, - "learning_rate": 1.6219278485960813e-06, - "loss": 0.8027, - "step": 36023 - }, - { - "epoch": 0.92, - "learning_rate": 1.6219061803297549e-06, - "loss": 0.522, - "step": 36024 - }, - { - "epoch": 0.92, - "learning_rate": 1.6218845115872637e-06, - "loss": 0.7083, - "step": 36025 - }, - { - "epoch": 0.92, - "learning_rate": 1.6218628423686243e-06, - "loss": 0.6572, - "step": 36026 - }, - { - "epoch": 0.92, - "learning_rate": 1.6218411726738528e-06, - "loss": 0.8218, - "step": 36027 - }, - { - "epoch": 0.92, - "learning_rate": 1.6218195025029661e-06, - "loss": 0.7678, - "step": 36028 - }, - { - "epoch": 0.92, - "learning_rate": 1.621797831855981e-06, - "loss": 0.8447, - "step": 36029 - }, - { - "epoch": 0.92, - "learning_rate": 1.6217761607329137e-06, - "loss": 1.0107, - "step": 36030 - }, - { - "epoch": 0.92, - "learning_rate": 1.621754489133781e-06, - "loss": 0.8271, - "step": 36031 - }, - { - "epoch": 0.92, - "learning_rate": 1.6217328170585997e-06, - "loss": 0.5933, - "step": 36032 - }, - { - "epoch": 0.92, - "learning_rate": 1.621711144507386e-06, - "loss": 0.9287, - "step": 36033 - }, - { - "epoch": 0.92, - "learning_rate": 1.6216894714801566e-06, - "loss": 1.0537, - "step": 36034 - }, - { - "epoch": 0.92, - "learning_rate": 1.6216677979769282e-06, - "loss": 0.8784, - "step": 36035 - }, - { - "epoch": 0.92, - "learning_rate": 1.6216461239977176e-06, - "loss": 1.0469, - "step": 36036 - }, - { - "epoch": 0.92, - "learning_rate": 1.6216244495425406e-06, - "loss": 0.6504, - "step": 36037 - }, - { - "epoch": 0.92, - "learning_rate": 1.6216027746114146e-06, - "loss": 0.9912, - "step": 36038 - }, - { - "epoch": 0.92, - "learning_rate": 1.6215810992043562e-06, - "loss": 0.9688, - "step": 36039 - }, - { - "epoch": 0.92, - "learning_rate": 1.6215594233213816e-06, - "loss": 0.7178, - "step": 36040 - }, - { - "epoch": 0.92, - "learning_rate": 1.6215377469625072e-06, - "loss": 0.7861, - "step": 36041 - }, - { - "epoch": 0.92, - "learning_rate": 1.6215160701277505e-06, - "loss": 0.7578, - "step": 36042 - }, - { - "epoch": 0.92, - "learning_rate": 1.621494392817127e-06, - "loss": 0.9668, - "step": 36043 - }, - { - "epoch": 0.92, - "learning_rate": 1.621472715030654e-06, - "loss": 1.001, - "step": 36044 - }, - { - "epoch": 0.92, - "learning_rate": 1.6214510367683484e-06, - "loss": 1.0264, - "step": 36045 - }, - { - "epoch": 0.92, - "learning_rate": 1.6214293580302256e-06, - "loss": 0.8076, - "step": 36046 - }, - { - "epoch": 0.92, - "learning_rate": 1.6214076788163032e-06, - "loss": 0.7764, - "step": 36047 - }, - { - "epoch": 0.92, - "learning_rate": 1.6213859991265975e-06, - "loss": 0.7451, - "step": 36048 - }, - { - "epoch": 0.92, - "learning_rate": 1.6213643189611253e-06, - "loss": 0.9678, - "step": 36049 - }, - { - "epoch": 0.92, - "learning_rate": 1.6213426383199029e-06, - "loss": 0.8135, - "step": 36050 - }, - { - "epoch": 0.92, - "learning_rate": 1.621320957202947e-06, - "loss": 0.8906, - "step": 36051 - }, - { - "epoch": 0.92, - "learning_rate": 1.621299275610274e-06, - "loss": 0.9111, - "step": 36052 - }, - { - "epoch": 0.92, - "learning_rate": 1.6212775935419007e-06, - "loss": 1.0537, - "step": 36053 - }, - { - "epoch": 0.92, - "learning_rate": 1.6212559109978438e-06, - "loss": 0.8271, - "step": 36054 - }, - { - "epoch": 0.92, - "learning_rate": 1.6212342279781202e-06, - "loss": 0.646, - "step": 36055 - }, - { - "epoch": 0.92, - "learning_rate": 1.621212544482746e-06, - "loss": 0.8789, - "step": 36056 - }, - { - "epoch": 0.92, - "learning_rate": 1.6211908605117374e-06, - "loss": 0.8965, - "step": 36057 - }, - { - "epoch": 0.92, - "learning_rate": 1.6211691760651119e-06, - "loss": 0.9619, - "step": 36058 - }, - { - "epoch": 0.92, - "learning_rate": 1.6211474911428856e-06, - "loss": 1.1113, - "step": 36059 - }, - { - "epoch": 0.92, - "learning_rate": 1.6211258057450753e-06, - "loss": 0.6841, - "step": 36060 - }, - { - "epoch": 0.92, - "learning_rate": 1.6211041198716977e-06, - "loss": 0.9062, - "step": 36061 - }, - { - "epoch": 0.92, - "learning_rate": 1.621082433522769e-06, - "loss": 0.7319, - "step": 36062 - }, - { - "epoch": 0.92, - "learning_rate": 1.6210607466983062e-06, - "loss": 0.7466, - "step": 36063 - }, - { - "epoch": 0.92, - "learning_rate": 1.6210390593983254e-06, - "loss": 1.0303, - "step": 36064 - }, - { - "epoch": 0.92, - "learning_rate": 1.6210173716228441e-06, - "loss": 0.8867, - "step": 36065 - }, - { - "epoch": 0.92, - "learning_rate": 1.6209956833718779e-06, - "loss": 0.959, - "step": 36066 - }, - { - "epoch": 0.92, - "learning_rate": 1.620973994645444e-06, - "loss": 0.6753, - "step": 36067 - }, - { - "epoch": 0.92, - "learning_rate": 1.6209523054435587e-06, - "loss": 0.8828, - "step": 36068 - }, - { - "epoch": 0.92, - "learning_rate": 1.620930615766239e-06, - "loss": 0.584, - "step": 36069 - }, - { - "epoch": 0.92, - "learning_rate": 1.6209089256135014e-06, - "loss": 0.8887, - "step": 36070 - }, - { - "epoch": 0.92, - "learning_rate": 1.6208872349853622e-06, - "loss": 0.7344, - "step": 36071 - }, - { - "epoch": 0.92, - "learning_rate": 1.6208655438818382e-06, - "loss": 0.6177, - "step": 36072 - }, - { - "epoch": 0.92, - "learning_rate": 1.620843852302946e-06, - "loss": 0.7388, - "step": 36073 - }, - { - "epoch": 0.92, - "learning_rate": 1.6208221602487021e-06, - "loss": 0.9121, - "step": 36074 - }, - { - "epoch": 0.92, - "learning_rate": 1.6208004677191237e-06, - "loss": 0.7397, - "step": 36075 - }, - { - "epoch": 0.92, - "learning_rate": 1.6207787747142265e-06, - "loss": 0.8193, - "step": 36076 - }, - { - "epoch": 0.92, - "learning_rate": 1.6207570812340274e-06, - "loss": 0.7666, - "step": 36077 - }, - { - "epoch": 0.92, - "learning_rate": 1.6207353872785433e-06, - "loss": 0.5269, - "step": 36078 - }, - { - "epoch": 0.92, - "learning_rate": 1.620713692847791e-06, - "loss": 0.853, - "step": 36079 - }, - { - "epoch": 0.92, - "learning_rate": 1.6206919979417864e-06, - "loss": 0.7305, - "step": 36080 - }, - { - "epoch": 0.92, - "learning_rate": 1.6206703025605463e-06, - "loss": 0.9004, - "step": 36081 - }, - { - "epoch": 0.92, - "learning_rate": 1.6206486067040878e-06, - "loss": 0.9316, - "step": 36082 - }, - { - "epoch": 0.92, - "learning_rate": 1.6206269103724272e-06, - "loss": 0.8975, - "step": 36083 - }, - { - "epoch": 0.92, - "learning_rate": 1.620605213565581e-06, - "loss": 0.71, - "step": 36084 - }, - { - "epoch": 0.92, - "learning_rate": 1.620583516283566e-06, - "loss": 0.9717, - "step": 36085 - }, - { - "epoch": 0.92, - "learning_rate": 1.6205618185263988e-06, - "loss": 0.7188, - "step": 36086 - }, - { - "epoch": 0.92, - "learning_rate": 1.6205401202940958e-06, - "loss": 0.6924, - "step": 36087 - }, - { - "epoch": 0.92, - "learning_rate": 1.6205184215866737e-06, - "loss": 0.8896, - "step": 36088 - }, - { - "epoch": 0.92, - "learning_rate": 1.6204967224041494e-06, - "loss": 0.8145, - "step": 36089 - }, - { - "epoch": 0.93, - "learning_rate": 1.620475022746539e-06, - "loss": 0.8896, - "step": 36090 - }, - { - "epoch": 0.93, - "learning_rate": 1.6204533226138599e-06, - "loss": 0.7554, - "step": 36091 - }, - { - "epoch": 0.93, - "learning_rate": 1.6204316220061278e-06, - "loss": 1.0381, - "step": 36092 - }, - { - "epoch": 0.93, - "learning_rate": 1.6204099209233597e-06, - "loss": 0.7832, - "step": 36093 - }, - { - "epoch": 0.93, - "learning_rate": 1.6203882193655726e-06, - "loss": 1.0586, - "step": 36094 - }, - { - "epoch": 0.93, - "learning_rate": 1.6203665173327825e-06, - "loss": 0.8105, - "step": 36095 - }, - { - "epoch": 0.93, - "learning_rate": 1.6203448148250064e-06, - "loss": 0.7578, - "step": 36096 - }, - { - "epoch": 0.93, - "learning_rate": 1.6203231118422606e-06, - "loss": 0.6323, - "step": 36097 - }, - { - "epoch": 0.93, - "learning_rate": 1.620301408384562e-06, - "loss": 0.8896, - "step": 36098 - }, - { - "epoch": 0.93, - "learning_rate": 1.6202797044519275e-06, - "loss": 0.9102, - "step": 36099 - }, - { - "epoch": 0.93, - "learning_rate": 1.6202580000443732e-06, - "loss": 0.8057, - "step": 36100 - }, - { - "epoch": 0.93, - "learning_rate": 1.6202362951619154e-06, - "loss": 0.9707, - "step": 36101 - }, - { - "epoch": 0.93, - "learning_rate": 1.6202145898045717e-06, - "loss": 0.8594, - "step": 36102 - }, - { - "epoch": 0.93, - "learning_rate": 1.6201928839723577e-06, - "loss": 0.6189, - "step": 36103 - }, - { - "epoch": 0.93, - "learning_rate": 1.620171177665291e-06, - "loss": 0.8379, - "step": 36104 - }, - { - "epoch": 0.93, - "learning_rate": 1.6201494708833879e-06, - "loss": 1.0322, - "step": 36105 - }, - { - "epoch": 0.93, - "learning_rate": 1.6201277636266642e-06, - "loss": 0.8457, - "step": 36106 - }, - { - "epoch": 0.93, - "learning_rate": 1.6201060558951376e-06, - "loss": 0.9512, - "step": 36107 - }, - { - "epoch": 0.93, - "learning_rate": 1.6200843476888242e-06, - "loss": 1.0449, - "step": 36108 - }, - { - "epoch": 0.93, - "learning_rate": 1.6200626390077407e-06, - "loss": 1.0049, - "step": 36109 - }, - { - "epoch": 0.93, - "learning_rate": 1.6200409298519039e-06, - "loss": 0.8711, - "step": 36110 - }, - { - "epoch": 0.93, - "learning_rate": 1.6200192202213303e-06, - "loss": 0.752, - "step": 36111 - }, - { - "epoch": 0.93, - "learning_rate": 1.6199975101160363e-06, - "loss": 0.8657, - "step": 36112 - }, - { - "epoch": 0.93, - "learning_rate": 1.6199757995360388e-06, - "loss": 0.9092, - "step": 36113 - }, - { - "epoch": 0.93, - "learning_rate": 1.6199540884813543e-06, - "loss": 0.8457, - "step": 36114 - }, - { - "epoch": 0.93, - "learning_rate": 1.6199323769519997e-06, - "loss": 0.9141, - "step": 36115 - }, - { - "epoch": 0.93, - "learning_rate": 1.6199106649479913e-06, - "loss": 0.9844, - "step": 36116 - }, - { - "epoch": 0.93, - "learning_rate": 1.6198889524693455e-06, - "loss": 0.999, - "step": 36117 - }, - { - "epoch": 0.93, - "learning_rate": 1.6198672395160796e-06, - "loss": 0.8652, - "step": 36118 - }, - { - "epoch": 0.93, - "learning_rate": 1.6198455260882095e-06, - "loss": 0.7026, - "step": 36119 - }, - { - "epoch": 0.93, - "learning_rate": 1.6198238121857523e-06, - "loss": 0.8306, - "step": 36120 - }, - { - "epoch": 0.93, - "learning_rate": 1.6198020978087246e-06, - "loss": 0.7119, - "step": 36121 - }, - { - "epoch": 0.93, - "learning_rate": 1.619780382957143e-06, - "loss": 0.8887, - "step": 36122 - }, - { - "epoch": 0.93, - "learning_rate": 1.6197586676310237e-06, - "loss": 1.1035, - "step": 36123 - }, - { - "epoch": 0.93, - "learning_rate": 1.6197369518303841e-06, - "loss": 0.7285, - "step": 36124 - }, - { - "epoch": 0.93, - "learning_rate": 1.6197152355552403e-06, - "loss": 1.1201, - "step": 36125 - }, - { - "epoch": 0.93, - "learning_rate": 1.619693518805609e-06, - "loss": 0.8301, - "step": 36126 - }, - { - "epoch": 0.93, - "learning_rate": 1.6196718015815068e-06, - "loss": 0.8311, - "step": 36127 - }, - { - "epoch": 0.93, - "learning_rate": 1.6196500838829503e-06, - "loss": 0.6008, - "step": 36128 - }, - { - "epoch": 0.93, - "learning_rate": 1.6196283657099565e-06, - "loss": 0.8721, - "step": 36129 - }, - { - "epoch": 0.93, - "learning_rate": 1.6196066470625417e-06, - "loss": 0.7427, - "step": 36130 - }, - { - "epoch": 0.93, - "learning_rate": 1.6195849279407226e-06, - "loss": 0.7266, - "step": 36131 - }, - { - "epoch": 0.93, - "learning_rate": 1.6195632083445157e-06, - "loss": 0.8701, - "step": 36132 - }, - { - "epoch": 0.93, - "learning_rate": 1.6195414882739375e-06, - "loss": 0.8906, - "step": 36133 - }, - { - "epoch": 0.93, - "learning_rate": 1.6195197677290052e-06, - "loss": 0.9629, - "step": 36134 - }, - { - "epoch": 0.93, - "learning_rate": 1.6194980467097353e-06, - "loss": 0.8213, - "step": 36135 - }, - { - "epoch": 0.93, - "learning_rate": 1.6194763252161439e-06, - "loss": 0.8774, - "step": 36136 - }, - { - "epoch": 0.93, - "learning_rate": 1.6194546032482479e-06, - "loss": 0.8672, - "step": 36137 - }, - { - "epoch": 0.93, - "learning_rate": 1.6194328808060642e-06, - "loss": 0.9336, - "step": 36138 - }, - { - "epoch": 0.93, - "learning_rate": 1.619411157889609e-06, - "loss": 0.9375, - "step": 36139 - }, - { - "epoch": 0.93, - "learning_rate": 1.6193894344988993e-06, - "loss": 0.752, - "step": 36140 - }, - { - "epoch": 0.93, - "learning_rate": 1.6193677106339515e-06, - "loss": 0.7871, - "step": 36141 - }, - { - "epoch": 0.93, - "learning_rate": 1.6193459862947828e-06, - "loss": 0.8672, - "step": 36142 - }, - { - "epoch": 0.93, - "learning_rate": 1.6193242614814088e-06, - "loss": 0.7891, - "step": 36143 - }, - { - "epoch": 0.93, - "learning_rate": 1.6193025361938469e-06, - "loss": 0.8398, - "step": 36144 - }, - { - "epoch": 0.93, - "learning_rate": 1.6192808104321136e-06, - "loss": 0.6797, - "step": 36145 - }, - { - "epoch": 0.93, - "learning_rate": 1.619259084196225e-06, - "loss": 0.8818, - "step": 36146 - }, - { - "epoch": 0.93, - "learning_rate": 1.6192373574861988e-06, - "loss": 0.7966, - "step": 36147 - }, - { - "epoch": 0.93, - "learning_rate": 1.6192156303020507e-06, - "loss": 0.918, - "step": 36148 - }, - { - "epoch": 0.93, - "learning_rate": 1.6191939026437978e-06, - "loss": 0.7119, - "step": 36149 - }, - { - "epoch": 0.93, - "learning_rate": 1.6191721745114567e-06, - "loss": 0.6406, - "step": 36150 - }, - { - "epoch": 0.93, - "learning_rate": 1.6191504459050435e-06, - "loss": 0.793, - "step": 36151 - }, - { - "epoch": 0.93, - "learning_rate": 1.6191287168245754e-06, - "loss": 0.8604, - "step": 36152 - }, - { - "epoch": 0.93, - "learning_rate": 1.6191069872700692e-06, - "loss": 0.9697, - "step": 36153 - }, - { - "epoch": 0.93, - "learning_rate": 1.619085257241541e-06, - "loss": 0.6533, - "step": 36154 - }, - { - "epoch": 0.93, - "learning_rate": 1.619063526739008e-06, - "loss": 0.8359, - "step": 36155 - }, - { - "epoch": 0.93, - "learning_rate": 1.6190417957624863e-06, - "loss": 0.686, - "step": 36156 - }, - { - "epoch": 0.93, - "learning_rate": 1.6190200643119927e-06, - "loss": 0.7314, - "step": 36157 - }, - { - "epoch": 0.93, - "learning_rate": 1.618998332387544e-06, - "loss": 0.8359, - "step": 36158 - }, - { - "epoch": 0.93, - "learning_rate": 1.6189765999891564e-06, - "loss": 0.9033, - "step": 36159 - }, - { - "epoch": 0.93, - "learning_rate": 1.6189548671168475e-06, - "loss": 0.8413, - "step": 36160 - }, - { - "epoch": 0.93, - "learning_rate": 1.618933133770633e-06, - "loss": 0.8223, - "step": 36161 - }, - { - "epoch": 0.93, - "learning_rate": 1.6189113999505298e-06, - "loss": 0.7627, - "step": 36162 - }, - { - "epoch": 0.93, - "learning_rate": 1.6188896656565547e-06, - "loss": 0.7324, - "step": 36163 - }, - { - "epoch": 0.93, - "learning_rate": 1.6188679308887241e-06, - "loss": 0.9434, - "step": 36164 - }, - { - "epoch": 0.93, - "learning_rate": 1.6188461956470549e-06, - "loss": 0.7422, - "step": 36165 - }, - { - "epoch": 0.93, - "learning_rate": 1.6188244599315638e-06, - "loss": 0.7627, - "step": 36166 - }, - { - "epoch": 0.93, - "learning_rate": 1.618802723742267e-06, - "loss": 0.9932, - "step": 36167 - }, - { - "epoch": 0.93, - "learning_rate": 1.6187809870791815e-06, - "loss": 0.8086, - "step": 36168 - }, - { - "epoch": 0.93, - "learning_rate": 1.6187592499423237e-06, - "loss": 0.7295, - "step": 36169 - }, - { - "epoch": 0.93, - "learning_rate": 1.6187375123317106e-06, - "loss": 0.7559, - "step": 36170 - }, - { - "epoch": 0.93, - "learning_rate": 1.6187157742473585e-06, - "loss": 0.8584, - "step": 36171 - }, - { - "epoch": 0.93, - "learning_rate": 1.6186940356892844e-06, - "loss": 1.0635, - "step": 36172 - }, - { - "epoch": 0.93, - "learning_rate": 1.6186722966575044e-06, - "loss": 0.7949, - "step": 36173 - }, - { - "epoch": 0.93, - "learning_rate": 1.6186505571520356e-06, - "loss": 0.9141, - "step": 36174 - }, - { - "epoch": 0.93, - "learning_rate": 1.6186288171728948e-06, - "loss": 0.96, - "step": 36175 - }, - { - "epoch": 0.93, - "learning_rate": 1.6186070767200982e-06, - "loss": 0.546, - "step": 36176 - }, - { - "epoch": 0.93, - "learning_rate": 1.6185853357936624e-06, - "loss": 0.6758, - "step": 36177 - }, - { - "epoch": 0.93, - "learning_rate": 1.6185635943936043e-06, - "loss": 0.9443, - "step": 36178 - }, - { - "epoch": 0.93, - "learning_rate": 1.6185418525199404e-06, - "loss": 0.7969, - "step": 36179 - }, - { - "epoch": 0.93, - "learning_rate": 1.618520110172688e-06, - "loss": 0.7375, - "step": 36180 - }, - { - "epoch": 0.93, - "learning_rate": 1.6184983673518627e-06, - "loss": 0.9453, - "step": 36181 - }, - { - "epoch": 0.93, - "learning_rate": 1.6184766240574817e-06, - "loss": 0.9492, - "step": 36182 - }, - { - "epoch": 0.93, - "learning_rate": 1.6184548802895615e-06, - "loss": 0.8105, - "step": 36183 - }, - { - "epoch": 0.93, - "learning_rate": 1.618433136048119e-06, - "loss": 0.9932, - "step": 36184 - }, - { - "epoch": 0.93, - "learning_rate": 1.6184113913331706e-06, - "loss": 0.5708, - "step": 36185 - }, - { - "epoch": 0.93, - "learning_rate": 1.6183896461447333e-06, - "loss": 0.8906, - "step": 36186 - }, - { - "epoch": 0.93, - "learning_rate": 1.618367900482823e-06, - "loss": 0.9902, - "step": 36187 - }, - { - "epoch": 0.93, - "learning_rate": 1.6183461543474573e-06, - "loss": 0.8096, - "step": 36188 - }, - { - "epoch": 0.93, - "learning_rate": 1.618324407738652e-06, - "loss": 0.6846, - "step": 36189 - }, - { - "epoch": 0.93, - "learning_rate": 1.6183026606564244e-06, - "loss": 0.8359, - "step": 36190 - }, - { - "epoch": 0.93, - "learning_rate": 1.618280913100791e-06, - "loss": 0.9072, - "step": 36191 - }, - { - "epoch": 0.93, - "learning_rate": 1.6182591650717679e-06, - "loss": 0.5708, - "step": 36192 - }, - { - "epoch": 0.93, - "learning_rate": 1.6182374165693724e-06, - "loss": 0.6807, - "step": 36193 - }, - { - "epoch": 0.93, - "learning_rate": 1.618215667593621e-06, - "loss": 0.6753, - "step": 36194 - }, - { - "epoch": 0.93, - "learning_rate": 1.6181939181445303e-06, - "loss": 0.8779, - "step": 36195 - }, - { - "epoch": 0.93, - "learning_rate": 1.6181721682221167e-06, - "loss": 0.7441, - "step": 36196 - }, - { - "epoch": 0.93, - "learning_rate": 1.6181504178263974e-06, - "loss": 0.833, - "step": 36197 - }, - { - "epoch": 0.93, - "learning_rate": 1.6181286669573887e-06, - "loss": 0.8027, - "step": 36198 - }, - { - "epoch": 0.93, - "learning_rate": 1.6181069156151073e-06, - "loss": 0.9863, - "step": 36199 - }, - { - "epoch": 0.93, - "learning_rate": 1.6180851637995695e-06, - "loss": 0.8296, - "step": 36200 - }, - { - "epoch": 0.93, - "learning_rate": 1.6180634115107928e-06, - "loss": 1.0049, - "step": 36201 - }, - { - "epoch": 0.93, - "learning_rate": 1.6180416587487931e-06, - "loss": 0.8345, - "step": 36202 - }, - { - "epoch": 0.93, - "learning_rate": 1.6180199055135875e-06, - "loss": 0.7656, - "step": 36203 - }, - { - "epoch": 0.93, - "learning_rate": 1.6179981518051925e-06, - "loss": 0.876, - "step": 36204 - }, - { - "epoch": 0.93, - "learning_rate": 1.6179763976236242e-06, - "loss": 0.7173, - "step": 36205 - }, - { - "epoch": 0.93, - "learning_rate": 1.6179546429689005e-06, - "loss": 0.7598, - "step": 36206 - }, - { - "epoch": 0.93, - "learning_rate": 1.6179328878410368e-06, - "loss": 0.7495, - "step": 36207 - }, - { - "epoch": 0.93, - "learning_rate": 1.6179111322400506e-06, - "loss": 0.5125, - "step": 36208 - }, - { - "epoch": 0.93, - "learning_rate": 1.6178893761659583e-06, - "loss": 0.8428, - "step": 36209 - }, - { - "epoch": 0.93, - "learning_rate": 1.6178676196187762e-06, - "loss": 0.9209, - "step": 36210 - }, - { - "epoch": 0.93, - "learning_rate": 1.6178458625985214e-06, - "loss": 0.8291, - "step": 36211 - }, - { - "epoch": 0.93, - "learning_rate": 1.6178241051052107e-06, - "loss": 0.6836, - "step": 36212 - }, - { - "epoch": 0.93, - "learning_rate": 1.6178023471388602e-06, - "loss": 0.7969, - "step": 36213 - }, - { - "epoch": 0.93, - "learning_rate": 1.617780588699487e-06, - "loss": 0.7129, - "step": 36214 - }, - { - "epoch": 0.93, - "learning_rate": 1.6177588297871077e-06, - "loss": 0.8076, - "step": 36215 - }, - { - "epoch": 0.93, - "learning_rate": 1.6177370704017386e-06, - "loss": 0.915, - "step": 36216 - }, - { - "epoch": 0.93, - "learning_rate": 1.6177153105433967e-06, - "loss": 0.8594, - "step": 36217 - }, - { - "epoch": 0.93, - "learning_rate": 1.6176935502120986e-06, - "loss": 0.7969, - "step": 36218 - }, - { - "epoch": 0.93, - "learning_rate": 1.617671789407861e-06, - "loss": 0.9248, - "step": 36219 - }, - { - "epoch": 0.93, - "learning_rate": 1.6176500281307006e-06, - "loss": 0.9297, - "step": 36220 - }, - { - "epoch": 0.93, - "learning_rate": 1.6176282663806338e-06, - "loss": 0.79, - "step": 36221 - }, - { - "epoch": 0.93, - "learning_rate": 1.6176065041576776e-06, - "loss": 0.8525, - "step": 36222 - }, - { - "epoch": 0.93, - "learning_rate": 1.617584741461848e-06, - "loss": 0.792, - "step": 36223 - }, - { - "epoch": 0.93, - "learning_rate": 1.6175629782931631e-06, - "loss": 0.9316, - "step": 36224 - }, - { - "epoch": 0.93, - "learning_rate": 1.6175412146516379e-06, - "loss": 0.8457, - "step": 36225 - }, - { - "epoch": 0.93, - "learning_rate": 1.61751945053729e-06, - "loss": 0.9746, - "step": 36226 - }, - { - "epoch": 0.93, - "learning_rate": 1.6174976859501359e-06, - "loss": 0.916, - "step": 36227 - }, - { - "epoch": 0.93, - "learning_rate": 1.6174759208901921e-06, - "loss": 0.9238, - "step": 36228 - }, - { - "epoch": 0.93, - "learning_rate": 1.6174541553574756e-06, - "loss": 0.8262, - "step": 36229 - }, - { - "epoch": 0.93, - "learning_rate": 1.6174323893520026e-06, - "loss": 0.8428, - "step": 36230 - }, - { - "epoch": 0.93, - "learning_rate": 1.6174106228737898e-06, - "loss": 0.7373, - "step": 36231 - }, - { - "epoch": 0.93, - "learning_rate": 1.6173888559228543e-06, - "loss": 0.8418, - "step": 36232 - }, - { - "epoch": 0.93, - "learning_rate": 1.6173670884992129e-06, - "loss": 1.0127, - "step": 36233 - }, - { - "epoch": 0.93, - "learning_rate": 1.6173453206028814e-06, - "loss": 0.6846, - "step": 36234 - }, - { - "epoch": 0.93, - "learning_rate": 1.6173235522338773e-06, - "loss": 0.6431, - "step": 36235 - }, - { - "epoch": 0.93, - "learning_rate": 1.6173017833922167e-06, - "loss": 1.1553, - "step": 36236 - }, - { - "epoch": 0.93, - "learning_rate": 1.6172800140779167e-06, - "loss": 0.9248, - "step": 36237 - }, - { - "epoch": 0.93, - "learning_rate": 1.6172582442909936e-06, - "loss": 0.6699, - "step": 36238 - }, - { - "epoch": 0.93, - "learning_rate": 1.6172364740314646e-06, - "loss": 0.594, - "step": 36239 - }, - { - "epoch": 0.93, - "learning_rate": 1.6172147032993457e-06, - "loss": 0.6385, - "step": 36240 - }, - { - "epoch": 0.93, - "learning_rate": 1.617192932094654e-06, - "loss": 0.9443, - "step": 36241 - }, - { - "epoch": 0.93, - "learning_rate": 1.617171160417406e-06, - "loss": 0.7417, - "step": 36242 - }, - { - "epoch": 0.93, - "learning_rate": 1.6171493882676183e-06, - "loss": 0.8955, - "step": 36243 - }, - { - "epoch": 0.93, - "learning_rate": 1.6171276156453079e-06, - "loss": 0.9307, - "step": 36244 - }, - { - "epoch": 0.93, - "learning_rate": 1.6171058425504911e-06, - "loss": 0.9473, - "step": 36245 - }, - { - "epoch": 0.93, - "learning_rate": 1.6170840689831848e-06, - "loss": 0.8701, - "step": 36246 - }, - { - "epoch": 0.93, - "learning_rate": 1.6170622949434056e-06, - "loss": 0.9277, - "step": 36247 - }, - { - "epoch": 0.93, - "learning_rate": 1.6170405204311704e-06, - "loss": 0.7627, - "step": 36248 - }, - { - "epoch": 0.93, - "learning_rate": 1.6170187454464955e-06, - "loss": 0.8633, - "step": 36249 - }, - { - "epoch": 0.93, - "learning_rate": 1.6169969699893974e-06, - "loss": 0.7759, - "step": 36250 - }, - { - "epoch": 0.93, - "learning_rate": 1.6169751940598934e-06, - "loss": 0.7354, - "step": 36251 - }, - { - "epoch": 0.93, - "learning_rate": 1.6169534176579998e-06, - "loss": 0.9258, - "step": 36252 - }, - { - "epoch": 0.93, - "learning_rate": 1.6169316407837333e-06, - "loss": 0.7549, - "step": 36253 - }, - { - "epoch": 0.93, - "learning_rate": 1.6169098634371107e-06, - "loss": 0.9185, - "step": 36254 - }, - { - "epoch": 0.93, - "learning_rate": 1.6168880856181483e-06, - "loss": 0.9111, - "step": 36255 - }, - { - "epoch": 0.93, - "learning_rate": 1.6168663073268634e-06, - "loss": 0.7178, - "step": 36256 - }, - { - "epoch": 0.93, - "learning_rate": 1.6168445285632721e-06, - "loss": 0.7793, - "step": 36257 - }, - { - "epoch": 0.93, - "learning_rate": 1.6168227493273915e-06, - "loss": 1.0547, - "step": 36258 - }, - { - "epoch": 0.93, - "learning_rate": 1.6168009696192382e-06, - "loss": 0.9746, - "step": 36259 - }, - { - "epoch": 0.93, - "learning_rate": 1.6167791894388284e-06, - "loss": 0.7627, - "step": 36260 - }, - { - "epoch": 0.93, - "learning_rate": 1.6167574087861793e-06, - "loss": 0.752, - "step": 36261 - }, - { - "epoch": 0.93, - "learning_rate": 1.6167356276613075e-06, - "loss": 0.6592, - "step": 36262 - }, - { - "epoch": 0.93, - "learning_rate": 1.6167138460642296e-06, - "loss": 0.6948, - "step": 36263 - }, - { - "epoch": 0.93, - "learning_rate": 1.6166920639949622e-06, - "loss": 0.6924, - "step": 36264 - }, - { - "epoch": 0.93, - "learning_rate": 1.6166702814535218e-06, - "loss": 0.8076, - "step": 36265 - }, - { - "epoch": 0.93, - "learning_rate": 1.6166484984399255e-06, - "loss": 0.8877, - "step": 36266 - }, - { - "epoch": 0.93, - "learning_rate": 1.6166267149541899e-06, - "loss": 0.8555, - "step": 36267 - }, - { - "epoch": 0.93, - "learning_rate": 1.6166049309963314e-06, - "loss": 0.5864, - "step": 36268 - }, - { - "epoch": 0.93, - "learning_rate": 1.6165831465663673e-06, - "loss": 0.6846, - "step": 36269 - }, - { - "epoch": 0.93, - "learning_rate": 1.6165613616643134e-06, - "loss": 0.5808, - "step": 36270 - }, - { - "epoch": 0.93, - "learning_rate": 1.616539576290187e-06, - "loss": 1.0488, - "step": 36271 - }, - { - "epoch": 0.93, - "learning_rate": 1.6165177904440044e-06, - "loss": 0.9189, - "step": 36272 - }, - { - "epoch": 0.93, - "learning_rate": 1.6164960041257825e-06, - "loss": 1.0635, - "step": 36273 - }, - { - "epoch": 0.93, - "learning_rate": 1.6164742173355382e-06, - "loss": 0.8135, - "step": 36274 - }, - { - "epoch": 0.93, - "learning_rate": 1.6164524300732878e-06, - "loss": 0.8975, - "step": 36275 - }, - { - "epoch": 0.93, - "learning_rate": 1.6164306423390479e-06, - "loss": 0.835, - "step": 36276 - }, - { - "epoch": 0.93, - "learning_rate": 1.6164088541328358e-06, - "loss": 0.9072, - "step": 36277 - }, - { - "epoch": 0.93, - "learning_rate": 1.6163870654546675e-06, - "loss": 0.834, - "step": 36278 - }, - { - "epoch": 0.93, - "learning_rate": 1.6163652763045601e-06, - "loss": 0.7007, - "step": 36279 - }, - { - "epoch": 0.93, - "learning_rate": 1.61634348668253e-06, - "loss": 0.9268, - "step": 36280 - }, - { - "epoch": 0.93, - "learning_rate": 1.616321696588594e-06, - "loss": 0.8174, - "step": 36281 - }, - { - "epoch": 0.93, - "learning_rate": 1.616299906022769e-06, - "loss": 0.6924, - "step": 36282 - }, - { - "epoch": 0.93, - "learning_rate": 1.6162781149850715e-06, - "loss": 0.9102, - "step": 36283 - }, - { - "epoch": 0.93, - "learning_rate": 1.6162563234755183e-06, - "loss": 0.9375, - "step": 36284 - }, - { - "epoch": 0.93, - "learning_rate": 1.6162345314941257e-06, - "loss": 0.877, - "step": 36285 - }, - { - "epoch": 0.93, - "learning_rate": 1.6162127390409107e-06, - "loss": 0.8164, - "step": 36286 - }, - { - "epoch": 0.93, - "learning_rate": 1.61619094611589e-06, - "loss": 0.8022, - "step": 36287 - }, - { - "epoch": 0.93, - "learning_rate": 1.6161691527190801e-06, - "loss": 0.7148, - "step": 36288 - }, - { - "epoch": 0.93, - "learning_rate": 1.616147358850498e-06, - "loss": 0.9189, - "step": 36289 - }, - { - "epoch": 0.93, - "learning_rate": 1.6161255645101602e-06, - "loss": 0.9512, - "step": 36290 - }, - { - "epoch": 0.93, - "learning_rate": 1.6161037696980834e-06, - "loss": 0.791, - "step": 36291 - }, - { - "epoch": 0.93, - "learning_rate": 1.6160819744142841e-06, - "loss": 0.5991, - "step": 36292 - }, - { - "epoch": 0.93, - "learning_rate": 1.6160601786587793e-06, - "loss": 0.6641, - "step": 36293 - }, - { - "epoch": 0.93, - "learning_rate": 1.6160383824315855e-06, - "loss": 0.5469, - "step": 36294 - }, - { - "epoch": 0.93, - "learning_rate": 1.6160165857327195e-06, - "loss": 0.5046, - "step": 36295 - }, - { - "epoch": 0.93, - "learning_rate": 1.6159947885621978e-06, - "loss": 0.7725, - "step": 36296 - }, - { - "epoch": 0.93, - "learning_rate": 1.6159729909200372e-06, - "loss": 0.8599, - "step": 36297 - }, - { - "epoch": 0.93, - "learning_rate": 1.6159511928062545e-06, - "loss": 0.8242, - "step": 36298 - }, - { - "epoch": 0.93, - "learning_rate": 1.6159293942208666e-06, - "loss": 0.918, - "step": 36299 - }, - { - "epoch": 0.93, - "learning_rate": 1.6159075951638894e-06, - "loss": 0.9131, - "step": 36300 - }, - { - "epoch": 0.93, - "learning_rate": 1.6158857956353402e-06, - "loss": 1.0127, - "step": 36301 - }, - { - "epoch": 0.93, - "learning_rate": 1.6158639956352355e-06, - "loss": 0.917, - "step": 36302 - }, - { - "epoch": 0.93, - "learning_rate": 1.615842195163592e-06, - "loss": 0.5266, - "step": 36303 - }, - { - "epoch": 0.93, - "learning_rate": 1.615820394220427e-06, - "loss": 0.6777, - "step": 36304 - }, - { - "epoch": 0.93, - "learning_rate": 1.6157985928057562e-06, - "loss": 0.8418, - "step": 36305 - }, - { - "epoch": 0.93, - "learning_rate": 1.6157767909195967e-06, - "loss": 0.751, - "step": 36306 - }, - { - "epoch": 0.93, - "learning_rate": 1.6157549885619653e-06, - "loss": 0.793, - "step": 36307 - }, - { - "epoch": 0.93, - "learning_rate": 1.6157331857328784e-06, - "loss": 0.8154, - "step": 36308 - }, - { - "epoch": 0.93, - "learning_rate": 1.6157113824323534e-06, - "loss": 0.9004, - "step": 36309 - }, - { - "epoch": 0.93, - "learning_rate": 1.6156895786604063e-06, - "loss": 0.9111, - "step": 36310 - }, - { - "epoch": 0.93, - "learning_rate": 1.6156677744170537e-06, - "loss": 0.6958, - "step": 36311 - }, - { - "epoch": 0.93, - "learning_rate": 1.6156459697023127e-06, - "loss": 0.9229, - "step": 36312 - }, - { - "epoch": 0.93, - "learning_rate": 1.6156241645162001e-06, - "loss": 0.9014, - "step": 36313 - }, - { - "epoch": 0.93, - "learning_rate": 1.6156023588587325e-06, - "loss": 0.8311, - "step": 36314 - }, - { - "epoch": 0.93, - "learning_rate": 1.6155805527299262e-06, - "loss": 0.8672, - "step": 36315 - }, - { - "epoch": 0.93, - "learning_rate": 1.6155587461297984e-06, - "loss": 0.6958, - "step": 36316 - }, - { - "epoch": 0.93, - "learning_rate": 1.6155369390583653e-06, - "loss": 0.897, - "step": 36317 - }, - { - "epoch": 0.93, - "learning_rate": 1.615515131515644e-06, - "loss": 0.7812, - "step": 36318 - }, - { - "epoch": 0.93, - "learning_rate": 1.6154933235016513e-06, - "loss": 0.999, - "step": 36319 - }, - { - "epoch": 0.93, - "learning_rate": 1.6154715150164034e-06, - "loss": 0.7578, - "step": 36320 - }, - { - "epoch": 0.93, - "learning_rate": 1.6154497060599173e-06, - "loss": 0.8975, - "step": 36321 - }, - { - "epoch": 0.93, - "learning_rate": 1.6154278966322097e-06, - "loss": 0.8721, - "step": 36322 - }, - { - "epoch": 0.93, - "learning_rate": 1.615406086733297e-06, - "loss": 0.7627, - "step": 36323 - }, - { - "epoch": 0.93, - "learning_rate": 1.6153842763631965e-06, - "loss": 0.9248, - "step": 36324 - }, - { - "epoch": 0.93, - "learning_rate": 1.6153624655219243e-06, - "loss": 0.603, - "step": 36325 - }, - { - "epoch": 0.93, - "learning_rate": 1.6153406542094974e-06, - "loss": 0.873, - "step": 36326 - }, - { - "epoch": 0.93, - "learning_rate": 1.6153188424259328e-06, - "loss": 0.7842, - "step": 36327 - }, - { - "epoch": 0.93, - "learning_rate": 1.6152970301712466e-06, - "loss": 0.9043, - "step": 36328 - }, - { - "epoch": 0.93, - "learning_rate": 1.615275217445456e-06, - "loss": 0.6538, - "step": 36329 - }, - { - "epoch": 0.93, - "learning_rate": 1.6152534042485768e-06, - "loss": 0.7334, - "step": 36330 - }, - { - "epoch": 0.93, - "learning_rate": 1.6152315905806267e-06, - "loss": 0.8984, - "step": 36331 - }, - { - "epoch": 0.93, - "learning_rate": 1.6152097764416221e-06, - "loss": 0.9082, - "step": 36332 - }, - { - "epoch": 0.93, - "learning_rate": 1.6151879618315797e-06, - "loss": 0.9785, - "step": 36333 - }, - { - "epoch": 0.93, - "learning_rate": 1.6151661467505165e-06, - "loss": 0.8398, - "step": 36334 - }, - { - "epoch": 0.93, - "learning_rate": 1.6151443311984484e-06, - "loss": 0.8379, - "step": 36335 - }, - { - "epoch": 0.93, - "learning_rate": 1.6151225151753924e-06, - "loss": 0.7671, - "step": 36336 - }, - { - "epoch": 0.93, - "learning_rate": 1.6151006986813658e-06, - "loss": 0.8584, - "step": 36337 - }, - { - "epoch": 0.93, - "learning_rate": 1.6150788817163848e-06, - "loss": 1.0107, - "step": 36338 - }, - { - "epoch": 0.93, - "learning_rate": 1.6150570642804663e-06, - "loss": 0.9824, - "step": 36339 - }, - { - "epoch": 0.93, - "learning_rate": 1.6150352463736266e-06, - "loss": 0.9424, - "step": 36340 - }, - { - "epoch": 0.93, - "learning_rate": 1.6150134279958828e-06, - "loss": 0.9238, - "step": 36341 - }, - { - "epoch": 0.93, - "learning_rate": 1.6149916091472515e-06, - "loss": 0.8735, - "step": 36342 - }, - { - "epoch": 0.93, - "learning_rate": 1.6149697898277492e-06, - "loss": 0.9297, - "step": 36343 - }, - { - "epoch": 0.93, - "learning_rate": 1.614947970037393e-06, - "loss": 0.8779, - "step": 36344 - }, - { - "epoch": 0.93, - "learning_rate": 1.6149261497761995e-06, - "loss": 0.7388, - "step": 36345 - }, - { - "epoch": 0.93, - "learning_rate": 1.6149043290441852e-06, - "loss": 0.7749, - "step": 36346 - }, - { - "epoch": 0.93, - "learning_rate": 1.614882507841367e-06, - "loss": 0.8848, - "step": 36347 - }, - { - "epoch": 0.93, - "learning_rate": 1.6148606861677615e-06, - "loss": 0.71, - "step": 36348 - }, - { - "epoch": 0.93, - "learning_rate": 1.6148388640233854e-06, - "loss": 0.9463, - "step": 36349 - }, - { - "epoch": 0.93, - "learning_rate": 1.6148170414082558e-06, - "loss": 0.9326, - "step": 36350 - }, - { - "epoch": 0.93, - "learning_rate": 1.6147952183223886e-06, - "loss": 0.9531, - "step": 36351 - }, - { - "epoch": 0.93, - "learning_rate": 1.614773394765801e-06, - "loss": 0.8398, - "step": 36352 - }, - { - "epoch": 0.93, - "learning_rate": 1.6147515707385097e-06, - "loss": 0.8193, - "step": 36353 - }, - { - "epoch": 0.93, - "learning_rate": 1.6147297462405318e-06, - "loss": 0.6724, - "step": 36354 - }, - { - "epoch": 0.93, - "learning_rate": 1.6147079212718832e-06, - "loss": 0.7988, - "step": 36355 - }, - { - "epoch": 0.93, - "learning_rate": 1.6146860958325811e-06, - "loss": 0.999, - "step": 36356 - }, - { - "epoch": 0.93, - "learning_rate": 1.6146642699226423e-06, - "loss": 0.6785, - "step": 36357 - }, - { - "epoch": 0.93, - "learning_rate": 1.6146424435420832e-06, - "loss": 0.5757, - "step": 36358 - }, - { - "epoch": 0.93, - "learning_rate": 1.6146206166909205e-06, - "loss": 0.8086, - "step": 36359 - }, - { - "epoch": 0.93, - "learning_rate": 1.6145987893691712e-06, - "loss": 0.8994, - "step": 36360 - }, - { - "epoch": 0.93, - "learning_rate": 1.6145769615768518e-06, - "loss": 0.7529, - "step": 36361 - }, - { - "epoch": 0.93, - "learning_rate": 1.6145551333139792e-06, - "loss": 0.7925, - "step": 36362 - }, - { - "epoch": 0.93, - "learning_rate": 1.6145333045805698e-06, - "loss": 0.7197, - "step": 36363 - }, - { - "epoch": 0.93, - "learning_rate": 1.6145114753766408e-06, - "loss": 1.1016, - "step": 36364 - }, - { - "epoch": 0.93, - "learning_rate": 1.6144896457022083e-06, - "loss": 0.8711, - "step": 36365 - }, - { - "epoch": 0.93, - "learning_rate": 1.6144678155572894e-06, - "loss": 0.9971, - "step": 36366 - }, - { - "epoch": 0.93, - "learning_rate": 1.614445984941901e-06, - "loss": 0.6147, - "step": 36367 - }, - { - "epoch": 0.93, - "learning_rate": 1.6144241538560594e-06, - "loss": 0.708, - "step": 36368 - }, - { - "epoch": 0.93, - "learning_rate": 1.6144023222997816e-06, - "loss": 0.7153, - "step": 36369 - }, - { - "epoch": 0.93, - "learning_rate": 1.614380490273084e-06, - "loss": 1.166, - "step": 36370 - }, - { - "epoch": 0.93, - "learning_rate": 1.6143586577759834e-06, - "loss": 0.8955, - "step": 36371 - }, - { - "epoch": 0.93, - "learning_rate": 1.6143368248084967e-06, - "loss": 0.8682, - "step": 36372 - }, - { - "epoch": 0.93, - "learning_rate": 1.6143149913706409e-06, - "loss": 0.7754, - "step": 36373 - }, - { - "epoch": 0.93, - "learning_rate": 1.614293157462432e-06, - "loss": 1.0127, - "step": 36374 - }, - { - "epoch": 0.93, - "learning_rate": 1.6142713230838872e-06, - "loss": 0.8086, - "step": 36375 - }, - { - "epoch": 0.93, - "learning_rate": 1.6142494882350231e-06, - "loss": 0.7422, - "step": 36376 - }, - { - "epoch": 0.93, - "learning_rate": 1.6142276529158561e-06, - "loss": 0.7734, - "step": 36377 - }, - { - "epoch": 0.93, - "learning_rate": 1.6142058171264035e-06, - "loss": 0.8174, - "step": 36378 - }, - { - "epoch": 0.93, - "learning_rate": 1.6141839808666816e-06, - "loss": 0.9482, - "step": 36379 - }, - { - "epoch": 0.93, - "learning_rate": 1.6141621441367078e-06, - "loss": 0.6279, - "step": 36380 - }, - { - "epoch": 0.93, - "learning_rate": 1.6141403069364979e-06, - "loss": 0.8018, - "step": 36381 - }, - { - "epoch": 0.93, - "learning_rate": 1.6141184692660688e-06, - "loss": 0.9307, - "step": 36382 - }, - { - "epoch": 0.93, - "learning_rate": 1.6140966311254376e-06, - "loss": 0.6909, - "step": 36383 - }, - { - "epoch": 0.93, - "learning_rate": 1.614074792514621e-06, - "loss": 0.8711, - "step": 36384 - }, - { - "epoch": 0.93, - "learning_rate": 1.6140529534336354e-06, - "loss": 0.7896, - "step": 36385 - }, - { - "epoch": 0.93, - "learning_rate": 1.6140311138824978e-06, - "loss": 0.8745, - "step": 36386 - }, - { - "epoch": 0.93, - "learning_rate": 1.6140092738612246e-06, - "loss": 0.9854, - "step": 36387 - }, - { - "epoch": 0.93, - "learning_rate": 1.6139874333698328e-06, - "loss": 0.9551, - "step": 36388 - }, - { - "epoch": 0.93, - "learning_rate": 1.6139655924083392e-06, - "loss": 0.6592, - "step": 36389 - }, - { - "epoch": 0.93, - "learning_rate": 1.61394375097676e-06, - "loss": 0.8872, - "step": 36390 - }, - { - "epoch": 0.93, - "learning_rate": 1.6139219090751128e-06, - "loss": 0.8662, - "step": 36391 - }, - { - "epoch": 0.93, - "learning_rate": 1.6139000667034138e-06, - "loss": 0.7686, - "step": 36392 - }, - { - "epoch": 0.93, - "learning_rate": 1.6138782238616794e-06, - "loss": 0.8496, - "step": 36393 - }, - { - "epoch": 0.93, - "learning_rate": 1.6138563805499267e-06, - "loss": 0.9512, - "step": 36394 - }, - { - "epoch": 0.93, - "learning_rate": 1.6138345367681727e-06, - "loss": 0.6885, - "step": 36395 - }, - { - "epoch": 0.93, - "learning_rate": 1.6138126925164337e-06, - "loss": 0.8662, - "step": 36396 - }, - { - "epoch": 0.93, - "learning_rate": 1.6137908477947264e-06, - "loss": 0.5215, - "step": 36397 - }, - { - "epoch": 0.93, - "learning_rate": 1.6137690026030677e-06, - "loss": 0.792, - "step": 36398 - }, - { - "epoch": 0.93, - "learning_rate": 1.6137471569414744e-06, - "loss": 0.9824, - "step": 36399 - }, - { - "epoch": 0.93, - "learning_rate": 1.6137253108099632e-06, - "loss": 0.8799, - "step": 36400 - }, - { - "epoch": 0.93, - "learning_rate": 1.6137034642085507e-06, - "loss": 0.8506, - "step": 36401 - }, - { - "epoch": 0.93, - "learning_rate": 1.6136816171372535e-06, - "loss": 0.9365, - "step": 36402 - }, - { - "epoch": 0.93, - "learning_rate": 1.6136597695960888e-06, - "loss": 0.8418, - "step": 36403 - }, - { - "epoch": 0.93, - "learning_rate": 1.6136379215850729e-06, - "loss": 0.8848, - "step": 36404 - }, - { - "epoch": 0.93, - "learning_rate": 1.6136160731042226e-06, - "loss": 1.0, - "step": 36405 - }, - { - "epoch": 0.93, - "learning_rate": 1.6135942241535545e-06, - "loss": 0.7598, - "step": 36406 - }, - { - "epoch": 0.93, - "learning_rate": 1.6135723747330859e-06, - "loss": 0.8457, - "step": 36407 - }, - { - "epoch": 0.93, - "learning_rate": 1.6135505248428327e-06, - "loss": 0.8857, - "step": 36408 - }, - { - "epoch": 0.93, - "learning_rate": 1.6135286744828125e-06, - "loss": 0.6611, - "step": 36409 - }, - { - "epoch": 0.93, - "learning_rate": 1.6135068236530414e-06, - "loss": 0.957, - "step": 36410 - }, - { - "epoch": 0.93, - "learning_rate": 1.6134849723535365e-06, - "loss": 0.614, - "step": 36411 - }, - { - "epoch": 0.93, - "learning_rate": 1.6134631205843142e-06, - "loss": 0.9082, - "step": 36412 - }, - { - "epoch": 0.93, - "learning_rate": 1.6134412683453913e-06, - "loss": 0.7598, - "step": 36413 - }, - { - "epoch": 0.93, - "learning_rate": 1.6134194156367849e-06, - "loss": 0.6328, - "step": 36414 - }, - { - "epoch": 0.93, - "learning_rate": 1.6133975624585111e-06, - "loss": 0.6685, - "step": 36415 - }, - { - "epoch": 0.93, - "learning_rate": 1.6133757088105873e-06, - "loss": 0.707, - "step": 36416 - }, - { - "epoch": 0.93, - "learning_rate": 1.6133538546930298e-06, - "loss": 0.7603, - "step": 36417 - }, - { - "epoch": 0.93, - "learning_rate": 1.6133320001058555e-06, - "loss": 0.874, - "step": 36418 - }, - { - "epoch": 0.93, - "learning_rate": 1.613310145049081e-06, - "loss": 0.9385, - "step": 36419 - }, - { - "epoch": 0.93, - "learning_rate": 1.6132882895227234e-06, - "loss": 0.8369, - "step": 36420 - }, - { - "epoch": 0.93, - "learning_rate": 1.6132664335267988e-06, - "loss": 0.8145, - "step": 36421 - }, - { - "epoch": 0.93, - "learning_rate": 1.6132445770613242e-06, - "loss": 1.0977, - "step": 36422 - }, - { - "epoch": 0.93, - "learning_rate": 1.6132227201263169e-06, - "loss": 0.8232, - "step": 36423 - }, - { - "epoch": 0.93, - "learning_rate": 1.613200862721793e-06, - "loss": 0.9912, - "step": 36424 - }, - { - "epoch": 0.93, - "learning_rate": 1.6131790048477694e-06, - "loss": 0.6582, - "step": 36425 - }, - { - "epoch": 0.93, - "learning_rate": 1.6131571465042627e-06, - "loss": 0.9053, - "step": 36426 - }, - { - "epoch": 0.93, - "learning_rate": 1.61313528769129e-06, - "loss": 0.7568, - "step": 36427 - }, - { - "epoch": 0.93, - "learning_rate": 1.6131134284088675e-06, - "loss": 0.959, - "step": 36428 - }, - { - "epoch": 0.93, - "learning_rate": 1.6130915686570123e-06, - "loss": 0.6694, - "step": 36429 - }, - { - "epoch": 0.93, - "learning_rate": 1.6130697084357411e-06, - "loss": 0.9551, - "step": 36430 - }, - { - "epoch": 0.93, - "learning_rate": 1.6130478477450708e-06, - "loss": 0.8779, - "step": 36431 - }, - { - "epoch": 0.93, - "learning_rate": 1.6130259865850178e-06, - "loss": 0.8945, - "step": 36432 - }, - { - "epoch": 0.93, - "learning_rate": 1.6130041249555988e-06, - "loss": 0.8174, - "step": 36433 - }, - { - "epoch": 0.93, - "learning_rate": 1.612982262856831e-06, - "loss": 0.7461, - "step": 36434 - }, - { - "epoch": 0.93, - "learning_rate": 1.6129604002887309e-06, - "loss": 0.8203, - "step": 36435 - }, - { - "epoch": 0.93, - "learning_rate": 1.612938537251315e-06, - "loss": 0.8223, - "step": 36436 - }, - { - "epoch": 0.93, - "learning_rate": 1.6129166737446005e-06, - "loss": 0.8872, - "step": 36437 - }, - { - "epoch": 0.93, - "learning_rate": 1.6128948097686038e-06, - "loss": 0.7358, - "step": 36438 - }, - { - "epoch": 0.93, - "learning_rate": 1.6128729453233415e-06, - "loss": 0.8672, - "step": 36439 - }, - { - "epoch": 0.93, - "learning_rate": 1.6128510804088307e-06, - "loss": 0.812, - "step": 36440 - }, - { - "epoch": 0.93, - "learning_rate": 1.6128292150250879e-06, - "loss": 0.8135, - "step": 36441 - }, - { - "epoch": 0.93, - "learning_rate": 1.6128073491721303e-06, - "loss": 1.0586, - "step": 36442 - }, - { - "epoch": 0.93, - "learning_rate": 1.6127854828499737e-06, - "loss": 0.9297, - "step": 36443 - }, - { - "epoch": 0.93, - "learning_rate": 1.6127636160586363e-06, - "loss": 0.8623, - "step": 36444 - }, - { - "epoch": 0.93, - "learning_rate": 1.6127417487981334e-06, - "loss": 0.793, - "step": 36445 - }, - { - "epoch": 0.93, - "learning_rate": 1.6127198810684822e-06, - "loss": 0.8301, - "step": 36446 - }, - { - "epoch": 0.93, - "learning_rate": 1.6126980128696998e-06, - "loss": 0.792, - "step": 36447 - }, - { - "epoch": 0.93, - "learning_rate": 1.6126761442018027e-06, - "loss": 0.917, - "step": 36448 - }, - { - "epoch": 0.93, - "learning_rate": 1.6126542750648078e-06, - "loss": 0.8066, - "step": 36449 - }, - { - "epoch": 0.93, - "learning_rate": 1.6126324054587314e-06, - "loss": 0.8169, - "step": 36450 - }, - { - "epoch": 0.93, - "learning_rate": 1.6126105353835905e-06, - "loss": 1.0352, - "step": 36451 - }, - { - "epoch": 0.93, - "learning_rate": 1.6125886648394022e-06, - "loss": 0.8613, - "step": 36452 - }, - { - "epoch": 0.93, - "learning_rate": 1.6125667938261828e-06, - "loss": 0.8398, - "step": 36453 - }, - { - "epoch": 0.93, - "learning_rate": 1.612544922343949e-06, - "loss": 0.9414, - "step": 36454 - }, - { - "epoch": 0.93, - "learning_rate": 1.612523050392718e-06, - "loss": 0.7998, - "step": 36455 - }, - { - "epoch": 0.93, - "learning_rate": 1.612501177972506e-06, - "loss": 0.7534, - "step": 36456 - }, - { - "epoch": 0.93, - "learning_rate": 1.61247930508333e-06, - "loss": 1.0186, - "step": 36457 - }, - { - "epoch": 0.93, - "learning_rate": 1.6124574317252068e-06, - "loss": 0.8975, - "step": 36458 - }, - { - "epoch": 0.93, - "learning_rate": 1.6124355578981534e-06, - "loss": 0.5931, - "step": 36459 - }, - { - "epoch": 0.93, - "learning_rate": 1.612413683602186e-06, - "loss": 1.0215, - "step": 36460 - }, - { - "epoch": 0.93, - "learning_rate": 1.6123918088373217e-06, - "loss": 0.8096, - "step": 36461 - }, - { - "epoch": 0.93, - "learning_rate": 1.612369933603577e-06, - "loss": 0.8633, - "step": 36462 - }, - { - "epoch": 0.93, - "learning_rate": 1.6123480579009688e-06, - "loss": 0.8025, - "step": 36463 - }, - { - "epoch": 0.93, - "learning_rate": 1.612326181729514e-06, - "loss": 0.8633, - "step": 36464 - }, - { - "epoch": 0.93, - "learning_rate": 1.6123043050892293e-06, - "loss": 0.8115, - "step": 36465 - }, - { - "epoch": 0.93, - "learning_rate": 1.612282427980131e-06, - "loss": 1.0059, - "step": 36466 - }, - { - "epoch": 0.93, - "learning_rate": 1.6122605504022365e-06, - "loss": 0.792, - "step": 36467 - }, - { - "epoch": 0.93, - "learning_rate": 1.6122386723555619e-06, - "loss": 0.8232, - "step": 36468 - }, - { - "epoch": 0.93, - "learning_rate": 1.6122167938401248e-06, - "loss": 0.9033, - "step": 36469 - }, - { - "epoch": 0.93, - "learning_rate": 1.612194914855941e-06, - "loss": 0.8867, - "step": 36470 - }, - { - "epoch": 0.93, - "learning_rate": 1.612173035403028e-06, - "loss": 0.9072, - "step": 36471 - }, - { - "epoch": 0.93, - "learning_rate": 1.612151155481402e-06, - "loss": 0.7412, - "step": 36472 - }, - { - "epoch": 0.93, - "learning_rate": 1.6121292750910802e-06, - "loss": 0.8389, - "step": 36473 - }, - { - "epoch": 0.93, - "learning_rate": 1.6121073942320793e-06, - "loss": 0.8525, - "step": 36474 - }, - { - "epoch": 0.93, - "learning_rate": 1.6120855129044158e-06, - "loss": 0.7393, - "step": 36475 - }, - { - "epoch": 0.93, - "learning_rate": 1.6120636311081063e-06, - "loss": 1.0225, - "step": 36476 - }, - { - "epoch": 0.93, - "learning_rate": 1.612041748843168e-06, - "loss": 0.7546, - "step": 36477 - }, - { - "epoch": 0.93, - "learning_rate": 1.6120198661096173e-06, - "loss": 0.7568, - "step": 36478 - }, - { - "epoch": 0.93, - "learning_rate": 1.6119979829074714e-06, - "loss": 0.8965, - "step": 36479 - }, - { - "epoch": 0.94, - "learning_rate": 1.6119760992367468e-06, - "loss": 0.8564, - "step": 36480 - }, - { - "epoch": 0.94, - "learning_rate": 1.61195421509746e-06, - "loss": 0.9961, - "step": 36481 - }, - { - "epoch": 0.94, - "learning_rate": 1.6119323304896282e-06, - "loss": 0.7666, - "step": 36482 - }, - { - "epoch": 0.94, - "learning_rate": 1.6119104454132679e-06, - "loss": 1.0234, - "step": 36483 - }, - { - "epoch": 0.94, - "learning_rate": 1.611888559868396e-06, - "loss": 0.8223, - "step": 36484 - }, - { - "epoch": 0.94, - "learning_rate": 1.611866673855029e-06, - "loss": 0.6924, - "step": 36485 - }, - { - "epoch": 0.94, - "learning_rate": 1.611844787373184e-06, - "loss": 0.8252, - "step": 36486 - }, - { - "epoch": 0.94, - "learning_rate": 1.6118229004228772e-06, - "loss": 0.7607, - "step": 36487 - }, - { - "epoch": 0.94, - "learning_rate": 1.6118010130041263e-06, - "loss": 1.1455, - "step": 36488 - }, - { - "epoch": 0.94, - "learning_rate": 1.611779125116947e-06, - "loss": 0.8955, - "step": 36489 - }, - { - "epoch": 0.94, - "learning_rate": 1.6117572367613567e-06, - "loss": 0.8438, - "step": 36490 - }, - { - "epoch": 0.94, - "learning_rate": 1.6117353479373721e-06, - "loss": 0.832, - "step": 36491 - }, - { - "epoch": 0.94, - "learning_rate": 1.61171345864501e-06, - "loss": 0.8848, - "step": 36492 - }, - { - "epoch": 0.94, - "learning_rate": 1.6116915688842868e-06, - "loss": 0.8066, - "step": 36493 - }, - { - "epoch": 0.94, - "learning_rate": 1.6116696786552195e-06, - "loss": 0.6528, - "step": 36494 - }, - { - "epoch": 0.94, - "learning_rate": 1.611647787957825e-06, - "loss": 0.8599, - "step": 36495 - }, - { - "epoch": 0.94, - "learning_rate": 1.6116258967921197e-06, - "loss": 1.0117, - "step": 36496 - }, - { - "epoch": 0.94, - "learning_rate": 1.6116040051581207e-06, - "loss": 0.7578, - "step": 36497 - }, - { - "epoch": 0.94, - "learning_rate": 1.6115821130558449e-06, - "loss": 0.7754, - "step": 36498 - }, - { - "epoch": 0.94, - "learning_rate": 1.6115602204853084e-06, - "loss": 0.7686, - "step": 36499 - }, - { - "epoch": 0.94, - "learning_rate": 1.6115383274465284e-06, - "loss": 0.8447, - "step": 36500 - }, - { - "epoch": 0.94, - "learning_rate": 1.6115164339395217e-06, - "loss": 0.9902, - "step": 36501 - }, - { - "epoch": 0.94, - "learning_rate": 1.611494539964305e-06, - "loss": 0.7695, - "step": 36502 - }, - { - "epoch": 0.94, - "learning_rate": 1.6114726455208951e-06, - "loss": 1.0117, - "step": 36503 - }, - { - "epoch": 0.94, - "learning_rate": 1.6114507506093085e-06, - "loss": 0.8887, - "step": 36504 - }, - { - "epoch": 0.94, - "learning_rate": 1.6114288552295623e-06, - "loss": 0.9053, - "step": 36505 - }, - { - "epoch": 0.94, - "learning_rate": 1.6114069593816733e-06, - "loss": 0.7656, - "step": 36506 - }, - { - "epoch": 0.94, - "learning_rate": 1.6113850630656578e-06, - "loss": 0.8359, - "step": 36507 - }, - { - "epoch": 0.94, - "learning_rate": 1.6113631662815332e-06, - "loss": 0.7705, - "step": 36508 - }, - { - "epoch": 0.94, - "learning_rate": 1.611341269029316e-06, - "loss": 0.7153, - "step": 36509 - }, - { - "epoch": 0.94, - "learning_rate": 1.6113193713090226e-06, - "loss": 0.9111, - "step": 36510 - }, - { - "epoch": 0.94, - "learning_rate": 1.6112974731206702e-06, - "loss": 0.7969, - "step": 36511 - }, - { - "epoch": 0.94, - "learning_rate": 1.6112755744642751e-06, - "loss": 0.6035, - "step": 36512 - }, - { - "epoch": 0.94, - "learning_rate": 1.611253675339855e-06, - "loss": 1.0859, - "step": 36513 - }, - { - "epoch": 0.94, - "learning_rate": 1.6112317757474256e-06, - "loss": 0.7871, - "step": 36514 - }, - { - "epoch": 0.94, - "learning_rate": 1.6112098756870043e-06, - "loss": 0.6855, - "step": 36515 - }, - { - "epoch": 0.94, - "learning_rate": 1.6111879751586078e-06, - "loss": 0.9609, - "step": 36516 - }, - { - "epoch": 0.94, - "learning_rate": 1.6111660741622526e-06, - "loss": 0.7441, - "step": 36517 - }, - { - "epoch": 0.94, - "learning_rate": 1.6111441726979558e-06, - "loss": 0.8223, - "step": 36518 - }, - { - "epoch": 0.94, - "learning_rate": 1.6111222707657337e-06, - "loss": 0.8047, - "step": 36519 - }, - { - "epoch": 0.94, - "learning_rate": 1.6111003683656038e-06, - "loss": 0.8955, - "step": 36520 - }, - { - "epoch": 0.94, - "learning_rate": 1.611078465497582e-06, - "loss": 0.9355, - "step": 36521 - }, - { - "epoch": 0.94, - "learning_rate": 1.6110565621616856e-06, - "loss": 0.9248, - "step": 36522 - }, - { - "epoch": 0.94, - "learning_rate": 1.6110346583579318e-06, - "loss": 0.7515, - "step": 36523 - }, - { - "epoch": 0.94, - "learning_rate": 1.6110127540863364e-06, - "loss": 0.8643, - "step": 36524 - }, - { - "epoch": 0.94, - "learning_rate": 1.6109908493469166e-06, - "loss": 0.8965, - "step": 36525 - }, - { - "epoch": 0.94, - "learning_rate": 1.6109689441396892e-06, - "loss": 0.9834, - "step": 36526 - }, - { - "epoch": 0.94, - "learning_rate": 1.6109470384646713e-06, - "loss": 0.8516, - "step": 36527 - }, - { - "epoch": 0.94, - "learning_rate": 1.610925132321879e-06, - "loss": 0.6544, - "step": 36528 - }, - { - "epoch": 0.94, - "learning_rate": 1.6109032257113294e-06, - "loss": 0.9062, - "step": 36529 - }, - { - "epoch": 0.94, - "learning_rate": 1.6108813186330397e-06, - "loss": 0.7104, - "step": 36530 - }, - { - "epoch": 0.94, - "learning_rate": 1.610859411087026e-06, - "loss": 0.6309, - "step": 36531 - }, - { - "epoch": 0.94, - "learning_rate": 1.6108375030733053e-06, - "loss": 0.8071, - "step": 36532 - }, - { - "epoch": 0.94, - "learning_rate": 1.6108155945918945e-06, - "loss": 0.7695, - "step": 36533 - }, - { - "epoch": 0.94, - "learning_rate": 1.61079368564281e-06, - "loss": 0.6934, - "step": 36534 - }, - { - "epoch": 0.94, - "learning_rate": 1.6107717762260693e-06, - "loss": 0.8555, - "step": 36535 - }, - { - "epoch": 0.94, - "learning_rate": 1.6107498663416886e-06, - "loss": 0.6992, - "step": 36536 - }, - { - "epoch": 0.94, - "learning_rate": 1.6107279559896845e-06, - "loss": 0.9014, - "step": 36537 - }, - { - "epoch": 0.94, - "learning_rate": 1.6107060451700748e-06, - "loss": 1.0371, - "step": 36538 - }, - { - "epoch": 0.94, - "learning_rate": 1.610684133882875e-06, - "loss": 0.8467, - "step": 36539 - }, - { - "epoch": 0.94, - "learning_rate": 1.6106622221281024e-06, - "loss": 0.7715, - "step": 36540 - }, - { - "epoch": 0.94, - "learning_rate": 1.610640309905774e-06, - "loss": 1.0537, - "step": 36541 - }, - { - "epoch": 0.94, - "learning_rate": 1.6106183972159062e-06, - "loss": 0.7109, - "step": 36542 - }, - { - "epoch": 0.94, - "learning_rate": 1.6105964840585163e-06, - "loss": 0.8887, - "step": 36543 - }, - { - "epoch": 0.94, - "learning_rate": 1.6105745704336205e-06, - "loss": 0.8457, - "step": 36544 - }, - { - "epoch": 0.94, - "learning_rate": 1.6105526563412358e-06, - "loss": 0.7256, - "step": 36545 - }, - { - "epoch": 0.94, - "learning_rate": 1.610530741781379e-06, - "loss": 1.0742, - "step": 36546 - }, - { - "epoch": 0.94, - "learning_rate": 1.6105088267540672e-06, - "loss": 0.6411, - "step": 36547 - }, - { - "epoch": 0.94, - "learning_rate": 1.6104869112593167e-06, - "loss": 0.8853, - "step": 36548 - }, - { - "epoch": 0.94, - "learning_rate": 1.610464995297144e-06, - "loss": 0.7915, - "step": 36549 - }, - { - "epoch": 0.94, - "learning_rate": 1.6104430788675668e-06, - "loss": 0.5938, - "step": 36550 - }, - { - "epoch": 0.94, - "learning_rate": 1.6104211619706014e-06, - "loss": 1.0566, - "step": 36551 - }, - { - "epoch": 0.94, - "learning_rate": 1.6103992446062643e-06, - "loss": 1.2383, - "step": 36552 - }, - { - "epoch": 0.94, - "learning_rate": 1.6103773267745729e-06, - "loss": 0.8545, - "step": 36553 - }, - { - "epoch": 0.94, - "learning_rate": 1.6103554084755435e-06, - "loss": 0.6982, - "step": 36554 - }, - { - "epoch": 0.94, - "learning_rate": 1.6103334897091928e-06, - "loss": 0.6545, - "step": 36555 - }, - { - "epoch": 0.94, - "learning_rate": 1.6103115704755384e-06, - "loss": 0.8867, - "step": 36556 - }, - { - "epoch": 0.94, - "learning_rate": 1.610289650774596e-06, - "loss": 0.8193, - "step": 36557 - }, - { - "epoch": 0.94, - "learning_rate": 1.6102677306063832e-06, - "loss": 0.7656, - "step": 36558 - }, - { - "epoch": 0.94, - "learning_rate": 1.6102458099709163e-06, - "loss": 0.8994, - "step": 36559 - }, - { - "epoch": 0.94, - "learning_rate": 1.610223888868212e-06, - "loss": 0.7017, - "step": 36560 - }, - { - "epoch": 0.94, - "learning_rate": 1.6102019672982876e-06, - "loss": 1.0264, - "step": 36561 - }, - { - "epoch": 0.94, - "learning_rate": 1.6101800452611593e-06, - "loss": 0.8643, - "step": 36562 - }, - { - "epoch": 0.94, - "learning_rate": 1.6101581227568449e-06, - "loss": 0.7559, - "step": 36563 - }, - { - "epoch": 0.94, - "learning_rate": 1.61013619978536e-06, - "loss": 0.7031, - "step": 36564 - }, - { - "epoch": 0.94, - "learning_rate": 1.6101142763467217e-06, - "loss": 0.9399, - "step": 36565 - }, - { - "epoch": 0.94, - "learning_rate": 1.6100923524409474e-06, - "loss": 0.7574, - "step": 36566 - }, - { - "epoch": 0.94, - "learning_rate": 1.6100704280680529e-06, - "loss": 0.7783, - "step": 36567 - }, - { - "epoch": 0.94, - "learning_rate": 1.610048503228056e-06, - "loss": 0.8164, - "step": 36568 - }, - { - "epoch": 0.94, - "learning_rate": 1.6100265779209728e-06, - "loss": 0.96, - "step": 36569 - }, - { - "epoch": 0.94, - "learning_rate": 1.6100046521468204e-06, - "loss": 0.9277, - "step": 36570 - }, - { - "epoch": 0.94, - "learning_rate": 1.6099827259056154e-06, - "loss": 0.7808, - "step": 36571 - }, - { - "epoch": 0.94, - "learning_rate": 1.6099607991973744e-06, - "loss": 0.7339, - "step": 36572 - }, - { - "epoch": 0.94, - "learning_rate": 1.609938872022115e-06, - "loss": 0.803, - "step": 36573 - }, - { - "epoch": 0.94, - "learning_rate": 1.609916944379853e-06, - "loss": 0.8701, - "step": 36574 - }, - { - "epoch": 0.94, - "learning_rate": 1.609895016270606e-06, - "loss": 0.833, - "step": 36575 - }, - { - "epoch": 0.94, - "learning_rate": 1.6098730876943903e-06, - "loss": 0.9854, - "step": 36576 - }, - { - "epoch": 0.94, - "learning_rate": 1.6098511586512228e-06, - "loss": 0.8145, - "step": 36577 - }, - { - "epoch": 0.94, - "learning_rate": 1.6098292291411202e-06, - "loss": 0.9766, - "step": 36578 - }, - { - "epoch": 0.94, - "learning_rate": 1.6098072991640996e-06, - "loss": 0.8779, - "step": 36579 - }, - { - "epoch": 0.94, - "learning_rate": 1.6097853687201774e-06, - "loss": 0.9072, - "step": 36580 - }, - { - "epoch": 0.94, - "learning_rate": 1.6097634378093705e-06, - "loss": 0.9937, - "step": 36581 - }, - { - "epoch": 0.94, - "learning_rate": 1.609741506431696e-06, - "loss": 0.8452, - "step": 36582 - }, - { - "epoch": 0.94, - "learning_rate": 1.6097195745871707e-06, - "loss": 0.8408, - "step": 36583 - }, - { - "epoch": 0.94, - "learning_rate": 1.6096976422758108e-06, - "loss": 0.6943, - "step": 36584 - }, - { - "epoch": 0.94, - "learning_rate": 1.6096757094976334e-06, - "loss": 0.8311, - "step": 36585 - }, - { - "epoch": 0.94, - "learning_rate": 1.6096537762526556e-06, - "loss": 0.8184, - "step": 36586 - }, - { - "epoch": 0.94, - "learning_rate": 1.6096318425408938e-06, - "loss": 0.71, - "step": 36587 - }, - { - "epoch": 0.94, - "learning_rate": 1.6096099083623649e-06, - "loss": 0.7852, - "step": 36588 - }, - { - "epoch": 0.94, - "learning_rate": 1.609587973717086e-06, - "loss": 0.8721, - "step": 36589 - }, - { - "epoch": 0.94, - "learning_rate": 1.6095660386050732e-06, - "loss": 0.6183, - "step": 36590 - }, - { - "epoch": 0.94, - "learning_rate": 1.6095441030263438e-06, - "loss": 0.6328, - "step": 36591 - }, - { - "epoch": 0.94, - "learning_rate": 1.6095221669809145e-06, - "loss": 0.9648, - "step": 36592 - }, - { - "epoch": 0.94, - "learning_rate": 1.6095002304688024e-06, - "loss": 0.9092, - "step": 36593 - }, - { - "epoch": 0.94, - "learning_rate": 1.6094782934900235e-06, - "loss": 0.7471, - "step": 36594 - }, - { - "epoch": 0.94, - "learning_rate": 1.6094563560445955e-06, - "loss": 0.9199, - "step": 36595 - }, - { - "epoch": 0.94, - "learning_rate": 1.6094344181325345e-06, - "loss": 0.8066, - "step": 36596 - }, - { - "epoch": 0.94, - "learning_rate": 1.6094124797538577e-06, - "loss": 0.9619, - "step": 36597 - }, - { - "epoch": 0.94, - "learning_rate": 1.6093905409085822e-06, - "loss": 0.7197, - "step": 36598 - }, - { - "epoch": 0.94, - "learning_rate": 1.6093686015967238e-06, - "loss": 0.8809, - "step": 36599 - }, - { - "epoch": 0.94, - "learning_rate": 1.6093466618183003e-06, - "loss": 0.8491, - "step": 36600 - }, - { - "epoch": 0.94, - "learning_rate": 1.6093247215733276e-06, - "loss": 0.7925, - "step": 36601 - }, - { - "epoch": 0.94, - "learning_rate": 1.6093027808618235e-06, - "loss": 0.9189, - "step": 36602 - }, - { - "epoch": 0.94, - "learning_rate": 1.6092808396838042e-06, - "loss": 0.6055, - "step": 36603 - }, - { - "epoch": 0.94, - "learning_rate": 1.6092588980392864e-06, - "loss": 1.0059, - "step": 36604 - }, - { - "epoch": 0.94, - "learning_rate": 1.609236955928287e-06, - "loss": 0.6143, - "step": 36605 - }, - { - "epoch": 0.94, - "learning_rate": 1.609215013350823e-06, - "loss": 0.7993, - "step": 36606 - }, - { - "epoch": 0.94, - "learning_rate": 1.609193070306911e-06, - "loss": 0.79, - "step": 36607 - }, - { - "epoch": 0.94, - "learning_rate": 1.6091711267965683e-06, - "loss": 0.769, - "step": 36608 - }, - { - "epoch": 0.94, - "learning_rate": 1.6091491828198107e-06, - "loss": 0.814, - "step": 36609 - }, - { - "epoch": 0.94, - "learning_rate": 1.6091272383766557e-06, - "loss": 0.4893, - "step": 36610 - }, - { - "epoch": 0.94, - "learning_rate": 1.60910529346712e-06, - "loss": 0.7451, - "step": 36611 - }, - { - "epoch": 0.94, - "learning_rate": 1.6090833480912205e-06, - "loss": 0.3989, - "step": 36612 - }, - { - "epoch": 0.94, - "learning_rate": 1.6090614022489738e-06, - "loss": 0.7778, - "step": 36613 - }, - { - "epoch": 0.94, - "learning_rate": 1.609039455940397e-06, - "loss": 0.7949, - "step": 36614 - }, - { - "epoch": 0.94, - "learning_rate": 1.6090175091655065e-06, - "loss": 0.7178, - "step": 36615 - }, - { - "epoch": 0.94, - "learning_rate": 1.6089955619243193e-06, - "loss": 0.916, - "step": 36616 - }, - { - "epoch": 0.94, - "learning_rate": 1.6089736142168523e-06, - "loss": 0.8428, - "step": 36617 - }, - { - "epoch": 0.94, - "learning_rate": 1.6089516660431222e-06, - "loss": 0.7793, - "step": 36618 - }, - { - "epoch": 0.94, - "learning_rate": 1.6089297174031456e-06, - "loss": 1.0469, - "step": 36619 - }, - { - "epoch": 0.94, - "learning_rate": 1.6089077682969397e-06, - "loss": 1.0537, - "step": 36620 - }, - { - "epoch": 0.94, - "learning_rate": 1.6088858187245208e-06, - "loss": 0.8252, - "step": 36621 - }, - { - "epoch": 0.94, - "learning_rate": 1.6088638686859065e-06, - "loss": 0.958, - "step": 36622 - }, - { - "epoch": 0.94, - "learning_rate": 1.608841918181113e-06, - "loss": 0.8555, - "step": 36623 - }, - { - "epoch": 0.94, - "learning_rate": 1.6088199672101572e-06, - "loss": 0.71, - "step": 36624 - }, - { - "epoch": 0.94, - "learning_rate": 1.608798015773056e-06, - "loss": 0.7476, - "step": 36625 - }, - { - "epoch": 0.94, - "learning_rate": 1.608776063869826e-06, - "loss": 0.9004, - "step": 36626 - }, - { - "epoch": 0.94, - "learning_rate": 1.608754111500484e-06, - "loss": 0.7598, - "step": 36627 - }, - { - "epoch": 0.94, - "learning_rate": 1.6087321586650476e-06, - "loss": 0.8975, - "step": 36628 - }, - { - "epoch": 0.94, - "learning_rate": 1.6087102053635324e-06, - "loss": 0.6021, - "step": 36629 - }, - { - "epoch": 0.94, - "learning_rate": 1.6086882515959559e-06, - "loss": 0.8247, - "step": 36630 - }, - { - "epoch": 0.94, - "learning_rate": 1.6086662973623348e-06, - "loss": 0.8789, - "step": 36631 - }, - { - "epoch": 0.94, - "learning_rate": 1.608644342662686e-06, - "loss": 0.7148, - "step": 36632 - }, - { - "epoch": 0.94, - "learning_rate": 1.6086223874970264e-06, - "loss": 0.8369, - "step": 36633 - }, - { - "epoch": 0.94, - "learning_rate": 1.6086004318653724e-06, - "loss": 0.8047, - "step": 36634 - }, - { - "epoch": 0.94, - "learning_rate": 1.6085784757677408e-06, - "loss": 0.6885, - "step": 36635 - }, - { - "epoch": 0.94, - "learning_rate": 1.608556519204149e-06, - "loss": 0.8848, - "step": 36636 - }, - { - "epoch": 0.94, - "learning_rate": 1.6085345621746132e-06, - "loss": 0.8364, - "step": 36637 - }, - { - "epoch": 0.94, - "learning_rate": 1.6085126046791507e-06, - "loss": 0.7988, - "step": 36638 - }, - { - "epoch": 0.94, - "learning_rate": 1.608490646717778e-06, - "loss": 0.8408, - "step": 36639 - }, - { - "epoch": 0.94, - "learning_rate": 1.6084686882905118e-06, - "loss": 0.9219, - "step": 36640 - }, - { - "epoch": 0.94, - "learning_rate": 1.6084467293973693e-06, - "loss": 0.7549, - "step": 36641 - }, - { - "epoch": 0.94, - "learning_rate": 1.608424770038367e-06, - "loss": 0.7939, - "step": 36642 - }, - { - "epoch": 0.94, - "learning_rate": 1.6084028102135221e-06, - "loss": 0.7041, - "step": 36643 - }, - { - "epoch": 0.94, - "learning_rate": 1.608380849922851e-06, - "loss": 0.6001, - "step": 36644 - }, - { - "epoch": 0.94, - "learning_rate": 1.6083588891663706e-06, - "loss": 0.9277, - "step": 36645 - }, - { - "epoch": 0.94, - "learning_rate": 1.6083369279440976e-06, - "loss": 0.7925, - "step": 36646 - }, - { - "epoch": 0.94, - "learning_rate": 1.6083149662560494e-06, - "loss": 0.7212, - "step": 36647 - }, - { - "epoch": 0.94, - "learning_rate": 1.6082930041022421e-06, - "loss": 0.8271, - "step": 36648 - }, - { - "epoch": 0.94, - "learning_rate": 1.608271041482693e-06, - "loss": 0.9668, - "step": 36649 - }, - { - "epoch": 0.94, - "learning_rate": 1.6082490783974186e-06, - "loss": 0.6892, - "step": 36650 - }, - { - "epoch": 0.94, - "learning_rate": 1.6082271148464358e-06, - "loss": 0.9375, - "step": 36651 - }, - { - "epoch": 0.94, - "learning_rate": 1.6082051508297615e-06, - "loss": 0.8096, - "step": 36652 - }, - { - "epoch": 0.94, - "learning_rate": 1.6081831863474124e-06, - "loss": 0.7368, - "step": 36653 - }, - { - "epoch": 0.94, - "learning_rate": 1.6081612213994058e-06, - "loss": 0.7031, - "step": 36654 - }, - { - "epoch": 0.94, - "learning_rate": 1.6081392559857576e-06, - "loss": 0.876, - "step": 36655 - }, - { - "epoch": 0.94, - "learning_rate": 1.6081172901064855e-06, - "loss": 0.6968, - "step": 36656 - }, - { - "epoch": 0.94, - "learning_rate": 1.6080953237616056e-06, - "loss": 0.9873, - "step": 36657 - }, - { - "epoch": 0.94, - "learning_rate": 1.6080733569511352e-06, - "loss": 0.7666, - "step": 36658 - }, - { - "epoch": 0.94, - "learning_rate": 1.6080513896750913e-06, - "loss": 1.0215, - "step": 36659 - }, - { - "epoch": 0.94, - "learning_rate": 1.6080294219334902e-06, - "loss": 0.7705, - "step": 36660 - }, - { - "epoch": 0.94, - "learning_rate": 1.608007453726349e-06, - "loss": 0.9844, - "step": 36661 - }, - { - "epoch": 0.94, - "learning_rate": 1.6079854850536842e-06, - "loss": 0.771, - "step": 36662 - }, - { - "epoch": 0.94, - "learning_rate": 1.6079635159155132e-06, - "loss": 0.8599, - "step": 36663 - }, - { - "epoch": 0.94, - "learning_rate": 1.6079415463118524e-06, - "loss": 0.8887, - "step": 36664 - }, - { - "epoch": 0.94, - "learning_rate": 1.6079195762427185e-06, - "loss": 0.9824, - "step": 36665 - }, - { - "epoch": 0.94, - "learning_rate": 1.6078976057081288e-06, - "loss": 0.8301, - "step": 36666 - }, - { - "epoch": 0.94, - "learning_rate": 1.6078756347080997e-06, - "loss": 0.6367, - "step": 36667 - }, - { - "epoch": 0.94, - "learning_rate": 1.6078536632426483e-06, - "loss": 1.0039, - "step": 36668 - }, - { - "epoch": 0.94, - "learning_rate": 1.607831691311791e-06, - "loss": 0.8564, - "step": 36669 - }, - { - "epoch": 0.94, - "learning_rate": 1.6078097189155452e-06, - "loss": 0.6245, - "step": 36670 - }, - { - "epoch": 0.94, - "learning_rate": 1.6077877460539273e-06, - "loss": 1.0015, - "step": 36671 - }, - { - "epoch": 0.94, - "learning_rate": 1.6077657727269544e-06, - "loss": 0.8506, - "step": 36672 - }, - { - "epoch": 0.94, - "learning_rate": 1.6077437989346434e-06, - "loss": 0.7358, - "step": 36673 - }, - { - "epoch": 0.94, - "learning_rate": 1.6077218246770104e-06, - "loss": 0.8584, - "step": 36674 - }, - { - "epoch": 0.94, - "learning_rate": 1.607699849954073e-06, - "loss": 0.9551, - "step": 36675 - }, - { - "epoch": 0.94, - "learning_rate": 1.6076778747658479e-06, - "loss": 0.9688, - "step": 36676 - }, - { - "epoch": 0.94, - "learning_rate": 1.6076558991123514e-06, - "loss": 0.8584, - "step": 36677 - }, - { - "epoch": 0.94, - "learning_rate": 1.6076339229936013e-06, - "loss": 0.8662, - "step": 36678 - }, - { - "epoch": 0.94, - "learning_rate": 1.6076119464096137e-06, - "loss": 0.9351, - "step": 36679 - }, - { - "epoch": 0.94, - "learning_rate": 1.6075899693604051e-06, - "loss": 0.9873, - "step": 36680 - }, - { - "epoch": 0.94, - "learning_rate": 1.6075679918459933e-06, - "loss": 0.7842, - "step": 36681 - }, - { - "epoch": 0.94, - "learning_rate": 1.6075460138663942e-06, - "loss": 0.6494, - "step": 36682 - }, - { - "epoch": 0.94, - "learning_rate": 1.6075240354216254e-06, - "loss": 0.9121, - "step": 36683 - }, - { - "epoch": 0.94, - "learning_rate": 1.6075020565117033e-06, - "loss": 0.7881, - "step": 36684 - }, - { - "epoch": 0.94, - "learning_rate": 1.6074800771366445e-06, - "loss": 0.7578, - "step": 36685 - }, - { - "epoch": 0.94, - "learning_rate": 1.6074580972964666e-06, - "loss": 0.8975, - "step": 36686 - }, - { - "epoch": 0.94, - "learning_rate": 1.6074361169911857e-06, - "loss": 0.7451, - "step": 36687 - }, - { - "epoch": 0.94, - "learning_rate": 1.6074141362208188e-06, - "loss": 0.771, - "step": 36688 - }, - { - "epoch": 0.94, - "learning_rate": 1.607392154985383e-06, - "loss": 0.6157, - "step": 36689 - }, - { - "epoch": 0.94, - "learning_rate": 1.6073701732848953e-06, - "loss": 0.8564, - "step": 36690 - }, - { - "epoch": 0.94, - "learning_rate": 1.6073481911193716e-06, - "loss": 0.9326, - "step": 36691 - }, - { - "epoch": 0.94, - "learning_rate": 1.6073262084888295e-06, - "loss": 1.1191, - "step": 36692 - }, - { - "epoch": 0.94, - "learning_rate": 1.6073042253932859e-06, - "loss": 0.9004, - "step": 36693 - }, - { - "epoch": 0.94, - "learning_rate": 1.6072822418327572e-06, - "loss": 0.8833, - "step": 36694 - }, - { - "epoch": 0.94, - "learning_rate": 1.6072602578072603e-06, - "loss": 0.8877, - "step": 36695 - }, - { - "epoch": 0.94, - "learning_rate": 1.6072382733168122e-06, - "loss": 0.7676, - "step": 36696 - }, - { - "epoch": 0.94, - "learning_rate": 1.6072162883614294e-06, - "loss": 0.6724, - "step": 36697 - }, - { - "epoch": 0.94, - "learning_rate": 1.6071943029411298e-06, - "loss": 0.8506, - "step": 36698 - }, - { - "epoch": 0.94, - "learning_rate": 1.6071723170559288e-06, - "loss": 0.7041, - "step": 36699 - }, - { - "epoch": 0.94, - "learning_rate": 1.607150330705844e-06, - "loss": 0.8057, - "step": 36700 - }, - { - "epoch": 0.94, - "learning_rate": 1.607128343890892e-06, - "loss": 0.749, - "step": 36701 - }, - { - "epoch": 0.94, - "learning_rate": 1.60710635661109e-06, - "loss": 0.9736, - "step": 36702 - }, - { - "epoch": 0.94, - "learning_rate": 1.6070843688664546e-06, - "loss": 0.8691, - "step": 36703 - }, - { - "epoch": 0.94, - "learning_rate": 1.6070623806570023e-06, - "loss": 1.082, - "step": 36704 - }, - { - "epoch": 0.94, - "learning_rate": 1.6070403919827506e-06, - "loss": 1.0273, - "step": 36705 - }, - { - "epoch": 0.94, - "learning_rate": 1.6070184028437156e-06, - "loss": 0.8838, - "step": 36706 - }, - { - "epoch": 0.94, - "learning_rate": 1.6069964132399147e-06, - "loss": 0.7666, - "step": 36707 - }, - { - "epoch": 0.94, - "learning_rate": 1.6069744231713646e-06, - "loss": 0.8135, - "step": 36708 - }, - { - "epoch": 0.94, - "learning_rate": 1.6069524326380823e-06, - "loss": 0.7568, - "step": 36709 - }, - { - "epoch": 0.94, - "learning_rate": 1.6069304416400842e-06, - "loss": 0.7734, - "step": 36710 - }, - { - "epoch": 0.94, - "learning_rate": 1.6069084501773873e-06, - "loss": 0.9238, - "step": 36711 - }, - { - "epoch": 0.94, - "learning_rate": 1.6068864582500086e-06, - "loss": 0.5776, - "step": 36712 - }, - { - "epoch": 0.94, - "learning_rate": 1.606864465857965e-06, - "loss": 0.876, - "step": 36713 - }, - { - "epoch": 0.94, - "learning_rate": 1.6068424730012731e-06, - "loss": 0.9404, - "step": 36714 - }, - { - "epoch": 0.94, - "learning_rate": 1.6068204796799494e-06, - "loss": 1.002, - "step": 36715 - }, - { - "epoch": 0.94, - "learning_rate": 1.6067984858940116e-06, - "loss": 0.6699, - "step": 36716 - }, - { - "epoch": 0.94, - "learning_rate": 1.606776491643476e-06, - "loss": 0.7275, - "step": 36717 - }, - { - "epoch": 0.94, - "learning_rate": 1.6067544969283597e-06, - "loss": 0.9316, - "step": 36718 - }, - { - "epoch": 0.94, - "learning_rate": 1.606732501748679e-06, - "loss": 1.0498, - "step": 36719 - }, - { - "epoch": 0.94, - "learning_rate": 1.6067105061044514e-06, - "loss": 0.709, - "step": 36720 - }, - { - "epoch": 0.94, - "learning_rate": 1.6066885099956933e-06, - "loss": 0.9033, - "step": 36721 - }, - { - "epoch": 0.94, - "learning_rate": 1.606666513422422e-06, - "loss": 0.6382, - "step": 36722 - }, - { - "epoch": 0.94, - "learning_rate": 1.6066445163846539e-06, - "loss": 0.7324, - "step": 36723 - }, - { - "epoch": 0.94, - "learning_rate": 1.6066225188824058e-06, - "loss": 0.958, - "step": 36724 - }, - { - "epoch": 0.94, - "learning_rate": 1.606600520915695e-06, - "loss": 0.8828, - "step": 36725 - }, - { - "epoch": 0.94, - "learning_rate": 1.6065785224845378e-06, - "loss": 0.8789, - "step": 36726 - }, - { - "epoch": 0.94, - "learning_rate": 1.6065565235889515e-06, - "loss": 0.7031, - "step": 36727 - }, - { - "epoch": 0.94, - "learning_rate": 1.6065345242289527e-06, - "loss": 0.835, - "step": 36728 - }, - { - "epoch": 0.94, - "learning_rate": 1.6065125244045583e-06, - "loss": 0.6587, - "step": 36729 - }, - { - "epoch": 0.94, - "learning_rate": 1.6064905241157853e-06, - "loss": 0.5886, - "step": 36730 - }, - { - "epoch": 0.94, - "learning_rate": 1.60646852336265e-06, - "loss": 0.9912, - "step": 36731 - }, - { - "epoch": 0.94, - "learning_rate": 1.60644652214517e-06, - "loss": 0.9395, - "step": 36732 - }, - { - "epoch": 0.94, - "learning_rate": 1.6064245204633617e-06, - "loss": 0.8467, - "step": 36733 - }, - { - "epoch": 0.94, - "learning_rate": 1.606402518317242e-06, - "loss": 0.7959, - "step": 36734 - }, - { - "epoch": 0.94, - "learning_rate": 1.606380515706828e-06, - "loss": 0.9189, - "step": 36735 - }, - { - "epoch": 0.94, - "learning_rate": 1.6063585126321359e-06, - "loss": 0.7979, - "step": 36736 - }, - { - "epoch": 0.94, - "learning_rate": 1.6063365090931833e-06, - "loss": 0.8721, - "step": 36737 - }, - { - "epoch": 0.94, - "learning_rate": 1.6063145050899866e-06, - "loss": 0.6851, - "step": 36738 - }, - { - "epoch": 0.94, - "learning_rate": 1.6062925006225627e-06, - "loss": 0.7402, - "step": 36739 - }, - { - "epoch": 0.94, - "learning_rate": 1.6062704956909286e-06, - "loss": 0.8086, - "step": 36740 - }, - { - "epoch": 0.94, - "learning_rate": 1.606248490295101e-06, - "loss": 0.7065, - "step": 36741 - }, - { - "epoch": 0.94, - "learning_rate": 1.6062264844350968e-06, - "loss": 0.8516, - "step": 36742 - }, - { - "epoch": 0.94, - "learning_rate": 1.606204478110933e-06, - "loss": 0.8457, - "step": 36743 - }, - { - "epoch": 0.94, - "learning_rate": 1.6061824713226262e-06, - "loss": 0.9531, - "step": 36744 - }, - { - "epoch": 0.94, - "learning_rate": 1.6061604640701933e-06, - "loss": 0.8525, - "step": 36745 - }, - { - "epoch": 0.94, - "learning_rate": 1.6061384563536512e-06, - "loss": 0.6855, - "step": 36746 - }, - { - "epoch": 0.94, - "learning_rate": 1.606116448173017e-06, - "loss": 0.5852, - "step": 36747 - }, - { - "epoch": 0.94, - "learning_rate": 1.6060944395283072e-06, - "loss": 0.8467, - "step": 36748 - }, - { - "epoch": 0.94, - "learning_rate": 1.6060724304195383e-06, - "loss": 1.0449, - "step": 36749 - }, - { - "epoch": 0.94, - "learning_rate": 1.6060504208467283e-06, - "loss": 0.8496, - "step": 36750 - }, - { - "epoch": 0.94, - "learning_rate": 1.606028410809893e-06, - "loss": 0.5876, - "step": 36751 - }, - { - "epoch": 0.94, - "learning_rate": 1.6060064003090496e-06, - "loss": 0.9053, - "step": 36752 - }, - { - "epoch": 0.94, - "learning_rate": 1.6059843893442149e-06, - "loss": 0.8291, - "step": 36753 - }, - { - "epoch": 0.94, - "learning_rate": 1.6059623779154058e-06, - "loss": 0.9688, - "step": 36754 - }, - { - "epoch": 0.94, - "learning_rate": 1.6059403660226395e-06, - "loss": 0.8379, - "step": 36755 - }, - { - "epoch": 0.94, - "learning_rate": 1.6059183536659324e-06, - "loss": 0.8281, - "step": 36756 - }, - { - "epoch": 0.94, - "learning_rate": 1.6058963408453012e-06, - "loss": 0.7578, - "step": 36757 - }, - { - "epoch": 0.94, - "learning_rate": 1.6058743275607634e-06, - "loss": 0.8101, - "step": 36758 - }, - { - "epoch": 0.94, - "learning_rate": 1.6058523138123352e-06, - "loss": 0.9409, - "step": 36759 - }, - { - "epoch": 0.94, - "learning_rate": 1.605830299600034e-06, - "loss": 0.8242, - "step": 36760 - }, - { - "epoch": 0.94, - "learning_rate": 1.6058082849238761e-06, - "loss": 0.9248, - "step": 36761 - }, - { - "epoch": 0.94, - "learning_rate": 1.6057862697838788e-06, - "loss": 1.0156, - "step": 36762 - }, - { - "epoch": 0.94, - "learning_rate": 1.605764254180059e-06, - "loss": 0.9922, - "step": 36763 - }, - { - "epoch": 0.94, - "learning_rate": 1.605742238112433e-06, - "loss": 0.6904, - "step": 36764 - }, - { - "epoch": 0.94, - "learning_rate": 1.6057202215810183e-06, - "loss": 0.9961, - "step": 36765 - }, - { - "epoch": 0.94, - "learning_rate": 1.6056982045858315e-06, - "loss": 0.7861, - "step": 36766 - }, - { - "epoch": 0.94, - "learning_rate": 1.6056761871268894e-06, - "loss": 0.8516, - "step": 36767 - }, - { - "epoch": 0.94, - "learning_rate": 1.6056541692042086e-06, - "loss": 0.7261, - "step": 36768 - }, - { - "epoch": 0.94, - "learning_rate": 1.6056321508178066e-06, - "loss": 0.7871, - "step": 36769 - }, - { - "epoch": 0.94, - "learning_rate": 1.6056101319676997e-06, - "loss": 0.8682, - "step": 36770 - }, - { - "epoch": 0.94, - "learning_rate": 1.605588112653905e-06, - "loss": 0.9756, - "step": 36771 - }, - { - "epoch": 0.94, - "learning_rate": 1.6055660928764393e-06, - "loss": 0.9844, - "step": 36772 - }, - { - "epoch": 0.94, - "learning_rate": 1.6055440726353195e-06, - "loss": 0.873, - "step": 36773 - }, - { - "epoch": 0.94, - "learning_rate": 1.6055220519305626e-06, - "loss": 0.835, - "step": 36774 - }, - { - "epoch": 0.94, - "learning_rate": 1.6055000307621853e-06, - "loss": 1.001, - "step": 36775 - }, - { - "epoch": 0.94, - "learning_rate": 1.6054780091302043e-06, - "loss": 0.8506, - "step": 36776 - }, - { - "epoch": 0.94, - "learning_rate": 1.6054559870346367e-06, - "loss": 0.8115, - "step": 36777 - }, - { - "epoch": 0.94, - "learning_rate": 1.6054339644754996e-06, - "loss": 0.7075, - "step": 36778 - }, - { - "epoch": 0.94, - "learning_rate": 1.6054119414528091e-06, - "loss": 0.7642, - "step": 36779 - }, - { - "epoch": 0.94, - "learning_rate": 1.6053899179665824e-06, - "loss": 0.9297, - "step": 36780 - }, - { - "epoch": 0.94, - "learning_rate": 1.6053678940168366e-06, - "loss": 0.9375, - "step": 36781 - }, - { - "epoch": 0.94, - "learning_rate": 1.6053458696035889e-06, - "loss": 0.833, - "step": 36782 - }, - { - "epoch": 0.94, - "learning_rate": 1.6053238447268553e-06, - "loss": 0.8701, - "step": 36783 - }, - { - "epoch": 0.94, - "learning_rate": 1.6053018193866532e-06, - "loss": 0.9707, - "step": 36784 - }, - { - "epoch": 0.94, - "learning_rate": 1.6052797935829992e-06, - "loss": 0.7939, - "step": 36785 - }, - { - "epoch": 0.94, - "learning_rate": 1.6052577673159104e-06, - "loss": 0.8198, - "step": 36786 - }, - { - "epoch": 0.94, - "learning_rate": 1.6052357405854035e-06, - "loss": 0.7764, - "step": 36787 - }, - { - "epoch": 0.94, - "learning_rate": 1.6052137133914956e-06, - "loss": 0.9912, - "step": 36788 - }, - { - "epoch": 0.94, - "learning_rate": 1.6051916857342032e-06, - "loss": 0.75, - "step": 36789 - }, - { - "epoch": 0.94, - "learning_rate": 1.6051696576135435e-06, - "loss": 1.0244, - "step": 36790 - }, - { - "epoch": 0.94, - "learning_rate": 1.6051476290295328e-06, - "loss": 0.7441, - "step": 36791 - }, - { - "epoch": 0.94, - "learning_rate": 1.6051255999821888e-06, - "loss": 0.8013, - "step": 36792 - }, - { - "epoch": 0.94, - "learning_rate": 1.605103570471528e-06, - "loss": 0.7422, - "step": 36793 - }, - { - "epoch": 0.94, - "learning_rate": 1.6050815404975671e-06, - "loss": 1.0225, - "step": 36794 - }, - { - "epoch": 0.94, - "learning_rate": 1.6050595100603231e-06, - "loss": 0.6857, - "step": 36795 - }, - { - "epoch": 0.94, - "learning_rate": 1.6050374791598127e-06, - "loss": 0.792, - "step": 36796 - }, - { - "epoch": 0.94, - "learning_rate": 1.6050154477960531e-06, - "loss": 0.8867, - "step": 36797 - }, - { - "epoch": 0.94, - "learning_rate": 1.6049934159690608e-06, - "loss": 0.7871, - "step": 36798 - }, - { - "epoch": 0.94, - "learning_rate": 1.604971383678853e-06, - "loss": 0.6265, - "step": 36799 - }, - { - "epoch": 0.94, - "learning_rate": 1.6049493509254463e-06, - "loss": 0.8262, - "step": 36800 - }, - { - "epoch": 0.94, - "learning_rate": 1.604927317708858e-06, - "loss": 0.9629, - "step": 36801 - }, - { - "epoch": 0.94, - "learning_rate": 1.6049052840291047e-06, - "loss": 0.9238, - "step": 36802 - }, - { - "epoch": 0.94, - "learning_rate": 1.604883249886203e-06, - "loss": 0.8799, - "step": 36803 - }, - { - "epoch": 0.94, - "learning_rate": 1.6048612152801698e-06, - "loss": 0.8721, - "step": 36804 - }, - { - "epoch": 0.94, - "learning_rate": 1.6048391802110223e-06, - "loss": 0.8535, - "step": 36805 - }, - { - "epoch": 0.94, - "learning_rate": 1.6048171446787775e-06, - "loss": 0.7969, - "step": 36806 - }, - { - "epoch": 0.94, - "learning_rate": 1.604795108683452e-06, - "loss": 0.6964, - "step": 36807 - }, - { - "epoch": 0.94, - "learning_rate": 1.6047730722250626e-06, - "loss": 0.7656, - "step": 36808 - }, - { - "epoch": 0.94, - "learning_rate": 1.604751035303626e-06, - "loss": 0.8096, - "step": 36809 - }, - { - "epoch": 0.94, - "learning_rate": 1.6047289979191598e-06, - "loss": 0.6191, - "step": 36810 - }, - { - "epoch": 0.94, - "learning_rate": 1.60470696007168e-06, - "loss": 0.6587, - "step": 36811 - }, - { - "epoch": 0.94, - "learning_rate": 1.6046849217612043e-06, - "loss": 0.9971, - "step": 36812 - }, - { - "epoch": 0.94, - "learning_rate": 1.604662882987749e-06, - "loss": 1.0283, - "step": 36813 - }, - { - "epoch": 0.94, - "learning_rate": 1.6046408437513308e-06, - "loss": 0.7471, - "step": 36814 - }, - { - "epoch": 0.94, - "learning_rate": 1.6046188040519673e-06, - "loss": 0.9785, - "step": 36815 - }, - { - "epoch": 0.94, - "learning_rate": 1.604596763889675e-06, - "loss": 0.7725, - "step": 36816 - }, - { - "epoch": 0.94, - "learning_rate": 1.6045747232644703e-06, - "loss": 0.8447, - "step": 36817 - }, - { - "epoch": 0.94, - "learning_rate": 1.6045526821763708e-06, - "loss": 0.8359, - "step": 36818 - }, - { - "epoch": 0.94, - "learning_rate": 1.6045306406253933e-06, - "loss": 0.8906, - "step": 36819 - }, - { - "epoch": 0.94, - "learning_rate": 1.6045085986115543e-06, - "loss": 1.0557, - "step": 36820 - }, - { - "epoch": 0.94, - "learning_rate": 1.6044865561348711e-06, - "loss": 0.7002, - "step": 36821 - }, - { - "epoch": 0.94, - "learning_rate": 1.60446451319536e-06, - "loss": 0.9922, - "step": 36822 - }, - { - "epoch": 0.94, - "learning_rate": 1.6044424697930382e-06, - "loss": 0.9639, - "step": 36823 - }, - { - "epoch": 0.94, - "learning_rate": 1.604420425927923e-06, - "loss": 0.5459, - "step": 36824 - }, - { - "epoch": 0.94, - "learning_rate": 1.6043983816000305e-06, - "loss": 0.6255, - "step": 36825 - }, - { - "epoch": 0.94, - "learning_rate": 1.604376336809378e-06, - "loss": 0.96, - "step": 36826 - }, - { - "epoch": 0.94, - "learning_rate": 1.6043542915559826e-06, - "loss": 0.8955, - "step": 36827 - }, - { - "epoch": 0.94, - "learning_rate": 1.6043322458398607e-06, - "loss": 0.7725, - "step": 36828 - }, - { - "epoch": 0.94, - "learning_rate": 1.6043101996610293e-06, - "loss": 0.8262, - "step": 36829 - }, - { - "epoch": 0.94, - "learning_rate": 1.6042881530195056e-06, - "loss": 0.9531, - "step": 36830 - }, - { - "epoch": 0.94, - "learning_rate": 1.6042661059153061e-06, - "loss": 0.7095, - "step": 36831 - }, - { - "epoch": 0.94, - "learning_rate": 1.604244058348448e-06, - "loss": 0.9463, - "step": 36832 - }, - { - "epoch": 0.94, - "learning_rate": 1.604222010318948e-06, - "loss": 1.0156, - "step": 36833 - }, - { - "epoch": 0.94, - "learning_rate": 1.6041999618268225e-06, - "loss": 0.8057, - "step": 36834 - }, - { - "epoch": 0.94, - "learning_rate": 1.6041779128720894e-06, - "loss": 0.7979, - "step": 36835 - }, - { - "epoch": 0.94, - "learning_rate": 1.604155863454765e-06, - "loss": 0.8701, - "step": 36836 - }, - { - "epoch": 0.94, - "learning_rate": 1.6041338135748662e-06, - "loss": 0.834, - "step": 36837 - }, - { - "epoch": 0.94, - "learning_rate": 1.6041117632324096e-06, - "loss": 0.9258, - "step": 36838 - }, - { - "epoch": 0.94, - "learning_rate": 1.6040897124274126e-06, - "loss": 0.9775, - "step": 36839 - }, - { - "epoch": 0.94, - "learning_rate": 1.6040676611598918e-06, - "loss": 0.6758, - "step": 36840 - }, - { - "epoch": 0.94, - "learning_rate": 1.6040456094298645e-06, - "loss": 0.9102, - "step": 36841 - }, - { - "epoch": 0.94, - "learning_rate": 1.6040235572373471e-06, - "loss": 0.8223, - "step": 36842 - }, - { - "epoch": 0.94, - "learning_rate": 1.6040015045823565e-06, - "loss": 0.8047, - "step": 36843 - }, - { - "epoch": 0.94, - "learning_rate": 1.6039794514649096e-06, - "loss": 0.6562, - "step": 36844 - }, - { - "epoch": 0.94, - "learning_rate": 1.6039573978850236e-06, - "loss": 0.9961, - "step": 36845 - }, - { - "epoch": 0.94, - "learning_rate": 1.603935343842715e-06, - "loss": 0.8184, - "step": 36846 - }, - { - "epoch": 0.94, - "learning_rate": 1.6039132893380013e-06, - "loss": 0.752, - "step": 36847 - }, - { - "epoch": 0.94, - "learning_rate": 1.6038912343708985e-06, - "loss": 0.9023, - "step": 36848 - }, - { - "epoch": 0.94, - "learning_rate": 1.6038691789414242e-06, - "loss": 0.9316, - "step": 36849 - }, - { - "epoch": 0.94, - "learning_rate": 1.6038471230495952e-06, - "loss": 1.0342, - "step": 36850 - }, - { - "epoch": 0.94, - "learning_rate": 1.603825066695428e-06, - "loss": 0.9771, - "step": 36851 - }, - { - "epoch": 0.94, - "learning_rate": 1.6038030098789398e-06, - "loss": 0.7437, - "step": 36852 - }, - { - "epoch": 0.94, - "learning_rate": 1.6037809526001473e-06, - "loss": 0.6604, - "step": 36853 - }, - { - "epoch": 0.94, - "learning_rate": 1.6037588948590678e-06, - "loss": 0.7939, - "step": 36854 - }, - { - "epoch": 0.94, - "learning_rate": 1.6037368366557174e-06, - "loss": 0.792, - "step": 36855 - }, - { - "epoch": 0.94, - "learning_rate": 1.6037147779901137e-06, - "loss": 0.8369, - "step": 36856 - }, - { - "epoch": 0.94, - "learning_rate": 1.6036927188622732e-06, - "loss": 0.8408, - "step": 36857 - }, - { - "epoch": 0.94, - "learning_rate": 1.603670659272213e-06, - "loss": 0.8857, - "step": 36858 - }, - { - "epoch": 0.94, - "learning_rate": 1.6036485992199503e-06, - "loss": 0.8906, - "step": 36859 - }, - { - "epoch": 0.94, - "learning_rate": 1.6036265387055013e-06, - "loss": 0.835, - "step": 36860 - }, - { - "epoch": 0.94, - "learning_rate": 1.603604477728883e-06, - "loss": 0.7085, - "step": 36861 - }, - { - "epoch": 0.94, - "learning_rate": 1.6035824162901127e-06, - "loss": 0.73, - "step": 36862 - }, - { - "epoch": 0.94, - "learning_rate": 1.6035603543892071e-06, - "loss": 0.9736, - "step": 36863 - }, - { - "epoch": 0.94, - "learning_rate": 1.6035382920261832e-06, - "loss": 0.5967, - "step": 36864 - }, - { - "epoch": 0.94, - "learning_rate": 1.6035162292010578e-06, - "loss": 0.729, - "step": 36865 - }, - { - "epoch": 0.94, - "learning_rate": 1.6034941659138474e-06, - "loss": 0.647, - "step": 36866 - }, - { - "epoch": 0.94, - "learning_rate": 1.6034721021645698e-06, - "loss": 0.8613, - "step": 36867 - }, - { - "epoch": 0.94, - "learning_rate": 1.6034500379532412e-06, - "loss": 0.8281, - "step": 36868 - }, - { - "epoch": 0.94, - "learning_rate": 1.6034279732798784e-06, - "loss": 0.7393, - "step": 36869 - }, - { - "epoch": 0.94, - "learning_rate": 1.6034059081444988e-06, - "loss": 0.8281, - "step": 36870 - }, - { - "epoch": 0.95, - "learning_rate": 1.603383842547119e-06, - "loss": 0.5913, - "step": 36871 - }, - { - "epoch": 0.95, - "learning_rate": 1.6033617764877559e-06, - "loss": 0.7466, - "step": 36872 - }, - { - "epoch": 0.95, - "learning_rate": 1.6033397099664266e-06, - "loss": 0.8008, - "step": 36873 - }, - { - "epoch": 0.95, - "learning_rate": 1.6033176429831473e-06, - "loss": 0.6978, - "step": 36874 - }, - { - "epoch": 0.95, - "learning_rate": 1.6032955755379361e-06, - "loss": 0.7944, - "step": 36875 - }, - { - "epoch": 0.95, - "learning_rate": 1.6032735076308086e-06, - "loss": 0.8018, - "step": 36876 - }, - { - "epoch": 0.95, - "learning_rate": 1.6032514392617826e-06, - "loss": 0.9102, - "step": 36877 - }, - { - "epoch": 0.95, - "learning_rate": 1.603229370430875e-06, - "loss": 0.9385, - "step": 36878 - }, - { - "epoch": 0.95, - "learning_rate": 1.603207301138102e-06, - "loss": 0.9297, - "step": 36879 - }, - { - "epoch": 0.95, - "learning_rate": 1.603185231383481e-06, - "loss": 0.8027, - "step": 36880 - }, - { - "epoch": 0.95, - "learning_rate": 1.6031631611670288e-06, - "loss": 0.8359, - "step": 36881 - }, - { - "epoch": 0.95, - "learning_rate": 1.6031410904887623e-06, - "loss": 0.855, - "step": 36882 - }, - { - "epoch": 0.95, - "learning_rate": 1.6031190193486985e-06, - "loss": 0.8154, - "step": 36883 - }, - { - "epoch": 0.95, - "learning_rate": 1.6030969477468541e-06, - "loss": 0.644, - "step": 36884 - }, - { - "epoch": 0.95, - "learning_rate": 1.6030748756832462e-06, - "loss": 0.4723, - "step": 36885 - }, - { - "epoch": 0.95, - "learning_rate": 1.6030528031578915e-06, - "loss": 0.7651, - "step": 36886 - }, - { - "epoch": 0.95, - "learning_rate": 1.603030730170807e-06, - "loss": 0.9414, - "step": 36887 - }, - { - "epoch": 0.95, - "learning_rate": 1.6030086567220096e-06, - "loss": 0.8838, - "step": 36888 - }, - { - "epoch": 0.95, - "learning_rate": 1.6029865828115164e-06, - "loss": 0.7988, - "step": 36889 - }, - { - "epoch": 0.95, - "learning_rate": 1.6029645084393437e-06, - "loss": 0.9004, - "step": 36890 - }, - { - "epoch": 0.95, - "learning_rate": 1.602942433605509e-06, - "loss": 0.9619, - "step": 36891 - }, - { - "epoch": 0.95, - "learning_rate": 1.6029203583100292e-06, - "loss": 0.8252, - "step": 36892 - }, - { - "epoch": 0.95, - "learning_rate": 1.6028982825529207e-06, - "loss": 1.0684, - "step": 36893 - }, - { - "epoch": 0.95, - "learning_rate": 1.6028762063342009e-06, - "loss": 0.709, - "step": 36894 - }, - { - "epoch": 0.95, - "learning_rate": 1.6028541296538864e-06, - "loss": 0.7715, - "step": 36895 - }, - { - "epoch": 0.95, - "learning_rate": 1.6028320525119943e-06, - "loss": 0.8818, - "step": 36896 - }, - { - "epoch": 0.95, - "learning_rate": 1.6028099749085416e-06, - "loss": 0.6101, - "step": 36897 - }, - { - "epoch": 0.95, - "learning_rate": 1.6027878968435447e-06, - "loss": 0.9248, - "step": 36898 - }, - { - "epoch": 0.95, - "learning_rate": 1.602765818317021e-06, - "loss": 1.082, - "step": 36899 - }, - { - "epoch": 0.95, - "learning_rate": 1.6027437393289868e-06, - "loss": 1.0117, - "step": 36900 - }, - { - "epoch": 0.95, - "learning_rate": 1.6027216598794597e-06, - "loss": 0.9033, - "step": 36901 - }, - { - "epoch": 0.95, - "learning_rate": 1.6026995799684566e-06, - "loss": 0.8828, - "step": 36902 - }, - { - "epoch": 0.95, - "learning_rate": 1.6026774995959941e-06, - "loss": 0.8711, - "step": 36903 - }, - { - "epoch": 0.95, - "learning_rate": 1.6026554187620889e-06, - "loss": 0.8574, - "step": 36904 - }, - { - "epoch": 0.95, - "learning_rate": 1.6026333374667584e-06, - "loss": 0.9961, - "step": 36905 - }, - { - "epoch": 0.95, - "learning_rate": 1.6026112557100188e-06, - "loss": 0.749, - "step": 36906 - }, - { - "epoch": 0.95, - "learning_rate": 1.6025891734918878e-06, - "loss": 0.7681, - "step": 36907 - }, - { - "epoch": 0.95, - "learning_rate": 1.602567090812382e-06, - "loss": 0.9629, - "step": 36908 - }, - { - "epoch": 0.95, - "learning_rate": 1.6025450076715186e-06, - "loss": 0.6606, - "step": 36909 - }, - { - "epoch": 0.95, - "learning_rate": 1.6025229240693136e-06, - "loss": 1.082, - "step": 36910 - }, - { - "epoch": 0.95, - "learning_rate": 1.6025008400057848e-06, - "loss": 0.7183, - "step": 36911 - }, - { - "epoch": 0.95, - "learning_rate": 1.602478755480949e-06, - "loss": 0.7002, - "step": 36912 - }, - { - "epoch": 0.95, - "learning_rate": 1.6024566704948225e-06, - "loss": 0.7344, - "step": 36913 - }, - { - "epoch": 0.95, - "learning_rate": 1.602434585047423e-06, - "loss": 0.7388, - "step": 36914 - }, - { - "epoch": 0.95, - "learning_rate": 1.6024124991387669e-06, - "loss": 0.8162, - "step": 36915 - }, - { - "epoch": 0.95, - "learning_rate": 1.602390412768871e-06, - "loss": 0.6685, - "step": 36916 - }, - { - "epoch": 0.95, - "learning_rate": 1.602368325937753e-06, - "loss": 0.873, - "step": 36917 - }, - { - "epoch": 0.95, - "learning_rate": 1.6023462386454286e-06, - "loss": 1.0195, - "step": 36918 - }, - { - "epoch": 0.95, - "learning_rate": 1.6023241508919158e-06, - "loss": 0.8916, - "step": 36919 - }, - { - "epoch": 0.95, - "learning_rate": 1.602302062677231e-06, - "loss": 0.7959, - "step": 36920 - }, - { - "epoch": 0.95, - "learning_rate": 1.6022799740013913e-06, - "loss": 0.5293, - "step": 36921 - }, - { - "epoch": 0.95, - "learning_rate": 1.6022578848644134e-06, - "loss": 0.832, - "step": 36922 - }, - { - "epoch": 0.95, - "learning_rate": 1.6022357952663144e-06, - "loss": 0.6704, - "step": 36923 - }, - { - "epoch": 0.95, - "learning_rate": 1.6022137052071111e-06, - "loss": 0.9746, - "step": 36924 - }, - { - "epoch": 0.95, - "learning_rate": 1.6021916146868204e-06, - "loss": 0.958, - "step": 36925 - }, - { - "epoch": 0.95, - "learning_rate": 1.6021695237054594e-06, - "loss": 0.709, - "step": 36926 - }, - { - "epoch": 0.95, - "learning_rate": 1.6021474322630448e-06, - "loss": 0.8838, - "step": 36927 - }, - { - "epoch": 0.95, - "learning_rate": 1.6021253403595938e-06, - "loss": 0.7129, - "step": 36928 - }, - { - "epoch": 0.95, - "learning_rate": 1.6021032479951226e-06, - "loss": 0.9561, - "step": 36929 - }, - { - "epoch": 0.95, - "learning_rate": 1.602081155169649e-06, - "loss": 0.8027, - "step": 36930 - }, - { - "epoch": 0.95, - "learning_rate": 1.6020590618831897e-06, - "loss": 0.7109, - "step": 36931 - }, - { - "epoch": 0.95, - "learning_rate": 1.6020369681357613e-06, - "loss": 0.8711, - "step": 36932 - }, - { - "epoch": 0.95, - "learning_rate": 1.6020148739273807e-06, - "loss": 0.4648, - "step": 36933 - }, - { - "epoch": 0.95, - "learning_rate": 1.6019927792580651e-06, - "loss": 0.5925, - "step": 36934 - }, - { - "epoch": 0.95, - "learning_rate": 1.6019706841278313e-06, - "loss": 0.8691, - "step": 36935 - }, - { - "epoch": 0.95, - "learning_rate": 1.6019485885366963e-06, - "loss": 0.8359, - "step": 36936 - }, - { - "epoch": 0.95, - "learning_rate": 1.6019264924846772e-06, - "loss": 0.915, - "step": 36937 - }, - { - "epoch": 0.95, - "learning_rate": 1.6019043959717901e-06, - "loss": 0.5112, - "step": 36938 - }, - { - "epoch": 0.95, - "learning_rate": 1.601882298998053e-06, - "loss": 0.6816, - "step": 36939 - }, - { - "epoch": 0.95, - "learning_rate": 1.601860201563482e-06, - "loss": 0.7905, - "step": 36940 - }, - { - "epoch": 0.95, - "learning_rate": 1.6018381036680944e-06, - "loss": 0.8301, - "step": 36941 - }, - { - "epoch": 0.95, - "learning_rate": 1.6018160053119072e-06, - "loss": 0.7598, - "step": 36942 - }, - { - "epoch": 0.95, - "learning_rate": 1.6017939064949366e-06, - "loss": 0.7134, - "step": 36943 - }, - { - "epoch": 0.95, - "learning_rate": 1.6017718072172006e-06, - "loss": 0.8945, - "step": 36944 - }, - { - "epoch": 0.95, - "learning_rate": 1.6017497074787153e-06, - "loss": 0.9561, - "step": 36945 - }, - { - "epoch": 0.95, - "learning_rate": 1.6017276072794981e-06, - "loss": 1.001, - "step": 36946 - }, - { - "epoch": 0.95, - "learning_rate": 1.6017055066195658e-06, - "loss": 0.6128, - "step": 36947 - }, - { - "epoch": 0.95, - "learning_rate": 1.6016834054989351e-06, - "loss": 0.8828, - "step": 36948 - }, - { - "epoch": 0.95, - "learning_rate": 1.6016613039176232e-06, - "loss": 0.9219, - "step": 36949 - }, - { - "epoch": 0.95, - "learning_rate": 1.6016392018756468e-06, - "loss": 0.9316, - "step": 36950 - }, - { - "epoch": 0.95, - "learning_rate": 1.601617099373023e-06, - "loss": 0.8945, - "step": 36951 - }, - { - "epoch": 0.95, - "learning_rate": 1.6015949964097688e-06, - "loss": 0.8838, - "step": 36952 - }, - { - "epoch": 0.95, - "learning_rate": 1.6015728929859008e-06, - "loss": 0.6816, - "step": 36953 - }, - { - "epoch": 0.95, - "learning_rate": 1.601550789101436e-06, - "loss": 0.9443, - "step": 36954 - }, - { - "epoch": 0.95, - "learning_rate": 1.6015286847563914e-06, - "loss": 0.5864, - "step": 36955 - }, - { - "epoch": 0.95, - "learning_rate": 1.6015065799507842e-06, - "loss": 0.7354, - "step": 36956 - }, - { - "epoch": 0.95, - "learning_rate": 1.6014844746846307e-06, - "loss": 0.5762, - "step": 36957 - }, - { - "epoch": 0.95, - "learning_rate": 1.6014623689579486e-06, - "loss": 1.0107, - "step": 36958 - }, - { - "epoch": 0.95, - "learning_rate": 1.6014402627707542e-06, - "loss": 1.0137, - "step": 36959 - }, - { - "epoch": 0.95, - "learning_rate": 1.6014181561230648e-06, - "loss": 0.8457, - "step": 36960 - }, - { - "epoch": 0.95, - "learning_rate": 1.6013960490148968e-06, - "loss": 0.874, - "step": 36961 - }, - { - "epoch": 0.95, - "learning_rate": 1.601373941446268e-06, - "loss": 0.6431, - "step": 36962 - }, - { - "epoch": 0.95, - "learning_rate": 1.6013518334171945e-06, - "loss": 0.8721, - "step": 36963 - }, - { - "epoch": 0.95, - "learning_rate": 1.6013297249276936e-06, - "loss": 1.04, - "step": 36964 - }, - { - "epoch": 0.95, - "learning_rate": 1.6013076159777822e-06, - "loss": 0.8447, - "step": 36965 - }, - { - "epoch": 0.95, - "learning_rate": 1.6012855065674773e-06, - "loss": 0.8105, - "step": 36966 - }, - { - "epoch": 0.95, - "learning_rate": 1.6012633966967956e-06, - "loss": 0.8721, - "step": 36967 - }, - { - "epoch": 0.95, - "learning_rate": 1.6012412863657544e-06, - "loss": 0.7739, - "step": 36968 - }, - { - "epoch": 0.95, - "learning_rate": 1.60121917557437e-06, - "loss": 0.8516, - "step": 36969 - }, - { - "epoch": 0.95, - "learning_rate": 1.60119706432266e-06, - "loss": 0.7993, - "step": 36970 - }, - { - "epoch": 0.95, - "learning_rate": 1.601174952610641e-06, - "loss": 0.7471, - "step": 36971 - }, - { - "epoch": 0.95, - "learning_rate": 1.60115284043833e-06, - "loss": 0.7302, - "step": 36972 - }, - { - "epoch": 0.95, - "learning_rate": 1.6011307278057439e-06, - "loss": 0.8721, - "step": 36973 - }, - { - "epoch": 0.95, - "learning_rate": 1.6011086147128997e-06, - "loss": 0.7686, - "step": 36974 - }, - { - "epoch": 0.95, - "learning_rate": 1.601086501159814e-06, - "loss": 0.873, - "step": 36975 - }, - { - "epoch": 0.95, - "learning_rate": 1.6010643871465044e-06, - "loss": 0.8516, - "step": 36976 - }, - { - "epoch": 0.95, - "learning_rate": 1.6010422726729874e-06, - "loss": 0.9727, - "step": 36977 - }, - { - "epoch": 0.95, - "learning_rate": 1.6010201577392797e-06, - "loss": 0.7666, - "step": 36978 - }, - { - "epoch": 0.95, - "learning_rate": 1.6009980423453985e-06, - "loss": 0.8423, - "step": 36979 - }, - { - "epoch": 0.95, - "learning_rate": 1.600975926491361e-06, - "loss": 0.8867, - "step": 36980 - }, - { - "epoch": 0.95, - "learning_rate": 1.6009538101771836e-06, - "loss": 0.9297, - "step": 36981 - }, - { - "epoch": 0.95, - "learning_rate": 1.6009316934028837e-06, - "loss": 0.9395, - "step": 36982 - }, - { - "epoch": 0.95, - "learning_rate": 1.6009095761684778e-06, - "loss": 0.8469, - "step": 36983 - }, - { - "epoch": 0.95, - "learning_rate": 1.6008874584739834e-06, - "loss": 0.771, - "step": 36984 - }, - { - "epoch": 0.95, - "learning_rate": 1.6008653403194168e-06, - "loss": 0.9502, - "step": 36985 - }, - { - "epoch": 0.95, - "learning_rate": 1.6008432217047953e-06, - "loss": 0.8203, - "step": 36986 - }, - { - "epoch": 0.95, - "learning_rate": 1.600821102630136e-06, - "loss": 1.0371, - "step": 36987 - }, - { - "epoch": 0.95, - "learning_rate": 1.6007989830954553e-06, - "loss": 0.8936, - "step": 36988 - }, - { - "epoch": 0.95, - "learning_rate": 1.6007768631007705e-06, - "loss": 0.9678, - "step": 36989 - }, - { - "epoch": 0.95, - "learning_rate": 1.6007547426460987e-06, - "loss": 0.7598, - "step": 36990 - }, - { - "epoch": 0.95, - "learning_rate": 1.6007326217314562e-06, - "loss": 0.7393, - "step": 36991 - }, - { - "epoch": 0.95, - "learning_rate": 1.600710500356861e-06, - "loss": 0.8271, - "step": 36992 - }, - { - "epoch": 0.95, - "learning_rate": 1.6006883785223288e-06, - "loss": 0.9668, - "step": 36993 - }, - { - "epoch": 0.95, - "learning_rate": 1.6006662562278775e-06, - "loss": 0.6816, - "step": 36994 - }, - { - "epoch": 0.95, - "learning_rate": 1.6006441334735235e-06, - "loss": 0.8276, - "step": 36995 - }, - { - "epoch": 0.95, - "learning_rate": 1.600622010259284e-06, - "loss": 1.0215, - "step": 36996 - }, - { - "epoch": 0.95, - "learning_rate": 1.6005998865851757e-06, - "loss": 0.7607, - "step": 36997 - }, - { - "epoch": 0.95, - "learning_rate": 1.6005777624512157e-06, - "loss": 0.6421, - "step": 36998 - }, - { - "epoch": 0.95, - "learning_rate": 1.600555637857421e-06, - "loss": 0.7539, - "step": 36999 - }, - { - "epoch": 0.95, - "learning_rate": 1.6005335128038082e-06, - "loss": 0.8047, - "step": 37000 - }, - { - "epoch": 0.95, - "learning_rate": 1.6005113872903947e-06, - "loss": 0.7422, - "step": 37001 - }, - { - "epoch": 0.95, - "learning_rate": 1.6004892613171976e-06, - "loss": 0.7754, - "step": 37002 - }, - { - "epoch": 0.95, - "learning_rate": 1.6004671348842331e-06, - "loss": 0.8169, - "step": 37003 - }, - { - "epoch": 0.95, - "learning_rate": 1.6004450079915186e-06, - "loss": 0.7969, - "step": 37004 - }, - { - "epoch": 0.95, - "learning_rate": 1.6004228806390708e-06, - "loss": 0.7515, - "step": 37005 - }, - { - "epoch": 0.95, - "learning_rate": 1.600400752826907e-06, - "loss": 0.9072, - "step": 37006 - }, - { - "epoch": 0.95, - "learning_rate": 1.600378624555044e-06, - "loss": 0.8022, - "step": 37007 - }, - { - "epoch": 0.95, - "learning_rate": 1.6003564958234988e-06, - "loss": 0.7007, - "step": 37008 - }, - { - "epoch": 0.95, - "learning_rate": 1.600334366632288e-06, - "loss": 0.877, - "step": 37009 - }, - { - "epoch": 0.95, - "learning_rate": 1.6003122369814288e-06, - "loss": 0.9131, - "step": 37010 - }, - { - "epoch": 0.95, - "learning_rate": 1.600290106870938e-06, - "loss": 0.7988, - "step": 37011 - }, - { - "epoch": 0.95, - "learning_rate": 1.6002679763008331e-06, - "loss": 0.8706, - "step": 37012 - }, - { - "epoch": 0.95, - "learning_rate": 1.60024584527113e-06, - "loss": 0.9385, - "step": 37013 - }, - { - "epoch": 0.95, - "learning_rate": 1.6002237137818467e-06, - "loss": 0.959, - "step": 37014 - }, - { - "epoch": 0.95, - "learning_rate": 1.6002015818329998e-06, - "loss": 0.9014, - "step": 37015 - }, - { - "epoch": 0.95, - "learning_rate": 1.6001794494246058e-06, - "loss": 1.0156, - "step": 37016 - }, - { - "epoch": 0.95, - "learning_rate": 1.600157316556682e-06, - "loss": 0.9766, - "step": 37017 - }, - { - "epoch": 0.95, - "learning_rate": 1.6001351832292456e-06, - "loss": 0.7002, - "step": 37018 - }, - { - "epoch": 0.95, - "learning_rate": 1.6001130494423131e-06, - "loss": 0.8052, - "step": 37019 - }, - { - "epoch": 0.95, - "learning_rate": 1.6000909151959015e-06, - "loss": 0.9062, - "step": 37020 - }, - { - "epoch": 0.95, - "learning_rate": 1.6000687804900284e-06, - "loss": 0.6924, - "step": 37021 - }, - { - "epoch": 0.95, - "learning_rate": 1.60004664532471e-06, - "loss": 0.7876, - "step": 37022 - }, - { - "epoch": 0.95, - "learning_rate": 1.600024509699963e-06, - "loss": 0.6509, - "step": 37023 - }, - { - "epoch": 0.95, - "learning_rate": 1.6000023736158052e-06, - "loss": 1.0332, - "step": 37024 - }, - { - "epoch": 0.95, - "learning_rate": 1.5999802370722533e-06, - "loss": 0.9082, - "step": 37025 - }, - { - "epoch": 0.95, - "learning_rate": 1.599958100069324e-06, - "loss": 0.8169, - "step": 37026 - }, - { - "epoch": 0.95, - "learning_rate": 1.5999359626070343e-06, - "loss": 0.874, - "step": 37027 - }, - { - "epoch": 0.95, - "learning_rate": 1.5999138246854012e-06, - "loss": 0.8486, - "step": 37028 - }, - { - "epoch": 0.95, - "learning_rate": 1.5998916863044417e-06, - "loss": 0.6304, - "step": 37029 - }, - { - "epoch": 0.95, - "learning_rate": 1.5998695474641729e-06, - "loss": 0.7261, - "step": 37030 - }, - { - "epoch": 0.95, - "learning_rate": 1.5998474081646115e-06, - "loss": 0.8047, - "step": 37031 - }, - { - "epoch": 0.95, - "learning_rate": 1.5998252684057744e-06, - "loss": 1.1895, - "step": 37032 - }, - { - "epoch": 0.95, - "learning_rate": 1.5998031281876786e-06, - "loss": 0.6655, - "step": 37033 - }, - { - "epoch": 0.95, - "learning_rate": 1.5997809875103412e-06, - "loss": 1.0215, - "step": 37034 - }, - { - "epoch": 0.95, - "learning_rate": 1.599758846373779e-06, - "loss": 0.8398, - "step": 37035 - }, - { - "epoch": 0.95, - "learning_rate": 1.5997367047780094e-06, - "loss": 0.8027, - "step": 37036 - }, - { - "epoch": 0.95, - "learning_rate": 1.5997145627230487e-06, - "loss": 0.689, - "step": 37037 - }, - { - "epoch": 0.95, - "learning_rate": 1.599692420208914e-06, - "loss": 0.6787, - "step": 37038 - }, - { - "epoch": 0.95, - "learning_rate": 1.5996702772356225e-06, - "loss": 0.7278, - "step": 37039 - }, - { - "epoch": 0.95, - "learning_rate": 1.5996481338031913e-06, - "loss": 0.9404, - "step": 37040 - }, - { - "epoch": 0.95, - "learning_rate": 1.5996259899116366e-06, - "loss": 0.8789, - "step": 37041 - }, - { - "epoch": 0.95, - "learning_rate": 1.5996038455609763e-06, - "loss": 0.7661, - "step": 37042 - }, - { - "epoch": 0.95, - "learning_rate": 1.599581700751227e-06, - "loss": 1.2041, - "step": 37043 - }, - { - "epoch": 0.95, - "learning_rate": 1.599559555482405e-06, - "loss": 0.6016, - "step": 37044 - }, - { - "epoch": 0.95, - "learning_rate": 1.5995374097545282e-06, - "loss": 0.873, - "step": 37045 - }, - { - "epoch": 0.95, - "learning_rate": 1.599515263567613e-06, - "loss": 0.6299, - "step": 37046 - }, - { - "epoch": 0.95, - "learning_rate": 1.5994931169216768e-06, - "loss": 0.8477, - "step": 37047 - }, - { - "epoch": 0.95, - "learning_rate": 1.5994709698167362e-06, - "loss": 0.8955, - "step": 37048 - }, - { - "epoch": 0.95, - "learning_rate": 1.599448822252808e-06, - "loss": 0.7988, - "step": 37049 - }, - { - "epoch": 0.95, - "learning_rate": 1.5994266742299094e-06, - "loss": 0.769, - "step": 37050 - }, - { - "epoch": 0.95, - "learning_rate": 1.5994045257480577e-06, - "loss": 0.8877, - "step": 37051 - }, - { - "epoch": 0.95, - "learning_rate": 1.5993823768072693e-06, - "loss": 1.0166, - "step": 37052 - }, - { - "epoch": 0.95, - "learning_rate": 1.5993602274075615e-06, - "loss": 0.8066, - "step": 37053 - }, - { - "epoch": 0.95, - "learning_rate": 1.599338077548951e-06, - "loss": 1.042, - "step": 37054 - }, - { - "epoch": 0.95, - "learning_rate": 1.5993159272314549e-06, - "loss": 0.9238, - "step": 37055 - }, - { - "epoch": 0.95, - "learning_rate": 1.5992937764550902e-06, - "loss": 0.834, - "step": 37056 - }, - { - "epoch": 0.95, - "learning_rate": 1.5992716252198738e-06, - "loss": 0.6201, - "step": 37057 - }, - { - "epoch": 0.95, - "learning_rate": 1.5992494735258229e-06, - "loss": 1.1162, - "step": 37058 - }, - { - "epoch": 0.95, - "learning_rate": 1.5992273213729539e-06, - "loss": 1.1816, - "step": 37059 - }, - { - "epoch": 0.95, - "learning_rate": 1.599205168761284e-06, - "loss": 0.7622, - "step": 37060 - }, - { - "epoch": 0.95, - "learning_rate": 1.5991830156908303e-06, - "loss": 0.7979, - "step": 37061 - }, - { - "epoch": 0.95, - "learning_rate": 1.5991608621616098e-06, - "loss": 1.042, - "step": 37062 - }, - { - "epoch": 0.95, - "learning_rate": 1.5991387081736395e-06, - "loss": 1.0508, - "step": 37063 - }, - { - "epoch": 0.95, - "learning_rate": 1.5991165537269363e-06, - "loss": 0.75, - "step": 37064 - }, - { - "epoch": 0.95, - "learning_rate": 1.599094398821517e-06, - "loss": 0.8047, - "step": 37065 - }, - { - "epoch": 0.95, - "learning_rate": 1.5990722434573987e-06, - "loss": 0.9678, - "step": 37066 - }, - { - "epoch": 0.95, - "learning_rate": 1.5990500876345983e-06, - "loss": 0.8599, - "step": 37067 - }, - { - "epoch": 0.95, - "learning_rate": 1.5990279313531328e-06, - "loss": 0.8462, - "step": 37068 - }, - { - "epoch": 0.95, - "learning_rate": 1.599005774613019e-06, - "loss": 0.8213, - "step": 37069 - }, - { - "epoch": 0.95, - "learning_rate": 1.5989836174142743e-06, - "loss": 0.8555, - "step": 37070 - }, - { - "epoch": 0.95, - "learning_rate": 1.5989614597569151e-06, - "loss": 0.8359, - "step": 37071 - }, - { - "epoch": 0.95, - "learning_rate": 1.598939301640959e-06, - "loss": 0.7104, - "step": 37072 - }, - { - "epoch": 0.95, - "learning_rate": 1.5989171430664223e-06, - "loss": 1.0137, - "step": 37073 - }, - { - "epoch": 0.95, - "learning_rate": 1.5988949840333223e-06, - "loss": 0.9834, - "step": 37074 - }, - { - "epoch": 0.95, - "learning_rate": 1.598872824541676e-06, - "loss": 0.7461, - "step": 37075 - }, - { - "epoch": 0.95, - "learning_rate": 1.5988506645915005e-06, - "loss": 0.7051, - "step": 37076 - }, - { - "epoch": 0.95, - "learning_rate": 1.5988285041828125e-06, - "loss": 0.9482, - "step": 37077 - }, - { - "epoch": 0.95, - "learning_rate": 1.598806343315629e-06, - "loss": 0.832, - "step": 37078 - }, - { - "epoch": 0.95, - "learning_rate": 1.5987841819899667e-06, - "loss": 0.5952, - "step": 37079 - }, - { - "epoch": 0.95, - "learning_rate": 1.5987620202058433e-06, - "loss": 0.8564, - "step": 37080 - }, - { - "epoch": 0.95, - "learning_rate": 1.5987398579632752e-06, - "loss": 0.7583, - "step": 37081 - }, - { - "epoch": 0.95, - "learning_rate": 1.5987176952622797e-06, - "loss": 0.9424, - "step": 37082 - }, - { - "epoch": 0.95, - "learning_rate": 1.5986955321028733e-06, - "loss": 0.7251, - "step": 37083 - }, - { - "epoch": 0.95, - "learning_rate": 1.5986733684850735e-06, - "loss": 0.6357, - "step": 37084 - }, - { - "epoch": 0.95, - "learning_rate": 1.598651204408897e-06, - "loss": 0.9199, - "step": 37085 - }, - { - "epoch": 0.95, - "learning_rate": 1.5986290398743608e-06, - "loss": 0.9297, - "step": 37086 - }, - { - "epoch": 0.95, - "learning_rate": 1.5986068748814815e-06, - "loss": 0.9219, - "step": 37087 - }, - { - "epoch": 0.95, - "learning_rate": 1.5985847094302768e-06, - "loss": 0.7383, - "step": 37088 - }, - { - "epoch": 0.95, - "learning_rate": 1.5985625435207633e-06, - "loss": 0.9443, - "step": 37089 - }, - { - "epoch": 0.95, - "learning_rate": 1.598540377152958e-06, - "loss": 0.6147, - "step": 37090 - }, - { - "epoch": 0.95, - "learning_rate": 1.5985182103268779e-06, - "loss": 0.9521, - "step": 37091 - }, - { - "epoch": 0.95, - "learning_rate": 1.5984960430425399e-06, - "loss": 0.8701, - "step": 37092 - }, - { - "epoch": 0.95, - "learning_rate": 1.5984738752999606e-06, - "loss": 0.833, - "step": 37093 - }, - { - "epoch": 0.95, - "learning_rate": 1.5984517070991576e-06, - "loss": 0.8535, - "step": 37094 - }, - { - "epoch": 0.95, - "learning_rate": 1.5984295384401478e-06, - "loss": 0.918, - "step": 37095 - }, - { - "epoch": 0.95, - "learning_rate": 1.5984073693229482e-06, - "loss": 0.6934, - "step": 37096 - }, - { - "epoch": 0.95, - "learning_rate": 1.5983851997475752e-06, - "loss": 0.7241, - "step": 37097 - }, - { - "epoch": 0.95, - "learning_rate": 1.5983630297140465e-06, - "loss": 0.9395, - "step": 37098 - }, - { - "epoch": 0.95, - "learning_rate": 1.5983408592223784e-06, - "loss": 0.7456, - "step": 37099 - }, - { - "epoch": 0.95, - "learning_rate": 1.5983186882725886e-06, - "loss": 0.835, - "step": 37100 - }, - { - "epoch": 0.95, - "learning_rate": 1.5982965168646937e-06, - "loss": 0.8369, - "step": 37101 - }, - { - "epoch": 0.95, - "learning_rate": 1.5982743449987102e-06, - "loss": 0.7739, - "step": 37102 - }, - { - "epoch": 0.95, - "learning_rate": 1.5982521726746558e-06, - "loss": 0.9814, - "step": 37103 - }, - { - "epoch": 0.95, - "learning_rate": 1.598229999892547e-06, - "loss": 0.9023, - "step": 37104 - }, - { - "epoch": 0.95, - "learning_rate": 1.5982078266524013e-06, - "loss": 0.873, - "step": 37105 - }, - { - "epoch": 0.95, - "learning_rate": 1.5981856529542352e-06, - "loss": 0.8838, - "step": 37106 - }, - { - "epoch": 0.95, - "learning_rate": 1.598163478798066e-06, - "loss": 0.7344, - "step": 37107 - }, - { - "epoch": 0.95, - "learning_rate": 1.5981413041839104e-06, - "loss": 0.7852, - "step": 37108 - }, - { - "epoch": 0.95, - "learning_rate": 1.5981191291117855e-06, - "loss": 0.8066, - "step": 37109 - }, - { - "epoch": 0.95, - "learning_rate": 1.5980969535817082e-06, - "loss": 0.8682, - "step": 37110 - }, - { - "epoch": 0.95, - "learning_rate": 1.598074777593696e-06, - "loss": 0.9473, - "step": 37111 - }, - { - "epoch": 0.95, - "learning_rate": 1.598052601147765e-06, - "loss": 0.8481, - "step": 37112 - }, - { - "epoch": 0.95, - "learning_rate": 1.5980304242439328e-06, - "loss": 0.75, - "step": 37113 - }, - { - "epoch": 0.95, - "learning_rate": 1.598008246882216e-06, - "loss": 0.8418, - "step": 37114 - }, - { - "epoch": 0.95, - "learning_rate": 1.5979860690626321e-06, - "loss": 0.9307, - "step": 37115 - }, - { - "epoch": 0.95, - "learning_rate": 1.5979638907851977e-06, - "loss": 0.9287, - "step": 37116 - }, - { - "epoch": 0.95, - "learning_rate": 1.5979417120499297e-06, - "loss": 0.916, - "step": 37117 - }, - { - "epoch": 0.95, - "learning_rate": 1.5979195328568453e-06, - "loss": 0.8252, - "step": 37118 - }, - { - "epoch": 0.95, - "learning_rate": 1.5978973532059614e-06, - "loss": 1.0967, - "step": 37119 - }, - { - "epoch": 0.95, - "learning_rate": 1.5978751730972949e-06, - "loss": 0.8525, - "step": 37120 - }, - { - "epoch": 0.95, - "learning_rate": 1.5978529925308632e-06, - "loss": 0.7773, - "step": 37121 - }, - { - "epoch": 0.95, - "learning_rate": 1.5978308115066827e-06, - "loss": 0.9463, - "step": 37122 - }, - { - "epoch": 0.95, - "learning_rate": 1.5978086300247706e-06, - "loss": 0.9834, - "step": 37123 - }, - { - "epoch": 0.95, - "learning_rate": 1.5977864480851437e-06, - "loss": 0.6812, - "step": 37124 - }, - { - "epoch": 0.95, - "learning_rate": 1.5977642656878196e-06, - "loss": 0.7002, - "step": 37125 - }, - { - "epoch": 0.95, - "learning_rate": 1.5977420828328148e-06, - "loss": 0.9062, - "step": 37126 - }, - { - "epoch": 0.95, - "learning_rate": 1.5977198995201465e-06, - "loss": 0.9482, - "step": 37127 - }, - { - "epoch": 0.95, - "learning_rate": 1.5976977157498313e-06, - "loss": 0.718, - "step": 37128 - }, - { - "epoch": 0.95, - "learning_rate": 1.5976755315218865e-06, - "loss": 1.0684, - "step": 37129 - }, - { - "epoch": 0.95, - "learning_rate": 1.597653346836329e-06, - "loss": 0.8184, - "step": 37130 - }, - { - "epoch": 0.95, - "learning_rate": 1.597631161693176e-06, - "loss": 0.7246, - "step": 37131 - }, - { - "epoch": 0.95, - "learning_rate": 1.597608976092444e-06, - "loss": 0.7656, - "step": 37132 - }, - { - "epoch": 0.95, - "learning_rate": 1.5975867900341504e-06, - "loss": 0.8105, - "step": 37133 - }, - { - "epoch": 0.95, - "learning_rate": 1.5975646035183122e-06, - "loss": 0.8145, - "step": 37134 - }, - { - "epoch": 0.95, - "learning_rate": 1.5975424165449461e-06, - "loss": 0.5356, - "step": 37135 - }, - { - "epoch": 0.95, - "learning_rate": 1.5975202291140695e-06, - "loss": 0.6787, - "step": 37136 - }, - { - "epoch": 0.95, - "learning_rate": 1.5974980412256989e-06, - "loss": 0.6382, - "step": 37137 - }, - { - "epoch": 0.95, - "learning_rate": 1.5974758528798515e-06, - "loss": 0.7588, - "step": 37138 - }, - { - "epoch": 0.95, - "learning_rate": 1.5974536640765445e-06, - "loss": 0.9482, - "step": 37139 - }, - { - "epoch": 0.95, - "learning_rate": 1.5974314748157944e-06, - "loss": 0.7539, - "step": 37140 - }, - { - "epoch": 0.95, - "learning_rate": 1.5974092850976191e-06, - "loss": 0.8418, - "step": 37141 - }, - { - "epoch": 0.95, - "learning_rate": 1.5973870949220345e-06, - "loss": 1.082, - "step": 37142 - }, - { - "epoch": 0.95, - "learning_rate": 1.597364904289058e-06, - "loss": 0.8203, - "step": 37143 - }, - { - "epoch": 0.95, - "learning_rate": 1.5973427131987067e-06, - "loss": 0.8438, - "step": 37144 - }, - { - "epoch": 0.95, - "learning_rate": 1.5973205216509977e-06, - "loss": 1.0293, - "step": 37145 - }, - { - "epoch": 0.95, - "learning_rate": 1.5972983296459479e-06, - "loss": 0.5304, - "step": 37146 - }, - { - "epoch": 0.95, - "learning_rate": 1.5972761371835742e-06, - "loss": 0.9385, - "step": 37147 - }, - { - "epoch": 0.95, - "learning_rate": 1.5972539442638935e-06, - "loss": 0.9756, - "step": 37148 - }, - { - "epoch": 0.95, - "learning_rate": 1.5972317508869228e-06, - "loss": 0.8184, - "step": 37149 - }, - { - "epoch": 0.95, - "learning_rate": 1.5972095570526793e-06, - "loss": 0.6255, - "step": 37150 - }, - { - "epoch": 0.95, - "learning_rate": 1.59718736276118e-06, - "loss": 0.9795, - "step": 37151 - }, - { - "epoch": 0.95, - "learning_rate": 1.597165168012442e-06, - "loss": 0.5879, - "step": 37152 - }, - { - "epoch": 0.95, - "learning_rate": 1.5971429728064818e-06, - "loss": 0.8945, - "step": 37153 - }, - { - "epoch": 0.95, - "learning_rate": 1.5971207771433167e-06, - "loss": 0.9209, - "step": 37154 - }, - { - "epoch": 0.95, - "learning_rate": 1.5970985810229639e-06, - "loss": 0.8955, - "step": 37155 - }, - { - "epoch": 0.95, - "learning_rate": 1.5970763844454398e-06, - "loss": 0.9131, - "step": 37156 - }, - { - "epoch": 0.95, - "learning_rate": 1.597054187410762e-06, - "loss": 0.9009, - "step": 37157 - }, - { - "epoch": 0.95, - "learning_rate": 1.5970319899189473e-06, - "loss": 0.7939, - "step": 37158 - }, - { - "epoch": 0.95, - "learning_rate": 1.5970097919700126e-06, - "loss": 0.7383, - "step": 37159 - }, - { - "epoch": 0.95, - "learning_rate": 1.5969875935639748e-06, - "loss": 0.8682, - "step": 37160 - }, - { - "epoch": 0.95, - "learning_rate": 1.5969653947008515e-06, - "loss": 0.7432, - "step": 37161 - }, - { - "epoch": 0.95, - "learning_rate": 1.5969431953806587e-06, - "loss": 0.9229, - "step": 37162 - }, - { - "epoch": 0.95, - "learning_rate": 1.5969209956034141e-06, - "loss": 0.8525, - "step": 37163 - }, - { - "epoch": 0.95, - "learning_rate": 1.596898795369135e-06, - "loss": 1.0098, - "step": 37164 - }, - { - "epoch": 0.95, - "learning_rate": 1.5968765946778374e-06, - "loss": 1.001, - "step": 37165 - }, - { - "epoch": 0.95, - "learning_rate": 1.5968543935295391e-06, - "loss": 0.9043, - "step": 37166 - }, - { - "epoch": 0.95, - "learning_rate": 1.5968321919242564e-06, - "loss": 0.8594, - "step": 37167 - }, - { - "epoch": 0.95, - "learning_rate": 1.5968099898620072e-06, - "loss": 0.8125, - "step": 37168 - }, - { - "epoch": 0.95, - "learning_rate": 1.596787787342808e-06, - "loss": 0.5669, - "step": 37169 - }, - { - "epoch": 0.95, - "learning_rate": 1.5967655843666757e-06, - "loss": 1.0059, - "step": 37170 - }, - { - "epoch": 0.95, - "learning_rate": 1.5967433809336276e-06, - "loss": 0.9248, - "step": 37171 - }, - { - "epoch": 0.95, - "learning_rate": 1.5967211770436802e-06, - "loss": 0.647, - "step": 37172 - }, - { - "epoch": 0.95, - "learning_rate": 1.596698972696851e-06, - "loss": 1.083, - "step": 37173 - }, - { - "epoch": 0.95, - "learning_rate": 1.596676767893157e-06, - "loss": 0.833, - "step": 37174 - }, - { - "epoch": 0.95, - "learning_rate": 1.5966545626326146e-06, - "loss": 0.876, - "step": 37175 - }, - { - "epoch": 0.95, - "learning_rate": 1.5966323569152417e-06, - "loss": 0.8779, - "step": 37176 - }, - { - "epoch": 0.95, - "learning_rate": 1.5966101507410548e-06, - "loss": 0.8057, - "step": 37177 - }, - { - "epoch": 0.95, - "learning_rate": 1.5965879441100706e-06, - "loss": 0.8691, - "step": 37178 - }, - { - "epoch": 0.95, - "learning_rate": 1.5965657370223066e-06, - "loss": 0.75, - "step": 37179 - }, - { - "epoch": 0.95, - "learning_rate": 1.5965435294777799e-06, - "loss": 0.6716, - "step": 37180 - }, - { - "epoch": 0.95, - "learning_rate": 1.596521321476507e-06, - "loss": 0.6445, - "step": 37181 - }, - { - "epoch": 0.95, - "learning_rate": 1.5964991130185053e-06, - "loss": 0.9414, - "step": 37182 - }, - { - "epoch": 0.95, - "learning_rate": 1.5964769041037913e-06, - "loss": 1.168, - "step": 37183 - }, - { - "epoch": 0.95, - "learning_rate": 1.5964546947323827e-06, - "loss": 0.9268, - "step": 37184 - }, - { - "epoch": 0.95, - "learning_rate": 1.5964324849042964e-06, - "loss": 0.7979, - "step": 37185 - }, - { - "epoch": 0.95, - "learning_rate": 1.5964102746195488e-06, - "loss": 0.7788, - "step": 37186 - }, - { - "epoch": 0.95, - "learning_rate": 1.5963880638781573e-06, - "loss": 0.8701, - "step": 37187 - }, - { - "epoch": 0.95, - "learning_rate": 1.596365852680139e-06, - "loss": 1.1035, - "step": 37188 - }, - { - "epoch": 0.95, - "learning_rate": 1.5963436410255104e-06, - "loss": 0.5938, - "step": 37189 - }, - { - "epoch": 0.95, - "learning_rate": 1.5963214289142891e-06, - "loss": 0.9238, - "step": 37190 - }, - { - "epoch": 0.95, - "learning_rate": 1.5962992163464924e-06, - "loss": 0.9229, - "step": 37191 - }, - { - "epoch": 0.95, - "learning_rate": 1.5962770033221363e-06, - "loss": 0.9536, - "step": 37192 - }, - { - "epoch": 0.95, - "learning_rate": 1.5962547898412385e-06, - "loss": 0.9111, - "step": 37193 - }, - { - "epoch": 0.95, - "learning_rate": 1.5962325759038155e-06, - "loss": 1.0059, - "step": 37194 - }, - { - "epoch": 0.95, - "learning_rate": 1.5962103615098849e-06, - "loss": 0.8496, - "step": 37195 - }, - { - "epoch": 0.95, - "learning_rate": 1.5961881466594635e-06, - "loss": 0.7549, - "step": 37196 - }, - { - "epoch": 0.95, - "learning_rate": 1.5961659313525682e-06, - "loss": 0.8086, - "step": 37197 - }, - { - "epoch": 0.95, - "learning_rate": 1.596143715589216e-06, - "loss": 1.0557, - "step": 37198 - }, - { - "epoch": 0.95, - "learning_rate": 1.5961214993694241e-06, - "loss": 0.8398, - "step": 37199 - }, - { - "epoch": 0.95, - "learning_rate": 1.596099282693209e-06, - "loss": 0.9375, - "step": 37200 - }, - { - "epoch": 0.95, - "learning_rate": 1.5960770655605886e-06, - "loss": 0.8926, - "step": 37201 - }, - { - "epoch": 0.95, - "learning_rate": 1.5960548479715793e-06, - "loss": 0.8994, - "step": 37202 - }, - { - "epoch": 0.95, - "learning_rate": 1.5960326299261979e-06, - "loss": 0.8057, - "step": 37203 - }, - { - "epoch": 0.95, - "learning_rate": 1.5960104114244618e-06, - "loss": 0.8926, - "step": 37204 - }, - { - "epoch": 0.95, - "learning_rate": 1.595988192466388e-06, - "loss": 0.8496, - "step": 37205 - }, - { - "epoch": 0.95, - "learning_rate": 1.5959659730519936e-06, - "loss": 0.6543, - "step": 37206 - }, - { - "epoch": 0.95, - "learning_rate": 1.5959437531812954e-06, - "loss": 0.564, - "step": 37207 - }, - { - "epoch": 0.95, - "learning_rate": 1.5959215328543102e-06, - "loss": 0.999, - "step": 37208 - }, - { - "epoch": 0.95, - "learning_rate": 1.5958993120710556e-06, - "loss": 0.4927, - "step": 37209 - }, - { - "epoch": 0.95, - "learning_rate": 1.5958770908315483e-06, - "loss": 0.835, - "step": 37210 - }, - { - "epoch": 0.95, - "learning_rate": 1.5958548691358051e-06, - "loss": 0.6656, - "step": 37211 - }, - { - "epoch": 0.95, - "learning_rate": 1.5958326469838435e-06, - "loss": 0.6572, - "step": 37212 - }, - { - "epoch": 0.95, - "learning_rate": 1.59581042437568e-06, - "loss": 0.7925, - "step": 37213 - }, - { - "epoch": 0.95, - "learning_rate": 1.5957882013113317e-06, - "loss": 0.7107, - "step": 37214 - }, - { - "epoch": 0.95, - "learning_rate": 1.595765977790816e-06, - "loss": 0.7688, - "step": 37215 - }, - { - "epoch": 0.95, - "learning_rate": 1.5957437538141499e-06, - "loss": 0.9424, - "step": 37216 - }, - { - "epoch": 0.95, - "learning_rate": 1.59572152938135e-06, - "loss": 0.6423, - "step": 37217 - }, - { - "epoch": 0.95, - "learning_rate": 1.5956993044924334e-06, - "loss": 0.8887, - "step": 37218 - }, - { - "epoch": 0.95, - "learning_rate": 1.5956770791474172e-06, - "loss": 0.8086, - "step": 37219 - }, - { - "epoch": 0.95, - "learning_rate": 1.5956548533463186e-06, - "loss": 0.8682, - "step": 37220 - }, - { - "epoch": 0.95, - "learning_rate": 1.5956326270891546e-06, - "loss": 0.6792, - "step": 37221 - }, - { - "epoch": 0.95, - "learning_rate": 1.5956104003759419e-06, - "loss": 0.7715, - "step": 37222 - }, - { - "epoch": 0.95, - "learning_rate": 1.5955881732066976e-06, - "loss": 0.9561, - "step": 37223 - }, - { - "epoch": 0.95, - "learning_rate": 1.595565945581439e-06, - "loss": 0.8311, - "step": 37224 - }, - { - "epoch": 0.95, - "learning_rate": 1.5955437175001826e-06, - "loss": 0.7793, - "step": 37225 - }, - { - "epoch": 0.95, - "learning_rate": 1.5955214889629463e-06, - "loss": 0.9053, - "step": 37226 - }, - { - "epoch": 0.95, - "learning_rate": 1.5954992599697464e-06, - "loss": 0.918, - "step": 37227 - }, - { - "epoch": 0.95, - "learning_rate": 1.5954770305206e-06, - "loss": 0.8301, - "step": 37228 - }, - { - "epoch": 0.95, - "learning_rate": 1.5954548006155242e-06, - "loss": 0.917, - "step": 37229 - }, - { - "epoch": 0.95, - "learning_rate": 1.595432570254536e-06, - "loss": 0.8105, - "step": 37230 - }, - { - "epoch": 0.95, - "learning_rate": 1.5954103394376527e-06, - "loss": 0.9473, - "step": 37231 - }, - { - "epoch": 0.95, - "learning_rate": 1.595388108164891e-06, - "loss": 0.918, - "step": 37232 - }, - { - "epoch": 0.95, - "learning_rate": 1.5953658764362676e-06, - "loss": 0.7539, - "step": 37233 - }, - { - "epoch": 0.95, - "learning_rate": 1.5953436442518004e-06, - "loss": 0.9297, - "step": 37234 - }, - { - "epoch": 0.95, - "learning_rate": 1.5953214116115058e-06, - "loss": 0.8174, - "step": 37235 - }, - { - "epoch": 0.95, - "learning_rate": 1.595299178515401e-06, - "loss": 0.7363, - "step": 37236 - }, - { - "epoch": 0.95, - "learning_rate": 1.5952769449635032e-06, - "loss": 0.8145, - "step": 37237 - }, - { - "epoch": 0.95, - "learning_rate": 1.5952547109558284e-06, - "loss": 0.6501, - "step": 37238 - }, - { - "epoch": 0.95, - "learning_rate": 1.5952324764923951e-06, - "loss": 0.9141, - "step": 37239 - }, - { - "epoch": 0.95, - "learning_rate": 1.5952102415732198e-06, - "loss": 0.9619, - "step": 37240 - }, - { - "epoch": 0.95, - "learning_rate": 1.5951880061983189e-06, - "loss": 0.915, - "step": 37241 - }, - { - "epoch": 0.95, - "learning_rate": 1.5951657703677105e-06, - "loss": 0.5903, - "step": 37242 - }, - { - "epoch": 0.95, - "learning_rate": 1.5951435340814106e-06, - "loss": 0.917, - "step": 37243 - }, - { - "epoch": 0.95, - "learning_rate": 1.5951212973394369e-06, - "loss": 0.9287, - "step": 37244 - }, - { - "epoch": 0.95, - "learning_rate": 1.5950990601418058e-06, - "loss": 0.7393, - "step": 37245 - }, - { - "epoch": 0.95, - "learning_rate": 1.5950768224885351e-06, - "loss": 0.9551, - "step": 37246 - }, - { - "epoch": 0.95, - "learning_rate": 1.5950545843796412e-06, - "loss": 0.8105, - "step": 37247 - }, - { - "epoch": 0.95, - "learning_rate": 1.5950323458151416e-06, - "loss": 0.7256, - "step": 37248 - }, - { - "epoch": 0.95, - "learning_rate": 1.595010106795053e-06, - "loss": 0.8789, - "step": 37249 - }, - { - "epoch": 0.95, - "learning_rate": 1.5949878673193923e-06, - "loss": 0.8296, - "step": 37250 - }, - { - "epoch": 0.95, - "learning_rate": 1.5949656273881771e-06, - "loss": 0.7139, - "step": 37251 - }, - { - "epoch": 0.95, - "learning_rate": 1.594943387001424e-06, - "loss": 0.917, - "step": 37252 - }, - { - "epoch": 0.95, - "learning_rate": 1.5949211461591499e-06, - "loss": 0.576, - "step": 37253 - }, - { - "epoch": 0.95, - "learning_rate": 1.5948989048613722e-06, - "loss": 0.7783, - "step": 37254 - }, - { - "epoch": 0.95, - "learning_rate": 1.5948766631081076e-06, - "loss": 0.5884, - "step": 37255 - }, - { - "epoch": 0.95, - "learning_rate": 1.5948544208993735e-06, - "loss": 0.8838, - "step": 37256 - }, - { - "epoch": 0.95, - "learning_rate": 1.5948321782351865e-06, - "loss": 0.9141, - "step": 37257 - }, - { - "epoch": 0.95, - "learning_rate": 1.5948099351155642e-06, - "loss": 0.8711, - "step": 37258 - }, - { - "epoch": 0.95, - "learning_rate": 1.5947876915405227e-06, - "loss": 0.8408, - "step": 37259 - }, - { - "epoch": 0.95, - "learning_rate": 1.59476544751008e-06, - "loss": 0.6919, - "step": 37260 - }, - { - "epoch": 0.96, - "learning_rate": 1.5947432030242527e-06, - "loss": 0.9492, - "step": 37261 - }, - { - "epoch": 0.96, - "learning_rate": 1.594720958083058e-06, - "loss": 0.9912, - "step": 37262 - }, - { - "epoch": 0.96, - "learning_rate": 1.5946987126865125e-06, - "loss": 0.8164, - "step": 37263 - }, - { - "epoch": 0.96, - "learning_rate": 1.594676466834634e-06, - "loss": 0.812, - "step": 37264 - }, - { - "epoch": 0.96, - "learning_rate": 1.5946542205274386e-06, - "loss": 0.8447, - "step": 37265 - }, - { - "epoch": 0.96, - "learning_rate": 1.5946319737649442e-06, - "loss": 0.9053, - "step": 37266 - }, - { - "epoch": 0.96, - "learning_rate": 1.5946097265471675e-06, - "loss": 0.8218, - "step": 37267 - }, - { - "epoch": 0.96, - "learning_rate": 1.594587478874125e-06, - "loss": 0.9287, - "step": 37268 - }, - { - "epoch": 0.96, - "learning_rate": 1.5945652307458343e-06, - "loss": 1.0342, - "step": 37269 - }, - { - "epoch": 0.96, - "learning_rate": 1.5945429821623125e-06, - "loss": 1.0381, - "step": 37270 - }, - { - "epoch": 0.96, - "learning_rate": 1.5945207331235767e-06, - "loss": 0.7769, - "step": 37271 - }, - { - "epoch": 0.96, - "learning_rate": 1.5944984836296433e-06, - "loss": 0.6562, - "step": 37272 - }, - { - "epoch": 0.96, - "learning_rate": 1.59447623368053e-06, - "loss": 1.0039, - "step": 37273 - }, - { - "epoch": 0.96, - "learning_rate": 1.5944539832762534e-06, - "loss": 0.8252, - "step": 37274 - }, - { - "epoch": 0.96, - "learning_rate": 1.594431732416831e-06, - "loss": 0.8516, - "step": 37275 - }, - { - "epoch": 0.96, - "learning_rate": 1.5944094811022796e-06, - "loss": 0.4946, - "step": 37276 - }, - { - "epoch": 0.96, - "learning_rate": 1.5943872293326157e-06, - "loss": 1.1133, - "step": 37277 - }, - { - "epoch": 0.96, - "learning_rate": 1.5943649771078572e-06, - "loss": 0.8682, - "step": 37278 - }, - { - "epoch": 0.96, - "learning_rate": 1.5943427244280205e-06, - "loss": 0.9902, - "step": 37279 - }, - { - "epoch": 0.96, - "learning_rate": 1.5943204712931231e-06, - "loss": 0.7974, - "step": 37280 - }, - { - "epoch": 0.96, - "learning_rate": 1.5942982177031819e-06, - "loss": 0.8027, - "step": 37281 - }, - { - "epoch": 0.96, - "learning_rate": 1.5942759636582137e-06, - "loss": 0.7178, - "step": 37282 - }, - { - "epoch": 0.96, - "learning_rate": 1.5942537091582357e-06, - "loss": 0.9399, - "step": 37283 - }, - { - "epoch": 0.96, - "learning_rate": 1.5942314542032653e-06, - "loss": 1.0176, - "step": 37284 - }, - { - "epoch": 0.96, - "learning_rate": 1.5942091987933188e-06, - "loss": 0.9492, - "step": 37285 - }, - { - "epoch": 0.96, - "learning_rate": 1.5941869429284137e-06, - "loss": 0.8086, - "step": 37286 - }, - { - "epoch": 0.96, - "learning_rate": 1.5941646866085675e-06, - "loss": 0.9375, - "step": 37287 - }, - { - "epoch": 0.96, - "learning_rate": 1.594142429833796e-06, - "loss": 0.79, - "step": 37288 - }, - { - "epoch": 0.96, - "learning_rate": 1.5941201726041173e-06, - "loss": 0.7012, - "step": 37289 - }, - { - "epoch": 0.96, - "learning_rate": 1.5940979149195482e-06, - "loss": 1.0664, - "step": 37290 - }, - { - "epoch": 0.96, - "learning_rate": 1.5940756567801054e-06, - "loss": 0.9443, - "step": 37291 - }, - { - "epoch": 0.96, - "learning_rate": 1.5940533981858063e-06, - "loss": 0.9932, - "step": 37292 - }, - { - "epoch": 0.96, - "learning_rate": 1.5940311391366678e-06, - "loss": 0.8779, - "step": 37293 - }, - { - "epoch": 0.96, - "learning_rate": 1.5940088796327072e-06, - "loss": 0.8008, - "step": 37294 - }, - { - "epoch": 0.96, - "learning_rate": 1.5939866196739409e-06, - "loss": 0.8369, - "step": 37295 - }, - { - "epoch": 0.96, - "learning_rate": 1.593964359260387e-06, - "loss": 0.6633, - "step": 37296 - }, - { - "epoch": 0.96, - "learning_rate": 1.5939420983920612e-06, - "loss": 0.4458, - "step": 37297 - }, - { - "epoch": 0.96, - "learning_rate": 1.5939198370689815e-06, - "loss": 0.8174, - "step": 37298 - }, - { - "epoch": 0.96, - "learning_rate": 1.5938975752911645e-06, - "loss": 0.8379, - "step": 37299 - }, - { - "epoch": 0.96, - "learning_rate": 1.5938753130586278e-06, - "loss": 0.5981, - "step": 37300 - }, - { - "epoch": 0.96, - "learning_rate": 1.593853050371388e-06, - "loss": 0.9062, - "step": 37301 - }, - { - "epoch": 0.96, - "learning_rate": 1.5938307872294621e-06, - "loss": 0.957, - "step": 37302 - }, - { - "epoch": 0.96, - "learning_rate": 1.5938085236328674e-06, - "loss": 0.8857, - "step": 37303 - }, - { - "epoch": 0.96, - "learning_rate": 1.5937862595816208e-06, - "loss": 0.917, - "step": 37304 - }, - { - "epoch": 0.96, - "learning_rate": 1.5937639950757392e-06, - "loss": 0.6182, - "step": 37305 - }, - { - "epoch": 0.96, - "learning_rate": 1.5937417301152397e-06, - "loss": 0.9746, - "step": 37306 - }, - { - "epoch": 0.96, - "learning_rate": 1.5937194647001398e-06, - "loss": 0.7461, - "step": 37307 - }, - { - "epoch": 0.96, - "learning_rate": 1.5936971988304562e-06, - "loss": 0.9453, - "step": 37308 - }, - { - "epoch": 0.96, - "learning_rate": 1.5936749325062055e-06, - "loss": 0.7861, - "step": 37309 - }, - { - "epoch": 0.96, - "learning_rate": 1.5936526657274056e-06, - "loss": 0.9629, - "step": 37310 - }, - { - "epoch": 0.96, - "learning_rate": 1.5936303984940733e-06, - "loss": 0.7183, - "step": 37311 - }, - { - "epoch": 0.96, - "learning_rate": 1.5936081308062252e-06, - "loss": 0.8442, - "step": 37312 - }, - { - "epoch": 0.96, - "learning_rate": 1.5935858626638786e-06, - "loss": 0.9385, - "step": 37313 - }, - { - "epoch": 0.96, - "learning_rate": 1.5935635940670506e-06, - "loss": 1.0225, - "step": 37314 - }, - { - "epoch": 0.96, - "learning_rate": 1.5935413250157586e-06, - "loss": 1.042, - "step": 37315 - }, - { - "epoch": 0.96, - "learning_rate": 1.5935190555100193e-06, - "loss": 0.7207, - "step": 37316 - }, - { - "epoch": 0.96, - "learning_rate": 1.5934967855498493e-06, - "loss": 0.9736, - "step": 37317 - }, - { - "epoch": 0.96, - "learning_rate": 1.5934745151352664e-06, - "loss": 0.9844, - "step": 37318 - }, - { - "epoch": 0.96, - "learning_rate": 1.5934522442662873e-06, - "loss": 0.9561, - "step": 37319 - }, - { - "epoch": 0.96, - "learning_rate": 1.593429972942929e-06, - "loss": 0.7617, - "step": 37320 - }, - { - "epoch": 0.96, - "learning_rate": 1.5934077011652089e-06, - "loss": 0.7676, - "step": 37321 - }, - { - "epoch": 0.96, - "learning_rate": 1.5933854289331437e-06, - "loss": 0.6304, - "step": 37322 - }, - { - "epoch": 0.96, - "learning_rate": 1.5933631562467503e-06, - "loss": 0.7363, - "step": 37323 - }, - { - "epoch": 0.96, - "learning_rate": 1.5933408831060464e-06, - "loss": 0.7871, - "step": 37324 - }, - { - "epoch": 0.96, - "learning_rate": 1.5933186095110483e-06, - "loss": 0.793, - "step": 37325 - }, - { - "epoch": 0.96, - "learning_rate": 1.593296335461774e-06, - "loss": 0.5431, - "step": 37326 - }, - { - "epoch": 0.96, - "learning_rate": 1.5932740609582393e-06, - "loss": 0.9307, - "step": 37327 - }, - { - "epoch": 0.96, - "learning_rate": 1.5932517860004623e-06, - "loss": 0.5278, - "step": 37328 - }, - { - "epoch": 0.96, - "learning_rate": 1.5932295105884594e-06, - "loss": 0.7773, - "step": 37329 - }, - { - "epoch": 0.96, - "learning_rate": 1.5932072347222483e-06, - "loss": 0.5449, - "step": 37330 - }, - { - "epoch": 0.96, - "learning_rate": 1.5931849584018455e-06, - "loss": 0.9941, - "step": 37331 - }, - { - "epoch": 0.96, - "learning_rate": 1.5931626816272682e-06, - "loss": 0.6484, - "step": 37332 - }, - { - "epoch": 0.96, - "learning_rate": 1.5931404043985337e-06, - "loss": 0.6228, - "step": 37333 - }, - { - "epoch": 0.96, - "learning_rate": 1.5931181267156587e-06, - "loss": 0.9082, - "step": 37334 - }, - { - "epoch": 0.96, - "learning_rate": 1.5930958485786605e-06, - "loss": 0.8457, - "step": 37335 - }, - { - "epoch": 0.96, - "learning_rate": 1.5930735699875561e-06, - "loss": 0.9775, - "step": 37336 - }, - { - "epoch": 0.96, - "learning_rate": 1.5930512909423626e-06, - "loss": 0.8398, - "step": 37337 - }, - { - "epoch": 0.96, - "learning_rate": 1.593029011443097e-06, - "loss": 0.9014, - "step": 37338 - }, - { - "epoch": 0.96, - "learning_rate": 1.5930067314897763e-06, - "loss": 0.7773, - "step": 37339 - }, - { - "epoch": 0.96, - "learning_rate": 1.5929844510824174e-06, - "loss": 0.7656, - "step": 37340 - }, - { - "epoch": 0.96, - "learning_rate": 1.5929621702210381e-06, - "loss": 0.875, - "step": 37341 - }, - { - "epoch": 0.96, - "learning_rate": 1.5929398889056543e-06, - "loss": 0.8115, - "step": 37342 - }, - { - "epoch": 0.96, - "learning_rate": 1.592917607136284e-06, - "loss": 0.7126, - "step": 37343 - }, - { - "epoch": 0.96, - "learning_rate": 1.592895324912944e-06, - "loss": 0.8389, - "step": 37344 - }, - { - "epoch": 0.96, - "learning_rate": 1.5928730422356512e-06, - "loss": 1.0068, - "step": 37345 - }, - { - "epoch": 0.96, - "learning_rate": 1.5928507591044229e-06, - "loss": 0.8906, - "step": 37346 - }, - { - "epoch": 0.96, - "learning_rate": 1.5928284755192757e-06, - "loss": 0.7285, - "step": 37347 - }, - { - "epoch": 0.96, - "learning_rate": 1.5928061914802276e-06, - "loss": 0.6089, - "step": 37348 - }, - { - "epoch": 0.96, - "learning_rate": 1.5927839069872943e-06, - "loss": 0.8047, - "step": 37349 - }, - { - "epoch": 0.96, - "learning_rate": 1.592761622040494e-06, - "loss": 0.6064, - "step": 37350 - }, - { - "epoch": 0.96, - "learning_rate": 1.5927393366398436e-06, - "loss": 1.0625, - "step": 37351 - }, - { - "epoch": 0.96, - "learning_rate": 1.5927170507853599e-06, - "loss": 0.7812, - "step": 37352 - }, - { - "epoch": 0.96, - "learning_rate": 1.5926947644770596e-06, - "loss": 0.8623, - "step": 37353 - }, - { - "epoch": 0.96, - "learning_rate": 1.5926724777149604e-06, - "loss": 0.9648, - "step": 37354 - }, - { - "epoch": 0.96, - "learning_rate": 1.5926501904990792e-06, - "loss": 0.6694, - "step": 37355 - }, - { - "epoch": 0.96, - "learning_rate": 1.592627902829433e-06, - "loss": 1.0342, - "step": 37356 - }, - { - "epoch": 0.96, - "learning_rate": 1.5926056147060386e-06, - "loss": 0.8418, - "step": 37357 - }, - { - "epoch": 0.96, - "learning_rate": 1.5925833261289138e-06, - "loss": 0.9463, - "step": 37358 - }, - { - "epoch": 0.96, - "learning_rate": 1.5925610370980748e-06, - "loss": 1.0205, - "step": 37359 - }, - { - "epoch": 0.96, - "learning_rate": 1.5925387476135393e-06, - "loss": 0.9375, - "step": 37360 - }, - { - "epoch": 0.96, - "learning_rate": 1.592516457675324e-06, - "loss": 0.6074, - "step": 37361 - }, - { - "epoch": 0.96, - "learning_rate": 1.5924941672834461e-06, - "loss": 0.7803, - "step": 37362 - }, - { - "epoch": 0.96, - "learning_rate": 1.5924718764379229e-06, - "loss": 0.7725, - "step": 37363 - }, - { - "epoch": 0.96, - "learning_rate": 1.5924495851387709e-06, - "loss": 0.9229, - "step": 37364 - }, - { - "epoch": 0.96, - "learning_rate": 1.5924272933860077e-06, - "loss": 0.8838, - "step": 37365 - }, - { - "epoch": 0.96, - "learning_rate": 1.59240500117965e-06, - "loss": 0.7842, - "step": 37366 - }, - { - "epoch": 0.96, - "learning_rate": 1.592382708519715e-06, - "loss": 0.7183, - "step": 37367 - }, - { - "epoch": 0.96, - "learning_rate": 1.59236041540622e-06, - "loss": 0.7979, - "step": 37368 - }, - { - "epoch": 0.96, - "learning_rate": 1.5923381218391817e-06, - "loss": 0.8271, - "step": 37369 - }, - { - "epoch": 0.96, - "learning_rate": 1.5923158278186174e-06, - "loss": 0.8652, - "step": 37370 - }, - { - "epoch": 0.96, - "learning_rate": 1.5922935333445441e-06, - "loss": 0.6436, - "step": 37371 - }, - { - "epoch": 0.96, - "learning_rate": 1.592271238416979e-06, - "loss": 0.8447, - "step": 37372 - }, - { - "epoch": 0.96, - "learning_rate": 1.592248943035939e-06, - "loss": 0.8691, - "step": 37373 - }, - { - "epoch": 0.96, - "learning_rate": 1.592226647201441e-06, - "loss": 0.7832, - "step": 37374 - }, - { - "epoch": 0.96, - "learning_rate": 1.5922043509135025e-06, - "loss": 0.7915, - "step": 37375 - }, - { - "epoch": 0.96, - "learning_rate": 1.5921820541721403e-06, - "loss": 1.0547, - "step": 37376 - }, - { - "epoch": 0.96, - "learning_rate": 1.5921597569773715e-06, - "loss": 0.7063, - "step": 37377 - }, - { - "epoch": 0.96, - "learning_rate": 1.5921374593292131e-06, - "loss": 0.8809, - "step": 37378 - }, - { - "epoch": 0.96, - "learning_rate": 1.5921151612276825e-06, - "loss": 0.833, - "step": 37379 - }, - { - "epoch": 0.96, - "learning_rate": 1.5920928626727965e-06, - "loss": 0.7227, - "step": 37380 - }, - { - "epoch": 0.96, - "learning_rate": 1.5920705636645721e-06, - "loss": 0.8716, - "step": 37381 - }, - { - "epoch": 0.96, - "learning_rate": 1.5920482642030267e-06, - "loss": 0.6411, - "step": 37382 - }, - { - "epoch": 0.96, - "learning_rate": 1.5920259642881768e-06, - "loss": 0.8105, - "step": 37383 - }, - { - "epoch": 0.96, - "learning_rate": 1.5920036639200402e-06, - "loss": 0.6135, - "step": 37384 - }, - { - "epoch": 0.96, - "learning_rate": 1.5919813630986336e-06, - "loss": 0.916, - "step": 37385 - }, - { - "epoch": 0.96, - "learning_rate": 1.591959061823974e-06, - "loss": 0.645, - "step": 37386 - }, - { - "epoch": 0.96, - "learning_rate": 1.5919367600960784e-06, - "loss": 0.8789, - "step": 37387 - }, - { - "epoch": 0.96, - "learning_rate": 1.5919144579149641e-06, - "loss": 0.7617, - "step": 37388 - }, - { - "epoch": 0.96, - "learning_rate": 1.5918921552806483e-06, - "loss": 0.7744, - "step": 37389 - }, - { - "epoch": 0.96, - "learning_rate": 1.591869852193148e-06, - "loss": 0.8271, - "step": 37390 - }, - { - "epoch": 0.96, - "learning_rate": 1.59184754865248e-06, - "loss": 1.3281, - "step": 37391 - }, - { - "epoch": 0.96, - "learning_rate": 1.5918252446586613e-06, - "loss": 1.0967, - "step": 37392 - }, - { - "epoch": 0.96, - "learning_rate": 1.5918029402117093e-06, - "loss": 0.9043, - "step": 37393 - }, - { - "epoch": 0.96, - "learning_rate": 1.5917806353116411e-06, - "loss": 0.8926, - "step": 37394 - }, - { - "epoch": 0.96, - "learning_rate": 1.5917583299584738e-06, - "loss": 0.9009, - "step": 37395 - }, - { - "epoch": 0.96, - "learning_rate": 1.5917360241522243e-06, - "loss": 0.7725, - "step": 37396 - }, - { - "epoch": 0.96, - "learning_rate": 1.5917137178929096e-06, - "loss": 0.7559, - "step": 37397 - }, - { - "epoch": 0.96, - "learning_rate": 1.591691411180547e-06, - "loss": 0.8049, - "step": 37398 - }, - { - "epoch": 0.96, - "learning_rate": 1.5916691040151537e-06, - "loss": 0.7969, - "step": 37399 - }, - { - "epoch": 0.96, - "learning_rate": 1.5916467963967463e-06, - "loss": 0.8643, - "step": 37400 - }, - { - "epoch": 0.96, - "learning_rate": 1.5916244883253422e-06, - "loss": 0.7192, - "step": 37401 - }, - { - "epoch": 0.96, - "learning_rate": 1.5916021798009585e-06, - "loss": 0.6528, - "step": 37402 - }, - { - "epoch": 0.96, - "learning_rate": 1.591579870823612e-06, - "loss": 0.8115, - "step": 37403 - }, - { - "epoch": 0.96, - "learning_rate": 1.59155756139332e-06, - "loss": 0.7617, - "step": 37404 - }, - { - "epoch": 0.96, - "learning_rate": 1.5915352515101002e-06, - "loss": 0.9023, - "step": 37405 - }, - { - "epoch": 0.96, - "learning_rate": 1.5915129411739685e-06, - "loss": 0.8506, - "step": 37406 - }, - { - "epoch": 0.96, - "learning_rate": 1.5914906303849426e-06, - "loss": 0.6753, - "step": 37407 - }, - { - "epoch": 0.96, - "learning_rate": 1.5914683191430396e-06, - "loss": 0.8369, - "step": 37408 - }, - { - "epoch": 0.96, - "learning_rate": 1.5914460074482766e-06, - "loss": 1.0078, - "step": 37409 - }, - { - "epoch": 0.96, - "learning_rate": 1.5914236953006707e-06, - "loss": 0.7319, - "step": 37410 - }, - { - "epoch": 0.96, - "learning_rate": 1.5914013827002384e-06, - "loss": 0.7466, - "step": 37411 - }, - { - "epoch": 0.96, - "learning_rate": 1.5913790696469973e-06, - "loss": 0.9346, - "step": 37412 - }, - { - "epoch": 0.96, - "learning_rate": 1.5913567561409647e-06, - "loss": 0.7881, - "step": 37413 - }, - { - "epoch": 0.96, - "learning_rate": 1.5913344421821573e-06, - "loss": 0.7627, - "step": 37414 - }, - { - "epoch": 0.96, - "learning_rate": 1.5913121277705926e-06, - "loss": 0.9756, - "step": 37415 - }, - { - "epoch": 0.96, - "learning_rate": 1.591289812906287e-06, - "loss": 1.0859, - "step": 37416 - }, - { - "epoch": 0.96, - "learning_rate": 1.591267497589258e-06, - "loss": 0.9473, - "step": 37417 - }, - { - "epoch": 0.96, - "learning_rate": 1.5912451818195228e-06, - "loss": 0.834, - "step": 37418 - }, - { - "epoch": 0.96, - "learning_rate": 1.5912228655970985e-06, - "loss": 0.9121, - "step": 37419 - }, - { - "epoch": 0.96, - "learning_rate": 1.5912005489220017e-06, - "loss": 0.7969, - "step": 37420 - }, - { - "epoch": 0.96, - "learning_rate": 1.5911782317942501e-06, - "loss": 0.8232, - "step": 37421 - }, - { - "epoch": 0.96, - "learning_rate": 1.5911559142138602e-06, - "loss": 0.708, - "step": 37422 - }, - { - "epoch": 0.96, - "learning_rate": 1.5911335961808496e-06, - "loss": 0.8213, - "step": 37423 - }, - { - "epoch": 0.96, - "learning_rate": 1.5911112776952354e-06, - "loss": 0.8574, - "step": 37424 - }, - { - "epoch": 0.96, - "learning_rate": 1.5910889587570343e-06, - "loss": 0.7478, - "step": 37425 - }, - { - "epoch": 0.96, - "learning_rate": 1.5910666393662635e-06, - "loss": 0.8945, - "step": 37426 - }, - { - "epoch": 0.96, - "learning_rate": 1.5910443195229402e-06, - "loss": 1.0225, - "step": 37427 - }, - { - "epoch": 0.96, - "learning_rate": 1.5910219992270814e-06, - "loss": 0.8789, - "step": 37428 - }, - { - "epoch": 0.96, - "learning_rate": 1.5909996784787043e-06, - "loss": 0.8003, - "step": 37429 - }, - { - "epoch": 0.96, - "learning_rate": 1.590977357277826e-06, - "loss": 0.8359, - "step": 37430 - }, - { - "epoch": 0.96, - "learning_rate": 1.5909550356244633e-06, - "loss": 0.8164, - "step": 37431 - }, - { - "epoch": 0.96, - "learning_rate": 1.5909327135186335e-06, - "loss": 0.8208, - "step": 37432 - }, - { - "epoch": 0.96, - "learning_rate": 1.5909103909603538e-06, - "loss": 0.6267, - "step": 37433 - }, - { - "epoch": 0.96, - "learning_rate": 1.590888067949641e-06, - "loss": 0.8442, - "step": 37434 - }, - { - "epoch": 0.96, - "learning_rate": 1.5908657444865128e-06, - "loss": 0.853, - "step": 37435 - }, - { - "epoch": 0.96, - "learning_rate": 1.5908434205709856e-06, - "loss": 0.6709, - "step": 37436 - }, - { - "epoch": 0.96, - "learning_rate": 1.5908210962030767e-06, - "loss": 0.8506, - "step": 37437 - }, - { - "epoch": 0.96, - "learning_rate": 1.5907987713828034e-06, - "loss": 0.7417, - "step": 37438 - }, - { - "epoch": 0.96, - "learning_rate": 1.5907764461101824e-06, - "loss": 0.4043, - "step": 37439 - }, - { - "epoch": 0.96, - "learning_rate": 1.5907541203852315e-06, - "loss": 0.9072, - "step": 37440 - }, - { - "epoch": 0.96, - "learning_rate": 1.5907317942079667e-06, - "loss": 0.9307, - "step": 37441 - }, - { - "epoch": 0.96, - "learning_rate": 1.5907094675784062e-06, - "loss": 0.6919, - "step": 37442 - }, - { - "epoch": 0.96, - "learning_rate": 1.5906871404965665e-06, - "loss": 0.8467, - "step": 37443 - }, - { - "epoch": 0.96, - "learning_rate": 1.5906648129624648e-06, - "loss": 0.783, - "step": 37444 - }, - { - "epoch": 0.96, - "learning_rate": 1.5906424849761185e-06, - "loss": 0.9072, - "step": 37445 - }, - { - "epoch": 0.96, - "learning_rate": 1.5906201565375442e-06, - "loss": 0.793, - "step": 37446 - }, - { - "epoch": 0.96, - "learning_rate": 1.590597827646759e-06, - "loss": 0.793, - "step": 37447 - }, - { - "epoch": 0.96, - "learning_rate": 1.5905754983037802e-06, - "loss": 0.8848, - "step": 37448 - }, - { - "epoch": 0.96, - "learning_rate": 1.590553168508625e-06, - "loss": 0.9854, - "step": 37449 - }, - { - "epoch": 0.96, - "learning_rate": 1.5905308382613108e-06, - "loss": 0.7588, - "step": 37450 - }, - { - "epoch": 0.96, - "learning_rate": 1.5905085075618536e-06, - "loss": 1.0186, - "step": 37451 - }, - { - "epoch": 0.96, - "learning_rate": 1.5904861764102715e-06, - "loss": 0.8828, - "step": 37452 - }, - { - "epoch": 0.96, - "learning_rate": 1.5904638448065812e-06, - "loss": 0.8965, - "step": 37453 - }, - { - "epoch": 0.96, - "learning_rate": 1.5904415127508001e-06, - "loss": 0.6196, - "step": 37454 - }, - { - "epoch": 0.96, - "learning_rate": 1.590419180242945e-06, - "loss": 0.7769, - "step": 37455 - }, - { - "epoch": 0.96, - "learning_rate": 1.590396847283033e-06, - "loss": 0.9238, - "step": 37456 - }, - { - "epoch": 0.96, - "learning_rate": 1.5903745138710813e-06, - "loss": 0.8223, - "step": 37457 - }, - { - "epoch": 0.96, - "learning_rate": 1.590352180007107e-06, - "loss": 0.8613, - "step": 37458 - }, - { - "epoch": 0.96, - "learning_rate": 1.5903298456911272e-06, - "loss": 0.8926, - "step": 37459 - }, - { - "epoch": 0.96, - "learning_rate": 1.590307510923159e-06, - "loss": 0.6538, - "step": 37460 - }, - { - "epoch": 0.96, - "learning_rate": 1.5902851757032196e-06, - "loss": 1.0029, - "step": 37461 - }, - { - "epoch": 0.96, - "learning_rate": 1.5902628400313257e-06, - "loss": 0.698, - "step": 37462 - }, - { - "epoch": 0.96, - "learning_rate": 1.590240503907495e-06, - "loss": 0.9668, - "step": 37463 - }, - { - "epoch": 0.96, - "learning_rate": 1.5902181673317438e-06, - "loss": 0.7705, - "step": 37464 - }, - { - "epoch": 0.96, - "learning_rate": 1.59019583030409e-06, - "loss": 0.8857, - "step": 37465 - }, - { - "epoch": 0.96, - "learning_rate": 1.5901734928245506e-06, - "loss": 0.9766, - "step": 37466 - }, - { - "epoch": 0.96, - "learning_rate": 1.5901511548931421e-06, - "loss": 0.7988, - "step": 37467 - }, - { - "epoch": 0.96, - "learning_rate": 1.5901288165098822e-06, - "loss": 0.7637, - "step": 37468 - }, - { - "epoch": 0.96, - "learning_rate": 1.5901064776747877e-06, - "loss": 1.0781, - "step": 37469 - }, - { - "epoch": 0.96, - "learning_rate": 1.590084138387876e-06, - "loss": 0.6128, - "step": 37470 - }, - { - "epoch": 0.96, - "learning_rate": 1.590061798649164e-06, - "loss": 0.7627, - "step": 37471 - }, - { - "epoch": 0.96, - "learning_rate": 1.5900394584586688e-06, - "loss": 0.9404, - "step": 37472 - }, - { - "epoch": 0.96, - "learning_rate": 1.5900171178164072e-06, - "loss": 0.8936, - "step": 37473 - }, - { - "epoch": 0.96, - "learning_rate": 1.5899947767223968e-06, - "loss": 0.8125, - "step": 37474 - }, - { - "epoch": 0.96, - "learning_rate": 1.5899724351766545e-06, - "loss": 0.7207, - "step": 37475 - }, - { - "epoch": 0.96, - "learning_rate": 1.5899500931791976e-06, - "loss": 0.7754, - "step": 37476 - }, - { - "epoch": 0.96, - "learning_rate": 1.5899277507300428e-06, - "loss": 0.96, - "step": 37477 - }, - { - "epoch": 0.96, - "learning_rate": 1.5899054078292076e-06, - "loss": 0.8994, - "step": 37478 - }, - { - "epoch": 0.96, - "learning_rate": 1.5898830644767089e-06, - "loss": 0.9805, - "step": 37479 - }, - { - "epoch": 0.96, - "learning_rate": 1.5898607206725641e-06, - "loss": 0.6145, - "step": 37480 - }, - { - "epoch": 0.96, - "learning_rate": 1.58983837641679e-06, - "loss": 0.7803, - "step": 37481 - }, - { - "epoch": 0.96, - "learning_rate": 1.5898160317094035e-06, - "loss": 1.0791, - "step": 37482 - }, - { - "epoch": 0.96, - "learning_rate": 1.589793686550422e-06, - "loss": 0.7817, - "step": 37483 - }, - { - "epoch": 0.96, - "learning_rate": 1.5897713409398627e-06, - "loss": 0.9619, - "step": 37484 - }, - { - "epoch": 0.96, - "learning_rate": 1.5897489948777428e-06, - "loss": 0.8818, - "step": 37485 - }, - { - "epoch": 0.96, - "learning_rate": 1.589726648364079e-06, - "loss": 0.8506, - "step": 37486 - }, - { - "epoch": 0.96, - "learning_rate": 1.5897043013988886e-06, - "loss": 1.0469, - "step": 37487 - }, - { - "epoch": 0.96, - "learning_rate": 1.5896819539821888e-06, - "loss": 0.958, - "step": 37488 - }, - { - "epoch": 0.96, - "learning_rate": 1.5896596061139967e-06, - "loss": 0.5791, - "step": 37489 - }, - { - "epoch": 0.96, - "learning_rate": 1.5896372577943294e-06, - "loss": 0.9131, - "step": 37490 - }, - { - "epoch": 0.96, - "learning_rate": 1.5896149090232038e-06, - "loss": 0.7627, - "step": 37491 - }, - { - "epoch": 0.96, - "learning_rate": 1.589592559800637e-06, - "loss": 0.9307, - "step": 37492 - }, - { - "epoch": 0.96, - "learning_rate": 1.5895702101266466e-06, - "loss": 0.8838, - "step": 37493 - }, - { - "epoch": 0.96, - "learning_rate": 1.5895478600012493e-06, - "loss": 0.8701, - "step": 37494 - }, - { - "epoch": 0.96, - "learning_rate": 1.5895255094244627e-06, - "loss": 0.7363, - "step": 37495 - }, - { - "epoch": 0.96, - "learning_rate": 1.5895031583963028e-06, - "loss": 0.9912, - "step": 37496 - }, - { - "epoch": 0.96, - "learning_rate": 1.589480806916788e-06, - "loss": 0.6338, - "step": 37497 - }, - { - "epoch": 0.96, - "learning_rate": 1.5894584549859345e-06, - "loss": 0.8262, - "step": 37498 - }, - { - "epoch": 0.96, - "learning_rate": 1.5894361026037597e-06, - "loss": 0.8457, - "step": 37499 - }, - { - "epoch": 0.96, - "learning_rate": 1.5894137497702814e-06, - "loss": 0.6797, - "step": 37500 - }, - { - "epoch": 0.96, - "learning_rate": 1.5893913964855154e-06, - "loss": 0.6147, - "step": 37501 - }, - { - "epoch": 0.96, - "learning_rate": 1.5893690427494799e-06, - "loss": 0.7104, - "step": 37502 - }, - { - "epoch": 0.96, - "learning_rate": 1.5893466885621916e-06, - "loss": 0.8799, - "step": 37503 - }, - { - "epoch": 0.96, - "learning_rate": 1.5893243339236672e-06, - "loss": 0.7046, - "step": 37504 - }, - { - "epoch": 0.96, - "learning_rate": 1.5893019788339248e-06, - "loss": 0.7607, - "step": 37505 - }, - { - "epoch": 0.96, - "learning_rate": 1.589279623292981e-06, - "loss": 0.8071, - "step": 37506 - }, - { - "epoch": 0.96, - "learning_rate": 1.5892572673008524e-06, - "loss": 0.79, - "step": 37507 - }, - { - "epoch": 0.96, - "learning_rate": 1.5892349108575569e-06, - "loss": 0.9082, - "step": 37508 - }, - { - "epoch": 0.96, - "learning_rate": 1.589212553963111e-06, - "loss": 0.7695, - "step": 37509 - }, - { - "epoch": 0.96, - "learning_rate": 1.5891901966175327e-06, - "loss": 0.9092, - "step": 37510 - }, - { - "epoch": 0.96, - "learning_rate": 1.5891678388208382e-06, - "loss": 0.6772, - "step": 37511 - }, - { - "epoch": 0.96, - "learning_rate": 1.589145480573045e-06, - "loss": 0.8037, - "step": 37512 - }, - { - "epoch": 0.96, - "learning_rate": 1.5891231218741705e-06, - "loss": 0.8232, - "step": 37513 - }, - { - "epoch": 0.96, - "learning_rate": 1.589100762724231e-06, - "loss": 1.1387, - "step": 37514 - }, - { - "epoch": 0.96, - "learning_rate": 1.5890784031232446e-06, - "loss": 0.8799, - "step": 37515 - }, - { - "epoch": 0.96, - "learning_rate": 1.5890560430712277e-06, - "loss": 0.6517, - "step": 37516 - }, - { - "epoch": 0.96, - "learning_rate": 1.589033682568198e-06, - "loss": 0.7627, - "step": 37517 - }, - { - "epoch": 0.96, - "learning_rate": 1.5890113216141718e-06, - "loss": 0.8447, - "step": 37518 - }, - { - "epoch": 0.96, - "learning_rate": 1.5889889602091669e-06, - "loss": 0.7881, - "step": 37519 - }, - { - "epoch": 0.96, - "learning_rate": 1.5889665983532004e-06, - "loss": 0.8955, - "step": 37520 - }, - { - "epoch": 0.96, - "learning_rate": 1.5889442360462892e-06, - "loss": 0.875, - "step": 37521 - }, - { - "epoch": 0.96, - "learning_rate": 1.5889218732884505e-06, - "loss": 0.7871, - "step": 37522 - }, - { - "epoch": 0.96, - "learning_rate": 1.5888995100797012e-06, - "loss": 0.6084, - "step": 37523 - }, - { - "epoch": 0.96, - "learning_rate": 1.5888771464200587e-06, - "loss": 0.8721, - "step": 37524 - }, - { - "epoch": 0.96, - "learning_rate": 1.5888547823095402e-06, - "loss": 0.6357, - "step": 37525 - }, - { - "epoch": 0.96, - "learning_rate": 1.5888324177481625e-06, - "loss": 0.5649, - "step": 37526 - }, - { - "epoch": 0.96, - "learning_rate": 1.5888100527359429e-06, - "loss": 0.6914, - "step": 37527 - }, - { - "epoch": 0.96, - "learning_rate": 1.5887876872728984e-06, - "loss": 0.9443, - "step": 37528 - }, - { - "epoch": 0.96, - "learning_rate": 1.5887653213590465e-06, - "loss": 0.875, - "step": 37529 - }, - { - "epoch": 0.96, - "learning_rate": 1.588742954994404e-06, - "loss": 0.9795, - "step": 37530 - }, - { - "epoch": 0.96, - "learning_rate": 1.588720588178988e-06, - "loss": 0.52, - "step": 37531 - }, - { - "epoch": 0.96, - "learning_rate": 1.5886982209128159e-06, - "loss": 0.9033, - "step": 37532 - }, - { - "epoch": 0.96, - "learning_rate": 1.5886758531959044e-06, - "loss": 0.7383, - "step": 37533 - }, - { - "epoch": 0.96, - "learning_rate": 1.588653485028271e-06, - "loss": 0.9287, - "step": 37534 - }, - { - "epoch": 0.96, - "learning_rate": 1.5886311164099327e-06, - "loss": 0.613, - "step": 37535 - }, - { - "epoch": 0.96, - "learning_rate": 1.5886087473409066e-06, - "loss": 0.7559, - "step": 37536 - }, - { - "epoch": 0.96, - "learning_rate": 1.5885863778212098e-06, - "loss": 0.7644, - "step": 37537 - }, - { - "epoch": 0.96, - "learning_rate": 1.5885640078508595e-06, - "loss": 0.7656, - "step": 37538 - }, - { - "epoch": 0.96, - "learning_rate": 1.5885416374298729e-06, - "loss": 0.7134, - "step": 37539 - }, - { - "epoch": 0.96, - "learning_rate": 1.5885192665582673e-06, - "loss": 0.8486, - "step": 37540 - }, - { - "epoch": 0.96, - "learning_rate": 1.588496895236059e-06, - "loss": 0.7578, - "step": 37541 - }, - { - "epoch": 0.96, - "learning_rate": 1.5884745234632657e-06, - "loss": 0.9941, - "step": 37542 - }, - { - "epoch": 0.96, - "learning_rate": 1.5884521512399048e-06, - "loss": 0.9189, - "step": 37543 - }, - { - "epoch": 0.96, - "learning_rate": 1.588429778565993e-06, - "loss": 0.8682, - "step": 37544 - }, - { - "epoch": 0.96, - "learning_rate": 1.5884074054415479e-06, - "loss": 0.9189, - "step": 37545 - }, - { - "epoch": 0.96, - "learning_rate": 1.588385031866586e-06, - "loss": 0.644, - "step": 37546 - }, - { - "epoch": 0.96, - "learning_rate": 1.5883626578411248e-06, - "loss": 0.9766, - "step": 37547 - }, - { - "epoch": 0.96, - "learning_rate": 1.5883402833651811e-06, - "loss": 0.8135, - "step": 37548 - }, - { - "epoch": 0.96, - "learning_rate": 1.5883179084387727e-06, - "loss": 0.8047, - "step": 37549 - }, - { - "epoch": 0.96, - "learning_rate": 1.588295533061916e-06, - "loss": 0.7188, - "step": 37550 - }, - { - "epoch": 0.96, - "learning_rate": 1.5882731572346288e-06, - "loss": 0.7915, - "step": 37551 - }, - { - "epoch": 0.96, - "learning_rate": 1.5882507809569277e-06, - "loss": 0.7319, - "step": 37552 - }, - { - "epoch": 0.96, - "learning_rate": 1.5882284042288298e-06, - "loss": 0.9189, - "step": 37553 - }, - { - "epoch": 0.96, - "learning_rate": 1.588206027050353e-06, - "loss": 0.8315, - "step": 37554 - }, - { - "epoch": 0.96, - "learning_rate": 1.5881836494215134e-06, - "loss": 0.9824, - "step": 37555 - }, - { - "epoch": 0.96, - "learning_rate": 1.588161271342329e-06, - "loss": 0.6086, - "step": 37556 - }, - { - "epoch": 0.96, - "learning_rate": 1.5881388928128163e-06, - "loss": 0.6714, - "step": 37557 - }, - { - "epoch": 0.96, - "learning_rate": 1.588116513832993e-06, - "loss": 0.6694, - "step": 37558 - }, - { - "epoch": 0.96, - "learning_rate": 1.5880941344028753e-06, - "loss": 0.6255, - "step": 37559 - }, - { - "epoch": 0.96, - "learning_rate": 1.5880717545224816e-06, - "loss": 0.7549, - "step": 37560 - }, - { - "epoch": 0.96, - "learning_rate": 1.5880493741918282e-06, - "loss": 0.7119, - "step": 37561 - }, - { - "epoch": 0.96, - "learning_rate": 1.5880269934109322e-06, - "loss": 0.6895, - "step": 37562 - }, - { - "epoch": 0.96, - "learning_rate": 1.5880046121798114e-06, - "loss": 0.9648, - "step": 37563 - }, - { - "epoch": 0.96, - "learning_rate": 1.5879822304984823e-06, - "loss": 0.834, - "step": 37564 - }, - { - "epoch": 0.96, - "learning_rate": 1.5879598483669621e-06, - "loss": 0.9697, - "step": 37565 - }, - { - "epoch": 0.96, - "learning_rate": 1.5879374657852683e-06, - "loss": 0.8164, - "step": 37566 - }, - { - "epoch": 0.96, - "learning_rate": 1.5879150827534175e-06, - "loss": 0.9756, - "step": 37567 - }, - { - "epoch": 0.96, - "learning_rate": 1.5878926992714274e-06, - "loss": 1.0293, - "step": 37568 - }, - { - "epoch": 0.96, - "learning_rate": 1.5878703153393147e-06, - "loss": 0.749, - "step": 37569 - }, - { - "epoch": 0.96, - "learning_rate": 1.5878479309570971e-06, - "loss": 0.7764, - "step": 37570 - }, - { - "epoch": 0.96, - "learning_rate": 1.5878255461247912e-06, - "loss": 0.9814, - "step": 37571 - }, - { - "epoch": 0.96, - "learning_rate": 1.5878031608424142e-06, - "loss": 0.8037, - "step": 37572 - }, - { - "epoch": 0.96, - "learning_rate": 1.5877807751099835e-06, - "loss": 1.04, - "step": 37573 - }, - { - "epoch": 0.96, - "learning_rate": 1.587758388927516e-06, - "loss": 0.9473, - "step": 37574 - }, - { - "epoch": 0.96, - "learning_rate": 1.587736002295029e-06, - "loss": 0.8418, - "step": 37575 - }, - { - "epoch": 0.96, - "learning_rate": 1.5877136152125394e-06, - "loss": 1.0293, - "step": 37576 - }, - { - "epoch": 0.96, - "learning_rate": 1.5876912276800644e-06, - "loss": 0.9668, - "step": 37577 - }, - { - "epoch": 0.96, - "learning_rate": 1.5876688396976214e-06, - "loss": 0.916, - "step": 37578 - }, - { - "epoch": 0.96, - "learning_rate": 1.5876464512652277e-06, - "loss": 0.8408, - "step": 37579 - }, - { - "epoch": 0.96, - "learning_rate": 1.5876240623829e-06, - "loss": 0.7422, - "step": 37580 - }, - { - "epoch": 0.96, - "learning_rate": 1.5876016730506554e-06, - "loss": 0.7246, - "step": 37581 - }, - { - "epoch": 0.96, - "learning_rate": 1.5875792832685111e-06, - "loss": 0.8384, - "step": 37582 - }, - { - "epoch": 0.96, - "learning_rate": 1.5875568930364845e-06, - "loss": 0.7817, - "step": 37583 - }, - { - "epoch": 0.96, - "learning_rate": 1.5875345023545928e-06, - "loss": 1.0693, - "step": 37584 - }, - { - "epoch": 0.96, - "learning_rate": 1.587512111222853e-06, - "loss": 0.9648, - "step": 37585 - }, - { - "epoch": 0.96, - "learning_rate": 1.5874897196412818e-06, - "loss": 0.7861, - "step": 37586 - }, - { - "epoch": 0.96, - "learning_rate": 1.5874673276098968e-06, - "loss": 0.8047, - "step": 37587 - }, - { - "epoch": 0.96, - "learning_rate": 1.5874449351287152e-06, - "loss": 1.002, - "step": 37588 - }, - { - "epoch": 0.96, - "learning_rate": 1.5874225421977539e-06, - "loss": 0.7769, - "step": 37589 - }, - { - "epoch": 0.96, - "learning_rate": 1.5874001488170303e-06, - "loss": 0.8105, - "step": 37590 - }, - { - "epoch": 0.96, - "learning_rate": 1.5873777549865617e-06, - "loss": 0.7153, - "step": 37591 - }, - { - "epoch": 0.96, - "learning_rate": 1.5873553607063644e-06, - "loss": 0.8652, - "step": 37592 - }, - { - "epoch": 0.96, - "learning_rate": 1.5873329659764565e-06, - "loss": 0.9941, - "step": 37593 - }, - { - "epoch": 0.96, - "learning_rate": 1.5873105707968546e-06, - "loss": 0.7422, - "step": 37594 - }, - { - "epoch": 0.96, - "learning_rate": 1.587288175167576e-06, - "loss": 0.9287, - "step": 37595 - }, - { - "epoch": 0.96, - "learning_rate": 1.5872657790886379e-06, - "loss": 0.7324, - "step": 37596 - }, - { - "epoch": 0.96, - "learning_rate": 1.5872433825600574e-06, - "loss": 0.8262, - "step": 37597 - }, - { - "epoch": 0.96, - "learning_rate": 1.5872209855818515e-06, - "loss": 0.8066, - "step": 37598 - }, - { - "epoch": 0.96, - "learning_rate": 1.5871985881540378e-06, - "loss": 0.8223, - "step": 37599 - }, - { - "epoch": 0.96, - "learning_rate": 1.5871761902766328e-06, - "loss": 0.6763, - "step": 37600 - }, - { - "epoch": 0.96, - "learning_rate": 1.587153791949654e-06, - "loss": 0.7861, - "step": 37601 - }, - { - "epoch": 0.96, - "learning_rate": 1.5871313931731188e-06, - "loss": 0.7354, - "step": 37602 - }, - { - "epoch": 0.96, - "learning_rate": 1.587108993947044e-06, - "loss": 0.9873, - "step": 37603 - }, - { - "epoch": 0.96, - "learning_rate": 1.5870865942714466e-06, - "loss": 0.6523, - "step": 37604 - }, - { - "epoch": 0.96, - "learning_rate": 1.5870641941463446e-06, - "loss": 1.0117, - "step": 37605 - }, - { - "epoch": 0.96, - "learning_rate": 1.5870417935717537e-06, - "loss": 0.9609, - "step": 37606 - }, - { - "epoch": 0.96, - "learning_rate": 1.5870193925476924e-06, - "loss": 0.9336, - "step": 37607 - }, - { - "epoch": 0.96, - "learning_rate": 1.5869969910741774e-06, - "loss": 0.8018, - "step": 37608 - }, - { - "epoch": 0.96, - "learning_rate": 1.5869745891512257e-06, - "loss": 0.8467, - "step": 37609 - }, - { - "epoch": 0.96, - "learning_rate": 1.5869521867788544e-06, - "loss": 0.9219, - "step": 37610 - }, - { - "epoch": 0.96, - "learning_rate": 1.5869297839570809e-06, - "loss": 0.9678, - "step": 37611 - }, - { - "epoch": 0.96, - "learning_rate": 1.5869073806859223e-06, - "loss": 0.9375, - "step": 37612 - }, - { - "epoch": 0.96, - "learning_rate": 1.5868849769653956e-06, - "loss": 0.7051, - "step": 37613 - }, - { - "epoch": 0.96, - "learning_rate": 1.586862572795518e-06, - "loss": 0.8721, - "step": 37614 - }, - { - "epoch": 0.96, - "learning_rate": 1.586840168176307e-06, - "loss": 0.8701, - "step": 37615 - }, - { - "epoch": 0.96, - "learning_rate": 1.5868177631077794e-06, - "loss": 0.8535, - "step": 37616 - }, - { - "epoch": 0.96, - "learning_rate": 1.5867953575899523e-06, - "loss": 0.8027, - "step": 37617 - }, - { - "epoch": 0.96, - "learning_rate": 1.586772951622843e-06, - "loss": 0.9043, - "step": 37618 - }, - { - "epoch": 0.96, - "learning_rate": 1.5867505452064686e-06, - "loss": 0.875, - "step": 37619 - }, - { - "epoch": 0.96, - "learning_rate": 1.5867281383408463e-06, - "loss": 0.7676, - "step": 37620 - }, - { - "epoch": 0.96, - "learning_rate": 1.5867057310259932e-06, - "loss": 0.8105, - "step": 37621 - }, - { - "epoch": 0.96, - "learning_rate": 1.5866833232619265e-06, - "loss": 0.8428, - "step": 37622 - }, - { - "epoch": 0.96, - "learning_rate": 1.5866609150486637e-06, - "loss": 0.7637, - "step": 37623 - }, - { - "epoch": 0.96, - "learning_rate": 1.586638506386221e-06, - "loss": 0.957, - "step": 37624 - }, - { - "epoch": 0.96, - "learning_rate": 1.5866160972746168e-06, - "loss": 0.7773, - "step": 37625 - }, - { - "epoch": 0.96, - "learning_rate": 1.5865936877138674e-06, - "loss": 0.6777, - "step": 37626 - }, - { - "epoch": 0.96, - "learning_rate": 1.58657127770399e-06, - "loss": 0.9424, - "step": 37627 - }, - { - "epoch": 0.96, - "learning_rate": 1.586548867245002e-06, - "loss": 0.8013, - "step": 37628 - }, - { - "epoch": 0.96, - "learning_rate": 1.5865264563369205e-06, - "loss": 0.8447, - "step": 37629 - }, - { - "epoch": 0.96, - "learning_rate": 1.5865040449797628e-06, - "loss": 0.6948, - "step": 37630 - }, - { - "epoch": 0.96, - "learning_rate": 1.586481633173546e-06, - "loss": 0.8955, - "step": 37631 - }, - { - "epoch": 0.96, - "learning_rate": 1.5864592209182867e-06, - "loss": 0.9756, - "step": 37632 - }, - { - "epoch": 0.96, - "learning_rate": 1.586436808214003e-06, - "loss": 0.7529, - "step": 37633 - }, - { - "epoch": 0.96, - "learning_rate": 1.5864143950607115e-06, - "loss": 0.8276, - "step": 37634 - }, - { - "epoch": 0.96, - "learning_rate": 1.5863919814584295e-06, - "loss": 0.916, - "step": 37635 - }, - { - "epoch": 0.96, - "learning_rate": 1.586369567407174e-06, - "loss": 0.9473, - "step": 37636 - }, - { - "epoch": 0.96, - "learning_rate": 1.5863471529069623e-06, - "loss": 0.7949, - "step": 37637 - }, - { - "epoch": 0.96, - "learning_rate": 1.5863247379578115e-06, - "loss": 0.7881, - "step": 37638 - }, - { - "epoch": 0.96, - "learning_rate": 1.586302322559739e-06, - "loss": 0.8359, - "step": 37639 - }, - { - "epoch": 0.96, - "learning_rate": 1.5862799067127616e-06, - "loss": 0.959, - "step": 37640 - }, - { - "epoch": 0.96, - "learning_rate": 1.5862574904168966e-06, - "loss": 0.9463, - "step": 37641 - }, - { - "epoch": 0.96, - "learning_rate": 1.5862350736721615e-06, - "loss": 0.6367, - "step": 37642 - }, - { - "epoch": 0.96, - "learning_rate": 1.5862126564785729e-06, - "loss": 0.6289, - "step": 37643 - }, - { - "epoch": 0.96, - "learning_rate": 1.5861902388361483e-06, - "loss": 0.9014, - "step": 37644 - }, - { - "epoch": 0.96, - "learning_rate": 1.5861678207449048e-06, - "loss": 1.0215, - "step": 37645 - }, - { - "epoch": 0.96, - "learning_rate": 1.5861454022048593e-06, - "loss": 0.6162, - "step": 37646 - }, - { - "epoch": 0.96, - "learning_rate": 1.5861229832160294e-06, - "loss": 1.0273, - "step": 37647 - }, - { - "epoch": 0.96, - "learning_rate": 1.5861005637784321e-06, - "loss": 0.9844, - "step": 37648 - }, - { - "epoch": 0.96, - "learning_rate": 1.5860781438920845e-06, - "loss": 0.9873, - "step": 37649 - }, - { - "epoch": 0.96, - "learning_rate": 1.586055723557004e-06, - "loss": 0.9551, - "step": 37650 - }, - { - "epoch": 0.97, - "learning_rate": 1.5860333027732075e-06, - "loss": 0.7979, - "step": 37651 - }, - { - "epoch": 0.97, - "learning_rate": 1.5860108815407123e-06, - "loss": 0.7822, - "step": 37652 - }, - { - "epoch": 0.97, - "learning_rate": 1.5859884598595353e-06, - "loss": 0.8926, - "step": 37653 - }, - { - "epoch": 0.97, - "learning_rate": 1.585966037729694e-06, - "loss": 0.8843, - "step": 37654 - }, - { - "epoch": 0.97, - "learning_rate": 1.5859436151512056e-06, - "loss": 0.833, - "step": 37655 - }, - { - "epoch": 0.97, - "learning_rate": 1.5859211921240869e-06, - "loss": 0.6255, - "step": 37656 - }, - { - "epoch": 0.97, - "learning_rate": 1.5858987686483553e-06, - "loss": 0.8018, - "step": 37657 - }, - { - "epoch": 0.97, - "learning_rate": 1.585876344724028e-06, - "loss": 1.0098, - "step": 37658 - }, - { - "epoch": 0.97, - "learning_rate": 1.5858539203511221e-06, - "loss": 0.7842, - "step": 37659 - }, - { - "epoch": 0.97, - "learning_rate": 1.5858314955296547e-06, - "loss": 0.7605, - "step": 37660 - }, - { - "epoch": 0.97, - "learning_rate": 1.5858090702596433e-06, - "loss": 0.9473, - "step": 37661 - }, - { - "epoch": 0.97, - "learning_rate": 1.5857866445411047e-06, - "loss": 1.0928, - "step": 37662 - }, - { - "epoch": 0.97, - "learning_rate": 1.5857642183740562e-06, - "loss": 0.7812, - "step": 37663 - }, - { - "epoch": 0.97, - "learning_rate": 1.5857417917585152e-06, - "loss": 1.1113, - "step": 37664 - }, - { - "epoch": 0.97, - "learning_rate": 1.5857193646944983e-06, - "loss": 1.0527, - "step": 37665 - }, - { - "epoch": 0.97, - "learning_rate": 1.585696937182023e-06, - "loss": 0.7979, - "step": 37666 - }, - { - "epoch": 0.97, - "learning_rate": 1.5856745092211066e-06, - "loss": 0.875, - "step": 37667 - }, - { - "epoch": 0.97, - "learning_rate": 1.5856520808117662e-06, - "loss": 0.9203, - "step": 37668 - }, - { - "epoch": 0.97, - "learning_rate": 1.5856296519540191e-06, - "loss": 0.6572, - "step": 37669 - }, - { - "epoch": 0.97, - "learning_rate": 1.585607222647882e-06, - "loss": 0.6187, - "step": 37670 - }, - { - "epoch": 0.97, - "learning_rate": 1.5855847928933726e-06, - "loss": 0.7163, - "step": 37671 - }, - { - "epoch": 0.97, - "learning_rate": 1.5855623626905078e-06, - "loss": 0.7642, - "step": 37672 - }, - { - "epoch": 0.97, - "learning_rate": 1.5855399320393046e-06, - "loss": 0.8848, - "step": 37673 - }, - { - "epoch": 0.97, - "learning_rate": 1.5855175009397806e-06, - "loss": 0.8965, - "step": 37674 - }, - { - "epoch": 0.97, - "learning_rate": 1.585495069391953e-06, - "loss": 0.6675, - "step": 37675 - }, - { - "epoch": 0.97, - "learning_rate": 1.585472637395838e-06, - "loss": 0.7783, - "step": 37676 - }, - { - "epoch": 0.97, - "learning_rate": 1.5854502049514542e-06, - "loss": 0.7417, - "step": 37677 - }, - { - "epoch": 0.97, - "learning_rate": 1.5854277720588178e-06, - "loss": 0.8105, - "step": 37678 - }, - { - "epoch": 0.97, - "learning_rate": 1.5854053387179466e-06, - "loss": 0.9414, - "step": 37679 - }, - { - "epoch": 0.97, - "learning_rate": 1.585382904928857e-06, - "loss": 0.8672, - "step": 37680 - }, - { - "epoch": 0.97, - "learning_rate": 1.585360470691567e-06, - "loss": 0.8828, - "step": 37681 - }, - { - "epoch": 0.97, - "learning_rate": 1.5853380360060933e-06, - "loss": 0.9082, - "step": 37682 - }, - { - "epoch": 0.97, - "learning_rate": 1.5853156008724532e-06, - "loss": 0.6533, - "step": 37683 - }, - { - "epoch": 0.97, - "learning_rate": 1.5852931652906636e-06, - "loss": 0.8013, - "step": 37684 - }, - { - "epoch": 0.97, - "learning_rate": 1.585270729260742e-06, - "loss": 0.8916, - "step": 37685 - }, - { - "epoch": 0.97, - "learning_rate": 1.5852482927827056e-06, - "loss": 0.748, - "step": 37686 - }, - { - "epoch": 0.97, - "learning_rate": 1.5852258558565716e-06, - "loss": 1.0273, - "step": 37687 - }, - { - "epoch": 0.97, - "learning_rate": 1.585203418482357e-06, - "loss": 0.7122, - "step": 37688 - }, - { - "epoch": 0.97, - "learning_rate": 1.5851809806600791e-06, - "loss": 0.8379, - "step": 37689 - }, - { - "epoch": 0.97, - "learning_rate": 1.585158542389755e-06, - "loss": 0.5376, - "step": 37690 - }, - { - "epoch": 0.97, - "learning_rate": 1.585136103671402e-06, - "loss": 0.8071, - "step": 37691 - }, - { - "epoch": 0.97, - "learning_rate": 1.585113664505037e-06, - "loss": 0.7505, - "step": 37692 - }, - { - "epoch": 0.97, - "learning_rate": 1.5850912248906774e-06, - "loss": 0.7769, - "step": 37693 - }, - { - "epoch": 0.97, - "learning_rate": 1.5850687848283405e-06, - "loss": 1.0928, - "step": 37694 - }, - { - "epoch": 0.97, - "learning_rate": 1.5850463443180433e-06, - "loss": 0.6582, - "step": 37695 - }, - { - "epoch": 0.97, - "learning_rate": 1.585023903359803e-06, - "loss": 0.8604, - "step": 37696 - }, - { - "epoch": 0.97, - "learning_rate": 1.5850014619536367e-06, - "loss": 0.9834, - "step": 37697 - }, - { - "epoch": 0.97, - "learning_rate": 1.5849790200995617e-06, - "loss": 0.6455, - "step": 37698 - }, - { - "epoch": 0.97, - "learning_rate": 1.5849565777975952e-06, - "loss": 0.5706, - "step": 37699 - }, - { - "epoch": 0.97, - "learning_rate": 1.5849341350477544e-06, - "loss": 0.8652, - "step": 37700 - }, - { - "epoch": 0.97, - "learning_rate": 1.5849116918500562e-06, - "loss": 1.0039, - "step": 37701 - }, - { - "epoch": 0.97, - "learning_rate": 1.5848892482045182e-06, - "loss": 0.8564, - "step": 37702 - }, - { - "epoch": 0.97, - "learning_rate": 1.5848668041111575e-06, - "loss": 0.9639, - "step": 37703 - }, - { - "epoch": 0.97, - "learning_rate": 1.5848443595699913e-06, - "loss": 0.7578, - "step": 37704 - }, - { - "epoch": 0.97, - "learning_rate": 1.5848219145810364e-06, - "loss": 0.9072, - "step": 37705 - }, - { - "epoch": 0.97, - "learning_rate": 1.58479946914431e-06, - "loss": 0.6245, - "step": 37706 - }, - { - "epoch": 0.97, - "learning_rate": 1.58477702325983e-06, - "loss": 0.8818, - "step": 37707 - }, - { - "epoch": 0.97, - "learning_rate": 1.584754576927613e-06, - "loss": 1.3623, - "step": 37708 - }, - { - "epoch": 0.97, - "learning_rate": 1.584732130147676e-06, - "loss": 0.9512, - "step": 37709 - }, - { - "epoch": 0.97, - "learning_rate": 1.5847096829200368e-06, - "loss": 0.9561, - "step": 37710 - }, - { - "epoch": 0.97, - "learning_rate": 1.5846872352447123e-06, - "loss": 0.7578, - "step": 37711 - }, - { - "epoch": 0.97, - "learning_rate": 1.5846647871217194e-06, - "loss": 0.8438, - "step": 37712 - }, - { - "epoch": 0.97, - "learning_rate": 1.5846423385510757e-06, - "loss": 0.9814, - "step": 37713 - }, - { - "epoch": 0.97, - "learning_rate": 1.5846198895327984e-06, - "loss": 0.8887, - "step": 37714 - }, - { - "epoch": 0.97, - "learning_rate": 1.5845974400669047e-06, - "loss": 0.8066, - "step": 37715 - }, - { - "epoch": 0.97, - "learning_rate": 1.5845749901534112e-06, - "loss": 0.7668, - "step": 37716 - }, - { - "epoch": 0.97, - "learning_rate": 1.5845525397923355e-06, - "loss": 0.7041, - "step": 37717 - }, - { - "epoch": 0.97, - "learning_rate": 1.584530088983695e-06, - "loss": 0.7969, - "step": 37718 - }, - { - "epoch": 0.97, - "learning_rate": 1.5845076377275065e-06, - "loss": 0.9956, - "step": 37719 - }, - { - "epoch": 0.97, - "learning_rate": 1.5844851860237877e-06, - "loss": 0.6997, - "step": 37720 - }, - { - "epoch": 0.97, - "learning_rate": 1.5844627338725554e-06, - "loss": 1.0693, - "step": 37721 - }, - { - "epoch": 0.97, - "learning_rate": 1.5844402812738266e-06, - "loss": 0.696, - "step": 37722 - }, - { - "epoch": 0.97, - "learning_rate": 1.584417828227619e-06, - "loss": 0.6357, - "step": 37723 - }, - { - "epoch": 0.97, - "learning_rate": 1.5843953747339494e-06, - "loss": 0.6619, - "step": 37724 - }, - { - "epoch": 0.97, - "learning_rate": 1.5843729207928354e-06, - "loss": 0.6421, - "step": 37725 - }, - { - "epoch": 0.97, - "learning_rate": 1.5843504664042934e-06, - "loss": 0.7197, - "step": 37726 - }, - { - "epoch": 0.97, - "learning_rate": 1.5843280115683414e-06, - "loss": 0.8242, - "step": 37727 - }, - { - "epoch": 0.97, - "learning_rate": 1.5843055562849964e-06, - "loss": 0.8965, - "step": 37728 - }, - { - "epoch": 0.97, - "learning_rate": 1.5842831005542756e-06, - "loss": 0.7617, - "step": 37729 - }, - { - "epoch": 0.97, - "learning_rate": 1.584260644376196e-06, - "loss": 0.6948, - "step": 37730 - }, - { - "epoch": 0.97, - "learning_rate": 1.5842381877507744e-06, - "loss": 0.7373, - "step": 37731 - }, - { - "epoch": 0.97, - "learning_rate": 1.584215730678029e-06, - "loss": 0.8193, - "step": 37732 - }, - { - "epoch": 0.97, - "learning_rate": 1.5841932731579766e-06, - "loss": 0.7383, - "step": 37733 - }, - { - "epoch": 0.97, - "learning_rate": 1.5841708151906338e-06, - "loss": 0.6143, - "step": 37734 - }, - { - "epoch": 0.97, - "learning_rate": 1.5841483567760186e-06, - "loss": 1.0527, - "step": 37735 - }, - { - "epoch": 0.97, - "learning_rate": 1.5841258979141476e-06, - "loss": 0.8682, - "step": 37736 - }, - { - "epoch": 0.97, - "learning_rate": 1.5841034386050388e-06, - "loss": 0.8711, - "step": 37737 - }, - { - "epoch": 0.97, - "learning_rate": 1.5840809788487082e-06, - "loss": 0.6533, - "step": 37738 - }, - { - "epoch": 0.97, - "learning_rate": 1.584058518645174e-06, - "loss": 0.8613, - "step": 37739 - }, - { - "epoch": 0.97, - "learning_rate": 1.584036057994453e-06, - "loss": 0.7617, - "step": 37740 - }, - { - "epoch": 0.97, - "learning_rate": 1.5840135968965625e-06, - "loss": 0.9277, - "step": 37741 - }, - { - "epoch": 0.97, - "learning_rate": 1.5839911353515194e-06, - "loss": 0.7744, - "step": 37742 - }, - { - "epoch": 0.97, - "learning_rate": 1.5839686733593414e-06, - "loss": 0.7197, - "step": 37743 - }, - { - "epoch": 0.97, - "learning_rate": 1.5839462109200454e-06, - "loss": 0.5415, - "step": 37744 - }, - { - "epoch": 0.97, - "learning_rate": 1.5839237480336488e-06, - "loss": 0.7324, - "step": 37745 - }, - { - "epoch": 0.97, - "learning_rate": 1.5839012847001682e-06, - "loss": 0.8535, - "step": 37746 - }, - { - "epoch": 0.97, - "learning_rate": 1.5838788209196214e-06, - "loss": 0.7874, - "step": 37747 - }, - { - "epoch": 0.97, - "learning_rate": 1.5838563566920256e-06, - "loss": 0.7998, - "step": 37748 - }, - { - "epoch": 0.97, - "learning_rate": 1.583833892017398e-06, - "loss": 0.9736, - "step": 37749 - }, - { - "epoch": 0.97, - "learning_rate": 1.583811426895755e-06, - "loss": 0.7832, - "step": 37750 - }, - { - "epoch": 0.97, - "learning_rate": 1.5837889613271149e-06, - "loss": 0.7776, - "step": 37751 - }, - { - "epoch": 0.97, - "learning_rate": 1.5837664953114941e-06, - "loss": 0.8955, - "step": 37752 - }, - { - "epoch": 0.97, - "learning_rate": 1.5837440288489106e-06, - "loss": 0.7344, - "step": 37753 - }, - { - "epoch": 0.97, - "learning_rate": 1.5837215619393809e-06, - "loss": 0.6343, - "step": 37754 - }, - { - "epoch": 0.97, - "learning_rate": 1.5836990945829224e-06, - "loss": 0.9482, - "step": 37755 - }, - { - "epoch": 0.97, - "learning_rate": 1.5836766267795523e-06, - "loss": 0.813, - "step": 37756 - }, - { - "epoch": 0.97, - "learning_rate": 1.583654158529288e-06, - "loss": 0.73, - "step": 37757 - }, - { - "epoch": 0.97, - "learning_rate": 1.5836316898321464e-06, - "loss": 0.9824, - "step": 37758 - }, - { - "epoch": 0.97, - "learning_rate": 1.583609220688145e-06, - "loss": 0.8228, - "step": 37759 - }, - { - "epoch": 0.97, - "learning_rate": 1.5835867510973009e-06, - "loss": 0.7246, - "step": 37760 - }, - { - "epoch": 0.97, - "learning_rate": 1.583564281059631e-06, - "loss": 0.7568, - "step": 37761 - }, - { - "epoch": 0.97, - "learning_rate": 1.583541810575153e-06, - "loss": 0.8057, - "step": 37762 - }, - { - "epoch": 0.97, - "learning_rate": 1.5835193396438837e-06, - "loss": 1.0527, - "step": 37763 - }, - { - "epoch": 0.97, - "learning_rate": 1.5834968682658407e-06, - "loss": 1.0645, - "step": 37764 - }, - { - "epoch": 0.97, - "learning_rate": 1.5834743964410408e-06, - "loss": 0.8101, - "step": 37765 - }, - { - "epoch": 0.97, - "learning_rate": 1.5834519241695015e-06, - "loss": 0.5063, - "step": 37766 - }, - { - "epoch": 0.97, - "learning_rate": 1.5834294514512396e-06, - "loss": 0.8848, - "step": 37767 - }, - { - "epoch": 0.97, - "learning_rate": 1.5834069782862728e-06, - "loss": 0.7949, - "step": 37768 - }, - { - "epoch": 0.97, - "learning_rate": 1.5833845046746184e-06, - "loss": 0.9453, - "step": 37769 - }, - { - "epoch": 0.97, - "learning_rate": 1.583362030616293e-06, - "loss": 0.7715, - "step": 37770 - }, - { - "epoch": 0.97, - "learning_rate": 1.583339556111314e-06, - "loss": 0.8867, - "step": 37771 - }, - { - "epoch": 0.97, - "learning_rate": 1.583317081159699e-06, - "loss": 0.8652, - "step": 37772 - }, - { - "epoch": 0.97, - "learning_rate": 1.5832946057614644e-06, - "loss": 0.8291, - "step": 37773 - }, - { - "epoch": 0.97, - "learning_rate": 1.5832721299166285e-06, - "loss": 1.0166, - "step": 37774 - }, - { - "epoch": 0.97, - "learning_rate": 1.5832496536252079e-06, - "loss": 1.1689, - "step": 37775 - }, - { - "epoch": 0.97, - "learning_rate": 1.5832271768872196e-06, - "loss": 0.8594, - "step": 37776 - }, - { - "epoch": 0.97, - "learning_rate": 1.5832046997026813e-06, - "loss": 0.6323, - "step": 37777 - }, - { - "epoch": 0.97, - "learning_rate": 1.5831822220716097e-06, - "loss": 0.959, - "step": 37778 - }, - { - "epoch": 0.97, - "learning_rate": 1.5831597439940225e-06, - "loss": 0.6938, - "step": 37779 - }, - { - "epoch": 0.97, - "learning_rate": 1.583137265469937e-06, - "loss": 0.9619, - "step": 37780 - }, - { - "epoch": 0.97, - "learning_rate": 1.5831147864993697e-06, - "loss": 1.0283, - "step": 37781 - }, - { - "epoch": 0.97, - "learning_rate": 1.583092307082338e-06, - "loss": 0.7764, - "step": 37782 - }, - { - "epoch": 0.97, - "learning_rate": 1.5830698272188596e-06, - "loss": 0.8003, - "step": 37783 - }, - { - "epoch": 0.97, - "learning_rate": 1.5830473469089518e-06, - "loss": 0.7373, - "step": 37784 - }, - { - "epoch": 0.97, - "learning_rate": 1.5830248661526308e-06, - "loss": 0.7861, - "step": 37785 - }, - { - "epoch": 0.97, - "learning_rate": 1.583002384949915e-06, - "loss": 0.9023, - "step": 37786 - }, - { - "epoch": 0.97, - "learning_rate": 1.582979903300821e-06, - "loss": 0.8887, - "step": 37787 - }, - { - "epoch": 0.97, - "learning_rate": 1.5829574212053658e-06, - "loss": 0.5959, - "step": 37788 - }, - { - "epoch": 0.97, - "learning_rate": 1.5829349386635671e-06, - "loss": 0.8467, - "step": 37789 - }, - { - "epoch": 0.97, - "learning_rate": 1.5829124556754422e-06, - "loss": 0.8018, - "step": 37790 - }, - { - "epoch": 0.97, - "learning_rate": 1.5828899722410073e-06, - "loss": 0.7969, - "step": 37791 - }, - { - "epoch": 0.97, - "learning_rate": 1.5828674883602807e-06, - "loss": 0.792, - "step": 37792 - }, - { - "epoch": 0.97, - "learning_rate": 1.5828450040332796e-06, - "loss": 0.8096, - "step": 37793 - }, - { - "epoch": 0.97, - "learning_rate": 1.5828225192600209e-06, - "loss": 0.791, - "step": 37794 - }, - { - "epoch": 0.97, - "learning_rate": 1.5828000340405212e-06, - "loss": 0.7808, - "step": 37795 - }, - { - "epoch": 0.97, - "learning_rate": 1.5827775483747987e-06, - "loss": 0.8613, - "step": 37796 - }, - { - "epoch": 0.97, - "learning_rate": 1.58275506226287e-06, - "loss": 1.0361, - "step": 37797 - }, - { - "epoch": 0.97, - "learning_rate": 1.5827325757047528e-06, - "loss": 0.7891, - "step": 37798 - }, - { - "epoch": 0.97, - "learning_rate": 1.5827100887004641e-06, - "loss": 0.5698, - "step": 37799 - }, - { - "epoch": 0.97, - "learning_rate": 1.5826876012500208e-06, - "loss": 0.79, - "step": 37800 - }, - { - "epoch": 0.97, - "learning_rate": 1.5826651133534407e-06, - "loss": 0.7637, - "step": 37801 - }, - { - "epoch": 0.97, - "learning_rate": 1.5826426250107402e-06, - "loss": 0.5571, - "step": 37802 - }, - { - "epoch": 0.97, - "learning_rate": 1.5826201362219375e-06, - "loss": 0.7861, - "step": 37803 - }, - { - "epoch": 0.97, - "learning_rate": 1.5825976469870494e-06, - "loss": 0.7065, - "step": 37804 - }, - { - "epoch": 0.97, - "learning_rate": 1.582575157306093e-06, - "loss": 0.7666, - "step": 37805 - }, - { - "epoch": 0.97, - "learning_rate": 1.5825526671790855e-06, - "loss": 0.998, - "step": 37806 - }, - { - "epoch": 0.97, - "learning_rate": 1.5825301766060441e-06, - "loss": 0.6924, - "step": 37807 - }, - { - "epoch": 0.97, - "learning_rate": 1.5825076855869863e-06, - "loss": 0.8682, - "step": 37808 - }, - { - "epoch": 0.97, - "learning_rate": 1.5824851941219293e-06, - "loss": 0.538, - "step": 37809 - }, - { - "epoch": 0.97, - "learning_rate": 1.58246270221089e-06, - "loss": 0.561, - "step": 37810 - }, - { - "epoch": 0.97, - "learning_rate": 1.5824402098538856e-06, - "loss": 0.7432, - "step": 37811 - }, - { - "epoch": 0.97, - "learning_rate": 1.5824177170509337e-06, - "loss": 0.6426, - "step": 37812 - }, - { - "epoch": 0.97, - "learning_rate": 1.5823952238020513e-06, - "loss": 0.6997, - "step": 37813 - }, - { - "epoch": 0.97, - "learning_rate": 1.5823727301072558e-06, - "loss": 0.8438, - "step": 37814 - }, - { - "epoch": 0.97, - "learning_rate": 1.582350235966564e-06, - "loss": 0.9102, - "step": 37815 - }, - { - "epoch": 0.97, - "learning_rate": 1.5823277413799936e-06, - "loss": 0.9199, - "step": 37816 - }, - { - "epoch": 0.97, - "learning_rate": 1.5823052463475614e-06, - "loss": 0.8779, - "step": 37817 - }, - { - "epoch": 0.97, - "learning_rate": 1.5822827508692851e-06, - "loss": 0.8662, - "step": 37818 - }, - { - "epoch": 0.97, - "learning_rate": 1.5822602549451815e-06, - "loss": 0.7197, - "step": 37819 - }, - { - "epoch": 0.97, - "learning_rate": 1.582237758575268e-06, - "loss": 0.9209, - "step": 37820 - }, - { - "epoch": 0.97, - "learning_rate": 1.582215261759562e-06, - "loss": 0.9141, - "step": 37821 - }, - { - "epoch": 0.97, - "learning_rate": 1.5821927644980804e-06, - "loss": 0.8755, - "step": 37822 - }, - { - "epoch": 0.97, - "learning_rate": 1.5821702667908406e-06, - "loss": 0.8379, - "step": 37823 - }, - { - "epoch": 0.97, - "learning_rate": 1.58214776863786e-06, - "loss": 0.8086, - "step": 37824 - }, - { - "epoch": 0.97, - "learning_rate": 1.5821252700391554e-06, - "loss": 0.7812, - "step": 37825 - }, - { - "epoch": 0.97, - "learning_rate": 1.5821027709947442e-06, - "loss": 0.7251, - "step": 37826 - }, - { - "epoch": 0.97, - "learning_rate": 1.5820802715046438e-06, - "loss": 0.8062, - "step": 37827 - }, - { - "epoch": 0.97, - "learning_rate": 1.5820577715688712e-06, - "loss": 0.7471, - "step": 37828 - }, - { - "epoch": 0.97, - "learning_rate": 1.582035271187444e-06, - "loss": 0.7783, - "step": 37829 - }, - { - "epoch": 0.97, - "learning_rate": 1.5820127703603786e-06, - "loss": 0.7295, - "step": 37830 - }, - { - "epoch": 0.97, - "learning_rate": 1.5819902690876931e-06, - "loss": 0.877, - "step": 37831 - }, - { - "epoch": 0.97, - "learning_rate": 1.5819677673694045e-06, - "loss": 0.7363, - "step": 37832 - }, - { - "epoch": 0.97, - "learning_rate": 1.58194526520553e-06, - "loss": 0.9756, - "step": 37833 - }, - { - "epoch": 0.97, - "learning_rate": 1.5819227625960868e-06, - "loss": 0.9648, - "step": 37834 - }, - { - "epoch": 0.97, - "learning_rate": 1.5819002595410917e-06, - "loss": 0.8911, - "step": 37835 - }, - { - "epoch": 0.97, - "learning_rate": 1.5818777560405628e-06, - "loss": 0.688, - "step": 37836 - }, - { - "epoch": 0.97, - "learning_rate": 1.5818552520945165e-06, - "loss": 0.9609, - "step": 37837 - }, - { - "epoch": 0.97, - "learning_rate": 1.5818327477029706e-06, - "loss": 0.9854, - "step": 37838 - }, - { - "epoch": 0.97, - "learning_rate": 1.5818102428659418e-06, - "loss": 0.8848, - "step": 37839 - }, - { - "epoch": 0.97, - "learning_rate": 1.581787737583448e-06, - "loss": 1.0439, - "step": 37840 - }, - { - "epoch": 0.97, - "learning_rate": 1.581765231855506e-06, - "loss": 1.4229, - "step": 37841 - }, - { - "epoch": 0.97, - "learning_rate": 1.5817427256821331e-06, - "loss": 1.1377, - "step": 37842 - }, - { - "epoch": 0.97, - "learning_rate": 1.5817202190633462e-06, - "loss": 0.9199, - "step": 37843 - }, - { - "epoch": 0.97, - "learning_rate": 1.5816977119991635e-06, - "loss": 0.8936, - "step": 37844 - }, - { - "epoch": 0.97, - "learning_rate": 1.5816752044896014e-06, - "loss": 0.8975, - "step": 37845 - }, - { - "epoch": 0.97, - "learning_rate": 1.581652696534677e-06, - "loss": 0.6406, - "step": 37846 - }, - { - "epoch": 0.97, - "learning_rate": 1.581630188134408e-06, - "loss": 0.9502, - "step": 37847 - }, - { - "epoch": 0.97, - "learning_rate": 1.5816076792888118e-06, - "loss": 0.9492, - "step": 37848 - }, - { - "epoch": 0.97, - "learning_rate": 1.5815851699979055e-06, - "loss": 0.707, - "step": 37849 - }, - { - "epoch": 0.97, - "learning_rate": 1.5815626602617055e-06, - "loss": 0.7175, - "step": 37850 - }, - { - "epoch": 0.97, - "learning_rate": 1.58154015008023e-06, - "loss": 0.563, - "step": 37851 - }, - { - "epoch": 0.97, - "learning_rate": 1.581517639453496e-06, - "loss": 1.1787, - "step": 37852 - }, - { - "epoch": 0.97, - "learning_rate": 1.5814951283815207e-06, - "loss": 0.7109, - "step": 37853 - }, - { - "epoch": 0.97, - "learning_rate": 1.5814726168643215e-06, - "loss": 0.9106, - "step": 37854 - }, - { - "epoch": 0.97, - "learning_rate": 1.5814501049019153e-06, - "loss": 0.7896, - "step": 37855 - }, - { - "epoch": 0.97, - "learning_rate": 1.5814275924943195e-06, - "loss": 0.6836, - "step": 37856 - }, - { - "epoch": 0.97, - "learning_rate": 1.5814050796415511e-06, - "loss": 0.9277, - "step": 37857 - }, - { - "epoch": 0.97, - "learning_rate": 1.5813825663436278e-06, - "loss": 0.8887, - "step": 37858 - }, - { - "epoch": 0.97, - "learning_rate": 1.5813600526005666e-06, - "loss": 0.5684, - "step": 37859 - }, - { - "epoch": 0.97, - "learning_rate": 1.5813375384123848e-06, - "loss": 0.9287, - "step": 37860 - }, - { - "epoch": 0.97, - "learning_rate": 1.5813150237790996e-06, - "loss": 0.9443, - "step": 37861 - }, - { - "epoch": 0.97, - "learning_rate": 1.5812925087007278e-06, - "loss": 0.9111, - "step": 37862 - }, - { - "epoch": 0.97, - "learning_rate": 1.5812699931772873e-06, - "loss": 0.8291, - "step": 37863 - }, - { - "epoch": 0.97, - "learning_rate": 1.5812474772087953e-06, - "loss": 0.8838, - "step": 37864 - }, - { - "epoch": 0.97, - "learning_rate": 1.5812249607952686e-06, - "loss": 1.0664, - "step": 37865 - }, - { - "epoch": 0.97, - "learning_rate": 1.5812024439367247e-06, - "loss": 0.8496, - "step": 37866 - }, - { - "epoch": 0.97, - "learning_rate": 1.5811799266331809e-06, - "loss": 0.792, - "step": 37867 - }, - { - "epoch": 0.97, - "learning_rate": 1.5811574088846542e-06, - "loss": 0.8838, - "step": 37868 - }, - { - "epoch": 0.97, - "learning_rate": 1.581134890691162e-06, - "loss": 0.9717, - "step": 37869 - }, - { - "epoch": 0.97, - "learning_rate": 1.581112372052722e-06, - "loss": 0.8818, - "step": 37870 - }, - { - "epoch": 0.97, - "learning_rate": 1.5810898529693505e-06, - "loss": 0.9707, - "step": 37871 - }, - { - "epoch": 0.97, - "learning_rate": 1.581067333441065e-06, - "loss": 1.0225, - "step": 37872 - }, - { - "epoch": 0.97, - "learning_rate": 1.5810448134678834e-06, - "loss": 0.8359, - "step": 37873 - }, - { - "epoch": 0.97, - "learning_rate": 1.5810222930498225e-06, - "loss": 0.8369, - "step": 37874 - }, - { - "epoch": 0.97, - "learning_rate": 1.5809997721868995e-06, - "loss": 0.8008, - "step": 37875 - }, - { - "epoch": 0.97, - "learning_rate": 1.5809772508791315e-06, - "loss": 0.8623, - "step": 37876 - }, - { - "epoch": 0.97, - "learning_rate": 1.5809547291265361e-06, - "loss": 0.7422, - "step": 37877 - }, - { - "epoch": 0.97, - "learning_rate": 1.5809322069291305e-06, - "loss": 0.7441, - "step": 37878 - }, - { - "epoch": 0.97, - "learning_rate": 1.5809096842869315e-06, - "loss": 0.7124, - "step": 37879 - }, - { - "epoch": 0.97, - "learning_rate": 1.580887161199957e-06, - "loss": 0.8076, - "step": 37880 - }, - { - "epoch": 0.97, - "learning_rate": 1.5808646376682236e-06, - "loss": 0.7542, - "step": 37881 - }, - { - "epoch": 0.97, - "learning_rate": 1.5808421136917489e-06, - "loss": 0.8271, - "step": 37882 - }, - { - "epoch": 0.97, - "learning_rate": 1.5808195892705504e-06, - "loss": 0.9395, - "step": 37883 - }, - { - "epoch": 0.97, - "learning_rate": 1.580797064404645e-06, - "loss": 0.8013, - "step": 37884 - }, - { - "epoch": 0.97, - "learning_rate": 1.5807745390940497e-06, - "loss": 1.1436, - "step": 37885 - }, - { - "epoch": 0.97, - "learning_rate": 1.580752013338782e-06, - "loss": 0.9258, - "step": 37886 - }, - { - "epoch": 0.97, - "learning_rate": 1.5807294871388595e-06, - "loss": 0.8335, - "step": 37887 - }, - { - "epoch": 0.97, - "learning_rate": 1.5807069604942988e-06, - "loss": 0.8203, - "step": 37888 - }, - { - "epoch": 0.97, - "learning_rate": 1.5806844334051178e-06, - "loss": 1.0723, - "step": 37889 - }, - { - "epoch": 0.97, - "learning_rate": 1.5806619058713332e-06, - "loss": 0.7812, - "step": 37890 - }, - { - "epoch": 0.97, - "learning_rate": 1.5806393778929628e-06, - "loss": 0.8301, - "step": 37891 - }, - { - "epoch": 0.97, - "learning_rate": 1.5806168494700232e-06, - "loss": 0.6631, - "step": 37892 - }, - { - "epoch": 0.97, - "learning_rate": 1.5805943206025321e-06, - "loss": 0.9375, - "step": 37893 - }, - { - "epoch": 0.97, - "learning_rate": 1.5805717912905067e-06, - "loss": 0.5706, - "step": 37894 - }, - { - "epoch": 0.97, - "learning_rate": 1.5805492615339639e-06, - "loss": 0.6938, - "step": 37895 - }, - { - "epoch": 0.97, - "learning_rate": 1.5805267313329217e-06, - "loss": 0.9814, - "step": 37896 - }, - { - "epoch": 0.97, - "learning_rate": 1.5805042006873964e-06, - "loss": 1.0332, - "step": 37897 - }, - { - "epoch": 0.97, - "learning_rate": 1.5804816695974056e-06, - "loss": 0.6846, - "step": 37898 - }, - { - "epoch": 0.97, - "learning_rate": 1.5804591380629675e-06, - "loss": 0.7009, - "step": 37899 - }, - { - "epoch": 0.97, - "learning_rate": 1.5804366060840976e-06, - "loss": 0.7549, - "step": 37900 - }, - { - "epoch": 0.97, - "learning_rate": 1.5804140736608147e-06, - "loss": 0.9365, - "step": 37901 - }, - { - "epoch": 0.97, - "learning_rate": 1.5803915407931351e-06, - "loss": 0.8057, - "step": 37902 - }, - { - "epoch": 0.97, - "learning_rate": 1.5803690074810767e-06, - "loss": 0.6455, - "step": 37903 - }, - { - "epoch": 0.97, - "learning_rate": 1.5803464737246564e-06, - "loss": 0.8301, - "step": 37904 - }, - { - "epoch": 0.97, - "learning_rate": 1.5803239395238912e-06, - "loss": 0.7979, - "step": 37905 - }, - { - "epoch": 0.97, - "learning_rate": 1.5803014048787987e-06, - "loss": 0.4968, - "step": 37906 - }, - { - "epoch": 0.97, - "learning_rate": 1.5802788697893962e-06, - "loss": 0.6704, - "step": 37907 - }, - { - "epoch": 0.97, - "learning_rate": 1.5802563342557008e-06, - "loss": 0.7158, - "step": 37908 - }, - { - "epoch": 0.97, - "learning_rate": 1.58023379827773e-06, - "loss": 0.7173, - "step": 37909 - }, - { - "epoch": 0.97, - "learning_rate": 1.5802112618555005e-06, - "loss": 0.835, - "step": 37910 - }, - { - "epoch": 0.97, - "learning_rate": 1.5801887249890303e-06, - "loss": 1.1035, - "step": 37911 - }, - { - "epoch": 0.97, - "learning_rate": 1.5801661876783362e-06, - "loss": 0.7578, - "step": 37912 - }, - { - "epoch": 0.97, - "learning_rate": 1.580143649923435e-06, - "loss": 1.0156, - "step": 37913 - }, - { - "epoch": 0.97, - "learning_rate": 1.5801211117243453e-06, - "loss": 0.8916, - "step": 37914 - }, - { - "epoch": 0.97, - "learning_rate": 1.580098573081083e-06, - "loss": 0.9434, - "step": 37915 - }, - { - "epoch": 0.97, - "learning_rate": 1.5800760339936661e-06, - "loss": 0.9668, - "step": 37916 - }, - { - "epoch": 0.97, - "learning_rate": 1.5800534944621115e-06, - "loss": 0.8447, - "step": 37917 - }, - { - "epoch": 0.97, - "learning_rate": 1.5800309544864366e-06, - "loss": 0.7373, - "step": 37918 - }, - { - "epoch": 0.97, - "learning_rate": 1.5800084140666589e-06, - "loss": 0.8154, - "step": 37919 - }, - { - "epoch": 0.97, - "learning_rate": 1.5799858732027952e-06, - "loss": 0.9238, - "step": 37920 - }, - { - "epoch": 0.97, - "learning_rate": 1.5799633318948632e-06, - "loss": 0.7407, - "step": 37921 - }, - { - "epoch": 0.97, - "learning_rate": 1.5799407901428797e-06, - "loss": 0.8848, - "step": 37922 - }, - { - "epoch": 0.97, - "learning_rate": 1.5799182479468623e-06, - "loss": 0.7485, - "step": 37923 - }, - { - "epoch": 0.97, - "learning_rate": 1.5798957053068285e-06, - "loss": 0.8428, - "step": 37924 - }, - { - "epoch": 0.97, - "learning_rate": 1.5798731622227948e-06, - "loss": 0.8506, - "step": 37925 - }, - { - "epoch": 0.97, - "learning_rate": 1.579850618694779e-06, - "loss": 0.9062, - "step": 37926 - }, - { - "epoch": 0.97, - "learning_rate": 1.579828074722798e-06, - "loss": 0.7759, - "step": 37927 - }, - { - "epoch": 0.97, - "learning_rate": 1.5798055303068695e-06, - "loss": 1.1309, - "step": 37928 - }, - { - "epoch": 0.97, - "learning_rate": 1.5797829854470107e-06, - "loss": 0.8906, - "step": 37929 - }, - { - "epoch": 0.97, - "learning_rate": 1.5797604401432387e-06, - "loss": 0.9014, - "step": 37930 - }, - { - "epoch": 0.97, - "learning_rate": 1.5797378943955707e-06, - "loss": 0.6875, - "step": 37931 - }, - { - "epoch": 0.97, - "learning_rate": 1.579715348204024e-06, - "loss": 0.8574, - "step": 37932 - }, - { - "epoch": 0.97, - "learning_rate": 1.5796928015686159e-06, - "loss": 0.8848, - "step": 37933 - }, - { - "epoch": 0.97, - "learning_rate": 1.579670254489364e-06, - "loss": 0.8682, - "step": 37934 - }, - { - "epoch": 0.97, - "learning_rate": 1.579647706966285e-06, - "loss": 0.5796, - "step": 37935 - }, - { - "epoch": 0.97, - "learning_rate": 1.5796251589993963e-06, - "loss": 0.959, - "step": 37936 - }, - { - "epoch": 0.97, - "learning_rate": 1.5796026105887155e-06, - "loss": 0.7072, - "step": 37937 - }, - { - "epoch": 0.97, - "learning_rate": 1.5795800617342595e-06, - "loss": 0.7129, - "step": 37938 - }, - { - "epoch": 0.97, - "learning_rate": 1.5795575124360457e-06, - "loss": 0.7852, - "step": 37939 - }, - { - "epoch": 0.97, - "learning_rate": 1.5795349626940913e-06, - "loss": 0.9336, - "step": 37940 - }, - { - "epoch": 0.97, - "learning_rate": 1.5795124125084137e-06, - "loss": 0.7502, - "step": 37941 - }, - { - "epoch": 0.97, - "learning_rate": 1.57948986187903e-06, - "loss": 0.917, - "step": 37942 - }, - { - "epoch": 0.97, - "learning_rate": 1.5794673108059574e-06, - "loss": 0.9375, - "step": 37943 - }, - { - "epoch": 0.97, - "learning_rate": 1.579444759289214e-06, - "loss": 1.0684, - "step": 37944 - }, - { - "epoch": 0.97, - "learning_rate": 1.579422207328816e-06, - "loss": 0.7197, - "step": 37945 - }, - { - "epoch": 0.97, - "learning_rate": 1.579399654924781e-06, - "loss": 0.9473, - "step": 37946 - }, - { - "epoch": 0.97, - "learning_rate": 1.5793771020771262e-06, - "loss": 0.7568, - "step": 37947 - }, - { - "epoch": 0.97, - "learning_rate": 1.579354548785869e-06, - "loss": 0.6597, - "step": 37948 - }, - { - "epoch": 0.97, - "learning_rate": 1.5793319950510271e-06, - "loss": 0.7646, - "step": 37949 - }, - { - "epoch": 0.97, - "learning_rate": 1.579309440872617e-06, - "loss": 0.7334, - "step": 37950 - }, - { - "epoch": 0.97, - "learning_rate": 1.579286886250656e-06, - "loss": 0.4927, - "step": 37951 - }, - { - "epoch": 0.97, - "learning_rate": 1.5792643311851622e-06, - "loss": 0.9297, - "step": 37952 - }, - { - "epoch": 0.97, - "learning_rate": 1.5792417756761522e-06, - "loss": 0.9473, - "step": 37953 - }, - { - "epoch": 0.97, - "learning_rate": 1.5792192197236433e-06, - "loss": 0.7397, - "step": 37954 - }, - { - "epoch": 0.97, - "learning_rate": 1.5791966633276528e-06, - "loss": 0.7949, - "step": 37955 - }, - { - "epoch": 0.97, - "learning_rate": 1.5791741064881982e-06, - "loss": 0.7393, - "step": 37956 - }, - { - "epoch": 0.97, - "learning_rate": 1.5791515492052966e-06, - "loss": 0.4741, - "step": 37957 - }, - { - "epoch": 0.97, - "learning_rate": 1.5791289914789654e-06, - "loss": 0.6208, - "step": 37958 - }, - { - "epoch": 0.97, - "learning_rate": 1.5791064333092216e-06, - "loss": 0.7568, - "step": 37959 - }, - { - "epoch": 0.97, - "learning_rate": 1.5790838746960826e-06, - "loss": 0.6938, - "step": 37960 - }, - { - "epoch": 0.97, - "learning_rate": 1.5790613156395658e-06, - "loss": 0.7344, - "step": 37961 - }, - { - "epoch": 0.97, - "learning_rate": 1.5790387561396883e-06, - "loss": 0.8616, - "step": 37962 - }, - { - "epoch": 0.97, - "learning_rate": 1.5790161961964677e-06, - "loss": 0.7607, - "step": 37963 - }, - { - "epoch": 0.97, - "learning_rate": 1.5789936358099208e-06, - "loss": 0.748, - "step": 37964 - }, - { - "epoch": 0.97, - "learning_rate": 1.578971074980065e-06, - "loss": 0.9043, - "step": 37965 - }, - { - "epoch": 0.97, - "learning_rate": 1.5789485137069178e-06, - "loss": 0.6482, - "step": 37966 - }, - { - "epoch": 0.97, - "learning_rate": 1.578925951990496e-06, - "loss": 0.604, - "step": 37967 - }, - { - "epoch": 0.97, - "learning_rate": 1.5789033898308177e-06, - "loss": 0.8691, - "step": 37968 - }, - { - "epoch": 0.97, - "learning_rate": 1.5788808272278998e-06, - "loss": 0.8228, - "step": 37969 - }, - { - "epoch": 0.97, - "learning_rate": 1.578858264181759e-06, - "loss": 0.8467, - "step": 37970 - }, - { - "epoch": 0.97, - "learning_rate": 1.5788357006924132e-06, - "loss": 0.7686, - "step": 37971 - }, - { - "epoch": 0.97, - "learning_rate": 1.5788131367598796e-06, - "loss": 0.8662, - "step": 37972 - }, - { - "epoch": 0.97, - "learning_rate": 1.5787905723841755e-06, - "loss": 0.8408, - "step": 37973 - }, - { - "epoch": 0.97, - "learning_rate": 1.5787680075653177e-06, - "loss": 0.7524, - "step": 37974 - }, - { - "epoch": 0.97, - "learning_rate": 1.578745442303324e-06, - "loss": 0.877, - "step": 37975 - }, - { - "epoch": 0.97, - "learning_rate": 1.578722876598212e-06, - "loss": 0.8535, - "step": 37976 - }, - { - "epoch": 0.97, - "learning_rate": 1.578700310449998e-06, - "loss": 0.8623, - "step": 37977 - }, - { - "epoch": 0.97, - "learning_rate": 1.5786777438586998e-06, - "loss": 0.7051, - "step": 37978 - }, - { - "epoch": 0.97, - "learning_rate": 1.5786551768243348e-06, - "loss": 1.1504, - "step": 37979 - }, - { - "epoch": 0.97, - "learning_rate": 1.5786326093469202e-06, - "loss": 0.7715, - "step": 37980 - }, - { - "epoch": 0.97, - "learning_rate": 1.578610041426473e-06, - "loss": 0.9707, - "step": 37981 - }, - { - "epoch": 0.97, - "learning_rate": 1.5785874730630106e-06, - "loss": 0.957, - "step": 37982 - }, - { - "epoch": 0.97, - "learning_rate": 1.578564904256551e-06, - "loss": 0.9785, - "step": 37983 - }, - { - "epoch": 0.97, - "learning_rate": 1.5785423350071104e-06, - "loss": 0.623, - "step": 37984 - }, - { - "epoch": 0.97, - "learning_rate": 1.5785197653147064e-06, - "loss": 1.0781, - "step": 37985 - }, - { - "epoch": 0.97, - "learning_rate": 1.5784971951793566e-06, - "loss": 0.7056, - "step": 37986 - }, - { - "epoch": 0.97, - "learning_rate": 1.5784746246010782e-06, - "loss": 0.6624, - "step": 37987 - }, - { - "epoch": 0.97, - "learning_rate": 1.5784520535798881e-06, - "loss": 0.8916, - "step": 37988 - }, - { - "epoch": 0.97, - "learning_rate": 1.5784294821158042e-06, - "loss": 1.0273, - "step": 37989 - }, - { - "epoch": 0.97, - "learning_rate": 1.578406910208843e-06, - "loss": 1.0645, - "step": 37990 - }, - { - "epoch": 0.97, - "learning_rate": 1.5783843378590227e-06, - "loss": 0.8184, - "step": 37991 - }, - { - "epoch": 0.97, - "learning_rate": 1.5783617650663596e-06, - "loss": 0.8945, - "step": 37992 - }, - { - "epoch": 0.97, - "learning_rate": 1.5783391918308722e-06, - "loss": 0.4985, - "step": 37993 - }, - { - "epoch": 0.97, - "learning_rate": 1.5783166181525766e-06, - "loss": 0.9199, - "step": 37994 - }, - { - "epoch": 0.97, - "learning_rate": 1.5782940440314906e-06, - "loss": 0.7754, - "step": 37995 - }, - { - "epoch": 0.97, - "learning_rate": 1.5782714694676314e-06, - "loss": 1.1816, - "step": 37996 - }, - { - "epoch": 0.97, - "learning_rate": 1.5782488944610164e-06, - "loss": 0.7202, - "step": 37997 - }, - { - "epoch": 0.97, - "learning_rate": 1.5782263190116626e-06, - "loss": 0.9785, - "step": 37998 - }, - { - "epoch": 0.97, - "learning_rate": 1.5782037431195878e-06, - "loss": 0.7593, - "step": 37999 - }, - { - "epoch": 0.97, - "learning_rate": 1.578181166784809e-06, - "loss": 1.0527, - "step": 38000 - }, - { - "epoch": 0.97, - "learning_rate": 1.5781585900073433e-06, - "loss": 0.7051, - "step": 38001 - }, - { - "epoch": 0.97, - "learning_rate": 1.5781360127872082e-06, - "loss": 0.9062, - "step": 38002 - }, - { - "epoch": 0.97, - "learning_rate": 1.578113435124421e-06, - "loss": 0.8184, - "step": 38003 - }, - { - "epoch": 0.97, - "learning_rate": 1.578090857018999e-06, - "loss": 0.8645, - "step": 38004 - }, - { - "epoch": 0.97, - "learning_rate": 1.578068278470959e-06, - "loss": 0.8647, - "step": 38005 - }, - { - "epoch": 0.97, - "learning_rate": 1.5780456994803188e-06, - "loss": 0.9307, - "step": 38006 - }, - { - "epoch": 0.97, - "learning_rate": 1.5780231200470959e-06, - "loss": 0.7871, - "step": 38007 - }, - { - "epoch": 0.97, - "learning_rate": 1.5780005401713076e-06, - "loss": 0.9639, - "step": 38008 - }, - { - "epoch": 0.97, - "learning_rate": 1.5779779598529702e-06, - "loss": 0.8291, - "step": 38009 - }, - { - "epoch": 0.97, - "learning_rate": 1.577955379092102e-06, - "loss": 0.9697, - "step": 38010 - }, - { - "epoch": 0.97, - "learning_rate": 1.5779327978887195e-06, - "loss": 0.7549, - "step": 38011 - }, - { - "epoch": 0.97, - "learning_rate": 1.5779102162428405e-06, - "loss": 0.874, - "step": 38012 - }, - { - "epoch": 0.97, - "learning_rate": 1.5778876341544827e-06, - "loss": 0.634, - "step": 38013 - }, - { - "epoch": 0.97, - "learning_rate": 1.5778650516236627e-06, - "loss": 0.5605, - "step": 38014 - }, - { - "epoch": 0.97, - "learning_rate": 1.577842468650398e-06, - "loss": 0.8887, - "step": 38015 - }, - { - "epoch": 0.97, - "learning_rate": 1.5778198852347058e-06, - "loss": 0.9189, - "step": 38016 - }, - { - "epoch": 0.97, - "learning_rate": 1.5777973013766036e-06, - "loss": 0.8311, - "step": 38017 - }, - { - "epoch": 0.97, - "learning_rate": 1.5777747170761085e-06, - "loss": 0.7134, - "step": 38018 - }, - { - "epoch": 0.97, - "learning_rate": 1.5777521323332378e-06, - "loss": 0.9004, - "step": 38019 - }, - { - "epoch": 0.97, - "learning_rate": 1.5777295471480087e-06, - "loss": 0.6577, - "step": 38020 - }, - { - "epoch": 0.97, - "learning_rate": 1.577706961520439e-06, - "loss": 0.9854, - "step": 38021 - }, - { - "epoch": 0.97, - "learning_rate": 1.5776843754505454e-06, - "loss": 0.7275, - "step": 38022 - }, - { - "epoch": 0.97, - "learning_rate": 1.5776617889383457e-06, - "loss": 0.6338, - "step": 38023 - }, - { - "epoch": 0.97, - "learning_rate": 1.5776392019838567e-06, - "loss": 0.9316, - "step": 38024 - }, - { - "epoch": 0.97, - "learning_rate": 1.5776166145870962e-06, - "loss": 0.7637, - "step": 38025 - }, - { - "epoch": 0.97, - "learning_rate": 1.577594026748081e-06, - "loss": 0.8369, - "step": 38026 - }, - { - "epoch": 0.97, - "learning_rate": 1.5775714384668283e-06, - "loss": 0.9824, - "step": 38027 - }, - { - "epoch": 0.97, - "learning_rate": 1.5775488497433563e-06, - "loss": 0.6836, - "step": 38028 - }, - { - "epoch": 0.97, - "learning_rate": 1.5775262605776815e-06, - "loss": 0.9824, - "step": 38029 - }, - { - "epoch": 0.97, - "learning_rate": 1.5775036709698213e-06, - "loss": 0.8604, - "step": 38030 - }, - { - "epoch": 0.97, - "learning_rate": 1.5774810809197932e-06, - "loss": 0.7998, - "step": 38031 - }, - { - "epoch": 0.97, - "learning_rate": 1.5774584904276141e-06, - "loss": 0.8965, - "step": 38032 - }, - { - "epoch": 0.97, - "learning_rate": 1.5774358994933018e-06, - "loss": 0.6987, - "step": 38033 - }, - { - "epoch": 0.97, - "learning_rate": 1.5774133081168737e-06, - "loss": 0.6963, - "step": 38034 - }, - { - "epoch": 0.97, - "learning_rate": 1.577390716298346e-06, - "loss": 0.7129, - "step": 38035 - }, - { - "epoch": 0.97, - "learning_rate": 1.5773681240377378e-06, - "loss": 0.752, - "step": 38036 - }, - { - "epoch": 0.97, - "learning_rate": 1.5773455313350644e-06, - "loss": 0.8911, - "step": 38037 - }, - { - "epoch": 0.97, - "learning_rate": 1.5773229381903447e-06, - "loss": 1.04, - "step": 38038 - }, - { - "epoch": 0.97, - "learning_rate": 1.5773003446035951e-06, - "loss": 0.7402, - "step": 38039 - }, - { - "epoch": 0.97, - "learning_rate": 1.5772777505748333e-06, - "loss": 0.8857, - "step": 38040 - }, - { - "epoch": 0.98, - "learning_rate": 1.5772551561040763e-06, - "loss": 0.6836, - "step": 38041 - }, - { - "epoch": 0.98, - "learning_rate": 1.5772325611913417e-06, - "loss": 0.957, - "step": 38042 - }, - { - "epoch": 0.98, - "learning_rate": 1.5772099658366468e-06, - "loss": 1.0156, - "step": 38043 - }, - { - "epoch": 0.98, - "learning_rate": 1.5771873700400086e-06, - "loss": 0.7383, - "step": 38044 - }, - { - "epoch": 0.98, - "learning_rate": 1.5771647738014445e-06, - "loss": 0.7935, - "step": 38045 - }, - { - "epoch": 0.98, - "learning_rate": 1.5771421771209719e-06, - "loss": 0.7656, - "step": 38046 - }, - { - "epoch": 0.98, - "learning_rate": 1.5771195799986083e-06, - "loss": 0.9277, - "step": 38047 - }, - { - "epoch": 0.98, - "learning_rate": 1.5770969824343707e-06, - "loss": 0.9468, - "step": 38048 - }, - { - "epoch": 0.98, - "learning_rate": 1.5770743844282763e-06, - "loss": 0.8779, - "step": 38049 - }, - { - "epoch": 0.98, - "learning_rate": 1.5770517859803428e-06, - "loss": 0.6479, - "step": 38050 - }, - { - "epoch": 0.98, - "learning_rate": 1.577029187090587e-06, - "loss": 0.8184, - "step": 38051 - }, - { - "epoch": 0.98, - "learning_rate": 1.5770065877590266e-06, - "loss": 0.8574, - "step": 38052 - }, - { - "epoch": 0.98, - "learning_rate": 1.576983987985679e-06, - "loss": 0.9375, - "step": 38053 - }, - { - "epoch": 0.98, - "learning_rate": 1.5769613877705612e-06, - "loss": 0.8564, - "step": 38054 - }, - { - "epoch": 0.98, - "learning_rate": 1.5769387871136903e-06, - "loss": 0.7363, - "step": 38055 - }, - { - "epoch": 0.98, - "learning_rate": 1.5769161860150841e-06, - "loss": 0.9648, - "step": 38056 - }, - { - "epoch": 0.98, - "learning_rate": 1.5768935844747598e-06, - "loss": 0.8906, - "step": 38057 - }, - { - "epoch": 0.98, - "learning_rate": 1.5768709824927346e-06, - "loss": 0.7236, - "step": 38058 - }, - { - "epoch": 0.98, - "learning_rate": 1.5768483800690256e-06, - "loss": 0.7856, - "step": 38059 - }, - { - "epoch": 0.98, - "learning_rate": 1.5768257772036505e-06, - "loss": 0.9082, - "step": 38060 - }, - { - "epoch": 0.98, - "learning_rate": 1.5768031738966264e-06, - "loss": 0.8242, - "step": 38061 - }, - { - "epoch": 0.98, - "learning_rate": 1.5767805701479704e-06, - "loss": 0.5286, - "step": 38062 - }, - { - "epoch": 0.98, - "learning_rate": 1.5767579659577003e-06, - "loss": 0.7817, - "step": 38063 - }, - { - "epoch": 0.98, - "learning_rate": 1.5767353613258332e-06, - "loss": 0.8091, - "step": 38064 - }, - { - "epoch": 0.98, - "learning_rate": 1.5767127562523864e-06, - "loss": 0.8467, - "step": 38065 - }, - { - "epoch": 0.98, - "learning_rate": 1.5766901507373768e-06, - "loss": 0.792, - "step": 38066 - }, - { - "epoch": 0.98, - "learning_rate": 1.5766675447808222e-06, - "loss": 0.6138, - "step": 38067 - }, - { - "epoch": 0.98, - "learning_rate": 1.5766449383827401e-06, - "loss": 0.5945, - "step": 38068 - }, - { - "epoch": 0.98, - "learning_rate": 1.576622331543147e-06, - "loss": 0.6875, - "step": 38069 - }, - { - "epoch": 0.98, - "learning_rate": 1.576599724262061e-06, - "loss": 1.04, - "step": 38070 - }, - { - "epoch": 0.98, - "learning_rate": 1.576577116539499e-06, - "loss": 0.9346, - "step": 38071 - }, - { - "epoch": 0.98, - "learning_rate": 1.5765545083754783e-06, - "loss": 0.8184, - "step": 38072 - }, - { - "epoch": 0.98, - "learning_rate": 1.5765318997700167e-06, - "loss": 0.5208, - "step": 38073 - }, - { - "epoch": 0.98, - "learning_rate": 1.576509290723131e-06, - "loss": 0.8555, - "step": 38074 - }, - { - "epoch": 0.98, - "learning_rate": 1.5764866812348383e-06, - "loss": 0.6509, - "step": 38075 - }, - { - "epoch": 0.98, - "learning_rate": 1.5764640713051564e-06, - "loss": 0.8242, - "step": 38076 - }, - { - "epoch": 0.98, - "learning_rate": 1.5764414609341027e-06, - "loss": 0.959, - "step": 38077 - }, - { - "epoch": 0.98, - "learning_rate": 1.5764188501216943e-06, - "loss": 0.9062, - "step": 38078 - }, - { - "epoch": 0.98, - "learning_rate": 1.5763962388679483e-06, - "loss": 1.1338, - "step": 38079 - }, - { - "epoch": 0.98, - "learning_rate": 1.5763736271728822e-06, - "loss": 0.8721, - "step": 38080 - }, - { - "epoch": 0.98, - "learning_rate": 1.5763510150365136e-06, - "loss": 0.8457, - "step": 38081 - }, - { - "epoch": 0.98, - "learning_rate": 1.5763284024588593e-06, - "loss": 0.9717, - "step": 38082 - }, - { - "epoch": 0.98, - "learning_rate": 1.5763057894399368e-06, - "loss": 0.707, - "step": 38083 - }, - { - "epoch": 0.98, - "learning_rate": 1.5762831759797635e-06, - "loss": 0.6724, - "step": 38084 - }, - { - "epoch": 0.98, - "learning_rate": 1.5762605620783566e-06, - "loss": 1.001, - "step": 38085 - }, - { - "epoch": 0.98, - "learning_rate": 1.5762379477357334e-06, - "loss": 0.7305, - "step": 38086 - }, - { - "epoch": 0.98, - "learning_rate": 1.5762153329519115e-06, - "loss": 0.9082, - "step": 38087 - }, - { - "epoch": 0.98, - "learning_rate": 1.5761927177269078e-06, - "loss": 0.8604, - "step": 38088 - }, - { - "epoch": 0.98, - "learning_rate": 1.5761701020607401e-06, - "loss": 0.6562, - "step": 38089 - }, - { - "epoch": 0.98, - "learning_rate": 1.5761474859534254e-06, - "loss": 0.7021, - "step": 38090 - }, - { - "epoch": 0.98, - "learning_rate": 1.576124869404981e-06, - "loss": 0.8115, - "step": 38091 - }, - { - "epoch": 0.98, - "learning_rate": 1.576102252415424e-06, - "loss": 0.9863, - "step": 38092 - }, - { - "epoch": 0.98, - "learning_rate": 1.5760796349847726e-06, - "loss": 0.8506, - "step": 38093 - }, - { - "epoch": 0.98, - "learning_rate": 1.5760570171130432e-06, - "loss": 1.0623, - "step": 38094 - }, - { - "epoch": 0.98, - "learning_rate": 1.5760343988002533e-06, - "loss": 0.957, - "step": 38095 - }, - { - "epoch": 0.98, - "learning_rate": 1.5760117800464206e-06, - "loss": 0.7832, - "step": 38096 - }, - { - "epoch": 0.98, - "learning_rate": 1.575989160851562e-06, - "loss": 0.9922, - "step": 38097 - }, - { - "epoch": 0.98, - "learning_rate": 1.5759665412156951e-06, - "loss": 0.7578, - "step": 38098 - }, - { - "epoch": 0.98, - "learning_rate": 1.5759439211388367e-06, - "loss": 0.9111, - "step": 38099 - }, - { - "epoch": 0.98, - "learning_rate": 1.575921300621005e-06, - "loss": 0.7881, - "step": 38100 - }, - { - "epoch": 0.98, - "learning_rate": 1.5758986796622167e-06, - "loss": 0.9531, - "step": 38101 - }, - { - "epoch": 0.98, - "learning_rate": 1.575876058262489e-06, - "loss": 0.6968, - "step": 38102 - }, - { - "epoch": 0.98, - "learning_rate": 1.57585343642184e-06, - "loss": 0.916, - "step": 38103 - }, - { - "epoch": 0.98, - "learning_rate": 1.5758308141402862e-06, - "loss": 0.7783, - "step": 38104 - }, - { - "epoch": 0.98, - "learning_rate": 1.5758081914178454e-06, - "loss": 0.915, - "step": 38105 - }, - { - "epoch": 0.98, - "learning_rate": 1.5757855682545344e-06, - "loss": 0.9609, - "step": 38106 - }, - { - "epoch": 0.98, - "learning_rate": 1.575762944650371e-06, - "loss": 1.0146, - "step": 38107 - }, - { - "epoch": 0.98, - "learning_rate": 1.5757403206053725e-06, - "loss": 0.7324, - "step": 38108 - }, - { - "epoch": 0.98, - "learning_rate": 1.5757176961195562e-06, - "loss": 0.8574, - "step": 38109 - }, - { - "epoch": 0.98, - "learning_rate": 1.575695071192939e-06, - "loss": 1.1904, - "step": 38110 - }, - { - "epoch": 0.98, - "learning_rate": 1.5756724458255387e-06, - "loss": 0.9482, - "step": 38111 - }, - { - "epoch": 0.98, - "learning_rate": 1.5756498200173727e-06, - "loss": 0.7588, - "step": 38112 - }, - { - "epoch": 0.98, - "learning_rate": 1.575627193768458e-06, - "loss": 0.9854, - "step": 38113 - }, - { - "epoch": 0.98, - "learning_rate": 1.575604567078812e-06, - "loss": 0.9619, - "step": 38114 - }, - { - "epoch": 0.98, - "learning_rate": 1.5755819399484518e-06, - "loss": 0.9082, - "step": 38115 - }, - { - "epoch": 0.98, - "learning_rate": 1.5755593123773951e-06, - "loss": 0.8809, - "step": 38116 - }, - { - "epoch": 0.98, - "learning_rate": 1.5755366843656593e-06, - "loss": 1.0283, - "step": 38117 - }, - { - "epoch": 0.98, - "learning_rate": 1.5755140559132617e-06, - "loss": 0.7173, - "step": 38118 - }, - { - "epoch": 0.98, - "learning_rate": 1.5754914270202188e-06, - "loss": 0.6445, - "step": 38119 - }, - { - "epoch": 0.98, - "learning_rate": 1.575468797686549e-06, - "loss": 0.6992, - "step": 38120 - }, - { - "epoch": 0.98, - "learning_rate": 1.575446167912269e-06, - "loss": 0.8018, - "step": 38121 - }, - { - "epoch": 0.98, - "learning_rate": 1.5754235376973965e-06, - "loss": 0.7393, - "step": 38122 - }, - { - "epoch": 0.98, - "learning_rate": 1.5754009070419487e-06, - "loss": 0.7607, - "step": 38123 - }, - { - "epoch": 0.98, - "learning_rate": 1.5753782759459427e-06, - "loss": 0.7832, - "step": 38124 - }, - { - "epoch": 0.98, - "learning_rate": 1.575355644409396e-06, - "loss": 0.8003, - "step": 38125 - }, - { - "epoch": 0.98, - "learning_rate": 1.5753330124323263e-06, - "loss": 0.7339, - "step": 38126 - }, - { - "epoch": 0.98, - "learning_rate": 1.5753103800147502e-06, - "loss": 0.6381, - "step": 38127 - }, - { - "epoch": 0.98, - "learning_rate": 1.5752877471566857e-06, - "loss": 0.7666, - "step": 38128 - }, - { - "epoch": 0.98, - "learning_rate": 1.5752651138581494e-06, - "loss": 0.6357, - "step": 38129 - }, - { - "epoch": 0.98, - "learning_rate": 1.5752424801191592e-06, - "loss": 0.8164, - "step": 38130 - }, - { - "epoch": 0.98, - "learning_rate": 1.5752198459397325e-06, - "loss": 0.8096, - "step": 38131 - }, - { - "epoch": 0.98, - "learning_rate": 1.5751972113198861e-06, - "loss": 0.7939, - "step": 38132 - }, - { - "epoch": 0.98, - "learning_rate": 1.5751745762596381e-06, - "loss": 0.8877, - "step": 38133 - }, - { - "epoch": 0.98, - "learning_rate": 1.575151940759005e-06, - "loss": 0.9297, - "step": 38134 - }, - { - "epoch": 0.98, - "learning_rate": 1.5751293048180045e-06, - "loss": 0.8091, - "step": 38135 - }, - { - "epoch": 0.98, - "learning_rate": 1.5751066684366542e-06, - "loss": 0.6289, - "step": 38136 - }, - { - "epoch": 0.98, - "learning_rate": 1.5750840316149709e-06, - "loss": 0.6936, - "step": 38137 - }, - { - "epoch": 0.98, - "learning_rate": 1.5750613943529723e-06, - "loss": 0.8262, - "step": 38138 - }, - { - "epoch": 0.98, - "learning_rate": 1.5750387566506758e-06, - "loss": 0.9717, - "step": 38139 - }, - { - "epoch": 0.98, - "learning_rate": 1.5750161185080982e-06, - "loss": 0.6611, - "step": 38140 - }, - { - "epoch": 0.98, - "learning_rate": 1.5749934799252574e-06, - "loss": 0.73, - "step": 38141 - }, - { - "epoch": 0.98, - "learning_rate": 1.5749708409021704e-06, - "loss": 0.6538, - "step": 38142 - }, - { - "epoch": 0.98, - "learning_rate": 1.5749482014388552e-06, - "loss": 0.5938, - "step": 38143 - }, - { - "epoch": 0.98, - "learning_rate": 1.574925561535328e-06, - "loss": 0.7725, - "step": 38144 - }, - { - "epoch": 0.98, - "learning_rate": 1.574902921191607e-06, - "loss": 0.9121, - "step": 38145 - }, - { - "epoch": 0.98, - "learning_rate": 1.5748802804077093e-06, - "loss": 0.8779, - "step": 38146 - }, - { - "epoch": 0.98, - "learning_rate": 1.574857639183652e-06, - "loss": 0.7617, - "step": 38147 - }, - { - "epoch": 0.98, - "learning_rate": 1.5748349975194529e-06, - "loss": 0.9043, - "step": 38148 - }, - { - "epoch": 0.98, - "learning_rate": 1.574812355415129e-06, - "loss": 0.8291, - "step": 38149 - }, - { - "epoch": 0.98, - "learning_rate": 1.5747897128706975e-06, - "loss": 0.8145, - "step": 38150 - }, - { - "epoch": 0.98, - "learning_rate": 1.5747670698861758e-06, - "loss": 0.8027, - "step": 38151 - }, - { - "epoch": 0.98, - "learning_rate": 1.5747444264615819e-06, - "loss": 0.6875, - "step": 38152 - }, - { - "epoch": 0.98, - "learning_rate": 1.5747217825969322e-06, - "loss": 0.7749, - "step": 38153 - }, - { - "epoch": 0.98, - "learning_rate": 1.5746991382922446e-06, - "loss": 0.9678, - "step": 38154 - }, - { - "epoch": 0.98, - "learning_rate": 1.5746764935475366e-06, - "loss": 0.8198, - "step": 38155 - }, - { - "epoch": 0.98, - "learning_rate": 1.5746538483628249e-06, - "loss": 0.8066, - "step": 38156 - }, - { - "epoch": 0.98, - "learning_rate": 1.5746312027381272e-06, - "loss": 0.7705, - "step": 38157 - }, - { - "epoch": 0.98, - "learning_rate": 1.574608556673461e-06, - "loss": 0.6714, - "step": 38158 - }, - { - "epoch": 0.98, - "learning_rate": 1.574585910168843e-06, - "loss": 1.0557, - "step": 38159 - }, - { - "epoch": 0.98, - "learning_rate": 1.5745632632242913e-06, - "loss": 0.8662, - "step": 38160 - }, - { - "epoch": 0.98, - "learning_rate": 1.574540615839823e-06, - "loss": 0.8779, - "step": 38161 - }, - { - "epoch": 0.98, - "learning_rate": 1.574517968015455e-06, - "loss": 0.8379, - "step": 38162 - }, - { - "epoch": 0.98, - "learning_rate": 1.5744953197512056e-06, - "loss": 0.8965, - "step": 38163 - }, - { - "epoch": 0.98, - "learning_rate": 1.5744726710470912e-06, - "loss": 0.9824, - "step": 38164 - }, - { - "epoch": 0.98, - "learning_rate": 1.5744500219031296e-06, - "loss": 0.9453, - "step": 38165 - }, - { - "epoch": 0.98, - "learning_rate": 1.5744273723193377e-06, - "loss": 0.873, - "step": 38166 - }, - { - "epoch": 0.98, - "learning_rate": 1.5744047222957336e-06, - "loss": 1.043, - "step": 38167 - }, - { - "epoch": 0.98, - "learning_rate": 1.5743820718323342e-06, - "loss": 1.1006, - "step": 38168 - }, - { - "epoch": 0.98, - "learning_rate": 1.5743594209291567e-06, - "loss": 0.8613, - "step": 38169 - }, - { - "epoch": 0.98, - "learning_rate": 1.5743367695862184e-06, - "loss": 0.7812, - "step": 38170 - }, - { - "epoch": 0.98, - "learning_rate": 1.5743141178035371e-06, - "loss": 0.918, - "step": 38171 - }, - { - "epoch": 0.98, - "learning_rate": 1.5742914655811298e-06, - "loss": 0.7676, - "step": 38172 - }, - { - "epoch": 0.98, - "learning_rate": 1.574268812919014e-06, - "loss": 0.8501, - "step": 38173 - }, - { - "epoch": 0.98, - "learning_rate": 1.574246159817207e-06, - "loss": 0.7375, - "step": 38174 - }, - { - "epoch": 0.98, - "learning_rate": 1.574223506275726e-06, - "loss": 0.5551, - "step": 38175 - }, - { - "epoch": 0.98, - "learning_rate": 1.5742008522945883e-06, - "loss": 0.9209, - "step": 38176 - }, - { - "epoch": 0.98, - "learning_rate": 1.5741781978738118e-06, - "loss": 0.8296, - "step": 38177 - }, - { - "epoch": 0.98, - "learning_rate": 1.5741555430134135e-06, - "loss": 0.9219, - "step": 38178 - }, - { - "epoch": 0.98, - "learning_rate": 1.5741328877134104e-06, - "loss": 0.7979, - "step": 38179 - }, - { - "epoch": 0.98, - "learning_rate": 1.5741102319738203e-06, - "loss": 0.5811, - "step": 38180 - }, - { - "epoch": 0.98, - "learning_rate": 1.5740875757946603e-06, - "loss": 0.8057, - "step": 38181 - }, - { - "epoch": 0.98, - "learning_rate": 1.5740649191759476e-06, - "loss": 0.8008, - "step": 38182 - }, - { - "epoch": 0.98, - "learning_rate": 1.5740422621177004e-06, - "loss": 1.0225, - "step": 38183 - }, - { - "epoch": 0.98, - "learning_rate": 1.574019604619935e-06, - "loss": 0.71, - "step": 38184 - }, - { - "epoch": 0.98, - "learning_rate": 1.5739969466826692e-06, - "loss": 0.8608, - "step": 38185 - }, - { - "epoch": 0.98, - "learning_rate": 1.5739742883059206e-06, - "loss": 0.8154, - "step": 38186 - }, - { - "epoch": 0.98, - "learning_rate": 1.573951629489706e-06, - "loss": 0.9062, - "step": 38187 - }, - { - "epoch": 0.98, - "learning_rate": 1.5739289702340432e-06, - "loss": 0.7812, - "step": 38188 - }, - { - "epoch": 0.98, - "learning_rate": 1.5739063105389492e-06, - "loss": 0.833, - "step": 38189 - }, - { - "epoch": 0.98, - "learning_rate": 1.5738836504044418e-06, - "loss": 0.9707, - "step": 38190 - }, - { - "epoch": 0.98, - "learning_rate": 1.5738609898305377e-06, - "loss": 0.9219, - "step": 38191 - }, - { - "epoch": 0.98, - "learning_rate": 1.573838328817255e-06, - "loss": 0.874, - "step": 38192 - }, - { - "epoch": 0.98, - "learning_rate": 1.5738156673646103e-06, - "loss": 0.8262, - "step": 38193 - }, - { - "epoch": 0.98, - "learning_rate": 1.5737930054726215e-06, - "loss": 0.8447, - "step": 38194 - }, - { - "epoch": 0.98, - "learning_rate": 1.573770343141306e-06, - "loss": 0.6987, - "step": 38195 - }, - { - "epoch": 0.98, - "learning_rate": 1.5737476803706807e-06, - "loss": 1.0078, - "step": 38196 - }, - { - "epoch": 0.98, - "learning_rate": 1.5737250171607631e-06, - "loss": 0.998, - "step": 38197 - }, - { - "epoch": 0.98, - "learning_rate": 1.573702353511571e-06, - "loss": 0.7588, - "step": 38198 - }, - { - "epoch": 0.98, - "learning_rate": 1.573679689423121e-06, - "loss": 0.9219, - "step": 38199 - }, - { - "epoch": 0.98, - "learning_rate": 1.5736570248954312e-06, - "loss": 0.7739, - "step": 38200 - }, - { - "epoch": 0.98, - "learning_rate": 1.5736343599285182e-06, - "loss": 0.7881, - "step": 38201 - }, - { - "epoch": 0.98, - "learning_rate": 1.5736116945224e-06, - "loss": 0.8926, - "step": 38202 - }, - { - "epoch": 0.98, - "learning_rate": 1.5735890286770936e-06, - "loss": 0.8789, - "step": 38203 - }, - { - "epoch": 0.98, - "learning_rate": 1.5735663623926165e-06, - "loss": 1.123, - "step": 38204 - }, - { - "epoch": 0.98, - "learning_rate": 1.5735436956689858e-06, - "loss": 0.7764, - "step": 38205 - }, - { - "epoch": 0.98, - "learning_rate": 1.5735210285062194e-06, - "loss": 0.959, - "step": 38206 - }, - { - "epoch": 0.98, - "learning_rate": 1.5734983609043341e-06, - "loss": 0.7539, - "step": 38207 - }, - { - "epoch": 0.98, - "learning_rate": 1.5734756928633476e-06, - "loss": 0.5684, - "step": 38208 - }, - { - "epoch": 0.98, - "learning_rate": 1.5734530243832772e-06, - "loss": 0.8362, - "step": 38209 - }, - { - "epoch": 0.98, - "learning_rate": 1.57343035546414e-06, - "loss": 0.9053, - "step": 38210 - }, - { - "epoch": 0.98, - "learning_rate": 1.5734076861059538e-06, - "loss": 0.8086, - "step": 38211 - }, - { - "epoch": 0.98, - "learning_rate": 1.5733850163087352e-06, - "loss": 0.7712, - "step": 38212 - }, - { - "epoch": 0.98, - "learning_rate": 1.5733623460725025e-06, - "loss": 0.7217, - "step": 38213 - }, - { - "epoch": 0.98, - "learning_rate": 1.5733396753972725e-06, - "loss": 0.7058, - "step": 38214 - }, - { - "epoch": 0.98, - "learning_rate": 1.5733170042830628e-06, - "loss": 0.9385, - "step": 38215 - }, - { - "epoch": 0.98, - "learning_rate": 1.5732943327298904e-06, - "loss": 0.8208, - "step": 38216 - }, - { - "epoch": 0.98, - "learning_rate": 1.573271660737773e-06, - "loss": 0.9004, - "step": 38217 - }, - { - "epoch": 0.98, - "learning_rate": 1.5732489883067279e-06, - "loss": 1.001, - "step": 38218 - }, - { - "epoch": 0.98, - "learning_rate": 1.5732263154367724e-06, - "loss": 0.7598, - "step": 38219 - }, - { - "epoch": 0.98, - "learning_rate": 1.5732036421279237e-06, - "loss": 0.7754, - "step": 38220 - }, - { - "epoch": 0.98, - "learning_rate": 1.5731809683801994e-06, - "loss": 0.9287, - "step": 38221 - }, - { - "epoch": 0.98, - "learning_rate": 1.5731582941936168e-06, - "loss": 0.8682, - "step": 38222 - }, - { - "epoch": 0.98, - "learning_rate": 1.5731356195681933e-06, - "loss": 0.9248, - "step": 38223 - }, - { - "epoch": 0.98, - "learning_rate": 1.5731129445039462e-06, - "loss": 1.0645, - "step": 38224 - }, - { - "epoch": 0.98, - "learning_rate": 1.573090269000893e-06, - "loss": 0.9355, - "step": 38225 - }, - { - "epoch": 0.98, - "learning_rate": 1.5730675930590506e-06, - "loss": 0.9434, - "step": 38226 - }, - { - "epoch": 0.98, - "learning_rate": 1.573044916678437e-06, - "loss": 0.6611, - "step": 38227 - }, - { - "epoch": 0.98, - "learning_rate": 1.5730222398590694e-06, - "loss": 0.7656, - "step": 38228 - }, - { - "epoch": 0.98, - "learning_rate": 1.5729995626009647e-06, - "loss": 0.957, - "step": 38229 - }, - { - "epoch": 0.98, - "learning_rate": 1.5729768849041406e-06, - "loss": 0.8379, - "step": 38230 - }, - { - "epoch": 0.98, - "learning_rate": 1.5729542067686143e-06, - "loss": 0.9258, - "step": 38231 - }, - { - "epoch": 0.98, - "learning_rate": 1.5729315281944034e-06, - "loss": 0.8818, - "step": 38232 - }, - { - "epoch": 0.98, - "learning_rate": 1.5729088491815255e-06, - "loss": 1.0537, - "step": 38233 - }, - { - "epoch": 0.98, - "learning_rate": 1.5728861697299975e-06, - "loss": 1.0176, - "step": 38234 - }, - { - "epoch": 0.98, - "learning_rate": 1.5728634898398366e-06, - "loss": 0.6978, - "step": 38235 - }, - { - "epoch": 0.98, - "learning_rate": 1.5728408095110606e-06, - "loss": 0.8105, - "step": 38236 - }, - { - "epoch": 0.98, - "learning_rate": 1.572818128743687e-06, - "loss": 0.9424, - "step": 38237 - }, - { - "epoch": 0.98, - "learning_rate": 1.5727954475377328e-06, - "loss": 0.8896, - "step": 38238 - }, - { - "epoch": 0.98, - "learning_rate": 1.5727727658932153e-06, - "loss": 0.7793, - "step": 38239 - }, - { - "epoch": 0.98, - "learning_rate": 1.5727500838101522e-06, - "loss": 1.0332, - "step": 38240 - }, - { - "epoch": 0.98, - "learning_rate": 1.5727274012885606e-06, - "loss": 0.8223, - "step": 38241 - }, - { - "epoch": 0.98, - "learning_rate": 1.572704718328458e-06, - "loss": 0.9746, - "step": 38242 - }, - { - "epoch": 0.98, - "learning_rate": 1.5726820349298616e-06, - "loss": 0.6729, - "step": 38243 - }, - { - "epoch": 0.98, - "learning_rate": 1.5726593510927889e-06, - "loss": 0.8271, - "step": 38244 - }, - { - "epoch": 0.98, - "learning_rate": 1.5726366668172574e-06, - "loss": 0.8091, - "step": 38245 - }, - { - "epoch": 0.98, - "learning_rate": 1.5726139821032841e-06, - "loss": 0.875, - "step": 38246 - }, - { - "epoch": 0.98, - "learning_rate": 1.572591296950887e-06, - "loss": 0.9736, - "step": 38247 - }, - { - "epoch": 0.98, - "learning_rate": 1.572568611360083e-06, - "loss": 0.8271, - "step": 38248 - }, - { - "epoch": 0.98, - "learning_rate": 1.5725459253308892e-06, - "loss": 0.8242, - "step": 38249 - }, - { - "epoch": 0.98, - "learning_rate": 1.5725232388633235e-06, - "loss": 0.8662, - "step": 38250 - }, - { - "epoch": 0.98, - "learning_rate": 1.572500551957403e-06, - "loss": 0.7988, - "step": 38251 - }, - { - "epoch": 0.98, - "learning_rate": 1.5724778646131453e-06, - "loss": 0.9863, - "step": 38252 - }, - { - "epoch": 0.98, - "learning_rate": 1.5724551768305677e-06, - "loss": 1.0166, - "step": 38253 - }, - { - "epoch": 0.98, - "learning_rate": 1.5724324886096874e-06, - "loss": 0.7153, - "step": 38254 - }, - { - "epoch": 0.98, - "learning_rate": 1.5724097999505218e-06, - "loss": 0.6957, - "step": 38255 - }, - { - "epoch": 0.98, - "learning_rate": 1.5723871108530884e-06, - "loss": 0.5254, - "step": 38256 - }, - { - "epoch": 0.98, - "learning_rate": 1.5723644213174046e-06, - "loss": 0.9502, - "step": 38257 - }, - { - "epoch": 0.98, - "learning_rate": 1.5723417313434874e-06, - "loss": 1.0957, - "step": 38258 - }, - { - "epoch": 0.98, - "learning_rate": 1.5723190409313547e-06, - "loss": 1.1123, - "step": 38259 - }, - { - "epoch": 0.98, - "learning_rate": 1.5722963500810234e-06, - "loss": 0.8545, - "step": 38260 - }, - { - "epoch": 0.98, - "learning_rate": 1.5722736587925113e-06, - "loss": 1.0264, - "step": 38261 - }, - { - "epoch": 0.98, - "learning_rate": 1.5722509670658357e-06, - "loss": 0.9785, - "step": 38262 - }, - { - "epoch": 0.98, - "learning_rate": 1.5722282749010133e-06, - "loss": 0.6809, - "step": 38263 - }, - { - "epoch": 0.98, - "learning_rate": 1.5722055822980625e-06, - "loss": 0.6904, - "step": 38264 - }, - { - "epoch": 0.98, - "learning_rate": 1.5721828892570002e-06, - "loss": 0.7529, - "step": 38265 - }, - { - "epoch": 0.98, - "learning_rate": 1.5721601957778434e-06, - "loss": 1.0059, - "step": 38266 - }, - { - "epoch": 0.98, - "learning_rate": 1.5721375018606104e-06, - "loss": 0.8291, - "step": 38267 - }, - { - "epoch": 0.98, - "learning_rate": 1.5721148075053176e-06, - "loss": 0.835, - "step": 38268 - }, - { - "epoch": 0.98, - "learning_rate": 1.5720921127119828e-06, - "loss": 0.7852, - "step": 38269 - }, - { - "epoch": 0.98, - "learning_rate": 1.5720694174806235e-06, - "loss": 0.7812, - "step": 38270 - }, - { - "epoch": 0.98, - "learning_rate": 1.572046721811257e-06, - "loss": 0.7041, - "step": 38271 - }, - { - "epoch": 0.98, - "learning_rate": 1.5720240257039006e-06, - "loss": 0.8555, - "step": 38272 - }, - { - "epoch": 0.98, - "learning_rate": 1.5720013291585716e-06, - "loss": 0.5342, - "step": 38273 - }, - { - "epoch": 0.98, - "learning_rate": 1.5719786321752877e-06, - "loss": 0.8838, - "step": 38274 - }, - { - "epoch": 0.98, - "learning_rate": 1.5719559347540658e-06, - "loss": 0.832, - "step": 38275 - }, - { - "epoch": 0.98, - "learning_rate": 1.5719332368949236e-06, - "loss": 0.5132, - "step": 38276 - }, - { - "epoch": 0.98, - "learning_rate": 1.5719105385978787e-06, - "loss": 0.6411, - "step": 38277 - }, - { - "epoch": 0.98, - "learning_rate": 1.5718878398629478e-06, - "loss": 0.7764, - "step": 38278 - }, - { - "epoch": 0.98, - "learning_rate": 1.571865140690149e-06, - "loss": 0.8223, - "step": 38279 - }, - { - "epoch": 0.98, - "learning_rate": 1.5718424410794992e-06, - "loss": 0.9131, - "step": 38280 - }, - { - "epoch": 0.98, - "learning_rate": 1.5718197410310159e-06, - "loss": 0.7734, - "step": 38281 - }, - { - "epoch": 0.98, - "learning_rate": 1.5717970405447165e-06, - "loss": 0.6001, - "step": 38282 - }, - { - "epoch": 0.98, - "learning_rate": 1.5717743396206186e-06, - "loss": 0.9551, - "step": 38283 - }, - { - "epoch": 0.98, - "learning_rate": 1.5717516382587392e-06, - "loss": 1.166, - "step": 38284 - }, - { - "epoch": 0.98, - "learning_rate": 1.5717289364590957e-06, - "loss": 0.7588, - "step": 38285 - }, - { - "epoch": 0.98, - "learning_rate": 1.571706234221706e-06, - "loss": 0.96, - "step": 38286 - }, - { - "epoch": 0.98, - "learning_rate": 1.571683531546587e-06, - "loss": 0.8296, - "step": 38287 - }, - { - "epoch": 0.98, - "learning_rate": 1.5716608284337562e-06, - "loss": 0.8105, - "step": 38288 - }, - { - "epoch": 0.98, - "learning_rate": 1.5716381248832308e-06, - "loss": 0.7656, - "step": 38289 - }, - { - "epoch": 0.98, - "learning_rate": 1.5716154208950287e-06, - "loss": 1.0039, - "step": 38290 - }, - { - "epoch": 0.98, - "learning_rate": 1.5715927164691668e-06, - "loss": 0.7861, - "step": 38291 - }, - { - "epoch": 0.98, - "learning_rate": 1.5715700116056627e-06, - "loss": 0.6968, - "step": 38292 - }, - { - "epoch": 0.98, - "learning_rate": 1.5715473063045335e-06, - "loss": 1.0586, - "step": 38293 - }, - { - "epoch": 0.98, - "learning_rate": 1.5715246005657972e-06, - "loss": 0.624, - "step": 38294 - }, - { - "epoch": 0.98, - "learning_rate": 1.5715018943894704e-06, - "loss": 0.8286, - "step": 38295 - }, - { - "epoch": 0.98, - "learning_rate": 1.571479187775571e-06, - "loss": 0.8296, - "step": 38296 - }, - { - "epoch": 0.98, - "learning_rate": 1.5714564807241164e-06, - "loss": 0.6782, - "step": 38297 - }, - { - "epoch": 0.98, - "learning_rate": 1.5714337732351238e-06, - "loss": 0.8896, - "step": 38298 - }, - { - "epoch": 0.98, - "learning_rate": 1.5714110653086104e-06, - "loss": 0.7617, - "step": 38299 - }, - { - "epoch": 0.98, - "learning_rate": 1.571388356944594e-06, - "loss": 0.9727, - "step": 38300 - }, - { - "epoch": 0.98, - "learning_rate": 1.5713656481430916e-06, - "loss": 0.8799, - "step": 38301 - }, - { - "epoch": 0.98, - "learning_rate": 1.5713429389041215e-06, - "loss": 1.0117, - "step": 38302 - }, - { - "epoch": 0.98, - "learning_rate": 1.5713202292276997e-06, - "loss": 1.0713, - "step": 38303 - }, - { - "epoch": 0.98, - "learning_rate": 1.5712975191138445e-06, - "loss": 0.834, - "step": 38304 - }, - { - "epoch": 0.98, - "learning_rate": 1.571274808562573e-06, - "loss": 0.7949, - "step": 38305 - }, - { - "epoch": 0.98, - "learning_rate": 1.5712520975739026e-06, - "loss": 0.5737, - "step": 38306 - }, - { - "epoch": 0.98, - "learning_rate": 1.5712293861478506e-06, - "loss": 0.8936, - "step": 38307 - }, - { - "epoch": 0.98, - "learning_rate": 1.5712066742844349e-06, - "loss": 0.8916, - "step": 38308 - }, - { - "epoch": 0.98, - "learning_rate": 1.5711839619836723e-06, - "loss": 0.8779, - "step": 38309 - }, - { - "epoch": 0.98, - "learning_rate": 1.5711612492455805e-06, - "loss": 0.7656, - "step": 38310 - }, - { - "epoch": 0.98, - "learning_rate": 1.5711385360701768e-06, - "loss": 0.8818, - "step": 38311 - }, - { - "epoch": 0.98, - "learning_rate": 1.5711158224574786e-06, - "loss": 0.7412, - "step": 38312 - }, - { - "epoch": 0.98, - "learning_rate": 1.5710931084075032e-06, - "loss": 1.0312, - "step": 38313 - }, - { - "epoch": 0.98, - "learning_rate": 1.571070393920268e-06, - "loss": 0.9639, - "step": 38314 - }, - { - "epoch": 0.98, - "learning_rate": 1.5710476789957906e-06, - "loss": 1.0225, - "step": 38315 - }, - { - "epoch": 0.98, - "learning_rate": 1.571024963634088e-06, - "loss": 0.6509, - "step": 38316 - }, - { - "epoch": 0.98, - "learning_rate": 1.5710022478351782e-06, - "loss": 0.9189, - "step": 38317 - }, - { - "epoch": 0.98, - "learning_rate": 1.5709795315990779e-06, - "loss": 0.832, - "step": 38318 - }, - { - "epoch": 0.98, - "learning_rate": 1.570956814925805e-06, - "loss": 0.7861, - "step": 38319 - }, - { - "epoch": 0.98, - "learning_rate": 1.5709340978153768e-06, - "loss": 0.7061, - "step": 38320 - }, - { - "epoch": 0.98, - "learning_rate": 1.5709113802678103e-06, - "loss": 1.0, - "step": 38321 - }, - { - "epoch": 0.98, - "learning_rate": 1.5708886622831238e-06, - "loss": 0.8052, - "step": 38322 - }, - { - "epoch": 0.98, - "learning_rate": 1.5708659438613335e-06, - "loss": 0.8008, - "step": 38323 - }, - { - "epoch": 0.98, - "learning_rate": 1.5708432250024575e-06, - "loss": 1.0107, - "step": 38324 - }, - { - "epoch": 0.98, - "learning_rate": 1.5708205057065134e-06, - "loss": 0.6838, - "step": 38325 - }, - { - "epoch": 0.98, - "learning_rate": 1.570797785973518e-06, - "loss": 1.002, - "step": 38326 - }, - { - "epoch": 0.98, - "learning_rate": 1.570775065803489e-06, - "loss": 0.7273, - "step": 38327 - }, - { - "epoch": 0.98, - "learning_rate": 1.570752345196444e-06, - "loss": 0.7148, - "step": 38328 - }, - { - "epoch": 0.98, - "learning_rate": 1.5707296241524e-06, - "loss": 0.7422, - "step": 38329 - }, - { - "epoch": 0.98, - "learning_rate": 1.5707069026713743e-06, - "loss": 0.9385, - "step": 38330 - }, - { - "epoch": 0.98, - "learning_rate": 1.570684180753385e-06, - "loss": 0.9863, - "step": 38331 - }, - { - "epoch": 0.98, - "learning_rate": 1.570661458398449e-06, - "loss": 0.8223, - "step": 38332 - }, - { - "epoch": 0.98, - "learning_rate": 1.5706387356065839e-06, - "loss": 0.7622, - "step": 38333 - }, - { - "epoch": 0.98, - "learning_rate": 1.5706160123778065e-06, - "loss": 0.791, - "step": 38334 - }, - { - "epoch": 0.98, - "learning_rate": 1.570593288712135e-06, - "loss": 0.7979, - "step": 38335 - }, - { - "epoch": 0.98, - "learning_rate": 1.570570564609586e-06, - "loss": 0.6597, - "step": 38336 - }, - { - "epoch": 0.98, - "learning_rate": 1.570547840070178e-06, - "loss": 0.8115, - "step": 38337 - }, - { - "epoch": 0.98, - "learning_rate": 1.5705251150939277e-06, - "loss": 0.8945, - "step": 38338 - }, - { - "epoch": 0.98, - "learning_rate": 1.570502389680852e-06, - "loss": 0.7476, - "step": 38339 - }, - { - "epoch": 0.98, - "learning_rate": 1.5704796638309692e-06, - "loss": 0.7324, - "step": 38340 - }, - { - "epoch": 0.98, - "learning_rate": 1.5704569375442964e-06, - "loss": 0.7393, - "step": 38341 - }, - { - "epoch": 0.98, - "learning_rate": 1.570434210820851e-06, - "loss": 0.769, - "step": 38342 - }, - { - "epoch": 0.98, - "learning_rate": 1.5704114836606502e-06, - "loss": 0.6943, - "step": 38343 - }, - { - "epoch": 0.98, - "learning_rate": 1.5703887560637114e-06, - "loss": 0.79, - "step": 38344 - }, - { - "epoch": 0.98, - "learning_rate": 1.5703660280300523e-06, - "loss": 0.8711, - "step": 38345 - }, - { - "epoch": 0.98, - "learning_rate": 1.5703432995596902e-06, - "loss": 1.0479, - "step": 38346 - }, - { - "epoch": 0.98, - "learning_rate": 1.5703205706526426e-06, - "loss": 0.73, - "step": 38347 - }, - { - "epoch": 0.98, - "learning_rate": 1.5702978413089266e-06, - "loss": 0.8047, - "step": 38348 - }, - { - "epoch": 0.98, - "learning_rate": 1.5702751115285598e-06, - "loss": 1.0039, - "step": 38349 - }, - { - "epoch": 0.98, - "learning_rate": 1.5702523813115597e-06, - "loss": 1.0044, - "step": 38350 - }, - { - "epoch": 0.98, - "learning_rate": 1.5702296506579434e-06, - "loss": 0.8525, - "step": 38351 - }, - { - "epoch": 0.98, - "learning_rate": 1.5702069195677283e-06, - "loss": 0.7026, - "step": 38352 - }, - { - "epoch": 0.98, - "learning_rate": 1.5701841880409323e-06, - "loss": 0.8086, - "step": 38353 - }, - { - "epoch": 0.98, - "learning_rate": 1.5701614560775723e-06, - "loss": 0.6416, - "step": 38354 - }, - { - "epoch": 0.98, - "learning_rate": 1.570138723677666e-06, - "loss": 0.9971, - "step": 38355 - }, - { - "epoch": 0.98, - "learning_rate": 1.5701159908412308e-06, - "loss": 0.6875, - "step": 38356 - }, - { - "epoch": 0.98, - "learning_rate": 1.5700932575682837e-06, - "loss": 0.917, - "step": 38357 - }, - { - "epoch": 0.98, - "learning_rate": 1.5700705238588426e-06, - "loss": 1.0078, - "step": 38358 - }, - { - "epoch": 0.98, - "learning_rate": 1.5700477897129246e-06, - "loss": 0.7783, - "step": 38359 - }, - { - "epoch": 0.98, - "learning_rate": 1.5700250551305474e-06, - "loss": 0.708, - "step": 38360 - }, - { - "epoch": 0.98, - "learning_rate": 1.5700023201117278e-06, - "loss": 0.9551, - "step": 38361 - }, - { - "epoch": 0.98, - "learning_rate": 1.5699795846564843e-06, - "loss": 0.7583, - "step": 38362 - }, - { - "epoch": 0.98, - "learning_rate": 1.5699568487648334e-06, - "loss": 0.8159, - "step": 38363 - }, - { - "epoch": 0.98, - "learning_rate": 1.5699341124367925e-06, - "loss": 1.0186, - "step": 38364 - }, - { - "epoch": 0.98, - "learning_rate": 1.5699113756723793e-06, - "loss": 0.8984, - "step": 38365 - }, - { - "epoch": 0.98, - "learning_rate": 1.5698886384716113e-06, - "loss": 0.8662, - "step": 38366 - }, - { - "epoch": 0.98, - "learning_rate": 1.5698659008345057e-06, - "loss": 0.7686, - "step": 38367 - }, - { - "epoch": 0.98, - "learning_rate": 1.5698431627610801e-06, - "loss": 0.7871, - "step": 38368 - }, - { - "epoch": 0.98, - "learning_rate": 1.5698204242513517e-06, - "loss": 1.0469, - "step": 38369 - }, - { - "epoch": 0.98, - "learning_rate": 1.569797685305338e-06, - "loss": 0.7803, - "step": 38370 - }, - { - "epoch": 0.98, - "learning_rate": 1.5697749459230565e-06, - "loss": 0.9648, - "step": 38371 - }, - { - "epoch": 0.98, - "learning_rate": 1.5697522061045243e-06, - "loss": 0.7451, - "step": 38372 - }, - { - "epoch": 0.98, - "learning_rate": 1.5697294658497594e-06, - "loss": 1.0557, - "step": 38373 - }, - { - "epoch": 0.98, - "learning_rate": 1.5697067251587784e-06, - "loss": 0.6348, - "step": 38374 - }, - { - "epoch": 0.98, - "learning_rate": 1.5696839840315993e-06, - "loss": 0.6748, - "step": 38375 - }, - { - "epoch": 0.98, - "learning_rate": 1.5696612424682396e-06, - "loss": 0.8965, - "step": 38376 - }, - { - "epoch": 0.98, - "learning_rate": 1.5696385004687166e-06, - "loss": 0.7583, - "step": 38377 - }, - { - "epoch": 0.98, - "learning_rate": 1.5696157580330472e-06, - "loss": 0.8779, - "step": 38378 - }, - { - "epoch": 0.98, - "learning_rate": 1.5695930151612492e-06, - "loss": 0.8535, - "step": 38379 - }, - { - "epoch": 0.98, - "learning_rate": 1.5695702718533402e-06, - "loss": 0.9141, - "step": 38380 - }, - { - "epoch": 0.98, - "learning_rate": 1.5695475281093373e-06, - "loss": 1.0098, - "step": 38381 - }, - { - "epoch": 0.98, - "learning_rate": 1.5695247839292582e-06, - "loss": 0.6743, - "step": 38382 - }, - { - "epoch": 0.98, - "learning_rate": 1.5695020393131202e-06, - "loss": 0.9971, - "step": 38383 - }, - { - "epoch": 0.98, - "learning_rate": 1.5694792942609402e-06, - "loss": 0.7417, - "step": 38384 - }, - { - "epoch": 0.98, - "learning_rate": 1.5694565487727366e-06, - "loss": 0.7988, - "step": 38385 - }, - { - "epoch": 0.98, - "learning_rate": 1.569433802848526e-06, - "loss": 0.8047, - "step": 38386 - }, - { - "epoch": 0.98, - "learning_rate": 1.5694110564883266e-06, - "loss": 0.9746, - "step": 38387 - }, - { - "epoch": 0.98, - "learning_rate": 1.5693883096921549e-06, - "loss": 0.9355, - "step": 38388 - }, - { - "epoch": 0.98, - "learning_rate": 1.5693655624600289e-06, - "loss": 0.5088, - "step": 38389 - }, - { - "epoch": 0.98, - "learning_rate": 1.5693428147919657e-06, - "loss": 0.8184, - "step": 38390 - }, - { - "epoch": 0.98, - "learning_rate": 1.569320066687983e-06, - "loss": 0.9277, - "step": 38391 - }, - { - "epoch": 0.98, - "learning_rate": 1.5692973181480982e-06, - "loss": 0.5264, - "step": 38392 - }, - { - "epoch": 0.98, - "learning_rate": 1.5692745691723286e-06, - "loss": 0.8086, - "step": 38393 - }, - { - "epoch": 0.98, - "learning_rate": 1.5692518197606917e-06, - "loss": 0.8359, - "step": 38394 - }, - { - "epoch": 0.98, - "learning_rate": 1.5692290699132045e-06, - "loss": 0.9863, - "step": 38395 - }, - { - "epoch": 0.98, - "learning_rate": 1.569206319629885e-06, - "loss": 0.8828, - "step": 38396 - }, - { - "epoch": 0.98, - "learning_rate": 1.5691835689107506e-06, - "loss": 0.8701, - "step": 38397 - }, - { - "epoch": 0.98, - "learning_rate": 1.5691608177558183e-06, - "loss": 0.7808, - "step": 38398 - }, - { - "epoch": 0.98, - "learning_rate": 1.569138066165106e-06, - "loss": 0.8125, - "step": 38399 - }, - { - "epoch": 0.98, - "learning_rate": 1.5691153141386303e-06, - "loss": 0.7686, - "step": 38400 - }, - { - "epoch": 0.98, - "learning_rate": 1.5690925616764095e-06, - "loss": 0.6494, - "step": 38401 - }, - { - "epoch": 0.98, - "learning_rate": 1.5690698087784609e-06, - "loss": 1.0742, - "step": 38402 - }, - { - "epoch": 0.98, - "learning_rate": 1.5690470554448014e-06, - "loss": 0.5983, - "step": 38403 - }, - { - "epoch": 0.98, - "learning_rate": 1.5690243016754487e-06, - "loss": 0.9248, - "step": 38404 - }, - { - "epoch": 0.98, - "learning_rate": 1.5690015474704204e-06, - "loss": 0.9082, - "step": 38405 - }, - { - "epoch": 0.98, - "learning_rate": 1.5689787928297339e-06, - "loss": 0.7773, - "step": 38406 - }, - { - "epoch": 0.98, - "learning_rate": 1.5689560377534062e-06, - "loss": 0.8423, - "step": 38407 - }, - { - "epoch": 0.98, - "learning_rate": 1.5689332822414552e-06, - "loss": 0.9365, - "step": 38408 - }, - { - "epoch": 0.98, - "learning_rate": 1.568910526293898e-06, - "loss": 0.7803, - "step": 38409 - }, - { - "epoch": 0.98, - "learning_rate": 1.5688877699107524e-06, - "loss": 0.7271, - "step": 38410 - }, - { - "epoch": 0.98, - "learning_rate": 1.5688650130920354e-06, - "loss": 0.915, - "step": 38411 - }, - { - "epoch": 0.98, - "learning_rate": 1.5688422558377647e-06, - "loss": 0.998, - "step": 38412 - }, - { - "epoch": 0.98, - "learning_rate": 1.568819498147958e-06, - "loss": 1.001, - "step": 38413 - }, - { - "epoch": 0.98, - "learning_rate": 1.5687967400226318e-06, - "loss": 0.812, - "step": 38414 - }, - { - "epoch": 0.98, - "learning_rate": 1.5687739814618041e-06, - "loss": 0.9219, - "step": 38415 - }, - { - "epoch": 0.98, - "learning_rate": 1.5687512224654927e-06, - "loss": 0.8408, - "step": 38416 - }, - { - "epoch": 0.98, - "learning_rate": 1.5687284630337146e-06, - "loss": 0.7715, - "step": 38417 - }, - { - "epoch": 0.98, - "learning_rate": 1.568705703166487e-06, - "loss": 0.7324, - "step": 38418 - }, - { - "epoch": 0.98, - "learning_rate": 1.5686829428638278e-06, - "loss": 0.9561, - "step": 38419 - }, - { - "epoch": 0.98, - "learning_rate": 1.568660182125754e-06, - "loss": 0.7686, - "step": 38420 - }, - { - "epoch": 0.98, - "learning_rate": 1.5686374209522835e-06, - "loss": 0.9678, - "step": 38421 - }, - { - "epoch": 0.98, - "learning_rate": 1.5686146593434333e-06, - "loss": 0.8633, - "step": 38422 - }, - { - "epoch": 0.98, - "learning_rate": 1.568591897299221e-06, - "loss": 0.9053, - "step": 38423 - }, - { - "epoch": 0.98, - "learning_rate": 1.568569134819664e-06, - "loss": 0.7866, - "step": 38424 - }, - { - "epoch": 0.98, - "learning_rate": 1.5685463719047797e-06, - "loss": 0.7466, - "step": 38425 - }, - { - "epoch": 0.98, - "learning_rate": 1.568523608554586e-06, - "loss": 0.8428, - "step": 38426 - }, - { - "epoch": 0.98, - "learning_rate": 1.5685008447690998e-06, - "loss": 0.7251, - "step": 38427 - }, - { - "epoch": 0.98, - "learning_rate": 1.5684780805483384e-06, - "loss": 1.2061, - "step": 38428 - }, - { - "epoch": 0.98, - "learning_rate": 1.5684553158923195e-06, - "loss": 0.8682, - "step": 38429 - }, - { - "epoch": 0.98, - "learning_rate": 1.5684325508010602e-06, - "loss": 0.7432, - "step": 38430 - }, - { - "epoch": 0.99, - "learning_rate": 1.5684097852745788e-06, - "loss": 0.9199, - "step": 38431 - }, - { - "epoch": 0.99, - "learning_rate": 1.568387019312892e-06, - "loss": 0.8911, - "step": 38432 - }, - { - "epoch": 0.99, - "learning_rate": 1.5683642529160172e-06, - "loss": 0.8652, - "step": 38433 - }, - { - "epoch": 0.99, - "learning_rate": 1.5683414860839723e-06, - "loss": 0.875, - "step": 38434 - }, - { - "epoch": 0.99, - "learning_rate": 1.5683187188167744e-06, - "loss": 0.8047, - "step": 38435 - }, - { - "epoch": 0.99, - "learning_rate": 1.5682959511144408e-06, - "loss": 0.6816, - "step": 38436 - }, - { - "epoch": 0.99, - "learning_rate": 1.5682731829769896e-06, - "loss": 0.7412, - "step": 38437 - }, - { - "epoch": 0.99, - "learning_rate": 1.5682504144044373e-06, - "loss": 1.0732, - "step": 38438 - }, - { - "epoch": 0.99, - "learning_rate": 1.5682276453968018e-06, - "loss": 0.8916, - "step": 38439 - }, - { - "epoch": 0.99, - "learning_rate": 1.5682048759541005e-06, - "loss": 0.9248, - "step": 38440 - }, - { - "epoch": 0.99, - "learning_rate": 1.5681821060763509e-06, - "loss": 0.748, - "step": 38441 - }, - { - "epoch": 0.99, - "learning_rate": 1.5681593357635708e-06, - "loss": 0.7773, - "step": 38442 - }, - { - "epoch": 0.99, - "learning_rate": 1.5681365650157767e-06, - "loss": 0.8599, - "step": 38443 - }, - { - "epoch": 0.99, - "learning_rate": 1.5681137938329866e-06, - "loss": 1.085, - "step": 38444 - }, - { - "epoch": 0.99, - "learning_rate": 1.5680910222152178e-06, - "loss": 0.9639, - "step": 38445 - }, - { - "epoch": 0.99, - "learning_rate": 1.5680682501624883e-06, - "loss": 0.8867, - "step": 38446 - }, - { - "epoch": 0.99, - "learning_rate": 1.5680454776748148e-06, - "loss": 0.6777, - "step": 38447 - }, - { - "epoch": 0.99, - "learning_rate": 1.568022704752215e-06, - "loss": 0.8232, - "step": 38448 - }, - { - "epoch": 0.99, - "learning_rate": 1.5679999313947063e-06, - "loss": 1.0078, - "step": 38449 - }, - { - "epoch": 0.99, - "learning_rate": 1.5679771576023062e-06, - "loss": 0.6704, - "step": 38450 - }, - { - "epoch": 0.99, - "learning_rate": 1.567954383375032e-06, - "loss": 0.6611, - "step": 38451 - }, - { - "epoch": 0.99, - "learning_rate": 1.5679316087129016e-06, - "loss": 0.835, - "step": 38452 - }, - { - "epoch": 0.99, - "learning_rate": 1.5679088336159319e-06, - "loss": 0.6758, - "step": 38453 - }, - { - "epoch": 0.99, - "learning_rate": 1.5678860580841401e-06, - "loss": 0.9824, - "step": 38454 - }, - { - "epoch": 0.99, - "learning_rate": 1.5678632821175445e-06, - "loss": 0.7949, - "step": 38455 - }, - { - "epoch": 0.99, - "learning_rate": 1.567840505716162e-06, - "loss": 0.9229, - "step": 38456 - }, - { - "epoch": 0.99, - "learning_rate": 1.5678177288800103e-06, - "loss": 0.9492, - "step": 38457 - }, - { - "epoch": 0.99, - "learning_rate": 1.5677949516091065e-06, - "loss": 0.6704, - "step": 38458 - }, - { - "epoch": 0.99, - "learning_rate": 1.5677721739034682e-06, - "loss": 0.9639, - "step": 38459 - }, - { - "epoch": 0.99, - "learning_rate": 1.567749395763113e-06, - "loss": 0.9395, - "step": 38460 - }, - { - "epoch": 0.99, - "learning_rate": 1.567726617188058e-06, - "loss": 0.75, - "step": 38461 - }, - { - "epoch": 0.99, - "learning_rate": 1.567703838178321e-06, - "loss": 0.8057, - "step": 38462 - }, - { - "epoch": 0.99, - "learning_rate": 1.567681058733919e-06, - "loss": 0.8916, - "step": 38463 - }, - { - "epoch": 0.99, - "learning_rate": 1.56765827885487e-06, - "loss": 0.8091, - "step": 38464 - }, - { - "epoch": 0.99, - "learning_rate": 1.567635498541191e-06, - "loss": 0.7349, - "step": 38465 - }, - { - "epoch": 0.99, - "learning_rate": 1.5676127177928998e-06, - "loss": 0.8496, - "step": 38466 - }, - { - "epoch": 0.99, - "learning_rate": 1.5675899366100134e-06, - "loss": 0.8447, - "step": 38467 - }, - { - "epoch": 0.99, - "learning_rate": 1.5675671549925495e-06, - "loss": 0.877, - "step": 38468 - }, - { - "epoch": 0.99, - "learning_rate": 1.5675443729405257e-06, - "loss": 0.8203, - "step": 38469 - }, - { - "epoch": 0.99, - "learning_rate": 1.5675215904539593e-06, - "loss": 0.5381, - "step": 38470 - }, - { - "epoch": 0.99, - "learning_rate": 1.5674988075328674e-06, - "loss": 0.8047, - "step": 38471 - }, - { - "epoch": 0.99, - "learning_rate": 1.567476024177268e-06, - "loss": 0.8779, - "step": 38472 - }, - { - "epoch": 0.99, - "learning_rate": 1.5674532403871781e-06, - "loss": 0.792, - "step": 38473 - }, - { - "epoch": 0.99, - "learning_rate": 1.5674304561626155e-06, - "loss": 0.8223, - "step": 38474 - }, - { - "epoch": 0.99, - "learning_rate": 1.5674076715035975e-06, - "loss": 0.6729, - "step": 38475 - }, - { - "epoch": 0.99, - "learning_rate": 1.5673848864101417e-06, - "loss": 1.0166, - "step": 38476 - }, - { - "epoch": 0.99, - "learning_rate": 1.5673621008822653e-06, - "loss": 0.9136, - "step": 38477 - }, - { - "epoch": 0.99, - "learning_rate": 1.5673393149199857e-06, - "loss": 0.8896, - "step": 38478 - }, - { - "epoch": 0.99, - "learning_rate": 1.5673165285233205e-06, - "loss": 0.6567, - "step": 38479 - }, - { - "epoch": 0.99, - "learning_rate": 1.5672937416922869e-06, - "loss": 0.9805, - "step": 38480 - }, - { - "epoch": 0.99, - "learning_rate": 1.567270954426903e-06, - "loss": 0.9561, - "step": 38481 - }, - { - "epoch": 0.99, - "learning_rate": 1.5672481667271854e-06, - "loss": 0.9385, - "step": 38482 - }, - { - "epoch": 0.99, - "learning_rate": 1.5672253785931523e-06, - "loss": 0.9688, - "step": 38483 - }, - { - "epoch": 0.99, - "learning_rate": 1.5672025900248207e-06, - "loss": 1.0107, - "step": 38484 - }, - { - "epoch": 0.99, - "learning_rate": 1.5671798010222078e-06, - "loss": 0.8418, - "step": 38485 - }, - { - "epoch": 0.99, - "learning_rate": 1.5671570115853322e-06, - "loss": 0.7305, - "step": 38486 - }, - { - "epoch": 0.99, - "learning_rate": 1.5671342217142099e-06, - "loss": 0.9521, - "step": 38487 - }, - { - "epoch": 0.99, - "learning_rate": 1.5671114314088595e-06, - "loss": 0.792, - "step": 38488 - }, - { - "epoch": 0.99, - "learning_rate": 1.5670886406692976e-06, - "loss": 0.5576, - "step": 38489 - }, - { - "epoch": 0.99, - "learning_rate": 1.5670658494955417e-06, - "loss": 0.6206, - "step": 38490 - }, - { - "epoch": 0.99, - "learning_rate": 1.56704305788761e-06, - "loss": 0.8447, - "step": 38491 - }, - { - "epoch": 0.99, - "learning_rate": 1.5670202658455196e-06, - "loss": 1.0352, - "step": 38492 - }, - { - "epoch": 0.99, - "learning_rate": 1.5669974733692876e-06, - "loss": 0.769, - "step": 38493 - }, - { - "epoch": 0.99, - "learning_rate": 1.5669746804589316e-06, - "loss": 0.8105, - "step": 38494 - }, - { - "epoch": 0.99, - "learning_rate": 1.5669518871144694e-06, - "loss": 0.8545, - "step": 38495 - }, - { - "epoch": 0.99, - "learning_rate": 1.566929093335918e-06, - "loss": 0.8438, - "step": 38496 - }, - { - "epoch": 0.99, - "learning_rate": 1.5669062991232952e-06, - "loss": 0.791, - "step": 38497 - }, - { - "epoch": 0.99, - "learning_rate": 1.5668835044766185e-06, - "loss": 0.8018, - "step": 38498 - }, - { - "epoch": 0.99, - "learning_rate": 1.566860709395905e-06, - "loss": 0.8867, - "step": 38499 - }, - { - "epoch": 0.99, - "learning_rate": 1.5668379138811722e-06, - "loss": 0.8525, - "step": 38500 - }, - { - "epoch": 0.99, - "learning_rate": 1.5668151179324379e-06, - "loss": 0.7979, - "step": 38501 - }, - { - "epoch": 0.99, - "learning_rate": 1.5667923215497193e-06, - "loss": 0.9297, - "step": 38502 - }, - { - "epoch": 0.99, - "learning_rate": 1.5667695247330337e-06, - "loss": 0.8162, - "step": 38503 - }, - { - "epoch": 0.99, - "learning_rate": 1.566746727482399e-06, - "loss": 0.9038, - "step": 38504 - }, - { - "epoch": 0.99, - "learning_rate": 1.566723929797832e-06, - "loss": 0.8145, - "step": 38505 - }, - { - "epoch": 0.99, - "learning_rate": 1.5667011316793506e-06, - "loss": 0.8125, - "step": 38506 - }, - { - "epoch": 0.99, - "learning_rate": 1.5666783331269726e-06, - "loss": 0.791, - "step": 38507 - }, - { - "epoch": 0.99, - "learning_rate": 1.5666555341407149e-06, - "loss": 0.6934, - "step": 38508 - }, - { - "epoch": 0.99, - "learning_rate": 1.5666327347205948e-06, - "loss": 1.0039, - "step": 38509 - }, - { - "epoch": 0.99, - "learning_rate": 1.5666099348666303e-06, - "loss": 0.6226, - "step": 38510 - }, - { - "epoch": 0.99, - "learning_rate": 1.5665871345788387e-06, - "loss": 0.8145, - "step": 38511 - }, - { - "epoch": 0.99, - "learning_rate": 1.5665643338572374e-06, - "loss": 0.897, - "step": 38512 - }, - { - "epoch": 0.99, - "learning_rate": 1.5665415327018437e-06, - "loss": 0.9961, - "step": 38513 - }, - { - "epoch": 0.99, - "learning_rate": 1.566518731112675e-06, - "loss": 0.8848, - "step": 38514 - }, - { - "epoch": 0.99, - "learning_rate": 1.5664959290897492e-06, - "loss": 0.6782, - "step": 38515 - }, - { - "epoch": 0.99, - "learning_rate": 1.5664731266330837e-06, - "loss": 0.5479, - "step": 38516 - }, - { - "epoch": 0.99, - "learning_rate": 1.5664503237426955e-06, - "loss": 0.7451, - "step": 38517 - }, - { - "epoch": 0.99, - "learning_rate": 1.5664275204186024e-06, - "loss": 0.6167, - "step": 38518 - }, - { - "epoch": 0.99, - "learning_rate": 1.5664047166608218e-06, - "loss": 0.9746, - "step": 38519 - }, - { - "epoch": 0.99, - "learning_rate": 1.5663819124693714e-06, - "loss": 0.8147, - "step": 38520 - }, - { - "epoch": 0.99, - "learning_rate": 1.566359107844268e-06, - "loss": 0.96, - "step": 38521 - }, - { - "epoch": 0.99, - "learning_rate": 1.5663363027855296e-06, - "loss": 0.9385, - "step": 38522 - }, - { - "epoch": 0.99, - "learning_rate": 1.5663134972931736e-06, - "loss": 0.7959, - "step": 38523 - }, - { - "epoch": 0.99, - "learning_rate": 1.5662906913672175e-06, - "loss": 1.0303, - "step": 38524 - }, - { - "epoch": 0.99, - "learning_rate": 1.5662678850076786e-06, - "loss": 0.7432, - "step": 38525 - }, - { - "epoch": 0.99, - "learning_rate": 1.5662450782145742e-06, - "loss": 0.7871, - "step": 38526 - }, - { - "epoch": 0.99, - "learning_rate": 1.5662222709879225e-06, - "loss": 0.9814, - "step": 38527 - }, - { - "epoch": 0.99, - "learning_rate": 1.5661994633277397e-06, - "loss": 0.8848, - "step": 38528 - }, - { - "epoch": 0.99, - "learning_rate": 1.5661766552340446e-06, - "loss": 0.8477, - "step": 38529 - }, - { - "epoch": 0.99, - "learning_rate": 1.5661538467068539e-06, - "loss": 0.877, - "step": 38530 - }, - { - "epoch": 0.99, - "learning_rate": 1.5661310377461852e-06, - "loss": 0.6816, - "step": 38531 - }, - { - "epoch": 0.99, - "learning_rate": 1.5661082283520558e-06, - "loss": 0.9775, - "step": 38532 - }, - { - "epoch": 0.99, - "learning_rate": 1.5660854185244836e-06, - "loss": 0.7456, - "step": 38533 - }, - { - "epoch": 0.99, - "learning_rate": 1.5660626082634857e-06, - "loss": 0.8359, - "step": 38534 - }, - { - "epoch": 0.99, - "learning_rate": 1.5660397975690797e-06, - "loss": 0.7119, - "step": 38535 - }, - { - "epoch": 0.99, - "learning_rate": 1.5660169864412831e-06, - "loss": 0.791, - "step": 38536 - }, - { - "epoch": 0.99, - "learning_rate": 1.5659941748801136e-06, - "loss": 0.998, - "step": 38537 - }, - { - "epoch": 0.99, - "learning_rate": 1.565971362885588e-06, - "loss": 0.7549, - "step": 38538 - }, - { - "epoch": 0.99, - "learning_rate": 1.5659485504577244e-06, - "loss": 0.7295, - "step": 38539 - }, - { - "epoch": 0.99, - "learning_rate": 1.5659257375965399e-06, - "loss": 0.6475, - "step": 38540 - }, - { - "epoch": 0.99, - "learning_rate": 1.5659029243020519e-06, - "loss": 0.8608, - "step": 38541 - }, - { - "epoch": 0.99, - "learning_rate": 1.5658801105742784e-06, - "loss": 0.6169, - "step": 38542 - }, - { - "epoch": 0.99, - "learning_rate": 1.5658572964132363e-06, - "loss": 0.7083, - "step": 38543 - }, - { - "epoch": 0.99, - "learning_rate": 1.5658344818189432e-06, - "loss": 0.9756, - "step": 38544 - }, - { - "epoch": 0.99, - "learning_rate": 1.5658116667914168e-06, - "loss": 0.7803, - "step": 38545 - }, - { - "epoch": 0.99, - "learning_rate": 1.5657888513306743e-06, - "loss": 0.793, - "step": 38546 - }, - { - "epoch": 0.99, - "learning_rate": 1.5657660354367334e-06, - "loss": 0.9854, - "step": 38547 - }, - { - "epoch": 0.99, - "learning_rate": 1.5657432191096116e-06, - "loss": 1.0713, - "step": 38548 - }, - { - "epoch": 0.99, - "learning_rate": 1.565720402349326e-06, - "loss": 0.9355, - "step": 38549 - }, - { - "epoch": 0.99, - "learning_rate": 1.5656975851558944e-06, - "loss": 0.8467, - "step": 38550 - }, - { - "epoch": 0.99, - "learning_rate": 1.5656747675293343e-06, - "loss": 0.9287, - "step": 38551 - }, - { - "epoch": 0.99, - "learning_rate": 1.5656519494696628e-06, - "loss": 0.8145, - "step": 38552 - }, - { - "epoch": 0.99, - "learning_rate": 1.5656291309768976e-06, - "loss": 1.1738, - "step": 38553 - }, - { - "epoch": 0.99, - "learning_rate": 1.5656063120510563e-06, - "loss": 0.9355, - "step": 38554 - }, - { - "epoch": 0.99, - "learning_rate": 1.5655834926921565e-06, - "loss": 0.8701, - "step": 38555 - }, - { - "epoch": 0.99, - "learning_rate": 1.5655606729002151e-06, - "loss": 0.5642, - "step": 38556 - }, - { - "epoch": 0.99, - "learning_rate": 1.5655378526752498e-06, - "loss": 0.7852, - "step": 38557 - }, - { - "epoch": 0.99, - "learning_rate": 1.5655150320172786e-06, - "loss": 0.7529, - "step": 38558 - }, - { - "epoch": 0.99, - "learning_rate": 1.565492210926318e-06, - "loss": 0.6914, - "step": 38559 - }, - { - "epoch": 0.99, - "learning_rate": 1.5654693894023865e-06, - "loss": 0.8389, - "step": 38560 - }, - { - "epoch": 0.99, - "learning_rate": 1.565446567445501e-06, - "loss": 0.7822, - "step": 38561 - }, - { - "epoch": 0.99, - "learning_rate": 1.5654237450556788e-06, - "loss": 0.8389, - "step": 38562 - }, - { - "epoch": 0.99, - "learning_rate": 1.565400922232938e-06, - "loss": 0.6885, - "step": 38563 - }, - { - "epoch": 0.99, - "learning_rate": 1.565378098977295e-06, - "loss": 1.1318, - "step": 38564 - }, - { - "epoch": 0.99, - "learning_rate": 1.565355275288769e-06, - "loss": 0.8184, - "step": 38565 - }, - { - "epoch": 0.99, - "learning_rate": 1.565332451167376e-06, - "loss": 1.0, - "step": 38566 - }, - { - "epoch": 0.99, - "learning_rate": 1.5653096266131337e-06, - "loss": 0.9111, - "step": 38567 - }, - { - "epoch": 0.99, - "learning_rate": 1.56528680162606e-06, - "loss": 0.9062, - "step": 38568 - }, - { - "epoch": 0.99, - "learning_rate": 1.5652639762061721e-06, - "loss": 0.8721, - "step": 38569 - }, - { - "epoch": 0.99, - "learning_rate": 1.5652411503534876e-06, - "loss": 0.7454, - "step": 38570 - }, - { - "epoch": 0.99, - "learning_rate": 1.5652183240680242e-06, - "loss": 0.8018, - "step": 38571 - }, - { - "epoch": 0.99, - "learning_rate": 1.565195497349799e-06, - "loss": 0.9316, - "step": 38572 - }, - { - "epoch": 0.99, - "learning_rate": 1.5651726701988292e-06, - "loss": 0.7725, - "step": 38573 - }, - { - "epoch": 0.99, - "learning_rate": 1.5651498426151331e-06, - "loss": 0.8408, - "step": 38574 - }, - { - "epoch": 0.99, - "learning_rate": 1.5651270145987276e-06, - "loss": 0.9658, - "step": 38575 - }, - { - "epoch": 0.99, - "learning_rate": 1.5651041861496305e-06, - "loss": 0.6729, - "step": 38576 - }, - { - "epoch": 0.99, - "learning_rate": 1.565081357267859e-06, - "loss": 0.8584, - "step": 38577 - }, - { - "epoch": 0.99, - "learning_rate": 1.5650585279534307e-06, - "loss": 0.8115, - "step": 38578 - }, - { - "epoch": 0.99, - "learning_rate": 1.5650356982063628e-06, - "loss": 0.9619, - "step": 38579 - }, - { - "epoch": 0.99, - "learning_rate": 1.5650128680266734e-06, - "loss": 0.9727, - "step": 38580 - }, - { - "epoch": 0.99, - "learning_rate": 1.5649900374143793e-06, - "loss": 0.7705, - "step": 38581 - }, - { - "epoch": 0.99, - "learning_rate": 1.5649672063694987e-06, - "loss": 0.8799, - "step": 38582 - }, - { - "epoch": 0.99, - "learning_rate": 1.5649443748920486e-06, - "loss": 0.7278, - "step": 38583 - }, - { - "epoch": 0.99, - "learning_rate": 1.5649215429820464e-06, - "loss": 0.6978, - "step": 38584 - }, - { - "epoch": 0.99, - "learning_rate": 1.5648987106395097e-06, - "loss": 0.8701, - "step": 38585 - }, - { - "epoch": 0.99, - "learning_rate": 1.5648758778644563e-06, - "loss": 1.0361, - "step": 38586 - }, - { - "epoch": 0.99, - "learning_rate": 1.5648530446569032e-06, - "loss": 0.8779, - "step": 38587 - }, - { - "epoch": 0.99, - "learning_rate": 1.564830211016868e-06, - "loss": 0.7095, - "step": 38588 - }, - { - "epoch": 0.99, - "learning_rate": 1.5648073769443686e-06, - "loss": 0.7334, - "step": 38589 - }, - { - "epoch": 0.99, - "learning_rate": 1.564784542439422e-06, - "loss": 0.9375, - "step": 38590 - }, - { - "epoch": 0.99, - "learning_rate": 1.564761707502046e-06, - "loss": 1.0703, - "step": 38591 - }, - { - "epoch": 0.99, - "learning_rate": 1.5647388721322576e-06, - "loss": 0.4651, - "step": 38592 - }, - { - "epoch": 0.99, - "learning_rate": 1.564716036330075e-06, - "loss": 0.7324, - "step": 38593 - }, - { - "epoch": 0.99, - "learning_rate": 1.564693200095515e-06, - "loss": 1.083, - "step": 38594 - }, - { - "epoch": 0.99, - "learning_rate": 1.5646703634285953e-06, - "loss": 1.0703, - "step": 38595 - }, - { - "epoch": 0.99, - "learning_rate": 1.5646475263293337e-06, - "loss": 0.874, - "step": 38596 - }, - { - "epoch": 0.99, - "learning_rate": 1.5646246887977475e-06, - "loss": 0.8667, - "step": 38597 - }, - { - "epoch": 0.99, - "learning_rate": 1.5646018508338541e-06, - "loss": 0.9277, - "step": 38598 - }, - { - "epoch": 0.99, - "learning_rate": 1.564579012437671e-06, - "loss": 0.7305, - "step": 38599 - }, - { - "epoch": 0.99, - "learning_rate": 1.5645561736092155e-06, - "loss": 0.9014, - "step": 38600 - }, - { - "epoch": 0.99, - "learning_rate": 1.5645333343485056e-06, - "loss": 0.8291, - "step": 38601 - }, - { - "epoch": 0.99, - "learning_rate": 1.5645104946555581e-06, - "loss": 1.0498, - "step": 38602 - }, - { - "epoch": 0.99, - "learning_rate": 1.5644876545303914e-06, - "loss": 0.9238, - "step": 38603 - }, - { - "epoch": 0.99, - "learning_rate": 1.5644648139730219e-06, - "loss": 1.0674, - "step": 38604 - }, - { - "epoch": 0.99, - "learning_rate": 1.564441972983468e-06, - "loss": 0.8564, - "step": 38605 - }, - { - "epoch": 0.99, - "learning_rate": 1.5644191315617468e-06, - "loss": 0.7646, - "step": 38606 - }, - { - "epoch": 0.99, - "learning_rate": 1.5643962897078758e-06, - "loss": 0.6841, - "step": 38607 - }, - { - "epoch": 0.99, - "learning_rate": 1.5643734474218723e-06, - "loss": 0.8428, - "step": 38608 - }, - { - "epoch": 0.99, - "learning_rate": 1.5643506047037543e-06, - "loss": 0.9023, - "step": 38609 - }, - { - "epoch": 0.99, - "learning_rate": 1.5643277615535388e-06, - "loss": 0.8037, - "step": 38610 - }, - { - "epoch": 0.99, - "learning_rate": 1.5643049179712437e-06, - "loss": 0.7842, - "step": 38611 - }, - { - "epoch": 0.99, - "learning_rate": 1.5642820739568862e-06, - "loss": 0.8428, - "step": 38612 - }, - { - "epoch": 0.99, - "learning_rate": 1.5642592295104837e-06, - "loss": 0.731, - "step": 38613 - }, - { - "epoch": 0.99, - "learning_rate": 1.564236384632054e-06, - "loss": 0.8984, - "step": 38614 - }, - { - "epoch": 0.99, - "learning_rate": 1.5642135393216143e-06, - "loss": 0.8975, - "step": 38615 - }, - { - "epoch": 0.99, - "learning_rate": 1.5641906935791825e-06, - "loss": 0.7798, - "step": 38616 - }, - { - "epoch": 0.99, - "learning_rate": 1.5641678474047754e-06, - "loss": 0.7871, - "step": 38617 - }, - { - "epoch": 0.99, - "learning_rate": 1.5641450007984113e-06, - "loss": 0.7349, - "step": 38618 - }, - { - "epoch": 0.99, - "learning_rate": 1.5641221537601072e-06, - "loss": 0.8594, - "step": 38619 - }, - { - "epoch": 0.99, - "learning_rate": 1.5640993062898807e-06, - "loss": 0.9258, - "step": 38620 - }, - { - "epoch": 0.99, - "learning_rate": 1.5640764583877496e-06, - "loss": 0.9033, - "step": 38621 - }, - { - "epoch": 0.99, - "learning_rate": 1.5640536100537305e-06, - "loss": 0.5669, - "step": 38622 - }, - { - "epoch": 0.99, - "learning_rate": 1.5640307612878418e-06, - "loss": 0.7725, - "step": 38623 - }, - { - "epoch": 0.99, - "learning_rate": 1.5640079120901009e-06, - "loss": 0.7568, - "step": 38624 - }, - { - "epoch": 0.99, - "learning_rate": 1.5639850624605246e-06, - "loss": 0.4331, - "step": 38625 - }, - { - "epoch": 0.99, - "learning_rate": 1.5639622123991311e-06, - "loss": 0.876, - "step": 38626 - }, - { - "epoch": 0.99, - "learning_rate": 1.5639393619059377e-06, - "loss": 0.8037, - "step": 38627 - }, - { - "epoch": 0.99, - "learning_rate": 1.5639165109809617e-06, - "loss": 0.8423, - "step": 38628 - }, - { - "epoch": 0.99, - "learning_rate": 1.5638936596242209e-06, - "loss": 0.7329, - "step": 38629 - }, - { - "epoch": 0.99, - "learning_rate": 1.5638708078357325e-06, - "loss": 0.731, - "step": 38630 - }, - { - "epoch": 0.99, - "learning_rate": 1.5638479556155147e-06, - "loss": 0.8359, - "step": 38631 - }, - { - "epoch": 0.99, - "learning_rate": 1.5638251029635838e-06, - "loss": 0.6528, - "step": 38632 - }, - { - "epoch": 0.99, - "learning_rate": 1.5638022498799584e-06, - "loss": 0.7837, - "step": 38633 - }, - { - "epoch": 0.99, - "learning_rate": 1.563779396364655e-06, - "loss": 0.7617, - "step": 38634 - }, - { - "epoch": 0.99, - "learning_rate": 1.5637565424176921e-06, - "loss": 0.9209, - "step": 38635 - }, - { - "epoch": 0.99, - "learning_rate": 1.5637336880390867e-06, - "loss": 0.6646, - "step": 38636 - }, - { - "epoch": 0.99, - "learning_rate": 1.5637108332288562e-06, - "loss": 0.9062, - "step": 38637 - }, - { - "epoch": 0.99, - "learning_rate": 1.5636879779870183e-06, - "loss": 0.7021, - "step": 38638 - }, - { - "epoch": 0.99, - "learning_rate": 1.5636651223135903e-06, - "loss": 0.7568, - "step": 38639 - }, - { - "epoch": 0.99, - "learning_rate": 1.5636422662085899e-06, - "loss": 0.6958, - "step": 38640 - }, - { - "epoch": 0.99, - "learning_rate": 1.563619409672035e-06, - "loss": 0.9609, - "step": 38641 - }, - { - "epoch": 0.99, - "learning_rate": 1.5635965527039421e-06, - "loss": 0.8262, - "step": 38642 - }, - { - "epoch": 0.99, - "learning_rate": 1.5635736953043293e-06, - "loss": 0.8447, - "step": 38643 - }, - { - "epoch": 0.99, - "learning_rate": 1.563550837473214e-06, - "loss": 0.7207, - "step": 38644 - }, - { - "epoch": 0.99, - "learning_rate": 1.5635279792106138e-06, - "loss": 0.877, - "step": 38645 - }, - { - "epoch": 0.99, - "learning_rate": 1.5635051205165462e-06, - "loss": 0.8447, - "step": 38646 - }, - { - "epoch": 0.99, - "learning_rate": 1.5634822613910286e-06, - "loss": 0.9287, - "step": 38647 - }, - { - "epoch": 0.99, - "learning_rate": 1.5634594018340784e-06, - "loss": 0.8906, - "step": 38648 - }, - { - "epoch": 0.99, - "learning_rate": 1.5634365418457133e-06, - "loss": 0.8027, - "step": 38649 - }, - { - "epoch": 0.99, - "learning_rate": 1.563413681425951e-06, - "loss": 0.9658, - "step": 38650 - }, - { - "epoch": 0.99, - "learning_rate": 1.5633908205748085e-06, - "loss": 0.7349, - "step": 38651 - }, - { - "epoch": 0.99, - "learning_rate": 1.5633679592923037e-06, - "loss": 0.8359, - "step": 38652 - }, - { - "epoch": 0.99, - "learning_rate": 1.563345097578454e-06, - "loss": 0.7441, - "step": 38653 - }, - { - "epoch": 0.99, - "learning_rate": 1.5633222354332766e-06, - "loss": 0.9053, - "step": 38654 - }, - { - "epoch": 0.99, - "learning_rate": 1.5632993728567895e-06, - "loss": 1.0596, - "step": 38655 - }, - { - "epoch": 0.99, - "learning_rate": 1.5632765098490099e-06, - "loss": 0.9072, - "step": 38656 - }, - { - "epoch": 0.99, - "learning_rate": 1.5632536464099552e-06, - "loss": 0.9189, - "step": 38657 - }, - { - "epoch": 0.99, - "learning_rate": 1.5632307825396434e-06, - "loss": 0.7476, - "step": 38658 - }, - { - "epoch": 0.99, - "learning_rate": 1.5632079182380915e-06, - "loss": 0.751, - "step": 38659 - }, - { - "epoch": 0.99, - "learning_rate": 1.5631850535053172e-06, - "loss": 0.7214, - "step": 38660 - }, - { - "epoch": 0.99, - "learning_rate": 1.5631621883413382e-06, - "loss": 0.7881, - "step": 38661 - }, - { - "epoch": 0.99, - "learning_rate": 1.5631393227461715e-06, - "loss": 0.8369, - "step": 38662 - }, - { - "epoch": 0.99, - "learning_rate": 1.5631164567198352e-06, - "loss": 0.79, - "step": 38663 - }, - { - "epoch": 0.99, - "learning_rate": 1.5630935902623464e-06, - "loss": 0.8447, - "step": 38664 - }, - { - "epoch": 0.99, - "learning_rate": 1.5630707233737223e-06, - "loss": 0.8276, - "step": 38665 - }, - { - "epoch": 0.99, - "learning_rate": 1.5630478560539815e-06, - "loss": 0.7627, - "step": 38666 - }, - { - "epoch": 0.99, - "learning_rate": 1.5630249883031405e-06, - "loss": 0.8164, - "step": 38667 - }, - { - "epoch": 0.99, - "learning_rate": 1.5630021201212174e-06, - "loss": 0.8584, - "step": 38668 - }, - { - "epoch": 0.99, - "learning_rate": 1.5629792515082292e-06, - "loss": 0.5271, - "step": 38669 - }, - { - "epoch": 0.99, - "learning_rate": 1.5629563824641938e-06, - "loss": 0.7173, - "step": 38670 - }, - { - "epoch": 0.99, - "learning_rate": 1.5629335129891286e-06, - "loss": 0.7891, - "step": 38671 - }, - { - "epoch": 0.99, - "learning_rate": 1.562910643083051e-06, - "loss": 0.8398, - "step": 38672 - }, - { - "epoch": 0.99, - "learning_rate": 1.5628877727459785e-06, - "loss": 1.1045, - "step": 38673 - }, - { - "epoch": 0.99, - "learning_rate": 1.562864901977929e-06, - "loss": 0.7649, - "step": 38674 - }, - { - "epoch": 0.99, - "learning_rate": 1.5628420307789195e-06, - "loss": 0.9004, - "step": 38675 - }, - { - "epoch": 0.99, - "learning_rate": 1.5628191591489681e-06, - "loss": 0.5166, - "step": 38676 - }, - { - "epoch": 0.99, - "learning_rate": 1.5627962870880915e-06, - "loss": 0.8125, - "step": 38677 - }, - { - "epoch": 0.99, - "learning_rate": 1.5627734145963078e-06, - "loss": 0.7144, - "step": 38678 - }, - { - "epoch": 0.99, - "learning_rate": 1.5627505416736347e-06, - "loss": 1.0791, - "step": 38679 - }, - { - "epoch": 0.99, - "learning_rate": 1.562727668320089e-06, - "loss": 0.79, - "step": 38680 - }, - { - "epoch": 0.99, - "learning_rate": 1.5627047945356887e-06, - "loss": 0.7173, - "step": 38681 - }, - { - "epoch": 0.99, - "learning_rate": 1.5626819203204513e-06, - "loss": 0.627, - "step": 38682 - }, - { - "epoch": 0.99, - "learning_rate": 1.562659045674394e-06, - "loss": 0.7139, - "step": 38683 - }, - { - "epoch": 0.99, - "learning_rate": 1.5626361705975345e-06, - "loss": 0.6406, - "step": 38684 - }, - { - "epoch": 0.99, - "learning_rate": 1.5626132950898907e-06, - "loss": 0.7495, - "step": 38685 - }, - { - "epoch": 0.99, - "learning_rate": 1.5625904191514797e-06, - "loss": 0.6714, - "step": 38686 - }, - { - "epoch": 0.99, - "learning_rate": 1.562567542782319e-06, - "loss": 0.8164, - "step": 38687 - }, - { - "epoch": 0.99, - "learning_rate": 1.5625446659824265e-06, - "loss": 0.7549, - "step": 38688 - }, - { - "epoch": 0.99, - "learning_rate": 1.5625217887518187e-06, - "loss": 0.4487, - "step": 38689 - }, - { - "epoch": 0.99, - "learning_rate": 1.5624989110905142e-06, - "loss": 0.8867, - "step": 38690 - }, - { - "epoch": 0.99, - "learning_rate": 1.5624760329985302e-06, - "loss": 0.7119, - "step": 38691 - }, - { - "epoch": 0.99, - "learning_rate": 1.5624531544758843e-06, - "loss": 1.0234, - "step": 38692 - }, - { - "epoch": 0.99, - "learning_rate": 1.5624302755225938e-06, - "loss": 0.8887, - "step": 38693 - }, - { - "epoch": 0.99, - "learning_rate": 1.562407396138676e-06, - "loss": 0.9521, - "step": 38694 - }, - { - "epoch": 0.99, - "learning_rate": 1.562384516324149e-06, - "loss": 0.8428, - "step": 38695 - }, - { - "epoch": 0.99, - "learning_rate": 1.5623616360790301e-06, - "loss": 0.7524, - "step": 38696 - }, - { - "epoch": 0.99, - "learning_rate": 1.5623387554033367e-06, - "loss": 1.0088, - "step": 38697 - }, - { - "epoch": 0.99, - "learning_rate": 1.5623158742970863e-06, - "loss": 0.9414, - "step": 38698 - }, - { - "epoch": 0.99, - "learning_rate": 1.5622929927602964e-06, - "loss": 0.7744, - "step": 38699 - }, - { - "epoch": 0.99, - "learning_rate": 1.5622701107929847e-06, - "loss": 0.7305, - "step": 38700 - }, - { - "epoch": 0.99, - "learning_rate": 1.5622472283951689e-06, - "loss": 0.7524, - "step": 38701 - }, - { - "epoch": 0.99, - "learning_rate": 1.5622243455668657e-06, - "loss": 0.8027, - "step": 38702 - }, - { - "epoch": 0.99, - "learning_rate": 1.5622014623080937e-06, - "loss": 0.8994, - "step": 38703 - }, - { - "epoch": 0.99, - "learning_rate": 1.5621785786188694e-06, - "loss": 0.7646, - "step": 38704 - }, - { - "epoch": 0.99, - "learning_rate": 1.5621556944992112e-06, - "loss": 0.4609, - "step": 38705 - }, - { - "epoch": 0.99, - "learning_rate": 1.5621328099491361e-06, - "loss": 0.6516, - "step": 38706 - }, - { - "epoch": 0.99, - "learning_rate": 1.562109924968662e-06, - "loss": 0.6338, - "step": 38707 - }, - { - "epoch": 0.99, - "learning_rate": 1.5620870395578059e-06, - "loss": 0.8477, - "step": 38708 - }, - { - "epoch": 0.99, - "learning_rate": 1.5620641537165856e-06, - "loss": 0.8535, - "step": 38709 - }, - { - "epoch": 0.99, - "learning_rate": 1.5620412674450185e-06, - "loss": 0.8491, - "step": 38710 - }, - { - "epoch": 0.99, - "learning_rate": 1.5620183807431223e-06, - "loss": 0.9043, - "step": 38711 - }, - { - "epoch": 0.99, - "learning_rate": 1.5619954936109148e-06, - "loss": 0.8306, - "step": 38712 - }, - { - "epoch": 0.99, - "learning_rate": 1.561972606048413e-06, - "loss": 0.7793, - "step": 38713 - }, - { - "epoch": 0.99, - "learning_rate": 1.5619497180556346e-06, - "loss": 0.8682, - "step": 38714 - }, - { - "epoch": 0.99, - "learning_rate": 1.5619268296325969e-06, - "loss": 0.8091, - "step": 38715 - }, - { - "epoch": 0.99, - "learning_rate": 1.5619039407793179e-06, - "loss": 0.8018, - "step": 38716 - }, - { - "epoch": 0.99, - "learning_rate": 1.561881051495815e-06, - "loss": 0.8613, - "step": 38717 - }, - { - "epoch": 0.99, - "learning_rate": 1.5618581617821053e-06, - "loss": 0.7745, - "step": 38718 - }, - { - "epoch": 0.99, - "learning_rate": 1.5618352716382069e-06, - "loss": 0.668, - "step": 38719 - }, - { - "epoch": 0.99, - "learning_rate": 1.561812381064137e-06, - "loss": 0.6682, - "step": 38720 - }, - { - "epoch": 0.99, - "learning_rate": 1.5617894900599134e-06, - "loss": 0.7769, - "step": 38721 - }, - { - "epoch": 0.99, - "learning_rate": 1.561766598625553e-06, - "loss": 1.0215, - "step": 38722 - }, - { - "epoch": 0.99, - "learning_rate": 1.5617437067610739e-06, - "loss": 0.8613, - "step": 38723 - }, - { - "epoch": 0.99, - "learning_rate": 1.5617208144664936e-06, - "loss": 0.6887, - "step": 38724 - }, - { - "epoch": 0.99, - "learning_rate": 1.5616979217418295e-06, - "loss": 0.8271, - "step": 38725 - }, - { - "epoch": 0.99, - "learning_rate": 1.561675028587099e-06, - "loss": 0.73, - "step": 38726 - }, - { - "epoch": 0.99, - "learning_rate": 1.56165213500232e-06, - "loss": 0.7979, - "step": 38727 - }, - { - "epoch": 0.99, - "learning_rate": 1.5616292409875093e-06, - "loss": 0.8418, - "step": 38728 - }, - { - "epoch": 0.99, - "learning_rate": 1.5616063465426855e-06, - "loss": 1.0039, - "step": 38729 - }, - { - "epoch": 0.99, - "learning_rate": 1.561583451667865e-06, - "loss": 0.8164, - "step": 38730 - }, - { - "epoch": 0.99, - "learning_rate": 1.5615605563630663e-06, - "loss": 0.731, - "step": 38731 - }, - { - "epoch": 0.99, - "learning_rate": 1.5615376606283064e-06, - "loss": 0.9707, - "step": 38732 - }, - { - "epoch": 0.99, - "learning_rate": 1.561514764463603e-06, - "loss": 0.6948, - "step": 38733 - }, - { - "epoch": 0.99, - "learning_rate": 1.5614918678689733e-06, - "loss": 0.9556, - "step": 38734 - }, - { - "epoch": 0.99, - "learning_rate": 1.561468970844435e-06, - "loss": 0.9126, - "step": 38735 - }, - { - "epoch": 0.99, - "learning_rate": 1.561446073390006e-06, - "loss": 0.9297, - "step": 38736 - }, - { - "epoch": 0.99, - "learning_rate": 1.5614231755057038e-06, - "loss": 0.5698, - "step": 38737 - }, - { - "epoch": 0.99, - "learning_rate": 1.5614002771915451e-06, - "loss": 0.7041, - "step": 38738 - }, - { - "epoch": 0.99, - "learning_rate": 1.5613773784475484e-06, - "loss": 0.8086, - "step": 38739 - }, - { - "epoch": 0.99, - "learning_rate": 1.5613544792737305e-06, - "loss": 0.8301, - "step": 38740 - }, - { - "epoch": 0.99, - "learning_rate": 1.5613315796701099e-06, - "loss": 0.7183, - "step": 38741 - }, - { - "epoch": 0.99, - "learning_rate": 1.5613086796367033e-06, - "loss": 0.9199, - "step": 38742 - }, - { - "epoch": 0.99, - "learning_rate": 1.561285779173528e-06, - "loss": 0.8545, - "step": 38743 - }, - { - "epoch": 0.99, - "learning_rate": 1.5612628782806025e-06, - "loss": 0.7959, - "step": 38744 - }, - { - "epoch": 0.99, - "learning_rate": 1.5612399769579434e-06, - "loss": 0.623, - "step": 38745 - }, - { - "epoch": 0.99, - "learning_rate": 1.5612170752055694e-06, - "loss": 0.8213, - "step": 38746 - }, - { - "epoch": 0.99, - "learning_rate": 1.5611941730234966e-06, - "loss": 0.6658, - "step": 38747 - }, - { - "epoch": 0.99, - "learning_rate": 1.5611712704117435e-06, - "loss": 0.6792, - "step": 38748 - }, - { - "epoch": 0.99, - "learning_rate": 1.5611483673703272e-06, - "loss": 0.6658, - "step": 38749 - }, - { - "epoch": 0.99, - "learning_rate": 1.5611254638992653e-06, - "loss": 0.9492, - "step": 38750 - }, - { - "epoch": 0.99, - "learning_rate": 1.5611025599985759e-06, - "loss": 1.0156, - "step": 38751 - }, - { - "epoch": 0.99, - "learning_rate": 1.5610796556682755e-06, - "loss": 0.7266, - "step": 38752 - }, - { - "epoch": 0.99, - "learning_rate": 1.5610567509083827e-06, - "loss": 0.8203, - "step": 38753 - }, - { - "epoch": 0.99, - "learning_rate": 1.5610338457189142e-06, - "loss": 0.7207, - "step": 38754 - }, - { - "epoch": 0.99, - "learning_rate": 1.561010940099888e-06, - "loss": 0.5134, - "step": 38755 - }, - { - "epoch": 0.99, - "learning_rate": 1.5609880340513215e-06, - "loss": 0.8379, - "step": 38756 - }, - { - "epoch": 0.99, - "learning_rate": 1.5609651275732323e-06, - "loss": 0.7632, - "step": 38757 - }, - { - "epoch": 0.99, - "learning_rate": 1.5609422206656379e-06, - "loss": 0.833, - "step": 38758 - }, - { - "epoch": 0.99, - "learning_rate": 1.5609193133285558e-06, - "loss": 0.793, - "step": 38759 - }, - { - "epoch": 0.99, - "learning_rate": 1.5608964055620035e-06, - "loss": 0.833, - "step": 38760 - }, - { - "epoch": 0.99, - "learning_rate": 1.560873497365999e-06, - "loss": 0.957, - "step": 38761 - }, - { - "epoch": 0.99, - "learning_rate": 1.560850588740559e-06, - "loss": 0.9746, - "step": 38762 - }, - { - "epoch": 0.99, - "learning_rate": 1.5608276796857016e-06, - "loss": 0.552, - "step": 38763 - }, - { - "epoch": 0.99, - "learning_rate": 1.5608047702014444e-06, - "loss": 0.6558, - "step": 38764 - }, - { - "epoch": 0.99, - "learning_rate": 1.5607818602878044e-06, - "loss": 0.6611, - "step": 38765 - }, - { - "epoch": 0.99, - "learning_rate": 1.5607589499448e-06, - "loss": 0.9717, - "step": 38766 - }, - { - "epoch": 0.99, - "learning_rate": 1.560736039172448e-06, - "loss": 0.6641, - "step": 38767 - }, - { - "epoch": 0.99, - "learning_rate": 1.560713127970766e-06, - "loss": 0.9736, - "step": 38768 - }, - { - "epoch": 0.99, - "learning_rate": 1.5606902163397723e-06, - "loss": 0.8633, - "step": 38769 - }, - { - "epoch": 0.99, - "learning_rate": 1.5606673042794833e-06, - "loss": 0.4866, - "step": 38770 - }, - { - "epoch": 0.99, - "learning_rate": 1.5606443917899176e-06, - "loss": 0.8662, - "step": 38771 - }, - { - "epoch": 0.99, - "learning_rate": 1.5606214788710918e-06, - "loss": 0.8223, - "step": 38772 - }, - { - "epoch": 0.99, - "learning_rate": 1.5605985655230243e-06, - "loss": 0.9023, - "step": 38773 - }, - { - "epoch": 0.99, - "learning_rate": 1.560575651745732e-06, - "loss": 0.8623, - "step": 38774 - }, - { - "epoch": 0.99, - "learning_rate": 1.560552737539233e-06, - "loss": 0.7778, - "step": 38775 - }, - { - "epoch": 0.99, - "learning_rate": 1.5605298229035443e-06, - "loss": 0.7236, - "step": 38776 - }, - { - "epoch": 0.99, - "learning_rate": 1.5605069078386838e-06, - "loss": 0.812, - "step": 38777 - }, - { - "epoch": 0.99, - "learning_rate": 1.5604839923446686e-06, - "loss": 0.8145, - "step": 38778 - }, - { - "epoch": 0.99, - "learning_rate": 1.5604610764215172e-06, - "loss": 0.7432, - "step": 38779 - }, - { - "epoch": 0.99, - "learning_rate": 1.560438160069246e-06, - "loss": 0.7959, - "step": 38780 - }, - { - "epoch": 0.99, - "learning_rate": 1.5604152432878733e-06, - "loss": 0.9082, - "step": 38781 - }, - { - "epoch": 0.99, - "learning_rate": 1.5603923260774163e-06, - "loss": 0.9492, - "step": 38782 - }, - { - "epoch": 0.99, - "learning_rate": 1.5603694084378926e-06, - "loss": 0.5933, - "step": 38783 - }, - { - "epoch": 0.99, - "learning_rate": 1.56034649036932e-06, - "loss": 1.0645, - "step": 38784 - }, - { - "epoch": 0.99, - "learning_rate": 1.5603235718717159e-06, - "loss": 0.7393, - "step": 38785 - }, - { - "epoch": 0.99, - "learning_rate": 1.5603006529450977e-06, - "loss": 0.623, - "step": 38786 - }, - { - "epoch": 0.99, - "learning_rate": 1.560277733589483e-06, - "loss": 0.8682, - "step": 38787 - }, - { - "epoch": 0.99, - "learning_rate": 1.5602548138048897e-06, - "loss": 0.7444, - "step": 38788 - }, - { - "epoch": 0.99, - "learning_rate": 1.5602318935913345e-06, - "loss": 0.9355, - "step": 38789 - }, - { - "epoch": 0.99, - "learning_rate": 1.560208972948836e-06, - "loss": 0.9229, - "step": 38790 - }, - { - "epoch": 0.99, - "learning_rate": 1.560186051877411e-06, - "loss": 0.8081, - "step": 38791 - }, - { - "epoch": 0.99, - "learning_rate": 1.5601631303770772e-06, - "loss": 0.9082, - "step": 38792 - }, - { - "epoch": 0.99, - "learning_rate": 1.5601402084478526e-06, - "loss": 0.958, - "step": 38793 - }, - { - "epoch": 0.99, - "learning_rate": 1.560117286089754e-06, - "loss": 0.6753, - "step": 38794 - }, - { - "epoch": 0.99, - "learning_rate": 1.5600943633027995e-06, - "loss": 0.7676, - "step": 38795 - }, - { - "epoch": 0.99, - "learning_rate": 1.560071440087007e-06, - "loss": 1.1025, - "step": 38796 - }, - { - "epoch": 0.99, - "learning_rate": 1.560048516442393e-06, - "loss": 0.8906, - "step": 38797 - }, - { - "epoch": 0.99, - "learning_rate": 1.5600255923689756e-06, - "loss": 0.6279, - "step": 38798 - }, - { - "epoch": 0.99, - "learning_rate": 1.5600026678667723e-06, - "loss": 0.8643, - "step": 38799 - }, - { - "epoch": 0.99, - "learning_rate": 1.559979742935801e-06, - "loss": 0.6885, - "step": 38800 - }, - { - "epoch": 0.99, - "learning_rate": 1.5599568175760788e-06, - "loss": 0.9438, - "step": 38801 - }, - { - "epoch": 0.99, - "learning_rate": 1.5599338917876234e-06, - "loss": 0.958, - "step": 38802 - }, - { - "epoch": 0.99, - "learning_rate": 1.5599109655704523e-06, - "loss": 0.96, - "step": 38803 - }, - { - "epoch": 0.99, - "learning_rate": 1.5598880389245834e-06, - "loss": 0.7954, - "step": 38804 - }, - { - "epoch": 0.99, - "learning_rate": 1.5598651118500338e-06, - "loss": 0.7969, - "step": 38805 - }, - { - "epoch": 0.99, - "learning_rate": 1.5598421843468212e-06, - "loss": 0.7417, - "step": 38806 - }, - { - "epoch": 0.99, - "learning_rate": 1.559819256414963e-06, - "loss": 0.8574, - "step": 38807 - }, - { - "epoch": 0.99, - "learning_rate": 1.5597963280544772e-06, - "loss": 0.877, - "step": 38808 - }, - { - "epoch": 0.99, - "learning_rate": 1.559773399265381e-06, - "loss": 0.8281, - "step": 38809 - }, - { - "epoch": 0.99, - "learning_rate": 1.559750470047692e-06, - "loss": 0.9531, - "step": 38810 - }, - { - "epoch": 0.99, - "learning_rate": 1.559727540401428e-06, - "loss": 0.9082, - "step": 38811 - }, - { - "epoch": 0.99, - "learning_rate": 1.5597046103266064e-06, - "loss": 0.8955, - "step": 38812 - }, - { - "epoch": 0.99, - "learning_rate": 1.5596816798232447e-06, - "loss": 0.6003, - "step": 38813 - }, - { - "epoch": 0.99, - "learning_rate": 1.5596587488913602e-06, - "loss": 0.9033, - "step": 38814 - }, - { - "epoch": 0.99, - "learning_rate": 1.5596358175309707e-06, - "loss": 0.8633, - "step": 38815 - }, - { - "epoch": 0.99, - "learning_rate": 1.5596128857420944e-06, - "loss": 0.6421, - "step": 38816 - }, - { - "epoch": 0.99, - "learning_rate": 1.5595899535247474e-06, - "loss": 0.8096, - "step": 38817 - }, - { - "epoch": 0.99, - "learning_rate": 1.5595670208789486e-06, - "loss": 1.0049, - "step": 38818 - }, - { - "epoch": 0.99, - "learning_rate": 1.5595440878047148e-06, - "loss": 0.8682, - "step": 38819 - }, - { - "epoch": 0.99, - "learning_rate": 1.5595211543020642e-06, - "loss": 0.9082, - "step": 38820 - }, - { - "epoch": 1.0, - "learning_rate": 1.559498220371014e-06, - "loss": 1.0254, - "step": 38821 - }, - { - "epoch": 1.0, - "learning_rate": 1.5594752860115813e-06, - "loss": 0.8184, - "step": 38822 - }, - { - "epoch": 1.0, - "learning_rate": 1.559452351223784e-06, - "loss": 0.5039, - "step": 38823 - }, - { - "epoch": 1.0, - "learning_rate": 1.55942941600764e-06, - "loss": 0.7378, - "step": 38824 - }, - { - "epoch": 1.0, - "learning_rate": 1.5594064803631667e-06, - "loss": 0.9668, - "step": 38825 - }, - { - "epoch": 1.0, - "learning_rate": 1.5593835442903816e-06, - "loss": 0.6909, - "step": 38826 - }, - { - "epoch": 1.0, - "learning_rate": 1.5593606077893021e-06, - "loss": 0.9844, - "step": 38827 - }, - { - "epoch": 1.0, - "learning_rate": 1.559337670859946e-06, - "loss": 0.9746, - "step": 38828 - }, - { - "epoch": 1.0, - "learning_rate": 1.5593147335023308e-06, - "loss": 0.7148, - "step": 38829 - }, - { - "epoch": 1.0, - "learning_rate": 1.5592917957164739e-06, - "loss": 0.8311, - "step": 38830 - }, - { - "epoch": 1.0, - "learning_rate": 1.5592688575023933e-06, - "loss": 0.9814, - "step": 38831 - }, - { - "epoch": 1.0, - "learning_rate": 1.559245918860106e-06, - "loss": 1.0566, - "step": 38832 - }, - { - "epoch": 1.0, - "learning_rate": 1.55922297978963e-06, - "loss": 0.9863, - "step": 38833 - }, - { - "epoch": 1.0, - "learning_rate": 1.5592000402909823e-06, - "loss": 0.793, - "step": 38834 - }, - { - "epoch": 1.0, - "learning_rate": 1.559177100364181e-06, - "loss": 0.7163, - "step": 38835 - }, - { - "epoch": 1.0, - "learning_rate": 1.5591541600092439e-06, - "loss": 0.5093, - "step": 38836 - }, - { - "epoch": 1.0, - "learning_rate": 1.5591312192261875e-06, - "loss": 0.8193, - "step": 38837 - }, - { - "epoch": 1.0, - "learning_rate": 1.5591082780150306e-06, - "loss": 0.7988, - "step": 38838 - }, - { - "epoch": 1.0, - "learning_rate": 1.55908533637579e-06, - "loss": 1.0645, - "step": 38839 - }, - { - "epoch": 1.0, - "learning_rate": 1.5590623943084832e-06, - "loss": 0.9541, - "step": 38840 - }, - { - "epoch": 1.0, - "learning_rate": 1.5590394518131284e-06, - "loss": 0.8643, - "step": 38841 - }, - { - "epoch": 1.0, - "learning_rate": 1.5590165088897427e-06, - "loss": 0.8574, - "step": 38842 - }, - { - "epoch": 1.0, - "learning_rate": 1.5589935655383437e-06, - "loss": 0.8662, - "step": 38843 - }, - { - "epoch": 1.0, - "learning_rate": 1.5589706217589492e-06, - "loss": 0.75, - "step": 38844 - }, - { - "epoch": 1.0, - "learning_rate": 1.5589476775515765e-06, - "loss": 0.7969, - "step": 38845 - }, - { - "epoch": 1.0, - "learning_rate": 1.558924732916243e-06, - "loss": 0.8398, - "step": 38846 - }, - { - "epoch": 1.0, - "learning_rate": 1.5589017878529669e-06, - "loss": 0.7419, - "step": 38847 - }, - { - "epoch": 1.0, - "learning_rate": 1.5588788423617652e-06, - "loss": 0.54, - "step": 38848 - }, - { - "epoch": 1.0, - "learning_rate": 1.5588558964426557e-06, - "loss": 0.8096, - "step": 38849 - }, - { - "epoch": 1.0, - "learning_rate": 1.5588329500956562e-06, - "loss": 0.7969, - "step": 38850 - }, - { - "epoch": 1.0, - "learning_rate": 1.5588100033207834e-06, - "loss": 0.9111, - "step": 38851 - }, - { - "epoch": 1.0, - "learning_rate": 1.5587870561180561e-06, - "loss": 0.8096, - "step": 38852 - }, - { - "epoch": 1.0, - "learning_rate": 1.558764108487491e-06, - "loss": 0.6445, - "step": 38853 - }, - { - "epoch": 1.0, - "learning_rate": 1.5587411604291056e-06, - "loss": 0.8232, - "step": 38854 - }, - { - "epoch": 1.0, - "learning_rate": 1.5587182119429182e-06, - "loss": 0.7705, - "step": 38855 - }, - { - "epoch": 1.0, - "learning_rate": 1.5586952630289457e-06, - "loss": 0.575, - "step": 38856 - }, - { - "epoch": 1.0, - "learning_rate": 1.5586723136872061e-06, - "loss": 0.8975, - "step": 38857 - }, - { - "epoch": 1.0, - "learning_rate": 1.5586493639177168e-06, - "loss": 0.6479, - "step": 38858 - }, - { - "epoch": 1.0, - "learning_rate": 1.5586264137204953e-06, - "loss": 0.8877, - "step": 38859 - }, - { - "epoch": 1.0, - "learning_rate": 1.5586034630955592e-06, - "loss": 0.9238, - "step": 38860 - }, - { - "epoch": 1.0, - "learning_rate": 1.5585805120429266e-06, - "loss": 0.9971, - "step": 38861 - }, - { - "epoch": 1.0, - "learning_rate": 1.558557560562614e-06, - "loss": 0.7666, - "step": 38862 - }, - { - "epoch": 1.0, - "learning_rate": 1.5585346086546397e-06, - "loss": 0.7397, - "step": 38863 - }, - { - "epoch": 1.0, - "learning_rate": 1.5585116563190211e-06, - "loss": 0.9297, - "step": 38864 - }, - { - "epoch": 1.0, - "learning_rate": 1.558488703555776e-06, - "loss": 0.7681, - "step": 38865 - }, - { - "epoch": 1.0, - "learning_rate": 1.5584657503649217e-06, - "loss": 0.8994, - "step": 38866 - }, - { - "epoch": 1.0, - "learning_rate": 1.5584427967464757e-06, - "loss": 0.9434, - "step": 38867 - }, - { - "epoch": 1.0, - "learning_rate": 1.5584198427004558e-06, - "loss": 0.8135, - "step": 38868 - }, - { - "epoch": 1.0, - "learning_rate": 1.5583968882268796e-06, - "loss": 0.9639, - "step": 38869 - }, - { - "epoch": 1.0, - "learning_rate": 1.5583739333257646e-06, - "loss": 0.8359, - "step": 38870 - }, - { - "epoch": 1.0, - "learning_rate": 1.5583509779971282e-06, - "loss": 0.9531, - "step": 38871 - }, - { - "epoch": 1.0, - "learning_rate": 1.558328022240988e-06, - "loss": 0.7246, - "step": 38872 - }, - { - "epoch": 1.0, - "learning_rate": 1.558305066057362e-06, - "loss": 0.9238, - "step": 38873 - }, - { - "epoch": 1.0, - "learning_rate": 1.5582821094462673e-06, - "loss": 0.6797, - "step": 38874 - }, - { - "epoch": 1.0, - "learning_rate": 1.558259152407722e-06, - "loss": 0.731, - "step": 38875 - }, - { - "epoch": 1.0, - "learning_rate": 1.558236194941743e-06, - "loss": 0.8545, - "step": 38876 - }, - { - "epoch": 1.0, - "learning_rate": 1.5582132370483482e-06, - "loss": 0.916, - "step": 38877 - }, - { - "epoch": 1.0, - "learning_rate": 1.5581902787275554e-06, - "loss": 0.7898, - "step": 38878 - }, - { - "epoch": 1.0, - "learning_rate": 1.5581673199793817e-06, - "loss": 0.8613, - "step": 38879 - }, - { - "epoch": 1.0, - "learning_rate": 1.5581443608038454e-06, - "loss": 0.71, - "step": 38880 - }, - { - "epoch": 1.0, - "learning_rate": 1.5581214012009634e-06, - "loss": 0.7925, - "step": 38881 - }, - { - "epoch": 1.0, - "learning_rate": 1.5580984411707535e-06, - "loss": 0.7427, - "step": 38882 - }, - { - "epoch": 1.0, - "learning_rate": 1.5580754807132328e-06, - "loss": 0.9673, - "step": 38883 - }, - { - "epoch": 1.0, - "learning_rate": 1.5580525198284198e-06, - "loss": 1.0625, - "step": 38884 - }, - { - "epoch": 1.0, - "learning_rate": 1.5580295585163318e-06, - "loss": 0.8447, - "step": 38885 - }, - { - "epoch": 1.0, - "learning_rate": 1.5580065967769862e-06, - "loss": 0.7485, - "step": 38886 - }, - { - "epoch": 1.0, - "learning_rate": 1.5579836346104002e-06, - "loss": 0.8237, - "step": 38887 - }, - { - "epoch": 1.0, - "learning_rate": 1.5579606720165921e-06, - "loss": 0.7344, - "step": 38888 - }, - { - "epoch": 1.0, - "learning_rate": 1.5579377089955792e-06, - "loss": 0.9062, - "step": 38889 - }, - { - "epoch": 1.0, - "learning_rate": 1.5579147455473791e-06, - "loss": 0.5581, - "step": 38890 - }, - { - "epoch": 1.0, - "learning_rate": 1.557891781672009e-06, - "loss": 0.9746, - "step": 38891 - }, - { - "epoch": 1.0, - "learning_rate": 1.5578688173694872e-06, - "loss": 0.9331, - "step": 38892 - }, - { - "epoch": 1.0, - "learning_rate": 1.5578458526398305e-06, - "loss": 0.6719, - "step": 38893 - }, - { - "epoch": 1.0, - "learning_rate": 1.5578228874830572e-06, - "loss": 0.8477, - "step": 38894 - }, - { - "epoch": 1.0, - "learning_rate": 1.5577999218991847e-06, - "loss": 0.7295, - "step": 38895 - }, - { - "epoch": 1.0, - "learning_rate": 1.5577769558882302e-06, - "loss": 1.0117, - "step": 38896 - }, - { - "epoch": 1.0, - "learning_rate": 1.5577539894502114e-06, - "loss": 0.6494, - "step": 38897 - }, - { - "epoch": 1.0, - "learning_rate": 1.557731022585146e-06, - "loss": 0.7686, - "step": 38898 - }, - { - "epoch": 1.0, - "learning_rate": 1.5577080552930516e-06, - "loss": 0.5503, - "step": 38899 - }, - { - "epoch": 1.0, - "learning_rate": 1.5576850875739465e-06, - "loss": 0.7549, - "step": 38900 - }, - { - "epoch": 1.0, - "learning_rate": 1.5576621194278468e-06, - "loss": 0.6912, - "step": 38901 - }, - { - "epoch": 1.0, - "learning_rate": 1.5576391508547713e-06, - "loss": 0.626, - "step": 38902 - }, - { - "epoch": 1.0, - "learning_rate": 1.5576161818547366e-06, - "loss": 0.9219, - "step": 38903 - }, - { - "epoch": 1.0, - "learning_rate": 1.5575932124277612e-06, - "loss": 0.7236, - "step": 38904 - }, - { - "epoch": 1.0, - "learning_rate": 1.5575702425738625e-06, - "loss": 1.0332, - "step": 38905 - }, - { - "epoch": 1.0, - "learning_rate": 1.5575472722930576e-06, - "loss": 0.5837, - "step": 38906 - }, - { - "epoch": 1.0, - "learning_rate": 1.5575243015853644e-06, - "loss": 0.7754, - "step": 38907 - }, - { - "epoch": 1.0, - "learning_rate": 1.5575013304508008e-06, - "loss": 0.8252, - "step": 38908 - }, - { - "epoch": 1.0, - "learning_rate": 1.5574783588893837e-06, - "loss": 0.9248, - "step": 38909 - }, - { - "epoch": 1.0, - "learning_rate": 1.557455386901131e-06, - "loss": 0.8271, - "step": 38910 - }, - { - "epoch": 1.0, - "learning_rate": 1.5574324144860605e-06, - "loss": 0.9668, - "step": 38911 - }, - { - "epoch": 1.0, - "learning_rate": 1.55740944164419e-06, - "loss": 0.8867, - "step": 38912 - }, - { - "epoch": 1.0, - "learning_rate": 1.557386468375536e-06, - "loss": 1.0098, - "step": 38913 - }, - { - "epoch": 1.0, - "learning_rate": 1.5573634946801173e-06, - "loss": 0.6523, - "step": 38914 - }, - { - "epoch": 1.0, - "learning_rate": 1.557340520557951e-06, - "loss": 1.0098, - "step": 38915 - }, - { - "epoch": 1.0, - "learning_rate": 1.5573175460090542e-06, - "loss": 0.9346, - "step": 38916 - }, - { - "epoch": 1.0, - "learning_rate": 1.5572945710334455e-06, - "loss": 0.8887, - "step": 38917 - }, - { - "epoch": 1.0, - "learning_rate": 1.5572715956311417e-06, - "loss": 0.8252, - "step": 38918 - }, - { - "epoch": 1.0, - "learning_rate": 1.5572486198021607e-06, - "loss": 0.6855, - "step": 38919 - }, - { - "epoch": 1.0, - "learning_rate": 1.5572256435465203e-06, - "loss": 0.8628, - "step": 38920 - }, - { - "epoch": 1.0, - "learning_rate": 1.5572026668642377e-06, - "loss": 0.9092, - "step": 38921 - }, - { - "epoch": 1.0, - "learning_rate": 1.5571796897553306e-06, - "loss": 0.7983, - "step": 38922 - }, - { - "epoch": 1.0, - "learning_rate": 1.5571567122198167e-06, - "loss": 1.0938, - "step": 38923 - }, - { - "epoch": 1.0, - "learning_rate": 1.5571337342577132e-06, - "loss": 0.7959, - "step": 38924 - }, - { - "epoch": 1.0, - "learning_rate": 1.5571107558690387e-06, - "loss": 0.9697, - "step": 38925 - }, - { - "epoch": 1.0, - "learning_rate": 1.5570877770538096e-06, - "loss": 0.9141, - "step": 38926 - }, - { - "epoch": 1.0, - "learning_rate": 1.557064797812044e-06, - "loss": 0.8447, - "step": 38927 - }, - { - "epoch": 1.0, - "learning_rate": 1.5570418181437597e-06, - "loss": 0.8945, - "step": 38928 - }, - { - "epoch": 1.0, - "learning_rate": 1.557018838048974e-06, - "loss": 0.7354, - "step": 38929 - }, - { - "epoch": 1.0, - "learning_rate": 1.5569958575277045e-06, - "loss": 0.7402, - "step": 38930 - }, - { - "epoch": 1.0, - "learning_rate": 1.556972876579969e-06, - "loss": 0.9219, - "step": 38931 - }, - { - "epoch": 1.0, - "learning_rate": 1.5569498952057849e-06, - "loss": 0.8545, - "step": 38932 - }, - { - "epoch": 1.0, - "learning_rate": 1.55692691340517e-06, - "loss": 0.9346, - "step": 38933 - }, - { - "epoch": 1.0, - "learning_rate": 1.5569039311781417e-06, - "loss": 0.832, - "step": 38934 - }, - { - "epoch": 1.0, - "learning_rate": 1.5568809485247174e-06, - "loss": 0.7603, - "step": 38935 - }, - { - "epoch": 1.0, - "learning_rate": 1.5568579654449154e-06, - "loss": 1.0693, - "step": 38936 - }, - { - "epoch": 1.0, - "learning_rate": 1.5568349819387527e-06, - "loss": 0.9473, - "step": 38937 - }, - { - "epoch": 1.0, - "learning_rate": 1.556811998006247e-06, - "loss": 0.7842, - "step": 38938 - }, - { - "epoch": 1.0, - "learning_rate": 1.556789013647416e-06, - "loss": 0.6128, - "step": 38939 - }, - { - "epoch": 1.0, - "learning_rate": 1.5567660288622773e-06, - "loss": 0.8252, - "step": 38940 - }, - { - "epoch": 1.0, - "learning_rate": 1.5567430436508485e-06, - "loss": 0.7295, - "step": 38941 - }, - { - "epoch": 1.0, - "learning_rate": 1.556720058013147e-06, - "loss": 0.9277, - "step": 38942 - }, - { - "epoch": 1.0, - "learning_rate": 1.5566970719491903e-06, - "loss": 0.8887, - "step": 38943 - }, - { - "epoch": 1.0, - "learning_rate": 1.5566740854589967e-06, - "loss": 0.7471, - "step": 38944 - }, - { - "epoch": 1.0, - "learning_rate": 1.5566510985425834e-06, - "loss": 0.6475, - "step": 38945 - }, - { - "epoch": 1.0, - "learning_rate": 1.5566281111999678e-06, - "loss": 0.8242, - "step": 38946 - }, - { - "epoch": 1.0, - "learning_rate": 1.5566051234311674e-06, - "loss": 0.9287, - "step": 38947 - }, - { - "epoch": 1.0, - "learning_rate": 1.5565821352362004e-06, - "loss": 0.5776, - "step": 38948 - }, - { - "epoch": 1.0, - "learning_rate": 1.5565591466150837e-06, - "loss": 0.7651, - "step": 38949 - }, - { - "epoch": 1.0, - "learning_rate": 1.5565361575678355e-06, - "loss": 0.6772, - "step": 38950 - }, - { - "epoch": 1.0, - "learning_rate": 1.5565131680944731e-06, - "loss": 0.9268, - "step": 38951 - }, - { - "epoch": 1.0, - "learning_rate": 1.5564901781950143e-06, - "loss": 0.8066, - "step": 38952 - }, - { - "epoch": 1.0, - "learning_rate": 1.5564671878694765e-06, - "loss": 0.6235, - "step": 38953 - }, - { - "epoch": 1.0, - "learning_rate": 1.556444197117877e-06, - "loss": 0.6943, - "step": 38954 - }, - { - "epoch": 1.0, - "learning_rate": 1.556421205940234e-06, - "loss": 0.6968, - "step": 38955 - }, - { - "epoch": 1.0, - "learning_rate": 1.556398214336565e-06, - "loss": 0.7529, - "step": 38956 - }, - { - "epoch": 1.0, - "learning_rate": 1.5563752223068876e-06, - "loss": 0.6217, - "step": 38957 - }, - { - "epoch": 1.0, - "learning_rate": 1.5563522298512188e-06, - "loss": 0.845, - "step": 38958 - }, - { - "epoch": 1.0, - "learning_rate": 1.556329236969577e-06, - "loss": 0.8364, - "step": 38959 - }, - { - "epoch": 1.0, - "learning_rate": 1.5563062436619797e-06, - "loss": 0.9424, - "step": 38960 - }, - { - "epoch": 1.0, - "learning_rate": 1.5562832499284438e-06, - "loss": 0.707, - "step": 38961 - }, - { - "epoch": 1.0, - "learning_rate": 1.5562602557689877e-06, - "loss": 0.7671, - "step": 38962 - }, - { - "epoch": 1.0, - "learning_rate": 1.5562372611836285e-06, - "loss": 0.6191, - "step": 38963 - }, - { - "epoch": 1.0, - "learning_rate": 1.5562142661723842e-06, - "loss": 0.9873, - "step": 38964 - }, - { - "epoch": 1.0, - "learning_rate": 1.5561912707352722e-06, - "loss": 0.4355, - "step": 38965 - }, - { - "epoch": 1.0, - "learning_rate": 1.5561682748723102e-06, - "loss": 0.958, - "step": 38966 - }, - { - "epoch": 1.0, - "learning_rate": 1.5561452785835154e-06, - "loss": 0.8555, - "step": 38967 - }, - { - "epoch": 1.0, - "learning_rate": 1.5561222818689057e-06, - "loss": 0.5605, - "step": 38968 - }, - { - "epoch": 1.0, - "learning_rate": 1.5560992847284991e-06, - "loss": 1.0469, - "step": 38969 - }, - { - "epoch": 1.0, - "learning_rate": 1.5560762871623128e-06, - "loss": 0.8032, - "step": 38970 - }, - { - "epoch": 1.0, - "learning_rate": 1.5560532891703645e-06, - "loss": 0.6294, - "step": 38971 - }, - { - "epoch": 1.0, - "learning_rate": 1.5560302907526713e-06, - "loss": 0.7207, - "step": 38972 - }, - { - "epoch": 1.0, - "learning_rate": 1.5560072919092514e-06, - "loss": 0.8174, - "step": 38973 - }, - { - "epoch": 1.0, - "learning_rate": 1.5559842926401227e-06, - "loss": 0.7979, - "step": 38974 - }, - { - "epoch": 1.0, - "learning_rate": 1.5559612929453023e-06, - "loss": 0.7676, - "step": 38975 - }, - { - "epoch": 1.0, - "learning_rate": 1.5559382928248076e-06, - "loss": 0.8223, - "step": 38976 - }, - { - "epoch": 1.0, - "learning_rate": 1.5559152922786569e-06, - "loss": 0.915, - "step": 38977 - }, - { - "epoch": 1.0, - "learning_rate": 1.555892291306867e-06, - "loss": 0.8789, - "step": 38978 - }, - { - "epoch": 1.0, - "learning_rate": 1.5558692899094562e-06, - "loss": 1.0479, - "step": 38979 - }, - { - "epoch": 1.0, - "learning_rate": 1.5558462880864418e-06, - "loss": 0.6592, - "step": 38980 - }, - { - "epoch": 1.0, - "learning_rate": 1.5558232858378414e-06, - "loss": 0.7261, - "step": 38981 - }, - { - "epoch": 1.0, - "learning_rate": 1.5558002831636725e-06, - "loss": 0.7463, - "step": 38982 - }, - { - "epoch": 1.0, - "learning_rate": 1.5557772800639533e-06, - "loss": 0.7305, - "step": 38983 - }, - { - "epoch": 1.0, - "learning_rate": 1.5557542765387006e-06, - "loss": 0.8403, - "step": 38984 - }, - { - "epoch": 1.0, - "learning_rate": 1.5557312725879327e-06, - "loss": 0.6982, - "step": 38985 - }, - { - "epoch": 1.0, - "learning_rate": 1.5557082682116667e-06, - "loss": 0.8213, - "step": 38986 - }, - { - "epoch": 1.0, - "learning_rate": 1.5556852634099205e-06, - "loss": 0.8779, - "step": 38987 - }, - { - "epoch": 1.0, - "learning_rate": 1.5556622581827117e-06, - "loss": 0.9658, - "step": 38988 - }, - { - "epoch": 1.0, - "learning_rate": 1.5556392525300578e-06, - "loss": 0.7812, - "step": 38989 - }, - { - "epoch": 1.0, - "learning_rate": 1.5556162464519766e-06, - "loss": 1.0293, - "step": 38990 - }, - { - "epoch": 1.0, - "learning_rate": 1.5555932399484854e-06, - "loss": 0.8198, - "step": 38991 - }, - { - "epoch": 1.0, - "learning_rate": 1.5555702330196021e-06, - "loss": 0.8994, - "step": 38992 - }, - { - "epoch": 1.0, - "learning_rate": 1.5555472256653445e-06, - "loss": 0.9023, - "step": 38993 - }, - { - "epoch": 1.0, - "learning_rate": 1.5555242178857295e-06, - "loss": 0.9492, - "step": 38994 - }, - { - "epoch": 1.0, - "learning_rate": 1.5555012096807754e-06, - "loss": 0.9395, - "step": 38995 - }, - { - "epoch": 1.0, - "learning_rate": 1.5554782010504992e-06, - "loss": 0.6084, - "step": 38996 - }, - { - "epoch": 1.0, - "learning_rate": 1.5554551919949193e-06, - "loss": 0.7036, - "step": 38997 - }, - { - "epoch": 1.0, - "learning_rate": 1.5554321825140529e-06, - "loss": 0.9014, - "step": 38998 - }, - { - "epoch": 1.0, - "learning_rate": 1.5554091726079172e-06, - "loss": 0.8135, - "step": 38999 - }, - { - "epoch": 1.0, - "learning_rate": 1.5553861622765306e-06, - "loss": 0.8291, - "step": 39000 - }, - { - "epoch": 1.0, - "learning_rate": 1.5553631515199101e-06, - "loss": 1.041, - "step": 39001 - }, - { - "epoch": 1.0, - "learning_rate": 1.5553401403380738e-06, - "loss": 0.7168, - "step": 39002 - }, - { - "epoch": 1.0, - "learning_rate": 1.5553171287310392e-06, - "loss": 0.7988, - "step": 39003 - }, - { - "epoch": 1.0, - "learning_rate": 1.5552941166988234e-06, - "loss": 0.7693, - "step": 39004 - }, - { - "epoch": 1.0, - "learning_rate": 1.5552711042414446e-06, - "loss": 0.7959, - "step": 39005 - }, - { - "epoch": 1.0, - "learning_rate": 1.5552480913589205e-06, - "loss": 1.0, - "step": 39006 - }, - { - "epoch": 1.0, - "learning_rate": 1.5552250780512682e-06, - "loss": 0.7466, - "step": 39007 - }, - { - "epoch": 1.0, - "learning_rate": 1.5552020643185056e-06, - "loss": 0.8721, - "step": 39008 - }, - { - "epoch": 1.0, - "learning_rate": 1.5551790501606501e-06, - "loss": 0.877, - "step": 39009 - }, - { - "epoch": 1.0, - "learning_rate": 1.5551560355777201e-06, - "loss": 0.8867, - "step": 39010 - }, - { - "epoch": 1.0, - "learning_rate": 1.5551330205697322e-06, - "loss": 0.7402, - "step": 39011 - }, - { - "epoch": 1.0, - "learning_rate": 1.5551100051367047e-06, - "loss": 0.6943, - "step": 39012 - }, - { - "epoch": 1.0, - "learning_rate": 1.5550869892786549e-06, - "loss": 0.8711, - "step": 39013 - }, - { - "epoch": 1.0, - "learning_rate": 1.5550639729956005e-06, - "loss": 0.8037, - "step": 39014 - }, - { - "epoch": 1.0, - "learning_rate": 1.5550409562875593e-06, - "loss": 0.9434, - "step": 39015 - }, - { - "epoch": 1.0, - "learning_rate": 1.5550179391545487e-06, - "loss": 0.7852, - "step": 39016 - }, - { - "epoch": 1.0, - "learning_rate": 1.554994921596586e-06, - "loss": 0.6829, - "step": 39017 - }, - { - "epoch": 1.0, - "learning_rate": 1.5549719036136897e-06, - "loss": 0.7891, - "step": 39018 - }, - { - "epoch": 1.0, - "learning_rate": 1.5549488852058766e-06, - "loss": 0.7266, - "step": 39019 - }, - { - "epoch": 1.0, - "learning_rate": 1.554925866373165e-06, - "loss": 0.7617, - "step": 39020 - }, - { - "epoch": 1.0, - "learning_rate": 1.554902847115572e-06, - "loss": 0.709, - "step": 39021 - }, - { - "epoch": 1.0, - "learning_rate": 1.5548798274331152e-06, - "loss": 0.6033, - "step": 39022 - }, - { - "epoch": 1.0, - "learning_rate": 1.5548568073258125e-06, - "loss": 0.6326, - "step": 39023 - }, - { - "epoch": 1.0, - "learning_rate": 1.5548337867936816e-06, - "loss": 0.6895, - "step": 39024 - }, - { - "epoch": 1.0, - "learning_rate": 1.55481076583674e-06, - "loss": 0.5718, - "step": 39025 - }, - { - "epoch": 1.0, - "learning_rate": 1.5547877444550053e-06, - "loss": 0.6528, - "step": 39026 - }, - { - "epoch": 1.0, - "learning_rate": 1.554764722648495e-06, - "loss": 0.8047, - "step": 39027 - }, - { - "epoch": 1.0, - "learning_rate": 1.554741700417227e-06, - "loss": 0.7305, - "step": 39028 - }, - { - "epoch": 1.0, - "learning_rate": 1.554718677761219e-06, - "loss": 0.6897, - "step": 39029 - }, - { - "epoch": 1.0, - "learning_rate": 1.5546956546804879e-06, - "loss": 0.5771, - "step": 39030 - }, - { - "epoch": 1.0, - "learning_rate": 1.5546726311750521e-06, - "loss": 0.7178, - "step": 39031 - }, - { - "epoch": 1.0, - "learning_rate": 1.5546496072449289e-06, - "loss": 0.7852, - "step": 39032 - }, - { - "epoch": 1.0, - "learning_rate": 1.5546265828901359e-06, - "loss": 0.6973, - "step": 39033 - }, - { - "epoch": 1.0, - "learning_rate": 1.554603558110691e-06, - "loss": 0.7324, - "step": 39034 - }, - { - "epoch": 1.0, - "learning_rate": 1.554580532906612e-06, - "loss": 0.7305, - "step": 39035 - }, - { - "epoch": 1.0, - "learning_rate": 1.5545575072779158e-06, - "loss": 0.6646, - "step": 39036 - }, - { - "epoch": 1.0, - "learning_rate": 1.5545344812246204e-06, - "loss": 0.7188, - "step": 39037 - }, - { - "epoch": 1.0, - "learning_rate": 1.5545114547467436e-06, - "loss": 0.7012, - "step": 39038 - }, - { - "epoch": 1.0, - "learning_rate": 1.5544884278443027e-06, - "loss": 0.667, - "step": 39039 - }, - { - "epoch": 1.0, - "learning_rate": 1.5544654005173156e-06, - "loss": 0.7207, - "step": 39040 - }, - { - "epoch": 1.0, - "learning_rate": 1.5544423727657998e-06, - "loss": 0.7188, - "step": 39041 - }, - { - "epoch": 1.0, - "learning_rate": 1.554419344589773e-06, - "loss": 0.7803, - "step": 39042 - }, - { - "epoch": 1.0, - "learning_rate": 1.5543963159892525e-06, - "loss": 0.47, - "step": 39043 - }, - { - "epoch": 1.0, - "learning_rate": 1.5543732869642568e-06, - "loss": 0.7314, - "step": 39044 - }, - { - "epoch": 1.0, - "learning_rate": 1.5543502575148027e-06, - "loss": 0.7969, - "step": 39045 - }, - { - "epoch": 1.0, - "learning_rate": 1.554327227640908e-06, - "loss": 0.6709, - "step": 39046 - }, - { - "epoch": 1.0, - "learning_rate": 1.5543041973425905e-06, - "loss": 0.6826, - "step": 39047 - }, - { - "epoch": 1.0, - "learning_rate": 1.5542811666198678e-06, - "loss": 0.6523, - "step": 39048 - }, - { - "epoch": 1.0, - "learning_rate": 1.5542581354727576e-06, - "loss": 0.624, - "step": 39049 - }, - { - "epoch": 1.0, - "learning_rate": 1.5542351039012772e-06, - "loss": 0.9346, - "step": 39050 - }, - { - "epoch": 1.0, - "learning_rate": 1.5542120719054445e-06, - "loss": 0.4854, - "step": 39051 - }, - { - "epoch": 1.0, - "learning_rate": 1.5541890394852773e-06, - "loss": 0.5947, - "step": 39052 - }, - { - "epoch": 1.0, - "learning_rate": 1.5541660066407927e-06, - "loss": 0.4493, - "step": 39053 - }, - { - "epoch": 1.0, - "learning_rate": 1.5541429733720088e-06, - "loss": 0.6431, - "step": 39054 - }, - { - "epoch": 1.0, - "learning_rate": 1.5541199396789436e-06, - "loss": 0.6187, - "step": 39055 - }, - { - "epoch": 1.0, - "learning_rate": 1.5540969055616135e-06, - "loss": 0.6377, - "step": 39056 - }, - { - "epoch": 1.0, - "learning_rate": 1.5540738710200375e-06, - "loss": 0.6558, - "step": 39057 - }, - { - "epoch": 1.0, - "learning_rate": 1.5540508360542322e-06, - "loss": 0.6567, - "step": 39058 - }, - { - "epoch": 1.0, - "learning_rate": 1.5540278006642158e-06, - "loss": 0.7207, - "step": 39059 - }, - { - "epoch": 1.0, - "learning_rate": 1.5540047648500058e-06, - "loss": 0.7651, - "step": 39060 - }, - { - "epoch": 1.0, - "learning_rate": 1.5539817286116197e-06, - "loss": 0.6479, - "step": 39061 - }, - { - "epoch": 1.0, - "learning_rate": 1.5539586919490755e-06, - "loss": 0.5249, - "step": 39062 - }, - { - "epoch": 1.0, - "learning_rate": 1.5539356548623903e-06, - "loss": 0.3691, - "step": 39063 - }, - { - "epoch": 1.0, - "learning_rate": 1.5539126173515822e-06, - "loss": 0.7324, - "step": 39064 - }, - { - "epoch": 1.0, - "learning_rate": 1.5538895794166687e-06, - "loss": 0.4797, - "step": 39065 - }, - { - "epoch": 1.0, - "learning_rate": 1.5538665410576672e-06, - "loss": 0.6865, - "step": 39066 - }, - { - "epoch": 1.0, - "learning_rate": 1.553843502274596e-06, - "loss": 0.7236, - "step": 39067 - }, - { - "epoch": 1.0, - "learning_rate": 1.5538204630674717e-06, - "loss": 0.6904, - "step": 39068 - }, - { - "epoch": 1.0, - "learning_rate": 1.553797423436313e-06, - "loss": 0.6719, - "step": 39069 - }, - { - "epoch": 1.0, - "learning_rate": 1.5537743833811373e-06, - "loss": 0.6592, - "step": 39070 - }, - { - "epoch": 1.0, - "learning_rate": 1.5537513429019615e-06, - "loss": 0.7002, - "step": 39071 - }, - { - "epoch": 1.0, - "learning_rate": 1.5537283019988036e-06, - "loss": 0.7598, - "step": 39072 - }, - { - "epoch": 1.0, - "learning_rate": 1.5537052606716817e-06, - "loss": 0.6465, - "step": 39073 - }, - { - "epoch": 1.0, - "learning_rate": 1.5536822189206133e-06, - "loss": 0.7471, - "step": 39074 - }, - { - "epoch": 1.0, - "learning_rate": 1.553659176745616e-06, - "loss": 0.4812, - "step": 39075 - }, - { - "epoch": 1.0, - "learning_rate": 1.553636134146707e-06, - "loss": 0.5994, - "step": 39076 - }, - { - "epoch": 1.0, - "learning_rate": 1.5536130911239042e-06, - "loss": 0.8574, - "step": 39077 - }, - { - "epoch": 1.0, - "learning_rate": 1.5535900476772255e-06, - "loss": 0.8984, - "step": 39078 - }, - { - "epoch": 1.0, - "learning_rate": 1.5535670038066884e-06, - "loss": 0.7021, - "step": 39079 - }, - { - "epoch": 1.0, - "learning_rate": 1.5535439595123102e-06, - "loss": 0.6157, - "step": 39080 - }, - { - "epoch": 1.0, - "learning_rate": 1.5535209147941094e-06, - "loss": 0.6167, - "step": 39081 - }, - { - "epoch": 1.0, - "learning_rate": 1.5534978696521023e-06, - "loss": 0.7852, - "step": 39082 - }, - { - "epoch": 1.0, - "learning_rate": 1.553474824086308e-06, - "loss": 0.8096, - "step": 39083 - }, - { - "epoch": 1.0, - "learning_rate": 1.5534517780967433e-06, - "loss": 0.541, - "step": 39084 - }, - { - "epoch": 1.0, - "learning_rate": 1.553428731683426e-06, - "loss": 0.8232, - "step": 39085 - }, - { - "epoch": 1.0, - "learning_rate": 1.5534056848463738e-06, - "loss": 0.5557, - "step": 39086 - }, - { - "epoch": 1.0, - "learning_rate": 1.5533826375856043e-06, - "loss": 0.7773, - "step": 39087 - }, - { - "epoch": 1.0, - "learning_rate": 1.553359589901135e-06, - "loss": 0.5508, - "step": 39088 - }, - { - "epoch": 1.0, - "learning_rate": 1.5533365417929835e-06, - "loss": 0.6958, - "step": 39089 - }, - { - "epoch": 1.0, - "learning_rate": 1.5533134932611682e-06, - "loss": 0.6875, - "step": 39090 - }, - { - "epoch": 1.0, - "learning_rate": 1.553290444305706e-06, - "loss": 0.7876, - "step": 39091 - }, - { - "epoch": 1.0, - "learning_rate": 1.5532673949266148e-06, - "loss": 0.6143, - "step": 39092 - }, - { - "epoch": 1.0, - "learning_rate": 1.553244345123912e-06, - "loss": 0.6807, - "step": 39093 - }, - { - "epoch": 1.0, - "learning_rate": 1.5532212948976156e-06, - "loss": 0.6182, - "step": 39094 - }, - { - "epoch": 1.0, - "learning_rate": 1.5531982442477432e-06, - "loss": 0.7139, - "step": 39095 - }, - { - "epoch": 1.0, - "learning_rate": 1.553175193174312e-06, - "loss": 0.7793, - "step": 39096 - }, - { - "epoch": 1.0, - "learning_rate": 1.5531521416773404e-06, - "loss": 0.8223, - "step": 39097 - }, - { - "epoch": 1.0, - "learning_rate": 1.5531290897568453e-06, - "loss": 0.6797, - "step": 39098 - }, - { - "epoch": 1.0, - "learning_rate": 1.553106037412845e-06, - "loss": 0.7207, - "step": 39099 - }, - { - "epoch": 1.0, - "learning_rate": 1.5530829846453566e-06, - "loss": 0.7646, - "step": 39100 - }, - { - "epoch": 1.0, - "learning_rate": 1.553059931454398e-06, - "loss": 0.5913, - "step": 39101 - }, - { - "epoch": 1.0, - "learning_rate": 1.5530368778399867e-06, - "loss": 0.8516, - "step": 39102 - }, - { - "epoch": 1.0, - "learning_rate": 1.5530138238021407e-06, - "loss": 0.8389, - "step": 39103 - }, - { - "epoch": 1.0, - "learning_rate": 1.5529907693408775e-06, - "loss": 0.7383, - "step": 39104 - }, - { - "epoch": 1.0, - "learning_rate": 1.5529677144562147e-06, - "loss": 0.6475, - "step": 39105 - }, - { - "epoch": 1.0, - "learning_rate": 1.5529446591481699e-06, - "loss": 0.5557, - "step": 39106 - }, - { - "epoch": 1.0, - "learning_rate": 1.5529216034167604e-06, - "loss": 0.793, - "step": 39107 - }, - { - "epoch": 1.0, - "learning_rate": 1.5528985472620048e-06, - "loss": 0.5508, - "step": 39108 - }, - { - "epoch": 1.0, - "learning_rate": 1.5528754906839198e-06, - "loss": 0.6016, - "step": 39109 - }, - { - "epoch": 1.0, - "learning_rate": 1.552852433682524e-06, - "loss": 0.6494, - "step": 39110 - }, - { - "epoch": 1.0, - "learning_rate": 1.552829376257834e-06, - "loss": 0.6895, - "step": 39111 - }, - { - "epoch": 1.0, - "learning_rate": 1.5528063184098683e-06, - "loss": 0.5325, - "step": 39112 - }, - { - "epoch": 1.0, - "learning_rate": 1.552783260138644e-06, - "loss": 0.5776, - "step": 39113 - }, - { - "epoch": 1.0, - "learning_rate": 1.5527602014441791e-06, - "loss": 0.7842, - "step": 39114 - }, - { - "epoch": 1.0, - "learning_rate": 1.552737142326491e-06, - "loss": 0.8076, - "step": 39115 - }, - { - "epoch": 1.0, - "learning_rate": 1.5527140827855977e-06, - "loss": 0.7334, - "step": 39116 - }, - { - "epoch": 1.0, - "learning_rate": 1.5526910228215165e-06, - "loss": 0.6416, - "step": 39117 - }, - { - "epoch": 1.0, - "learning_rate": 1.5526679624342651e-06, - "loss": 0.7148, - "step": 39118 - }, - { - "epoch": 1.0, - "learning_rate": 1.5526449016238615e-06, - "loss": 0.6445, - "step": 39119 - }, - { - "epoch": 1.0, - "learning_rate": 1.552621840390323e-06, - "loss": 0.7383, - "step": 39120 - }, - { - "epoch": 1.0, - "learning_rate": 1.552598778733667e-06, - "loss": 0.7622, - "step": 39121 - }, - { - "epoch": 1.0, - "learning_rate": 1.5525757166539122e-06, - "loss": 0.4534, - "step": 39122 - }, - { - "epoch": 1.0, - "learning_rate": 1.5525526541510748e-06, - "loss": 0.7383, - "step": 39123 - }, - { - "epoch": 1.0, - "learning_rate": 1.552529591225174e-06, - "loss": 0.6885, - "step": 39124 - }, - { - "epoch": 1.0, - "learning_rate": 1.5525065278762264e-06, - "loss": 0.5137, - "step": 39125 - }, - { - "epoch": 1.0, - "learning_rate": 1.55248346410425e-06, - "loss": 0.6528, - "step": 39126 - }, - { - "epoch": 1.0, - "learning_rate": 1.5524603999092623e-06, - "loss": 0.4695, - "step": 39127 - }, - { - "epoch": 1.0, - "learning_rate": 1.5524373352912813e-06, - "loss": 0.6782, - "step": 39128 - }, - { - "epoch": 1.0, - "learning_rate": 1.552414270250324e-06, - "loss": 0.8594, - "step": 39129 - }, - { - "epoch": 1.0, - "learning_rate": 1.5523912047864087e-06, - "loss": 0.7427, - "step": 39130 - }, - { - "epoch": 1.0, - "learning_rate": 1.552368138899553e-06, - "loss": 0.562, - "step": 39131 - }, - { - "epoch": 1.0, - "learning_rate": 1.5523450725897744e-06, - "loss": 0.8223, - "step": 39132 - }, - { - "epoch": 1.0, - "learning_rate": 1.5523220058570904e-06, - "loss": 0.5339, - "step": 39133 - }, - { - "epoch": 1.0, - "learning_rate": 1.5522989387015192e-06, - "loss": 0.6919, - "step": 39134 - }, - { - "epoch": 1.0, - "learning_rate": 1.5522758711230775e-06, - "loss": 0.708, - "step": 39135 - }, - { - "epoch": 1.0, - "learning_rate": 1.552252803121784e-06, - "loss": 0.7822, - "step": 39136 - }, - { - "epoch": 1.0, - "learning_rate": 1.5522297346976557e-06, - "loss": 0.6875, - "step": 39137 - }, - { - "epoch": 1.0, - "learning_rate": 1.5522066658507106e-06, - "loss": 0.6006, - "step": 39138 - }, - { - "epoch": 1.0, - "learning_rate": 1.5521835965809663e-06, - "loss": 0.6211, - "step": 39139 - }, - { - "epoch": 1.0, - "learning_rate": 1.5521605268884405e-06, - "loss": 0.2896, - "step": 39140 - }, - { - "epoch": 1.0, - "learning_rate": 1.5521374567731503e-06, - "loss": 0.6982, - "step": 39141 - }, - { - "epoch": 1.0, - "learning_rate": 1.5521143862351146e-06, - "loss": 0.8057, - "step": 39142 - }, - { - "epoch": 1.0, - "learning_rate": 1.5520913152743496e-06, - "loss": 0.5574, - "step": 39143 - }, - { - "epoch": 1.0, - "learning_rate": 1.5520682438908741e-06, - "loss": 0.5356, - "step": 39144 - }, - { - "epoch": 1.0, - "learning_rate": 1.5520451720847053e-06, - "loss": 0.4861, - "step": 39145 - }, - { - "epoch": 1.0, - "learning_rate": 1.5520220998558604e-06, - "loss": 0.7939, - "step": 39146 - }, - { - "epoch": 1.0, - "learning_rate": 1.5519990272043582e-06, - "loss": 0.5903, - "step": 39147 - }, - { - "epoch": 1.0, - "learning_rate": 1.5519759541302154e-06, - "loss": 0.6875, - "step": 39148 - }, - { - "epoch": 1.0, - "learning_rate": 1.55195288063345e-06, - "loss": 0.8525, - "step": 39149 - }, - { - "epoch": 1.0, - "learning_rate": 1.5519298067140797e-06, - "loss": 0.8418, - "step": 39150 - }, - { - "epoch": 1.0, - "learning_rate": 1.5519067323721223e-06, - "loss": 0.6963, - "step": 39151 - }, - { - "epoch": 1.0, - "learning_rate": 1.551883657607595e-06, - "loss": 0.6501, - "step": 39152 - }, - { - "epoch": 1.0, - "learning_rate": 1.5518605824205157e-06, - "loss": 0.6533, - "step": 39153 - }, - { - "epoch": 1.0, - "learning_rate": 1.5518375068109023e-06, - "loss": 0.7803, - "step": 39154 - }, - { - "epoch": 1.0, - "learning_rate": 1.5518144307787724e-06, - "loss": 0.5542, - "step": 39155 - }, - { - "epoch": 1.0, - "learning_rate": 1.5517913543241435e-06, - "loss": 0.6465, - "step": 39156 - }, - { - "epoch": 1.0, - "learning_rate": 1.5517682774470334e-06, - "loss": 0.6675, - "step": 39157 - }, - { - "epoch": 1.0, - "learning_rate": 1.5517452001474593e-06, - "loss": 0.5483, - "step": 39158 - }, - { - "epoch": 1.0, - "learning_rate": 1.5517221224254398e-06, - "loss": 0.5811, - "step": 39159 - }, - { - "epoch": 1.0, - "learning_rate": 1.5516990442809918e-06, - "loss": 0.6963, - "step": 39160 - }, - { - "epoch": 1.0, - "learning_rate": 1.551675965714133e-06, - "loss": 0.5317, - "step": 39161 - }, - { - "epoch": 1.0, - "learning_rate": 1.5516528867248818e-06, - "loss": 0.6846, - "step": 39162 - }, - { - "epoch": 1.0, - "learning_rate": 1.5516298073132547e-06, - "loss": 0.7207, - "step": 39163 - }, - { - "epoch": 1.0, - "learning_rate": 1.5516067274792706e-06, - "loss": 0.6377, - "step": 39164 - }, - { - "epoch": 1.0, - "learning_rate": 1.5515836472229462e-06, - "loss": 0.5239, - "step": 39165 - }, - { - "epoch": 1.0, - "learning_rate": 1.5515605665442998e-06, - "loss": 0.6963, - "step": 39166 - }, - { - "epoch": 1.0, - "learning_rate": 1.5515374854433487e-06, - "loss": 0.5217, - "step": 39167 - }, - { - "epoch": 1.0, - "learning_rate": 1.5515144039201106e-06, - "loss": 0.6904, - "step": 39168 - }, - { - "epoch": 1.0, - "learning_rate": 1.5514913219746038e-06, - "loss": 0.5059, - "step": 39169 - }, - { - "epoch": 1.0, - "learning_rate": 1.551468239606845e-06, - "loss": 0.5059, - "step": 39170 - }, - { - "epoch": 1.0, - "learning_rate": 1.5514451568168525e-06, - "loss": 0.6963, - "step": 39171 - }, - { - "epoch": 1.0, - "learning_rate": 1.5514220736046437e-06, - "loss": 0.6289, - "step": 39172 - }, - { - "epoch": 1.0, - "learning_rate": 1.5513989899702361e-06, - "loss": 0.6553, - "step": 39173 - }, - { - "epoch": 1.0, - "learning_rate": 1.551375905913648e-06, - "loss": 0.6309, - "step": 39174 - }, - { - "epoch": 1.0, - "learning_rate": 1.551352821434897e-06, - "loss": 0.5806, - "step": 39175 - }, - { - "epoch": 1.0, - "learning_rate": 1.5513297365339998e-06, - "loss": 0.7197, - "step": 39176 - }, - { - "epoch": 1.0, - "learning_rate": 1.5513066512109753e-06, - "loss": 0.8525, - "step": 39177 - }, - { - "epoch": 1.0, - "learning_rate": 1.5512835654658405e-06, - "loss": 0.6685, - "step": 39178 - }, - { - "epoch": 1.0, - "learning_rate": 1.5512604792986132e-06, - "loss": 0.5864, - "step": 39179 - }, - { - "epoch": 1.0, - "learning_rate": 1.5512373927093113e-06, - "loss": 0.7119, - "step": 39180 - }, - { - "epoch": 1.0, - "learning_rate": 1.551214305697952e-06, - "loss": 0.792, - "step": 39181 - }, - { - "epoch": 1.0, - "learning_rate": 1.5511912182645531e-06, - "loss": 0.6392, - "step": 39182 - }, - { - "epoch": 1.0, - "learning_rate": 1.5511681304091329e-06, - "loss": 0.3884, - "step": 39183 - }, - { - "epoch": 1.0, - "learning_rate": 1.5511450421317083e-06, - "loss": 0.7363, - "step": 39184 - }, - { - "epoch": 1.0, - "learning_rate": 1.5511219534322972e-06, - "loss": 0.6514, - "step": 39185 - }, - { - "epoch": 1.0, - "learning_rate": 1.5510988643109176e-06, - "loss": 0.5842, - "step": 39186 - }, - { - "epoch": 1.0, - "learning_rate": 1.5510757747675868e-06, - "loss": 0.6792, - "step": 39187 - }, - { - "epoch": 1.0, - "learning_rate": 1.5510526848023227e-06, - "loss": 0.603, - "step": 39188 - }, - { - "epoch": 1.0, - "learning_rate": 1.551029594415143e-06, - "loss": 0.4663, - "step": 39189 - }, - { - "epoch": 1.0, - "learning_rate": 1.551006503606065e-06, - "loss": 0.7393, - "step": 39190 - }, - { - "epoch": 1.0, - "learning_rate": 1.5509834123751069e-06, - "loss": 0.7021, - "step": 39191 - }, - { - "epoch": 1.0, - "learning_rate": 1.5509603207222859e-06, - "loss": 0.6211, - "step": 39192 - }, - { - "epoch": 1.0, - "learning_rate": 1.5509372286476202e-06, - "loss": 0.6055, - "step": 39193 - }, - { - "epoch": 1.0, - "learning_rate": 1.550914136151127e-06, - "loss": 0.5854, - "step": 39194 - }, - { - "epoch": 1.0, - "learning_rate": 1.5508910432328244e-06, - "loss": 0.4395, - "step": 39195 - }, - { - "epoch": 1.0, - "learning_rate": 1.5508679498927295e-06, - "loss": 0.6543, - "step": 39196 - }, - { - "epoch": 1.0, - "learning_rate": 1.5508448561308604e-06, - "loss": 0.5815, - "step": 39197 - }, - { - "epoch": 1.0, - "learning_rate": 1.550821761947235e-06, - "loss": 0.7129, - "step": 39198 - }, - { - "epoch": 1.0, - "learning_rate": 1.5507986673418705e-06, - "loss": 0.7134, - "step": 39199 - }, - { - "epoch": 1.0, - "learning_rate": 1.5507755723147851e-06, - "loss": 0.7881, - "step": 39200 - }, - { - "epoch": 1.0, - "learning_rate": 1.5507524768659957e-06, - "loss": 0.6021, - "step": 39201 - }, - { - "epoch": 1.0, - "learning_rate": 1.5507293809955207e-06, - "loss": 0.574, - "step": 39202 - }, - { - "epoch": 1.0, - "learning_rate": 1.5507062847033774e-06, - "loss": 0.6777, - "step": 39203 - }, - { - "epoch": 1.0, - "learning_rate": 1.5506831879895836e-06, - "loss": 0.5696, - "step": 39204 - }, - { - "epoch": 1.0, - "learning_rate": 1.5506600908541572e-06, - "loss": 0.543, - "step": 39205 - }, - { - "epoch": 1.0, - "learning_rate": 1.5506369932971155e-06, - "loss": 0.625, - "step": 39206 - }, - { - "epoch": 1.0, - "learning_rate": 1.5506138953184765e-06, - "loss": 0.6553, - "step": 39207 - }, - { - "epoch": 1.0, - "learning_rate": 1.5505907969182577e-06, - "loss": 0.709, - "step": 39208 - }, - { - "epoch": 1.0, - "learning_rate": 1.550567698096477e-06, - "loss": 0.6855, - "step": 39209 - }, - { - "epoch": 1.0, - "learning_rate": 1.5505445988531517e-06, - "loss": 0.6265, - "step": 39210 - }, - { - "epoch": 1.0, - "learning_rate": 1.5505214991883e-06, - "loss": 0.6172, - "step": 39211 - }, - { - "epoch": 1.01, - "learning_rate": 1.5504983991019392e-06, - "loss": 0.7666, - "step": 39212 - }, - { - "epoch": 1.01, - "learning_rate": 1.5504752985940867e-06, - "loss": 0.6504, - "step": 39213 - }, - { - "epoch": 1.01, - "learning_rate": 1.5504521976647613e-06, - "loss": 0.8174, - "step": 39214 - }, - { - "epoch": 1.01, - "learning_rate": 1.5504290963139795e-06, - "loss": 0.4951, - "step": 39215 - }, - { - "epoch": 1.01, - "learning_rate": 1.5504059945417593e-06, - "loss": 0.5669, - "step": 39216 - }, - { - "epoch": 1.01, - "learning_rate": 1.5503828923481189e-06, - "loss": 0.6646, - "step": 39217 - }, - { - "epoch": 1.01, - "learning_rate": 1.5503597897330754e-06, - "loss": 0.4766, - "step": 39218 - }, - { - "epoch": 1.01, - "learning_rate": 1.5503366866966468e-06, - "loss": 0.7241, - "step": 39219 - }, - { - "epoch": 1.01, - "learning_rate": 1.5503135832388508e-06, - "loss": 0.7017, - "step": 39220 - }, - { - "epoch": 1.01, - "learning_rate": 1.5502904793597047e-06, - "loss": 0.7393, - "step": 39221 - }, - { - "epoch": 1.01, - "learning_rate": 1.5502673750592268e-06, - "loss": 0.6816, - "step": 39222 - }, - { - "epoch": 1.01, - "learning_rate": 1.5502442703374343e-06, - "loss": 0.625, - "step": 39223 - }, - { - "epoch": 1.01, - "learning_rate": 1.5502211651943452e-06, - "loss": 0.5234, - "step": 39224 - }, - { - "epoch": 1.01, - "learning_rate": 1.5501980596299768e-06, - "loss": 0.5781, - "step": 39225 - }, - { - "epoch": 1.01, - "learning_rate": 1.5501749536443472e-06, - "loss": 0.6362, - "step": 39226 - }, - { - "epoch": 1.01, - "learning_rate": 1.5501518472374739e-06, - "loss": 0.5854, - "step": 39227 - }, - { - "epoch": 1.01, - "learning_rate": 1.5501287404093747e-06, - "loss": 0.4189, - "step": 39228 - }, - { - "epoch": 1.01, - "learning_rate": 1.5501056331600672e-06, - "loss": 0.8506, - "step": 39229 - }, - { - "epoch": 1.01, - "learning_rate": 1.5500825254895692e-06, - "loss": 0.5847, - "step": 39230 - }, - { - "epoch": 1.01, - "learning_rate": 1.550059417397898e-06, - "loss": 0.5999, - "step": 39231 - }, - { - "epoch": 1.01, - "learning_rate": 1.550036308885072e-06, - "loss": 0.8389, - "step": 39232 - }, - { - "epoch": 1.01, - "learning_rate": 1.5500131999511082e-06, - "loss": 0.8057, - "step": 39233 - }, - { - "epoch": 1.01, - "learning_rate": 1.5499900905960245e-06, - "loss": 0.5537, - "step": 39234 - }, - { - "epoch": 1.01, - "learning_rate": 1.549966980819839e-06, - "loss": 0.7744, - "step": 39235 - }, - { - "epoch": 1.01, - "learning_rate": 1.5499438706225689e-06, - "loss": 0.6758, - "step": 39236 - }, - { - "epoch": 1.01, - "learning_rate": 1.549920760004232e-06, - "loss": 0.6299, - "step": 39237 - }, - { - "epoch": 1.01, - "learning_rate": 1.5498976489648463e-06, - "loss": 0.6938, - "step": 39238 - }, - { - "epoch": 1.01, - "learning_rate": 1.5498745375044291e-06, - "loss": 0.7393, - "step": 39239 - }, - { - "epoch": 1.01, - "learning_rate": 1.5498514256229983e-06, - "loss": 0.8008, - "step": 39240 - }, - { - "epoch": 1.01, - "learning_rate": 1.5498283133205713e-06, - "loss": 0.6011, - "step": 39241 - }, - { - "epoch": 1.01, - "learning_rate": 1.5498052005971663e-06, - "loss": 0.6201, - "step": 39242 - }, - { - "epoch": 1.01, - "learning_rate": 1.5497820874528004e-06, - "loss": 0.7168, - "step": 39243 - }, - { - "epoch": 1.01, - "learning_rate": 1.5497589738874922e-06, - "loss": 0.4673, - "step": 39244 - }, - { - "epoch": 1.01, - "learning_rate": 1.5497358599012586e-06, - "loss": 0.4619, - "step": 39245 - }, - { - "epoch": 1.01, - "learning_rate": 1.5497127454941174e-06, - "loss": 0.7754, - "step": 39246 - }, - { - "epoch": 1.01, - "learning_rate": 1.5496896306660864e-06, - "loss": 0.9111, - "step": 39247 - }, - { - "epoch": 1.01, - "learning_rate": 1.5496665154171836e-06, - "loss": 0.6597, - "step": 39248 - }, - { - "epoch": 1.01, - "learning_rate": 1.5496433997474263e-06, - "loss": 0.5396, - "step": 39249 - }, - { - "epoch": 1.01, - "learning_rate": 1.5496202836568323e-06, - "loss": 0.6904, - "step": 39250 - }, - { - "epoch": 1.01, - "learning_rate": 1.5495971671454192e-06, - "loss": 0.5425, - "step": 39251 - }, - { - "epoch": 1.01, - "learning_rate": 1.5495740502132048e-06, - "loss": 0.6436, - "step": 39252 - }, - { - "epoch": 1.01, - "learning_rate": 1.5495509328602067e-06, - "loss": 0.6787, - "step": 39253 - }, - { - "epoch": 1.01, - "learning_rate": 1.5495278150864433e-06, - "loss": 0.7998, - "step": 39254 - }, - { - "epoch": 1.01, - "learning_rate": 1.5495046968919315e-06, - "loss": 0.5234, - "step": 39255 - }, - { - "epoch": 1.01, - "learning_rate": 1.5494815782766889e-06, - "loss": 0.6572, - "step": 39256 - }, - { - "epoch": 1.01, - "learning_rate": 1.5494584592407337e-06, - "loss": 0.7607, - "step": 39257 - }, - { - "epoch": 1.01, - "learning_rate": 1.5494353397840833e-06, - "loss": 0.687, - "step": 39258 - }, - { - "epoch": 1.01, - "learning_rate": 1.5494122199067559e-06, - "loss": 0.7969, - "step": 39259 - }, - { - "epoch": 1.01, - "learning_rate": 1.5493890996087684e-06, - "loss": 0.5337, - "step": 39260 - }, - { - "epoch": 1.01, - "learning_rate": 1.5493659788901393e-06, - "loss": 0.4785, - "step": 39261 - }, - { - "epoch": 1.01, - "learning_rate": 1.5493428577508857e-06, - "loss": 0.7002, - "step": 39262 - }, - { - "epoch": 1.01, - "learning_rate": 1.5493197361910256e-06, - "loss": 0.6338, - "step": 39263 - }, - { - "epoch": 1.01, - "learning_rate": 1.5492966142105766e-06, - "loss": 0.7051, - "step": 39264 - }, - { - "epoch": 1.01, - "learning_rate": 1.5492734918095564e-06, - "loss": 0.646, - "step": 39265 - }, - { - "epoch": 1.01, - "learning_rate": 1.5492503689879827e-06, - "loss": 0.4814, - "step": 39266 - }, - { - "epoch": 1.01, - "learning_rate": 1.5492272457458735e-06, - "loss": 0.6641, - "step": 39267 - }, - { - "epoch": 1.01, - "learning_rate": 1.5492041220832458e-06, - "loss": 0.6729, - "step": 39268 - }, - { - "epoch": 1.01, - "learning_rate": 1.5491809980001182e-06, - "loss": 0.6758, - "step": 39269 - }, - { - "epoch": 1.01, - "learning_rate": 1.5491578734965077e-06, - "loss": 0.5273, - "step": 39270 - }, - { - "epoch": 1.01, - "learning_rate": 1.5491347485724325e-06, - "loss": 0.5884, - "step": 39271 - }, - { - "epoch": 1.01, - "learning_rate": 1.54911162322791e-06, - "loss": 0.646, - "step": 39272 - }, - { - "epoch": 1.01, - "learning_rate": 1.549088497462958e-06, - "loss": 0.5542, - "step": 39273 - }, - { - "epoch": 1.01, - "learning_rate": 1.549065371277594e-06, - "loss": 0.5679, - "step": 39274 - }, - { - "epoch": 1.01, - "learning_rate": 1.549042244671836e-06, - "loss": 0.7373, - "step": 39275 - }, - { - "epoch": 1.01, - "learning_rate": 1.5490191176457014e-06, - "loss": 0.7783, - "step": 39276 - }, - { - "epoch": 1.01, - "learning_rate": 1.5489959901992084e-06, - "loss": 0.6787, - "step": 39277 - }, - { - "epoch": 1.01, - "learning_rate": 1.5489728623323744e-06, - "loss": 0.6113, - "step": 39278 - }, - { - "epoch": 1.01, - "learning_rate": 1.5489497340452173e-06, - "loss": 0.5825, - "step": 39279 - }, - { - "epoch": 1.01, - "learning_rate": 1.5489266053377543e-06, - "loss": 0.7666, - "step": 39280 - }, - { - "epoch": 1.01, - "learning_rate": 1.5489034762100034e-06, - "loss": 0.7539, - "step": 39281 - }, - { - "epoch": 1.01, - "learning_rate": 1.5488803466619825e-06, - "loss": 0.7393, - "step": 39282 - }, - { - "epoch": 1.01, - "learning_rate": 1.548857216693709e-06, - "loss": 0.6562, - "step": 39283 - }, - { - "epoch": 1.01, - "learning_rate": 1.5488340863052009e-06, - "loss": 0.749, - "step": 39284 - }, - { - "epoch": 1.01, - "learning_rate": 1.5488109554964758e-06, - "loss": 0.7734, - "step": 39285 - }, - { - "epoch": 1.01, - "learning_rate": 1.5487878242675514e-06, - "loss": 0.6064, - "step": 39286 - }, - { - "epoch": 1.01, - "learning_rate": 1.5487646926184454e-06, - "loss": 0.6499, - "step": 39287 - }, - { - "epoch": 1.01, - "learning_rate": 1.5487415605491754e-06, - "loss": 0.7539, - "step": 39288 - }, - { - "epoch": 1.01, - "learning_rate": 1.5487184280597595e-06, - "loss": 0.5132, - "step": 39289 - }, - { - "epoch": 1.01, - "learning_rate": 1.5486952951502148e-06, - "loss": 0.6035, - "step": 39290 - }, - { - "epoch": 1.01, - "learning_rate": 1.5486721618205594e-06, - "loss": 0.6533, - "step": 39291 - }, - { - "epoch": 1.01, - "learning_rate": 1.5486490280708112e-06, - "loss": 0.625, - "step": 39292 - }, - { - "epoch": 1.01, - "learning_rate": 1.5486258939009874e-06, - "loss": 0.5879, - "step": 39293 - }, - { - "epoch": 1.01, - "learning_rate": 1.548602759311106e-06, - "loss": 0.709, - "step": 39294 - }, - { - "epoch": 1.01, - "learning_rate": 1.5485796243011847e-06, - "loss": 0.7568, - "step": 39295 - }, - { - "epoch": 1.01, - "learning_rate": 1.5485564888712412e-06, - "loss": 0.7207, - "step": 39296 - }, - { - "epoch": 1.01, - "learning_rate": 1.5485333530212932e-06, - "loss": 0.7695, - "step": 39297 - }, - { - "epoch": 1.01, - "learning_rate": 1.5485102167513583e-06, - "loss": 0.7061, - "step": 39298 - }, - { - "epoch": 1.01, - "learning_rate": 1.5484870800614548e-06, - "loss": 0.7832, - "step": 39299 - }, - { - "epoch": 1.01, - "learning_rate": 1.5484639429515997e-06, - "loss": 0.7031, - "step": 39300 - }, - { - "epoch": 1.01, - "learning_rate": 1.548440805421811e-06, - "loss": 0.5811, - "step": 39301 - }, - { - "epoch": 1.01, - "learning_rate": 1.5484176674721064e-06, - "loss": 0.5823, - "step": 39302 - }, - { - "epoch": 1.01, - "learning_rate": 1.5483945291025035e-06, - "loss": 0.6924, - "step": 39303 - }, - { - "epoch": 1.01, - "learning_rate": 1.5483713903130204e-06, - "loss": 0.4331, - "step": 39304 - }, - { - "epoch": 1.01, - "learning_rate": 1.5483482511036744e-06, - "loss": 0.4541, - "step": 39305 - }, - { - "epoch": 1.01, - "learning_rate": 1.548325111474483e-06, - "loss": 0.5225, - "step": 39306 - }, - { - "epoch": 1.01, - "learning_rate": 1.5483019714254648e-06, - "loss": 0.6797, - "step": 39307 - }, - { - "epoch": 1.01, - "learning_rate": 1.5482788309566366e-06, - "loss": 0.6582, - "step": 39308 - }, - { - "epoch": 1.01, - "learning_rate": 1.548255690068017e-06, - "loss": 0.6787, - "step": 39309 - }, - { - "epoch": 1.01, - "learning_rate": 1.548232548759623e-06, - "loss": 0.7109, - "step": 39310 - }, - { - "epoch": 1.01, - "learning_rate": 1.5482094070314721e-06, - "loss": 0.6982, - "step": 39311 - }, - { - "epoch": 1.01, - "learning_rate": 1.5481862648835828e-06, - "loss": 0.6035, - "step": 39312 - }, - { - "epoch": 1.01, - "learning_rate": 1.5481631223159726e-06, - "loss": 0.5273, - "step": 39313 - }, - { - "epoch": 1.01, - "learning_rate": 1.5481399793286589e-06, - "loss": 0.7852, - "step": 39314 - }, - { - "epoch": 1.01, - "learning_rate": 1.54811683592166e-06, - "loss": 0.8955, - "step": 39315 - }, - { - "epoch": 1.01, - "learning_rate": 1.5480936920949929e-06, - "loss": 0.5042, - "step": 39316 - }, - { - "epoch": 1.01, - "learning_rate": 1.5480705478486758e-06, - "loss": 0.5596, - "step": 39317 - }, - { - "epoch": 1.01, - "learning_rate": 1.5480474031827261e-06, - "loss": 0.7051, - "step": 39318 - }, - { - "epoch": 1.01, - "learning_rate": 1.5480242580971618e-06, - "loss": 0.6309, - "step": 39319 - }, - { - "epoch": 1.01, - "learning_rate": 1.5480011125920007e-06, - "loss": 0.686, - "step": 39320 - }, - { - "epoch": 1.01, - "learning_rate": 1.54797796666726e-06, - "loss": 0.7578, - "step": 39321 - }, - { - "epoch": 1.01, - "learning_rate": 1.547954820322958e-06, - "loss": 0.6953, - "step": 39322 - }, - { - "epoch": 1.01, - "learning_rate": 1.547931673559112e-06, - "loss": 0.7188, - "step": 39323 - }, - { - "epoch": 1.01, - "learning_rate": 1.5479085263757403e-06, - "loss": 0.6406, - "step": 39324 - }, - { - "epoch": 1.01, - "learning_rate": 1.5478853787728601e-06, - "loss": 0.52, - "step": 39325 - }, - { - "epoch": 1.01, - "learning_rate": 1.5478622307504892e-06, - "loss": 0.792, - "step": 39326 - }, - { - "epoch": 1.01, - "learning_rate": 1.5478390823086452e-06, - "loss": 0.4535, - "step": 39327 - }, - { - "epoch": 1.01, - "learning_rate": 1.547815933447346e-06, - "loss": 0.645, - "step": 39328 - }, - { - "epoch": 1.01, - "learning_rate": 1.5477927841666096e-06, - "loss": 0.5908, - "step": 39329 - }, - { - "epoch": 1.01, - "learning_rate": 1.5477696344664532e-06, - "loss": 0.4561, - "step": 39330 - }, - { - "epoch": 1.01, - "learning_rate": 1.547746484346895e-06, - "loss": 0.533, - "step": 39331 - }, - { - "epoch": 1.01, - "learning_rate": 1.5477233338079526e-06, - "loss": 0.748, - "step": 39332 - }, - { - "epoch": 1.01, - "learning_rate": 1.5477001828496431e-06, - "loss": 0.7568, - "step": 39333 - }, - { - "epoch": 1.01, - "learning_rate": 1.5476770314719854e-06, - "loss": 0.6611, - "step": 39334 - }, - { - "epoch": 1.01, - "learning_rate": 1.5476538796749962e-06, - "loss": 0.7285, - "step": 39335 - }, - { - "epoch": 1.01, - "learning_rate": 1.5476307274586937e-06, - "loss": 0.6821, - "step": 39336 - }, - { - "epoch": 1.01, - "learning_rate": 1.5476075748230955e-06, - "loss": 0.5703, - "step": 39337 - }, - { - "epoch": 1.01, - "learning_rate": 1.5475844217682192e-06, - "loss": 0.6489, - "step": 39338 - }, - { - "epoch": 1.01, - "learning_rate": 1.5475612682940828e-06, - "loss": 0.7637, - "step": 39339 - }, - { - "epoch": 1.01, - "learning_rate": 1.5475381144007042e-06, - "loss": 0.8486, - "step": 39340 - }, - { - "epoch": 1.01, - "learning_rate": 1.5475149600881006e-06, - "loss": 0.665, - "step": 39341 - }, - { - "epoch": 1.01, - "learning_rate": 1.54749180535629e-06, - "loss": 0.6729, - "step": 39342 - }, - { - "epoch": 1.01, - "learning_rate": 1.5474686502052899e-06, - "loss": 0.6392, - "step": 39343 - }, - { - "epoch": 1.01, - "learning_rate": 1.5474454946351187e-06, - "loss": 0.8301, - "step": 39344 - }, - { - "epoch": 1.01, - "learning_rate": 1.547422338645793e-06, - "loss": 0.5115, - "step": 39345 - }, - { - "epoch": 1.01, - "learning_rate": 1.5473991822373319e-06, - "loss": 0.6797, - "step": 39346 - }, - { - "epoch": 1.01, - "learning_rate": 1.547376025409752e-06, - "loss": 0.6709, - "step": 39347 - }, - { - "epoch": 1.01, - "learning_rate": 1.5473528681630711e-06, - "loss": 0.5737, - "step": 39348 - }, - { - "epoch": 1.01, - "learning_rate": 1.547329710497308e-06, - "loss": 0.4753, - "step": 39349 - }, - { - "epoch": 1.01, - "learning_rate": 1.5473065524124795e-06, - "loss": 0.7021, - "step": 39350 - }, - { - "epoch": 1.01, - "learning_rate": 1.5472833939086033e-06, - "loss": 0.4125, - "step": 39351 - }, - { - "epoch": 1.01, - "learning_rate": 1.5472602349856975e-06, - "loss": 0.6187, - "step": 39352 - }, - { - "epoch": 1.01, - "learning_rate": 1.5472370756437797e-06, - "loss": 0.5249, - "step": 39353 - }, - { - "epoch": 1.01, - "learning_rate": 1.547213915882868e-06, - "loss": 0.6328, - "step": 39354 - }, - { - "epoch": 1.01, - "learning_rate": 1.5471907557029793e-06, - "loss": 0.6367, - "step": 39355 - }, - { - "epoch": 1.01, - "learning_rate": 1.5471675951041315e-06, - "loss": 0.5332, - "step": 39356 - }, - { - "epoch": 1.01, - "learning_rate": 1.5471444340863434e-06, - "loss": 0.6357, - "step": 39357 - }, - { - "epoch": 1.01, - "learning_rate": 1.5471212726496313e-06, - "loss": 0.5791, - "step": 39358 - }, - { - "epoch": 1.01, - "learning_rate": 1.5470981107940139e-06, - "loss": 0.6606, - "step": 39359 - }, - { - "epoch": 1.01, - "learning_rate": 1.547074948519509e-06, - "loss": 0.7324, - "step": 39360 - }, - { - "epoch": 1.01, - "learning_rate": 1.5470517858261334e-06, - "loss": 0.4526, - "step": 39361 - }, - { - "epoch": 1.01, - "learning_rate": 1.5470286227139059e-06, - "loss": 0.5967, - "step": 39362 - }, - { - "epoch": 1.01, - "learning_rate": 1.5470054591828433e-06, - "loss": 0.6294, - "step": 39363 - }, - { - "epoch": 1.01, - "learning_rate": 1.546982295232964e-06, - "loss": 0.6934, - "step": 39364 - }, - { - "epoch": 1.01, - "learning_rate": 1.5469591308642853e-06, - "loss": 0.6094, - "step": 39365 - }, - { - "epoch": 1.01, - "learning_rate": 1.546935966076825e-06, - "loss": 0.6479, - "step": 39366 - }, - { - "epoch": 1.01, - "learning_rate": 1.5469128008706014e-06, - "loss": 0.625, - "step": 39367 - }, - { - "epoch": 1.01, - "learning_rate": 1.5468896352456317e-06, - "loss": 0.7441, - "step": 39368 - }, - { - "epoch": 1.01, - "learning_rate": 1.5468664692019337e-06, - "loss": 0.8271, - "step": 39369 - }, - { - "epoch": 1.01, - "learning_rate": 1.5468433027395253e-06, - "loss": 0.8135, - "step": 39370 - }, - { - "epoch": 1.01, - "learning_rate": 1.5468201358584239e-06, - "loss": 0.5721, - "step": 39371 - }, - { - "epoch": 1.01, - "learning_rate": 1.5467969685586474e-06, - "loss": 0.7031, - "step": 39372 - }, - { - "epoch": 1.01, - "learning_rate": 1.5467738008402141e-06, - "loss": 0.5121, - "step": 39373 - }, - { - "epoch": 1.01, - "learning_rate": 1.546750632703141e-06, - "loss": 0.5312, - "step": 39374 - }, - { - "epoch": 1.01, - "learning_rate": 1.5467274641474458e-06, - "loss": 0.7559, - "step": 39375 - }, - { - "epoch": 1.01, - "learning_rate": 1.5467042951731468e-06, - "loss": 0.7666, - "step": 39376 - }, - { - "epoch": 1.01, - "learning_rate": 1.5466811257802615e-06, - "loss": 0.8477, - "step": 39377 - }, - { - "epoch": 1.01, - "learning_rate": 1.5466579559688073e-06, - "loss": 0.707, - "step": 39378 - }, - { - "epoch": 1.01, - "learning_rate": 1.546634785738803e-06, - "loss": 0.5469, - "step": 39379 - }, - { - "epoch": 1.01, - "learning_rate": 1.5466116150902647e-06, - "loss": 0.6011, - "step": 39380 - }, - { - "epoch": 1.01, - "learning_rate": 1.5465884440232114e-06, - "loss": 0.7266, - "step": 39381 - }, - { - "epoch": 1.01, - "learning_rate": 1.5465652725376603e-06, - "loss": 0.5845, - "step": 39382 - }, - { - "epoch": 1.01, - "learning_rate": 1.5465421006336295e-06, - "loss": 0.7256, - "step": 39383 - }, - { - "epoch": 1.01, - "learning_rate": 1.5465189283111364e-06, - "loss": 0.6982, - "step": 39384 - }, - { - "epoch": 1.01, - "learning_rate": 1.546495755570199e-06, - "loss": 0.6875, - "step": 39385 - }, - { - "epoch": 1.01, - "learning_rate": 1.5464725824108347e-06, - "loss": 0.707, - "step": 39386 - }, - { - "epoch": 1.01, - "learning_rate": 1.5464494088330616e-06, - "loss": 0.8086, - "step": 39387 - }, - { - "epoch": 1.01, - "learning_rate": 1.5464262348368974e-06, - "loss": 0.6875, - "step": 39388 - }, - { - "epoch": 1.01, - "learning_rate": 1.5464030604223597e-06, - "loss": 0.6646, - "step": 39389 - }, - { - "epoch": 1.01, - "learning_rate": 1.5463798855894664e-06, - "loss": 0.6694, - "step": 39390 - }, - { - "epoch": 1.01, - "learning_rate": 1.546356710338235e-06, - "loss": 0.7637, - "step": 39391 - }, - { - "epoch": 1.01, - "learning_rate": 1.5463335346686834e-06, - "loss": 0.7441, - "step": 39392 - }, - { - "epoch": 1.01, - "learning_rate": 1.5463103585808296e-06, - "loss": 0.4692, - "step": 39393 - }, - { - "epoch": 1.01, - "learning_rate": 1.5462871820746907e-06, - "loss": 0.7168, - "step": 39394 - }, - { - "epoch": 1.01, - "learning_rate": 1.546264005150285e-06, - "loss": 0.7139, - "step": 39395 - }, - { - "epoch": 1.01, - "learning_rate": 1.54624082780763e-06, - "loss": 0.6104, - "step": 39396 - }, - { - "epoch": 1.01, - "learning_rate": 1.5462176500467435e-06, - "loss": 0.7578, - "step": 39397 - }, - { - "epoch": 1.01, - "learning_rate": 1.5461944718676435e-06, - "loss": 0.8701, - "step": 39398 - }, - { - "epoch": 1.01, - "learning_rate": 1.5461712932703471e-06, - "loss": 0.6885, - "step": 39399 - }, - { - "epoch": 1.01, - "learning_rate": 1.546148114254873e-06, - "loss": 0.564, - "step": 39400 - }, - { - "epoch": 1.01, - "learning_rate": 1.546124934821238e-06, - "loss": 0.6982, - "step": 39401 - }, - { - "epoch": 1.01, - "learning_rate": 1.5461017549694605e-06, - "loss": 0.5913, - "step": 39402 - }, - { - "epoch": 1.01, - "learning_rate": 1.5460785746995574e-06, - "loss": 0.7183, - "step": 39403 - }, - { - "epoch": 1.01, - "learning_rate": 1.5460553940115477e-06, - "loss": 0.7158, - "step": 39404 - }, - { - "epoch": 1.01, - "learning_rate": 1.5460322129054482e-06, - "loss": 0.6875, - "step": 39405 - }, - { - "epoch": 1.01, - "learning_rate": 1.546009031381277e-06, - "loss": 0.5244, - "step": 39406 - }, - { - "epoch": 1.01, - "learning_rate": 1.5459858494390518e-06, - "loss": 0.6699, - "step": 39407 - }, - { - "epoch": 1.01, - "learning_rate": 1.5459626670787903e-06, - "loss": 0.6465, - "step": 39408 - }, - { - "epoch": 1.01, - "learning_rate": 1.5459394843005105e-06, - "loss": 0.6865, - "step": 39409 - }, - { - "epoch": 1.01, - "learning_rate": 1.5459163011042296e-06, - "loss": 0.667, - "step": 39410 - }, - { - "epoch": 1.01, - "learning_rate": 1.5458931174899658e-06, - "loss": 0.4849, - "step": 39411 - }, - { - "epoch": 1.01, - "learning_rate": 1.545869933457737e-06, - "loss": 0.5986, - "step": 39412 - }, - { - "epoch": 1.01, - "learning_rate": 1.5458467490075604e-06, - "loss": 0.645, - "step": 39413 - }, - { - "epoch": 1.01, - "learning_rate": 1.545823564139454e-06, - "loss": 0.7344, - "step": 39414 - }, - { - "epoch": 1.01, - "learning_rate": 1.5458003788534359e-06, - "loss": 0.5801, - "step": 39415 - }, - { - "epoch": 1.01, - "learning_rate": 1.5457771931495234e-06, - "loss": 0.6963, - "step": 39416 - }, - { - "epoch": 1.01, - "learning_rate": 1.5457540070277344e-06, - "loss": 0.5781, - "step": 39417 - }, - { - "epoch": 1.01, - "learning_rate": 1.5457308204880865e-06, - "loss": 0.5322, - "step": 39418 - }, - { - "epoch": 1.01, - "learning_rate": 1.5457076335305979e-06, - "loss": 0.8262, - "step": 39419 - }, - { - "epoch": 1.01, - "learning_rate": 1.545684446155286e-06, - "loss": 0.5881, - "step": 39420 - }, - { - "epoch": 1.01, - "learning_rate": 1.5456612583621684e-06, - "loss": 0.8135, - "step": 39421 - }, - { - "epoch": 1.01, - "learning_rate": 1.545638070151263e-06, - "loss": 0.792, - "step": 39422 - }, - { - "epoch": 1.01, - "learning_rate": 1.5456148815225877e-06, - "loss": 0.6465, - "step": 39423 - }, - { - "epoch": 1.01, - "learning_rate": 1.5455916924761604e-06, - "loss": 0.8281, - "step": 39424 - }, - { - "epoch": 1.01, - "learning_rate": 1.5455685030119985e-06, - "loss": 0.6309, - "step": 39425 - }, - { - "epoch": 1.01, - "learning_rate": 1.54554531313012e-06, - "loss": 0.6885, - "step": 39426 - }, - { - "epoch": 1.01, - "learning_rate": 1.5455221228305421e-06, - "loss": 0.5161, - "step": 39427 - }, - { - "epoch": 1.01, - "learning_rate": 1.5454989321132835e-06, - "loss": 0.7617, - "step": 39428 - }, - { - "epoch": 1.01, - "learning_rate": 1.5454757409783613e-06, - "loss": 0.79, - "step": 39429 - }, - { - "epoch": 1.01, - "learning_rate": 1.5454525494257933e-06, - "loss": 0.6787, - "step": 39430 - }, - { - "epoch": 1.01, - "learning_rate": 1.5454293574555974e-06, - "loss": 0.7432, - "step": 39431 - }, - { - "epoch": 1.01, - "learning_rate": 1.5454061650677913e-06, - "loss": 0.3538, - "step": 39432 - }, - { - "epoch": 1.01, - "learning_rate": 1.5453829722623927e-06, - "loss": 0.8047, - "step": 39433 - }, - { - "epoch": 1.01, - "learning_rate": 1.54535977903942e-06, - "loss": 0.5698, - "step": 39434 - }, - { - "epoch": 1.01, - "learning_rate": 1.5453365853988895e-06, - "loss": 0.5312, - "step": 39435 - }, - { - "epoch": 1.01, - "learning_rate": 1.5453133913408205e-06, - "loss": 0.624, - "step": 39436 - }, - { - "epoch": 1.01, - "learning_rate": 1.5452901968652298e-06, - "loss": 0.708, - "step": 39437 - }, - { - "epoch": 1.01, - "learning_rate": 1.5452670019721356e-06, - "loss": 0.6343, - "step": 39438 - }, - { - "epoch": 1.01, - "learning_rate": 1.5452438066615555e-06, - "loss": 0.832, - "step": 39439 - }, - { - "epoch": 1.01, - "learning_rate": 1.5452206109335072e-06, - "loss": 0.603, - "step": 39440 - }, - { - "epoch": 1.01, - "learning_rate": 1.5451974147880087e-06, - "loss": 0.6025, - "step": 39441 - }, - { - "epoch": 1.01, - "learning_rate": 1.5451742182250777e-06, - "loss": 0.7129, - "step": 39442 - }, - { - "epoch": 1.01, - "learning_rate": 1.5451510212447319e-06, - "loss": 0.6211, - "step": 39443 - }, - { - "epoch": 1.01, - "learning_rate": 1.5451278238469888e-06, - "loss": 0.5796, - "step": 39444 - }, - { - "epoch": 1.01, - "learning_rate": 1.5451046260318665e-06, - "loss": 0.6738, - "step": 39445 - }, - { - "epoch": 1.01, - "learning_rate": 1.5450814277993824e-06, - "loss": 0.6519, - "step": 39446 - }, - { - "epoch": 1.01, - "learning_rate": 1.545058229149555e-06, - "loss": 0.6777, - "step": 39447 - }, - { - "epoch": 1.01, - "learning_rate": 1.5450350300824011e-06, - "loss": 0.6265, - "step": 39448 - }, - { - "epoch": 1.01, - "learning_rate": 1.545011830597939e-06, - "loss": 0.5249, - "step": 39449 - }, - { - "epoch": 1.01, - "learning_rate": 1.5449886306961866e-06, - "loss": 0.6992, - "step": 39450 - }, - { - "epoch": 1.01, - "learning_rate": 1.5449654303771613e-06, - "loss": 0.7129, - "step": 39451 - }, - { - "epoch": 1.01, - "learning_rate": 1.5449422296408812e-06, - "loss": 0.7363, - "step": 39452 - }, - { - "epoch": 1.01, - "learning_rate": 1.544919028487364e-06, - "loss": 0.5791, - "step": 39453 - }, - { - "epoch": 1.01, - "learning_rate": 1.544895826916627e-06, - "loss": 0.8135, - "step": 39454 - }, - { - "epoch": 1.01, - "learning_rate": 1.5448726249286884e-06, - "loss": 0.5442, - "step": 39455 - }, - { - "epoch": 1.01, - "learning_rate": 1.544849422523566e-06, - "loss": 0.7881, - "step": 39456 - }, - { - "epoch": 1.01, - "learning_rate": 1.5448262197012774e-06, - "loss": 0.624, - "step": 39457 - }, - { - "epoch": 1.01, - "learning_rate": 1.5448030164618406e-06, - "loss": 0.7163, - "step": 39458 - }, - { - "epoch": 1.01, - "learning_rate": 1.544779812805273e-06, - "loss": 0.666, - "step": 39459 - }, - { - "epoch": 1.01, - "learning_rate": 1.5447566087315927e-06, - "loss": 0.8145, - "step": 39460 - }, - { - "epoch": 1.01, - "learning_rate": 1.5447334042408168e-06, - "loss": 0.6128, - "step": 39461 - }, - { - "epoch": 1.01, - "learning_rate": 1.544710199332964e-06, - "loss": 0.8145, - "step": 39462 - }, - { - "epoch": 1.01, - "learning_rate": 1.5446869940080517e-06, - "loss": 0.3967, - "step": 39463 - }, - { - "epoch": 1.01, - "learning_rate": 1.5446637882660975e-06, - "loss": 0.8828, - "step": 39464 - }, - { - "epoch": 1.01, - "learning_rate": 1.5446405821071194e-06, - "loss": 0.7754, - "step": 39465 - }, - { - "epoch": 1.01, - "learning_rate": 1.544617375531135e-06, - "loss": 0.6655, - "step": 39466 - }, - { - "epoch": 1.01, - "learning_rate": 1.544594168538162e-06, - "loss": 0.5762, - "step": 39467 - }, - { - "epoch": 1.01, - "learning_rate": 1.5445709611282186e-06, - "loss": 0.6401, - "step": 39468 - }, - { - "epoch": 1.01, - "learning_rate": 1.544547753301322e-06, - "loss": 0.5032, - "step": 39469 - }, - { - "epoch": 1.01, - "learning_rate": 1.54452454505749e-06, - "loss": 0.6509, - "step": 39470 - }, - { - "epoch": 1.01, - "learning_rate": 1.5445013363967409e-06, - "loss": 0.7529, - "step": 39471 - }, - { - "epoch": 1.01, - "learning_rate": 1.5444781273190919e-06, - "loss": 0.6104, - "step": 39472 - }, - { - "epoch": 1.01, - "learning_rate": 1.5444549178245614e-06, - "loss": 0.7148, - "step": 39473 - }, - { - "epoch": 1.01, - "learning_rate": 1.5444317079131667e-06, - "loss": 0.6914, - "step": 39474 - }, - { - "epoch": 1.01, - "learning_rate": 1.5444084975849254e-06, - "loss": 0.7207, - "step": 39475 - }, - { - "epoch": 1.01, - "learning_rate": 1.5443852868398558e-06, - "loss": 0.832, - "step": 39476 - }, - { - "epoch": 1.01, - "learning_rate": 1.5443620756779753e-06, - "loss": 0.5659, - "step": 39477 - }, - { - "epoch": 1.01, - "learning_rate": 1.544338864099302e-06, - "loss": 0.6157, - "step": 39478 - }, - { - "epoch": 1.01, - "learning_rate": 1.5443156521038532e-06, - "loss": 0.668, - "step": 39479 - }, - { - "epoch": 1.01, - "learning_rate": 1.544292439691647e-06, - "loss": 0.5029, - "step": 39480 - }, - { - "epoch": 1.01, - "learning_rate": 1.5442692268627013e-06, - "loss": 0.6719, - "step": 39481 - }, - { - "epoch": 1.01, - "learning_rate": 1.5442460136170333e-06, - "loss": 0.7373, - "step": 39482 - }, - { - "epoch": 1.01, - "learning_rate": 1.5442227999546616e-06, - "loss": 0.7402, - "step": 39483 - }, - { - "epoch": 1.01, - "learning_rate": 1.5441995858756034e-06, - "loss": 0.6768, - "step": 39484 - }, - { - "epoch": 1.01, - "learning_rate": 1.5441763713798764e-06, - "loss": 0.6416, - "step": 39485 - }, - { - "epoch": 1.01, - "learning_rate": 1.5441531564674985e-06, - "loss": 0.3284, - "step": 39486 - }, - { - "epoch": 1.01, - "learning_rate": 1.5441299411384878e-06, - "loss": 0.7549, - "step": 39487 - }, - { - "epoch": 1.01, - "learning_rate": 1.5441067253928618e-06, - "loss": 0.6406, - "step": 39488 - }, - { - "epoch": 1.01, - "learning_rate": 1.5440835092306386e-06, - "loss": 0.7476, - "step": 39489 - }, - { - "epoch": 1.01, - "learning_rate": 1.5440602926518352e-06, - "loss": 0.7129, - "step": 39490 - }, - { - "epoch": 1.01, - "learning_rate": 1.5440370756564699e-06, - "loss": 0.4922, - "step": 39491 - }, - { - "epoch": 1.01, - "learning_rate": 1.5440138582445603e-06, - "loss": 0.5835, - "step": 39492 - }, - { - "epoch": 1.01, - "learning_rate": 1.543990640416125e-06, - "loss": 0.583, - "step": 39493 - }, - { - "epoch": 1.01, - "learning_rate": 1.5439674221711804e-06, - "loss": 0.791, - "step": 39494 - }, - { - "epoch": 1.01, - "learning_rate": 1.5439442035097452e-06, - "loss": 0.5361, - "step": 39495 - }, - { - "epoch": 1.01, - "learning_rate": 1.543920984431837e-06, - "loss": 0.5791, - "step": 39496 - }, - { - "epoch": 1.01, - "learning_rate": 1.543897764937473e-06, - "loss": 0.5669, - "step": 39497 - }, - { - "epoch": 1.01, - "learning_rate": 1.543874545026672e-06, - "loss": 0.6694, - "step": 39498 - }, - { - "epoch": 1.01, - "learning_rate": 1.5438513246994514e-06, - "loss": 0.686, - "step": 39499 - }, - { - "epoch": 1.01, - "learning_rate": 1.5438281039558283e-06, - "loss": 0.8086, - "step": 39500 - }, - { - "epoch": 1.01, - "learning_rate": 1.5438048827958214e-06, - "loss": 0.5574, - "step": 39501 - }, - { - "epoch": 1.01, - "learning_rate": 1.543781661219448e-06, - "loss": 0.7158, - "step": 39502 - }, - { - "epoch": 1.01, - "learning_rate": 1.5437584392267262e-06, - "loss": 0.5977, - "step": 39503 - }, - { - "epoch": 1.01, - "learning_rate": 1.5437352168176733e-06, - "loss": 0.5265, - "step": 39504 - }, - { - "epoch": 1.01, - "learning_rate": 1.5437119939923075e-06, - "loss": 0.6089, - "step": 39505 - }, - { - "epoch": 1.01, - "learning_rate": 1.5436887707506464e-06, - "loss": 0.8115, - "step": 39506 - }, - { - "epoch": 1.01, - "learning_rate": 1.5436655470927078e-06, - "loss": 0.6426, - "step": 39507 - }, - { - "epoch": 1.01, - "learning_rate": 1.5436423230185094e-06, - "loss": 0.749, - "step": 39508 - }, - { - "epoch": 1.01, - "learning_rate": 1.5436190985280693e-06, - "loss": 0.6494, - "step": 39509 - }, - { - "epoch": 1.01, - "learning_rate": 1.5435958736214049e-06, - "loss": 0.6074, - "step": 39510 - }, - { - "epoch": 1.01, - "learning_rate": 1.5435726482985338e-06, - "loss": 0.7124, - "step": 39511 - }, - { - "epoch": 1.01, - "learning_rate": 1.5435494225594744e-06, - "loss": 0.2881, - "step": 39512 - }, - { - "epoch": 1.01, - "learning_rate": 1.5435261964042442e-06, - "loss": 0.5088, - "step": 39513 - }, - { - "epoch": 1.01, - "learning_rate": 1.5435029698328612e-06, - "loss": 0.5981, - "step": 39514 - }, - { - "epoch": 1.01, - "learning_rate": 1.543479742845343e-06, - "loss": 0.5273, - "step": 39515 - }, - { - "epoch": 1.01, - "learning_rate": 1.543456515441707e-06, - "loss": 0.6279, - "step": 39516 - }, - { - "epoch": 1.01, - "learning_rate": 1.5434332876219713e-06, - "loss": 0.6772, - "step": 39517 - }, - { - "epoch": 1.01, - "learning_rate": 1.543410059386154e-06, - "loss": 0.7314, - "step": 39518 - }, - { - "epoch": 1.01, - "learning_rate": 1.5433868307342723e-06, - "loss": 0.6797, - "step": 39519 - }, - { - "epoch": 1.01, - "learning_rate": 1.5433636016663444e-06, - "loss": 0.6621, - "step": 39520 - }, - { - "epoch": 1.01, - "learning_rate": 1.543340372182388e-06, - "loss": 0.5708, - "step": 39521 - }, - { - "epoch": 1.01, - "learning_rate": 1.5433171422824212e-06, - "loss": 0.6982, - "step": 39522 - }, - { - "epoch": 1.01, - "learning_rate": 1.5432939119664611e-06, - "loss": 0.748, - "step": 39523 - }, - { - "epoch": 1.01, - "learning_rate": 1.5432706812345262e-06, - "loss": 0.7104, - "step": 39524 - }, - { - "epoch": 1.01, - "learning_rate": 1.5432474500866335e-06, - "loss": 0.6348, - "step": 39525 - }, - { - "epoch": 1.01, - "learning_rate": 1.5432242185228013e-06, - "loss": 0.835, - "step": 39526 - }, - { - "epoch": 1.01, - "learning_rate": 1.5432009865430473e-06, - "loss": 0.4668, - "step": 39527 - }, - { - "epoch": 1.01, - "learning_rate": 1.5431777541473893e-06, - "loss": 0.6484, - "step": 39528 - }, - { - "epoch": 1.01, - "learning_rate": 1.543154521335845e-06, - "loss": 0.5493, - "step": 39529 - }, - { - "epoch": 1.01, - "learning_rate": 1.5431312881084324e-06, - "loss": 0.4585, - "step": 39530 - }, - { - "epoch": 1.01, - "learning_rate": 1.543108054465169e-06, - "loss": 0.5552, - "step": 39531 - }, - { - "epoch": 1.01, - "learning_rate": 1.5430848204060728e-06, - "loss": 0.6245, - "step": 39532 - }, - { - "epoch": 1.01, - "learning_rate": 1.5430615859311617e-06, - "loss": 0.6475, - "step": 39533 - }, - { - "epoch": 1.01, - "learning_rate": 1.5430383510404532e-06, - "loss": 0.6284, - "step": 39534 - }, - { - "epoch": 1.01, - "learning_rate": 1.543015115733965e-06, - "loss": 0.7686, - "step": 39535 - }, - { - "epoch": 1.01, - "learning_rate": 1.5429918800117152e-06, - "loss": 0.6445, - "step": 39536 - }, - { - "epoch": 1.01, - "learning_rate": 1.5429686438737214e-06, - "loss": 0.7578, - "step": 39537 - }, - { - "epoch": 1.01, - "learning_rate": 1.5429454073200018e-06, - "loss": 0.5591, - "step": 39538 - }, - { - "epoch": 1.01, - "learning_rate": 1.5429221703505736e-06, - "loss": 0.709, - "step": 39539 - }, - { - "epoch": 1.01, - "learning_rate": 1.5428989329654552e-06, - "loss": 0.3962, - "step": 39540 - }, - { - "epoch": 1.01, - "learning_rate": 1.5428756951646635e-06, - "loss": 0.5698, - "step": 39541 - }, - { - "epoch": 1.01, - "learning_rate": 1.5428524569482174e-06, - "loss": 0.7568, - "step": 39542 - }, - { - "epoch": 1.01, - "learning_rate": 1.5428292183161338e-06, - "loss": 0.5134, - "step": 39543 - }, - { - "epoch": 1.01, - "learning_rate": 1.5428059792684307e-06, - "loss": 0.6553, - "step": 39544 - }, - { - "epoch": 1.01, - "learning_rate": 1.5427827398051262e-06, - "loss": 0.6494, - "step": 39545 - }, - { - "epoch": 1.01, - "learning_rate": 1.542759499926238e-06, - "loss": 0.4629, - "step": 39546 - }, - { - "epoch": 1.01, - "learning_rate": 1.5427362596317837e-06, - "loss": 0.6479, - "step": 39547 - }, - { - "epoch": 1.01, - "learning_rate": 1.5427130189217813e-06, - "loss": 0.6914, - "step": 39548 - }, - { - "epoch": 1.01, - "learning_rate": 1.5426897777962484e-06, - "loss": 0.6309, - "step": 39549 - }, - { - "epoch": 1.01, - "learning_rate": 1.542666536255203e-06, - "loss": 0.707, - "step": 39550 - }, - { - "epoch": 1.01, - "learning_rate": 1.5426432942986627e-06, - "loss": 0.3663, - "step": 39551 - }, - { - "epoch": 1.01, - "learning_rate": 1.5426200519266452e-06, - "loss": 0.5469, - "step": 39552 - }, - { - "epoch": 1.01, - "learning_rate": 1.542596809139169e-06, - "loss": 0.7959, - "step": 39553 - }, - { - "epoch": 1.01, - "learning_rate": 1.542573565936251e-06, - "loss": 0.6104, - "step": 39554 - }, - { - "epoch": 1.01, - "learning_rate": 1.5425503223179093e-06, - "loss": 0.5142, - "step": 39555 - }, - { - "epoch": 1.01, - "learning_rate": 1.542527078284162e-06, - "loss": 0.7065, - "step": 39556 - }, - { - "epoch": 1.01, - "learning_rate": 1.5425038338350263e-06, - "loss": 0.4905, - "step": 39557 - }, - { - "epoch": 1.01, - "learning_rate": 1.5424805889705206e-06, - "loss": 0.6855, - "step": 39558 - }, - { - "epoch": 1.01, - "learning_rate": 1.5424573436906624e-06, - "loss": 0.6602, - "step": 39559 - }, - { - "epoch": 1.01, - "learning_rate": 1.5424340979954697e-06, - "loss": 0.5728, - "step": 39560 - }, - { - "epoch": 1.01, - "learning_rate": 1.54241085188496e-06, - "loss": 0.6377, - "step": 39561 - }, - { - "epoch": 1.01, - "learning_rate": 1.5423876053591514e-06, - "loss": 0.6758, - "step": 39562 - }, - { - "epoch": 1.01, - "learning_rate": 1.5423643584180615e-06, - "loss": 0.6123, - "step": 39563 - }, - { - "epoch": 1.01, - "learning_rate": 1.5423411110617082e-06, - "loss": 0.7617, - "step": 39564 - }, - { - "epoch": 1.01, - "learning_rate": 1.5423178632901087e-06, - "loss": 0.7148, - "step": 39565 - }, - { - "epoch": 1.01, - "learning_rate": 1.542294615103282e-06, - "loss": 0.9102, - "step": 39566 - }, - { - "epoch": 1.01, - "learning_rate": 1.542271366501245e-06, - "loss": 0.6611, - "step": 39567 - }, - { - "epoch": 1.01, - "learning_rate": 1.542248117484016e-06, - "loss": 0.6592, - "step": 39568 - }, - { - "epoch": 1.01, - "learning_rate": 1.5422248680516123e-06, - "loss": 0.5201, - "step": 39569 - }, - { - "epoch": 1.01, - "learning_rate": 1.5422016182040521e-06, - "loss": 0.7017, - "step": 39570 - }, - { - "epoch": 1.01, - "learning_rate": 1.5421783679413526e-06, - "loss": 0.7246, - "step": 39571 - }, - { - "epoch": 1.01, - "learning_rate": 1.5421551172635327e-06, - "loss": 0.6123, - "step": 39572 - }, - { - "epoch": 1.01, - "learning_rate": 1.5421318661706094e-06, - "loss": 0.5952, - "step": 39573 - }, - { - "epoch": 1.01, - "learning_rate": 1.5421086146626006e-06, - "loss": 0.8311, - "step": 39574 - }, - { - "epoch": 1.01, - "learning_rate": 1.5420853627395238e-06, - "loss": 0.7393, - "step": 39575 - }, - { - "epoch": 1.01, - "learning_rate": 1.5420621104013973e-06, - "loss": 0.5383, - "step": 39576 - }, - { - "epoch": 1.01, - "learning_rate": 1.542038857648239e-06, - "loss": 0.6729, - "step": 39577 - }, - { - "epoch": 1.01, - "learning_rate": 1.5420156044800666e-06, - "loss": 0.6021, - "step": 39578 - }, - { - "epoch": 1.01, - "learning_rate": 1.5419923508968976e-06, - "loss": 0.657, - "step": 39579 - }, - { - "epoch": 1.01, - "learning_rate": 1.5419690968987497e-06, - "loss": 0.8125, - "step": 39580 - }, - { - "epoch": 1.01, - "learning_rate": 1.5419458424856413e-06, - "loss": 0.6108, - "step": 39581 - }, - { - "epoch": 1.01, - "learning_rate": 1.5419225876575897e-06, - "loss": 0.4861, - "step": 39582 - }, - { - "epoch": 1.01, - "learning_rate": 1.541899332414613e-06, - "loss": 0.6226, - "step": 39583 - }, - { - "epoch": 1.01, - "learning_rate": 1.5418760767567291e-06, - "loss": 0.5786, - "step": 39584 - }, - { - "epoch": 1.01, - "learning_rate": 1.5418528206839554e-06, - "loss": 0.7139, - "step": 39585 - }, - { - "epoch": 1.01, - "learning_rate": 1.5418295641963097e-06, - "loss": 0.6182, - "step": 39586 - }, - { - "epoch": 1.01, - "learning_rate": 1.5418063072938104e-06, - "loss": 0.8721, - "step": 39587 - }, - { - "epoch": 1.01, - "learning_rate": 1.5417830499764749e-06, - "loss": 0.5786, - "step": 39588 - }, - { - "epoch": 1.01, - "learning_rate": 1.5417597922443206e-06, - "loss": 0.561, - "step": 39589 - }, - { - "epoch": 1.01, - "learning_rate": 1.541736534097366e-06, - "loss": 0.4556, - "step": 39590 - }, - { - "epoch": 1.01, - "learning_rate": 1.5417132755356287e-06, - "loss": 0.5474, - "step": 39591 - }, - { - "epoch": 1.01, - "learning_rate": 1.5416900165591264e-06, - "loss": 0.6992, - "step": 39592 - }, - { - "epoch": 1.01, - "learning_rate": 1.541666757167877e-06, - "loss": 0.6973, - "step": 39593 - }, - { - "epoch": 1.01, - "learning_rate": 1.5416434973618983e-06, - "loss": 0.7231, - "step": 39594 - }, - { - "epoch": 1.01, - "learning_rate": 1.5416202371412078e-06, - "loss": 0.667, - "step": 39595 - }, - { - "epoch": 1.01, - "learning_rate": 1.541596976505824e-06, - "loss": 0.6196, - "step": 39596 - }, - { - "epoch": 1.01, - "learning_rate": 1.541573715455764e-06, - "loss": 0.5181, - "step": 39597 - }, - { - "epoch": 1.01, - "learning_rate": 1.5415504539910465e-06, - "loss": 0.5696, - "step": 39598 - }, - { - "epoch": 1.01, - "learning_rate": 1.5415271921116882e-06, - "loss": 0.6533, - "step": 39599 - }, - { - "epoch": 1.01, - "learning_rate": 1.5415039298177073e-06, - "loss": 0.6963, - "step": 39600 - }, - { - "epoch": 1.01, - "learning_rate": 1.5414806671091218e-06, - "loss": 0.7129, - "step": 39601 - }, - { - "epoch": 1.02, - "learning_rate": 1.5414574039859497e-06, - "loss": 0.6797, - "step": 39602 - }, - { - "epoch": 1.02, - "learning_rate": 1.5414341404482083e-06, - "loss": 0.6892, - "step": 39603 - }, - { - "epoch": 1.02, - "learning_rate": 1.5414108764959158e-06, - "loss": 0.3457, - "step": 39604 - }, - { - "epoch": 1.02, - "learning_rate": 1.5413876121290899e-06, - "loss": 0.6206, - "step": 39605 - }, - { - "epoch": 1.02, - "learning_rate": 1.5413643473477484e-06, - "loss": 0.7773, - "step": 39606 - }, - { - "epoch": 1.02, - "learning_rate": 1.5413410821519091e-06, - "loss": 0.6655, - "step": 39607 - }, - { - "epoch": 1.02, - "learning_rate": 1.54131781654159e-06, - "loss": 0.7295, - "step": 39608 - }, - { - "epoch": 1.02, - "learning_rate": 1.5412945505168084e-06, - "loss": 0.793, - "step": 39609 - }, - { - "epoch": 1.02, - "learning_rate": 1.5412712840775825e-06, - "loss": 0.6299, - "step": 39610 - }, - { - "epoch": 1.02, - "learning_rate": 1.54124801722393e-06, - "loss": 0.7197, - "step": 39611 - }, - { - "epoch": 1.02, - "learning_rate": 1.5412247499558691e-06, - "loss": 0.7334, - "step": 39612 - }, - { - "epoch": 1.02, - "learning_rate": 1.5412014822734174e-06, - "loss": 0.5918, - "step": 39613 - }, - { - "epoch": 1.02, - "learning_rate": 1.5411782141765923e-06, - "loss": 0.5825, - "step": 39614 - }, - { - "epoch": 1.02, - "learning_rate": 1.5411549456654118e-06, - "loss": 0.7209, - "step": 39615 - }, - { - "epoch": 1.02, - "learning_rate": 1.5411316767398944e-06, - "loss": 0.5947, - "step": 39616 - }, - { - "epoch": 1.02, - "learning_rate": 1.5411084074000567e-06, - "loss": 0.7441, - "step": 39617 - }, - { - "epoch": 1.02, - "learning_rate": 1.5410851376459176e-06, - "loss": 0.5308, - "step": 39618 - }, - { - "epoch": 1.02, - "learning_rate": 1.5410618674774943e-06, - "loss": 0.6836, - "step": 39619 - }, - { - "epoch": 1.02, - "learning_rate": 1.541038596894805e-06, - "loss": 0.7568, - "step": 39620 - }, - { - "epoch": 1.02, - "learning_rate": 1.5410153258978672e-06, - "loss": 0.4019, - "step": 39621 - }, - { - "epoch": 1.02, - "learning_rate": 1.5409920544866987e-06, - "loss": 0.8086, - "step": 39622 - }, - { - "epoch": 1.02, - "learning_rate": 1.5409687826613178e-06, - "loss": 0.7026, - "step": 39623 - }, - { - "epoch": 1.02, - "learning_rate": 1.5409455104217416e-06, - "loss": 0.6052, - "step": 39624 - }, - { - "epoch": 1.02, - "learning_rate": 1.5409222377679885e-06, - "loss": 0.7563, - "step": 39625 - }, - { - "epoch": 1.02, - "learning_rate": 1.5408989647000761e-06, - "loss": 0.686, - "step": 39626 - }, - { - "epoch": 1.02, - "learning_rate": 1.540875691218022e-06, - "loss": 0.6011, - "step": 39627 - }, - { - "epoch": 1.02, - "learning_rate": 1.5408524173218446e-06, - "loss": 0.6538, - "step": 39628 - }, - { - "epoch": 1.02, - "learning_rate": 1.5408291430115612e-06, - "loss": 0.6436, - "step": 39629 - }, - { - "epoch": 1.02, - "learning_rate": 1.5408058682871897e-06, - "loss": 0.6772, - "step": 39630 - }, - { - "epoch": 1.02, - "learning_rate": 1.540782593148748e-06, - "loss": 0.752, - "step": 39631 - }, - { - "epoch": 1.02, - "learning_rate": 1.5407593175962543e-06, - "loss": 0.6709, - "step": 39632 - }, - { - "epoch": 1.02, - "learning_rate": 1.540736041629726e-06, - "loss": 0.5391, - "step": 39633 - }, - { - "epoch": 1.02, - "learning_rate": 1.5407127652491807e-06, - "loss": 0.2876, - "step": 39634 - }, - { - "epoch": 1.02, - "learning_rate": 1.5406894884546366e-06, - "loss": 0.5664, - "step": 39635 - }, - { - "epoch": 1.02, - "learning_rate": 1.5406662112461114e-06, - "loss": 0.5874, - "step": 39636 - }, - { - "epoch": 1.02, - "learning_rate": 1.5406429336236228e-06, - "loss": 0.6865, - "step": 39637 - }, - { - "epoch": 1.02, - "learning_rate": 1.5406196555871892e-06, - "loss": 0.6963, - "step": 39638 - }, - { - "epoch": 1.02, - "learning_rate": 1.5405963771368278e-06, - "loss": 0.71, - "step": 39639 - }, - { - "epoch": 1.02, - "learning_rate": 1.5405730982725565e-06, - "loss": 0.5669, - "step": 39640 - }, - { - "epoch": 1.02, - "learning_rate": 1.5405498189943932e-06, - "loss": 0.478, - "step": 39641 - }, - { - "epoch": 1.02, - "learning_rate": 1.5405265393023558e-06, - "loss": 0.573, - "step": 39642 - }, - { - "epoch": 1.02, - "learning_rate": 1.5405032591964623e-06, - "loss": 0.7383, - "step": 39643 - }, - { - "epoch": 1.02, - "learning_rate": 1.5404799786767299e-06, - "loss": 0.6973, - "step": 39644 - }, - { - "epoch": 1.02, - "learning_rate": 1.5404566977431772e-06, - "loss": 0.7148, - "step": 39645 - }, - { - "epoch": 1.02, - "learning_rate": 1.5404334163958214e-06, - "loss": 0.7012, - "step": 39646 - }, - { - "epoch": 1.02, - "learning_rate": 1.5404101346346808e-06, - "loss": 0.7498, - "step": 39647 - }, - { - "epoch": 1.02, - "learning_rate": 1.5403868524597727e-06, - "loss": 0.4644, - "step": 39648 - }, - { - "epoch": 1.02, - "learning_rate": 1.5403635698711156e-06, - "loss": 0.6348, - "step": 39649 - }, - { - "epoch": 1.02, - "learning_rate": 1.5403402868687266e-06, - "loss": 0.6982, - "step": 39650 - }, - { - "epoch": 1.02, - "learning_rate": 1.5403170034526242e-06, - "loss": 0.624, - "step": 39651 - }, - { - "epoch": 1.02, - "learning_rate": 1.5402937196228255e-06, - "loss": 0.6357, - "step": 39652 - }, - { - "epoch": 1.02, - "learning_rate": 1.5402704353793493e-06, - "loss": 0.6406, - "step": 39653 - }, - { - "epoch": 1.02, - "learning_rate": 1.5402471507222125e-06, - "loss": 0.6235, - "step": 39654 - }, - { - "epoch": 1.02, - "learning_rate": 1.5402238656514337e-06, - "loss": 0.512, - "step": 39655 - }, - { - "epoch": 1.02, - "learning_rate": 1.54020058016703e-06, - "loss": 0.4663, - "step": 39656 - }, - { - "epoch": 1.02, - "learning_rate": 1.5401772942690195e-06, - "loss": 0.688, - "step": 39657 - }, - { - "epoch": 1.02, - "learning_rate": 1.5401540079574202e-06, - "loss": 0.4658, - "step": 39658 - }, - { - "epoch": 1.02, - "learning_rate": 1.54013072123225e-06, - "loss": 0.7373, - "step": 39659 - }, - { - "epoch": 1.02, - "learning_rate": 1.540107434093526e-06, - "loss": 0.9561, - "step": 39660 - }, - { - "epoch": 1.02, - "learning_rate": 1.540084146541267e-06, - "loss": 0.6328, - "step": 39661 - }, - { - "epoch": 1.02, - "learning_rate": 1.5400608585754903e-06, - "loss": 0.6094, - "step": 39662 - }, - { - "epoch": 1.02, - "learning_rate": 1.5400375701962137e-06, - "loss": 0.7441, - "step": 39663 - }, - { - "epoch": 1.02, - "learning_rate": 1.5400142814034555e-06, - "loss": 0.4259, - "step": 39664 - }, - { - "epoch": 1.02, - "learning_rate": 1.5399909921972327e-06, - "loss": 0.5227, - "step": 39665 - }, - { - "epoch": 1.02, - "learning_rate": 1.5399677025775638e-06, - "loss": 0.5308, - "step": 39666 - }, - { - "epoch": 1.02, - "learning_rate": 1.5399444125444667e-06, - "loss": 0.6973, - "step": 39667 - }, - { - "epoch": 1.02, - "learning_rate": 1.5399211220979592e-06, - "loss": 0.7041, - "step": 39668 - }, - { - "epoch": 1.02, - "learning_rate": 1.5398978312380583e-06, - "loss": 0.6187, - "step": 39669 - }, - { - "epoch": 1.02, - "learning_rate": 1.5398745399647827e-06, - "loss": 0.5796, - "step": 39670 - }, - { - "epoch": 1.02, - "learning_rate": 1.53985124827815e-06, - "loss": 0.6128, - "step": 39671 - }, - { - "epoch": 1.02, - "learning_rate": 1.539827956178178e-06, - "loss": 0.7939, - "step": 39672 - }, - { - "epoch": 1.02, - "learning_rate": 1.539804663664885e-06, - "loss": 0.6338, - "step": 39673 - }, - { - "epoch": 1.02, - "learning_rate": 1.5397813707382881e-06, - "loss": 0.6572, - "step": 39674 - }, - { - "epoch": 1.02, - "learning_rate": 1.5397580773984048e-06, - "loss": 0.5439, - "step": 39675 - }, - { - "epoch": 1.02, - "learning_rate": 1.5397347836452546e-06, - "loss": 0.6611, - "step": 39676 - }, - { - "epoch": 1.02, - "learning_rate": 1.5397114894788535e-06, - "loss": 0.5444, - "step": 39677 - }, - { - "epoch": 1.02, - "learning_rate": 1.5396881948992206e-06, - "loss": 0.5586, - "step": 39678 - }, - { - "epoch": 1.02, - "learning_rate": 1.539664899906373e-06, - "loss": 0.8662, - "step": 39679 - }, - { - "epoch": 1.02, - "learning_rate": 1.5396416045003288e-06, - "loss": 0.8799, - "step": 39680 - }, - { - "epoch": 1.02, - "learning_rate": 1.539618308681106e-06, - "loss": 0.7588, - "step": 39681 - }, - { - "epoch": 1.02, - "learning_rate": 1.5395950124487222e-06, - "loss": 0.6182, - "step": 39682 - }, - { - "epoch": 1.02, - "learning_rate": 1.5395717158031954e-06, - "loss": 0.667, - "step": 39683 - }, - { - "epoch": 1.02, - "learning_rate": 1.539548418744543e-06, - "loss": 0.6641, - "step": 39684 - }, - { - "epoch": 1.02, - "learning_rate": 1.5395251212727836e-06, - "loss": 0.9258, - "step": 39685 - }, - { - "epoch": 1.02, - "learning_rate": 1.5395018233879345e-06, - "loss": 0.6572, - "step": 39686 - }, - { - "epoch": 1.02, - "learning_rate": 1.5394785250900135e-06, - "loss": 0.3918, - "step": 39687 - }, - { - "epoch": 1.02, - "learning_rate": 1.5394552263790388e-06, - "loss": 0.8779, - "step": 39688 - }, - { - "epoch": 1.02, - "learning_rate": 1.5394319272550278e-06, - "loss": 0.8486, - "step": 39689 - }, - { - "epoch": 1.02, - "learning_rate": 1.5394086277179988e-06, - "loss": 0.4287, - "step": 39690 - }, - { - "epoch": 1.02, - "learning_rate": 1.5393853277679693e-06, - "loss": 0.7275, - "step": 39691 - }, - { - "epoch": 1.02, - "learning_rate": 1.539362027404957e-06, - "loss": 0.5767, - "step": 39692 - }, - { - "epoch": 1.02, - "learning_rate": 1.5393387266289807e-06, - "loss": 0.9229, - "step": 39693 - }, - { - "epoch": 1.02, - "learning_rate": 1.539315425440057e-06, - "loss": 0.752, - "step": 39694 - }, - { - "epoch": 1.02, - "learning_rate": 1.5392921238382047e-06, - "loss": 0.5923, - "step": 39695 - }, - { - "epoch": 1.02, - "learning_rate": 1.5392688218234406e-06, - "loss": 0.5244, - "step": 39696 - }, - { - "epoch": 1.02, - "learning_rate": 1.5392455193957834e-06, - "loss": 0.5537, - "step": 39697 - }, - { - "epoch": 1.02, - "learning_rate": 1.539222216555251e-06, - "loss": 0.6494, - "step": 39698 - }, - { - "epoch": 1.02, - "learning_rate": 1.5391989133018607e-06, - "loss": 0.7246, - "step": 39699 - }, - { - "epoch": 1.02, - "learning_rate": 1.5391756096356306e-06, - "loss": 0.7119, - "step": 39700 - }, - { - "epoch": 1.02, - "learning_rate": 1.5391523055565787e-06, - "loss": 0.6611, - "step": 39701 - }, - { - "epoch": 1.02, - "learning_rate": 1.5391290010647223e-06, - "loss": 0.7432, - "step": 39702 - }, - { - "epoch": 1.02, - "learning_rate": 1.5391056961600798e-06, - "loss": 0.646, - "step": 39703 - }, - { - "epoch": 1.02, - "learning_rate": 1.539082390842669e-06, - "loss": 0.6313, - "step": 39704 - }, - { - "epoch": 1.02, - "learning_rate": 1.5390590851125075e-06, - "loss": 0.6084, - "step": 39705 - }, - { - "epoch": 1.02, - "learning_rate": 1.5390357789696132e-06, - "loss": 0.7988, - "step": 39706 - }, - { - "epoch": 1.02, - "learning_rate": 1.5390124724140038e-06, - "loss": 0.6045, - "step": 39707 - }, - { - "epoch": 1.02, - "learning_rate": 1.538989165445698e-06, - "loss": 0.6919, - "step": 39708 - }, - { - "epoch": 1.02, - "learning_rate": 1.5389658580647123e-06, - "loss": 0.667, - "step": 39709 - }, - { - "epoch": 1.02, - "learning_rate": 1.5389425502710656e-06, - "loss": 0.4604, - "step": 39710 - }, - { - "epoch": 1.02, - "learning_rate": 1.538919242064775e-06, - "loss": 0.7236, - "step": 39711 - }, - { - "epoch": 1.02, - "learning_rate": 1.5388959334458588e-06, - "loss": 0.6602, - "step": 39712 - }, - { - "epoch": 1.02, - "learning_rate": 1.5388726244143353e-06, - "loss": 0.7939, - "step": 39713 - }, - { - "epoch": 1.02, - "learning_rate": 1.5388493149702213e-06, - "loss": 0.6421, - "step": 39714 - }, - { - "epoch": 1.02, - "learning_rate": 1.538826005113535e-06, - "loss": 0.6479, - "step": 39715 - }, - { - "epoch": 1.02, - "learning_rate": 1.538802694844295e-06, - "loss": 0.6465, - "step": 39716 - }, - { - "epoch": 1.02, - "learning_rate": 1.538779384162518e-06, - "loss": 0.6484, - "step": 39717 - }, - { - "epoch": 1.02, - "learning_rate": 1.5387560730682228e-06, - "loss": 0.6758, - "step": 39718 - }, - { - "epoch": 1.02, - "learning_rate": 1.5387327615614267e-06, - "loss": 0.4387, - "step": 39719 - }, - { - "epoch": 1.02, - "learning_rate": 1.5387094496421478e-06, - "loss": 0.666, - "step": 39720 - }, - { - "epoch": 1.02, - "learning_rate": 1.5386861373104035e-06, - "loss": 0.6787, - "step": 39721 - }, - { - "epoch": 1.02, - "learning_rate": 1.5386628245662121e-06, - "loss": 0.6953, - "step": 39722 - }, - { - "epoch": 1.02, - "learning_rate": 1.5386395114095917e-06, - "loss": 0.6475, - "step": 39723 - }, - { - "epoch": 1.02, - "learning_rate": 1.5386161978405597e-06, - "loss": 0.5549, - "step": 39724 - }, - { - "epoch": 1.02, - "learning_rate": 1.5385928838591338e-06, - "loss": 0.5291, - "step": 39725 - }, - { - "epoch": 1.02, - "learning_rate": 1.538569569465332e-06, - "loss": 0.5413, - "step": 39726 - }, - { - "epoch": 1.02, - "learning_rate": 1.5385462546591725e-06, - "loss": 0.6494, - "step": 39727 - }, - { - "epoch": 1.02, - "learning_rate": 1.5385229394406728e-06, - "loss": 0.5918, - "step": 39728 - }, - { - "epoch": 1.02, - "learning_rate": 1.538499623809851e-06, - "loss": 0.6096, - "step": 39729 - }, - { - "epoch": 1.02, - "learning_rate": 1.5384763077667244e-06, - "loss": 0.5962, - "step": 39730 - }, - { - "epoch": 1.02, - "learning_rate": 1.5384529913113115e-06, - "loss": 0.7227, - "step": 39731 - }, - { - "epoch": 1.02, - "learning_rate": 1.53842967444363e-06, - "loss": 0.5532, - "step": 39732 - }, - { - "epoch": 1.02, - "learning_rate": 1.5384063571636978e-06, - "loss": 0.8193, - "step": 39733 - }, - { - "epoch": 1.02, - "learning_rate": 1.5383830394715322e-06, - "loss": 0.627, - "step": 39734 - }, - { - "epoch": 1.02, - "learning_rate": 1.5383597213671518e-06, - "loss": 0.6807, - "step": 39735 - }, - { - "epoch": 1.02, - "learning_rate": 1.5383364028505738e-06, - "loss": 0.6279, - "step": 39736 - }, - { - "epoch": 1.02, - "learning_rate": 1.5383130839218167e-06, - "loss": 0.7295, - "step": 39737 - }, - { - "epoch": 1.02, - "learning_rate": 1.5382897645808978e-06, - "loss": 0.7871, - "step": 39738 - }, - { - "epoch": 1.02, - "learning_rate": 1.5382664448278354e-06, - "loss": 0.6826, - "step": 39739 - }, - { - "epoch": 1.02, - "learning_rate": 1.5382431246626469e-06, - "loss": 0.7676, - "step": 39740 - }, - { - "epoch": 1.02, - "learning_rate": 1.5382198040853504e-06, - "loss": 0.5527, - "step": 39741 - }, - { - "epoch": 1.02, - "learning_rate": 1.5381964830959637e-06, - "loss": 0.6162, - "step": 39742 - }, - { - "epoch": 1.02, - "learning_rate": 1.538173161694505e-06, - "loss": 0.5879, - "step": 39743 - }, - { - "epoch": 1.02, - "learning_rate": 1.5381498398809915e-06, - "loss": 0.7925, - "step": 39744 - }, - { - "epoch": 1.02, - "learning_rate": 1.5381265176554416e-06, - "loss": 0.749, - "step": 39745 - }, - { - "epoch": 1.02, - "learning_rate": 1.5381031950178728e-06, - "loss": 0.624, - "step": 39746 - }, - { - "epoch": 1.02, - "learning_rate": 1.5380798719683034e-06, - "loss": 0.4929, - "step": 39747 - }, - { - "epoch": 1.02, - "learning_rate": 1.538056548506751e-06, - "loss": 0.7021, - "step": 39748 - }, - { - "epoch": 1.02, - "learning_rate": 1.5380332246332333e-06, - "loss": 0.6641, - "step": 39749 - }, - { - "epoch": 1.02, - "learning_rate": 1.5380099003477683e-06, - "loss": 0.707, - "step": 39750 - }, - { - "epoch": 1.02, - "learning_rate": 1.5379865756503737e-06, - "loss": 0.4799, - "step": 39751 - }, - { - "epoch": 1.02, - "learning_rate": 1.5379632505410677e-06, - "loss": 0.7026, - "step": 39752 - }, - { - "epoch": 1.02, - "learning_rate": 1.537939925019868e-06, - "loss": 0.613, - "step": 39753 - }, - { - "epoch": 1.02, - "learning_rate": 1.5379165990867924e-06, - "loss": 0.7354, - "step": 39754 - }, - { - "epoch": 1.02, - "learning_rate": 1.5378932727418589e-06, - "loss": 0.6504, - "step": 39755 - }, - { - "epoch": 1.02, - "learning_rate": 1.537869945985085e-06, - "loss": 0.8359, - "step": 39756 - }, - { - "epoch": 1.02, - "learning_rate": 1.537846618816489e-06, - "loss": 0.5002, - "step": 39757 - }, - { - "epoch": 1.02, - "learning_rate": 1.5378232912360884e-06, - "loss": 0.5215, - "step": 39758 - }, - { - "epoch": 1.02, - "learning_rate": 1.5377999632439013e-06, - "loss": 0.6191, - "step": 39759 - }, - { - "epoch": 1.02, - "learning_rate": 1.5377766348399457e-06, - "loss": 0.6177, - "step": 39760 - }, - { - "epoch": 1.02, - "learning_rate": 1.5377533060242388e-06, - "loss": 0.6001, - "step": 39761 - }, - { - "epoch": 1.02, - "learning_rate": 1.5377299767967995e-06, - "loss": 0.6094, - "step": 39762 - }, - { - "epoch": 1.02, - "learning_rate": 1.5377066471576447e-06, - "loss": 0.7329, - "step": 39763 - }, - { - "epoch": 1.02, - "learning_rate": 1.537683317106793e-06, - "loss": 0.8447, - "step": 39764 - }, - { - "epoch": 1.02, - "learning_rate": 1.5376599866442615e-06, - "loss": 0.6221, - "step": 39765 - }, - { - "epoch": 1.02, - "learning_rate": 1.5376366557700686e-06, - "loss": 0.6714, - "step": 39766 - }, - { - "epoch": 1.02, - "learning_rate": 1.5376133244842322e-06, - "loss": 0.6235, - "step": 39767 - }, - { - "epoch": 1.02, - "learning_rate": 1.53758999278677e-06, - "loss": 0.5508, - "step": 39768 - }, - { - "epoch": 1.02, - "learning_rate": 1.5375666606776995e-06, - "loss": 0.7393, - "step": 39769 - }, - { - "epoch": 1.02, - "learning_rate": 1.5375433281570392e-06, - "loss": 0.7363, - "step": 39770 - }, - { - "epoch": 1.02, - "learning_rate": 1.5375199952248067e-06, - "loss": 0.6006, - "step": 39771 - }, - { - "epoch": 1.02, - "learning_rate": 1.5374966618810197e-06, - "loss": 0.7109, - "step": 39772 - }, - { - "epoch": 1.02, - "learning_rate": 1.5374733281256964e-06, - "loss": 0.5229, - "step": 39773 - }, - { - "epoch": 1.02, - "learning_rate": 1.5374499939588543e-06, - "loss": 0.5679, - "step": 39774 - }, - { - "epoch": 1.02, - "learning_rate": 1.5374266593805115e-06, - "loss": 0.7305, - "step": 39775 - }, - { - "epoch": 1.02, - "learning_rate": 1.5374033243906862e-06, - "loss": 0.7139, - "step": 39776 - }, - { - "epoch": 1.02, - "learning_rate": 1.5373799889893954e-06, - "loss": 0.666, - "step": 39777 - }, - { - "epoch": 1.02, - "learning_rate": 1.5373566531766575e-06, - "loss": 0.6182, - "step": 39778 - }, - { - "epoch": 1.02, - "learning_rate": 1.5373333169524905e-06, - "loss": 0.5557, - "step": 39779 - }, - { - "epoch": 1.02, - "learning_rate": 1.5373099803169122e-06, - "loss": 0.6694, - "step": 39780 - }, - { - "epoch": 1.02, - "learning_rate": 1.5372866432699399e-06, - "loss": 0.5957, - "step": 39781 - }, - { - "epoch": 1.02, - "learning_rate": 1.5372633058115923e-06, - "loss": 0.6777, - "step": 39782 - }, - { - "epoch": 1.02, - "learning_rate": 1.5372399679418868e-06, - "loss": 0.6182, - "step": 39783 - }, - { - "epoch": 1.02, - "learning_rate": 1.537216629660841e-06, - "loss": 0.6401, - "step": 39784 - }, - { - "epoch": 1.02, - "learning_rate": 1.5371932909684738e-06, - "loss": 0.7803, - "step": 39785 - }, - { - "epoch": 1.02, - "learning_rate": 1.537169951864802e-06, - "loss": 0.7949, - "step": 39786 - }, - { - "epoch": 1.02, - "learning_rate": 1.537146612349844e-06, - "loss": 0.6692, - "step": 39787 - }, - { - "epoch": 1.02, - "learning_rate": 1.5371232724236177e-06, - "loss": 0.6338, - "step": 39788 - }, - { - "epoch": 1.02, - "learning_rate": 1.5370999320861403e-06, - "loss": 0.7607, - "step": 39789 - }, - { - "epoch": 1.02, - "learning_rate": 1.5370765913374304e-06, - "loss": 0.7012, - "step": 39790 - }, - { - "epoch": 1.02, - "learning_rate": 1.537053250177506e-06, - "loss": 0.6396, - "step": 39791 - }, - { - "epoch": 1.02, - "learning_rate": 1.5370299086063842e-06, - "loss": 0.6001, - "step": 39792 - }, - { - "epoch": 1.02, - "learning_rate": 1.5370065666240835e-06, - "loss": 0.6641, - "step": 39793 - }, - { - "epoch": 1.02, - "learning_rate": 1.5369832242306212e-06, - "loss": 0.6865, - "step": 39794 - }, - { - "epoch": 1.02, - "learning_rate": 1.536959881426016e-06, - "loss": 0.7095, - "step": 39795 - }, - { - "epoch": 1.02, - "learning_rate": 1.536936538210285e-06, - "loss": 0.71, - "step": 39796 - }, - { - "epoch": 1.02, - "learning_rate": 1.5369131945834465e-06, - "loss": 0.5776, - "step": 39797 - }, - { - "epoch": 1.02, - "learning_rate": 1.5368898505455183e-06, - "loss": 0.4871, - "step": 39798 - }, - { - "epoch": 1.02, - "learning_rate": 1.5368665060965182e-06, - "loss": 0.7754, - "step": 39799 - }, - { - "epoch": 1.02, - "learning_rate": 1.5368431612364643e-06, - "loss": 0.8975, - "step": 39800 - }, - { - "epoch": 1.02, - "learning_rate": 1.5368198159653739e-06, - "loss": 0.6309, - "step": 39801 - }, - { - "epoch": 1.02, - "learning_rate": 1.5367964702832656e-06, - "loss": 0.688, - "step": 39802 - }, - { - "epoch": 1.02, - "learning_rate": 1.5367731241901567e-06, - "loss": 0.7295, - "step": 39803 - }, - { - "epoch": 1.02, - "learning_rate": 1.5367497776860654e-06, - "loss": 0.7134, - "step": 39804 - }, - { - "epoch": 1.02, - "learning_rate": 1.5367264307710092e-06, - "loss": 0.751, - "step": 39805 - }, - { - "epoch": 1.02, - "learning_rate": 1.5367030834450064e-06, - "loss": 0.8047, - "step": 39806 - }, - { - "epoch": 1.02, - "learning_rate": 1.5366797357080752e-06, - "loss": 0.5901, - "step": 39807 - }, - { - "epoch": 1.02, - "learning_rate": 1.5366563875602326e-06, - "loss": 0.5474, - "step": 39808 - }, - { - "epoch": 1.02, - "learning_rate": 1.5366330390014968e-06, - "loss": 0.6614, - "step": 39809 - }, - { - "epoch": 1.02, - "learning_rate": 1.5366096900318857e-06, - "loss": 0.5698, - "step": 39810 - }, - { - "epoch": 1.02, - "learning_rate": 1.5365863406514175e-06, - "loss": 0.7891, - "step": 39811 - }, - { - "epoch": 1.02, - "learning_rate": 1.53656299086011e-06, - "loss": 0.5918, - "step": 39812 - }, - { - "epoch": 1.02, - "learning_rate": 1.5365396406579803e-06, - "loss": 0.6934, - "step": 39813 - }, - { - "epoch": 1.02, - "learning_rate": 1.5365162900450472e-06, - "loss": 0.6748, - "step": 39814 - }, - { - "epoch": 1.02, - "learning_rate": 1.5364929390213282e-06, - "loss": 0.7158, - "step": 39815 - }, - { - "epoch": 1.02, - "learning_rate": 1.5364695875868413e-06, - "loss": 0.5964, - "step": 39816 - }, - { - "epoch": 1.02, - "learning_rate": 1.5364462357416042e-06, - "loss": 0.6802, - "step": 39817 - }, - { - "epoch": 1.02, - "learning_rate": 1.5364228834856348e-06, - "loss": 0.6289, - "step": 39818 - }, - { - "epoch": 1.02, - "learning_rate": 1.5363995308189513e-06, - "loss": 0.7148, - "step": 39819 - }, - { - "epoch": 1.02, - "learning_rate": 1.5363761777415709e-06, - "loss": 0.6284, - "step": 39820 - }, - { - "epoch": 1.02, - "learning_rate": 1.5363528242535125e-06, - "loss": 0.5759, - "step": 39821 - }, - { - "epoch": 1.02, - "learning_rate": 1.536329470354793e-06, - "loss": 0.6553, - "step": 39822 - }, - { - "epoch": 1.02, - "learning_rate": 1.536306116045431e-06, - "loss": 0.7607, - "step": 39823 - }, - { - "epoch": 1.02, - "learning_rate": 1.5362827613254439e-06, - "loss": 0.6028, - "step": 39824 - }, - { - "epoch": 1.02, - "learning_rate": 1.5362594061948495e-06, - "loss": 0.7529, - "step": 39825 - }, - { - "epoch": 1.02, - "learning_rate": 1.5362360506536662e-06, - "loss": 0.7109, - "step": 39826 - }, - { - "epoch": 1.02, - "learning_rate": 1.5362126947019117e-06, - "loss": 0.6807, - "step": 39827 - }, - { - "epoch": 1.02, - "learning_rate": 1.5361893383396035e-06, - "loss": 0.7119, - "step": 39828 - }, - { - "epoch": 1.02, - "learning_rate": 1.5361659815667603e-06, - "loss": 0.6089, - "step": 39829 - }, - { - "epoch": 1.02, - "learning_rate": 1.5361426243833991e-06, - "loss": 0.6367, - "step": 39830 - }, - { - "epoch": 1.02, - "learning_rate": 1.5361192667895383e-06, - "loss": 0.7227, - "step": 39831 - }, - { - "epoch": 1.02, - "learning_rate": 1.5360959087851955e-06, - "loss": 0.709, - "step": 39832 - }, - { - "epoch": 1.02, - "learning_rate": 1.5360725503703886e-06, - "loss": 0.5898, - "step": 39833 - }, - { - "epoch": 1.02, - "learning_rate": 1.5360491915451354e-06, - "loss": 0.6582, - "step": 39834 - }, - { - "epoch": 1.02, - "learning_rate": 1.5360258323094547e-06, - "loss": 0.6504, - "step": 39835 - }, - { - "epoch": 1.02, - "learning_rate": 1.5360024726633628e-06, - "loss": 0.6865, - "step": 39836 - }, - { - "epoch": 1.02, - "learning_rate": 1.535979112606879e-06, - "loss": 0.9023, - "step": 39837 - }, - { - "epoch": 1.02, - "learning_rate": 1.5359557521400209e-06, - "loss": 0.6975, - "step": 39838 - }, - { - "epoch": 1.02, - "learning_rate": 1.5359323912628058e-06, - "loss": 0.6826, - "step": 39839 - }, - { - "epoch": 1.02, - "learning_rate": 1.5359090299752517e-06, - "loss": 0.5283, - "step": 39840 - }, - { - "epoch": 1.02, - "learning_rate": 1.535885668277377e-06, - "loss": 0.5005, - "step": 39841 - }, - { - "epoch": 1.02, - "learning_rate": 1.5358623061691991e-06, - "loss": 0.7832, - "step": 39842 - }, - { - "epoch": 1.02, - "learning_rate": 1.5358389436507361e-06, - "loss": 0.5991, - "step": 39843 - }, - { - "epoch": 1.02, - "learning_rate": 1.535815580722006e-06, - "loss": 0.7559, - "step": 39844 - }, - { - "epoch": 1.02, - "learning_rate": 1.5357922173830262e-06, - "loss": 0.8691, - "step": 39845 - }, - { - "epoch": 1.02, - "learning_rate": 1.5357688536338152e-06, - "loss": 0.7656, - "step": 39846 - }, - { - "epoch": 1.02, - "learning_rate": 1.5357454894743907e-06, - "loss": 0.7383, - "step": 39847 - }, - { - "epoch": 1.02, - "learning_rate": 1.5357221249047705e-06, - "loss": 0.7637, - "step": 39848 - }, - { - "epoch": 1.02, - "learning_rate": 1.5356987599249723e-06, - "loss": 0.6816, - "step": 39849 - }, - { - "epoch": 1.02, - "learning_rate": 1.5356753945350142e-06, - "loss": 0.834, - "step": 39850 - }, - { - "epoch": 1.02, - "learning_rate": 1.5356520287349142e-06, - "loss": 0.5518, - "step": 39851 - }, - { - "epoch": 1.02, - "learning_rate": 1.5356286625246903e-06, - "loss": 0.8203, - "step": 39852 - }, - { - "epoch": 1.02, - "learning_rate": 1.53560529590436e-06, - "loss": 0.6973, - "step": 39853 - }, - { - "epoch": 1.02, - "learning_rate": 1.5355819288739413e-06, - "loss": 0.6528, - "step": 39854 - }, - { - "epoch": 1.02, - "learning_rate": 1.5355585614334518e-06, - "loss": 0.6592, - "step": 39855 - }, - { - "epoch": 1.02, - "learning_rate": 1.53553519358291e-06, - "loss": 0.6421, - "step": 39856 - }, - { - "epoch": 1.02, - "learning_rate": 1.5355118253223341e-06, - "loss": 0.7949, - "step": 39857 - }, - { - "epoch": 1.02, - "learning_rate": 1.5354884566517408e-06, - "loss": 0.5146, - "step": 39858 - }, - { - "epoch": 1.02, - "learning_rate": 1.5354650875711486e-06, - "loss": 0.7031, - "step": 39859 - }, - { - "epoch": 1.02, - "learning_rate": 1.5354417180805754e-06, - "loss": 0.8262, - "step": 39860 - }, - { - "epoch": 1.02, - "learning_rate": 1.5354183481800394e-06, - "loss": 0.8018, - "step": 39861 - }, - { - "epoch": 1.02, - "learning_rate": 1.535394977869558e-06, - "loss": 0.7148, - "step": 39862 - }, - { - "epoch": 1.02, - "learning_rate": 1.5353716071491491e-06, - "loss": 0.6504, - "step": 39863 - }, - { - "epoch": 1.02, - "learning_rate": 1.535348236018831e-06, - "loss": 0.7983, - "step": 39864 - }, - { - "epoch": 1.02, - "learning_rate": 1.5353248644786212e-06, - "loss": 0.4907, - "step": 39865 - }, - { - "epoch": 1.02, - "learning_rate": 1.5353014925285382e-06, - "loss": 0.6396, - "step": 39866 - }, - { - "epoch": 1.02, - "learning_rate": 1.5352781201685991e-06, - "loss": 0.7568, - "step": 39867 - }, - { - "epoch": 1.02, - "learning_rate": 1.535254747398822e-06, - "loss": 0.749, - "step": 39868 - }, - { - "epoch": 1.02, - "learning_rate": 1.5352313742192253e-06, - "loss": 0.5503, - "step": 39869 - }, - { - "epoch": 1.02, - "learning_rate": 1.5352080006298263e-06, - "loss": 0.6826, - "step": 39870 - }, - { - "epoch": 1.02, - "learning_rate": 1.5351846266306434e-06, - "loss": 0.7217, - "step": 39871 - }, - { - "epoch": 1.02, - "learning_rate": 1.5351612522216941e-06, - "loss": 0.5281, - "step": 39872 - }, - { - "epoch": 1.02, - "learning_rate": 1.5351378774029967e-06, - "loss": 0.751, - "step": 39873 - }, - { - "epoch": 1.02, - "learning_rate": 1.5351145021745682e-06, - "loss": 0.5488, - "step": 39874 - }, - { - "epoch": 1.02, - "learning_rate": 1.5350911265364278e-06, - "loss": 0.5591, - "step": 39875 - }, - { - "epoch": 1.02, - "learning_rate": 1.5350677504885924e-06, - "loss": 0.6875, - "step": 39876 - }, - { - "epoch": 1.02, - "learning_rate": 1.5350443740310803e-06, - "loss": 0.8057, - "step": 39877 - }, - { - "epoch": 1.02, - "learning_rate": 1.5350209971639093e-06, - "loss": 0.6504, - "step": 39878 - }, - { - "epoch": 1.02, - "learning_rate": 1.5349976198870972e-06, - "loss": 0.8184, - "step": 39879 - }, - { - "epoch": 1.02, - "learning_rate": 1.5349742422006622e-06, - "loss": 0.6992, - "step": 39880 - }, - { - "epoch": 1.02, - "learning_rate": 1.5349508641046219e-06, - "loss": 0.439, - "step": 39881 - }, - { - "epoch": 1.02, - "learning_rate": 1.5349274855989944e-06, - "loss": 0.5938, - "step": 39882 - }, - { - "epoch": 1.02, - "learning_rate": 1.5349041066837974e-06, - "loss": 0.6719, - "step": 39883 - }, - { - "epoch": 1.02, - "learning_rate": 1.5348807273590492e-06, - "loss": 0.6079, - "step": 39884 - }, - { - "epoch": 1.02, - "learning_rate": 1.5348573476247674e-06, - "loss": 0.9473, - "step": 39885 - }, - { - "epoch": 1.02, - "learning_rate": 1.5348339674809694e-06, - "loss": 0.7949, - "step": 39886 - }, - { - "epoch": 1.02, - "learning_rate": 1.5348105869276743e-06, - "loss": 0.792, - "step": 39887 - }, - { - "epoch": 1.02, - "learning_rate": 1.5347872059648988e-06, - "loss": 0.687, - "step": 39888 - }, - { - "epoch": 1.02, - "learning_rate": 1.5347638245926615e-06, - "loss": 0.7988, - "step": 39889 - }, - { - "epoch": 1.02, - "learning_rate": 1.5347404428109801e-06, - "loss": 0.4424, - "step": 39890 - }, - { - "epoch": 1.02, - "learning_rate": 1.5347170606198724e-06, - "loss": 0.709, - "step": 39891 - }, - { - "epoch": 1.02, - "learning_rate": 1.5346936780193569e-06, - "loss": 0.689, - "step": 39892 - }, - { - "epoch": 1.02, - "learning_rate": 1.5346702950094508e-06, - "loss": 0.7031, - "step": 39893 - }, - { - "epoch": 1.02, - "learning_rate": 1.534646911590172e-06, - "loss": 0.6973, - "step": 39894 - }, - { - "epoch": 1.02, - "learning_rate": 1.534623527761539e-06, - "loss": 0.5742, - "step": 39895 - }, - { - "epoch": 1.02, - "learning_rate": 1.5346001435235691e-06, - "loss": 0.6748, - "step": 39896 - }, - { - "epoch": 1.02, - "learning_rate": 1.5345767588762808e-06, - "loss": 0.6206, - "step": 39897 - }, - { - "epoch": 1.02, - "learning_rate": 1.5345533738196914e-06, - "loss": 0.6533, - "step": 39898 - }, - { - "epoch": 1.02, - "learning_rate": 1.5345299883538188e-06, - "loss": 0.6084, - "step": 39899 - }, - { - "epoch": 1.02, - "learning_rate": 1.5345066024786815e-06, - "loss": 0.7607, - "step": 39900 - }, - { - "epoch": 1.02, - "learning_rate": 1.5344832161942968e-06, - "loss": 0.5151, - "step": 39901 - }, - { - "epoch": 1.02, - "learning_rate": 1.5344598295006835e-06, - "loss": 0.6392, - "step": 39902 - }, - { - "epoch": 1.02, - "learning_rate": 1.5344364423978583e-06, - "loss": 0.6885, - "step": 39903 - }, - { - "epoch": 1.02, - "learning_rate": 1.53441305488584e-06, - "loss": 0.5474, - "step": 39904 - }, - { - "epoch": 1.02, - "learning_rate": 1.5343896669646459e-06, - "loss": 0.5845, - "step": 39905 - }, - { - "epoch": 1.02, - "learning_rate": 1.5343662786342944e-06, - "loss": 0.6343, - "step": 39906 - }, - { - "epoch": 1.02, - "learning_rate": 1.5343428898948032e-06, - "loss": 0.6787, - "step": 39907 - }, - { - "epoch": 1.02, - "learning_rate": 1.53431950074619e-06, - "loss": 0.7168, - "step": 39908 - }, - { - "epoch": 1.02, - "learning_rate": 1.5342961111884733e-06, - "loss": 0.7129, - "step": 39909 - }, - { - "epoch": 1.02, - "learning_rate": 1.5342727212216703e-06, - "loss": 0.7734, - "step": 39910 - }, - { - "epoch": 1.02, - "learning_rate": 1.5342493308457995e-06, - "loss": 0.6191, - "step": 39911 - }, - { - "epoch": 1.02, - "learning_rate": 1.5342259400608783e-06, - "loss": 0.6465, - "step": 39912 - }, - { - "epoch": 1.02, - "learning_rate": 1.5342025488669253e-06, - "loss": 0.5762, - "step": 39913 - }, - { - "epoch": 1.02, - "learning_rate": 1.5341791572639572e-06, - "loss": 0.6621, - "step": 39914 - }, - { - "epoch": 1.02, - "learning_rate": 1.5341557652519934e-06, - "loss": 0.5371, - "step": 39915 - }, - { - "epoch": 1.02, - "learning_rate": 1.5341323728310509e-06, - "loss": 0.7539, - "step": 39916 - }, - { - "epoch": 1.02, - "learning_rate": 1.534108980001148e-06, - "loss": 0.3804, - "step": 39917 - }, - { - "epoch": 1.02, - "learning_rate": 1.534085586762302e-06, - "loss": 0.5312, - "step": 39918 - }, - { - "epoch": 1.02, - "learning_rate": 1.5340621931145314e-06, - "loss": 0.792, - "step": 39919 - }, - { - "epoch": 1.02, - "learning_rate": 1.534038799057854e-06, - "loss": 0.5249, - "step": 39920 - }, - { - "epoch": 1.02, - "learning_rate": 1.5340154045922874e-06, - "loss": 0.6099, - "step": 39921 - }, - { - "epoch": 1.02, - "learning_rate": 1.53399200971785e-06, - "loss": 0.5615, - "step": 39922 - }, - { - "epoch": 1.02, - "learning_rate": 1.5339686144345594e-06, - "loss": 0.5557, - "step": 39923 - }, - { - "epoch": 1.02, - "learning_rate": 1.5339452187424334e-06, - "loss": 0.6331, - "step": 39924 - }, - { - "epoch": 1.02, - "learning_rate": 1.5339218226414902e-06, - "loss": 0.7031, - "step": 39925 - }, - { - "epoch": 1.02, - "learning_rate": 1.5338984261317478e-06, - "loss": 0.5605, - "step": 39926 - }, - { - "epoch": 1.02, - "learning_rate": 1.5338750292132238e-06, - "loss": 0.6157, - "step": 39927 - }, - { - "epoch": 1.02, - "learning_rate": 1.5338516318859366e-06, - "loss": 0.4756, - "step": 39928 - }, - { - "epoch": 1.02, - "learning_rate": 1.5338282341499032e-06, - "loss": 0.5137, - "step": 39929 - }, - { - "epoch": 1.02, - "learning_rate": 1.5338048360051423e-06, - "loss": 0.7598, - "step": 39930 - }, - { - "epoch": 1.02, - "learning_rate": 1.5337814374516716e-06, - "loss": 0.3391, - "step": 39931 - }, - { - "epoch": 1.02, - "learning_rate": 1.533758038489509e-06, - "loss": 0.5732, - "step": 39932 - }, - { - "epoch": 1.02, - "learning_rate": 1.533734639118672e-06, - "loss": 0.8906, - "step": 39933 - }, - { - "epoch": 1.02, - "learning_rate": 1.5337112393391796e-06, - "loss": 0.7627, - "step": 39934 - }, - { - "epoch": 1.02, - "learning_rate": 1.5336878391510487e-06, - "loss": 0.6836, - "step": 39935 - }, - { - "epoch": 1.02, - "learning_rate": 1.5336644385542977e-06, - "loss": 0.6807, - "step": 39936 - }, - { - "epoch": 1.02, - "learning_rate": 1.5336410375489442e-06, - "loss": 0.6533, - "step": 39937 - }, - { - "epoch": 1.02, - "learning_rate": 1.5336176361350063e-06, - "loss": 0.6245, - "step": 39938 - }, - { - "epoch": 1.02, - "learning_rate": 1.533594234312502e-06, - "loss": 0.7783, - "step": 39939 - }, - { - "epoch": 1.02, - "learning_rate": 1.533570832081449e-06, - "loss": 0.6924, - "step": 39940 - }, - { - "epoch": 1.02, - "learning_rate": 1.5335474294418655e-06, - "loss": 0.6482, - "step": 39941 - }, - { - "epoch": 1.02, - "learning_rate": 1.5335240263937697e-06, - "loss": 0.6465, - "step": 39942 - }, - { - "epoch": 1.02, - "learning_rate": 1.5335006229371784e-06, - "loss": 0.5586, - "step": 39943 - }, - { - "epoch": 1.02, - "learning_rate": 1.5334772190721103e-06, - "loss": 0.5581, - "step": 39944 - }, - { - "epoch": 1.02, - "learning_rate": 1.5334538147985833e-06, - "loss": 0.8262, - "step": 39945 - }, - { - "epoch": 1.02, - "learning_rate": 1.5334304101166153e-06, - "loss": 0.5095, - "step": 39946 - }, - { - "epoch": 1.02, - "learning_rate": 1.5334070050262243e-06, - "loss": 0.6821, - "step": 39947 - }, - { - "epoch": 1.02, - "learning_rate": 1.533383599527428e-06, - "loss": 0.6934, - "step": 39948 - }, - { - "epoch": 1.02, - "learning_rate": 1.5333601936202442e-06, - "loss": 0.5542, - "step": 39949 - }, - { - "epoch": 1.02, - "learning_rate": 1.5333367873046914e-06, - "loss": 0.7803, - "step": 39950 - }, - { - "epoch": 1.02, - "learning_rate": 1.5333133805807866e-06, - "loss": 0.623, - "step": 39951 - }, - { - "epoch": 1.02, - "learning_rate": 1.5332899734485488e-06, - "loss": 0.7168, - "step": 39952 - }, - { - "epoch": 1.02, - "learning_rate": 1.5332665659079951e-06, - "loss": 0.7676, - "step": 39953 - }, - { - "epoch": 1.02, - "learning_rate": 1.5332431579591436e-06, - "loss": 0.7676, - "step": 39954 - }, - { - "epoch": 1.02, - "learning_rate": 1.5332197496020127e-06, - "loss": 0.548, - "step": 39955 - }, - { - "epoch": 1.02, - "learning_rate": 1.5331963408366196e-06, - "loss": 0.6362, - "step": 39956 - }, - { - "epoch": 1.02, - "learning_rate": 1.5331729316629828e-06, - "loss": 0.6045, - "step": 39957 - }, - { - "epoch": 1.02, - "learning_rate": 1.53314952208112e-06, - "loss": 0.5684, - "step": 39958 - }, - { - "epoch": 1.02, - "learning_rate": 1.533126112091049e-06, - "loss": 0.6631, - "step": 39959 - }, - { - "epoch": 1.02, - "learning_rate": 1.5331027016927878e-06, - "loss": 0.7109, - "step": 39960 - }, - { - "epoch": 1.02, - "learning_rate": 1.5330792908863548e-06, - "loss": 0.5767, - "step": 39961 - }, - { - "epoch": 1.02, - "learning_rate": 1.533055879671767e-06, - "loss": 0.7832, - "step": 39962 - }, - { - "epoch": 1.02, - "learning_rate": 1.5330324680490432e-06, - "loss": 0.6934, - "step": 39963 - }, - { - "epoch": 1.02, - "learning_rate": 1.5330090560182006e-06, - "loss": 0.4683, - "step": 39964 - }, - { - "epoch": 1.02, - "learning_rate": 1.5329856435792578e-06, - "loss": 0.708, - "step": 39965 - }, - { - "epoch": 1.02, - "learning_rate": 1.532962230732232e-06, - "loss": 1.0166, - "step": 39966 - }, - { - "epoch": 1.02, - "learning_rate": 1.532938817477142e-06, - "loss": 0.624, - "step": 39967 - }, - { - "epoch": 1.02, - "learning_rate": 1.5329154038140048e-06, - "loss": 0.7012, - "step": 39968 - }, - { - "epoch": 1.02, - "learning_rate": 1.5328919897428392e-06, - "loss": 0.7021, - "step": 39969 - }, - { - "epoch": 1.02, - "learning_rate": 1.5328685752636625e-06, - "loss": 0.5493, - "step": 39970 - }, - { - "epoch": 1.02, - "learning_rate": 1.5328451603764929e-06, - "loss": 0.3893, - "step": 39971 - }, - { - "epoch": 1.02, - "learning_rate": 1.5328217450813482e-06, - "loss": 0.7178, - "step": 39972 - }, - { - "epoch": 1.02, - "learning_rate": 1.532798329378246e-06, - "loss": 0.6191, - "step": 39973 - }, - { - "epoch": 1.02, - "learning_rate": 1.5327749132672051e-06, - "loss": 0.6021, - "step": 39974 - }, - { - "epoch": 1.02, - "learning_rate": 1.532751496748243e-06, - "loss": 0.4719, - "step": 39975 - }, - { - "epoch": 1.02, - "learning_rate": 1.5327280798213774e-06, - "loss": 0.3678, - "step": 39976 - }, - { - "epoch": 1.02, - "learning_rate": 1.5327046624866265e-06, - "loss": 0.7578, - "step": 39977 - }, - { - "epoch": 1.02, - "learning_rate": 1.5326812447440082e-06, - "loss": 0.6382, - "step": 39978 - }, - { - "epoch": 1.02, - "learning_rate": 1.5326578265935402e-06, - "loss": 0.7344, - "step": 39979 - }, - { - "epoch": 1.02, - "learning_rate": 1.5326344080352404e-06, - "loss": 0.6094, - "step": 39980 - }, - { - "epoch": 1.02, - "learning_rate": 1.532610989069127e-06, - "loss": 0.5164, - "step": 39981 - }, - { - "epoch": 1.02, - "learning_rate": 1.5325875696952184e-06, - "loss": 0.6621, - "step": 39982 - }, - { - "epoch": 1.02, - "learning_rate": 1.5325641499135316e-06, - "loss": 0.6401, - "step": 39983 - }, - { - "epoch": 1.02, - "learning_rate": 1.5325407297240848e-06, - "loss": 0.5835, - "step": 39984 - }, - { - "epoch": 1.02, - "learning_rate": 1.5325173091268959e-06, - "loss": 0.6631, - "step": 39985 - }, - { - "epoch": 1.02, - "learning_rate": 1.5324938881219835e-06, - "loss": 0.6211, - "step": 39986 - }, - { - "epoch": 1.02, - "learning_rate": 1.5324704667093648e-06, - "loss": 0.666, - "step": 39987 - }, - { - "epoch": 1.02, - "learning_rate": 1.532447044889058e-06, - "loss": 0.6143, - "step": 39988 - }, - { - "epoch": 1.02, - "learning_rate": 1.5324236226610807e-06, - "loss": 0.5378, - "step": 39989 - }, - { - "epoch": 1.02, - "learning_rate": 1.5324002000254515e-06, - "loss": 0.4078, - "step": 39990 - }, - { - "epoch": 1.02, - "learning_rate": 1.5323767769821876e-06, - "loss": 0.709, - "step": 39991 - }, - { - "epoch": 1.03, - "learning_rate": 1.5323533535313076e-06, - "loss": 0.5715, - "step": 39992 - }, - { - "epoch": 1.03, - "learning_rate": 1.5323299296728287e-06, - "loss": 0.6367, - "step": 39993 - }, - { - "epoch": 1.03, - "learning_rate": 1.5323065054067697e-06, - "loss": 0.574, - "step": 39994 - }, - { - "epoch": 1.03, - "learning_rate": 1.5322830807331476e-06, - "loss": 0.5374, - "step": 39995 - }, - { - "epoch": 1.03, - "learning_rate": 1.5322596556519814e-06, - "loss": 0.5913, - "step": 39996 - }, - { - "epoch": 1.03, - "learning_rate": 1.532236230163288e-06, - "loss": 0.6362, - "step": 39997 - }, - { - "epoch": 1.03, - "learning_rate": 1.5322128042670862e-06, - "loss": 0.6562, - "step": 39998 - }, - { - "epoch": 1.03, - "learning_rate": 1.5321893779633933e-06, - "loss": 0.8408, - "step": 39999 - }, - { - "epoch": 1.03, - "learning_rate": 1.5321659512522271e-06, - "loss": 0.4163, - "step": 40000 - }, - { - "epoch": 1.03, - "learning_rate": 1.5321425241336063e-06, - "loss": 0.6865, - "step": 40001 - }, - { - "epoch": 1.03, - "learning_rate": 1.5321190966075483e-06, - "loss": 0.6602, - "step": 40002 - }, - { - "epoch": 1.03, - "learning_rate": 1.5320956686740716e-06, - "loss": 0.6118, - "step": 40003 - }, - { - "epoch": 1.03, - "learning_rate": 1.5320722403331931e-06, - "loss": 0.7441, - "step": 40004 - }, - { - "epoch": 1.03, - "learning_rate": 1.5320488115849318e-06, - "loss": 0.751, - "step": 40005 - }, - { - "epoch": 1.03, - "learning_rate": 1.5320253824293047e-06, - "loss": 0.7861, - "step": 40006 - }, - { - "epoch": 1.03, - "learning_rate": 1.5320019528663309e-06, - "loss": 0.8857, - "step": 40007 - }, - { - "epoch": 1.03, - "learning_rate": 1.5319785228960272e-06, - "loss": 0.748, - "step": 40008 - }, - { - "epoch": 1.03, - "learning_rate": 1.531955092518412e-06, - "loss": 0.8262, - "step": 40009 - }, - { - "epoch": 1.03, - "learning_rate": 1.5319316617335033e-06, - "loss": 0.605, - "step": 40010 - }, - { - "epoch": 1.03, - "learning_rate": 1.5319082305413192e-06, - "loss": 0.7568, - "step": 40011 - }, - { - "epoch": 1.03, - "learning_rate": 1.5318847989418774e-06, - "loss": 0.7148, - "step": 40012 - }, - { - "epoch": 1.03, - "learning_rate": 1.5318613669351957e-06, - "loss": 0.5557, - "step": 40013 - }, - { - "epoch": 1.03, - "learning_rate": 1.531837934521292e-06, - "loss": 0.5977, - "step": 40014 - }, - { - "epoch": 1.03, - "learning_rate": 1.5318145017001846e-06, - "loss": 0.6162, - "step": 40015 - }, - { - "epoch": 1.03, - "learning_rate": 1.5317910684718913e-06, - "loss": 0.7354, - "step": 40016 - }, - { - "epoch": 1.03, - "learning_rate": 1.5317676348364304e-06, - "loss": 0.7217, - "step": 40017 - }, - { - "epoch": 1.03, - "learning_rate": 1.531744200793819e-06, - "loss": 0.7539, - "step": 40018 - }, - { - "epoch": 1.03, - "learning_rate": 1.5317207663440758e-06, - "loss": 0.7168, - "step": 40019 - }, - { - "epoch": 1.03, - "learning_rate": 1.5316973314872183e-06, - "loss": 0.7676, - "step": 40020 - }, - { - "epoch": 1.03, - "learning_rate": 1.5316738962232648e-06, - "loss": 0.3967, - "step": 40021 - }, - { - "epoch": 1.03, - "learning_rate": 1.5316504605522328e-06, - "loss": 0.6851, - "step": 40022 - }, - { - "epoch": 1.03, - "learning_rate": 1.5316270244741405e-06, - "loss": 0.6279, - "step": 40023 - }, - { - "epoch": 1.03, - "learning_rate": 1.531603587989006e-06, - "loss": 0.749, - "step": 40024 - }, - { - "epoch": 1.03, - "learning_rate": 1.531580151096847e-06, - "loss": 0.6885, - "step": 40025 - }, - { - "epoch": 1.03, - "learning_rate": 1.5315567137976815e-06, - "loss": 0.6621, - "step": 40026 - }, - { - "epoch": 1.03, - "learning_rate": 1.5315332760915273e-06, - "loss": 0.75, - "step": 40027 - }, - { - "epoch": 1.03, - "learning_rate": 1.5315098379784028e-06, - "loss": 0.7656, - "step": 40028 - }, - { - "epoch": 1.03, - "learning_rate": 1.5314863994583257e-06, - "loss": 0.7422, - "step": 40029 - }, - { - "epoch": 1.03, - "learning_rate": 1.5314629605313139e-06, - "loss": 0.7554, - "step": 40030 - }, - { - "epoch": 1.03, - "learning_rate": 1.531439521197385e-06, - "loss": 0.7061, - "step": 40031 - }, - { - "epoch": 1.03, - "learning_rate": 1.5314160814565576e-06, - "loss": 0.5337, - "step": 40032 - }, - { - "epoch": 1.03, - "learning_rate": 1.5313926413088491e-06, - "loss": 0.6836, - "step": 40033 - }, - { - "epoch": 1.03, - "learning_rate": 1.5313692007542777e-06, - "loss": 0.5894, - "step": 40034 - }, - { - "epoch": 1.03, - "learning_rate": 1.5313457597928613e-06, - "loss": 0.6274, - "step": 40035 - }, - { - "epoch": 1.03, - "learning_rate": 1.5313223184246184e-06, - "loss": 0.5244, - "step": 40036 - }, - { - "epoch": 1.03, - "learning_rate": 1.5312988766495663e-06, - "loss": 0.7549, - "step": 40037 - }, - { - "epoch": 1.03, - "learning_rate": 1.5312754344677228e-06, - "loss": 0.6191, - "step": 40038 - }, - { - "epoch": 1.03, - "learning_rate": 1.531251991879106e-06, - "loss": 0.7412, - "step": 40039 - }, - { - "epoch": 1.03, - "learning_rate": 1.5312285488837343e-06, - "loss": 0.6274, - "step": 40040 - }, - { - "epoch": 1.03, - "learning_rate": 1.531205105481625e-06, - "loss": 0.6226, - "step": 40041 - }, - { - "epoch": 1.03, - "learning_rate": 1.5311816616727967e-06, - "loss": 0.5518, - "step": 40042 - }, - { - "epoch": 1.03, - "learning_rate": 1.5311582174572667e-06, - "loss": 0.6279, - "step": 40043 - }, - { - "epoch": 1.03, - "learning_rate": 1.5311347728350533e-06, - "loss": 0.7998, - "step": 40044 - }, - { - "epoch": 1.03, - "learning_rate": 1.5311113278061748e-06, - "loss": 0.4695, - "step": 40045 - }, - { - "epoch": 1.03, - "learning_rate": 1.5310878823706488e-06, - "loss": 0.4496, - "step": 40046 - }, - { - "epoch": 1.03, - "learning_rate": 1.531064436528493e-06, - "loss": 0.6616, - "step": 40047 - }, - { - "epoch": 1.03, - "learning_rate": 1.5310409902797255e-06, - "loss": 0.7847, - "step": 40048 - }, - { - "epoch": 1.03, - "learning_rate": 1.5310175436243643e-06, - "loss": 0.3989, - "step": 40049 - }, - { - "epoch": 1.03, - "learning_rate": 1.5309940965624276e-06, - "loss": 0.7168, - "step": 40050 - }, - { - "epoch": 1.03, - "learning_rate": 1.5309706490939332e-06, - "loss": 0.6265, - "step": 40051 - }, - { - "epoch": 1.03, - "learning_rate": 1.5309472012188986e-06, - "loss": 0.7598, - "step": 40052 - }, - { - "epoch": 1.03, - "learning_rate": 1.5309237529373423e-06, - "loss": 0.7852, - "step": 40053 - }, - { - "epoch": 1.03, - "learning_rate": 1.530900304249282e-06, - "loss": 0.8076, - "step": 40054 - }, - { - "epoch": 1.03, - "learning_rate": 1.5308768551547362e-06, - "loss": 0.6206, - "step": 40055 - }, - { - "epoch": 1.03, - "learning_rate": 1.5308534056537221e-06, - "loss": 0.5889, - "step": 40056 - }, - { - "epoch": 1.03, - "learning_rate": 1.530829955746258e-06, - "loss": 0.5874, - "step": 40057 - }, - { - "epoch": 1.03, - "learning_rate": 1.5308065054323618e-06, - "loss": 0.5835, - "step": 40058 - }, - { - "epoch": 1.03, - "learning_rate": 1.5307830547120512e-06, - "loss": 0.7793, - "step": 40059 - }, - { - "epoch": 1.03, - "learning_rate": 1.5307596035853448e-06, - "loss": 0.4873, - "step": 40060 - }, - { - "epoch": 1.03, - "learning_rate": 1.53073615205226e-06, - "loss": 0.6042, - "step": 40061 - }, - { - "epoch": 1.03, - "learning_rate": 1.530712700112815e-06, - "loss": 0.6704, - "step": 40062 - }, - { - "epoch": 1.03, - "learning_rate": 1.5306892477670274e-06, - "loss": 0.5781, - "step": 40063 - }, - { - "epoch": 1.03, - "learning_rate": 1.530665795014916e-06, - "loss": 0.709, - "step": 40064 - }, - { - "epoch": 1.03, - "learning_rate": 1.530642341856498e-06, - "loss": 0.6172, - "step": 40065 - }, - { - "epoch": 1.03, - "learning_rate": 1.5306188882917913e-06, - "loss": 0.8125, - "step": 40066 - }, - { - "epoch": 1.03, - "learning_rate": 1.5305954343208143e-06, - "loss": 0.5051, - "step": 40067 - }, - { - "epoch": 1.03, - "learning_rate": 1.5305719799435849e-06, - "loss": 0.552, - "step": 40068 - }, - { - "epoch": 1.03, - "learning_rate": 1.5305485251601207e-06, - "loss": 0.5005, - "step": 40069 - }, - { - "epoch": 1.03, - "learning_rate": 1.53052506997044e-06, - "loss": 0.7725, - "step": 40070 - }, - { - "epoch": 1.03, - "learning_rate": 1.5305016143745606e-06, - "loss": 0.6914, - "step": 40071 - }, - { - "epoch": 1.03, - "learning_rate": 1.5304781583725007e-06, - "loss": 0.4951, - "step": 40072 - }, - { - "epoch": 1.03, - "learning_rate": 1.5304547019642777e-06, - "loss": 0.6904, - "step": 40073 - }, - { - "epoch": 1.03, - "learning_rate": 1.5304312451499102e-06, - "loss": 0.6763, - "step": 40074 - }, - { - "epoch": 1.03, - "learning_rate": 1.5304077879294158e-06, - "loss": 0.7197, - "step": 40075 - }, - { - "epoch": 1.03, - "learning_rate": 1.5303843303028127e-06, - "loss": 0.6592, - "step": 40076 - }, - { - "epoch": 1.03, - "learning_rate": 1.5303608722701183e-06, - "loss": 0.5654, - "step": 40077 - }, - { - "epoch": 1.03, - "learning_rate": 1.5303374138313515e-06, - "loss": 0.7197, - "step": 40078 - }, - { - "epoch": 1.03, - "learning_rate": 1.530313954986529e-06, - "loss": 0.8125, - "step": 40079 - }, - { - "epoch": 1.03, - "learning_rate": 1.53029049573567e-06, - "loss": 0.7539, - "step": 40080 - }, - { - "epoch": 1.03, - "learning_rate": 1.5302670360787921e-06, - "loss": 0.7021, - "step": 40081 - }, - { - "epoch": 1.03, - "learning_rate": 1.530243576015913e-06, - "loss": 0.7354, - "step": 40082 - }, - { - "epoch": 1.03, - "learning_rate": 1.5302201155470505e-06, - "loss": 0.7627, - "step": 40083 - }, - { - "epoch": 1.03, - "learning_rate": 1.530196654672223e-06, - "loss": 0.7998, - "step": 40084 - }, - { - "epoch": 1.03, - "learning_rate": 1.5301731933914483e-06, - "loss": 0.6699, - "step": 40085 - }, - { - "epoch": 1.03, - "learning_rate": 1.5301497317047444e-06, - "loss": 0.7012, - "step": 40086 - }, - { - "epoch": 1.03, - "learning_rate": 1.5301262696121294e-06, - "loss": 0.6523, - "step": 40087 - }, - { - "epoch": 1.03, - "learning_rate": 1.5301028071136207e-06, - "loss": 0.5261, - "step": 40088 - }, - { - "epoch": 1.03, - "learning_rate": 1.5300793442092368e-06, - "loss": 0.5742, - "step": 40089 - }, - { - "epoch": 1.03, - "learning_rate": 1.5300558808989957e-06, - "loss": 0.6553, - "step": 40090 - }, - { - "epoch": 1.03, - "learning_rate": 1.530032417182915e-06, - "loss": 0.4331, - "step": 40091 - }, - { - "epoch": 1.03, - "learning_rate": 1.530008953061013e-06, - "loss": 0.323, - "step": 40092 - }, - { - "epoch": 1.03, - "learning_rate": 1.5299854885333075e-06, - "loss": 0.6792, - "step": 40093 - }, - { - "epoch": 1.03, - "learning_rate": 1.5299620235998164e-06, - "loss": 0.8057, - "step": 40094 - }, - { - "epoch": 1.03, - "learning_rate": 1.5299385582605578e-06, - "loss": 0.5281, - "step": 40095 - }, - { - "epoch": 1.03, - "learning_rate": 1.5299150925155494e-06, - "loss": 0.5332, - "step": 40096 - }, - { - "epoch": 1.03, - "learning_rate": 1.5298916263648098e-06, - "loss": 0.6755, - "step": 40097 - }, - { - "epoch": 1.03, - "learning_rate": 1.5298681598083561e-06, - "loss": 0.5093, - "step": 40098 - }, - { - "epoch": 1.03, - "learning_rate": 1.529844692846207e-06, - "loss": 0.7188, - "step": 40099 - }, - { - "epoch": 1.03, - "learning_rate": 1.52982122547838e-06, - "loss": 0.6885, - "step": 40100 - }, - { - "epoch": 1.03, - "learning_rate": 1.5297977577048936e-06, - "loss": 0.8369, - "step": 40101 - }, - { - "epoch": 1.03, - "learning_rate": 1.5297742895257647e-06, - "loss": 0.5625, - "step": 40102 - }, - { - "epoch": 1.03, - "learning_rate": 1.5297508209410128e-06, - "loss": 0.5566, - "step": 40103 - }, - { - "epoch": 1.03, - "learning_rate": 1.5297273519506547e-06, - "loss": 0.5703, - "step": 40104 - }, - { - "epoch": 1.03, - "learning_rate": 1.5297038825547086e-06, - "loss": 0.6631, - "step": 40105 - }, - { - "epoch": 1.03, - "learning_rate": 1.5296804127531927e-06, - "loss": 0.7656, - "step": 40106 - }, - { - "epoch": 1.03, - "learning_rate": 1.5296569425461247e-06, - "loss": 0.6313, - "step": 40107 - }, - { - "epoch": 1.03, - "learning_rate": 1.5296334719335232e-06, - "loss": 0.6567, - "step": 40108 - }, - { - "epoch": 1.03, - "learning_rate": 1.5296100009154054e-06, - "loss": 0.5757, - "step": 40109 - }, - { - "epoch": 1.03, - "learning_rate": 1.5295865294917895e-06, - "loss": 0.5737, - "step": 40110 - }, - { - "epoch": 1.03, - "learning_rate": 1.5295630576626937e-06, - "loss": 0.7334, - "step": 40111 - }, - { - "epoch": 1.03, - "learning_rate": 1.5295395854281358e-06, - "loss": 0.835, - "step": 40112 - }, - { - "epoch": 1.03, - "learning_rate": 1.5295161127881336e-06, - "loss": 0.6582, - "step": 40113 - }, - { - "epoch": 1.03, - "learning_rate": 1.5294926397427052e-06, - "loss": 0.6304, - "step": 40114 - }, - { - "epoch": 1.03, - "learning_rate": 1.5294691662918688e-06, - "loss": 0.5928, - "step": 40115 - }, - { - "epoch": 1.03, - "learning_rate": 1.5294456924356425e-06, - "loss": 0.5762, - "step": 40116 - }, - { - "epoch": 1.03, - "learning_rate": 1.5294222181740437e-06, - "loss": 0.7495, - "step": 40117 - }, - { - "epoch": 1.03, - "learning_rate": 1.5293987435070908e-06, - "loss": 0.5037, - "step": 40118 - }, - { - "epoch": 1.03, - "learning_rate": 1.5293752684348013e-06, - "loss": 0.8096, - "step": 40119 - }, - { - "epoch": 1.03, - "learning_rate": 1.5293517929571938e-06, - "loss": 0.5322, - "step": 40120 - }, - { - "epoch": 1.03, - "learning_rate": 1.5293283170742859e-06, - "loss": 0.647, - "step": 40121 - }, - { - "epoch": 1.03, - "learning_rate": 1.5293048407860956e-06, - "loss": 0.5542, - "step": 40122 - }, - { - "epoch": 1.03, - "learning_rate": 1.529281364092641e-06, - "loss": 0.7148, - "step": 40123 - }, - { - "epoch": 1.03, - "learning_rate": 1.5292578869939398e-06, - "loss": 0.7383, - "step": 40124 - }, - { - "epoch": 1.03, - "learning_rate": 1.52923440949001e-06, - "loss": 0.8379, - "step": 40125 - }, - { - "epoch": 1.03, - "learning_rate": 1.5292109315808703e-06, - "loss": 0.6348, - "step": 40126 - }, - { - "epoch": 1.03, - "learning_rate": 1.5291874532665378e-06, - "loss": 0.7217, - "step": 40127 - }, - { - "epoch": 1.03, - "learning_rate": 1.5291639745470311e-06, - "loss": 0.6802, - "step": 40128 - }, - { - "epoch": 1.03, - "learning_rate": 1.5291404954223674e-06, - "loss": 0.6924, - "step": 40129 - }, - { - "epoch": 1.03, - "learning_rate": 1.5291170158925657e-06, - "loss": 0.5718, - "step": 40130 - }, - { - "epoch": 1.03, - "learning_rate": 1.5290935359576432e-06, - "loss": 0.6719, - "step": 40131 - }, - { - "epoch": 1.03, - "learning_rate": 1.5290700556176177e-06, - "loss": 0.7363, - "step": 40132 - }, - { - "epoch": 1.03, - "learning_rate": 1.529046574872508e-06, - "loss": 0.6514, - "step": 40133 - }, - { - "epoch": 1.03, - "learning_rate": 1.5290230937223316e-06, - "loss": 0.5811, - "step": 40134 - }, - { - "epoch": 1.03, - "learning_rate": 1.5289996121671064e-06, - "loss": 0.6733, - "step": 40135 - }, - { - "epoch": 1.03, - "learning_rate": 1.5289761302068506e-06, - "loss": 0.6104, - "step": 40136 - }, - { - "epoch": 1.03, - "learning_rate": 1.5289526478415825e-06, - "loss": 0.6777, - "step": 40137 - }, - { - "epoch": 1.03, - "learning_rate": 1.528929165071319e-06, - "loss": 0.6885, - "step": 40138 - }, - { - "epoch": 1.03, - "learning_rate": 1.5289056818960792e-06, - "loss": 0.5776, - "step": 40139 - }, - { - "epoch": 1.03, - "learning_rate": 1.5288821983158803e-06, - "loss": 0.8545, - "step": 40140 - }, - { - "epoch": 1.03, - "learning_rate": 1.5288587143307412e-06, - "loss": 0.457, - "step": 40141 - }, - { - "epoch": 1.03, - "learning_rate": 1.5288352299406789e-06, - "loss": 0.6465, - "step": 40142 - }, - { - "epoch": 1.03, - "learning_rate": 1.528811745145712e-06, - "loss": 0.6455, - "step": 40143 - }, - { - "epoch": 1.03, - "learning_rate": 1.5287882599458577e-06, - "loss": 0.7646, - "step": 40144 - }, - { - "epoch": 1.03, - "learning_rate": 1.528764774341135e-06, - "loss": 0.6675, - "step": 40145 - }, - { - "epoch": 1.03, - "learning_rate": 1.5287412883315617e-06, - "loss": 0.6582, - "step": 40146 - }, - { - "epoch": 1.03, - "learning_rate": 1.5287178019171552e-06, - "loss": 0.5874, - "step": 40147 - }, - { - "epoch": 1.03, - "learning_rate": 1.5286943150979334e-06, - "loss": 0.6685, - "step": 40148 - }, - { - "epoch": 1.03, - "learning_rate": 1.528670827873915e-06, - "loss": 0.6104, - "step": 40149 - }, - { - "epoch": 1.03, - "learning_rate": 1.5286473402451176e-06, - "loss": 0.7251, - "step": 40150 - }, - { - "epoch": 1.03, - "learning_rate": 1.5286238522115596e-06, - "loss": 0.7666, - "step": 40151 - }, - { - "epoch": 1.03, - "learning_rate": 1.5286003637732585e-06, - "loss": 0.6807, - "step": 40152 - }, - { - "epoch": 1.03, - "learning_rate": 1.528576874930232e-06, - "loss": 0.5703, - "step": 40153 - }, - { - "epoch": 1.03, - "learning_rate": 1.5285533856824988e-06, - "loss": 0.6128, - "step": 40154 - }, - { - "epoch": 1.03, - "learning_rate": 1.5285298960300765e-06, - "loss": 0.6221, - "step": 40155 - }, - { - "epoch": 1.03, - "learning_rate": 1.5285064059729833e-06, - "loss": 0.8599, - "step": 40156 - }, - { - "epoch": 1.03, - "learning_rate": 1.528482915511237e-06, - "loss": 0.8066, - "step": 40157 - }, - { - "epoch": 1.03, - "learning_rate": 1.5284594246448555e-06, - "loss": 0.5361, - "step": 40158 - }, - { - "epoch": 1.03, - "learning_rate": 1.5284359333738567e-06, - "loss": 0.7178, - "step": 40159 - }, - { - "epoch": 1.03, - "learning_rate": 1.5284124416982592e-06, - "loss": 0.6611, - "step": 40160 - }, - { - "epoch": 1.03, - "learning_rate": 1.5283889496180807e-06, - "loss": 0.606, - "step": 40161 - }, - { - "epoch": 1.03, - "learning_rate": 1.5283654571333387e-06, - "loss": 0.9414, - "step": 40162 - }, - { - "epoch": 1.03, - "learning_rate": 1.5283419642440518e-06, - "loss": 0.5947, - "step": 40163 - }, - { - "epoch": 1.03, - "learning_rate": 1.5283184709502375e-06, - "loss": 0.4712, - "step": 40164 - }, - { - "epoch": 1.03, - "learning_rate": 1.5282949772519143e-06, - "loss": 0.7412, - "step": 40165 - }, - { - "epoch": 1.03, - "learning_rate": 1.5282714831490999e-06, - "loss": 0.5288, - "step": 40166 - }, - { - "epoch": 1.03, - "learning_rate": 1.5282479886418122e-06, - "loss": 0.5126, - "step": 40167 - }, - { - "epoch": 1.03, - "learning_rate": 1.5282244937300694e-06, - "loss": 0.6416, - "step": 40168 - }, - { - "epoch": 1.03, - "learning_rate": 1.5282009984138894e-06, - "loss": 0.5874, - "step": 40169 - }, - { - "epoch": 1.03, - "learning_rate": 1.5281775026932899e-06, - "loss": 0.6611, - "step": 40170 - }, - { - "epoch": 1.03, - "learning_rate": 1.5281540065682897e-06, - "loss": 0.54, - "step": 40171 - }, - { - "epoch": 1.03, - "learning_rate": 1.5281305100389059e-06, - "loss": 0.709, - "step": 40172 - }, - { - "epoch": 1.03, - "learning_rate": 1.5281070131051568e-06, - "loss": 0.8408, - "step": 40173 - }, - { - "epoch": 1.03, - "learning_rate": 1.5280835157670606e-06, - "loss": 0.6865, - "step": 40174 - }, - { - "epoch": 1.03, - "learning_rate": 1.528060018024635e-06, - "loss": 0.6738, - "step": 40175 - }, - { - "epoch": 1.03, - "learning_rate": 1.5280365198778982e-06, - "loss": 0.3823, - "step": 40176 - }, - { - "epoch": 1.03, - "learning_rate": 1.5280130213268682e-06, - "loss": 0.7544, - "step": 40177 - }, - { - "epoch": 1.03, - "learning_rate": 1.5279895223715628e-06, - "loss": 0.5664, - "step": 40178 - }, - { - "epoch": 1.03, - "learning_rate": 1.5279660230120005e-06, - "loss": 0.6162, - "step": 40179 - }, - { - "epoch": 1.03, - "learning_rate": 1.5279425232481982e-06, - "loss": 0.6191, - "step": 40180 - }, - { - "epoch": 1.03, - "learning_rate": 1.5279190230801754e-06, - "loss": 0.5186, - "step": 40181 - }, - { - "epoch": 1.03, - "learning_rate": 1.5278955225079484e-06, - "loss": 0.8008, - "step": 40182 - }, - { - "epoch": 1.03, - "learning_rate": 1.5278720215315363e-06, - "loss": 0.5017, - "step": 40183 - }, - { - "epoch": 1.03, - "learning_rate": 1.527848520150957e-06, - "loss": 0.7334, - "step": 40184 - }, - { - "epoch": 1.03, - "learning_rate": 1.5278250183662284e-06, - "loss": 0.5752, - "step": 40185 - }, - { - "epoch": 1.03, - "learning_rate": 1.5278015161773687e-06, - "loss": 0.6768, - "step": 40186 - }, - { - "epoch": 1.03, - "learning_rate": 1.5277780135843953e-06, - "loss": 0.7422, - "step": 40187 - }, - { - "epoch": 1.03, - "learning_rate": 1.5277545105873269e-06, - "loss": 0.5889, - "step": 40188 - }, - { - "epoch": 1.03, - "learning_rate": 1.5277310071861807e-06, - "loss": 0.6367, - "step": 40189 - }, - { - "epoch": 1.03, - "learning_rate": 1.5277075033809753e-06, - "loss": 0.7256, - "step": 40190 - }, - { - "epoch": 1.03, - "learning_rate": 1.5276839991717288e-06, - "loss": 0.7124, - "step": 40191 - }, - { - "epoch": 1.03, - "learning_rate": 1.5276604945584586e-06, - "loss": 0.6123, - "step": 40192 - }, - { - "epoch": 1.03, - "learning_rate": 1.527636989541183e-06, - "loss": 0.7227, - "step": 40193 - }, - { - "epoch": 1.03, - "learning_rate": 1.52761348411992e-06, - "loss": 0.6694, - "step": 40194 - }, - { - "epoch": 1.03, - "learning_rate": 1.5275899782946877e-06, - "loss": 0.5752, - "step": 40195 - }, - { - "epoch": 1.03, - "learning_rate": 1.5275664720655042e-06, - "loss": 0.6543, - "step": 40196 - }, - { - "epoch": 1.03, - "learning_rate": 1.5275429654323871e-06, - "loss": 0.6265, - "step": 40197 - }, - { - "epoch": 1.03, - "learning_rate": 1.5275194583953548e-06, - "loss": 0.5386, - "step": 40198 - }, - { - "epoch": 1.03, - "learning_rate": 1.527495950954425e-06, - "loss": 0.6895, - "step": 40199 - }, - { - "epoch": 1.03, - "learning_rate": 1.5274724431096155e-06, - "loss": 0.5701, - "step": 40200 - }, - { - "epoch": 1.03, - "learning_rate": 1.5274489348609449e-06, - "loss": 0.5483, - "step": 40201 - }, - { - "epoch": 1.03, - "learning_rate": 1.527425426208431e-06, - "loss": 0.644, - "step": 40202 - }, - { - "epoch": 1.03, - "learning_rate": 1.5274019171520914e-06, - "loss": 0.5747, - "step": 40203 - }, - { - "epoch": 1.03, - "learning_rate": 1.5273784076919447e-06, - "loss": 0.6504, - "step": 40204 - }, - { - "epoch": 1.03, - "learning_rate": 1.5273548978280081e-06, - "loss": 0.7119, - "step": 40205 - }, - { - "epoch": 1.03, - "learning_rate": 1.5273313875603009e-06, - "loss": 0.6074, - "step": 40206 - }, - { - "epoch": 1.03, - "learning_rate": 1.5273078768888397e-06, - "loss": 0.6978, - "step": 40207 - }, - { - "epoch": 1.03, - "learning_rate": 1.5272843658136437e-06, - "loss": 0.5632, - "step": 40208 - }, - { - "epoch": 1.03, - "learning_rate": 1.5272608543347297e-06, - "loss": 0.542, - "step": 40209 - }, - { - "epoch": 1.03, - "learning_rate": 1.5272373424521162e-06, - "loss": 0.7427, - "step": 40210 - }, - { - "epoch": 1.03, - "learning_rate": 1.5272138301658219e-06, - "loss": 0.6611, - "step": 40211 - }, - { - "epoch": 1.03, - "learning_rate": 1.527190317475864e-06, - "loss": 0.7188, - "step": 40212 - }, - { - "epoch": 1.03, - "learning_rate": 1.5271668043822605e-06, - "loss": 0.7275, - "step": 40213 - }, - { - "epoch": 1.03, - "learning_rate": 1.5271432908850299e-06, - "loss": 0.7222, - "step": 40214 - }, - { - "epoch": 1.03, - "learning_rate": 1.5271197769841897e-06, - "loss": 0.6519, - "step": 40215 - }, - { - "epoch": 1.03, - "learning_rate": 1.527096262679758e-06, - "loss": 0.5625, - "step": 40216 - }, - { - "epoch": 1.03, - "learning_rate": 1.5270727479717533e-06, - "loss": 0.5977, - "step": 40217 - }, - { - "epoch": 1.03, - "learning_rate": 1.5270492328601931e-06, - "loss": 0.7637, - "step": 40218 - }, - { - "epoch": 1.03, - "learning_rate": 1.5270257173450956e-06, - "loss": 0.5923, - "step": 40219 - }, - { - "epoch": 1.03, - "learning_rate": 1.5270022014264785e-06, - "loss": 0.6992, - "step": 40220 - }, - { - "epoch": 1.03, - "learning_rate": 1.5269786851043604e-06, - "loss": 0.6003, - "step": 40221 - }, - { - "epoch": 1.03, - "learning_rate": 1.5269551683787586e-06, - "loss": 0.7041, - "step": 40222 - }, - { - "epoch": 1.03, - "learning_rate": 1.5269316512496916e-06, - "loss": 0.6816, - "step": 40223 - }, - { - "epoch": 1.03, - "learning_rate": 1.5269081337171772e-06, - "loss": 0.7109, - "step": 40224 - }, - { - "epoch": 1.03, - "learning_rate": 1.5268846157812337e-06, - "loss": 0.5659, - "step": 40225 - }, - { - "epoch": 1.03, - "learning_rate": 1.5268610974418788e-06, - "loss": 0.5107, - "step": 40226 - }, - { - "epoch": 1.03, - "learning_rate": 1.5268375786991303e-06, - "loss": 0.8135, - "step": 40227 - }, - { - "epoch": 1.03, - "learning_rate": 1.5268140595530069e-06, - "loss": 0.7715, - "step": 40228 - }, - { - "epoch": 1.03, - "learning_rate": 1.526790540003526e-06, - "loss": 0.5854, - "step": 40229 - }, - { - "epoch": 1.03, - "learning_rate": 1.5267670200507055e-06, - "loss": 0.7969, - "step": 40230 - }, - { - "epoch": 1.03, - "learning_rate": 1.5267434996945643e-06, - "loss": 0.8135, - "step": 40231 - }, - { - "epoch": 1.03, - "learning_rate": 1.5267199789351195e-06, - "loss": 0.7178, - "step": 40232 - }, - { - "epoch": 1.03, - "learning_rate": 1.5266964577723895e-06, - "loss": 0.7544, - "step": 40233 - }, - { - "epoch": 1.03, - "learning_rate": 1.5266729362063919e-06, - "loss": 0.6104, - "step": 40234 - }, - { - "epoch": 1.03, - "learning_rate": 1.5266494142371455e-06, - "loss": 0.4678, - "step": 40235 - }, - { - "epoch": 1.03, - "learning_rate": 1.5266258918646677e-06, - "loss": 0.7207, - "step": 40236 - }, - { - "epoch": 1.03, - "learning_rate": 1.5266023690889767e-06, - "loss": 0.5845, - "step": 40237 - }, - { - "epoch": 1.03, - "learning_rate": 1.5265788459100905e-06, - "loss": 0.5396, - "step": 40238 - }, - { - "epoch": 1.03, - "learning_rate": 1.526555322328027e-06, - "loss": 0.7246, - "step": 40239 - }, - { - "epoch": 1.03, - "learning_rate": 1.5265317983428042e-06, - "loss": 0.4397, - "step": 40240 - }, - { - "epoch": 1.03, - "learning_rate": 1.5265082739544405e-06, - "loss": 0.3918, - "step": 40241 - }, - { - "epoch": 1.03, - "learning_rate": 1.5264847491629536e-06, - "loss": 0.6133, - "step": 40242 - }, - { - "epoch": 1.03, - "learning_rate": 1.5264612239683615e-06, - "loss": 0.7148, - "step": 40243 - }, - { - "epoch": 1.03, - "learning_rate": 1.5264376983706822e-06, - "loss": 0.541, - "step": 40244 - }, - { - "epoch": 1.03, - "learning_rate": 1.5264141723699337e-06, - "loss": 0.6196, - "step": 40245 - }, - { - "epoch": 1.03, - "learning_rate": 1.526390645966134e-06, - "loss": 0.7207, - "step": 40246 - }, - { - "epoch": 1.03, - "learning_rate": 1.5263671191593012e-06, - "loss": 0.6348, - "step": 40247 - }, - { - "epoch": 1.03, - "learning_rate": 1.5263435919494536e-06, - "loss": 0.7075, - "step": 40248 - }, - { - "epoch": 1.03, - "learning_rate": 1.5263200643366086e-06, - "loss": 0.7871, - "step": 40249 - }, - { - "epoch": 1.03, - "learning_rate": 1.5262965363207845e-06, - "loss": 0.666, - "step": 40250 - }, - { - "epoch": 1.03, - "learning_rate": 1.5262730079019996e-06, - "loss": 0.4595, - "step": 40251 - }, - { - "epoch": 1.03, - "learning_rate": 1.5262494790802715e-06, - "loss": 0.7446, - "step": 40252 - }, - { - "epoch": 1.03, - "learning_rate": 1.5262259498556182e-06, - "loss": 0.4453, - "step": 40253 - }, - { - "epoch": 1.03, - "learning_rate": 1.5262024202280583e-06, - "loss": 0.5679, - "step": 40254 - }, - { - "epoch": 1.03, - "learning_rate": 1.5261788901976092e-06, - "loss": 0.5522, - "step": 40255 - }, - { - "epoch": 1.03, - "learning_rate": 1.5261553597642891e-06, - "loss": 0.7969, - "step": 40256 - }, - { - "epoch": 1.03, - "learning_rate": 1.5261318289281162e-06, - "loss": 0.7344, - "step": 40257 - }, - { - "epoch": 1.03, - "learning_rate": 1.5261082976891081e-06, - "loss": 0.6357, - "step": 40258 - }, - { - "epoch": 1.03, - "learning_rate": 1.5260847660472832e-06, - "loss": 0.7212, - "step": 40259 - }, - { - "epoch": 1.03, - "learning_rate": 1.5260612340026593e-06, - "loss": 0.6001, - "step": 40260 - }, - { - "epoch": 1.03, - "learning_rate": 1.5260377015552546e-06, - "loss": 0.5586, - "step": 40261 - }, - { - "epoch": 1.03, - "learning_rate": 1.5260141687050872e-06, - "loss": 0.6738, - "step": 40262 - }, - { - "epoch": 1.03, - "learning_rate": 1.5259906354521745e-06, - "loss": 0.7373, - "step": 40263 - }, - { - "epoch": 1.03, - "learning_rate": 1.5259671017965352e-06, - "loss": 0.5457, - "step": 40264 - }, - { - "epoch": 1.03, - "learning_rate": 1.525943567738187e-06, - "loss": 0.5225, - "step": 40265 - }, - { - "epoch": 1.03, - "learning_rate": 1.5259200332771477e-06, - "loss": 0.6738, - "step": 40266 - }, - { - "epoch": 1.03, - "learning_rate": 1.5258964984134362e-06, - "loss": 0.603, - "step": 40267 - }, - { - "epoch": 1.03, - "learning_rate": 1.5258729631470696e-06, - "loss": 0.7588, - "step": 40268 - }, - { - "epoch": 1.03, - "learning_rate": 1.5258494274780664e-06, - "loss": 0.5657, - "step": 40269 - }, - { - "epoch": 1.03, - "learning_rate": 1.5258258914064444e-06, - "loss": 0.6143, - "step": 40270 - }, - { - "epoch": 1.03, - "learning_rate": 1.525802354932222e-06, - "loss": 0.6338, - "step": 40271 - }, - { - "epoch": 1.03, - "learning_rate": 1.5257788180554164e-06, - "loss": 0.5596, - "step": 40272 - }, - { - "epoch": 1.03, - "learning_rate": 1.5257552807760463e-06, - "loss": 0.5576, - "step": 40273 - }, - { - "epoch": 1.03, - "learning_rate": 1.5257317430941294e-06, - "loss": 0.5352, - "step": 40274 - }, - { - "epoch": 1.03, - "learning_rate": 1.5257082050096842e-06, - "loss": 0.7744, - "step": 40275 - }, - { - "epoch": 1.03, - "learning_rate": 1.5256846665227283e-06, - "loss": 0.5674, - "step": 40276 - }, - { - "epoch": 1.03, - "learning_rate": 1.5256611276332797e-06, - "loss": 0.7041, - "step": 40277 - }, - { - "epoch": 1.03, - "learning_rate": 1.5256375883413566e-06, - "loss": 0.4795, - "step": 40278 - }, - { - "epoch": 1.03, - "learning_rate": 1.525614048646977e-06, - "loss": 0.5117, - "step": 40279 - }, - { - "epoch": 1.03, - "learning_rate": 1.525590508550159e-06, - "loss": 0.5342, - "step": 40280 - }, - { - "epoch": 1.03, - "learning_rate": 1.5255669680509207e-06, - "loss": 0.7861, - "step": 40281 - }, - { - "epoch": 1.03, - "learning_rate": 1.5255434271492795e-06, - "loss": 0.6157, - "step": 40282 - }, - { - "epoch": 1.03, - "learning_rate": 1.525519885845254e-06, - "loss": 0.7637, - "step": 40283 - }, - { - "epoch": 1.03, - "learning_rate": 1.5254963441388623e-06, - "loss": 0.5264, - "step": 40284 - }, - { - "epoch": 1.03, - "learning_rate": 1.525472802030122e-06, - "loss": 0.7969, - "step": 40285 - }, - { - "epoch": 1.03, - "learning_rate": 1.525449259519051e-06, - "loss": 0.6885, - "step": 40286 - }, - { - "epoch": 1.03, - "learning_rate": 1.5254257166056683e-06, - "loss": 0.6055, - "step": 40287 - }, - { - "epoch": 1.03, - "learning_rate": 1.5254021732899908e-06, - "loss": 0.5337, - "step": 40288 - }, - { - "epoch": 1.03, - "learning_rate": 1.5253786295720373e-06, - "loss": 0.5103, - "step": 40289 - }, - { - "epoch": 1.03, - "learning_rate": 1.5253550854518254e-06, - "loss": 0.6118, - "step": 40290 - }, - { - "epoch": 1.03, - "learning_rate": 1.5253315409293735e-06, - "loss": 0.6953, - "step": 40291 - }, - { - "epoch": 1.03, - "learning_rate": 1.5253079960046994e-06, - "loss": 0.6436, - "step": 40292 - }, - { - "epoch": 1.03, - "learning_rate": 1.525284450677821e-06, - "loss": 0.5806, - "step": 40293 - }, - { - "epoch": 1.03, - "learning_rate": 1.5252609049487562e-06, - "loss": 0.6138, - "step": 40294 - }, - { - "epoch": 1.03, - "learning_rate": 1.5252373588175234e-06, - "loss": 0.54, - "step": 40295 - }, - { - "epoch": 1.03, - "learning_rate": 1.5252138122841407e-06, - "loss": 0.7461, - "step": 40296 - }, - { - "epoch": 1.03, - "learning_rate": 1.5251902653486258e-06, - "loss": 0.6733, - "step": 40297 - }, - { - "epoch": 1.03, - "learning_rate": 1.5251667180109968e-06, - "loss": 0.6885, - "step": 40298 - }, - { - "epoch": 1.03, - "learning_rate": 1.5251431702712717e-06, - "loss": 0.7227, - "step": 40299 - }, - { - "epoch": 1.03, - "learning_rate": 1.5251196221294688e-06, - "loss": 0.7637, - "step": 40300 - }, - { - "epoch": 1.03, - "learning_rate": 1.5250960735856062e-06, - "loss": 0.7246, - "step": 40301 - }, - { - "epoch": 1.03, - "learning_rate": 1.5250725246397016e-06, - "loss": 0.5972, - "step": 40302 - }, - { - "epoch": 1.03, - "learning_rate": 1.5250489752917725e-06, - "loss": 0.6389, - "step": 40303 - }, - { - "epoch": 1.03, - "learning_rate": 1.5250254255418383e-06, - "loss": 0.5925, - "step": 40304 - }, - { - "epoch": 1.03, - "learning_rate": 1.5250018753899157e-06, - "loss": 0.7173, - "step": 40305 - }, - { - "epoch": 1.03, - "learning_rate": 1.5249783248360238e-06, - "loss": 0.8154, - "step": 40306 - }, - { - "epoch": 1.03, - "learning_rate": 1.5249547738801798e-06, - "loss": 0.6221, - "step": 40307 - }, - { - "epoch": 1.03, - "learning_rate": 1.5249312225224022e-06, - "loss": 0.751, - "step": 40308 - }, - { - "epoch": 1.03, - "learning_rate": 1.5249076707627086e-06, - "loss": 0.6816, - "step": 40309 - }, - { - "epoch": 1.03, - "learning_rate": 1.5248841186011179e-06, - "loss": 0.5701, - "step": 40310 - }, - { - "epoch": 1.03, - "learning_rate": 1.5248605660376473e-06, - "loss": 0.71, - "step": 40311 - }, - { - "epoch": 1.03, - "learning_rate": 1.524837013072315e-06, - "loss": 0.7207, - "step": 40312 - }, - { - "epoch": 1.03, - "learning_rate": 1.5248134597051393e-06, - "loss": 0.7822, - "step": 40313 - }, - { - "epoch": 1.03, - "learning_rate": 1.5247899059361378e-06, - "loss": 0.6758, - "step": 40314 - }, - { - "epoch": 1.03, - "learning_rate": 1.5247663517653288e-06, - "loss": 0.7402, - "step": 40315 - }, - { - "epoch": 1.03, - "learning_rate": 1.5247427971927306e-06, - "loss": 0.6343, - "step": 40316 - }, - { - "epoch": 1.03, - "learning_rate": 1.524719242218361e-06, - "loss": 0.7012, - "step": 40317 - }, - { - "epoch": 1.03, - "learning_rate": 1.5246956868422377e-06, - "loss": 0.7842, - "step": 40318 - }, - { - "epoch": 1.03, - "learning_rate": 1.5246721310643792e-06, - "loss": 0.4756, - "step": 40319 - }, - { - "epoch": 1.03, - "learning_rate": 1.5246485748848032e-06, - "loss": 0.79, - "step": 40320 - }, - { - "epoch": 1.03, - "learning_rate": 1.5246250183035282e-06, - "loss": 0.7021, - "step": 40321 - }, - { - "epoch": 1.03, - "learning_rate": 1.524601461320572e-06, - "loss": 0.4829, - "step": 40322 - }, - { - "epoch": 1.03, - "learning_rate": 1.5245779039359523e-06, - "loss": 0.8398, - "step": 40323 - }, - { - "epoch": 1.03, - "learning_rate": 1.5245543461496874e-06, - "loss": 0.668, - "step": 40324 - }, - { - "epoch": 1.03, - "learning_rate": 1.5245307879617957e-06, - "loss": 0.4725, - "step": 40325 - }, - { - "epoch": 1.03, - "learning_rate": 1.5245072293722947e-06, - "loss": 0.6436, - "step": 40326 - }, - { - "epoch": 1.03, - "learning_rate": 1.5244836703812025e-06, - "loss": 0.6104, - "step": 40327 - }, - { - "epoch": 1.03, - "learning_rate": 1.5244601109885373e-06, - "loss": 0.5908, - "step": 40328 - }, - { - "epoch": 1.03, - "learning_rate": 1.5244365511943173e-06, - "loss": 0.6895, - "step": 40329 - }, - { - "epoch": 1.03, - "learning_rate": 1.5244129909985604e-06, - "loss": 0.6528, - "step": 40330 - }, - { - "epoch": 1.03, - "learning_rate": 1.5243894304012841e-06, - "loss": 0.5469, - "step": 40331 - }, - { - "epoch": 1.03, - "learning_rate": 1.5243658694025074e-06, - "loss": 0.5938, - "step": 40332 - }, - { - "epoch": 1.03, - "learning_rate": 1.5243423080022475e-06, - "loss": 0.71, - "step": 40333 - }, - { - "epoch": 1.03, - "learning_rate": 1.5243187462005232e-06, - "loss": 0.6094, - "step": 40334 - }, - { - "epoch": 1.03, - "learning_rate": 1.5242951839973518e-06, - "loss": 0.4534, - "step": 40335 - }, - { - "epoch": 1.03, - "learning_rate": 1.524271621392752e-06, - "loss": 0.5657, - "step": 40336 - }, - { - "epoch": 1.03, - "learning_rate": 1.5242480583867415e-06, - "loss": 0.5425, - "step": 40337 - }, - { - "epoch": 1.03, - "learning_rate": 1.524224494979338e-06, - "loss": 0.7715, - "step": 40338 - }, - { - "epoch": 1.03, - "learning_rate": 1.52420093117056e-06, - "loss": 0.5151, - "step": 40339 - }, - { - "epoch": 1.03, - "learning_rate": 1.524177366960426e-06, - "loss": 0.4988, - "step": 40340 - }, - { - "epoch": 1.03, - "learning_rate": 1.524153802348953e-06, - "loss": 0.5723, - "step": 40341 - }, - { - "epoch": 1.03, - "learning_rate": 1.5241302373361597e-06, - "loss": 0.7637, - "step": 40342 - }, - { - "epoch": 1.03, - "learning_rate": 1.5241066719220639e-06, - "loss": 0.7871, - "step": 40343 - }, - { - "epoch": 1.03, - "learning_rate": 1.5240831061066837e-06, - "loss": 0.7754, - "step": 40344 - }, - { - "epoch": 1.03, - "learning_rate": 1.5240595398900373e-06, - "loss": 0.8291, - "step": 40345 - }, - { - "epoch": 1.03, - "learning_rate": 1.5240359732721425e-06, - "loss": 0.5913, - "step": 40346 - }, - { - "epoch": 1.03, - "learning_rate": 1.5240124062530173e-06, - "loss": 0.6699, - "step": 40347 - }, - { - "epoch": 1.03, - "learning_rate": 1.5239888388326803e-06, - "loss": 0.5947, - "step": 40348 - }, - { - "epoch": 1.03, - "learning_rate": 1.5239652710111485e-06, - "loss": 0.5684, - "step": 40349 - }, - { - "epoch": 1.03, - "learning_rate": 1.5239417027884411e-06, - "loss": 0.8799, - "step": 40350 - }, - { - "epoch": 1.03, - "learning_rate": 1.5239181341645754e-06, - "loss": 0.7676, - "step": 40351 - }, - { - "epoch": 1.03, - "learning_rate": 1.52389456513957e-06, - "loss": 0.541, - "step": 40352 - }, - { - "epoch": 1.03, - "learning_rate": 1.5238709957134424e-06, - "loss": 0.6797, - "step": 40353 - }, - { - "epoch": 1.03, - "learning_rate": 1.5238474258862107e-06, - "loss": 0.5947, - "step": 40354 - }, - { - "epoch": 1.03, - "learning_rate": 1.5238238556578934e-06, - "loss": 0.5814, - "step": 40355 - }, - { - "epoch": 1.03, - "learning_rate": 1.523800285028508e-06, - "loss": 0.6206, - "step": 40356 - }, - { - "epoch": 1.03, - "learning_rate": 1.5237767139980732e-06, - "loss": 0.5498, - "step": 40357 - }, - { - "epoch": 1.03, - "learning_rate": 1.5237531425666062e-06, - "loss": 0.6699, - "step": 40358 - }, - { - "epoch": 1.03, - "learning_rate": 1.5237295707341256e-06, - "loss": 0.4746, - "step": 40359 - }, - { - "epoch": 1.03, - "learning_rate": 1.5237059985006495e-06, - "loss": 0.6567, - "step": 40360 - }, - { - "epoch": 1.03, - "learning_rate": 1.523682425866196e-06, - "loss": 0.6768, - "step": 40361 - }, - { - "epoch": 1.03, - "learning_rate": 1.5236588528307826e-06, - "loss": 0.6885, - "step": 40362 - }, - { - "epoch": 1.03, - "learning_rate": 1.5236352793944275e-06, - "loss": 0.6006, - "step": 40363 - }, - { - "epoch": 1.03, - "learning_rate": 1.5236117055571494e-06, - "loss": 0.6377, - "step": 40364 - }, - { - "epoch": 1.03, - "learning_rate": 1.5235881313189659e-06, - "loss": 0.5483, - "step": 40365 - }, - { - "epoch": 1.03, - "learning_rate": 1.5235645566798948e-06, - "loss": 0.8823, - "step": 40366 - }, - { - "epoch": 1.03, - "learning_rate": 1.5235409816399544e-06, - "loss": 0.6074, - "step": 40367 - }, - { - "epoch": 1.03, - "learning_rate": 1.5235174061991628e-06, - "loss": 0.7422, - "step": 40368 - }, - { - "epoch": 1.03, - "learning_rate": 1.523493830357538e-06, - "loss": 0.4232, - "step": 40369 - }, - { - "epoch": 1.03, - "learning_rate": 1.5234702541150978e-06, - "loss": 0.7109, - "step": 40370 - }, - { - "epoch": 1.03, - "learning_rate": 1.523446677471861e-06, - "loss": 0.6235, - "step": 40371 - }, - { - "epoch": 1.03, - "learning_rate": 1.5234231004278449e-06, - "loss": 0.7852, - "step": 40372 - }, - { - "epoch": 1.03, - "learning_rate": 1.5233995229830678e-06, - "loss": 0.6987, - "step": 40373 - }, - { - "epoch": 1.03, - "learning_rate": 1.5233759451375473e-06, - "loss": 0.4094, - "step": 40374 - }, - { - "epoch": 1.03, - "learning_rate": 1.5233523668913026e-06, - "loss": 0.5972, - "step": 40375 - }, - { - "epoch": 1.03, - "learning_rate": 1.523328788244351e-06, - "loss": 0.7012, - "step": 40376 - }, - { - "epoch": 1.03, - "learning_rate": 1.5233052091967103e-06, - "loss": 0.5234, - "step": 40377 - }, - { - "epoch": 1.03, - "learning_rate": 1.523281629748399e-06, - "loss": 0.644, - "step": 40378 - }, - { - "epoch": 1.03, - "learning_rate": 1.5232580498994347e-06, - "loss": 0.6631, - "step": 40379 - }, - { - "epoch": 1.03, - "learning_rate": 1.5232344696498363e-06, - "loss": 0.6074, - "step": 40380 - }, - { - "epoch": 1.03, - "learning_rate": 1.523210888999621e-06, - "loss": 0.4011, - "step": 40381 - }, - { - "epoch": 1.04, - "learning_rate": 1.5231873079488074e-06, - "loss": 0.5046, - "step": 40382 - }, - { - "epoch": 1.04, - "learning_rate": 1.5231637264974131e-06, - "loss": 0.6401, - "step": 40383 - }, - { - "epoch": 1.04, - "learning_rate": 1.5231401446454567e-06, - "loss": 0.7139, - "step": 40384 - }, - { - "epoch": 1.04, - "learning_rate": 1.5231165623929555e-06, - "loss": 0.5261, - "step": 40385 - }, - { - "epoch": 1.04, - "learning_rate": 1.5230929797399283e-06, - "loss": 0.6899, - "step": 40386 - }, - { - "epoch": 1.04, - "learning_rate": 1.5230693966863925e-06, - "loss": 0.6279, - "step": 40387 - }, - { - "epoch": 1.04, - "learning_rate": 1.5230458132323669e-06, - "loss": 0.6777, - "step": 40388 - }, - { - "epoch": 1.04, - "learning_rate": 1.5230222293778692e-06, - "loss": 0.627, - "step": 40389 - }, - { - "epoch": 1.04, - "learning_rate": 1.5229986451229175e-06, - "loss": 0.5352, - "step": 40390 - }, - { - "epoch": 1.04, - "learning_rate": 1.5229750604675294e-06, - "loss": 0.7959, - "step": 40391 - }, - { - "epoch": 1.04, - "learning_rate": 1.5229514754117236e-06, - "loss": 0.6255, - "step": 40392 - }, - { - "epoch": 1.04, - "learning_rate": 1.5229278899555179e-06, - "loss": 0.6455, - "step": 40393 - }, - { - "epoch": 1.04, - "learning_rate": 1.5229043040989303e-06, - "loss": 0.6836, - "step": 40394 - }, - { - "epoch": 1.04, - "learning_rate": 1.522880717841979e-06, - "loss": 0.6016, - "step": 40395 - }, - { - "epoch": 1.04, - "learning_rate": 1.5228571311846817e-06, - "loss": 0.6416, - "step": 40396 - }, - { - "epoch": 1.04, - "learning_rate": 1.522833544127057e-06, - "loss": 0.5962, - "step": 40397 - }, - { - "epoch": 1.04, - "learning_rate": 1.5228099566691225e-06, - "loss": 0.6313, - "step": 40398 - }, - { - "epoch": 1.04, - "learning_rate": 1.5227863688108966e-06, - "loss": 0.7266, - "step": 40399 - }, - { - "epoch": 1.04, - "learning_rate": 1.5227627805523973e-06, - "loss": 0.6001, - "step": 40400 - }, - { - "epoch": 1.04, - "learning_rate": 1.5227391918936424e-06, - "loss": 0.5508, - "step": 40401 - }, - { - "epoch": 1.04, - "learning_rate": 1.52271560283465e-06, - "loss": 0.8496, - "step": 40402 - }, - { - "epoch": 1.04, - "learning_rate": 1.5226920133754387e-06, - "loss": 0.7344, - "step": 40403 - }, - { - "epoch": 1.04, - "learning_rate": 1.5226684235160258e-06, - "loss": 0.79, - "step": 40404 - }, - { - "epoch": 1.04, - "learning_rate": 1.52264483325643e-06, - "loss": 0.7139, - "step": 40405 - }, - { - "epoch": 1.04, - "learning_rate": 1.5226212425966689e-06, - "loss": 0.626, - "step": 40406 - }, - { - "epoch": 1.04, - "learning_rate": 1.522597651536761e-06, - "loss": 0.8154, - "step": 40407 - }, - { - "epoch": 1.04, - "learning_rate": 1.5225740600767238e-06, - "loss": 0.6572, - "step": 40408 - }, - { - "epoch": 1.04, - "learning_rate": 1.5225504682165759e-06, - "loss": 0.6587, - "step": 40409 - }, - { - "epoch": 1.04, - "learning_rate": 1.522526875956335e-06, - "loss": 0.5928, - "step": 40410 - }, - { - "epoch": 1.04, - "learning_rate": 1.5225032832960194e-06, - "loss": 0.6729, - "step": 40411 - }, - { - "epoch": 1.04, - "learning_rate": 1.522479690235647e-06, - "loss": 0.604, - "step": 40412 - }, - { - "epoch": 1.04, - "learning_rate": 1.5224560967752357e-06, - "loss": 0.5864, - "step": 40413 - }, - { - "epoch": 1.04, - "learning_rate": 1.5224325029148042e-06, - "loss": 0.709, - "step": 40414 - }, - { - "epoch": 1.04, - "learning_rate": 1.5224089086543702e-06, - "loss": 0.5889, - "step": 40415 - }, - { - "epoch": 1.04, - "learning_rate": 1.522385313993951e-06, - "loss": 0.6445, - "step": 40416 - }, - { - "epoch": 1.04, - "learning_rate": 1.5223617189335661e-06, - "loss": 0.7227, - "step": 40417 - }, - { - "epoch": 1.04, - "learning_rate": 1.5223381234732324e-06, - "loss": 0.7354, - "step": 40418 - }, - { - "epoch": 1.04, - "learning_rate": 1.522314527612969e-06, - "loss": 0.5986, - "step": 40419 - }, - { - "epoch": 1.04, - "learning_rate": 1.5222909313527929e-06, - "loss": 0.6914, - "step": 40420 - }, - { - "epoch": 1.04, - "learning_rate": 1.5222673346927227e-06, - "loss": 0.752, - "step": 40421 - }, - { - "epoch": 1.04, - "learning_rate": 1.5222437376327766e-06, - "loss": 0.5867, - "step": 40422 - }, - { - "epoch": 1.04, - "learning_rate": 1.5222201401729722e-06, - "loss": 0.793, - "step": 40423 - }, - { - "epoch": 1.04, - "learning_rate": 1.522196542313328e-06, - "loss": 0.5144, - "step": 40424 - }, - { - "epoch": 1.04, - "learning_rate": 1.5221729440538619e-06, - "loss": 0.583, - "step": 40425 - }, - { - "epoch": 1.04, - "learning_rate": 1.5221493453945922e-06, - "loss": 0.6421, - "step": 40426 - }, - { - "epoch": 1.04, - "learning_rate": 1.5221257463355364e-06, - "loss": 0.748, - "step": 40427 - }, - { - "epoch": 1.04, - "learning_rate": 1.5221021468767131e-06, - "loss": 0.6304, - "step": 40428 - }, - { - "epoch": 1.04, - "learning_rate": 1.52207854701814e-06, - "loss": 0.6172, - "step": 40429 - }, - { - "epoch": 1.04, - "learning_rate": 1.522054946759836e-06, - "loss": 0.6213, - "step": 40430 - }, - { - "epoch": 1.04, - "learning_rate": 1.522031346101818e-06, - "loss": 0.5044, - "step": 40431 - }, - { - "epoch": 1.04, - "learning_rate": 1.5220077450441044e-06, - "loss": 0.7559, - "step": 40432 - }, - { - "epoch": 1.04, - "learning_rate": 1.5219841435867139e-06, - "loss": 0.6606, - "step": 40433 - }, - { - "epoch": 1.04, - "learning_rate": 1.5219605417296642e-06, - "loss": 0.8555, - "step": 40434 - }, - { - "epoch": 1.04, - "learning_rate": 1.5219369394729729e-06, - "loss": 0.8516, - "step": 40435 - }, - { - "epoch": 1.04, - "learning_rate": 1.521913336816659e-06, - "loss": 0.6143, - "step": 40436 - }, - { - "epoch": 1.04, - "learning_rate": 1.5218897337607395e-06, - "loss": 0.4189, - "step": 40437 - }, - { - "epoch": 1.04, - "learning_rate": 1.5218661303052334e-06, - "loss": 0.7725, - "step": 40438 - }, - { - "epoch": 1.04, - "learning_rate": 1.521842526450158e-06, - "loss": 0.6233, - "step": 40439 - }, - { - "epoch": 1.04, - "learning_rate": 1.5218189221955323e-06, - "loss": 0.5842, - "step": 40440 - }, - { - "epoch": 1.04, - "learning_rate": 1.5217953175413735e-06, - "loss": 0.7676, - "step": 40441 - }, - { - "epoch": 1.04, - "learning_rate": 1.5217717124877e-06, - "loss": 0.7979, - "step": 40442 - }, - { - "epoch": 1.04, - "learning_rate": 1.5217481070345302e-06, - "loss": 0.6738, - "step": 40443 - }, - { - "epoch": 1.04, - "learning_rate": 1.5217245011818815e-06, - "loss": 0.7178, - "step": 40444 - }, - { - "epoch": 1.04, - "learning_rate": 1.5217008949297726e-06, - "loss": 0.7837, - "step": 40445 - }, - { - "epoch": 1.04, - "learning_rate": 1.5216772882782213e-06, - "loss": 0.5835, - "step": 40446 - }, - { - "epoch": 1.04, - "learning_rate": 1.5216536812272456e-06, - "loss": 0.6338, - "step": 40447 - }, - { - "epoch": 1.04, - "learning_rate": 1.5216300737768638e-06, - "loss": 0.7324, - "step": 40448 - }, - { - "epoch": 1.04, - "learning_rate": 1.5216064659270935e-06, - "loss": 0.6895, - "step": 40449 - }, - { - "epoch": 1.04, - "learning_rate": 1.5215828576779535e-06, - "loss": 0.8125, - "step": 40450 - }, - { - "epoch": 1.04, - "learning_rate": 1.5215592490294613e-06, - "loss": 0.7451, - "step": 40451 - }, - { - "epoch": 1.04, - "learning_rate": 1.5215356399816351e-06, - "loss": 0.6187, - "step": 40452 - }, - { - "epoch": 1.04, - "learning_rate": 1.521512030534493e-06, - "loss": 0.6387, - "step": 40453 - }, - { - "epoch": 1.04, - "learning_rate": 1.5214884206880534e-06, - "loss": 0.5664, - "step": 40454 - }, - { - "epoch": 1.04, - "learning_rate": 1.521464810442334e-06, - "loss": 0.603, - "step": 40455 - }, - { - "epoch": 1.04, - "learning_rate": 1.5214411997973528e-06, - "loss": 0.7222, - "step": 40456 - }, - { - "epoch": 1.04, - "learning_rate": 1.5214175887531283e-06, - "loss": 0.5889, - "step": 40457 - }, - { - "epoch": 1.04, - "learning_rate": 1.521393977309678e-06, - "loss": 0.5972, - "step": 40458 - }, - { - "epoch": 1.04, - "learning_rate": 1.5213703654670206e-06, - "loss": 0.6072, - "step": 40459 - }, - { - "epoch": 1.04, - "learning_rate": 1.5213467532251738e-06, - "loss": 0.7725, - "step": 40460 - }, - { - "epoch": 1.04, - "learning_rate": 1.5213231405841559e-06, - "loss": 0.668, - "step": 40461 - }, - { - "epoch": 1.04, - "learning_rate": 1.5212995275439843e-06, - "loss": 0.584, - "step": 40462 - }, - { - "epoch": 1.04, - "learning_rate": 1.5212759141046783e-06, - "loss": 0.6094, - "step": 40463 - }, - { - "epoch": 1.04, - "learning_rate": 1.521252300266255e-06, - "loss": 0.5981, - "step": 40464 - }, - { - "epoch": 1.04, - "learning_rate": 1.5212286860287326e-06, - "loss": 0.7305, - "step": 40465 - }, - { - "epoch": 1.04, - "learning_rate": 1.5212050713921297e-06, - "loss": 0.8506, - "step": 40466 - }, - { - "epoch": 1.04, - "learning_rate": 1.5211814563564639e-06, - "loss": 0.8486, - "step": 40467 - }, - { - "epoch": 1.04, - "learning_rate": 1.5211578409217534e-06, - "loss": 0.7109, - "step": 40468 - }, - { - "epoch": 1.04, - "learning_rate": 1.5211342250880161e-06, - "loss": 0.8027, - "step": 40469 - }, - { - "epoch": 1.04, - "learning_rate": 1.5211106088552708e-06, - "loss": 0.6729, - "step": 40470 - }, - { - "epoch": 1.04, - "learning_rate": 1.5210869922235347e-06, - "loss": 0.5884, - "step": 40471 - }, - { - "epoch": 1.04, - "learning_rate": 1.5210633751928264e-06, - "loss": 0.6777, - "step": 40472 - }, - { - "epoch": 1.04, - "learning_rate": 1.5210397577631636e-06, - "loss": 0.4399, - "step": 40473 - }, - { - "epoch": 1.04, - "learning_rate": 1.5210161399345646e-06, - "loss": 0.7061, - "step": 40474 - }, - { - "epoch": 1.04, - "learning_rate": 1.5209925217070478e-06, - "loss": 0.748, - "step": 40475 - }, - { - "epoch": 1.04, - "learning_rate": 1.520968903080631e-06, - "loss": 0.5837, - "step": 40476 - }, - { - "epoch": 1.04, - "learning_rate": 1.5209452840553319e-06, - "loss": 0.6499, - "step": 40477 - }, - { - "epoch": 1.04, - "learning_rate": 1.5209216646311693e-06, - "loss": 0.6855, - "step": 40478 - }, - { - "epoch": 1.04, - "learning_rate": 1.5208980448081607e-06, - "loss": 0.5562, - "step": 40479 - }, - { - "epoch": 1.04, - "learning_rate": 1.5208744245863248e-06, - "loss": 0.6074, - "step": 40480 - }, - { - "epoch": 1.04, - "learning_rate": 1.5208508039656788e-06, - "loss": 0.7148, - "step": 40481 - }, - { - "epoch": 1.04, - "learning_rate": 1.5208271829462417e-06, - "loss": 0.6978, - "step": 40482 - }, - { - "epoch": 1.04, - "learning_rate": 1.5208035615280308e-06, - "loss": 0.6479, - "step": 40483 - }, - { - "epoch": 1.04, - "learning_rate": 1.5207799397110648e-06, - "loss": 0.71, - "step": 40484 - }, - { - "epoch": 1.04, - "learning_rate": 1.5207563174953615e-06, - "loss": 0.6284, - "step": 40485 - }, - { - "epoch": 1.04, - "learning_rate": 1.5207326948809392e-06, - "loss": 0.5625, - "step": 40486 - }, - { - "epoch": 1.04, - "learning_rate": 1.5207090718678154e-06, - "loss": 0.6055, - "step": 40487 - }, - { - "epoch": 1.04, - "learning_rate": 1.520685448456009e-06, - "loss": 0.7305, - "step": 40488 - }, - { - "epoch": 1.04, - "learning_rate": 1.5206618246455375e-06, - "loss": 0.5854, - "step": 40489 - }, - { - "epoch": 1.04, - "learning_rate": 1.5206382004364193e-06, - "loss": 0.6509, - "step": 40490 - }, - { - "epoch": 1.04, - "learning_rate": 1.5206145758286724e-06, - "loss": 0.386, - "step": 40491 - }, - { - "epoch": 1.04, - "learning_rate": 1.5205909508223145e-06, - "loss": 0.7158, - "step": 40492 - }, - { - "epoch": 1.04, - "learning_rate": 1.5205673254173643e-06, - "loss": 0.8535, - "step": 40493 - }, - { - "epoch": 1.04, - "learning_rate": 1.5205436996138396e-06, - "loss": 0.5479, - "step": 40494 - }, - { - "epoch": 1.04, - "learning_rate": 1.5205200734117588e-06, - "loss": 0.7324, - "step": 40495 - }, - { - "epoch": 1.04, - "learning_rate": 1.5204964468111392e-06, - "loss": 0.563, - "step": 40496 - }, - { - "epoch": 1.04, - "learning_rate": 1.5204728198119997e-06, - "loss": 0.585, - "step": 40497 - }, - { - "epoch": 1.04, - "learning_rate": 1.5204491924143582e-06, - "loss": 0.6235, - "step": 40498 - }, - { - "epoch": 1.04, - "learning_rate": 1.5204255646182325e-06, - "loss": 0.6855, - "step": 40499 - }, - { - "epoch": 1.04, - "learning_rate": 1.520401936423641e-06, - "loss": 0.6653, - "step": 40500 - }, - { - "epoch": 1.04, - "learning_rate": 1.5203783078306018e-06, - "loss": 0.543, - "step": 40501 - }, - { - "epoch": 1.04, - "learning_rate": 1.5203546788391325e-06, - "loss": 0.5723, - "step": 40502 - }, - { - "epoch": 1.04, - "learning_rate": 1.5203310494492518e-06, - "loss": 0.5845, - "step": 40503 - }, - { - "epoch": 1.04, - "learning_rate": 1.5203074196609773e-06, - "loss": 0.7695, - "step": 40504 - }, - { - "epoch": 1.04, - "learning_rate": 1.5202837894743277e-06, - "loss": 0.6367, - "step": 40505 - }, - { - "epoch": 1.04, - "learning_rate": 1.5202601588893202e-06, - "loss": 0.7603, - "step": 40506 - }, - { - "epoch": 1.04, - "learning_rate": 1.5202365279059739e-06, - "loss": 0.8838, - "step": 40507 - }, - { - "epoch": 1.04, - "learning_rate": 1.5202128965243062e-06, - "loss": 0.4742, - "step": 40508 - }, - { - "epoch": 1.04, - "learning_rate": 1.5201892647443356e-06, - "loss": 0.7246, - "step": 40509 - }, - { - "epoch": 1.04, - "learning_rate": 1.5201656325660797e-06, - "loss": 0.8027, - "step": 40510 - }, - { - "epoch": 1.04, - "learning_rate": 1.520141999989557e-06, - "loss": 0.6396, - "step": 40511 - }, - { - "epoch": 1.04, - "learning_rate": 1.5201183670147855e-06, - "loss": 0.5498, - "step": 40512 - }, - { - "epoch": 1.04, - "learning_rate": 1.520094733641783e-06, - "loss": 0.7988, - "step": 40513 - }, - { - "epoch": 1.04, - "learning_rate": 1.5200710998705683e-06, - "loss": 0.708, - "step": 40514 - }, - { - "epoch": 1.04, - "learning_rate": 1.5200474657011592e-06, - "loss": 0.4792, - "step": 40515 - }, - { - "epoch": 1.04, - "learning_rate": 1.5200238311335733e-06, - "loss": 0.6484, - "step": 40516 - }, - { - "epoch": 1.04, - "learning_rate": 1.5200001961678291e-06, - "loss": 0.6699, - "step": 40517 - }, - { - "epoch": 1.04, - "learning_rate": 1.5199765608039447e-06, - "loss": 0.6582, - "step": 40518 - }, - { - "epoch": 1.04, - "learning_rate": 1.5199529250419384e-06, - "loss": 0.7158, - "step": 40519 - }, - { - "epoch": 1.04, - "learning_rate": 1.519929288881828e-06, - "loss": 0.4893, - "step": 40520 - }, - { - "epoch": 1.04, - "learning_rate": 1.5199056523236314e-06, - "loss": 0.6567, - "step": 40521 - }, - { - "epoch": 1.04, - "learning_rate": 1.519882015367367e-06, - "loss": 0.5781, - "step": 40522 - }, - { - "epoch": 1.04, - "learning_rate": 1.519858378013053e-06, - "loss": 0.7354, - "step": 40523 - }, - { - "epoch": 1.04, - "learning_rate": 1.5198347402607073e-06, - "loss": 0.5266, - "step": 40524 - }, - { - "epoch": 1.04, - "learning_rate": 1.519811102110348e-06, - "loss": 0.6797, - "step": 40525 - }, - { - "epoch": 1.04, - "learning_rate": 1.5197874635619932e-06, - "loss": 0.6914, - "step": 40526 - }, - { - "epoch": 1.04, - "learning_rate": 1.5197638246156607e-06, - "loss": 0.792, - "step": 40527 - }, - { - "epoch": 1.04, - "learning_rate": 1.5197401852713695e-06, - "loss": 0.5337, - "step": 40528 - }, - { - "epoch": 1.04, - "learning_rate": 1.5197165455291368e-06, - "loss": 0.6191, - "step": 40529 - }, - { - "epoch": 1.04, - "learning_rate": 1.5196929053889813e-06, - "loss": 0.6255, - "step": 40530 - }, - { - "epoch": 1.04, - "learning_rate": 1.5196692648509205e-06, - "loss": 0.4441, - "step": 40531 - }, - { - "epoch": 1.04, - "learning_rate": 1.5196456239149733e-06, - "loss": 0.6846, - "step": 40532 - }, - { - "epoch": 1.04, - "learning_rate": 1.519621982581157e-06, - "loss": 0.8418, - "step": 40533 - }, - { - "epoch": 1.04, - "learning_rate": 1.5195983408494901e-06, - "loss": 0.6123, - "step": 40534 - }, - { - "epoch": 1.04, - "learning_rate": 1.5195746987199909e-06, - "loss": 0.7637, - "step": 40535 - }, - { - "epoch": 1.04, - "learning_rate": 1.519551056192677e-06, - "loss": 0.6226, - "step": 40536 - }, - { - "epoch": 1.04, - "learning_rate": 1.5195274132675667e-06, - "loss": 0.8047, - "step": 40537 - }, - { - "epoch": 1.04, - "learning_rate": 1.519503769944678e-06, - "loss": 0.5977, - "step": 40538 - }, - { - "epoch": 1.04, - "learning_rate": 1.5194801262240296e-06, - "loss": 0.729, - "step": 40539 - }, - { - "epoch": 1.04, - "learning_rate": 1.519456482105639e-06, - "loss": 0.7217, - "step": 40540 - }, - { - "epoch": 1.04, - "learning_rate": 1.5194328375895244e-06, - "loss": 0.7568, - "step": 40541 - }, - { - "epoch": 1.04, - "learning_rate": 1.5194091926757037e-06, - "loss": 0.8535, - "step": 40542 - }, - { - "epoch": 1.04, - "learning_rate": 1.5193855473641954e-06, - "loss": 0.6567, - "step": 40543 - }, - { - "epoch": 1.04, - "learning_rate": 1.5193619016550175e-06, - "loss": 0.5603, - "step": 40544 - }, - { - "epoch": 1.04, - "learning_rate": 1.5193382555481887e-06, - "loss": 0.7842, - "step": 40545 - }, - { - "epoch": 1.04, - "learning_rate": 1.5193146090437257e-06, - "loss": 0.6572, - "step": 40546 - }, - { - "epoch": 1.04, - "learning_rate": 1.5192909621416477e-06, - "loss": 0.6709, - "step": 40547 - }, - { - "epoch": 1.04, - "learning_rate": 1.5192673148419722e-06, - "loss": 0.6309, - "step": 40548 - }, - { - "epoch": 1.04, - "learning_rate": 1.519243667144718e-06, - "loss": 0.6934, - "step": 40549 - }, - { - "epoch": 1.04, - "learning_rate": 1.5192200190499024e-06, - "loss": 0.6299, - "step": 40550 - }, - { - "epoch": 1.04, - "learning_rate": 1.5191963705575442e-06, - "loss": 0.6904, - "step": 40551 - }, - { - "epoch": 1.04, - "learning_rate": 1.5191727216676608e-06, - "loss": 0.5981, - "step": 40552 - }, - { - "epoch": 1.04, - "learning_rate": 1.5191490723802711e-06, - "loss": 0.5366, - "step": 40553 - }, - { - "epoch": 1.04, - "learning_rate": 1.5191254226953928e-06, - "loss": 0.8164, - "step": 40554 - }, - { - "epoch": 1.04, - "learning_rate": 1.5191017726130442e-06, - "loss": 0.6646, - "step": 40555 - }, - { - "epoch": 1.04, - "learning_rate": 1.519078122133243e-06, - "loss": 0.4154, - "step": 40556 - }, - { - "epoch": 1.04, - "learning_rate": 1.5190544712560073e-06, - "loss": 0.7529, - "step": 40557 - }, - { - "epoch": 1.04, - "learning_rate": 1.519030819981356e-06, - "loss": 0.8037, - "step": 40558 - }, - { - "epoch": 1.04, - "learning_rate": 1.5190071683093063e-06, - "loss": 0.7627, - "step": 40559 - }, - { - "epoch": 1.04, - "learning_rate": 1.5189835162398769e-06, - "loss": 0.5725, - "step": 40560 - }, - { - "epoch": 1.04, - "learning_rate": 1.5189598637730855e-06, - "loss": 0.4363, - "step": 40561 - }, - { - "epoch": 1.04, - "learning_rate": 1.5189362109089502e-06, - "loss": 0.7212, - "step": 40562 - }, - { - "epoch": 1.04, - "learning_rate": 1.5189125576474897e-06, - "loss": 0.8066, - "step": 40563 - }, - { - "epoch": 1.04, - "learning_rate": 1.5188889039887215e-06, - "loss": 0.5254, - "step": 40564 - }, - { - "epoch": 1.04, - "learning_rate": 1.5188652499326642e-06, - "loss": 0.6772, - "step": 40565 - }, - { - "epoch": 1.04, - "learning_rate": 1.5188415954793355e-06, - "loss": 0.7446, - "step": 40566 - }, - { - "epoch": 1.04, - "learning_rate": 1.5188179406287534e-06, - "loss": 0.6738, - "step": 40567 - }, - { - "epoch": 1.04, - "learning_rate": 1.5187942853809364e-06, - "loss": 0.5142, - "step": 40568 - }, - { - "epoch": 1.04, - "learning_rate": 1.5187706297359025e-06, - "loss": 0.5776, - "step": 40569 - }, - { - "epoch": 1.04, - "learning_rate": 1.51874697369367e-06, - "loss": 0.5347, - "step": 40570 - }, - { - "epoch": 1.04, - "learning_rate": 1.5187233172542564e-06, - "loss": 0.584, - "step": 40571 - }, - { - "epoch": 1.04, - "learning_rate": 1.5186996604176804e-06, - "loss": 0.7168, - "step": 40572 - }, - { - "epoch": 1.04, - "learning_rate": 1.51867600318396e-06, - "loss": 0.6387, - "step": 40573 - }, - { - "epoch": 1.04, - "learning_rate": 1.5186523455531131e-06, - "loss": 0.7197, - "step": 40574 - }, - { - "epoch": 1.04, - "learning_rate": 1.5186286875251582e-06, - "loss": 0.7529, - "step": 40575 - }, - { - "epoch": 1.04, - "learning_rate": 1.5186050291001126e-06, - "loss": 0.7148, - "step": 40576 - }, - { - "epoch": 1.04, - "learning_rate": 1.5185813702779955e-06, - "loss": 0.6631, - "step": 40577 - }, - { - "epoch": 1.04, - "learning_rate": 1.5185577110588243e-06, - "loss": 0.5537, - "step": 40578 - }, - { - "epoch": 1.04, - "learning_rate": 1.5185340514426172e-06, - "loss": 0.6113, - "step": 40579 - }, - { - "epoch": 1.04, - "learning_rate": 1.5185103914293926e-06, - "loss": 0.5679, - "step": 40580 - }, - { - "epoch": 1.04, - "learning_rate": 1.5184867310191686e-06, - "loss": 0.7261, - "step": 40581 - }, - { - "epoch": 1.04, - "learning_rate": 1.5184630702119628e-06, - "loss": 0.7031, - "step": 40582 - }, - { - "epoch": 1.04, - "learning_rate": 1.5184394090077936e-06, - "loss": 0.6582, - "step": 40583 - }, - { - "epoch": 1.04, - "learning_rate": 1.5184157474066794e-06, - "loss": 0.6929, - "step": 40584 - }, - { - "epoch": 1.04, - "learning_rate": 1.5183920854086383e-06, - "loss": 0.7725, - "step": 40585 - }, - { - "epoch": 1.04, - "learning_rate": 1.518368423013688e-06, - "loss": 0.709, - "step": 40586 - }, - { - "epoch": 1.04, - "learning_rate": 1.518344760221847e-06, - "loss": 0.7246, - "step": 40587 - }, - { - "epoch": 1.04, - "learning_rate": 1.5183210970331329e-06, - "loss": 0.8008, - "step": 40588 - }, - { - "epoch": 1.04, - "learning_rate": 1.5182974334475644e-06, - "loss": 0.5173, - "step": 40589 - }, - { - "epoch": 1.04, - "learning_rate": 1.5182737694651593e-06, - "loss": 0.6841, - "step": 40590 - }, - { - "epoch": 1.04, - "learning_rate": 1.518250105085936e-06, - "loss": 0.958, - "step": 40591 - }, - { - "epoch": 1.04, - "learning_rate": 1.5182264403099121e-06, - "loss": 0.7412, - "step": 40592 - }, - { - "epoch": 1.04, - "learning_rate": 1.5182027751371062e-06, - "loss": 0.5449, - "step": 40593 - }, - { - "epoch": 1.04, - "learning_rate": 1.5181791095675363e-06, - "loss": 0.5693, - "step": 40594 - }, - { - "epoch": 1.04, - "learning_rate": 1.5181554436012208e-06, - "loss": 0.4109, - "step": 40595 - }, - { - "epoch": 1.04, - "learning_rate": 1.5181317772381767e-06, - "loss": 0.8389, - "step": 40596 - }, - { - "epoch": 1.04, - "learning_rate": 1.5181081104784234e-06, - "loss": 0.6709, - "step": 40597 - }, - { - "epoch": 1.04, - "learning_rate": 1.5180844433219785e-06, - "loss": 0.5879, - "step": 40598 - }, - { - "epoch": 1.04, - "learning_rate": 1.5180607757688603e-06, - "loss": 0.5242, - "step": 40599 - }, - { - "epoch": 1.04, - "learning_rate": 1.5180371078190867e-06, - "loss": 0.5996, - "step": 40600 - }, - { - "epoch": 1.04, - "learning_rate": 1.5180134394726758e-06, - "loss": 0.7129, - "step": 40601 - }, - { - "epoch": 1.04, - "learning_rate": 1.517989770729646e-06, - "loss": 0.6602, - "step": 40602 - }, - { - "epoch": 1.04, - "learning_rate": 1.5179661015900149e-06, - "loss": 0.8359, - "step": 40603 - }, - { - "epoch": 1.04, - "learning_rate": 1.5179424320538015e-06, - "loss": 0.5215, - "step": 40604 - }, - { - "epoch": 1.04, - "learning_rate": 1.517918762121023e-06, - "loss": 0.8633, - "step": 40605 - }, - { - "epoch": 1.04, - "learning_rate": 1.5178950917916984e-06, - "loss": 0.6104, - "step": 40606 - }, - { - "epoch": 1.04, - "learning_rate": 1.5178714210658448e-06, - "loss": 0.7324, - "step": 40607 - }, - { - "epoch": 1.04, - "learning_rate": 1.517847749943481e-06, - "loss": 0.6309, - "step": 40608 - }, - { - "epoch": 1.04, - "learning_rate": 1.517824078424625e-06, - "loss": 0.5833, - "step": 40609 - }, - { - "epoch": 1.04, - "learning_rate": 1.5178004065092952e-06, - "loss": 0.6011, - "step": 40610 - }, - { - "epoch": 1.04, - "learning_rate": 1.517776734197509e-06, - "loss": 0.7578, - "step": 40611 - }, - { - "epoch": 1.04, - "learning_rate": 1.517753061489285e-06, - "loss": 0.5625, - "step": 40612 - }, - { - "epoch": 1.04, - "learning_rate": 1.5177293883846414e-06, - "loss": 0.6104, - "step": 40613 - }, - { - "epoch": 1.04, - "learning_rate": 1.5177057148835965e-06, - "loss": 0.5913, - "step": 40614 - }, - { - "epoch": 1.04, - "learning_rate": 1.517682040986168e-06, - "loss": 0.6514, - "step": 40615 - }, - { - "epoch": 1.04, - "learning_rate": 1.517658366692374e-06, - "loss": 0.4094, - "step": 40616 - }, - { - "epoch": 1.04, - "learning_rate": 1.5176346920022327e-06, - "loss": 0.5706, - "step": 40617 - }, - { - "epoch": 1.04, - "learning_rate": 1.5176110169157625e-06, - "loss": 0.4463, - "step": 40618 - }, - { - "epoch": 1.04, - "learning_rate": 1.5175873414329817e-06, - "loss": 0.873, - "step": 40619 - }, - { - "epoch": 1.04, - "learning_rate": 1.5175636655539076e-06, - "loss": 0.5612, - "step": 40620 - }, - { - "epoch": 1.04, - "learning_rate": 1.5175399892785588e-06, - "loss": 0.5791, - "step": 40621 - }, - { - "epoch": 1.04, - "learning_rate": 1.5175163126069533e-06, - "loss": 0.6953, - "step": 40622 - }, - { - "epoch": 1.04, - "learning_rate": 1.5174926355391095e-06, - "loss": 0.5542, - "step": 40623 - }, - { - "epoch": 1.04, - "learning_rate": 1.5174689580750456e-06, - "loss": 0.666, - "step": 40624 - }, - { - "epoch": 1.04, - "learning_rate": 1.5174452802147794e-06, - "loss": 0.7822, - "step": 40625 - }, - { - "epoch": 1.04, - "learning_rate": 1.517421601958329e-06, - "loss": 0.7017, - "step": 40626 - }, - { - "epoch": 1.04, - "learning_rate": 1.5173979233057129e-06, - "loss": 0.4827, - "step": 40627 - }, - { - "epoch": 1.04, - "learning_rate": 1.5173742442569485e-06, - "loss": 0.6201, - "step": 40628 - }, - { - "epoch": 1.04, - "learning_rate": 1.5173505648120553e-06, - "loss": 0.7764, - "step": 40629 - }, - { - "epoch": 1.04, - "learning_rate": 1.51732688497105e-06, - "loss": 0.7295, - "step": 40630 - }, - { - "epoch": 1.04, - "learning_rate": 1.5173032047339513e-06, - "loss": 0.4941, - "step": 40631 - }, - { - "epoch": 1.04, - "learning_rate": 1.5172795241007771e-06, - "loss": 0.6138, - "step": 40632 - }, - { - "epoch": 1.04, - "learning_rate": 1.5172558430715462e-06, - "loss": 0.6318, - "step": 40633 - }, - { - "epoch": 1.04, - "learning_rate": 1.5172321616462761e-06, - "loss": 0.707, - "step": 40634 - }, - { - "epoch": 1.04, - "learning_rate": 1.5172084798249853e-06, - "loss": 0.6091, - "step": 40635 - }, - { - "epoch": 1.04, - "learning_rate": 1.5171847976076918e-06, - "loss": 0.6162, - "step": 40636 - }, - { - "epoch": 1.04, - "learning_rate": 1.5171611149944133e-06, - "loss": 0.4878, - "step": 40637 - }, - { - "epoch": 1.04, - "learning_rate": 1.5171374319851683e-06, - "loss": 0.6738, - "step": 40638 - }, - { - "epoch": 1.04, - "learning_rate": 1.5171137485799753e-06, - "loss": 0.6689, - "step": 40639 - }, - { - "epoch": 1.04, - "learning_rate": 1.517090064778852e-06, - "loss": 0.6592, - "step": 40640 - }, - { - "epoch": 1.04, - "learning_rate": 1.5170663805818164e-06, - "loss": 0.6792, - "step": 40641 - }, - { - "epoch": 1.04, - "learning_rate": 1.5170426959888868e-06, - "loss": 0.5596, - "step": 40642 - }, - { - "epoch": 1.04, - "learning_rate": 1.5170190110000818e-06, - "loss": 0.6206, - "step": 40643 - }, - { - "epoch": 1.04, - "learning_rate": 1.516995325615419e-06, - "loss": 0.6875, - "step": 40644 - }, - { - "epoch": 1.04, - "learning_rate": 1.5169716398349163e-06, - "loss": 0.5596, - "step": 40645 - }, - { - "epoch": 1.04, - "learning_rate": 1.5169479536585925e-06, - "loss": 0.635, - "step": 40646 - }, - { - "epoch": 1.04, - "learning_rate": 1.5169242670864652e-06, - "loss": 0.7812, - "step": 40647 - }, - { - "epoch": 1.04, - "learning_rate": 1.5169005801185529e-06, - "loss": 0.6138, - "step": 40648 - }, - { - "epoch": 1.04, - "learning_rate": 1.5168768927548737e-06, - "loss": 0.6475, - "step": 40649 - }, - { - "epoch": 1.04, - "learning_rate": 1.5168532049954455e-06, - "loss": 0.8105, - "step": 40650 - }, - { - "epoch": 1.04, - "learning_rate": 1.5168295168402865e-06, - "loss": 0.7295, - "step": 40651 - }, - { - "epoch": 1.04, - "learning_rate": 1.5168058282894148e-06, - "loss": 0.6816, - "step": 40652 - }, - { - "epoch": 1.04, - "learning_rate": 1.5167821393428488e-06, - "loss": 0.5415, - "step": 40653 - }, - { - "epoch": 1.04, - "learning_rate": 1.5167584500006068e-06, - "loss": 0.7202, - "step": 40654 - }, - { - "epoch": 1.04, - "learning_rate": 1.5167347602627061e-06, - "loss": 0.7695, - "step": 40655 - }, - { - "epoch": 1.04, - "learning_rate": 1.516711070129166e-06, - "loss": 0.5864, - "step": 40656 - }, - { - "epoch": 1.04, - "learning_rate": 1.516687379600003e-06, - "loss": 0.7266, - "step": 40657 - }, - { - "epoch": 1.04, - "learning_rate": 1.516663688675237e-06, - "loss": 0.6562, - "step": 40658 - }, - { - "epoch": 1.04, - "learning_rate": 1.5166399973548854e-06, - "loss": 0.5327, - "step": 40659 - }, - { - "epoch": 1.04, - "learning_rate": 1.516616305638966e-06, - "loss": 0.6802, - "step": 40660 - }, - { - "epoch": 1.04, - "learning_rate": 1.5165926135274974e-06, - "loss": 0.5801, - "step": 40661 - }, - { - "epoch": 1.04, - "learning_rate": 1.5165689210204976e-06, - "loss": 0.6855, - "step": 40662 - }, - { - "epoch": 1.04, - "learning_rate": 1.5165452281179842e-06, - "loss": 0.6265, - "step": 40663 - }, - { - "epoch": 1.04, - "learning_rate": 1.5165215348199764e-06, - "loss": 0.6411, - "step": 40664 - }, - { - "epoch": 1.04, - "learning_rate": 1.5164978411264918e-06, - "loss": 0.6924, - "step": 40665 - }, - { - "epoch": 1.04, - "learning_rate": 1.5164741470375485e-06, - "loss": 0.6748, - "step": 40666 - }, - { - "epoch": 1.04, - "learning_rate": 1.5164504525531645e-06, - "loss": 0.603, - "step": 40667 - }, - { - "epoch": 1.04, - "learning_rate": 1.5164267576733586e-06, - "loss": 0.5645, - "step": 40668 - }, - { - "epoch": 1.04, - "learning_rate": 1.5164030623981484e-06, - "loss": 0.6924, - "step": 40669 - }, - { - "epoch": 1.04, - "learning_rate": 1.5163793667275514e-06, - "loss": 0.6157, - "step": 40670 - }, - { - "epoch": 1.04, - "learning_rate": 1.5163556706615873e-06, - "loss": 0.6704, - "step": 40671 - }, - { - "epoch": 1.04, - "learning_rate": 1.5163319742002728e-06, - "loss": 0.468, - "step": 40672 - }, - { - "epoch": 1.04, - "learning_rate": 1.5163082773436271e-06, - "loss": 0.6323, - "step": 40673 - }, - { - "epoch": 1.04, - "learning_rate": 1.5162845800916678e-06, - "loss": 0.3464, - "step": 40674 - }, - { - "epoch": 1.04, - "learning_rate": 1.516260882444413e-06, - "loss": 0.7324, - "step": 40675 - }, - { - "epoch": 1.04, - "learning_rate": 1.516237184401881e-06, - "loss": 0.6392, - "step": 40676 - }, - { - "epoch": 1.04, - "learning_rate": 1.5162134859640898e-06, - "loss": 0.5283, - "step": 40677 - }, - { - "epoch": 1.04, - "learning_rate": 1.516189787131058e-06, - "loss": 0.7129, - "step": 40678 - }, - { - "epoch": 1.04, - "learning_rate": 1.5161660879028034e-06, - "loss": 0.7451, - "step": 40679 - }, - { - "epoch": 1.04, - "learning_rate": 1.5161423882793436e-06, - "loss": 0.7393, - "step": 40680 - }, - { - "epoch": 1.04, - "learning_rate": 1.5161186882606977e-06, - "loss": 0.7754, - "step": 40681 - }, - { - "epoch": 1.04, - "learning_rate": 1.5160949878468836e-06, - "loss": 0.5835, - "step": 40682 - }, - { - "epoch": 1.04, - "learning_rate": 1.5160712870379192e-06, - "loss": 0.7178, - "step": 40683 - }, - { - "epoch": 1.04, - "learning_rate": 1.5160475858338227e-06, - "loss": 0.501, - "step": 40684 - }, - { - "epoch": 1.04, - "learning_rate": 1.5160238842346122e-06, - "loss": 0.7383, - "step": 40685 - }, - { - "epoch": 1.04, - "learning_rate": 1.5160001822403062e-06, - "loss": 0.6548, - "step": 40686 - }, - { - "epoch": 1.04, - "learning_rate": 1.5159764798509222e-06, - "loss": 0.7207, - "step": 40687 - }, - { - "epoch": 1.04, - "learning_rate": 1.515952777066479e-06, - "loss": 0.7793, - "step": 40688 - }, - { - "epoch": 1.04, - "learning_rate": 1.5159290738869946e-06, - "loss": 0.6846, - "step": 40689 - }, - { - "epoch": 1.04, - "learning_rate": 1.515905370312487e-06, - "loss": 0.834, - "step": 40690 - }, - { - "epoch": 1.04, - "learning_rate": 1.515881666342974e-06, - "loss": 0.6602, - "step": 40691 - }, - { - "epoch": 1.04, - "learning_rate": 1.5158579619784743e-06, - "loss": 0.6035, - "step": 40692 - }, - { - "epoch": 1.04, - "learning_rate": 1.515834257219006e-06, - "loss": 0.6626, - "step": 40693 - }, - { - "epoch": 1.04, - "learning_rate": 1.5158105520645874e-06, - "loss": 0.5815, - "step": 40694 - }, - { - "epoch": 1.04, - "learning_rate": 1.5157868465152358e-06, - "loss": 0.7373, - "step": 40695 - }, - { - "epoch": 1.04, - "learning_rate": 1.5157631405709702e-06, - "loss": 0.7004, - "step": 40696 - }, - { - "epoch": 1.04, - "learning_rate": 1.5157394342318084e-06, - "loss": 0.4197, - "step": 40697 - }, - { - "epoch": 1.04, - "learning_rate": 1.5157157274977688e-06, - "loss": 0.6709, - "step": 40698 - }, - { - "epoch": 1.04, - "learning_rate": 1.5156920203688693e-06, - "loss": 0.5474, - "step": 40699 - }, - { - "epoch": 1.04, - "learning_rate": 1.5156683128451282e-06, - "loss": 0.7676, - "step": 40700 - }, - { - "epoch": 1.04, - "learning_rate": 1.5156446049265634e-06, - "loss": 0.4626, - "step": 40701 - }, - { - "epoch": 1.04, - "learning_rate": 1.5156208966131933e-06, - "loss": 0.8271, - "step": 40702 - }, - { - "epoch": 1.04, - "learning_rate": 1.515597187905036e-06, - "loss": 0.6494, - "step": 40703 - }, - { - "epoch": 1.04, - "learning_rate": 1.5155734788021098e-06, - "loss": 0.5923, - "step": 40704 - }, - { - "epoch": 1.04, - "learning_rate": 1.5155497693044325e-06, - "loss": 0.4388, - "step": 40705 - }, - { - "epoch": 1.04, - "learning_rate": 1.5155260594120226e-06, - "loss": 0.6855, - "step": 40706 - }, - { - "epoch": 1.04, - "learning_rate": 1.5155023491248978e-06, - "loss": 0.6699, - "step": 40707 - }, - { - "epoch": 1.04, - "learning_rate": 1.515478638443077e-06, - "loss": 0.8887, - "step": 40708 - }, - { - "epoch": 1.04, - "learning_rate": 1.5154549273665774e-06, - "loss": 0.7793, - "step": 40709 - }, - { - "epoch": 1.04, - "learning_rate": 1.515431215895418e-06, - "loss": 0.6221, - "step": 40710 - }, - { - "epoch": 1.04, - "learning_rate": 1.5154075040296165e-06, - "loss": 0.6196, - "step": 40711 - }, - { - "epoch": 1.04, - "learning_rate": 1.5153837917691911e-06, - "loss": 0.6865, - "step": 40712 - }, - { - "epoch": 1.04, - "learning_rate": 1.5153600791141604e-06, - "loss": 0.77, - "step": 40713 - }, - { - "epoch": 1.04, - "learning_rate": 1.5153363660645417e-06, - "loss": 0.6646, - "step": 40714 - }, - { - "epoch": 1.04, - "learning_rate": 1.5153126526203539e-06, - "loss": 0.6078, - "step": 40715 - }, - { - "epoch": 1.04, - "learning_rate": 1.515288938781615e-06, - "loss": 0.6172, - "step": 40716 - }, - { - "epoch": 1.04, - "learning_rate": 1.5152652245483428e-06, - "loss": 0.6327, - "step": 40717 - }, - { - "epoch": 1.04, - "learning_rate": 1.5152415099205559e-06, - "loss": 0.6963, - "step": 40718 - }, - { - "epoch": 1.04, - "learning_rate": 1.5152177948982724e-06, - "loss": 0.5182, - "step": 40719 - }, - { - "epoch": 1.04, - "learning_rate": 1.51519407948151e-06, - "loss": 0.5972, - "step": 40720 - }, - { - "epoch": 1.04, - "learning_rate": 1.5151703636702873e-06, - "loss": 0.7148, - "step": 40721 - }, - { - "epoch": 1.04, - "learning_rate": 1.5151466474646224e-06, - "loss": 0.7803, - "step": 40722 - }, - { - "epoch": 1.04, - "learning_rate": 1.5151229308645331e-06, - "loss": 0.4995, - "step": 40723 - }, - { - "epoch": 1.04, - "learning_rate": 1.5150992138700383e-06, - "loss": 0.5889, - "step": 40724 - }, - { - "epoch": 1.04, - "learning_rate": 1.5150754964811555e-06, - "loss": 0.6587, - "step": 40725 - }, - { - "epoch": 1.04, - "learning_rate": 1.5150517786979032e-06, - "loss": 0.5825, - "step": 40726 - }, - { - "epoch": 1.04, - "learning_rate": 1.5150280605202993e-06, - "loss": 0.6348, - "step": 40727 - }, - { - "epoch": 1.04, - "learning_rate": 1.515004341948362e-06, - "loss": 0.7324, - "step": 40728 - }, - { - "epoch": 1.04, - "learning_rate": 1.5149806229821098e-06, - "loss": 0.6611, - "step": 40729 - }, - { - "epoch": 1.04, - "learning_rate": 1.5149569036215603e-06, - "loss": 0.7686, - "step": 40730 - }, - { - "epoch": 1.04, - "learning_rate": 1.5149331838667325e-06, - "loss": 0.7441, - "step": 40731 - }, - { - "epoch": 1.04, - "learning_rate": 1.5149094637176436e-06, - "loss": 0.6758, - "step": 40732 - }, - { - "epoch": 1.04, - "learning_rate": 1.5148857431743123e-06, - "loss": 0.6953, - "step": 40733 - }, - { - "epoch": 1.04, - "learning_rate": 1.5148620222367567e-06, - "loss": 0.3719, - "step": 40734 - }, - { - "epoch": 1.04, - "learning_rate": 1.5148383009049947e-06, - "loss": 0.7607, - "step": 40735 - }, - { - "epoch": 1.04, - "learning_rate": 1.514814579179045e-06, - "loss": 0.7256, - "step": 40736 - }, - { - "epoch": 1.04, - "learning_rate": 1.5147908570589252e-06, - "loss": 0.6411, - "step": 40737 - }, - { - "epoch": 1.04, - "learning_rate": 1.514767134544654e-06, - "loss": 0.5889, - "step": 40738 - }, - { - "epoch": 1.04, - "learning_rate": 1.5147434116362491e-06, - "loss": 0.6079, - "step": 40739 - }, - { - "epoch": 1.04, - "learning_rate": 1.514719688333729e-06, - "loss": 0.5657, - "step": 40740 - }, - { - "epoch": 1.04, - "learning_rate": 1.5146959646371116e-06, - "loss": 0.5122, - "step": 40741 - }, - { - "epoch": 1.04, - "learning_rate": 1.5146722405464152e-06, - "loss": 0.5728, - "step": 40742 - }, - { - "epoch": 1.04, - "learning_rate": 1.5146485160616575e-06, - "loss": 0.6924, - "step": 40743 - }, - { - "epoch": 1.04, - "learning_rate": 1.5146247911828578e-06, - "loss": 0.709, - "step": 40744 - }, - { - "epoch": 1.04, - "learning_rate": 1.514601065910033e-06, - "loss": 0.707, - "step": 40745 - }, - { - "epoch": 1.04, - "learning_rate": 1.514577340243202e-06, - "loss": 0.6709, - "step": 40746 - }, - { - "epoch": 1.04, - "learning_rate": 1.5145536141823829e-06, - "loss": 0.6875, - "step": 40747 - }, - { - "epoch": 1.04, - "learning_rate": 1.5145298877275936e-06, - "loss": 0.5759, - "step": 40748 - }, - { - "epoch": 1.04, - "learning_rate": 1.5145061608788528e-06, - "loss": 0.6621, - "step": 40749 - }, - { - "epoch": 1.04, - "learning_rate": 1.514482433636178e-06, - "loss": 0.4368, - "step": 40750 - }, - { - "epoch": 1.04, - "learning_rate": 1.5144587059995875e-06, - "loss": 0.8232, - "step": 40751 - }, - { - "epoch": 1.04, - "learning_rate": 1.5144349779691e-06, - "loss": 0.6914, - "step": 40752 - }, - { - "epoch": 1.04, - "learning_rate": 1.5144112495447327e-06, - "loss": 0.4951, - "step": 40753 - }, - { - "epoch": 1.04, - "learning_rate": 1.514387520726505e-06, - "loss": 0.6914, - "step": 40754 - }, - { - "epoch": 1.04, - "learning_rate": 1.5143637915144343e-06, - "loss": 0.5701, - "step": 40755 - }, - { - "epoch": 1.04, - "learning_rate": 1.5143400619085386e-06, - "loss": 0.541, - "step": 40756 - }, - { - "epoch": 1.04, - "learning_rate": 1.5143163319088364e-06, - "loss": 0.7432, - "step": 40757 - }, - { - "epoch": 1.04, - "learning_rate": 1.514292601515346e-06, - "loss": 0.7446, - "step": 40758 - }, - { - "epoch": 1.04, - "learning_rate": 1.5142688707280856e-06, - "loss": 0.7686, - "step": 40759 - }, - { - "epoch": 1.04, - "learning_rate": 1.5142451395470727e-06, - "loss": 0.6787, - "step": 40760 - }, - { - "epoch": 1.04, - "learning_rate": 1.5142214079723262e-06, - "loss": 0.6958, - "step": 40761 - }, - { - "epoch": 1.04, - "learning_rate": 1.514197676003864e-06, - "loss": 0.5496, - "step": 40762 - }, - { - "epoch": 1.04, - "learning_rate": 1.5141739436417042e-06, - "loss": 0.5255, - "step": 40763 - }, - { - "epoch": 1.04, - "learning_rate": 1.5141502108858652e-06, - "loss": 0.623, - "step": 40764 - }, - { - "epoch": 1.04, - "learning_rate": 1.5141264777363652e-06, - "loss": 0.6895, - "step": 40765 - }, - { - "epoch": 1.04, - "learning_rate": 1.5141027441932214e-06, - "loss": 0.7529, - "step": 40766 - }, - { - "epoch": 1.04, - "learning_rate": 1.5140790102564535e-06, - "loss": 0.7666, - "step": 40767 - }, - { - "epoch": 1.04, - "learning_rate": 1.5140552759260788e-06, - "loss": 0.6069, - "step": 40768 - }, - { - "epoch": 1.04, - "learning_rate": 1.5140315412021156e-06, - "loss": 0.6924, - "step": 40769 - }, - { - "epoch": 1.04, - "learning_rate": 1.514007806084582e-06, - "loss": 0.7178, - "step": 40770 - }, - { - "epoch": 1.04, - "learning_rate": 1.5139840705734966e-06, - "loss": 0.6953, - "step": 40771 - }, - { - "epoch": 1.05, - "learning_rate": 1.5139603346688764e-06, - "loss": 0.4707, - "step": 40772 - }, - { - "epoch": 1.05, - "learning_rate": 1.5139365983707412e-06, - "loss": 0.7373, - "step": 40773 - }, - { - "epoch": 1.05, - "learning_rate": 1.5139128616791084e-06, - "loss": 0.7305, - "step": 40774 - }, - { - "epoch": 1.05, - "learning_rate": 1.5138891245939958e-06, - "loss": 0.5679, - "step": 40775 - }, - { - "epoch": 1.05, - "learning_rate": 1.513865387115422e-06, - "loss": 0.7998, - "step": 40776 - }, - { - "epoch": 1.05, - "learning_rate": 1.5138416492434049e-06, - "loss": 0.5615, - "step": 40777 - }, - { - "epoch": 1.05, - "learning_rate": 1.5138179109779633e-06, - "loss": 0.6079, - "step": 40778 - }, - { - "epoch": 1.05, - "learning_rate": 1.5137941723191146e-06, - "loss": 0.6279, - "step": 40779 - }, - { - "epoch": 1.05, - "learning_rate": 1.5137704332668774e-06, - "loss": 0.4638, - "step": 40780 - }, - { - "epoch": 1.05, - "learning_rate": 1.5137466938212699e-06, - "loss": 0.4717, - "step": 40781 - }, - { - "epoch": 1.05, - "learning_rate": 1.51372295398231e-06, - "loss": 0.5195, - "step": 40782 - }, - { - "epoch": 1.05, - "learning_rate": 1.5136992137500161e-06, - "loss": 0.6592, - "step": 40783 - }, - { - "epoch": 1.05, - "learning_rate": 1.5136754731244068e-06, - "loss": 0.6914, - "step": 40784 - }, - { - "epoch": 1.05, - "learning_rate": 1.513651732105499e-06, - "loss": 0.7231, - "step": 40785 - }, - { - "epoch": 1.05, - "learning_rate": 1.5136279906933125e-06, - "loss": 0.5596, - "step": 40786 - }, - { - "epoch": 1.05, - "learning_rate": 1.513604248887864e-06, - "loss": 0.8047, - "step": 40787 - }, - { - "epoch": 1.05, - "learning_rate": 1.513580506689173e-06, - "loss": 0.647, - "step": 40788 - }, - { - "epoch": 1.05, - "learning_rate": 1.5135567640972564e-06, - "loss": 0.7881, - "step": 40789 - }, - { - "epoch": 1.05, - "learning_rate": 1.5135330211121336e-06, - "loss": 0.5747, - "step": 40790 - }, - { - "epoch": 1.05, - "learning_rate": 1.5135092777338216e-06, - "loss": 0.5747, - "step": 40791 - }, - { - "epoch": 1.05, - "learning_rate": 1.5134855339623393e-06, - "loss": 0.5957, - "step": 40792 - }, - { - "epoch": 1.05, - "learning_rate": 1.513461789797705e-06, - "loss": 0.7725, - "step": 40793 - }, - { - "epoch": 1.05, - "learning_rate": 1.5134380452399365e-06, - "loss": 0.6299, - "step": 40794 - }, - { - "epoch": 1.05, - "learning_rate": 1.5134143002890519e-06, - "loss": 0.6719, - "step": 40795 - }, - { - "epoch": 1.05, - "learning_rate": 1.5133905549450698e-06, - "loss": 0.5684, - "step": 40796 - }, - { - "epoch": 1.05, - "learning_rate": 1.5133668092080082e-06, - "loss": 0.5737, - "step": 40797 - }, - { - "epoch": 1.05, - "learning_rate": 1.513343063077885e-06, - "loss": 0.6768, - "step": 40798 - }, - { - "epoch": 1.05, - "learning_rate": 1.5133193165547187e-06, - "loss": 0.6709, - "step": 40799 - }, - { - "epoch": 1.05, - "learning_rate": 1.5132955696385272e-06, - "loss": 0.4805, - "step": 40800 - }, - { - "epoch": 1.05, - "learning_rate": 1.5132718223293292e-06, - "loss": 0.792, - "step": 40801 - }, - { - "epoch": 1.05, - "learning_rate": 1.5132480746271426e-06, - "loss": 0.8477, - "step": 40802 - }, - { - "epoch": 1.05, - "learning_rate": 1.5132243265319855e-06, - "loss": 0.6421, - "step": 40803 - }, - { - "epoch": 1.05, - "learning_rate": 1.513200578043876e-06, - "loss": 0.6592, - "step": 40804 - }, - { - "epoch": 1.05, - "learning_rate": 1.5131768291628326e-06, - "loss": 0.7969, - "step": 40805 - }, - { - "epoch": 1.05, - "learning_rate": 1.513153079888873e-06, - "loss": 0.3901, - "step": 40806 - }, - { - "epoch": 1.05, - "learning_rate": 1.513129330222016e-06, - "loss": 0.7324, - "step": 40807 - }, - { - "epoch": 1.05, - "learning_rate": 1.5131055801622791e-06, - "loss": 0.7148, - "step": 40808 - }, - { - "epoch": 1.05, - "learning_rate": 1.5130818297096815e-06, - "loss": 0.5369, - "step": 40809 - }, - { - "epoch": 1.05, - "learning_rate": 1.51305807886424e-06, - "loss": 0.561, - "step": 40810 - }, - { - "epoch": 1.05, - "learning_rate": 1.5130343276259741e-06, - "loss": 0.6865, - "step": 40811 - }, - { - "epoch": 1.05, - "learning_rate": 1.513010575994901e-06, - "loss": 0.5791, - "step": 40812 - }, - { - "epoch": 1.05, - "learning_rate": 1.5129868239710395e-06, - "loss": 0.7871, - "step": 40813 - }, - { - "epoch": 1.05, - "learning_rate": 1.5129630715544076e-06, - "loss": 0.4775, - "step": 40814 - }, - { - "epoch": 1.05, - "learning_rate": 1.5129393187450233e-06, - "loss": 0.6206, - "step": 40815 - }, - { - "epoch": 1.05, - "learning_rate": 1.512915565542905e-06, - "loss": 0.5046, - "step": 40816 - }, - { - "epoch": 1.05, - "learning_rate": 1.5128918119480706e-06, - "loss": 0.7822, - "step": 40817 - }, - { - "epoch": 1.05, - "learning_rate": 1.5128680579605388e-06, - "loss": 0.7441, - "step": 40818 - }, - { - "epoch": 1.05, - "learning_rate": 1.5128443035803277e-06, - "loss": 0.5386, - "step": 40819 - }, - { - "epoch": 1.05, - "learning_rate": 1.512820548807455e-06, - "loss": 0.6382, - "step": 40820 - }, - { - "epoch": 1.05, - "learning_rate": 1.5127967936419394e-06, - "loss": 0.6226, - "step": 40821 - }, - { - "epoch": 1.05, - "learning_rate": 1.5127730380837986e-06, - "loss": 0.6172, - "step": 40822 - }, - { - "epoch": 1.05, - "learning_rate": 1.5127492821330515e-06, - "loss": 0.7178, - "step": 40823 - }, - { - "epoch": 1.05, - "learning_rate": 1.5127255257897154e-06, - "loss": 0.7383, - "step": 40824 - }, - { - "epoch": 1.05, - "learning_rate": 1.512701769053809e-06, - "loss": 0.6294, - "step": 40825 - }, - { - "epoch": 1.05, - "learning_rate": 1.5126780119253506e-06, - "loss": 0.6162, - "step": 40826 - }, - { - "epoch": 1.05, - "learning_rate": 1.5126542544043579e-06, - "loss": 0.6016, - "step": 40827 - }, - { - "epoch": 1.05, - "learning_rate": 1.5126304964908499e-06, - "loss": 0.6851, - "step": 40828 - }, - { - "epoch": 1.05, - "learning_rate": 1.5126067381848442e-06, - "loss": 0.7578, - "step": 40829 - }, - { - "epoch": 1.05, - "learning_rate": 1.512582979486359e-06, - "loss": 0.6421, - "step": 40830 - }, - { - "epoch": 1.05, - "learning_rate": 1.5125592203954124e-06, - "loss": 0.6396, - "step": 40831 - }, - { - "epoch": 1.05, - "learning_rate": 1.5125354609120228e-06, - "loss": 0.7324, - "step": 40832 - }, - { - "epoch": 1.05, - "learning_rate": 1.5125117010362084e-06, - "loss": 0.7939, - "step": 40833 - }, - { - "epoch": 1.05, - "learning_rate": 1.5124879407679876e-06, - "loss": 0.5444, - "step": 40834 - }, - { - "epoch": 1.05, - "learning_rate": 1.5124641801073784e-06, - "loss": 0.6562, - "step": 40835 - }, - { - "epoch": 1.05, - "learning_rate": 1.5124404190543985e-06, - "loss": 0.7451, - "step": 40836 - }, - { - "epoch": 1.05, - "learning_rate": 1.5124166576090668e-06, - "loss": 0.7666, - "step": 40837 - }, - { - "epoch": 1.05, - "learning_rate": 1.5123928957714012e-06, - "loss": 0.5361, - "step": 40838 - }, - { - "epoch": 1.05, - "learning_rate": 1.51236913354142e-06, - "loss": 0.5386, - "step": 40839 - }, - { - "epoch": 1.05, - "learning_rate": 1.5123453709191412e-06, - "loss": 0.7012, - "step": 40840 - }, - { - "epoch": 1.05, - "learning_rate": 1.5123216079045832e-06, - "loss": 0.6143, - "step": 40841 - }, - { - "epoch": 1.05, - "learning_rate": 1.512297844497764e-06, - "loss": 0.6479, - "step": 40842 - }, - { - "epoch": 1.05, - "learning_rate": 1.5122740806987015e-06, - "loss": 0.6621, - "step": 40843 - }, - { - "epoch": 1.05, - "learning_rate": 1.5122503165074148e-06, - "loss": 0.5811, - "step": 40844 - }, - { - "epoch": 1.05, - "learning_rate": 1.5122265519239217e-06, - "loss": 0.752, - "step": 40845 - }, - { - "epoch": 1.05, - "learning_rate": 1.5122027869482399e-06, - "loss": 0.6162, - "step": 40846 - }, - { - "epoch": 1.05, - "learning_rate": 1.5121790215803882e-06, - "loss": 0.6821, - "step": 40847 - }, - { - "epoch": 1.05, - "learning_rate": 1.5121552558203848e-06, - "loss": 0.6709, - "step": 40848 - }, - { - "epoch": 1.05, - "learning_rate": 1.5121314896682472e-06, - "loss": 0.7061, - "step": 40849 - }, - { - "epoch": 1.05, - "learning_rate": 1.5121077231239942e-06, - "loss": 0.6328, - "step": 40850 - }, - { - "epoch": 1.05, - "learning_rate": 1.5120839561876442e-06, - "loss": 0.6553, - "step": 40851 - }, - { - "epoch": 1.05, - "learning_rate": 1.5120601888592144e-06, - "loss": 0.6445, - "step": 40852 - }, - { - "epoch": 1.05, - "learning_rate": 1.5120364211387243e-06, - "loss": 0.5884, - "step": 40853 - }, - { - "epoch": 1.05, - "learning_rate": 1.5120126530261913e-06, - "loss": 0.6309, - "step": 40854 - }, - { - "epoch": 1.05, - "learning_rate": 1.5119888845216338e-06, - "loss": 0.4473, - "step": 40855 - }, - { - "epoch": 1.05, - "learning_rate": 1.5119651156250695e-06, - "loss": 0.7188, - "step": 40856 - }, - { - "epoch": 1.05, - "learning_rate": 1.5119413463365174e-06, - "loss": 0.4597, - "step": 40857 - }, - { - "epoch": 1.05, - "learning_rate": 1.5119175766559954e-06, - "loss": 0.6655, - "step": 40858 - }, - { - "epoch": 1.05, - "learning_rate": 1.5118938065835217e-06, - "loss": 0.5879, - "step": 40859 - }, - { - "epoch": 1.05, - "learning_rate": 1.511870036119114e-06, - "loss": 0.584, - "step": 40860 - }, - { - "epoch": 1.05, - "learning_rate": 1.5118462652627914e-06, - "loss": 0.7256, - "step": 40861 - }, - { - "epoch": 1.05, - "learning_rate": 1.5118224940145714e-06, - "loss": 0.5811, - "step": 40862 - }, - { - "epoch": 1.05, - "learning_rate": 1.5117987223744727e-06, - "loss": 0.6885, - "step": 40863 - }, - { - "epoch": 1.05, - "learning_rate": 1.5117749503425133e-06, - "loss": 0.4565, - "step": 40864 - }, - { - "epoch": 1.05, - "learning_rate": 1.511751177918711e-06, - "loss": 0.5044, - "step": 40865 - }, - { - "epoch": 1.05, - "learning_rate": 1.5117274051030844e-06, - "loss": 0.6406, - "step": 40866 - }, - { - "epoch": 1.05, - "learning_rate": 1.511703631895652e-06, - "loss": 0.8564, - "step": 40867 - }, - { - "epoch": 1.05, - "learning_rate": 1.511679858296431e-06, - "loss": 0.7773, - "step": 40868 - }, - { - "epoch": 1.05, - "learning_rate": 1.5116560843054411e-06, - "loss": 0.5156, - "step": 40869 - }, - { - "epoch": 1.05, - "learning_rate": 1.5116323099226993e-06, - "loss": 0.7432, - "step": 40870 - }, - { - "epoch": 1.05, - "learning_rate": 1.511608535148224e-06, - "loss": 0.7021, - "step": 40871 - }, - { - "epoch": 1.05, - "learning_rate": 1.5115847599820336e-06, - "loss": 0.5596, - "step": 40872 - }, - { - "epoch": 1.05, - "learning_rate": 1.5115609844241464e-06, - "loss": 0.6697, - "step": 40873 - }, - { - "epoch": 1.05, - "learning_rate": 1.5115372084745808e-06, - "loss": 0.7168, - "step": 40874 - }, - { - "epoch": 1.05, - "learning_rate": 1.511513432133354e-06, - "loss": 0.6973, - "step": 40875 - }, - { - "epoch": 1.05, - "learning_rate": 1.5114896554004856e-06, - "loss": 0.8262, - "step": 40876 - }, - { - "epoch": 1.05, - "learning_rate": 1.5114658782759923e-06, - "loss": 0.6636, - "step": 40877 - }, - { - "epoch": 1.05, - "learning_rate": 1.5114421007598937e-06, - "loss": 0.7002, - "step": 40878 - }, - { - "epoch": 1.05, - "learning_rate": 1.511418322852207e-06, - "loss": 0.7998, - "step": 40879 - }, - { - "epoch": 1.05, - "learning_rate": 1.5113945445529513e-06, - "loss": 0.5688, - "step": 40880 - }, - { - "epoch": 1.05, - "learning_rate": 1.5113707658621438e-06, - "loss": 0.5159, - "step": 40881 - }, - { - "epoch": 1.05, - "learning_rate": 1.5113469867798037e-06, - "loss": 0.6943, - "step": 40882 - }, - { - "epoch": 1.05, - "learning_rate": 1.5113232073059481e-06, - "loss": 0.7061, - "step": 40883 - }, - { - "epoch": 1.05, - "learning_rate": 1.5112994274405964e-06, - "loss": 0.7158, - "step": 40884 - }, - { - "epoch": 1.05, - "learning_rate": 1.511275647183766e-06, - "loss": 0.6406, - "step": 40885 - }, - { - "epoch": 1.05, - "learning_rate": 1.5112518665354755e-06, - "loss": 0.6514, - "step": 40886 - }, - { - "epoch": 1.05, - "learning_rate": 1.5112280854957427e-06, - "loss": 0.6455, - "step": 40887 - }, - { - "epoch": 1.05, - "learning_rate": 1.511204304064586e-06, - "loss": 0.6699, - "step": 40888 - }, - { - "epoch": 1.05, - "learning_rate": 1.511180522242024e-06, - "loss": 0.7832, - "step": 40889 - }, - { - "epoch": 1.05, - "learning_rate": 1.5111567400280745e-06, - "loss": 0.5317, - "step": 40890 - }, - { - "epoch": 1.05, - "learning_rate": 1.5111329574227557e-06, - "loss": 0.5142, - "step": 40891 - }, - { - "epoch": 1.05, - "learning_rate": 1.5111091744260858e-06, - "loss": 0.6909, - "step": 40892 - }, - { - "epoch": 1.05, - "learning_rate": 1.511085391038083e-06, - "loss": 0.6367, - "step": 40893 - }, - { - "epoch": 1.05, - "learning_rate": 1.511061607258766e-06, - "loss": 0.6299, - "step": 40894 - }, - { - "epoch": 1.05, - "learning_rate": 1.5110378230881527e-06, - "loss": 0.8652, - "step": 40895 - }, - { - "epoch": 1.05, - "learning_rate": 1.5110140385262608e-06, - "loss": 0.6416, - "step": 40896 - }, - { - "epoch": 1.05, - "learning_rate": 1.5109902535731092e-06, - "loss": 0.5952, - "step": 40897 - }, - { - "epoch": 1.05, - "learning_rate": 1.5109664682287158e-06, - "loss": 0.6885, - "step": 40898 - }, - { - "epoch": 1.05, - "learning_rate": 1.5109426824930992e-06, - "loss": 0.6753, - "step": 40899 - }, - { - "epoch": 1.05, - "learning_rate": 1.510918896366277e-06, - "loss": 0.4346, - "step": 40900 - }, - { - "epoch": 1.05, - "learning_rate": 1.5108951098482674e-06, - "loss": 0.7061, - "step": 40901 - }, - { - "epoch": 1.05, - "learning_rate": 1.510871322939089e-06, - "loss": 0.7559, - "step": 40902 - }, - { - "epoch": 1.05, - "learning_rate": 1.5108475356387604e-06, - "loss": 0.5374, - "step": 40903 - }, - { - "epoch": 1.05, - "learning_rate": 1.5108237479472988e-06, - "loss": 0.6313, - "step": 40904 - }, - { - "epoch": 1.05, - "learning_rate": 1.5107999598647234e-06, - "loss": 0.6934, - "step": 40905 - }, - { - "epoch": 1.05, - "learning_rate": 1.5107761713910517e-06, - "loss": 0.6035, - "step": 40906 - }, - { - "epoch": 1.05, - "learning_rate": 1.5107523825263023e-06, - "loss": 0.525, - "step": 40907 - }, - { - "epoch": 1.05, - "learning_rate": 1.510728593270493e-06, - "loss": 0.5938, - "step": 40908 - }, - { - "epoch": 1.05, - "learning_rate": 1.5107048036236426e-06, - "loss": 0.7026, - "step": 40909 - }, - { - "epoch": 1.05, - "learning_rate": 1.5106810135857689e-06, - "loss": 0.6121, - "step": 40910 - }, - { - "epoch": 1.05, - "learning_rate": 1.5106572231568901e-06, - "loss": 0.709, - "step": 40911 - }, - { - "epoch": 1.05, - "learning_rate": 1.5106334323370246e-06, - "loss": 0.7432, - "step": 40912 - }, - { - "epoch": 1.05, - "learning_rate": 1.5106096411261909e-06, - "loss": 0.5933, - "step": 40913 - }, - { - "epoch": 1.05, - "learning_rate": 1.5105858495244066e-06, - "loss": 0.6885, - "step": 40914 - }, - { - "epoch": 1.05, - "learning_rate": 1.5105620575316899e-06, - "loss": 0.3085, - "step": 40915 - }, - { - "epoch": 1.05, - "learning_rate": 1.5105382651480599e-06, - "loss": 0.7354, - "step": 40916 - }, - { - "epoch": 1.05, - "learning_rate": 1.5105144723735337e-06, - "loss": 0.6348, - "step": 40917 - }, - { - "epoch": 1.05, - "learning_rate": 1.5104906792081305e-06, - "loss": 0.4229, - "step": 40918 - }, - { - "epoch": 1.05, - "learning_rate": 1.5104668856518677e-06, - "loss": 0.6953, - "step": 40919 - }, - { - "epoch": 1.05, - "learning_rate": 1.5104430917047641e-06, - "loss": 0.8242, - "step": 40920 - }, - { - "epoch": 1.05, - "learning_rate": 1.5104192973668375e-06, - "loss": 0.603, - "step": 40921 - }, - { - "epoch": 1.05, - "learning_rate": 1.5103955026381065e-06, - "loss": 0.5562, - "step": 40922 - }, - { - "epoch": 1.05, - "learning_rate": 1.510371707518589e-06, - "loss": 0.7109, - "step": 40923 - }, - { - "epoch": 1.05, - "learning_rate": 1.5103479120083034e-06, - "loss": 0.6758, - "step": 40924 - }, - { - "epoch": 1.05, - "learning_rate": 1.510324116107268e-06, - "loss": 0.6587, - "step": 40925 - }, - { - "epoch": 1.05, - "learning_rate": 1.5103003198155006e-06, - "loss": 0.6479, - "step": 40926 - }, - { - "epoch": 1.05, - "learning_rate": 1.5102765231330196e-06, - "loss": 0.5708, - "step": 40927 - }, - { - "epoch": 1.05, - "learning_rate": 1.5102527260598442e-06, - "loss": 0.5444, - "step": 40928 - }, - { - "epoch": 1.05, - "learning_rate": 1.5102289285959909e-06, - "loss": 0.8262, - "step": 40929 - }, - { - "epoch": 1.05, - "learning_rate": 1.510205130741479e-06, - "loss": 0.7402, - "step": 40930 - }, - { - "epoch": 1.05, - "learning_rate": 1.5101813324963264e-06, - "loss": 0.708, - "step": 40931 - }, - { - "epoch": 1.05, - "learning_rate": 1.5101575338605518e-06, - "loss": 0.5061, - "step": 40932 - }, - { - "epoch": 1.05, - "learning_rate": 1.5101337348341728e-06, - "loss": 0.4609, - "step": 40933 - }, - { - "epoch": 1.05, - "learning_rate": 1.5101099354172074e-06, - "loss": 0.5884, - "step": 40934 - }, - { - "epoch": 1.05, - "learning_rate": 1.5100861356096748e-06, - "loss": 0.6357, - "step": 40935 - }, - { - "epoch": 1.05, - "learning_rate": 1.5100623354115926e-06, - "loss": 0.7207, - "step": 40936 - }, - { - "epoch": 1.05, - "learning_rate": 1.510038534822979e-06, - "loss": 0.6924, - "step": 40937 - }, - { - "epoch": 1.05, - "learning_rate": 1.5100147338438527e-06, - "loss": 0.4478, - "step": 40938 - }, - { - "epoch": 1.05, - "learning_rate": 1.5099909324742312e-06, - "loss": 0.4559, - "step": 40939 - }, - { - "epoch": 1.05, - "learning_rate": 1.5099671307141332e-06, - "loss": 0.6191, - "step": 40940 - }, - { - "epoch": 1.05, - "learning_rate": 1.509943328563577e-06, - "loss": 0.6895, - "step": 40941 - }, - { - "epoch": 1.05, - "learning_rate": 1.5099195260225802e-06, - "loss": 0.5986, - "step": 40942 - }, - { - "epoch": 1.05, - "learning_rate": 1.5098957230911621e-06, - "loss": 0.6091, - "step": 40943 - }, - { - "epoch": 1.05, - "learning_rate": 1.5098719197693397e-06, - "loss": 0.623, - "step": 40944 - }, - { - "epoch": 1.05, - "learning_rate": 1.5098481160571321e-06, - "loss": 0.7773, - "step": 40945 - }, - { - "epoch": 1.05, - "learning_rate": 1.5098243119545573e-06, - "loss": 0.7256, - "step": 40946 - }, - { - "epoch": 1.05, - "learning_rate": 1.5098005074616333e-06, - "loss": 0.5786, - "step": 40947 - }, - { - "epoch": 1.05, - "learning_rate": 1.5097767025783786e-06, - "loss": 0.6924, - "step": 40948 - }, - { - "epoch": 1.05, - "learning_rate": 1.5097528973048114e-06, - "loss": 0.6831, - "step": 40949 - }, - { - "epoch": 1.05, - "learning_rate": 1.5097290916409495e-06, - "loss": 0.7363, - "step": 40950 - }, - { - "epoch": 1.05, - "learning_rate": 1.5097052855868119e-06, - "loss": 0.6333, - "step": 40951 - }, - { - "epoch": 1.05, - "learning_rate": 1.5096814791424159e-06, - "loss": 0.4749, - "step": 40952 - }, - { - "epoch": 1.05, - "learning_rate": 1.5096576723077808e-06, - "loss": 0.6616, - "step": 40953 - }, - { - "epoch": 1.05, - "learning_rate": 1.509633865082924e-06, - "loss": 0.6309, - "step": 40954 - }, - { - "epoch": 1.05, - "learning_rate": 1.5096100574678636e-06, - "loss": 0.7285, - "step": 40955 - }, - { - "epoch": 1.05, - "learning_rate": 1.5095862494626188e-06, - "loss": 0.5886, - "step": 40956 - }, - { - "epoch": 1.05, - "learning_rate": 1.509562441067207e-06, - "loss": 0.8682, - "step": 40957 - }, - { - "epoch": 1.05, - "learning_rate": 1.5095386322816468e-06, - "loss": 0.6372, - "step": 40958 - }, - { - "epoch": 1.05, - "learning_rate": 1.509514823105956e-06, - "loss": 0.7188, - "step": 40959 - }, - { - "epoch": 1.05, - "learning_rate": 1.5094910135401536e-06, - "loss": 0.5601, - "step": 40960 - }, - { - "epoch": 1.05, - "learning_rate": 1.509467203584257e-06, - "loss": 0.7085, - "step": 40961 - }, - { - "epoch": 1.05, - "learning_rate": 1.5094433932382846e-06, - "loss": 0.7344, - "step": 40962 - }, - { - "epoch": 1.05, - "learning_rate": 1.5094195825022552e-06, - "loss": 0.5518, - "step": 40963 - }, - { - "epoch": 1.05, - "learning_rate": 1.5093957713761865e-06, - "loss": 0.8359, - "step": 40964 - }, - { - "epoch": 1.05, - "learning_rate": 1.5093719598600969e-06, - "loss": 0.627, - "step": 40965 - }, - { - "epoch": 1.05, - "learning_rate": 1.5093481479540047e-06, - "loss": 0.5254, - "step": 40966 - }, - { - "epoch": 1.05, - "learning_rate": 1.5093243356579277e-06, - "loss": 0.6274, - "step": 40967 - }, - { - "epoch": 1.05, - "learning_rate": 1.5093005229718848e-06, - "loss": 0.5671, - "step": 40968 - }, - { - "epoch": 1.05, - "learning_rate": 1.5092767098958938e-06, - "loss": 0.5879, - "step": 40969 - }, - { - "epoch": 1.05, - "learning_rate": 1.5092528964299733e-06, - "loss": 0.437, - "step": 40970 - }, - { - "epoch": 1.05, - "learning_rate": 1.5092290825741409e-06, - "loss": 0.7026, - "step": 40971 - }, - { - "epoch": 1.05, - "learning_rate": 1.5092052683284156e-06, - "loss": 0.613, - "step": 40972 - }, - { - "epoch": 1.05, - "learning_rate": 1.509181453692815e-06, - "loss": 0.7168, - "step": 40973 - }, - { - "epoch": 1.05, - "learning_rate": 1.5091576386673577e-06, - "loss": 0.4756, - "step": 40974 - }, - { - "epoch": 1.05, - "learning_rate": 1.5091338232520614e-06, - "loss": 0.6602, - "step": 40975 - }, - { - "epoch": 1.05, - "learning_rate": 1.5091100074469448e-06, - "loss": 0.709, - "step": 40976 - }, - { - "epoch": 1.05, - "learning_rate": 1.5090861912520265e-06, - "loss": 0.623, - "step": 40977 - }, - { - "epoch": 1.05, - "learning_rate": 1.509062374667324e-06, - "loss": 0.7412, - "step": 40978 - }, - { - "epoch": 1.05, - "learning_rate": 1.509038557692856e-06, - "loss": 0.7334, - "step": 40979 - }, - { - "epoch": 1.05, - "learning_rate": 1.5090147403286407e-06, - "loss": 0.6323, - "step": 40980 - }, - { - "epoch": 1.05, - "learning_rate": 1.508990922574696e-06, - "loss": 0.6504, - "step": 40981 - }, - { - "epoch": 1.05, - "learning_rate": 1.5089671044310404e-06, - "loss": 0.7188, - "step": 40982 - }, - { - "epoch": 1.05, - "learning_rate": 1.508943285897692e-06, - "loss": 0.5151, - "step": 40983 - }, - { - "epoch": 1.05, - "learning_rate": 1.5089194669746691e-06, - "loss": 0.4414, - "step": 40984 - }, - { - "epoch": 1.05, - "learning_rate": 1.5088956476619906e-06, - "loss": 0.5049, - "step": 40985 - }, - { - "epoch": 1.05, - "learning_rate": 1.5088718279596733e-06, - "loss": 0.3945, - "step": 40986 - }, - { - "epoch": 1.05, - "learning_rate": 1.5088480078677366e-06, - "loss": 0.6167, - "step": 40987 - }, - { - "epoch": 1.05, - "learning_rate": 1.5088241873861981e-06, - "loss": 0.6914, - "step": 40988 - }, - { - "epoch": 1.05, - "learning_rate": 1.5088003665150768e-06, - "loss": 0.426, - "step": 40989 - }, - { - "epoch": 1.05, - "learning_rate": 1.50877654525439e-06, - "loss": 0.7471, - "step": 40990 - }, - { - "epoch": 1.05, - "learning_rate": 1.5087527236041568e-06, - "loss": 0.6914, - "step": 40991 - }, - { - "epoch": 1.05, - "learning_rate": 1.5087289015643947e-06, - "loss": 0.4526, - "step": 40992 - }, - { - "epoch": 1.05, - "learning_rate": 1.5087050791351227e-06, - "loss": 0.7583, - "step": 40993 - }, - { - "epoch": 1.05, - "learning_rate": 1.508681256316358e-06, - "loss": 0.4849, - "step": 40994 - }, - { - "epoch": 1.05, - "learning_rate": 1.5086574331081199e-06, - "loss": 0.8027, - "step": 40995 - }, - { - "epoch": 1.05, - "learning_rate": 1.5086336095104258e-06, - "loss": 0.7261, - "step": 40996 - }, - { - "epoch": 1.05, - "learning_rate": 1.5086097855232947e-06, - "loss": 0.6133, - "step": 40997 - }, - { - "epoch": 1.05, - "learning_rate": 1.5085859611467445e-06, - "loss": 0.6973, - "step": 40998 - }, - { - "epoch": 1.05, - "learning_rate": 1.508562136380793e-06, - "loss": 0.6592, - "step": 40999 - }, - { - "epoch": 1.05, - "learning_rate": 1.5085383112254592e-06, - "loss": 0.7031, - "step": 41000 - }, - { - "epoch": 1.05, - "learning_rate": 1.508514485680761e-06, - "loss": 0.5732, - "step": 41001 - }, - { - "epoch": 1.05, - "learning_rate": 1.5084906597467164e-06, - "loss": 0.7803, - "step": 41002 - }, - { - "epoch": 1.05, - "learning_rate": 1.5084668334233442e-06, - "loss": 0.5349, - "step": 41003 - }, - { - "epoch": 1.05, - "learning_rate": 1.508443006710662e-06, - "loss": 0.7617, - "step": 41004 - }, - { - "epoch": 1.05, - "learning_rate": 1.5084191796086887e-06, - "loss": 0.5884, - "step": 41005 - }, - { - "epoch": 1.05, - "learning_rate": 1.5083953521174419e-06, - "loss": 0.6914, - "step": 41006 - }, - { - "epoch": 1.05, - "learning_rate": 1.5083715242369404e-06, - "loss": 0.665, - "step": 41007 - }, - { - "epoch": 1.05, - "learning_rate": 1.508347695967202e-06, - "loss": 0.8057, - "step": 41008 - }, - { - "epoch": 1.05, - "learning_rate": 1.5083238673082456e-06, - "loss": 0.7939, - "step": 41009 - }, - { - "epoch": 1.05, - "learning_rate": 1.5083000382600886e-06, - "loss": 0.8203, - "step": 41010 - }, - { - "epoch": 1.05, - "learning_rate": 1.5082762088227493e-06, - "loss": 0.8223, - "step": 41011 - }, - { - "epoch": 1.05, - "learning_rate": 1.508252378996247e-06, - "loss": 0.6567, - "step": 41012 - }, - { - "epoch": 1.05, - "learning_rate": 1.5082285487805985e-06, - "loss": 0.6528, - "step": 41013 - }, - { - "epoch": 1.05, - "learning_rate": 1.5082047181758233e-06, - "loss": 0.7461, - "step": 41014 - }, - { - "epoch": 1.05, - "learning_rate": 1.508180887181939e-06, - "loss": 0.6787, - "step": 41015 - }, - { - "epoch": 1.05, - "learning_rate": 1.5081570557989638e-06, - "loss": 0.6924, - "step": 41016 - }, - { - "epoch": 1.05, - "learning_rate": 1.508133224026916e-06, - "loss": 0.6035, - "step": 41017 - }, - { - "epoch": 1.05, - "learning_rate": 1.5081093918658145e-06, - "loss": 0.6855, - "step": 41018 - }, - { - "epoch": 1.05, - "learning_rate": 1.5080855593156767e-06, - "loss": 0.667, - "step": 41019 - }, - { - "epoch": 1.05, - "learning_rate": 1.5080617263765213e-06, - "loss": 0.6904, - "step": 41020 - }, - { - "epoch": 1.05, - "learning_rate": 1.508037893048366e-06, - "loss": 0.6279, - "step": 41021 - }, - { - "epoch": 1.05, - "learning_rate": 1.5080140593312298e-06, - "loss": 0.7021, - "step": 41022 - }, - { - "epoch": 1.05, - "learning_rate": 1.5079902252251304e-06, - "loss": 0.7041, - "step": 41023 - }, - { - "epoch": 1.05, - "learning_rate": 1.5079663907300861e-06, - "loss": 0.7202, - "step": 41024 - }, - { - "epoch": 1.05, - "learning_rate": 1.5079425558461157e-06, - "loss": 0.5457, - "step": 41025 - }, - { - "epoch": 1.05, - "learning_rate": 1.5079187205732367e-06, - "loss": 0.6621, - "step": 41026 - }, - { - "epoch": 1.05, - "learning_rate": 1.5078948849114679e-06, - "loss": 0.601, - "step": 41027 - }, - { - "epoch": 1.05, - "learning_rate": 1.5078710488608273e-06, - "loss": 0.5752, - "step": 41028 - }, - { - "epoch": 1.05, - "learning_rate": 1.5078472124213332e-06, - "loss": 0.8096, - "step": 41029 - }, - { - "epoch": 1.05, - "learning_rate": 1.5078233755930037e-06, - "loss": 0.6265, - "step": 41030 - }, - { - "epoch": 1.05, - "learning_rate": 1.5077995383758575e-06, - "loss": 0.5765, - "step": 41031 - }, - { - "epoch": 1.05, - "learning_rate": 1.5077757007699118e-06, - "loss": 0.6812, - "step": 41032 - }, - { - "epoch": 1.05, - "learning_rate": 1.5077518627751866e-06, - "loss": 0.6875, - "step": 41033 - }, - { - "epoch": 1.05, - "learning_rate": 1.5077280243916985e-06, - "loss": 0.5818, - "step": 41034 - }, - { - "epoch": 1.05, - "learning_rate": 1.5077041856194668e-06, - "loss": 0.6365, - "step": 41035 - }, - { - "epoch": 1.05, - "learning_rate": 1.5076803464585091e-06, - "loss": 0.6299, - "step": 41036 - }, - { - "epoch": 1.05, - "learning_rate": 1.5076565069088439e-06, - "loss": 0.5894, - "step": 41037 - }, - { - "epoch": 1.05, - "learning_rate": 1.5076326669704896e-06, - "loss": 0.5615, - "step": 41038 - }, - { - "epoch": 1.05, - "learning_rate": 1.507608826643464e-06, - "loss": 0.6113, - "step": 41039 - }, - { - "epoch": 1.05, - "learning_rate": 1.507584985927786e-06, - "loss": 0.8296, - "step": 41040 - }, - { - "epoch": 1.05, - "learning_rate": 1.5075611448234732e-06, - "loss": 0.7061, - "step": 41041 - }, - { - "epoch": 1.05, - "learning_rate": 1.5075373033305443e-06, - "loss": 0.7676, - "step": 41042 - }, - { - "epoch": 1.05, - "learning_rate": 1.5075134614490174e-06, - "loss": 0.6885, - "step": 41043 - }, - { - "epoch": 1.05, - "learning_rate": 1.5074896191789108e-06, - "loss": 0.9189, - "step": 41044 - }, - { - "epoch": 1.05, - "learning_rate": 1.5074657765202429e-06, - "loss": 0.5974, - "step": 41045 - }, - { - "epoch": 1.05, - "learning_rate": 1.5074419334730318e-06, - "loss": 0.8115, - "step": 41046 - }, - { - "epoch": 1.05, - "learning_rate": 1.5074180900372954e-06, - "loss": 0.5282, - "step": 41047 - }, - { - "epoch": 1.05, - "learning_rate": 1.5073942462130528e-06, - "loss": 0.7754, - "step": 41048 - }, - { - "epoch": 1.05, - "learning_rate": 1.5073704020003212e-06, - "loss": 0.6499, - "step": 41049 - }, - { - "epoch": 1.05, - "learning_rate": 1.5073465573991198e-06, - "loss": 0.7393, - "step": 41050 - }, - { - "epoch": 1.05, - "learning_rate": 1.5073227124094663e-06, - "loss": 0.7319, - "step": 41051 - }, - { - "epoch": 1.05, - "learning_rate": 1.5072988670313792e-06, - "loss": 0.5659, - "step": 41052 - }, - { - "epoch": 1.05, - "learning_rate": 1.5072750212648766e-06, - "loss": 0.5674, - "step": 41053 - }, - { - "epoch": 1.05, - "learning_rate": 1.507251175109977e-06, - "loss": 0.5842, - "step": 41054 - }, - { - "epoch": 1.05, - "learning_rate": 1.507227328566698e-06, - "loss": 0.5361, - "step": 41055 - }, - { - "epoch": 1.05, - "learning_rate": 1.507203481635059e-06, - "loss": 0.613, - "step": 41056 - }, - { - "epoch": 1.05, - "learning_rate": 1.5071796343150774e-06, - "loss": 0.7017, - "step": 41057 - }, - { - "epoch": 1.05, - "learning_rate": 1.5071557866067717e-06, - "loss": 0.344, - "step": 41058 - }, - { - "epoch": 1.05, - "learning_rate": 1.5071319385101599e-06, - "loss": 0.5216, - "step": 41059 - }, - { - "epoch": 1.05, - "learning_rate": 1.507108090025261e-06, - "loss": 0.7227, - "step": 41060 - }, - { - "epoch": 1.05, - "learning_rate": 1.5070842411520922e-06, - "loss": 0.6914, - "step": 41061 - }, - { - "epoch": 1.05, - "learning_rate": 1.5070603918906727e-06, - "loss": 0.7686, - "step": 41062 - }, - { - "epoch": 1.05, - "learning_rate": 1.5070365422410202e-06, - "loss": 0.8623, - "step": 41063 - }, - { - "epoch": 1.05, - "learning_rate": 1.5070126922031532e-06, - "loss": 0.7178, - "step": 41064 - }, - { - "epoch": 1.05, - "learning_rate": 1.5069888417770898e-06, - "loss": 0.7744, - "step": 41065 - }, - { - "epoch": 1.05, - "learning_rate": 1.5069649909628484e-06, - "loss": 0.7402, - "step": 41066 - }, - { - "epoch": 1.05, - "learning_rate": 1.506941139760447e-06, - "loss": 0.6787, - "step": 41067 - }, - { - "epoch": 1.05, - "learning_rate": 1.5069172881699044e-06, - "loss": 0.7744, - "step": 41068 - }, - { - "epoch": 1.05, - "learning_rate": 1.5068934361912385e-06, - "loss": 0.7178, - "step": 41069 - }, - { - "epoch": 1.05, - "learning_rate": 1.5068695838244674e-06, - "loss": 0.5957, - "step": 41070 - }, - { - "epoch": 1.05, - "learning_rate": 1.50684573106961e-06, - "loss": 0.5835, - "step": 41071 - }, - { - "epoch": 1.05, - "learning_rate": 1.5068218779266834e-06, - "loss": 0.6294, - "step": 41072 - }, - { - "epoch": 1.05, - "learning_rate": 1.5067980243957075e-06, - "loss": 0.5151, - "step": 41073 - }, - { - "epoch": 1.05, - "learning_rate": 1.506774170476699e-06, - "loss": 0.6719, - "step": 41074 - }, - { - "epoch": 1.05, - "learning_rate": 1.506750316169677e-06, - "loss": 0.6025, - "step": 41075 - }, - { - "epoch": 1.05, - "learning_rate": 1.5067264614746593e-06, - "loss": 0.6689, - "step": 41076 - }, - { - "epoch": 1.05, - "learning_rate": 1.5067026063916651e-06, - "loss": 0.5641, - "step": 41077 - }, - { - "epoch": 1.05, - "learning_rate": 1.5066787509207116e-06, - "loss": 0.7139, - "step": 41078 - }, - { - "epoch": 1.05, - "learning_rate": 1.5066548950618174e-06, - "loss": 0.6836, - "step": 41079 - }, - { - "epoch": 1.05, - "learning_rate": 1.506631038815001e-06, - "loss": 0.6929, - "step": 41080 - }, - { - "epoch": 1.05, - "learning_rate": 1.5066071821802803e-06, - "loss": 0.791, - "step": 41081 - }, - { - "epoch": 1.05, - "learning_rate": 1.506583325157674e-06, - "loss": 0.5227, - "step": 41082 - }, - { - "epoch": 1.05, - "learning_rate": 1.5065594677472003e-06, - "loss": 0.5596, - "step": 41083 - }, - { - "epoch": 1.05, - "learning_rate": 1.506535609948877e-06, - "loss": 0.6992, - "step": 41084 - }, - { - "epoch": 1.05, - "learning_rate": 1.5065117517627227e-06, - "loss": 0.7266, - "step": 41085 - }, - { - "epoch": 1.05, - "learning_rate": 1.5064878931887557e-06, - "loss": 0.6738, - "step": 41086 - }, - { - "epoch": 1.05, - "learning_rate": 1.5064640342269943e-06, - "loss": 0.6514, - "step": 41087 - }, - { - "epoch": 1.05, - "learning_rate": 1.5064401748774566e-06, - "loss": 0.7661, - "step": 41088 - }, - { - "epoch": 1.05, - "learning_rate": 1.5064163151401608e-06, - "loss": 0.5529, - "step": 41089 - }, - { - "epoch": 1.05, - "learning_rate": 1.5063924550151254e-06, - "loss": 0.6592, - "step": 41090 - }, - { - "epoch": 1.05, - "learning_rate": 1.5063685945023688e-06, - "loss": 0.7432, - "step": 41091 - }, - { - "epoch": 1.05, - "learning_rate": 1.5063447336019089e-06, - "loss": 0.397, - "step": 41092 - }, - { - "epoch": 1.05, - "learning_rate": 1.506320872313764e-06, - "loss": 0.749, - "step": 41093 - }, - { - "epoch": 1.05, - "learning_rate": 1.5062970106379526e-06, - "loss": 0.6235, - "step": 41094 - }, - { - "epoch": 1.05, - "learning_rate": 1.5062731485744928e-06, - "loss": 0.5415, - "step": 41095 - }, - { - "epoch": 1.05, - "learning_rate": 1.506249286123403e-06, - "loss": 0.7402, - "step": 41096 - }, - { - "epoch": 1.05, - "learning_rate": 1.5062254232847016e-06, - "loss": 0.5063, - "step": 41097 - }, - { - "epoch": 1.05, - "learning_rate": 1.5062015600584065e-06, - "loss": 0.5596, - "step": 41098 - }, - { - "epoch": 1.05, - "learning_rate": 1.506177696444536e-06, - "loss": 0.4576, - "step": 41099 - }, - { - "epoch": 1.05, - "learning_rate": 1.5061538324431087e-06, - "loss": 0.7334, - "step": 41100 - }, - { - "epoch": 1.05, - "learning_rate": 1.5061299680541427e-06, - "loss": 0.4922, - "step": 41101 - }, - { - "epoch": 1.05, - "learning_rate": 1.506106103277656e-06, - "loss": 0.6636, - "step": 41102 - }, - { - "epoch": 1.05, - "learning_rate": 1.5060822381136674e-06, - "loss": 0.6533, - "step": 41103 - }, - { - "epoch": 1.05, - "learning_rate": 1.5060583725621947e-06, - "loss": 0.6541, - "step": 41104 - }, - { - "epoch": 1.05, - "learning_rate": 1.5060345066232562e-06, - "loss": 0.5908, - "step": 41105 - }, - { - "epoch": 1.05, - "learning_rate": 1.5060106402968708e-06, - "loss": 0.6211, - "step": 41106 - }, - { - "epoch": 1.05, - "learning_rate": 1.505986773583056e-06, - "loss": 0.6226, - "step": 41107 - }, - { - "epoch": 1.05, - "learning_rate": 1.5059629064818306e-06, - "loss": 0.583, - "step": 41108 - }, - { - "epoch": 1.05, - "learning_rate": 1.5059390389932126e-06, - "loss": 0.7959, - "step": 41109 - }, - { - "epoch": 1.05, - "learning_rate": 1.5059151711172204e-06, - "loss": 0.5872, - "step": 41110 - }, - { - "epoch": 1.05, - "learning_rate": 1.5058913028538722e-06, - "loss": 0.4971, - "step": 41111 - }, - { - "epoch": 1.05, - "learning_rate": 1.5058674342031861e-06, - "loss": 0.7251, - "step": 41112 - }, - { - "epoch": 1.05, - "learning_rate": 1.5058435651651807e-06, - "loss": 0.6055, - "step": 41113 - }, - { - "epoch": 1.05, - "learning_rate": 1.5058196957398742e-06, - "loss": 0.7344, - "step": 41114 - }, - { - "epoch": 1.05, - "learning_rate": 1.5057958259272847e-06, - "loss": 0.6372, - "step": 41115 - }, - { - "epoch": 1.05, - "learning_rate": 1.5057719557274307e-06, - "loss": 0.7246, - "step": 41116 - }, - { - "epoch": 1.05, - "learning_rate": 1.5057480851403304e-06, - "loss": 0.7324, - "step": 41117 - }, - { - "epoch": 1.05, - "learning_rate": 1.5057242141660017e-06, - "loss": 0.4961, - "step": 41118 - }, - { - "epoch": 1.05, - "learning_rate": 1.5057003428044636e-06, - "loss": 0.6113, - "step": 41119 - }, - { - "epoch": 1.05, - "learning_rate": 1.5056764710557336e-06, - "loss": 0.6631, - "step": 41120 - }, - { - "epoch": 1.05, - "learning_rate": 1.505652598919831e-06, - "loss": 0.7827, - "step": 41121 - }, - { - "epoch": 1.05, - "learning_rate": 1.5056287263967732e-06, - "loss": 0.4956, - "step": 41122 - }, - { - "epoch": 1.05, - "learning_rate": 1.5056048534865787e-06, - "loss": 0.5742, - "step": 41123 - }, - { - "epoch": 1.05, - "learning_rate": 1.5055809801892656e-06, - "loss": 0.4404, - "step": 41124 - }, - { - "epoch": 1.05, - "learning_rate": 1.5055571065048527e-06, - "loss": 0.7598, - "step": 41125 - }, - { - "epoch": 1.05, - "learning_rate": 1.5055332324333576e-06, - "loss": 0.5356, - "step": 41126 - }, - { - "epoch": 1.05, - "learning_rate": 1.5055093579747994e-06, - "loss": 0.6729, - "step": 41127 - }, - { - "epoch": 1.05, - "learning_rate": 1.5054854831291956e-06, - "loss": 0.7168, - "step": 41128 - }, - { - "epoch": 1.05, - "learning_rate": 1.5054616078965649e-06, - "loss": 0.8115, - "step": 41129 - }, - { - "epoch": 1.05, - "learning_rate": 1.5054377322769254e-06, - "loss": 0.6992, - "step": 41130 - }, - { - "epoch": 1.05, - "learning_rate": 1.5054138562702957e-06, - "loss": 0.7529, - "step": 41131 - }, - { - "epoch": 1.05, - "learning_rate": 1.5053899798766935e-06, - "loss": 0.6138, - "step": 41132 - }, - { - "epoch": 1.05, - "learning_rate": 1.5053661030961378e-06, - "loss": 0.875, - "step": 41133 - }, - { - "epoch": 1.05, - "learning_rate": 1.5053422259286467e-06, - "loss": 0.5342, - "step": 41134 - }, - { - "epoch": 1.05, - "learning_rate": 1.5053183483742374e-06, - "loss": 0.7412, - "step": 41135 - }, - { - "epoch": 1.05, - "learning_rate": 1.50529447043293e-06, - "loss": 0.5659, - "step": 41136 - }, - { - "epoch": 1.05, - "learning_rate": 1.5052705921047414e-06, - "loss": 0.7783, - "step": 41137 - }, - { - "epoch": 1.05, - "learning_rate": 1.5052467133896904e-06, - "loss": 0.6328, - "step": 41138 - }, - { - "epoch": 1.05, - "learning_rate": 1.5052228342877954e-06, - "loss": 0.6709, - "step": 41139 - }, - { - "epoch": 1.05, - "learning_rate": 1.5051989547990742e-06, - "loss": 0.7178, - "step": 41140 - }, - { - "epoch": 1.05, - "learning_rate": 1.5051750749235454e-06, - "loss": 0.4744, - "step": 41141 - }, - { - "epoch": 1.05, - "learning_rate": 1.5051511946612276e-06, - "loss": 0.6133, - "step": 41142 - }, - { - "epoch": 1.05, - "learning_rate": 1.5051273140121388e-06, - "loss": 0.5653, - "step": 41143 - }, - { - "epoch": 1.05, - "learning_rate": 1.5051034329762971e-06, - "loss": 0.6482, - "step": 41144 - }, - { - "epoch": 1.05, - "learning_rate": 1.5050795515537205e-06, - "loss": 0.6748, - "step": 41145 - }, - { - "epoch": 1.05, - "learning_rate": 1.505055669744428e-06, - "loss": 0.623, - "step": 41146 - }, - { - "epoch": 1.05, - "learning_rate": 1.5050317875484377e-06, - "loss": 0.8301, - "step": 41147 - }, - { - "epoch": 1.05, - "learning_rate": 1.505007904965768e-06, - "loss": 0.4917, - "step": 41148 - }, - { - "epoch": 1.05, - "learning_rate": 1.5049840219964366e-06, - "loss": 0.6416, - "step": 41149 - }, - { - "epoch": 1.05, - "learning_rate": 1.5049601386404622e-06, - "loss": 0.7949, - "step": 41150 - }, - { - "epoch": 1.05, - "learning_rate": 1.504936254897863e-06, - "loss": 0.6855, - "step": 41151 - }, - { - "epoch": 1.05, - "learning_rate": 1.5049123707686576e-06, - "loss": 0.6709, - "step": 41152 - }, - { - "epoch": 1.05, - "learning_rate": 1.5048884862528638e-06, - "loss": 0.7217, - "step": 41153 - }, - { - "epoch": 1.05, - "learning_rate": 1.5048646013505003e-06, - "loss": 0.6562, - "step": 41154 - }, - { - "epoch": 1.05, - "learning_rate": 1.5048407160615849e-06, - "loss": 0.75, - "step": 41155 - }, - { - "epoch": 1.05, - "learning_rate": 1.5048168303861363e-06, - "loss": 0.5427, - "step": 41156 - }, - { - "epoch": 1.05, - "learning_rate": 1.5047929443241726e-06, - "loss": 0.6992, - "step": 41157 - }, - { - "epoch": 1.05, - "learning_rate": 1.5047690578757123e-06, - "loss": 0.9092, - "step": 41158 - }, - { - "epoch": 1.05, - "learning_rate": 1.5047451710407734e-06, - "loss": 0.6426, - "step": 41159 - }, - { - "epoch": 1.05, - "learning_rate": 1.5047212838193743e-06, - "loss": 0.7197, - "step": 41160 - }, - { - "epoch": 1.05, - "learning_rate": 1.5046973962115334e-06, - "loss": 0.6943, - "step": 41161 - }, - { - "epoch": 1.06, - "learning_rate": 1.504673508217269e-06, - "loss": 0.7139, - "step": 41162 - }, - { - "epoch": 1.06, - "learning_rate": 1.5046496198365995e-06, - "loss": 0.5835, - "step": 41163 - }, - { - "epoch": 1.06, - "learning_rate": 1.5046257310695425e-06, - "loss": 0.6274, - "step": 41164 - }, - { - "epoch": 1.06, - "learning_rate": 1.5046018419161173e-06, - "loss": 0.6758, - "step": 41165 - }, - { - "epoch": 1.06, - "learning_rate": 1.5045779523763412e-06, - "loss": 0.7734, - "step": 41166 - }, - { - "epoch": 1.06, - "learning_rate": 1.5045540624502331e-06, - "loss": 0.6982, - "step": 41167 - }, - { - "epoch": 1.06, - "learning_rate": 1.5045301721378113e-06, - "loss": 0.7363, - "step": 41168 - }, - { - "epoch": 1.06, - "learning_rate": 1.5045062814390938e-06, - "loss": 0.6807, - "step": 41169 - }, - { - "epoch": 1.06, - "learning_rate": 1.504482390354099e-06, - "loss": 0.6348, - "step": 41170 - }, - { - "epoch": 1.06, - "learning_rate": 1.5044584988828453e-06, - "loss": 0.5718, - "step": 41171 - }, - { - "epoch": 1.06, - "learning_rate": 1.5044346070253509e-06, - "loss": 0.6914, - "step": 41172 - }, - { - "epoch": 1.06, - "learning_rate": 1.5044107147816342e-06, - "loss": 0.5442, - "step": 41173 - }, - { - "epoch": 1.06, - "learning_rate": 1.5043868221517136e-06, - "loss": 0.6724, - "step": 41174 - }, - { - "epoch": 1.06, - "learning_rate": 1.5043629291356068e-06, - "loss": 0.7373, - "step": 41175 - }, - { - "epoch": 1.06, - "learning_rate": 1.5043390357333325e-06, - "loss": 0.6865, - "step": 41176 - }, - { - "epoch": 1.06, - "learning_rate": 1.5043151419449092e-06, - "loss": 0.583, - "step": 41177 - }, - { - "epoch": 1.06, - "learning_rate": 1.5042912477703551e-06, - "loss": 0.7676, - "step": 41178 - }, - { - "epoch": 1.06, - "learning_rate": 1.504267353209688e-06, - "loss": 0.4966, - "step": 41179 - }, - { - "epoch": 1.06, - "learning_rate": 1.5042434582629269e-06, - "loss": 0.77, - "step": 41180 - }, - { - "epoch": 1.06, - "learning_rate": 1.5042195629300898e-06, - "loss": 0.5913, - "step": 41181 - }, - { - "epoch": 1.06, - "learning_rate": 1.5041956672111945e-06, - "loss": 0.668, - "step": 41182 - }, - { - "epoch": 1.06, - "learning_rate": 1.5041717711062602e-06, - "loss": 0.6387, - "step": 41183 - }, - { - "epoch": 1.06, - "learning_rate": 1.5041478746153046e-06, - "loss": 0.7275, - "step": 41184 - }, - { - "epoch": 1.06, - "learning_rate": 1.504123977738346e-06, - "loss": 0.4414, - "step": 41185 - }, - { - "epoch": 1.06, - "learning_rate": 1.5041000804754034e-06, - "loss": 0.5537, - "step": 41186 - }, - { - "epoch": 1.06, - "learning_rate": 1.504076182826494e-06, - "loss": 0.6816, - "step": 41187 - }, - { - "epoch": 1.06, - "learning_rate": 1.504052284791637e-06, - "loss": 0.7139, - "step": 41188 - }, - { - "epoch": 1.06, - "learning_rate": 1.5040283863708503e-06, - "loss": 0.562, - "step": 41189 - }, - { - "epoch": 1.06, - "learning_rate": 1.5040044875641519e-06, - "loss": 0.6792, - "step": 41190 - }, - { - "epoch": 1.06, - "learning_rate": 1.5039805883715605e-06, - "loss": 0.6069, - "step": 41191 - }, - { - "epoch": 1.06, - "learning_rate": 1.5039566887930947e-06, - "loss": 0.6992, - "step": 41192 - }, - { - "epoch": 1.06, - "learning_rate": 1.5039327888287722e-06, - "loss": 0.6738, - "step": 41193 - }, - { - "epoch": 1.06, - "learning_rate": 1.5039088884786117e-06, - "loss": 0.5554, - "step": 41194 - }, - { - "epoch": 1.06, - "learning_rate": 1.5038849877426312e-06, - "loss": 0.6074, - "step": 41195 - }, - { - "epoch": 1.06, - "learning_rate": 1.5038610866208493e-06, - "loss": 0.624, - "step": 41196 - }, - { - "epoch": 1.06, - "learning_rate": 1.5038371851132837e-06, - "loss": 0.6572, - "step": 41197 - }, - { - "epoch": 1.06, - "learning_rate": 1.5038132832199536e-06, - "loss": 0.7598, - "step": 41198 - }, - { - "epoch": 1.06, - "learning_rate": 1.5037893809408763e-06, - "loss": 0.7549, - "step": 41199 - }, - { - "epoch": 1.06, - "learning_rate": 1.5037654782760712e-06, - "loss": 0.6069, - "step": 41200 - }, - { - "epoch": 1.06, - "learning_rate": 1.5037415752255558e-06, - "loss": 0.5508, - "step": 41201 - }, - { - "epoch": 1.06, - "learning_rate": 1.5037176717893485e-06, - "loss": 0.6436, - "step": 41202 - }, - { - "epoch": 1.06, - "learning_rate": 1.5036937679674682e-06, - "loss": 0.459, - "step": 41203 - }, - { - "epoch": 1.06, - "learning_rate": 1.5036698637599323e-06, - "loss": 0.748, - "step": 41204 - }, - { - "epoch": 1.06, - "learning_rate": 1.5036459591667597e-06, - "loss": 0.603, - "step": 41205 - }, - { - "epoch": 1.06, - "learning_rate": 1.5036220541879683e-06, - "loss": 0.7891, - "step": 41206 - }, - { - "epoch": 1.06, - "learning_rate": 1.5035981488235769e-06, - "loss": 0.6174, - "step": 41207 - }, - { - "epoch": 1.06, - "learning_rate": 1.5035742430736037e-06, - "loss": 0.6646, - "step": 41208 - }, - { - "epoch": 1.06, - "learning_rate": 1.503550336938067e-06, - "loss": 0.8125, - "step": 41209 - }, - { - "epoch": 1.06, - "learning_rate": 1.5035264304169842e-06, - "loss": 0.6533, - "step": 41210 - }, - { - "epoch": 1.06, - "learning_rate": 1.5035025235103749e-06, - "loss": 0.6313, - "step": 41211 - }, - { - "epoch": 1.06, - "learning_rate": 1.503478616218257e-06, - "loss": 0.6875, - "step": 41212 - }, - { - "epoch": 1.06, - "learning_rate": 1.5034547085406483e-06, - "loss": 0.7607, - "step": 41213 - }, - { - "epoch": 1.06, - "learning_rate": 1.5034308004775676e-06, - "loss": 0.752, - "step": 41214 - }, - { - "epoch": 1.06, - "learning_rate": 1.5034068920290332e-06, - "loss": 0.5107, - "step": 41215 - }, - { - "epoch": 1.06, - "learning_rate": 1.503382983195063e-06, - "loss": 0.5435, - "step": 41216 - }, - { - "epoch": 1.06, - "learning_rate": 1.503359073975676e-06, - "loss": 0.6284, - "step": 41217 - }, - { - "epoch": 1.06, - "learning_rate": 1.50333516437089e-06, - "loss": 0.6455, - "step": 41218 - }, - { - "epoch": 1.06, - "learning_rate": 1.5033112543807231e-06, - "loss": 0.7295, - "step": 41219 - }, - { - "epoch": 1.06, - "learning_rate": 1.5032873440051943e-06, - "loss": 0.5996, - "step": 41220 - }, - { - "epoch": 1.06, - "learning_rate": 1.5032634332443212e-06, - "loss": 0.7402, - "step": 41221 - }, - { - "epoch": 1.06, - "learning_rate": 1.5032395220981227e-06, - "loss": 0.6685, - "step": 41222 - }, - { - "epoch": 1.06, - "learning_rate": 1.5032156105666167e-06, - "loss": 0.5669, - "step": 41223 - }, - { - "epoch": 1.06, - "learning_rate": 1.5031916986498217e-06, - "loss": 0.6196, - "step": 41224 - }, - { - "epoch": 1.06, - "learning_rate": 1.5031677863477556e-06, - "loss": 0.5254, - "step": 41225 - }, - { - "epoch": 1.06, - "learning_rate": 1.5031438736604376e-06, - "loss": 0.8623, - "step": 41226 - }, - { - "epoch": 1.06, - "learning_rate": 1.5031199605878852e-06, - "loss": 0.6689, - "step": 41227 - }, - { - "epoch": 1.06, - "learning_rate": 1.5030960471301172e-06, - "loss": 0.7119, - "step": 41228 - }, - { - "epoch": 1.06, - "learning_rate": 1.5030721332871515e-06, - "loss": 0.5323, - "step": 41229 - }, - { - "epoch": 1.06, - "learning_rate": 1.5030482190590066e-06, - "loss": 0.7119, - "step": 41230 - }, - { - "epoch": 1.06, - "learning_rate": 1.5030243044457008e-06, - "loss": 0.7725, - "step": 41231 - }, - { - "epoch": 1.06, - "learning_rate": 1.5030003894472528e-06, - "loss": 0.6846, - "step": 41232 - }, - { - "epoch": 1.06, - "learning_rate": 1.50297647406368e-06, - "loss": 0.8213, - "step": 41233 - }, - { - "epoch": 1.06, - "learning_rate": 1.5029525582950014e-06, - "loss": 0.5723, - "step": 41234 - }, - { - "epoch": 1.06, - "learning_rate": 1.502928642141235e-06, - "loss": 0.7178, - "step": 41235 - }, - { - "epoch": 1.06, - "learning_rate": 1.5029047256023994e-06, - "loss": 0.5952, - "step": 41236 - }, - { - "epoch": 1.06, - "learning_rate": 1.5028808086785129e-06, - "loss": 0.7764, - "step": 41237 - }, - { - "epoch": 1.06, - "learning_rate": 1.5028568913695936e-06, - "loss": 0.7119, - "step": 41238 - }, - { - "epoch": 1.06, - "learning_rate": 1.5028329736756597e-06, - "loss": 0.6299, - "step": 41239 - }, - { - "epoch": 1.06, - "learning_rate": 1.5028090555967302e-06, - "loss": 0.6201, - "step": 41240 - }, - { - "epoch": 1.06, - "learning_rate": 1.5027851371328226e-06, - "loss": 0.5515, - "step": 41241 - }, - { - "epoch": 1.06, - "learning_rate": 1.5027612182839555e-06, - "loss": 0.5957, - "step": 41242 - }, - { - "epoch": 1.06, - "learning_rate": 1.5027372990501474e-06, - "loss": 0.6748, - "step": 41243 - }, - { - "epoch": 1.06, - "learning_rate": 1.5027133794314165e-06, - "loss": 0.6309, - "step": 41244 - }, - { - "epoch": 1.06, - "learning_rate": 1.5026894594277809e-06, - "loss": 0.5625, - "step": 41245 - }, - { - "epoch": 1.06, - "learning_rate": 1.5026655390392592e-06, - "loss": 0.7441, - "step": 41246 - }, - { - "epoch": 1.06, - "learning_rate": 1.5026416182658697e-06, - "loss": 0.6948, - "step": 41247 - }, - { - "epoch": 1.06, - "learning_rate": 1.5026176971076303e-06, - "loss": 0.7061, - "step": 41248 - }, - { - "epoch": 1.06, - "learning_rate": 1.50259377556456e-06, - "loss": 0.7627, - "step": 41249 - }, - { - "epoch": 1.06, - "learning_rate": 1.5025698536366764e-06, - "loss": 0.749, - "step": 41250 - }, - { - "epoch": 1.06, - "learning_rate": 1.5025459313239982e-06, - "loss": 0.6504, - "step": 41251 - }, - { - "epoch": 1.06, - "learning_rate": 1.5025220086265441e-06, - "loss": 0.5811, - "step": 41252 - }, - { - "epoch": 1.06, - "learning_rate": 1.502498085544332e-06, - "loss": 0.6221, - "step": 41253 - }, - { - "epoch": 1.06, - "learning_rate": 1.5024741620773797e-06, - "loss": 0.708, - "step": 41254 - }, - { - "epoch": 1.06, - "learning_rate": 1.5024502382257065e-06, - "loss": 0.605, - "step": 41255 - }, - { - "epoch": 1.06, - "learning_rate": 1.5024263139893299e-06, - "loss": 0.6211, - "step": 41256 - }, - { - "epoch": 1.06, - "learning_rate": 1.502402389368269e-06, - "loss": 0.6792, - "step": 41257 - }, - { - "epoch": 1.06, - "learning_rate": 1.5023784643625413e-06, - "loss": 0.6108, - "step": 41258 - }, - { - "epoch": 1.06, - "learning_rate": 1.5023545389721658e-06, - "loss": 0.5796, - "step": 41259 - }, - { - "epoch": 1.06, - "learning_rate": 1.5023306131971602e-06, - "loss": 0.7656, - "step": 41260 - }, - { - "epoch": 1.06, - "learning_rate": 1.5023066870375437e-06, - "loss": 0.7334, - "step": 41261 - }, - { - "epoch": 1.06, - "learning_rate": 1.5022827604933335e-06, - "loss": 0.5796, - "step": 41262 - }, - { - "epoch": 1.06, - "learning_rate": 1.5022588335645488e-06, - "loss": 0.7134, - "step": 41263 - }, - { - "epoch": 1.06, - "learning_rate": 1.5022349062512075e-06, - "loss": 0.7969, - "step": 41264 - }, - { - "epoch": 1.06, - "learning_rate": 1.5022109785533279e-06, - "loss": 0.6436, - "step": 41265 - }, - { - "epoch": 1.06, - "learning_rate": 1.5021870504709283e-06, - "loss": 0.7969, - "step": 41266 - }, - { - "epoch": 1.06, - "learning_rate": 1.5021631220040277e-06, - "loss": 0.5903, - "step": 41267 - }, - { - "epoch": 1.06, - "learning_rate": 1.5021391931526438e-06, - "loss": 0.5469, - "step": 41268 - }, - { - "epoch": 1.06, - "learning_rate": 1.5021152639167943e-06, - "loss": 0.7568, - "step": 41269 - }, - { - "epoch": 1.06, - "learning_rate": 1.502091334296499e-06, - "loss": 0.6758, - "step": 41270 - }, - { - "epoch": 1.06, - "learning_rate": 1.5020674042917754e-06, - "loss": 0.6689, - "step": 41271 - }, - { - "epoch": 1.06, - "learning_rate": 1.5020434739026417e-06, - "loss": 0.835, - "step": 41272 - }, - { - "epoch": 1.06, - "learning_rate": 1.5020195431291162e-06, - "loss": 0.6128, - "step": 41273 - }, - { - "epoch": 1.06, - "learning_rate": 1.5019956119712175e-06, - "loss": 0.4376, - "step": 41274 - }, - { - "epoch": 1.06, - "learning_rate": 1.501971680428964e-06, - "loss": 0.6807, - "step": 41275 - }, - { - "epoch": 1.06, - "learning_rate": 1.501947748502374e-06, - "loss": 0.7158, - "step": 41276 - }, - { - "epoch": 1.06, - "learning_rate": 1.5019238161914656e-06, - "loss": 0.4878, - "step": 41277 - }, - { - "epoch": 1.06, - "learning_rate": 1.501899883496257e-06, - "loss": 0.6108, - "step": 41278 - }, - { - "epoch": 1.06, - "learning_rate": 1.5018759504167667e-06, - "loss": 0.6221, - "step": 41279 - }, - { - "epoch": 1.06, - "learning_rate": 1.5018520169530133e-06, - "loss": 0.7578, - "step": 41280 - }, - { - "epoch": 1.06, - "learning_rate": 1.5018280831050148e-06, - "loss": 0.7949, - "step": 41281 - }, - { - "epoch": 1.06, - "learning_rate": 1.50180414887279e-06, - "loss": 0.6133, - "step": 41282 - }, - { - "epoch": 1.06, - "learning_rate": 1.5017802142563562e-06, - "loss": 0.7227, - "step": 41283 - }, - { - "epoch": 1.06, - "learning_rate": 1.5017562792557327e-06, - "loss": 0.7012, - "step": 41284 - }, - { - "epoch": 1.06, - "learning_rate": 1.5017323438709371e-06, - "loss": 0.7227, - "step": 41285 - }, - { - "epoch": 1.06, - "learning_rate": 1.5017084081019884e-06, - "loss": 0.6523, - "step": 41286 - }, - { - "epoch": 1.06, - "learning_rate": 1.5016844719489048e-06, - "loss": 0.7334, - "step": 41287 - }, - { - "epoch": 1.06, - "learning_rate": 1.5016605354117044e-06, - "loss": 0.7881, - "step": 41288 - }, - { - "epoch": 1.06, - "learning_rate": 1.5016365984904053e-06, - "loss": 0.8613, - "step": 41289 - }, - { - "epoch": 1.06, - "learning_rate": 1.5016126611850263e-06, - "loss": 0.6885, - "step": 41290 - }, - { - "epoch": 1.06, - "learning_rate": 1.5015887234955854e-06, - "loss": 0.7578, - "step": 41291 - }, - { - "epoch": 1.06, - "learning_rate": 1.5015647854221017e-06, - "loss": 0.5039, - "step": 41292 - }, - { - "epoch": 1.06, - "learning_rate": 1.5015408469645925e-06, - "loss": 0.3525, - "step": 41293 - }, - { - "epoch": 1.06, - "learning_rate": 1.5015169081230763e-06, - "loss": 0.8584, - "step": 41294 - }, - { - "epoch": 1.06, - "learning_rate": 1.5014929688975719e-06, - "loss": 0.4824, - "step": 41295 - }, - { - "epoch": 1.06, - "learning_rate": 1.5014690292880974e-06, - "loss": 0.7549, - "step": 41296 - }, - { - "epoch": 1.06, - "learning_rate": 1.501445089294671e-06, - "loss": 0.6924, - "step": 41297 - }, - { - "epoch": 1.06, - "learning_rate": 1.5014211489173115e-06, - "loss": 0.7773, - "step": 41298 - }, - { - "epoch": 1.06, - "learning_rate": 1.5013972081560366e-06, - "loss": 0.7852, - "step": 41299 - }, - { - "epoch": 1.06, - "learning_rate": 1.5013732670108647e-06, - "loss": 0.665, - "step": 41300 - }, - { - "epoch": 1.06, - "learning_rate": 1.5013493254818146e-06, - "loss": 0.5952, - "step": 41301 - }, - { - "epoch": 1.06, - "learning_rate": 1.5013253835689046e-06, - "loss": 0.6846, - "step": 41302 - }, - { - "epoch": 1.06, - "learning_rate": 1.5013014412721525e-06, - "loss": 0.6582, - "step": 41303 - }, - { - "epoch": 1.06, - "learning_rate": 1.5012774985915767e-06, - "loss": 0.7529, - "step": 41304 - }, - { - "epoch": 1.06, - "learning_rate": 1.5012535555271964e-06, - "loss": 0.4633, - "step": 41305 - }, - { - "epoch": 1.06, - "learning_rate": 1.5012296120790286e-06, - "loss": 0.8984, - "step": 41306 - }, - { - "epoch": 1.06, - "learning_rate": 1.501205668247093e-06, - "loss": 0.8154, - "step": 41307 - }, - { - "epoch": 1.06, - "learning_rate": 1.5011817240314068e-06, - "loss": 0.6567, - "step": 41308 - }, - { - "epoch": 1.06, - "learning_rate": 1.501157779431989e-06, - "loss": 0.8584, - "step": 41309 - }, - { - "epoch": 1.06, - "learning_rate": 1.5011338344488578e-06, - "loss": 0.6528, - "step": 41310 - }, - { - "epoch": 1.06, - "learning_rate": 1.5011098890820312e-06, - "loss": 0.6016, - "step": 41311 - }, - { - "epoch": 1.06, - "learning_rate": 1.5010859433315281e-06, - "loss": 0.665, - "step": 41312 - }, - { - "epoch": 1.06, - "learning_rate": 1.5010619971973663e-06, - "loss": 0.5742, - "step": 41313 - }, - { - "epoch": 1.06, - "learning_rate": 1.5010380506795644e-06, - "loss": 0.7334, - "step": 41314 - }, - { - "epoch": 1.06, - "learning_rate": 1.5010141037781407e-06, - "loss": 0.6289, - "step": 41315 - }, - { - "epoch": 1.06, - "learning_rate": 1.5009901564931138e-06, - "loss": 0.6396, - "step": 41316 - }, - { - "epoch": 1.06, - "learning_rate": 1.5009662088245016e-06, - "loss": 0.564, - "step": 41317 - }, - { - "epoch": 1.06, - "learning_rate": 1.5009422607723226e-06, - "loss": 0.5542, - "step": 41318 - }, - { - "epoch": 1.06, - "learning_rate": 1.5009183123365948e-06, - "loss": 0.6333, - "step": 41319 - }, - { - "epoch": 1.06, - "learning_rate": 1.5008943635173375e-06, - "loss": 0.748, - "step": 41320 - }, - { - "epoch": 1.06, - "learning_rate": 1.5008704143145679e-06, - "loss": 0.522, - "step": 41321 - }, - { - "epoch": 1.06, - "learning_rate": 1.5008464647283055e-06, - "loss": 0.5845, - "step": 41322 - }, - { - "epoch": 1.06, - "learning_rate": 1.5008225147585674e-06, - "loss": 0.6436, - "step": 41323 - }, - { - "epoch": 1.06, - "learning_rate": 1.5007985644053726e-06, - "loss": 0.4241, - "step": 41324 - }, - { - "epoch": 1.06, - "learning_rate": 1.5007746136687395e-06, - "loss": 0.625, - "step": 41325 - }, - { - "epoch": 1.06, - "learning_rate": 1.5007506625486864e-06, - "loss": 0.7871, - "step": 41326 - }, - { - "epoch": 1.06, - "learning_rate": 1.5007267110452312e-06, - "loss": 0.4075, - "step": 41327 - }, - { - "epoch": 1.06, - "learning_rate": 1.5007027591583929e-06, - "loss": 0.5542, - "step": 41328 - }, - { - "epoch": 1.06, - "learning_rate": 1.5006788068881893e-06, - "loss": 0.6816, - "step": 41329 - }, - { - "epoch": 1.06, - "learning_rate": 1.5006548542346394e-06, - "loss": 0.7373, - "step": 41330 - }, - { - "epoch": 1.06, - "learning_rate": 1.5006309011977604e-06, - "loss": 0.5786, - "step": 41331 - }, - { - "epoch": 1.06, - "learning_rate": 1.5006069477775718e-06, - "loss": 0.6445, - "step": 41332 - }, - { - "epoch": 1.06, - "learning_rate": 1.5005829939740914e-06, - "loss": 0.5735, - "step": 41333 - }, - { - "epoch": 1.06, - "learning_rate": 1.5005590397873377e-06, - "loss": 0.668, - "step": 41334 - }, - { - "epoch": 1.06, - "learning_rate": 1.500535085217329e-06, - "loss": 0.5762, - "step": 41335 - }, - { - "epoch": 1.06, - "learning_rate": 1.5005111302640833e-06, - "loss": 0.4728, - "step": 41336 - }, - { - "epoch": 1.06, - "learning_rate": 1.5004871749276196e-06, - "loss": 0.7871, - "step": 41337 - }, - { - "epoch": 1.06, - "learning_rate": 1.5004632192079556e-06, - "loss": 0.519, - "step": 41338 - }, - { - "epoch": 1.06, - "learning_rate": 1.50043926310511e-06, - "loss": 0.6426, - "step": 41339 - }, - { - "epoch": 1.06, - "learning_rate": 1.500415306619101e-06, - "loss": 0.6953, - "step": 41340 - }, - { - "epoch": 1.06, - "learning_rate": 1.5003913497499472e-06, - "loss": 0.5585, - "step": 41341 - }, - { - "epoch": 1.06, - "learning_rate": 1.5003673924976665e-06, - "loss": 0.7734, - "step": 41342 - }, - { - "epoch": 1.06, - "learning_rate": 1.500343434862278e-06, - "loss": 0.8047, - "step": 41343 - }, - { - "epoch": 1.06, - "learning_rate": 1.5003194768437987e-06, - "loss": 0.7891, - "step": 41344 - }, - { - "epoch": 1.06, - "learning_rate": 1.5002955184422485e-06, - "loss": 0.5605, - "step": 41345 - }, - { - "epoch": 1.06, - "learning_rate": 1.5002715596576448e-06, - "loss": 0.6387, - "step": 41346 - }, - { - "epoch": 1.06, - "learning_rate": 1.5002476004900064e-06, - "loss": 0.6338, - "step": 41347 - }, - { - "epoch": 1.06, - "learning_rate": 1.500223640939351e-06, - "loss": 0.6821, - "step": 41348 - }, - { - "epoch": 1.06, - "learning_rate": 1.5001996810056974e-06, - "loss": 0.5094, - "step": 41349 - }, - { - "epoch": 1.06, - "learning_rate": 1.500175720689064e-06, - "loss": 0.7051, - "step": 41350 - }, - { - "epoch": 1.06, - "learning_rate": 1.5001517599894692e-06, - "loss": 0.749, - "step": 41351 - }, - { - "epoch": 1.06, - "learning_rate": 1.5001277989069312e-06, - "loss": 0.4705, - "step": 41352 - }, - { - "epoch": 1.06, - "learning_rate": 1.5001038374414684e-06, - "loss": 0.582, - "step": 41353 - }, - { - "epoch": 1.06, - "learning_rate": 1.5000798755930986e-06, - "loss": 0.7393, - "step": 41354 - }, - { - "epoch": 1.06, - "learning_rate": 1.500055913361841e-06, - "loss": 0.6465, - "step": 41355 - }, - { - "epoch": 1.06, - "learning_rate": 1.5000319507477134e-06, - "loss": 0.4669, - "step": 41356 - }, - { - "epoch": 1.06, - "learning_rate": 1.5000079877507345e-06, - "loss": 0.7236, - "step": 41357 - }, - { - "epoch": 1.06, - "learning_rate": 1.4999840243709226e-06, - "loss": 0.6362, - "step": 41358 - }, - { - "epoch": 1.06, - "learning_rate": 1.4999600606082957e-06, - "loss": 0.8145, - "step": 41359 - }, - { - "epoch": 1.06, - "learning_rate": 1.4999360964628723e-06, - "loss": 0.7061, - "step": 41360 - }, - { - "epoch": 1.06, - "learning_rate": 1.499912131934671e-06, - "loss": 0.6924, - "step": 41361 - }, - { - "epoch": 1.06, - "learning_rate": 1.49988816702371e-06, - "loss": 0.5386, - "step": 41362 - }, - { - "epoch": 1.06, - "learning_rate": 1.4998642017300074e-06, - "loss": 0.5039, - "step": 41363 - }, - { - "epoch": 1.06, - "learning_rate": 1.4998402360535821e-06, - "loss": 0.5682, - "step": 41364 - }, - { - "epoch": 1.06, - "learning_rate": 1.4998162699944517e-06, - "loss": 0.6338, - "step": 41365 - }, - { - "epoch": 1.06, - "learning_rate": 1.4997923035526352e-06, - "loss": 0.6885, - "step": 41366 - }, - { - "epoch": 1.06, - "learning_rate": 1.4997683367281505e-06, - "loss": 0.6064, - "step": 41367 - }, - { - "epoch": 1.06, - "learning_rate": 1.4997443695210167e-06, - "loss": 0.6265, - "step": 41368 - }, - { - "epoch": 1.06, - "learning_rate": 1.4997204019312511e-06, - "loss": 0.6276, - "step": 41369 - }, - { - "epoch": 1.06, - "learning_rate": 1.4996964339588727e-06, - "loss": 0.7065, - "step": 41370 - }, - { - "epoch": 1.06, - "learning_rate": 1.4996724656038997e-06, - "loss": 0.7197, - "step": 41371 - }, - { - "epoch": 1.06, - "learning_rate": 1.4996484968663508e-06, - "loss": 0.7026, - "step": 41372 - }, - { - "epoch": 1.06, - "learning_rate": 1.4996245277462434e-06, - "loss": 0.5566, - "step": 41373 - }, - { - "epoch": 1.06, - "learning_rate": 1.4996005582435968e-06, - "loss": 0.708, - "step": 41374 - }, - { - "epoch": 1.06, - "learning_rate": 1.499576588358429e-06, - "loss": 0.4985, - "step": 41375 - }, - { - "epoch": 1.06, - "learning_rate": 1.4995526180907586e-06, - "loss": 0.6699, - "step": 41376 - }, - { - "epoch": 1.06, - "learning_rate": 1.4995286474406035e-06, - "loss": 0.6191, - "step": 41377 - }, - { - "epoch": 1.06, - "learning_rate": 1.4995046764079821e-06, - "loss": 0.6265, - "step": 41378 - }, - { - "epoch": 1.06, - "learning_rate": 1.4994807049929133e-06, - "loss": 0.5952, - "step": 41379 - }, - { - "epoch": 1.06, - "learning_rate": 1.499456733195415e-06, - "loss": 0.6895, - "step": 41380 - }, - { - "epoch": 1.06, - "learning_rate": 1.4994327610155055e-06, - "loss": 0.582, - "step": 41381 - }, - { - "epoch": 1.06, - "learning_rate": 1.4994087884532034e-06, - "loss": 0.7285, - "step": 41382 - }, - { - "epoch": 1.06, - "learning_rate": 1.4993848155085269e-06, - "loss": 0.7217, - "step": 41383 - }, - { - "epoch": 1.06, - "learning_rate": 1.4993608421814944e-06, - "loss": 0.6021, - "step": 41384 - }, - { - "epoch": 1.06, - "learning_rate": 1.4993368684721244e-06, - "loss": 0.7363, - "step": 41385 - }, - { - "epoch": 1.06, - "learning_rate": 1.4993128943804349e-06, - "loss": 0.6895, - "step": 41386 - }, - { - "epoch": 1.06, - "learning_rate": 1.4992889199064448e-06, - "loss": 0.5649, - "step": 41387 - }, - { - "epoch": 1.06, - "learning_rate": 1.499264945050172e-06, - "loss": 0.625, - "step": 41388 - }, - { - "epoch": 1.06, - "learning_rate": 1.4992409698116348e-06, - "loss": 0.7744, - "step": 41389 - }, - { - "epoch": 1.06, - "learning_rate": 1.499216994190852e-06, - "loss": 0.6541, - "step": 41390 - }, - { - "epoch": 1.06, - "learning_rate": 1.4991930181878417e-06, - "loss": 0.4128, - "step": 41391 - }, - { - "epoch": 1.06, - "learning_rate": 1.499169041802622e-06, - "loss": 0.6143, - "step": 41392 - }, - { - "epoch": 1.06, - "learning_rate": 1.4991450650352119e-06, - "loss": 0.562, - "step": 41393 - }, - { - "epoch": 1.06, - "learning_rate": 1.4991210878856288e-06, - "loss": 0.7256, - "step": 41394 - }, - { - "epoch": 1.06, - "learning_rate": 1.4990971103538921e-06, - "loss": 0.7676, - "step": 41395 - }, - { - "epoch": 1.06, - "learning_rate": 1.4990731324400193e-06, - "loss": 0.686, - "step": 41396 - }, - { - "epoch": 1.06, - "learning_rate": 1.4990491541440299e-06, - "loss": 0.5718, - "step": 41397 - }, - { - "epoch": 1.06, - "learning_rate": 1.4990251754659409e-06, - "loss": 0.6562, - "step": 41398 - }, - { - "epoch": 1.06, - "learning_rate": 1.4990011964057714e-06, - "loss": 0.5648, - "step": 41399 - }, - { - "epoch": 1.06, - "learning_rate": 1.4989772169635395e-06, - "loss": 0.7812, - "step": 41400 - }, - { - "epoch": 1.06, - "learning_rate": 1.498953237139264e-06, - "loss": 0.6455, - "step": 41401 - }, - { - "epoch": 1.06, - "learning_rate": 1.4989292569329625e-06, - "loss": 0.6865, - "step": 41402 - }, - { - "epoch": 1.06, - "learning_rate": 1.498905276344654e-06, - "loss": 0.5457, - "step": 41403 - }, - { - "epoch": 1.06, - "learning_rate": 1.4988812953743568e-06, - "loss": 0.6084, - "step": 41404 - }, - { - "epoch": 1.06, - "learning_rate": 1.498857314022089e-06, - "loss": 0.6807, - "step": 41405 - }, - { - "epoch": 1.06, - "learning_rate": 1.4988333322878692e-06, - "loss": 0.5271, - "step": 41406 - }, - { - "epoch": 1.06, - "learning_rate": 1.4988093501717156e-06, - "loss": 0.6641, - "step": 41407 - }, - { - "epoch": 1.06, - "learning_rate": 1.498785367673647e-06, - "loss": 0.8018, - "step": 41408 - }, - { - "epoch": 1.06, - "learning_rate": 1.4987613847936807e-06, - "loss": 0.6895, - "step": 41409 - }, - { - "epoch": 1.06, - "learning_rate": 1.4987374015318359e-06, - "loss": 0.3518, - "step": 41410 - }, - { - "epoch": 1.06, - "learning_rate": 1.4987134178881312e-06, - "loss": 0.7314, - "step": 41411 - }, - { - "epoch": 1.06, - "learning_rate": 1.4986894338625843e-06, - "loss": 0.6821, - "step": 41412 - }, - { - "epoch": 1.06, - "learning_rate": 1.4986654494552138e-06, - "loss": 0.7949, - "step": 41413 - }, - { - "epoch": 1.06, - "learning_rate": 1.498641464666038e-06, - "loss": 0.623, - "step": 41414 - }, - { - "epoch": 1.06, - "learning_rate": 1.4986174794950754e-06, - "loss": 0.7124, - "step": 41415 - }, - { - "epoch": 1.06, - "learning_rate": 1.4985934939423446e-06, - "loss": 0.8145, - "step": 41416 - }, - { - "epoch": 1.06, - "learning_rate": 1.4985695080078635e-06, - "loss": 0.6704, - "step": 41417 - }, - { - "epoch": 1.06, - "learning_rate": 1.4985455216916509e-06, - "loss": 0.8018, - "step": 41418 - }, - { - "epoch": 1.06, - "learning_rate": 1.4985215349937246e-06, - "loss": 0.6021, - "step": 41419 - }, - { - "epoch": 1.06, - "learning_rate": 1.4984975479141034e-06, - "loss": 0.5583, - "step": 41420 - }, - { - "epoch": 1.06, - "learning_rate": 1.4984735604528053e-06, - "loss": 0.501, - "step": 41421 - }, - { - "epoch": 1.06, - "learning_rate": 1.498449572609849e-06, - "loss": 0.6636, - "step": 41422 - }, - { - "epoch": 1.06, - "learning_rate": 1.4984255843852532e-06, - "loss": 0.5757, - "step": 41423 - }, - { - "epoch": 1.06, - "learning_rate": 1.4984015957790358e-06, - "loss": 0.8193, - "step": 41424 - }, - { - "epoch": 1.06, - "learning_rate": 1.4983776067912145e-06, - "loss": 0.604, - "step": 41425 - }, - { - "epoch": 1.06, - "learning_rate": 1.498353617421809e-06, - "loss": 0.5515, - "step": 41426 - }, - { - "epoch": 1.06, - "learning_rate": 1.498329627670837e-06, - "loss": 0.8125, - "step": 41427 - }, - { - "epoch": 1.06, - "learning_rate": 1.4983056375383167e-06, - "loss": 0.7617, - "step": 41428 - }, - { - "epoch": 1.06, - "learning_rate": 1.498281647024267e-06, - "loss": 0.4036, - "step": 41429 - }, - { - "epoch": 1.06, - "learning_rate": 1.4982576561287056e-06, - "loss": 0.7412, - "step": 41430 - }, - { - "epoch": 1.06, - "learning_rate": 1.4982336648516514e-06, - "loss": 0.6196, - "step": 41431 - }, - { - "epoch": 1.06, - "learning_rate": 1.4982096731931226e-06, - "loss": 0.6362, - "step": 41432 - }, - { - "epoch": 1.06, - "learning_rate": 1.4981856811531378e-06, - "loss": 0.6621, - "step": 41433 - }, - { - "epoch": 1.06, - "learning_rate": 1.4981616887317148e-06, - "loss": 0.7285, - "step": 41434 - }, - { - "epoch": 1.06, - "learning_rate": 1.4981376959288724e-06, - "loss": 0.8096, - "step": 41435 - }, - { - "epoch": 1.06, - "learning_rate": 1.4981137027446286e-06, - "loss": 0.8066, - "step": 41436 - }, - { - "epoch": 1.06, - "learning_rate": 1.4980897091790026e-06, - "loss": 0.6064, - "step": 41437 - }, - { - "epoch": 1.06, - "learning_rate": 1.4980657152320118e-06, - "loss": 0.7178, - "step": 41438 - }, - { - "epoch": 1.06, - "learning_rate": 1.4980417209036751e-06, - "loss": 0.7451, - "step": 41439 - }, - { - "epoch": 1.06, - "learning_rate": 1.4980177261940106e-06, - "loss": 0.604, - "step": 41440 - }, - { - "epoch": 1.06, - "learning_rate": 1.497993731103037e-06, - "loss": 0.5498, - "step": 41441 - }, - { - "epoch": 1.06, - "learning_rate": 1.4979697356307726e-06, - "loss": 0.5134, - "step": 41442 - }, - { - "epoch": 1.06, - "learning_rate": 1.4979457397772354e-06, - "loss": 0.4766, - "step": 41443 - }, - { - "epoch": 1.06, - "learning_rate": 1.4979217435424442e-06, - "loss": 0.6294, - "step": 41444 - }, - { - "epoch": 1.06, - "learning_rate": 1.497897746926417e-06, - "loss": 0.655, - "step": 41445 - }, - { - "epoch": 1.06, - "learning_rate": 1.4978737499291727e-06, - "loss": 0.7773, - "step": 41446 - }, - { - "epoch": 1.06, - "learning_rate": 1.497849752550729e-06, - "loss": 0.5762, - "step": 41447 - }, - { - "epoch": 1.06, - "learning_rate": 1.4978257547911054e-06, - "loss": 0.5662, - "step": 41448 - }, - { - "epoch": 1.06, - "learning_rate": 1.4978017566503188e-06, - "loss": 0.6509, - "step": 41449 - }, - { - "epoch": 1.06, - "learning_rate": 1.4977777581283887e-06, - "loss": 0.5474, - "step": 41450 - }, - { - "epoch": 1.06, - "learning_rate": 1.4977537592253327e-06, - "loss": 0.5825, - "step": 41451 - }, - { - "epoch": 1.06, - "learning_rate": 1.4977297599411696e-06, - "loss": 0.6924, - "step": 41452 - }, - { - "epoch": 1.06, - "learning_rate": 1.4977057602759178e-06, - "loss": 0.6797, - "step": 41453 - }, - { - "epoch": 1.06, - "learning_rate": 1.4976817602295957e-06, - "loss": 0.6675, - "step": 41454 - }, - { - "epoch": 1.06, - "learning_rate": 1.4976577598022214e-06, - "loss": 0.6094, - "step": 41455 - }, - { - "epoch": 1.06, - "learning_rate": 1.4976337589938133e-06, - "loss": 0.7627, - "step": 41456 - }, - { - "epoch": 1.06, - "learning_rate": 1.4976097578043901e-06, - "loss": 0.5693, - "step": 41457 - }, - { - "epoch": 1.06, - "learning_rate": 1.49758575623397e-06, - "loss": 0.3447, - "step": 41458 - }, - { - "epoch": 1.06, - "learning_rate": 1.497561754282571e-06, - "loss": 0.6089, - "step": 41459 - }, - { - "epoch": 1.06, - "learning_rate": 1.4975377519502127e-06, - "loss": 0.5181, - "step": 41460 - }, - { - "epoch": 1.06, - "learning_rate": 1.4975137492369116e-06, - "loss": 0.7373, - "step": 41461 - }, - { - "epoch": 1.06, - "learning_rate": 1.4974897461426881e-06, - "loss": 0.6055, - "step": 41462 - }, - { - "epoch": 1.06, - "learning_rate": 1.497465742667559e-06, - "loss": 0.6631, - "step": 41463 - }, - { - "epoch": 1.06, - "learning_rate": 1.4974417388115432e-06, - "loss": 0.6172, - "step": 41464 - }, - { - "epoch": 1.06, - "learning_rate": 1.4974177345746593e-06, - "loss": 0.6699, - "step": 41465 - }, - { - "epoch": 1.06, - "learning_rate": 1.4973937299569252e-06, - "loss": 0.7393, - "step": 41466 - }, - { - "epoch": 1.06, - "learning_rate": 1.49736972495836e-06, - "loss": 0.6675, - "step": 41467 - }, - { - "epoch": 1.06, - "learning_rate": 1.4973457195789815e-06, - "loss": 0.7803, - "step": 41468 - }, - { - "epoch": 1.06, - "learning_rate": 1.4973217138188083e-06, - "loss": 0.6973, - "step": 41469 - }, - { - "epoch": 1.06, - "learning_rate": 1.4972977076778588e-06, - "loss": 0.7549, - "step": 41470 - }, - { - "epoch": 1.06, - "learning_rate": 1.4972737011561512e-06, - "loss": 0.6377, - "step": 41471 - }, - { - "epoch": 1.06, - "learning_rate": 1.497249694253704e-06, - "loss": 0.667, - "step": 41472 - }, - { - "epoch": 1.06, - "learning_rate": 1.4972256869705357e-06, - "loss": 0.6982, - "step": 41473 - }, - { - "epoch": 1.06, - "learning_rate": 1.4972016793066641e-06, - "loss": 0.5723, - "step": 41474 - }, - { - "epoch": 1.06, - "learning_rate": 1.4971776712621087e-06, - "loss": 0.5896, - "step": 41475 - }, - { - "epoch": 1.06, - "learning_rate": 1.4971536628368866e-06, - "loss": 0.5933, - "step": 41476 - }, - { - "epoch": 1.06, - "learning_rate": 1.4971296540310175e-06, - "loss": 0.5605, - "step": 41477 - }, - { - "epoch": 1.06, - "learning_rate": 1.4971056448445185e-06, - "loss": 0.5103, - "step": 41478 - }, - { - "epoch": 1.06, - "learning_rate": 1.497081635277409e-06, - "loss": 0.4292, - "step": 41479 - }, - { - "epoch": 1.06, - "learning_rate": 1.4970576253297065e-06, - "loss": 0.5977, - "step": 41480 - }, - { - "epoch": 1.06, - "learning_rate": 1.49703361500143e-06, - "loss": 0.501, - "step": 41481 - }, - { - "epoch": 1.06, - "learning_rate": 1.497009604292598e-06, - "loss": 0.6548, - "step": 41482 - }, - { - "epoch": 1.06, - "learning_rate": 1.4969855932032282e-06, - "loss": 0.7197, - "step": 41483 - }, - { - "epoch": 1.06, - "learning_rate": 1.4969615817333394e-06, - "loss": 0.7988, - "step": 41484 - }, - { - "epoch": 1.06, - "learning_rate": 1.4969375698829501e-06, - "loss": 0.6826, - "step": 41485 - }, - { - "epoch": 1.06, - "learning_rate": 1.4969135576520783e-06, - "loss": 0.5371, - "step": 41486 - }, - { - "epoch": 1.06, - "learning_rate": 1.4968895450407432e-06, - "loss": 0.6899, - "step": 41487 - }, - { - "epoch": 1.06, - "learning_rate": 1.4968655320489622e-06, - "loss": 0.7256, - "step": 41488 - }, - { - "epoch": 1.06, - "learning_rate": 1.4968415186767542e-06, - "loss": 0.6211, - "step": 41489 - }, - { - "epoch": 1.06, - "learning_rate": 1.4968175049241377e-06, - "loss": 0.6128, - "step": 41490 - }, - { - "epoch": 1.06, - "learning_rate": 1.4967934907911306e-06, - "loss": 0.5215, - "step": 41491 - }, - { - "epoch": 1.06, - "learning_rate": 1.4967694762777517e-06, - "loss": 0.6553, - "step": 41492 - }, - { - "epoch": 1.06, - "learning_rate": 1.4967454613840192e-06, - "loss": 0.6057, - "step": 41493 - }, - { - "epoch": 1.06, - "learning_rate": 1.4967214461099515e-06, - "loss": 0.96, - "step": 41494 - }, - { - "epoch": 1.06, - "learning_rate": 1.496697430455567e-06, - "loss": 0.7305, - "step": 41495 - }, - { - "epoch": 1.06, - "learning_rate": 1.4966734144208842e-06, - "loss": 0.645, - "step": 41496 - }, - { - "epoch": 1.06, - "learning_rate": 1.4966493980059216e-06, - "loss": 0.7461, - "step": 41497 - }, - { - "epoch": 1.06, - "learning_rate": 1.496625381210697e-06, - "loss": 0.4624, - "step": 41498 - }, - { - "epoch": 1.06, - "learning_rate": 1.4966013640352294e-06, - "loss": 0.7798, - "step": 41499 - }, - { - "epoch": 1.06, - "learning_rate": 1.496577346479537e-06, - "loss": 0.7295, - "step": 41500 - }, - { - "epoch": 1.06, - "learning_rate": 1.4965533285436381e-06, - "loss": 0.709, - "step": 41501 - }, - { - "epoch": 1.06, - "learning_rate": 1.4965293102275514e-06, - "loss": 0.6772, - "step": 41502 - }, - { - "epoch": 1.06, - "learning_rate": 1.4965052915312947e-06, - "loss": 0.6729, - "step": 41503 - }, - { - "epoch": 1.06, - "learning_rate": 1.4964812724548868e-06, - "loss": 0.7812, - "step": 41504 - }, - { - "epoch": 1.06, - "learning_rate": 1.496457252998346e-06, - "loss": 0.7383, - "step": 41505 - }, - { - "epoch": 1.06, - "learning_rate": 1.496433233161691e-06, - "loss": 0.7031, - "step": 41506 - }, - { - "epoch": 1.06, - "learning_rate": 1.4964092129449393e-06, - "loss": 0.7173, - "step": 41507 - }, - { - "epoch": 1.06, - "learning_rate": 1.4963851923481103e-06, - "loss": 0.3887, - "step": 41508 - }, - { - "epoch": 1.06, - "learning_rate": 1.4963611713712218e-06, - "loss": 0.6064, - "step": 41509 - }, - { - "epoch": 1.06, - "learning_rate": 1.4963371500142925e-06, - "loss": 0.5459, - "step": 41510 - }, - { - "epoch": 1.06, - "learning_rate": 1.496313128277341e-06, - "loss": 0.6689, - "step": 41511 - }, - { - "epoch": 1.06, - "learning_rate": 1.496289106160385e-06, - "loss": 0.7134, - "step": 41512 - }, - { - "epoch": 1.06, - "learning_rate": 1.496265083663443e-06, - "loss": 0.6172, - "step": 41513 - }, - { - "epoch": 1.06, - "learning_rate": 1.4962410607865339e-06, - "loss": 0.7109, - "step": 41514 - }, - { - "epoch": 1.06, - "learning_rate": 1.4962170375296758e-06, - "loss": 0.6411, - "step": 41515 - }, - { - "epoch": 1.06, - "learning_rate": 1.4961930138928874e-06, - "loss": 0.7661, - "step": 41516 - }, - { - "epoch": 1.06, - "learning_rate": 1.4961689898761866e-06, - "loss": 0.7378, - "step": 41517 - }, - { - "epoch": 1.06, - "learning_rate": 1.4961449654795919e-06, - "loss": 0.6108, - "step": 41518 - }, - { - "epoch": 1.06, - "learning_rate": 1.496120940703122e-06, - "loss": 0.7139, - "step": 41519 - }, - { - "epoch": 1.06, - "learning_rate": 1.4960969155467948e-06, - "loss": 0.8672, - "step": 41520 - }, - { - "epoch": 1.06, - "learning_rate": 1.4960728900106297e-06, - "loss": 0.7334, - "step": 41521 - }, - { - "epoch": 1.06, - "learning_rate": 1.4960488640946438e-06, - "loss": 0.5369, - "step": 41522 - }, - { - "epoch": 1.06, - "learning_rate": 1.4960248377988562e-06, - "loss": 0.8369, - "step": 41523 - }, - { - "epoch": 1.06, - "learning_rate": 1.496000811123285e-06, - "loss": 0.7314, - "step": 41524 - }, - { - "epoch": 1.06, - "learning_rate": 1.4959767840679492e-06, - "loss": 0.5894, - "step": 41525 - }, - { - "epoch": 1.06, - "learning_rate": 1.4959527566328667e-06, - "loss": 0.512, - "step": 41526 - }, - { - "epoch": 1.06, - "learning_rate": 1.495928728818056e-06, - "loss": 0.6709, - "step": 41527 - }, - { - "epoch": 1.06, - "learning_rate": 1.495904700623535e-06, - "loss": 0.7456, - "step": 41528 - }, - { - "epoch": 1.06, - "learning_rate": 1.495880672049323e-06, - "loss": 0.6768, - "step": 41529 - }, - { - "epoch": 1.06, - "learning_rate": 1.495856643095438e-06, - "loss": 0.7627, - "step": 41530 - }, - { - "epoch": 1.06, - "learning_rate": 1.4958326137618985e-06, - "loss": 0.7021, - "step": 41531 - }, - { - "epoch": 1.06, - "learning_rate": 1.4958085840487225e-06, - "loss": 0.6216, - "step": 41532 - }, - { - "epoch": 1.06, - "learning_rate": 1.4957845539559287e-06, - "loss": 0.7168, - "step": 41533 - }, - { - "epoch": 1.06, - "learning_rate": 1.4957605234835353e-06, - "loss": 0.7832, - "step": 41534 - }, - { - "epoch": 1.06, - "learning_rate": 1.495736492631561e-06, - "loss": 0.5513, - "step": 41535 - }, - { - "epoch": 1.06, - "learning_rate": 1.4957124614000241e-06, - "loss": 0.6201, - "step": 41536 - }, - { - "epoch": 1.06, - "learning_rate": 1.495688429788943e-06, - "loss": 0.709, - "step": 41537 - }, - { - "epoch": 1.06, - "learning_rate": 1.495664397798336e-06, - "loss": 0.7275, - "step": 41538 - }, - { - "epoch": 1.06, - "learning_rate": 1.4956403654282214e-06, - "loss": 0.7002, - "step": 41539 - }, - { - "epoch": 1.06, - "learning_rate": 1.4956163326786179e-06, - "loss": 0.58, - "step": 41540 - }, - { - "epoch": 1.06, - "learning_rate": 1.495592299549544e-06, - "loss": 0.793, - "step": 41541 - }, - { - "epoch": 1.06, - "learning_rate": 1.4955682660410176e-06, - "loss": 0.5601, - "step": 41542 - }, - { - "epoch": 1.06, - "learning_rate": 1.4955442321530574e-06, - "loss": 0.521, - "step": 41543 - }, - { - "epoch": 1.06, - "learning_rate": 1.495520197885682e-06, - "loss": 0.7471, - "step": 41544 - }, - { - "epoch": 1.06, - "learning_rate": 1.495496163238909e-06, - "loss": 0.665, - "step": 41545 - }, - { - "epoch": 1.06, - "learning_rate": 1.495472128212758e-06, - "loss": 0.7505, - "step": 41546 - }, - { - "epoch": 1.06, - "learning_rate": 1.4954480928072464e-06, - "loss": 0.7783, - "step": 41547 - }, - { - "epoch": 1.06, - "learning_rate": 1.4954240570223933e-06, - "loss": 0.6064, - "step": 41548 - }, - { - "epoch": 1.06, - "learning_rate": 1.4954000208582163e-06, - "loss": 0.489, - "step": 41549 - }, - { - "epoch": 1.06, - "learning_rate": 1.4953759843147346e-06, - "loss": 0.7744, - "step": 41550 - }, - { - "epoch": 1.06, - "learning_rate": 1.4953519473919664e-06, - "loss": 0.6934, - "step": 41551 - }, - { - "epoch": 1.06, - "learning_rate": 1.4953279100899298e-06, - "loss": 0.707, - "step": 41552 - }, - { - "epoch": 1.07, - "learning_rate": 1.4953038724086434e-06, - "loss": 0.6084, - "step": 41553 - }, - { - "epoch": 1.07, - "learning_rate": 1.4952798343481257e-06, - "loss": 0.5947, - "step": 41554 - }, - { - "epoch": 1.07, - "learning_rate": 1.4952557959083947e-06, - "loss": 0.6348, - "step": 41555 - }, - { - "epoch": 1.07, - "learning_rate": 1.4952317570894695e-06, - "loss": 0.7354, - "step": 41556 - }, - { - "epoch": 1.07, - "learning_rate": 1.4952077178913677e-06, - "loss": 0.5366, - "step": 41557 - }, - { - "epoch": 1.07, - "learning_rate": 1.4951836783141086e-06, - "loss": 0.6416, - "step": 41558 - }, - { - "epoch": 1.07, - "learning_rate": 1.4951596383577099e-06, - "loss": 0.5903, - "step": 41559 - }, - { - "epoch": 1.07, - "learning_rate": 1.4951355980221902e-06, - "loss": 0.7217, - "step": 41560 - }, - { - "epoch": 1.07, - "learning_rate": 1.495111557307568e-06, - "loss": 0.52, - "step": 41561 - }, - { - "epoch": 1.07, - "learning_rate": 1.4950875162138615e-06, - "loss": 0.7007, - "step": 41562 - }, - { - "epoch": 1.07, - "learning_rate": 1.4950634747410896e-06, - "loss": 0.7432, - "step": 41563 - }, - { - "epoch": 1.07, - "learning_rate": 1.49503943288927e-06, - "loss": 0.7285, - "step": 41564 - }, - { - "epoch": 1.07, - "learning_rate": 1.4950153906584216e-06, - "loss": 0.7256, - "step": 41565 - }, - { - "epoch": 1.07, - "learning_rate": 1.4949913480485628e-06, - "loss": 0.73, - "step": 41566 - }, - { - "epoch": 1.07, - "learning_rate": 1.4949673050597116e-06, - "loss": 0.6494, - "step": 41567 - }, - { - "epoch": 1.07, - "learning_rate": 1.494943261691887e-06, - "loss": 0.6782, - "step": 41568 - }, - { - "epoch": 1.07, - "learning_rate": 1.4949192179451069e-06, - "loss": 0.5757, - "step": 41569 - }, - { - "epoch": 1.07, - "learning_rate": 1.4948951738193899e-06, - "loss": 0.748, - "step": 41570 - }, - { - "epoch": 1.07, - "learning_rate": 1.4948711293147548e-06, - "loss": 0.7539, - "step": 41571 - }, - { - "epoch": 1.07, - "learning_rate": 1.4948470844312192e-06, - "loss": 0.6777, - "step": 41572 - }, - { - "epoch": 1.07, - "learning_rate": 1.494823039168802e-06, - "loss": 0.5796, - "step": 41573 - }, - { - "epoch": 1.07, - "learning_rate": 1.4947989935275214e-06, - "loss": 0.603, - "step": 41574 - }, - { - "epoch": 1.07, - "learning_rate": 1.4947749475073964e-06, - "loss": 0.6826, - "step": 41575 - }, - { - "epoch": 1.07, - "learning_rate": 1.4947509011084447e-06, - "loss": 0.6638, - "step": 41576 - }, - { - "epoch": 1.07, - "learning_rate": 1.4947268543306851e-06, - "loss": 0.5757, - "step": 41577 - }, - { - "epoch": 1.07, - "learning_rate": 1.4947028071741358e-06, - "loss": 0.5508, - "step": 41578 - }, - { - "epoch": 1.07, - "learning_rate": 1.4946787596388153e-06, - "loss": 0.6494, - "step": 41579 - }, - { - "epoch": 1.07, - "learning_rate": 1.494654711724742e-06, - "loss": 0.6353, - "step": 41580 - }, - { - "epoch": 1.07, - "learning_rate": 1.4946306634319343e-06, - "loss": 0.6689, - "step": 41581 - }, - { - "epoch": 1.07, - "learning_rate": 1.4946066147604108e-06, - "loss": 0.3774, - "step": 41582 - }, - { - "epoch": 1.07, - "learning_rate": 1.4945825657101895e-06, - "loss": 0.7549, - "step": 41583 - }, - { - "epoch": 1.07, - "learning_rate": 1.4945585162812894e-06, - "loss": 0.585, - "step": 41584 - }, - { - "epoch": 1.07, - "learning_rate": 1.4945344664737283e-06, - "loss": 0.6392, - "step": 41585 - }, - { - "epoch": 1.07, - "learning_rate": 1.4945104162875253e-06, - "loss": 0.6904, - "step": 41586 - }, - { - "epoch": 1.07, - "learning_rate": 1.494486365722698e-06, - "loss": 0.5527, - "step": 41587 - }, - { - "epoch": 1.07, - "learning_rate": 1.4944623147792656e-06, - "loss": 0.7002, - "step": 41588 - }, - { - "epoch": 1.07, - "learning_rate": 1.4944382634572458e-06, - "loss": 0.5947, - "step": 41589 - }, - { - "epoch": 1.07, - "learning_rate": 1.4944142117566573e-06, - "loss": 0.6309, - "step": 41590 - }, - { - "epoch": 1.07, - "learning_rate": 1.494390159677519e-06, - "loss": 0.6426, - "step": 41591 - }, - { - "epoch": 1.07, - "learning_rate": 1.4943661072198487e-06, - "loss": 0.6748, - "step": 41592 - }, - { - "epoch": 1.07, - "learning_rate": 1.494342054383665e-06, - "loss": 0.8389, - "step": 41593 - }, - { - "epoch": 1.07, - "learning_rate": 1.4943180011689863e-06, - "loss": 0.6797, - "step": 41594 - }, - { - "epoch": 1.07, - "learning_rate": 1.4942939475758308e-06, - "loss": 0.5854, - "step": 41595 - }, - { - "epoch": 1.07, - "learning_rate": 1.4942698936042176e-06, - "loss": 0.7588, - "step": 41596 - }, - { - "epoch": 1.07, - "learning_rate": 1.494245839254164e-06, - "loss": 0.6553, - "step": 41597 - }, - { - "epoch": 1.07, - "learning_rate": 1.4942217845256897e-06, - "loss": 0.875, - "step": 41598 - }, - { - "epoch": 1.07, - "learning_rate": 1.4941977294188122e-06, - "loss": 0.6904, - "step": 41599 - }, - { - "epoch": 1.07, - "learning_rate": 1.4941736739335505e-06, - "loss": 0.7324, - "step": 41600 - }, - { - "epoch": 1.07, - "learning_rate": 1.4941496180699226e-06, - "loss": 0.5, - "step": 41601 - }, - { - "epoch": 1.07, - "learning_rate": 1.4941255618279469e-06, - "loss": 0.6338, - "step": 41602 - }, - { - "epoch": 1.07, - "learning_rate": 1.4941015052076422e-06, - "loss": 0.7441, - "step": 41603 - }, - { - "epoch": 1.07, - "learning_rate": 1.4940774482090265e-06, - "loss": 0.6875, - "step": 41604 - }, - { - "epoch": 1.07, - "learning_rate": 1.4940533908321187e-06, - "loss": 0.6538, - "step": 41605 - }, - { - "epoch": 1.07, - "learning_rate": 1.4940293330769366e-06, - "loss": 0.7275, - "step": 41606 - }, - { - "epoch": 1.07, - "learning_rate": 1.4940052749434993e-06, - "loss": 0.7148, - "step": 41607 - }, - { - "epoch": 1.07, - "learning_rate": 1.4939812164318247e-06, - "loss": 0.7646, - "step": 41608 - }, - { - "epoch": 1.07, - "learning_rate": 1.4939571575419314e-06, - "loss": 0.5688, - "step": 41609 - }, - { - "epoch": 1.07, - "learning_rate": 1.4939330982738377e-06, - "loss": 0.6279, - "step": 41610 - }, - { - "epoch": 1.07, - "learning_rate": 1.4939090386275624e-06, - "loss": 0.7559, - "step": 41611 - }, - { - "epoch": 1.07, - "learning_rate": 1.4938849786031234e-06, - "loss": 0.5771, - "step": 41612 - }, - { - "epoch": 1.07, - "learning_rate": 1.4938609182005394e-06, - "loss": 0.5469, - "step": 41613 - }, - { - "epoch": 1.07, - "learning_rate": 1.4938368574198289e-06, - "loss": 0.7598, - "step": 41614 - }, - { - "epoch": 1.07, - "learning_rate": 1.4938127962610103e-06, - "loss": 0.645, - "step": 41615 - }, - { - "epoch": 1.07, - "learning_rate": 1.4937887347241018e-06, - "loss": 0.479, - "step": 41616 - }, - { - "epoch": 1.07, - "learning_rate": 1.4937646728091223e-06, - "loss": 0.7031, - "step": 41617 - }, - { - "epoch": 1.07, - "learning_rate": 1.4937406105160895e-06, - "loss": 0.6528, - "step": 41618 - }, - { - "epoch": 1.07, - "learning_rate": 1.4937165478450223e-06, - "loss": 0.4648, - "step": 41619 - }, - { - "epoch": 1.07, - "learning_rate": 1.493692484795939e-06, - "loss": 0.7773, - "step": 41620 - }, - { - "epoch": 1.07, - "learning_rate": 1.4936684213688584e-06, - "loss": 0.8271, - "step": 41621 - }, - { - "epoch": 1.07, - "learning_rate": 1.4936443575637983e-06, - "loss": 0.6289, - "step": 41622 - }, - { - "epoch": 1.07, - "learning_rate": 1.4936202933807773e-06, - "loss": 0.7412, - "step": 41623 - }, - { - "epoch": 1.07, - "learning_rate": 1.493596228819814e-06, - "loss": 0.4797, - "step": 41624 - }, - { - "epoch": 1.07, - "learning_rate": 1.4935721638809269e-06, - "loss": 0.5742, - "step": 41625 - }, - { - "epoch": 1.07, - "learning_rate": 1.4935480985641345e-06, - "loss": 0.7959, - "step": 41626 - }, - { - "epoch": 1.07, - "learning_rate": 1.4935240328694544e-06, - "loss": 0.6431, - "step": 41627 - }, - { - "epoch": 1.07, - "learning_rate": 1.4934999667969062e-06, - "loss": 0.4561, - "step": 41628 - }, - { - "epoch": 1.07, - "learning_rate": 1.4934759003465074e-06, - "loss": 0.624, - "step": 41629 - }, - { - "epoch": 1.07, - "learning_rate": 1.493451833518277e-06, - "loss": 0.7939, - "step": 41630 - }, - { - "epoch": 1.07, - "learning_rate": 1.4934277663122332e-06, - "loss": 0.7793, - "step": 41631 - }, - { - "epoch": 1.07, - "learning_rate": 1.4934036987283946e-06, - "loss": 0.5767, - "step": 41632 - }, - { - "epoch": 1.07, - "learning_rate": 1.493379630766779e-06, - "loss": 0.6611, - "step": 41633 - }, - { - "epoch": 1.07, - "learning_rate": 1.493355562427406e-06, - "loss": 0.5885, - "step": 41634 - }, - { - "epoch": 1.07, - "learning_rate": 1.4933314937102926e-06, - "loss": 0.707, - "step": 41635 - }, - { - "epoch": 1.07, - "learning_rate": 1.4933074246154586e-06, - "loss": 0.666, - "step": 41636 - }, - { - "epoch": 1.07, - "learning_rate": 1.4932833551429214e-06, - "loss": 0.6382, - "step": 41637 - }, - { - "epoch": 1.07, - "learning_rate": 1.4932592852927e-06, - "loss": 0.8574, - "step": 41638 - }, - { - "epoch": 1.07, - "learning_rate": 1.4932352150648125e-06, - "loss": 0.7119, - "step": 41639 - }, - { - "epoch": 1.07, - "learning_rate": 1.4932111444592775e-06, - "loss": 0.7021, - "step": 41640 - }, - { - "epoch": 1.07, - "learning_rate": 1.4931870734761134e-06, - "loss": 0.584, - "step": 41641 - }, - { - "epoch": 1.07, - "learning_rate": 1.4931630021153388e-06, - "loss": 0.6205, - "step": 41642 - }, - { - "epoch": 1.07, - "learning_rate": 1.4931389303769717e-06, - "loss": 0.667, - "step": 41643 - }, - { - "epoch": 1.07, - "learning_rate": 1.4931148582610308e-06, - "loss": 0.7144, - "step": 41644 - }, - { - "epoch": 1.07, - "learning_rate": 1.4930907857675345e-06, - "loss": 0.7754, - "step": 41645 - }, - { - "epoch": 1.07, - "learning_rate": 1.4930667128965015e-06, - "loss": 0.5442, - "step": 41646 - }, - { - "epoch": 1.07, - "learning_rate": 1.49304263964795e-06, - "loss": 0.7764, - "step": 41647 - }, - { - "epoch": 1.07, - "learning_rate": 1.4930185660218983e-06, - "loss": 0.7461, - "step": 41648 - }, - { - "epoch": 1.07, - "learning_rate": 1.492994492018365e-06, - "loss": 0.5488, - "step": 41649 - }, - { - "epoch": 1.07, - "learning_rate": 1.4929704176373685e-06, - "loss": 0.5464, - "step": 41650 - }, - { - "epoch": 1.07, - "learning_rate": 1.4929463428789272e-06, - "loss": 0.4419, - "step": 41651 - }, - { - "epoch": 1.07, - "learning_rate": 1.4929222677430596e-06, - "loss": 0.6641, - "step": 41652 - }, - { - "epoch": 1.07, - "learning_rate": 1.492898192229784e-06, - "loss": 0.636, - "step": 41653 - }, - { - "epoch": 1.07, - "learning_rate": 1.4928741163391188e-06, - "loss": 0.4785, - "step": 41654 - }, - { - "epoch": 1.07, - "learning_rate": 1.4928500400710828e-06, - "loss": 0.7109, - "step": 41655 - }, - { - "epoch": 1.07, - "learning_rate": 1.4928259634256942e-06, - "loss": 0.5408, - "step": 41656 - }, - { - "epoch": 1.07, - "learning_rate": 1.4928018864029713e-06, - "loss": 0.6299, - "step": 41657 - }, - { - "epoch": 1.07, - "learning_rate": 1.4927778090029324e-06, - "loss": 0.646, - "step": 41658 - }, - { - "epoch": 1.07, - "learning_rate": 1.4927537312255967e-06, - "loss": 0.7236, - "step": 41659 - }, - { - "epoch": 1.07, - "learning_rate": 1.4927296530709816e-06, - "loss": 0.8037, - "step": 41660 - }, - { - "epoch": 1.07, - "learning_rate": 1.4927055745391066e-06, - "loss": 0.4487, - "step": 41661 - }, - { - "epoch": 1.07, - "learning_rate": 1.492681495629989e-06, - "loss": 0.5522, - "step": 41662 - }, - { - "epoch": 1.07, - "learning_rate": 1.4926574163436485e-06, - "loss": 0.5688, - "step": 41663 - }, - { - "epoch": 1.07, - "learning_rate": 1.4926333366801024e-06, - "loss": 0.7656, - "step": 41664 - }, - { - "epoch": 1.07, - "learning_rate": 1.4926092566393697e-06, - "loss": 0.6318, - "step": 41665 - }, - { - "epoch": 1.07, - "learning_rate": 1.492585176221469e-06, - "loss": 0.7471, - "step": 41666 - }, - { - "epoch": 1.07, - "learning_rate": 1.4925610954264181e-06, - "loss": 0.6748, - "step": 41667 - }, - { - "epoch": 1.07, - "learning_rate": 1.492537014254236e-06, - "loss": 0.5645, - "step": 41668 - }, - { - "epoch": 1.07, - "learning_rate": 1.4925129327049409e-06, - "loss": 0.8018, - "step": 41669 - }, - { - "epoch": 1.07, - "learning_rate": 1.4924888507785513e-06, - "loss": 0.8936, - "step": 41670 - }, - { - "epoch": 1.07, - "learning_rate": 1.4924647684750857e-06, - "loss": 0.8926, - "step": 41671 - }, - { - "epoch": 1.07, - "learning_rate": 1.4924406857945624e-06, - "loss": 0.6758, - "step": 41672 - }, - { - "epoch": 1.07, - "learning_rate": 1.4924166027369997e-06, - "loss": 0.6958, - "step": 41673 - }, - { - "epoch": 1.07, - "learning_rate": 1.4923925193024168e-06, - "loss": 0.6289, - "step": 41674 - }, - { - "epoch": 1.07, - "learning_rate": 1.492368435490831e-06, - "loss": 0.6816, - "step": 41675 - }, - { - "epoch": 1.07, - "learning_rate": 1.492344351302262e-06, - "loss": 0.6323, - "step": 41676 - }, - { - "epoch": 1.07, - "learning_rate": 1.492320266736727e-06, - "loss": 0.6172, - "step": 41677 - }, - { - "epoch": 1.07, - "learning_rate": 1.4922961817942451e-06, - "loss": 0.6885, - "step": 41678 - }, - { - "epoch": 1.07, - "learning_rate": 1.4922720964748345e-06, - "loss": 0.8594, - "step": 41679 - }, - { - "epoch": 1.07, - "learning_rate": 1.4922480107785143e-06, - "loss": 0.79, - "step": 41680 - }, - { - "epoch": 1.07, - "learning_rate": 1.4922239247053022e-06, - "loss": 0.7051, - "step": 41681 - }, - { - "epoch": 1.07, - "learning_rate": 1.492199838255217e-06, - "loss": 0.6504, - "step": 41682 - }, - { - "epoch": 1.07, - "learning_rate": 1.4921757514282765e-06, - "loss": 0.6978, - "step": 41683 - }, - { - "epoch": 1.07, - "learning_rate": 1.4921516642245002e-06, - "loss": 0.5483, - "step": 41684 - }, - { - "epoch": 1.07, - "learning_rate": 1.4921275766439057e-06, - "loss": 0.7158, - "step": 41685 - }, - { - "epoch": 1.07, - "learning_rate": 1.492103488686512e-06, - "loss": 0.5518, - "step": 41686 - }, - { - "epoch": 1.07, - "learning_rate": 1.492079400352337e-06, - "loss": 0.4708, - "step": 41687 - }, - { - "epoch": 1.07, - "learning_rate": 1.4920553116413997e-06, - "loss": 0.5195, - "step": 41688 - }, - { - "epoch": 1.07, - "learning_rate": 1.492031222553718e-06, - "loss": 0.6548, - "step": 41689 - }, - { - "epoch": 1.07, - "learning_rate": 1.4920071330893107e-06, - "loss": 0.5996, - "step": 41690 - }, - { - "epoch": 1.07, - "learning_rate": 1.4919830432481964e-06, - "loss": 0.6167, - "step": 41691 - }, - { - "epoch": 1.07, - "learning_rate": 1.491958953030393e-06, - "loss": 0.6445, - "step": 41692 - }, - { - "epoch": 1.07, - "learning_rate": 1.4919348624359195e-06, - "loss": 0.5537, - "step": 41693 - }, - { - "epoch": 1.07, - "learning_rate": 1.4919107714647937e-06, - "loss": 0.7063, - "step": 41694 - }, - { - "epoch": 1.07, - "learning_rate": 1.4918866801170346e-06, - "loss": 0.6523, - "step": 41695 - }, - { - "epoch": 1.07, - "learning_rate": 1.4918625883926608e-06, - "loss": 0.5083, - "step": 41696 - }, - { - "epoch": 1.07, - "learning_rate": 1.4918384962916903e-06, - "loss": 0.3982, - "step": 41697 - }, - { - "epoch": 1.07, - "learning_rate": 1.4918144038141413e-06, - "loss": 0.7842, - "step": 41698 - }, - { - "epoch": 1.07, - "learning_rate": 1.4917903109600331e-06, - "loss": 0.8232, - "step": 41699 - }, - { - "epoch": 1.07, - "learning_rate": 1.4917662177293835e-06, - "loss": 0.665, - "step": 41700 - }, - { - "epoch": 1.07, - "learning_rate": 1.4917421241222114e-06, - "loss": 0.6094, - "step": 41701 - }, - { - "epoch": 1.07, - "learning_rate": 1.4917180301385344e-06, - "loss": 0.7148, - "step": 41702 - }, - { - "epoch": 1.07, - "learning_rate": 1.491693935778372e-06, - "loss": 0.7246, - "step": 41703 - }, - { - "epoch": 1.07, - "learning_rate": 1.4916698410417418e-06, - "loss": 0.6582, - "step": 41704 - }, - { - "epoch": 1.07, - "learning_rate": 1.4916457459286629e-06, - "loss": 0.6943, - "step": 41705 - }, - { - "epoch": 1.07, - "learning_rate": 1.4916216504391531e-06, - "loss": 0.7539, - "step": 41706 - }, - { - "epoch": 1.07, - "learning_rate": 1.4915975545732317e-06, - "loss": 0.5225, - "step": 41707 - }, - { - "epoch": 1.07, - "learning_rate": 1.4915734583309164e-06, - "loss": 0.7275, - "step": 41708 - }, - { - "epoch": 1.07, - "learning_rate": 1.4915493617122258e-06, - "loss": 0.6611, - "step": 41709 - }, - { - "epoch": 1.07, - "learning_rate": 1.4915252647171785e-06, - "loss": 0.665, - "step": 41710 - }, - { - "epoch": 1.07, - "learning_rate": 1.491501167345793e-06, - "loss": 0.7246, - "step": 41711 - }, - { - "epoch": 1.07, - "learning_rate": 1.4914770695980876e-06, - "loss": 0.519, - "step": 41712 - }, - { - "epoch": 1.07, - "learning_rate": 1.491452971474081e-06, - "loss": 0.5977, - "step": 41713 - }, - { - "epoch": 1.07, - "learning_rate": 1.4914288729737912e-06, - "loss": 0.5356, - "step": 41714 - }, - { - "epoch": 1.07, - "learning_rate": 1.491404774097237e-06, - "loss": 0.5596, - "step": 41715 - }, - { - "epoch": 1.07, - "learning_rate": 1.4913806748444368e-06, - "loss": 0.8066, - "step": 41716 - }, - { - "epoch": 1.07, - "learning_rate": 1.4913565752154087e-06, - "loss": 0.5991, - "step": 41717 - }, - { - "epoch": 1.07, - "learning_rate": 1.491332475210172e-06, - "loss": 0.6074, - "step": 41718 - }, - { - "epoch": 1.07, - "learning_rate": 1.4913083748287441e-06, - "loss": 0.4719, - "step": 41719 - }, - { - "epoch": 1.07, - "learning_rate": 1.4912842740711441e-06, - "loss": 0.5559, - "step": 41720 - }, - { - "epoch": 1.07, - "learning_rate": 1.4912601729373906e-06, - "loss": 0.5442, - "step": 41721 - }, - { - "epoch": 1.07, - "learning_rate": 1.4912360714275019e-06, - "loss": 0.5618, - "step": 41722 - }, - { - "epoch": 1.07, - "learning_rate": 1.4912119695414958e-06, - "loss": 0.7275, - "step": 41723 - }, - { - "epoch": 1.07, - "learning_rate": 1.4911878672793916e-06, - "loss": 0.7773, - "step": 41724 - }, - { - "epoch": 1.07, - "learning_rate": 1.4911637646412072e-06, - "loss": 0.9468, - "step": 41725 - }, - { - "epoch": 1.07, - "learning_rate": 1.4911396616269615e-06, - "loss": 0.6167, - "step": 41726 - }, - { - "epoch": 1.07, - "learning_rate": 1.4911155582366728e-06, - "loss": 0.5669, - "step": 41727 - }, - { - "epoch": 1.07, - "learning_rate": 1.4910914544703594e-06, - "loss": 0.6309, - "step": 41728 - }, - { - "epoch": 1.07, - "learning_rate": 1.4910673503280395e-06, - "loss": 0.7197, - "step": 41729 - }, - { - "epoch": 1.07, - "learning_rate": 1.4910432458097324e-06, - "loss": 0.5957, - "step": 41730 - }, - { - "epoch": 1.07, - "learning_rate": 1.491019140915456e-06, - "loss": 0.6953, - "step": 41731 - }, - { - "epoch": 1.07, - "learning_rate": 1.4909950356452287e-06, - "loss": 0.6338, - "step": 41732 - }, - { - "epoch": 1.07, - "learning_rate": 1.4909709299990691e-06, - "loss": 0.791, - "step": 41733 - }, - { - "epoch": 1.07, - "learning_rate": 1.4909468239769959e-06, - "loss": 0.7412, - "step": 41734 - }, - { - "epoch": 1.07, - "learning_rate": 1.4909227175790266e-06, - "loss": 0.626, - "step": 41735 - }, - { - "epoch": 1.07, - "learning_rate": 1.490898610805181e-06, - "loss": 0.6621, - "step": 41736 - }, - { - "epoch": 1.07, - "learning_rate": 1.4908745036554766e-06, - "loss": 0.7148, - "step": 41737 - }, - { - "epoch": 1.07, - "learning_rate": 1.4908503961299324e-06, - "loss": 0.6089, - "step": 41738 - }, - { - "epoch": 1.07, - "learning_rate": 1.4908262882285664e-06, - "loss": 0.6401, - "step": 41739 - }, - { - "epoch": 1.07, - "learning_rate": 1.4908021799513975e-06, - "loss": 0.6309, - "step": 41740 - }, - { - "epoch": 1.07, - "learning_rate": 1.4907780712984438e-06, - "loss": 0.6626, - "step": 41741 - }, - { - "epoch": 1.07, - "learning_rate": 1.490753962269724e-06, - "loss": 0.5771, - "step": 41742 - }, - { - "epoch": 1.07, - "learning_rate": 1.490729852865256e-06, - "loss": 0.7539, - "step": 41743 - }, - { - "epoch": 1.07, - "learning_rate": 1.4907057430850592e-06, - "loss": 0.873, - "step": 41744 - }, - { - "epoch": 1.07, - "learning_rate": 1.4906816329291514e-06, - "loss": 0.5703, - "step": 41745 - }, - { - "epoch": 1.07, - "learning_rate": 1.4906575223975516e-06, - "loss": 0.7861, - "step": 41746 - }, - { - "epoch": 1.07, - "learning_rate": 1.4906334114902774e-06, - "loss": 0.6172, - "step": 41747 - }, - { - "epoch": 1.07, - "learning_rate": 1.4906093002073478e-06, - "loss": 0.4729, - "step": 41748 - }, - { - "epoch": 1.07, - "learning_rate": 1.4905851885487814e-06, - "loss": 0.7178, - "step": 41749 - }, - { - "epoch": 1.07, - "learning_rate": 1.4905610765145965e-06, - "loss": 0.665, - "step": 41750 - }, - { - "epoch": 1.07, - "learning_rate": 1.4905369641048116e-06, - "loss": 0.7197, - "step": 41751 - }, - { - "epoch": 1.07, - "learning_rate": 1.4905128513194448e-06, - "loss": 0.6836, - "step": 41752 - }, - { - "epoch": 1.07, - "learning_rate": 1.4904887381585152e-06, - "loss": 0.7153, - "step": 41753 - }, - { - "epoch": 1.07, - "learning_rate": 1.4904646246220404e-06, - "loss": 0.7803, - "step": 41754 - }, - { - "epoch": 1.07, - "learning_rate": 1.49044051071004e-06, - "loss": 0.751, - "step": 41755 - }, - { - "epoch": 1.07, - "learning_rate": 1.4904163964225315e-06, - "loss": 0.6709, - "step": 41756 - }, - { - "epoch": 1.07, - "learning_rate": 1.490392281759534e-06, - "loss": 0.5449, - "step": 41757 - }, - { - "epoch": 1.07, - "learning_rate": 1.4903681667210653e-06, - "loss": 0.5425, - "step": 41758 - }, - { - "epoch": 1.07, - "learning_rate": 1.4903440513071445e-06, - "loss": 0.5708, - "step": 41759 - }, - { - "epoch": 1.07, - "learning_rate": 1.4903199355177895e-06, - "loss": 0.5353, - "step": 41760 - }, - { - "epoch": 1.07, - "learning_rate": 1.4902958193530195e-06, - "loss": 0.7461, - "step": 41761 - }, - { - "epoch": 1.07, - "learning_rate": 1.4902717028128524e-06, - "loss": 0.8672, - "step": 41762 - }, - { - "epoch": 1.07, - "learning_rate": 1.4902475858973068e-06, - "loss": 0.7686, - "step": 41763 - }, - { - "epoch": 1.07, - "learning_rate": 1.490223468606401e-06, - "loss": 0.7188, - "step": 41764 - }, - { - "epoch": 1.07, - "learning_rate": 1.4901993509401535e-06, - "loss": 0.438, - "step": 41765 - }, - { - "epoch": 1.07, - "learning_rate": 1.4901752328985835e-06, - "loss": 0.5953, - "step": 41766 - }, - { - "epoch": 1.07, - "learning_rate": 1.4901511144817085e-06, - "loss": 0.6382, - "step": 41767 - }, - { - "epoch": 1.07, - "learning_rate": 1.4901269956895472e-06, - "loss": 0.5697, - "step": 41768 - }, - { - "epoch": 1.07, - "learning_rate": 1.4901028765221183e-06, - "loss": 0.5781, - "step": 41769 - }, - { - "epoch": 1.07, - "learning_rate": 1.4900787569794402e-06, - "loss": 0.4413, - "step": 41770 - }, - { - "epoch": 1.07, - "learning_rate": 1.4900546370615315e-06, - "loss": 0.7471, - "step": 41771 - }, - { - "epoch": 1.07, - "learning_rate": 1.4900305167684104e-06, - "loss": 0.7373, - "step": 41772 - }, - { - "epoch": 1.07, - "learning_rate": 1.4900063961000952e-06, - "loss": 0.6924, - "step": 41773 - }, - { - "epoch": 1.07, - "learning_rate": 1.489982275056605e-06, - "loss": 0.5596, - "step": 41774 - }, - { - "epoch": 1.07, - "learning_rate": 1.4899581536379575e-06, - "loss": 0.7139, - "step": 41775 - }, - { - "epoch": 1.07, - "learning_rate": 1.489934031844172e-06, - "loss": 0.5732, - "step": 41776 - }, - { - "epoch": 1.07, - "learning_rate": 1.4899099096752663e-06, - "loss": 0.5972, - "step": 41777 - }, - { - "epoch": 1.07, - "learning_rate": 1.4898857871312591e-06, - "loss": 0.7578, - "step": 41778 - }, - { - "epoch": 1.07, - "learning_rate": 1.4898616642121688e-06, - "loss": 0.748, - "step": 41779 - }, - { - "epoch": 1.07, - "learning_rate": 1.4898375409180142e-06, - "loss": 0.6963, - "step": 41780 - }, - { - "epoch": 1.07, - "learning_rate": 1.4898134172488136e-06, - "loss": 0.688, - "step": 41781 - }, - { - "epoch": 1.07, - "learning_rate": 1.4897892932045849e-06, - "loss": 0.7236, - "step": 41782 - }, - { - "epoch": 1.07, - "learning_rate": 1.4897651687853473e-06, - "loss": 0.627, - "step": 41783 - }, - { - "epoch": 1.07, - "learning_rate": 1.4897410439911192e-06, - "loss": 0.6582, - "step": 41784 - }, - { - "epoch": 1.07, - "learning_rate": 1.4897169188219185e-06, - "loss": 0.5158, - "step": 41785 - }, - { - "epoch": 1.07, - "learning_rate": 1.4896927932777645e-06, - "loss": 0.6021, - "step": 41786 - }, - { - "epoch": 1.07, - "learning_rate": 1.489668667358675e-06, - "loss": 0.4599, - "step": 41787 - }, - { - "epoch": 1.07, - "learning_rate": 1.4896445410646688e-06, - "loss": 0.8564, - "step": 41788 - }, - { - "epoch": 1.07, - "learning_rate": 1.4896204143957645e-06, - "loss": 0.708, - "step": 41789 - }, - { - "epoch": 1.07, - "learning_rate": 1.48959628735198e-06, - "loss": 0.7676, - "step": 41790 - }, - { - "epoch": 1.07, - "learning_rate": 1.4895721599333344e-06, - "loss": 0.5881, - "step": 41791 - }, - { - "epoch": 1.07, - "learning_rate": 1.4895480321398456e-06, - "loss": 0.6777, - "step": 41792 - }, - { - "epoch": 1.07, - "learning_rate": 1.489523903971533e-06, - "loss": 0.7793, - "step": 41793 - }, - { - "epoch": 1.07, - "learning_rate": 1.4894997754284138e-06, - "loss": 0.6895, - "step": 41794 - }, - { - "epoch": 1.07, - "learning_rate": 1.4894756465105074e-06, - "loss": 0.7148, - "step": 41795 - }, - { - "epoch": 1.07, - "learning_rate": 1.489451517217832e-06, - "loss": 0.8672, - "step": 41796 - }, - { - "epoch": 1.07, - "learning_rate": 1.489427387550406e-06, - "loss": 0.6826, - "step": 41797 - }, - { - "epoch": 1.07, - "learning_rate": 1.489403257508248e-06, - "loss": 0.5647, - "step": 41798 - }, - { - "epoch": 1.07, - "learning_rate": 1.4893791270913765e-06, - "loss": 0.5542, - "step": 41799 - }, - { - "epoch": 1.07, - "learning_rate": 1.4893549962998097e-06, - "loss": 0.4858, - "step": 41800 - }, - { - "epoch": 1.07, - "learning_rate": 1.4893308651335662e-06, - "loss": 0.6943, - "step": 41801 - }, - { - "epoch": 1.07, - "learning_rate": 1.489306733592665e-06, - "loss": 0.4407, - "step": 41802 - }, - { - "epoch": 1.07, - "learning_rate": 1.489282601677124e-06, - "loss": 0.2802, - "step": 41803 - }, - { - "epoch": 1.07, - "learning_rate": 1.4892584693869616e-06, - "loss": 0.7139, - "step": 41804 - }, - { - "epoch": 1.07, - "learning_rate": 1.4892343367221967e-06, - "loss": 0.6733, - "step": 41805 - }, - { - "epoch": 1.07, - "learning_rate": 1.4892102036828476e-06, - "loss": 0.751, - "step": 41806 - }, - { - "epoch": 1.07, - "learning_rate": 1.4891860702689325e-06, - "loss": 0.4595, - "step": 41807 - }, - { - "epoch": 1.07, - "learning_rate": 1.4891619364804702e-06, - "loss": 0.7134, - "step": 41808 - }, - { - "epoch": 1.07, - "learning_rate": 1.489137802317479e-06, - "loss": 0.6738, - "step": 41809 - }, - { - "epoch": 1.07, - "learning_rate": 1.4891136677799778e-06, - "loss": 0.7979, - "step": 41810 - }, - { - "epoch": 1.07, - "learning_rate": 1.4890895328679845e-06, - "loss": 0.7471, - "step": 41811 - }, - { - "epoch": 1.07, - "learning_rate": 1.489065397581518e-06, - "loss": 0.6904, - "step": 41812 - }, - { - "epoch": 1.07, - "learning_rate": 1.4890412619205964e-06, - "loss": 0.584, - "step": 41813 - }, - { - "epoch": 1.07, - "learning_rate": 1.4890171258852384e-06, - "loss": 0.835, - "step": 41814 - }, - { - "epoch": 1.07, - "learning_rate": 1.4889929894754626e-06, - "loss": 0.7681, - "step": 41815 - }, - { - "epoch": 1.07, - "learning_rate": 1.4889688526912875e-06, - "loss": 0.7705, - "step": 41816 - }, - { - "epoch": 1.07, - "learning_rate": 1.4889447155327311e-06, - "loss": 0.5972, - "step": 41817 - }, - { - "epoch": 1.07, - "learning_rate": 1.4889205779998123e-06, - "loss": 0.7344, - "step": 41818 - }, - { - "epoch": 1.07, - "learning_rate": 1.4888964400925494e-06, - "loss": 0.5732, - "step": 41819 - }, - { - "epoch": 1.07, - "learning_rate": 1.4888723018109615e-06, - "loss": 0.625, - "step": 41820 - }, - { - "epoch": 1.07, - "learning_rate": 1.488848163155066e-06, - "loss": 0.3882, - "step": 41821 - }, - { - "epoch": 1.07, - "learning_rate": 1.4888240241248822e-06, - "loss": 0.6313, - "step": 41822 - }, - { - "epoch": 1.07, - "learning_rate": 1.4887998847204282e-06, - "loss": 0.7354, - "step": 41823 - }, - { - "epoch": 1.07, - "learning_rate": 1.4887757449417227e-06, - "loss": 0.6567, - "step": 41824 - }, - { - "epoch": 1.07, - "learning_rate": 1.488751604788784e-06, - "loss": 0.6836, - "step": 41825 - }, - { - "epoch": 1.07, - "learning_rate": 1.4887274642616308e-06, - "loss": 0.7373, - "step": 41826 - }, - { - "epoch": 1.07, - "learning_rate": 1.4887033233602814e-06, - "loss": 0.7246, - "step": 41827 - }, - { - "epoch": 1.07, - "learning_rate": 1.4886791820847542e-06, - "loss": 0.8145, - "step": 41828 - }, - { - "epoch": 1.07, - "learning_rate": 1.4886550404350679e-06, - "loss": 0.6016, - "step": 41829 - }, - { - "epoch": 1.07, - "learning_rate": 1.488630898411241e-06, - "loss": 0.71, - "step": 41830 - }, - { - "epoch": 1.07, - "learning_rate": 1.4886067560132918e-06, - "loss": 0.8369, - "step": 41831 - }, - { - "epoch": 1.07, - "learning_rate": 1.4885826132412388e-06, - "loss": 0.7285, - "step": 41832 - }, - { - "epoch": 1.07, - "learning_rate": 1.4885584700951008e-06, - "loss": 0.7383, - "step": 41833 - }, - { - "epoch": 1.07, - "learning_rate": 1.4885343265748957e-06, - "loss": 0.5518, - "step": 41834 - }, - { - "epoch": 1.07, - "learning_rate": 1.4885101826806428e-06, - "loss": 0.6016, - "step": 41835 - }, - { - "epoch": 1.07, - "learning_rate": 1.4884860384123596e-06, - "loss": 0.7139, - "step": 41836 - }, - { - "epoch": 1.07, - "learning_rate": 1.4884618937700656e-06, - "loss": 0.7754, - "step": 41837 - }, - { - "epoch": 1.07, - "learning_rate": 1.4884377487537782e-06, - "loss": 0.707, - "step": 41838 - }, - { - "epoch": 1.07, - "learning_rate": 1.4884136033635168e-06, - "loss": 0.7881, - "step": 41839 - }, - { - "epoch": 1.07, - "learning_rate": 1.4883894575993e-06, - "loss": 0.3092, - "step": 41840 - }, - { - "epoch": 1.07, - "learning_rate": 1.4883653114611451e-06, - "loss": 0.7646, - "step": 41841 - }, - { - "epoch": 1.07, - "learning_rate": 1.4883411649490717e-06, - "loss": 0.6406, - "step": 41842 - }, - { - "epoch": 1.07, - "learning_rate": 1.488317018063098e-06, - "loss": 0.584, - "step": 41843 - }, - { - "epoch": 1.07, - "learning_rate": 1.4882928708032422e-06, - "loss": 0.7314, - "step": 41844 - }, - { - "epoch": 1.07, - "learning_rate": 1.488268723169523e-06, - "loss": 0.749, - "step": 41845 - }, - { - "epoch": 1.07, - "learning_rate": 1.488244575161959e-06, - "loss": 0.5767, - "step": 41846 - }, - { - "epoch": 1.07, - "learning_rate": 1.4882204267805688e-06, - "loss": 0.5923, - "step": 41847 - }, - { - "epoch": 1.07, - "learning_rate": 1.4881962780253702e-06, - "loss": 0.7012, - "step": 41848 - }, - { - "epoch": 1.07, - "learning_rate": 1.4881721288963825e-06, - "loss": 0.6514, - "step": 41849 - }, - { - "epoch": 1.07, - "learning_rate": 1.4881479793936235e-06, - "loss": 0.6177, - "step": 41850 - }, - { - "epoch": 1.07, - "learning_rate": 1.4881238295171123e-06, - "loss": 0.665, - "step": 41851 - }, - { - "epoch": 1.07, - "learning_rate": 1.4880996792668673e-06, - "loss": 0.6943, - "step": 41852 - }, - { - "epoch": 1.07, - "learning_rate": 1.4880755286429062e-06, - "loss": 0.5811, - "step": 41853 - }, - { - "epoch": 1.07, - "learning_rate": 1.4880513776452488e-06, - "loss": 0.8086, - "step": 41854 - }, - { - "epoch": 1.07, - "learning_rate": 1.4880272262739127e-06, - "loss": 0.5933, - "step": 41855 - }, - { - "epoch": 1.07, - "learning_rate": 1.4880030745289165e-06, - "loss": 0.6777, - "step": 41856 - }, - { - "epoch": 1.07, - "learning_rate": 1.4879789224102788e-06, - "loss": 0.5605, - "step": 41857 - }, - { - "epoch": 1.07, - "learning_rate": 1.487954769918018e-06, - "loss": 0.7393, - "step": 41858 - }, - { - "epoch": 1.07, - "learning_rate": 1.4879306170521526e-06, - "loss": 0.5464, - "step": 41859 - }, - { - "epoch": 1.07, - "learning_rate": 1.4879064638127017e-06, - "loss": 0.5249, - "step": 41860 - }, - { - "epoch": 1.07, - "learning_rate": 1.4878823101996827e-06, - "loss": 0.6099, - "step": 41861 - }, - { - "epoch": 1.07, - "learning_rate": 1.487858156213115e-06, - "loss": 0.6611, - "step": 41862 - }, - { - "epoch": 1.07, - "learning_rate": 1.4878340018530161e-06, - "loss": 0.7842, - "step": 41863 - }, - { - "epoch": 1.07, - "learning_rate": 1.4878098471194058e-06, - "loss": 0.6885, - "step": 41864 - }, - { - "epoch": 1.07, - "learning_rate": 1.4877856920123018e-06, - "loss": 0.7197, - "step": 41865 - }, - { - "epoch": 1.07, - "learning_rate": 1.4877615365317228e-06, - "loss": 0.4634, - "step": 41866 - }, - { - "epoch": 1.07, - "learning_rate": 1.487737380677687e-06, - "loss": 0.5483, - "step": 41867 - }, - { - "epoch": 1.07, - "learning_rate": 1.4877132244502131e-06, - "loss": 0.625, - "step": 41868 - }, - { - "epoch": 1.07, - "learning_rate": 1.4876890678493195e-06, - "loss": 0.6201, - "step": 41869 - }, - { - "epoch": 1.07, - "learning_rate": 1.4876649108750252e-06, - "loss": 0.709, - "step": 41870 - }, - { - "epoch": 1.07, - "learning_rate": 1.4876407535273482e-06, - "loss": 0.6133, - "step": 41871 - }, - { - "epoch": 1.07, - "learning_rate": 1.4876165958063067e-06, - "loss": 0.7041, - "step": 41872 - }, - { - "epoch": 1.07, - "learning_rate": 1.48759243771192e-06, - "loss": 0.6362, - "step": 41873 - }, - { - "epoch": 1.07, - "learning_rate": 1.487568279244206e-06, - "loss": 0.751, - "step": 41874 - }, - { - "epoch": 1.07, - "learning_rate": 1.4875441204031838e-06, - "loss": 0.5938, - "step": 41875 - }, - { - "epoch": 1.07, - "learning_rate": 1.4875199611888708e-06, - "loss": 0.6616, - "step": 41876 - }, - { - "epoch": 1.07, - "learning_rate": 1.4874958016012865e-06, - "loss": 0.6821, - "step": 41877 - }, - { - "epoch": 1.07, - "learning_rate": 1.4874716416404493e-06, - "loss": 0.7148, - "step": 41878 - }, - { - "epoch": 1.07, - "learning_rate": 1.4874474813063772e-06, - "loss": 0.8066, - "step": 41879 - }, - { - "epoch": 1.07, - "learning_rate": 1.487423320599089e-06, - "loss": 0.6899, - "step": 41880 - }, - { - "epoch": 1.07, - "learning_rate": 1.4873991595186035e-06, - "loss": 0.5864, - "step": 41881 - }, - { - "epoch": 1.07, - "learning_rate": 1.4873749980649385e-06, - "loss": 0.7178, - "step": 41882 - }, - { - "epoch": 1.07, - "learning_rate": 1.4873508362381131e-06, - "loss": 0.6277, - "step": 41883 - }, - { - "epoch": 1.07, - "learning_rate": 1.4873266740381454e-06, - "loss": 0.6597, - "step": 41884 - }, - { - "epoch": 1.07, - "learning_rate": 1.4873025114650544e-06, - "loss": 0.7637, - "step": 41885 - }, - { - "epoch": 1.07, - "learning_rate": 1.4872783485188578e-06, - "loss": 0.5664, - "step": 41886 - }, - { - "epoch": 1.07, - "learning_rate": 1.4872541851995748e-06, - "loss": 0.5452, - "step": 41887 - }, - { - "epoch": 1.07, - "learning_rate": 1.4872300215072235e-06, - "loss": 0.6904, - "step": 41888 - }, - { - "epoch": 1.07, - "learning_rate": 1.4872058574418229e-06, - "loss": 0.3972, - "step": 41889 - }, - { - "epoch": 1.07, - "learning_rate": 1.4871816930033912e-06, - "loss": 0.6895, - "step": 41890 - }, - { - "epoch": 1.07, - "learning_rate": 1.4871575281919464e-06, - "loss": 0.4902, - "step": 41891 - }, - { - "epoch": 1.07, - "learning_rate": 1.487133363007508e-06, - "loss": 0.5049, - "step": 41892 - }, - { - "epoch": 1.07, - "learning_rate": 1.4871091974500938e-06, - "loss": 0.7354, - "step": 41893 - }, - { - "epoch": 1.07, - "learning_rate": 1.4870850315197224e-06, - "loss": 0.4302, - "step": 41894 - }, - { - "epoch": 1.07, - "learning_rate": 1.4870608652164122e-06, - "loss": 0.7803, - "step": 41895 - }, - { - "epoch": 1.07, - "learning_rate": 1.4870366985401824e-06, - "loss": 0.5481, - "step": 41896 - }, - { - "epoch": 1.07, - "learning_rate": 1.4870125314910506e-06, - "loss": 0.6328, - "step": 41897 - }, - { - "epoch": 1.07, - "learning_rate": 1.486988364069036e-06, - "loss": 0.6509, - "step": 41898 - }, - { - "epoch": 1.07, - "learning_rate": 1.4869641962741565e-06, - "loss": 0.6309, - "step": 41899 - }, - { - "epoch": 1.07, - "learning_rate": 1.486940028106431e-06, - "loss": 0.7998, - "step": 41900 - }, - { - "epoch": 1.07, - "learning_rate": 1.4869158595658779e-06, - "loss": 0.6553, - "step": 41901 - }, - { - "epoch": 1.07, - "learning_rate": 1.4868916906525157e-06, - "loss": 0.4331, - "step": 41902 - }, - { - "epoch": 1.07, - "learning_rate": 1.486867521366363e-06, - "loss": 0.8115, - "step": 41903 - }, - { - "epoch": 1.07, - "learning_rate": 1.4868433517074382e-06, - "loss": 0.5479, - "step": 41904 - }, - { - "epoch": 1.07, - "learning_rate": 1.4868191816757598e-06, - "loss": 0.6699, - "step": 41905 - }, - { - "epoch": 1.07, - "learning_rate": 1.4867950112713465e-06, - "loss": 0.5781, - "step": 41906 - }, - { - "epoch": 1.07, - "learning_rate": 1.4867708404942164e-06, - "loss": 0.708, - "step": 41907 - }, - { - "epoch": 1.07, - "learning_rate": 1.4867466693443884e-06, - "loss": 0.7036, - "step": 41908 - }, - { - "epoch": 1.07, - "learning_rate": 1.4867224978218808e-06, - "loss": 0.6748, - "step": 41909 - }, - { - "epoch": 1.07, - "learning_rate": 1.4866983259267123e-06, - "loss": 0.7891, - "step": 41910 - }, - { - "epoch": 1.07, - "learning_rate": 1.486674153658901e-06, - "loss": 0.5693, - "step": 41911 - }, - { - "epoch": 1.07, - "learning_rate": 1.486649981018466e-06, - "loss": 0.7119, - "step": 41912 - }, - { - "epoch": 1.07, - "learning_rate": 1.4866258080054254e-06, - "loss": 0.7773, - "step": 41913 - }, - { - "epoch": 1.07, - "learning_rate": 1.4866016346197976e-06, - "loss": 0.7324, - "step": 41914 - }, - { - "epoch": 1.07, - "learning_rate": 1.4865774608616013e-06, - "loss": 0.6567, - "step": 41915 - }, - { - "epoch": 1.07, - "learning_rate": 1.4865532867308552e-06, - "loss": 0.7095, - "step": 41916 - }, - { - "epoch": 1.07, - "learning_rate": 1.4865291122275777e-06, - "loss": 0.623, - "step": 41917 - }, - { - "epoch": 1.07, - "learning_rate": 1.4865049373517869e-06, - "loss": 0.6055, - "step": 41918 - }, - { - "epoch": 1.07, - "learning_rate": 1.4864807621035019e-06, - "loss": 0.6709, - "step": 41919 - }, - { - "epoch": 1.07, - "learning_rate": 1.4864565864827407e-06, - "loss": 0.8232, - "step": 41920 - }, - { - "epoch": 1.07, - "learning_rate": 1.4864324104895225e-06, - "loss": 0.6414, - "step": 41921 - }, - { - "epoch": 1.07, - "learning_rate": 1.4864082341238649e-06, - "loss": 0.707, - "step": 41922 - }, - { - "epoch": 1.07, - "learning_rate": 1.486384057385787e-06, - "loss": 0.5718, - "step": 41923 - }, - { - "epoch": 1.07, - "learning_rate": 1.4863598802753073e-06, - "loss": 0.8096, - "step": 41924 - }, - { - "epoch": 1.07, - "learning_rate": 1.4863357027924444e-06, - "loss": 0.6094, - "step": 41925 - }, - { - "epoch": 1.07, - "learning_rate": 1.4863115249372163e-06, - "loss": 0.6895, - "step": 41926 - }, - { - "epoch": 1.07, - "learning_rate": 1.4862873467096418e-06, - "loss": 0.5781, - "step": 41927 - }, - { - "epoch": 1.07, - "learning_rate": 1.4862631681097396e-06, - "loss": 0.6777, - "step": 41928 - }, - { - "epoch": 1.07, - "learning_rate": 1.486238989137528e-06, - "loss": 0.5205, - "step": 41929 - }, - { - "epoch": 1.07, - "learning_rate": 1.4862148097930256e-06, - "loss": 0.7627, - "step": 41930 - }, - { - "epoch": 1.07, - "learning_rate": 1.4861906300762507e-06, - "loss": 0.7305, - "step": 41931 - }, - { - "epoch": 1.07, - "learning_rate": 1.4861664499872222e-06, - "loss": 0.7354, - "step": 41932 - }, - { - "epoch": 1.07, - "learning_rate": 1.4861422695259585e-06, - "loss": 0.5077, - "step": 41933 - }, - { - "epoch": 1.07, - "learning_rate": 1.4861180886924776e-06, - "loss": 0.7119, - "step": 41934 - }, - { - "epoch": 1.07, - "learning_rate": 1.4860939074867988e-06, - "loss": 0.8135, - "step": 41935 - }, - { - "epoch": 1.07, - "learning_rate": 1.48606972590894e-06, - "loss": 0.6768, - "step": 41936 - }, - { - "epoch": 1.07, - "learning_rate": 1.4860455439589203e-06, - "loss": 0.7373, - "step": 41937 - }, - { - "epoch": 1.07, - "learning_rate": 1.4860213616367576e-06, - "loss": 0.6255, - "step": 41938 - }, - { - "epoch": 1.07, - "learning_rate": 1.4859971789424709e-06, - "loss": 0.6875, - "step": 41939 - }, - { - "epoch": 1.07, - "learning_rate": 1.4859729958760784e-06, - "loss": 0.6504, - "step": 41940 - }, - { - "epoch": 1.07, - "learning_rate": 1.4859488124375985e-06, - "loss": 0.6162, - "step": 41941 - }, - { - "epoch": 1.07, - "learning_rate": 1.4859246286270502e-06, - "loss": 0.7881, - "step": 41942 - }, - { - "epoch": 1.08, - "learning_rate": 1.4859004444444515e-06, - "loss": 0.6006, - "step": 41943 - }, - { - "epoch": 1.08, - "learning_rate": 1.4858762598898214e-06, - "loss": 0.583, - "step": 41944 - }, - { - "epoch": 1.08, - "learning_rate": 1.4858520749631781e-06, - "loss": 0.4937, - "step": 41945 - }, - { - "epoch": 1.08, - "learning_rate": 1.4858278896645404e-06, - "loss": 0.7861, - "step": 41946 - }, - { - "epoch": 1.08, - "learning_rate": 1.4858037039939265e-06, - "loss": 0.7056, - "step": 41947 - }, - { - "epoch": 1.08, - "learning_rate": 1.485779517951355e-06, - "loss": 0.6709, - "step": 41948 - }, - { - "epoch": 1.08, - "learning_rate": 1.4857553315368443e-06, - "loss": 0.6367, - "step": 41949 - }, - { - "epoch": 1.08, - "learning_rate": 1.4857311447504135e-06, - "loss": 0.769, - "step": 41950 - }, - { - "epoch": 1.08, - "learning_rate": 1.4857069575920804e-06, - "loss": 0.4055, - "step": 41951 - }, - { - "epoch": 1.08, - "learning_rate": 1.4856827700618639e-06, - "loss": 0.582, - "step": 41952 - }, - { - "epoch": 1.08, - "learning_rate": 1.4856585821597823e-06, - "loss": 0.5582, - "step": 41953 - }, - { - "epoch": 1.08, - "learning_rate": 1.4856343938858545e-06, - "loss": 0.7192, - "step": 41954 - }, - { - "epoch": 1.08, - "learning_rate": 1.4856102052400986e-06, - "loss": 0.6763, - "step": 41955 - }, - { - "epoch": 1.08, - "learning_rate": 1.4855860162225332e-06, - "loss": 0.6709, - "step": 41956 - }, - { - "epoch": 1.08, - "learning_rate": 1.485561826833177e-06, - "loss": 0.7031, - "step": 41957 - }, - { - "epoch": 1.08, - "learning_rate": 1.4855376370720487e-06, - "loss": 0.6807, - "step": 41958 - }, - { - "epoch": 1.08, - "learning_rate": 1.485513446939166e-06, - "loss": 0.5718, - "step": 41959 - }, - { - "epoch": 1.08, - "learning_rate": 1.4854892564345484e-06, - "loss": 0.7236, - "step": 41960 - }, - { - "epoch": 1.08, - "learning_rate": 1.485465065558214e-06, - "loss": 0.8721, - "step": 41961 - }, - { - "epoch": 1.08, - "learning_rate": 1.4854408743101812e-06, - "loss": 0.6895, - "step": 41962 - }, - { - "epoch": 1.08, - "learning_rate": 1.4854166826904688e-06, - "loss": 0.6514, - "step": 41963 - }, - { - "epoch": 1.08, - "learning_rate": 1.485392490699095e-06, - "loss": 0.7373, - "step": 41964 - }, - { - "epoch": 1.08, - "learning_rate": 1.4853682983360787e-06, - "loss": 0.563, - "step": 41965 - }, - { - "epoch": 1.08, - "learning_rate": 1.4853441056014376e-06, - "loss": 0.6455, - "step": 41966 - }, - { - "epoch": 1.08, - "learning_rate": 1.4853199124951916e-06, - "loss": 0.4392, - "step": 41967 - }, - { - "epoch": 1.08, - "learning_rate": 1.4852957190173578e-06, - "loss": 0.5444, - "step": 41968 - }, - { - "epoch": 1.08, - "learning_rate": 1.485271525167956e-06, - "loss": 0.5957, - "step": 41969 - }, - { - "epoch": 1.08, - "learning_rate": 1.4852473309470037e-06, - "loss": 0.625, - "step": 41970 - }, - { - "epoch": 1.08, - "learning_rate": 1.4852231363545202e-06, - "loss": 0.7441, - "step": 41971 - }, - { - "epoch": 1.08, - "learning_rate": 1.4851989413905233e-06, - "loss": 0.6733, - "step": 41972 - }, - { - "epoch": 1.08, - "learning_rate": 1.4851747460550322e-06, - "loss": 0.5386, - "step": 41973 - }, - { - "epoch": 1.08, - "learning_rate": 1.4851505503480646e-06, - "loss": 0.7373, - "step": 41974 - }, - { - "epoch": 1.08, - "learning_rate": 1.4851263542696399e-06, - "loss": 0.8125, - "step": 41975 - }, - { - "epoch": 1.08, - "learning_rate": 1.4851021578197761e-06, - "loss": 0.5791, - "step": 41976 - }, - { - "epoch": 1.08, - "learning_rate": 1.4850779609984923e-06, - "loss": 0.4792, - "step": 41977 - }, - { - "epoch": 1.08, - "learning_rate": 1.485053763805806e-06, - "loss": 0.7393, - "step": 41978 - }, - { - "epoch": 1.08, - "learning_rate": 1.4850295662417367e-06, - "loss": 0.6597, - "step": 41979 - }, - { - "epoch": 1.08, - "learning_rate": 1.4850053683063023e-06, - "loss": 0.5229, - "step": 41980 - }, - { - "epoch": 1.08, - "learning_rate": 1.484981169999522e-06, - "loss": 0.5625, - "step": 41981 - }, - { - "epoch": 1.08, - "learning_rate": 1.4849569713214137e-06, - "loss": 0.6738, - "step": 41982 - }, - { - "epoch": 1.08, - "learning_rate": 1.4849327722719963e-06, - "loss": 0.7969, - "step": 41983 - }, - { - "epoch": 1.08, - "learning_rate": 1.4849085728512877e-06, - "loss": 0.6299, - "step": 41984 - }, - { - "epoch": 1.08, - "learning_rate": 1.4848843730593073e-06, - "loss": 0.5039, - "step": 41985 - }, - { - "epoch": 1.08, - "learning_rate": 1.4848601728960733e-06, - "loss": 0.6055, - "step": 41986 - }, - { - "epoch": 1.08, - "learning_rate": 1.4848359723616037e-06, - "loss": 0.5308, - "step": 41987 - }, - { - "epoch": 1.08, - "learning_rate": 1.4848117714559178e-06, - "loss": 0.916, - "step": 41988 - }, - { - "epoch": 1.08, - "learning_rate": 1.4847875701790337e-06, - "loss": 0.7119, - "step": 41989 - }, - { - "epoch": 1.08, - "learning_rate": 1.4847633685309707e-06, - "loss": 0.4678, - "step": 41990 - }, - { - "epoch": 1.08, - "learning_rate": 1.484739166511746e-06, - "loss": 0.6589, - "step": 41991 - }, - { - "epoch": 1.08, - "learning_rate": 1.484714964121379e-06, - "loss": 0.6626, - "step": 41992 - }, - { - "epoch": 1.08, - "learning_rate": 1.4846907613598876e-06, - "loss": 0.5366, - "step": 41993 - }, - { - "epoch": 1.08, - "learning_rate": 1.4846665582272913e-06, - "loss": 0.8652, - "step": 41994 - }, - { - "epoch": 1.08, - "learning_rate": 1.484642354723608e-06, - "loss": 0.5137, - "step": 41995 - }, - { - "epoch": 1.08, - "learning_rate": 1.4846181508488565e-06, - "loss": 0.8223, - "step": 41996 - }, - { - "epoch": 1.08, - "learning_rate": 1.4845939466030548e-06, - "loss": 0.6245, - "step": 41997 - }, - { - "epoch": 1.08, - "learning_rate": 1.484569741986222e-06, - "loss": 0.561, - "step": 41998 - }, - { - "epoch": 1.08, - "learning_rate": 1.484545536998376e-06, - "loss": 0.4436, - "step": 41999 - }, - { - "epoch": 1.08, - "learning_rate": 1.4845213316395367e-06, - "loss": 0.7236, - "step": 42000 - }, - { - "epoch": 1.08, - "learning_rate": 1.484497125909721e-06, - "loss": 0.6636, - "step": 42001 - }, - { - "epoch": 1.08, - "learning_rate": 1.4844729198089483e-06, - "loss": 0.7354, - "step": 42002 - }, - { - "epoch": 1.08, - "learning_rate": 1.4844487133372368e-06, - "loss": 0.6479, - "step": 42003 - }, - { - "epoch": 1.08, - "learning_rate": 1.4844245064946055e-06, - "loss": 0.7495, - "step": 42004 - }, - { - "epoch": 1.08, - "learning_rate": 1.4844002992810725e-06, - "loss": 0.6724, - "step": 42005 - }, - { - "epoch": 1.08, - "learning_rate": 1.4843760916966561e-06, - "loss": 0.6689, - "step": 42006 - }, - { - "epoch": 1.08, - "learning_rate": 1.4843518837413757e-06, - "loss": 0.8955, - "step": 42007 - }, - { - "epoch": 1.08, - "learning_rate": 1.484327675415249e-06, - "loss": 0.7998, - "step": 42008 - }, - { - "epoch": 1.08, - "learning_rate": 1.4843034667182952e-06, - "loss": 0.6401, - "step": 42009 - }, - { - "epoch": 1.08, - "learning_rate": 1.4842792576505323e-06, - "loss": 0.7734, - "step": 42010 - }, - { - "epoch": 1.08, - "learning_rate": 1.484255048211979e-06, - "loss": 0.7725, - "step": 42011 - }, - { - "epoch": 1.08, - "learning_rate": 1.484230838402654e-06, - "loss": 0.5476, - "step": 42012 - }, - { - "epoch": 1.08, - "learning_rate": 1.4842066282225755e-06, - "loss": 0.751, - "step": 42013 - }, - { - "epoch": 1.08, - "learning_rate": 1.4841824176717625e-06, - "loss": 0.8242, - "step": 42014 - }, - { - "epoch": 1.08, - "learning_rate": 1.4841582067502333e-06, - "loss": 0.752, - "step": 42015 - }, - { - "epoch": 1.08, - "learning_rate": 1.4841339954580063e-06, - "loss": 0.6924, - "step": 42016 - }, - { - "epoch": 1.08, - "learning_rate": 1.4841097837951002e-06, - "loss": 0.6143, - "step": 42017 - }, - { - "epoch": 1.08, - "learning_rate": 1.4840855717615334e-06, - "loss": 0.7041, - "step": 42018 - }, - { - "epoch": 1.08, - "learning_rate": 1.4840613593573245e-06, - "loss": 0.6943, - "step": 42019 - }, - { - "epoch": 1.08, - "learning_rate": 1.4840371465824925e-06, - "loss": 0.5537, - "step": 42020 - }, - { - "epoch": 1.08, - "learning_rate": 1.484012933437055e-06, - "loss": 0.5405, - "step": 42021 - }, - { - "epoch": 1.08, - "learning_rate": 1.4839887199210312e-06, - "loss": 0.6116, - "step": 42022 - }, - { - "epoch": 1.08, - "learning_rate": 1.4839645060344396e-06, - "loss": 0.6309, - "step": 42023 - }, - { - "epoch": 1.08, - "learning_rate": 1.4839402917772985e-06, - "loss": 0.6709, - "step": 42024 - }, - { - "epoch": 1.08, - "learning_rate": 1.4839160771496268e-06, - "loss": 0.6973, - "step": 42025 - }, - { - "epoch": 1.08, - "learning_rate": 1.4838918621514427e-06, - "loss": 0.6455, - "step": 42026 - }, - { - "epoch": 1.08, - "learning_rate": 1.4838676467827648e-06, - "loss": 0.6475, - "step": 42027 - }, - { - "epoch": 1.08, - "learning_rate": 1.4838434310436116e-06, - "loss": 0.708, - "step": 42028 - }, - { - "epoch": 1.08, - "learning_rate": 1.483819214934002e-06, - "loss": 0.4229, - "step": 42029 - }, - { - "epoch": 1.08, - "learning_rate": 1.4837949984539541e-06, - "loss": 0.5586, - "step": 42030 - }, - { - "epoch": 1.08, - "learning_rate": 1.4837707816034865e-06, - "loss": 0.6401, - "step": 42031 - }, - { - "epoch": 1.08, - "learning_rate": 1.483746564382618e-06, - "loss": 0.5293, - "step": 42032 - }, - { - "epoch": 1.08, - "learning_rate": 1.4837223467913668e-06, - "loss": 0.7139, - "step": 42033 - }, - { - "epoch": 1.08, - "learning_rate": 1.4836981288297519e-06, - "loss": 0.6265, - "step": 42034 - }, - { - "epoch": 1.08, - "learning_rate": 1.4836739104977916e-06, - "loss": 0.6833, - "step": 42035 - }, - { - "epoch": 1.08, - "learning_rate": 1.4836496917955044e-06, - "loss": 0.6328, - "step": 42036 - }, - { - "epoch": 1.08, - "learning_rate": 1.4836254727229087e-06, - "loss": 0.6831, - "step": 42037 - }, - { - "epoch": 1.08, - "learning_rate": 1.4836012532800232e-06, - "loss": 0.5681, - "step": 42038 - }, - { - "epoch": 1.08, - "learning_rate": 1.4835770334668664e-06, - "loss": 0.5815, - "step": 42039 - }, - { - "epoch": 1.08, - "learning_rate": 1.4835528132834576e-06, - "loss": 0.6621, - "step": 42040 - }, - { - "epoch": 1.08, - "learning_rate": 1.4835285927298138e-06, - "loss": 0.5713, - "step": 42041 - }, - { - "epoch": 1.08, - "learning_rate": 1.4835043718059548e-06, - "loss": 0.5444, - "step": 42042 - }, - { - "epoch": 1.08, - "learning_rate": 1.4834801505118985e-06, - "loss": 0.6719, - "step": 42043 - }, - { - "epoch": 1.08, - "learning_rate": 1.483455928847664e-06, - "loss": 0.4604, - "step": 42044 - }, - { - "epoch": 1.08, - "learning_rate": 1.4834317068132692e-06, - "loss": 0.6011, - "step": 42045 - }, - { - "epoch": 1.08, - "learning_rate": 1.4834074844087335e-06, - "loss": 0.7402, - "step": 42046 - }, - { - "epoch": 1.08, - "learning_rate": 1.4833832616340743e-06, - "loss": 0.6909, - "step": 42047 - }, - { - "epoch": 1.08, - "learning_rate": 1.4833590384893112e-06, - "loss": 0.6289, - "step": 42048 - }, - { - "epoch": 1.08, - "learning_rate": 1.4833348149744618e-06, - "loss": 0.5894, - "step": 42049 - }, - { - "epoch": 1.08, - "learning_rate": 1.4833105910895456e-06, - "loss": 0.7314, - "step": 42050 - }, - { - "epoch": 1.08, - "learning_rate": 1.4832863668345804e-06, - "loss": 0.5645, - "step": 42051 - }, - { - "epoch": 1.08, - "learning_rate": 1.4832621422095853e-06, - "loss": 0.7578, - "step": 42052 - }, - { - "epoch": 1.08, - "learning_rate": 1.4832379172145785e-06, - "loss": 0.7197, - "step": 42053 - }, - { - "epoch": 1.08, - "learning_rate": 1.4832136918495785e-06, - "loss": 0.554, - "step": 42054 - }, - { - "epoch": 1.08, - "learning_rate": 1.4831894661146046e-06, - "loss": 0.4246, - "step": 42055 - }, - { - "epoch": 1.08, - "learning_rate": 1.483165240009674e-06, - "loss": 0.7476, - "step": 42056 - }, - { - "epoch": 1.08, - "learning_rate": 1.4831410135348063e-06, - "loss": 0.7568, - "step": 42057 - }, - { - "epoch": 1.08, - "learning_rate": 1.4831167866900197e-06, - "loss": 0.7168, - "step": 42058 - }, - { - "epoch": 1.08, - "learning_rate": 1.483092559475333e-06, - "loss": 0.7422, - "step": 42059 - }, - { - "epoch": 1.08, - "learning_rate": 1.4830683318907644e-06, - "loss": 0.7275, - "step": 42060 - }, - { - "epoch": 1.08, - "learning_rate": 1.4830441039363327e-06, - "loss": 0.7871, - "step": 42061 - }, - { - "epoch": 1.08, - "learning_rate": 1.4830198756120559e-06, - "loss": 0.6201, - "step": 42062 - }, - { - "epoch": 1.08, - "learning_rate": 1.4829956469179534e-06, - "loss": 0.5591, - "step": 42063 - }, - { - "epoch": 1.08, - "learning_rate": 1.4829714178540432e-06, - "loss": 0.5518, - "step": 42064 - }, - { - "epoch": 1.08, - "learning_rate": 1.4829471884203442e-06, - "loss": 0.5908, - "step": 42065 - }, - { - "epoch": 1.08, - "learning_rate": 1.4829229586168743e-06, - "loss": 0.7529, - "step": 42066 - }, - { - "epoch": 1.08, - "learning_rate": 1.4828987284436528e-06, - "loss": 0.6689, - "step": 42067 - }, - { - "epoch": 1.08, - "learning_rate": 1.4828744979006977e-06, - "loss": 0.7168, - "step": 42068 - }, - { - "epoch": 1.08, - "learning_rate": 1.4828502669880284e-06, - "loss": 0.7227, - "step": 42069 - }, - { - "epoch": 1.08, - "learning_rate": 1.4828260357056624e-06, - "loss": 0.707, - "step": 42070 - }, - { - "epoch": 1.08, - "learning_rate": 1.4828018040536185e-06, - "loss": 0.6108, - "step": 42071 - }, - { - "epoch": 1.08, - "learning_rate": 1.482777572031916e-06, - "loss": 0.479, - "step": 42072 - }, - { - "epoch": 1.08, - "learning_rate": 1.4827533396405727e-06, - "loss": 0.5481, - "step": 42073 - }, - { - "epoch": 1.08, - "learning_rate": 1.482729106879607e-06, - "loss": 0.6455, - "step": 42074 - }, - { - "epoch": 1.08, - "learning_rate": 1.4827048737490382e-06, - "loss": 0.6067, - "step": 42075 - }, - { - "epoch": 1.08, - "learning_rate": 1.4826806402488844e-06, - "loss": 0.668, - "step": 42076 - }, - { - "epoch": 1.08, - "learning_rate": 1.4826564063791642e-06, - "loss": 0.6167, - "step": 42077 - }, - { - "epoch": 1.08, - "learning_rate": 1.4826321721398962e-06, - "loss": 0.5781, - "step": 42078 - }, - { - "epoch": 1.08, - "learning_rate": 1.4826079375310989e-06, - "loss": 0.7344, - "step": 42079 - }, - { - "epoch": 1.08, - "learning_rate": 1.4825837025527912e-06, - "loss": 0.7158, - "step": 42080 - }, - { - "epoch": 1.08, - "learning_rate": 1.4825594672049911e-06, - "loss": 0.5781, - "step": 42081 - }, - { - "epoch": 1.08, - "learning_rate": 1.4825352314877173e-06, - "loss": 0.6982, - "step": 42082 - }, - { - "epoch": 1.08, - "learning_rate": 1.4825109954009885e-06, - "loss": 0.7451, - "step": 42083 - }, - { - "epoch": 1.08, - "learning_rate": 1.4824867589448234e-06, - "loss": 0.6123, - "step": 42084 - }, - { - "epoch": 1.08, - "learning_rate": 1.4824625221192402e-06, - "loss": 0.5974, - "step": 42085 - }, - { - "epoch": 1.08, - "learning_rate": 1.4824382849242575e-06, - "loss": 0.6653, - "step": 42086 - }, - { - "epoch": 1.08, - "learning_rate": 1.4824140473598944e-06, - "loss": 0.8574, - "step": 42087 - }, - { - "epoch": 1.08, - "learning_rate": 1.4823898094261687e-06, - "loss": 0.7417, - "step": 42088 - }, - { - "epoch": 1.08, - "learning_rate": 1.4823655711230994e-06, - "loss": 0.7031, - "step": 42089 - }, - { - "epoch": 1.08, - "learning_rate": 1.482341332450705e-06, - "loss": 0.603, - "step": 42090 - }, - { - "epoch": 1.08, - "learning_rate": 1.482317093409004e-06, - "loss": 0.6875, - "step": 42091 - }, - { - "epoch": 1.08, - "learning_rate": 1.482292853998015e-06, - "loss": 0.6572, - "step": 42092 - }, - { - "epoch": 1.08, - "learning_rate": 1.4822686142177566e-06, - "loss": 0.6924, - "step": 42093 - }, - { - "epoch": 1.08, - "learning_rate": 1.4822443740682471e-06, - "loss": 0.6221, - "step": 42094 - }, - { - "epoch": 1.08, - "learning_rate": 1.4822201335495055e-06, - "loss": 0.5801, - "step": 42095 - }, - { - "epoch": 1.08, - "learning_rate": 1.4821958926615498e-06, - "loss": 0.6938, - "step": 42096 - }, - { - "epoch": 1.08, - "learning_rate": 1.482171651404399e-06, - "loss": 0.6038, - "step": 42097 - }, - { - "epoch": 1.08, - "learning_rate": 1.4821474097780714e-06, - "loss": 0.5703, - "step": 42098 - }, - { - "epoch": 1.08, - "learning_rate": 1.4821231677825863e-06, - "loss": 0.6289, - "step": 42099 - }, - { - "epoch": 1.08, - "learning_rate": 1.4820989254179612e-06, - "loss": 0.6636, - "step": 42100 - }, - { - "epoch": 1.08, - "learning_rate": 1.4820746826842152e-06, - "loss": 0.6084, - "step": 42101 - }, - { - "epoch": 1.08, - "learning_rate": 1.4820504395813666e-06, - "loss": 0.5149, - "step": 42102 - }, - { - "epoch": 1.08, - "learning_rate": 1.4820261961094342e-06, - "loss": 0.5894, - "step": 42103 - }, - { - "epoch": 1.08, - "learning_rate": 1.4820019522684369e-06, - "loss": 0.7715, - "step": 42104 - }, - { - "epoch": 1.08, - "learning_rate": 1.4819777080583925e-06, - "loss": 0.792, - "step": 42105 - }, - { - "epoch": 1.08, - "learning_rate": 1.48195346347932e-06, - "loss": 0.709, - "step": 42106 - }, - { - "epoch": 1.08, - "learning_rate": 1.481929218531238e-06, - "loss": 0.6616, - "step": 42107 - }, - { - "epoch": 1.08, - "learning_rate": 1.4819049732141645e-06, - "loss": 0.6865, - "step": 42108 - }, - { - "epoch": 1.08, - "learning_rate": 1.4818807275281193e-06, - "loss": 0.7334, - "step": 42109 - }, - { - "epoch": 1.08, - "learning_rate": 1.4818564814731195e-06, - "loss": 0.6108, - "step": 42110 - }, - { - "epoch": 1.08, - "learning_rate": 1.4818322350491848e-06, - "loss": 0.6292, - "step": 42111 - }, - { - "epoch": 1.08, - "learning_rate": 1.481807988256333e-06, - "loss": 0.7207, - "step": 42112 - }, - { - "epoch": 1.08, - "learning_rate": 1.481783741094583e-06, - "loss": 0.6963, - "step": 42113 - }, - { - "epoch": 1.08, - "learning_rate": 1.4817594935639538e-06, - "loss": 0.5156, - "step": 42114 - }, - { - "epoch": 1.08, - "learning_rate": 1.481735245664463e-06, - "loss": 0.7393, - "step": 42115 - }, - { - "epoch": 1.08, - "learning_rate": 1.4817109973961297e-06, - "loss": 0.6328, - "step": 42116 - }, - { - "epoch": 1.08, - "learning_rate": 1.4816867487589728e-06, - "loss": 0.5444, - "step": 42117 - }, - { - "epoch": 1.08, - "learning_rate": 1.4816624997530101e-06, - "loss": 0.791, - "step": 42118 - }, - { - "epoch": 1.08, - "learning_rate": 1.4816382503782607e-06, - "loss": 0.75, - "step": 42119 - }, - { - "epoch": 1.08, - "learning_rate": 1.4816140006347433e-06, - "loss": 0.6306, - "step": 42120 - }, - { - "epoch": 1.08, - "learning_rate": 1.4815897505224758e-06, - "loss": 0.5361, - "step": 42121 - }, - { - "epoch": 1.08, - "learning_rate": 1.4815655000414772e-06, - "loss": 0.8086, - "step": 42122 - }, - { - "epoch": 1.08, - "learning_rate": 1.4815412491917663e-06, - "loss": 0.5166, - "step": 42123 - }, - { - "epoch": 1.08, - "learning_rate": 1.4815169979733614e-06, - "loss": 0.6865, - "step": 42124 - }, - { - "epoch": 1.08, - "learning_rate": 1.481492746386281e-06, - "loss": 0.7354, - "step": 42125 - }, - { - "epoch": 1.08, - "learning_rate": 1.4814684944305437e-06, - "loss": 0.5967, - "step": 42126 - }, - { - "epoch": 1.08, - "learning_rate": 1.4814442421061678e-06, - "loss": 0.6152, - "step": 42127 - }, - { - "epoch": 1.08, - "learning_rate": 1.4814199894131726e-06, - "loss": 0.6069, - "step": 42128 - }, - { - "epoch": 1.08, - "learning_rate": 1.4813957363515764e-06, - "loss": 0.4907, - "step": 42129 - }, - { - "epoch": 1.08, - "learning_rate": 1.4813714829213974e-06, - "loss": 0.5889, - "step": 42130 - }, - { - "epoch": 1.08, - "learning_rate": 1.4813472291226542e-06, - "loss": 0.7461, - "step": 42131 - }, - { - "epoch": 1.08, - "learning_rate": 1.481322974955366e-06, - "loss": 0.6357, - "step": 42132 - }, - { - "epoch": 1.08, - "learning_rate": 1.4812987204195504e-06, - "loss": 0.4663, - "step": 42133 - }, - { - "epoch": 1.08, - "learning_rate": 1.4812744655152268e-06, - "loss": 0.5537, - "step": 42134 - }, - { - "epoch": 1.08, - "learning_rate": 1.4812502102424136e-06, - "loss": 0.5271, - "step": 42135 - }, - { - "epoch": 1.08, - "learning_rate": 1.481225954601129e-06, - "loss": 0.6387, - "step": 42136 - }, - { - "epoch": 1.08, - "learning_rate": 1.4812016985913918e-06, - "loss": 0.6602, - "step": 42137 - }, - { - "epoch": 1.08, - "learning_rate": 1.4811774422132209e-06, - "loss": 0.6885, - "step": 42138 - }, - { - "epoch": 1.08, - "learning_rate": 1.4811531854666343e-06, - "loss": 0.6309, - "step": 42139 - }, - { - "epoch": 1.08, - "learning_rate": 1.4811289283516506e-06, - "loss": 0.605, - "step": 42140 - }, - { - "epoch": 1.08, - "learning_rate": 1.4811046708682891e-06, - "loss": 0.7559, - "step": 42141 - }, - { - "epoch": 1.08, - "learning_rate": 1.4810804130165674e-06, - "loss": 0.7227, - "step": 42142 - }, - { - "epoch": 1.08, - "learning_rate": 1.481056154796505e-06, - "loss": 0.9766, - "step": 42143 - }, - { - "epoch": 1.08, - "learning_rate": 1.4810318962081198e-06, - "loss": 0.9121, - "step": 42144 - }, - { - "epoch": 1.08, - "learning_rate": 1.4810076372514307e-06, - "loss": 0.6533, - "step": 42145 - }, - { - "epoch": 1.08, - "learning_rate": 1.480983377926456e-06, - "loss": 0.6104, - "step": 42146 - }, - { - "epoch": 1.08, - "learning_rate": 1.4809591182332147e-06, - "loss": 0.4158, - "step": 42147 - }, - { - "epoch": 1.08, - "learning_rate": 1.4809348581717246e-06, - "loss": 0.6418, - "step": 42148 - }, - { - "epoch": 1.08, - "learning_rate": 1.4809105977420054e-06, - "loss": 0.489, - "step": 42149 - }, - { - "epoch": 1.08, - "learning_rate": 1.4808863369440746e-06, - "loss": 0.4556, - "step": 42150 - }, - { - "epoch": 1.08, - "learning_rate": 1.4808620757779515e-06, - "loss": 0.7446, - "step": 42151 - }, - { - "epoch": 1.08, - "learning_rate": 1.4808378142436543e-06, - "loss": 0.7021, - "step": 42152 - }, - { - "epoch": 1.08, - "learning_rate": 1.4808135523412017e-06, - "loss": 0.5723, - "step": 42153 - }, - { - "epoch": 1.08, - "learning_rate": 1.4807892900706125e-06, - "loss": 0.6263, - "step": 42154 - }, - { - "epoch": 1.08, - "learning_rate": 1.480765027431905e-06, - "loss": 0.7573, - "step": 42155 - }, - { - "epoch": 1.08, - "learning_rate": 1.4807407644250976e-06, - "loss": 0.8369, - "step": 42156 - }, - { - "epoch": 1.08, - "learning_rate": 1.4807165010502093e-06, - "loss": 0.7119, - "step": 42157 - }, - { - "epoch": 1.08, - "learning_rate": 1.4806922373072582e-06, - "loss": 0.6121, - "step": 42158 - }, - { - "epoch": 1.08, - "learning_rate": 1.4806679731962635e-06, - "loss": 0.6416, - "step": 42159 - }, - { - "epoch": 1.08, - "learning_rate": 1.4806437087172432e-06, - "loss": 0.5149, - "step": 42160 - }, - { - "epoch": 1.08, - "learning_rate": 1.480619443870216e-06, - "loss": 0.6069, - "step": 42161 - }, - { - "epoch": 1.08, - "learning_rate": 1.4805951786552009e-06, - "loss": 0.7236, - "step": 42162 - }, - { - "epoch": 1.08, - "learning_rate": 1.4805709130722162e-06, - "loss": 0.5801, - "step": 42163 - }, - { - "epoch": 1.08, - "learning_rate": 1.4805466471212803e-06, - "loss": 0.4141, - "step": 42164 - }, - { - "epoch": 1.08, - "learning_rate": 1.4805223808024118e-06, - "loss": 0.7627, - "step": 42165 - }, - { - "epoch": 1.08, - "learning_rate": 1.4804981141156297e-06, - "loss": 0.6885, - "step": 42166 - }, - { - "epoch": 1.08, - "learning_rate": 1.4804738470609518e-06, - "loss": 0.7578, - "step": 42167 - }, - { - "epoch": 1.08, - "learning_rate": 1.4804495796383975e-06, - "loss": 0.6084, - "step": 42168 - }, - { - "epoch": 1.08, - "learning_rate": 1.4804253118479853e-06, - "loss": 0.6445, - "step": 42169 - }, - { - "epoch": 1.08, - "learning_rate": 1.4804010436897331e-06, - "loss": 0.6973, - "step": 42170 - }, - { - "epoch": 1.08, - "learning_rate": 1.48037677516366e-06, - "loss": 0.7373, - "step": 42171 - }, - { - "epoch": 1.08, - "learning_rate": 1.4803525062697846e-06, - "loss": 0.7144, - "step": 42172 - }, - { - "epoch": 1.08, - "learning_rate": 1.4803282370081255e-06, - "loss": 0.6367, - "step": 42173 - }, - { - "epoch": 1.08, - "learning_rate": 1.480303967378701e-06, - "loss": 0.6143, - "step": 42174 - }, - { - "epoch": 1.08, - "learning_rate": 1.4802796973815297e-06, - "loss": 0.5984, - "step": 42175 - }, - { - "epoch": 1.08, - "learning_rate": 1.4802554270166305e-06, - "loss": 0.8105, - "step": 42176 - }, - { - "epoch": 1.08, - "learning_rate": 1.4802311562840218e-06, - "loss": 0.7783, - "step": 42177 - }, - { - "epoch": 1.08, - "learning_rate": 1.4802068851837222e-06, - "loss": 0.436, - "step": 42178 - }, - { - "epoch": 1.08, - "learning_rate": 1.4801826137157502e-06, - "loss": 0.5981, - "step": 42179 - }, - { - "epoch": 1.08, - "learning_rate": 1.4801583418801244e-06, - "loss": 0.6348, - "step": 42180 - }, - { - "epoch": 1.08, - "learning_rate": 1.4801340696768634e-06, - "loss": 0.6411, - "step": 42181 - }, - { - "epoch": 1.08, - "learning_rate": 1.4801097971059862e-06, - "loss": 0.6855, - "step": 42182 - }, - { - "epoch": 1.08, - "learning_rate": 1.4800855241675105e-06, - "loss": 0.7129, - "step": 42183 - }, - { - "epoch": 1.08, - "learning_rate": 1.4800612508614557e-06, - "loss": 0.6025, - "step": 42184 - }, - { - "epoch": 1.08, - "learning_rate": 1.4800369771878401e-06, - "loss": 0.5432, - "step": 42185 - }, - { - "epoch": 1.08, - "learning_rate": 1.480012703146682e-06, - "loss": 0.501, - "step": 42186 - }, - { - "epoch": 1.08, - "learning_rate": 1.4799884287380005e-06, - "loss": 0.6289, - "step": 42187 - }, - { - "epoch": 1.08, - "learning_rate": 1.4799641539618134e-06, - "loss": 0.708, - "step": 42188 - }, - { - "epoch": 1.08, - "learning_rate": 1.4799398788181407e-06, - "loss": 0.7578, - "step": 42189 - }, - { - "epoch": 1.08, - "learning_rate": 1.4799156033069994e-06, - "loss": 0.7422, - "step": 42190 - }, - { - "epoch": 1.08, - "learning_rate": 1.4798913274284091e-06, - "loss": 0.6006, - "step": 42191 - }, - { - "epoch": 1.08, - "learning_rate": 1.4798670511823878e-06, - "loss": 0.7617, - "step": 42192 - }, - { - "epoch": 1.08, - "learning_rate": 1.4798427745689547e-06, - "loss": 0.6133, - "step": 42193 - }, - { - "epoch": 1.08, - "learning_rate": 1.479818497588128e-06, - "loss": 0.8047, - "step": 42194 - }, - { - "epoch": 1.08, - "learning_rate": 1.4797942202399263e-06, - "loss": 0.6924, - "step": 42195 - }, - { - "epoch": 1.08, - "learning_rate": 1.479769942524368e-06, - "loss": 0.6318, - "step": 42196 - }, - { - "epoch": 1.08, - "learning_rate": 1.4797456644414723e-06, - "loss": 0.7358, - "step": 42197 - }, - { - "epoch": 1.08, - "learning_rate": 1.4797213859912572e-06, - "loss": 0.5391, - "step": 42198 - }, - { - "epoch": 1.08, - "learning_rate": 1.4796971071737417e-06, - "loss": 0.8091, - "step": 42199 - }, - { - "epoch": 1.08, - "learning_rate": 1.4796728279889438e-06, - "loss": 0.5557, - "step": 42200 - }, - { - "epoch": 1.08, - "learning_rate": 1.4796485484368826e-06, - "loss": 0.6768, - "step": 42201 - }, - { - "epoch": 1.08, - "learning_rate": 1.4796242685175767e-06, - "loss": 0.6514, - "step": 42202 - }, - { - "epoch": 1.08, - "learning_rate": 1.4795999882310443e-06, - "loss": 0.5515, - "step": 42203 - }, - { - "epoch": 1.08, - "learning_rate": 1.4795757075773045e-06, - "loss": 0.6561, - "step": 42204 - }, - { - "epoch": 1.08, - "learning_rate": 1.4795514265563755e-06, - "loss": 0.6416, - "step": 42205 - }, - { - "epoch": 1.08, - "learning_rate": 1.479527145168276e-06, - "loss": 0.7686, - "step": 42206 - }, - { - "epoch": 1.08, - "learning_rate": 1.4795028634130246e-06, - "loss": 0.6458, - "step": 42207 - }, - { - "epoch": 1.08, - "learning_rate": 1.47947858129064e-06, - "loss": 0.6138, - "step": 42208 - }, - { - "epoch": 1.08, - "learning_rate": 1.479454298801141e-06, - "loss": 0.7588, - "step": 42209 - }, - { - "epoch": 1.08, - "learning_rate": 1.4794300159445454e-06, - "loss": 0.6748, - "step": 42210 - }, - { - "epoch": 1.08, - "learning_rate": 1.4794057327208725e-06, - "loss": 0.8027, - "step": 42211 - }, - { - "epoch": 1.08, - "learning_rate": 1.4793814491301406e-06, - "loss": 0.509, - "step": 42212 - }, - { - "epoch": 1.08, - "learning_rate": 1.4793571651723682e-06, - "loss": 0.7773, - "step": 42213 - }, - { - "epoch": 1.08, - "learning_rate": 1.4793328808475746e-06, - "loss": 0.6958, - "step": 42214 - }, - { - "epoch": 1.08, - "learning_rate": 1.4793085961557774e-06, - "loss": 0.6196, - "step": 42215 - }, - { - "epoch": 1.08, - "learning_rate": 1.4792843110969958e-06, - "loss": 0.5088, - "step": 42216 - }, - { - "epoch": 1.08, - "learning_rate": 1.4792600256712479e-06, - "loss": 0.5864, - "step": 42217 - }, - { - "epoch": 1.08, - "learning_rate": 1.479235739878553e-06, - "loss": 0.645, - "step": 42218 - }, - { - "epoch": 1.08, - "learning_rate": 1.4792114537189293e-06, - "loss": 0.6924, - "step": 42219 - }, - { - "epoch": 1.08, - "learning_rate": 1.4791871671923956e-06, - "loss": 0.7002, - "step": 42220 - }, - { - "epoch": 1.08, - "learning_rate": 1.47916288029897e-06, - "loss": 0.6084, - "step": 42221 - }, - { - "epoch": 1.08, - "learning_rate": 1.4791385930386716e-06, - "loss": 0.6772, - "step": 42222 - }, - { - "epoch": 1.08, - "learning_rate": 1.4791143054115185e-06, - "loss": 0.5947, - "step": 42223 - }, - { - "epoch": 1.08, - "learning_rate": 1.47909001741753e-06, - "loss": 0.7065, - "step": 42224 - }, - { - "epoch": 1.08, - "learning_rate": 1.4790657290567241e-06, - "loss": 0.6245, - "step": 42225 - }, - { - "epoch": 1.08, - "learning_rate": 1.4790414403291199e-06, - "loss": 0.5791, - "step": 42226 - }, - { - "epoch": 1.08, - "learning_rate": 1.479017151234735e-06, - "loss": 0.5742, - "step": 42227 - }, - { - "epoch": 1.08, - "learning_rate": 1.4789928617735895e-06, - "loss": 0.6465, - "step": 42228 - }, - { - "epoch": 1.08, - "learning_rate": 1.4789685719457008e-06, - "loss": 0.6157, - "step": 42229 - }, - { - "epoch": 1.08, - "learning_rate": 1.4789442817510878e-06, - "loss": 0.3962, - "step": 42230 - }, - { - "epoch": 1.08, - "learning_rate": 1.4789199911897692e-06, - "loss": 0.5757, - "step": 42231 - }, - { - "epoch": 1.08, - "learning_rate": 1.4788957002617637e-06, - "loss": 0.7656, - "step": 42232 - }, - { - "epoch": 1.08, - "learning_rate": 1.4788714089670897e-06, - "loss": 0.7231, - "step": 42233 - }, - { - "epoch": 1.08, - "learning_rate": 1.478847117305766e-06, - "loss": 0.7266, - "step": 42234 - }, - { - "epoch": 1.08, - "learning_rate": 1.478822825277811e-06, - "loss": 0.707, - "step": 42235 - }, - { - "epoch": 1.08, - "learning_rate": 1.4787985328832433e-06, - "loss": 0.6895, - "step": 42236 - }, - { - "epoch": 1.08, - "learning_rate": 1.4787742401220817e-06, - "loss": 0.5552, - "step": 42237 - }, - { - "epoch": 1.08, - "learning_rate": 1.4787499469943447e-06, - "loss": 0.5625, - "step": 42238 - }, - { - "epoch": 1.08, - "learning_rate": 1.4787256535000509e-06, - "loss": 0.7339, - "step": 42239 - }, - { - "epoch": 1.08, - "learning_rate": 1.4787013596392188e-06, - "loss": 0.6396, - "step": 42240 - }, - { - "epoch": 1.08, - "learning_rate": 1.4786770654118673e-06, - "loss": 0.6509, - "step": 42241 - }, - { - "epoch": 1.08, - "learning_rate": 1.4786527708180144e-06, - "loss": 0.6045, - "step": 42242 - }, - { - "epoch": 1.08, - "learning_rate": 1.4786284758576793e-06, - "loss": 0.6523, - "step": 42243 - }, - { - "epoch": 1.08, - "learning_rate": 1.4786041805308803e-06, - "loss": 0.6611, - "step": 42244 - }, - { - "epoch": 1.08, - "learning_rate": 1.4785798848376364e-06, - "loss": 0.9355, - "step": 42245 - }, - { - "epoch": 1.08, - "learning_rate": 1.4785555887779652e-06, - "loss": 0.486, - "step": 42246 - }, - { - "epoch": 1.08, - "learning_rate": 1.4785312923518866e-06, - "loss": 0.5337, - "step": 42247 - }, - { - "epoch": 1.08, - "learning_rate": 1.4785069955594182e-06, - "loss": 0.6396, - "step": 42248 - }, - { - "epoch": 1.08, - "learning_rate": 1.4784826984005793e-06, - "loss": 0.6846, - "step": 42249 - }, - { - "epoch": 1.08, - "learning_rate": 1.4784584008753882e-06, - "loss": 0.6602, - "step": 42250 - }, - { - "epoch": 1.08, - "learning_rate": 1.4784341029838632e-06, - "loss": 0.625, - "step": 42251 - }, - { - "epoch": 1.08, - "learning_rate": 1.4784098047260236e-06, - "loss": 0.6836, - "step": 42252 - }, - { - "epoch": 1.08, - "learning_rate": 1.4783855061018873e-06, - "loss": 0.5625, - "step": 42253 - }, - { - "epoch": 1.08, - "learning_rate": 1.4783612071114734e-06, - "loss": 0.5382, - "step": 42254 - }, - { - "epoch": 1.08, - "learning_rate": 1.4783369077548002e-06, - "loss": 0.6465, - "step": 42255 - }, - { - "epoch": 1.08, - "learning_rate": 1.4783126080318864e-06, - "loss": 0.792, - "step": 42256 - }, - { - "epoch": 1.08, - "learning_rate": 1.4782883079427508e-06, - "loss": 0.7354, - "step": 42257 - }, - { - "epoch": 1.08, - "learning_rate": 1.4782640074874119e-06, - "loss": 0.6758, - "step": 42258 - }, - { - "epoch": 1.08, - "learning_rate": 1.4782397066658879e-06, - "loss": 0.7383, - "step": 42259 - }, - { - "epoch": 1.08, - "learning_rate": 1.4782154054781981e-06, - "loss": 0.7515, - "step": 42260 - }, - { - "epoch": 1.08, - "learning_rate": 1.4781911039243604e-06, - "loss": 0.6494, - "step": 42261 - }, - { - "epoch": 1.08, - "learning_rate": 1.478166802004394e-06, - "loss": 0.5547, - "step": 42262 - }, - { - "epoch": 1.08, - "learning_rate": 1.478142499718317e-06, - "loss": 0.526, - "step": 42263 - }, - { - "epoch": 1.08, - "learning_rate": 1.4781181970661487e-06, - "loss": 0.6289, - "step": 42264 - }, - { - "epoch": 1.08, - "learning_rate": 1.478093894047907e-06, - "loss": 0.5952, - "step": 42265 - }, - { - "epoch": 1.08, - "learning_rate": 1.4780695906636108e-06, - "loss": 0.7935, - "step": 42266 - }, - { - "epoch": 1.08, - "learning_rate": 1.4780452869132786e-06, - "loss": 0.5791, - "step": 42267 - }, - { - "epoch": 1.08, - "learning_rate": 1.4780209827969294e-06, - "loss": 0.8789, - "step": 42268 - }, - { - "epoch": 1.08, - "learning_rate": 1.4779966783145814e-06, - "loss": 0.6328, - "step": 42269 - }, - { - "epoch": 1.08, - "learning_rate": 1.4779723734662534e-06, - "loss": 0.4565, - "step": 42270 - }, - { - "epoch": 1.08, - "learning_rate": 1.4779480682519637e-06, - "loss": 0.5232, - "step": 42271 - }, - { - "epoch": 1.08, - "learning_rate": 1.4779237626717313e-06, - "loss": 0.6069, - "step": 42272 - }, - { - "epoch": 1.08, - "learning_rate": 1.4778994567255746e-06, - "loss": 0.6611, - "step": 42273 - }, - { - "epoch": 1.08, - "learning_rate": 1.4778751504135123e-06, - "loss": 0.6162, - "step": 42274 - }, - { - "epoch": 1.08, - "learning_rate": 1.4778508437355627e-06, - "loss": 0.7686, - "step": 42275 - }, - { - "epoch": 1.08, - "learning_rate": 1.477826536691745e-06, - "loss": 0.5908, - "step": 42276 - }, - { - "epoch": 1.08, - "learning_rate": 1.4778022292820776e-06, - "loss": 0.6821, - "step": 42277 - }, - { - "epoch": 1.08, - "learning_rate": 1.4777779215065786e-06, - "loss": 0.6011, - "step": 42278 - }, - { - "epoch": 1.08, - "learning_rate": 1.4777536133652675e-06, - "loss": 0.6509, - "step": 42279 - }, - { - "epoch": 1.08, - "learning_rate": 1.477729304858162e-06, - "loss": 0.627, - "step": 42280 - }, - { - "epoch": 1.08, - "learning_rate": 1.4777049959852815e-06, - "loss": 0.3833, - "step": 42281 - }, - { - "epoch": 1.08, - "learning_rate": 1.4776806867466437e-06, - "loss": 0.748, - "step": 42282 - }, - { - "epoch": 1.08, - "learning_rate": 1.4776563771422682e-06, - "loss": 0.4172, - "step": 42283 - }, - { - "epoch": 1.08, - "learning_rate": 1.4776320671721732e-06, - "loss": 0.6353, - "step": 42284 - }, - { - "epoch": 1.08, - "learning_rate": 1.477607756836377e-06, - "loss": 0.665, - "step": 42285 - }, - { - "epoch": 1.08, - "learning_rate": 1.4775834461348988e-06, - "loss": 0.6631, - "step": 42286 - }, - { - "epoch": 1.08, - "learning_rate": 1.4775591350677569e-06, - "loss": 0.7471, - "step": 42287 - }, - { - "epoch": 1.08, - "learning_rate": 1.4775348236349696e-06, - "loss": 0.7344, - "step": 42288 - }, - { - "epoch": 1.08, - "learning_rate": 1.4775105118365564e-06, - "loss": 0.564, - "step": 42289 - }, - { - "epoch": 1.08, - "learning_rate": 1.4774861996725347e-06, - "loss": 0.7979, - "step": 42290 - }, - { - "epoch": 1.08, - "learning_rate": 1.4774618871429243e-06, - "loss": 0.4644, - "step": 42291 - }, - { - "epoch": 1.08, - "learning_rate": 1.4774375742477427e-06, - "loss": 0.5474, - "step": 42292 - }, - { - "epoch": 1.08, - "learning_rate": 1.4774132609870097e-06, - "loss": 0.7402, - "step": 42293 - }, - { - "epoch": 1.08, - "learning_rate": 1.4773889473607431e-06, - "loss": 0.6724, - "step": 42294 - }, - { - "epoch": 1.08, - "learning_rate": 1.4773646333689616e-06, - "loss": 0.5525, - "step": 42295 - }, - { - "epoch": 1.08, - "learning_rate": 1.4773403190116842e-06, - "loss": 0.4722, - "step": 42296 - }, - { - "epoch": 1.08, - "learning_rate": 1.477316004288929e-06, - "loss": 0.6006, - "step": 42297 - }, - { - "epoch": 1.08, - "learning_rate": 1.477291689200715e-06, - "loss": 0.6958, - "step": 42298 - }, - { - "epoch": 1.08, - "learning_rate": 1.477267373747061e-06, - "loss": 0.6489, - "step": 42299 - }, - { - "epoch": 1.08, - "learning_rate": 1.4772430579279852e-06, - "loss": 0.6504, - "step": 42300 - }, - { - "epoch": 1.08, - "learning_rate": 1.4772187417435057e-06, - "loss": 0.5977, - "step": 42301 - }, - { - "epoch": 1.08, - "learning_rate": 1.4771944251936423e-06, - "loss": 0.6855, - "step": 42302 - }, - { - "epoch": 1.08, - "learning_rate": 1.477170108278413e-06, - "loss": 0.5869, - "step": 42303 - }, - { - "epoch": 1.08, - "learning_rate": 1.4771457909978367e-06, - "loss": 0.7305, - "step": 42304 - }, - { - "epoch": 1.08, - "learning_rate": 1.4771214733519315e-06, - "loss": 0.5654, - "step": 42305 - }, - { - "epoch": 1.08, - "learning_rate": 1.4770971553407166e-06, - "loss": 0.709, - "step": 42306 - }, - { - "epoch": 1.08, - "learning_rate": 1.47707283696421e-06, - "loss": 0.7949, - "step": 42307 - }, - { - "epoch": 1.08, - "learning_rate": 1.4770485182224309e-06, - "loss": 0.6401, - "step": 42308 - }, - { - "epoch": 1.08, - "learning_rate": 1.4770241991153975e-06, - "loss": 0.6533, - "step": 42309 - }, - { - "epoch": 1.08, - "learning_rate": 1.476999879643129e-06, - "loss": 0.48, - "step": 42310 - }, - { - "epoch": 1.08, - "learning_rate": 1.476975559805643e-06, - "loss": 0.3845, - "step": 42311 - }, - { - "epoch": 1.08, - "learning_rate": 1.4769512396029594e-06, - "loss": 0.5918, - "step": 42312 - }, - { - "epoch": 1.08, - "learning_rate": 1.4769269190350957e-06, - "loss": 0.6382, - "step": 42313 - }, - { - "epoch": 1.08, - "learning_rate": 1.4769025981020712e-06, - "loss": 0.5212, - "step": 42314 - }, - { - "epoch": 1.08, - "learning_rate": 1.4768782768039043e-06, - "loss": 0.6714, - "step": 42315 - }, - { - "epoch": 1.08, - "learning_rate": 1.4768539551406136e-06, - "loss": 0.542, - "step": 42316 - }, - { - "epoch": 1.08, - "learning_rate": 1.4768296331122177e-06, - "loss": 0.6621, - "step": 42317 - }, - { - "epoch": 1.08, - "learning_rate": 1.4768053107187352e-06, - "loss": 0.7266, - "step": 42318 - }, - { - "epoch": 1.08, - "learning_rate": 1.476780987960185e-06, - "loss": 0.5415, - "step": 42319 - }, - { - "epoch": 1.08, - "learning_rate": 1.4767566648365856e-06, - "loss": 0.6289, - "step": 42320 - }, - { - "epoch": 1.08, - "learning_rate": 1.4767323413479553e-06, - "loss": 0.7852, - "step": 42321 - }, - { - "epoch": 1.08, - "learning_rate": 1.476708017494313e-06, - "loss": 0.5659, - "step": 42322 - }, - { - "epoch": 1.08, - "learning_rate": 1.4766836932756773e-06, - "loss": 0.4863, - "step": 42323 - }, - { - "epoch": 1.08, - "learning_rate": 1.4766593686920668e-06, - "loss": 0.6152, - "step": 42324 - }, - { - "epoch": 1.08, - "learning_rate": 1.4766350437435003e-06, - "loss": 0.5269, - "step": 42325 - }, - { - "epoch": 1.08, - "learning_rate": 1.4766107184299962e-06, - "loss": 0.6895, - "step": 42326 - }, - { - "epoch": 1.08, - "learning_rate": 1.4765863927515731e-06, - "loss": 0.6621, - "step": 42327 - }, - { - "epoch": 1.08, - "learning_rate": 1.4765620667082494e-06, - "loss": 0.7109, - "step": 42328 - }, - { - "epoch": 1.08, - "learning_rate": 1.4765377403000448e-06, - "loss": 0.667, - "step": 42329 - }, - { - "epoch": 1.08, - "learning_rate": 1.4765134135269767e-06, - "loss": 0.7686, - "step": 42330 - }, - { - "epoch": 1.08, - "learning_rate": 1.4764890863890642e-06, - "loss": 0.5378, - "step": 42331 - }, - { - "epoch": 1.08, - "learning_rate": 1.476464758886326e-06, - "loss": 0.5464, - "step": 42332 - }, - { - "epoch": 1.09, - "learning_rate": 1.4764404310187806e-06, - "loss": 0.5884, - "step": 42333 - }, - { - "epoch": 1.09, - "learning_rate": 1.4764161027864467e-06, - "loss": 0.6719, - "step": 42334 - }, - { - "epoch": 1.09, - "learning_rate": 1.476391774189343e-06, - "loss": 0.7222, - "step": 42335 - }, - { - "epoch": 1.09, - "learning_rate": 1.4763674452274878e-06, - "loss": 0.5112, - "step": 42336 - }, - { - "epoch": 1.09, - "learning_rate": 1.4763431159009002e-06, - "loss": 0.6421, - "step": 42337 - }, - { - "epoch": 1.09, - "learning_rate": 1.476318786209598e-06, - "loss": 0.7637, - "step": 42338 - }, - { - "epoch": 1.09, - "learning_rate": 1.4762944561536011e-06, - "loss": 0.6309, - "step": 42339 - }, - { - "epoch": 1.09, - "learning_rate": 1.4762701257329271e-06, - "loss": 0.6816, - "step": 42340 - }, - { - "epoch": 1.09, - "learning_rate": 1.4762457949475949e-06, - "loss": 0.5789, - "step": 42341 - }, - { - "epoch": 1.09, - "learning_rate": 1.4762214637976236e-06, - "loss": 0.5991, - "step": 42342 - }, - { - "epoch": 1.09, - "learning_rate": 1.476197132283031e-06, - "loss": 0.7051, - "step": 42343 - }, - { - "epoch": 1.09, - "learning_rate": 1.4761728004038365e-06, - "loss": 0.4785, - "step": 42344 - }, - { - "epoch": 1.09, - "learning_rate": 1.476148468160058e-06, - "loss": 0.7314, - "step": 42345 - }, - { - "epoch": 1.09, - "learning_rate": 1.4761241355517146e-06, - "loss": 0.7969, - "step": 42346 - }, - { - "epoch": 1.09, - "learning_rate": 1.476099802578825e-06, - "loss": 0.4631, - "step": 42347 - }, - { - "epoch": 1.09, - "learning_rate": 1.4760754692414078e-06, - "loss": 0.5002, - "step": 42348 - }, - { - "epoch": 1.09, - "learning_rate": 1.476051135539481e-06, - "loss": 0.6191, - "step": 42349 - }, - { - "epoch": 1.09, - "learning_rate": 1.4760268014730644e-06, - "loss": 0.5791, - "step": 42350 - }, - { - "epoch": 1.09, - "learning_rate": 1.4760024670421753e-06, - "loss": 0.7725, - "step": 42351 - }, - { - "epoch": 1.09, - "learning_rate": 1.4759781322468335e-06, - "loss": 0.7402, - "step": 42352 - }, - { - "epoch": 1.09, - "learning_rate": 1.4759537970870567e-06, - "loss": 0.6763, - "step": 42353 - }, - { - "epoch": 1.09, - "learning_rate": 1.4759294615628646e-06, - "loss": 0.7036, - "step": 42354 - }, - { - "epoch": 1.09, - "learning_rate": 1.4759051256742744e-06, - "loss": 0.6787, - "step": 42355 - }, - { - "epoch": 1.09, - "learning_rate": 1.4758807894213061e-06, - "loss": 0.7197, - "step": 42356 - }, - { - "epoch": 1.09, - "learning_rate": 1.4758564528039776e-06, - "loss": 0.5933, - "step": 42357 - }, - { - "epoch": 1.09, - "learning_rate": 1.4758321158223077e-06, - "loss": 0.5381, - "step": 42358 - }, - { - "epoch": 1.09, - "learning_rate": 1.475807778476315e-06, - "loss": 0.5295, - "step": 42359 - }, - { - "epoch": 1.09, - "learning_rate": 1.4757834407660183e-06, - "loss": 0.4236, - "step": 42360 - }, - { - "epoch": 1.09, - "learning_rate": 1.4757591026914357e-06, - "loss": 0.8574, - "step": 42361 - }, - { - "epoch": 1.09, - "learning_rate": 1.4757347642525867e-06, - "loss": 0.708, - "step": 42362 - }, - { - "epoch": 1.09, - "learning_rate": 1.4757104254494892e-06, - "loss": 0.5554, - "step": 42363 - }, - { - "epoch": 1.09, - "learning_rate": 1.4756860862821624e-06, - "loss": 0.6968, - "step": 42364 - }, - { - "epoch": 1.09, - "learning_rate": 1.4756617467506243e-06, - "loss": 0.7163, - "step": 42365 - }, - { - "epoch": 1.09, - "learning_rate": 1.475637406854894e-06, - "loss": 0.5918, - "step": 42366 - }, - { - "epoch": 1.09, - "learning_rate": 1.47561306659499e-06, - "loss": 0.6621, - "step": 42367 - }, - { - "epoch": 1.09, - "learning_rate": 1.4755887259709305e-06, - "loss": 0.5522, - "step": 42368 - }, - { - "epoch": 1.09, - "learning_rate": 1.4755643849827355e-06, - "loss": 0.6299, - "step": 42369 - }, - { - "epoch": 1.09, - "learning_rate": 1.475540043630422e-06, - "loss": 0.6787, - "step": 42370 - }, - { - "epoch": 1.09, - "learning_rate": 1.4755157019140097e-06, - "loss": 0.7236, - "step": 42371 - }, - { - "epoch": 1.09, - "learning_rate": 1.4754913598335166e-06, - "loss": 0.6821, - "step": 42372 - }, - { - "epoch": 1.09, - "learning_rate": 1.4754670173889618e-06, - "loss": 0.5908, - "step": 42373 - }, - { - "epoch": 1.09, - "learning_rate": 1.4754426745803638e-06, - "loss": 0.5, - "step": 42374 - }, - { - "epoch": 1.09, - "learning_rate": 1.4754183314077413e-06, - "loss": 0.6699, - "step": 42375 - }, - { - "epoch": 1.09, - "learning_rate": 1.4753939878711126e-06, - "loss": 0.4185, - "step": 42376 - }, - { - "epoch": 1.09, - "learning_rate": 1.4753696439704969e-06, - "loss": 0.6963, - "step": 42377 - }, - { - "epoch": 1.09, - "learning_rate": 1.4753452997059122e-06, - "loss": 0.8369, - "step": 42378 - }, - { - "epoch": 1.09, - "learning_rate": 1.4753209550773777e-06, - "loss": 0.4895, - "step": 42379 - }, - { - "epoch": 1.09, - "learning_rate": 1.4752966100849115e-06, - "loss": 0.7178, - "step": 42380 - }, - { - "epoch": 1.09, - "learning_rate": 1.4752722647285329e-06, - "loss": 0.6489, - "step": 42381 - }, - { - "epoch": 1.09, - "learning_rate": 1.4752479190082598e-06, - "loss": 0.7295, - "step": 42382 - }, - { - "epoch": 1.09, - "learning_rate": 1.4752235729241115e-06, - "loss": 0.5669, - "step": 42383 - }, - { - "epoch": 1.09, - "learning_rate": 1.4751992264761064e-06, - "loss": 0.749, - "step": 42384 - }, - { - "epoch": 1.09, - "learning_rate": 1.4751748796642628e-06, - "loss": 0.7627, - "step": 42385 - }, - { - "epoch": 1.09, - "learning_rate": 1.4751505324886e-06, - "loss": 0.7891, - "step": 42386 - }, - { - "epoch": 1.09, - "learning_rate": 1.475126184949136e-06, - "loss": 0.5298, - "step": 42387 - }, - { - "epoch": 1.09, - "learning_rate": 1.4751018370458898e-06, - "loss": 0.6641, - "step": 42388 - }, - { - "epoch": 1.09, - "learning_rate": 1.4750774887788802e-06, - "loss": 0.7734, - "step": 42389 - }, - { - "epoch": 1.09, - "learning_rate": 1.4750531401481254e-06, - "loss": 0.6299, - "step": 42390 - }, - { - "epoch": 1.09, - "learning_rate": 1.4750287911536444e-06, - "loss": 0.7412, - "step": 42391 - }, - { - "epoch": 1.09, - "learning_rate": 1.4750044417954554e-06, - "loss": 0.6377, - "step": 42392 - }, - { - "epoch": 1.09, - "learning_rate": 1.4749800920735776e-06, - "loss": 0.7549, - "step": 42393 - }, - { - "epoch": 1.09, - "learning_rate": 1.4749557419880293e-06, - "loss": 0.7773, - "step": 42394 - }, - { - "epoch": 1.09, - "learning_rate": 1.4749313915388291e-06, - "loss": 0.6475, - "step": 42395 - }, - { - "epoch": 1.09, - "learning_rate": 1.474907040725996e-06, - "loss": 0.5576, - "step": 42396 - }, - { - "epoch": 1.09, - "learning_rate": 1.4748826895495482e-06, - "loss": 0.6265, - "step": 42397 - }, - { - "epoch": 1.09, - "learning_rate": 1.4748583380095049e-06, - "loss": 0.6172, - "step": 42398 - }, - { - "epoch": 1.09, - "learning_rate": 1.474833986105884e-06, - "loss": 0.6689, - "step": 42399 - }, - { - "epoch": 1.09, - "learning_rate": 1.474809633838705e-06, - "loss": 0.626, - "step": 42400 - }, - { - "epoch": 1.09, - "learning_rate": 1.4747852812079855e-06, - "loss": 0.7744, - "step": 42401 - }, - { - "epoch": 1.09, - "learning_rate": 1.4747609282137451e-06, - "loss": 0.606, - "step": 42402 - }, - { - "epoch": 1.09, - "learning_rate": 1.4747365748560023e-06, - "loss": 0.79, - "step": 42403 - }, - { - "epoch": 1.09, - "learning_rate": 1.474712221134775e-06, - "loss": 0.6328, - "step": 42404 - }, - { - "epoch": 1.09, - "learning_rate": 1.474687867050083e-06, - "loss": 0.6875, - "step": 42405 - }, - { - "epoch": 1.09, - "learning_rate": 1.474663512601944e-06, - "loss": 0.8184, - "step": 42406 - }, - { - "epoch": 1.09, - "learning_rate": 1.4746391577903767e-06, - "loss": 0.6001, - "step": 42407 - }, - { - "epoch": 1.09, - "learning_rate": 1.4746148026154003e-06, - "loss": 0.5586, - "step": 42408 - }, - { - "epoch": 1.09, - "learning_rate": 1.4745904470770334e-06, - "loss": 0.8447, - "step": 42409 - }, - { - "epoch": 1.09, - "learning_rate": 1.474566091175294e-06, - "loss": 0.6499, - "step": 42410 - }, - { - "epoch": 1.09, - "learning_rate": 1.4745417349102015e-06, - "loss": 0.8096, - "step": 42411 - }, - { - "epoch": 1.09, - "learning_rate": 1.474517378281774e-06, - "loss": 0.6855, - "step": 42412 - }, - { - "epoch": 1.09, - "learning_rate": 1.4744930212900307e-06, - "loss": 0.5942, - "step": 42413 - }, - { - "epoch": 1.09, - "learning_rate": 1.4744686639349894e-06, - "loss": 0.6377, - "step": 42414 - }, - { - "epoch": 1.09, - "learning_rate": 1.4744443062166693e-06, - "loss": 0.6777, - "step": 42415 - }, - { - "epoch": 1.09, - "learning_rate": 1.4744199481350892e-06, - "loss": 0.5728, - "step": 42416 - }, - { - "epoch": 1.09, - "learning_rate": 1.4743955896902675e-06, - "loss": 0.5243, - "step": 42417 - }, - { - "epoch": 1.09, - "learning_rate": 1.4743712308822232e-06, - "loss": 0.646, - "step": 42418 - }, - { - "epoch": 1.09, - "learning_rate": 1.4743468717109746e-06, - "loss": 0.6357, - "step": 42419 - }, - { - "epoch": 1.09, - "learning_rate": 1.4743225121765402e-06, - "loss": 0.5752, - "step": 42420 - }, - { - "epoch": 1.09, - "learning_rate": 1.4742981522789388e-06, - "loss": 0.5176, - "step": 42421 - }, - { - "epoch": 1.09, - "learning_rate": 1.4742737920181892e-06, - "loss": 0.5011, - "step": 42422 - }, - { - "epoch": 1.09, - "learning_rate": 1.4742494313943102e-06, - "loss": 0.7144, - "step": 42423 - }, - { - "epoch": 1.09, - "learning_rate": 1.4742250704073198e-06, - "loss": 0.75, - "step": 42424 - }, - { - "epoch": 1.09, - "learning_rate": 1.4742007090572375e-06, - "loss": 0.5737, - "step": 42425 - }, - { - "epoch": 1.09, - "learning_rate": 1.474176347344081e-06, - "loss": 0.6875, - "step": 42426 - }, - { - "epoch": 1.09, - "learning_rate": 1.47415198526787e-06, - "loss": 0.6748, - "step": 42427 - }, - { - "epoch": 1.09, - "learning_rate": 1.4741276228286223e-06, - "loss": 0.8887, - "step": 42428 - }, - { - "epoch": 1.09, - "learning_rate": 1.4741032600263567e-06, - "loss": 0.6147, - "step": 42429 - }, - { - "epoch": 1.09, - "learning_rate": 1.4740788968610925e-06, - "loss": 0.627, - "step": 42430 - }, - { - "epoch": 1.09, - "learning_rate": 1.4740545333328477e-06, - "loss": 0.8496, - "step": 42431 - }, - { - "epoch": 1.09, - "learning_rate": 1.4740301694416411e-06, - "loss": 0.6787, - "step": 42432 - }, - { - "epoch": 1.09, - "learning_rate": 1.4740058051874916e-06, - "loss": 0.6094, - "step": 42433 - }, - { - "epoch": 1.09, - "learning_rate": 1.4739814405704174e-06, - "loss": 0.8516, - "step": 42434 - }, - { - "epoch": 1.09, - "learning_rate": 1.4739570755904373e-06, - "loss": 0.7852, - "step": 42435 - }, - { - "epoch": 1.09, - "learning_rate": 1.4739327102475704e-06, - "loss": 0.7178, - "step": 42436 - }, - { - "epoch": 1.09, - "learning_rate": 1.4739083445418347e-06, - "loss": 0.6611, - "step": 42437 - }, - { - "epoch": 1.09, - "learning_rate": 1.4738839784732497e-06, - "loss": 0.6357, - "step": 42438 - }, - { - "epoch": 1.09, - "learning_rate": 1.4738596120418329e-06, - "loss": 0.6504, - "step": 42439 - }, - { - "epoch": 1.09, - "learning_rate": 1.4738352452476039e-06, - "loss": 0.5635, - "step": 42440 - }, - { - "epoch": 1.09, - "learning_rate": 1.473810878090581e-06, - "loss": 0.6184, - "step": 42441 - }, - { - "epoch": 1.09, - "learning_rate": 1.473786510570783e-06, - "loss": 0.603, - "step": 42442 - }, - { - "epoch": 1.09, - "learning_rate": 1.4737621426882283e-06, - "loss": 0.6851, - "step": 42443 - }, - { - "epoch": 1.09, - "learning_rate": 1.4737377744429357e-06, - "loss": 0.4866, - "step": 42444 - }, - { - "epoch": 1.09, - "learning_rate": 1.473713405834924e-06, - "loss": 0.5554, - "step": 42445 - }, - { - "epoch": 1.09, - "learning_rate": 1.4736890368642116e-06, - "loss": 0.6816, - "step": 42446 - }, - { - "epoch": 1.09, - "learning_rate": 1.4736646675308171e-06, - "loss": 0.7007, - "step": 42447 - }, - { - "epoch": 1.09, - "learning_rate": 1.4736402978347598e-06, - "loss": 0.6924, - "step": 42448 - }, - { - "epoch": 1.09, - "learning_rate": 1.4736159277760578e-06, - "loss": 0.6304, - "step": 42449 - }, - { - "epoch": 1.09, - "learning_rate": 1.4735915573547297e-06, - "loss": 0.5864, - "step": 42450 - }, - { - "epoch": 1.09, - "learning_rate": 1.473567186570794e-06, - "loss": 0.6943, - "step": 42451 - }, - { - "epoch": 1.09, - "learning_rate": 1.4735428154242705e-06, - "loss": 0.4619, - "step": 42452 - }, - { - "epoch": 1.09, - "learning_rate": 1.4735184439151764e-06, - "loss": 0.7803, - "step": 42453 - }, - { - "epoch": 1.09, - "learning_rate": 1.4734940720435312e-06, - "loss": 0.6621, - "step": 42454 - }, - { - "epoch": 1.09, - "learning_rate": 1.4734696998093532e-06, - "loss": 0.7061, - "step": 42455 - }, - { - "epoch": 1.09, - "learning_rate": 1.4734453272126615e-06, - "loss": 0.6602, - "step": 42456 - }, - { - "epoch": 1.09, - "learning_rate": 1.4734209542534743e-06, - "loss": 0.665, - "step": 42457 - }, - { - "epoch": 1.09, - "learning_rate": 1.4733965809318106e-06, - "loss": 0.6719, - "step": 42458 - }, - { - "epoch": 1.09, - "learning_rate": 1.4733722072476888e-06, - "loss": 0.6543, - "step": 42459 - }, - { - "epoch": 1.09, - "learning_rate": 1.4733478332011275e-06, - "loss": 0.6113, - "step": 42460 - }, - { - "epoch": 1.09, - "learning_rate": 1.4733234587921458e-06, - "loss": 0.4686, - "step": 42461 - }, - { - "epoch": 1.09, - "learning_rate": 1.4732990840207618e-06, - "loss": 0.5649, - "step": 42462 - }, - { - "epoch": 1.09, - "learning_rate": 1.473274708886995e-06, - "loss": 0.7148, - "step": 42463 - }, - { - "epoch": 1.09, - "learning_rate": 1.473250333390863e-06, - "loss": 0.4263, - "step": 42464 - }, - { - "epoch": 1.09, - "learning_rate": 1.4732259575323852e-06, - "loss": 0.8359, - "step": 42465 - }, - { - "epoch": 1.09, - "learning_rate": 1.4732015813115796e-06, - "loss": 0.7832, - "step": 42466 - }, - { - "epoch": 1.09, - "learning_rate": 1.473177204728466e-06, - "loss": 0.6196, - "step": 42467 - }, - { - "epoch": 1.09, - "learning_rate": 1.473152827783062e-06, - "loss": 0.4861, - "step": 42468 - }, - { - "epoch": 1.09, - "learning_rate": 1.4731284504753869e-06, - "loss": 0.5991, - "step": 42469 - }, - { - "epoch": 1.09, - "learning_rate": 1.4731040728054587e-06, - "loss": 0.6294, - "step": 42470 - }, - { - "epoch": 1.09, - "learning_rate": 1.4730796947732968e-06, - "loss": 0.8447, - "step": 42471 - }, - { - "epoch": 1.09, - "learning_rate": 1.4730553163789192e-06, - "loss": 0.426, - "step": 42472 - }, - { - "epoch": 1.09, - "learning_rate": 1.4730309376223452e-06, - "loss": 0.6646, - "step": 42473 - }, - { - "epoch": 1.09, - "learning_rate": 1.473006558503593e-06, - "loss": 0.5962, - "step": 42474 - }, - { - "epoch": 1.09, - "learning_rate": 1.4729821790226816e-06, - "loss": 0.9072, - "step": 42475 - }, - { - "epoch": 1.09, - "learning_rate": 1.472957799179629e-06, - "loss": 0.7275, - "step": 42476 - }, - { - "epoch": 1.09, - "learning_rate": 1.4729334189744549e-06, - "loss": 0.7354, - "step": 42477 - }, - { - "epoch": 1.09, - "learning_rate": 1.4729090384071773e-06, - "loss": 0.6396, - "step": 42478 - }, - { - "epoch": 1.09, - "learning_rate": 1.472884657477815e-06, - "loss": 0.6436, - "step": 42479 - }, - { - "epoch": 1.09, - "learning_rate": 1.4728602761863867e-06, - "loss": 0.6362, - "step": 42480 - }, - { - "epoch": 1.09, - "learning_rate": 1.4728358945329107e-06, - "loss": 0.7295, - "step": 42481 - }, - { - "epoch": 1.09, - "learning_rate": 1.4728115125174064e-06, - "loss": 0.6914, - "step": 42482 - }, - { - "epoch": 1.09, - "learning_rate": 1.472787130139892e-06, - "loss": 0.6777, - "step": 42483 - }, - { - "epoch": 1.09, - "learning_rate": 1.472762747400386e-06, - "loss": 0.646, - "step": 42484 - }, - { - "epoch": 1.09, - "learning_rate": 1.4727383642989075e-06, - "loss": 0.6138, - "step": 42485 - }, - { - "epoch": 1.09, - "learning_rate": 1.472713980835475e-06, - "loss": 0.8223, - "step": 42486 - }, - { - "epoch": 1.09, - "learning_rate": 1.472689597010107e-06, - "loss": 0.699, - "step": 42487 - }, - { - "epoch": 1.09, - "learning_rate": 1.4726652128228225e-06, - "loss": 0.5913, - "step": 42488 - }, - { - "epoch": 1.09, - "learning_rate": 1.4726408282736395e-06, - "loss": 0.6914, - "step": 42489 - }, - { - "epoch": 1.09, - "learning_rate": 1.4726164433625777e-06, - "loss": 0.7041, - "step": 42490 - }, - { - "epoch": 1.09, - "learning_rate": 1.472592058089655e-06, - "loss": 0.7305, - "step": 42491 - }, - { - "epoch": 1.09, - "learning_rate": 1.4725676724548903e-06, - "loss": 0.4193, - "step": 42492 - }, - { - "epoch": 1.09, - "learning_rate": 1.4725432864583022e-06, - "loss": 0.6123, - "step": 42493 - }, - { - "epoch": 1.09, - "learning_rate": 1.4725189000999095e-06, - "loss": 0.6904, - "step": 42494 - }, - { - "epoch": 1.09, - "learning_rate": 1.4724945133797308e-06, - "loss": 0.7021, - "step": 42495 - }, - { - "epoch": 1.09, - "learning_rate": 1.472470126297785e-06, - "loss": 0.4614, - "step": 42496 - }, - { - "epoch": 1.09, - "learning_rate": 1.47244573885409e-06, - "loss": 0.749, - "step": 42497 - }, - { - "epoch": 1.09, - "learning_rate": 1.4724213510486656e-06, - "loss": 0.6338, - "step": 42498 - }, - { - "epoch": 1.09, - "learning_rate": 1.4723969628815295e-06, - "loss": 0.3422, - "step": 42499 - }, - { - "epoch": 1.09, - "learning_rate": 1.4723725743527008e-06, - "loss": 0.5723, - "step": 42500 - }, - { - "epoch": 1.09, - "learning_rate": 1.4723481854621984e-06, - "loss": 0.5537, - "step": 42501 - }, - { - "epoch": 1.09, - "learning_rate": 1.4723237962100405e-06, - "loss": 0.5674, - "step": 42502 - }, - { - "epoch": 1.09, - "learning_rate": 1.4722994065962464e-06, - "loss": 0.5908, - "step": 42503 - }, - { - "epoch": 1.09, - "learning_rate": 1.4722750166208337e-06, - "loss": 0.6416, - "step": 42504 - }, - { - "epoch": 1.09, - "learning_rate": 1.4722506262838224e-06, - "loss": 0.6113, - "step": 42505 - }, - { - "epoch": 1.09, - "learning_rate": 1.47222623558523e-06, - "loss": 0.6855, - "step": 42506 - }, - { - "epoch": 1.09, - "learning_rate": 1.4722018445250757e-06, - "loss": 0.6719, - "step": 42507 - }, - { - "epoch": 1.09, - "learning_rate": 1.4721774531033784e-06, - "loss": 0.5283, - "step": 42508 - }, - { - "epoch": 1.09, - "learning_rate": 1.4721530613201566e-06, - "loss": 0.5308, - "step": 42509 - }, - { - "epoch": 1.09, - "learning_rate": 1.4721286691754283e-06, - "loss": 0.6597, - "step": 42510 - }, - { - "epoch": 1.09, - "learning_rate": 1.4721042766692135e-06, - "loss": 0.6416, - "step": 42511 - }, - { - "epoch": 1.09, - "learning_rate": 1.4720798838015297e-06, - "loss": 0.5972, - "step": 42512 - }, - { - "epoch": 1.09, - "learning_rate": 1.4720554905723964e-06, - "loss": 0.6445, - "step": 42513 - }, - { - "epoch": 1.09, - "learning_rate": 1.4720310969818319e-06, - "loss": 0.751, - "step": 42514 - }, - { - "epoch": 1.09, - "learning_rate": 1.4720067030298549e-06, - "loss": 0.6533, - "step": 42515 - }, - { - "epoch": 1.09, - "learning_rate": 1.4719823087164838e-06, - "loss": 0.6406, - "step": 42516 - }, - { - "epoch": 1.09, - "learning_rate": 1.4719579140417376e-06, - "loss": 0.5649, - "step": 42517 - }, - { - "epoch": 1.09, - "learning_rate": 1.4719335190056353e-06, - "loss": 0.7363, - "step": 42518 - }, - { - "epoch": 1.09, - "learning_rate": 1.4719091236081946e-06, - "loss": 0.6729, - "step": 42519 - }, - { - "epoch": 1.09, - "learning_rate": 1.4718847278494351e-06, - "loss": 0.7148, - "step": 42520 - }, - { - "epoch": 1.09, - "learning_rate": 1.471860331729375e-06, - "loss": 0.6758, - "step": 42521 - }, - { - "epoch": 1.09, - "learning_rate": 1.4718359352480333e-06, - "loss": 0.6553, - "step": 42522 - }, - { - "epoch": 1.09, - "learning_rate": 1.471811538405429e-06, - "loss": 0.6191, - "step": 42523 - }, - { - "epoch": 1.09, - "learning_rate": 1.4717871412015797e-06, - "loss": 0.7725, - "step": 42524 - }, - { - "epoch": 1.09, - "learning_rate": 1.4717627436365045e-06, - "loss": 0.6768, - "step": 42525 - }, - { - "epoch": 1.09, - "learning_rate": 1.4717383457102226e-06, - "loss": 0.6675, - "step": 42526 - }, - { - "epoch": 1.09, - "learning_rate": 1.4717139474227521e-06, - "loss": 0.5093, - "step": 42527 - }, - { - "epoch": 1.09, - "learning_rate": 1.4716895487741125e-06, - "loss": 0.5569, - "step": 42528 - }, - { - "epoch": 1.09, - "learning_rate": 1.4716651497643214e-06, - "loss": 0.4795, - "step": 42529 - }, - { - "epoch": 1.09, - "learning_rate": 1.4716407503933981e-06, - "loss": 0.769, - "step": 42530 - }, - { - "epoch": 1.09, - "learning_rate": 1.471616350661361e-06, - "loss": 0.6392, - "step": 42531 - }, - { - "epoch": 1.09, - "learning_rate": 1.4715919505682293e-06, - "loss": 0.6172, - "step": 42532 - }, - { - "epoch": 1.09, - "learning_rate": 1.4715675501140213e-06, - "loss": 0.7476, - "step": 42533 - }, - { - "epoch": 1.09, - "learning_rate": 1.4715431492987552e-06, - "loss": 0.7686, - "step": 42534 - }, - { - "epoch": 1.09, - "learning_rate": 1.4715187481224507e-06, - "loss": 0.6489, - "step": 42535 - }, - { - "epoch": 1.09, - "learning_rate": 1.4714943465851257e-06, - "loss": 0.5303, - "step": 42536 - }, - { - "epoch": 1.09, - "learning_rate": 1.4714699446867993e-06, - "loss": 0.6406, - "step": 42537 - }, - { - "epoch": 1.09, - "learning_rate": 1.4714455424274902e-06, - "loss": 0.5889, - "step": 42538 - }, - { - "epoch": 1.09, - "learning_rate": 1.4714211398072168e-06, - "loss": 0.6914, - "step": 42539 - }, - { - "epoch": 1.09, - "learning_rate": 1.4713967368259978e-06, - "loss": 0.6997, - "step": 42540 - }, - { - "epoch": 1.09, - "learning_rate": 1.4713723334838516e-06, - "loss": 0.7236, - "step": 42541 - }, - { - "epoch": 1.09, - "learning_rate": 1.471347929780798e-06, - "loss": 0.7061, - "step": 42542 - }, - { - "epoch": 1.09, - "learning_rate": 1.4713235257168549e-06, - "loss": 0.2991, - "step": 42543 - }, - { - "epoch": 1.09, - "learning_rate": 1.4712991212920405e-06, - "loss": 0.5244, - "step": 42544 - }, - { - "epoch": 1.09, - "learning_rate": 1.4712747165063743e-06, - "loss": 0.5596, - "step": 42545 - }, - { - "epoch": 1.09, - "learning_rate": 1.471250311359875e-06, - "loss": 0.5991, - "step": 42546 - }, - { - "epoch": 1.09, - "learning_rate": 1.4712259058525607e-06, - "loss": 0.7188, - "step": 42547 - }, - { - "epoch": 1.09, - "learning_rate": 1.4712014999844505e-06, - "loss": 0.8076, - "step": 42548 - }, - { - "epoch": 1.09, - "learning_rate": 1.471177093755563e-06, - "loss": 0.7529, - "step": 42549 - }, - { - "epoch": 1.09, - "learning_rate": 1.4711526871659168e-06, - "loss": 0.6719, - "step": 42550 - }, - { - "epoch": 1.09, - "learning_rate": 1.4711282802155308e-06, - "loss": 0.9199, - "step": 42551 - }, - { - "epoch": 1.09, - "learning_rate": 1.471103872904423e-06, - "loss": 0.55, - "step": 42552 - }, - { - "epoch": 1.09, - "learning_rate": 1.4710794652326136e-06, - "loss": 0.5576, - "step": 42553 - }, - { - "epoch": 1.09, - "learning_rate": 1.4710550572001195e-06, - "loss": 0.7324, - "step": 42554 - }, - { - "epoch": 1.09, - "learning_rate": 1.4710306488069606e-06, - "loss": 0.7666, - "step": 42555 - }, - { - "epoch": 1.09, - "learning_rate": 1.4710062400531549e-06, - "loss": 0.5645, - "step": 42556 - }, - { - "epoch": 1.09, - "learning_rate": 1.4709818309387214e-06, - "loss": 0.5645, - "step": 42557 - }, - { - "epoch": 1.09, - "learning_rate": 1.4709574214636792e-06, - "loss": 0.5435, - "step": 42558 - }, - { - "epoch": 1.09, - "learning_rate": 1.4709330116280463e-06, - "loss": 0.7344, - "step": 42559 - }, - { - "epoch": 1.09, - "learning_rate": 1.4709086014318413e-06, - "loss": 0.5947, - "step": 42560 - }, - { - "epoch": 1.09, - "learning_rate": 1.4708841908750837e-06, - "loss": 0.7393, - "step": 42561 - }, - { - "epoch": 1.09, - "learning_rate": 1.4708597799577915e-06, - "loss": 0.5801, - "step": 42562 - }, - { - "epoch": 1.09, - "learning_rate": 1.4708353686799838e-06, - "loss": 0.3936, - "step": 42563 - }, - { - "epoch": 1.09, - "learning_rate": 1.470810957041679e-06, - "loss": 0.6338, - "step": 42564 - }, - { - "epoch": 1.09, - "learning_rate": 1.4707865450428956e-06, - "loss": 0.5845, - "step": 42565 - }, - { - "epoch": 1.09, - "learning_rate": 1.470762132683653e-06, - "loss": 0.5449, - "step": 42566 - }, - { - "epoch": 1.09, - "learning_rate": 1.4707377199639693e-06, - "loss": 0.542, - "step": 42567 - }, - { - "epoch": 1.09, - "learning_rate": 1.4707133068838636e-06, - "loss": 0.5957, - "step": 42568 - }, - { - "epoch": 1.09, - "learning_rate": 1.4706888934433542e-06, - "loss": 0.6299, - "step": 42569 - }, - { - "epoch": 1.09, - "learning_rate": 1.4706644796424598e-06, - "loss": 0.6504, - "step": 42570 - }, - { - "epoch": 1.09, - "learning_rate": 1.4706400654811995e-06, - "loss": 0.7568, - "step": 42571 - }, - { - "epoch": 1.09, - "learning_rate": 1.4706156509595915e-06, - "loss": 0.708, - "step": 42572 - }, - { - "epoch": 1.09, - "learning_rate": 1.4705912360776548e-06, - "loss": 0.509, - "step": 42573 - }, - { - "epoch": 1.09, - "learning_rate": 1.4705668208354083e-06, - "loss": 0.6455, - "step": 42574 - }, - { - "epoch": 1.09, - "learning_rate": 1.4705424052328702e-06, - "loss": 0.6182, - "step": 42575 - }, - { - "epoch": 1.09, - "learning_rate": 1.4705179892700594e-06, - "loss": 0.7666, - "step": 42576 - }, - { - "epoch": 1.09, - "learning_rate": 1.4704935729469948e-06, - "loss": 0.5767, - "step": 42577 - }, - { - "epoch": 1.09, - "learning_rate": 1.4704691562636948e-06, - "loss": 0.6045, - "step": 42578 - }, - { - "epoch": 1.09, - "learning_rate": 1.470444739220178e-06, - "loss": 0.5737, - "step": 42579 - }, - { - "epoch": 1.09, - "learning_rate": 1.4704203218164636e-06, - "loss": 0.3473, - "step": 42580 - }, - { - "epoch": 1.09, - "learning_rate": 1.4703959040525697e-06, - "loss": 0.7314, - "step": 42581 - }, - { - "epoch": 1.09, - "learning_rate": 1.4703714859285158e-06, - "loss": 0.7881, - "step": 42582 - }, - { - "epoch": 1.09, - "learning_rate": 1.4703470674443195e-06, - "loss": 0.7441, - "step": 42583 - }, - { - "epoch": 1.09, - "learning_rate": 1.4703226486000002e-06, - "loss": 0.6719, - "step": 42584 - }, - { - "epoch": 1.09, - "learning_rate": 1.4702982293955766e-06, - "loss": 0.9395, - "step": 42585 - }, - { - "epoch": 1.09, - "learning_rate": 1.4702738098310671e-06, - "loss": 0.7627, - "step": 42586 - }, - { - "epoch": 1.09, - "learning_rate": 1.4702493899064907e-06, - "loss": 0.6523, - "step": 42587 - }, - { - "epoch": 1.09, - "learning_rate": 1.4702249696218664e-06, - "loss": 0.8301, - "step": 42588 - }, - { - "epoch": 1.09, - "learning_rate": 1.4702005489772117e-06, - "loss": 0.5208, - "step": 42589 - }, - { - "epoch": 1.09, - "learning_rate": 1.4701761279725463e-06, - "loss": 0.7793, - "step": 42590 - }, - { - "epoch": 1.09, - "learning_rate": 1.470151706607889e-06, - "loss": 0.752, - "step": 42591 - }, - { - "epoch": 1.09, - "learning_rate": 1.4701272848832576e-06, - "loss": 0.5269, - "step": 42592 - }, - { - "epoch": 1.09, - "learning_rate": 1.470102862798672e-06, - "loss": 0.6094, - "step": 42593 - }, - { - "epoch": 1.09, - "learning_rate": 1.4700784403541498e-06, - "loss": 0.6838, - "step": 42594 - }, - { - "epoch": 1.09, - "learning_rate": 1.4700540175497103e-06, - "loss": 0.4852, - "step": 42595 - }, - { - "epoch": 1.09, - "learning_rate": 1.4700295943853717e-06, - "loss": 0.5752, - "step": 42596 - }, - { - "epoch": 1.09, - "learning_rate": 1.4700051708611536e-06, - "loss": 0.5361, - "step": 42597 - }, - { - "epoch": 1.09, - "learning_rate": 1.469980746977074e-06, - "loss": 0.5928, - "step": 42598 - }, - { - "epoch": 1.09, - "learning_rate": 1.4699563227331518e-06, - "loss": 0.6367, - "step": 42599 - }, - { - "epoch": 1.09, - "learning_rate": 1.4699318981294052e-06, - "loss": 0.6211, - "step": 42600 - }, - { - "epoch": 1.09, - "learning_rate": 1.4699074731658541e-06, - "loss": 0.6211, - "step": 42601 - }, - { - "epoch": 1.09, - "learning_rate": 1.4698830478425156e-06, - "loss": 0.7388, - "step": 42602 - }, - { - "epoch": 1.09, - "learning_rate": 1.46985862215941e-06, - "loss": 0.6738, - "step": 42603 - }, - { - "epoch": 1.09, - "learning_rate": 1.469834196116555e-06, - "loss": 0.5503, - "step": 42604 - }, - { - "epoch": 1.09, - "learning_rate": 1.4698097697139694e-06, - "loss": 0.6191, - "step": 42605 - }, - { - "epoch": 1.09, - "learning_rate": 1.4697853429516723e-06, - "loss": 0.8223, - "step": 42606 - }, - { - "epoch": 1.09, - "learning_rate": 1.469760915829682e-06, - "loss": 0.606, - "step": 42607 - }, - { - "epoch": 1.09, - "learning_rate": 1.4697364883480174e-06, - "loss": 0.5356, - "step": 42608 - }, - { - "epoch": 1.09, - "learning_rate": 1.469712060506697e-06, - "loss": 0.8896, - "step": 42609 - }, - { - "epoch": 1.09, - "learning_rate": 1.4696876323057398e-06, - "loss": 0.6387, - "step": 42610 - }, - { - "epoch": 1.09, - "learning_rate": 1.4696632037451644e-06, - "loss": 0.6245, - "step": 42611 - }, - { - "epoch": 1.09, - "learning_rate": 1.4696387748249897e-06, - "loss": 0.6882, - "step": 42612 - }, - { - "epoch": 1.09, - "learning_rate": 1.4696143455452342e-06, - "loss": 0.6221, - "step": 42613 - }, - { - "epoch": 1.09, - "learning_rate": 1.4695899159059162e-06, - "loss": 0.6589, - "step": 42614 - }, - { - "epoch": 1.09, - "learning_rate": 1.4695654859070547e-06, - "loss": 0.748, - "step": 42615 - }, - { - "epoch": 1.09, - "learning_rate": 1.4695410555486692e-06, - "loss": 0.8232, - "step": 42616 - }, - { - "epoch": 1.09, - "learning_rate": 1.469516624830777e-06, - "loss": 0.4525, - "step": 42617 - }, - { - "epoch": 1.09, - "learning_rate": 1.469492193753398e-06, - "loss": 0.6021, - "step": 42618 - }, - { - "epoch": 1.09, - "learning_rate": 1.4694677623165502e-06, - "loss": 0.5413, - "step": 42619 - }, - { - "epoch": 1.09, - "learning_rate": 1.4694433305202524e-06, - "loss": 0.6904, - "step": 42620 - }, - { - "epoch": 1.09, - "learning_rate": 1.4694188983645234e-06, - "loss": 0.4419, - "step": 42621 - }, - { - "epoch": 1.09, - "learning_rate": 1.4693944658493822e-06, - "loss": 0.7441, - "step": 42622 - }, - { - "epoch": 1.09, - "learning_rate": 1.4693700329748472e-06, - "loss": 0.7295, - "step": 42623 - }, - { - "epoch": 1.09, - "learning_rate": 1.4693455997409372e-06, - "loss": 0.6348, - "step": 42624 - }, - { - "epoch": 1.09, - "learning_rate": 1.4693211661476706e-06, - "loss": 0.6431, - "step": 42625 - }, - { - "epoch": 1.09, - "learning_rate": 1.4692967321950665e-06, - "loss": 0.6416, - "step": 42626 - }, - { - "epoch": 1.09, - "learning_rate": 1.4692722978831433e-06, - "loss": 0.5781, - "step": 42627 - }, - { - "epoch": 1.09, - "learning_rate": 1.4692478632119202e-06, - "loss": 0.7256, - "step": 42628 - }, - { - "epoch": 1.09, - "learning_rate": 1.4692234281814155e-06, - "loss": 0.5469, - "step": 42629 - }, - { - "epoch": 1.09, - "learning_rate": 1.4691989927916478e-06, - "loss": 0.6963, - "step": 42630 - }, - { - "epoch": 1.09, - "learning_rate": 1.4691745570426362e-06, - "loss": 0.751, - "step": 42631 - }, - { - "epoch": 1.09, - "learning_rate": 1.469150120934399e-06, - "loss": 0.7793, - "step": 42632 - }, - { - "epoch": 1.09, - "learning_rate": 1.4691256844669555e-06, - "loss": 0.6587, - "step": 42633 - }, - { - "epoch": 1.09, - "learning_rate": 1.4691012476403235e-06, - "loss": 0.4192, - "step": 42634 - }, - { - "epoch": 1.09, - "learning_rate": 1.4690768104545227e-06, - "loss": 0.6133, - "step": 42635 - }, - { - "epoch": 1.09, - "learning_rate": 1.4690523729095712e-06, - "loss": 0.457, - "step": 42636 - }, - { - "epoch": 1.09, - "learning_rate": 1.4690279350054878e-06, - "loss": 0.6528, - "step": 42637 - }, - { - "epoch": 1.09, - "learning_rate": 1.4690034967422916e-06, - "loss": 0.4824, - "step": 42638 - }, - { - "epoch": 1.09, - "learning_rate": 1.4689790581200007e-06, - "loss": 0.7891, - "step": 42639 - }, - { - "epoch": 1.09, - "learning_rate": 1.468954619138634e-06, - "loss": 0.5083, - "step": 42640 - }, - { - "epoch": 1.09, - "learning_rate": 1.4689301797982103e-06, - "loss": 0.4224, - "step": 42641 - }, - { - "epoch": 1.09, - "learning_rate": 1.4689057400987485e-06, - "loss": 0.7412, - "step": 42642 - }, - { - "epoch": 1.09, - "learning_rate": 1.4688813000402673e-06, - "loss": 0.6445, - "step": 42643 - }, - { - "epoch": 1.09, - "learning_rate": 1.4688568596227851e-06, - "loss": 0.8594, - "step": 42644 - }, - { - "epoch": 1.09, - "learning_rate": 1.4688324188463207e-06, - "loss": 0.5498, - "step": 42645 - }, - { - "epoch": 1.09, - "learning_rate": 1.4688079777108926e-06, - "loss": 0.7495, - "step": 42646 - }, - { - "epoch": 1.09, - "learning_rate": 1.4687835362165203e-06, - "loss": 0.7153, - "step": 42647 - }, - { - "epoch": 1.09, - "learning_rate": 1.4687590943632218e-06, - "loss": 0.6101, - "step": 42648 - }, - { - "epoch": 1.09, - "learning_rate": 1.468734652151016e-06, - "loss": 0.7275, - "step": 42649 - }, - { - "epoch": 1.09, - "learning_rate": 1.4687102095799216e-06, - "loss": 0.6201, - "step": 42650 - }, - { - "epoch": 1.09, - "learning_rate": 1.4686857666499574e-06, - "loss": 0.5278, - "step": 42651 - }, - { - "epoch": 1.09, - "learning_rate": 1.4686613233611418e-06, - "loss": 0.7715, - "step": 42652 - }, - { - "epoch": 1.09, - "learning_rate": 1.468636879713494e-06, - "loss": 0.7759, - "step": 42653 - }, - { - "epoch": 1.09, - "learning_rate": 1.4686124357070327e-06, - "loss": 0.751, - "step": 42654 - }, - { - "epoch": 1.09, - "learning_rate": 1.468587991341776e-06, - "loss": 0.3052, - "step": 42655 - }, - { - "epoch": 1.09, - "learning_rate": 1.4685635466177434e-06, - "loss": 0.7744, - "step": 42656 - }, - { - "epoch": 1.09, - "learning_rate": 1.4685391015349528e-06, - "loss": 0.6411, - "step": 42657 - }, - { - "epoch": 1.09, - "learning_rate": 1.468514656093424e-06, - "loss": 0.6221, - "step": 42658 - }, - { - "epoch": 1.09, - "learning_rate": 1.4684902102931745e-06, - "loss": 0.7148, - "step": 42659 - }, - { - "epoch": 1.09, - "learning_rate": 1.4684657641342237e-06, - "loss": 0.6572, - "step": 42660 - }, - { - "epoch": 1.09, - "learning_rate": 1.4684413176165903e-06, - "loss": 0.4521, - "step": 42661 - }, - { - "epoch": 1.09, - "learning_rate": 1.4684168707402928e-06, - "loss": 0.4071, - "step": 42662 - }, - { - "epoch": 1.09, - "learning_rate": 1.4683924235053502e-06, - "loss": 0.5024, - "step": 42663 - }, - { - "epoch": 1.09, - "learning_rate": 1.4683679759117812e-06, - "loss": 0.6445, - "step": 42664 - }, - { - "epoch": 1.09, - "learning_rate": 1.4683435279596039e-06, - "loss": 0.6807, - "step": 42665 - }, - { - "epoch": 1.09, - "learning_rate": 1.4683190796488379e-06, - "loss": 0.719, - "step": 42666 - }, - { - "epoch": 1.09, - "learning_rate": 1.4682946309795013e-06, - "loss": 0.6719, - "step": 42667 - }, - { - "epoch": 1.09, - "learning_rate": 1.4682701819516133e-06, - "loss": 0.5898, - "step": 42668 - }, - { - "epoch": 1.09, - "learning_rate": 1.4682457325651921e-06, - "loss": 0.7217, - "step": 42669 - }, - { - "epoch": 1.09, - "learning_rate": 1.4682212828202566e-06, - "loss": 0.7354, - "step": 42670 - }, - { - "epoch": 1.09, - "learning_rate": 1.4681968327168257e-06, - "loss": 0.7373, - "step": 42671 - }, - { - "epoch": 1.09, - "learning_rate": 1.4681723822549181e-06, - "loss": 0.6162, - "step": 42672 - }, - { - "epoch": 1.09, - "learning_rate": 1.4681479314345526e-06, - "loss": 0.7012, - "step": 42673 - }, - { - "epoch": 1.09, - "learning_rate": 1.4681234802557474e-06, - "loss": 0.7886, - "step": 42674 - }, - { - "epoch": 1.09, - "learning_rate": 1.4680990287185218e-06, - "loss": 0.7881, - "step": 42675 - }, - { - "epoch": 1.09, - "learning_rate": 1.468074576822894e-06, - "loss": 0.5938, - "step": 42676 - }, - { - "epoch": 1.09, - "learning_rate": 1.4680501245688833e-06, - "loss": 0.7383, - "step": 42677 - }, - { - "epoch": 1.09, - "learning_rate": 1.4680256719565082e-06, - "loss": 0.5376, - "step": 42678 - }, - { - "epoch": 1.09, - "learning_rate": 1.4680012189857873e-06, - "loss": 0.6548, - "step": 42679 - }, - { - "epoch": 1.09, - "learning_rate": 1.467976765656739e-06, - "loss": 0.6758, - "step": 42680 - }, - { - "epoch": 1.09, - "learning_rate": 1.467952311969383e-06, - "loss": 0.7856, - "step": 42681 - }, - { - "epoch": 1.09, - "learning_rate": 1.4679278579237368e-06, - "loss": 0.6575, - "step": 42682 - }, - { - "epoch": 1.09, - "learning_rate": 1.4679034035198206e-06, - "loss": 0.7432, - "step": 42683 - }, - { - "epoch": 1.09, - "learning_rate": 1.4678789487576515e-06, - "loss": 0.5918, - "step": 42684 - }, - { - "epoch": 1.09, - "learning_rate": 1.4678544936372495e-06, - "loss": 0.668, - "step": 42685 - }, - { - "epoch": 1.09, - "learning_rate": 1.4678300381586324e-06, - "loss": 0.7012, - "step": 42686 - }, - { - "epoch": 1.09, - "learning_rate": 1.4678055823218197e-06, - "loss": 0.6777, - "step": 42687 - }, - { - "epoch": 1.09, - "learning_rate": 1.4677811261268295e-06, - "loss": 0.665, - "step": 42688 - }, - { - "epoch": 1.09, - "learning_rate": 1.4677566695736812e-06, - "loss": 0.6421, - "step": 42689 - }, - { - "epoch": 1.09, - "learning_rate": 1.4677322126623928e-06, - "loss": 0.6084, - "step": 42690 - }, - { - "epoch": 1.09, - "learning_rate": 1.4677077553929835e-06, - "loss": 0.5723, - "step": 42691 - }, - { - "epoch": 1.09, - "learning_rate": 1.4676832977654717e-06, - "loss": 0.6807, - "step": 42692 - }, - { - "epoch": 1.09, - "learning_rate": 1.4676588397798766e-06, - "loss": 0.5913, - "step": 42693 - }, - { - "epoch": 1.09, - "learning_rate": 1.4676343814362163e-06, - "loss": 0.5547, - "step": 42694 - }, - { - "epoch": 1.09, - "learning_rate": 1.46760992273451e-06, - "loss": 0.5386, - "step": 42695 - }, - { - "epoch": 1.09, - "learning_rate": 1.4675854636747761e-06, - "loss": 0.563, - "step": 42696 - }, - { - "epoch": 1.09, - "learning_rate": 1.467561004257034e-06, - "loss": 0.6265, - "step": 42697 - }, - { - "epoch": 1.09, - "learning_rate": 1.4675365444813014e-06, - "loss": 0.6758, - "step": 42698 - }, - { - "epoch": 1.09, - "learning_rate": 1.467512084347598e-06, - "loss": 0.8301, - "step": 42699 - }, - { - "epoch": 1.09, - "learning_rate": 1.4674876238559416e-06, - "loss": 0.7305, - "step": 42700 - }, - { - "epoch": 1.09, - "learning_rate": 1.4674631630063517e-06, - "loss": 0.3906, - "step": 42701 - }, - { - "epoch": 1.09, - "learning_rate": 1.467438701798847e-06, - "loss": 0.7383, - "step": 42702 - }, - { - "epoch": 1.09, - "learning_rate": 1.4674142402334458e-06, - "loss": 0.5132, - "step": 42703 - }, - { - "epoch": 1.09, - "learning_rate": 1.4673897783101668e-06, - "loss": 0.5647, - "step": 42704 - }, - { - "epoch": 1.09, - "learning_rate": 1.467365316029029e-06, - "loss": 0.5293, - "step": 42705 - }, - { - "epoch": 1.09, - "learning_rate": 1.467340853390051e-06, - "loss": 0.8896, - "step": 42706 - }, - { - "epoch": 1.09, - "learning_rate": 1.4673163903932518e-06, - "loss": 0.4717, - "step": 42707 - }, - { - "epoch": 1.09, - "learning_rate": 1.46729192703865e-06, - "loss": 0.5479, - "step": 42708 - }, - { - "epoch": 1.09, - "learning_rate": 1.4672674633262641e-06, - "loss": 0.6699, - "step": 42709 - }, - { - "epoch": 1.09, - "learning_rate": 1.467242999256113e-06, - "loss": 0.7725, - "step": 42710 - }, - { - "epoch": 1.09, - "learning_rate": 1.4672185348282153e-06, - "loss": 0.6758, - "step": 42711 - }, - { - "epoch": 1.09, - "learning_rate": 1.4671940700425905e-06, - "loss": 0.7021, - "step": 42712 - }, - { - "epoch": 1.09, - "learning_rate": 1.4671696048992559e-06, - "loss": 0.5923, - "step": 42713 - }, - { - "epoch": 1.09, - "learning_rate": 1.4671451393982315e-06, - "loss": 0.562, - "step": 42714 - }, - { - "epoch": 1.09, - "learning_rate": 1.4671206735395352e-06, - "loss": 0.5356, - "step": 42715 - }, - { - "epoch": 1.09, - "learning_rate": 1.4670962073231863e-06, - "loss": 0.3748, - "step": 42716 - }, - { - "epoch": 1.09, - "learning_rate": 1.4670717407492033e-06, - "loss": 0.5991, - "step": 42717 - }, - { - "epoch": 1.09, - "learning_rate": 1.4670472738176044e-06, - "loss": 0.6226, - "step": 42718 - }, - { - "epoch": 1.09, - "learning_rate": 1.4670228065284097e-06, - "loss": 0.6128, - "step": 42719 - }, - { - "epoch": 1.09, - "learning_rate": 1.4669983388816368e-06, - "loss": 0.7305, - "step": 42720 - }, - { - "epoch": 1.09, - "learning_rate": 1.4669738708773046e-06, - "loss": 0.5967, - "step": 42721 - }, - { - "epoch": 1.09, - "learning_rate": 1.4669494025154322e-06, - "loss": 0.8164, - "step": 42722 - }, - { - "epoch": 1.1, - "learning_rate": 1.466924933796038e-06, - "loss": 0.4971, - "step": 42723 - }, - { - "epoch": 1.1, - "learning_rate": 1.4669004647191408e-06, - "loss": 0.7485, - "step": 42724 - }, - { - "epoch": 1.1, - "learning_rate": 1.4668759952847593e-06, - "loss": 0.9453, - "step": 42725 - }, - { - "epoch": 1.1, - "learning_rate": 1.4668515254929123e-06, - "loss": 0.4524, - "step": 42726 - }, - { - "epoch": 1.1, - "learning_rate": 1.4668270553436191e-06, - "loss": 0.5347, - "step": 42727 - }, - { - "epoch": 1.1, - "learning_rate": 1.4668025848368975e-06, - "loss": 0.5759, - "step": 42728 - }, - { - "epoch": 1.1, - "learning_rate": 1.4667781139727665e-06, - "loss": 0.7046, - "step": 42729 - }, - { - "epoch": 1.1, - "learning_rate": 1.466753642751245e-06, - "loss": 0.7705, - "step": 42730 - }, - { - "epoch": 1.1, - "learning_rate": 1.4667291711723516e-06, - "loss": 0.7412, - "step": 42731 - }, - { - "epoch": 1.1, - "learning_rate": 1.4667046992361056e-06, - "loss": 0.5195, - "step": 42732 - }, - { - "epoch": 1.1, - "learning_rate": 1.4666802269425248e-06, - "loss": 0.6943, - "step": 42733 - }, - { - "epoch": 1.1, - "learning_rate": 1.4666557542916287e-06, - "loss": 0.7852, - "step": 42734 - }, - { - "epoch": 1.1, - "learning_rate": 1.4666312812834356e-06, - "loss": 0.5444, - "step": 42735 - }, - { - "epoch": 1.1, - "learning_rate": 1.4666068079179642e-06, - "loss": 0.6523, - "step": 42736 - }, - { - "epoch": 1.1, - "learning_rate": 1.4665823341952338e-06, - "loss": 0.4487, - "step": 42737 - }, - { - "epoch": 1.1, - "learning_rate": 1.4665578601152629e-06, - "loss": 0.7168, - "step": 42738 - }, - { - "epoch": 1.1, - "learning_rate": 1.4665333856780697e-06, - "loss": 0.6436, - "step": 42739 - }, - { - "epoch": 1.1, - "learning_rate": 1.4665089108836735e-06, - "loss": 0.7607, - "step": 42740 - }, - { - "epoch": 1.1, - "learning_rate": 1.4664844357320927e-06, - "loss": 0.6226, - "step": 42741 - }, - { - "epoch": 1.1, - "learning_rate": 1.4664599602233466e-06, - "loss": 0.8262, - "step": 42742 - }, - { - "epoch": 1.1, - "learning_rate": 1.4664354843574528e-06, - "loss": 0.6729, - "step": 42743 - }, - { - "epoch": 1.1, - "learning_rate": 1.4664110081344317e-06, - "loss": 0.7344, - "step": 42744 - }, - { - "epoch": 1.1, - "learning_rate": 1.4663865315543005e-06, - "loss": 0.5496, - "step": 42745 - }, - { - "epoch": 1.1, - "learning_rate": 1.466362054617079e-06, - "loss": 0.6152, - "step": 42746 - }, - { - "epoch": 1.1, - "learning_rate": 1.4663375773227853e-06, - "loss": 0.7588, - "step": 42747 - }, - { - "epoch": 1.1, - "learning_rate": 1.4663130996714384e-06, - "loss": 0.8438, - "step": 42748 - }, - { - "epoch": 1.1, - "learning_rate": 1.4662886216630567e-06, - "loss": 0.5176, - "step": 42749 - }, - { - "epoch": 1.1, - "learning_rate": 1.4662641432976598e-06, - "loss": 0.6987, - "step": 42750 - }, - { - "epoch": 1.1, - "learning_rate": 1.4662396645752653e-06, - "loss": 0.5643, - "step": 42751 - }, - { - "epoch": 1.1, - "learning_rate": 1.4662151854958933e-06, - "loss": 0.791, - "step": 42752 - }, - { - "epoch": 1.1, - "learning_rate": 1.466190706059561e-06, - "loss": 0.548, - "step": 42753 - }, - { - "epoch": 1.1, - "learning_rate": 1.4661662262662884e-06, - "loss": 0.5142, - "step": 42754 - }, - { - "epoch": 1.1, - "learning_rate": 1.4661417461160933e-06, - "loss": 0.7363, - "step": 42755 - }, - { - "epoch": 1.1, - "learning_rate": 1.4661172656089954e-06, - "loss": 0.6479, - "step": 42756 - }, - { - "epoch": 1.1, - "learning_rate": 1.4660927847450126e-06, - "loss": 0.7666, - "step": 42757 - }, - { - "epoch": 1.1, - "learning_rate": 1.4660683035241642e-06, - "loss": 0.6191, - "step": 42758 - }, - { - "epoch": 1.1, - "learning_rate": 1.4660438219464685e-06, - "loss": 0.6738, - "step": 42759 - }, - { - "epoch": 1.1, - "learning_rate": 1.4660193400119447e-06, - "loss": 0.6973, - "step": 42760 - }, - { - "epoch": 1.1, - "learning_rate": 1.465994857720611e-06, - "loss": 0.8506, - "step": 42761 - }, - { - "epoch": 1.1, - "learning_rate": 1.465970375072487e-06, - "loss": 0.7969, - "step": 42762 - }, - { - "epoch": 1.1, - "learning_rate": 1.4659458920675907e-06, - "loss": 0.4927, - "step": 42763 - }, - { - "epoch": 1.1, - "learning_rate": 1.465921408705941e-06, - "loss": 0.5603, - "step": 42764 - }, - { - "epoch": 1.1, - "learning_rate": 1.4658969249875566e-06, - "loss": 0.6924, - "step": 42765 - }, - { - "epoch": 1.1, - "learning_rate": 1.4658724409124563e-06, - "loss": 0.6777, - "step": 42766 - }, - { - "epoch": 1.1, - "learning_rate": 1.4658479564806591e-06, - "loss": 0.5757, - "step": 42767 - }, - { - "epoch": 1.1, - "learning_rate": 1.4658234716921834e-06, - "loss": 0.603, - "step": 42768 - }, - { - "epoch": 1.1, - "learning_rate": 1.4657989865470481e-06, - "loss": 0.6328, - "step": 42769 - }, - { - "epoch": 1.1, - "learning_rate": 1.4657745010452717e-06, - "loss": 0.7705, - "step": 42770 - }, - { - "epoch": 1.1, - "learning_rate": 1.4657500151868735e-06, - "loss": 0.8018, - "step": 42771 - }, - { - "epoch": 1.1, - "learning_rate": 1.465725528971872e-06, - "loss": 0.6455, - "step": 42772 - }, - { - "epoch": 1.1, - "learning_rate": 1.465701042400286e-06, - "loss": 0.6631, - "step": 42773 - }, - { - "epoch": 1.1, - "learning_rate": 1.4656765554721338e-06, - "loss": 0.6396, - "step": 42774 - }, - { - "epoch": 1.1, - "learning_rate": 1.4656520681874344e-06, - "loss": 0.6768, - "step": 42775 - }, - { - "epoch": 1.1, - "learning_rate": 1.4656275805462065e-06, - "loss": 0.7461, - "step": 42776 - }, - { - "epoch": 1.1, - "learning_rate": 1.4656030925484697e-06, - "loss": 0.6342, - "step": 42777 - }, - { - "epoch": 1.1, - "learning_rate": 1.4655786041942415e-06, - "loss": 0.6558, - "step": 42778 - }, - { - "epoch": 1.1, - "learning_rate": 1.4655541154835413e-06, - "loss": 0.66, - "step": 42779 - }, - { - "epoch": 1.1, - "learning_rate": 1.4655296264163875e-06, - "loss": 0.6655, - "step": 42780 - }, - { - "epoch": 1.1, - "learning_rate": 1.465505136992799e-06, - "loss": 0.7168, - "step": 42781 - }, - { - "epoch": 1.1, - "learning_rate": 1.4654806472127952e-06, - "loss": 0.5083, - "step": 42782 - }, - { - "epoch": 1.1, - "learning_rate": 1.465456157076394e-06, - "loss": 0.8008, - "step": 42783 - }, - { - "epoch": 1.1, - "learning_rate": 1.4654316665836142e-06, - "loss": 0.8652, - "step": 42784 - }, - { - "epoch": 1.1, - "learning_rate": 1.4654071757344748e-06, - "loss": 0.665, - "step": 42785 - }, - { - "epoch": 1.1, - "learning_rate": 1.4653826845289948e-06, - "loss": 0.5708, - "step": 42786 - }, - { - "epoch": 1.1, - "learning_rate": 1.4653581929671926e-06, - "loss": 0.6377, - "step": 42787 - }, - { - "epoch": 1.1, - "learning_rate": 1.465333701049087e-06, - "loss": 0.6992, - "step": 42788 - }, - { - "epoch": 1.1, - "learning_rate": 1.4653092087746965e-06, - "loss": 0.4055, - "step": 42789 - }, - { - "epoch": 1.1, - "learning_rate": 1.4652847161440405e-06, - "loss": 0.7065, - "step": 42790 - }, - { - "epoch": 1.1, - "learning_rate": 1.4652602231571369e-06, - "loss": 0.8213, - "step": 42791 - }, - { - "epoch": 1.1, - "learning_rate": 1.4652357298140057e-06, - "loss": 0.7607, - "step": 42792 - }, - { - "epoch": 1.1, - "learning_rate": 1.4652112361146642e-06, - "loss": 0.7119, - "step": 42793 - }, - { - "epoch": 1.1, - "learning_rate": 1.4651867420591324e-06, - "loss": 0.6411, - "step": 42794 - }, - { - "epoch": 1.1, - "learning_rate": 1.4651622476474279e-06, - "loss": 0.6582, - "step": 42795 - }, - { - "epoch": 1.1, - "learning_rate": 1.4651377528795706e-06, - "loss": 0.7012, - "step": 42796 - }, - { - "epoch": 1.1, - "learning_rate": 1.4651132577555785e-06, - "loss": 0.5624, - "step": 42797 - }, - { - "epoch": 1.1, - "learning_rate": 1.4650887622754706e-06, - "loss": 0.3966, - "step": 42798 - }, - { - "epoch": 1.1, - "learning_rate": 1.4650642664392655e-06, - "loss": 0.623, - "step": 42799 - }, - { - "epoch": 1.1, - "learning_rate": 1.4650397702469821e-06, - "loss": 0.5547, - "step": 42800 - }, - { - "epoch": 1.1, - "learning_rate": 1.465015273698639e-06, - "loss": 0.5732, - "step": 42801 - }, - { - "epoch": 1.1, - "learning_rate": 1.4649907767942558e-06, - "loss": 0.4348, - "step": 42802 - }, - { - "epoch": 1.1, - "learning_rate": 1.4649662795338498e-06, - "loss": 0.6602, - "step": 42803 - }, - { - "epoch": 1.1, - "learning_rate": 1.4649417819174409e-06, - "loss": 0.6152, - "step": 42804 - }, - { - "epoch": 1.1, - "learning_rate": 1.464917283945047e-06, - "loss": 0.7104, - "step": 42805 - }, - { - "epoch": 1.1, - "learning_rate": 1.4648927856166878e-06, - "loss": 0.623, - "step": 42806 - }, - { - "epoch": 1.1, - "learning_rate": 1.4648682869323814e-06, - "loss": 0.6567, - "step": 42807 - }, - { - "epoch": 1.1, - "learning_rate": 1.4648437878921464e-06, - "loss": 0.7949, - "step": 42808 - }, - { - "epoch": 1.1, - "learning_rate": 1.4648192884960022e-06, - "loss": 0.5835, - "step": 42809 - }, - { - "epoch": 1.1, - "learning_rate": 1.4647947887439671e-06, - "loss": 0.6694, - "step": 42810 - }, - { - "epoch": 1.1, - "learning_rate": 1.4647702886360603e-06, - "loss": 0.6841, - "step": 42811 - }, - { - "epoch": 1.1, - "learning_rate": 1.4647457881723e-06, - "loss": 0.6357, - "step": 42812 - }, - { - "epoch": 1.1, - "learning_rate": 1.4647212873527055e-06, - "loss": 0.7002, - "step": 42813 - }, - { - "epoch": 1.1, - "learning_rate": 1.464696786177295e-06, - "loss": 0.5874, - "step": 42814 - }, - { - "epoch": 1.1, - "learning_rate": 1.4646722846460877e-06, - "loss": 0.748, - "step": 42815 - }, - { - "epoch": 1.1, - "learning_rate": 1.4646477827591019e-06, - "loss": 0.8037, - "step": 42816 - }, - { - "epoch": 1.1, - "learning_rate": 1.4646232805163573e-06, - "loss": 0.5713, - "step": 42817 - }, - { - "epoch": 1.1, - "learning_rate": 1.4645987779178712e-06, - "loss": 0.5967, - "step": 42818 - }, - { - "epoch": 1.1, - "learning_rate": 1.4645742749636637e-06, - "loss": 0.5522, - "step": 42819 - }, - { - "epoch": 1.1, - "learning_rate": 1.4645497716537527e-06, - "loss": 0.478, - "step": 42820 - }, - { - "epoch": 1.1, - "learning_rate": 1.4645252679881577e-06, - "loss": 0.5962, - "step": 42821 - }, - { - "epoch": 1.1, - "learning_rate": 1.4645007639668968e-06, - "loss": 0.7734, - "step": 42822 - }, - { - "epoch": 1.1, - "learning_rate": 1.4644762595899892e-06, - "loss": 0.7744, - "step": 42823 - }, - { - "epoch": 1.1, - "learning_rate": 1.4644517548574534e-06, - "loss": 0.6914, - "step": 42824 - }, - { - "epoch": 1.1, - "learning_rate": 1.4644272497693081e-06, - "loss": 0.668, - "step": 42825 - }, - { - "epoch": 1.1, - "learning_rate": 1.4644027443255725e-06, - "loss": 0.5439, - "step": 42826 - }, - { - "epoch": 1.1, - "learning_rate": 1.464378238526265e-06, - "loss": 0.5918, - "step": 42827 - }, - { - "epoch": 1.1, - "learning_rate": 1.464353732371404e-06, - "loss": 0.6504, - "step": 42828 - }, - { - "epoch": 1.1, - "learning_rate": 1.4643292258610091e-06, - "loss": 0.5562, - "step": 42829 - }, - { - "epoch": 1.1, - "learning_rate": 1.4643047189950988e-06, - "loss": 0.708, - "step": 42830 - }, - { - "epoch": 1.1, - "learning_rate": 1.4642802117736913e-06, - "loss": 0.666, - "step": 42831 - }, - { - "epoch": 1.1, - "learning_rate": 1.4642557041968061e-06, - "loss": 0.5688, - "step": 42832 - }, - { - "epoch": 1.1, - "learning_rate": 1.4642311962644617e-06, - "loss": 0.6792, - "step": 42833 - }, - { - "epoch": 1.1, - "learning_rate": 1.4642066879766765e-06, - "loss": 0.7969, - "step": 42834 - }, - { - "epoch": 1.1, - "learning_rate": 1.4641821793334698e-06, - "loss": 0.7935, - "step": 42835 - }, - { - "epoch": 1.1, - "learning_rate": 1.4641576703348602e-06, - "loss": 0.6709, - "step": 42836 - }, - { - "epoch": 1.1, - "learning_rate": 1.4641331609808662e-06, - "loss": 0.7676, - "step": 42837 - }, - { - "epoch": 1.1, - "learning_rate": 1.4641086512715073e-06, - "loss": 0.5276, - "step": 42838 - }, - { - "epoch": 1.1, - "learning_rate": 1.464084141206801e-06, - "loss": 0.5996, - "step": 42839 - }, - { - "epoch": 1.1, - "learning_rate": 1.4640596307867674e-06, - "loss": 0.6826, - "step": 42840 - }, - { - "epoch": 1.1, - "learning_rate": 1.4640351200114244e-06, - "loss": 0.7227, - "step": 42841 - }, - { - "epoch": 1.1, - "learning_rate": 1.4640106088807913e-06, - "loss": 0.7461, - "step": 42842 - }, - { - "epoch": 1.1, - "learning_rate": 1.463986097394886e-06, - "loss": 0.6558, - "step": 42843 - }, - { - "epoch": 1.1, - "learning_rate": 1.4639615855537287e-06, - "loss": 0.6792, - "step": 42844 - }, - { - "epoch": 1.1, - "learning_rate": 1.4639370733573367e-06, - "loss": 0.4608, - "step": 42845 - }, - { - "epoch": 1.1, - "learning_rate": 1.4639125608057296e-06, - "loss": 0.6958, - "step": 42846 - }, - { - "epoch": 1.1, - "learning_rate": 1.4638880478989262e-06, - "loss": 0.6826, - "step": 42847 - }, - { - "epoch": 1.1, - "learning_rate": 1.463863534636945e-06, - "loss": 0.8281, - "step": 42848 - }, - { - "epoch": 1.1, - "learning_rate": 1.4638390210198045e-06, - "loss": 0.6768, - "step": 42849 - }, - { - "epoch": 1.1, - "learning_rate": 1.4638145070475241e-06, - "loss": 0.6152, - "step": 42850 - }, - { - "epoch": 1.1, - "learning_rate": 1.463789992720122e-06, - "loss": 0.7881, - "step": 42851 - }, - { - "epoch": 1.1, - "learning_rate": 1.4637654780376174e-06, - "loss": 0.6074, - "step": 42852 - }, - { - "epoch": 1.1, - "learning_rate": 1.4637409630000291e-06, - "loss": 0.6875, - "step": 42853 - }, - { - "epoch": 1.1, - "learning_rate": 1.4637164476073753e-06, - "loss": 0.7451, - "step": 42854 - }, - { - "epoch": 1.1, - "learning_rate": 1.4636919318596755e-06, - "loss": 0.75, - "step": 42855 - }, - { - "epoch": 1.1, - "learning_rate": 1.463667415756948e-06, - "loss": 0.4863, - "step": 42856 - }, - { - "epoch": 1.1, - "learning_rate": 1.4636428992992116e-06, - "loss": 0.5736, - "step": 42857 - }, - { - "epoch": 1.1, - "learning_rate": 1.463618382486485e-06, - "loss": 0.3523, - "step": 42858 - }, - { - "epoch": 1.1, - "learning_rate": 1.4635938653187871e-06, - "loss": 0.582, - "step": 42859 - }, - { - "epoch": 1.1, - "learning_rate": 1.4635693477961368e-06, - "loss": 0.5579, - "step": 42860 - }, - { - "epoch": 1.1, - "learning_rate": 1.463544829918553e-06, - "loss": 0.6228, - "step": 42861 - }, - { - "epoch": 1.1, - "learning_rate": 1.4635203116860543e-06, - "loss": 0.5052, - "step": 42862 - }, - { - "epoch": 1.1, - "learning_rate": 1.463495793098659e-06, - "loss": 0.6396, - "step": 42863 - }, - { - "epoch": 1.1, - "learning_rate": 1.4634712741563862e-06, - "loss": 0.6477, - "step": 42864 - }, - { - "epoch": 1.1, - "learning_rate": 1.4634467548592552e-06, - "loss": 0.7402, - "step": 42865 - }, - { - "epoch": 1.1, - "learning_rate": 1.4634222352072841e-06, - "loss": 0.6963, - "step": 42866 - }, - { - "epoch": 1.1, - "learning_rate": 1.4633977152004922e-06, - "loss": 0.8154, - "step": 42867 - }, - { - "epoch": 1.1, - "learning_rate": 1.4633731948388974e-06, - "loss": 0.5996, - "step": 42868 - }, - { - "epoch": 1.1, - "learning_rate": 1.4633486741225193e-06, - "loss": 0.7041, - "step": 42869 - }, - { - "epoch": 1.1, - "learning_rate": 1.4633241530513764e-06, - "loss": 0.6729, - "step": 42870 - }, - { - "epoch": 1.1, - "learning_rate": 1.4632996316254877e-06, - "loss": 0.709, - "step": 42871 - }, - { - "epoch": 1.1, - "learning_rate": 1.4632751098448718e-06, - "loss": 0.6709, - "step": 42872 - }, - { - "epoch": 1.1, - "learning_rate": 1.4632505877095473e-06, - "loss": 0.7163, - "step": 42873 - }, - { - "epoch": 1.1, - "learning_rate": 1.4632260652195332e-06, - "loss": 0.583, - "step": 42874 - }, - { - "epoch": 1.1, - "learning_rate": 1.463201542374848e-06, - "loss": 0.5049, - "step": 42875 - }, - { - "epoch": 1.1, - "learning_rate": 1.463177019175511e-06, - "loss": 0.7642, - "step": 42876 - }, - { - "epoch": 1.1, - "learning_rate": 1.4631524956215405e-06, - "loss": 0.5513, - "step": 42877 - }, - { - "epoch": 1.1, - "learning_rate": 1.4631279717129554e-06, - "loss": 0.6562, - "step": 42878 - }, - { - "epoch": 1.1, - "learning_rate": 1.4631034474497744e-06, - "loss": 0.4863, - "step": 42879 - }, - { - "epoch": 1.1, - "learning_rate": 1.4630789228320163e-06, - "loss": 0.6177, - "step": 42880 - }, - { - "epoch": 1.1, - "learning_rate": 1.4630543978597004e-06, - "loss": 0.6035, - "step": 42881 - }, - { - "epoch": 1.1, - "learning_rate": 1.4630298725328449e-06, - "loss": 0.7002, - "step": 42882 - }, - { - "epoch": 1.1, - "learning_rate": 1.4630053468514686e-06, - "loss": 0.3999, - "step": 42883 - }, - { - "epoch": 1.1, - "learning_rate": 1.4629808208155903e-06, - "loss": 0.6045, - "step": 42884 - }, - { - "epoch": 1.1, - "learning_rate": 1.462956294425229e-06, - "loss": 0.5986, - "step": 42885 - }, - { - "epoch": 1.1, - "learning_rate": 1.4629317676804033e-06, - "loss": 0.5093, - "step": 42886 - }, - { - "epoch": 1.1, - "learning_rate": 1.4629072405811322e-06, - "loss": 0.5981, - "step": 42887 - }, - { - "epoch": 1.1, - "learning_rate": 1.462882713127434e-06, - "loss": 0.7227, - "step": 42888 - }, - { - "epoch": 1.1, - "learning_rate": 1.462858185319328e-06, - "loss": 0.7988, - "step": 42889 - }, - { - "epoch": 1.1, - "learning_rate": 1.4628336571568328e-06, - "loss": 0.5225, - "step": 42890 - }, - { - "epoch": 1.1, - "learning_rate": 1.4628091286399671e-06, - "loss": 0.593, - "step": 42891 - }, - { - "epoch": 1.1, - "learning_rate": 1.4627845997687499e-06, - "loss": 0.6501, - "step": 42892 - }, - { - "epoch": 1.1, - "learning_rate": 1.4627600705431995e-06, - "loss": 0.5986, - "step": 42893 - }, - { - "epoch": 1.1, - "learning_rate": 1.4627355409633354e-06, - "loss": 0.6943, - "step": 42894 - }, - { - "epoch": 1.1, - "learning_rate": 1.4627110110291754e-06, - "loss": 0.7607, - "step": 42895 - }, - { - "epoch": 1.1, - "learning_rate": 1.462686480740739e-06, - "loss": 0.6162, - "step": 42896 - }, - { - "epoch": 1.1, - "learning_rate": 1.4626619500980454e-06, - "loss": 0.7646, - "step": 42897 - }, - { - "epoch": 1.1, - "learning_rate": 1.462637419101112e-06, - "loss": 0.7378, - "step": 42898 - }, - { - "epoch": 1.1, - "learning_rate": 1.4626128877499588e-06, - "loss": 0.5435, - "step": 42899 - }, - { - "epoch": 1.1, - "learning_rate": 1.4625883560446042e-06, - "loss": 0.6748, - "step": 42900 - }, - { - "epoch": 1.1, - "learning_rate": 1.462563823985067e-06, - "loss": 0.75, - "step": 42901 - }, - { - "epoch": 1.1, - "learning_rate": 1.4625392915713662e-06, - "loss": 0.6963, - "step": 42902 - }, - { - "epoch": 1.1, - "learning_rate": 1.46251475880352e-06, - "loss": 0.6333, - "step": 42903 - }, - { - "epoch": 1.1, - "learning_rate": 1.4624902256815475e-06, - "loss": 0.8789, - "step": 42904 - }, - { - "epoch": 1.1, - "learning_rate": 1.4624656922054674e-06, - "loss": 0.626, - "step": 42905 - }, - { - "epoch": 1.1, - "learning_rate": 1.4624411583752987e-06, - "loss": 0.7754, - "step": 42906 - }, - { - "epoch": 1.1, - "learning_rate": 1.4624166241910603e-06, - "loss": 0.5952, - "step": 42907 - }, - { - "epoch": 1.1, - "learning_rate": 1.4623920896527703e-06, - "loss": 0.698, - "step": 42908 - }, - { - "epoch": 1.1, - "learning_rate": 1.4623675547604486e-06, - "loss": 0.7305, - "step": 42909 - }, - { - "epoch": 1.1, - "learning_rate": 1.4623430195141126e-06, - "loss": 0.749, - "step": 42910 - }, - { - "epoch": 1.1, - "learning_rate": 1.4623184839137823e-06, - "loss": 0.6294, - "step": 42911 - }, - { - "epoch": 1.1, - "learning_rate": 1.4622939479594759e-06, - "loss": 0.6533, - "step": 42912 - }, - { - "epoch": 1.1, - "learning_rate": 1.4622694116512121e-06, - "loss": 0.5737, - "step": 42913 - }, - { - "epoch": 1.1, - "learning_rate": 1.46224487498901e-06, - "loss": 0.7393, - "step": 42914 - }, - { - "epoch": 1.1, - "learning_rate": 1.4622203379728884e-06, - "loss": 0.6895, - "step": 42915 - }, - { - "epoch": 1.1, - "learning_rate": 1.4621958006028657e-06, - "loss": 0.5347, - "step": 42916 - }, - { - "epoch": 1.1, - "learning_rate": 1.462171262878961e-06, - "loss": 0.5554, - "step": 42917 - }, - { - "epoch": 1.1, - "learning_rate": 1.462146724801193e-06, - "loss": 0.833, - "step": 42918 - }, - { - "epoch": 1.1, - "learning_rate": 1.4621221863695805e-06, - "loss": 0.668, - "step": 42919 - }, - { - "epoch": 1.1, - "learning_rate": 1.4620976475841423e-06, - "loss": 0.6226, - "step": 42920 - }, - { - "epoch": 1.1, - "learning_rate": 1.462073108444897e-06, - "loss": 0.6138, - "step": 42921 - }, - { - "epoch": 1.1, - "learning_rate": 1.462048568951864e-06, - "loss": 0.8682, - "step": 42922 - }, - { - "epoch": 1.1, - "learning_rate": 1.4620240291050615e-06, - "loss": 0.6895, - "step": 42923 - }, - { - "epoch": 1.1, - "learning_rate": 1.4619994889045081e-06, - "loss": 0.6223, - "step": 42924 - }, - { - "epoch": 1.1, - "learning_rate": 1.4619749483502233e-06, - "loss": 0.5752, - "step": 42925 - }, - { - "epoch": 1.1, - "learning_rate": 1.4619504074422252e-06, - "loss": 0.8066, - "step": 42926 - }, - { - "epoch": 1.1, - "learning_rate": 1.4619258661805334e-06, - "loss": 0.6147, - "step": 42927 - }, - { - "epoch": 1.1, - "learning_rate": 1.4619013245651659e-06, - "loss": 0.752, - "step": 42928 - }, - { - "epoch": 1.1, - "learning_rate": 1.4618767825961418e-06, - "loss": 0.7969, - "step": 42929 - }, - { - "epoch": 1.1, - "learning_rate": 1.46185224027348e-06, - "loss": 0.8291, - "step": 42930 - }, - { - "epoch": 1.1, - "learning_rate": 1.4618276975971988e-06, - "loss": 0.6577, - "step": 42931 - }, - { - "epoch": 1.1, - "learning_rate": 1.461803154567318e-06, - "loss": 0.6089, - "step": 42932 - }, - { - "epoch": 1.1, - "learning_rate": 1.4617786111838552e-06, - "loss": 0.7529, - "step": 42933 - }, - { - "epoch": 1.1, - "learning_rate": 1.46175406744683e-06, - "loss": 0.6572, - "step": 42934 - }, - { - "epoch": 1.1, - "learning_rate": 1.461729523356261e-06, - "loss": 0.8398, - "step": 42935 - }, - { - "epoch": 1.1, - "learning_rate": 1.461704978912167e-06, - "loss": 0.6216, - "step": 42936 - }, - { - "epoch": 1.1, - "learning_rate": 1.4616804341145664e-06, - "loss": 0.5586, - "step": 42937 - }, - { - "epoch": 1.1, - "learning_rate": 1.4616558889634788e-06, - "loss": 0.6094, - "step": 42938 - }, - { - "epoch": 1.1, - "learning_rate": 1.4616313434589218e-06, - "loss": 0.7065, - "step": 42939 - }, - { - "epoch": 1.1, - "learning_rate": 1.4616067976009153e-06, - "loss": 0.7773, - "step": 42940 - }, - { - "epoch": 1.1, - "learning_rate": 1.4615822513894778e-06, - "loss": 0.4971, - "step": 42941 - }, - { - "epoch": 1.1, - "learning_rate": 1.4615577048246279e-06, - "loss": 0.6948, - "step": 42942 - }, - { - "epoch": 1.1, - "learning_rate": 1.4615331579063845e-06, - "loss": 0.6523, - "step": 42943 - }, - { - "epoch": 1.1, - "learning_rate": 1.4615086106347663e-06, - "loss": 0.626, - "step": 42944 - }, - { - "epoch": 1.1, - "learning_rate": 1.4614840630097923e-06, - "loss": 0.6826, - "step": 42945 - }, - { - "epoch": 1.1, - "learning_rate": 1.4614595150314811e-06, - "loss": 0.7588, - "step": 42946 - }, - { - "epoch": 1.1, - "learning_rate": 1.4614349666998518e-06, - "loss": 0.5205, - "step": 42947 - }, - { - "epoch": 1.1, - "learning_rate": 1.4614104180149228e-06, - "loss": 0.6621, - "step": 42948 - }, - { - "epoch": 1.1, - "learning_rate": 1.461385868976713e-06, - "loss": 0.6694, - "step": 42949 - }, - { - "epoch": 1.1, - "learning_rate": 1.461361319585241e-06, - "loss": 0.873, - "step": 42950 - }, - { - "epoch": 1.1, - "learning_rate": 1.4613367698405262e-06, - "loss": 0.5923, - "step": 42951 - }, - { - "epoch": 1.1, - "learning_rate": 1.461312219742587e-06, - "loss": 0.6431, - "step": 42952 - }, - { - "epoch": 1.1, - "learning_rate": 1.4612876692914424e-06, - "loss": 0.6401, - "step": 42953 - }, - { - "epoch": 1.1, - "learning_rate": 1.4612631184871108e-06, - "loss": 0.6411, - "step": 42954 - }, - { - "epoch": 1.1, - "learning_rate": 1.4612385673296113e-06, - "loss": 0.644, - "step": 42955 - }, - { - "epoch": 1.1, - "learning_rate": 1.4612140158189625e-06, - "loss": 0.7891, - "step": 42956 - }, - { - "epoch": 1.1, - "learning_rate": 1.4611894639551837e-06, - "loss": 0.584, - "step": 42957 - }, - { - "epoch": 1.1, - "learning_rate": 1.461164911738293e-06, - "loss": 0.6211, - "step": 42958 - }, - { - "epoch": 1.1, - "learning_rate": 1.4611403591683095e-06, - "loss": 0.6152, - "step": 42959 - }, - { - "epoch": 1.1, - "learning_rate": 1.4611158062452523e-06, - "loss": 0.4648, - "step": 42960 - }, - { - "epoch": 1.1, - "learning_rate": 1.4610912529691396e-06, - "loss": 0.6365, - "step": 42961 - }, - { - "epoch": 1.1, - "learning_rate": 1.4610666993399909e-06, - "loss": 0.6523, - "step": 42962 - }, - { - "epoch": 1.1, - "learning_rate": 1.4610421453578244e-06, - "loss": 0.7334, - "step": 42963 - }, - { - "epoch": 1.1, - "learning_rate": 1.4610175910226592e-06, - "loss": 0.7031, - "step": 42964 - }, - { - "epoch": 1.1, - "learning_rate": 1.4609930363345143e-06, - "loss": 0.604, - "step": 42965 - }, - { - "epoch": 1.1, - "learning_rate": 1.4609684812934075e-06, - "loss": 0.8154, - "step": 42966 - }, - { - "epoch": 1.1, - "learning_rate": 1.460943925899359e-06, - "loss": 0.542, - "step": 42967 - }, - { - "epoch": 1.1, - "learning_rate": 1.4609193701523868e-06, - "loss": 0.7856, - "step": 42968 - }, - { - "epoch": 1.1, - "learning_rate": 1.4608948140525096e-06, - "loss": 0.603, - "step": 42969 - }, - { - "epoch": 1.1, - "learning_rate": 1.4608702575997466e-06, - "loss": 0.623, - "step": 42970 - }, - { - "epoch": 1.1, - "learning_rate": 1.4608457007941165e-06, - "loss": 0.7607, - "step": 42971 - }, - { - "epoch": 1.1, - "learning_rate": 1.4608211436356379e-06, - "loss": 0.6685, - "step": 42972 - }, - { - "epoch": 1.1, - "learning_rate": 1.4607965861243296e-06, - "loss": 0.6562, - "step": 42973 - }, - { - "epoch": 1.1, - "learning_rate": 1.4607720282602109e-06, - "loss": 0.6161, - "step": 42974 - }, - { - "epoch": 1.1, - "learning_rate": 1.4607474700433e-06, - "loss": 0.8242, - "step": 42975 - }, - { - "epoch": 1.1, - "learning_rate": 1.4607229114736162e-06, - "loss": 0.7109, - "step": 42976 - }, - { - "epoch": 1.1, - "learning_rate": 1.4606983525511779e-06, - "loss": 0.5647, - "step": 42977 - }, - { - "epoch": 1.1, - "learning_rate": 1.4606737932760037e-06, - "loss": 0.7012, - "step": 42978 - }, - { - "epoch": 1.1, - "learning_rate": 1.4606492336481134e-06, - "loss": 0.6953, - "step": 42979 - }, - { - "epoch": 1.1, - "learning_rate": 1.4606246736675247e-06, - "loss": 0.6836, - "step": 42980 - }, - { - "epoch": 1.1, - "learning_rate": 1.460600113334257e-06, - "loss": 0.5184, - "step": 42981 - }, - { - "epoch": 1.1, - "learning_rate": 1.4605755526483293e-06, - "loss": 0.665, - "step": 42982 - }, - { - "epoch": 1.1, - "learning_rate": 1.4605509916097596e-06, - "loss": 0.75, - "step": 42983 - }, - { - "epoch": 1.1, - "learning_rate": 1.460526430218567e-06, - "loss": 0.6992, - "step": 42984 - }, - { - "epoch": 1.1, - "learning_rate": 1.460501868474771e-06, - "loss": 0.5952, - "step": 42985 - }, - { - "epoch": 1.1, - "learning_rate": 1.4604773063783898e-06, - "loss": 0.6777, - "step": 42986 - }, - { - "epoch": 1.1, - "learning_rate": 1.4604527439294423e-06, - "loss": 0.6858, - "step": 42987 - }, - { - "epoch": 1.1, - "learning_rate": 1.4604281811279472e-06, - "loss": 0.6719, - "step": 42988 - }, - { - "epoch": 1.1, - "learning_rate": 1.4604036179739235e-06, - "loss": 0.7656, - "step": 42989 - }, - { - "epoch": 1.1, - "learning_rate": 1.4603790544673895e-06, - "loss": 0.6099, - "step": 42990 - }, - { - "epoch": 1.1, - "learning_rate": 1.4603544906083652e-06, - "loss": 0.7812, - "step": 42991 - }, - { - "epoch": 1.1, - "learning_rate": 1.4603299263968681e-06, - "loss": 0.7061, - "step": 42992 - }, - { - "epoch": 1.1, - "learning_rate": 1.4603053618329177e-06, - "loss": 0.5762, - "step": 42993 - }, - { - "epoch": 1.1, - "learning_rate": 1.4602807969165325e-06, - "loss": 0.7285, - "step": 42994 - }, - { - "epoch": 1.1, - "learning_rate": 1.4602562316477316e-06, - "loss": 0.7061, - "step": 42995 - }, - { - "epoch": 1.1, - "learning_rate": 1.4602316660265336e-06, - "loss": 0.5737, - "step": 42996 - }, - { - "epoch": 1.1, - "learning_rate": 1.4602071000529575e-06, - "loss": 0.71, - "step": 42997 - }, - { - "epoch": 1.1, - "learning_rate": 1.4601825337270218e-06, - "loss": 0.6694, - "step": 42998 - }, - { - "epoch": 1.1, - "learning_rate": 1.4601579670487456e-06, - "loss": 0.6992, - "step": 42999 - }, - { - "epoch": 1.1, - "learning_rate": 1.4601334000181475e-06, - "loss": 0.4534, - "step": 43000 - }, - { - "epoch": 1.1, - "learning_rate": 1.4601088326352468e-06, - "loss": 0.6143, - "step": 43001 - }, - { - "epoch": 1.1, - "learning_rate": 1.4600842649000615e-06, - "loss": 0.8281, - "step": 43002 - }, - { - "epoch": 1.1, - "learning_rate": 1.4600596968126111e-06, - "loss": 0.6846, - "step": 43003 - }, - { - "epoch": 1.1, - "learning_rate": 1.460035128372914e-06, - "loss": 0.6304, - "step": 43004 - }, - { - "epoch": 1.1, - "learning_rate": 1.460010559580989e-06, - "loss": 0.6611, - "step": 43005 - }, - { - "epoch": 1.1, - "learning_rate": 1.4599859904368555e-06, - "loss": 0.6499, - "step": 43006 - }, - { - "epoch": 1.1, - "learning_rate": 1.4599614209405312e-06, - "loss": 0.4458, - "step": 43007 - }, - { - "epoch": 1.1, - "learning_rate": 1.4599368510920362e-06, - "loss": 0.6099, - "step": 43008 - }, - { - "epoch": 1.1, - "learning_rate": 1.4599122808913885e-06, - "loss": 0.6519, - "step": 43009 - }, - { - "epoch": 1.1, - "learning_rate": 1.4598877103386072e-06, - "loss": 0.4739, - "step": 43010 - }, - { - "epoch": 1.1, - "learning_rate": 1.459863139433711e-06, - "loss": 0.5663, - "step": 43011 - }, - { - "epoch": 1.1, - "learning_rate": 1.4598385681767187e-06, - "loss": 0.606, - "step": 43012 - }, - { - "epoch": 1.1, - "learning_rate": 1.4598139965676488e-06, - "loss": 0.7012, - "step": 43013 - }, - { - "epoch": 1.1, - "learning_rate": 1.459789424606521e-06, - "loss": 0.6152, - "step": 43014 - }, - { - "epoch": 1.1, - "learning_rate": 1.4597648522933533e-06, - "loss": 0.6201, - "step": 43015 - }, - { - "epoch": 1.1, - "learning_rate": 1.459740279628165e-06, - "loss": 0.6689, - "step": 43016 - }, - { - "epoch": 1.1, - "learning_rate": 1.4597157066109746e-06, - "loss": 0.7852, - "step": 43017 - }, - { - "epoch": 1.1, - "learning_rate": 1.459691133241801e-06, - "loss": 0.6313, - "step": 43018 - }, - { - "epoch": 1.1, - "learning_rate": 1.459666559520663e-06, - "loss": 0.874, - "step": 43019 - }, - { - "epoch": 1.1, - "learning_rate": 1.4596419854475795e-06, - "loss": 0.6953, - "step": 43020 - }, - { - "epoch": 1.1, - "learning_rate": 1.4596174110225691e-06, - "loss": 0.751, - "step": 43021 - }, - { - "epoch": 1.1, - "learning_rate": 1.459592836245651e-06, - "loss": 0.7803, - "step": 43022 - }, - { - "epoch": 1.1, - "learning_rate": 1.4595682611168439e-06, - "loss": 0.7852, - "step": 43023 - }, - { - "epoch": 1.1, - "learning_rate": 1.4595436856361664e-06, - "loss": 0.7178, - "step": 43024 - }, - { - "epoch": 1.1, - "learning_rate": 1.459519109803637e-06, - "loss": 0.6963, - "step": 43025 - }, - { - "epoch": 1.1, - "learning_rate": 1.4594945336192757e-06, - "loss": 0.543, - "step": 43026 - }, - { - "epoch": 1.1, - "learning_rate": 1.4594699570831002e-06, - "loss": 0.7139, - "step": 43027 - }, - { - "epoch": 1.1, - "learning_rate": 1.4594453801951297e-06, - "loss": 0.791, - "step": 43028 - }, - { - "epoch": 1.1, - "learning_rate": 1.4594208029553827e-06, - "loss": 0.5742, - "step": 43029 - }, - { - "epoch": 1.1, - "learning_rate": 1.4593962253638787e-06, - "loss": 0.709, - "step": 43030 - }, - { - "epoch": 1.1, - "learning_rate": 1.459371647420636e-06, - "loss": 0.7734, - "step": 43031 - }, - { - "epoch": 1.1, - "learning_rate": 1.4593470691256735e-06, - "loss": 0.4727, - "step": 43032 - }, - { - "epoch": 1.1, - "learning_rate": 1.4593224904790103e-06, - "loss": 0.5889, - "step": 43033 - }, - { - "epoch": 1.1, - "learning_rate": 1.4592979114806644e-06, - "loss": 0.5042, - "step": 43034 - }, - { - "epoch": 1.1, - "learning_rate": 1.4592733321306559e-06, - "loss": 0.5967, - "step": 43035 - }, - { - "epoch": 1.1, - "learning_rate": 1.4592487524290027e-06, - "loss": 0.6807, - "step": 43036 - }, - { - "epoch": 1.1, - "learning_rate": 1.4592241723757239e-06, - "loss": 0.5337, - "step": 43037 - }, - { - "epoch": 1.1, - "learning_rate": 1.459199591970838e-06, - "loss": 0.6445, - "step": 43038 - }, - { - "epoch": 1.1, - "learning_rate": 1.4591750112143644e-06, - "loss": 0.7861, - "step": 43039 - }, - { - "epoch": 1.1, - "learning_rate": 1.4591504301063214e-06, - "loss": 0.7695, - "step": 43040 - }, - { - "epoch": 1.1, - "learning_rate": 1.4591258486467284e-06, - "loss": 0.7007, - "step": 43041 - }, - { - "epoch": 1.1, - "learning_rate": 1.4591012668356034e-06, - "loss": 0.5815, - "step": 43042 - }, - { - "epoch": 1.1, - "learning_rate": 1.4590766846729658e-06, - "loss": 0.6904, - "step": 43043 - }, - { - "epoch": 1.1, - "learning_rate": 1.4590521021588342e-06, - "loss": 0.7881, - "step": 43044 - }, - { - "epoch": 1.1, - "learning_rate": 1.4590275192932277e-06, - "loss": 0.7158, - "step": 43045 - }, - { - "epoch": 1.1, - "learning_rate": 1.4590029360761648e-06, - "loss": 0.5063, - "step": 43046 - }, - { - "epoch": 1.1, - "learning_rate": 1.4589783525076647e-06, - "loss": 0.6572, - "step": 43047 - }, - { - "epoch": 1.1, - "learning_rate": 1.4589537685877457e-06, - "loss": 0.6992, - "step": 43048 - }, - { - "epoch": 1.1, - "learning_rate": 1.458929184316427e-06, - "loss": 0.6777, - "step": 43049 - }, - { - "epoch": 1.1, - "learning_rate": 1.4589045996937272e-06, - "loss": 0.7075, - "step": 43050 - }, - { - "epoch": 1.1, - "learning_rate": 1.4588800147196655e-06, - "loss": 0.6484, - "step": 43051 - }, - { - "epoch": 1.1, - "learning_rate": 1.4588554293942603e-06, - "loss": 0.751, - "step": 43052 - }, - { - "epoch": 1.1, - "learning_rate": 1.4588308437175308e-06, - "loss": 0.709, - "step": 43053 - }, - { - "epoch": 1.1, - "learning_rate": 1.4588062576894952e-06, - "loss": 0.5879, - "step": 43054 - }, - { - "epoch": 1.1, - "learning_rate": 1.4587816713101733e-06, - "loss": 0.6943, - "step": 43055 - }, - { - "epoch": 1.1, - "learning_rate": 1.4587570845795832e-06, - "loss": 0.71, - "step": 43056 - }, - { - "epoch": 1.1, - "learning_rate": 1.4587324974977436e-06, - "loss": 0.5811, - "step": 43057 - }, - { - "epoch": 1.1, - "learning_rate": 1.4587079100646737e-06, - "loss": 0.4819, - "step": 43058 - }, - { - "epoch": 1.1, - "learning_rate": 1.4586833222803922e-06, - "loss": 0.7686, - "step": 43059 - }, - { - "epoch": 1.1, - "learning_rate": 1.4586587341449184e-06, - "loss": 0.6475, - "step": 43060 - }, - { - "epoch": 1.1, - "learning_rate": 1.4586341456582702e-06, - "loss": 0.7363, - "step": 43061 - }, - { - "epoch": 1.1, - "learning_rate": 1.4586095568204673e-06, - "loss": 0.6943, - "step": 43062 - }, - { - "epoch": 1.1, - "learning_rate": 1.4585849676315277e-06, - "loss": 0.6538, - "step": 43063 - }, - { - "epoch": 1.1, - "learning_rate": 1.4585603780914712e-06, - "loss": 0.6211, - "step": 43064 - }, - { - "epoch": 1.1, - "learning_rate": 1.4585357882003158e-06, - "loss": 0.6689, - "step": 43065 - }, - { - "epoch": 1.1, - "learning_rate": 1.4585111979580808e-06, - "loss": 0.7393, - "step": 43066 - }, - { - "epoch": 1.1, - "learning_rate": 1.4584866073647848e-06, - "loss": 0.6396, - "step": 43067 - }, - { - "epoch": 1.1, - "learning_rate": 1.4584620164204466e-06, - "loss": 0.5938, - "step": 43068 - }, - { - "epoch": 1.1, - "learning_rate": 1.458437425125085e-06, - "loss": 0.511, - "step": 43069 - }, - { - "epoch": 1.1, - "learning_rate": 1.458412833478719e-06, - "loss": 0.5962, - "step": 43070 - }, - { - "epoch": 1.1, - "learning_rate": 1.4583882414813677e-06, - "loss": 0.6938, - "step": 43071 - }, - { - "epoch": 1.1, - "learning_rate": 1.4583636491330492e-06, - "loss": 0.5347, - "step": 43072 - }, - { - "epoch": 1.1, - "learning_rate": 1.458339056433783e-06, - "loss": 0.8008, - "step": 43073 - }, - { - "epoch": 1.1, - "learning_rate": 1.4583144633835875e-06, - "loss": 0.6494, - "step": 43074 - }, - { - "epoch": 1.1, - "learning_rate": 1.4582898699824816e-06, - "loss": 0.8926, - "step": 43075 - }, - { - "epoch": 1.1, - "learning_rate": 1.4582652762304846e-06, - "loss": 0.5312, - "step": 43076 - }, - { - "epoch": 1.1, - "learning_rate": 1.4582406821276147e-06, - "loss": 0.459, - "step": 43077 - }, - { - "epoch": 1.1, - "learning_rate": 1.458216087673891e-06, - "loss": 0.6294, - "step": 43078 - }, - { - "epoch": 1.1, - "learning_rate": 1.4581914928693323e-06, - "loss": 0.6475, - "step": 43079 - }, - { - "epoch": 1.1, - "learning_rate": 1.4581668977139572e-06, - "loss": 0.7036, - "step": 43080 - }, - { - "epoch": 1.1, - "learning_rate": 1.4581423022077854e-06, - "loss": 0.7656, - "step": 43081 - }, - { - "epoch": 1.1, - "learning_rate": 1.4581177063508346e-06, - "loss": 0.5913, - "step": 43082 - }, - { - "epoch": 1.1, - "learning_rate": 1.4580931101431243e-06, - "loss": 0.6807, - "step": 43083 - }, - { - "epoch": 1.1, - "learning_rate": 1.458068513584673e-06, - "loss": 0.6182, - "step": 43084 - }, - { - "epoch": 1.1, - "learning_rate": 1.4580439166754998e-06, - "loss": 0.6494, - "step": 43085 - }, - { - "epoch": 1.1, - "learning_rate": 1.4580193194156235e-06, - "loss": 0.7256, - "step": 43086 - }, - { - "epoch": 1.1, - "learning_rate": 1.457994721805063e-06, - "loss": 0.7422, - "step": 43087 - }, - { - "epoch": 1.1, - "learning_rate": 1.4579701238438369e-06, - "loss": 0.7842, - "step": 43088 - }, - { - "epoch": 1.1, - "learning_rate": 1.457945525531964e-06, - "loss": 0.4829, - "step": 43089 - }, - { - "epoch": 1.1, - "learning_rate": 1.4579209268694632e-06, - "loss": 0.75, - "step": 43090 - }, - { - "epoch": 1.1, - "learning_rate": 1.4578963278563539e-06, - "loss": 0.5791, - "step": 43091 - }, - { - "epoch": 1.1, - "learning_rate": 1.4578717284926538e-06, - "loss": 0.7383, - "step": 43092 - }, - { - "epoch": 1.1, - "learning_rate": 1.4578471287783827e-06, - "loss": 0.5801, - "step": 43093 - }, - { - "epoch": 1.1, - "learning_rate": 1.457822528713559e-06, - "loss": 0.4785, - "step": 43094 - }, - { - "epoch": 1.1, - "learning_rate": 1.457797928298202e-06, - "loss": 0.48, - "step": 43095 - }, - { - "epoch": 1.1, - "learning_rate": 1.4577733275323297e-06, - "loss": 0.458, - "step": 43096 - }, - { - "epoch": 1.1, - "learning_rate": 1.4577487264159613e-06, - "loss": 0.5933, - "step": 43097 - }, - { - "epoch": 1.1, - "learning_rate": 1.4577241249491162e-06, - "loss": 0.7227, - "step": 43098 - }, - { - "epoch": 1.1, - "learning_rate": 1.4576995231318128e-06, - "loss": 0.6533, - "step": 43099 - }, - { - "epoch": 1.1, - "learning_rate": 1.4576749209640695e-06, - "loss": 0.7588, - "step": 43100 - }, - { - "epoch": 1.1, - "learning_rate": 1.457650318445906e-06, - "loss": 0.6812, - "step": 43101 - }, - { - "epoch": 1.1, - "learning_rate": 1.4576257155773404e-06, - "loss": 0.5466, - "step": 43102 - }, - { - "epoch": 1.1, - "learning_rate": 1.4576011123583917e-06, - "loss": 0.7236, - "step": 43103 - }, - { - "epoch": 1.1, - "learning_rate": 1.4575765087890793e-06, - "loss": 0.6274, - "step": 43104 - }, - { - "epoch": 1.1, - "learning_rate": 1.4575519048694211e-06, - "loss": 0.5586, - "step": 43105 - }, - { - "epoch": 1.1, - "learning_rate": 1.4575273005994371e-06, - "loss": 0.7549, - "step": 43106 - }, - { - "epoch": 1.1, - "learning_rate": 1.457502695979145e-06, - "loss": 0.6724, - "step": 43107 - }, - { - "epoch": 1.1, - "learning_rate": 1.4574780910085642e-06, - "loss": 0.623, - "step": 43108 - }, - { - "epoch": 1.1, - "learning_rate": 1.4574534856877136e-06, - "loss": 0.7314, - "step": 43109 - }, - { - "epoch": 1.1, - "learning_rate": 1.4574288800166118e-06, - "loss": 0.7949, - "step": 43110 - }, - { - "epoch": 1.1, - "learning_rate": 1.4574042739952779e-06, - "loss": 0.751, - "step": 43111 - }, - { - "epoch": 1.1, - "learning_rate": 1.4573796676237303e-06, - "loss": 0.5382, - "step": 43112 - }, - { - "epoch": 1.11, - "learning_rate": 1.4573550609019883e-06, - "loss": 0.5798, - "step": 43113 - }, - { - "epoch": 1.11, - "learning_rate": 1.4573304538300705e-06, - "loss": 0.7441, - "step": 43114 - }, - { - "epoch": 1.11, - "learning_rate": 1.4573058464079957e-06, - "loss": 0.4563, - "step": 43115 - }, - { - "epoch": 1.11, - "learning_rate": 1.457281238635783e-06, - "loss": 0.772, - "step": 43116 - }, - { - "epoch": 1.11, - "learning_rate": 1.457256630513451e-06, - "loss": 0.623, - "step": 43117 - }, - { - "epoch": 1.11, - "learning_rate": 1.4572320220410187e-06, - "loss": 0.6914, - "step": 43118 - }, - { - "epoch": 1.11, - "learning_rate": 1.4572074132185047e-06, - "loss": 0.5283, - "step": 43119 - }, - { - "epoch": 1.11, - "learning_rate": 1.4571828040459281e-06, - "loss": 0.5957, - "step": 43120 - }, - { - "epoch": 1.11, - "learning_rate": 1.4571581945233077e-06, - "loss": 0.6548, - "step": 43121 - }, - { - "epoch": 1.11, - "learning_rate": 1.4571335846506622e-06, - "loss": 0.7578, - "step": 43122 - }, - { - "epoch": 1.11, - "learning_rate": 1.457108974428011e-06, - "loss": 0.6758, - "step": 43123 - }, - { - "epoch": 1.11, - "learning_rate": 1.457084363855372e-06, - "loss": 0.6674, - "step": 43124 - }, - { - "epoch": 1.11, - "learning_rate": 1.4570597529327644e-06, - "loss": 0.6865, - "step": 43125 - }, - { - "epoch": 1.11, - "learning_rate": 1.4570351416602074e-06, - "loss": 0.4265, - "step": 43126 - }, - { - "epoch": 1.11, - "learning_rate": 1.4570105300377197e-06, - "loss": 0.6914, - "step": 43127 - }, - { - "epoch": 1.11, - "learning_rate": 1.4569859180653197e-06, - "loss": 0.7485, - "step": 43128 - }, - { - "epoch": 1.11, - "learning_rate": 1.456961305743027e-06, - "loss": 0.6289, - "step": 43129 - }, - { - "epoch": 1.11, - "learning_rate": 1.4569366930708596e-06, - "loss": 0.6514, - "step": 43130 - }, - { - "epoch": 1.11, - "learning_rate": 1.4569120800488373e-06, - "loss": 0.749, - "step": 43131 - }, - { - "epoch": 1.11, - "learning_rate": 1.4568874666769782e-06, - "loss": 0.6318, - "step": 43132 - }, - { - "epoch": 1.11, - "learning_rate": 1.4568628529553012e-06, - "loss": 0.6299, - "step": 43133 - }, - { - "epoch": 1.11, - "learning_rate": 1.4568382388838255e-06, - "loss": 0.6787, - "step": 43134 - }, - { - "epoch": 1.11, - "learning_rate": 1.4568136244625698e-06, - "loss": 0.4829, - "step": 43135 - }, - { - "epoch": 1.11, - "learning_rate": 1.4567890096915529e-06, - "loss": 0.4071, - "step": 43136 - }, - { - "epoch": 1.11, - "learning_rate": 1.4567643945707935e-06, - "loss": 0.7344, - "step": 43137 - }, - { - "epoch": 1.11, - "learning_rate": 1.4567397791003107e-06, - "loss": 0.5967, - "step": 43138 - }, - { - "epoch": 1.11, - "learning_rate": 1.4567151632801233e-06, - "loss": 0.8242, - "step": 43139 - }, - { - "epoch": 1.11, - "learning_rate": 1.4566905471102499e-06, - "loss": 0.6172, - "step": 43140 - }, - { - "epoch": 1.11, - "learning_rate": 1.4566659305907098e-06, - "loss": 0.6445, - "step": 43141 - }, - { - "epoch": 1.11, - "learning_rate": 1.4566413137215215e-06, - "loss": 0.7373, - "step": 43142 - }, - { - "epoch": 1.11, - "learning_rate": 1.4566166965027038e-06, - "loss": 0.7061, - "step": 43143 - }, - { - "epoch": 1.11, - "learning_rate": 1.456592078934276e-06, - "loss": 0.5913, - "step": 43144 - }, - { - "epoch": 1.11, - "learning_rate": 1.4565674610162564e-06, - "loss": 0.4614, - "step": 43145 - }, - { - "epoch": 1.11, - "learning_rate": 1.4565428427486644e-06, - "loss": 0.4019, - "step": 43146 - }, - { - "epoch": 1.11, - "learning_rate": 1.4565182241315182e-06, - "loss": 0.6191, - "step": 43147 - }, - { - "epoch": 1.11, - "learning_rate": 1.4564936051648372e-06, - "loss": 0.6357, - "step": 43148 - }, - { - "epoch": 1.11, - "learning_rate": 1.4564689858486395e-06, - "loss": 0.752, - "step": 43149 - }, - { - "epoch": 1.11, - "learning_rate": 1.456444366182945e-06, - "loss": 0.6299, - "step": 43150 - }, - { - "epoch": 1.11, - "learning_rate": 1.456419746167772e-06, - "loss": 0.6309, - "step": 43151 - }, - { - "epoch": 1.11, - "learning_rate": 1.4563951258031394e-06, - "loss": 0.6836, - "step": 43152 - }, - { - "epoch": 1.11, - "learning_rate": 1.456370505089066e-06, - "loss": 0.7842, - "step": 43153 - }, - { - "epoch": 1.11, - "learning_rate": 1.4563458840255706e-06, - "loss": 0.6138, - "step": 43154 - }, - { - "epoch": 1.11, - "learning_rate": 1.4563212626126723e-06, - "loss": 0.8066, - "step": 43155 - }, - { - "epoch": 1.11, - "learning_rate": 1.4562966408503898e-06, - "loss": 0.8438, - "step": 43156 - }, - { - "epoch": 1.11, - "learning_rate": 1.4562720187387418e-06, - "loss": 0.6641, - "step": 43157 - }, - { - "epoch": 1.11, - "learning_rate": 1.4562473962777473e-06, - "loss": 0.6797, - "step": 43158 - }, - { - "epoch": 1.11, - "learning_rate": 1.456222773467425e-06, - "loss": 0.6504, - "step": 43159 - }, - { - "epoch": 1.11, - "learning_rate": 1.4561981503077942e-06, - "loss": 0.7109, - "step": 43160 - }, - { - "epoch": 1.11, - "learning_rate": 1.4561735267988734e-06, - "loss": 0.561, - "step": 43161 - }, - { - "epoch": 1.11, - "learning_rate": 1.4561489029406814e-06, - "loss": 0.7607, - "step": 43162 - }, - { - "epoch": 1.11, - "learning_rate": 1.4561242787332374e-06, - "loss": 0.5938, - "step": 43163 - }, - { - "epoch": 1.11, - "learning_rate": 1.4560996541765595e-06, - "loss": 0.6777, - "step": 43164 - }, - { - "epoch": 1.11, - "learning_rate": 1.4560750292706673e-06, - "loss": 0.6572, - "step": 43165 - }, - { - "epoch": 1.11, - "learning_rate": 1.4560504040155797e-06, - "loss": 0.5825, - "step": 43166 - }, - { - "epoch": 1.11, - "learning_rate": 1.456025778411315e-06, - "loss": 0.4756, - "step": 43167 - }, - { - "epoch": 1.11, - "learning_rate": 1.4560011524578923e-06, - "loss": 0.8066, - "step": 43168 - }, - { - "epoch": 1.11, - "learning_rate": 1.4559765261553307e-06, - "loss": 0.562, - "step": 43169 - }, - { - "epoch": 1.11, - "learning_rate": 1.4559518995036486e-06, - "loss": 0.5105, - "step": 43170 - }, - { - "epoch": 1.11, - "learning_rate": 1.4559272725028656e-06, - "loss": 0.6265, - "step": 43171 - }, - { - "epoch": 1.11, - "learning_rate": 1.4559026451529994e-06, - "loss": 0.6069, - "step": 43172 - }, - { - "epoch": 1.11, - "learning_rate": 1.45587801745407e-06, - "loss": 0.7051, - "step": 43173 - }, - { - "epoch": 1.11, - "learning_rate": 1.4558533894060955e-06, - "loss": 0.6323, - "step": 43174 - }, - { - "epoch": 1.11, - "learning_rate": 1.455828761009095e-06, - "loss": 0.7422, - "step": 43175 - }, - { - "epoch": 1.11, - "learning_rate": 1.4558041322630874e-06, - "loss": 1.04, - "step": 43176 - }, - { - "epoch": 1.11, - "learning_rate": 1.4557795031680918e-06, - "loss": 0.6719, - "step": 43177 - }, - { - "epoch": 1.11, - "learning_rate": 1.4557548737241263e-06, - "loss": 0.7256, - "step": 43178 - }, - { - "epoch": 1.11, - "learning_rate": 1.4557302439312107e-06, - "loss": 0.6152, - "step": 43179 - }, - { - "epoch": 1.11, - "learning_rate": 1.4557056137893632e-06, - "loss": 0.5073, - "step": 43180 - }, - { - "epoch": 1.11, - "learning_rate": 1.455680983298603e-06, - "loss": 0.4922, - "step": 43181 - }, - { - "epoch": 1.11, - "learning_rate": 1.4556563524589484e-06, - "loss": 0.7432, - "step": 43182 - }, - { - "epoch": 1.11, - "learning_rate": 1.4556317212704191e-06, - "loss": 0.79, - "step": 43183 - }, - { - "epoch": 1.11, - "learning_rate": 1.4556070897330334e-06, - "loss": 0.5591, - "step": 43184 - }, - { - "epoch": 1.11, - "learning_rate": 1.4555824578468103e-06, - "loss": 0.7285, - "step": 43185 - }, - { - "epoch": 1.11, - "learning_rate": 1.4555578256117688e-06, - "loss": 0.7188, - "step": 43186 - }, - { - "epoch": 1.11, - "learning_rate": 1.4555331930279276e-06, - "loss": 0.7285, - "step": 43187 - }, - { - "epoch": 1.11, - "learning_rate": 1.4555085600953054e-06, - "loss": 0.457, - "step": 43188 - }, - { - "epoch": 1.11, - "learning_rate": 1.4554839268139214e-06, - "loss": 0.7666, - "step": 43189 - }, - { - "epoch": 1.11, - "learning_rate": 1.4554592931837942e-06, - "loss": 0.6948, - "step": 43190 - }, - { - "epoch": 1.11, - "learning_rate": 1.455434659204943e-06, - "loss": 0.71, - "step": 43191 - }, - { - "epoch": 1.11, - "learning_rate": 1.4554100248773862e-06, - "loss": 0.6064, - "step": 43192 - }, - { - "epoch": 1.11, - "learning_rate": 1.4553853902011426e-06, - "loss": 0.5933, - "step": 43193 - }, - { - "epoch": 1.11, - "learning_rate": 1.4553607551762319e-06, - "loss": 0.5388, - "step": 43194 - }, - { - "epoch": 1.11, - "learning_rate": 1.4553361198026718e-06, - "loss": 0.5454, - "step": 43195 - }, - { - "epoch": 1.11, - "learning_rate": 1.4553114840804825e-06, - "loss": 0.665, - "step": 43196 - }, - { - "epoch": 1.11, - "learning_rate": 1.4552868480096816e-06, - "loss": 0.7144, - "step": 43197 - }, - { - "epoch": 1.11, - "learning_rate": 1.4552622115902889e-06, - "loss": 0.7695, - "step": 43198 - }, - { - "epoch": 1.11, - "learning_rate": 1.4552375748223224e-06, - "loss": 0.6426, - "step": 43199 - }, - { - "epoch": 1.11, - "learning_rate": 1.4552129377058017e-06, - "loss": 0.54, - "step": 43200 - }, - { - "epoch": 1.11, - "learning_rate": 1.4551883002407454e-06, - "loss": 0.502, - "step": 43201 - }, - { - "epoch": 1.11, - "learning_rate": 1.4551636624271724e-06, - "loss": 0.7178, - "step": 43202 - }, - { - "epoch": 1.11, - "learning_rate": 1.4551390242651011e-06, - "loss": 0.6816, - "step": 43203 - }, - { - "epoch": 1.11, - "learning_rate": 1.4551143857545514e-06, - "loss": 0.7109, - "step": 43204 - }, - { - "epoch": 1.11, - "learning_rate": 1.455089746895541e-06, - "loss": 0.6025, - "step": 43205 - }, - { - "epoch": 1.11, - "learning_rate": 1.4550651076880898e-06, - "loss": 0.7783, - "step": 43206 - }, - { - "epoch": 1.11, - "learning_rate": 1.4550404681322158e-06, - "loss": 0.666, - "step": 43207 - }, - { - "epoch": 1.11, - "learning_rate": 1.4550158282279381e-06, - "loss": 0.749, - "step": 43208 - }, - { - "epoch": 1.11, - "learning_rate": 1.4549911879752758e-06, - "loss": 0.7168, - "step": 43209 - }, - { - "epoch": 1.11, - "learning_rate": 1.454966547374248e-06, - "loss": 0.6919, - "step": 43210 - }, - { - "epoch": 1.11, - "learning_rate": 1.4549419064248732e-06, - "loss": 0.792, - "step": 43211 - }, - { - "epoch": 1.11, - "learning_rate": 1.45491726512717e-06, - "loss": 0.6562, - "step": 43212 - }, - { - "epoch": 1.11, - "learning_rate": 1.4548926234811576e-06, - "loss": 0.7192, - "step": 43213 - }, - { - "epoch": 1.11, - "learning_rate": 1.4548679814868549e-06, - "loss": 0.7275, - "step": 43214 - }, - { - "epoch": 1.11, - "learning_rate": 1.4548433391442806e-06, - "loss": 0.5225, - "step": 43215 - }, - { - "epoch": 1.11, - "learning_rate": 1.4548186964534539e-06, - "loss": 0.5889, - "step": 43216 - }, - { - "epoch": 1.11, - "learning_rate": 1.4547940534143935e-06, - "loss": 0.6982, - "step": 43217 - }, - { - "epoch": 1.11, - "learning_rate": 1.454769410027118e-06, - "loss": 0.7266, - "step": 43218 - }, - { - "epoch": 1.11, - "learning_rate": 1.4547447662916466e-06, - "loss": 0.6357, - "step": 43219 - }, - { - "epoch": 1.11, - "learning_rate": 1.4547201222079976e-06, - "loss": 0.623, - "step": 43220 - }, - { - "epoch": 1.11, - "learning_rate": 1.4546954777761912e-06, - "loss": 0.6309, - "step": 43221 - }, - { - "epoch": 1.11, - "learning_rate": 1.4546708329962445e-06, - "loss": 0.6162, - "step": 43222 - }, - { - "epoch": 1.11, - "learning_rate": 1.4546461878681778e-06, - "loss": 0.5232, - "step": 43223 - }, - { - "epoch": 1.11, - "learning_rate": 1.454621542392009e-06, - "loss": 0.7393, - "step": 43224 - }, - { - "epoch": 1.11, - "learning_rate": 1.4545968965677577e-06, - "loss": 0.593, - "step": 43225 - }, - { - "epoch": 1.11, - "learning_rate": 1.4545722503954426e-06, - "loss": 0.6167, - "step": 43226 - }, - { - "epoch": 1.11, - "learning_rate": 1.4545476038750822e-06, - "loss": 0.7412, - "step": 43227 - }, - { - "epoch": 1.11, - "learning_rate": 1.4545229570066955e-06, - "loss": 0.6689, - "step": 43228 - }, - { - "epoch": 1.11, - "learning_rate": 1.4544983097903013e-06, - "loss": 0.5774, - "step": 43229 - }, - { - "epoch": 1.11, - "learning_rate": 1.4544736622259191e-06, - "loss": 0.6411, - "step": 43230 - }, - { - "epoch": 1.11, - "learning_rate": 1.454449014313567e-06, - "loss": 0.7441, - "step": 43231 - }, - { - "epoch": 1.11, - "learning_rate": 1.4544243660532645e-06, - "loss": 0.5542, - "step": 43232 - }, - { - "epoch": 1.11, - "learning_rate": 1.4543997174450298e-06, - "loss": 0.6768, - "step": 43233 - }, - { - "epoch": 1.11, - "learning_rate": 1.4543750684888822e-06, - "loss": 0.5493, - "step": 43234 - }, - { - "epoch": 1.11, - "learning_rate": 1.4543504191848408e-06, - "loss": 0.7158, - "step": 43235 - }, - { - "epoch": 1.11, - "learning_rate": 1.454325769532924e-06, - "loss": 0.8149, - "step": 43236 - }, - { - "epoch": 1.11, - "learning_rate": 1.4543011195331506e-06, - "loss": 0.7222, - "step": 43237 - }, - { - "epoch": 1.11, - "learning_rate": 1.4542764691855403e-06, - "loss": 0.5701, - "step": 43238 - }, - { - "epoch": 1.11, - "learning_rate": 1.454251818490111e-06, - "loss": 0.7832, - "step": 43239 - }, - { - "epoch": 1.11, - "learning_rate": 1.454227167446882e-06, - "loss": 0.3538, - "step": 43240 - }, - { - "epoch": 1.11, - "learning_rate": 1.4542025160558722e-06, - "loss": 0.6855, - "step": 43241 - }, - { - "epoch": 1.11, - "learning_rate": 1.4541778643171003e-06, - "loss": 0.7676, - "step": 43242 - }, - { - "epoch": 1.11, - "learning_rate": 1.4541532122305853e-06, - "loss": 0.7471, - "step": 43243 - }, - { - "epoch": 1.11, - "learning_rate": 1.4541285597963462e-06, - "loss": 0.7251, - "step": 43244 - }, - { - "epoch": 1.11, - "learning_rate": 1.4541039070144017e-06, - "loss": 0.6606, - "step": 43245 - }, - { - "epoch": 1.11, - "learning_rate": 1.4540792538847708e-06, - "loss": 0.5488, - "step": 43246 - }, - { - "epoch": 1.11, - "learning_rate": 1.454054600407472e-06, - "loss": 0.603, - "step": 43247 - }, - { - "epoch": 1.11, - "learning_rate": 1.4540299465825249e-06, - "loss": 0.623, - "step": 43248 - }, - { - "epoch": 1.11, - "learning_rate": 1.4540052924099475e-06, - "loss": 0.4971, - "step": 43249 - }, - { - "epoch": 1.11, - "learning_rate": 1.4539806378897595e-06, - "loss": 0.8608, - "step": 43250 - }, - { - "epoch": 1.11, - "learning_rate": 1.453955983021979e-06, - "loss": 0.6143, - "step": 43251 - }, - { - "epoch": 1.11, - "learning_rate": 1.4539313278066257e-06, - "loss": 0.6807, - "step": 43252 - }, - { - "epoch": 1.11, - "learning_rate": 1.4539066722437179e-06, - "loss": 0.6846, - "step": 43253 - }, - { - "epoch": 1.11, - "learning_rate": 1.4538820163332746e-06, - "loss": 0.5742, - "step": 43254 - }, - { - "epoch": 1.11, - "learning_rate": 1.4538573600753147e-06, - "loss": 0.6836, - "step": 43255 - }, - { - "epoch": 1.11, - "learning_rate": 1.453832703469857e-06, - "loss": 0.5028, - "step": 43256 - }, - { - "epoch": 1.11, - "learning_rate": 1.4538080465169206e-06, - "loss": 0.3142, - "step": 43257 - }, - { - "epoch": 1.11, - "learning_rate": 1.453783389216524e-06, - "loss": 0.6328, - "step": 43258 - }, - { - "epoch": 1.11, - "learning_rate": 1.4537587315686866e-06, - "loss": 0.5645, - "step": 43259 - }, - { - "epoch": 1.11, - "learning_rate": 1.4537340735734269e-06, - "loss": 0.6602, - "step": 43260 - }, - { - "epoch": 1.11, - "learning_rate": 1.4537094152307643e-06, - "loss": 0.5444, - "step": 43261 - }, - { - "epoch": 1.11, - "learning_rate": 1.4536847565407167e-06, - "loss": 0.7305, - "step": 43262 - }, - { - "epoch": 1.11, - "learning_rate": 1.4536600975033037e-06, - "loss": 0.5551, - "step": 43263 - }, - { - "epoch": 1.11, - "learning_rate": 1.453635438118544e-06, - "loss": 0.8408, - "step": 43264 - }, - { - "epoch": 1.11, - "learning_rate": 1.4536107783864565e-06, - "loss": 0.6982, - "step": 43265 - }, - { - "epoch": 1.11, - "learning_rate": 1.4535861183070604e-06, - "loss": 0.5776, - "step": 43266 - }, - { - "epoch": 1.11, - "learning_rate": 1.4535614578803739e-06, - "loss": 0.7129, - "step": 43267 - }, - { - "epoch": 1.11, - "learning_rate": 1.4535367971064162e-06, - "loss": 0.7339, - "step": 43268 - }, - { - "epoch": 1.11, - "learning_rate": 1.4535121359852065e-06, - "loss": 0.6294, - "step": 43269 - }, - { - "epoch": 1.11, - "learning_rate": 1.4534874745167632e-06, - "loss": 0.5767, - "step": 43270 - }, - { - "epoch": 1.11, - "learning_rate": 1.4534628127011056e-06, - "loss": 0.8213, - "step": 43271 - }, - { - "epoch": 1.11, - "learning_rate": 1.4534381505382522e-06, - "loss": 0.6562, - "step": 43272 - }, - { - "epoch": 1.11, - "learning_rate": 1.4534134880282222e-06, - "loss": 0.7168, - "step": 43273 - }, - { - "epoch": 1.11, - "learning_rate": 1.453388825171034e-06, - "loss": 0.7744, - "step": 43274 - }, - { - "epoch": 1.11, - "learning_rate": 1.453364161966707e-06, - "loss": 0.6836, - "step": 43275 - }, - { - "epoch": 1.11, - "learning_rate": 1.4533394984152603e-06, - "loss": 0.4434, - "step": 43276 - }, - { - "epoch": 1.11, - "learning_rate": 1.4533148345167119e-06, - "loss": 0.5762, - "step": 43277 - }, - { - "epoch": 1.11, - "learning_rate": 1.4532901702710815e-06, - "loss": 0.4429, - "step": 43278 - }, - { - "epoch": 1.11, - "learning_rate": 1.4532655056783877e-06, - "loss": 0.5566, - "step": 43279 - }, - { - "epoch": 1.11, - "learning_rate": 1.4532408407386492e-06, - "loss": 0.6465, - "step": 43280 - }, - { - "epoch": 1.11, - "learning_rate": 1.4532161754518847e-06, - "loss": 0.6465, - "step": 43281 - }, - { - "epoch": 1.11, - "learning_rate": 1.4531915098181137e-06, - "loss": 0.6758, - "step": 43282 - }, - { - "epoch": 1.11, - "learning_rate": 1.4531668438373548e-06, - "loss": 0.4976, - "step": 43283 - }, - { - "epoch": 1.11, - "learning_rate": 1.4531421775096268e-06, - "loss": 0.4596, - "step": 43284 - }, - { - "epoch": 1.11, - "learning_rate": 1.4531175108349489e-06, - "loss": 0.584, - "step": 43285 - }, - { - "epoch": 1.11, - "learning_rate": 1.4530928438133398e-06, - "loss": 0.7754, - "step": 43286 - }, - { - "epoch": 1.11, - "learning_rate": 1.4530681764448177e-06, - "loss": 0.4597, - "step": 43287 - }, - { - "epoch": 1.11, - "learning_rate": 1.453043508729403e-06, - "loss": 0.8428, - "step": 43288 - }, - { - "epoch": 1.11, - "learning_rate": 1.453018840667113e-06, - "loss": 0.6709, - "step": 43289 - }, - { - "epoch": 1.11, - "learning_rate": 1.4529941722579678e-06, - "loss": 0.4946, - "step": 43290 - }, - { - "epoch": 1.11, - "learning_rate": 1.4529695035019855e-06, - "loss": 0.6177, - "step": 43291 - }, - { - "epoch": 1.11, - "learning_rate": 1.4529448343991856e-06, - "loss": 0.5996, - "step": 43292 - }, - { - "epoch": 1.11, - "learning_rate": 1.4529201649495862e-06, - "loss": 0.6147, - "step": 43293 - }, - { - "epoch": 1.11, - "learning_rate": 1.452895495153207e-06, - "loss": 0.5522, - "step": 43294 - }, - { - "epoch": 1.11, - "learning_rate": 1.4528708250100666e-06, - "loss": 0.6899, - "step": 43295 - }, - { - "epoch": 1.11, - "learning_rate": 1.4528461545201833e-06, - "loss": 0.4421, - "step": 43296 - }, - { - "epoch": 1.11, - "learning_rate": 1.4528214836835772e-06, - "loss": 0.6377, - "step": 43297 - }, - { - "epoch": 1.11, - "learning_rate": 1.4527968125002663e-06, - "loss": 0.8203, - "step": 43298 - }, - { - "epoch": 1.11, - "learning_rate": 1.4527721409702693e-06, - "loss": 0.6318, - "step": 43299 - }, - { - "epoch": 1.11, - "learning_rate": 1.4527474690936058e-06, - "loss": 0.6309, - "step": 43300 - }, - { - "epoch": 1.11, - "learning_rate": 1.4527227968702946e-06, - "loss": 0.7427, - "step": 43301 - }, - { - "epoch": 1.11, - "learning_rate": 1.452698124300354e-06, - "loss": 0.6265, - "step": 43302 - }, - { - "epoch": 1.11, - "learning_rate": 1.4526734513838036e-06, - "loss": 0.4612, - "step": 43303 - }, - { - "epoch": 1.11, - "learning_rate": 1.4526487781206615e-06, - "loss": 0.6353, - "step": 43304 - }, - { - "epoch": 1.11, - "learning_rate": 1.4526241045109475e-06, - "loss": 0.8379, - "step": 43305 - }, - { - "epoch": 1.11, - "learning_rate": 1.4525994305546799e-06, - "loss": 0.7275, - "step": 43306 - }, - { - "epoch": 1.11, - "learning_rate": 1.4525747562518777e-06, - "loss": 0.5474, - "step": 43307 - }, - { - "epoch": 1.11, - "learning_rate": 1.4525500816025595e-06, - "loss": 0.7803, - "step": 43308 - }, - { - "epoch": 1.11, - "learning_rate": 1.4525254066067448e-06, - "loss": 0.6309, - "step": 43309 - }, - { - "epoch": 1.11, - "learning_rate": 1.4525007312644524e-06, - "loss": 0.6533, - "step": 43310 - }, - { - "epoch": 1.11, - "learning_rate": 1.452476055575701e-06, - "loss": 0.5112, - "step": 43311 - }, - { - "epoch": 1.11, - "learning_rate": 1.452451379540509e-06, - "loss": 0.834, - "step": 43312 - }, - { - "epoch": 1.11, - "learning_rate": 1.4524267031588962e-06, - "loss": 0.6592, - "step": 43313 - }, - { - "epoch": 1.11, - "learning_rate": 1.4524020264308808e-06, - "loss": 0.7012, - "step": 43314 - }, - { - "epoch": 1.11, - "learning_rate": 1.4523773493564824e-06, - "loss": 0.665, - "step": 43315 - }, - { - "epoch": 1.11, - "learning_rate": 1.452352671935719e-06, - "loss": 0.7871, - "step": 43316 - }, - { - "epoch": 1.11, - "learning_rate": 1.4523279941686103e-06, - "loss": 0.6274, - "step": 43317 - }, - { - "epoch": 1.11, - "learning_rate": 1.4523033160551745e-06, - "loss": 0.6475, - "step": 43318 - }, - { - "epoch": 1.11, - "learning_rate": 1.4522786375954313e-06, - "loss": 0.8066, - "step": 43319 - }, - { - "epoch": 1.11, - "learning_rate": 1.4522539587893986e-06, - "loss": 0.6162, - "step": 43320 - }, - { - "epoch": 1.11, - "learning_rate": 1.4522292796370963e-06, - "loss": 0.4448, - "step": 43321 - }, - { - "epoch": 1.11, - "learning_rate": 1.4522046001385426e-06, - "loss": 0.6885, - "step": 43322 - }, - { - "epoch": 1.11, - "learning_rate": 1.4521799202937566e-06, - "loss": 0.7354, - "step": 43323 - }, - { - "epoch": 1.11, - "learning_rate": 1.4521552401027575e-06, - "loss": 0.6709, - "step": 43324 - }, - { - "epoch": 1.11, - "learning_rate": 1.4521305595655637e-06, - "loss": 0.5547, - "step": 43325 - }, - { - "epoch": 1.11, - "learning_rate": 1.4521058786821944e-06, - "loss": 0.7305, - "step": 43326 - }, - { - "epoch": 1.11, - "learning_rate": 1.4520811974526683e-06, - "loss": 0.6826, - "step": 43327 - }, - { - "epoch": 1.11, - "learning_rate": 1.4520565158770045e-06, - "loss": 0.6152, - "step": 43328 - }, - { - "epoch": 1.11, - "learning_rate": 1.4520318339552217e-06, - "loss": 0.6523, - "step": 43329 - }, - { - "epoch": 1.11, - "learning_rate": 1.4520071516873393e-06, - "loss": 0.9326, - "step": 43330 - }, - { - "epoch": 1.11, - "learning_rate": 1.4519824690733756e-06, - "loss": 0.6494, - "step": 43331 - }, - { - "epoch": 1.11, - "learning_rate": 1.4519577861133495e-06, - "loss": 0.5127, - "step": 43332 - }, - { - "epoch": 1.11, - "learning_rate": 1.45193310280728e-06, - "loss": 0.6572, - "step": 43333 - }, - { - "epoch": 1.11, - "learning_rate": 1.4519084191551866e-06, - "loss": 0.7256, - "step": 43334 - }, - { - "epoch": 1.11, - "learning_rate": 1.4518837351570873e-06, - "loss": 0.8135, - "step": 43335 - }, - { - "epoch": 1.11, - "learning_rate": 1.4518590508130018e-06, - "loss": 0.8115, - "step": 43336 - }, - { - "epoch": 1.11, - "learning_rate": 1.4518343661229483e-06, - "loss": 0.6084, - "step": 43337 - }, - { - "epoch": 1.11, - "learning_rate": 1.4518096810869461e-06, - "loss": 0.8896, - "step": 43338 - }, - { - "epoch": 1.11, - "learning_rate": 1.4517849957050136e-06, - "loss": 0.707, - "step": 43339 - }, - { - "epoch": 1.11, - "learning_rate": 1.4517603099771706e-06, - "loss": 0.7549, - "step": 43340 - }, - { - "epoch": 1.11, - "learning_rate": 1.4517356239034356e-06, - "loss": 0.6204, - "step": 43341 - }, - { - "epoch": 1.11, - "learning_rate": 1.4517109374838273e-06, - "loss": 0.7012, - "step": 43342 - }, - { - "epoch": 1.11, - "learning_rate": 1.4516862507183643e-06, - "loss": 0.6045, - "step": 43343 - }, - { - "epoch": 1.11, - "learning_rate": 1.4516615636070662e-06, - "loss": 0.6577, - "step": 43344 - }, - { - "epoch": 1.11, - "learning_rate": 1.4516368761499517e-06, - "loss": 0.6348, - "step": 43345 - }, - { - "epoch": 1.11, - "learning_rate": 1.4516121883470393e-06, - "loss": 0.48, - "step": 43346 - }, - { - "epoch": 1.11, - "learning_rate": 1.4515875001983484e-06, - "loss": 0.6934, - "step": 43347 - }, - { - "epoch": 1.11, - "learning_rate": 1.4515628117038976e-06, - "loss": 0.5889, - "step": 43348 - }, - { - "epoch": 1.11, - "learning_rate": 1.451538122863706e-06, - "loss": 0.752, - "step": 43349 - }, - { - "epoch": 1.11, - "learning_rate": 1.4515134336777925e-06, - "loss": 0.6475, - "step": 43350 - }, - { - "epoch": 1.11, - "learning_rate": 1.4514887441461761e-06, - "loss": 0.6201, - "step": 43351 - }, - { - "epoch": 1.11, - "learning_rate": 1.4514640542688752e-06, - "loss": 0.6772, - "step": 43352 - }, - { - "epoch": 1.11, - "learning_rate": 1.4514393640459092e-06, - "loss": 0.564, - "step": 43353 - }, - { - "epoch": 1.11, - "learning_rate": 1.4514146734772967e-06, - "loss": 0.4103, - "step": 43354 - }, - { - "epoch": 1.11, - "learning_rate": 1.4513899825630572e-06, - "loss": 0.5125, - "step": 43355 - }, - { - "epoch": 1.11, - "learning_rate": 1.4513652913032085e-06, - "loss": 0.6445, - "step": 43356 - }, - { - "epoch": 1.11, - "learning_rate": 1.4513405996977705e-06, - "loss": 0.5894, - "step": 43357 - }, - { - "epoch": 1.11, - "learning_rate": 1.4513159077467616e-06, - "loss": 0.5415, - "step": 43358 - }, - { - "epoch": 1.11, - "learning_rate": 1.451291215450201e-06, - "loss": 0.6855, - "step": 43359 - }, - { - "epoch": 1.11, - "learning_rate": 1.4512665228081074e-06, - "loss": 0.561, - "step": 43360 - }, - { - "epoch": 1.11, - "learning_rate": 1.4512418298204998e-06, - "loss": 0.7285, - "step": 43361 - }, - { - "epoch": 1.11, - "learning_rate": 1.451217136487397e-06, - "loss": 0.6841, - "step": 43362 - }, - { - "epoch": 1.11, - "learning_rate": 1.4511924428088183e-06, - "loss": 0.6982, - "step": 43363 - }, - { - "epoch": 1.11, - "learning_rate": 1.4511677487847818e-06, - "loss": 0.6279, - "step": 43364 - }, - { - "epoch": 1.11, - "learning_rate": 1.4511430544153071e-06, - "loss": 0.7139, - "step": 43365 - }, - { - "epoch": 1.11, - "learning_rate": 1.451118359700413e-06, - "loss": 0.4182, - "step": 43366 - }, - { - "epoch": 1.11, - "learning_rate": 1.4510936646401181e-06, - "loss": 0.5615, - "step": 43367 - }, - { - "epoch": 1.11, - "learning_rate": 1.4510689692344417e-06, - "loss": 0.6211, - "step": 43368 - }, - { - "epoch": 1.11, - "learning_rate": 1.4510442734834027e-06, - "loss": 0.488, - "step": 43369 - }, - { - "epoch": 1.11, - "learning_rate": 1.4510195773870197e-06, - "loss": 0.6943, - "step": 43370 - }, - { - "epoch": 1.11, - "learning_rate": 1.4509948809453117e-06, - "loss": 0.6865, - "step": 43371 - }, - { - "epoch": 1.11, - "learning_rate": 1.4509701841582978e-06, - "loss": 0.7734, - "step": 43372 - }, - { - "epoch": 1.11, - "learning_rate": 1.4509454870259964e-06, - "loss": 0.5435, - "step": 43373 - }, - { - "epoch": 1.11, - "learning_rate": 1.450920789548427e-06, - "loss": 0.4783, - "step": 43374 - }, - { - "epoch": 1.11, - "learning_rate": 1.4508960917256083e-06, - "loss": 0.7017, - "step": 43375 - }, - { - "epoch": 1.11, - "learning_rate": 1.450871393557559e-06, - "loss": 0.7036, - "step": 43376 - }, - { - "epoch": 1.11, - "learning_rate": 1.4508466950442986e-06, - "loss": 0.668, - "step": 43377 - }, - { - "epoch": 1.11, - "learning_rate": 1.4508219961858455e-06, - "loss": 0.5732, - "step": 43378 - }, - { - "epoch": 1.11, - "learning_rate": 1.4507972969822184e-06, - "loss": 0.665, - "step": 43379 - }, - { - "epoch": 1.11, - "learning_rate": 1.450772597433437e-06, - "loss": 0.8369, - "step": 43380 - }, - { - "epoch": 1.11, - "learning_rate": 1.4507478975395193e-06, - "loss": 0.6123, - "step": 43381 - }, - { - "epoch": 1.11, - "learning_rate": 1.4507231973004853e-06, - "loss": 0.6523, - "step": 43382 - }, - { - "epoch": 1.11, - "learning_rate": 1.4506984967163525e-06, - "loss": 0.5049, - "step": 43383 - }, - { - "epoch": 1.11, - "learning_rate": 1.450673795787141e-06, - "loss": 0.668, - "step": 43384 - }, - { - "epoch": 1.11, - "learning_rate": 1.4506490945128693e-06, - "loss": 0.4988, - "step": 43385 - }, - { - "epoch": 1.11, - "learning_rate": 1.4506243928935561e-06, - "loss": 0.7881, - "step": 43386 - }, - { - "epoch": 1.11, - "learning_rate": 1.4505996909292208e-06, - "loss": 0.5918, - "step": 43387 - }, - { - "epoch": 1.11, - "learning_rate": 1.4505749886198818e-06, - "loss": 0.7256, - "step": 43388 - }, - { - "epoch": 1.11, - "learning_rate": 1.4505502859655584e-06, - "loss": 0.5239, - "step": 43389 - }, - { - "epoch": 1.11, - "learning_rate": 1.4505255829662693e-06, - "loss": 0.4097, - "step": 43390 - }, - { - "epoch": 1.11, - "learning_rate": 1.4505008796220335e-06, - "loss": 0.5283, - "step": 43391 - }, - { - "epoch": 1.11, - "learning_rate": 1.4504761759328698e-06, - "loss": 0.6973, - "step": 43392 - }, - { - "epoch": 1.11, - "learning_rate": 1.4504514718987974e-06, - "loss": 0.7949, - "step": 43393 - }, - { - "epoch": 1.11, - "learning_rate": 1.4504267675198346e-06, - "loss": 0.6406, - "step": 43394 - }, - { - "epoch": 1.11, - "learning_rate": 1.4504020627960013e-06, - "loss": 0.563, - "step": 43395 - }, - { - "epoch": 1.11, - "learning_rate": 1.4503773577273155e-06, - "loss": 0.6934, - "step": 43396 - }, - { - "epoch": 1.11, - "learning_rate": 1.4503526523137968e-06, - "loss": 0.6326, - "step": 43397 - }, - { - "epoch": 1.11, - "learning_rate": 1.4503279465554635e-06, - "loss": 0.5283, - "step": 43398 - }, - { - "epoch": 1.11, - "learning_rate": 1.4503032404523347e-06, - "loss": 0.791, - "step": 43399 - }, - { - "epoch": 1.11, - "learning_rate": 1.4502785340044297e-06, - "loss": 0.6326, - "step": 43400 - }, - { - "epoch": 1.11, - "learning_rate": 1.450253827211767e-06, - "loss": 0.4858, - "step": 43401 - }, - { - "epoch": 1.11, - "learning_rate": 1.4502291200743655e-06, - "loss": 0.7495, - "step": 43402 - }, - { - "epoch": 1.11, - "learning_rate": 1.4502044125922446e-06, - "loss": 0.4309, - "step": 43403 - }, - { - "epoch": 1.11, - "learning_rate": 1.4501797047654223e-06, - "loss": 0.7988, - "step": 43404 - }, - { - "epoch": 1.11, - "learning_rate": 1.4501549965939189e-06, - "loss": 0.645, - "step": 43405 - }, - { - "epoch": 1.11, - "learning_rate": 1.450130288077752e-06, - "loss": 0.4819, - "step": 43406 - }, - { - "epoch": 1.11, - "learning_rate": 1.4501055792169411e-06, - "loss": 0.5322, - "step": 43407 - }, - { - "epoch": 1.11, - "learning_rate": 1.450080870011505e-06, - "loss": 0.5029, - "step": 43408 - }, - { - "epoch": 1.11, - "learning_rate": 1.4500561604614628e-06, - "loss": 0.7432, - "step": 43409 - }, - { - "epoch": 1.11, - "learning_rate": 1.4500314505668332e-06, - "loss": 0.6709, - "step": 43410 - }, - { - "epoch": 1.11, - "learning_rate": 1.4500067403276353e-06, - "loss": 0.5615, - "step": 43411 - }, - { - "epoch": 1.11, - "learning_rate": 1.4499820297438879e-06, - "loss": 0.6313, - "step": 43412 - }, - { - "epoch": 1.11, - "learning_rate": 1.4499573188156098e-06, - "loss": 0.6172, - "step": 43413 - }, - { - "epoch": 1.11, - "learning_rate": 1.44993260754282e-06, - "loss": 0.6216, - "step": 43414 - }, - { - "epoch": 1.11, - "learning_rate": 1.449907895925538e-06, - "loss": 0.6006, - "step": 43415 - }, - { - "epoch": 1.11, - "learning_rate": 1.449883183963782e-06, - "loss": 0.6299, - "step": 43416 - }, - { - "epoch": 1.11, - "learning_rate": 1.449858471657571e-06, - "loss": 0.5493, - "step": 43417 - }, - { - "epoch": 1.11, - "learning_rate": 1.4498337590069241e-06, - "loss": 0.6494, - "step": 43418 - }, - { - "epoch": 1.11, - "learning_rate": 1.4498090460118602e-06, - "loss": 0.835, - "step": 43419 - }, - { - "epoch": 1.11, - "learning_rate": 1.4497843326723983e-06, - "loss": 0.6909, - "step": 43420 - }, - { - "epoch": 1.11, - "learning_rate": 1.449759618988557e-06, - "loss": 0.8105, - "step": 43421 - }, - { - "epoch": 1.11, - "learning_rate": 1.4497349049603556e-06, - "loss": 0.8662, - "step": 43422 - }, - { - "epoch": 1.11, - "learning_rate": 1.4497101905878127e-06, - "loss": 0.7393, - "step": 43423 - }, - { - "epoch": 1.11, - "learning_rate": 1.4496854758709477e-06, - "loss": 0.6147, - "step": 43424 - }, - { - "epoch": 1.11, - "learning_rate": 1.4496607608097788e-06, - "loss": 0.4421, - "step": 43425 - }, - { - "epoch": 1.11, - "learning_rate": 1.4496360454043255e-06, - "loss": 0.6807, - "step": 43426 - }, - { - "epoch": 1.11, - "learning_rate": 1.4496113296546067e-06, - "loss": 0.6689, - "step": 43427 - }, - { - "epoch": 1.11, - "learning_rate": 1.4495866135606408e-06, - "loss": 0.7148, - "step": 43428 - }, - { - "epoch": 1.11, - "learning_rate": 1.4495618971224475e-06, - "loss": 0.6709, - "step": 43429 - }, - { - "epoch": 1.11, - "learning_rate": 1.4495371803400452e-06, - "loss": 0.5698, - "step": 43430 - }, - { - "epoch": 1.11, - "learning_rate": 1.449512463213453e-06, - "loss": 0.5945, - "step": 43431 - }, - { - "epoch": 1.11, - "learning_rate": 1.4494877457426897e-06, - "loss": 0.4497, - "step": 43432 - }, - { - "epoch": 1.11, - "learning_rate": 1.4494630279277741e-06, - "loss": 0.6753, - "step": 43433 - }, - { - "epoch": 1.11, - "learning_rate": 1.4494383097687258e-06, - "loss": 0.7441, - "step": 43434 - }, - { - "epoch": 1.11, - "learning_rate": 1.449413591265563e-06, - "loss": 0.8945, - "step": 43435 - }, - { - "epoch": 1.11, - "learning_rate": 1.4493888724183046e-06, - "loss": 0.6406, - "step": 43436 - }, - { - "epoch": 1.11, - "learning_rate": 1.4493641532269702e-06, - "loss": 0.7051, - "step": 43437 - }, - { - "epoch": 1.11, - "learning_rate": 1.449339433691578e-06, - "loss": 0.6104, - "step": 43438 - }, - { - "epoch": 1.11, - "learning_rate": 1.4493147138121476e-06, - "loss": 0.5122, - "step": 43439 - }, - { - "epoch": 1.11, - "learning_rate": 1.4492899935886975e-06, - "loss": 0.4868, - "step": 43440 - }, - { - "epoch": 1.11, - "learning_rate": 1.4492652730212467e-06, - "loss": 0.626, - "step": 43441 - }, - { - "epoch": 1.11, - "learning_rate": 1.449240552109814e-06, - "loss": 0.5557, - "step": 43442 - }, - { - "epoch": 1.11, - "learning_rate": 1.4492158308544187e-06, - "loss": 0.6353, - "step": 43443 - }, - { - "epoch": 1.11, - "learning_rate": 1.449191109255079e-06, - "loss": 0.6633, - "step": 43444 - }, - { - "epoch": 1.11, - "learning_rate": 1.449166387311815e-06, - "loss": 0.5557, - "step": 43445 - }, - { - "epoch": 1.11, - "learning_rate": 1.4491416650246447e-06, - "loss": 0.4902, - "step": 43446 - }, - { - "epoch": 1.11, - "learning_rate": 1.4491169423935873e-06, - "loss": 0.6797, - "step": 43447 - }, - { - "epoch": 1.11, - "learning_rate": 1.4490922194186611e-06, - "loss": 0.7559, - "step": 43448 - }, - { - "epoch": 1.11, - "learning_rate": 1.4490674960998864e-06, - "loss": 0.6323, - "step": 43449 - }, - { - "epoch": 1.11, - "learning_rate": 1.4490427724372811e-06, - "loss": 0.6729, - "step": 43450 - }, - { - "epoch": 1.11, - "learning_rate": 1.4490180484308645e-06, - "loss": 0.7188, - "step": 43451 - }, - { - "epoch": 1.11, - "learning_rate": 1.4489933240806553e-06, - "loss": 0.6616, - "step": 43452 - }, - { - "epoch": 1.11, - "learning_rate": 1.4489685993866728e-06, - "loss": 0.6445, - "step": 43453 - }, - { - "epoch": 1.11, - "learning_rate": 1.4489438743489354e-06, - "loss": 0.6865, - "step": 43454 - }, - { - "epoch": 1.11, - "learning_rate": 1.4489191489674624e-06, - "loss": 0.6572, - "step": 43455 - }, - { - "epoch": 1.11, - "learning_rate": 1.4488944232422726e-06, - "loss": 0.3762, - "step": 43456 - }, - { - "epoch": 1.11, - "learning_rate": 1.448869697173385e-06, - "loss": 0.7476, - "step": 43457 - }, - { - "epoch": 1.11, - "learning_rate": 1.4488449707608186e-06, - "loss": 0.7705, - "step": 43458 - }, - { - "epoch": 1.11, - "learning_rate": 1.448820244004592e-06, - "loss": 0.7217, - "step": 43459 - }, - { - "epoch": 1.11, - "learning_rate": 1.4487955169047248e-06, - "loss": 0.7734, - "step": 43460 - }, - { - "epoch": 1.11, - "learning_rate": 1.448770789461235e-06, - "loss": 0.644, - "step": 43461 - }, - { - "epoch": 1.11, - "learning_rate": 1.4487460616741424e-06, - "loss": 0.542, - "step": 43462 - }, - { - "epoch": 1.11, - "learning_rate": 1.4487213335434654e-06, - "loss": 0.6729, - "step": 43463 - }, - { - "epoch": 1.11, - "learning_rate": 1.4486966050692234e-06, - "loss": 0.6228, - "step": 43464 - }, - { - "epoch": 1.11, - "learning_rate": 1.4486718762514348e-06, - "loss": 0.75, - "step": 43465 - }, - { - "epoch": 1.11, - "learning_rate": 1.448647147090119e-06, - "loss": 0.5933, - "step": 43466 - }, - { - "epoch": 1.11, - "learning_rate": 1.4486224175852941e-06, - "loss": 0.7422, - "step": 43467 - }, - { - "epoch": 1.11, - "learning_rate": 1.4485976877369802e-06, - "loss": 0.7227, - "step": 43468 - }, - { - "epoch": 1.11, - "learning_rate": 1.4485729575451955e-06, - "loss": 0.562, - "step": 43469 - }, - { - "epoch": 1.11, - "learning_rate": 1.4485482270099593e-06, - "loss": 0.7861, - "step": 43470 - }, - { - "epoch": 1.11, - "learning_rate": 1.4485234961312902e-06, - "loss": 0.7056, - "step": 43471 - }, - { - "epoch": 1.11, - "learning_rate": 1.4484987649092072e-06, - "loss": 0.561, - "step": 43472 - }, - { - "epoch": 1.11, - "learning_rate": 1.4484740333437295e-06, - "loss": 0.7715, - "step": 43473 - }, - { - "epoch": 1.11, - "learning_rate": 1.4484493014348758e-06, - "loss": 0.6997, - "step": 43474 - }, - { - "epoch": 1.11, - "learning_rate": 1.448424569182665e-06, - "loss": 0.5601, - "step": 43475 - }, - { - "epoch": 1.11, - "learning_rate": 1.4483998365871162e-06, - "loss": 0.6611, - "step": 43476 - }, - { - "epoch": 1.11, - "learning_rate": 1.448375103648248e-06, - "loss": 0.7051, - "step": 43477 - }, - { - "epoch": 1.11, - "learning_rate": 1.44835037036608e-06, - "loss": 0.6997, - "step": 43478 - }, - { - "epoch": 1.11, - "learning_rate": 1.4483256367406304e-06, - "loss": 0.6504, - "step": 43479 - }, - { - "epoch": 1.11, - "learning_rate": 1.4483009027719188e-06, - "loss": 0.605, - "step": 43480 - }, - { - "epoch": 1.11, - "learning_rate": 1.4482761684599638e-06, - "loss": 0.668, - "step": 43481 - }, - { - "epoch": 1.11, - "learning_rate": 1.448251433804784e-06, - "loss": 0.5635, - "step": 43482 - }, - { - "epoch": 1.11, - "learning_rate": 1.448226698806399e-06, - "loss": 0.7461, - "step": 43483 - }, - { - "epoch": 1.11, - "learning_rate": 1.4482019634648273e-06, - "loss": 0.5959, - "step": 43484 - }, - { - "epoch": 1.11, - "learning_rate": 1.4481772277800882e-06, - "loss": 0.75, - "step": 43485 - }, - { - "epoch": 1.11, - "learning_rate": 1.4481524917522e-06, - "loss": 0.624, - "step": 43486 - }, - { - "epoch": 1.11, - "learning_rate": 1.4481277553811823e-06, - "loss": 0.5664, - "step": 43487 - }, - { - "epoch": 1.11, - "learning_rate": 1.4481030186670536e-06, - "loss": 0.6787, - "step": 43488 - }, - { - "epoch": 1.11, - "learning_rate": 1.448078281609833e-06, - "loss": 0.6401, - "step": 43489 - }, - { - "epoch": 1.11, - "learning_rate": 1.4480535442095398e-06, - "loss": 0.458, - "step": 43490 - }, - { - "epoch": 1.11, - "learning_rate": 1.4480288064661926e-06, - "loss": 0.4121, - "step": 43491 - }, - { - "epoch": 1.11, - "learning_rate": 1.44800406837981e-06, - "loss": 0.5654, - "step": 43492 - }, - { - "epoch": 1.11, - "learning_rate": 1.4479793299504114e-06, - "loss": 0.6475, - "step": 43493 - }, - { - "epoch": 1.11, - "learning_rate": 1.4479545911780155e-06, - "loss": 0.6006, - "step": 43494 - }, - { - "epoch": 1.11, - "learning_rate": 1.447929852062642e-06, - "loss": 0.7861, - "step": 43495 - }, - { - "epoch": 1.11, - "learning_rate": 1.4479051126043085e-06, - "loss": 0.6982, - "step": 43496 - }, - { - "epoch": 1.11, - "learning_rate": 1.4478803728030352e-06, - "loss": 0.6494, - "step": 43497 - }, - { - "epoch": 1.11, - "learning_rate": 1.4478556326588397e-06, - "loss": 0.7617, - "step": 43498 - }, - { - "epoch": 1.11, - "learning_rate": 1.4478308921717425e-06, - "loss": 0.4883, - "step": 43499 - }, - { - "epoch": 1.11, - "learning_rate": 1.4478061513417614e-06, - "loss": 0.6582, - "step": 43500 - }, - { - "epoch": 1.11, - "learning_rate": 1.4477814101689156e-06, - "loss": 0.5845, - "step": 43501 - }, - { - "epoch": 1.11, - "learning_rate": 1.4477566686532245e-06, - "loss": 0.563, - "step": 43502 - }, - { - "epoch": 1.12, - "learning_rate": 1.4477319267947065e-06, - "loss": 0.6445, - "step": 43503 - }, - { - "epoch": 1.12, - "learning_rate": 1.447707184593381e-06, - "loss": 0.5485, - "step": 43504 - }, - { - "epoch": 1.12, - "learning_rate": 1.4476824420492666e-06, - "loss": 0.4941, - "step": 43505 - }, - { - "epoch": 1.12, - "learning_rate": 1.4476576991623822e-06, - "loss": 0.6069, - "step": 43506 - }, - { - "epoch": 1.12, - "learning_rate": 1.4476329559327469e-06, - "loss": 0.6885, - "step": 43507 - }, - { - "epoch": 1.12, - "learning_rate": 1.4476082123603798e-06, - "loss": 0.5491, - "step": 43508 - }, - { - "epoch": 1.12, - "learning_rate": 1.4475834684452995e-06, - "loss": 0.7739, - "step": 43509 - }, - { - "epoch": 1.12, - "learning_rate": 1.4475587241875254e-06, - "loss": 0.5957, - "step": 43510 - }, - { - "epoch": 1.12, - "learning_rate": 1.4475339795870758e-06, - "loss": 0.6938, - "step": 43511 - }, - { - "epoch": 1.12, - "learning_rate": 1.44750923464397e-06, - "loss": 0.5322, - "step": 43512 - }, - { - "epoch": 1.12, - "learning_rate": 1.4474844893582272e-06, - "loss": 0.4863, - "step": 43513 - }, - { - "epoch": 1.12, - "learning_rate": 1.447459743729866e-06, - "loss": 0.7295, - "step": 43514 - }, - { - "epoch": 1.12, - "learning_rate": 1.4474349977589056e-06, - "loss": 0.7695, - "step": 43515 - }, - { - "epoch": 1.12, - "learning_rate": 1.4474102514453645e-06, - "loss": 0.6938, - "step": 43516 - }, - { - "epoch": 1.12, - "learning_rate": 1.447385504789262e-06, - "loss": 0.7627, - "step": 43517 - }, - { - "epoch": 1.12, - "learning_rate": 1.4473607577906173e-06, - "loss": 0.6431, - "step": 43518 - }, - { - "epoch": 1.12, - "learning_rate": 1.4473360104494487e-06, - "loss": 0.6543, - "step": 43519 - }, - { - "epoch": 1.12, - "learning_rate": 1.4473112627657757e-06, - "loss": 0.6904, - "step": 43520 - }, - { - "epoch": 1.12, - "learning_rate": 1.447286514739617e-06, - "loss": 0.6924, - "step": 43521 - }, - { - "epoch": 1.12, - "learning_rate": 1.4472617663709916e-06, - "loss": 0.3418, - "step": 43522 - }, - { - "epoch": 1.12, - "learning_rate": 1.4472370176599183e-06, - "loss": 0.6885, - "step": 43523 - }, - { - "epoch": 1.12, - "learning_rate": 1.447212268606416e-06, - "loss": 0.5415, - "step": 43524 - }, - { - "epoch": 1.12, - "learning_rate": 1.4471875192105042e-06, - "loss": 0.5796, - "step": 43525 - }, - { - "epoch": 1.12, - "learning_rate": 1.4471627694722012e-06, - "loss": 0.6655, - "step": 43526 - }, - { - "epoch": 1.12, - "learning_rate": 1.4471380193915266e-06, - "loss": 0.7383, - "step": 43527 - }, - { - "epoch": 1.12, - "learning_rate": 1.4471132689684987e-06, - "loss": 0.6279, - "step": 43528 - }, - { - "epoch": 1.12, - "learning_rate": 1.4470885182031367e-06, - "loss": 0.6021, - "step": 43529 - }, - { - "epoch": 1.12, - "learning_rate": 1.4470637670954598e-06, - "loss": 0.5139, - "step": 43530 - }, - { - "epoch": 1.12, - "learning_rate": 1.4470390156454866e-06, - "loss": 0.6504, - "step": 43531 - }, - { - "epoch": 1.12, - "learning_rate": 1.447014263853236e-06, - "loss": 0.5454, - "step": 43532 - }, - { - "epoch": 1.12, - "learning_rate": 1.4469895117187274e-06, - "loss": 0.8311, - "step": 43533 - }, - { - "epoch": 1.12, - "learning_rate": 1.4469647592419794e-06, - "loss": 0.707, - "step": 43534 - }, - { - "epoch": 1.12, - "learning_rate": 1.4469400064230111e-06, - "loss": 0.7612, - "step": 43535 - }, - { - "epoch": 1.12, - "learning_rate": 1.4469152532618414e-06, - "loss": 0.7559, - "step": 43536 - }, - { - "epoch": 1.12, - "learning_rate": 1.446890499758489e-06, - "loss": 0.6147, - "step": 43537 - }, - { - "epoch": 1.12, - "learning_rate": 1.4468657459129732e-06, - "loss": 0.6543, - "step": 43538 - }, - { - "epoch": 1.12, - "learning_rate": 1.4468409917253128e-06, - "loss": 0.5835, - "step": 43539 - }, - { - "epoch": 1.12, - "learning_rate": 1.446816237195527e-06, - "loss": 0.7617, - "step": 43540 - }, - { - "epoch": 1.12, - "learning_rate": 1.4467914823236346e-06, - "loss": 0.7295, - "step": 43541 - }, - { - "epoch": 1.12, - "learning_rate": 1.446766727109654e-06, - "loss": 0.5854, - "step": 43542 - }, - { - "epoch": 1.12, - "learning_rate": 1.4467419715536054e-06, - "loss": 0.5977, - "step": 43543 - }, - { - "epoch": 1.12, - "learning_rate": 1.4467172156555062e-06, - "loss": 0.322, - "step": 43544 - }, - { - "epoch": 1.12, - "learning_rate": 1.4466924594153768e-06, - "loss": 0.7471, - "step": 43545 - }, - { - "epoch": 1.12, - "learning_rate": 1.4466677028332354e-06, - "loss": 0.8486, - "step": 43546 - }, - { - "epoch": 1.12, - "learning_rate": 1.446642945909101e-06, - "loss": 0.7031, - "step": 43547 - }, - { - "epoch": 1.12, - "learning_rate": 1.4466181886429926e-06, - "loss": 0.7334, - "step": 43548 - }, - { - "epoch": 1.12, - "learning_rate": 1.446593431034929e-06, - "loss": 0.6621, - "step": 43549 - }, - { - "epoch": 1.12, - "learning_rate": 1.4465686730849301e-06, - "loss": 0.749, - "step": 43550 - }, - { - "epoch": 1.12, - "learning_rate": 1.446543914793013e-06, - "loss": 0.625, - "step": 43551 - }, - { - "epoch": 1.12, - "learning_rate": 1.4465191561591986e-06, - "loss": 0.5874, - "step": 43552 - }, - { - "epoch": 1.12, - "learning_rate": 1.4464943971835045e-06, - "loss": 0.488, - "step": 43553 - }, - { - "epoch": 1.12, - "learning_rate": 1.4464696378659507e-06, - "loss": 0.7305, - "step": 43554 - }, - { - "epoch": 1.12, - "learning_rate": 1.4464448782065553e-06, - "loss": 0.667, - "step": 43555 - }, - { - "epoch": 1.12, - "learning_rate": 1.4464201182053377e-06, - "loss": 0.7646, - "step": 43556 - }, - { - "epoch": 1.12, - "learning_rate": 1.4463953578623164e-06, - "loss": 0.5659, - "step": 43557 - }, - { - "epoch": 1.12, - "learning_rate": 1.446370597177511e-06, - "loss": 0.583, - "step": 43558 - }, - { - "epoch": 1.12, - "learning_rate": 1.44634583615094e-06, - "loss": 0.583, - "step": 43559 - }, - { - "epoch": 1.12, - "learning_rate": 1.446321074782623e-06, - "loss": 0.707, - "step": 43560 - }, - { - "epoch": 1.12, - "learning_rate": 1.4462963130725781e-06, - "loss": 0.6138, - "step": 43561 - }, - { - "epoch": 1.12, - "learning_rate": 1.4462715510208246e-06, - "loss": 0.6196, - "step": 43562 - }, - { - "epoch": 1.12, - "learning_rate": 1.4462467886273815e-06, - "loss": 0.6191, - "step": 43563 - }, - { - "epoch": 1.12, - "learning_rate": 1.4462220258922677e-06, - "loss": 0.5869, - "step": 43564 - }, - { - "epoch": 1.12, - "learning_rate": 1.4461972628155024e-06, - "loss": 0.5791, - "step": 43565 - }, - { - "epoch": 1.12, - "learning_rate": 1.446172499397104e-06, - "loss": 0.5874, - "step": 43566 - }, - { - "epoch": 1.12, - "learning_rate": 1.4461477356370923e-06, - "loss": 0.6841, - "step": 43567 - }, - { - "epoch": 1.12, - "learning_rate": 1.4461229715354858e-06, - "loss": 0.834, - "step": 43568 - }, - { - "epoch": 1.12, - "learning_rate": 1.4460982070923028e-06, - "loss": 0.6001, - "step": 43569 - }, - { - "epoch": 1.12, - "learning_rate": 1.4460734423075636e-06, - "loss": 0.6128, - "step": 43570 - }, - { - "epoch": 1.12, - "learning_rate": 1.4460486771812863e-06, - "loss": 0.748, - "step": 43571 - }, - { - "epoch": 1.12, - "learning_rate": 1.4460239117134898e-06, - "loss": 0.7891, - "step": 43572 - }, - { - "epoch": 1.12, - "learning_rate": 1.4459991459041937e-06, - "loss": 0.8091, - "step": 43573 - }, - { - "epoch": 1.12, - "learning_rate": 1.4459743797534162e-06, - "loss": 0.5488, - "step": 43574 - }, - { - "epoch": 1.12, - "learning_rate": 1.445949613261177e-06, - "loss": 0.5884, - "step": 43575 - }, - { - "epoch": 1.12, - "learning_rate": 1.4459248464274943e-06, - "loss": 0.7002, - "step": 43576 - }, - { - "epoch": 1.12, - "learning_rate": 1.4459000792523876e-06, - "loss": 0.709, - "step": 43577 - }, - { - "epoch": 1.12, - "learning_rate": 1.4458753117358757e-06, - "loss": 0.5532, - "step": 43578 - }, - { - "epoch": 1.12, - "learning_rate": 1.4458505438779779e-06, - "loss": 0.8389, - "step": 43579 - }, - { - "epoch": 1.12, - "learning_rate": 1.4458257756787125e-06, - "loss": 0.6206, - "step": 43580 - }, - { - "epoch": 1.12, - "learning_rate": 1.445801007138099e-06, - "loss": 0.7861, - "step": 43581 - }, - { - "epoch": 1.12, - "learning_rate": 1.4457762382561557e-06, - "loss": 0.7812, - "step": 43582 - }, - { - "epoch": 1.12, - "learning_rate": 1.4457514690329022e-06, - "loss": 0.5543, - "step": 43583 - }, - { - "epoch": 1.12, - "learning_rate": 1.4457266994683575e-06, - "loss": 0.6426, - "step": 43584 - }, - { - "epoch": 1.12, - "learning_rate": 1.4457019295625403e-06, - "loss": 0.5845, - "step": 43585 - }, - { - "epoch": 1.12, - "learning_rate": 1.4456771593154696e-06, - "loss": 0.7422, - "step": 43586 - }, - { - "epoch": 1.12, - "learning_rate": 1.4456523887271645e-06, - "loss": 0.748, - "step": 43587 - }, - { - "epoch": 1.12, - "learning_rate": 1.4456276177976436e-06, - "loss": 0.6665, - "step": 43588 - }, - { - "epoch": 1.12, - "learning_rate": 1.4456028465269264e-06, - "loss": 0.5874, - "step": 43589 - }, - { - "epoch": 1.12, - "learning_rate": 1.4455780749150315e-06, - "loss": 0.6079, - "step": 43590 - }, - { - "epoch": 1.12, - "learning_rate": 1.445553302961978e-06, - "loss": 0.8584, - "step": 43591 - }, - { - "epoch": 1.12, - "learning_rate": 1.4455285306677846e-06, - "loss": 0.6221, - "step": 43592 - }, - { - "epoch": 1.12, - "learning_rate": 1.4455037580324704e-06, - "loss": 0.7627, - "step": 43593 - }, - { - "epoch": 1.12, - "learning_rate": 1.4454789850560552e-06, - "loss": 0.5264, - "step": 43594 - }, - { - "epoch": 1.12, - "learning_rate": 1.4454542117385566e-06, - "loss": 0.6729, - "step": 43595 - }, - { - "epoch": 1.12, - "learning_rate": 1.4454294380799942e-06, - "loss": 0.7354, - "step": 43596 - }, - { - "epoch": 1.12, - "learning_rate": 1.445404664080387e-06, - "loss": 0.6333, - "step": 43597 - }, - { - "epoch": 1.12, - "learning_rate": 1.4453798897397543e-06, - "loss": 0.6953, - "step": 43598 - }, - { - "epoch": 1.12, - "learning_rate": 1.4453551150581142e-06, - "loss": 0.667, - "step": 43599 - }, - { - "epoch": 1.12, - "learning_rate": 1.4453303400354866e-06, - "loss": 0.6602, - "step": 43600 - }, - { - "epoch": 1.12, - "learning_rate": 1.4453055646718896e-06, - "loss": 0.6611, - "step": 43601 - }, - { - "epoch": 1.12, - "learning_rate": 1.445280788967343e-06, - "loss": 0.7578, - "step": 43602 - }, - { - "epoch": 1.12, - "learning_rate": 1.445256012921865e-06, - "loss": 0.7109, - "step": 43603 - }, - { - "epoch": 1.12, - "learning_rate": 1.4452312365354753e-06, - "loss": 0.6436, - "step": 43604 - }, - { - "epoch": 1.12, - "learning_rate": 1.4452064598081924e-06, - "loss": 0.7241, - "step": 43605 - }, - { - "epoch": 1.12, - "learning_rate": 1.4451816827400353e-06, - "loss": 0.6631, - "step": 43606 - }, - { - "epoch": 1.12, - "learning_rate": 1.445156905331023e-06, - "loss": 0.6797, - "step": 43607 - }, - { - "epoch": 1.12, - "learning_rate": 1.4451321275811748e-06, - "loss": 0.6963, - "step": 43608 - }, - { - "epoch": 1.12, - "learning_rate": 1.445107349490509e-06, - "loss": 0.687, - "step": 43609 - }, - { - "epoch": 1.12, - "learning_rate": 1.4450825710590453e-06, - "loss": 0.5273, - "step": 43610 - }, - { - "epoch": 1.12, - "learning_rate": 1.4450577922868021e-06, - "loss": 0.5474, - "step": 43611 - }, - { - "epoch": 1.12, - "learning_rate": 1.4450330131737988e-06, - "loss": 0.5068, - "step": 43612 - }, - { - "epoch": 1.12, - "learning_rate": 1.445008233720054e-06, - "loss": 0.6182, - "step": 43613 - }, - { - "epoch": 1.12, - "learning_rate": 1.4449834539255871e-06, - "loss": 0.5635, - "step": 43614 - }, - { - "epoch": 1.12, - "learning_rate": 1.4449586737904169e-06, - "loss": 0.626, - "step": 43615 - }, - { - "epoch": 1.12, - "learning_rate": 1.444933893314562e-06, - "loss": 0.4861, - "step": 43616 - }, - { - "epoch": 1.12, - "learning_rate": 1.4449091124980418e-06, - "loss": 0.7656, - "step": 43617 - }, - { - "epoch": 1.12, - "learning_rate": 1.444884331340875e-06, - "loss": 0.5908, - "step": 43618 - }, - { - "epoch": 1.12, - "learning_rate": 1.4448595498430812e-06, - "loss": 0.6099, - "step": 43619 - }, - { - "epoch": 1.12, - "learning_rate": 1.4448347680046784e-06, - "loss": 0.6367, - "step": 43620 - }, - { - "epoch": 1.12, - "learning_rate": 1.444809985825686e-06, - "loss": 0.5488, - "step": 43621 - }, - { - "epoch": 1.12, - "learning_rate": 1.4447852033061233e-06, - "loss": 0.6436, - "step": 43622 - }, - { - "epoch": 1.12, - "learning_rate": 1.4447604204460091e-06, - "loss": 0.6992, - "step": 43623 - }, - { - "epoch": 1.12, - "learning_rate": 1.4447356372453623e-06, - "loss": 0.5459, - "step": 43624 - }, - { - "epoch": 1.12, - "learning_rate": 1.4447108537042018e-06, - "loss": 0.6772, - "step": 43625 - }, - { - "epoch": 1.12, - "learning_rate": 1.4446860698225466e-06, - "loss": 0.6729, - "step": 43626 - }, - { - "epoch": 1.12, - "learning_rate": 1.4446612856004157e-06, - "loss": 0.7012, - "step": 43627 - }, - { - "epoch": 1.12, - "learning_rate": 1.4446365010378281e-06, - "loss": 0.6191, - "step": 43628 - }, - { - "epoch": 1.12, - "learning_rate": 1.4446117161348028e-06, - "loss": 0.6436, - "step": 43629 - }, - { - "epoch": 1.12, - "learning_rate": 1.4445869308913587e-06, - "loss": 0.6172, - "step": 43630 - }, - { - "epoch": 1.12, - "learning_rate": 1.4445621453075152e-06, - "loss": 0.6279, - "step": 43631 - }, - { - "epoch": 1.12, - "learning_rate": 1.4445373593832904e-06, - "loss": 0.6289, - "step": 43632 - }, - { - "epoch": 1.12, - "learning_rate": 1.444512573118704e-06, - "loss": 0.6499, - "step": 43633 - }, - { - "epoch": 1.12, - "learning_rate": 1.444487786513775e-06, - "loss": 0.668, - "step": 43634 - }, - { - "epoch": 1.12, - "learning_rate": 1.4444629995685216e-06, - "loss": 0.4231, - "step": 43635 - }, - { - "epoch": 1.12, - "learning_rate": 1.4444382122829636e-06, - "loss": 0.4988, - "step": 43636 - }, - { - "epoch": 1.12, - "learning_rate": 1.4444134246571196e-06, - "loss": 0.6426, - "step": 43637 - }, - { - "epoch": 1.12, - "learning_rate": 1.444388636691009e-06, - "loss": 0.6006, - "step": 43638 - }, - { - "epoch": 1.12, - "learning_rate": 1.4443638483846504e-06, - "loss": 0.7773, - "step": 43639 - }, - { - "epoch": 1.12, - "learning_rate": 1.4443390597380628e-06, - "loss": 0.5815, - "step": 43640 - }, - { - "epoch": 1.12, - "learning_rate": 1.4443142707512648e-06, - "loss": 0.5688, - "step": 43641 - }, - { - "epoch": 1.12, - "learning_rate": 1.444289481424276e-06, - "loss": 0.7065, - "step": 43642 - }, - { - "epoch": 1.12, - "learning_rate": 1.4442646917571153e-06, - "loss": 0.499, - "step": 43643 - }, - { - "epoch": 1.12, - "learning_rate": 1.4442399017498017e-06, - "loss": 0.8125, - "step": 43644 - }, - { - "epoch": 1.12, - "learning_rate": 1.4442151114023537e-06, - "loss": 0.6455, - "step": 43645 - }, - { - "epoch": 1.12, - "learning_rate": 1.4441903207147907e-06, - "loss": 0.5664, - "step": 43646 - }, - { - "epoch": 1.12, - "learning_rate": 1.4441655296871316e-06, - "loss": 0.6084, - "step": 43647 - }, - { - "epoch": 1.12, - "learning_rate": 1.4441407383193956e-06, - "loss": 0.5842, - "step": 43648 - }, - { - "epoch": 1.12, - "learning_rate": 1.4441159466116013e-06, - "loss": 0.3658, - "step": 43649 - }, - { - "epoch": 1.12, - "learning_rate": 1.4440911545637677e-06, - "loss": 0.2881, - "step": 43650 - }, - { - "epoch": 1.12, - "learning_rate": 1.4440663621759142e-06, - "loss": 0.5967, - "step": 43651 - }, - { - "epoch": 1.12, - "learning_rate": 1.4440415694480592e-06, - "loss": 0.5098, - "step": 43652 - }, - { - "epoch": 1.12, - "learning_rate": 1.4440167763802222e-06, - "loss": 0.6729, - "step": 43653 - }, - { - "epoch": 1.12, - "learning_rate": 1.4439919829724218e-06, - "loss": 0.5118, - "step": 43654 - }, - { - "epoch": 1.12, - "learning_rate": 1.4439671892246773e-06, - "loss": 0.4617, - "step": 43655 - }, - { - "epoch": 1.12, - "learning_rate": 1.4439423951370076e-06, - "loss": 0.7739, - "step": 43656 - }, - { - "epoch": 1.12, - "learning_rate": 1.4439176007094313e-06, - "loss": 0.7188, - "step": 43657 - }, - { - "epoch": 1.12, - "learning_rate": 1.443892805941968e-06, - "loss": 0.4492, - "step": 43658 - }, - { - "epoch": 1.12, - "learning_rate": 1.4438680108346367e-06, - "loss": 0.6173, - "step": 43659 - }, - { - "epoch": 1.12, - "learning_rate": 1.4438432153874553e-06, - "loss": 0.5, - "step": 43660 - }, - { - "epoch": 1.12, - "learning_rate": 1.4438184196004441e-06, - "loss": 0.5708, - "step": 43661 - }, - { - "epoch": 1.12, - "learning_rate": 1.4437936234736213e-06, - "loss": 0.7227, - "step": 43662 - }, - { - "epoch": 1.12, - "learning_rate": 1.4437688270070064e-06, - "loss": 0.8242, - "step": 43663 - }, - { - "epoch": 1.12, - "learning_rate": 1.443744030200618e-06, - "loss": 0.7451, - "step": 43664 - }, - { - "epoch": 1.12, - "learning_rate": 1.443719233054475e-06, - "loss": 0.79, - "step": 43665 - }, - { - "epoch": 1.12, - "learning_rate": 1.4436944355685968e-06, - "loss": 0.5947, - "step": 43666 - }, - { - "epoch": 1.12, - "learning_rate": 1.443669637743002e-06, - "loss": 0.5615, - "step": 43667 - }, - { - "epoch": 1.12, - "learning_rate": 1.4436448395777099e-06, - "loss": 0.7441, - "step": 43668 - }, - { - "epoch": 1.12, - "learning_rate": 1.4436200410727396e-06, - "loss": 0.6289, - "step": 43669 - }, - { - "epoch": 1.12, - "learning_rate": 1.4435952422281093e-06, - "loss": 0.5898, - "step": 43670 - }, - { - "epoch": 1.12, - "learning_rate": 1.4435704430438387e-06, - "loss": 0.7207, - "step": 43671 - }, - { - "epoch": 1.12, - "learning_rate": 1.4435456435199464e-06, - "loss": 0.6548, - "step": 43672 - }, - { - "epoch": 1.12, - "learning_rate": 1.4435208436564522e-06, - "loss": 0.5913, - "step": 43673 - }, - { - "epoch": 1.12, - "learning_rate": 1.4434960434533741e-06, - "loss": 0.6328, - "step": 43674 - }, - { - "epoch": 1.12, - "learning_rate": 1.4434712429107316e-06, - "loss": 0.6138, - "step": 43675 - }, - { - "epoch": 1.12, - "learning_rate": 1.4434464420285432e-06, - "loss": 0.7188, - "step": 43676 - }, - { - "epoch": 1.12, - "learning_rate": 1.4434216408068287e-06, - "loss": 0.4454, - "step": 43677 - }, - { - "epoch": 1.12, - "learning_rate": 1.4433968392456064e-06, - "loss": 0.7695, - "step": 43678 - }, - { - "epoch": 1.12, - "learning_rate": 1.4433720373448956e-06, - "loss": 0.6914, - "step": 43679 - }, - { - "epoch": 1.12, - "learning_rate": 1.4433472351047154e-06, - "loss": 0.6479, - "step": 43680 - }, - { - "epoch": 1.12, - "learning_rate": 1.443322432525084e-06, - "loss": 0.4321, - "step": 43681 - }, - { - "epoch": 1.12, - "learning_rate": 1.4432976296060218e-06, - "loss": 0.6099, - "step": 43682 - }, - { - "epoch": 1.12, - "learning_rate": 1.4432728263475462e-06, - "loss": 0.791, - "step": 43683 - }, - { - "epoch": 1.12, - "learning_rate": 1.4432480227496777e-06, - "loss": 0.6406, - "step": 43684 - }, - { - "epoch": 1.12, - "learning_rate": 1.443223218812434e-06, - "loss": 0.6068, - "step": 43685 - }, - { - "epoch": 1.12, - "learning_rate": 1.4431984145358351e-06, - "loss": 0.7256, - "step": 43686 - }, - { - "epoch": 1.12, - "learning_rate": 1.4431736099198993e-06, - "loss": 0.4917, - "step": 43687 - }, - { - "epoch": 1.12, - "learning_rate": 1.4431488049646458e-06, - "loss": 0.8232, - "step": 43688 - }, - { - "epoch": 1.12, - "learning_rate": 1.4431239996700938e-06, - "loss": 0.6553, - "step": 43689 - }, - { - "epoch": 1.12, - "learning_rate": 1.4430991940362622e-06, - "loss": 0.627, - "step": 43690 - }, - { - "epoch": 1.12, - "learning_rate": 1.4430743880631697e-06, - "loss": 0.6294, - "step": 43691 - }, - { - "epoch": 1.12, - "learning_rate": 1.4430495817508356e-06, - "loss": 0.6221, - "step": 43692 - }, - { - "epoch": 1.12, - "learning_rate": 1.4430247750992788e-06, - "loss": 0.4822, - "step": 43693 - }, - { - "epoch": 1.12, - "learning_rate": 1.4429999681085186e-06, - "loss": 0.7012, - "step": 43694 - }, - { - "epoch": 1.12, - "learning_rate": 1.442975160778573e-06, - "loss": 0.667, - "step": 43695 - }, - { - "epoch": 1.12, - "learning_rate": 1.4429503531094625e-06, - "loss": 0.7354, - "step": 43696 - }, - { - "epoch": 1.12, - "learning_rate": 1.4429255451012048e-06, - "loss": 0.6055, - "step": 43697 - }, - { - "epoch": 1.12, - "learning_rate": 1.4429007367538194e-06, - "loss": 0.5664, - "step": 43698 - }, - { - "epoch": 1.12, - "learning_rate": 1.4428759280673255e-06, - "loss": 0.7051, - "step": 43699 - }, - { - "epoch": 1.12, - "learning_rate": 1.4428511190417414e-06, - "loss": 0.5581, - "step": 43700 - }, - { - "epoch": 1.12, - "learning_rate": 1.442826309677087e-06, - "loss": 0.6206, - "step": 43701 - }, - { - "epoch": 1.12, - "learning_rate": 1.4428014999733808e-06, - "loss": 0.7607, - "step": 43702 - }, - { - "epoch": 1.12, - "learning_rate": 1.4427766899306417e-06, - "loss": 0.7157, - "step": 43703 - }, - { - "epoch": 1.12, - "learning_rate": 1.4427518795488888e-06, - "loss": 0.666, - "step": 43704 - }, - { - "epoch": 1.12, - "learning_rate": 1.4427270688281415e-06, - "loss": 0.6284, - "step": 43705 - }, - { - "epoch": 1.12, - "learning_rate": 1.4427022577684181e-06, - "loss": 0.6631, - "step": 43706 - }, - { - "epoch": 1.12, - "learning_rate": 1.442677446369738e-06, - "loss": 0.6162, - "step": 43707 - }, - { - "epoch": 1.12, - "learning_rate": 1.44265263463212e-06, - "loss": 0.6689, - "step": 43708 - }, - { - "epoch": 1.12, - "learning_rate": 1.4426278225555836e-06, - "loss": 0.6069, - "step": 43709 - }, - { - "epoch": 1.12, - "learning_rate": 1.4426030101401472e-06, - "loss": 0.7344, - "step": 43710 - }, - { - "epoch": 1.12, - "learning_rate": 1.44257819738583e-06, - "loss": 0.7959, - "step": 43711 - }, - { - "epoch": 1.12, - "learning_rate": 1.442553384292651e-06, - "loss": 0.7305, - "step": 43712 - }, - { - "epoch": 1.12, - "learning_rate": 1.4425285708606293e-06, - "loss": 0.6797, - "step": 43713 - }, - { - "epoch": 1.12, - "learning_rate": 1.442503757089784e-06, - "loss": 0.4652, - "step": 43714 - }, - { - "epoch": 1.12, - "learning_rate": 1.4424789429801338e-06, - "loss": 0.5029, - "step": 43715 - }, - { - "epoch": 1.12, - "learning_rate": 1.4424541285316976e-06, - "loss": 0.7988, - "step": 43716 - }, - { - "epoch": 1.12, - "learning_rate": 1.442429313744495e-06, - "loss": 0.7192, - "step": 43717 - }, - { - "epoch": 1.12, - "learning_rate": 1.4424044986185443e-06, - "loss": 0.6982, - "step": 43718 - }, - { - "epoch": 1.12, - "learning_rate": 1.4423796831538648e-06, - "loss": 0.666, - "step": 43719 - }, - { - "epoch": 1.12, - "learning_rate": 1.4423548673504758e-06, - "loss": 0.5835, - "step": 43720 - }, - { - "epoch": 1.12, - "learning_rate": 1.4423300512083957e-06, - "loss": 0.7422, - "step": 43721 - }, - { - "epoch": 1.12, - "learning_rate": 1.4423052347276442e-06, - "loss": 0.6523, - "step": 43722 - }, - { - "epoch": 1.12, - "learning_rate": 1.4422804179082395e-06, - "loss": 0.7139, - "step": 43723 - }, - { - "epoch": 1.12, - "learning_rate": 1.4422556007502014e-06, - "loss": 0.6592, - "step": 43724 - }, - { - "epoch": 1.12, - "learning_rate": 1.442230783253548e-06, - "loss": 0.6685, - "step": 43725 - }, - { - "epoch": 1.12, - "learning_rate": 1.4422059654182995e-06, - "loss": 0.7793, - "step": 43726 - }, - { - "epoch": 1.12, - "learning_rate": 1.4421811472444737e-06, - "loss": 0.7422, - "step": 43727 - }, - { - "epoch": 1.12, - "learning_rate": 1.44215632873209e-06, - "loss": 0.6797, - "step": 43728 - }, - { - "epoch": 1.12, - "learning_rate": 1.4421315098811681e-06, - "loss": 0.6562, - "step": 43729 - }, - { - "epoch": 1.12, - "learning_rate": 1.4421066906917263e-06, - "loss": 0.5293, - "step": 43730 - }, - { - "epoch": 1.12, - "learning_rate": 1.4420818711637835e-06, - "loss": 0.4006, - "step": 43731 - }, - { - "epoch": 1.12, - "learning_rate": 1.442057051297359e-06, - "loss": 0.5669, - "step": 43732 - }, - { - "epoch": 1.12, - "learning_rate": 1.4420322310924717e-06, - "loss": 0.6504, - "step": 43733 - }, - { - "epoch": 1.12, - "learning_rate": 1.442007410549141e-06, - "loss": 0.7051, - "step": 43734 - }, - { - "epoch": 1.12, - "learning_rate": 1.4419825896673853e-06, - "loss": 0.8555, - "step": 43735 - }, - { - "epoch": 1.12, - "learning_rate": 1.4419577684472237e-06, - "loss": 0.5437, - "step": 43736 - }, - { - "epoch": 1.12, - "learning_rate": 1.4419329468886754e-06, - "loss": 0.6348, - "step": 43737 - }, - { - "epoch": 1.12, - "learning_rate": 1.4419081249917595e-06, - "loss": 0.6277, - "step": 43738 - }, - { - "epoch": 1.12, - "learning_rate": 1.441883302756495e-06, - "loss": 0.6685, - "step": 43739 - }, - { - "epoch": 1.12, - "learning_rate": 1.4418584801829005e-06, - "loss": 0.6846, - "step": 43740 - }, - { - "epoch": 1.12, - "learning_rate": 1.4418336572709952e-06, - "loss": 0.7031, - "step": 43741 - }, - { - "epoch": 1.12, - "learning_rate": 1.4418088340207987e-06, - "loss": 0.6067, - "step": 43742 - }, - { - "epoch": 1.12, - "learning_rate": 1.441784010432329e-06, - "loss": 0.8193, - "step": 43743 - }, - { - "epoch": 1.12, - "learning_rate": 1.4417591865056057e-06, - "loss": 0.5859, - "step": 43744 - }, - { - "epoch": 1.12, - "learning_rate": 1.441734362240648e-06, - "loss": 0.7305, - "step": 43745 - }, - { - "epoch": 1.12, - "learning_rate": 1.4417095376374741e-06, - "loss": 0.637, - "step": 43746 - }, - { - "epoch": 1.12, - "learning_rate": 1.4416847126961039e-06, - "loss": 0.6699, - "step": 43747 - }, - { - "epoch": 1.12, - "learning_rate": 1.441659887416556e-06, - "loss": 0.5869, - "step": 43748 - }, - { - "epoch": 1.12, - "learning_rate": 1.4416350617988494e-06, - "loss": 0.7363, - "step": 43749 - }, - { - "epoch": 1.12, - "learning_rate": 1.4416102358430028e-06, - "loss": 0.7734, - "step": 43750 - }, - { - "epoch": 1.12, - "learning_rate": 1.4415854095490362e-06, - "loss": 0.6113, - "step": 43751 - }, - { - "epoch": 1.12, - "learning_rate": 1.4415605829169672e-06, - "loss": 0.3911, - "step": 43752 - }, - { - "epoch": 1.12, - "learning_rate": 1.441535755946816e-06, - "loss": 0.5938, - "step": 43753 - }, - { - "epoch": 1.12, - "learning_rate": 1.4415109286386011e-06, - "loss": 0.4639, - "step": 43754 - }, - { - "epoch": 1.12, - "learning_rate": 1.4414861009923417e-06, - "loss": 0.6904, - "step": 43755 - }, - { - "epoch": 1.12, - "learning_rate": 1.4414612730080567e-06, - "loss": 0.6338, - "step": 43756 - }, - { - "epoch": 1.12, - "learning_rate": 1.441436444685765e-06, - "loss": 0.4238, - "step": 43757 - }, - { - "epoch": 1.12, - "learning_rate": 1.4414116160254856e-06, - "loss": 0.7363, - "step": 43758 - }, - { - "epoch": 1.12, - "learning_rate": 1.441386787027238e-06, - "loss": 0.6855, - "step": 43759 - }, - { - "epoch": 1.12, - "learning_rate": 1.4413619576910402e-06, - "loss": 0.6187, - "step": 43760 - }, - { - "epoch": 1.12, - "learning_rate": 1.4413371280169124e-06, - "loss": 0.7695, - "step": 43761 - }, - { - "epoch": 1.12, - "learning_rate": 1.4413122980048728e-06, - "loss": 0.625, - "step": 43762 - }, - { - "epoch": 1.12, - "learning_rate": 1.441287467654941e-06, - "loss": 0.6279, - "step": 43763 - }, - { - "epoch": 1.12, - "learning_rate": 1.4412626369671353e-06, - "loss": 0.7598, - "step": 43764 - }, - { - "epoch": 1.12, - "learning_rate": 1.441237805941475e-06, - "loss": 0.7666, - "step": 43765 - }, - { - "epoch": 1.12, - "learning_rate": 1.4412129745779796e-06, - "loss": 0.6675, - "step": 43766 - }, - { - "epoch": 1.12, - "learning_rate": 1.4411881428766675e-06, - "loss": 0.7607, - "step": 43767 - }, - { - "epoch": 1.12, - "learning_rate": 1.4411633108375578e-06, - "loss": 0.6499, - "step": 43768 - }, - { - "epoch": 1.12, - "learning_rate": 1.4411384784606698e-06, - "loss": 0.4534, - "step": 43769 - }, - { - "epoch": 1.12, - "learning_rate": 1.4411136457460225e-06, - "loss": 0.6631, - "step": 43770 - }, - { - "epoch": 1.12, - "learning_rate": 1.4410888126936341e-06, - "loss": 0.6895, - "step": 43771 - }, - { - "epoch": 1.12, - "learning_rate": 1.441063979303525e-06, - "loss": 0.5791, - "step": 43772 - }, - { - "epoch": 1.12, - "learning_rate": 1.4410391455757131e-06, - "loss": 0.51, - "step": 43773 - }, - { - "epoch": 1.12, - "learning_rate": 1.4410143115102185e-06, - "loss": 0.5608, - "step": 43774 - }, - { - "epoch": 1.12, - "learning_rate": 1.4409894771070587e-06, - "loss": 0.6592, - "step": 43775 - }, - { - "epoch": 1.12, - "learning_rate": 1.440964642366254e-06, - "loss": 0.6743, - "step": 43776 - }, - { - "epoch": 1.12, - "learning_rate": 1.4409398072878226e-06, - "loss": 0.5508, - "step": 43777 - }, - { - "epoch": 1.12, - "learning_rate": 1.4409149718717841e-06, - "loss": 0.665, - "step": 43778 - }, - { - "epoch": 1.12, - "learning_rate": 1.4408901361181571e-06, - "loss": 0.7637, - "step": 43779 - }, - { - "epoch": 1.12, - "learning_rate": 1.440865300026961e-06, - "loss": 0.6587, - "step": 43780 - }, - { - "epoch": 1.12, - "learning_rate": 1.4408404635982144e-06, - "loss": 0.6782, - "step": 43781 - }, - { - "epoch": 1.12, - "learning_rate": 1.4408156268319367e-06, - "loss": 0.3733, - "step": 43782 - }, - { - "epoch": 1.12, - "learning_rate": 1.4407907897281466e-06, - "loss": 0.5415, - "step": 43783 - }, - { - "epoch": 1.12, - "learning_rate": 1.4407659522868636e-06, - "loss": 0.625, - "step": 43784 - }, - { - "epoch": 1.12, - "learning_rate": 1.4407411145081061e-06, - "loss": 0.7153, - "step": 43785 - }, - { - "epoch": 1.12, - "learning_rate": 1.4407162763918933e-06, - "loss": 0.5588, - "step": 43786 - }, - { - "epoch": 1.12, - "learning_rate": 1.4406914379382444e-06, - "loss": 0.8379, - "step": 43787 - }, - { - "epoch": 1.12, - "learning_rate": 1.4406665991471784e-06, - "loss": 0.5264, - "step": 43788 - }, - { - "epoch": 1.12, - "learning_rate": 1.4406417600187144e-06, - "loss": 0.6099, - "step": 43789 - }, - { - "epoch": 1.12, - "learning_rate": 1.4406169205528709e-06, - "loss": 0.75, - "step": 43790 - }, - { - "epoch": 1.12, - "learning_rate": 1.4405920807496674e-06, - "loss": 0.6255, - "step": 43791 - }, - { - "epoch": 1.12, - "learning_rate": 1.440567240609123e-06, - "loss": 0.7344, - "step": 43792 - }, - { - "epoch": 1.12, - "learning_rate": 1.4405424001312563e-06, - "loss": 0.5596, - "step": 43793 - }, - { - "epoch": 1.12, - "learning_rate": 1.4405175593160867e-06, - "loss": 0.5928, - "step": 43794 - }, - { - "epoch": 1.12, - "learning_rate": 1.440492718163633e-06, - "loss": 0.7832, - "step": 43795 - }, - { - "epoch": 1.12, - "learning_rate": 1.4404678766739142e-06, - "loss": 0.7217, - "step": 43796 - }, - { - "epoch": 1.12, - "learning_rate": 1.4404430348469496e-06, - "loss": 0.6836, - "step": 43797 - }, - { - "epoch": 1.12, - "learning_rate": 1.4404181926827576e-06, - "loss": 0.6472, - "step": 43798 - }, - { - "epoch": 1.12, - "learning_rate": 1.4403933501813582e-06, - "loss": 0.582, - "step": 43799 - }, - { - "epoch": 1.12, - "learning_rate": 1.4403685073427697e-06, - "loss": 0.7412, - "step": 43800 - }, - { - "epoch": 1.12, - "learning_rate": 1.440343664167011e-06, - "loss": 0.5474, - "step": 43801 - }, - { - "epoch": 1.12, - "learning_rate": 1.4403188206541016e-06, - "loss": 0.7158, - "step": 43802 - }, - { - "epoch": 1.12, - "learning_rate": 1.4402939768040604e-06, - "loss": 0.5518, - "step": 43803 - }, - { - "epoch": 1.12, - "learning_rate": 1.4402691326169062e-06, - "loss": 0.8018, - "step": 43804 - }, - { - "epoch": 1.12, - "learning_rate": 1.4402442880926583e-06, - "loss": 0.5437, - "step": 43805 - }, - { - "epoch": 1.12, - "learning_rate": 1.4402194432313354e-06, - "loss": 0.6982, - "step": 43806 - }, - { - "epoch": 1.12, - "learning_rate": 1.4401945980329569e-06, - "loss": 0.6061, - "step": 43807 - }, - { - "epoch": 1.12, - "learning_rate": 1.4401697524975414e-06, - "loss": 0.6479, - "step": 43808 - }, - { - "epoch": 1.12, - "learning_rate": 1.4401449066251084e-06, - "loss": 0.7935, - "step": 43809 - }, - { - "epoch": 1.12, - "learning_rate": 1.4401200604156767e-06, - "loss": 0.7188, - "step": 43810 - }, - { - "epoch": 1.12, - "learning_rate": 1.4400952138692653e-06, - "loss": 0.6909, - "step": 43811 - }, - { - "epoch": 1.12, - "learning_rate": 1.4400703669858928e-06, - "loss": 0.4805, - "step": 43812 - }, - { - "epoch": 1.12, - "learning_rate": 1.4400455197655791e-06, - "loss": 0.5132, - "step": 43813 - }, - { - "epoch": 1.12, - "learning_rate": 1.4400206722083428e-06, - "loss": 0.5547, - "step": 43814 - }, - { - "epoch": 1.12, - "learning_rate": 1.4399958243142027e-06, - "loss": 0.6709, - "step": 43815 - }, - { - "epoch": 1.12, - "learning_rate": 1.4399709760831781e-06, - "loss": 0.749, - "step": 43816 - }, - { - "epoch": 1.12, - "learning_rate": 1.439946127515288e-06, - "loss": 0.7085, - "step": 43817 - }, - { - "epoch": 1.12, - "learning_rate": 1.4399212786105514e-06, - "loss": 0.6016, - "step": 43818 - }, - { - "epoch": 1.12, - "learning_rate": 1.4398964293689873e-06, - "loss": 0.708, - "step": 43819 - }, - { - "epoch": 1.12, - "learning_rate": 1.4398715797906147e-06, - "loss": 0.6172, - "step": 43820 - }, - { - "epoch": 1.12, - "learning_rate": 1.4398467298754526e-06, - "loss": 0.5625, - "step": 43821 - }, - { - "epoch": 1.12, - "learning_rate": 1.43982187962352e-06, - "loss": 0.6479, - "step": 43822 - }, - { - "epoch": 1.12, - "learning_rate": 1.439797029034836e-06, - "loss": 0.6694, - "step": 43823 - }, - { - "epoch": 1.12, - "learning_rate": 1.4397721781094202e-06, - "loss": 0.6729, - "step": 43824 - }, - { - "epoch": 1.12, - "learning_rate": 1.4397473268472903e-06, - "loss": 0.6709, - "step": 43825 - }, - { - "epoch": 1.12, - "learning_rate": 1.4397224752484666e-06, - "loss": 0.6729, - "step": 43826 - }, - { - "epoch": 1.12, - "learning_rate": 1.4396976233129674e-06, - "loss": 0.6782, - "step": 43827 - }, - { - "epoch": 1.12, - "learning_rate": 1.439672771040812e-06, - "loss": 0.5425, - "step": 43828 - }, - { - "epoch": 1.12, - "learning_rate": 1.4396479184320193e-06, - "loss": 0.542, - "step": 43829 - }, - { - "epoch": 1.12, - "learning_rate": 1.4396230654866086e-06, - "loss": 0.5144, - "step": 43830 - }, - { - "epoch": 1.12, - "learning_rate": 1.4395982122045985e-06, - "loss": 0.6699, - "step": 43831 - }, - { - "epoch": 1.12, - "learning_rate": 1.4395733585860086e-06, - "loss": 0.7148, - "step": 43832 - }, - { - "epoch": 1.12, - "learning_rate": 1.4395485046308571e-06, - "loss": 0.5571, - "step": 43833 - }, - { - "epoch": 1.12, - "learning_rate": 1.4395236503391638e-06, - "loss": 0.6709, - "step": 43834 - }, - { - "epoch": 1.12, - "learning_rate": 1.4394987957109477e-06, - "loss": 0.6807, - "step": 43835 - }, - { - "epoch": 1.12, - "learning_rate": 1.439473940746227e-06, - "loss": 0.6709, - "step": 43836 - }, - { - "epoch": 1.12, - "learning_rate": 1.4394490854450216e-06, - "loss": 0.8389, - "step": 43837 - }, - { - "epoch": 1.12, - "learning_rate": 1.4394242298073503e-06, - "loss": 0.7002, - "step": 43838 - }, - { - "epoch": 1.12, - "learning_rate": 1.4393993738332321e-06, - "loss": 0.7324, - "step": 43839 - }, - { - "epoch": 1.12, - "learning_rate": 1.439374517522686e-06, - "loss": 0.5957, - "step": 43840 - }, - { - "epoch": 1.12, - "learning_rate": 1.439349660875731e-06, - "loss": 0.5425, - "step": 43841 - }, - { - "epoch": 1.12, - "learning_rate": 1.439324803892386e-06, - "loss": 0.8438, - "step": 43842 - }, - { - "epoch": 1.12, - "learning_rate": 1.4392999465726704e-06, - "loss": 0.5474, - "step": 43843 - }, - { - "epoch": 1.12, - "learning_rate": 1.439275088916603e-06, - "loss": 0.9287, - "step": 43844 - }, - { - "epoch": 1.12, - "learning_rate": 1.439250230924203e-06, - "loss": 0.7588, - "step": 43845 - }, - { - "epoch": 1.12, - "learning_rate": 1.439225372595489e-06, - "loss": 0.5232, - "step": 43846 - }, - { - "epoch": 1.12, - "learning_rate": 1.4392005139304803e-06, - "loss": 0.6895, - "step": 43847 - }, - { - "epoch": 1.12, - "learning_rate": 1.4391756549291963e-06, - "loss": 0.6631, - "step": 43848 - }, - { - "epoch": 1.12, - "learning_rate": 1.4391507955916557e-06, - "loss": 0.7246, - "step": 43849 - }, - { - "epoch": 1.12, - "learning_rate": 1.4391259359178772e-06, - "loss": 0.7549, - "step": 43850 - }, - { - "epoch": 1.12, - "learning_rate": 1.4391010759078803e-06, - "loss": 0.7539, - "step": 43851 - }, - { - "epoch": 1.12, - "learning_rate": 1.4390762155616838e-06, - "loss": 0.7334, - "step": 43852 - }, - { - "epoch": 1.12, - "learning_rate": 1.439051354879307e-06, - "loss": 0.792, - "step": 43853 - }, - { - "epoch": 1.12, - "learning_rate": 1.4390264938607688e-06, - "loss": 0.7432, - "step": 43854 - }, - { - "epoch": 1.12, - "learning_rate": 1.439001632506088e-06, - "loss": 0.6973, - "step": 43855 - }, - { - "epoch": 1.12, - "learning_rate": 1.4389767708152837e-06, - "loss": 0.5479, - "step": 43856 - }, - { - "epoch": 1.12, - "learning_rate": 1.4389519087883754e-06, - "loss": 0.583, - "step": 43857 - }, - { - "epoch": 1.12, - "learning_rate": 1.4389270464253818e-06, - "loss": 0.6206, - "step": 43858 - }, - { - "epoch": 1.12, - "learning_rate": 1.4389021837263217e-06, - "loss": 0.6787, - "step": 43859 - }, - { - "epoch": 1.12, - "learning_rate": 1.4388773206912149e-06, - "loss": 0.6699, - "step": 43860 - }, - { - "epoch": 1.12, - "learning_rate": 1.4388524573200793e-06, - "loss": 0.626, - "step": 43861 - }, - { - "epoch": 1.12, - "learning_rate": 1.4388275936129348e-06, - "loss": 0.5544, - "step": 43862 - }, - { - "epoch": 1.12, - "learning_rate": 1.4388027295698003e-06, - "loss": 0.4041, - "step": 43863 - }, - { - "epoch": 1.12, - "learning_rate": 1.4387778651906948e-06, - "loss": 0.5547, - "step": 43864 - }, - { - "epoch": 1.12, - "learning_rate": 1.438753000475637e-06, - "loss": 0.7349, - "step": 43865 - }, - { - "epoch": 1.12, - "learning_rate": 1.4387281354246464e-06, - "loss": 0.6567, - "step": 43866 - }, - { - "epoch": 1.12, - "learning_rate": 1.4387032700377416e-06, - "loss": 0.7012, - "step": 43867 - }, - { - "epoch": 1.12, - "learning_rate": 1.4386784043149418e-06, - "loss": 0.668, - "step": 43868 - }, - { - "epoch": 1.12, - "learning_rate": 1.4386535382562665e-06, - "loss": 0.6499, - "step": 43869 - }, - { - "epoch": 1.12, - "learning_rate": 1.4386286718617343e-06, - "loss": 0.8408, - "step": 43870 - }, - { - "epoch": 1.12, - "learning_rate": 1.438603805131364e-06, - "loss": 0.6123, - "step": 43871 - }, - { - "epoch": 1.12, - "learning_rate": 1.438578938065175e-06, - "loss": 0.6914, - "step": 43872 - }, - { - "epoch": 1.12, - "learning_rate": 1.4385540706631867e-06, - "loss": 0.7529, - "step": 43873 - }, - { - "epoch": 1.12, - "learning_rate": 1.4385292029254173e-06, - "loss": 0.8809, - "step": 43874 - }, - { - "epoch": 1.12, - "learning_rate": 1.4385043348518862e-06, - "loss": 0.6641, - "step": 43875 - }, - { - "epoch": 1.12, - "learning_rate": 1.4384794664426127e-06, - "loss": 0.4795, - "step": 43876 - }, - { - "epoch": 1.12, - "learning_rate": 1.4384545976976155e-06, - "loss": 0.5559, - "step": 43877 - }, - { - "epoch": 1.12, - "learning_rate": 1.4384297286169141e-06, - "loss": 0.4841, - "step": 43878 - }, - { - "epoch": 1.12, - "learning_rate": 1.4384048592005268e-06, - "loss": 0.4594, - "step": 43879 - }, - { - "epoch": 1.12, - "learning_rate": 1.4383799894484732e-06, - "loss": 0.8701, - "step": 43880 - }, - { - "epoch": 1.12, - "learning_rate": 1.438355119360772e-06, - "loss": 0.8125, - "step": 43881 - }, - { - "epoch": 1.12, - "learning_rate": 1.4383302489374428e-06, - "loss": 0.7012, - "step": 43882 - }, - { - "epoch": 1.12, - "learning_rate": 1.4383053781785044e-06, - "loss": 0.5688, - "step": 43883 - }, - { - "epoch": 1.12, - "learning_rate": 1.4382805070839755e-06, - "loss": 0.7842, - "step": 43884 - }, - { - "epoch": 1.12, - "learning_rate": 1.438255635653875e-06, - "loss": 0.7988, - "step": 43885 - }, - { - "epoch": 1.12, - "learning_rate": 1.4382307638882228e-06, - "loss": 0.6953, - "step": 43886 - }, - { - "epoch": 1.12, - "learning_rate": 1.4382058917870373e-06, - "loss": 0.6807, - "step": 43887 - }, - { - "epoch": 1.12, - "learning_rate": 1.4381810193503378e-06, - "loss": 0.5415, - "step": 43888 - }, - { - "epoch": 1.12, - "learning_rate": 1.4381561465781432e-06, - "loss": 0.6233, - "step": 43889 - }, - { - "epoch": 1.12, - "learning_rate": 1.4381312734704723e-06, - "loss": 0.5354, - "step": 43890 - }, - { - "epoch": 1.12, - "learning_rate": 1.438106400027345e-06, - "loss": 0.6284, - "step": 43891 - }, - { - "epoch": 1.12, - "learning_rate": 1.438081526248779e-06, - "loss": 0.519, - "step": 43892 - }, - { - "epoch": 1.12, - "learning_rate": 1.438056652134795e-06, - "loss": 0.7188, - "step": 43893 - }, - { - "epoch": 1.13, - "learning_rate": 1.4380317776854106e-06, - "loss": 0.6211, - "step": 43894 - }, - { - "epoch": 1.13, - "learning_rate": 1.4380069029006454e-06, - "loss": 0.5021, - "step": 43895 - }, - { - "epoch": 1.13, - "learning_rate": 1.4379820277805186e-06, - "loss": 0.5933, - "step": 43896 - }, - { - "epoch": 1.13, - "learning_rate": 1.4379571523250491e-06, - "loss": 0.7646, - "step": 43897 - }, - { - "epoch": 1.13, - "learning_rate": 1.4379322765342559e-06, - "loss": 0.4951, - "step": 43898 - }, - { - "epoch": 1.13, - "learning_rate": 1.4379074004081583e-06, - "loss": 0.411, - "step": 43899 - }, - { - "epoch": 1.13, - "learning_rate": 1.437882523946775e-06, - "loss": 0.5957, - "step": 43900 - }, - { - "epoch": 1.13, - "learning_rate": 1.437857647150125e-06, - "loss": 0.7314, - "step": 43901 - }, - { - "epoch": 1.13, - "learning_rate": 1.4378327700182276e-06, - "loss": 0.6992, - "step": 43902 - }, - { - "epoch": 1.13, - "learning_rate": 1.437807892551102e-06, - "loss": 0.6348, - "step": 43903 - }, - { - "epoch": 1.13, - "learning_rate": 1.4377830147487668e-06, - "loss": 0.6802, - "step": 43904 - }, - { - "epoch": 1.13, - "learning_rate": 1.4377581366112412e-06, - "loss": 0.5403, - "step": 43905 - }, - { - "epoch": 1.13, - "learning_rate": 1.4377332581385447e-06, - "loss": 0.7441, - "step": 43906 - }, - { - "epoch": 1.13, - "learning_rate": 1.4377083793306955e-06, - "loss": 0.5757, - "step": 43907 - }, - { - "epoch": 1.13, - "learning_rate": 1.4376835001877136e-06, - "loss": 0.6582, - "step": 43908 - }, - { - "epoch": 1.13, - "learning_rate": 1.4376586207096174e-06, - "loss": 0.5825, - "step": 43909 - }, - { - "epoch": 1.13, - "learning_rate": 1.437633740896426e-06, - "loss": 0.5947, - "step": 43910 - }, - { - "epoch": 1.13, - "learning_rate": 1.4376088607481585e-06, - "loss": 0.8027, - "step": 43911 - }, - { - "epoch": 1.13, - "learning_rate": 1.437583980264834e-06, - "loss": 0.3591, - "step": 43912 - }, - { - "epoch": 1.13, - "learning_rate": 1.437559099446472e-06, - "loss": 0.7422, - "step": 43913 - }, - { - "epoch": 1.13, - "learning_rate": 1.437534218293091e-06, - "loss": 0.5415, - "step": 43914 - }, - { - "epoch": 1.13, - "learning_rate": 1.4375093368047097e-06, - "loss": 0.5908, - "step": 43915 - }, - { - "epoch": 1.13, - "learning_rate": 1.4374844549813482e-06, - "loss": 0.5405, - "step": 43916 - }, - { - "epoch": 1.13, - "learning_rate": 1.4374595728230243e-06, - "loss": 0.5605, - "step": 43917 - }, - { - "epoch": 1.13, - "learning_rate": 1.4374346903297584e-06, - "loss": 0.5283, - "step": 43918 - }, - { - "epoch": 1.13, - "learning_rate": 1.4374098075015685e-06, - "loss": 0.6421, - "step": 43919 - }, - { - "epoch": 1.13, - "learning_rate": 1.437384924338474e-06, - "loss": 0.6455, - "step": 43920 - }, - { - "epoch": 1.13, - "learning_rate": 1.437360040840494e-06, - "loss": 0.4819, - "step": 43921 - }, - { - "epoch": 1.13, - "learning_rate": 1.4373351570076478e-06, - "loss": 0.6138, - "step": 43922 - }, - { - "epoch": 1.13, - "learning_rate": 1.437310272839954e-06, - "loss": 0.5288, - "step": 43923 - }, - { - "epoch": 1.13, - "learning_rate": 1.4372853883374316e-06, - "loss": 0.5938, - "step": 43924 - }, - { - "epoch": 1.13, - "learning_rate": 1.4372605035001005e-06, - "loss": 0.6572, - "step": 43925 - }, - { - "epoch": 1.13, - "learning_rate": 1.4372356183279784e-06, - "loss": 0.6826, - "step": 43926 - }, - { - "epoch": 1.13, - "learning_rate": 1.4372107328210853e-06, - "loss": 0.6064, - "step": 43927 - }, - { - "epoch": 1.13, - "learning_rate": 1.4371858469794404e-06, - "loss": 0.6714, - "step": 43928 - }, - { - "epoch": 1.13, - "learning_rate": 1.4371609608030624e-06, - "loss": 0.6147, - "step": 43929 - }, - { - "epoch": 1.13, - "learning_rate": 1.4371360742919699e-06, - "loss": 0.5889, - "step": 43930 - }, - { - "epoch": 1.13, - "learning_rate": 1.4371111874461829e-06, - "loss": 0.751, - "step": 43931 - }, - { - "epoch": 1.13, - "learning_rate": 1.4370863002657191e-06, - "loss": 0.6338, - "step": 43932 - }, - { - "epoch": 1.13, - "learning_rate": 1.4370614127505995e-06, - "loss": 0.7842, - "step": 43933 - }, - { - "epoch": 1.13, - "learning_rate": 1.4370365249008415e-06, - "loss": 0.5171, - "step": 43934 - }, - { - "epoch": 1.13, - "learning_rate": 1.4370116367164648e-06, - "loss": 0.4404, - "step": 43935 - }, - { - "epoch": 1.13, - "learning_rate": 1.4369867481974884e-06, - "loss": 0.5359, - "step": 43936 - }, - { - "epoch": 1.13, - "learning_rate": 1.4369618593439312e-06, - "loss": 0.7363, - "step": 43937 - }, - { - "epoch": 1.13, - "learning_rate": 1.4369369701558128e-06, - "loss": 0.4412, - "step": 43938 - }, - { - "epoch": 1.13, - "learning_rate": 1.4369120806331516e-06, - "loss": 0.6606, - "step": 43939 - }, - { - "epoch": 1.13, - "learning_rate": 1.4368871907759667e-06, - "loss": 0.6738, - "step": 43940 - }, - { - "epoch": 1.13, - "learning_rate": 1.4368623005842776e-06, - "loss": 0.7041, - "step": 43941 - }, - { - "epoch": 1.13, - "learning_rate": 1.4368374100581032e-06, - "loss": 0.7676, - "step": 43942 - }, - { - "epoch": 1.13, - "learning_rate": 1.4368125191974622e-06, - "loss": 0.7129, - "step": 43943 - }, - { - "epoch": 1.13, - "learning_rate": 1.4367876280023742e-06, - "loss": 0.5952, - "step": 43944 - }, - { - "epoch": 1.13, - "learning_rate": 1.4367627364728581e-06, - "loss": 0.6543, - "step": 43945 - }, - { - "epoch": 1.13, - "learning_rate": 1.4367378446089324e-06, - "loss": 0.6826, - "step": 43946 - }, - { - "epoch": 1.13, - "learning_rate": 1.436712952410617e-06, - "loss": 0.6914, - "step": 43947 - }, - { - "epoch": 1.13, - "learning_rate": 1.4366880598779305e-06, - "loss": 0.5537, - "step": 43948 - }, - { - "epoch": 1.13, - "learning_rate": 1.436663167010892e-06, - "loss": 0.8682, - "step": 43949 - }, - { - "epoch": 1.13, - "learning_rate": 1.4366382738095206e-06, - "loss": 0.627, - "step": 43950 - }, - { - "epoch": 1.13, - "learning_rate": 1.4366133802738351e-06, - "loss": 0.6343, - "step": 43951 - }, - { - "epoch": 1.13, - "learning_rate": 1.436588486403855e-06, - "loss": 0.5044, - "step": 43952 - }, - { - "epoch": 1.13, - "learning_rate": 1.4365635921995993e-06, - "loss": 0.7295, - "step": 43953 - }, - { - "epoch": 1.13, - "learning_rate": 1.436538697661087e-06, - "loss": 0.5986, - "step": 43954 - }, - { - "epoch": 1.13, - "learning_rate": 1.4365138027883368e-06, - "loss": 0.7266, - "step": 43955 - }, - { - "epoch": 1.13, - "learning_rate": 1.4364889075813683e-06, - "loss": 0.8623, - "step": 43956 - }, - { - "epoch": 1.13, - "learning_rate": 1.4364640120402e-06, - "loss": 0.5146, - "step": 43957 - }, - { - "epoch": 1.13, - "learning_rate": 1.4364391161648516e-06, - "loss": 0.6055, - "step": 43958 - }, - { - "epoch": 1.13, - "learning_rate": 1.4364142199553417e-06, - "loss": 0.4651, - "step": 43959 - }, - { - "epoch": 1.13, - "learning_rate": 1.4363893234116894e-06, - "loss": 0.626, - "step": 43960 - }, - { - "epoch": 1.13, - "learning_rate": 1.4363644265339141e-06, - "loss": 0.5974, - "step": 43961 - }, - { - "epoch": 1.13, - "learning_rate": 1.4363395293220344e-06, - "loss": 0.6719, - "step": 43962 - }, - { - "epoch": 1.13, - "learning_rate": 1.43631463177607e-06, - "loss": 0.666, - "step": 43963 - }, - { - "epoch": 1.13, - "learning_rate": 1.4362897338960391e-06, - "loss": 0.7959, - "step": 43964 - }, - { - "epoch": 1.13, - "learning_rate": 1.4362648356819614e-06, - "loss": 0.5149, - "step": 43965 - }, - { - "epoch": 1.13, - "learning_rate": 1.4362399371338556e-06, - "loss": 0.6104, - "step": 43966 - }, - { - "epoch": 1.13, - "learning_rate": 1.4362150382517408e-06, - "loss": 0.4878, - "step": 43967 - }, - { - "epoch": 1.13, - "learning_rate": 1.4361901390356366e-06, - "loss": 0.6348, - "step": 43968 - }, - { - "epoch": 1.13, - "learning_rate": 1.4361652394855618e-06, - "loss": 0.6045, - "step": 43969 - }, - { - "epoch": 1.13, - "learning_rate": 1.4361403396015349e-06, - "loss": 0.7002, - "step": 43970 - }, - { - "epoch": 1.13, - "learning_rate": 1.4361154393835756e-06, - "loss": 0.3394, - "step": 43971 - }, - { - "epoch": 1.13, - "learning_rate": 1.4360905388317024e-06, - "loss": 0.6045, - "step": 43972 - }, - { - "epoch": 1.13, - "learning_rate": 1.4360656379459353e-06, - "loss": 0.7441, - "step": 43973 - }, - { - "epoch": 1.13, - "learning_rate": 1.4360407367262925e-06, - "loss": 0.8057, - "step": 43974 - }, - { - "epoch": 1.13, - "learning_rate": 1.4360158351727933e-06, - "loss": 0.7422, - "step": 43975 - }, - { - "epoch": 1.13, - "learning_rate": 1.435990933285457e-06, - "loss": 0.6343, - "step": 43976 - }, - { - "epoch": 1.13, - "learning_rate": 1.4359660310643023e-06, - "loss": 0.5942, - "step": 43977 - }, - { - "epoch": 1.13, - "learning_rate": 1.4359411285093486e-06, - "loss": 0.5869, - "step": 43978 - }, - { - "epoch": 1.13, - "learning_rate": 1.435916225620615e-06, - "loss": 0.6396, - "step": 43979 - }, - { - "epoch": 1.13, - "learning_rate": 1.4358913223981198e-06, - "loss": 0.583, - "step": 43980 - }, - { - "epoch": 1.13, - "learning_rate": 1.4358664188418832e-06, - "loss": 0.5044, - "step": 43981 - }, - { - "epoch": 1.13, - "learning_rate": 1.4358415149519235e-06, - "loss": 0.876, - "step": 43982 - }, - { - "epoch": 1.13, - "learning_rate": 1.4358166107282603e-06, - "loss": 0.7988, - "step": 43983 - }, - { - "epoch": 1.13, - "learning_rate": 1.435791706170912e-06, - "loss": 0.8213, - "step": 43984 - }, - { - "epoch": 1.13, - "learning_rate": 1.435766801279898e-06, - "loss": 0.688, - "step": 43985 - }, - { - "epoch": 1.13, - "learning_rate": 1.4357418960552376e-06, - "loss": 0.7148, - "step": 43986 - }, - { - "epoch": 1.13, - "learning_rate": 1.4357169904969494e-06, - "loss": 0.7256, - "step": 43987 - }, - { - "epoch": 1.13, - "learning_rate": 1.4356920846050532e-06, - "loss": 0.7319, - "step": 43988 - }, - { - "epoch": 1.13, - "learning_rate": 1.4356671783795671e-06, - "loss": 0.7549, - "step": 43989 - }, - { - "epoch": 1.13, - "learning_rate": 1.435642271820511e-06, - "loss": 0.4607, - "step": 43990 - }, - { - "epoch": 1.13, - "learning_rate": 1.4356173649279038e-06, - "loss": 0.5918, - "step": 43991 - }, - { - "epoch": 1.13, - "learning_rate": 1.435592457701764e-06, - "loss": 0.5488, - "step": 43992 - }, - { - "epoch": 1.13, - "learning_rate": 1.4355675501421113e-06, - "loss": 0.6143, - "step": 43993 - }, - { - "epoch": 1.13, - "learning_rate": 1.4355426422489645e-06, - "loss": 0.6128, - "step": 43994 - }, - { - "epoch": 1.13, - "learning_rate": 1.4355177340223426e-06, - "loss": 0.7012, - "step": 43995 - }, - { - "epoch": 1.13, - "learning_rate": 1.435492825462265e-06, - "loss": 0.5085, - "step": 43996 - }, - { - "epoch": 1.13, - "learning_rate": 1.4354679165687504e-06, - "loss": 0.6543, - "step": 43997 - }, - { - "epoch": 1.13, - "learning_rate": 1.4354430073418183e-06, - "loss": 0.6229, - "step": 43998 - }, - { - "epoch": 1.13, - "learning_rate": 1.4354180977814872e-06, - "loss": 0.6577, - "step": 43999 - }, - { - "epoch": 1.13, - "learning_rate": 1.4353931878877767e-06, - "loss": 0.6982, - "step": 44000 - }, - { - "epoch": 1.13, - "learning_rate": 1.4353682776607055e-06, - "loss": 0.8232, - "step": 44001 - }, - { - "epoch": 1.13, - "learning_rate": 1.435343367100293e-06, - "loss": 0.6748, - "step": 44002 - }, - { - "epoch": 1.13, - "learning_rate": 1.4353184562065582e-06, - "loss": 0.7129, - "step": 44003 - }, - { - "epoch": 1.13, - "learning_rate": 1.4352935449795198e-06, - "loss": 0.6094, - "step": 44004 - }, - { - "epoch": 1.13, - "learning_rate": 1.4352686334191973e-06, - "loss": 0.5919, - "step": 44005 - }, - { - "epoch": 1.13, - "learning_rate": 1.4352437215256095e-06, - "loss": 0.6787, - "step": 44006 - }, - { - "epoch": 1.13, - "learning_rate": 1.4352188092987756e-06, - "loss": 0.6611, - "step": 44007 - }, - { - "epoch": 1.13, - "learning_rate": 1.435193896738715e-06, - "loss": 0.6768, - "step": 44008 - }, - { - "epoch": 1.13, - "learning_rate": 1.435168983845446e-06, - "loss": 0.6895, - "step": 44009 - }, - { - "epoch": 1.13, - "learning_rate": 1.4351440706189884e-06, - "loss": 0.7578, - "step": 44010 - }, - { - "epoch": 1.13, - "learning_rate": 1.4351191570593607e-06, - "loss": 0.6313, - "step": 44011 - }, - { - "epoch": 1.13, - "learning_rate": 1.4350942431665824e-06, - "loss": 0.6118, - "step": 44012 - }, - { - "epoch": 1.13, - "learning_rate": 1.4350693289406726e-06, - "loss": 0.5435, - "step": 44013 - }, - { - "epoch": 1.13, - "learning_rate": 1.43504441438165e-06, - "loss": 0.6455, - "step": 44014 - }, - { - "epoch": 1.13, - "learning_rate": 1.4350194994895341e-06, - "loss": 0.6055, - "step": 44015 - }, - { - "epoch": 1.13, - "learning_rate": 1.4349945842643436e-06, - "loss": 0.7119, - "step": 44016 - }, - { - "epoch": 1.13, - "learning_rate": 1.434969668706098e-06, - "loss": 0.7793, - "step": 44017 - }, - { - "epoch": 1.13, - "learning_rate": 1.434944752814816e-06, - "loss": 0.792, - "step": 44018 - }, - { - "epoch": 1.13, - "learning_rate": 1.4349198365905166e-06, - "loss": 0.4829, - "step": 44019 - }, - { - "epoch": 1.13, - "learning_rate": 1.4348949200332192e-06, - "loss": 0.7441, - "step": 44020 - }, - { - "epoch": 1.13, - "learning_rate": 1.4348700031429429e-06, - "loss": 0.835, - "step": 44021 - }, - { - "epoch": 1.13, - "learning_rate": 1.4348450859197062e-06, - "loss": 0.7471, - "step": 44022 - }, - { - "epoch": 1.13, - "learning_rate": 1.4348201683635295e-06, - "loss": 0.8716, - "step": 44023 - }, - { - "epoch": 1.13, - "learning_rate": 1.4347952504744303e-06, - "loss": 0.7568, - "step": 44024 - }, - { - "epoch": 1.13, - "learning_rate": 1.4347703322524285e-06, - "loss": 0.6826, - "step": 44025 - }, - { - "epoch": 1.13, - "learning_rate": 1.4347454136975427e-06, - "loss": 0.585, - "step": 44026 - }, - { - "epoch": 1.13, - "learning_rate": 1.434720494809793e-06, - "loss": 0.6729, - "step": 44027 - }, - { - "epoch": 1.13, - "learning_rate": 1.4346955755891973e-06, - "loss": 0.4553, - "step": 44028 - }, - { - "epoch": 1.13, - "learning_rate": 1.4346706560357756e-06, - "loss": 0.7861, - "step": 44029 - }, - { - "epoch": 1.13, - "learning_rate": 1.434645736149546e-06, - "loss": 0.7578, - "step": 44030 - }, - { - "epoch": 1.13, - "learning_rate": 1.4346208159305286e-06, - "loss": 0.7402, - "step": 44031 - }, - { - "epoch": 1.13, - "learning_rate": 1.434595895378742e-06, - "loss": 0.6006, - "step": 44032 - }, - { - "epoch": 1.13, - "learning_rate": 1.4345709744942051e-06, - "loss": 0.4878, - "step": 44033 - }, - { - "epoch": 1.13, - "learning_rate": 1.4345460532769375e-06, - "loss": 0.7412, - "step": 44034 - }, - { - "epoch": 1.13, - "learning_rate": 1.4345211317269579e-06, - "loss": 0.6465, - "step": 44035 - }, - { - "epoch": 1.13, - "learning_rate": 1.434496209844285e-06, - "loss": 0.6377, - "step": 44036 - }, - { - "epoch": 1.13, - "learning_rate": 1.4344712876289386e-06, - "loss": 0.6836, - "step": 44037 - }, - { - "epoch": 1.13, - "learning_rate": 1.4344463650809377e-06, - "loss": 0.7607, - "step": 44038 - }, - { - "epoch": 1.13, - "learning_rate": 1.4344214422003009e-06, - "loss": 0.6416, - "step": 44039 - }, - { - "epoch": 1.13, - "learning_rate": 1.434396518987048e-06, - "loss": 0.7559, - "step": 44040 - }, - { - "epoch": 1.13, - "learning_rate": 1.4343715954411972e-06, - "loss": 0.6792, - "step": 44041 - }, - { - "epoch": 1.13, - "learning_rate": 1.434346671562768e-06, - "loss": 0.7427, - "step": 44042 - }, - { - "epoch": 1.13, - "learning_rate": 1.4343217473517802e-06, - "loss": 0.5381, - "step": 44043 - }, - { - "epoch": 1.13, - "learning_rate": 1.4342968228082516e-06, - "loss": 0.418, - "step": 44044 - }, - { - "epoch": 1.13, - "learning_rate": 1.434271897932202e-06, - "loss": 0.6445, - "step": 44045 - }, - { - "epoch": 1.13, - "learning_rate": 1.4342469727236506e-06, - "loss": 0.5198, - "step": 44046 - }, - { - "epoch": 1.13, - "learning_rate": 1.4342220471826159e-06, - "loss": 0.7783, - "step": 44047 - }, - { - "epoch": 1.13, - "learning_rate": 1.4341971213091177e-06, - "loss": 0.5786, - "step": 44048 - }, - { - "epoch": 1.13, - "learning_rate": 1.4341721951031745e-06, - "loss": 0.7451, - "step": 44049 - }, - { - "epoch": 1.13, - "learning_rate": 1.4341472685648057e-06, - "loss": 0.7173, - "step": 44050 - }, - { - "epoch": 1.13, - "learning_rate": 1.4341223416940302e-06, - "loss": 0.4885, - "step": 44051 - }, - { - "epoch": 1.13, - "learning_rate": 1.4340974144908673e-06, - "loss": 0.7339, - "step": 44052 - }, - { - "epoch": 1.13, - "learning_rate": 1.434072486955336e-06, - "loss": 0.7539, - "step": 44053 - }, - { - "epoch": 1.13, - "learning_rate": 1.4340475590874555e-06, - "loss": 0.6323, - "step": 44054 - }, - { - "epoch": 1.13, - "learning_rate": 1.4340226308872442e-06, - "loss": 0.624, - "step": 44055 - }, - { - "epoch": 1.13, - "learning_rate": 1.4339977023547222e-06, - "loss": 0.709, - "step": 44056 - }, - { - "epoch": 1.13, - "learning_rate": 1.433972773489908e-06, - "loss": 0.5669, - "step": 44057 - }, - { - "epoch": 1.13, - "learning_rate": 1.4339478442928208e-06, - "loss": 0.5742, - "step": 44058 - }, - { - "epoch": 1.13, - "learning_rate": 1.4339229147634798e-06, - "loss": 0.6367, - "step": 44059 - }, - { - "epoch": 1.13, - "learning_rate": 1.4338979849019036e-06, - "loss": 0.6655, - "step": 44060 - }, - { - "epoch": 1.13, - "learning_rate": 1.433873054708112e-06, - "loss": 0.52, - "step": 44061 - }, - { - "epoch": 1.13, - "learning_rate": 1.4338481241821233e-06, - "loss": 0.5085, - "step": 44062 - }, - { - "epoch": 1.13, - "learning_rate": 1.433823193323958e-06, - "loss": 0.5037, - "step": 44063 - }, - { - "epoch": 1.13, - "learning_rate": 1.4337982621336334e-06, - "loss": 0.3794, - "step": 44064 - }, - { - "epoch": 1.13, - "learning_rate": 1.4337733306111696e-06, - "loss": 0.6201, - "step": 44065 - }, - { - "epoch": 1.13, - "learning_rate": 1.4337483987565854e-06, - "loss": 0.4041, - "step": 44066 - }, - { - "epoch": 1.13, - "learning_rate": 1.4337234665699002e-06, - "loss": 0.8418, - "step": 44067 - }, - { - "epoch": 1.13, - "learning_rate": 1.433698534051133e-06, - "loss": 0.7197, - "step": 44068 - }, - { - "epoch": 1.13, - "learning_rate": 1.4336736012003025e-06, - "loss": 0.584, - "step": 44069 - }, - { - "epoch": 1.13, - "learning_rate": 1.4336486680174282e-06, - "loss": 0.811, - "step": 44070 - }, - { - "epoch": 1.13, - "learning_rate": 1.433623734502529e-06, - "loss": 0.583, - "step": 44071 - }, - { - "epoch": 1.13, - "learning_rate": 1.4335988006556238e-06, - "loss": 0.3262, - "step": 44072 - }, - { - "epoch": 1.13, - "learning_rate": 1.4335738664767328e-06, - "loss": 0.6445, - "step": 44073 - }, - { - "epoch": 1.13, - "learning_rate": 1.4335489319658734e-06, - "loss": 0.5625, - "step": 44074 - }, - { - "epoch": 1.13, - "learning_rate": 1.4335239971230659e-06, - "loss": 0.6206, - "step": 44075 - }, - { - "epoch": 1.13, - "learning_rate": 1.4334990619483288e-06, - "loss": 0.4939, - "step": 44076 - }, - { - "epoch": 1.13, - "learning_rate": 1.4334741264416814e-06, - "loss": 0.6514, - "step": 44077 - }, - { - "epoch": 1.13, - "learning_rate": 1.433449190603143e-06, - "loss": 0.6025, - "step": 44078 - }, - { - "epoch": 1.13, - "learning_rate": 1.4334242544327322e-06, - "loss": 0.7266, - "step": 44079 - }, - { - "epoch": 1.13, - "learning_rate": 1.4333993179304685e-06, - "loss": 0.7617, - "step": 44080 - }, - { - "epoch": 1.13, - "learning_rate": 1.433374381096371e-06, - "loss": 0.5259, - "step": 44081 - }, - { - "epoch": 1.13, - "learning_rate": 1.4333494439304583e-06, - "loss": 0.6567, - "step": 44082 - }, - { - "epoch": 1.13, - "learning_rate": 1.4333245064327503e-06, - "loss": 0.7783, - "step": 44083 - }, - { - "epoch": 1.13, - "learning_rate": 1.4332995686032654e-06, - "loss": 0.7787, - "step": 44084 - }, - { - "epoch": 1.13, - "learning_rate": 1.4332746304420229e-06, - "loss": 0.6958, - "step": 44085 - }, - { - "epoch": 1.13, - "learning_rate": 1.433249691949042e-06, - "loss": 0.7295, - "step": 44086 - }, - { - "epoch": 1.13, - "learning_rate": 1.4332247531243417e-06, - "loss": 0.7451, - "step": 44087 - }, - { - "epoch": 1.13, - "learning_rate": 1.4331998139679416e-06, - "loss": 0.5317, - "step": 44088 - }, - { - "epoch": 1.13, - "learning_rate": 1.4331748744798596e-06, - "loss": 0.5057, - "step": 44089 - }, - { - "epoch": 1.13, - "learning_rate": 1.433149934660116e-06, - "loss": 0.6514, - "step": 44090 - }, - { - "epoch": 1.13, - "learning_rate": 1.4331249945087292e-06, - "loss": 0.8447, - "step": 44091 - }, - { - "epoch": 1.13, - "learning_rate": 1.4331000540257185e-06, - "loss": 0.6553, - "step": 44092 - }, - { - "epoch": 1.13, - "learning_rate": 1.4330751132111032e-06, - "loss": 0.6987, - "step": 44093 - }, - { - "epoch": 1.13, - "learning_rate": 1.4330501720649022e-06, - "loss": 0.5635, - "step": 44094 - }, - { - "epoch": 1.13, - "learning_rate": 1.4330252305871341e-06, - "loss": 0.6123, - "step": 44095 - }, - { - "epoch": 1.13, - "learning_rate": 1.433000288777819e-06, - "loss": 0.7109, - "step": 44096 - }, - { - "epoch": 1.13, - "learning_rate": 1.4329753466369751e-06, - "loss": 0.6855, - "step": 44097 - }, - { - "epoch": 1.13, - "learning_rate": 1.4329504041646225e-06, - "loss": 0.7168, - "step": 44098 - }, - { - "epoch": 1.13, - "learning_rate": 1.4329254613607793e-06, - "loss": 0.6079, - "step": 44099 - }, - { - "epoch": 1.13, - "learning_rate": 1.432900518225465e-06, - "loss": 0.5303, - "step": 44100 - }, - { - "epoch": 1.13, - "learning_rate": 1.4328755747586984e-06, - "loss": 0.6382, - "step": 44101 - }, - { - "epoch": 1.13, - "learning_rate": 1.4328506309604993e-06, - "loss": 0.8174, - "step": 44102 - }, - { - "epoch": 1.13, - "learning_rate": 1.4328256868308862e-06, - "loss": 0.7383, - "step": 44103 - }, - { - "epoch": 1.13, - "learning_rate": 1.4328007423698783e-06, - "loss": 0.6455, - "step": 44104 - }, - { - "epoch": 1.13, - "learning_rate": 1.432775797577495e-06, - "loss": 0.8096, - "step": 44105 - }, - { - "epoch": 1.13, - "learning_rate": 1.4327508524537548e-06, - "loss": 0.8574, - "step": 44106 - }, - { - "epoch": 1.13, - "learning_rate": 1.4327259069986775e-06, - "loss": 0.7061, - "step": 44107 - }, - { - "epoch": 1.13, - "learning_rate": 1.4327009612122818e-06, - "loss": 0.709, - "step": 44108 - }, - { - "epoch": 1.13, - "learning_rate": 1.4326760150945869e-06, - "loss": 0.7979, - "step": 44109 - }, - { - "epoch": 1.13, - "learning_rate": 1.4326510686456117e-06, - "loss": 0.7607, - "step": 44110 - }, - { - "epoch": 1.13, - "learning_rate": 1.4326261218653757e-06, - "loss": 0.6523, - "step": 44111 - }, - { - "epoch": 1.13, - "learning_rate": 1.4326011747538975e-06, - "loss": 0.7422, - "step": 44112 - }, - { - "epoch": 1.13, - "learning_rate": 1.432576227311197e-06, - "loss": 0.6992, - "step": 44113 - }, - { - "epoch": 1.13, - "learning_rate": 1.432551279537292e-06, - "loss": 0.6387, - "step": 44114 - }, - { - "epoch": 1.13, - "learning_rate": 1.4325263314322032e-06, - "loss": 0.5723, - "step": 44115 - }, - { - "epoch": 1.13, - "learning_rate": 1.432501382995948e-06, - "loss": 0.6377, - "step": 44116 - }, - { - "epoch": 1.13, - "learning_rate": 1.4324764342285472e-06, - "loss": 0.6631, - "step": 44117 - }, - { - "epoch": 1.13, - "learning_rate": 1.4324514851300186e-06, - "loss": 0.7148, - "step": 44118 - }, - { - "epoch": 1.13, - "learning_rate": 1.432426535700382e-06, - "loss": 0.7998, - "step": 44119 - }, - { - "epoch": 1.13, - "learning_rate": 1.432401585939656e-06, - "loss": 0.6577, - "step": 44120 - }, - { - "epoch": 1.13, - "learning_rate": 1.4323766358478602e-06, - "loss": 0.7285, - "step": 44121 - }, - { - "epoch": 1.13, - "learning_rate": 1.4323516854250132e-06, - "loss": 0.7617, - "step": 44122 - }, - { - "epoch": 1.13, - "learning_rate": 1.432326734671135e-06, - "loss": 0.5635, - "step": 44123 - }, - { - "epoch": 1.13, - "learning_rate": 1.4323017835862436e-06, - "loss": 0.5353, - "step": 44124 - }, - { - "epoch": 1.13, - "learning_rate": 1.432276832170359e-06, - "loss": 0.7354, - "step": 44125 - }, - { - "epoch": 1.13, - "learning_rate": 1.4322518804234993e-06, - "loss": 0.627, - "step": 44126 - }, - { - "epoch": 1.13, - "learning_rate": 1.4322269283456846e-06, - "loss": 0.8125, - "step": 44127 - }, - { - "epoch": 1.13, - "learning_rate": 1.432201975936934e-06, - "loss": 0.6621, - "step": 44128 - }, - { - "epoch": 1.13, - "learning_rate": 1.4321770231972655e-06, - "loss": 0.4941, - "step": 44129 - }, - { - "epoch": 1.13, - "learning_rate": 1.4321520701266994e-06, - "loss": 0.834, - "step": 44130 - }, - { - "epoch": 1.13, - "learning_rate": 1.4321271167252537e-06, - "loss": 0.7529, - "step": 44131 - }, - { - "epoch": 1.13, - "learning_rate": 1.4321021629929488e-06, - "loss": 0.5182, - "step": 44132 - }, - { - "epoch": 1.13, - "learning_rate": 1.432077208929803e-06, - "loss": 0.6698, - "step": 44133 - }, - { - "epoch": 1.13, - "learning_rate": 1.4320522545358356e-06, - "loss": 0.793, - "step": 44134 - }, - { - "epoch": 1.13, - "learning_rate": 1.4320272998110654e-06, - "loss": 0.6748, - "step": 44135 - }, - { - "epoch": 1.13, - "learning_rate": 1.4320023447555121e-06, - "loss": 0.6738, - "step": 44136 - }, - { - "epoch": 1.13, - "learning_rate": 1.431977389369194e-06, - "loss": 0.5967, - "step": 44137 - }, - { - "epoch": 1.13, - "learning_rate": 1.4319524336521315e-06, - "loss": 0.5518, - "step": 44138 - }, - { - "epoch": 1.13, - "learning_rate": 1.431927477604342e-06, - "loss": 0.5586, - "step": 44139 - }, - { - "epoch": 1.13, - "learning_rate": 1.4319025212258458e-06, - "loss": 0.6465, - "step": 44140 - }, - { - "epoch": 1.13, - "learning_rate": 1.4318775645166617e-06, - "loss": 0.6133, - "step": 44141 - }, - { - "epoch": 1.13, - "learning_rate": 1.431852607476809e-06, - "loss": 0.6689, - "step": 44142 - }, - { - "epoch": 1.13, - "learning_rate": 1.4318276501063062e-06, - "loss": 0.6001, - "step": 44143 - }, - { - "epoch": 1.13, - "learning_rate": 1.4318026924051734e-06, - "loss": 0.5176, - "step": 44144 - }, - { - "epoch": 1.13, - "learning_rate": 1.4317777343734286e-06, - "loss": 0.6455, - "step": 44145 - }, - { - "epoch": 1.13, - "learning_rate": 1.4317527760110917e-06, - "loss": 0.6987, - "step": 44146 - }, - { - "epoch": 1.13, - "learning_rate": 1.4317278173181814e-06, - "loss": 0.6777, - "step": 44147 - }, - { - "epoch": 1.13, - "learning_rate": 1.431702858294717e-06, - "loss": 0.6479, - "step": 44148 - }, - { - "epoch": 1.13, - "learning_rate": 1.4316778989407176e-06, - "loss": 0.6328, - "step": 44149 - }, - { - "epoch": 1.13, - "learning_rate": 1.4316529392562023e-06, - "loss": 0.7148, - "step": 44150 - }, - { - "epoch": 1.13, - "learning_rate": 1.4316279792411902e-06, - "loss": 0.6675, - "step": 44151 - }, - { - "epoch": 1.13, - "learning_rate": 1.4316030188957004e-06, - "loss": 0.7754, - "step": 44152 - }, - { - "epoch": 1.13, - "learning_rate": 1.4315780582197521e-06, - "loss": 0.5217, - "step": 44153 - }, - { - "epoch": 1.13, - "learning_rate": 1.4315530972133642e-06, - "loss": 0.6138, - "step": 44154 - }, - { - "epoch": 1.13, - "learning_rate": 1.4315281358765561e-06, - "loss": 0.5688, - "step": 44155 - }, - { - "epoch": 1.13, - "learning_rate": 1.4315031742093464e-06, - "loss": 0.5968, - "step": 44156 - }, - { - "epoch": 1.13, - "learning_rate": 1.431478212211755e-06, - "loss": 0.6475, - "step": 44157 - }, - { - "epoch": 1.13, - "learning_rate": 1.4314532498838004e-06, - "loss": 0.605, - "step": 44158 - }, - { - "epoch": 1.13, - "learning_rate": 1.431428287225502e-06, - "loss": 0.5669, - "step": 44159 - }, - { - "epoch": 1.13, - "learning_rate": 1.4314033242368784e-06, - "loss": 0.7412, - "step": 44160 - }, - { - "epoch": 1.13, - "learning_rate": 1.4313783609179493e-06, - "loss": 0.5176, - "step": 44161 - }, - { - "epoch": 1.13, - "learning_rate": 1.4313533972687337e-06, - "loss": 0.7646, - "step": 44162 - }, - { - "epoch": 1.13, - "learning_rate": 1.4313284332892508e-06, - "loss": 0.9551, - "step": 44163 - }, - { - "epoch": 1.13, - "learning_rate": 1.4313034689795193e-06, - "loss": 0.697, - "step": 44164 - }, - { - "epoch": 1.13, - "learning_rate": 1.4312785043395587e-06, - "loss": 0.5043, - "step": 44165 - }, - { - "epoch": 1.13, - "learning_rate": 1.4312535393693876e-06, - "loss": 0.6445, - "step": 44166 - }, - { - "epoch": 1.13, - "learning_rate": 1.431228574069026e-06, - "loss": 0.6807, - "step": 44167 - }, - { - "epoch": 1.13, - "learning_rate": 1.4312036084384923e-06, - "loss": 0.2842, - "step": 44168 - }, - { - "epoch": 1.13, - "learning_rate": 1.4311786424778058e-06, - "loss": 0.5378, - "step": 44169 - }, - { - "epoch": 1.13, - "learning_rate": 1.4311536761869857e-06, - "loss": 0.5957, - "step": 44170 - }, - { - "epoch": 1.13, - "learning_rate": 1.4311287095660512e-06, - "loss": 0.7461, - "step": 44171 - }, - { - "epoch": 1.13, - "learning_rate": 1.4311037426150213e-06, - "loss": 0.6143, - "step": 44172 - }, - { - "epoch": 1.13, - "learning_rate": 1.4310787753339147e-06, - "loss": 0.707, - "step": 44173 - }, - { - "epoch": 1.13, - "learning_rate": 1.4310538077227512e-06, - "loss": 0.7783, - "step": 44174 - }, - { - "epoch": 1.13, - "learning_rate": 1.4310288397815493e-06, - "loss": 0.7217, - "step": 44175 - }, - { - "epoch": 1.13, - "learning_rate": 1.4310038715103288e-06, - "loss": 0.7002, - "step": 44176 - }, - { - "epoch": 1.13, - "learning_rate": 1.4309789029091085e-06, - "loss": 0.5928, - "step": 44177 - }, - { - "epoch": 1.13, - "learning_rate": 1.4309539339779072e-06, - "loss": 0.8125, - "step": 44178 - }, - { - "epoch": 1.13, - "learning_rate": 1.4309289647167442e-06, - "loss": 0.6064, - "step": 44179 - }, - { - "epoch": 1.13, - "learning_rate": 1.430903995125639e-06, - "loss": 0.5884, - "step": 44180 - }, - { - "epoch": 1.13, - "learning_rate": 1.43087902520461e-06, - "loss": 0.5439, - "step": 44181 - }, - { - "epoch": 1.13, - "learning_rate": 1.4308540549536775e-06, - "loss": 0.666, - "step": 44182 - }, - { - "epoch": 1.13, - "learning_rate": 1.4308290843728592e-06, - "loss": 0.6826, - "step": 44183 - }, - { - "epoch": 1.13, - "learning_rate": 1.4308041134621752e-06, - "loss": 0.7305, - "step": 44184 - }, - { - "epoch": 1.13, - "learning_rate": 1.430779142221644e-06, - "loss": 0.7041, - "step": 44185 - }, - { - "epoch": 1.13, - "learning_rate": 1.4307541706512854e-06, - "loss": 0.6328, - "step": 44186 - }, - { - "epoch": 1.13, - "learning_rate": 1.4307291987511179e-06, - "loss": 0.5923, - "step": 44187 - }, - { - "epoch": 1.13, - "learning_rate": 1.430704226521161e-06, - "loss": 0.6182, - "step": 44188 - }, - { - "epoch": 1.13, - "learning_rate": 1.4306792539614334e-06, - "loss": 0.6797, - "step": 44189 - }, - { - "epoch": 1.13, - "learning_rate": 1.4306542810719546e-06, - "loss": 0.7627, - "step": 44190 - }, - { - "epoch": 1.13, - "learning_rate": 1.4306293078527437e-06, - "loss": 0.499, - "step": 44191 - }, - { - "epoch": 1.13, - "learning_rate": 1.4306043343038199e-06, - "loss": 0.624, - "step": 44192 - }, - { - "epoch": 1.13, - "learning_rate": 1.4305793604252019e-06, - "loss": 0.6646, - "step": 44193 - }, - { - "epoch": 1.13, - "learning_rate": 1.4305543862169089e-06, - "loss": 0.5522, - "step": 44194 - }, - { - "epoch": 1.13, - "learning_rate": 1.4305294116789608e-06, - "loss": 0.4971, - "step": 44195 - }, - { - "epoch": 1.13, - "learning_rate": 1.4305044368113757e-06, - "loss": 0.7207, - "step": 44196 - }, - { - "epoch": 1.13, - "learning_rate": 1.4304794616141735e-06, - "loss": 0.6177, - "step": 44197 - }, - { - "epoch": 1.13, - "learning_rate": 1.4304544860873727e-06, - "loss": 0.6543, - "step": 44198 - }, - { - "epoch": 1.13, - "learning_rate": 1.4304295102309927e-06, - "loss": 0.7178, - "step": 44199 - }, - { - "epoch": 1.13, - "learning_rate": 1.4304045340450524e-06, - "loss": 0.5107, - "step": 44200 - }, - { - "epoch": 1.13, - "learning_rate": 1.4303795575295713e-06, - "loss": 0.7275, - "step": 44201 - }, - { - "epoch": 1.13, - "learning_rate": 1.4303545806845687e-06, - "loss": 0.6523, - "step": 44202 - }, - { - "epoch": 1.13, - "learning_rate": 1.4303296035100631e-06, - "loss": 0.7314, - "step": 44203 - }, - { - "epoch": 1.13, - "learning_rate": 1.4303046260060738e-06, - "loss": 0.5933, - "step": 44204 - }, - { - "epoch": 1.13, - "learning_rate": 1.4302796481726202e-06, - "loss": 0.6821, - "step": 44205 - }, - { - "epoch": 1.13, - "learning_rate": 1.4302546700097212e-06, - "loss": 0.7188, - "step": 44206 - }, - { - "epoch": 1.13, - "learning_rate": 1.4302296915173962e-06, - "loss": 0.7734, - "step": 44207 - }, - { - "epoch": 1.13, - "learning_rate": 1.4302047126956637e-06, - "loss": 0.5981, - "step": 44208 - }, - { - "epoch": 1.13, - "learning_rate": 1.4301797335445437e-06, - "loss": 0.5488, - "step": 44209 - }, - { - "epoch": 1.13, - "learning_rate": 1.4301547540640544e-06, - "loss": 0.6611, - "step": 44210 - }, - { - "epoch": 1.13, - "learning_rate": 1.4301297742542156e-06, - "loss": 0.709, - "step": 44211 - }, - { - "epoch": 1.13, - "learning_rate": 1.4301047941150465e-06, - "loss": 0.8447, - "step": 44212 - }, - { - "epoch": 1.13, - "learning_rate": 1.4300798136465653e-06, - "loss": 0.6807, - "step": 44213 - }, - { - "epoch": 1.13, - "learning_rate": 1.4300548328487922e-06, - "loss": 0.7197, - "step": 44214 - }, - { - "epoch": 1.13, - "learning_rate": 1.4300298517217458e-06, - "loss": 0.731, - "step": 44215 - }, - { - "epoch": 1.13, - "learning_rate": 1.4300048702654453e-06, - "loss": 0.7051, - "step": 44216 - }, - { - "epoch": 1.13, - "learning_rate": 1.42997988847991e-06, - "loss": 0.5603, - "step": 44217 - }, - { - "epoch": 1.13, - "learning_rate": 1.4299549063651586e-06, - "loss": 0.5225, - "step": 44218 - }, - { - "epoch": 1.13, - "learning_rate": 1.4299299239212105e-06, - "loss": 0.6768, - "step": 44219 - }, - { - "epoch": 1.13, - "learning_rate": 1.429904941148085e-06, - "loss": 0.5557, - "step": 44220 - }, - { - "epoch": 1.13, - "learning_rate": 1.4298799580458008e-06, - "loss": 0.624, - "step": 44221 - }, - { - "epoch": 1.13, - "learning_rate": 1.4298549746143778e-06, - "loss": 0.5713, - "step": 44222 - }, - { - "epoch": 1.13, - "learning_rate": 1.429829990853834e-06, - "loss": 0.7598, - "step": 44223 - }, - { - "epoch": 1.13, - "learning_rate": 1.4298050067641895e-06, - "loss": 0.6982, - "step": 44224 - }, - { - "epoch": 1.13, - "learning_rate": 1.429780022345463e-06, - "loss": 0.6621, - "step": 44225 - }, - { - "epoch": 1.13, - "learning_rate": 1.4297550375976738e-06, - "loss": 0.6108, - "step": 44226 - }, - { - "epoch": 1.13, - "learning_rate": 1.4297300525208406e-06, - "loss": 0.5669, - "step": 44227 - }, - { - "epoch": 1.13, - "learning_rate": 1.4297050671149834e-06, - "loss": 0.574, - "step": 44228 - }, - { - "epoch": 1.13, - "learning_rate": 1.4296800813801201e-06, - "loss": 0.6611, - "step": 44229 - }, - { - "epoch": 1.13, - "learning_rate": 1.4296550953162712e-06, - "loss": 0.5063, - "step": 44230 - }, - { - "epoch": 1.13, - "learning_rate": 1.4296301089234546e-06, - "loss": 0.5537, - "step": 44231 - }, - { - "epoch": 1.13, - "learning_rate": 1.4296051222016902e-06, - "loss": 0.6982, - "step": 44232 - }, - { - "epoch": 1.13, - "learning_rate": 1.429580135150997e-06, - "loss": 0.834, - "step": 44233 - }, - { - "epoch": 1.13, - "learning_rate": 1.429555147771394e-06, - "loss": 0.605, - "step": 44234 - }, - { - "epoch": 1.13, - "learning_rate": 1.4295301600629004e-06, - "loss": 0.625, - "step": 44235 - }, - { - "epoch": 1.13, - "learning_rate": 1.4295051720255352e-06, - "loss": 0.793, - "step": 44236 - }, - { - "epoch": 1.13, - "learning_rate": 1.4294801836593178e-06, - "loss": 0.6089, - "step": 44237 - }, - { - "epoch": 1.13, - "learning_rate": 1.429455194964267e-06, - "loss": 0.5757, - "step": 44238 - }, - { - "epoch": 1.13, - "learning_rate": 1.4294302059404022e-06, - "loss": 0.5209, - "step": 44239 - }, - { - "epoch": 1.13, - "learning_rate": 1.4294052165877423e-06, - "loss": 0.4795, - "step": 44240 - }, - { - "epoch": 1.13, - "learning_rate": 1.4293802269063067e-06, - "loss": 0.7451, - "step": 44241 - }, - { - "epoch": 1.13, - "learning_rate": 1.4293552368961143e-06, - "loss": 0.7881, - "step": 44242 - }, - { - "epoch": 1.13, - "learning_rate": 1.4293302465571847e-06, - "loss": 0.7373, - "step": 44243 - }, - { - "epoch": 1.13, - "learning_rate": 1.4293052558895361e-06, - "loss": 0.5981, - "step": 44244 - }, - { - "epoch": 1.13, - "learning_rate": 1.4292802648931886e-06, - "loss": 0.7222, - "step": 44245 - }, - { - "epoch": 1.13, - "learning_rate": 1.429255273568161e-06, - "loss": 0.4907, - "step": 44246 - }, - { - "epoch": 1.13, - "learning_rate": 1.429230281914472e-06, - "loss": 0.5269, - "step": 44247 - }, - { - "epoch": 1.13, - "learning_rate": 1.4292052899321414e-06, - "loss": 0.5947, - "step": 44248 - }, - { - "epoch": 1.13, - "learning_rate": 1.4291802976211881e-06, - "loss": 0.7393, - "step": 44249 - }, - { - "epoch": 1.13, - "learning_rate": 1.429155304981631e-06, - "loss": 0.7656, - "step": 44250 - }, - { - "epoch": 1.13, - "learning_rate": 1.4291303120134895e-06, - "loss": 0.6465, - "step": 44251 - }, - { - "epoch": 1.13, - "learning_rate": 1.4291053187167826e-06, - "loss": 0.7012, - "step": 44252 - }, - { - "epoch": 1.13, - "learning_rate": 1.4290803250915296e-06, - "loss": 0.5879, - "step": 44253 - }, - { - "epoch": 1.13, - "learning_rate": 1.4290553311377492e-06, - "loss": 0.7578, - "step": 44254 - }, - { - "epoch": 1.13, - "learning_rate": 1.4290303368554613e-06, - "loss": 0.6455, - "step": 44255 - }, - { - "epoch": 1.13, - "learning_rate": 1.4290053422446842e-06, - "loss": 0.6646, - "step": 44256 - }, - { - "epoch": 1.13, - "learning_rate": 1.4289803473054375e-06, - "loss": 0.6165, - "step": 44257 - }, - { - "epoch": 1.13, - "learning_rate": 1.4289553520377406e-06, - "loss": 0.4331, - "step": 44258 - }, - { - "epoch": 1.13, - "learning_rate": 1.428930356441612e-06, - "loss": 0.54, - "step": 44259 - }, - { - "epoch": 1.13, - "learning_rate": 1.4289053605170714e-06, - "loss": 0.5234, - "step": 44260 - }, - { - "epoch": 1.13, - "learning_rate": 1.4288803642641374e-06, - "loss": 0.5591, - "step": 44261 - }, - { - "epoch": 1.13, - "learning_rate": 1.4288553676828297e-06, - "loss": 0.479, - "step": 44262 - }, - { - "epoch": 1.13, - "learning_rate": 1.4288303707731668e-06, - "loss": 0.4382, - "step": 44263 - }, - { - "epoch": 1.13, - "learning_rate": 1.4288053735351686e-06, - "loss": 0.5406, - "step": 44264 - }, - { - "epoch": 1.13, - "learning_rate": 1.4287803759688535e-06, - "loss": 0.5291, - "step": 44265 - }, - { - "epoch": 1.13, - "learning_rate": 1.4287553780742415e-06, - "loss": 0.7832, - "step": 44266 - }, - { - "epoch": 1.13, - "learning_rate": 1.4287303798513507e-06, - "loss": 0.4524, - "step": 44267 - }, - { - "epoch": 1.13, - "learning_rate": 1.428705381300201e-06, - "loss": 0.8389, - "step": 44268 - }, - { - "epoch": 1.13, - "learning_rate": 1.4286803824208112e-06, - "loss": 0.4666, - "step": 44269 - }, - { - "epoch": 1.13, - "learning_rate": 1.4286553832132008e-06, - "loss": 0.627, - "step": 44270 - }, - { - "epoch": 1.13, - "learning_rate": 1.428630383677388e-06, - "loss": 0.6946, - "step": 44271 - }, - { - "epoch": 1.13, - "learning_rate": 1.4286053838133936e-06, - "loss": 0.792, - "step": 44272 - }, - { - "epoch": 1.13, - "learning_rate": 1.428580383621235e-06, - "loss": 0.5703, - "step": 44273 - }, - { - "epoch": 1.13, - "learning_rate": 1.4285553831009325e-06, - "loss": 0.5352, - "step": 44274 - }, - { - "epoch": 1.13, - "learning_rate": 1.4285303822525046e-06, - "loss": 0.6104, - "step": 44275 - }, - { - "epoch": 1.13, - "learning_rate": 1.428505381075971e-06, - "loss": 0.6709, - "step": 44276 - }, - { - "epoch": 1.13, - "learning_rate": 1.4284803795713502e-06, - "loss": 0.7056, - "step": 44277 - }, - { - "epoch": 1.13, - "learning_rate": 1.4284553777386618e-06, - "loss": 0.6367, - "step": 44278 - }, - { - "epoch": 1.13, - "learning_rate": 1.4284303755779248e-06, - "loss": 0.6094, - "step": 44279 - }, - { - "epoch": 1.13, - "learning_rate": 1.4284053730891583e-06, - "loss": 0.7402, - "step": 44280 - }, - { - "epoch": 1.13, - "learning_rate": 1.4283803702723816e-06, - "loss": 0.6523, - "step": 44281 - }, - { - "epoch": 1.13, - "learning_rate": 1.428355367127614e-06, - "loss": 0.6729, - "step": 44282 - }, - { - "epoch": 1.13, - "learning_rate": 1.428330363654874e-06, - "loss": 0.5771, - "step": 44283 - }, - { - "epoch": 1.14, - "learning_rate": 1.428305359854181e-06, - "loss": 0.8066, - "step": 44284 - }, - { - "epoch": 1.14, - "learning_rate": 1.4282803557255548e-06, - "loss": 0.5801, - "step": 44285 - }, - { - "epoch": 1.14, - "learning_rate": 1.4282553512690137e-06, - "loss": 0.6294, - "step": 44286 - }, - { - "epoch": 1.14, - "learning_rate": 1.4282303464845775e-06, - "loss": 0.644, - "step": 44287 - }, - { - "epoch": 1.14, - "learning_rate": 1.4282053413722646e-06, - "loss": 0.7744, - "step": 44288 - }, - { - "epoch": 1.14, - "learning_rate": 1.4281803359320948e-06, - "loss": 0.5835, - "step": 44289 - }, - { - "epoch": 1.14, - "learning_rate": 1.4281553301640867e-06, - "loss": 0.7656, - "step": 44290 - }, - { - "epoch": 1.14, - "learning_rate": 1.42813032406826e-06, - "loss": 0.6602, - "step": 44291 - }, - { - "epoch": 1.14, - "learning_rate": 1.4281053176446336e-06, - "loss": 0.7793, - "step": 44292 - }, - { - "epoch": 1.14, - "learning_rate": 1.4280803108932266e-06, - "loss": 0.6028, - "step": 44293 - }, - { - "epoch": 1.14, - "learning_rate": 1.4280553038140583e-06, - "loss": 0.834, - "step": 44294 - }, - { - "epoch": 1.14, - "learning_rate": 1.4280302964071475e-06, - "loss": 0.5098, - "step": 44295 - }, - { - "epoch": 1.14, - "learning_rate": 1.4280052886725137e-06, - "loss": 0.6533, - "step": 44296 - }, - { - "epoch": 1.14, - "learning_rate": 1.4279802806101762e-06, - "loss": 0.6523, - "step": 44297 - }, - { - "epoch": 1.14, - "learning_rate": 1.4279552722201535e-06, - "loss": 0.8213, - "step": 44298 - }, - { - "epoch": 1.14, - "learning_rate": 1.4279302635024656e-06, - "loss": 0.4563, - "step": 44299 - }, - { - "epoch": 1.14, - "learning_rate": 1.4279052544571305e-06, - "loss": 0.5405, - "step": 44300 - }, - { - "epoch": 1.14, - "learning_rate": 1.4278802450841685e-06, - "loss": 0.5757, - "step": 44301 - }, - { - "epoch": 1.14, - "learning_rate": 1.427855235383598e-06, - "loss": 0.6758, - "step": 44302 - }, - { - "epoch": 1.14, - "learning_rate": 1.4278302253554385e-06, - "loss": 0.4941, - "step": 44303 - }, - { - "epoch": 1.14, - "learning_rate": 1.4278052149997093e-06, - "loss": 0.4082, - "step": 44304 - }, - { - "epoch": 1.14, - "learning_rate": 1.427780204316429e-06, - "loss": 0.5508, - "step": 44305 - }, - { - "epoch": 1.14, - "learning_rate": 1.4277551933056172e-06, - "loss": 0.9014, - "step": 44306 - }, - { - "epoch": 1.14, - "learning_rate": 1.4277301819672928e-06, - "loss": 0.6611, - "step": 44307 - }, - { - "epoch": 1.14, - "learning_rate": 1.4277051703014754e-06, - "loss": 0.7183, - "step": 44308 - }, - { - "epoch": 1.14, - "learning_rate": 1.4276801583081835e-06, - "loss": 0.6128, - "step": 44309 - }, - { - "epoch": 1.14, - "learning_rate": 1.4276551459874366e-06, - "loss": 0.5083, - "step": 44310 - }, - { - "epoch": 1.14, - "learning_rate": 1.4276301333392537e-06, - "loss": 0.6167, - "step": 44311 - }, - { - "epoch": 1.14, - "learning_rate": 1.4276051203636548e-06, - "loss": 0.5935, - "step": 44312 - }, - { - "epoch": 1.14, - "learning_rate": 1.4275801070606576e-06, - "loss": 0.4456, - "step": 44313 - }, - { - "epoch": 1.14, - "learning_rate": 1.427555093430282e-06, - "loss": 0.5576, - "step": 44314 - }, - { - "epoch": 1.14, - "learning_rate": 1.4275300794725472e-06, - "loss": 0.6602, - "step": 44315 - }, - { - "epoch": 1.14, - "learning_rate": 1.4275050651874725e-06, - "loss": 0.7266, - "step": 44316 - }, - { - "epoch": 1.14, - "learning_rate": 1.4274800505750769e-06, - "loss": 0.7021, - "step": 44317 - }, - { - "epoch": 1.14, - "learning_rate": 1.4274550356353793e-06, - "loss": 0.6328, - "step": 44318 - }, - { - "epoch": 1.14, - "learning_rate": 1.4274300203683987e-06, - "loss": 0.6147, - "step": 44319 - }, - { - "epoch": 1.14, - "learning_rate": 1.4274050047741551e-06, - "loss": 0.5063, - "step": 44320 - }, - { - "epoch": 1.14, - "learning_rate": 1.4273799888526665e-06, - "loss": 0.7852, - "step": 44321 - }, - { - "epoch": 1.14, - "learning_rate": 1.4273549726039534e-06, - "loss": 0.707, - "step": 44322 - }, - { - "epoch": 1.14, - "learning_rate": 1.427329956028034e-06, - "loss": 0.8604, - "step": 44323 - }, - { - "epoch": 1.14, - "learning_rate": 1.4273049391249277e-06, - "loss": 0.6592, - "step": 44324 - }, - { - "epoch": 1.14, - "learning_rate": 1.4272799218946533e-06, - "loss": 0.6592, - "step": 44325 - }, - { - "epoch": 1.14, - "learning_rate": 1.427254904337231e-06, - "loss": 0.6279, - "step": 44326 - }, - { - "epoch": 1.14, - "learning_rate": 1.4272298864526788e-06, - "loss": 0.7197, - "step": 44327 - }, - { - "epoch": 1.14, - "learning_rate": 1.4272048682410164e-06, - "loss": 0.728, - "step": 44328 - }, - { - "epoch": 1.14, - "learning_rate": 1.4271798497022629e-06, - "loss": 0.6396, - "step": 44329 - }, - { - "epoch": 1.14, - "learning_rate": 1.4271548308364373e-06, - "loss": 0.603, - "step": 44330 - }, - { - "epoch": 1.14, - "learning_rate": 1.427129811643559e-06, - "loss": 0.6145, - "step": 44331 - }, - { - "epoch": 1.14, - "learning_rate": 1.4271047921236472e-06, - "loss": 0.3169, - "step": 44332 - }, - { - "epoch": 1.14, - "learning_rate": 1.4270797722767208e-06, - "loss": 0.749, - "step": 44333 - }, - { - "epoch": 1.14, - "learning_rate": 1.427054752102799e-06, - "loss": 0.6484, - "step": 44334 - }, - { - "epoch": 1.14, - "learning_rate": 1.427029731601901e-06, - "loss": 0.7871, - "step": 44335 - }, - { - "epoch": 1.14, - "learning_rate": 1.427004710774046e-06, - "loss": 0.4808, - "step": 44336 - }, - { - "epoch": 1.14, - "learning_rate": 1.4269796896192533e-06, - "loss": 0.7134, - "step": 44337 - }, - { - "epoch": 1.14, - "learning_rate": 1.4269546681375416e-06, - "loss": 0.6797, - "step": 44338 - }, - { - "epoch": 1.14, - "learning_rate": 1.4269296463289304e-06, - "loss": 0.4907, - "step": 44339 - }, - { - "epoch": 1.14, - "learning_rate": 1.426904624193439e-06, - "loss": 0.7153, - "step": 44340 - }, - { - "epoch": 1.14, - "learning_rate": 1.426879601731086e-06, - "loss": 0.6611, - "step": 44341 - }, - { - "epoch": 1.14, - "learning_rate": 1.4268545789418914e-06, - "loss": 0.6855, - "step": 44342 - }, - { - "epoch": 1.14, - "learning_rate": 1.4268295558258734e-06, - "loss": 0.8154, - "step": 44343 - }, - { - "epoch": 1.14, - "learning_rate": 1.4268045323830518e-06, - "loss": 0.7305, - "step": 44344 - }, - { - "epoch": 1.14, - "learning_rate": 1.4267795086134459e-06, - "loss": 0.7969, - "step": 44345 - }, - { - "epoch": 1.14, - "learning_rate": 1.4267544845170741e-06, - "loss": 0.8291, - "step": 44346 - }, - { - "epoch": 1.14, - "learning_rate": 1.426729460093956e-06, - "loss": 0.8408, - "step": 44347 - }, - { - "epoch": 1.14, - "learning_rate": 1.426704435344111e-06, - "loss": 0.7334, - "step": 44348 - }, - { - "epoch": 1.14, - "learning_rate": 1.4266794102675581e-06, - "loss": 0.606, - "step": 44349 - }, - { - "epoch": 1.14, - "learning_rate": 1.4266543848643164e-06, - "loss": 0.6943, - "step": 44350 - }, - { - "epoch": 1.14, - "learning_rate": 1.426629359134405e-06, - "loss": 0.626, - "step": 44351 - }, - { - "epoch": 1.14, - "learning_rate": 1.4266043330778431e-06, - "loss": 0.7139, - "step": 44352 - }, - { - "epoch": 1.14, - "learning_rate": 1.4265793066946497e-06, - "loss": 0.5408, - "step": 44353 - }, - { - "epoch": 1.14, - "learning_rate": 1.4265542799848444e-06, - "loss": 0.6455, - "step": 44354 - }, - { - "epoch": 1.14, - "learning_rate": 1.426529252948446e-06, - "loss": 0.5405, - "step": 44355 - }, - { - "epoch": 1.14, - "learning_rate": 1.4265042255854738e-06, - "loss": 0.5854, - "step": 44356 - }, - { - "epoch": 1.14, - "learning_rate": 1.4264791978959468e-06, - "loss": 0.509, - "step": 44357 - }, - { - "epoch": 1.14, - "learning_rate": 1.4264541698798844e-06, - "loss": 0.6328, - "step": 44358 - }, - { - "epoch": 1.14, - "learning_rate": 1.4264291415373056e-06, - "loss": 0.5903, - "step": 44359 - }, - { - "epoch": 1.14, - "learning_rate": 1.4264041128682296e-06, - "loss": 0.5137, - "step": 44360 - }, - { - "epoch": 1.14, - "learning_rate": 1.4263790838726754e-06, - "loss": 0.709, - "step": 44361 - }, - { - "epoch": 1.14, - "learning_rate": 1.426354054550663e-06, - "loss": 0.7246, - "step": 44362 - }, - { - "epoch": 1.14, - "learning_rate": 1.4263290249022104e-06, - "loss": 0.6616, - "step": 44363 - }, - { - "epoch": 1.14, - "learning_rate": 1.4263039949273373e-06, - "loss": 0.7065, - "step": 44364 - }, - { - "epoch": 1.14, - "learning_rate": 1.4262789646260627e-06, - "loss": 0.4616, - "step": 44365 - }, - { - "epoch": 1.14, - "learning_rate": 1.426253933998406e-06, - "loss": 0.7568, - "step": 44366 - }, - { - "epoch": 1.14, - "learning_rate": 1.4262289030443866e-06, - "loss": 0.7295, - "step": 44367 - }, - { - "epoch": 1.14, - "learning_rate": 1.426203871764023e-06, - "loss": 0.4946, - "step": 44368 - }, - { - "epoch": 1.14, - "learning_rate": 1.4261788401573348e-06, - "loss": 0.6875, - "step": 44369 - }, - { - "epoch": 1.14, - "learning_rate": 1.4261538082243409e-06, - "loss": 0.6367, - "step": 44370 - }, - { - "epoch": 1.14, - "learning_rate": 1.4261287759650607e-06, - "loss": 0.6006, - "step": 44371 - }, - { - "epoch": 1.14, - "learning_rate": 1.4261037433795132e-06, - "loss": 0.5771, - "step": 44372 - }, - { - "epoch": 1.14, - "learning_rate": 1.4260787104677179e-06, - "loss": 0.449, - "step": 44373 - }, - { - "epoch": 1.14, - "learning_rate": 1.4260536772296935e-06, - "loss": 0.7656, - "step": 44374 - }, - { - "epoch": 1.14, - "learning_rate": 1.4260286436654596e-06, - "loss": 0.6729, - "step": 44375 - }, - { - "epoch": 1.14, - "learning_rate": 1.426003609775035e-06, - "loss": 0.6484, - "step": 44376 - }, - { - "epoch": 1.14, - "learning_rate": 1.4259785755584392e-06, - "loss": 0.5574, - "step": 44377 - }, - { - "epoch": 1.14, - "learning_rate": 1.4259535410156908e-06, - "loss": 0.7373, - "step": 44378 - }, - { - "epoch": 1.14, - "learning_rate": 1.42592850614681e-06, - "loss": 0.8604, - "step": 44379 - }, - { - "epoch": 1.14, - "learning_rate": 1.4259034709518146e-06, - "loss": 0.7627, - "step": 44380 - }, - { - "epoch": 1.14, - "learning_rate": 1.425878435430725e-06, - "loss": 0.751, - "step": 44381 - }, - { - "epoch": 1.14, - "learning_rate": 1.4258533995835596e-06, - "loss": 0.707, - "step": 44382 - }, - { - "epoch": 1.14, - "learning_rate": 1.4258283634103382e-06, - "loss": 0.5405, - "step": 44383 - }, - { - "epoch": 1.14, - "learning_rate": 1.4258033269110792e-06, - "loss": 0.6279, - "step": 44384 - }, - { - "epoch": 1.14, - "learning_rate": 1.425778290085802e-06, - "loss": 0.4811, - "step": 44385 - }, - { - "epoch": 1.14, - "learning_rate": 1.4257532529345264e-06, - "loss": 0.7725, - "step": 44386 - }, - { - "epoch": 1.14, - "learning_rate": 1.425728215457271e-06, - "loss": 0.7432, - "step": 44387 - }, - { - "epoch": 1.14, - "learning_rate": 1.425703177654055e-06, - "loss": 0.6035, - "step": 44388 - }, - { - "epoch": 1.14, - "learning_rate": 1.4256781395248978e-06, - "loss": 0.8525, - "step": 44389 - }, - { - "epoch": 1.14, - "learning_rate": 1.4256531010698184e-06, - "loss": 0.5005, - "step": 44390 - }, - { - "epoch": 1.14, - "learning_rate": 1.425628062288836e-06, - "loss": 0.6436, - "step": 44391 - }, - { - "epoch": 1.14, - "learning_rate": 1.4256030231819696e-06, - "loss": 0.7959, - "step": 44392 - }, - { - "epoch": 1.14, - "learning_rate": 1.4255779837492386e-06, - "loss": 0.7383, - "step": 44393 - }, - { - "epoch": 1.14, - "learning_rate": 1.4255529439906622e-06, - "loss": 0.6914, - "step": 44394 - }, - { - "epoch": 1.14, - "learning_rate": 1.425527903906259e-06, - "loss": 0.5504, - "step": 44395 - }, - { - "epoch": 1.14, - "learning_rate": 1.425502863496049e-06, - "loss": 0.5854, - "step": 44396 - }, - { - "epoch": 1.14, - "learning_rate": 1.4254778227600515e-06, - "loss": 0.6582, - "step": 44397 - }, - { - "epoch": 1.14, - "learning_rate": 1.4254527816982847e-06, - "loss": 0.6875, - "step": 44398 - }, - { - "epoch": 1.14, - "learning_rate": 1.4254277403107681e-06, - "loss": 0.5049, - "step": 44399 - }, - { - "epoch": 1.14, - "learning_rate": 1.4254026985975214e-06, - "loss": 0.7227, - "step": 44400 - }, - { - "epoch": 1.14, - "learning_rate": 1.4253776565585632e-06, - "loss": 0.5518, - "step": 44401 - }, - { - "epoch": 1.14, - "learning_rate": 1.4253526141939132e-06, - "loss": 0.5903, - "step": 44402 - }, - { - "epoch": 1.14, - "learning_rate": 1.42532757150359e-06, - "loss": 0.468, - "step": 44403 - }, - { - "epoch": 1.14, - "learning_rate": 1.425302528487613e-06, - "loss": 0.4937, - "step": 44404 - }, - { - "epoch": 1.14, - "learning_rate": 1.4252774851460015e-06, - "loss": 0.5916, - "step": 44405 - }, - { - "epoch": 1.14, - "learning_rate": 1.4252524414787745e-06, - "loss": 0.7202, - "step": 44406 - }, - { - "epoch": 1.14, - "learning_rate": 1.4252273974859514e-06, - "loss": 0.7451, - "step": 44407 - }, - { - "epoch": 1.14, - "learning_rate": 1.4252023531675513e-06, - "loss": 0.666, - "step": 44408 - }, - { - "epoch": 1.14, - "learning_rate": 1.425177308523593e-06, - "loss": 0.6367, - "step": 44409 - }, - { - "epoch": 1.14, - "learning_rate": 1.4251522635540962e-06, - "loss": 0.7295, - "step": 44410 - }, - { - "epoch": 1.14, - "learning_rate": 1.4251272182590796e-06, - "loss": 0.5283, - "step": 44411 - }, - { - "epoch": 1.14, - "learning_rate": 1.425102172638563e-06, - "loss": 0.4761, - "step": 44412 - }, - { - "epoch": 1.14, - "learning_rate": 1.4250771266925652e-06, - "loss": 0.6443, - "step": 44413 - }, - { - "epoch": 1.14, - "learning_rate": 1.4250520804211053e-06, - "loss": 0.7588, - "step": 44414 - }, - { - "epoch": 1.14, - "learning_rate": 1.4250270338242023e-06, - "loss": 0.6826, - "step": 44415 - }, - { - "epoch": 1.14, - "learning_rate": 1.425001986901876e-06, - "loss": 0.6943, - "step": 44416 - }, - { - "epoch": 1.14, - "learning_rate": 1.4249769396541451e-06, - "loss": 0.7827, - "step": 44417 - }, - { - "epoch": 1.14, - "learning_rate": 1.4249518920810285e-06, - "loss": 0.9541, - "step": 44418 - }, - { - "epoch": 1.14, - "learning_rate": 1.4249268441825465e-06, - "loss": 0.5547, - "step": 44419 - }, - { - "epoch": 1.14, - "learning_rate": 1.4249017959587172e-06, - "loss": 0.7129, - "step": 44420 - }, - { - "epoch": 1.14, - "learning_rate": 1.42487674740956e-06, - "loss": 0.4912, - "step": 44421 - }, - { - "epoch": 1.14, - "learning_rate": 1.4248516985350945e-06, - "loss": 0.6284, - "step": 44422 - }, - { - "epoch": 1.14, - "learning_rate": 1.4248266493353396e-06, - "loss": 0.6611, - "step": 44423 - }, - { - "epoch": 1.14, - "learning_rate": 1.424801599810314e-06, - "loss": 0.5986, - "step": 44424 - }, - { - "epoch": 1.14, - "learning_rate": 1.4247765499600378e-06, - "loss": 0.7285, - "step": 44425 - }, - { - "epoch": 1.14, - "learning_rate": 1.4247514997845294e-06, - "loss": 0.6416, - "step": 44426 - }, - { - "epoch": 1.14, - "learning_rate": 1.4247264492838088e-06, - "loss": 0.6816, - "step": 44427 - }, - { - "epoch": 1.14, - "learning_rate": 1.4247013984578942e-06, - "loss": 0.7793, - "step": 44428 - }, - { - "epoch": 1.14, - "learning_rate": 1.4246763473068055e-06, - "loss": 0.6934, - "step": 44429 - }, - { - "epoch": 1.14, - "learning_rate": 1.4246512958305615e-06, - "loss": 0.6348, - "step": 44430 - }, - { - "epoch": 1.14, - "learning_rate": 1.4246262440291816e-06, - "loss": 0.7109, - "step": 44431 - }, - { - "epoch": 1.14, - "learning_rate": 1.424601191902685e-06, - "loss": 0.7578, - "step": 44432 - }, - { - "epoch": 1.14, - "learning_rate": 1.4245761394510908e-06, - "loss": 0.75, - "step": 44433 - }, - { - "epoch": 1.14, - "learning_rate": 1.424551086674418e-06, - "loss": 0.5503, - "step": 44434 - }, - { - "epoch": 1.14, - "learning_rate": 1.4245260335726861e-06, - "loss": 0.6016, - "step": 44435 - }, - { - "epoch": 1.14, - "learning_rate": 1.424500980145914e-06, - "loss": 0.4985, - "step": 44436 - }, - { - "epoch": 1.14, - "learning_rate": 1.424475926394121e-06, - "loss": 0.5508, - "step": 44437 - }, - { - "epoch": 1.14, - "learning_rate": 1.4244508723173267e-06, - "loss": 0.6689, - "step": 44438 - }, - { - "epoch": 1.14, - "learning_rate": 1.4244258179155495e-06, - "loss": 0.5837, - "step": 44439 - }, - { - "epoch": 1.14, - "learning_rate": 1.4244007631888091e-06, - "loss": 0.6958, - "step": 44440 - }, - { - "epoch": 1.14, - "learning_rate": 1.4243757081371245e-06, - "loss": 0.6274, - "step": 44441 - }, - { - "epoch": 1.14, - "learning_rate": 1.4243506527605149e-06, - "loss": 0.5225, - "step": 44442 - }, - { - "epoch": 1.14, - "learning_rate": 1.4243255970589995e-06, - "loss": 0.624, - "step": 44443 - }, - { - "epoch": 1.14, - "learning_rate": 1.4243005410325977e-06, - "loss": 0.4739, - "step": 44444 - }, - { - "epoch": 1.14, - "learning_rate": 1.4242754846813282e-06, - "loss": 0.6191, - "step": 44445 - }, - { - "epoch": 1.14, - "learning_rate": 1.4242504280052108e-06, - "loss": 0.6353, - "step": 44446 - }, - { - "epoch": 1.14, - "learning_rate": 1.4242253710042643e-06, - "loss": 0.4824, - "step": 44447 - }, - { - "epoch": 1.14, - "learning_rate": 1.4242003136785077e-06, - "loss": 0.709, - "step": 44448 - }, - { - "epoch": 1.14, - "learning_rate": 1.4241752560279604e-06, - "loss": 0.6777, - "step": 44449 - }, - { - "epoch": 1.14, - "learning_rate": 1.4241501980526419e-06, - "loss": 0.7051, - "step": 44450 - }, - { - "epoch": 1.14, - "learning_rate": 1.4241251397525709e-06, - "loss": 0.5513, - "step": 44451 - }, - { - "epoch": 1.14, - "learning_rate": 1.424100081127767e-06, - "loss": 0.5205, - "step": 44452 - }, - { - "epoch": 1.14, - "learning_rate": 1.4240750221782486e-06, - "loss": 0.6855, - "step": 44453 - }, - { - "epoch": 1.14, - "learning_rate": 1.4240499629040362e-06, - "loss": 0.6807, - "step": 44454 - }, - { - "epoch": 1.14, - "learning_rate": 1.4240249033051477e-06, - "loss": 0.7163, - "step": 44455 - }, - { - "epoch": 1.14, - "learning_rate": 1.423999843381603e-06, - "loss": 0.7754, - "step": 44456 - }, - { - "epoch": 1.14, - "learning_rate": 1.4239747831334212e-06, - "loss": 0.6152, - "step": 44457 - }, - { - "epoch": 1.14, - "learning_rate": 1.4239497225606214e-06, - "loss": 0.6543, - "step": 44458 - }, - { - "epoch": 1.14, - "learning_rate": 1.4239246616632228e-06, - "loss": 0.6235, - "step": 44459 - }, - { - "epoch": 1.14, - "learning_rate": 1.4238996004412445e-06, - "loss": 0.7246, - "step": 44460 - }, - { - "epoch": 1.14, - "learning_rate": 1.4238745388947054e-06, - "loss": 0.6924, - "step": 44461 - }, - { - "epoch": 1.14, - "learning_rate": 1.4238494770236255e-06, - "loss": 0.7148, - "step": 44462 - }, - { - "epoch": 1.14, - "learning_rate": 1.4238244148280237e-06, - "loss": 0.584, - "step": 44463 - }, - { - "epoch": 1.14, - "learning_rate": 1.4237993523079185e-06, - "loss": 0.748, - "step": 44464 - }, - { - "epoch": 1.14, - "learning_rate": 1.4237742894633302e-06, - "loss": 0.4231, - "step": 44465 - }, - { - "epoch": 1.14, - "learning_rate": 1.4237492262942771e-06, - "loss": 0.6357, - "step": 44466 - }, - { - "epoch": 1.14, - "learning_rate": 1.423724162800779e-06, - "loss": 0.5603, - "step": 44467 - }, - { - "epoch": 1.14, - "learning_rate": 1.4236990989828544e-06, - "loss": 0.7598, - "step": 44468 - }, - { - "epoch": 1.14, - "learning_rate": 1.423674034840523e-06, - "loss": 0.7832, - "step": 44469 - }, - { - "epoch": 1.14, - "learning_rate": 1.4236489703738039e-06, - "loss": 0.7998, - "step": 44470 - }, - { - "epoch": 1.14, - "learning_rate": 1.4236239055827163e-06, - "loss": 0.6465, - "step": 44471 - }, - { - "epoch": 1.14, - "learning_rate": 1.4235988404672793e-06, - "loss": 0.7637, - "step": 44472 - }, - { - "epoch": 1.14, - "learning_rate": 1.4235737750275123e-06, - "loss": 0.6569, - "step": 44473 - }, - { - "epoch": 1.14, - "learning_rate": 1.423548709263434e-06, - "loss": 0.6396, - "step": 44474 - }, - { - "epoch": 1.14, - "learning_rate": 1.423523643175064e-06, - "loss": 0.7305, - "step": 44475 - }, - { - "epoch": 1.14, - "learning_rate": 1.4234985767624217e-06, - "loss": 0.5957, - "step": 44476 - }, - { - "epoch": 1.14, - "learning_rate": 1.423473510025526e-06, - "loss": 0.79, - "step": 44477 - }, - { - "epoch": 1.14, - "learning_rate": 1.4234484429643959e-06, - "loss": 0.4849, - "step": 44478 - }, - { - "epoch": 1.14, - "learning_rate": 1.423423375579051e-06, - "loss": 0.7661, - "step": 44479 - }, - { - "epoch": 1.14, - "learning_rate": 1.42339830786951e-06, - "loss": 0.8301, - "step": 44480 - }, - { - "epoch": 1.14, - "learning_rate": 1.4233732398357924e-06, - "loss": 0.4739, - "step": 44481 - }, - { - "epoch": 1.14, - "learning_rate": 1.4233481714779177e-06, - "loss": 0.6763, - "step": 44482 - }, - { - "epoch": 1.14, - "learning_rate": 1.4233231027959045e-06, - "loss": 0.5913, - "step": 44483 - }, - { - "epoch": 1.14, - "learning_rate": 1.4232980337897724e-06, - "loss": 0.6191, - "step": 44484 - }, - { - "epoch": 1.14, - "learning_rate": 1.4232729644595403e-06, - "loss": 0.7607, - "step": 44485 - }, - { - "epoch": 1.14, - "learning_rate": 1.4232478948052277e-06, - "loss": 0.7183, - "step": 44486 - }, - { - "epoch": 1.14, - "learning_rate": 1.4232228248268536e-06, - "loss": 0.7529, - "step": 44487 - }, - { - "epoch": 1.14, - "learning_rate": 1.4231977545244374e-06, - "loss": 0.6904, - "step": 44488 - }, - { - "epoch": 1.14, - "learning_rate": 1.4231726838979978e-06, - "loss": 0.5615, - "step": 44489 - }, - { - "epoch": 1.14, - "learning_rate": 1.4231476129475547e-06, - "loss": 0.5455, - "step": 44490 - }, - { - "epoch": 1.14, - "learning_rate": 1.4231225416731268e-06, - "loss": 0.374, - "step": 44491 - }, - { - "epoch": 1.14, - "learning_rate": 1.4230974700747334e-06, - "loss": 0.7588, - "step": 44492 - }, - { - "epoch": 1.14, - "learning_rate": 1.4230723981523935e-06, - "loss": 0.5371, - "step": 44493 - }, - { - "epoch": 1.14, - "learning_rate": 1.4230473259061268e-06, - "loss": 0.79, - "step": 44494 - }, - { - "epoch": 1.14, - "learning_rate": 1.4230222533359522e-06, - "loss": 0.7871, - "step": 44495 - }, - { - "epoch": 1.14, - "learning_rate": 1.422997180441889e-06, - "loss": 0.5591, - "step": 44496 - }, - { - "epoch": 1.14, - "learning_rate": 1.422972107223956e-06, - "loss": 0.6074, - "step": 44497 - }, - { - "epoch": 1.14, - "learning_rate": 1.422947033682173e-06, - "loss": 0.6777, - "step": 44498 - }, - { - "epoch": 1.14, - "learning_rate": 1.4229219598165585e-06, - "loss": 0.6426, - "step": 44499 - }, - { - "epoch": 1.14, - "learning_rate": 1.4228968856271324e-06, - "loss": 0.749, - "step": 44500 - }, - { - "epoch": 1.14, - "learning_rate": 1.4228718111139137e-06, - "loss": 0.6953, - "step": 44501 - }, - { - "epoch": 1.14, - "learning_rate": 1.4228467362769212e-06, - "loss": 0.52, - "step": 44502 - }, - { - "epoch": 1.14, - "learning_rate": 1.4228216611161745e-06, - "loss": 0.6134, - "step": 44503 - }, - { - "epoch": 1.14, - "learning_rate": 1.422796585631693e-06, - "loss": 0.7144, - "step": 44504 - }, - { - "epoch": 1.14, - "learning_rate": 1.4227715098234952e-06, - "loss": 0.7822, - "step": 44505 - }, - { - "epoch": 1.14, - "learning_rate": 1.4227464336916008e-06, - "loss": 0.4243, - "step": 44506 - }, - { - "epoch": 1.14, - "learning_rate": 1.4227213572360294e-06, - "loss": 0.6592, - "step": 44507 - }, - { - "epoch": 1.14, - "learning_rate": 1.4226962804567987e-06, - "loss": 0.5779, - "step": 44508 - }, - { - "epoch": 1.14, - "learning_rate": 1.4226712033539297e-06, - "loss": 0.5117, - "step": 44509 - }, - { - "epoch": 1.14, - "learning_rate": 1.4226461259274402e-06, - "loss": 0.751, - "step": 44510 - }, - { - "epoch": 1.14, - "learning_rate": 1.4226210481773508e-06, - "loss": 0.6104, - "step": 44511 - }, - { - "epoch": 1.14, - "learning_rate": 1.422595970103679e-06, - "loss": 0.6714, - "step": 44512 - }, - { - "epoch": 1.14, - "learning_rate": 1.4225708917064457e-06, - "loss": 0.5098, - "step": 44513 - }, - { - "epoch": 1.14, - "learning_rate": 1.4225458129856686e-06, - "loss": 0.627, - "step": 44514 - }, - { - "epoch": 1.14, - "learning_rate": 1.4225207339413681e-06, - "loss": 0.7393, - "step": 44515 - }, - { - "epoch": 1.14, - "learning_rate": 1.4224956545735627e-06, - "loss": 0.542, - "step": 44516 - }, - { - "epoch": 1.14, - "learning_rate": 1.4224705748822718e-06, - "loss": 0.748, - "step": 44517 - }, - { - "epoch": 1.14, - "learning_rate": 1.4224454948675146e-06, - "loss": 0.6504, - "step": 44518 - }, - { - "epoch": 1.14, - "learning_rate": 1.4224204145293103e-06, - "loss": 0.646, - "step": 44519 - }, - { - "epoch": 1.14, - "learning_rate": 1.4223953338676781e-06, - "loss": 0.7959, - "step": 44520 - }, - { - "epoch": 1.14, - "learning_rate": 1.4223702528826376e-06, - "loss": 0.7617, - "step": 44521 - }, - { - "epoch": 1.14, - "learning_rate": 1.4223451715742072e-06, - "loss": 0.5753, - "step": 44522 - }, - { - "epoch": 1.14, - "learning_rate": 1.4223200899424066e-06, - "loss": 0.5669, - "step": 44523 - }, - { - "epoch": 1.14, - "learning_rate": 1.422295007987255e-06, - "loss": 0.8174, - "step": 44524 - }, - { - "epoch": 1.14, - "learning_rate": 1.4222699257087713e-06, - "loss": 0.7314, - "step": 44525 - }, - { - "epoch": 1.14, - "learning_rate": 1.422244843106975e-06, - "loss": 0.5649, - "step": 44526 - }, - { - "epoch": 1.14, - "learning_rate": 1.4222197601818853e-06, - "loss": 0.5718, - "step": 44527 - }, - { - "epoch": 1.14, - "learning_rate": 1.4221946769335214e-06, - "loss": 0.8105, - "step": 44528 - }, - { - "epoch": 1.14, - "learning_rate": 1.4221695933619025e-06, - "loss": 0.7471, - "step": 44529 - }, - { - "epoch": 1.14, - "learning_rate": 1.4221445094670477e-06, - "loss": 0.7061, - "step": 44530 - }, - { - "epoch": 1.14, - "learning_rate": 1.4221194252489764e-06, - "loss": 0.6924, - "step": 44531 - }, - { - "epoch": 1.14, - "learning_rate": 1.4220943407077074e-06, - "loss": 0.6885, - "step": 44532 - }, - { - "epoch": 1.14, - "learning_rate": 1.4220692558432601e-06, - "loss": 0.6099, - "step": 44533 - }, - { - "epoch": 1.14, - "learning_rate": 1.4220441706556541e-06, - "loss": 0.7246, - "step": 44534 - }, - { - "epoch": 1.14, - "learning_rate": 1.4220190851449078e-06, - "loss": 0.6162, - "step": 44535 - }, - { - "epoch": 1.14, - "learning_rate": 1.4219939993110418e-06, - "loss": 0.7402, - "step": 44536 - }, - { - "epoch": 1.14, - "learning_rate": 1.4219689131540735e-06, - "loss": 0.6587, - "step": 44537 - }, - { - "epoch": 1.14, - "learning_rate": 1.4219438266740236e-06, - "loss": 0.5862, - "step": 44538 - }, - { - "epoch": 1.14, - "learning_rate": 1.42191873987091e-06, - "loss": 0.6865, - "step": 44539 - }, - { - "epoch": 1.14, - "learning_rate": 1.4218936527447534e-06, - "loss": 0.5752, - "step": 44540 - }, - { - "epoch": 1.14, - "learning_rate": 1.421868565295572e-06, - "loss": 0.7109, - "step": 44541 - }, - { - "epoch": 1.14, - "learning_rate": 1.4218434775233852e-06, - "loss": 0.7812, - "step": 44542 - }, - { - "epoch": 1.14, - "learning_rate": 1.4218183894282118e-06, - "loss": 0.5386, - "step": 44543 - }, - { - "epoch": 1.14, - "learning_rate": 1.421793301010072e-06, - "loss": 0.6191, - "step": 44544 - }, - { - "epoch": 1.14, - "learning_rate": 1.4217682122689842e-06, - "loss": 0.6636, - "step": 44545 - }, - { - "epoch": 1.14, - "learning_rate": 1.4217431232049681e-06, - "loss": 0.6533, - "step": 44546 - }, - { - "epoch": 1.14, - "learning_rate": 1.4217180338180426e-06, - "loss": 0.665, - "step": 44547 - }, - { - "epoch": 1.14, - "learning_rate": 1.4216929441082268e-06, - "loss": 0.6143, - "step": 44548 - }, - { - "epoch": 1.14, - "learning_rate": 1.4216678540755402e-06, - "loss": 0.3352, - "step": 44549 - }, - { - "epoch": 1.14, - "learning_rate": 1.4216427637200022e-06, - "loss": 0.5474, - "step": 44550 - }, - { - "epoch": 1.14, - "learning_rate": 1.4216176730416316e-06, - "loss": 0.7061, - "step": 44551 - }, - { - "epoch": 1.14, - "learning_rate": 1.4215925820404474e-06, - "loss": 0.6836, - "step": 44552 - }, - { - "epoch": 1.14, - "learning_rate": 1.4215674907164695e-06, - "loss": 0.6787, - "step": 44553 - }, - { - "epoch": 1.14, - "learning_rate": 1.4215423990697163e-06, - "loss": 0.4646, - "step": 44554 - }, - { - "epoch": 1.14, - "learning_rate": 1.421517307100208e-06, - "loss": 0.667, - "step": 44555 - }, - { - "epoch": 1.14, - "learning_rate": 1.4214922148079631e-06, - "loss": 0.6191, - "step": 44556 - }, - { - "epoch": 1.14, - "learning_rate": 1.421467122193001e-06, - "loss": 0.5786, - "step": 44557 - }, - { - "epoch": 1.14, - "learning_rate": 1.4214420292553406e-06, - "loss": 0.5615, - "step": 44558 - }, - { - "epoch": 1.14, - "learning_rate": 1.421416935995002e-06, - "loss": 0.6362, - "step": 44559 - }, - { - "epoch": 1.14, - "learning_rate": 1.4213918424120033e-06, - "loss": 0.6152, - "step": 44560 - }, - { - "epoch": 1.14, - "learning_rate": 1.4213667485063647e-06, - "loss": 0.7095, - "step": 44561 - }, - { - "epoch": 1.14, - "learning_rate": 1.4213416542781044e-06, - "loss": 0.7021, - "step": 44562 - }, - { - "epoch": 1.14, - "learning_rate": 1.4213165597272427e-06, - "loss": 0.5376, - "step": 44563 - }, - { - "epoch": 1.14, - "learning_rate": 1.421291464853798e-06, - "loss": 0.6279, - "step": 44564 - }, - { - "epoch": 1.14, - "learning_rate": 1.4212663696577898e-06, - "loss": 0.5603, - "step": 44565 - }, - { - "epoch": 1.14, - "learning_rate": 1.4212412741392377e-06, - "loss": 0.7402, - "step": 44566 - }, - { - "epoch": 1.14, - "learning_rate": 1.42121617829816e-06, - "loss": 0.6265, - "step": 44567 - }, - { - "epoch": 1.14, - "learning_rate": 1.4211910821345767e-06, - "loss": 0.6445, - "step": 44568 - }, - { - "epoch": 1.14, - "learning_rate": 1.4211659856485066e-06, - "loss": 0.8271, - "step": 44569 - }, - { - "epoch": 1.14, - "learning_rate": 1.421140888839969e-06, - "loss": 0.4941, - "step": 44570 - }, - { - "epoch": 1.14, - "learning_rate": 1.4211157917089836e-06, - "loss": 0.8398, - "step": 44571 - }, - { - "epoch": 1.14, - "learning_rate": 1.4210906942555689e-06, - "loss": 0.6562, - "step": 44572 - }, - { - "epoch": 1.14, - "learning_rate": 1.4210655964797442e-06, - "loss": 0.7424, - "step": 44573 - }, - { - "epoch": 1.14, - "learning_rate": 1.4210404983815295e-06, - "loss": 0.5317, - "step": 44574 - }, - { - "epoch": 1.14, - "learning_rate": 1.4210153999609429e-06, - "loss": 0.5747, - "step": 44575 - }, - { - "epoch": 1.14, - "learning_rate": 1.4209903012180046e-06, - "loss": 0.6748, - "step": 44576 - }, - { - "epoch": 1.14, - "learning_rate": 1.4209652021527332e-06, - "loss": 0.6035, - "step": 44577 - }, - { - "epoch": 1.14, - "learning_rate": 1.4209401027651482e-06, - "loss": 0.5112, - "step": 44578 - }, - { - "epoch": 1.14, - "learning_rate": 1.4209150030552684e-06, - "loss": 0.5354, - "step": 44579 - }, - { - "epoch": 1.14, - "learning_rate": 1.4208899030231135e-06, - "loss": 0.5981, - "step": 44580 - }, - { - "epoch": 1.14, - "learning_rate": 1.420864802668703e-06, - "loss": 0.7578, - "step": 44581 - }, - { - "epoch": 1.14, - "learning_rate": 1.4208397019920553e-06, - "loss": 0.5298, - "step": 44582 - }, - { - "epoch": 1.14, - "learning_rate": 1.4208146009931898e-06, - "loss": 0.5747, - "step": 44583 - }, - { - "epoch": 1.14, - "learning_rate": 1.420789499672126e-06, - "loss": 0.5809, - "step": 44584 - }, - { - "epoch": 1.14, - "learning_rate": 1.420764398028883e-06, - "loss": 0.7148, - "step": 44585 - }, - { - "epoch": 1.14, - "learning_rate": 1.4207392960634805e-06, - "loss": 0.5696, - "step": 44586 - }, - { - "epoch": 1.14, - "learning_rate": 1.4207141937759367e-06, - "loss": 0.5629, - "step": 44587 - }, - { - "epoch": 1.14, - "learning_rate": 1.4206890911662719e-06, - "loss": 0.7031, - "step": 44588 - }, - { - "epoch": 1.14, - "learning_rate": 1.4206639882345045e-06, - "loss": 0.5737, - "step": 44589 - }, - { - "epoch": 1.14, - "learning_rate": 1.420638884980654e-06, - "loss": 0.6147, - "step": 44590 - }, - { - "epoch": 1.14, - "learning_rate": 1.4206137814047396e-06, - "loss": 0.5303, - "step": 44591 - }, - { - "epoch": 1.14, - "learning_rate": 1.4205886775067806e-06, - "loss": 0.6279, - "step": 44592 - }, - { - "epoch": 1.14, - "learning_rate": 1.4205635732867964e-06, - "loss": 0.5967, - "step": 44593 - }, - { - "epoch": 1.14, - "learning_rate": 1.4205384687448058e-06, - "loss": 0.542, - "step": 44594 - }, - { - "epoch": 1.14, - "learning_rate": 1.4205133638808282e-06, - "loss": 0.7979, - "step": 44595 - }, - { - "epoch": 1.14, - "learning_rate": 1.420488258694883e-06, - "loss": 0.6235, - "step": 44596 - }, - { - "epoch": 1.14, - "learning_rate": 1.4204631531869896e-06, - "loss": 0.6074, - "step": 44597 - }, - { - "epoch": 1.14, - "learning_rate": 1.4204380473571663e-06, - "loss": 0.6743, - "step": 44598 - }, - { - "epoch": 1.14, - "learning_rate": 1.420412941205433e-06, - "loss": 0.7324, - "step": 44599 - }, - { - "epoch": 1.14, - "learning_rate": 1.4203878347318088e-06, - "loss": 0.8203, - "step": 44600 - }, - { - "epoch": 1.14, - "learning_rate": 1.4203627279363136e-06, - "loss": 0.5957, - "step": 44601 - }, - { - "epoch": 1.14, - "learning_rate": 1.4203376208189655e-06, - "loss": 0.6279, - "step": 44602 - }, - { - "epoch": 1.14, - "learning_rate": 1.4203125133797841e-06, - "loss": 0.834, - "step": 44603 - }, - { - "epoch": 1.14, - "learning_rate": 1.4202874056187888e-06, - "loss": 0.6611, - "step": 44604 - }, - { - "epoch": 1.14, - "learning_rate": 1.420262297535999e-06, - "loss": 0.7021, - "step": 44605 - }, - { - "epoch": 1.14, - "learning_rate": 1.4202371891314336e-06, - "loss": 0.7041, - "step": 44606 - }, - { - "epoch": 1.14, - "learning_rate": 1.4202120804051119e-06, - "loss": 0.5972, - "step": 44607 - }, - { - "epoch": 1.14, - "learning_rate": 1.4201869713570528e-06, - "loss": 0.7627, - "step": 44608 - }, - { - "epoch": 1.14, - "learning_rate": 1.4201618619872762e-06, - "loss": 0.7002, - "step": 44609 - }, - { - "epoch": 1.14, - "learning_rate": 1.4201367522958007e-06, - "loss": 0.6865, - "step": 44610 - }, - { - "epoch": 1.14, - "learning_rate": 1.4201116422826465e-06, - "loss": 0.7041, - "step": 44611 - }, - { - "epoch": 1.14, - "learning_rate": 1.4200865319478315e-06, - "loss": 0.7686, - "step": 44612 - }, - { - "epoch": 1.14, - "learning_rate": 1.4200614212913756e-06, - "loss": 0.8037, - "step": 44613 - }, - { - "epoch": 1.14, - "learning_rate": 1.420036310313298e-06, - "loss": 0.8721, - "step": 44614 - }, - { - "epoch": 1.14, - "learning_rate": 1.4200111990136182e-06, - "loss": 0.627, - "step": 44615 - }, - { - "epoch": 1.14, - "learning_rate": 1.4199860873923548e-06, - "loss": 0.8135, - "step": 44616 - }, - { - "epoch": 1.14, - "learning_rate": 1.4199609754495273e-06, - "loss": 0.6494, - "step": 44617 - }, - { - "epoch": 1.14, - "learning_rate": 1.4199358631851554e-06, - "loss": 0.6201, - "step": 44618 - }, - { - "epoch": 1.14, - "learning_rate": 1.4199107505992576e-06, - "loss": 0.6992, - "step": 44619 - }, - { - "epoch": 1.14, - "learning_rate": 1.4198856376918536e-06, - "loss": 0.5649, - "step": 44620 - }, - { - "epoch": 1.14, - "learning_rate": 1.4198605244629625e-06, - "loss": 0.7324, - "step": 44621 - }, - { - "epoch": 1.14, - "learning_rate": 1.4198354109126033e-06, - "loss": 0.6914, - "step": 44622 - }, - { - "epoch": 1.14, - "learning_rate": 1.4198102970407956e-06, - "loss": 0.5962, - "step": 44623 - }, - { - "epoch": 1.14, - "learning_rate": 1.4197851828475585e-06, - "loss": 0.6113, - "step": 44624 - }, - { - "epoch": 1.14, - "learning_rate": 1.419760068332911e-06, - "loss": 0.6406, - "step": 44625 - }, - { - "epoch": 1.14, - "learning_rate": 1.4197349534968727e-06, - "loss": 0.7227, - "step": 44626 - }, - { - "epoch": 1.14, - "learning_rate": 1.4197098383394625e-06, - "loss": 0.6709, - "step": 44627 - }, - { - "epoch": 1.14, - "learning_rate": 1.4196847228607e-06, - "loss": 0.543, - "step": 44628 - }, - { - "epoch": 1.14, - "learning_rate": 1.419659607060604e-06, - "loss": 0.562, - "step": 44629 - }, - { - "epoch": 1.14, - "learning_rate": 1.419634490939194e-06, - "loss": 0.5542, - "step": 44630 - }, - { - "epoch": 1.14, - "learning_rate": 1.4196093744964893e-06, - "loss": 0.4481, - "step": 44631 - }, - { - "epoch": 1.14, - "learning_rate": 1.4195842577325087e-06, - "loss": 0.5962, - "step": 44632 - }, - { - "epoch": 1.14, - "learning_rate": 1.4195591406472718e-06, - "loss": 0.7314, - "step": 44633 - }, - { - "epoch": 1.14, - "learning_rate": 1.419534023240798e-06, - "loss": 0.6763, - "step": 44634 - }, - { - "epoch": 1.14, - "learning_rate": 1.419508905513106e-06, - "loss": 0.7231, - "step": 44635 - }, - { - "epoch": 1.14, - "learning_rate": 1.4194837874642154e-06, - "loss": 0.6592, - "step": 44636 - }, - { - "epoch": 1.14, - "learning_rate": 1.4194586690941454e-06, - "loss": 0.5723, - "step": 44637 - }, - { - "epoch": 1.14, - "learning_rate": 1.4194335504029152e-06, - "loss": 0.6133, - "step": 44638 - }, - { - "epoch": 1.14, - "learning_rate": 1.419408431390544e-06, - "loss": 0.5598, - "step": 44639 - }, - { - "epoch": 1.14, - "learning_rate": 1.419383312057051e-06, - "loss": 0.959, - "step": 44640 - }, - { - "epoch": 1.14, - "learning_rate": 1.4193581924024555e-06, - "loss": 0.6006, - "step": 44641 - }, - { - "epoch": 1.14, - "learning_rate": 1.419333072426777e-06, - "loss": 0.6426, - "step": 44642 - }, - { - "epoch": 1.14, - "learning_rate": 1.4193079521300341e-06, - "loss": 0.5337, - "step": 44643 - }, - { - "epoch": 1.14, - "learning_rate": 1.4192828315122463e-06, - "loss": 0.6582, - "step": 44644 - }, - { - "epoch": 1.14, - "learning_rate": 1.419257710573433e-06, - "loss": 0.7725, - "step": 44645 - }, - { - "epoch": 1.14, - "learning_rate": 1.4192325893136136e-06, - "loss": 0.6133, - "step": 44646 - }, - { - "epoch": 1.14, - "learning_rate": 1.419207467732807e-06, - "loss": 0.8711, - "step": 44647 - }, - { - "epoch": 1.14, - "learning_rate": 1.4191823458310324e-06, - "loss": 0.6768, - "step": 44648 - }, - { - "epoch": 1.14, - "learning_rate": 1.419157223608309e-06, - "loss": 0.5649, - "step": 44649 - }, - { - "epoch": 1.14, - "learning_rate": 1.4191321010646563e-06, - "loss": 0.3986, - "step": 44650 - }, - { - "epoch": 1.14, - "learning_rate": 1.419106978200094e-06, - "loss": 0.5996, - "step": 44651 - }, - { - "epoch": 1.14, - "learning_rate": 1.41908185501464e-06, - "loss": 0.7461, - "step": 44652 - }, - { - "epoch": 1.14, - "learning_rate": 1.4190567315083146e-06, - "loss": 0.6172, - "step": 44653 - }, - { - "epoch": 1.14, - "learning_rate": 1.4190316076811365e-06, - "loss": 0.6108, - "step": 44654 - }, - { - "epoch": 1.14, - "learning_rate": 1.4190064835331255e-06, - "loss": 0.6787, - "step": 44655 - }, - { - "epoch": 1.14, - "learning_rate": 1.4189813590643005e-06, - "loss": 0.606, - "step": 44656 - }, - { - "epoch": 1.14, - "learning_rate": 1.4189562342746807e-06, - "loss": 0.7129, - "step": 44657 - }, - { - "epoch": 1.14, - "learning_rate": 1.418931109164285e-06, - "loss": 0.5579, - "step": 44658 - }, - { - "epoch": 1.14, - "learning_rate": 1.4189059837331331e-06, - "loss": 0.5898, - "step": 44659 - }, - { - "epoch": 1.14, - "learning_rate": 1.4188808579812443e-06, - "loss": 0.7324, - "step": 44660 - }, - { - "epoch": 1.14, - "learning_rate": 1.4188557319086378e-06, - "loss": 0.3969, - "step": 44661 - }, - { - "epoch": 1.14, - "learning_rate": 1.4188306055153328e-06, - "loss": 0.5024, - "step": 44662 - }, - { - "epoch": 1.14, - "learning_rate": 1.418805478801348e-06, - "loss": 0.5162, - "step": 44663 - }, - { - "epoch": 1.14, - "learning_rate": 1.4187803517667036e-06, - "loss": 0.6646, - "step": 44664 - }, - { - "epoch": 1.14, - "learning_rate": 1.418755224411418e-06, - "loss": 0.5327, - "step": 44665 - }, - { - "epoch": 1.14, - "learning_rate": 1.418730096735511e-06, - "loss": 0.8945, - "step": 44666 - }, - { - "epoch": 1.14, - "learning_rate": 1.4187049687390016e-06, - "loss": 0.7676, - "step": 44667 - }, - { - "epoch": 1.14, - "learning_rate": 1.4186798404219092e-06, - "loss": 0.7295, - "step": 44668 - }, - { - "epoch": 1.14, - "learning_rate": 1.4186547117842524e-06, - "loss": 0.4385, - "step": 44669 - }, - { - "epoch": 1.14, - "learning_rate": 1.4186295828260515e-06, - "loss": 0.6653, - "step": 44670 - }, - { - "epoch": 1.14, - "learning_rate": 1.4186044535473248e-06, - "loss": 0.6177, - "step": 44671 - }, - { - "epoch": 1.14, - "learning_rate": 1.4185793239480922e-06, - "loss": 0.6709, - "step": 44672 - }, - { - "epoch": 1.14, - "learning_rate": 1.4185541940283723e-06, - "loss": 0.6489, - "step": 44673 - }, - { - "epoch": 1.15, - "learning_rate": 1.4185290637881848e-06, - "loss": 0.6094, - "step": 44674 - }, - { - "epoch": 1.15, - "learning_rate": 1.418503933227549e-06, - "loss": 0.3733, - "step": 44675 - }, - { - "epoch": 1.15, - "learning_rate": 1.4184788023464841e-06, - "loss": 0.7129, - "step": 44676 - }, - { - "epoch": 1.15, - "learning_rate": 1.4184536711450089e-06, - "loss": 0.6226, - "step": 44677 - }, - { - "epoch": 1.15, - "learning_rate": 1.4184285396231432e-06, - "loss": 0.6582, - "step": 44678 - }, - { - "epoch": 1.15, - "learning_rate": 1.4184034077809057e-06, - "loss": 0.749, - "step": 44679 - }, - { - "epoch": 1.15, - "learning_rate": 1.4183782756183162e-06, - "loss": 0.4324, - "step": 44680 - }, - { - "epoch": 1.15, - "learning_rate": 1.418353143135394e-06, - "loss": 0.7012, - "step": 44681 - }, - { - "epoch": 1.15, - "learning_rate": 1.4183280103321574e-06, - "loss": 0.8408, - "step": 44682 - }, - { - "epoch": 1.15, - "learning_rate": 1.4183028772086265e-06, - "loss": 0.6084, - "step": 44683 - }, - { - "epoch": 1.15, - "learning_rate": 1.4182777437648207e-06, - "loss": 0.4895, - "step": 44684 - }, - { - "epoch": 1.15, - "learning_rate": 1.4182526100007582e-06, - "loss": 0.6836, - "step": 44685 - }, - { - "epoch": 1.15, - "learning_rate": 1.4182274759164594e-06, - "loss": 0.4919, - "step": 44686 - }, - { - "epoch": 1.15, - "learning_rate": 1.4182023415119429e-06, - "loss": 0.6812, - "step": 44687 - }, - { - "epoch": 1.15, - "learning_rate": 1.418177206787228e-06, - "loss": 0.7188, - "step": 44688 - }, - { - "epoch": 1.15, - "learning_rate": 1.418152071742334e-06, - "loss": 0.3073, - "step": 44689 - }, - { - "epoch": 1.15, - "learning_rate": 1.4181269363772802e-06, - "loss": 0.6865, - "step": 44690 - }, - { - "epoch": 1.15, - "learning_rate": 1.4181018006920865e-06, - "loss": 0.4351, - "step": 44691 - }, - { - "epoch": 1.15, - "learning_rate": 1.4180766646867706e-06, - "loss": 0.689, - "step": 44692 - }, - { - "epoch": 1.15, - "learning_rate": 1.418051528361353e-06, - "loss": 0.6738, - "step": 44693 - }, - { - "epoch": 1.15, - "learning_rate": 1.4180263917158525e-06, - "loss": 0.5063, - "step": 44694 - }, - { - "epoch": 1.15, - "learning_rate": 1.4180012547502884e-06, - "loss": 0.6191, - "step": 44695 - }, - { - "epoch": 1.15, - "learning_rate": 1.41797611746468e-06, - "loss": 0.3837, - "step": 44696 - }, - { - "epoch": 1.15, - "learning_rate": 1.4179509798590468e-06, - "loss": 0.665, - "step": 44697 - }, - { - "epoch": 1.15, - "learning_rate": 1.4179258419334073e-06, - "loss": 0.5234, - "step": 44698 - }, - { - "epoch": 1.15, - "learning_rate": 1.4179007036877813e-06, - "loss": 0.6641, - "step": 44699 - }, - { - "epoch": 1.15, - "learning_rate": 1.4178755651221879e-06, - "loss": 0.6089, - "step": 44700 - }, - { - "epoch": 1.15, - "learning_rate": 1.4178504262366468e-06, - "loss": 0.5596, - "step": 44701 - }, - { - "epoch": 1.15, - "learning_rate": 1.4178252870311765e-06, - "loss": 0.7793, - "step": 44702 - }, - { - "epoch": 1.15, - "learning_rate": 1.4178001475057966e-06, - "loss": 0.5172, - "step": 44703 - }, - { - "epoch": 1.15, - "learning_rate": 1.4177750076605261e-06, - "loss": 0.668, - "step": 44704 - }, - { - "epoch": 1.15, - "learning_rate": 1.417749867495385e-06, - "loss": 0.8926, - "step": 44705 - }, - { - "epoch": 1.15, - "learning_rate": 1.4177247270103918e-06, - "loss": 0.3403, - "step": 44706 - }, - { - "epoch": 1.15, - "learning_rate": 1.4176995862055658e-06, - "loss": 0.7158, - "step": 44707 - }, - { - "epoch": 1.15, - "learning_rate": 1.4176744450809265e-06, - "loss": 0.6428, - "step": 44708 - }, - { - "epoch": 1.15, - "learning_rate": 1.4176493036364932e-06, - "loss": 0.6963, - "step": 44709 - }, - { - "epoch": 1.15, - "learning_rate": 1.417624161872285e-06, - "loss": 0.6953, - "step": 44710 - }, - { - "epoch": 1.15, - "learning_rate": 1.4175990197883214e-06, - "loss": 0.749, - "step": 44711 - }, - { - "epoch": 1.15, - "learning_rate": 1.4175738773846213e-06, - "loss": 0.6914, - "step": 44712 - }, - { - "epoch": 1.15, - "learning_rate": 1.4175487346612038e-06, - "loss": 0.7041, - "step": 44713 - }, - { - "epoch": 1.15, - "learning_rate": 1.4175235916180887e-06, - "loss": 0.8408, - "step": 44714 - }, - { - "epoch": 1.15, - "learning_rate": 1.417498448255295e-06, - "loss": 0.7178, - "step": 44715 - }, - { - "epoch": 1.15, - "learning_rate": 1.417473304572842e-06, - "loss": 0.4995, - "step": 44716 - }, - { - "epoch": 1.15, - "learning_rate": 1.4174481605707488e-06, - "loss": 0.5476, - "step": 44717 - }, - { - "epoch": 1.15, - "learning_rate": 1.4174230162490345e-06, - "loss": 0.791, - "step": 44718 - }, - { - "epoch": 1.15, - "learning_rate": 1.4173978716077186e-06, - "loss": 0.6143, - "step": 44719 - }, - { - "epoch": 1.15, - "learning_rate": 1.4173727266468208e-06, - "loss": 0.6704, - "step": 44720 - }, - { - "epoch": 1.15, - "learning_rate": 1.4173475813663596e-06, - "loss": 0.6313, - "step": 44721 - }, - { - "epoch": 1.15, - "learning_rate": 1.4173224357663547e-06, - "loss": 0.6709, - "step": 44722 - }, - { - "epoch": 1.15, - "learning_rate": 1.417297289846825e-06, - "loss": 0.6313, - "step": 44723 - }, - { - "epoch": 1.15, - "learning_rate": 1.41727214360779e-06, - "loss": 0.6514, - "step": 44724 - }, - { - "epoch": 1.15, - "learning_rate": 1.4172469970492688e-06, - "loss": 0.8662, - "step": 44725 - }, - { - "epoch": 1.15, - "learning_rate": 1.4172218501712809e-06, - "loss": 0.7529, - "step": 44726 - }, - { - "epoch": 1.15, - "learning_rate": 1.4171967029738455e-06, - "loss": 0.6509, - "step": 44727 - }, - { - "epoch": 1.15, - "learning_rate": 1.4171715554569815e-06, - "loss": 0.8652, - "step": 44728 - }, - { - "epoch": 1.15, - "learning_rate": 1.4171464076207088e-06, - "loss": 0.5933, - "step": 44729 - }, - { - "epoch": 1.15, - "learning_rate": 1.4171212594650462e-06, - "loss": 0.6069, - "step": 44730 - }, - { - "epoch": 1.15, - "learning_rate": 1.4170961109900128e-06, - "loss": 0.6465, - "step": 44731 - }, - { - "epoch": 1.15, - "learning_rate": 1.417070962195628e-06, - "loss": 0.6816, - "step": 44732 - }, - { - "epoch": 1.15, - "learning_rate": 1.4170458130819115e-06, - "loss": 0.6929, - "step": 44733 - }, - { - "epoch": 1.15, - "learning_rate": 1.4170206636488817e-06, - "loss": 0.6875, - "step": 44734 - }, - { - "epoch": 1.15, - "learning_rate": 1.4169955138965588e-06, - "loss": 0.7617, - "step": 44735 - }, - { - "epoch": 1.15, - "learning_rate": 1.4169703638249617e-06, - "loss": 0.7578, - "step": 44736 - }, - { - "epoch": 1.15, - "learning_rate": 1.4169452134341094e-06, - "loss": 0.6797, - "step": 44737 - }, - { - "epoch": 1.15, - "learning_rate": 1.416920062724021e-06, - "loss": 0.7148, - "step": 44738 - }, - { - "epoch": 1.15, - "learning_rate": 1.4168949116947165e-06, - "loss": 0.8213, - "step": 44739 - }, - { - "epoch": 1.15, - "learning_rate": 1.4168697603462145e-06, - "loss": 0.625, - "step": 44740 - }, - { - "epoch": 1.15, - "learning_rate": 1.4168446086785348e-06, - "loss": 0.6387, - "step": 44741 - }, - { - "epoch": 1.15, - "learning_rate": 1.416819456691696e-06, - "loss": 0.7354, - "step": 44742 - }, - { - "epoch": 1.15, - "learning_rate": 1.4167943043857179e-06, - "loss": 0.7793, - "step": 44743 - }, - { - "epoch": 1.15, - "learning_rate": 1.4167691517606192e-06, - "loss": 0.5833, - "step": 44744 - }, - { - "epoch": 1.15, - "learning_rate": 1.41674399881642e-06, - "loss": 0.6631, - "step": 44745 - }, - { - "epoch": 1.15, - "learning_rate": 1.416718845553139e-06, - "loss": 0.8682, - "step": 44746 - }, - { - "epoch": 1.15, - "learning_rate": 1.4166936919707955e-06, - "loss": 0.6611, - "step": 44747 - }, - { - "epoch": 1.15, - "learning_rate": 1.4166685380694086e-06, - "loss": 0.5615, - "step": 44748 - }, - { - "epoch": 1.15, - "learning_rate": 1.416643383848998e-06, - "loss": 0.4495, - "step": 44749 - }, - { - "epoch": 1.15, - "learning_rate": 1.4166182293095826e-06, - "loss": 0.6064, - "step": 44750 - }, - { - "epoch": 1.15, - "learning_rate": 1.4165930744511818e-06, - "loss": 0.7969, - "step": 44751 - }, - { - "epoch": 1.15, - "learning_rate": 1.416567919273815e-06, - "loss": 0.9141, - "step": 44752 - }, - { - "epoch": 1.15, - "learning_rate": 1.416542763777501e-06, - "loss": 0.7734, - "step": 44753 - }, - { - "epoch": 1.15, - "learning_rate": 1.4165176079622594e-06, - "loss": 0.6074, - "step": 44754 - }, - { - "epoch": 1.15, - "learning_rate": 1.4164924518281093e-06, - "loss": 0.4822, - "step": 44755 - }, - { - "epoch": 1.15, - "learning_rate": 1.4164672953750708e-06, - "loss": 0.7344, - "step": 44756 - }, - { - "epoch": 1.15, - "learning_rate": 1.4164421386031616e-06, - "loss": 0.7026, - "step": 44757 - }, - { - "epoch": 1.15, - "learning_rate": 1.4164169815124024e-06, - "loss": 0.6143, - "step": 44758 - }, - { - "epoch": 1.15, - "learning_rate": 1.4163918241028115e-06, - "loss": 0.6406, - "step": 44759 - }, - { - "epoch": 1.15, - "learning_rate": 1.416366666374409e-06, - "loss": 0.5439, - "step": 44760 - }, - { - "epoch": 1.15, - "learning_rate": 1.416341508327213e-06, - "loss": 0.6865, - "step": 44761 - }, - { - "epoch": 1.15, - "learning_rate": 1.416316349961244e-06, - "loss": 0.6855, - "step": 44762 - }, - { - "epoch": 1.15, - "learning_rate": 1.41629119127652e-06, - "loss": 0.7334, - "step": 44763 - }, - { - "epoch": 1.15, - "learning_rate": 1.4162660322730617e-06, - "loss": 0.6689, - "step": 44764 - }, - { - "epoch": 1.15, - "learning_rate": 1.4162408729508874e-06, - "loss": 0.708, - "step": 44765 - }, - { - "epoch": 1.15, - "learning_rate": 1.4162157133100168e-06, - "loss": 0.7151, - "step": 44766 - }, - { - "epoch": 1.15, - "learning_rate": 1.4161905533504686e-06, - "loss": 0.5715, - "step": 44767 - }, - { - "epoch": 1.15, - "learning_rate": 1.4161653930722625e-06, - "loss": 0.7061, - "step": 44768 - }, - { - "epoch": 1.15, - "learning_rate": 1.416140232475418e-06, - "loss": 0.6318, - "step": 44769 - }, - { - "epoch": 1.15, - "learning_rate": 1.4161150715599538e-06, - "loss": 0.5518, - "step": 44770 - }, - { - "epoch": 1.15, - "learning_rate": 1.4160899103258897e-06, - "loss": 0.5361, - "step": 44771 - }, - { - "epoch": 1.15, - "learning_rate": 1.4160647487732442e-06, - "loss": 0.5317, - "step": 44772 - }, - { - "epoch": 1.15, - "learning_rate": 1.4160395869020375e-06, - "loss": 0.6533, - "step": 44773 - }, - { - "epoch": 1.15, - "learning_rate": 1.416014424712288e-06, - "loss": 0.7178, - "step": 44774 - }, - { - "epoch": 1.15, - "learning_rate": 1.415989262204016e-06, - "loss": 0.5835, - "step": 44775 - }, - { - "epoch": 1.15, - "learning_rate": 1.4159640993772394e-06, - "loss": 0.5697, - "step": 44776 - }, - { - "epoch": 1.15, - "learning_rate": 1.4159389362319787e-06, - "loss": 0.6821, - "step": 44777 - }, - { - "epoch": 1.15, - "learning_rate": 1.4159137727682526e-06, - "loss": 0.5605, - "step": 44778 - }, - { - "epoch": 1.15, - "learning_rate": 1.4158886089860804e-06, - "loss": 0.7793, - "step": 44779 - }, - { - "epoch": 1.15, - "learning_rate": 1.4158634448854815e-06, - "loss": 0.501, - "step": 44780 - }, - { - "epoch": 1.15, - "learning_rate": 1.415838280466475e-06, - "loss": 0.5723, - "step": 44781 - }, - { - "epoch": 1.15, - "learning_rate": 1.4158131157290803e-06, - "loss": 0.6226, - "step": 44782 - }, - { - "epoch": 1.15, - "learning_rate": 1.4157879506733166e-06, - "loss": 0.7715, - "step": 44783 - }, - { - "epoch": 1.15, - "learning_rate": 1.4157627852992028e-06, - "loss": 0.6025, - "step": 44784 - }, - { - "epoch": 1.15, - "learning_rate": 1.4157376196067594e-06, - "loss": 0.6602, - "step": 44785 - }, - { - "epoch": 1.15, - "learning_rate": 1.4157124535960044e-06, - "loss": 0.749, - "step": 44786 - }, - { - "epoch": 1.15, - "learning_rate": 1.4156872872669575e-06, - "loss": 0.3882, - "step": 44787 - }, - { - "epoch": 1.15, - "learning_rate": 1.4156621206196375e-06, - "loss": 0.6631, - "step": 44788 - }, - { - "epoch": 1.15, - "learning_rate": 1.4156369536540646e-06, - "loss": 0.606, - "step": 44789 - }, - { - "epoch": 1.15, - "learning_rate": 1.4156117863702576e-06, - "loss": 0.7324, - "step": 44790 - }, - { - "epoch": 1.15, - "learning_rate": 1.4155866187682358e-06, - "loss": 0.6973, - "step": 44791 - }, - { - "epoch": 1.15, - "learning_rate": 1.4155614508480182e-06, - "loss": 0.6738, - "step": 44792 - }, - { - "epoch": 1.15, - "learning_rate": 1.4155362826096244e-06, - "loss": 0.6904, - "step": 44793 - }, - { - "epoch": 1.15, - "learning_rate": 1.4155111140530735e-06, - "loss": 0.7354, - "step": 44794 - }, - { - "epoch": 1.15, - "learning_rate": 1.415485945178385e-06, - "loss": 0.6372, - "step": 44795 - }, - { - "epoch": 1.15, - "learning_rate": 1.4154607759855778e-06, - "loss": 0.8086, - "step": 44796 - }, - { - "epoch": 1.15, - "learning_rate": 1.4154356064746718e-06, - "loss": 0.7168, - "step": 44797 - }, - { - "epoch": 1.15, - "learning_rate": 1.4154104366456854e-06, - "loss": 0.7656, - "step": 44798 - }, - { - "epoch": 1.15, - "learning_rate": 1.4153852664986385e-06, - "loss": 0.8057, - "step": 44799 - }, - { - "epoch": 1.15, - "learning_rate": 1.4153600960335505e-06, - "loss": 0.6802, - "step": 44800 - }, - { - "epoch": 1.15, - "learning_rate": 1.4153349252504399e-06, - "loss": 0.7695, - "step": 44801 - }, - { - "epoch": 1.15, - "learning_rate": 1.4153097541493267e-06, - "loss": 0.6758, - "step": 44802 - }, - { - "epoch": 1.15, - "learning_rate": 1.4152845827302299e-06, - "loss": 0.5994, - "step": 44803 - }, - { - "epoch": 1.15, - "learning_rate": 1.4152594109931685e-06, - "loss": 0.606, - "step": 44804 - }, - { - "epoch": 1.15, - "learning_rate": 1.4152342389381626e-06, - "loss": 0.5669, - "step": 44805 - }, - { - "epoch": 1.15, - "learning_rate": 1.4152090665652307e-06, - "loss": 0.7529, - "step": 44806 - }, - { - "epoch": 1.15, - "learning_rate": 1.415183893874392e-06, - "loss": 0.6333, - "step": 44807 - }, - { - "epoch": 1.15, - "learning_rate": 1.4151587208656666e-06, - "loss": 0.6719, - "step": 44808 - }, - { - "epoch": 1.15, - "learning_rate": 1.4151335475390728e-06, - "loss": 0.5396, - "step": 44809 - }, - { - "epoch": 1.15, - "learning_rate": 1.4151083738946307e-06, - "loss": 0.6763, - "step": 44810 - }, - { - "epoch": 1.15, - "learning_rate": 1.4150831999323592e-06, - "loss": 0.6016, - "step": 44811 - }, - { - "epoch": 1.15, - "learning_rate": 1.4150580256522773e-06, - "loss": 0.6423, - "step": 44812 - }, - { - "epoch": 1.15, - "learning_rate": 1.4150328510544048e-06, - "loss": 0.519, - "step": 44813 - }, - { - "epoch": 1.15, - "learning_rate": 1.4150076761387606e-06, - "loss": 0.5471, - "step": 44814 - }, - { - "epoch": 1.15, - "learning_rate": 1.414982500905364e-06, - "loss": 0.6836, - "step": 44815 - }, - { - "epoch": 1.15, - "learning_rate": 1.4149573253542344e-06, - "loss": 0.4561, - "step": 44816 - }, - { - "epoch": 1.15, - "learning_rate": 1.4149321494853912e-06, - "loss": 0.6196, - "step": 44817 - }, - { - "epoch": 1.15, - "learning_rate": 1.4149069732988535e-06, - "loss": 0.5215, - "step": 44818 - }, - { - "epoch": 1.15, - "learning_rate": 1.4148817967946404e-06, - "loss": 0.6406, - "step": 44819 - }, - { - "epoch": 1.15, - "learning_rate": 1.4148566199727719e-06, - "loss": 0.6455, - "step": 44820 - }, - { - "epoch": 1.15, - "learning_rate": 1.4148314428332665e-06, - "loss": 0.6038, - "step": 44821 - }, - { - "epoch": 1.15, - "learning_rate": 1.4148062653761434e-06, - "loss": 0.707, - "step": 44822 - }, - { - "epoch": 1.15, - "learning_rate": 1.4147810876014225e-06, - "loss": 0.7695, - "step": 44823 - }, - { - "epoch": 1.15, - "learning_rate": 1.4147559095091227e-06, - "loss": 0.6279, - "step": 44824 - }, - { - "epoch": 1.15, - "learning_rate": 1.4147307310992638e-06, - "loss": 0.8379, - "step": 44825 - }, - { - "epoch": 1.15, - "learning_rate": 1.414705552371864e-06, - "loss": 0.7559, - "step": 44826 - }, - { - "epoch": 1.15, - "learning_rate": 1.4146803733269437e-06, - "loss": 0.5786, - "step": 44827 - }, - { - "epoch": 1.15, - "learning_rate": 1.4146551939645215e-06, - "loss": 0.6577, - "step": 44828 - }, - { - "epoch": 1.15, - "learning_rate": 1.4146300142846168e-06, - "loss": 0.6104, - "step": 44829 - }, - { - "epoch": 1.15, - "learning_rate": 1.4146048342872491e-06, - "loss": 0.6387, - "step": 44830 - }, - { - "epoch": 1.15, - "learning_rate": 1.4145796539724376e-06, - "loss": 0.6475, - "step": 44831 - }, - { - "epoch": 1.15, - "learning_rate": 1.4145544733402016e-06, - "loss": 0.7305, - "step": 44832 - }, - { - "epoch": 1.15, - "learning_rate": 1.41452929239056e-06, - "loss": 0.7246, - "step": 44833 - }, - { - "epoch": 1.15, - "learning_rate": 1.4145041111235325e-06, - "loss": 0.418, - "step": 44834 - }, - { - "epoch": 1.15, - "learning_rate": 1.4144789295391385e-06, - "loss": 0.447, - "step": 44835 - }, - { - "epoch": 1.15, - "learning_rate": 1.4144537476373967e-06, - "loss": 0.6475, - "step": 44836 - }, - { - "epoch": 1.15, - "learning_rate": 1.414428565418327e-06, - "loss": 0.5347, - "step": 44837 - }, - { - "epoch": 1.15, - "learning_rate": 1.4144033828819482e-06, - "loss": 0.6025, - "step": 44838 - }, - { - "epoch": 1.15, - "learning_rate": 1.4143782000282798e-06, - "loss": 0.4529, - "step": 44839 - }, - { - "epoch": 1.15, - "learning_rate": 1.4143530168573411e-06, - "loss": 0.6343, - "step": 44840 - }, - { - "epoch": 1.15, - "learning_rate": 1.4143278333691514e-06, - "loss": 0.6143, - "step": 44841 - }, - { - "epoch": 1.15, - "learning_rate": 1.41430264956373e-06, - "loss": 0.5972, - "step": 44842 - }, - { - "epoch": 1.15, - "learning_rate": 1.4142774654410958e-06, - "loss": 0.5928, - "step": 44843 - }, - { - "epoch": 1.15, - "learning_rate": 1.4142522810012686e-06, - "loss": 0.7119, - "step": 44844 - }, - { - "epoch": 1.15, - "learning_rate": 1.4142270962442676e-06, - "loss": 0.6992, - "step": 44845 - }, - { - "epoch": 1.15, - "learning_rate": 1.4142019111701117e-06, - "loss": 0.8701, - "step": 44846 - }, - { - "epoch": 1.15, - "learning_rate": 1.4141767257788206e-06, - "loss": 0.709, - "step": 44847 - }, - { - "epoch": 1.15, - "learning_rate": 1.4141515400704136e-06, - "loss": 0.4609, - "step": 44848 - }, - { - "epoch": 1.15, - "learning_rate": 1.4141263540449093e-06, - "loss": 0.6179, - "step": 44849 - }, - { - "epoch": 1.15, - "learning_rate": 1.414101167702328e-06, - "loss": 0.6387, - "step": 44850 - }, - { - "epoch": 1.15, - "learning_rate": 1.4140759810426883e-06, - "loss": 0.7266, - "step": 44851 - }, - { - "epoch": 1.15, - "learning_rate": 1.4140507940660097e-06, - "loss": 0.6436, - "step": 44852 - }, - { - "epoch": 1.15, - "learning_rate": 1.4140256067723112e-06, - "loss": 0.6084, - "step": 44853 - }, - { - "epoch": 1.15, - "learning_rate": 1.4140004191616127e-06, - "loss": 0.5122, - "step": 44854 - }, - { - "epoch": 1.15, - "learning_rate": 1.413975231233933e-06, - "loss": 0.7461, - "step": 44855 - }, - { - "epoch": 1.15, - "learning_rate": 1.4139500429892915e-06, - "loss": 0.521, - "step": 44856 - }, - { - "epoch": 1.15, - "learning_rate": 1.4139248544277073e-06, - "loss": 0.6025, - "step": 44857 - }, - { - "epoch": 1.15, - "learning_rate": 1.4138996655492e-06, - "loss": 0.7109, - "step": 44858 - }, - { - "epoch": 1.15, - "learning_rate": 1.4138744763537884e-06, - "loss": 0.5225, - "step": 44859 - }, - { - "epoch": 1.15, - "learning_rate": 1.4138492868414927e-06, - "loss": 0.6436, - "step": 44860 - }, - { - "epoch": 1.15, - "learning_rate": 1.4138240970123315e-06, - "loss": 0.6074, - "step": 44861 - }, - { - "epoch": 1.15, - "learning_rate": 1.4137989068663239e-06, - "loss": 0.5435, - "step": 44862 - }, - { - "epoch": 1.15, - "learning_rate": 1.4137737164034897e-06, - "loss": 0.5798, - "step": 44863 - }, - { - "epoch": 1.15, - "learning_rate": 1.413748525623848e-06, - "loss": 0.6836, - "step": 44864 - }, - { - "epoch": 1.15, - "learning_rate": 1.4137233345274185e-06, - "loss": 0.6445, - "step": 44865 - }, - { - "epoch": 1.15, - "learning_rate": 1.4136981431142195e-06, - "loss": 0.4985, - "step": 44866 - }, - { - "epoch": 1.15, - "learning_rate": 1.413672951384271e-06, - "loss": 0.603, - "step": 44867 - }, - { - "epoch": 1.15, - "learning_rate": 1.4136477593375922e-06, - "loss": 0.5757, - "step": 44868 - }, - { - "epoch": 1.15, - "learning_rate": 1.4136225669742023e-06, - "loss": 0.5835, - "step": 44869 - }, - { - "epoch": 1.15, - "learning_rate": 1.4135973742941207e-06, - "loss": 0.6582, - "step": 44870 - }, - { - "epoch": 1.15, - "learning_rate": 1.4135721812973667e-06, - "loss": 0.7266, - "step": 44871 - }, - { - "epoch": 1.15, - "learning_rate": 1.413546987983959e-06, - "loss": 0.562, - "step": 44872 - }, - { - "epoch": 1.15, - "learning_rate": 1.4135217943539179e-06, - "loss": 0.6924, - "step": 44873 - }, - { - "epoch": 1.15, - "learning_rate": 1.4134966004072618e-06, - "loss": 0.5381, - "step": 44874 - }, - { - "epoch": 1.15, - "learning_rate": 1.4134714061440108e-06, - "loss": 0.6934, - "step": 44875 - }, - { - "epoch": 1.15, - "learning_rate": 1.4134462115641834e-06, - "loss": 0.6934, - "step": 44876 - }, - { - "epoch": 1.15, - "learning_rate": 1.4134210166677994e-06, - "loss": 0.646, - "step": 44877 - }, - { - "epoch": 1.15, - "learning_rate": 1.4133958214548777e-06, - "loss": 0.5903, - "step": 44878 - }, - { - "epoch": 1.15, - "learning_rate": 1.413370625925438e-06, - "loss": 0.6948, - "step": 44879 - }, - { - "epoch": 1.15, - "learning_rate": 1.4133454300794995e-06, - "loss": 0.6272, - "step": 44880 - }, - { - "epoch": 1.15, - "learning_rate": 1.4133202339170814e-06, - "loss": 0.7607, - "step": 44881 - }, - { - "epoch": 1.15, - "learning_rate": 1.413295037438203e-06, - "loss": 0.7949, - "step": 44882 - }, - { - "epoch": 1.15, - "learning_rate": 1.4132698406428836e-06, - "loss": 0.4907, - "step": 44883 - }, - { - "epoch": 1.15, - "learning_rate": 1.4132446435311423e-06, - "loss": 0.7646, - "step": 44884 - }, - { - "epoch": 1.15, - "learning_rate": 1.4132194461029987e-06, - "loss": 0.6804, - "step": 44885 - }, - { - "epoch": 1.15, - "learning_rate": 1.4131942483584721e-06, - "loss": 0.6172, - "step": 44886 - }, - { - "epoch": 1.15, - "learning_rate": 1.4131690502975816e-06, - "loss": 0.6387, - "step": 44887 - }, - { - "epoch": 1.15, - "learning_rate": 1.4131438519203464e-06, - "loss": 0.6758, - "step": 44888 - }, - { - "epoch": 1.15, - "learning_rate": 1.4131186532267857e-06, - "loss": 0.6489, - "step": 44889 - }, - { - "epoch": 1.15, - "learning_rate": 1.4130934542169199e-06, - "loss": 0.5928, - "step": 44890 - }, - { - "epoch": 1.15, - "learning_rate": 1.4130682548907669e-06, - "loss": 0.6812, - "step": 44891 - }, - { - "epoch": 1.15, - "learning_rate": 1.4130430552483465e-06, - "loss": 0.668, - "step": 44892 - }, - { - "epoch": 1.15, - "learning_rate": 1.413017855289678e-06, - "loss": 0.6514, - "step": 44893 - }, - { - "epoch": 1.15, - "learning_rate": 1.4129926550147807e-06, - "loss": 0.5815, - "step": 44894 - }, - { - "epoch": 1.15, - "learning_rate": 1.4129674544236742e-06, - "loss": 0.8105, - "step": 44895 - }, - { - "epoch": 1.15, - "learning_rate": 1.4129422535163772e-06, - "loss": 0.5151, - "step": 44896 - }, - { - "epoch": 1.15, - "learning_rate": 1.4129170522929094e-06, - "loss": 0.5864, - "step": 44897 - }, - { - "epoch": 1.15, - "learning_rate": 1.4128918507532903e-06, - "loss": 0.7764, - "step": 44898 - }, - { - "epoch": 1.15, - "learning_rate": 1.4128666488975385e-06, - "loss": 0.7812, - "step": 44899 - }, - { - "epoch": 1.15, - "learning_rate": 1.412841446725674e-06, - "loss": 0.585, - "step": 44900 - }, - { - "epoch": 1.15, - "learning_rate": 1.4128162442377157e-06, - "loss": 0.6689, - "step": 44901 - }, - { - "epoch": 1.15, - "learning_rate": 1.4127910414336828e-06, - "loss": 0.752, - "step": 44902 - }, - { - "epoch": 1.15, - "learning_rate": 1.4127658383135947e-06, - "loss": 0.7695, - "step": 44903 - }, - { - "epoch": 1.15, - "learning_rate": 1.412740634877471e-06, - "loss": 0.5869, - "step": 44904 - }, - { - "epoch": 1.15, - "learning_rate": 1.4127154311253308e-06, - "loss": 0.8359, - "step": 44905 - }, - { - "epoch": 1.15, - "learning_rate": 1.4126902270571932e-06, - "loss": 0.6348, - "step": 44906 - }, - { - "epoch": 1.15, - "learning_rate": 1.4126650226730776e-06, - "loss": 0.4883, - "step": 44907 - }, - { - "epoch": 1.15, - "learning_rate": 1.4126398179730034e-06, - "loss": 0.6826, - "step": 44908 - }, - { - "epoch": 1.15, - "learning_rate": 1.4126146129569902e-06, - "loss": 0.6758, - "step": 44909 - }, - { - "epoch": 1.15, - "learning_rate": 1.4125894076250568e-06, - "loss": 0.6885, - "step": 44910 - }, - { - "epoch": 1.15, - "learning_rate": 1.4125642019772226e-06, - "loss": 0.7012, - "step": 44911 - }, - { - "epoch": 1.15, - "learning_rate": 1.412538996013507e-06, - "loss": 0.605, - "step": 44912 - }, - { - "epoch": 1.15, - "learning_rate": 1.4125137897339292e-06, - "loss": 0.5356, - "step": 44913 - }, - { - "epoch": 1.15, - "learning_rate": 1.4124885831385085e-06, - "loss": 0.5957, - "step": 44914 - }, - { - "epoch": 1.15, - "learning_rate": 1.4124633762272646e-06, - "loss": 0.5806, - "step": 44915 - }, - { - "epoch": 1.15, - "learning_rate": 1.4124381690002163e-06, - "loss": 0.6846, - "step": 44916 - }, - { - "epoch": 1.15, - "learning_rate": 1.4124129614573827e-06, - "loss": 0.7397, - "step": 44917 - }, - { - "epoch": 1.15, - "learning_rate": 1.4123877535987839e-06, - "loss": 0.6572, - "step": 44918 - }, - { - "epoch": 1.15, - "learning_rate": 1.4123625454244385e-06, - "loss": 0.6577, - "step": 44919 - }, - { - "epoch": 1.15, - "learning_rate": 1.4123373369343662e-06, - "loss": 0.6489, - "step": 44920 - }, - { - "epoch": 1.15, - "learning_rate": 1.4123121281285863e-06, - "loss": 0.6836, - "step": 44921 - }, - { - "epoch": 1.15, - "learning_rate": 1.4122869190071175e-06, - "loss": 0.5425, - "step": 44922 - }, - { - "epoch": 1.15, - "learning_rate": 1.41226170956998e-06, - "loss": 0.728, - "step": 44923 - }, - { - "epoch": 1.15, - "learning_rate": 1.4122364998171924e-06, - "loss": 0.6113, - "step": 44924 - }, - { - "epoch": 1.15, - "learning_rate": 1.4122112897487744e-06, - "loss": 0.5396, - "step": 44925 - }, - { - "epoch": 1.15, - "learning_rate": 1.412186079364745e-06, - "loss": 0.7715, - "step": 44926 - }, - { - "epoch": 1.15, - "learning_rate": 1.412160868665124e-06, - "loss": 0.6055, - "step": 44927 - }, - { - "epoch": 1.15, - "learning_rate": 1.4121356576499301e-06, - "loss": 0.7568, - "step": 44928 - }, - { - "epoch": 1.15, - "learning_rate": 1.4121104463191832e-06, - "loss": 0.7598, - "step": 44929 - }, - { - "epoch": 1.15, - "learning_rate": 1.412085234672902e-06, - "loss": 0.6138, - "step": 44930 - }, - { - "epoch": 1.15, - "learning_rate": 1.412060022711106e-06, - "loss": 0.623, - "step": 44931 - }, - { - "epoch": 1.15, - "learning_rate": 1.4120348104338148e-06, - "loss": 0.7607, - "step": 44932 - }, - { - "epoch": 1.15, - "learning_rate": 1.4120095978410471e-06, - "loss": 0.4796, - "step": 44933 - }, - { - "epoch": 1.15, - "learning_rate": 1.411984384932823e-06, - "loss": 0.5295, - "step": 44934 - }, - { - "epoch": 1.15, - "learning_rate": 1.4119591717091614e-06, - "loss": 0.7773, - "step": 44935 - }, - { - "epoch": 1.15, - "learning_rate": 1.4119339581700818e-06, - "loss": 0.5801, - "step": 44936 - }, - { - "epoch": 1.15, - "learning_rate": 1.4119087443156027e-06, - "loss": 0.5203, - "step": 44937 - }, - { - "epoch": 1.15, - "learning_rate": 1.4118835301457443e-06, - "loss": 0.6309, - "step": 44938 - }, - { - "epoch": 1.15, - "learning_rate": 1.4118583156605257e-06, - "loss": 0.7578, - "step": 44939 - }, - { - "epoch": 1.15, - "learning_rate": 1.4118331008599663e-06, - "loss": 0.7061, - "step": 44940 - }, - { - "epoch": 1.15, - "learning_rate": 1.4118078857440849e-06, - "loss": 0.6953, - "step": 44941 - }, - { - "epoch": 1.15, - "learning_rate": 1.4117826703129012e-06, - "loss": 0.7441, - "step": 44942 - }, - { - "epoch": 1.15, - "learning_rate": 1.4117574545664344e-06, - "loss": 0.6304, - "step": 44943 - }, - { - "epoch": 1.15, - "learning_rate": 1.4117322385047042e-06, - "loss": 0.6494, - "step": 44944 - }, - { - "epoch": 1.15, - "learning_rate": 1.4117070221277292e-06, - "loss": 0.646, - "step": 44945 - }, - { - "epoch": 1.15, - "learning_rate": 1.4116818054355292e-06, - "loss": 0.7266, - "step": 44946 - }, - { - "epoch": 1.15, - "learning_rate": 1.4116565884281233e-06, - "loss": 0.7422, - "step": 44947 - }, - { - "epoch": 1.15, - "learning_rate": 1.411631371105531e-06, - "loss": 0.6694, - "step": 44948 - }, - { - "epoch": 1.15, - "learning_rate": 1.4116061534677711e-06, - "loss": 0.7627, - "step": 44949 - }, - { - "epoch": 1.15, - "learning_rate": 1.4115809355148638e-06, - "loss": 0.5083, - "step": 44950 - }, - { - "epoch": 1.15, - "learning_rate": 1.4115557172468275e-06, - "loss": 0.7646, - "step": 44951 - }, - { - "epoch": 1.15, - "learning_rate": 1.4115304986636823e-06, - "loss": 0.5598, - "step": 44952 - }, - { - "epoch": 1.15, - "learning_rate": 1.4115052797654467e-06, - "loss": 0.647, - "step": 44953 - }, - { - "epoch": 1.15, - "learning_rate": 1.4114800605521408e-06, - "loss": 0.6875, - "step": 44954 - }, - { - "epoch": 1.15, - "learning_rate": 1.4114548410237833e-06, - "loss": 0.6279, - "step": 44955 - }, - { - "epoch": 1.15, - "learning_rate": 1.411429621180394e-06, - "loss": 0.5518, - "step": 44956 - }, - { - "epoch": 1.15, - "learning_rate": 1.4114044010219917e-06, - "loss": 0.8145, - "step": 44957 - }, - { - "epoch": 1.15, - "learning_rate": 1.411379180548596e-06, - "loss": 0.6182, - "step": 44958 - }, - { - "epoch": 1.15, - "learning_rate": 1.4113539597602264e-06, - "loss": 0.5605, - "step": 44959 - }, - { - "epoch": 1.15, - "learning_rate": 1.411328738656902e-06, - "loss": 0.7637, - "step": 44960 - }, - { - "epoch": 1.15, - "learning_rate": 1.4113035172386419e-06, - "loss": 0.6934, - "step": 44961 - }, - { - "epoch": 1.15, - "learning_rate": 1.4112782955054653e-06, - "loss": 0.6816, - "step": 44962 - }, - { - "epoch": 1.15, - "learning_rate": 1.4112530734573924e-06, - "loss": 0.7354, - "step": 44963 - }, - { - "epoch": 1.15, - "learning_rate": 1.4112278510944415e-06, - "loss": 0.6572, - "step": 44964 - }, - { - "epoch": 1.15, - "learning_rate": 1.4112026284166328e-06, - "loss": 0.5806, - "step": 44965 - }, - { - "epoch": 1.15, - "learning_rate": 1.4111774054239847e-06, - "loss": 0.5698, - "step": 44966 - }, - { - "epoch": 1.15, - "learning_rate": 1.4111521821165173e-06, - "loss": 0.5557, - "step": 44967 - }, - { - "epoch": 1.15, - "learning_rate": 1.4111269584942491e-06, - "loss": 0.7109, - "step": 44968 - }, - { - "epoch": 1.15, - "learning_rate": 1.4111017345572006e-06, - "loss": 0.5967, - "step": 44969 - }, - { - "epoch": 1.15, - "learning_rate": 1.41107651030539e-06, - "loss": 0.5447, - "step": 44970 - }, - { - "epoch": 1.15, - "learning_rate": 1.411051285738837e-06, - "loss": 0.7158, - "step": 44971 - }, - { - "epoch": 1.15, - "learning_rate": 1.4110260608575607e-06, - "loss": 0.8164, - "step": 44972 - }, - { - "epoch": 1.15, - "learning_rate": 1.4110008356615813e-06, - "loss": 0.7266, - "step": 44973 - }, - { - "epoch": 1.15, - "learning_rate": 1.4109756101509169e-06, - "loss": 0.6113, - "step": 44974 - }, - { - "epoch": 1.15, - "learning_rate": 1.4109503843255875e-06, - "loss": 0.5991, - "step": 44975 - }, - { - "epoch": 1.15, - "learning_rate": 1.4109251581856123e-06, - "loss": 0.5947, - "step": 44976 - }, - { - "epoch": 1.15, - "learning_rate": 1.4108999317310106e-06, - "loss": 0.8076, - "step": 44977 - }, - { - "epoch": 1.15, - "learning_rate": 1.410874704961802e-06, - "loss": 0.6582, - "step": 44978 - }, - { - "epoch": 1.15, - "learning_rate": 1.4108494778780048e-06, - "loss": 0.665, - "step": 44979 - }, - { - "epoch": 1.15, - "learning_rate": 1.41082425047964e-06, - "loss": 0.5928, - "step": 44980 - }, - { - "epoch": 1.15, - "learning_rate": 1.4107990227667255e-06, - "loss": 0.5574, - "step": 44981 - }, - { - "epoch": 1.15, - "learning_rate": 1.410773794739281e-06, - "loss": 0.6929, - "step": 44982 - }, - { - "epoch": 1.15, - "learning_rate": 1.4107485663973257e-06, - "loss": 0.5396, - "step": 44983 - }, - { - "epoch": 1.15, - "learning_rate": 1.4107233377408796e-06, - "loss": 0.7217, - "step": 44984 - }, - { - "epoch": 1.15, - "learning_rate": 1.4106981087699614e-06, - "loss": 0.6221, - "step": 44985 - }, - { - "epoch": 1.15, - "learning_rate": 1.4106728794845904e-06, - "loss": 0.7617, - "step": 44986 - }, - { - "epoch": 1.15, - "learning_rate": 1.410647649884786e-06, - "loss": 0.7256, - "step": 44987 - }, - { - "epoch": 1.15, - "learning_rate": 1.4106224199705678e-06, - "loss": 0.5981, - "step": 44988 - }, - { - "epoch": 1.15, - "learning_rate": 1.4105971897419547e-06, - "loss": 0.7051, - "step": 44989 - }, - { - "epoch": 1.15, - "learning_rate": 1.4105719591989665e-06, - "loss": 0.6011, - "step": 44990 - }, - { - "epoch": 1.15, - "learning_rate": 1.410546728341622e-06, - "loss": 0.5747, - "step": 44991 - }, - { - "epoch": 1.15, - "learning_rate": 1.4105214971699407e-06, - "loss": 0.6455, - "step": 44992 - }, - { - "epoch": 1.15, - "learning_rate": 1.4104962656839418e-06, - "loss": 0.7563, - "step": 44993 - }, - { - "epoch": 1.15, - "learning_rate": 1.4104710338836452e-06, - "loss": 0.6841, - "step": 44994 - }, - { - "epoch": 1.15, - "learning_rate": 1.4104458017690696e-06, - "loss": 0.7246, - "step": 44995 - }, - { - "epoch": 1.15, - "learning_rate": 1.4104205693402346e-06, - "loss": 0.5278, - "step": 44996 - }, - { - "epoch": 1.15, - "learning_rate": 1.4103953365971592e-06, - "loss": 0.5007, - "step": 44997 - }, - { - "epoch": 1.15, - "learning_rate": 1.4103701035398632e-06, - "loss": 0.6885, - "step": 44998 - }, - { - "epoch": 1.15, - "learning_rate": 1.4103448701683656e-06, - "loss": 0.6797, - "step": 44999 - }, - { - "epoch": 1.15, - "learning_rate": 1.410319636482686e-06, - "loss": 0.6338, - "step": 45000 - }, - { - "epoch": 1.15, - "learning_rate": 1.4102944024828434e-06, - "loss": 0.6562, - "step": 45001 - }, - { - "epoch": 1.15, - "learning_rate": 1.410269168168857e-06, - "loss": 0.5942, - "step": 45002 - }, - { - "epoch": 1.15, - "learning_rate": 1.4102439335407466e-06, - "loss": 0.6252, - "step": 45003 - }, - { - "epoch": 1.15, - "learning_rate": 1.410218698598531e-06, - "loss": 0.7583, - "step": 45004 - }, - { - "epoch": 1.15, - "learning_rate": 1.4101934633422303e-06, - "loss": 0.5679, - "step": 45005 - }, - { - "epoch": 1.15, - "learning_rate": 1.410168227771863e-06, - "loss": 0.6484, - "step": 45006 - }, - { - "epoch": 1.15, - "learning_rate": 1.410142991887449e-06, - "loss": 0.5605, - "step": 45007 - }, - { - "epoch": 1.15, - "learning_rate": 1.4101177556890069e-06, - "loss": 0.6035, - "step": 45008 - }, - { - "epoch": 1.15, - "learning_rate": 1.410092519176557e-06, - "loss": 0.5923, - "step": 45009 - }, - { - "epoch": 1.15, - "learning_rate": 1.4100672823501179e-06, - "loss": 0.7168, - "step": 45010 - }, - { - "epoch": 1.15, - "learning_rate": 1.410042045209709e-06, - "loss": 0.6016, - "step": 45011 - }, - { - "epoch": 1.15, - "learning_rate": 1.4100168077553498e-06, - "loss": 0.4954, - "step": 45012 - }, - { - "epoch": 1.15, - "learning_rate": 1.4099915699870598e-06, - "loss": 0.5942, - "step": 45013 - }, - { - "epoch": 1.15, - "learning_rate": 1.4099663319048578e-06, - "loss": 0.5781, - "step": 45014 - }, - { - "epoch": 1.15, - "learning_rate": 1.4099410935087637e-06, - "loss": 0.6719, - "step": 45015 - }, - { - "epoch": 1.15, - "learning_rate": 1.4099158547987965e-06, - "loss": 0.7363, - "step": 45016 - }, - { - "epoch": 1.15, - "learning_rate": 1.4098906157749756e-06, - "loss": 0.6924, - "step": 45017 - }, - { - "epoch": 1.15, - "learning_rate": 1.4098653764373204e-06, - "loss": 0.6357, - "step": 45018 - }, - { - "epoch": 1.15, - "learning_rate": 1.4098401367858496e-06, - "loss": 0.6235, - "step": 45019 - }, - { - "epoch": 1.15, - "learning_rate": 1.4098148968205836e-06, - "loss": 0.6738, - "step": 45020 - }, - { - "epoch": 1.15, - "learning_rate": 1.409789656541541e-06, - "loss": 0.6016, - "step": 45021 - }, - { - "epoch": 1.15, - "learning_rate": 1.4097644159487415e-06, - "loss": 0.5259, - "step": 45022 - }, - { - "epoch": 1.15, - "learning_rate": 1.4097391750422038e-06, - "loss": 0.4688, - "step": 45023 - }, - { - "epoch": 1.15, - "learning_rate": 1.409713933821948e-06, - "loss": 0.833, - "step": 45024 - }, - { - "epoch": 1.15, - "learning_rate": 1.409688692287993e-06, - "loss": 0.6904, - "step": 45025 - }, - { - "epoch": 1.15, - "learning_rate": 1.4096634504403582e-06, - "loss": 0.6914, - "step": 45026 - }, - { - "epoch": 1.15, - "learning_rate": 1.4096382082790628e-06, - "loss": 0.6416, - "step": 45027 - }, - { - "epoch": 1.15, - "learning_rate": 1.4096129658041262e-06, - "loss": 0.7256, - "step": 45028 - }, - { - "epoch": 1.15, - "learning_rate": 1.4095877230155679e-06, - "loss": 0.6528, - "step": 45029 - }, - { - "epoch": 1.15, - "learning_rate": 1.4095624799134075e-06, - "loss": 0.5918, - "step": 45030 - }, - { - "epoch": 1.15, - "learning_rate": 1.4095372364976634e-06, - "loss": 0.6865, - "step": 45031 - }, - { - "epoch": 1.15, - "learning_rate": 1.4095119927683558e-06, - "loss": 0.4747, - "step": 45032 - }, - { - "epoch": 1.15, - "learning_rate": 1.4094867487255036e-06, - "loss": 0.7725, - "step": 45033 - }, - { - "epoch": 1.15, - "learning_rate": 1.409461504369126e-06, - "loss": 0.4197, - "step": 45034 - }, - { - "epoch": 1.15, - "learning_rate": 1.4094362596992428e-06, - "loss": 0.6289, - "step": 45035 - }, - { - "epoch": 1.15, - "learning_rate": 1.4094110147158732e-06, - "loss": 0.5137, - "step": 45036 - }, - { - "epoch": 1.15, - "learning_rate": 1.409385769419036e-06, - "loss": 0.5521, - "step": 45037 - }, - { - "epoch": 1.15, - "learning_rate": 1.4093605238087514e-06, - "loss": 0.562, - "step": 45038 - }, - { - "epoch": 1.15, - "learning_rate": 1.4093352778850378e-06, - "loss": 0.4897, - "step": 45039 - }, - { - "epoch": 1.15, - "learning_rate": 1.4093100316479155e-06, - "loss": 0.3964, - "step": 45040 - }, - { - "epoch": 1.15, - "learning_rate": 1.409284785097403e-06, - "loss": 0.6313, - "step": 45041 - }, - { - "epoch": 1.15, - "learning_rate": 1.40925953823352e-06, - "loss": 0.7183, - "step": 45042 - }, - { - "epoch": 1.15, - "learning_rate": 1.4092342910562857e-06, - "loss": 0.533, - "step": 45043 - }, - { - "epoch": 1.15, - "learning_rate": 1.4092090435657196e-06, - "loss": 0.6636, - "step": 45044 - }, - { - "epoch": 1.15, - "learning_rate": 1.4091837957618413e-06, - "loss": 0.748, - "step": 45045 - }, - { - "epoch": 1.15, - "learning_rate": 1.4091585476446694e-06, - "loss": 0.7842, - "step": 45046 - }, - { - "epoch": 1.15, - "learning_rate": 1.4091332992142237e-06, - "loss": 0.5273, - "step": 45047 - }, - { - "epoch": 1.15, - "learning_rate": 1.4091080504705236e-06, - "loss": 0.8467, - "step": 45048 - }, - { - "epoch": 1.15, - "learning_rate": 1.409082801413588e-06, - "loss": 0.5986, - "step": 45049 - }, - { - "epoch": 1.15, - "learning_rate": 1.4090575520434366e-06, - "loss": 0.7549, - "step": 45050 - }, - { - "epoch": 1.15, - "learning_rate": 1.4090323023600888e-06, - "loss": 0.7793, - "step": 45051 - }, - { - "epoch": 1.15, - "learning_rate": 1.4090070523635636e-06, - "loss": 0.667, - "step": 45052 - }, - { - "epoch": 1.15, - "learning_rate": 1.4089818020538804e-06, - "loss": 0.71, - "step": 45053 - }, - { - "epoch": 1.15, - "learning_rate": 1.408956551431059e-06, - "loss": 0.6108, - "step": 45054 - }, - { - "epoch": 1.15, - "learning_rate": 1.4089313004951183e-06, - "loss": 0.4354, - "step": 45055 - }, - { - "epoch": 1.15, - "learning_rate": 1.4089060492460775e-06, - "loss": 0.7607, - "step": 45056 - }, - { - "epoch": 1.15, - "learning_rate": 1.4088807976839561e-06, - "loss": 0.54, - "step": 45057 - }, - { - "epoch": 1.15, - "learning_rate": 1.4088555458087735e-06, - "loss": 0.6904, - "step": 45058 - }, - { - "epoch": 1.15, - "learning_rate": 1.408830293620549e-06, - "loss": 0.7412, - "step": 45059 - }, - { - "epoch": 1.15, - "learning_rate": 1.4088050411193022e-06, - "loss": 0.6089, - "step": 45060 - }, - { - "epoch": 1.15, - "learning_rate": 1.4087797883050518e-06, - "loss": 0.5427, - "step": 45061 - }, - { - "epoch": 1.15, - "learning_rate": 1.408754535177818e-06, - "loss": 0.7285, - "step": 45062 - }, - { - "epoch": 1.15, - "learning_rate": 1.4087292817376193e-06, - "loss": 0.751, - "step": 45063 - }, - { - "epoch": 1.16, - "learning_rate": 1.4087040279844755e-06, - "loss": 0.6296, - "step": 45064 - }, - { - "epoch": 1.16, - "learning_rate": 1.4086787739184058e-06, - "loss": 0.7568, - "step": 45065 - }, - { - "epoch": 1.16, - "learning_rate": 1.4086535195394296e-06, - "loss": 0.6543, - "step": 45066 - }, - { - "epoch": 1.16, - "learning_rate": 1.4086282648475657e-06, - "loss": 0.8018, - "step": 45067 - }, - { - "epoch": 1.16, - "learning_rate": 1.4086030098428346e-06, - "loss": 0.7119, - "step": 45068 - }, - { - "epoch": 1.16, - "learning_rate": 1.4085777545252548e-06, - "loss": 0.7744, - "step": 45069 - }, - { - "epoch": 1.16, - "learning_rate": 1.4085524988948456e-06, - "loss": 0.5093, - "step": 45070 - }, - { - "epoch": 1.16, - "learning_rate": 1.4085272429516266e-06, - "loss": 0.6274, - "step": 45071 - }, - { - "epoch": 1.16, - "learning_rate": 1.4085019866956173e-06, - "loss": 0.7041, - "step": 45072 - }, - { - "epoch": 1.16, - "learning_rate": 1.4084767301268366e-06, - "loss": 0.6558, - "step": 45073 - }, - { - "epoch": 1.16, - "learning_rate": 1.4084514732453041e-06, - "loss": 0.7148, - "step": 45074 - }, - { - "epoch": 1.16, - "learning_rate": 1.4084262160510392e-06, - "loss": 0.7314, - "step": 45075 - }, - { - "epoch": 1.16, - "learning_rate": 1.408400958544061e-06, - "loss": 0.5225, - "step": 45076 - }, - { - "epoch": 1.16, - "learning_rate": 1.4083757007243886e-06, - "loss": 0.6602, - "step": 45077 - }, - { - "epoch": 1.16, - "learning_rate": 1.4083504425920423e-06, - "loss": 0.7168, - "step": 45078 - }, - { - "epoch": 1.16, - "learning_rate": 1.4083251841470407e-06, - "loss": 0.6443, - "step": 45079 - }, - { - "epoch": 1.16, - "learning_rate": 1.4082999253894033e-06, - "loss": 0.6348, - "step": 45080 - }, - { - "epoch": 1.16, - "learning_rate": 1.4082746663191492e-06, - "loss": 0.7334, - "step": 45081 - }, - { - "epoch": 1.16, - "learning_rate": 1.408249406936298e-06, - "loss": 0.666, - "step": 45082 - }, - { - "epoch": 1.16, - "learning_rate": 1.408224147240869e-06, - "loss": 0.6304, - "step": 45083 - }, - { - "epoch": 1.16, - "learning_rate": 1.4081988872328816e-06, - "loss": 0.5162, - "step": 45084 - }, - { - "epoch": 1.16, - "learning_rate": 1.4081736269123552e-06, - "loss": 0.6514, - "step": 45085 - }, - { - "epoch": 1.16, - "learning_rate": 1.4081483662793087e-06, - "loss": 0.6206, - "step": 45086 - }, - { - "epoch": 1.16, - "learning_rate": 1.408123105333762e-06, - "loss": 0.623, - "step": 45087 - }, - { - "epoch": 1.16, - "learning_rate": 1.4080978440757342e-06, - "loss": 0.6392, - "step": 45088 - }, - { - "epoch": 1.16, - "learning_rate": 1.4080725825052448e-06, - "loss": 0.6096, - "step": 45089 - }, - { - "epoch": 1.16, - "learning_rate": 1.4080473206223128e-06, - "loss": 0.6729, - "step": 45090 - }, - { - "epoch": 1.16, - "learning_rate": 1.4080220584269578e-06, - "loss": 0.7305, - "step": 45091 - }, - { - "epoch": 1.16, - "learning_rate": 1.407996795919199e-06, - "loss": 0.6318, - "step": 45092 - }, - { - "epoch": 1.16, - "learning_rate": 1.4079715330990557e-06, - "loss": 0.4385, - "step": 45093 - }, - { - "epoch": 1.16, - "learning_rate": 1.4079462699665477e-06, - "loss": 0.5986, - "step": 45094 - }, - { - "epoch": 1.16, - "learning_rate": 1.4079210065216938e-06, - "loss": 0.7402, - "step": 45095 - }, - { - "epoch": 1.16, - "learning_rate": 1.4078957427645132e-06, - "loss": 0.7148, - "step": 45096 - }, - { - "epoch": 1.16, - "learning_rate": 1.4078704786950263e-06, - "loss": 0.5693, - "step": 45097 - }, - { - "epoch": 1.16, - "learning_rate": 1.407845214313251e-06, - "loss": 0.7041, - "step": 45098 - }, - { - "epoch": 1.16, - "learning_rate": 1.4078199496192081e-06, - "loss": 0.7949, - "step": 45099 - }, - { - "epoch": 1.16, - "learning_rate": 1.4077946846129157e-06, - "loss": 0.6934, - "step": 45100 - }, - { - "epoch": 1.16, - "learning_rate": 1.407769419294394e-06, - "loss": 0.8213, - "step": 45101 - }, - { - "epoch": 1.16, - "learning_rate": 1.4077441536636614e-06, - "loss": 0.6963, - "step": 45102 - }, - { - "epoch": 1.16, - "learning_rate": 1.4077188877207385e-06, - "loss": 0.7139, - "step": 45103 - }, - { - "epoch": 1.16, - "learning_rate": 1.4076936214656438e-06, - "loss": 0.5791, - "step": 45104 - }, - { - "epoch": 1.16, - "learning_rate": 1.4076683548983965e-06, - "loss": 0.748, - "step": 45105 - }, - { - "epoch": 1.16, - "learning_rate": 1.4076430880190166e-06, - "loss": 0.5645, - "step": 45106 - }, - { - "epoch": 1.16, - "learning_rate": 1.4076178208275234e-06, - "loss": 0.5383, - "step": 45107 - }, - { - "epoch": 1.16, - "learning_rate": 1.4075925533239355e-06, - "loss": 0.5645, - "step": 45108 - }, - { - "epoch": 1.16, - "learning_rate": 1.407567285508273e-06, - "loss": 0.6084, - "step": 45109 - }, - { - "epoch": 1.16, - "learning_rate": 1.4075420173805549e-06, - "loss": 0.4785, - "step": 45110 - }, - { - "epoch": 1.16, - "learning_rate": 1.4075167489408004e-06, - "loss": 0.7051, - "step": 45111 - }, - { - "epoch": 1.16, - "learning_rate": 1.4074914801890293e-06, - "loss": 0.7529, - "step": 45112 - }, - { - "epoch": 1.16, - "learning_rate": 1.4074662111252607e-06, - "loss": 0.3707, - "step": 45113 - }, - { - "epoch": 1.16, - "learning_rate": 1.407440941749514e-06, - "loss": 0.6689, - "step": 45114 - }, - { - "epoch": 1.16, - "learning_rate": 1.4074156720618082e-06, - "loss": 0.7178, - "step": 45115 - }, - { - "epoch": 1.16, - "learning_rate": 1.4073904020621635e-06, - "loss": 0.6914, - "step": 45116 - }, - { - "epoch": 1.16, - "learning_rate": 1.4073651317505981e-06, - "loss": 0.624, - "step": 45117 - }, - { - "epoch": 1.16, - "learning_rate": 1.4073398611271324e-06, - "loss": 0.5703, - "step": 45118 - }, - { - "epoch": 1.16, - "learning_rate": 1.407314590191785e-06, - "loss": 0.6777, - "step": 45119 - }, - { - "epoch": 1.16, - "learning_rate": 1.4072893189445758e-06, - "loss": 0.7119, - "step": 45120 - }, - { - "epoch": 1.16, - "learning_rate": 1.4072640473855236e-06, - "loss": 0.7861, - "step": 45121 - }, - { - "epoch": 1.16, - "learning_rate": 1.4072387755146483e-06, - "loss": 0.7949, - "step": 45122 - }, - { - "epoch": 1.16, - "learning_rate": 1.407213503331969e-06, - "loss": 0.6846, - "step": 45123 - }, - { - "epoch": 1.16, - "learning_rate": 1.4071882308375052e-06, - "loss": 0.7373, - "step": 45124 - }, - { - "epoch": 1.16, - "learning_rate": 1.4071629580312756e-06, - "loss": 0.7109, - "step": 45125 - }, - { - "epoch": 1.16, - "learning_rate": 1.4071376849133003e-06, - "loss": 0.4751, - "step": 45126 - }, - { - "epoch": 1.16, - "learning_rate": 1.4071124114835983e-06, - "loss": 0.7168, - "step": 45127 - }, - { - "epoch": 1.16, - "learning_rate": 1.4070871377421894e-06, - "loss": 0.6377, - "step": 45128 - }, - { - "epoch": 1.16, - "learning_rate": 1.4070618636890923e-06, - "loss": 0.562, - "step": 45129 - }, - { - "epoch": 1.16, - "learning_rate": 1.4070365893243265e-06, - "loss": 0.7607, - "step": 45130 - }, - { - "epoch": 1.16, - "learning_rate": 1.4070113146479116e-06, - "loss": 0.6611, - "step": 45131 - }, - { - "epoch": 1.16, - "learning_rate": 1.406986039659867e-06, - "loss": 0.4856, - "step": 45132 - }, - { - "epoch": 1.16, - "learning_rate": 1.4069607643602118e-06, - "loss": 0.707, - "step": 45133 - }, - { - "epoch": 1.16, - "learning_rate": 1.4069354887489656e-06, - "loss": 0.5532, - "step": 45134 - }, - { - "epoch": 1.16, - "learning_rate": 1.4069102128261477e-06, - "loss": 0.6504, - "step": 45135 - }, - { - "epoch": 1.16, - "learning_rate": 1.4068849365917768e-06, - "loss": 0.6426, - "step": 45136 - }, - { - "epoch": 1.16, - "learning_rate": 1.4068596600458732e-06, - "loss": 0.5996, - "step": 45137 - }, - { - "epoch": 1.16, - "learning_rate": 1.4068343831884559e-06, - "loss": 0.6348, - "step": 45138 - }, - { - "epoch": 1.16, - "learning_rate": 1.4068091060195445e-06, - "loss": 0.3792, - "step": 45139 - }, - { - "epoch": 1.16, - "learning_rate": 1.4067838285391575e-06, - "loss": 0.7827, - "step": 45140 - }, - { - "epoch": 1.16, - "learning_rate": 1.4067585507473152e-06, - "loss": 0.4424, - "step": 45141 - }, - { - "epoch": 1.16, - "learning_rate": 1.4067332726440362e-06, - "loss": 0.604, - "step": 45142 - }, - { - "epoch": 1.16, - "learning_rate": 1.4067079942293405e-06, - "loss": 0.5859, - "step": 45143 - }, - { - "epoch": 1.16, - "learning_rate": 1.4066827155032472e-06, - "loss": 0.6279, - "step": 45144 - }, - { - "epoch": 1.16, - "learning_rate": 1.4066574364657758e-06, - "loss": 0.7188, - "step": 45145 - }, - { - "epoch": 1.16, - "learning_rate": 1.4066321571169453e-06, - "loss": 0.5034, - "step": 45146 - }, - { - "epoch": 1.16, - "learning_rate": 1.4066068774567753e-06, - "loss": 0.6729, - "step": 45147 - }, - { - "epoch": 1.16, - "learning_rate": 1.4065815974852847e-06, - "loss": 0.563, - "step": 45148 - }, - { - "epoch": 1.16, - "learning_rate": 1.4065563172024939e-06, - "loss": 0.5864, - "step": 45149 - }, - { - "epoch": 1.16, - "learning_rate": 1.4065310366084214e-06, - "loss": 0.7646, - "step": 45150 - }, - { - "epoch": 1.16, - "learning_rate": 1.4065057557030867e-06, - "loss": 0.5017, - "step": 45151 - }, - { - "epoch": 1.16, - "learning_rate": 1.4064804744865094e-06, - "loss": 0.5679, - "step": 45152 - }, - { - "epoch": 1.16, - "learning_rate": 1.4064551929587086e-06, - "loss": 0.7285, - "step": 45153 - }, - { - "epoch": 1.16, - "learning_rate": 1.4064299111197035e-06, - "loss": 0.5767, - "step": 45154 - }, - { - "epoch": 1.16, - "learning_rate": 1.406404628969514e-06, - "loss": 0.4088, - "step": 45155 - }, - { - "epoch": 1.16, - "learning_rate": 1.406379346508159e-06, - "loss": 0.7183, - "step": 45156 - }, - { - "epoch": 1.16, - "learning_rate": 1.406354063735658e-06, - "loss": 0.4924, - "step": 45157 - }, - { - "epoch": 1.16, - "learning_rate": 1.4063287806520305e-06, - "loss": 0.5747, - "step": 45158 - }, - { - "epoch": 1.16, - "learning_rate": 1.4063034972572959e-06, - "loss": 0.7393, - "step": 45159 - }, - { - "epoch": 1.16, - "learning_rate": 1.4062782135514733e-06, - "loss": 0.7305, - "step": 45160 - }, - { - "epoch": 1.16, - "learning_rate": 1.406252929534582e-06, - "loss": 0.7881, - "step": 45161 - }, - { - "epoch": 1.16, - "learning_rate": 1.4062276452066415e-06, - "loss": 0.6602, - "step": 45162 - }, - { - "epoch": 1.16, - "learning_rate": 1.4062023605676712e-06, - "loss": 0.6914, - "step": 45163 - }, - { - "epoch": 1.16, - "learning_rate": 1.4061770756176907e-06, - "loss": 0.668, - "step": 45164 - }, - { - "epoch": 1.16, - "learning_rate": 1.4061517903567186e-06, - "loss": 0.5327, - "step": 45165 - }, - { - "epoch": 1.16, - "learning_rate": 1.4061265047847752e-06, - "loss": 0.8604, - "step": 45166 - }, - { - "epoch": 1.16, - "learning_rate": 1.4061012189018791e-06, - "loss": 0.6328, - "step": 45167 - }, - { - "epoch": 1.16, - "learning_rate": 1.4060759327080502e-06, - "loss": 0.5225, - "step": 45168 - }, - { - "epoch": 1.16, - "learning_rate": 1.4060506462033075e-06, - "loss": 0.7139, - "step": 45169 - }, - { - "epoch": 1.16, - "learning_rate": 1.4060253593876706e-06, - "loss": 0.707, - "step": 45170 - }, - { - "epoch": 1.16, - "learning_rate": 1.4060000722611585e-06, - "loss": 0.3513, - "step": 45171 - }, - { - "epoch": 1.16, - "learning_rate": 1.405974784823791e-06, - "loss": 0.5635, - "step": 45172 - }, - { - "epoch": 1.16, - "learning_rate": 1.4059494970755871e-06, - "loss": 0.6558, - "step": 45173 - }, - { - "epoch": 1.16, - "learning_rate": 1.4059242090165667e-06, - "loss": 0.53, - "step": 45174 - }, - { - "epoch": 1.16, - "learning_rate": 1.4058989206467487e-06, - "loss": 0.7705, - "step": 45175 - }, - { - "epoch": 1.16, - "learning_rate": 1.4058736319661524e-06, - "loss": 0.6323, - "step": 45176 - }, - { - "epoch": 1.16, - "learning_rate": 1.4058483429747973e-06, - "loss": 0.6875, - "step": 45177 - }, - { - "epoch": 1.16, - "learning_rate": 1.4058230536727028e-06, - "loss": 0.6357, - "step": 45178 - }, - { - "epoch": 1.16, - "learning_rate": 1.4057977640598883e-06, - "loss": 0.6191, - "step": 45179 - }, - { - "epoch": 1.16, - "learning_rate": 1.4057724741363732e-06, - "loss": 0.6963, - "step": 45180 - }, - { - "epoch": 1.16, - "learning_rate": 1.4057471839021768e-06, - "loss": 0.7812, - "step": 45181 - }, - { - "epoch": 1.16, - "learning_rate": 1.4057218933573182e-06, - "loss": 0.6533, - "step": 45182 - }, - { - "epoch": 1.16, - "learning_rate": 1.4056966025018172e-06, - "loss": 0.4683, - "step": 45183 - }, - { - "epoch": 1.16, - "learning_rate": 1.4056713113356929e-06, - "loss": 0.6475, - "step": 45184 - }, - { - "epoch": 1.16, - "learning_rate": 1.4056460198589648e-06, - "loss": 0.7354, - "step": 45185 - }, - { - "epoch": 1.16, - "learning_rate": 1.4056207280716522e-06, - "loss": 0.5444, - "step": 45186 - }, - { - "epoch": 1.16, - "learning_rate": 1.4055954359737743e-06, - "loss": 0.6143, - "step": 45187 - }, - { - "epoch": 1.16, - "learning_rate": 1.4055701435653504e-06, - "loss": 0.5815, - "step": 45188 - }, - { - "epoch": 1.16, - "learning_rate": 1.4055448508464006e-06, - "loss": 0.5795, - "step": 45189 - }, - { - "epoch": 1.16, - "learning_rate": 1.4055195578169436e-06, - "loss": 0.5981, - "step": 45190 - }, - { - "epoch": 1.16, - "learning_rate": 1.4054942644769989e-06, - "loss": 0.4917, - "step": 45191 - }, - { - "epoch": 1.16, - "learning_rate": 1.4054689708265856e-06, - "loss": 0.6514, - "step": 45192 - }, - { - "epoch": 1.16, - "learning_rate": 1.4054436768657237e-06, - "loss": 0.5356, - "step": 45193 - }, - { - "epoch": 1.16, - "learning_rate": 1.4054183825944324e-06, - "loss": 0.7822, - "step": 45194 - }, - { - "epoch": 1.16, - "learning_rate": 1.4053930880127305e-06, - "loss": 0.7656, - "step": 45195 - }, - { - "epoch": 1.16, - "learning_rate": 1.405367793120638e-06, - "loss": 0.8301, - "step": 45196 - }, - { - "epoch": 1.16, - "learning_rate": 1.4053424979181738e-06, - "loss": 0.8926, - "step": 45197 - }, - { - "epoch": 1.16, - "learning_rate": 1.4053172024053574e-06, - "loss": 0.6118, - "step": 45198 - }, - { - "epoch": 1.16, - "learning_rate": 1.4052919065822085e-06, - "loss": 0.5137, - "step": 45199 - }, - { - "epoch": 1.16, - "learning_rate": 1.4052666104487463e-06, - "loss": 0.6904, - "step": 45200 - }, - { - "epoch": 1.16, - "learning_rate": 1.4052413140049897e-06, - "loss": 0.6777, - "step": 45201 - }, - { - "epoch": 1.16, - "learning_rate": 1.4052160172509588e-06, - "loss": 0.6699, - "step": 45202 - }, - { - "epoch": 1.16, - "learning_rate": 1.4051907201866724e-06, - "loss": 0.585, - "step": 45203 - }, - { - "epoch": 1.16, - "learning_rate": 1.4051654228121505e-06, - "loss": 0.6409, - "step": 45204 - }, - { - "epoch": 1.16, - "learning_rate": 1.4051401251274118e-06, - "loss": 0.5038, - "step": 45205 - }, - { - "epoch": 1.16, - "learning_rate": 1.405114827132476e-06, - "loss": 0.6602, - "step": 45206 - }, - { - "epoch": 1.16, - "learning_rate": 1.4050895288273621e-06, - "loss": 0.5537, - "step": 45207 - }, - { - "epoch": 1.16, - "learning_rate": 1.40506423021209e-06, - "loss": 0.6465, - "step": 45208 - }, - { - "epoch": 1.16, - "learning_rate": 1.4050389312866791e-06, - "loss": 0.5903, - "step": 45209 - }, - { - "epoch": 1.16, - "learning_rate": 1.4050136320511483e-06, - "loss": 0.8564, - "step": 45210 - }, - { - "epoch": 1.16, - "learning_rate": 1.404988332505517e-06, - "loss": 0.5503, - "step": 45211 - }, - { - "epoch": 1.16, - "learning_rate": 1.404963032649805e-06, - "loss": 0.7163, - "step": 45212 - }, - { - "epoch": 1.16, - "learning_rate": 1.404937732484031e-06, - "loss": 0.623, - "step": 45213 - }, - { - "epoch": 1.16, - "learning_rate": 1.4049124320082152e-06, - "loss": 0.7578, - "step": 45214 - }, - { - "epoch": 1.16, - "learning_rate": 1.4048871312223767e-06, - "loss": 0.4048, - "step": 45215 - }, - { - "epoch": 1.16, - "learning_rate": 1.4048618301265348e-06, - "loss": 0.6484, - "step": 45216 - }, - { - "epoch": 1.16, - "learning_rate": 1.4048365287207082e-06, - "loss": 0.6265, - "step": 45217 - }, - { - "epoch": 1.16, - "learning_rate": 1.4048112270049175e-06, - "loss": 0.7324, - "step": 45218 - }, - { - "epoch": 1.16, - "learning_rate": 1.4047859249791812e-06, - "loss": 0.7363, - "step": 45219 - }, - { - "epoch": 1.16, - "learning_rate": 1.4047606226435186e-06, - "loss": 0.8291, - "step": 45220 - }, - { - "epoch": 1.16, - "learning_rate": 1.4047353199979498e-06, - "loss": 0.6982, - "step": 45221 - }, - { - "epoch": 1.16, - "learning_rate": 1.4047100170424936e-06, - "loss": 0.6196, - "step": 45222 - }, - { - "epoch": 1.16, - "learning_rate": 1.4046847137771699e-06, - "loss": 0.8574, - "step": 45223 - }, - { - "epoch": 1.16, - "learning_rate": 1.4046594102019975e-06, - "loss": 0.6138, - "step": 45224 - }, - { - "epoch": 1.16, - "learning_rate": 1.404634106316996e-06, - "loss": 0.7188, - "step": 45225 - }, - { - "epoch": 1.16, - "learning_rate": 1.4046088021221847e-06, - "loss": 0.3544, - "step": 45226 - }, - { - "epoch": 1.16, - "learning_rate": 1.404583497617583e-06, - "loss": 0.5675, - "step": 45227 - }, - { - "epoch": 1.16, - "learning_rate": 1.4045581928032105e-06, - "loss": 0.5605, - "step": 45228 - }, - { - "epoch": 1.16, - "learning_rate": 1.4045328876790863e-06, - "loss": 0.6763, - "step": 45229 - }, - { - "epoch": 1.16, - "learning_rate": 1.4045075822452298e-06, - "loss": 0.7412, - "step": 45230 - }, - { - "epoch": 1.16, - "learning_rate": 1.4044822765016607e-06, - "loss": 0.3661, - "step": 45231 - }, - { - "epoch": 1.16, - "learning_rate": 1.4044569704483977e-06, - "loss": 0.6484, - "step": 45232 - }, - { - "epoch": 1.16, - "learning_rate": 1.404431664085461e-06, - "loss": 0.606, - "step": 45233 - }, - { - "epoch": 1.16, - "learning_rate": 1.4044063574128692e-06, - "loss": 0.5452, - "step": 45234 - }, - { - "epoch": 1.16, - "learning_rate": 1.4043810504306425e-06, - "loss": 0.6543, - "step": 45235 - }, - { - "epoch": 1.16, - "learning_rate": 1.4043557431387996e-06, - "loss": 0.5464, - "step": 45236 - }, - { - "epoch": 1.16, - "learning_rate": 1.40433043553736e-06, - "loss": 0.5933, - "step": 45237 - }, - { - "epoch": 1.16, - "learning_rate": 1.404305127626343e-06, - "loss": 0.7139, - "step": 45238 - }, - { - "epoch": 1.16, - "learning_rate": 1.4042798194057686e-06, - "loss": 0.582, - "step": 45239 - }, - { - "epoch": 1.16, - "learning_rate": 1.4042545108756557e-06, - "loss": 0.6855, - "step": 45240 - }, - { - "epoch": 1.16, - "learning_rate": 1.4042292020360233e-06, - "loss": 0.8262, - "step": 45241 - }, - { - "epoch": 1.16, - "learning_rate": 1.4042038928868915e-06, - "loss": 0.6797, - "step": 45242 - }, - { - "epoch": 1.16, - "learning_rate": 1.4041785834282793e-06, - "loss": 0.5569, - "step": 45243 - }, - { - "epoch": 1.16, - "learning_rate": 1.4041532736602061e-06, - "loss": 0.7246, - "step": 45244 - }, - { - "epoch": 1.16, - "learning_rate": 1.4041279635826915e-06, - "loss": 0.7295, - "step": 45245 - }, - { - "epoch": 1.16, - "learning_rate": 1.4041026531957544e-06, - "loss": 0.7275, - "step": 45246 - }, - { - "epoch": 1.16, - "learning_rate": 1.4040773424994147e-06, - "loss": 0.5103, - "step": 45247 - }, - { - "epoch": 1.16, - "learning_rate": 1.4040520314936914e-06, - "loss": 0.6621, - "step": 45248 - }, - { - "epoch": 1.16, - "learning_rate": 1.4040267201786043e-06, - "loss": 0.6899, - "step": 45249 - }, - { - "epoch": 1.16, - "learning_rate": 1.4040014085541724e-06, - "loss": 0.6143, - "step": 45250 - }, - { - "epoch": 1.16, - "learning_rate": 1.4039760966204151e-06, - "loss": 0.6914, - "step": 45251 - }, - { - "epoch": 1.16, - "learning_rate": 1.403950784377352e-06, - "loss": 0.5613, - "step": 45252 - }, - { - "epoch": 1.16, - "learning_rate": 1.4039254718250022e-06, - "loss": 0.6074, - "step": 45253 - }, - { - "epoch": 1.16, - "learning_rate": 1.4039001589633854e-06, - "loss": 0.7197, - "step": 45254 - }, - { - "epoch": 1.16, - "learning_rate": 1.4038748457925206e-06, - "loss": 0.7793, - "step": 45255 - }, - { - "epoch": 1.16, - "learning_rate": 1.4038495323124278e-06, - "loss": 0.5576, - "step": 45256 - }, - { - "epoch": 1.16, - "learning_rate": 1.4038242185231254e-06, - "loss": 0.5693, - "step": 45257 - }, - { - "epoch": 1.16, - "learning_rate": 1.403798904424634e-06, - "loss": 0.6357, - "step": 45258 - }, - { - "epoch": 1.16, - "learning_rate": 1.4037735900169721e-06, - "loss": 0.8887, - "step": 45259 - }, - { - "epoch": 1.16, - "learning_rate": 1.4037482753001594e-06, - "loss": 0.6411, - "step": 45260 - }, - { - "epoch": 1.16, - "learning_rate": 1.403722960274215e-06, - "loss": 0.5966, - "step": 45261 - }, - { - "epoch": 1.16, - "learning_rate": 1.4036976449391585e-06, - "loss": 0.6064, - "step": 45262 - }, - { - "epoch": 1.16, - "learning_rate": 1.4036723292950092e-06, - "loss": 0.6787, - "step": 45263 - }, - { - "epoch": 1.16, - "learning_rate": 1.4036470133417869e-06, - "loss": 0.7339, - "step": 45264 - }, - { - "epoch": 1.16, - "learning_rate": 1.4036216970795104e-06, - "loss": 0.6992, - "step": 45265 - }, - { - "epoch": 1.16, - "learning_rate": 1.4035963805081992e-06, - "loss": 0.8965, - "step": 45266 - }, - { - "epoch": 1.16, - "learning_rate": 1.403571063627873e-06, - "loss": 0.4575, - "step": 45267 - }, - { - "epoch": 1.16, - "learning_rate": 1.403545746438551e-06, - "loss": 0.5488, - "step": 45268 - }, - { - "epoch": 1.16, - "learning_rate": 1.4035204289402527e-06, - "loss": 0.5938, - "step": 45269 - }, - { - "epoch": 1.16, - "learning_rate": 1.403495111132997e-06, - "loss": 0.6157, - "step": 45270 - }, - { - "epoch": 1.16, - "learning_rate": 1.403469793016804e-06, - "loss": 0.626, - "step": 45271 - }, - { - "epoch": 1.16, - "learning_rate": 1.4034444745916925e-06, - "loss": 0.792, - "step": 45272 - }, - { - "epoch": 1.16, - "learning_rate": 1.4034191558576822e-06, - "loss": 0.71, - "step": 45273 - }, - { - "epoch": 1.16, - "learning_rate": 1.4033938368147926e-06, - "loss": 0.7251, - "step": 45274 - }, - { - "epoch": 1.16, - "learning_rate": 1.4033685174630427e-06, - "loss": 0.6611, - "step": 45275 - }, - { - "epoch": 1.16, - "learning_rate": 1.4033431978024522e-06, - "loss": 0.5198, - "step": 45276 - }, - { - "epoch": 1.16, - "learning_rate": 1.40331787783304e-06, - "loss": 0.6714, - "step": 45277 - }, - { - "epoch": 1.16, - "learning_rate": 1.403292557554826e-06, - "loss": 0.8408, - "step": 45278 - }, - { - "epoch": 1.16, - "learning_rate": 1.4032672369678297e-06, - "loss": 0.6211, - "step": 45279 - }, - { - "epoch": 1.16, - "learning_rate": 1.4032419160720702e-06, - "loss": 0.6221, - "step": 45280 - }, - { - "epoch": 1.16, - "learning_rate": 1.4032165948675667e-06, - "loss": 0.7305, - "step": 45281 - }, - { - "epoch": 1.16, - "learning_rate": 1.4031912733543388e-06, - "loss": 0.5921, - "step": 45282 - }, - { - "epoch": 1.16, - "learning_rate": 1.403165951532406e-06, - "loss": 0.835, - "step": 45283 - }, - { - "epoch": 1.16, - "learning_rate": 1.4031406294017874e-06, - "loss": 0.4893, - "step": 45284 - }, - { - "epoch": 1.16, - "learning_rate": 1.4031153069625026e-06, - "loss": 0.3792, - "step": 45285 - }, - { - "epoch": 1.16, - "learning_rate": 1.4030899842145709e-06, - "loss": 0.752, - "step": 45286 - }, - { - "epoch": 1.16, - "learning_rate": 1.4030646611580119e-06, - "loss": 0.5669, - "step": 45287 - }, - { - "epoch": 1.16, - "learning_rate": 1.4030393377928447e-06, - "loss": 0.6318, - "step": 45288 - }, - { - "epoch": 1.16, - "learning_rate": 1.403014014119089e-06, - "loss": 0.6602, - "step": 45289 - }, - { - "epoch": 1.16, - "learning_rate": 1.4029886901367638e-06, - "loss": 0.7217, - "step": 45290 - }, - { - "epoch": 1.16, - "learning_rate": 1.4029633658458885e-06, - "loss": 0.4653, - "step": 45291 - }, - { - "epoch": 1.16, - "learning_rate": 1.4029380412464832e-06, - "loss": 0.5088, - "step": 45292 - }, - { - "epoch": 1.16, - "learning_rate": 1.4029127163385664e-06, - "loss": 0.5913, - "step": 45293 - }, - { - "epoch": 1.16, - "learning_rate": 1.402887391122158e-06, - "loss": 0.5613, - "step": 45294 - }, - { - "epoch": 1.16, - "learning_rate": 1.4028620655972771e-06, - "loss": 0.4177, - "step": 45295 - }, - { - "epoch": 1.16, - "learning_rate": 1.4028367397639436e-06, - "loss": 0.6738, - "step": 45296 - }, - { - "epoch": 1.16, - "learning_rate": 1.4028114136221761e-06, - "loss": 0.6406, - "step": 45297 - }, - { - "epoch": 1.16, - "learning_rate": 1.4027860871719945e-06, - "loss": 0.6221, - "step": 45298 - }, - { - "epoch": 1.16, - "learning_rate": 1.4027607604134185e-06, - "loss": 0.7676, - "step": 45299 - }, - { - "epoch": 1.16, - "learning_rate": 1.4027354333464668e-06, - "loss": 0.689, - "step": 45300 - }, - { - "epoch": 1.16, - "learning_rate": 1.4027101059711591e-06, - "loss": 0.5161, - "step": 45301 - }, - { - "epoch": 1.16, - "learning_rate": 1.4026847782875147e-06, - "loss": 0.7314, - "step": 45302 - }, - { - "epoch": 1.16, - "learning_rate": 1.402659450295553e-06, - "loss": 0.6143, - "step": 45303 - }, - { - "epoch": 1.16, - "learning_rate": 1.4026341219952937e-06, - "loss": 0.5442, - "step": 45304 - }, - { - "epoch": 1.16, - "learning_rate": 1.402608793386756e-06, - "loss": 0.6416, - "step": 45305 - }, - { - "epoch": 1.16, - "learning_rate": 1.4025834644699592e-06, - "loss": 0.8262, - "step": 45306 - }, - { - "epoch": 1.16, - "learning_rate": 1.4025581352449227e-06, - "loss": 0.5027, - "step": 45307 - }, - { - "epoch": 1.16, - "learning_rate": 1.402532805711666e-06, - "loss": 0.6865, - "step": 45308 - }, - { - "epoch": 1.16, - "learning_rate": 1.4025074758702084e-06, - "loss": 0.6406, - "step": 45309 - }, - { - "epoch": 1.16, - "learning_rate": 1.4024821457205693e-06, - "loss": 0.5742, - "step": 45310 - }, - { - "epoch": 1.16, - "learning_rate": 1.4024568152627683e-06, - "loss": 0.7705, - "step": 45311 - }, - { - "epoch": 1.16, - "learning_rate": 1.4024314844968244e-06, - "loss": 0.7168, - "step": 45312 - }, - { - "epoch": 1.16, - "learning_rate": 1.4024061534227574e-06, - "loss": 0.5674, - "step": 45313 - }, - { - "epoch": 1.16, - "learning_rate": 1.4023808220405866e-06, - "loss": 0.6196, - "step": 45314 - }, - { - "epoch": 1.16, - "learning_rate": 1.4023554903503311e-06, - "loss": 0.7212, - "step": 45315 - }, - { - "epoch": 1.16, - "learning_rate": 1.4023301583520104e-06, - "loss": 0.6001, - "step": 45316 - }, - { - "epoch": 1.16, - "learning_rate": 1.4023048260456443e-06, - "loss": 0.6875, - "step": 45317 - }, - { - "epoch": 1.16, - "learning_rate": 1.4022794934312513e-06, - "loss": 0.7148, - "step": 45318 - }, - { - "epoch": 1.16, - "learning_rate": 1.4022541605088523e-06, - "loss": 0.6611, - "step": 45319 - }, - { - "epoch": 1.16, - "learning_rate": 1.4022288272784652e-06, - "loss": 0.7041, - "step": 45320 - }, - { - "epoch": 1.16, - "learning_rate": 1.4022034937401102e-06, - "loss": 0.7275, - "step": 45321 - }, - { - "epoch": 1.16, - "learning_rate": 1.4021781598938063e-06, - "loss": 0.7637, - "step": 45322 - }, - { - "epoch": 1.16, - "learning_rate": 1.4021528257395732e-06, - "loss": 0.8198, - "step": 45323 - }, - { - "epoch": 1.16, - "learning_rate": 1.4021274912774302e-06, - "loss": 0.6016, - "step": 45324 - }, - { - "epoch": 1.16, - "learning_rate": 1.4021021565073965e-06, - "loss": 0.667, - "step": 45325 - }, - { - "epoch": 1.16, - "learning_rate": 1.4020768214294916e-06, - "loss": 0.6934, - "step": 45326 - }, - { - "epoch": 1.16, - "learning_rate": 1.4020514860437351e-06, - "loss": 0.5918, - "step": 45327 - }, - { - "epoch": 1.16, - "learning_rate": 1.4020261503501463e-06, - "loss": 0.6895, - "step": 45328 - }, - { - "epoch": 1.16, - "learning_rate": 1.4020008143487445e-06, - "loss": 0.6387, - "step": 45329 - }, - { - "epoch": 1.16, - "learning_rate": 1.4019754780395493e-06, - "loss": 0.4182, - "step": 45330 - }, - { - "epoch": 1.16, - "learning_rate": 1.4019501414225798e-06, - "loss": 0.7314, - "step": 45331 - }, - { - "epoch": 1.16, - "learning_rate": 1.4019248044978557e-06, - "loss": 0.6846, - "step": 45332 - }, - { - "epoch": 1.16, - "learning_rate": 1.4018994672653963e-06, - "loss": 0.6763, - "step": 45333 - }, - { - "epoch": 1.16, - "learning_rate": 1.4018741297252209e-06, - "loss": 0.7021, - "step": 45334 - }, - { - "epoch": 1.16, - "learning_rate": 1.4018487918773488e-06, - "loss": 0.5869, - "step": 45335 - }, - { - "epoch": 1.16, - "learning_rate": 1.4018234537217997e-06, - "loss": 0.7432, - "step": 45336 - }, - { - "epoch": 1.16, - "learning_rate": 1.4017981152585927e-06, - "loss": 0.749, - "step": 45337 - }, - { - "epoch": 1.16, - "learning_rate": 1.4017727764877474e-06, - "loss": 0.6782, - "step": 45338 - }, - { - "epoch": 1.16, - "learning_rate": 1.4017474374092832e-06, - "loss": 0.626, - "step": 45339 - }, - { - "epoch": 1.16, - "learning_rate": 1.4017220980232197e-06, - "loss": 0.5068, - "step": 45340 - }, - { - "epoch": 1.16, - "learning_rate": 1.4016967583295758e-06, - "loss": 0.5497, - "step": 45341 - }, - { - "epoch": 1.16, - "learning_rate": 1.4016714183283713e-06, - "loss": 0.5142, - "step": 45342 - }, - { - "epoch": 1.16, - "learning_rate": 1.401646078019625e-06, - "loss": 0.5654, - "step": 45343 - }, - { - "epoch": 1.16, - "learning_rate": 1.4016207374033575e-06, - "loss": 0.8232, - "step": 45344 - }, - { - "epoch": 1.16, - "learning_rate": 1.401595396479587e-06, - "loss": 0.707, - "step": 45345 - }, - { - "epoch": 1.16, - "learning_rate": 1.4015700552483335e-06, - "loss": 0.564, - "step": 45346 - }, - { - "epoch": 1.16, - "learning_rate": 1.4015447137096162e-06, - "loss": 0.6514, - "step": 45347 - }, - { - "epoch": 1.16, - "learning_rate": 1.401519371863455e-06, - "loss": 0.4707, - "step": 45348 - }, - { - "epoch": 1.16, - "learning_rate": 1.4014940297098683e-06, - "loss": 0.5083, - "step": 45349 - }, - { - "epoch": 1.16, - "learning_rate": 1.4014686872488763e-06, - "loss": 0.6079, - "step": 45350 - }, - { - "epoch": 1.16, - "learning_rate": 1.4014433444804982e-06, - "loss": 0.668, - "step": 45351 - }, - { - "epoch": 1.16, - "learning_rate": 1.4014180014047534e-06, - "loss": 0.6008, - "step": 45352 - }, - { - "epoch": 1.16, - "learning_rate": 1.4013926580216613e-06, - "loss": 0.5908, - "step": 45353 - }, - { - "epoch": 1.16, - "learning_rate": 1.4013673143312412e-06, - "loss": 0.6289, - "step": 45354 - }, - { - "epoch": 1.16, - "learning_rate": 1.4013419703335127e-06, - "loss": 0.6348, - "step": 45355 - }, - { - "epoch": 1.16, - "learning_rate": 1.401316626028495e-06, - "loss": 0.8374, - "step": 45356 - }, - { - "epoch": 1.16, - "learning_rate": 1.4012912814162077e-06, - "loss": 0.6042, - "step": 45357 - }, - { - "epoch": 1.16, - "learning_rate": 1.4012659364966702e-06, - "loss": 0.6001, - "step": 45358 - }, - { - "epoch": 1.16, - "learning_rate": 1.4012405912699017e-06, - "loss": 0.5889, - "step": 45359 - }, - { - "epoch": 1.16, - "learning_rate": 1.4012152457359217e-06, - "loss": 0.6768, - "step": 45360 - }, - { - "epoch": 1.16, - "learning_rate": 1.4011898998947498e-06, - "loss": 0.7119, - "step": 45361 - }, - { - "epoch": 1.16, - "learning_rate": 1.4011645537464049e-06, - "loss": 0.5259, - "step": 45362 - }, - { - "epoch": 1.16, - "learning_rate": 1.4011392072909072e-06, - "loss": 0.5181, - "step": 45363 - }, - { - "epoch": 1.16, - "learning_rate": 1.4011138605282753e-06, - "loss": 0.8818, - "step": 45364 - }, - { - "epoch": 1.16, - "learning_rate": 1.4010885134585294e-06, - "loss": 0.6318, - "step": 45365 - }, - { - "epoch": 1.16, - "learning_rate": 1.4010631660816879e-06, - "loss": 0.7715, - "step": 45366 - }, - { - "epoch": 1.16, - "learning_rate": 1.401037818397771e-06, - "loss": 0.5645, - "step": 45367 - }, - { - "epoch": 1.16, - "learning_rate": 1.401012470406798e-06, - "loss": 0.4395, - "step": 45368 - }, - { - "epoch": 1.16, - "learning_rate": 1.4009871221087881e-06, - "loss": 0.6846, - "step": 45369 - }, - { - "epoch": 1.16, - "learning_rate": 1.400961773503761e-06, - "loss": 0.6816, - "step": 45370 - }, - { - "epoch": 1.16, - "learning_rate": 1.4009364245917357e-06, - "loss": 0.5776, - "step": 45371 - }, - { - "epoch": 1.16, - "learning_rate": 1.4009110753727316e-06, - "loss": 0.5942, - "step": 45372 - }, - { - "epoch": 1.16, - "learning_rate": 1.4008857258467685e-06, - "loss": 0.5654, - "step": 45373 - }, - { - "epoch": 1.16, - "learning_rate": 1.400860376013866e-06, - "loss": 0.6538, - "step": 45374 - }, - { - "epoch": 1.16, - "learning_rate": 1.4008350258740426e-06, - "loss": 0.8242, - "step": 45375 - }, - { - "epoch": 1.16, - "learning_rate": 1.4008096754273186e-06, - "loss": 0.728, - "step": 45376 - }, - { - "epoch": 1.16, - "learning_rate": 1.4007843246737127e-06, - "loss": 0.5078, - "step": 45377 - }, - { - "epoch": 1.16, - "learning_rate": 1.4007589736132452e-06, - "loss": 0.6055, - "step": 45378 - }, - { - "epoch": 1.16, - "learning_rate": 1.4007336222459345e-06, - "loss": 0.7529, - "step": 45379 - }, - { - "epoch": 1.16, - "learning_rate": 1.4007082705718007e-06, - "loss": 0.6602, - "step": 45380 - }, - { - "epoch": 1.16, - "learning_rate": 1.4006829185908631e-06, - "loss": 0.7295, - "step": 45381 - }, - { - "epoch": 1.16, - "learning_rate": 1.4006575663031408e-06, - "loss": 0.8618, - "step": 45382 - }, - { - "epoch": 1.16, - "learning_rate": 1.4006322137086536e-06, - "loss": 0.7139, - "step": 45383 - }, - { - "epoch": 1.16, - "learning_rate": 1.400606860807421e-06, - "loss": 0.8281, - "step": 45384 - }, - { - "epoch": 1.16, - "learning_rate": 1.4005815075994614e-06, - "loss": 0.5752, - "step": 45385 - }, - { - "epoch": 1.16, - "learning_rate": 1.4005561540847954e-06, - "loss": 0.6621, - "step": 45386 - }, - { - "epoch": 1.16, - "learning_rate": 1.400530800263442e-06, - "loss": 0.6533, - "step": 45387 - }, - { - "epoch": 1.16, - "learning_rate": 1.4005054461354207e-06, - "loss": 0.6982, - "step": 45388 - }, - { - "epoch": 1.16, - "learning_rate": 1.4004800917007504e-06, - "loss": 0.7339, - "step": 45389 - }, - { - "epoch": 1.16, - "learning_rate": 1.4004547369594513e-06, - "loss": 0.5654, - "step": 45390 - }, - { - "epoch": 1.16, - "learning_rate": 1.400429381911542e-06, - "loss": 0.5038, - "step": 45391 - }, - { - "epoch": 1.16, - "learning_rate": 1.4004040265570427e-06, - "loss": 0.75, - "step": 45392 - }, - { - "epoch": 1.16, - "learning_rate": 1.4003786708959725e-06, - "loss": 0.5137, - "step": 45393 - }, - { - "epoch": 1.16, - "learning_rate": 1.4003533149283505e-06, - "loss": 0.6592, - "step": 45394 - }, - { - "epoch": 1.16, - "learning_rate": 1.4003279586541963e-06, - "loss": 0.5684, - "step": 45395 - }, - { - "epoch": 1.16, - "learning_rate": 1.4003026020735297e-06, - "loss": 0.7148, - "step": 45396 - }, - { - "epoch": 1.16, - "learning_rate": 1.4002772451863696e-06, - "loss": 0.604, - "step": 45397 - }, - { - "epoch": 1.16, - "learning_rate": 1.4002518879927356e-06, - "loss": 0.7568, - "step": 45398 - }, - { - "epoch": 1.16, - "learning_rate": 1.4002265304926475e-06, - "loss": 0.835, - "step": 45399 - }, - { - "epoch": 1.16, - "learning_rate": 1.4002011726861238e-06, - "loss": 0.6655, - "step": 45400 - }, - { - "epoch": 1.16, - "learning_rate": 1.4001758145731848e-06, - "loss": 0.7051, - "step": 45401 - }, - { - "epoch": 1.16, - "learning_rate": 1.4001504561538494e-06, - "loss": 0.5015, - "step": 45402 - }, - { - "epoch": 1.16, - "learning_rate": 1.4001250974281375e-06, - "loss": 0.8047, - "step": 45403 - }, - { - "epoch": 1.16, - "learning_rate": 1.400099738396068e-06, - "loss": 0.833, - "step": 45404 - }, - { - "epoch": 1.16, - "learning_rate": 1.4000743790576606e-06, - "loss": 0.5393, - "step": 45405 - }, - { - "epoch": 1.16, - "learning_rate": 1.4000490194129345e-06, - "loss": 0.4946, - "step": 45406 - }, - { - "epoch": 1.16, - "learning_rate": 1.4000236594619092e-06, - "loss": 0.7363, - "step": 45407 - }, - { - "epoch": 1.16, - "learning_rate": 1.3999982992046044e-06, - "loss": 0.7266, - "step": 45408 - }, - { - "epoch": 1.16, - "learning_rate": 1.3999729386410394e-06, - "loss": 0.5439, - "step": 45409 - }, - { - "epoch": 1.16, - "learning_rate": 1.399947577771233e-06, - "loss": 0.7627, - "step": 45410 - }, - { - "epoch": 1.16, - "learning_rate": 1.3999222165952059e-06, - "loss": 0.7783, - "step": 45411 - }, - { - "epoch": 1.16, - "learning_rate": 1.399896855112976e-06, - "loss": 0.6367, - "step": 45412 - }, - { - "epoch": 1.16, - "learning_rate": 1.399871493324564e-06, - "loss": 0.6191, - "step": 45413 - }, - { - "epoch": 1.16, - "learning_rate": 1.3998461312299884e-06, - "loss": 0.7041, - "step": 45414 - }, - { - "epoch": 1.16, - "learning_rate": 1.399820768829269e-06, - "loss": 0.9307, - "step": 45415 - }, - { - "epoch": 1.16, - "learning_rate": 1.3997954061224255e-06, - "loss": 0.6865, - "step": 45416 - }, - { - "epoch": 1.16, - "learning_rate": 1.399770043109477e-06, - "loss": 0.5117, - "step": 45417 - }, - { - "epoch": 1.16, - "learning_rate": 1.3997446797904428e-06, - "loss": 0.7393, - "step": 45418 - }, - { - "epoch": 1.16, - "learning_rate": 1.3997193161653424e-06, - "loss": 0.749, - "step": 45419 - }, - { - "epoch": 1.16, - "learning_rate": 1.3996939522341957e-06, - "loss": 0.7324, - "step": 45420 - }, - { - "epoch": 1.16, - "learning_rate": 1.3996685879970213e-06, - "loss": 0.7715, - "step": 45421 - }, - { - "epoch": 1.16, - "learning_rate": 1.3996432234538393e-06, - "loss": 0.8594, - "step": 45422 - }, - { - "epoch": 1.16, - "learning_rate": 1.3996178586046688e-06, - "loss": 0.6787, - "step": 45423 - }, - { - "epoch": 1.16, - "learning_rate": 1.3995924934495294e-06, - "loss": 0.7744, - "step": 45424 - }, - { - "epoch": 1.16, - "learning_rate": 1.39956712798844e-06, - "loss": 0.6172, - "step": 45425 - }, - { - "epoch": 1.16, - "learning_rate": 1.3995417622214207e-06, - "loss": 0.667, - "step": 45426 - }, - { - "epoch": 1.16, - "learning_rate": 1.3995163961484907e-06, - "loss": 0.6514, - "step": 45427 - }, - { - "epoch": 1.16, - "learning_rate": 1.3994910297696697e-06, - "loss": 0.75, - "step": 45428 - }, - { - "epoch": 1.16, - "learning_rate": 1.399465663084976e-06, - "loss": 0.6206, - "step": 45429 - }, - { - "epoch": 1.16, - "learning_rate": 1.3994402960944304e-06, - "loss": 0.4434, - "step": 45430 - }, - { - "epoch": 1.16, - "learning_rate": 1.3994149287980512e-06, - "loss": 0.7627, - "step": 45431 - }, - { - "epoch": 1.16, - "learning_rate": 1.3993895611958588e-06, - "loss": 0.4473, - "step": 45432 - }, - { - "epoch": 1.16, - "learning_rate": 1.3993641932878721e-06, - "loss": 0.6416, - "step": 45433 - }, - { - "epoch": 1.16, - "learning_rate": 1.3993388250741107e-06, - "loss": 0.6035, - "step": 45434 - }, - { - "epoch": 1.16, - "learning_rate": 1.3993134565545938e-06, - "loss": 0.7129, - "step": 45435 - }, - { - "epoch": 1.16, - "learning_rate": 1.3992880877293407e-06, - "loss": 0.686, - "step": 45436 - }, - { - "epoch": 1.16, - "learning_rate": 1.3992627185983711e-06, - "loss": 0.2832, - "step": 45437 - }, - { - "epoch": 1.16, - "learning_rate": 1.3992373491617047e-06, - "loss": 0.5327, - "step": 45438 - }, - { - "epoch": 1.16, - "learning_rate": 1.3992119794193607e-06, - "loss": 0.7656, - "step": 45439 - }, - { - "epoch": 1.16, - "learning_rate": 1.3991866093713582e-06, - "loss": 0.5737, - "step": 45440 - }, - { - "epoch": 1.16, - "learning_rate": 1.399161239017717e-06, - "loss": 0.5122, - "step": 45441 - }, - { - "epoch": 1.16, - "learning_rate": 1.3991358683584563e-06, - "loss": 0.6401, - "step": 45442 - }, - { - "epoch": 1.16, - "learning_rate": 1.3991104973935956e-06, - "loss": 0.6602, - "step": 45443 - }, - { - "epoch": 1.16, - "learning_rate": 1.3990851261231545e-06, - "loss": 0.6736, - "step": 45444 - }, - { - "epoch": 1.16, - "learning_rate": 1.3990597545471521e-06, - "loss": 0.6362, - "step": 45445 - }, - { - "epoch": 1.16, - "learning_rate": 1.3990343826656079e-06, - "loss": 0.7412, - "step": 45446 - }, - { - "epoch": 1.16, - "learning_rate": 1.3990090104785416e-06, - "loss": 0.6104, - "step": 45447 - }, - { - "epoch": 1.16, - "learning_rate": 1.3989836379859723e-06, - "loss": 0.6582, - "step": 45448 - }, - { - "epoch": 1.16, - "learning_rate": 1.39895826518792e-06, - "loss": 0.5195, - "step": 45449 - }, - { - "epoch": 1.16, - "learning_rate": 1.398932892084403e-06, - "loss": 0.835, - "step": 45450 - }, - { - "epoch": 1.16, - "learning_rate": 1.398907518675442e-06, - "loss": 0.7568, - "step": 45451 - }, - { - "epoch": 1.16, - "learning_rate": 1.3988821449610555e-06, - "loss": 0.6665, - "step": 45452 - }, - { - "epoch": 1.16, - "learning_rate": 1.3988567709412638e-06, - "loss": 0.6704, - "step": 45453 - }, - { - "epoch": 1.17, - "learning_rate": 1.3988313966160852e-06, - "loss": 0.5801, - "step": 45454 - }, - { - "epoch": 1.17, - "learning_rate": 1.3988060219855402e-06, - "loss": 0.6377, - "step": 45455 - }, - { - "epoch": 1.17, - "learning_rate": 1.3987806470496474e-06, - "loss": 0.5771, - "step": 45456 - }, - { - "epoch": 1.17, - "learning_rate": 1.3987552718084268e-06, - "loss": 0.3979, - "step": 45457 - }, - { - "epoch": 1.17, - "learning_rate": 1.3987298962618976e-06, - "loss": 0.4705, - "step": 45458 - }, - { - "epoch": 1.17, - "learning_rate": 1.3987045204100793e-06, - "loss": 0.7441, - "step": 45459 - }, - { - "epoch": 1.17, - "learning_rate": 1.3986791442529914e-06, - "loss": 0.4351, - "step": 45460 - }, - { - "epoch": 1.17, - "learning_rate": 1.398653767790653e-06, - "loss": 0.5762, - "step": 45461 - }, - { - "epoch": 1.17, - "learning_rate": 1.3986283910230836e-06, - "loss": 0.5601, - "step": 45462 - }, - { - "epoch": 1.17, - "learning_rate": 1.3986030139503028e-06, - "loss": 0.7373, - "step": 45463 - }, - { - "epoch": 1.17, - "learning_rate": 1.3985776365723302e-06, - "loss": 0.6396, - "step": 45464 - }, - { - "epoch": 1.17, - "learning_rate": 1.398552258889185e-06, - "loss": 0.5781, - "step": 45465 - }, - { - "epoch": 1.17, - "learning_rate": 1.3985268809008866e-06, - "loss": 0.6587, - "step": 45466 - }, - { - "epoch": 1.17, - "learning_rate": 1.3985015026074545e-06, - "loss": 0.6934, - "step": 45467 - }, - { - "epoch": 1.17, - "learning_rate": 1.3984761240089085e-06, - "loss": 0.7412, - "step": 45468 - }, - { - "epoch": 1.17, - "learning_rate": 1.398450745105267e-06, - "loss": 0.749, - "step": 45469 - }, - { - "epoch": 1.17, - "learning_rate": 1.3984253658965503e-06, - "loss": 0.8057, - "step": 45470 - }, - { - "epoch": 1.17, - "learning_rate": 1.3983999863827778e-06, - "loss": 0.749, - "step": 45471 - }, - { - "epoch": 1.17, - "learning_rate": 1.3983746065639688e-06, - "loss": 0.6812, - "step": 45472 - }, - { - "epoch": 1.17, - "learning_rate": 1.3983492264401423e-06, - "loss": 0.5708, - "step": 45473 - }, - { - "epoch": 1.17, - "learning_rate": 1.3983238460113186e-06, - "loss": 0.6489, - "step": 45474 - }, - { - "epoch": 1.17, - "learning_rate": 1.3982984652775162e-06, - "loss": 0.5903, - "step": 45475 - }, - { - "epoch": 1.17, - "learning_rate": 1.3982730842387553e-06, - "loss": 0.5493, - "step": 45476 - }, - { - "epoch": 1.17, - "learning_rate": 1.3982477028950547e-06, - "loss": 0.5894, - "step": 45477 - }, - { - "epoch": 1.17, - "learning_rate": 1.3982223212464345e-06, - "loss": 0.5923, - "step": 45478 - }, - { - "epoch": 1.17, - "learning_rate": 1.3981969392929135e-06, - "loss": 0.6973, - "step": 45479 - }, - { - "epoch": 1.17, - "learning_rate": 1.3981715570345118e-06, - "loss": 0.7852, - "step": 45480 - }, - { - "epoch": 1.17, - "learning_rate": 1.3981461744712478e-06, - "loss": 0.7383, - "step": 45481 - }, - { - "epoch": 1.17, - "learning_rate": 1.398120791603142e-06, - "loss": 0.5811, - "step": 45482 - }, - { - "epoch": 1.17, - "learning_rate": 1.3980954084302136e-06, - "loss": 0.6396, - "step": 45483 - }, - { - "epoch": 1.17, - "learning_rate": 1.3980700249524815e-06, - "loss": 0.5488, - "step": 45484 - }, - { - "epoch": 1.17, - "learning_rate": 1.3980446411699655e-06, - "loss": 0.6699, - "step": 45485 - }, - { - "epoch": 1.17, - "learning_rate": 1.3980192570826853e-06, - "loss": 0.5737, - "step": 45486 - }, - { - "epoch": 1.17, - "learning_rate": 1.3979938726906597e-06, - "loss": 0.707, - "step": 45487 - }, - { - "epoch": 1.17, - "learning_rate": 1.3979684879939088e-06, - "loss": 0.6162, - "step": 45488 - }, - { - "epoch": 1.17, - "learning_rate": 1.3979431029924518e-06, - "loss": 0.7041, - "step": 45489 - }, - { - "epoch": 1.17, - "learning_rate": 1.3979177176863078e-06, - "loss": 0.6104, - "step": 45490 - }, - { - "epoch": 1.17, - "learning_rate": 1.3978923320754966e-06, - "loss": 0.7061, - "step": 45491 - }, - { - "epoch": 1.17, - "learning_rate": 1.3978669461600373e-06, - "loss": 0.7134, - "step": 45492 - }, - { - "epoch": 1.17, - "learning_rate": 1.39784155993995e-06, - "loss": 0.7969, - "step": 45493 - }, - { - "epoch": 1.17, - "learning_rate": 1.3978161734152533e-06, - "loss": 0.5679, - "step": 45494 - }, - { - "epoch": 1.17, - "learning_rate": 1.3977907865859675e-06, - "loss": 0.5698, - "step": 45495 - }, - { - "epoch": 1.17, - "learning_rate": 1.397765399452111e-06, - "loss": 0.7842, - "step": 45496 - }, - { - "epoch": 1.17, - "learning_rate": 1.3977400120137044e-06, - "loss": 0.647, - "step": 45497 - }, - { - "epoch": 1.17, - "learning_rate": 1.3977146242707662e-06, - "loss": 0.7314, - "step": 45498 - }, - { - "epoch": 1.17, - "learning_rate": 1.3976892362233163e-06, - "loss": 0.5522, - "step": 45499 - }, - { - "epoch": 1.17, - "learning_rate": 1.397663847871374e-06, - "loss": 0.7236, - "step": 45500 - }, - { - "epoch": 1.17, - "learning_rate": 1.397638459214959e-06, - "loss": 0.7393, - "step": 45501 - }, - { - "epoch": 1.17, - "learning_rate": 1.3976130702540903e-06, - "loss": 0.623, - "step": 45502 - }, - { - "epoch": 1.17, - "learning_rate": 1.3975876809887877e-06, - "loss": 0.5688, - "step": 45503 - }, - { - "epoch": 1.17, - "learning_rate": 1.3975622914190703e-06, - "loss": 0.7334, - "step": 45504 - }, - { - "epoch": 1.17, - "learning_rate": 1.3975369015449578e-06, - "loss": 0.5999, - "step": 45505 - }, - { - "epoch": 1.17, - "learning_rate": 1.3975115113664695e-06, - "loss": 0.6343, - "step": 45506 - }, - { - "epoch": 1.17, - "learning_rate": 1.397486120883625e-06, - "loss": 0.6025, - "step": 45507 - }, - { - "epoch": 1.17, - "learning_rate": 1.3974607300964438e-06, - "loss": 0.6685, - "step": 45508 - }, - { - "epoch": 1.17, - "learning_rate": 1.397435339004945e-06, - "loss": 0.541, - "step": 45509 - }, - { - "epoch": 1.17, - "learning_rate": 1.3974099476091483e-06, - "loss": 0.5566, - "step": 45510 - }, - { - "epoch": 1.17, - "learning_rate": 1.397384555909073e-06, - "loss": 0.6494, - "step": 45511 - }, - { - "epoch": 1.17, - "learning_rate": 1.3973591639047387e-06, - "loss": 0.4639, - "step": 45512 - }, - { - "epoch": 1.17, - "learning_rate": 1.3973337715961648e-06, - "loss": 0.7168, - "step": 45513 - }, - { - "epoch": 1.17, - "learning_rate": 1.3973083789833706e-06, - "loss": 0.6831, - "step": 45514 - }, - { - "epoch": 1.17, - "learning_rate": 1.3972829860663757e-06, - "loss": 0.707, - "step": 45515 - }, - { - "epoch": 1.17, - "learning_rate": 1.3972575928451996e-06, - "loss": 0.7188, - "step": 45516 - }, - { - "epoch": 1.17, - "learning_rate": 1.3972321993198612e-06, - "loss": 0.7285, - "step": 45517 - }, - { - "epoch": 1.17, - "learning_rate": 1.3972068054903812e-06, - "loss": 0.7876, - "step": 45518 - }, - { - "epoch": 1.17, - "learning_rate": 1.3971814113567772e-06, - "loss": 0.5796, - "step": 45519 - }, - { - "epoch": 1.17, - "learning_rate": 1.3971560169190704e-06, - "loss": 0.6526, - "step": 45520 - }, - { - "epoch": 1.17, - "learning_rate": 1.3971306221772792e-06, - "loss": 0.6499, - "step": 45521 - }, - { - "epoch": 1.17, - "learning_rate": 1.3971052271314235e-06, - "loss": 0.6519, - "step": 45522 - }, - { - "epoch": 1.17, - "learning_rate": 1.3970798317815225e-06, - "loss": 0.5947, - "step": 45523 - }, - { - "epoch": 1.17, - "learning_rate": 1.3970544361275956e-06, - "loss": 0.5757, - "step": 45524 - }, - { - "epoch": 1.17, - "learning_rate": 1.3970290401696624e-06, - "loss": 0.5381, - "step": 45525 - }, - { - "epoch": 1.17, - "learning_rate": 1.3970036439077425e-06, - "loss": 0.6729, - "step": 45526 - }, - { - "epoch": 1.17, - "learning_rate": 1.396978247341855e-06, - "loss": 0.7334, - "step": 45527 - }, - { - "epoch": 1.17, - "learning_rate": 1.3969528504720197e-06, - "loss": 0.7197, - "step": 45528 - }, - { - "epoch": 1.17, - "learning_rate": 1.3969274532982556e-06, - "loss": 0.5708, - "step": 45529 - }, - { - "epoch": 1.17, - "learning_rate": 1.3969020558205827e-06, - "loss": 0.5249, - "step": 45530 - }, - { - "epoch": 1.17, - "learning_rate": 1.3968766580390198e-06, - "loss": 0.6172, - "step": 45531 - }, - { - "epoch": 1.17, - "learning_rate": 1.396851259953587e-06, - "loss": 0.6758, - "step": 45532 - }, - { - "epoch": 1.17, - "learning_rate": 1.3968258615643031e-06, - "loss": 0.6865, - "step": 45533 - }, - { - "epoch": 1.17, - "learning_rate": 1.3968004628711883e-06, - "loss": 0.582, - "step": 45534 - }, - { - "epoch": 1.17, - "learning_rate": 1.3967750638742612e-06, - "loss": 0.594, - "step": 45535 - }, - { - "epoch": 1.17, - "learning_rate": 1.396749664573542e-06, - "loss": 0.6875, - "step": 45536 - }, - { - "epoch": 1.17, - "learning_rate": 1.3967242649690496e-06, - "loss": 0.5432, - "step": 45537 - }, - { - "epoch": 1.17, - "learning_rate": 1.396698865060804e-06, - "loss": 0.5913, - "step": 45538 - }, - { - "epoch": 1.17, - "learning_rate": 1.396673464848824e-06, - "loss": 0.6382, - "step": 45539 - }, - { - "epoch": 1.17, - "learning_rate": 1.3966480643331296e-06, - "loss": 0.4805, - "step": 45540 - }, - { - "epoch": 1.17, - "learning_rate": 1.3966226635137397e-06, - "loss": 0.7119, - "step": 45541 - }, - { - "epoch": 1.17, - "learning_rate": 1.3965972623906744e-06, - "loss": 0.4362, - "step": 45542 - }, - { - "epoch": 1.17, - "learning_rate": 1.3965718609639528e-06, - "loss": 0.7529, - "step": 45543 - }, - { - "epoch": 1.17, - "learning_rate": 1.396546459233594e-06, - "loss": 0.7773, - "step": 45544 - }, - { - "epoch": 1.17, - "learning_rate": 1.3965210571996183e-06, - "loss": 0.6218, - "step": 45545 - }, - { - "epoch": 1.17, - "learning_rate": 1.396495654862044e-06, - "loss": 0.6855, - "step": 45546 - }, - { - "epoch": 1.17, - "learning_rate": 1.3964702522208918e-06, - "loss": 0.6858, - "step": 45547 - }, - { - "epoch": 1.17, - "learning_rate": 1.3964448492761804e-06, - "loss": 0.4717, - "step": 45548 - }, - { - "epoch": 1.17, - "learning_rate": 1.3964194460279295e-06, - "loss": 0.5479, - "step": 45549 - }, - { - "epoch": 1.17, - "learning_rate": 1.3963940424761582e-06, - "loss": 0.6626, - "step": 45550 - }, - { - "epoch": 1.17, - "learning_rate": 1.3963686386208864e-06, - "loss": 0.6016, - "step": 45551 - }, - { - "epoch": 1.17, - "learning_rate": 1.3963432344621331e-06, - "loss": 0.5146, - "step": 45552 - }, - { - "epoch": 1.17, - "learning_rate": 1.3963178299999182e-06, - "loss": 0.5493, - "step": 45553 - }, - { - "epoch": 1.17, - "learning_rate": 1.3962924252342612e-06, - "loss": 0.6099, - "step": 45554 - }, - { - "epoch": 1.17, - "learning_rate": 1.396267020165181e-06, - "loss": 0.6226, - "step": 45555 - }, - { - "epoch": 1.17, - "learning_rate": 1.3962416147926975e-06, - "loss": 0.7207, - "step": 45556 - }, - { - "epoch": 1.17, - "learning_rate": 1.3962162091168299e-06, - "loss": 0.5981, - "step": 45557 - }, - { - "epoch": 1.17, - "learning_rate": 1.396190803137598e-06, - "loss": 0.6287, - "step": 45558 - }, - { - "epoch": 1.17, - "learning_rate": 1.3961653968550206e-06, - "loss": 0.6816, - "step": 45559 - }, - { - "epoch": 1.17, - "learning_rate": 1.396139990269118e-06, - "loss": 0.6379, - "step": 45560 - }, - { - "epoch": 1.17, - "learning_rate": 1.396114583379909e-06, - "loss": 0.7109, - "step": 45561 - }, - { - "epoch": 1.17, - "learning_rate": 1.3960891761874134e-06, - "loss": 0.6367, - "step": 45562 - }, - { - "epoch": 1.17, - "learning_rate": 1.3960637686916506e-06, - "loss": 0.5977, - "step": 45563 - }, - { - "epoch": 1.17, - "learning_rate": 1.3960383608926398e-06, - "loss": 0.6758, - "step": 45564 - }, - { - "epoch": 1.17, - "learning_rate": 1.3960129527904006e-06, - "loss": 0.5906, - "step": 45565 - }, - { - "epoch": 1.17, - "learning_rate": 1.3959875443849525e-06, - "loss": 0.6167, - "step": 45566 - }, - { - "epoch": 1.17, - "learning_rate": 1.395962135676315e-06, - "loss": 0.5981, - "step": 45567 - }, - { - "epoch": 1.17, - "learning_rate": 1.3959367266645076e-06, - "loss": 0.6675, - "step": 45568 - }, - { - "epoch": 1.17, - "learning_rate": 1.3959113173495497e-06, - "loss": 0.8135, - "step": 45569 - }, - { - "epoch": 1.17, - "learning_rate": 1.3958859077314605e-06, - "loss": 0.6934, - "step": 45570 - }, - { - "epoch": 1.17, - "learning_rate": 1.3958604978102594e-06, - "loss": 0.6353, - "step": 45571 - }, - { - "epoch": 1.17, - "learning_rate": 1.3958350875859668e-06, - "loss": 0.6323, - "step": 45572 - }, - { - "epoch": 1.17, - "learning_rate": 1.395809677058601e-06, - "loss": 0.7031, - "step": 45573 - }, - { - "epoch": 1.17, - "learning_rate": 1.395784266228182e-06, - "loss": 0.4314, - "step": 45574 - }, - { - "epoch": 1.17, - "learning_rate": 1.3957588550947292e-06, - "loss": 0.3771, - "step": 45575 - }, - { - "epoch": 1.17, - "learning_rate": 1.3957334436582625e-06, - "loss": 0.6445, - "step": 45576 - }, - { - "epoch": 1.17, - "learning_rate": 1.3957080319188002e-06, - "loss": 0.5264, - "step": 45577 - }, - { - "epoch": 1.17, - "learning_rate": 1.3956826198763627e-06, - "loss": 0.6797, - "step": 45578 - }, - { - "epoch": 1.17, - "learning_rate": 1.3956572075309693e-06, - "loss": 0.6162, - "step": 45579 - }, - { - "epoch": 1.17, - "learning_rate": 1.3956317948826392e-06, - "loss": 0.6904, - "step": 45580 - }, - { - "epoch": 1.17, - "learning_rate": 1.3956063819313921e-06, - "loss": 0.582, - "step": 45581 - }, - { - "epoch": 1.17, - "learning_rate": 1.3955809686772475e-06, - "loss": 0.6836, - "step": 45582 - }, - { - "epoch": 1.17, - "learning_rate": 1.395555555120225e-06, - "loss": 0.7188, - "step": 45583 - }, - { - "epoch": 1.17, - "learning_rate": 1.3955301412603434e-06, - "loss": 0.6211, - "step": 45584 - }, - { - "epoch": 1.17, - "learning_rate": 1.3955047270976226e-06, - "loss": 0.5752, - "step": 45585 - }, - { - "epoch": 1.17, - "learning_rate": 1.3954793126320818e-06, - "loss": 0.728, - "step": 45586 - }, - { - "epoch": 1.17, - "learning_rate": 1.3954538978637409e-06, - "loss": 0.627, - "step": 45587 - }, - { - "epoch": 1.17, - "learning_rate": 1.3954284827926195e-06, - "loss": 0.5918, - "step": 45588 - }, - { - "epoch": 1.17, - "learning_rate": 1.3954030674187363e-06, - "loss": 0.6104, - "step": 45589 - }, - { - "epoch": 1.17, - "learning_rate": 1.395377651742111e-06, - "loss": 0.6631, - "step": 45590 - }, - { - "epoch": 1.17, - "learning_rate": 1.3953522357627636e-06, - "loss": 0.6123, - "step": 45591 - }, - { - "epoch": 1.17, - "learning_rate": 1.3953268194807128e-06, - "loss": 0.5737, - "step": 45592 - }, - { - "epoch": 1.17, - "learning_rate": 1.395301402895979e-06, - "loss": 0.79, - "step": 45593 - }, - { - "epoch": 1.17, - "learning_rate": 1.3952759860085804e-06, - "loss": 0.6846, - "step": 45594 - }, - { - "epoch": 1.17, - "learning_rate": 1.3952505688185375e-06, - "loss": 0.7246, - "step": 45595 - }, - { - "epoch": 1.17, - "learning_rate": 1.3952251513258693e-06, - "loss": 0.6768, - "step": 45596 - }, - { - "epoch": 1.17, - "learning_rate": 1.3951997335305956e-06, - "loss": 0.6357, - "step": 45597 - }, - { - "epoch": 1.17, - "learning_rate": 1.3951743154327355e-06, - "loss": 0.3943, - "step": 45598 - }, - { - "epoch": 1.17, - "learning_rate": 1.3951488970323084e-06, - "loss": 0.752, - "step": 45599 - }, - { - "epoch": 1.17, - "learning_rate": 1.3951234783293343e-06, - "loss": 0.5776, - "step": 45600 - }, - { - "epoch": 1.17, - "learning_rate": 1.395098059323832e-06, - "loss": 0.6084, - "step": 45601 - }, - { - "epoch": 1.17, - "learning_rate": 1.3950726400158216e-06, - "loss": 0.5137, - "step": 45602 - }, - { - "epoch": 1.17, - "learning_rate": 1.3950472204053222e-06, - "loss": 0.5991, - "step": 45603 - }, - { - "epoch": 1.17, - "learning_rate": 1.395021800492353e-06, - "loss": 0.5083, - "step": 45604 - }, - { - "epoch": 1.17, - "learning_rate": 1.394996380276934e-06, - "loss": 0.7578, - "step": 45605 - }, - { - "epoch": 1.17, - "learning_rate": 1.3949709597590844e-06, - "loss": 0.481, - "step": 45606 - }, - { - "epoch": 1.17, - "learning_rate": 1.3949455389388236e-06, - "loss": 0.585, - "step": 45607 - }, - { - "epoch": 1.17, - "learning_rate": 1.3949201178161715e-06, - "loss": 0.6475, - "step": 45608 - }, - { - "epoch": 1.17, - "learning_rate": 1.394894696391147e-06, - "loss": 0.6406, - "step": 45609 - }, - { - "epoch": 1.17, - "learning_rate": 1.3948692746637699e-06, - "loss": 0.7236, - "step": 45610 - }, - { - "epoch": 1.17, - "learning_rate": 1.3948438526340592e-06, - "loss": 0.6816, - "step": 45611 - }, - { - "epoch": 1.17, - "learning_rate": 1.394818430302035e-06, - "loss": 0.7441, - "step": 45612 - }, - { - "epoch": 1.17, - "learning_rate": 1.3947930076677166e-06, - "loss": 0.5759, - "step": 45613 - }, - { - "epoch": 1.17, - "learning_rate": 1.3947675847311232e-06, - "loss": 0.4761, - "step": 45614 - }, - { - "epoch": 1.17, - "learning_rate": 1.394742161492274e-06, - "loss": 0.7148, - "step": 45615 - }, - { - "epoch": 1.17, - "learning_rate": 1.3947167379511894e-06, - "loss": 0.7959, - "step": 45616 - }, - { - "epoch": 1.17, - "learning_rate": 1.3946913141078883e-06, - "loss": 0.6812, - "step": 45617 - }, - { - "epoch": 1.17, - "learning_rate": 1.39466588996239e-06, - "loss": 0.373, - "step": 45618 - }, - { - "epoch": 1.17, - "learning_rate": 1.3946404655147143e-06, - "loss": 0.6699, - "step": 45619 - }, - { - "epoch": 1.17, - "learning_rate": 1.3946150407648806e-06, - "loss": 0.5039, - "step": 45620 - }, - { - "epoch": 1.17, - "learning_rate": 1.3945896157129083e-06, - "loss": 0.7812, - "step": 45621 - }, - { - "epoch": 1.17, - "learning_rate": 1.3945641903588168e-06, - "loss": 0.6165, - "step": 45622 - }, - { - "epoch": 1.17, - "learning_rate": 1.3945387647026259e-06, - "loss": 0.5657, - "step": 45623 - }, - { - "epoch": 1.17, - "learning_rate": 1.3945133387443542e-06, - "loss": 0.5245, - "step": 45624 - }, - { - "epoch": 1.17, - "learning_rate": 1.3944879124840223e-06, - "loss": 0.6968, - "step": 45625 - }, - { - "epoch": 1.17, - "learning_rate": 1.3944624859216488e-06, - "loss": 0.7178, - "step": 45626 - }, - { - "epoch": 1.17, - "learning_rate": 1.394437059057254e-06, - "loss": 0.4956, - "step": 45627 - }, - { - "epoch": 1.17, - "learning_rate": 1.3944116318908566e-06, - "loss": 0.585, - "step": 45628 - }, - { - "epoch": 1.17, - "learning_rate": 1.3943862044224764e-06, - "loss": 0.5464, - "step": 45629 - }, - { - "epoch": 1.17, - "learning_rate": 1.3943607766521325e-06, - "loss": 0.6084, - "step": 45630 - }, - { - "epoch": 1.17, - "learning_rate": 1.3943353485798451e-06, - "loss": 0.6545, - "step": 45631 - }, - { - "epoch": 1.17, - "learning_rate": 1.3943099202056328e-06, - "loss": 0.5825, - "step": 45632 - }, - { - "epoch": 1.17, - "learning_rate": 1.3942844915295162e-06, - "loss": 0.606, - "step": 45633 - }, - { - "epoch": 1.17, - "learning_rate": 1.3942590625515136e-06, - "loss": 0.6572, - "step": 45634 - }, - { - "epoch": 1.17, - "learning_rate": 1.3942336332716452e-06, - "loss": 0.6289, - "step": 45635 - }, - { - "epoch": 1.17, - "learning_rate": 1.3942082036899299e-06, - "loss": 0.6157, - "step": 45636 - }, - { - "epoch": 1.17, - "learning_rate": 1.3941827738063879e-06, - "loss": 0.6675, - "step": 45637 - }, - { - "epoch": 1.17, - "learning_rate": 1.394157343621038e-06, - "loss": 0.5254, - "step": 45638 - }, - { - "epoch": 1.17, - "learning_rate": 1.3941319131339002e-06, - "loss": 0.7812, - "step": 45639 - }, - { - "epoch": 1.17, - "learning_rate": 1.3941064823449933e-06, - "loss": 0.5996, - "step": 45640 - }, - { - "epoch": 1.17, - "learning_rate": 1.3940810512543374e-06, - "loss": 0.5757, - "step": 45641 - }, - { - "epoch": 1.17, - "learning_rate": 1.3940556198619517e-06, - "loss": 0.5713, - "step": 45642 - }, - { - "epoch": 1.17, - "learning_rate": 1.394030188167856e-06, - "loss": 0.748, - "step": 45643 - }, - { - "epoch": 1.17, - "learning_rate": 1.3940047561720695e-06, - "loss": 0.5156, - "step": 45644 - }, - { - "epoch": 1.17, - "learning_rate": 1.3939793238746115e-06, - "loss": 0.7461, - "step": 45645 - }, - { - "epoch": 1.17, - "learning_rate": 1.3939538912755015e-06, - "loss": 0.7061, - "step": 45646 - }, - { - "epoch": 1.17, - "learning_rate": 1.3939284583747594e-06, - "loss": 0.5596, - "step": 45647 - }, - { - "epoch": 1.17, - "learning_rate": 1.3939030251724044e-06, - "loss": 0.4932, - "step": 45648 - }, - { - "epoch": 1.17, - "learning_rate": 1.3938775916684556e-06, - "loss": 0.5269, - "step": 45649 - }, - { - "epoch": 1.17, - "learning_rate": 1.3938521578629331e-06, - "loss": 0.5435, - "step": 45650 - }, - { - "epoch": 1.17, - "learning_rate": 1.393826723755856e-06, - "loss": 0.6289, - "step": 45651 - }, - { - "epoch": 1.17, - "learning_rate": 1.3938012893472441e-06, - "loss": 0.6455, - "step": 45652 - }, - { - "epoch": 1.17, - "learning_rate": 1.3937758546371166e-06, - "loss": 0.4929, - "step": 45653 - }, - { - "epoch": 1.17, - "learning_rate": 1.393750419625493e-06, - "loss": 0.7153, - "step": 45654 - }, - { - "epoch": 1.17, - "learning_rate": 1.3937249843123926e-06, - "loss": 0.5046, - "step": 45655 - }, - { - "epoch": 1.17, - "learning_rate": 1.3936995486978354e-06, - "loss": 0.6387, - "step": 45656 - }, - { - "epoch": 1.17, - "learning_rate": 1.3936741127818406e-06, - "loss": 0.6172, - "step": 45657 - }, - { - "epoch": 1.17, - "learning_rate": 1.3936486765644272e-06, - "loss": 0.6021, - "step": 45658 - }, - { - "epoch": 1.17, - "learning_rate": 1.3936232400456154e-06, - "loss": 0.6704, - "step": 45659 - }, - { - "epoch": 1.17, - "learning_rate": 1.3935978032254245e-06, - "loss": 0.7036, - "step": 45660 - }, - { - "epoch": 1.17, - "learning_rate": 1.3935723661038734e-06, - "loss": 0.8088, - "step": 45661 - }, - { - "epoch": 1.17, - "learning_rate": 1.3935469286809824e-06, - "loss": 0.6973, - "step": 45662 - }, - { - "epoch": 1.17, - "learning_rate": 1.3935214909567708e-06, - "loss": 0.5098, - "step": 45663 - }, - { - "epoch": 1.17, - "learning_rate": 1.3934960529312574e-06, - "loss": 0.751, - "step": 45664 - }, - { - "epoch": 1.17, - "learning_rate": 1.3934706146044626e-06, - "loss": 0.6465, - "step": 45665 - }, - { - "epoch": 1.17, - "learning_rate": 1.3934451759764053e-06, - "loss": 0.627, - "step": 45666 - }, - { - "epoch": 1.17, - "learning_rate": 1.393419737047105e-06, - "loss": 0.6021, - "step": 45667 - }, - { - "epoch": 1.17, - "learning_rate": 1.3933942978165813e-06, - "loss": 0.3449, - "step": 45668 - }, - { - "epoch": 1.17, - "learning_rate": 1.3933688582848538e-06, - "loss": 0.7666, - "step": 45669 - }, - { - "epoch": 1.17, - "learning_rate": 1.3933434184519416e-06, - "loss": 0.5762, - "step": 45670 - }, - { - "epoch": 1.17, - "learning_rate": 1.3933179783178648e-06, - "loss": 0.6899, - "step": 45671 - }, - { - "epoch": 1.17, - "learning_rate": 1.3932925378826424e-06, - "loss": 0.4536, - "step": 45672 - }, - { - "epoch": 1.17, - "learning_rate": 1.3932670971462939e-06, - "loss": 0.7441, - "step": 45673 - }, - { - "epoch": 1.17, - "learning_rate": 1.3932416561088388e-06, - "loss": 0.6201, - "step": 45674 - }, - { - "epoch": 1.17, - "learning_rate": 1.3932162147702969e-06, - "loss": 0.6538, - "step": 45675 - }, - { - "epoch": 1.17, - "learning_rate": 1.3931907731306872e-06, - "loss": 0.458, - "step": 45676 - }, - { - "epoch": 1.17, - "learning_rate": 1.3931653311900295e-06, - "loss": 0.7207, - "step": 45677 - }, - { - "epoch": 1.17, - "learning_rate": 1.393139888948343e-06, - "loss": 0.5552, - "step": 45678 - }, - { - "epoch": 1.17, - "learning_rate": 1.3931144464056476e-06, - "loss": 0.4907, - "step": 45679 - }, - { - "epoch": 1.17, - "learning_rate": 1.3930890035619624e-06, - "loss": 0.6094, - "step": 45680 - }, - { - "epoch": 1.17, - "learning_rate": 1.393063560417307e-06, - "loss": 0.6934, - "step": 45681 - }, - { - "epoch": 1.17, - "learning_rate": 1.3930381169717012e-06, - "loss": 0.5713, - "step": 45682 - }, - { - "epoch": 1.17, - "learning_rate": 1.3930126732251642e-06, - "loss": 0.7246, - "step": 45683 - }, - { - "epoch": 1.17, - "learning_rate": 1.392987229177715e-06, - "loss": 0.592, - "step": 45684 - }, - { - "epoch": 1.17, - "learning_rate": 1.3929617848293737e-06, - "loss": 0.707, - "step": 45685 - }, - { - "epoch": 1.17, - "learning_rate": 1.3929363401801596e-06, - "loss": 0.7827, - "step": 45686 - }, - { - "epoch": 1.17, - "learning_rate": 1.3929108952300925e-06, - "loss": 0.6016, - "step": 45687 - }, - { - "epoch": 1.17, - "learning_rate": 1.3928854499791916e-06, - "loss": 0.7642, - "step": 45688 - }, - { - "epoch": 1.17, - "learning_rate": 1.392860004427476e-06, - "loss": 0.541, - "step": 45689 - }, - { - "epoch": 1.17, - "learning_rate": 1.392834558574966e-06, - "loss": 0.7266, - "step": 45690 - }, - { - "epoch": 1.17, - "learning_rate": 1.3928091124216802e-06, - "loss": 0.6479, - "step": 45691 - }, - { - "epoch": 1.17, - "learning_rate": 1.3927836659676388e-06, - "loss": 0.6299, - "step": 45692 - }, - { - "epoch": 1.17, - "learning_rate": 1.3927582192128608e-06, - "loss": 0.6001, - "step": 45693 - }, - { - "epoch": 1.17, - "learning_rate": 1.3927327721573661e-06, - "loss": 0.8467, - "step": 45694 - }, - { - "epoch": 1.17, - "learning_rate": 1.3927073248011739e-06, - "loss": 0.624, - "step": 45695 - }, - { - "epoch": 1.17, - "learning_rate": 1.392681877144304e-06, - "loss": 0.6758, - "step": 45696 - }, - { - "epoch": 1.17, - "learning_rate": 1.3926564291867753e-06, - "loss": 0.5371, - "step": 45697 - }, - { - "epoch": 1.17, - "learning_rate": 1.3926309809286077e-06, - "loss": 0.8203, - "step": 45698 - }, - { - "epoch": 1.17, - "learning_rate": 1.3926055323698205e-06, - "loss": 0.6484, - "step": 45699 - }, - { - "epoch": 1.17, - "learning_rate": 1.3925800835104336e-06, - "loss": 0.5555, - "step": 45700 - }, - { - "epoch": 1.17, - "learning_rate": 1.392554634350466e-06, - "loss": 0.5771, - "step": 45701 - }, - { - "epoch": 1.17, - "learning_rate": 1.3925291848899375e-06, - "loss": 0.6494, - "step": 45702 - }, - { - "epoch": 1.17, - "learning_rate": 1.392503735128867e-06, - "loss": 0.5718, - "step": 45703 - }, - { - "epoch": 1.17, - "learning_rate": 1.392478285067275e-06, - "loss": 0.7744, - "step": 45704 - }, - { - "epoch": 1.17, - "learning_rate": 1.3924528347051801e-06, - "loss": 0.6592, - "step": 45705 - }, - { - "epoch": 1.17, - "learning_rate": 1.3924273840426022e-06, - "loss": 0.6567, - "step": 45706 - }, - { - "epoch": 1.17, - "learning_rate": 1.3924019330795609e-06, - "loss": 0.7129, - "step": 45707 - }, - { - "epoch": 1.17, - "learning_rate": 1.392376481816075e-06, - "loss": 0.748, - "step": 45708 - }, - { - "epoch": 1.17, - "learning_rate": 1.392351030252165e-06, - "loss": 0.6035, - "step": 45709 - }, - { - "epoch": 1.17, - "learning_rate": 1.3923255783878496e-06, - "loss": 0.7773, - "step": 45710 - }, - { - "epoch": 1.17, - "learning_rate": 1.3923001262231483e-06, - "loss": 0.6738, - "step": 45711 - }, - { - "epoch": 1.17, - "learning_rate": 1.3922746737580813e-06, - "loss": 0.6875, - "step": 45712 - }, - { - "epoch": 1.17, - "learning_rate": 1.3922492209926676e-06, - "loss": 0.7275, - "step": 45713 - }, - { - "epoch": 1.17, - "learning_rate": 1.3922237679269263e-06, - "loss": 0.749, - "step": 45714 - }, - { - "epoch": 1.17, - "learning_rate": 1.3921983145608775e-06, - "loss": 0.5508, - "step": 45715 - }, - { - "epoch": 1.17, - "learning_rate": 1.3921728608945405e-06, - "loss": 0.6582, - "step": 45716 - }, - { - "epoch": 1.17, - "learning_rate": 1.392147406927935e-06, - "loss": 0.7988, - "step": 45717 - }, - { - "epoch": 1.17, - "learning_rate": 1.39212195266108e-06, - "loss": 0.6836, - "step": 45718 - }, - { - "epoch": 1.17, - "learning_rate": 1.3920964980939952e-06, - "loss": 0.6792, - "step": 45719 - }, - { - "epoch": 1.17, - "learning_rate": 1.3920710432267e-06, - "loss": 0.7344, - "step": 45720 - }, - { - "epoch": 1.17, - "learning_rate": 1.3920455880592143e-06, - "loss": 0.752, - "step": 45721 - }, - { - "epoch": 1.17, - "learning_rate": 1.3920201325915576e-06, - "loss": 0.8096, - "step": 45722 - }, - { - "epoch": 1.17, - "learning_rate": 1.3919946768237488e-06, - "loss": 0.7588, - "step": 45723 - }, - { - "epoch": 1.17, - "learning_rate": 1.3919692207558074e-06, - "loss": 0.3494, - "step": 45724 - }, - { - "epoch": 1.17, - "learning_rate": 1.3919437643877536e-06, - "loss": 0.6479, - "step": 45725 - }, - { - "epoch": 1.17, - "learning_rate": 1.3919183077196061e-06, - "loss": 0.3804, - "step": 45726 - }, - { - "epoch": 1.17, - "learning_rate": 1.3918928507513852e-06, - "loss": 0.7812, - "step": 45727 - }, - { - "epoch": 1.17, - "learning_rate": 1.39186739348311e-06, - "loss": 0.5781, - "step": 45728 - }, - { - "epoch": 1.17, - "learning_rate": 1.3918419359147997e-06, - "loss": 0.7666, - "step": 45729 - }, - { - "epoch": 1.17, - "learning_rate": 1.3918164780464737e-06, - "loss": 0.4678, - "step": 45730 - }, - { - "epoch": 1.17, - "learning_rate": 1.3917910198781526e-06, - "loss": 0.4873, - "step": 45731 - }, - { - "epoch": 1.17, - "learning_rate": 1.391765561409855e-06, - "loss": 0.7617, - "step": 45732 - }, - { - "epoch": 1.17, - "learning_rate": 1.3917401026416e-06, - "loss": 0.6826, - "step": 45733 - }, - { - "epoch": 1.17, - "learning_rate": 1.3917146435734079e-06, - "loss": 0.6924, - "step": 45734 - }, - { - "epoch": 1.17, - "learning_rate": 1.3916891842052978e-06, - "loss": 0.5142, - "step": 45735 - }, - { - "epoch": 1.17, - "learning_rate": 1.3916637245372896e-06, - "loss": 0.7129, - "step": 45736 - }, - { - "epoch": 1.17, - "learning_rate": 1.3916382645694023e-06, - "loss": 0.6797, - "step": 45737 - }, - { - "epoch": 1.17, - "learning_rate": 1.3916128043016558e-06, - "loss": 0.363, - "step": 45738 - }, - { - "epoch": 1.17, - "learning_rate": 1.391587343734069e-06, - "loss": 0.6475, - "step": 45739 - }, - { - "epoch": 1.17, - "learning_rate": 1.391561882866662e-06, - "loss": 0.5591, - "step": 45740 - }, - { - "epoch": 1.17, - "learning_rate": 1.3915364216994538e-06, - "loss": 0.5767, - "step": 45741 - }, - { - "epoch": 1.17, - "learning_rate": 1.3915109602324647e-06, - "loss": 0.6431, - "step": 45742 - }, - { - "epoch": 1.17, - "learning_rate": 1.3914854984657132e-06, - "loss": 0.6064, - "step": 45743 - }, - { - "epoch": 1.17, - "learning_rate": 1.3914600363992196e-06, - "loss": 0.6699, - "step": 45744 - }, - { - "epoch": 1.17, - "learning_rate": 1.3914345740330027e-06, - "loss": 0.4727, - "step": 45745 - }, - { - "epoch": 1.17, - "learning_rate": 1.3914091113670825e-06, - "loss": 0.7207, - "step": 45746 - }, - { - "epoch": 1.17, - "learning_rate": 1.3913836484014785e-06, - "loss": 0.5217, - "step": 45747 - }, - { - "epoch": 1.17, - "learning_rate": 1.3913581851362099e-06, - "loss": 0.7148, - "step": 45748 - }, - { - "epoch": 1.17, - "learning_rate": 1.3913327215712961e-06, - "loss": 0.6729, - "step": 45749 - }, - { - "epoch": 1.17, - "learning_rate": 1.391307257706757e-06, - "loss": 0.8076, - "step": 45750 - }, - { - "epoch": 1.17, - "learning_rate": 1.3912817935426119e-06, - "loss": 0.5205, - "step": 45751 - }, - { - "epoch": 1.17, - "learning_rate": 1.3912563290788806e-06, - "loss": 0.7393, - "step": 45752 - }, - { - "epoch": 1.17, - "learning_rate": 1.391230864315582e-06, - "loss": 0.6055, - "step": 45753 - }, - { - "epoch": 1.17, - "learning_rate": 1.391205399252736e-06, - "loss": 0.7236, - "step": 45754 - }, - { - "epoch": 1.17, - "learning_rate": 1.3911799338903621e-06, - "loss": 0.8398, - "step": 45755 - }, - { - "epoch": 1.17, - "learning_rate": 1.3911544682284796e-06, - "loss": 0.6003, - "step": 45756 - }, - { - "epoch": 1.17, - "learning_rate": 1.3911290022671085e-06, - "loss": 0.5625, - "step": 45757 - }, - { - "epoch": 1.17, - "learning_rate": 1.3911035360062672e-06, - "loss": 0.8428, - "step": 45758 - }, - { - "epoch": 1.17, - "learning_rate": 1.3910780694459765e-06, - "loss": 0.915, - "step": 45759 - }, - { - "epoch": 1.17, - "learning_rate": 1.391052602586255e-06, - "loss": 0.6621, - "step": 45760 - }, - { - "epoch": 1.17, - "learning_rate": 1.3910271354271227e-06, - "loss": 0.5728, - "step": 45761 - }, - { - "epoch": 1.17, - "learning_rate": 1.3910016679685988e-06, - "loss": 0.7197, - "step": 45762 - }, - { - "epoch": 1.17, - "learning_rate": 1.3909762002107028e-06, - "loss": 0.5767, - "step": 45763 - }, - { - "epoch": 1.17, - "learning_rate": 1.3909507321534543e-06, - "loss": 0.6802, - "step": 45764 - }, - { - "epoch": 1.17, - "learning_rate": 1.3909252637968729e-06, - "loss": 0.6973, - "step": 45765 - }, - { - "epoch": 1.17, - "learning_rate": 1.390899795140978e-06, - "loss": 0.7266, - "step": 45766 - }, - { - "epoch": 1.17, - "learning_rate": 1.3908743261857894e-06, - "loss": 0.6035, - "step": 45767 - }, - { - "epoch": 1.17, - "learning_rate": 1.390848856931326e-06, - "loss": 0.5737, - "step": 45768 - }, - { - "epoch": 1.17, - "learning_rate": 1.3908233873776074e-06, - "loss": 0.541, - "step": 45769 - }, - { - "epoch": 1.17, - "learning_rate": 1.3907979175246533e-06, - "loss": 0.6689, - "step": 45770 - }, - { - "epoch": 1.17, - "learning_rate": 1.3907724473724836e-06, - "loss": 0.7012, - "step": 45771 - }, - { - "epoch": 1.17, - "learning_rate": 1.3907469769211172e-06, - "loss": 0.6172, - "step": 45772 - }, - { - "epoch": 1.17, - "learning_rate": 1.390721506170574e-06, - "loss": 0.3445, - "step": 45773 - }, - { - "epoch": 1.17, - "learning_rate": 1.3906960351208729e-06, - "loss": 0.7969, - "step": 45774 - }, - { - "epoch": 1.17, - "learning_rate": 1.3906705637720342e-06, - "loss": 0.8486, - "step": 45775 - }, - { - "epoch": 1.17, - "learning_rate": 1.3906450921240767e-06, - "loss": 0.5977, - "step": 45776 - }, - { - "epoch": 1.17, - "learning_rate": 1.3906196201770205e-06, - "loss": 0.5845, - "step": 45777 - }, - { - "epoch": 1.17, - "learning_rate": 1.3905941479308847e-06, - "loss": 0.7227, - "step": 45778 - }, - { - "epoch": 1.17, - "learning_rate": 1.3905686753856887e-06, - "loss": 0.6357, - "step": 45779 - }, - { - "epoch": 1.17, - "learning_rate": 1.3905432025414526e-06, - "loss": 0.5752, - "step": 45780 - }, - { - "epoch": 1.17, - "learning_rate": 1.3905177293981952e-06, - "loss": 0.5935, - "step": 45781 - }, - { - "epoch": 1.17, - "learning_rate": 1.3904922559559366e-06, - "loss": 0.6016, - "step": 45782 - }, - { - "epoch": 1.17, - "learning_rate": 1.3904667822146958e-06, - "loss": 0.5352, - "step": 45783 - }, - { - "epoch": 1.17, - "learning_rate": 1.3904413081744928e-06, - "loss": 0.7598, - "step": 45784 - }, - { - "epoch": 1.17, - "learning_rate": 1.3904158338353464e-06, - "loss": 0.5986, - "step": 45785 - }, - { - "epoch": 1.17, - "learning_rate": 1.3903903591972773e-06, - "loss": 0.4248, - "step": 45786 - }, - { - "epoch": 1.17, - "learning_rate": 1.3903648842603035e-06, - "loss": 0.6797, - "step": 45787 - }, - { - "epoch": 1.17, - "learning_rate": 1.3903394090244458e-06, - "loss": 0.6924, - "step": 45788 - }, - { - "epoch": 1.17, - "learning_rate": 1.3903139334897228e-06, - "loss": 0.6846, - "step": 45789 - }, - { - "epoch": 1.17, - "learning_rate": 1.3902884576561547e-06, - "loss": 0.7695, - "step": 45790 - }, - { - "epoch": 1.17, - "learning_rate": 1.39026298152376e-06, - "loss": 0.5356, - "step": 45791 - }, - { - "epoch": 1.17, - "learning_rate": 1.3902375050925596e-06, - "loss": 0.7061, - "step": 45792 - }, - { - "epoch": 1.17, - "learning_rate": 1.390212028362572e-06, - "loss": 0.6709, - "step": 45793 - }, - { - "epoch": 1.17, - "learning_rate": 1.390186551333817e-06, - "loss": 0.5413, - "step": 45794 - }, - { - "epoch": 1.17, - "learning_rate": 1.390161074006314e-06, - "loss": 0.551, - "step": 45795 - }, - { - "epoch": 1.17, - "learning_rate": 1.390135596380083e-06, - "loss": 0.6084, - "step": 45796 - }, - { - "epoch": 1.17, - "learning_rate": 1.3901101184551429e-06, - "loss": 0.6943, - "step": 45797 - }, - { - "epoch": 1.17, - "learning_rate": 1.3900846402315132e-06, - "loss": 0.8203, - "step": 45798 - }, - { - "epoch": 1.17, - "learning_rate": 1.390059161709214e-06, - "loss": 0.6787, - "step": 45799 - }, - { - "epoch": 1.17, - "learning_rate": 1.390033682888264e-06, - "loss": 0.7559, - "step": 45800 - }, - { - "epoch": 1.17, - "learning_rate": 1.3900082037686833e-06, - "loss": 0.7217, - "step": 45801 - }, - { - "epoch": 1.17, - "learning_rate": 1.3899827243504913e-06, - "loss": 0.4277, - "step": 45802 - }, - { - "epoch": 1.17, - "learning_rate": 1.3899572446337079e-06, - "loss": 0.7021, - "step": 45803 - }, - { - "epoch": 1.17, - "learning_rate": 1.3899317646183515e-06, - "loss": 0.6221, - "step": 45804 - }, - { - "epoch": 1.17, - "learning_rate": 1.3899062843044424e-06, - "loss": 0.6729, - "step": 45805 - }, - { - "epoch": 1.17, - "learning_rate": 1.389880803692e-06, - "loss": 0.6099, - "step": 45806 - }, - { - "epoch": 1.17, - "learning_rate": 1.3898553227810444e-06, - "loss": 0.5547, - "step": 45807 - }, - { - "epoch": 1.17, - "learning_rate": 1.3898298415715937e-06, - "loss": 0.8008, - "step": 45808 - }, - { - "epoch": 1.17, - "learning_rate": 1.3898043600636687e-06, - "loss": 0.749, - "step": 45809 - }, - { - "epoch": 1.17, - "learning_rate": 1.389778878257288e-06, - "loss": 0.4429, - "step": 45810 - }, - { - "epoch": 1.17, - "learning_rate": 1.3897533961524718e-06, - "loss": 0.5859, - "step": 45811 - }, - { - "epoch": 1.17, - "learning_rate": 1.3897279137492395e-06, - "loss": 0.5083, - "step": 45812 - }, - { - "epoch": 1.17, - "learning_rate": 1.3897024310476103e-06, - "loss": 0.4363, - "step": 45813 - }, - { - "epoch": 1.17, - "learning_rate": 1.3896769480476037e-06, - "loss": 0.5625, - "step": 45814 - }, - { - "epoch": 1.17, - "learning_rate": 1.3896514647492397e-06, - "loss": 0.627, - "step": 45815 - }, - { - "epoch": 1.17, - "learning_rate": 1.389625981152537e-06, - "loss": 0.6353, - "step": 45816 - }, - { - "epoch": 1.17, - "learning_rate": 1.3896004972575162e-06, - "loss": 0.6973, - "step": 45817 - }, - { - "epoch": 1.17, - "learning_rate": 1.3895750130641959e-06, - "loss": 0.6816, - "step": 45818 - }, - { - "epoch": 1.17, - "learning_rate": 1.389549528572596e-06, - "loss": 0.6128, - "step": 45819 - }, - { - "epoch": 1.17, - "learning_rate": 1.3895240437827358e-06, - "loss": 0.5715, - "step": 45820 - }, - { - "epoch": 1.17, - "learning_rate": 1.389498558694635e-06, - "loss": 0.6519, - "step": 45821 - }, - { - "epoch": 1.17, - "learning_rate": 1.3894730733083133e-06, - "loss": 0.5312, - "step": 45822 - }, - { - "epoch": 1.17, - "learning_rate": 1.3894475876237897e-06, - "loss": 0.7266, - "step": 45823 - }, - { - "epoch": 1.17, - "learning_rate": 1.389422101641084e-06, - "loss": 0.7637, - "step": 45824 - }, - { - "epoch": 1.17, - "learning_rate": 1.3893966153602157e-06, - "loss": 0.6074, - "step": 45825 - }, - { - "epoch": 1.17, - "learning_rate": 1.3893711287812046e-06, - "loss": 0.5728, - "step": 45826 - }, - { - "epoch": 1.17, - "learning_rate": 1.3893456419040699e-06, - "loss": 0.5391, - "step": 45827 - }, - { - "epoch": 1.17, - "learning_rate": 1.3893201547288308e-06, - "loss": 0.5376, - "step": 45828 - }, - { - "epoch": 1.17, - "learning_rate": 1.3892946672555073e-06, - "loss": 0.8647, - "step": 45829 - }, - { - "epoch": 1.17, - "learning_rate": 1.389269179484119e-06, - "loss": 0.605, - "step": 45830 - }, - { - "epoch": 1.17, - "learning_rate": 1.3892436914146848e-06, - "loss": 0.667, - "step": 45831 - }, - { - "epoch": 1.17, - "learning_rate": 1.389218203047225e-06, - "loss": 0.6621, - "step": 45832 - }, - { - "epoch": 1.17, - "learning_rate": 1.3891927143817586e-06, - "loss": 0.4666, - "step": 45833 - }, - { - "epoch": 1.17, - "learning_rate": 1.389167225418305e-06, - "loss": 0.6484, - "step": 45834 - }, - { - "epoch": 1.17, - "learning_rate": 1.389141736156884e-06, - "loss": 0.5615, - "step": 45835 - }, - { - "epoch": 1.17, - "learning_rate": 1.3891162465975153e-06, - "loss": 0.7305, - "step": 45836 - }, - { - "epoch": 1.17, - "learning_rate": 1.3890907567402182e-06, - "loss": 0.6763, - "step": 45837 - }, - { - "epoch": 1.17, - "learning_rate": 1.389065266585012e-06, - "loss": 0.6177, - "step": 45838 - }, - { - "epoch": 1.17, - "learning_rate": 1.3890397761319163e-06, - "loss": 0.5869, - "step": 45839 - }, - { - "epoch": 1.17, - "learning_rate": 1.389014285380951e-06, - "loss": 0.6528, - "step": 45840 - }, - { - "epoch": 1.17, - "learning_rate": 1.388988794332135e-06, - "loss": 0.5129, - "step": 45841 - }, - { - "epoch": 1.17, - "learning_rate": 1.3889633029854886e-06, - "loss": 0.6519, - "step": 45842 - }, - { - "epoch": 1.17, - "learning_rate": 1.388937811341031e-06, - "loss": 0.624, - "step": 45843 - }, - { - "epoch": 1.18, - "learning_rate": 1.3889123193987808e-06, - "loss": 0.6426, - "step": 45844 - }, - { - "epoch": 1.18, - "learning_rate": 1.388886827158759e-06, - "loss": 0.5225, - "step": 45845 - }, - { - "epoch": 1.18, - "learning_rate": 1.3888613346209843e-06, - "loss": 0.6326, - "step": 45846 - }, - { - "epoch": 1.18, - "learning_rate": 1.3888358417854764e-06, - "loss": 0.5713, - "step": 45847 - }, - { - "epoch": 1.18, - "learning_rate": 1.3888103486522545e-06, - "loss": 0.8242, - "step": 45848 - }, - { - "epoch": 1.18, - "learning_rate": 1.3887848552213388e-06, - "loss": 0.7998, - "step": 45849 - }, - { - "epoch": 1.18, - "learning_rate": 1.3887593614927479e-06, - "loss": 0.561, - "step": 45850 - }, - { - "epoch": 1.18, - "learning_rate": 1.3887338674665024e-06, - "loss": 0.6626, - "step": 45851 - }, - { - "epoch": 1.18, - "learning_rate": 1.388708373142621e-06, - "loss": 0.5645, - "step": 45852 - }, - { - "epoch": 1.18, - "learning_rate": 1.3886828785211235e-06, - "loss": 0.4171, - "step": 45853 - }, - { - "epoch": 1.18, - "learning_rate": 1.3886573836020291e-06, - "loss": 0.5039, - "step": 45854 - }, - { - "epoch": 1.18, - "learning_rate": 1.3886318883853578e-06, - "loss": 0.4299, - "step": 45855 - }, - { - "epoch": 1.18, - "learning_rate": 1.3886063928711292e-06, - "loss": 0.6221, - "step": 45856 - }, - { - "epoch": 1.18, - "learning_rate": 1.3885808970593624e-06, - "loss": 0.7383, - "step": 45857 - }, - { - "epoch": 1.18, - "learning_rate": 1.3885554009500768e-06, - "loss": 0.6611, - "step": 45858 - }, - { - "epoch": 1.18, - "learning_rate": 1.3885299045432926e-06, - "loss": 0.4666, - "step": 45859 - }, - { - "epoch": 1.18, - "learning_rate": 1.3885044078390286e-06, - "loss": 0.7031, - "step": 45860 - }, - { - "epoch": 1.18, - "learning_rate": 1.3884789108373046e-06, - "loss": 0.6504, - "step": 45861 - }, - { - "epoch": 1.18, - "learning_rate": 1.3884534135381408e-06, - "loss": 0.5596, - "step": 45862 - }, - { - "epoch": 1.18, - "learning_rate": 1.3884279159415555e-06, - "loss": 0.6543, - "step": 45863 - }, - { - "epoch": 1.18, - "learning_rate": 1.388402418047569e-06, - "loss": 0.6309, - "step": 45864 - }, - { - "epoch": 1.18, - "learning_rate": 1.3883769198562005e-06, - "loss": 0.6016, - "step": 45865 - }, - { - "epoch": 1.18, - "learning_rate": 1.3883514213674693e-06, - "loss": 0.573, - "step": 45866 - }, - { - "epoch": 1.18, - "learning_rate": 1.388325922581396e-06, - "loss": 0.5493, - "step": 45867 - }, - { - "epoch": 1.18, - "learning_rate": 1.388300423497999e-06, - "loss": 0.454, - "step": 45868 - }, - { - "epoch": 1.18, - "learning_rate": 1.3882749241172982e-06, - "loss": 0.8516, - "step": 45869 - }, - { - "epoch": 1.18, - "learning_rate": 1.3882494244393132e-06, - "loss": 0.5156, - "step": 45870 - }, - { - "epoch": 1.18, - "learning_rate": 1.3882239244640634e-06, - "loss": 0.5239, - "step": 45871 - }, - { - "epoch": 1.18, - "learning_rate": 1.3881984241915687e-06, - "loss": 0.7295, - "step": 45872 - }, - { - "epoch": 1.18, - "learning_rate": 1.388172923621848e-06, - "loss": 0.7505, - "step": 45873 - }, - { - "epoch": 1.18, - "learning_rate": 1.3881474227549215e-06, - "loss": 0.6543, - "step": 45874 - }, - { - "epoch": 1.18, - "learning_rate": 1.388121921590808e-06, - "loss": 0.709, - "step": 45875 - }, - { - "epoch": 1.18, - "learning_rate": 1.3880964201295275e-06, - "loss": 0.6309, - "step": 45876 - }, - { - "epoch": 1.18, - "learning_rate": 1.3880709183710994e-06, - "loss": 0.6836, - "step": 45877 - }, - { - "epoch": 1.18, - "learning_rate": 1.3880454163155434e-06, - "loss": 0.6289, - "step": 45878 - }, - { - "epoch": 1.18, - "learning_rate": 1.3880199139628785e-06, - "loss": 0.5742, - "step": 45879 - }, - { - "epoch": 1.18, - "learning_rate": 1.387994411313125e-06, - "loss": 0.6755, - "step": 45880 - }, - { - "epoch": 1.18, - "learning_rate": 1.3879689083663015e-06, - "loss": 0.9258, - "step": 45881 - }, - { - "epoch": 1.18, - "learning_rate": 1.3879434051224288e-06, - "loss": 0.5415, - "step": 45882 - }, - { - "epoch": 1.18, - "learning_rate": 1.3879179015815253e-06, - "loss": 0.7402, - "step": 45883 - }, - { - "epoch": 1.18, - "learning_rate": 1.3878923977436108e-06, - "loss": 0.7686, - "step": 45884 - }, - { - "epoch": 1.18, - "learning_rate": 1.3878668936087047e-06, - "loss": 0.5693, - "step": 45885 - }, - { - "epoch": 1.18, - "learning_rate": 1.3878413891768272e-06, - "loss": 0.7627, - "step": 45886 - }, - { - "epoch": 1.18, - "learning_rate": 1.3878158844479973e-06, - "loss": 0.5869, - "step": 45887 - }, - { - "epoch": 1.18, - "learning_rate": 1.3877903794222343e-06, - "loss": 0.5422, - "step": 45888 - }, - { - "epoch": 1.18, - "learning_rate": 1.3877648740995585e-06, - "loss": 0.4636, - "step": 45889 - }, - { - "epoch": 1.18, - "learning_rate": 1.3877393684799885e-06, - "loss": 0.6172, - "step": 45890 - }, - { - "epoch": 1.18, - "learning_rate": 1.3877138625635447e-06, - "loss": 0.666, - "step": 45891 - }, - { - "epoch": 1.18, - "learning_rate": 1.3876883563502462e-06, - "loss": 0.7217, - "step": 45892 - }, - { - "epoch": 1.18, - "learning_rate": 1.3876628498401124e-06, - "loss": 0.7188, - "step": 45893 - }, - { - "epoch": 1.18, - "learning_rate": 1.387637343033163e-06, - "loss": 0.8701, - "step": 45894 - }, - { - "epoch": 1.18, - "learning_rate": 1.3876118359294174e-06, - "loss": 0.5825, - "step": 45895 - }, - { - "epoch": 1.18, - "learning_rate": 1.3875863285288952e-06, - "loss": 0.6763, - "step": 45896 - }, - { - "epoch": 1.18, - "learning_rate": 1.3875608208316163e-06, - "loss": 0.5469, - "step": 45897 - }, - { - "epoch": 1.18, - "learning_rate": 1.3875353128375998e-06, - "loss": 0.6455, - "step": 45898 - }, - { - "epoch": 1.18, - "learning_rate": 1.3875098045468653e-06, - "loss": 0.5049, - "step": 45899 - }, - { - "epoch": 1.18, - "learning_rate": 1.387484295959432e-06, - "loss": 0.5204, - "step": 45900 - }, - { - "epoch": 1.18, - "learning_rate": 1.38745878707532e-06, - "loss": 0.6533, - "step": 45901 - }, - { - "epoch": 1.18, - "learning_rate": 1.387433277894549e-06, - "loss": 0.6611, - "step": 45902 - }, - { - "epoch": 1.18, - "learning_rate": 1.387407768417138e-06, - "loss": 0.6265, - "step": 45903 - }, - { - "epoch": 1.18, - "learning_rate": 1.3873822586431062e-06, - "loss": 0.6357, - "step": 45904 - }, - { - "epoch": 1.18, - "learning_rate": 1.3873567485724743e-06, - "loss": 0.6689, - "step": 45905 - }, - { - "epoch": 1.18, - "learning_rate": 1.3873312382052605e-06, - "loss": 0.7085, - "step": 45906 - }, - { - "epoch": 1.18, - "learning_rate": 1.3873057275414855e-06, - "loss": 0.5869, - "step": 45907 - }, - { - "epoch": 1.18, - "learning_rate": 1.3872802165811682e-06, - "loss": 0.749, - "step": 45908 - }, - { - "epoch": 1.18, - "learning_rate": 1.3872547053243282e-06, - "loss": 0.6548, - "step": 45909 - }, - { - "epoch": 1.18, - "learning_rate": 1.3872291937709848e-06, - "loss": 0.7383, - "step": 45910 - }, - { - "epoch": 1.18, - "learning_rate": 1.387203681921158e-06, - "loss": 0.6729, - "step": 45911 - }, - { - "epoch": 1.18, - "learning_rate": 1.3871781697748674e-06, - "loss": 0.791, - "step": 45912 - }, - { - "epoch": 1.18, - "learning_rate": 1.387152657332132e-06, - "loss": 0.5637, - "step": 45913 - }, - { - "epoch": 1.18, - "learning_rate": 1.3871271445929718e-06, - "loss": 0.6401, - "step": 45914 - }, - { - "epoch": 1.18, - "learning_rate": 1.3871016315574058e-06, - "loss": 0.6436, - "step": 45915 - }, - { - "epoch": 1.18, - "learning_rate": 1.3870761182254541e-06, - "loss": 0.7109, - "step": 45916 - }, - { - "epoch": 1.18, - "learning_rate": 1.3870506045971362e-06, - "loss": 0.8037, - "step": 45917 - }, - { - "epoch": 1.18, - "learning_rate": 1.3870250906724713e-06, - "loss": 0.7246, - "step": 45918 - }, - { - "epoch": 1.18, - "learning_rate": 1.386999576451479e-06, - "loss": 0.7598, - "step": 45919 - }, - { - "epoch": 1.18, - "learning_rate": 1.386974061934179e-06, - "loss": 0.6509, - "step": 45920 - }, - { - "epoch": 1.18, - "learning_rate": 1.3869485471205906e-06, - "loss": 0.7754, - "step": 45921 - }, - { - "epoch": 1.18, - "learning_rate": 1.386923032010734e-06, - "loss": 0.6895, - "step": 45922 - }, - { - "epoch": 1.18, - "learning_rate": 1.3868975166046275e-06, - "loss": 0.5659, - "step": 45923 - }, - { - "epoch": 1.18, - "learning_rate": 1.3868720009022918e-06, - "loss": 0.7441, - "step": 45924 - }, - { - "epoch": 1.18, - "learning_rate": 1.3868464849037457e-06, - "loss": 0.3533, - "step": 45925 - }, - { - "epoch": 1.18, - "learning_rate": 1.3868209686090093e-06, - "loss": 0.8779, - "step": 45926 - }, - { - "epoch": 1.18, - "learning_rate": 1.386795452018102e-06, - "loss": 0.6685, - "step": 45927 - }, - { - "epoch": 1.18, - "learning_rate": 1.386769935131043e-06, - "loss": 0.6689, - "step": 45928 - }, - { - "epoch": 1.18, - "learning_rate": 1.386744417947852e-06, - "loss": 0.7871, - "step": 45929 - }, - { - "epoch": 1.18, - "learning_rate": 1.3867189004685487e-06, - "loss": 0.5449, - "step": 45930 - }, - { - "epoch": 1.18, - "learning_rate": 1.3866933826931524e-06, - "loss": 0.7754, - "step": 45931 - }, - { - "epoch": 1.18, - "learning_rate": 1.3866678646216827e-06, - "loss": 0.6021, - "step": 45932 - }, - { - "epoch": 1.18, - "learning_rate": 1.3866423462541595e-06, - "loss": 0.7256, - "step": 45933 - }, - { - "epoch": 1.18, - "learning_rate": 1.386616827590602e-06, - "loss": 0.626, - "step": 45934 - }, - { - "epoch": 1.18, - "learning_rate": 1.3865913086310294e-06, - "loss": 0.5591, - "step": 45935 - }, - { - "epoch": 1.18, - "learning_rate": 1.3865657893754618e-06, - "loss": 0.7354, - "step": 45936 - }, - { - "epoch": 1.18, - "learning_rate": 1.3865402698239187e-06, - "loss": 0.7549, - "step": 45937 - }, - { - "epoch": 1.18, - "learning_rate": 1.3865147499764194e-06, - "loss": 0.7773, - "step": 45938 - }, - { - "epoch": 1.18, - "learning_rate": 1.3864892298329834e-06, - "loss": 0.9307, - "step": 45939 - }, - { - "epoch": 1.18, - "learning_rate": 1.3864637093936303e-06, - "loss": 0.5386, - "step": 45940 - }, - { - "epoch": 1.18, - "learning_rate": 1.3864381886583803e-06, - "loss": 0.6245, - "step": 45941 - }, - { - "epoch": 1.18, - "learning_rate": 1.3864126676272517e-06, - "loss": 0.6982, - "step": 45942 - }, - { - "epoch": 1.18, - "learning_rate": 1.386387146300265e-06, - "loss": 0.5601, - "step": 45943 - }, - { - "epoch": 1.18, - "learning_rate": 1.3863616246774393e-06, - "loss": 0.5659, - "step": 45944 - }, - { - "epoch": 1.18, - "learning_rate": 1.3863361027587944e-06, - "loss": 0.7256, - "step": 45945 - }, - { - "epoch": 1.18, - "learning_rate": 1.3863105805443496e-06, - "loss": 0.627, - "step": 45946 - }, - { - "epoch": 1.18, - "learning_rate": 1.3862850580341246e-06, - "loss": 0.4199, - "step": 45947 - }, - { - "epoch": 1.18, - "learning_rate": 1.3862595352281388e-06, - "loss": 0.6929, - "step": 45948 - }, - { - "epoch": 1.18, - "learning_rate": 1.386234012126412e-06, - "loss": 0.5891, - "step": 45949 - }, - { - "epoch": 1.18, - "learning_rate": 1.3862084887289634e-06, - "loss": 0.5669, - "step": 45950 - }, - { - "epoch": 1.18, - "learning_rate": 1.3861829650358129e-06, - "loss": 0.6465, - "step": 45951 - }, - { - "epoch": 1.18, - "learning_rate": 1.3861574410469797e-06, - "loss": 0.5771, - "step": 45952 - }, - { - "epoch": 1.18, - "learning_rate": 1.3861319167624837e-06, - "loss": 0.5784, - "step": 45953 - }, - { - "epoch": 1.18, - "learning_rate": 1.386106392182344e-06, - "loss": 0.5991, - "step": 45954 - }, - { - "epoch": 1.18, - "learning_rate": 1.3860808673065805e-06, - "loss": 0.5588, - "step": 45955 - }, - { - "epoch": 1.18, - "learning_rate": 1.3860553421352127e-06, - "loss": 0.7285, - "step": 45956 - }, - { - "epoch": 1.18, - "learning_rate": 1.3860298166682598e-06, - "loss": 0.7018, - "step": 45957 - }, - { - "epoch": 1.18, - "learning_rate": 1.386004290905742e-06, - "loss": 0.6812, - "step": 45958 - }, - { - "epoch": 1.18, - "learning_rate": 1.3859787648476782e-06, - "loss": 0.6553, - "step": 45959 - }, - { - "epoch": 1.18, - "learning_rate": 1.3859532384940882e-06, - "loss": 0.7363, - "step": 45960 - }, - { - "epoch": 1.18, - "learning_rate": 1.3859277118449918e-06, - "loss": 0.5803, - "step": 45961 - }, - { - "epoch": 1.18, - "learning_rate": 1.385902184900408e-06, - "loss": 0.6748, - "step": 45962 - }, - { - "epoch": 1.18, - "learning_rate": 1.385876657660357e-06, - "loss": 0.7852, - "step": 45963 - }, - { - "epoch": 1.18, - "learning_rate": 1.3858511301248576e-06, - "loss": 0.5786, - "step": 45964 - }, - { - "epoch": 1.18, - "learning_rate": 1.3858256022939298e-06, - "loss": 0.5791, - "step": 45965 - }, - { - "epoch": 1.18, - "learning_rate": 1.3858000741675935e-06, - "loss": 0.6338, - "step": 45966 - }, - { - "epoch": 1.18, - "learning_rate": 1.3857745457458672e-06, - "loss": 0.7773, - "step": 45967 - }, - { - "epoch": 1.18, - "learning_rate": 1.3857490170287716e-06, - "loss": 0.5581, - "step": 45968 - }, - { - "epoch": 1.18, - "learning_rate": 1.3857234880163253e-06, - "loss": 0.5811, - "step": 45969 - }, - { - "epoch": 1.18, - "learning_rate": 1.3856979587085485e-06, - "loss": 0.5059, - "step": 45970 - }, - { - "epoch": 1.18, - "learning_rate": 1.3856724291054604e-06, - "loss": 0.748, - "step": 45971 - }, - { - "epoch": 1.18, - "learning_rate": 1.3856468992070808e-06, - "loss": 0.5146, - "step": 45972 - }, - { - "epoch": 1.18, - "learning_rate": 1.385621369013429e-06, - "loss": 0.6333, - "step": 45973 - }, - { - "epoch": 1.18, - "learning_rate": 1.3855958385245248e-06, - "loss": 0.6675, - "step": 45974 - }, - { - "epoch": 1.18, - "learning_rate": 1.3855703077403874e-06, - "loss": 0.6934, - "step": 45975 - }, - { - "epoch": 1.18, - "learning_rate": 1.3855447766610365e-06, - "loss": 0.6162, - "step": 45976 - }, - { - "epoch": 1.18, - "learning_rate": 1.385519245286492e-06, - "loss": 0.7188, - "step": 45977 - }, - { - "epoch": 1.18, - "learning_rate": 1.3854937136167726e-06, - "loss": 0.6543, - "step": 45978 - }, - { - "epoch": 1.18, - "learning_rate": 1.3854681816518988e-06, - "loss": 0.7695, - "step": 45979 - }, - { - "epoch": 1.18, - "learning_rate": 1.3854426493918897e-06, - "loss": 0.7822, - "step": 45980 - }, - { - "epoch": 1.18, - "learning_rate": 1.385417116836765e-06, - "loss": 0.8047, - "step": 45981 - }, - { - "epoch": 1.18, - "learning_rate": 1.3853915839865437e-06, - "loss": 0.6846, - "step": 45982 - }, - { - "epoch": 1.18, - "learning_rate": 1.3853660508412462e-06, - "loss": 0.7295, - "step": 45983 - }, - { - "epoch": 1.18, - "learning_rate": 1.3853405174008914e-06, - "loss": 0.6299, - "step": 45984 - }, - { - "epoch": 1.18, - "learning_rate": 1.3853149836654993e-06, - "loss": 0.6714, - "step": 45985 - }, - { - "epoch": 1.18, - "learning_rate": 1.385289449635089e-06, - "loss": 0.3748, - "step": 45986 - }, - { - "epoch": 1.18, - "learning_rate": 1.3852639153096805e-06, - "loss": 0.7773, - "step": 45987 - }, - { - "epoch": 1.18, - "learning_rate": 1.3852383806892932e-06, - "loss": 0.7715, - "step": 45988 - }, - { - "epoch": 1.18, - "learning_rate": 1.3852128457739463e-06, - "loss": 0.5566, - "step": 45989 - }, - { - "epoch": 1.18, - "learning_rate": 1.3851873105636598e-06, - "loss": 0.7041, - "step": 45990 - }, - { - "epoch": 1.18, - "learning_rate": 1.3851617750584531e-06, - "loss": 0.6016, - "step": 45991 - }, - { - "epoch": 1.18, - "learning_rate": 1.3851362392583456e-06, - "loss": 0.6318, - "step": 45992 - }, - { - "epoch": 1.18, - "learning_rate": 1.3851107031633571e-06, - "loss": 0.45, - "step": 45993 - }, - { - "epoch": 1.18, - "learning_rate": 1.3850851667735072e-06, - "loss": 0.6797, - "step": 45994 - }, - { - "epoch": 1.18, - "learning_rate": 1.385059630088815e-06, - "loss": 0.7256, - "step": 45995 - }, - { - "epoch": 1.18, - "learning_rate": 1.3850340931093005e-06, - "loss": 0.5879, - "step": 45996 - }, - { - "epoch": 1.18, - "learning_rate": 1.385008555834983e-06, - "loss": 0.7422, - "step": 45997 - }, - { - "epoch": 1.18, - "learning_rate": 1.384983018265882e-06, - "loss": 0.7666, - "step": 45998 - }, - { - "epoch": 1.18, - "learning_rate": 1.3849574804020177e-06, - "loss": 0.4695, - "step": 45999 - }, - { - "epoch": 1.18, - "learning_rate": 1.3849319422434088e-06, - "loss": 0.6826, - "step": 46000 - }, - { - "epoch": 1.18, - "learning_rate": 1.3849064037900754e-06, - "loss": 0.6602, - "step": 46001 - }, - { - "epoch": 1.18, - "learning_rate": 1.3848808650420368e-06, - "loss": 0.8262, - "step": 46002 - }, - { - "epoch": 1.18, - "learning_rate": 1.3848553259993122e-06, - "loss": 0.5532, - "step": 46003 - }, - { - "epoch": 1.18, - "learning_rate": 1.384829786661922e-06, - "loss": 0.6797, - "step": 46004 - }, - { - "epoch": 1.18, - "learning_rate": 1.3848042470298853e-06, - "loss": 0.6797, - "step": 46005 - }, - { - "epoch": 1.18, - "learning_rate": 1.384778707103222e-06, - "loss": 0.6602, - "step": 46006 - }, - { - "epoch": 1.18, - "learning_rate": 1.3847531668819508e-06, - "loss": 0.748, - "step": 46007 - }, - { - "epoch": 1.18, - "learning_rate": 1.384727626366092e-06, - "loss": 0.6499, - "step": 46008 - }, - { - "epoch": 1.18, - "learning_rate": 1.3847020855556647e-06, - "loss": 0.563, - "step": 46009 - }, - { - "epoch": 1.18, - "learning_rate": 1.3846765444506892e-06, - "loss": 0.4871, - "step": 46010 - }, - { - "epoch": 1.18, - "learning_rate": 1.3846510030511842e-06, - "loss": 0.625, - "step": 46011 - }, - { - "epoch": 1.18, - "learning_rate": 1.38462546135717e-06, - "loss": 0.5859, - "step": 46012 - }, - { - "epoch": 1.18, - "learning_rate": 1.3845999193686652e-06, - "loss": 0.752, - "step": 46013 - }, - { - "epoch": 1.18, - "learning_rate": 1.3845743770856903e-06, - "loss": 0.5894, - "step": 46014 - }, - { - "epoch": 1.18, - "learning_rate": 1.3845488345082642e-06, - "loss": 0.6846, - "step": 46015 - }, - { - "epoch": 1.18, - "learning_rate": 1.3845232916364071e-06, - "loss": 0.6929, - "step": 46016 - }, - { - "epoch": 1.18, - "learning_rate": 1.384497748470138e-06, - "loss": 0.6221, - "step": 46017 - }, - { - "epoch": 1.18, - "learning_rate": 1.3844722050094765e-06, - "loss": 0.6787, - "step": 46018 - }, - { - "epoch": 1.18, - "learning_rate": 1.3844466612544426e-06, - "loss": 0.3318, - "step": 46019 - }, - { - "epoch": 1.18, - "learning_rate": 1.3844211172050555e-06, - "loss": 0.7002, - "step": 46020 - }, - { - "epoch": 1.18, - "learning_rate": 1.3843955728613347e-06, - "loss": 0.6953, - "step": 46021 - }, - { - "epoch": 1.18, - "learning_rate": 1.3843700282232999e-06, - "loss": 0.6895, - "step": 46022 - }, - { - "epoch": 1.18, - "learning_rate": 1.3843444832909708e-06, - "loss": 0.6797, - "step": 46023 - }, - { - "epoch": 1.18, - "learning_rate": 1.3843189380643666e-06, - "loss": 0.6992, - "step": 46024 - }, - { - "epoch": 1.18, - "learning_rate": 1.3842933925435071e-06, - "loss": 0.7603, - "step": 46025 - }, - { - "epoch": 1.18, - "learning_rate": 1.3842678467284122e-06, - "loss": 0.7144, - "step": 46026 - }, - { - "epoch": 1.18, - "learning_rate": 1.3842423006191006e-06, - "loss": 0.46, - "step": 46027 - }, - { - "epoch": 1.18, - "learning_rate": 1.3842167542155926e-06, - "loss": 0.4443, - "step": 46028 - }, - { - "epoch": 1.18, - "learning_rate": 1.3841912075179073e-06, - "loss": 0.541, - "step": 46029 - }, - { - "epoch": 1.18, - "learning_rate": 1.3841656605260644e-06, - "loss": 0.6582, - "step": 46030 - }, - { - "epoch": 1.18, - "learning_rate": 1.384140113240084e-06, - "loss": 0.6064, - "step": 46031 - }, - { - "epoch": 1.18, - "learning_rate": 1.3841145656599848e-06, - "loss": 0.6514, - "step": 46032 - }, - { - "epoch": 1.18, - "learning_rate": 1.3840890177857868e-06, - "loss": 0.6016, - "step": 46033 - }, - { - "epoch": 1.18, - "learning_rate": 1.3840634696175092e-06, - "loss": 0.7529, - "step": 46034 - }, - { - "epoch": 1.18, - "learning_rate": 1.3840379211551722e-06, - "loss": 0.5181, - "step": 46035 - }, - { - "epoch": 1.18, - "learning_rate": 1.3840123723987952e-06, - "loss": 0.5381, - "step": 46036 - }, - { - "epoch": 1.18, - "learning_rate": 1.3839868233483975e-06, - "loss": 0.566, - "step": 46037 - }, - { - "epoch": 1.18, - "learning_rate": 1.3839612740039983e-06, - "loss": 0.7134, - "step": 46038 - }, - { - "epoch": 1.18, - "learning_rate": 1.3839357243656182e-06, - "loss": 0.4961, - "step": 46039 - }, - { - "epoch": 1.18, - "learning_rate": 1.3839101744332758e-06, - "loss": 0.5344, - "step": 46040 - }, - { - "epoch": 1.18, - "learning_rate": 1.383884624206991e-06, - "loss": 0.7656, - "step": 46041 - }, - { - "epoch": 1.18, - "learning_rate": 1.3838590736867837e-06, - "loss": 0.7559, - "step": 46042 - }, - { - "epoch": 1.18, - "learning_rate": 1.3838335228726729e-06, - "loss": 0.6748, - "step": 46043 - }, - { - "epoch": 1.18, - "learning_rate": 1.3838079717646785e-06, - "loss": 0.6621, - "step": 46044 - }, - { - "epoch": 1.18, - "learning_rate": 1.38378242036282e-06, - "loss": 0.7261, - "step": 46045 - }, - { - "epoch": 1.18, - "learning_rate": 1.3837568686671168e-06, - "loss": 0.5962, - "step": 46046 - }, - { - "epoch": 1.18, - "learning_rate": 1.3837313166775887e-06, - "loss": 0.6523, - "step": 46047 - }, - { - "epoch": 1.18, - "learning_rate": 1.3837057643942554e-06, - "loss": 0.5171, - "step": 46048 - }, - { - "epoch": 1.18, - "learning_rate": 1.3836802118171357e-06, - "loss": 0.5742, - "step": 46049 - }, - { - "epoch": 1.18, - "learning_rate": 1.3836546589462504e-06, - "loss": 0.5635, - "step": 46050 - }, - { - "epoch": 1.18, - "learning_rate": 1.383629105781618e-06, - "loss": 0.7354, - "step": 46051 - }, - { - "epoch": 1.18, - "learning_rate": 1.3836035523232586e-06, - "loss": 0.7393, - "step": 46052 - }, - { - "epoch": 1.18, - "learning_rate": 1.3835779985711914e-06, - "loss": 0.5771, - "step": 46053 - }, - { - "epoch": 1.18, - "learning_rate": 1.383552444525436e-06, - "loss": 0.7158, - "step": 46054 - }, - { - "epoch": 1.18, - "learning_rate": 1.3835268901860121e-06, - "loss": 0.5796, - "step": 46055 - }, - { - "epoch": 1.18, - "learning_rate": 1.38350133555294e-06, - "loss": 0.8086, - "step": 46056 - }, - { - "epoch": 1.18, - "learning_rate": 1.3834757806262381e-06, - "loss": 0.5513, - "step": 46057 - }, - { - "epoch": 1.18, - "learning_rate": 1.3834502254059263e-06, - "loss": 0.832, - "step": 46058 - }, - { - "epoch": 1.18, - "learning_rate": 1.3834246698920241e-06, - "loss": 0.5542, - "step": 46059 - }, - { - "epoch": 1.18, - "learning_rate": 1.3833991140845518e-06, - "loss": 0.5254, - "step": 46060 - }, - { - "epoch": 1.18, - "learning_rate": 1.3833735579835284e-06, - "loss": 0.6699, - "step": 46061 - }, - { - "epoch": 1.18, - "learning_rate": 1.3833480015889733e-06, - "loss": 0.6035, - "step": 46062 - }, - { - "epoch": 1.18, - "learning_rate": 1.3833224449009062e-06, - "loss": 0.5776, - "step": 46063 - }, - { - "epoch": 1.18, - "learning_rate": 1.3832968879193469e-06, - "loss": 0.5693, - "step": 46064 - }, - { - "epoch": 1.18, - "learning_rate": 1.3832713306443144e-06, - "loss": 0.5378, - "step": 46065 - }, - { - "epoch": 1.18, - "learning_rate": 1.3832457730758292e-06, - "loss": 0.7881, - "step": 46066 - }, - { - "epoch": 1.18, - "learning_rate": 1.38322021521391e-06, - "loss": 0.666, - "step": 46067 - }, - { - "epoch": 1.18, - "learning_rate": 1.383194657058577e-06, - "loss": 0.8047, - "step": 46068 - }, - { - "epoch": 1.18, - "learning_rate": 1.3831690986098492e-06, - "loss": 0.7412, - "step": 46069 - }, - { - "epoch": 1.18, - "learning_rate": 1.3831435398677463e-06, - "loss": 0.6523, - "step": 46070 - }, - { - "epoch": 1.18, - "learning_rate": 1.3831179808322886e-06, - "loss": 0.7568, - "step": 46071 - }, - { - "epoch": 1.18, - "learning_rate": 1.3830924215034945e-06, - "loss": 0.8223, - "step": 46072 - }, - { - "epoch": 1.18, - "learning_rate": 1.3830668618813843e-06, - "loss": 0.6797, - "step": 46073 - }, - { - "epoch": 1.18, - "learning_rate": 1.3830413019659775e-06, - "loss": 0.6514, - "step": 46074 - }, - { - "epoch": 1.18, - "learning_rate": 1.3830157417572934e-06, - "loss": 0.5938, - "step": 46075 - }, - { - "epoch": 1.18, - "learning_rate": 1.3829901812553518e-06, - "loss": 0.3806, - "step": 46076 - }, - { - "epoch": 1.18, - "learning_rate": 1.3829646204601726e-06, - "loss": 0.6475, - "step": 46077 - }, - { - "epoch": 1.18, - "learning_rate": 1.3829390593717747e-06, - "loss": 0.4324, - "step": 46078 - }, - { - "epoch": 1.18, - "learning_rate": 1.382913497990178e-06, - "loss": 0.5596, - "step": 46079 - }, - { - "epoch": 1.18, - "learning_rate": 1.382887936315402e-06, - "loss": 0.6494, - "step": 46080 - }, - { - "epoch": 1.18, - "learning_rate": 1.3828623743474665e-06, - "loss": 0.7422, - "step": 46081 - }, - { - "epoch": 1.18, - "learning_rate": 1.3828368120863906e-06, - "loss": 0.7549, - "step": 46082 - }, - { - "epoch": 1.18, - "learning_rate": 1.3828112495321944e-06, - "loss": 0.769, - "step": 46083 - }, - { - "epoch": 1.18, - "learning_rate": 1.382785686684897e-06, - "loss": 0.6084, - "step": 46084 - }, - { - "epoch": 1.18, - "learning_rate": 1.3827601235445183e-06, - "loss": 0.7031, - "step": 46085 - }, - { - "epoch": 1.18, - "learning_rate": 1.3827345601110781e-06, - "loss": 0.7598, - "step": 46086 - }, - { - "epoch": 1.18, - "learning_rate": 1.382708996384595e-06, - "loss": 0.6953, - "step": 46087 - }, - { - "epoch": 1.18, - "learning_rate": 1.3826834323650898e-06, - "loss": 0.6621, - "step": 46088 - }, - { - "epoch": 1.18, - "learning_rate": 1.3826578680525812e-06, - "loss": 0.5112, - "step": 46089 - }, - { - "epoch": 1.18, - "learning_rate": 1.382632303447089e-06, - "loss": 0.8457, - "step": 46090 - }, - { - "epoch": 1.18, - "learning_rate": 1.3826067385486332e-06, - "loss": 0.7251, - "step": 46091 - }, - { - "epoch": 1.18, - "learning_rate": 1.3825811733572329e-06, - "loss": 0.6045, - "step": 46092 - }, - { - "epoch": 1.18, - "learning_rate": 1.3825556078729074e-06, - "loss": 0.6602, - "step": 46093 - }, - { - "epoch": 1.18, - "learning_rate": 1.3825300420956768e-06, - "loss": 0.792, - "step": 46094 - }, - { - "epoch": 1.18, - "learning_rate": 1.3825044760255607e-06, - "loss": 0.7168, - "step": 46095 - }, - { - "epoch": 1.18, - "learning_rate": 1.3824789096625788e-06, - "loss": 0.6646, - "step": 46096 - }, - { - "epoch": 1.18, - "learning_rate": 1.38245334300675e-06, - "loss": 0.5419, - "step": 46097 - }, - { - "epoch": 1.18, - "learning_rate": 1.3824277760580942e-06, - "loss": 0.6763, - "step": 46098 - }, - { - "epoch": 1.18, - "learning_rate": 1.3824022088166309e-06, - "loss": 0.5781, - "step": 46099 - }, - { - "epoch": 1.18, - "learning_rate": 1.3823766412823802e-06, - "loss": 0.4438, - "step": 46100 - }, - { - "epoch": 1.18, - "learning_rate": 1.3823510734553615e-06, - "loss": 0.5898, - "step": 46101 - }, - { - "epoch": 1.18, - "learning_rate": 1.3823255053355938e-06, - "loss": 0.5049, - "step": 46102 - }, - { - "epoch": 1.18, - "learning_rate": 1.3822999369230968e-06, - "loss": 0.6494, - "step": 46103 - }, - { - "epoch": 1.18, - "learning_rate": 1.3822743682178906e-06, - "loss": 0.5463, - "step": 46104 - }, - { - "epoch": 1.18, - "learning_rate": 1.3822487992199943e-06, - "loss": 0.583, - "step": 46105 - }, - { - "epoch": 1.18, - "learning_rate": 1.382223229929428e-06, - "loss": 0.6885, - "step": 46106 - }, - { - "epoch": 1.18, - "learning_rate": 1.3821976603462108e-06, - "loss": 0.7207, - "step": 46107 - }, - { - "epoch": 1.18, - "learning_rate": 1.3821720904703623e-06, - "loss": 0.667, - "step": 46108 - }, - { - "epoch": 1.18, - "learning_rate": 1.3821465203019025e-06, - "loss": 0.6147, - "step": 46109 - }, - { - "epoch": 1.18, - "learning_rate": 1.3821209498408504e-06, - "loss": 0.6255, - "step": 46110 - }, - { - "epoch": 1.18, - "learning_rate": 1.3820953790872261e-06, - "loss": 0.5923, - "step": 46111 - }, - { - "epoch": 1.18, - "learning_rate": 1.3820698080410487e-06, - "loss": 0.4932, - "step": 46112 - }, - { - "epoch": 1.18, - "learning_rate": 1.3820442367023381e-06, - "loss": 0.6426, - "step": 46113 - }, - { - "epoch": 1.18, - "learning_rate": 1.3820186650711136e-06, - "loss": 0.646, - "step": 46114 - }, - { - "epoch": 1.18, - "learning_rate": 1.3819930931473953e-06, - "loss": 0.5297, - "step": 46115 - }, - { - "epoch": 1.18, - "learning_rate": 1.3819675209312026e-06, - "loss": 0.7041, - "step": 46116 - }, - { - "epoch": 1.18, - "learning_rate": 1.3819419484225544e-06, - "loss": 0.6709, - "step": 46117 - }, - { - "epoch": 1.18, - "learning_rate": 1.381916375621471e-06, - "loss": 0.665, - "step": 46118 - }, - { - "epoch": 1.18, - "learning_rate": 1.381890802527972e-06, - "loss": 0.4744, - "step": 46119 - }, - { - "epoch": 1.18, - "learning_rate": 1.3818652291420767e-06, - "loss": 0.6279, - "step": 46120 - }, - { - "epoch": 1.18, - "learning_rate": 1.3818396554638048e-06, - "loss": 0.7002, - "step": 46121 - }, - { - "epoch": 1.18, - "learning_rate": 1.3818140814931756e-06, - "loss": 0.5981, - "step": 46122 - }, - { - "epoch": 1.18, - "learning_rate": 1.3817885072302091e-06, - "loss": 0.666, - "step": 46123 - }, - { - "epoch": 1.18, - "learning_rate": 1.3817629326749246e-06, - "loss": 0.7021, - "step": 46124 - }, - { - "epoch": 1.18, - "learning_rate": 1.381737357827342e-06, - "loss": 0.5532, - "step": 46125 - }, - { - "epoch": 1.18, - "learning_rate": 1.3817117826874803e-06, - "loss": 0.7119, - "step": 46126 - }, - { - "epoch": 1.18, - "learning_rate": 1.3816862072553598e-06, - "loss": 0.6831, - "step": 46127 - }, - { - "epoch": 1.18, - "learning_rate": 1.3816606315309993e-06, - "loss": 0.4307, - "step": 46128 - }, - { - "epoch": 1.18, - "learning_rate": 1.3816350555144192e-06, - "loss": 0.3828, - "step": 46129 - }, - { - "epoch": 1.18, - "learning_rate": 1.3816094792056382e-06, - "loss": 0.4521, - "step": 46130 - }, - { - "epoch": 1.18, - "learning_rate": 1.381583902604677e-06, - "loss": 0.6528, - "step": 46131 - }, - { - "epoch": 1.18, - "learning_rate": 1.3815583257115542e-06, - "loss": 0.8389, - "step": 46132 - }, - { - "epoch": 1.18, - "learning_rate": 1.3815327485262898e-06, - "loss": 0.7021, - "step": 46133 - }, - { - "epoch": 1.18, - "learning_rate": 1.3815071710489033e-06, - "loss": 0.6245, - "step": 46134 - }, - { - "epoch": 1.18, - "learning_rate": 1.3814815932794144e-06, - "loss": 0.7192, - "step": 46135 - }, - { - "epoch": 1.18, - "learning_rate": 1.3814560152178425e-06, - "loss": 0.6797, - "step": 46136 - }, - { - "epoch": 1.18, - "learning_rate": 1.3814304368642069e-06, - "loss": 0.6084, - "step": 46137 - }, - { - "epoch": 1.18, - "learning_rate": 1.381404858218528e-06, - "loss": 0.8994, - "step": 46138 - }, - { - "epoch": 1.18, - "learning_rate": 1.3813792792808248e-06, - "loss": 0.7773, - "step": 46139 - }, - { - "epoch": 1.18, - "learning_rate": 1.3813537000511172e-06, - "loss": 0.4563, - "step": 46140 - }, - { - "epoch": 1.18, - "learning_rate": 1.3813281205294246e-06, - "loss": 0.6416, - "step": 46141 - }, - { - "epoch": 1.18, - "learning_rate": 1.3813025407157663e-06, - "loss": 0.5757, - "step": 46142 - }, - { - "epoch": 1.18, - "learning_rate": 1.3812769606101622e-06, - "loss": 0.8057, - "step": 46143 - }, - { - "epoch": 1.18, - "learning_rate": 1.3812513802126322e-06, - "loss": 0.7344, - "step": 46144 - }, - { - "epoch": 1.18, - "learning_rate": 1.3812257995231952e-06, - "loss": 0.6924, - "step": 46145 - }, - { - "epoch": 1.18, - "learning_rate": 1.3812002185418715e-06, - "loss": 0.6953, - "step": 46146 - }, - { - "epoch": 1.18, - "learning_rate": 1.3811746372686801e-06, - "loss": 0.3853, - "step": 46147 - }, - { - "epoch": 1.18, - "learning_rate": 1.3811490557036406e-06, - "loss": 0.5433, - "step": 46148 - }, - { - "epoch": 1.18, - "learning_rate": 1.381123473846773e-06, - "loss": 0.6855, - "step": 46149 - }, - { - "epoch": 1.18, - "learning_rate": 1.3810978916980969e-06, - "loss": 0.5131, - "step": 46150 - }, - { - "epoch": 1.18, - "learning_rate": 1.3810723092576315e-06, - "loss": 0.5811, - "step": 46151 - }, - { - "epoch": 1.18, - "learning_rate": 1.3810467265253964e-06, - "loss": 0.6719, - "step": 46152 - }, - { - "epoch": 1.18, - "learning_rate": 1.3810211435014115e-06, - "loss": 0.6396, - "step": 46153 - }, - { - "epoch": 1.18, - "learning_rate": 1.3809955601856963e-06, - "loss": 0.686, - "step": 46154 - }, - { - "epoch": 1.18, - "learning_rate": 1.38096997657827e-06, - "loss": 0.6733, - "step": 46155 - }, - { - "epoch": 1.18, - "learning_rate": 1.3809443926791526e-06, - "loss": 0.7852, - "step": 46156 - }, - { - "epoch": 1.18, - "learning_rate": 1.3809188084883639e-06, - "loss": 0.7671, - "step": 46157 - }, - { - "epoch": 1.18, - "learning_rate": 1.3808932240059228e-06, - "loss": 0.5449, - "step": 46158 - }, - { - "epoch": 1.18, - "learning_rate": 1.3808676392318494e-06, - "loss": 0.4705, - "step": 46159 - }, - { - "epoch": 1.18, - "learning_rate": 1.3808420541661631e-06, - "loss": 0.7256, - "step": 46160 - }, - { - "epoch": 1.18, - "learning_rate": 1.380816468808884e-06, - "loss": 0.6177, - "step": 46161 - }, - { - "epoch": 1.18, - "learning_rate": 1.3807908831600308e-06, - "loss": 0.6042, - "step": 46162 - }, - { - "epoch": 1.18, - "learning_rate": 1.3807652972196238e-06, - "loss": 0.5913, - "step": 46163 - }, - { - "epoch": 1.18, - "learning_rate": 1.380739710987682e-06, - "loss": 0.6636, - "step": 46164 - }, - { - "epoch": 1.18, - "learning_rate": 1.3807141244642255e-06, - "loss": 0.7358, - "step": 46165 - }, - { - "epoch": 1.18, - "learning_rate": 1.3806885376492736e-06, - "loss": 0.6484, - "step": 46166 - }, - { - "epoch": 1.18, - "learning_rate": 1.3806629505428463e-06, - "loss": 0.6279, - "step": 46167 - }, - { - "epoch": 1.18, - "learning_rate": 1.3806373631449626e-06, - "loss": 0.6118, - "step": 46168 - }, - { - "epoch": 1.18, - "learning_rate": 1.3806117754556423e-06, - "loss": 0.748, - "step": 46169 - }, - { - "epoch": 1.18, - "learning_rate": 1.3805861874749053e-06, - "loss": 0.6318, - "step": 46170 - }, - { - "epoch": 1.18, - "learning_rate": 1.3805605992027709e-06, - "loss": 0.6943, - "step": 46171 - }, - { - "epoch": 1.18, - "learning_rate": 1.3805350106392586e-06, - "loss": 0.6851, - "step": 46172 - }, - { - "epoch": 1.18, - "learning_rate": 1.3805094217843882e-06, - "loss": 0.6216, - "step": 46173 - }, - { - "epoch": 1.18, - "learning_rate": 1.3804838326381791e-06, - "loss": 0.6318, - "step": 46174 - }, - { - "epoch": 1.18, - "learning_rate": 1.3804582432006513e-06, - "loss": 0.585, - "step": 46175 - }, - { - "epoch": 1.18, - "learning_rate": 1.380432653471824e-06, - "loss": 0.6108, - "step": 46176 - }, - { - "epoch": 1.18, - "learning_rate": 1.3804070634517168e-06, - "loss": 0.7344, - "step": 46177 - }, - { - "epoch": 1.18, - "learning_rate": 1.3803814731403495e-06, - "loss": 0.5537, - "step": 46178 - }, - { - "epoch": 1.18, - "learning_rate": 1.3803558825377416e-06, - "loss": 0.5952, - "step": 46179 - }, - { - "epoch": 1.18, - "learning_rate": 1.3803302916439128e-06, - "loss": 0.6484, - "step": 46180 - }, - { - "epoch": 1.18, - "learning_rate": 1.3803047004588827e-06, - "loss": 0.7231, - "step": 46181 - }, - { - "epoch": 1.18, - "learning_rate": 1.3802791089826704e-06, - "loss": 0.7549, - "step": 46182 - }, - { - "epoch": 1.18, - "learning_rate": 1.380253517215296e-06, - "loss": 0.6416, - "step": 46183 - }, - { - "epoch": 1.18, - "learning_rate": 1.380227925156779e-06, - "loss": 0.4795, - "step": 46184 - }, - { - "epoch": 1.18, - "learning_rate": 1.3802023328071389e-06, - "loss": 0.6587, - "step": 46185 - }, - { - "epoch": 1.18, - "learning_rate": 1.3801767401663956e-06, - "loss": 0.6021, - "step": 46186 - }, - { - "epoch": 1.18, - "learning_rate": 1.3801511472345683e-06, - "loss": 0.7129, - "step": 46187 - }, - { - "epoch": 1.18, - "learning_rate": 1.3801255540116764e-06, - "loss": 0.6396, - "step": 46188 - }, - { - "epoch": 1.18, - "learning_rate": 1.3800999604977403e-06, - "loss": 0.6709, - "step": 46189 - }, - { - "epoch": 1.18, - "learning_rate": 1.380074366692779e-06, - "loss": 0.4937, - "step": 46190 - }, - { - "epoch": 1.18, - "learning_rate": 1.3800487725968122e-06, - "loss": 0.7441, - "step": 46191 - }, - { - "epoch": 1.18, - "learning_rate": 1.3800231782098598e-06, - "loss": 0.6104, - "step": 46192 - }, - { - "epoch": 1.18, - "learning_rate": 1.3799975835319407e-06, - "loss": 0.7114, - "step": 46193 - }, - { - "epoch": 1.18, - "learning_rate": 1.3799719885630753e-06, - "loss": 0.6311, - "step": 46194 - }, - { - "epoch": 1.18, - "learning_rate": 1.3799463933032822e-06, - "loss": 0.5425, - "step": 46195 - }, - { - "epoch": 1.18, - "learning_rate": 1.3799207977525825e-06, - "loss": 0.6934, - "step": 46196 - }, - { - "epoch": 1.18, - "learning_rate": 1.3798952019109945e-06, - "loss": 0.6875, - "step": 46197 - }, - { - "epoch": 1.18, - "learning_rate": 1.379869605778538e-06, - "loss": 0.593, - "step": 46198 - }, - { - "epoch": 1.18, - "learning_rate": 1.379844009355233e-06, - "loss": 0.5986, - "step": 46199 - }, - { - "epoch": 1.18, - "learning_rate": 1.3798184126410987e-06, - "loss": 0.6099, - "step": 46200 - }, - { - "epoch": 1.18, - "learning_rate": 1.3797928156361552e-06, - "loss": 0.4824, - "step": 46201 - }, - { - "epoch": 1.18, - "learning_rate": 1.3797672183404217e-06, - "loss": 0.7959, - "step": 46202 - }, - { - "epoch": 1.18, - "learning_rate": 1.3797416207539179e-06, - "loss": 0.748, - "step": 46203 - }, - { - "epoch": 1.18, - "learning_rate": 1.3797160228766634e-06, - "loss": 0.7295, - "step": 46204 - }, - { - "epoch": 1.18, - "learning_rate": 1.3796904247086776e-06, - "loss": 0.5879, - "step": 46205 - }, - { - "epoch": 1.18, - "learning_rate": 1.3796648262499808e-06, - "loss": 0.6167, - "step": 46206 - }, - { - "epoch": 1.18, - "learning_rate": 1.3796392275005918e-06, - "loss": 0.6797, - "step": 46207 - }, - { - "epoch": 1.18, - "learning_rate": 1.37961362846053e-06, - "loss": 0.6211, - "step": 46208 - }, - { - "epoch": 1.18, - "learning_rate": 1.3795880291298162e-06, - "loss": 0.7129, - "step": 46209 - }, - { - "epoch": 1.18, - "learning_rate": 1.379562429508469e-06, - "loss": 0.4956, - "step": 46210 - }, - { - "epoch": 1.18, - "learning_rate": 1.379536829596509e-06, - "loss": 0.7686, - "step": 46211 - }, - { - "epoch": 1.18, - "learning_rate": 1.3795112293939542e-06, - "loss": 0.7852, - "step": 46212 - }, - { - "epoch": 1.18, - "learning_rate": 1.3794856289008255e-06, - "loss": 0.5259, - "step": 46213 - }, - { - "epoch": 1.18, - "learning_rate": 1.3794600281171418e-06, - "loss": 0.6953, - "step": 46214 - }, - { - "epoch": 1.18, - "learning_rate": 1.3794344270429235e-06, - "loss": 0.7017, - "step": 46215 - }, - { - "epoch": 1.18, - "learning_rate": 1.3794088256781892e-06, - "loss": 0.6621, - "step": 46216 - }, - { - "epoch": 1.18, - "learning_rate": 1.3793832240229595e-06, - "loss": 0.6934, - "step": 46217 - }, - { - "epoch": 1.18, - "learning_rate": 1.3793576220772529e-06, - "loss": 0.8701, - "step": 46218 - }, - { - "epoch": 1.18, - "learning_rate": 1.37933201984109e-06, - "loss": 0.686, - "step": 46219 - }, - { - "epoch": 1.18, - "learning_rate": 1.37930641731449e-06, - "loss": 0.6577, - "step": 46220 - }, - { - "epoch": 1.18, - "learning_rate": 1.3792808144974725e-06, - "loss": 0.6582, - "step": 46221 - }, - { - "epoch": 1.18, - "learning_rate": 1.3792552113900571e-06, - "loss": 0.6797, - "step": 46222 - }, - { - "epoch": 1.18, - "learning_rate": 1.3792296079922633e-06, - "loss": 0.7402, - "step": 46223 - }, - { - "epoch": 1.18, - "learning_rate": 1.379204004304111e-06, - "loss": 0.5576, - "step": 46224 - }, - { - "epoch": 1.18, - "learning_rate": 1.3791784003256196e-06, - "loss": 0.6328, - "step": 46225 - }, - { - "epoch": 1.18, - "learning_rate": 1.3791527960568087e-06, - "loss": 0.833, - "step": 46226 - }, - { - "epoch": 1.18, - "learning_rate": 1.379127191497698e-06, - "loss": 0.7759, - "step": 46227 - }, - { - "epoch": 1.18, - "learning_rate": 1.379101586648307e-06, - "loss": 0.7017, - "step": 46228 - }, - { - "epoch": 1.18, - "learning_rate": 1.3790759815086552e-06, - "loss": 0.5684, - "step": 46229 - }, - { - "epoch": 1.18, - "learning_rate": 1.3790503760787627e-06, - "loss": 0.5352, - "step": 46230 - }, - { - "epoch": 1.18, - "learning_rate": 1.3790247703586487e-06, - "loss": 0.5864, - "step": 46231 - }, - { - "epoch": 1.18, - "learning_rate": 1.3789991643483325e-06, - "loss": 0.7158, - "step": 46232 - }, - { - "epoch": 1.18, - "learning_rate": 1.3789735580478343e-06, - "loss": 0.5815, - "step": 46233 - }, - { - "epoch": 1.19, - "learning_rate": 1.3789479514571736e-06, - "loss": 0.626, - "step": 46234 - }, - { - "epoch": 1.19, - "learning_rate": 1.3789223445763695e-06, - "loss": 0.7549, - "step": 46235 - }, - { - "epoch": 1.19, - "learning_rate": 1.3788967374054424e-06, - "loss": 0.7686, - "step": 46236 - }, - { - "epoch": 1.19, - "learning_rate": 1.3788711299444113e-06, - "loss": 0.603, - "step": 46237 - }, - { - "epoch": 1.19, - "learning_rate": 1.3788455221932959e-06, - "loss": 0.6265, - "step": 46238 - }, - { - "epoch": 1.19, - "learning_rate": 1.378819914152116e-06, - "loss": 0.6689, - "step": 46239 - }, - { - "epoch": 1.19, - "learning_rate": 1.3787943058208912e-06, - "loss": 0.4475, - "step": 46240 - }, - { - "epoch": 1.19, - "learning_rate": 1.378768697199641e-06, - "loss": 0.6807, - "step": 46241 - }, - { - "epoch": 1.19, - "learning_rate": 1.3787430882883851e-06, - "loss": 0.7783, - "step": 46242 - }, - { - "epoch": 1.19, - "learning_rate": 1.3787174790871428e-06, - "loss": 0.668, - "step": 46243 - }, - { - "epoch": 1.19, - "learning_rate": 1.378691869595934e-06, - "loss": 0.6362, - "step": 46244 - }, - { - "epoch": 1.19, - "learning_rate": 1.3786662598147783e-06, - "loss": 0.687, - "step": 46245 - }, - { - "epoch": 1.19, - "learning_rate": 1.3786406497436951e-06, - "loss": 0.5752, - "step": 46246 - }, - { - "epoch": 1.19, - "learning_rate": 1.3786150393827044e-06, - "loss": 0.6992, - "step": 46247 - }, - { - "epoch": 1.19, - "learning_rate": 1.3785894287318255e-06, - "loss": 0.4724, - "step": 46248 - }, - { - "epoch": 1.19, - "learning_rate": 1.378563817791078e-06, - "loss": 0.6177, - "step": 46249 - }, - { - "epoch": 1.19, - "learning_rate": 1.3785382065604816e-06, - "loss": 0.5898, - "step": 46250 - }, - { - "epoch": 1.19, - "learning_rate": 1.378512595040056e-06, - "loss": 0.8047, - "step": 46251 - }, - { - "epoch": 1.19, - "learning_rate": 1.3784869832298205e-06, - "loss": 0.6655, - "step": 46252 - }, - { - "epoch": 1.19, - "learning_rate": 1.3784613711297953e-06, - "loss": 0.666, - "step": 46253 - }, - { - "epoch": 1.19, - "learning_rate": 1.378435758739999e-06, - "loss": 0.5156, - "step": 46254 - }, - { - "epoch": 1.19, - "learning_rate": 1.3784101460604527e-06, - "loss": 0.7432, - "step": 46255 - }, - { - "epoch": 1.19, - "learning_rate": 1.3783845330911745e-06, - "loss": 0.5151, - "step": 46256 - }, - { - "epoch": 1.19, - "learning_rate": 1.378358919832185e-06, - "loss": 0.6177, - "step": 46257 - }, - { - "epoch": 1.19, - "learning_rate": 1.378333306283503e-06, - "loss": 0.6431, - "step": 46258 - }, - { - "epoch": 1.19, - "learning_rate": 1.378307692445149e-06, - "loss": 0.6523, - "step": 46259 - }, - { - "epoch": 1.19, - "learning_rate": 1.3782820783171423e-06, - "loss": 0.583, - "step": 46260 - }, - { - "epoch": 1.19, - "learning_rate": 1.3782564638995021e-06, - "loss": 0.6079, - "step": 46261 - }, - { - "epoch": 1.19, - "learning_rate": 1.3782308491922485e-06, - "loss": 0.5913, - "step": 46262 - }, - { - "epoch": 1.19, - "learning_rate": 1.3782052341954009e-06, - "loss": 0.6006, - "step": 46263 - }, - { - "epoch": 1.19, - "learning_rate": 1.3781796189089788e-06, - "loss": 0.5684, - "step": 46264 - }, - { - "epoch": 1.19, - "learning_rate": 1.3781540033330022e-06, - "loss": 0.5913, - "step": 46265 - }, - { - "epoch": 1.19, - "learning_rate": 1.3781283874674903e-06, - "loss": 0.7725, - "step": 46266 - }, - { - "epoch": 1.19, - "learning_rate": 1.3781027713124628e-06, - "loss": 0.6865, - "step": 46267 - }, - { - "epoch": 1.19, - "learning_rate": 1.3780771548679395e-06, - "loss": 0.6553, - "step": 46268 - }, - { - "epoch": 1.19, - "learning_rate": 1.3780515381339402e-06, - "loss": 0.479, - "step": 46269 - }, - { - "epoch": 1.19, - "learning_rate": 1.3780259211104839e-06, - "loss": 0.6538, - "step": 46270 - }, - { - "epoch": 1.19, - "learning_rate": 1.3780003037975903e-06, - "loss": 0.7021, - "step": 46271 - }, - { - "epoch": 1.19, - "learning_rate": 1.3779746861952797e-06, - "loss": 0.4985, - "step": 46272 - }, - { - "epoch": 1.19, - "learning_rate": 1.3779490683035708e-06, - "loss": 0.665, - "step": 46273 - }, - { - "epoch": 1.19, - "learning_rate": 1.377923450122484e-06, - "loss": 0.6455, - "step": 46274 - }, - { - "epoch": 1.19, - "learning_rate": 1.3778978316520386e-06, - "loss": 0.6382, - "step": 46275 - }, - { - "epoch": 1.19, - "learning_rate": 1.3778722128922545e-06, - "loss": 0.5172, - "step": 46276 - }, - { - "epoch": 1.19, - "learning_rate": 1.3778465938431505e-06, - "loss": 0.6484, - "step": 46277 - }, - { - "epoch": 1.19, - "learning_rate": 1.377820974504747e-06, - "loss": 0.584, - "step": 46278 - }, - { - "epoch": 1.19, - "learning_rate": 1.377795354877063e-06, - "loss": 0.6033, - "step": 46279 - }, - { - "epoch": 1.19, - "learning_rate": 1.377769734960119e-06, - "loss": 0.5352, - "step": 46280 - }, - { - "epoch": 1.19, - "learning_rate": 1.3777441147539338e-06, - "loss": 0.667, - "step": 46281 - }, - { - "epoch": 1.19, - "learning_rate": 1.377718494258527e-06, - "loss": 0.5796, - "step": 46282 - }, - { - "epoch": 1.19, - "learning_rate": 1.377692873473919e-06, - "loss": 0.5571, - "step": 46283 - }, - { - "epoch": 1.19, - "learning_rate": 1.377667252400129e-06, - "loss": 0.7285, - "step": 46284 - }, - { - "epoch": 1.19, - "learning_rate": 1.3776416310371762e-06, - "loss": 0.5615, - "step": 46285 - }, - { - "epoch": 1.19, - "learning_rate": 1.3776160093850808e-06, - "loss": 0.749, - "step": 46286 - }, - { - "epoch": 1.19, - "learning_rate": 1.377590387443862e-06, - "loss": 0.7324, - "step": 46287 - }, - { - "epoch": 1.19, - "learning_rate": 1.3775647652135397e-06, - "loss": 0.7773, - "step": 46288 - }, - { - "epoch": 1.19, - "learning_rate": 1.3775391426941332e-06, - "loss": 0.5967, - "step": 46289 - }, - { - "epoch": 1.19, - "learning_rate": 1.3775135198856625e-06, - "loss": 0.667, - "step": 46290 - }, - { - "epoch": 1.19, - "learning_rate": 1.377487896788147e-06, - "loss": 0.625, - "step": 46291 - }, - { - "epoch": 1.19, - "learning_rate": 1.3774622734016067e-06, - "loss": 0.6436, - "step": 46292 - }, - { - "epoch": 1.19, - "learning_rate": 1.3774366497260605e-06, - "loss": 0.7148, - "step": 46293 - }, - { - "epoch": 1.19, - "learning_rate": 1.3774110257615286e-06, - "loss": 0.834, - "step": 46294 - }, - { - "epoch": 1.19, - "learning_rate": 1.3773854015080307e-06, - "loss": 0.5376, - "step": 46295 - }, - { - "epoch": 1.19, - "learning_rate": 1.3773597769655855e-06, - "loss": 0.585, - "step": 46296 - }, - { - "epoch": 1.19, - "learning_rate": 1.3773341521342138e-06, - "loss": 0.6597, - "step": 46297 - }, - { - "epoch": 1.19, - "learning_rate": 1.3773085270139344e-06, - "loss": 0.7354, - "step": 46298 - }, - { - "epoch": 1.19, - "learning_rate": 1.3772829016047674e-06, - "loss": 0.3857, - "step": 46299 - }, - { - "epoch": 1.19, - "learning_rate": 1.3772572759067323e-06, - "loss": 0.9062, - "step": 46300 - }, - { - "epoch": 1.19, - "learning_rate": 1.3772316499198484e-06, - "loss": 0.5396, - "step": 46301 - }, - { - "epoch": 1.19, - "learning_rate": 1.3772060236441356e-06, - "loss": 0.4641, - "step": 46302 - }, - { - "epoch": 1.19, - "learning_rate": 1.3771803970796135e-06, - "loss": 0.7031, - "step": 46303 - }, - { - "epoch": 1.19, - "learning_rate": 1.3771547702263018e-06, - "loss": 0.7852, - "step": 46304 - }, - { - "epoch": 1.19, - "learning_rate": 1.3771291430842203e-06, - "loss": 0.4868, - "step": 46305 - }, - { - "epoch": 1.19, - "learning_rate": 1.377103515653388e-06, - "loss": 0.6357, - "step": 46306 - }, - { - "epoch": 1.19, - "learning_rate": 1.3770778879338249e-06, - "loss": 0.6533, - "step": 46307 - }, - { - "epoch": 1.19, - "learning_rate": 1.3770522599255504e-06, - "loss": 0.6621, - "step": 46308 - }, - { - "epoch": 1.19, - "learning_rate": 1.377026631628585e-06, - "loss": 0.5723, - "step": 46309 - }, - { - "epoch": 1.19, - "learning_rate": 1.3770010030429472e-06, - "loss": 0.6641, - "step": 46310 - }, - { - "epoch": 1.19, - "learning_rate": 1.3769753741686567e-06, - "loss": 0.5914, - "step": 46311 - }, - { - "epoch": 1.19, - "learning_rate": 1.3769497450057338e-06, - "loss": 0.5479, - "step": 46312 - }, - { - "epoch": 1.19, - "learning_rate": 1.376924115554198e-06, - "loss": 0.4705, - "step": 46313 - }, - { - "epoch": 1.19, - "learning_rate": 1.3768984858140686e-06, - "loss": 0.71, - "step": 46314 - }, - { - "epoch": 1.19, - "learning_rate": 1.3768728557853653e-06, - "loss": 0.6177, - "step": 46315 - }, - { - "epoch": 1.19, - "learning_rate": 1.376847225468108e-06, - "loss": 0.6709, - "step": 46316 - }, - { - "epoch": 1.19, - "learning_rate": 1.3768215948623158e-06, - "loss": 0.613, - "step": 46317 - }, - { - "epoch": 1.19, - "learning_rate": 1.376795963968009e-06, - "loss": 0.8154, - "step": 46318 - }, - { - "epoch": 1.19, - "learning_rate": 1.3767703327852066e-06, - "loss": 0.666, - "step": 46319 - }, - { - "epoch": 1.19, - "learning_rate": 1.3767447013139286e-06, - "loss": 0.8779, - "step": 46320 - }, - { - "epoch": 1.19, - "learning_rate": 1.3767190695541943e-06, - "loss": 0.6494, - "step": 46321 - }, - { - "epoch": 1.19, - "learning_rate": 1.3766934375060237e-06, - "loss": 0.7793, - "step": 46322 - }, - { - "epoch": 1.19, - "learning_rate": 1.3766678051694363e-06, - "loss": 0.3867, - "step": 46323 - }, - { - "epoch": 1.19, - "learning_rate": 1.3766421725444516e-06, - "loss": 0.6082, - "step": 46324 - }, - { - "epoch": 1.19, - "learning_rate": 1.3766165396310894e-06, - "loss": 0.4414, - "step": 46325 - }, - { - "epoch": 1.19, - "learning_rate": 1.376590906429369e-06, - "loss": 0.7344, - "step": 46326 - }, - { - "epoch": 1.19, - "learning_rate": 1.3765652729393105e-06, - "loss": 0.5479, - "step": 46327 - }, - { - "epoch": 1.19, - "learning_rate": 1.3765396391609333e-06, - "loss": 0.6938, - "step": 46328 - }, - { - "epoch": 1.19, - "learning_rate": 1.3765140050942567e-06, - "loss": 0.7188, - "step": 46329 - }, - { - "epoch": 1.19, - "learning_rate": 1.376488370739301e-06, - "loss": 0.499, - "step": 46330 - }, - { - "epoch": 1.19, - "learning_rate": 1.3764627360960853e-06, - "loss": 0.5615, - "step": 46331 - }, - { - "epoch": 1.19, - "learning_rate": 1.3764371011646294e-06, - "loss": 0.6074, - "step": 46332 - }, - { - "epoch": 1.19, - "learning_rate": 1.3764114659449528e-06, - "loss": 0.5171, - "step": 46333 - }, - { - "epoch": 1.19, - "learning_rate": 1.3763858304370755e-06, - "loss": 0.4863, - "step": 46334 - }, - { - "epoch": 1.19, - "learning_rate": 1.3763601946410168e-06, - "loss": 0.708, - "step": 46335 - }, - { - "epoch": 1.19, - "learning_rate": 1.3763345585567963e-06, - "loss": 0.5132, - "step": 46336 - }, - { - "epoch": 1.19, - "learning_rate": 1.3763089221844338e-06, - "loss": 0.6309, - "step": 46337 - }, - { - "epoch": 1.19, - "learning_rate": 1.3762832855239486e-06, - "loss": 0.564, - "step": 46338 - }, - { - "epoch": 1.19, - "learning_rate": 1.376257648575361e-06, - "loss": 0.6611, - "step": 46339 - }, - { - "epoch": 1.19, - "learning_rate": 1.37623201133869e-06, - "loss": 0.464, - "step": 46340 - }, - { - "epoch": 1.19, - "learning_rate": 1.3762063738139554e-06, - "loss": 0.6709, - "step": 46341 - }, - { - "epoch": 1.19, - "learning_rate": 1.376180736001177e-06, - "loss": 0.5986, - "step": 46342 - }, - { - "epoch": 1.19, - "learning_rate": 1.3761550979003743e-06, - "loss": 0.7373, - "step": 46343 - }, - { - "epoch": 1.19, - "learning_rate": 1.376129459511567e-06, - "loss": 0.7666, - "step": 46344 - }, - { - "epoch": 1.19, - "learning_rate": 1.3761038208347748e-06, - "loss": 0.7964, - "step": 46345 - }, - { - "epoch": 1.19, - "learning_rate": 1.376078181870017e-06, - "loss": 0.665, - "step": 46346 - }, - { - "epoch": 1.19, - "learning_rate": 1.3760525426173132e-06, - "loss": 0.7969, - "step": 46347 - }, - { - "epoch": 1.19, - "learning_rate": 1.3760269030766835e-06, - "loss": 0.7539, - "step": 46348 - }, - { - "epoch": 1.19, - "learning_rate": 1.3760012632481473e-06, - "loss": 0.6567, - "step": 46349 - }, - { - "epoch": 1.19, - "learning_rate": 1.3759756231317242e-06, - "loss": 0.6602, - "step": 46350 - }, - { - "epoch": 1.19, - "learning_rate": 1.3759499827274339e-06, - "loss": 0.7217, - "step": 46351 - }, - { - "epoch": 1.19, - "learning_rate": 1.3759243420352959e-06, - "loss": 0.6357, - "step": 46352 - }, - { - "epoch": 1.19, - "learning_rate": 1.37589870105533e-06, - "loss": 0.7148, - "step": 46353 - }, - { - "epoch": 1.19, - "learning_rate": 1.3758730597875556e-06, - "loss": 0.3622, - "step": 46354 - }, - { - "epoch": 1.19, - "learning_rate": 1.3758474182319927e-06, - "loss": 0.8242, - "step": 46355 - }, - { - "epoch": 1.19, - "learning_rate": 1.3758217763886607e-06, - "loss": 0.5908, - "step": 46356 - }, - { - "epoch": 1.19, - "learning_rate": 1.3757961342575789e-06, - "loss": 0.5151, - "step": 46357 - }, - { - "epoch": 1.19, - "learning_rate": 1.3757704918387676e-06, - "loss": 0.5889, - "step": 46358 - }, - { - "epoch": 1.19, - "learning_rate": 1.3757448491322462e-06, - "loss": 0.7725, - "step": 46359 - }, - { - "epoch": 1.19, - "learning_rate": 1.375719206138034e-06, - "loss": 0.5466, - "step": 46360 - }, - { - "epoch": 1.19, - "learning_rate": 1.3756935628561508e-06, - "loss": 0.8428, - "step": 46361 - }, - { - "epoch": 1.19, - "learning_rate": 1.3756679192866165e-06, - "loss": 0.8096, - "step": 46362 - }, - { - "epoch": 1.19, - "learning_rate": 1.3756422754294503e-06, - "loss": 0.6909, - "step": 46363 - }, - { - "epoch": 1.19, - "learning_rate": 1.3756166312846724e-06, - "loss": 0.6143, - "step": 46364 - }, - { - "epoch": 1.19, - "learning_rate": 1.375590986852302e-06, - "loss": 0.667, - "step": 46365 - }, - { - "epoch": 1.19, - "learning_rate": 1.3755653421323591e-06, - "loss": 0.6484, - "step": 46366 - }, - { - "epoch": 1.19, - "learning_rate": 1.3755396971248627e-06, - "loss": 0.7412, - "step": 46367 - }, - { - "epoch": 1.19, - "learning_rate": 1.3755140518298331e-06, - "loss": 0.4711, - "step": 46368 - }, - { - "epoch": 1.19, - "learning_rate": 1.3754884062472894e-06, - "loss": 0.6543, - "step": 46369 - }, - { - "epoch": 1.19, - "learning_rate": 1.375462760377252e-06, - "loss": 0.6279, - "step": 46370 - }, - { - "epoch": 1.19, - "learning_rate": 1.3754371142197394e-06, - "loss": 0.7305, - "step": 46371 - }, - { - "epoch": 1.19, - "learning_rate": 1.3754114677747721e-06, - "loss": 0.5688, - "step": 46372 - }, - { - "epoch": 1.19, - "learning_rate": 1.3753858210423693e-06, - "loss": 0.6875, - "step": 46373 - }, - { - "epoch": 1.19, - "learning_rate": 1.3753601740225514e-06, - "loss": 0.6836, - "step": 46374 - }, - { - "epoch": 1.19, - "learning_rate": 1.3753345267153372e-06, - "loss": 0.6699, - "step": 46375 - }, - { - "epoch": 1.19, - "learning_rate": 1.3753088791207466e-06, - "loss": 0.6748, - "step": 46376 - }, - { - "epoch": 1.19, - "learning_rate": 1.375283231238799e-06, - "loss": 0.7227, - "step": 46377 - }, - { - "epoch": 1.19, - "learning_rate": 1.3752575830695145e-06, - "loss": 0.667, - "step": 46378 - }, - { - "epoch": 1.19, - "learning_rate": 1.3752319346129124e-06, - "loss": 0.6716, - "step": 46379 - }, - { - "epoch": 1.19, - "learning_rate": 1.3752062858690126e-06, - "loss": 0.6538, - "step": 46380 - }, - { - "epoch": 1.19, - "learning_rate": 1.3751806368378346e-06, - "loss": 0.5703, - "step": 46381 - }, - { - "epoch": 1.19, - "learning_rate": 1.375154987519398e-06, - "loss": 0.6641, - "step": 46382 - }, - { - "epoch": 1.19, - "learning_rate": 1.3751293379137226e-06, - "loss": 0.8145, - "step": 46383 - }, - { - "epoch": 1.19, - "learning_rate": 1.3751036880208275e-06, - "loss": 0.7168, - "step": 46384 - }, - { - "epoch": 1.19, - "learning_rate": 1.3750780378407334e-06, - "loss": 0.584, - "step": 46385 - }, - { - "epoch": 1.19, - "learning_rate": 1.3750523873734587e-06, - "loss": 0.5604, - "step": 46386 - }, - { - "epoch": 1.19, - "learning_rate": 1.375026736619024e-06, - "loss": 0.7227, - "step": 46387 - }, - { - "epoch": 1.19, - "learning_rate": 1.3750010855774484e-06, - "loss": 0.5801, - "step": 46388 - }, - { - "epoch": 1.19, - "learning_rate": 1.3749754342487516e-06, - "loss": 0.7168, - "step": 46389 - }, - { - "epoch": 1.19, - "learning_rate": 1.3749497826329538e-06, - "loss": 0.7129, - "step": 46390 - }, - { - "epoch": 1.19, - "learning_rate": 1.3749241307300738e-06, - "loss": 0.5906, - "step": 46391 - }, - { - "epoch": 1.19, - "learning_rate": 1.3748984785401317e-06, - "loss": 0.4727, - "step": 46392 - }, - { - "epoch": 1.19, - "learning_rate": 1.374872826063147e-06, - "loss": 0.749, - "step": 46393 - }, - { - "epoch": 1.19, - "learning_rate": 1.3748471732991393e-06, - "loss": 0.5818, - "step": 46394 - }, - { - "epoch": 1.19, - "learning_rate": 1.374821520248129e-06, - "loss": 0.6768, - "step": 46395 - }, - { - "epoch": 1.19, - "learning_rate": 1.3747958669101346e-06, - "loss": 0.5884, - "step": 46396 - }, - { - "epoch": 1.19, - "learning_rate": 1.3747702132851763e-06, - "loss": 0.7678, - "step": 46397 - }, - { - "epoch": 1.19, - "learning_rate": 1.3747445593732736e-06, - "loss": 0.6084, - "step": 46398 - }, - { - "epoch": 1.19, - "learning_rate": 1.3747189051744462e-06, - "loss": 0.668, - "step": 46399 - }, - { - "epoch": 1.19, - "learning_rate": 1.374693250688714e-06, - "loss": 0.7153, - "step": 46400 - }, - { - "epoch": 1.19, - "learning_rate": 1.3746675959160962e-06, - "loss": 0.6963, - "step": 46401 - }, - { - "epoch": 1.19, - "learning_rate": 1.3746419408566127e-06, - "loss": 0.6079, - "step": 46402 - }, - { - "epoch": 1.19, - "learning_rate": 1.3746162855102832e-06, - "loss": 0.6523, - "step": 46403 - }, - { - "epoch": 1.19, - "learning_rate": 1.3745906298771273e-06, - "loss": 0.7139, - "step": 46404 - }, - { - "epoch": 1.19, - "learning_rate": 1.3745649739571642e-06, - "loss": 0.7705, - "step": 46405 - }, - { - "epoch": 1.19, - "learning_rate": 1.3745393177504144e-06, - "loss": 0.7446, - "step": 46406 - }, - { - "epoch": 1.19, - "learning_rate": 1.3745136612568967e-06, - "loss": 0.6611, - "step": 46407 - }, - { - "epoch": 1.19, - "learning_rate": 1.3744880044766314e-06, - "loss": 0.6255, - "step": 46408 - }, - { - "epoch": 1.19, - "learning_rate": 1.3744623474096374e-06, - "loss": 0.6079, - "step": 46409 - }, - { - "epoch": 1.19, - "learning_rate": 1.3744366900559353e-06, - "loss": 0.6572, - "step": 46410 - }, - { - "epoch": 1.19, - "learning_rate": 1.3744110324155441e-06, - "loss": 0.5571, - "step": 46411 - }, - { - "epoch": 1.19, - "learning_rate": 1.3743853744884835e-06, - "loss": 0.5903, - "step": 46412 - }, - { - "epoch": 1.19, - "learning_rate": 1.3743597162747732e-06, - "loss": 0.6968, - "step": 46413 - }, - { - "epoch": 1.19, - "learning_rate": 1.3743340577744328e-06, - "loss": 0.5469, - "step": 46414 - }, - { - "epoch": 1.19, - "learning_rate": 1.3743083989874823e-06, - "loss": 0.7842, - "step": 46415 - }, - { - "epoch": 1.19, - "learning_rate": 1.3742827399139412e-06, - "loss": 0.6177, - "step": 46416 - }, - { - "epoch": 1.19, - "learning_rate": 1.3742570805538285e-06, - "loss": 0.4458, - "step": 46417 - }, - { - "epoch": 1.19, - "learning_rate": 1.3742314209071646e-06, - "loss": 0.6348, - "step": 46418 - }, - { - "epoch": 1.19, - "learning_rate": 1.3742057609739687e-06, - "loss": 0.6875, - "step": 46419 - }, - { - "epoch": 1.19, - "learning_rate": 1.374180100754261e-06, - "loss": 0.7915, - "step": 46420 - }, - { - "epoch": 1.19, - "learning_rate": 1.3741544402480606e-06, - "loss": 0.8682, - "step": 46421 - }, - { - "epoch": 1.19, - "learning_rate": 1.3741287794553878e-06, - "loss": 0.5703, - "step": 46422 - }, - { - "epoch": 1.19, - "learning_rate": 1.3741031183762611e-06, - "loss": 0.6357, - "step": 46423 - }, - { - "epoch": 1.19, - "learning_rate": 1.3740774570107012e-06, - "loss": 0.708, - "step": 46424 - }, - { - "epoch": 1.19, - "learning_rate": 1.3740517953587274e-06, - "loss": 0.6885, - "step": 46425 - }, - { - "epoch": 1.19, - "learning_rate": 1.3740261334203593e-06, - "loss": 0.5391, - "step": 46426 - }, - { - "epoch": 1.19, - "learning_rate": 1.3740004711956166e-06, - "loss": 0.5996, - "step": 46427 - }, - { - "epoch": 1.19, - "learning_rate": 1.3739748086845189e-06, - "loss": 0.4547, - "step": 46428 - }, - { - "epoch": 1.19, - "learning_rate": 1.373949145887086e-06, - "loss": 0.6958, - "step": 46429 - }, - { - "epoch": 1.19, - "learning_rate": 1.3739234828033372e-06, - "loss": 0.7354, - "step": 46430 - }, - { - "epoch": 1.19, - "learning_rate": 1.3738978194332926e-06, - "loss": 0.6592, - "step": 46431 - }, - { - "epoch": 1.19, - "learning_rate": 1.3738721557769715e-06, - "loss": 0.5762, - "step": 46432 - }, - { - "epoch": 1.19, - "learning_rate": 1.3738464918343938e-06, - "loss": 0.7656, - "step": 46433 - }, - { - "epoch": 1.19, - "learning_rate": 1.373820827605579e-06, - "loss": 0.6304, - "step": 46434 - }, - { - "epoch": 1.19, - "learning_rate": 1.373795163090547e-06, - "loss": 0.6333, - "step": 46435 - }, - { - "epoch": 1.19, - "learning_rate": 1.3737694982893166e-06, - "loss": 0.7476, - "step": 46436 - }, - { - "epoch": 1.19, - "learning_rate": 1.3737438332019085e-06, - "loss": 0.7368, - "step": 46437 - }, - { - "epoch": 1.19, - "learning_rate": 1.373718167828342e-06, - "loss": 0.582, - "step": 46438 - }, - { - "epoch": 1.19, - "learning_rate": 1.3736925021686366e-06, - "loss": 0.9189, - "step": 46439 - }, - { - "epoch": 1.19, - "learning_rate": 1.3736668362228119e-06, - "loss": 0.6172, - "step": 46440 - }, - { - "epoch": 1.19, - "learning_rate": 1.373641169990888e-06, - "loss": 0.6675, - "step": 46441 - }, - { - "epoch": 1.19, - "learning_rate": 1.3736155034728838e-06, - "loss": 0.5894, - "step": 46442 - }, - { - "epoch": 1.19, - "learning_rate": 1.3735898366688196e-06, - "loss": 0.5884, - "step": 46443 - }, - { - "epoch": 1.19, - "learning_rate": 1.3735641695787147e-06, - "loss": 0.5874, - "step": 46444 - }, - { - "epoch": 1.19, - "learning_rate": 1.373538502202589e-06, - "loss": 0.564, - "step": 46445 - }, - { - "epoch": 1.19, - "learning_rate": 1.3735128345404623e-06, - "loss": 0.7559, - "step": 46446 - }, - { - "epoch": 1.19, - "learning_rate": 1.3734871665923537e-06, - "loss": 0.563, - "step": 46447 - }, - { - "epoch": 1.19, - "learning_rate": 1.3734614983582832e-06, - "loss": 0.6323, - "step": 46448 - }, - { - "epoch": 1.19, - "learning_rate": 1.3734358298382707e-06, - "loss": 0.707, - "step": 46449 - }, - { - "epoch": 1.19, - "learning_rate": 1.3734101610323352e-06, - "loss": 0.8271, - "step": 46450 - }, - { - "epoch": 1.19, - "learning_rate": 1.373384491940497e-06, - "loss": 0.6416, - "step": 46451 - }, - { - "epoch": 1.19, - "learning_rate": 1.3733588225627752e-06, - "loss": 0.7939, - "step": 46452 - }, - { - "epoch": 1.19, - "learning_rate": 1.3733331528991897e-06, - "loss": 0.54, - "step": 46453 - }, - { - "epoch": 1.19, - "learning_rate": 1.3733074829497601e-06, - "loss": 0.5542, - "step": 46454 - }, - { - "epoch": 1.19, - "learning_rate": 1.3732818127145065e-06, - "loss": 0.7197, - "step": 46455 - }, - { - "epoch": 1.19, - "learning_rate": 1.3732561421934481e-06, - "loss": 0.6523, - "step": 46456 - }, - { - "epoch": 1.19, - "learning_rate": 1.3732304713866044e-06, - "loss": 0.5643, - "step": 46457 - }, - { - "epoch": 1.19, - "learning_rate": 1.3732048002939953e-06, - "loss": 0.6064, - "step": 46458 - }, - { - "epoch": 1.19, - "learning_rate": 1.3731791289156404e-06, - "loss": 0.7812, - "step": 46459 - }, - { - "epoch": 1.19, - "learning_rate": 1.37315345725156e-06, - "loss": 0.71, - "step": 46460 - }, - { - "epoch": 1.19, - "learning_rate": 1.3731277853017723e-06, - "loss": 0.6846, - "step": 46461 - }, - { - "epoch": 1.19, - "learning_rate": 1.3731021130662983e-06, - "loss": 0.8594, - "step": 46462 - }, - { - "epoch": 1.19, - "learning_rate": 1.3730764405451569e-06, - "loss": 0.7471, - "step": 46463 - }, - { - "epoch": 1.19, - "learning_rate": 1.3730507677383684e-06, - "loss": 0.4617, - "step": 46464 - }, - { - "epoch": 1.19, - "learning_rate": 1.3730250946459518e-06, - "loss": 0.6162, - "step": 46465 - }, - { - "epoch": 1.19, - "learning_rate": 1.372999421267927e-06, - "loss": 0.6816, - "step": 46466 - }, - { - "epoch": 1.19, - "learning_rate": 1.372973747604314e-06, - "loss": 0.5654, - "step": 46467 - }, - { - "epoch": 1.19, - "learning_rate": 1.372948073655132e-06, - "loss": 0.6235, - "step": 46468 - }, - { - "epoch": 1.19, - "learning_rate": 1.3729223994204007e-06, - "loss": 0.5713, - "step": 46469 - }, - { - "epoch": 1.19, - "learning_rate": 1.3728967249001398e-06, - "loss": 0.6167, - "step": 46470 - }, - { - "epoch": 1.19, - "learning_rate": 1.3728710500943695e-06, - "loss": 0.646, - "step": 46471 - }, - { - "epoch": 1.19, - "learning_rate": 1.3728453750031084e-06, - "loss": 0.7607, - "step": 46472 - }, - { - "epoch": 1.19, - "learning_rate": 1.372819699626377e-06, - "loss": 0.7393, - "step": 46473 - }, - { - "epoch": 1.19, - "learning_rate": 1.3727940239641944e-06, - "loss": 0.6182, - "step": 46474 - }, - { - "epoch": 1.19, - "learning_rate": 1.3727683480165813e-06, - "loss": 0.5801, - "step": 46475 - }, - { - "epoch": 1.19, - "learning_rate": 1.372742671783556e-06, - "loss": 0.6743, - "step": 46476 - }, - { - "epoch": 1.19, - "learning_rate": 1.372716995265139e-06, - "loss": 0.6294, - "step": 46477 - }, - { - "epoch": 1.19, - "learning_rate": 1.3726913184613493e-06, - "loss": 0.6953, - "step": 46478 - }, - { - "epoch": 1.19, - "learning_rate": 1.3726656413722074e-06, - "loss": 0.5188, - "step": 46479 - }, - { - "epoch": 1.19, - "learning_rate": 1.3726399639977326e-06, - "loss": 0.7549, - "step": 46480 - }, - { - "epoch": 1.19, - "learning_rate": 1.3726142863379447e-06, - "loss": 0.6953, - "step": 46481 - }, - { - "epoch": 1.19, - "learning_rate": 1.3725886083928625e-06, - "loss": 0.7788, - "step": 46482 - }, - { - "epoch": 1.19, - "learning_rate": 1.372562930162507e-06, - "loss": 0.6875, - "step": 46483 - }, - { - "epoch": 1.19, - "learning_rate": 1.3725372516468968e-06, - "loss": 0.4331, - "step": 46484 - }, - { - "epoch": 1.19, - "learning_rate": 1.3725115728460523e-06, - "loss": 0.6855, - "step": 46485 - }, - { - "epoch": 1.19, - "learning_rate": 1.3724858937599924e-06, - "loss": 0.6938, - "step": 46486 - }, - { - "epoch": 1.19, - "learning_rate": 1.3724602143887376e-06, - "loss": 0.4797, - "step": 46487 - }, - { - "epoch": 1.19, - "learning_rate": 1.3724345347323067e-06, - "loss": 0.6475, - "step": 46488 - }, - { - "epoch": 1.19, - "learning_rate": 1.37240885479072e-06, - "loss": 0.7217, - "step": 46489 - }, - { - "epoch": 1.19, - "learning_rate": 1.372383174563997e-06, - "loss": 0.5977, - "step": 46490 - }, - { - "epoch": 1.19, - "learning_rate": 1.3723574940521575e-06, - "loss": 0.7227, - "step": 46491 - }, - { - "epoch": 1.19, - "learning_rate": 1.3723318132552206e-06, - "loss": 0.5747, - "step": 46492 - }, - { - "epoch": 1.19, - "learning_rate": 1.3723061321732066e-06, - "loss": 0.5688, - "step": 46493 - }, - { - "epoch": 1.19, - "learning_rate": 1.372280450806135e-06, - "loss": 0.6855, - "step": 46494 - }, - { - "epoch": 1.19, - "learning_rate": 1.3722547691540252e-06, - "loss": 0.5981, - "step": 46495 - }, - { - "epoch": 1.19, - "learning_rate": 1.372229087216897e-06, - "loss": 0.6494, - "step": 46496 - }, - { - "epoch": 1.19, - "learning_rate": 1.3722034049947701e-06, - "loss": 0.7354, - "step": 46497 - }, - { - "epoch": 1.19, - "learning_rate": 1.3721777224876642e-06, - "loss": 0.6455, - "step": 46498 - }, - { - "epoch": 1.19, - "learning_rate": 1.372152039695599e-06, - "loss": 0.7773, - "step": 46499 - }, - { - "epoch": 1.19, - "learning_rate": 1.3721263566185944e-06, - "loss": 0.6455, - "step": 46500 - }, - { - "epoch": 1.19, - "learning_rate": 1.3721006732566692e-06, - "loss": 0.7065, - "step": 46501 - }, - { - "epoch": 1.19, - "learning_rate": 1.372074989609844e-06, - "loss": 0.6807, - "step": 46502 - }, - { - "epoch": 1.19, - "learning_rate": 1.372049305678138e-06, - "loss": 0.7764, - "step": 46503 - }, - { - "epoch": 1.19, - "learning_rate": 1.3720236214615709e-06, - "loss": 0.7627, - "step": 46504 - }, - { - "epoch": 1.19, - "learning_rate": 1.3719979369601623e-06, - "loss": 0.875, - "step": 46505 - }, - { - "epoch": 1.19, - "learning_rate": 1.3719722521739324e-06, - "loss": 0.6396, - "step": 46506 - }, - { - "epoch": 1.19, - "learning_rate": 1.3719465671028999e-06, - "loss": 0.4226, - "step": 46507 - }, - { - "epoch": 1.19, - "learning_rate": 1.3719208817470854e-06, - "loss": 0.6357, - "step": 46508 - }, - { - "epoch": 1.19, - "learning_rate": 1.3718951961065077e-06, - "loss": 0.6753, - "step": 46509 - }, - { - "epoch": 1.19, - "learning_rate": 1.3718695101811874e-06, - "loss": 0.624, - "step": 46510 - }, - { - "epoch": 1.19, - "learning_rate": 1.3718438239711438e-06, - "loss": 0.6318, - "step": 46511 - }, - { - "epoch": 1.19, - "learning_rate": 1.3718181374763965e-06, - "loss": 0.8262, - "step": 46512 - }, - { - "epoch": 1.19, - "learning_rate": 1.3717924506969646e-06, - "loss": 0.647, - "step": 46513 - }, - { - "epoch": 1.19, - "learning_rate": 1.3717667636328689e-06, - "loss": 0.6626, - "step": 46514 - }, - { - "epoch": 1.19, - "learning_rate": 1.3717410762841282e-06, - "loss": 0.7109, - "step": 46515 - }, - { - "epoch": 1.19, - "learning_rate": 1.3717153886507623e-06, - "loss": 0.5303, - "step": 46516 - }, - { - "epoch": 1.19, - "learning_rate": 1.3716897007327911e-06, - "loss": 0.7295, - "step": 46517 - }, - { - "epoch": 1.19, - "learning_rate": 1.3716640125302344e-06, - "loss": 0.748, - "step": 46518 - }, - { - "epoch": 1.19, - "learning_rate": 1.3716383240431117e-06, - "loss": 0.6255, - "step": 46519 - }, - { - "epoch": 1.19, - "learning_rate": 1.3716126352714426e-06, - "loss": 0.4932, - "step": 46520 - }, - { - "epoch": 1.19, - "learning_rate": 1.3715869462152467e-06, - "loss": 0.5425, - "step": 46521 - }, - { - "epoch": 1.19, - "learning_rate": 1.3715612568745435e-06, - "loss": 0.7266, - "step": 46522 - }, - { - "epoch": 1.19, - "learning_rate": 1.3715355672493534e-06, - "loss": 0.8799, - "step": 46523 - }, - { - "epoch": 1.19, - "learning_rate": 1.3715098773396952e-06, - "loss": 0.6323, - "step": 46524 - }, - { - "epoch": 1.19, - "learning_rate": 1.3714841871455893e-06, - "loss": 0.5298, - "step": 46525 - }, - { - "epoch": 1.19, - "learning_rate": 1.3714584966670549e-06, - "loss": 0.584, - "step": 46526 - }, - { - "epoch": 1.19, - "learning_rate": 1.3714328059041117e-06, - "loss": 0.5024, - "step": 46527 - }, - { - "epoch": 1.19, - "learning_rate": 1.3714071148567794e-06, - "loss": 0.7393, - "step": 46528 - }, - { - "epoch": 1.19, - "learning_rate": 1.371381423525078e-06, - "loss": 0.6655, - "step": 46529 - }, - { - "epoch": 1.19, - "learning_rate": 1.371355731909027e-06, - "loss": 0.6807, - "step": 46530 - }, - { - "epoch": 1.19, - "learning_rate": 1.371330040008646e-06, - "loss": 0.6074, - "step": 46531 - }, - { - "epoch": 1.19, - "learning_rate": 1.3713043478239542e-06, - "loss": 0.4897, - "step": 46532 - }, - { - "epoch": 1.19, - "learning_rate": 1.371278655354972e-06, - "loss": 0.7061, - "step": 46533 - }, - { - "epoch": 1.19, - "learning_rate": 1.3712529626017188e-06, - "loss": 0.728, - "step": 46534 - }, - { - "epoch": 1.19, - "learning_rate": 1.3712272695642144e-06, - "loss": 0.6699, - "step": 46535 - }, - { - "epoch": 1.19, - "learning_rate": 1.3712015762424783e-06, - "loss": 0.668, - "step": 46536 - }, - { - "epoch": 1.19, - "learning_rate": 1.37117588263653e-06, - "loss": 0.5786, - "step": 46537 - }, - { - "epoch": 1.19, - "learning_rate": 1.3711501887463896e-06, - "loss": 0.4648, - "step": 46538 - }, - { - "epoch": 1.19, - "learning_rate": 1.3711244945720765e-06, - "loss": 0.623, - "step": 46539 - }, - { - "epoch": 1.19, - "learning_rate": 1.3710988001136108e-06, - "loss": 0.8164, - "step": 46540 - }, - { - "epoch": 1.19, - "learning_rate": 1.3710731053710113e-06, - "loss": 0.7285, - "step": 46541 - }, - { - "epoch": 1.19, - "learning_rate": 1.3710474103442985e-06, - "loss": 0.687, - "step": 46542 - }, - { - "epoch": 1.19, - "learning_rate": 1.3710217150334912e-06, - "loss": 0.5708, - "step": 46543 - }, - { - "epoch": 1.19, - "learning_rate": 1.3709960194386105e-06, - "loss": 0.4312, - "step": 46544 - }, - { - "epoch": 1.19, - "learning_rate": 1.3709703235596748e-06, - "loss": 0.6567, - "step": 46545 - }, - { - "epoch": 1.19, - "learning_rate": 1.370944627396704e-06, - "loss": 0.6494, - "step": 46546 - }, - { - "epoch": 1.19, - "learning_rate": 1.370918930949718e-06, - "loss": 0.646, - "step": 46547 - }, - { - "epoch": 1.19, - "learning_rate": 1.3708932342187366e-06, - "loss": 0.6377, - "step": 46548 - }, - { - "epoch": 1.19, - "learning_rate": 1.3708675372037791e-06, - "loss": 0.6167, - "step": 46549 - }, - { - "epoch": 1.19, - "learning_rate": 1.3708418399048657e-06, - "loss": 0.5125, - "step": 46550 - }, - { - "epoch": 1.19, - "learning_rate": 1.3708161423220154e-06, - "loss": 0.4064, - "step": 46551 - }, - { - "epoch": 1.19, - "learning_rate": 1.3707904444552488e-06, - "loss": 0.5664, - "step": 46552 - }, - { - "epoch": 1.19, - "learning_rate": 1.3707647463045845e-06, - "loss": 0.6987, - "step": 46553 - }, - { - "epoch": 1.19, - "learning_rate": 1.3707390478700427e-06, - "loss": 0.6074, - "step": 46554 - }, - { - "epoch": 1.19, - "learning_rate": 1.3707133491516431e-06, - "loss": 0.5466, - "step": 46555 - }, - { - "epoch": 1.19, - "learning_rate": 1.3706876501494053e-06, - "loss": 0.6279, - "step": 46556 - }, - { - "epoch": 1.19, - "learning_rate": 1.3706619508633492e-06, - "loss": 0.6221, - "step": 46557 - }, - { - "epoch": 1.19, - "learning_rate": 1.3706362512934943e-06, - "loss": 0.709, - "step": 46558 - }, - { - "epoch": 1.19, - "learning_rate": 1.3706105514398603e-06, - "loss": 0.7383, - "step": 46559 - }, - { - "epoch": 1.19, - "learning_rate": 1.3705848513024664e-06, - "loss": 0.7314, - "step": 46560 - }, - { - "epoch": 1.19, - "learning_rate": 1.3705591508813332e-06, - "loss": 0.6689, - "step": 46561 - }, - { - "epoch": 1.19, - "learning_rate": 1.3705334501764796e-06, - "loss": 0.5898, - "step": 46562 - }, - { - "epoch": 1.19, - "learning_rate": 1.3705077491879258e-06, - "loss": 0.4801, - "step": 46563 - }, - { - "epoch": 1.19, - "learning_rate": 1.3704820479156911e-06, - "loss": 0.5811, - "step": 46564 - }, - { - "epoch": 1.19, - "learning_rate": 1.3704563463597953e-06, - "loss": 0.5554, - "step": 46565 - }, - { - "epoch": 1.19, - "learning_rate": 1.3704306445202583e-06, - "loss": 0.4849, - "step": 46566 - }, - { - "epoch": 1.19, - "learning_rate": 1.3704049423970994e-06, - "loss": 0.9092, - "step": 46567 - }, - { - "epoch": 1.19, - "learning_rate": 1.3703792399903384e-06, - "loss": 0.6519, - "step": 46568 - }, - { - "epoch": 1.19, - "learning_rate": 1.3703535372999955e-06, - "loss": 0.3479, - "step": 46569 - }, - { - "epoch": 1.19, - "learning_rate": 1.3703278343260895e-06, - "loss": 0.4893, - "step": 46570 - }, - { - "epoch": 1.19, - "learning_rate": 1.3703021310686406e-06, - "loss": 0.6362, - "step": 46571 - }, - { - "epoch": 1.19, - "learning_rate": 1.3702764275276685e-06, - "loss": 0.6494, - "step": 46572 - }, - { - "epoch": 1.19, - "learning_rate": 1.3702507237031925e-06, - "loss": 0.6406, - "step": 46573 - }, - { - "epoch": 1.19, - "learning_rate": 1.3702250195952328e-06, - "loss": 0.4285, - "step": 46574 - }, - { - "epoch": 1.19, - "learning_rate": 1.3701993152038088e-06, - "loss": 0.9062, - "step": 46575 - }, - { - "epoch": 1.19, - "learning_rate": 1.3701736105289401e-06, - "loss": 0.8184, - "step": 46576 - }, - { - "epoch": 1.19, - "learning_rate": 1.3701479055706466e-06, - "loss": 0.707, - "step": 46577 - }, - { - "epoch": 1.19, - "learning_rate": 1.3701222003289474e-06, - "loss": 0.6328, - "step": 46578 - }, - { - "epoch": 1.19, - "learning_rate": 1.3700964948038633e-06, - "loss": 0.8262, - "step": 46579 - }, - { - "epoch": 1.19, - "learning_rate": 1.3700707889954131e-06, - "loss": 0.5933, - "step": 46580 - }, - { - "epoch": 1.19, - "learning_rate": 1.3700450829036165e-06, - "loss": 0.605, - "step": 46581 - }, - { - "epoch": 1.19, - "learning_rate": 1.3700193765284937e-06, - "loss": 0.7646, - "step": 46582 - }, - { - "epoch": 1.19, - "learning_rate": 1.3699936698700638e-06, - "loss": 0.708, - "step": 46583 - }, - { - "epoch": 1.19, - "learning_rate": 1.369967962928347e-06, - "loss": 0.6313, - "step": 46584 - }, - { - "epoch": 1.19, - "learning_rate": 1.369942255703363e-06, - "loss": 0.6631, - "step": 46585 - }, - { - "epoch": 1.19, - "learning_rate": 1.3699165481951307e-06, - "loss": 0.7222, - "step": 46586 - }, - { - "epoch": 1.19, - "learning_rate": 1.3698908404036705e-06, - "loss": 0.4873, - "step": 46587 - }, - { - "epoch": 1.19, - "learning_rate": 1.3698651323290017e-06, - "loss": 0.4934, - "step": 46588 - }, - { - "epoch": 1.19, - "learning_rate": 1.3698394239711446e-06, - "loss": 0.7725, - "step": 46589 - }, - { - "epoch": 1.19, - "learning_rate": 1.3698137153301183e-06, - "loss": 0.6089, - "step": 46590 - }, - { - "epoch": 1.19, - "learning_rate": 1.3697880064059423e-06, - "loss": 0.6973, - "step": 46591 - }, - { - "epoch": 1.19, - "learning_rate": 1.3697622971986372e-06, - "loss": 0.6885, - "step": 46592 - }, - { - "epoch": 1.19, - "learning_rate": 1.3697365877082217e-06, - "loss": 0.7598, - "step": 46593 - }, - { - "epoch": 1.19, - "learning_rate": 1.3697108779347163e-06, - "loss": 0.3716, - "step": 46594 - }, - { - "epoch": 1.19, - "learning_rate": 1.3696851678781397e-06, - "loss": 0.7646, - "step": 46595 - }, - { - "epoch": 1.19, - "learning_rate": 1.3696594575385126e-06, - "loss": 0.7314, - "step": 46596 - }, - { - "epoch": 1.19, - "learning_rate": 1.369633746915854e-06, - "loss": 0.5815, - "step": 46597 - }, - { - "epoch": 1.19, - "learning_rate": 1.3696080360101838e-06, - "loss": 0.7178, - "step": 46598 - }, - { - "epoch": 1.19, - "learning_rate": 1.3695823248215218e-06, - "loss": 0.6089, - "step": 46599 - }, - { - "epoch": 1.19, - "learning_rate": 1.3695566133498877e-06, - "loss": 0.5283, - "step": 46600 - }, - { - "epoch": 1.19, - "learning_rate": 1.3695309015953013e-06, - "loss": 0.9424, - "step": 46601 - }, - { - "epoch": 1.19, - "learning_rate": 1.3695051895577816e-06, - "loss": 0.4424, - "step": 46602 - }, - { - "epoch": 1.19, - "learning_rate": 1.369479477237349e-06, - "loss": 0.8486, - "step": 46603 - }, - { - "epoch": 1.19, - "learning_rate": 1.369453764634023e-06, - "loss": 0.6855, - "step": 46604 - }, - { - "epoch": 1.19, - "learning_rate": 1.3694280517478233e-06, - "loss": 0.6934, - "step": 46605 - }, - { - "epoch": 1.19, - "learning_rate": 1.3694023385787693e-06, - "loss": 0.7383, - "step": 46606 - }, - { - "epoch": 1.19, - "learning_rate": 1.369376625126881e-06, - "loss": 0.6768, - "step": 46607 - }, - { - "epoch": 1.19, - "learning_rate": 1.369350911392178e-06, - "loss": 0.6089, - "step": 46608 - }, - { - "epoch": 1.19, - "learning_rate": 1.3693251973746801e-06, - "loss": 0.5654, - "step": 46609 - }, - { - "epoch": 1.19, - "learning_rate": 1.3692994830744069e-06, - "loss": 0.7324, - "step": 46610 - }, - { - "epoch": 1.19, - "learning_rate": 1.369273768491378e-06, - "loss": 0.6128, - "step": 46611 - }, - { - "epoch": 1.19, - "learning_rate": 1.3692480536256131e-06, - "loss": 0.6895, - "step": 46612 - }, - { - "epoch": 1.19, - "learning_rate": 1.369222338477132e-06, - "loss": 0.6377, - "step": 46613 - }, - { - "epoch": 1.19, - "learning_rate": 1.3691966230459544e-06, - "loss": 0.5249, - "step": 46614 - }, - { - "epoch": 1.19, - "learning_rate": 1.3691709073320998e-06, - "loss": 0.6807, - "step": 46615 - }, - { - "epoch": 1.19, - "learning_rate": 1.3691451913355878e-06, - "loss": 0.7402, - "step": 46616 - }, - { - "epoch": 1.19, - "learning_rate": 1.3691194750564388e-06, - "loss": 0.6494, - "step": 46617 - }, - { - "epoch": 1.19, - "learning_rate": 1.3690937584946716e-06, - "loss": 0.6841, - "step": 46618 - }, - { - "epoch": 1.19, - "learning_rate": 1.3690680416503067e-06, - "loss": 0.793, - "step": 46619 - }, - { - "epoch": 1.19, - "learning_rate": 1.369042324523363e-06, - "loss": 0.5338, - "step": 46620 - }, - { - "epoch": 1.19, - "learning_rate": 1.3690166071138606e-06, - "loss": 0.7852, - "step": 46621 - }, - { - "epoch": 1.19, - "learning_rate": 1.368990889421819e-06, - "loss": 0.6216, - "step": 46622 - }, - { - "epoch": 1.19, - "learning_rate": 1.3689651714472583e-06, - "loss": 0.7168, - "step": 46623 - }, - { - "epoch": 1.19, - "learning_rate": 1.3689394531901979e-06, - "loss": 0.6338, - "step": 46624 - }, - { - "epoch": 1.2, - "learning_rate": 1.3689137346506575e-06, - "loss": 0.7969, - "step": 46625 - }, - { - "epoch": 1.2, - "learning_rate": 1.368888015828657e-06, - "loss": 0.5879, - "step": 46626 - }, - { - "epoch": 1.2, - "learning_rate": 1.3688622967242155e-06, - "loss": 0.5059, - "step": 46627 - }, - { - "epoch": 1.2, - "learning_rate": 1.3688365773373533e-06, - "loss": 0.5491, - "step": 46628 - }, - { - "epoch": 1.2, - "learning_rate": 1.36881085766809e-06, - "loss": 0.6509, - "step": 46629 - }, - { - "epoch": 1.2, - "learning_rate": 1.3687851377164451e-06, - "loss": 0.8428, - "step": 46630 - }, - { - "epoch": 1.2, - "learning_rate": 1.3687594174824384e-06, - "loss": 0.8594, - "step": 46631 - }, - { - "epoch": 1.2, - "learning_rate": 1.3687336969660893e-06, - "loss": 0.5383, - "step": 46632 - }, - { - "epoch": 1.2, - "learning_rate": 1.368707976167418e-06, - "loss": 0.8096, - "step": 46633 - }, - { - "epoch": 1.2, - "learning_rate": 1.3686822550864444e-06, - "loss": 0.647, - "step": 46634 - }, - { - "epoch": 1.2, - "learning_rate": 1.368656533723187e-06, - "loss": 0.7598, - "step": 46635 - }, - { - "epoch": 1.2, - "learning_rate": 1.3686308120776669e-06, - "loss": 0.6328, - "step": 46636 - }, - { - "epoch": 1.2, - "learning_rate": 1.3686050901499028e-06, - "loss": 0.707, - "step": 46637 - }, - { - "epoch": 1.2, - "learning_rate": 1.3685793679399145e-06, - "loss": 0.7725, - "step": 46638 - }, - { - "epoch": 1.2, - "learning_rate": 1.3685536454477221e-06, - "loss": 0.6309, - "step": 46639 - }, - { - "epoch": 1.2, - "learning_rate": 1.3685279226733454e-06, - "loss": 0.6963, - "step": 46640 - }, - { - "epoch": 1.2, - "learning_rate": 1.3685021996168034e-06, - "loss": 0.7168, - "step": 46641 - }, - { - "epoch": 1.2, - "learning_rate": 1.3684764762781164e-06, - "loss": 0.5991, - "step": 46642 - }, - { - "epoch": 1.2, - "learning_rate": 1.368450752657304e-06, - "loss": 0.4997, - "step": 46643 - }, - { - "epoch": 1.2, - "learning_rate": 1.3684250287543858e-06, - "loss": 0.7412, - "step": 46644 - }, - { - "epoch": 1.2, - "learning_rate": 1.3683993045693814e-06, - "loss": 0.6299, - "step": 46645 - }, - { - "epoch": 1.2, - "learning_rate": 1.3683735801023103e-06, - "loss": 0.5947, - "step": 46646 - }, - { - "epoch": 1.2, - "learning_rate": 1.368347855353193e-06, - "loss": 0.5562, - "step": 46647 - }, - { - "epoch": 1.2, - "learning_rate": 1.3683221303220484e-06, - "loss": 0.6565, - "step": 46648 - }, - { - "epoch": 1.2, - "learning_rate": 1.3682964050088967e-06, - "loss": 0.8281, - "step": 46649 - }, - { - "epoch": 1.2, - "learning_rate": 1.368270679413757e-06, - "loss": 0.5488, - "step": 46650 - }, - { - "epoch": 1.2, - "learning_rate": 1.3682449535366498e-06, - "loss": 0.7266, - "step": 46651 - }, - { - "epoch": 1.2, - "learning_rate": 1.3682192273775938e-06, - "loss": 0.6169, - "step": 46652 - }, - { - "epoch": 1.2, - "learning_rate": 1.3681935009366099e-06, - "loss": 0.522, - "step": 46653 - }, - { - "epoch": 1.2, - "learning_rate": 1.368167774213717e-06, - "loss": 0.572, - "step": 46654 - }, - { - "epoch": 1.2, - "learning_rate": 1.368142047208935e-06, - "loss": 0.5627, - "step": 46655 - }, - { - "epoch": 1.2, - "learning_rate": 1.3681163199222832e-06, - "loss": 0.6562, - "step": 46656 - }, - { - "epoch": 1.2, - "learning_rate": 1.368090592353782e-06, - "loss": 0.5376, - "step": 46657 - }, - { - "epoch": 1.2, - "learning_rate": 1.3680648645034504e-06, - "loss": 0.6362, - "step": 46658 - }, - { - "epoch": 1.2, - "learning_rate": 1.3680391363713091e-06, - "loss": 0.6504, - "step": 46659 - }, - { - "epoch": 1.2, - "learning_rate": 1.3680134079573767e-06, - "loss": 0.6772, - "step": 46660 - }, - { - "epoch": 1.2, - "learning_rate": 1.3679876792616734e-06, - "loss": 0.7275, - "step": 46661 - }, - { - "epoch": 1.2, - "learning_rate": 1.3679619502842186e-06, - "loss": 0.6328, - "step": 46662 - }, - { - "epoch": 1.2, - "learning_rate": 1.3679362210250326e-06, - "loss": 0.6699, - "step": 46663 - }, - { - "epoch": 1.2, - "learning_rate": 1.367910491484135e-06, - "loss": 0.7627, - "step": 46664 - }, - { - "epoch": 1.2, - "learning_rate": 1.367884761661545e-06, - "loss": 0.7236, - "step": 46665 - }, - { - "epoch": 1.2, - "learning_rate": 1.3678590315572822e-06, - "loss": 0.6709, - "step": 46666 - }, - { - "epoch": 1.2, - "learning_rate": 1.3678333011713669e-06, - "loss": 0.6187, - "step": 46667 - }, - { - "epoch": 1.2, - "learning_rate": 1.3678075705038186e-06, - "loss": 0.6855, - "step": 46668 - }, - { - "epoch": 1.2, - "learning_rate": 1.367781839554657e-06, - "loss": 0.6709, - "step": 46669 - }, - { - "epoch": 1.2, - "learning_rate": 1.3677561083239017e-06, - "loss": 0.665, - "step": 46670 - }, - { - "epoch": 1.2, - "learning_rate": 1.3677303768115725e-06, - "loss": 0.5366, - "step": 46671 - }, - { - "epoch": 1.2, - "learning_rate": 1.367704645017689e-06, - "loss": 0.5684, - "step": 46672 - }, - { - "epoch": 1.2, - "learning_rate": 1.3676789129422708e-06, - "loss": 0.7637, - "step": 46673 - }, - { - "epoch": 1.2, - "learning_rate": 1.3676531805853381e-06, - "loss": 0.521, - "step": 46674 - }, - { - "epoch": 1.2, - "learning_rate": 1.3676274479469102e-06, - "loss": 0.7729, - "step": 46675 - }, - { - "epoch": 1.2, - "learning_rate": 1.3676017150270068e-06, - "loss": 0.7012, - "step": 46676 - }, - { - "epoch": 1.2, - "learning_rate": 1.3675759818256473e-06, - "loss": 0.7041, - "step": 46677 - }, - { - "epoch": 1.2, - "learning_rate": 1.3675502483428525e-06, - "loss": 0.6621, - "step": 46678 - }, - { - "epoch": 1.2, - "learning_rate": 1.3675245145786408e-06, - "loss": 0.627, - "step": 46679 - }, - { - "epoch": 1.2, - "learning_rate": 1.3674987805330328e-06, - "loss": 0.7227, - "step": 46680 - }, - { - "epoch": 1.2, - "learning_rate": 1.3674730462060478e-06, - "loss": 0.6294, - "step": 46681 - }, - { - "epoch": 1.2, - "learning_rate": 1.3674473115977056e-06, - "loss": 0.6201, - "step": 46682 - }, - { - "epoch": 1.2, - "learning_rate": 1.3674215767080257e-06, - "loss": 0.6389, - "step": 46683 - }, - { - "epoch": 1.2, - "learning_rate": 1.3673958415370283e-06, - "loss": 0.7715, - "step": 46684 - }, - { - "epoch": 1.2, - "learning_rate": 1.3673701060847325e-06, - "loss": 0.5518, - "step": 46685 - }, - { - "epoch": 1.2, - "learning_rate": 1.3673443703511585e-06, - "loss": 0.7598, - "step": 46686 - }, - { - "epoch": 1.2, - "learning_rate": 1.3673186343363257e-06, - "loss": 0.7275, - "step": 46687 - }, - { - "epoch": 1.2, - "learning_rate": 1.367292898040254e-06, - "loss": 0.5459, - "step": 46688 - }, - { - "epoch": 1.2, - "learning_rate": 1.367267161462963e-06, - "loss": 0.6187, - "step": 46689 - }, - { - "epoch": 1.2, - "learning_rate": 1.3672414246044723e-06, - "loss": 0.6924, - "step": 46690 - }, - { - "epoch": 1.2, - "learning_rate": 1.3672156874648018e-06, - "loss": 0.6299, - "step": 46691 - }, - { - "epoch": 1.2, - "learning_rate": 1.3671899500439712e-06, - "loss": 0.8027, - "step": 46692 - }, - { - "epoch": 1.2, - "learning_rate": 1.367164212342e-06, - "loss": 0.6377, - "step": 46693 - }, - { - "epoch": 1.2, - "learning_rate": 1.367138474358908e-06, - "loss": 0.5796, - "step": 46694 - }, - { - "epoch": 1.2, - "learning_rate": 1.3671127360947153e-06, - "loss": 0.6475, - "step": 46695 - }, - { - "epoch": 1.2, - "learning_rate": 1.3670869975494408e-06, - "loss": 0.709, - "step": 46696 - }, - { - "epoch": 1.2, - "learning_rate": 1.3670612587231051e-06, - "loss": 0.7471, - "step": 46697 - }, - { - "epoch": 1.2, - "learning_rate": 1.367035519615727e-06, - "loss": 0.7358, - "step": 46698 - }, - { - "epoch": 1.2, - "learning_rate": 1.3670097802273272e-06, - "loss": 0.7656, - "step": 46699 - }, - { - "epoch": 1.2, - "learning_rate": 1.3669840405579244e-06, - "loss": 0.7119, - "step": 46700 - }, - { - "epoch": 1.2, - "learning_rate": 1.3669583006075394e-06, - "loss": 0.5219, - "step": 46701 - }, - { - "epoch": 1.2, - "learning_rate": 1.3669325603761908e-06, - "loss": 0.6265, - "step": 46702 - }, - { - "epoch": 1.2, - "learning_rate": 1.366906819863899e-06, - "loss": 0.6655, - "step": 46703 - }, - { - "epoch": 1.2, - "learning_rate": 1.3668810790706835e-06, - "loss": 0.3828, - "step": 46704 - }, - { - "epoch": 1.2, - "learning_rate": 1.3668553379965642e-06, - "loss": 0.7061, - "step": 46705 - }, - { - "epoch": 1.2, - "learning_rate": 1.36682959664156e-06, - "loss": 0.7061, - "step": 46706 - }, - { - "epoch": 1.2, - "learning_rate": 1.366803855005692e-06, - "loss": 0.439, - "step": 46707 - }, - { - "epoch": 1.2, - "learning_rate": 1.3667781130889786e-06, - "loss": 0.7505, - "step": 46708 - }, - { - "epoch": 1.2, - "learning_rate": 1.3667523708914406e-06, - "loss": 0.6689, - "step": 46709 - }, - { - "epoch": 1.2, - "learning_rate": 1.3667266284130967e-06, - "loss": 0.708, - "step": 46710 - }, - { - "epoch": 1.2, - "learning_rate": 1.3667008856539671e-06, - "loss": 0.6545, - "step": 46711 - }, - { - "epoch": 1.2, - "learning_rate": 1.3666751426140716e-06, - "loss": 0.6636, - "step": 46712 - }, - { - "epoch": 1.2, - "learning_rate": 1.3666493992934301e-06, - "loss": 0.749, - "step": 46713 - }, - { - "epoch": 1.2, - "learning_rate": 1.3666236556920616e-06, - "loss": 0.6077, - "step": 46714 - }, - { - "epoch": 1.2, - "learning_rate": 1.3665979118099864e-06, - "loss": 0.6021, - "step": 46715 - }, - { - "epoch": 1.2, - "learning_rate": 1.3665721676472241e-06, - "loss": 0.5234, - "step": 46716 - }, - { - "epoch": 1.2, - "learning_rate": 1.3665464232037941e-06, - "loss": 0.585, - "step": 46717 - }, - { - "epoch": 1.2, - "learning_rate": 1.3665206784797165e-06, - "loss": 0.5115, - "step": 46718 - }, - { - "epoch": 1.2, - "learning_rate": 1.366494933475011e-06, - "loss": 0.6328, - "step": 46719 - }, - { - "epoch": 1.2, - "learning_rate": 1.3664691881896973e-06, - "loss": 0.6339, - "step": 46720 - }, - { - "epoch": 1.2, - "learning_rate": 1.3664434426237944e-06, - "loss": 0.4727, - "step": 46721 - }, - { - "epoch": 1.2, - "learning_rate": 1.3664176967773232e-06, - "loss": 0.5259, - "step": 46722 - }, - { - "epoch": 1.2, - "learning_rate": 1.3663919506503025e-06, - "loss": 0.4097, - "step": 46723 - }, - { - "epoch": 1.2, - "learning_rate": 1.3663662042427526e-06, - "loss": 0.708, - "step": 46724 - }, - { - "epoch": 1.2, - "learning_rate": 1.3663404575546927e-06, - "loss": 0.6729, - "step": 46725 - }, - { - "epoch": 1.2, - "learning_rate": 1.3663147105861427e-06, - "loss": 0.436, - "step": 46726 - }, - { - "epoch": 1.2, - "learning_rate": 1.3662889633371223e-06, - "loss": 0.8047, - "step": 46727 - }, - { - "epoch": 1.2, - "learning_rate": 1.3662632158076517e-06, - "loss": 0.5044, - "step": 46728 - }, - { - "epoch": 1.2, - "learning_rate": 1.3662374679977502e-06, - "loss": 0.5986, - "step": 46729 - }, - { - "epoch": 1.2, - "learning_rate": 1.3662117199074372e-06, - "loss": 0.7764, - "step": 46730 - }, - { - "epoch": 1.2, - "learning_rate": 1.3661859715367328e-06, - "loss": 0.6113, - "step": 46731 - }, - { - "epoch": 1.2, - "learning_rate": 1.3661602228856567e-06, - "loss": 0.7119, - "step": 46732 - }, - { - "epoch": 1.2, - "learning_rate": 1.3661344739542285e-06, - "loss": 0.7549, - "step": 46733 - }, - { - "epoch": 1.2, - "learning_rate": 1.3661087247424678e-06, - "loss": 0.7695, - "step": 46734 - }, - { - "epoch": 1.2, - "learning_rate": 1.366082975250395e-06, - "loss": 0.5557, - "step": 46735 - }, - { - "epoch": 1.2, - "learning_rate": 1.3660572254780286e-06, - "loss": 0.6621, - "step": 46736 - }, - { - "epoch": 1.2, - "learning_rate": 1.3660314754253893e-06, - "loss": 0.6943, - "step": 46737 - }, - { - "epoch": 1.2, - "learning_rate": 1.3660057250924969e-06, - "loss": 0.7568, - "step": 46738 - }, - { - "epoch": 1.2, - "learning_rate": 1.3659799744793704e-06, - "loss": 0.7588, - "step": 46739 - }, - { - "epoch": 1.2, - "learning_rate": 1.3659542235860297e-06, - "loss": 0.6123, - "step": 46740 - }, - { - "epoch": 1.2, - "learning_rate": 1.3659284724124952e-06, - "loss": 0.7676, - "step": 46741 - }, - { - "epoch": 1.2, - "learning_rate": 1.3659027209587854e-06, - "loss": 0.5859, - "step": 46742 - }, - { - "epoch": 1.2, - "learning_rate": 1.3658769692249213e-06, - "loss": 0.6709, - "step": 46743 - }, - { - "epoch": 1.2, - "learning_rate": 1.3658512172109219e-06, - "loss": 0.7363, - "step": 46744 - }, - { - "epoch": 1.2, - "learning_rate": 1.3658254649168068e-06, - "loss": 0.7207, - "step": 46745 - }, - { - "epoch": 1.2, - "learning_rate": 1.3657997123425962e-06, - "loss": 0.6128, - "step": 46746 - }, - { - "epoch": 1.2, - "learning_rate": 1.3657739594883096e-06, - "loss": 0.6465, - "step": 46747 - }, - { - "epoch": 1.2, - "learning_rate": 1.3657482063539662e-06, - "loss": 0.5767, - "step": 46748 - }, - { - "epoch": 1.2, - "learning_rate": 1.365722452939587e-06, - "loss": 0.5449, - "step": 46749 - }, - { - "epoch": 1.2, - "learning_rate": 1.3656966992451903e-06, - "loss": 0.5967, - "step": 46750 - }, - { - "epoch": 1.2, - "learning_rate": 1.365670945270797e-06, - "loss": 0.6099, - "step": 46751 - }, - { - "epoch": 1.2, - "learning_rate": 1.3656451910164257e-06, - "loss": 0.5615, - "step": 46752 - }, - { - "epoch": 1.2, - "learning_rate": 1.3656194364820972e-06, - "loss": 0.5693, - "step": 46753 - }, - { - "epoch": 1.2, - "learning_rate": 1.3655936816678304e-06, - "loss": 0.6504, - "step": 46754 - }, - { - "epoch": 1.2, - "learning_rate": 1.3655679265736455e-06, - "loss": 0.6157, - "step": 46755 - }, - { - "epoch": 1.2, - "learning_rate": 1.3655421711995619e-06, - "loss": 0.6279, - "step": 46756 - }, - { - "epoch": 1.2, - "learning_rate": 1.3655164155455996e-06, - "loss": 0.7109, - "step": 46757 - }, - { - "epoch": 1.2, - "learning_rate": 1.3654906596117778e-06, - "loss": 0.6602, - "step": 46758 - }, - { - "epoch": 1.2, - "learning_rate": 1.365464903398117e-06, - "loss": 0.6299, - "step": 46759 - }, - { - "epoch": 1.2, - "learning_rate": 1.3654391469046367e-06, - "loss": 0.5801, - "step": 46760 - }, - { - "epoch": 1.2, - "learning_rate": 1.3654133901313557e-06, - "loss": 0.5645, - "step": 46761 - }, - { - "epoch": 1.2, - "learning_rate": 1.365387633078295e-06, - "loss": 0.6489, - "step": 46762 - }, - { - "epoch": 1.2, - "learning_rate": 1.3653618757454739e-06, - "loss": 0.7139, - "step": 46763 - }, - { - "epoch": 1.2, - "learning_rate": 1.3653361181329122e-06, - "loss": 0.7197, - "step": 46764 - }, - { - "epoch": 1.2, - "learning_rate": 1.365310360240629e-06, - "loss": 0.6177, - "step": 46765 - }, - { - "epoch": 1.2, - "learning_rate": 1.3652846020686445e-06, - "loss": 0.9541, - "step": 46766 - }, - { - "epoch": 1.2, - "learning_rate": 1.3652588436169783e-06, - "loss": 0.4197, - "step": 46767 - }, - { - "epoch": 1.2, - "learning_rate": 1.3652330848856505e-06, - "loss": 0.6912, - "step": 46768 - }, - { - "epoch": 1.2, - "learning_rate": 1.3652073258746804e-06, - "loss": 0.7207, - "step": 46769 - }, - { - "epoch": 1.2, - "learning_rate": 1.3651815665840878e-06, - "loss": 0.6514, - "step": 46770 - }, - { - "epoch": 1.2, - "learning_rate": 1.3651558070138921e-06, - "loss": 0.666, - "step": 46771 - }, - { - "epoch": 1.2, - "learning_rate": 1.365130047164114e-06, - "loss": 0.5088, - "step": 46772 - }, - { - "epoch": 1.2, - "learning_rate": 1.3651042870347722e-06, - "loss": 0.6636, - "step": 46773 - }, - { - "epoch": 1.2, - "learning_rate": 1.3650785266258874e-06, - "loss": 0.7295, - "step": 46774 - }, - { - "epoch": 1.2, - "learning_rate": 1.3650527659374782e-06, - "loss": 0.6528, - "step": 46775 - }, - { - "epoch": 1.2, - "learning_rate": 1.365027004969565e-06, - "loss": 0.604, - "step": 46776 - }, - { - "epoch": 1.2, - "learning_rate": 1.3650012437221672e-06, - "loss": 0.576, - "step": 46777 - }, - { - "epoch": 1.2, - "learning_rate": 1.3649754821953053e-06, - "loss": 0.6089, - "step": 46778 - }, - { - "epoch": 1.2, - "learning_rate": 1.364949720388998e-06, - "loss": 0.7129, - "step": 46779 - }, - { - "epoch": 1.2, - "learning_rate": 1.3649239583032655e-06, - "loss": 0.6147, - "step": 46780 - }, - { - "epoch": 1.2, - "learning_rate": 1.3648981959381277e-06, - "loss": 0.791, - "step": 46781 - }, - { - "epoch": 1.2, - "learning_rate": 1.3648724332936042e-06, - "loss": 0.791, - "step": 46782 - }, - { - "epoch": 1.2, - "learning_rate": 1.3648466703697144e-06, - "loss": 0.5728, - "step": 46783 - }, - { - "epoch": 1.2, - "learning_rate": 1.3648209071664782e-06, - "loss": 0.752, - "step": 46784 - }, - { - "epoch": 1.2, - "learning_rate": 1.364795143683916e-06, - "loss": 0.7148, - "step": 46785 - }, - { - "epoch": 1.2, - "learning_rate": 1.364769379922046e-06, - "loss": 0.7109, - "step": 46786 - }, - { - "epoch": 1.2, - "learning_rate": 1.3647436158808897e-06, - "loss": 0.8301, - "step": 46787 - }, - { - "epoch": 1.2, - "learning_rate": 1.3647178515604653e-06, - "loss": 0.625, - "step": 46788 - }, - { - "epoch": 1.2, - "learning_rate": 1.3646920869607938e-06, - "loss": 0.7188, - "step": 46789 - }, - { - "epoch": 1.2, - "learning_rate": 1.3646663220818942e-06, - "loss": 0.6704, - "step": 46790 - }, - { - "epoch": 1.2, - "learning_rate": 1.3646405569237862e-06, - "loss": 0.8359, - "step": 46791 - }, - { - "epoch": 1.2, - "learning_rate": 1.3646147914864896e-06, - "loss": 0.7075, - "step": 46792 - }, - { - "epoch": 1.2, - "learning_rate": 1.3645890257700244e-06, - "loss": 0.6934, - "step": 46793 - }, - { - "epoch": 1.2, - "learning_rate": 1.3645632597744103e-06, - "loss": 0.6387, - "step": 46794 - }, - { - "epoch": 1.2, - "learning_rate": 1.3645374934996668e-06, - "loss": 0.7222, - "step": 46795 - }, - { - "epoch": 1.2, - "learning_rate": 1.3645117269458135e-06, - "loss": 0.6108, - "step": 46796 - }, - { - "epoch": 1.2, - "learning_rate": 1.3644859601128704e-06, - "loss": 0.6338, - "step": 46797 - }, - { - "epoch": 1.2, - "learning_rate": 1.364460193000857e-06, - "loss": 0.7402, - "step": 46798 - }, - { - "epoch": 1.2, - "learning_rate": 1.3644344256097937e-06, - "loss": 0.7793, - "step": 46799 - }, - { - "epoch": 1.2, - "learning_rate": 1.3644086579396994e-06, - "loss": 0.6265, - "step": 46800 - }, - { - "epoch": 1.2, - "learning_rate": 1.3643828899905941e-06, - "loss": 0.6504, - "step": 46801 - }, - { - "epoch": 1.2, - "learning_rate": 1.3643571217624974e-06, - "loss": 0.6719, - "step": 46802 - }, - { - "epoch": 1.2, - "learning_rate": 1.3643313532554297e-06, - "loss": 0.5928, - "step": 46803 - }, - { - "epoch": 1.2, - "learning_rate": 1.36430558446941e-06, - "loss": 0.6504, - "step": 46804 - }, - { - "epoch": 1.2, - "learning_rate": 1.3642798154044582e-06, - "loss": 0.5654, - "step": 46805 - }, - { - "epoch": 1.2, - "learning_rate": 1.364254046060594e-06, - "loss": 0.6245, - "step": 46806 - }, - { - "epoch": 1.2, - "learning_rate": 1.3642282764378371e-06, - "loss": 0.6802, - "step": 46807 - }, - { - "epoch": 1.2, - "learning_rate": 1.3642025065362078e-06, - "loss": 0.5396, - "step": 46808 - }, - { - "epoch": 1.2, - "learning_rate": 1.3641767363557254e-06, - "loss": 0.6318, - "step": 46809 - }, - { - "epoch": 1.2, - "learning_rate": 1.3641509658964094e-06, - "loss": 0.6104, - "step": 46810 - }, - { - "epoch": 1.2, - "learning_rate": 1.3641251951582798e-06, - "loss": 0.4448, - "step": 46811 - }, - { - "epoch": 1.2, - "learning_rate": 1.364099424141356e-06, - "loss": 0.3718, - "step": 46812 - }, - { - "epoch": 1.2, - "learning_rate": 1.3640736528456581e-06, - "loss": 0.645, - "step": 46813 - }, - { - "epoch": 1.2, - "learning_rate": 1.3640478812712063e-06, - "loss": 0.5898, - "step": 46814 - }, - { - "epoch": 1.2, - "learning_rate": 1.3640221094180193e-06, - "loss": 0.6924, - "step": 46815 - }, - { - "epoch": 1.2, - "learning_rate": 1.3639963372861175e-06, - "loss": 0.6274, - "step": 46816 - }, - { - "epoch": 1.2, - "learning_rate": 1.3639705648755203e-06, - "loss": 0.4985, - "step": 46817 - }, - { - "epoch": 1.2, - "learning_rate": 1.3639447921862476e-06, - "loss": 0.5876, - "step": 46818 - }, - { - "epoch": 1.2, - "learning_rate": 1.363919019218319e-06, - "loss": 0.6943, - "step": 46819 - }, - { - "epoch": 1.2, - "learning_rate": 1.3638932459717547e-06, - "loss": 0.6953, - "step": 46820 - }, - { - "epoch": 1.2, - "learning_rate": 1.3638674724465737e-06, - "loss": 0.7061, - "step": 46821 - }, - { - "epoch": 1.2, - "learning_rate": 1.3638416986427964e-06, - "loss": 0.7285, - "step": 46822 - }, - { - "epoch": 1.2, - "learning_rate": 1.3638159245604416e-06, - "loss": 0.5811, - "step": 46823 - }, - { - "epoch": 1.2, - "learning_rate": 1.3637901501995303e-06, - "loss": 0.5562, - "step": 46824 - }, - { - "epoch": 1.2, - "learning_rate": 1.3637643755600817e-06, - "loss": 0.6602, - "step": 46825 - }, - { - "epoch": 1.2, - "learning_rate": 1.363738600642115e-06, - "loss": 0.5479, - "step": 46826 - }, - { - "epoch": 1.2, - "learning_rate": 1.3637128254456507e-06, - "loss": 0.5669, - "step": 46827 - }, - { - "epoch": 1.2, - "learning_rate": 1.3636870499707081e-06, - "loss": 0.6118, - "step": 46828 - }, - { - "epoch": 1.2, - "learning_rate": 1.363661274217307e-06, - "loss": 0.626, - "step": 46829 - }, - { - "epoch": 1.2, - "learning_rate": 1.3636354981854672e-06, - "loss": 0.5923, - "step": 46830 - }, - { - "epoch": 1.2, - "learning_rate": 1.3636097218752086e-06, - "loss": 0.7354, - "step": 46831 - }, - { - "epoch": 1.2, - "learning_rate": 1.3635839452865505e-06, - "loss": 0.6763, - "step": 46832 - }, - { - "epoch": 1.2, - "learning_rate": 1.3635581684195132e-06, - "loss": 0.6533, - "step": 46833 - }, - { - "epoch": 1.2, - "learning_rate": 1.3635323912741158e-06, - "loss": 0.8633, - "step": 46834 - }, - { - "epoch": 1.2, - "learning_rate": 1.3635066138503786e-06, - "loss": 0.7139, - "step": 46835 - }, - { - "epoch": 1.2, - "learning_rate": 1.3634808361483209e-06, - "loss": 0.5557, - "step": 46836 - }, - { - "epoch": 1.2, - "learning_rate": 1.3634550581679628e-06, - "loss": 0.7437, - "step": 46837 - }, - { - "epoch": 1.2, - "learning_rate": 1.3634292799093237e-06, - "loss": 0.8486, - "step": 46838 - }, - { - "epoch": 1.2, - "learning_rate": 1.3634035013724237e-06, - "loss": 0.6641, - "step": 46839 - }, - { - "epoch": 1.2, - "learning_rate": 1.3633777225572823e-06, - "loss": 0.4103, - "step": 46840 - }, - { - "epoch": 1.2, - "learning_rate": 1.363351943463919e-06, - "loss": 0.751, - "step": 46841 - }, - { - "epoch": 1.2, - "learning_rate": 1.363326164092354e-06, - "loss": 0.7246, - "step": 46842 - }, - { - "epoch": 1.2, - "learning_rate": 1.363300384442607e-06, - "loss": 0.8174, - "step": 46843 - }, - { - "epoch": 1.2, - "learning_rate": 1.3632746045146976e-06, - "loss": 0.5508, - "step": 46844 - }, - { - "epoch": 1.2, - "learning_rate": 1.3632488243086455e-06, - "loss": 0.6362, - "step": 46845 - }, - { - "epoch": 1.2, - "learning_rate": 1.3632230438244703e-06, - "loss": 0.532, - "step": 46846 - }, - { - "epoch": 1.2, - "learning_rate": 1.3631972630621922e-06, - "loss": 0.5852, - "step": 46847 - }, - { - "epoch": 1.2, - "learning_rate": 1.3631714820218308e-06, - "loss": 0.7285, - "step": 46848 - }, - { - "epoch": 1.2, - "learning_rate": 1.363145700703405e-06, - "loss": 0.627, - "step": 46849 - }, - { - "epoch": 1.2, - "learning_rate": 1.3631199191069359e-06, - "loss": 0.5933, - "step": 46850 - }, - { - "epoch": 1.2, - "learning_rate": 1.363094137232442e-06, - "loss": 0.6777, - "step": 46851 - }, - { - "epoch": 1.2, - "learning_rate": 1.3630683550799442e-06, - "loss": 0.6523, - "step": 46852 - }, - { - "epoch": 1.2, - "learning_rate": 1.3630425726494614e-06, - "loss": 0.5942, - "step": 46853 - }, - { - "epoch": 1.2, - "learning_rate": 1.3630167899410137e-06, - "loss": 0.7329, - "step": 46854 - }, - { - "epoch": 1.2, - "learning_rate": 1.3629910069546204e-06, - "loss": 0.7393, - "step": 46855 - }, - { - "epoch": 1.2, - "learning_rate": 1.362965223690302e-06, - "loss": 0.6484, - "step": 46856 - }, - { - "epoch": 1.2, - "learning_rate": 1.3629394401480773e-06, - "loss": 0.6719, - "step": 46857 - }, - { - "epoch": 1.2, - "learning_rate": 1.3629136563279672e-06, - "loss": 0.667, - "step": 46858 - }, - { - "epoch": 1.2, - "learning_rate": 1.3628878722299904e-06, - "loss": 0.584, - "step": 46859 - }, - { - "epoch": 1.2, - "learning_rate": 1.3628620878541672e-06, - "loss": 0.6504, - "step": 46860 - }, - { - "epoch": 1.2, - "learning_rate": 1.362836303200517e-06, - "loss": 0.5942, - "step": 46861 - }, - { - "epoch": 1.2, - "learning_rate": 1.36281051826906e-06, - "loss": 0.6016, - "step": 46862 - }, - { - "epoch": 1.2, - "learning_rate": 1.3627847330598154e-06, - "loss": 0.7119, - "step": 46863 - }, - { - "epoch": 1.2, - "learning_rate": 1.3627589475728034e-06, - "loss": 0.791, - "step": 46864 - }, - { - "epoch": 1.2, - "learning_rate": 1.3627331618080434e-06, - "loss": 0.5581, - "step": 46865 - }, - { - "epoch": 1.2, - "learning_rate": 1.3627073757655554e-06, - "loss": 0.6006, - "step": 46866 - }, - { - "epoch": 1.2, - "learning_rate": 1.362681589445359e-06, - "loss": 0.5942, - "step": 46867 - }, - { - "epoch": 1.2, - "learning_rate": 1.362655802847474e-06, - "loss": 0.707, - "step": 46868 - }, - { - "epoch": 1.2, - "learning_rate": 1.36263001597192e-06, - "loss": 0.7217, - "step": 46869 - }, - { - "epoch": 1.2, - "learning_rate": 1.362604228818717e-06, - "loss": 0.6836, - "step": 46870 - }, - { - "epoch": 1.2, - "learning_rate": 1.3625784413878845e-06, - "loss": 0.7319, - "step": 46871 - }, - { - "epoch": 1.2, - "learning_rate": 1.3625526536794426e-06, - "loss": 0.7637, - "step": 46872 - }, - { - "epoch": 1.2, - "learning_rate": 1.3625268656934108e-06, - "loss": 0.6904, - "step": 46873 - }, - { - "epoch": 1.2, - "learning_rate": 1.3625010774298085e-06, - "loss": 0.6865, - "step": 46874 - }, - { - "epoch": 1.2, - "learning_rate": 1.3624752888886562e-06, - "loss": 0.8066, - "step": 46875 - }, - { - "epoch": 1.2, - "learning_rate": 1.3624495000699728e-06, - "loss": 0.6611, - "step": 46876 - }, - { - "epoch": 1.2, - "learning_rate": 1.3624237109737788e-06, - "loss": 0.7305, - "step": 46877 - }, - { - "epoch": 1.2, - "learning_rate": 1.3623979216000937e-06, - "loss": 0.6821, - "step": 46878 - }, - { - "epoch": 1.2, - "learning_rate": 1.362372131948937e-06, - "loss": 0.5469, - "step": 46879 - }, - { - "epoch": 1.2, - "learning_rate": 1.3623463420203284e-06, - "loss": 0.792, - "step": 46880 - }, - { - "epoch": 1.2, - "learning_rate": 1.3623205518142883e-06, - "loss": 0.6904, - "step": 46881 - }, - { - "epoch": 1.2, - "learning_rate": 1.3622947613308358e-06, - "loss": 0.6797, - "step": 46882 - }, - { - "epoch": 1.2, - "learning_rate": 1.362268970569991e-06, - "loss": 0.772, - "step": 46883 - }, - { - "epoch": 1.2, - "learning_rate": 1.3622431795317733e-06, - "loss": 0.6465, - "step": 46884 - }, - { - "epoch": 1.2, - "learning_rate": 1.3622173882162029e-06, - "loss": 0.5469, - "step": 46885 - }, - { - "epoch": 1.2, - "learning_rate": 1.3621915966232988e-06, - "loss": 0.7476, - "step": 46886 - }, - { - "epoch": 1.2, - "learning_rate": 1.362165804753082e-06, - "loss": 0.7334, - "step": 46887 - }, - { - "epoch": 1.2, - "learning_rate": 1.362140012605571e-06, - "loss": 0.6631, - "step": 46888 - }, - { - "epoch": 1.2, - "learning_rate": 1.362114220180786e-06, - "loss": 0.6714, - "step": 46889 - }, - { - "epoch": 1.2, - "learning_rate": 1.362088427478747e-06, - "loss": 0.7295, - "step": 46890 - }, - { - "epoch": 1.2, - "learning_rate": 1.3620626344994738e-06, - "loss": 0.6694, - "step": 46891 - }, - { - "epoch": 1.2, - "learning_rate": 1.3620368412429853e-06, - "loss": 0.7129, - "step": 46892 - }, - { - "epoch": 1.2, - "learning_rate": 1.362011047709302e-06, - "loss": 0.7061, - "step": 46893 - }, - { - "epoch": 1.2, - "learning_rate": 1.3619852538984438e-06, - "loss": 0.5574, - "step": 46894 - }, - { - "epoch": 1.2, - "learning_rate": 1.3619594598104297e-06, - "loss": 0.6304, - "step": 46895 - }, - { - "epoch": 1.2, - "learning_rate": 1.3619336654452802e-06, - "loss": 0.5562, - "step": 46896 - }, - { - "epoch": 1.2, - "learning_rate": 1.3619078708030146e-06, - "loss": 0.7402, - "step": 46897 - }, - { - "epoch": 1.2, - "learning_rate": 1.361882075883653e-06, - "loss": 0.6025, - "step": 46898 - }, - { - "epoch": 1.2, - "learning_rate": 1.3618562806872146e-06, - "loss": 0.6553, - "step": 46899 - }, - { - "epoch": 1.2, - "learning_rate": 1.3618304852137197e-06, - "loss": 0.7783, - "step": 46900 - }, - { - "epoch": 1.2, - "learning_rate": 1.3618046894631877e-06, - "loss": 0.6948, - "step": 46901 - }, - { - "epoch": 1.2, - "learning_rate": 1.3617788934356386e-06, - "loss": 0.5688, - "step": 46902 - }, - { - "epoch": 1.2, - "learning_rate": 1.3617530971310922e-06, - "loss": 0.5547, - "step": 46903 - }, - { - "epoch": 1.2, - "learning_rate": 1.361727300549568e-06, - "loss": 0.7344, - "step": 46904 - }, - { - "epoch": 1.2, - "learning_rate": 1.3617015036910856e-06, - "loss": 0.4812, - "step": 46905 - }, - { - "epoch": 1.2, - "learning_rate": 1.361675706555665e-06, - "loss": 0.7012, - "step": 46906 - }, - { - "epoch": 1.2, - "learning_rate": 1.361649909143326e-06, - "loss": 0.6345, - "step": 46907 - }, - { - "epoch": 1.2, - "learning_rate": 1.3616241114540886e-06, - "loss": 0.6333, - "step": 46908 - }, - { - "epoch": 1.2, - "learning_rate": 1.3615983134879718e-06, - "loss": 0.6357, - "step": 46909 - }, - { - "epoch": 1.2, - "learning_rate": 1.3615725152449962e-06, - "loss": 0.7002, - "step": 46910 - }, - { - "epoch": 1.2, - "learning_rate": 1.3615467167251805e-06, - "loss": 0.6689, - "step": 46911 - }, - { - "epoch": 1.2, - "learning_rate": 1.3615209179285459e-06, - "loss": 0.6602, - "step": 46912 - }, - { - "epoch": 1.2, - "learning_rate": 1.3614951188551112e-06, - "loss": 0.668, - "step": 46913 - }, - { - "epoch": 1.2, - "learning_rate": 1.3614693195048958e-06, - "loss": 0.667, - "step": 46914 - }, - { - "epoch": 1.2, - "learning_rate": 1.3614435198779204e-06, - "loss": 0.7075, - "step": 46915 - }, - { - "epoch": 1.2, - "learning_rate": 1.3614177199742042e-06, - "loss": 0.5098, - "step": 46916 - }, - { - "epoch": 1.2, - "learning_rate": 1.3613919197937669e-06, - "loss": 0.6638, - "step": 46917 - }, - { - "epoch": 1.2, - "learning_rate": 1.361366119336629e-06, - "loss": 0.575, - "step": 46918 - }, - { - "epoch": 1.2, - "learning_rate": 1.361340318602809e-06, - "loss": 0.6538, - "step": 46919 - }, - { - "epoch": 1.2, - "learning_rate": 1.3613145175923274e-06, - "loss": 0.666, - "step": 46920 - }, - { - "epoch": 1.2, - "learning_rate": 1.3612887163052043e-06, - "loss": 0.7324, - "step": 46921 - }, - { - "epoch": 1.2, - "learning_rate": 1.3612629147414587e-06, - "loss": 0.4885, - "step": 46922 - }, - { - "epoch": 1.2, - "learning_rate": 1.361237112901111e-06, - "loss": 0.488, - "step": 46923 - }, - { - "epoch": 1.2, - "learning_rate": 1.3612113107841805e-06, - "loss": 0.7188, - "step": 46924 - }, - { - "epoch": 1.2, - "learning_rate": 1.361185508390687e-06, - "loss": 0.4207, - "step": 46925 - }, - { - "epoch": 1.2, - "learning_rate": 1.3611597057206504e-06, - "loss": 0.6123, - "step": 46926 - }, - { - "epoch": 1.2, - "learning_rate": 1.3611339027740904e-06, - "loss": 0.8213, - "step": 46927 - }, - { - "epoch": 1.2, - "learning_rate": 1.3611080995510271e-06, - "loss": 0.6035, - "step": 46928 - }, - { - "epoch": 1.2, - "learning_rate": 1.3610822960514796e-06, - "loss": 0.6914, - "step": 46929 - }, - { - "epoch": 1.2, - "learning_rate": 1.361056492275468e-06, - "loss": 0.5552, - "step": 46930 - }, - { - "epoch": 1.2, - "learning_rate": 1.3610306882230122e-06, - "loss": 0.6323, - "step": 46931 - }, - { - "epoch": 1.2, - "learning_rate": 1.3610048838941316e-06, - "loss": 0.6562, - "step": 46932 - }, - { - "epoch": 1.2, - "learning_rate": 1.3609790792888465e-06, - "loss": 0.7246, - "step": 46933 - }, - { - "epoch": 1.2, - "learning_rate": 1.3609532744071758e-06, - "loss": 0.6978, - "step": 46934 - }, - { - "epoch": 1.2, - "learning_rate": 1.3609274692491403e-06, - "loss": 0.5278, - "step": 46935 - }, - { - "epoch": 1.2, - "learning_rate": 1.3609016638147588e-06, - "loss": 0.6846, - "step": 46936 - }, - { - "epoch": 1.2, - "learning_rate": 1.360875858104052e-06, - "loss": 0.7021, - "step": 46937 - }, - { - "epoch": 1.2, - "learning_rate": 1.3608500521170388e-06, - "loss": 0.4946, - "step": 46938 - }, - { - "epoch": 1.2, - "learning_rate": 1.360824245853739e-06, - "loss": 0.6367, - "step": 46939 - }, - { - "epoch": 1.2, - "learning_rate": 1.3607984393141733e-06, - "loss": 0.6372, - "step": 46940 - }, - { - "epoch": 1.2, - "learning_rate": 1.3607726324983603e-06, - "loss": 0.5531, - "step": 46941 - }, - { - "epoch": 1.2, - "learning_rate": 1.3607468254063207e-06, - "loss": 0.6709, - "step": 46942 - }, - { - "epoch": 1.2, - "learning_rate": 1.3607210180380737e-06, - "loss": 0.6621, - "step": 46943 - }, - { - "epoch": 1.2, - "learning_rate": 1.3606952103936392e-06, - "loss": 0.6455, - "step": 46944 - }, - { - "epoch": 1.2, - "learning_rate": 1.360669402473037e-06, - "loss": 0.7725, - "step": 46945 - }, - { - "epoch": 1.2, - "learning_rate": 1.3606435942762868e-06, - "loss": 0.6943, - "step": 46946 - }, - { - "epoch": 1.2, - "learning_rate": 1.360617785803408e-06, - "loss": 0.7188, - "step": 46947 - }, - { - "epoch": 1.2, - "learning_rate": 1.3605919770544214e-06, - "loss": 0.7578, - "step": 46948 - }, - { - "epoch": 1.2, - "learning_rate": 1.360566168029346e-06, - "loss": 0.624, - "step": 46949 - }, - { - "epoch": 1.2, - "learning_rate": 1.3605403587282012e-06, - "loss": 0.6367, - "step": 46950 - }, - { - "epoch": 1.2, - "learning_rate": 1.3605145491510074e-06, - "loss": 0.5203, - "step": 46951 - }, - { - "epoch": 1.2, - "learning_rate": 1.3604887392977844e-06, - "loss": 0.8994, - "step": 46952 - }, - { - "epoch": 1.2, - "learning_rate": 1.3604629291685518e-06, - "loss": 0.6436, - "step": 46953 - }, - { - "epoch": 1.2, - "learning_rate": 1.360437118763329e-06, - "loss": 0.6846, - "step": 46954 - }, - { - "epoch": 1.2, - "learning_rate": 1.360411308082136e-06, - "loss": 0.6514, - "step": 46955 - }, - { - "epoch": 1.2, - "learning_rate": 1.360385497124993e-06, - "loss": 0.7546, - "step": 46956 - }, - { - "epoch": 1.2, - "learning_rate": 1.360359685891919e-06, - "loss": 0.647, - "step": 46957 - }, - { - "epoch": 1.2, - "learning_rate": 1.3603338743829345e-06, - "loss": 0.5474, - "step": 46958 - }, - { - "epoch": 1.2, - "learning_rate": 1.360308062598059e-06, - "loss": 0.6582, - "step": 46959 - }, - { - "epoch": 1.2, - "learning_rate": 1.3602822505373117e-06, - "loss": 0.6787, - "step": 46960 - }, - { - "epoch": 1.2, - "learning_rate": 1.3602564382007132e-06, - "loss": 0.6343, - "step": 46961 - }, - { - "epoch": 1.2, - "learning_rate": 1.360230625588283e-06, - "loss": 0.6445, - "step": 46962 - }, - { - "epoch": 1.2, - "learning_rate": 1.3602048127000405e-06, - "loss": 0.7959, - "step": 46963 - }, - { - "epoch": 1.2, - "learning_rate": 1.3601789995360057e-06, - "loss": 0.626, - "step": 46964 - }, - { - "epoch": 1.2, - "learning_rate": 1.3601531860961987e-06, - "loss": 0.6055, - "step": 46965 - }, - { - "epoch": 1.2, - "learning_rate": 1.3601273723806387e-06, - "loss": 0.4773, - "step": 46966 - }, - { - "epoch": 1.2, - "learning_rate": 1.360101558389346e-06, - "loss": 0.5835, - "step": 46967 - }, - { - "epoch": 1.2, - "learning_rate": 1.3600757441223402e-06, - "loss": 0.7969, - "step": 46968 - }, - { - "epoch": 1.2, - "learning_rate": 1.3600499295796406e-06, - "loss": 0.625, - "step": 46969 - }, - { - "epoch": 1.2, - "learning_rate": 1.3600241147612672e-06, - "loss": 0.6694, - "step": 46970 - }, - { - "epoch": 1.2, - "learning_rate": 1.3599982996672404e-06, - "loss": 0.6919, - "step": 46971 - }, - { - "epoch": 1.2, - "learning_rate": 1.3599724842975788e-06, - "loss": 0.5168, - "step": 46972 - }, - { - "epoch": 1.2, - "learning_rate": 1.3599466686523037e-06, - "loss": 0.7607, - "step": 46973 - }, - { - "epoch": 1.2, - "learning_rate": 1.3599208527314332e-06, - "loss": 0.6914, - "step": 46974 - }, - { - "epoch": 1.2, - "learning_rate": 1.3598950365349882e-06, - "loss": 0.7266, - "step": 46975 - }, - { - "epoch": 1.2, - "learning_rate": 1.359869220062988e-06, - "loss": 0.5884, - "step": 46976 - }, - { - "epoch": 1.2, - "learning_rate": 1.3598434033154527e-06, - "loss": 0.5507, - "step": 46977 - }, - { - "epoch": 1.2, - "learning_rate": 1.3598175862924016e-06, - "loss": 0.5356, - "step": 46978 - }, - { - "epoch": 1.2, - "learning_rate": 1.3597917689938548e-06, - "loss": 0.6768, - "step": 46979 - }, - { - "epoch": 1.2, - "learning_rate": 1.3597659514198318e-06, - "loss": 0.6074, - "step": 46980 - }, - { - "epoch": 1.2, - "learning_rate": 1.359740133570353e-06, - "loss": 0.6445, - "step": 46981 - }, - { - "epoch": 1.2, - "learning_rate": 1.3597143154454373e-06, - "loss": 0.5713, - "step": 46982 - }, - { - "epoch": 1.2, - "learning_rate": 1.3596884970451053e-06, - "loss": 0.6763, - "step": 46983 - }, - { - "epoch": 1.2, - "learning_rate": 1.3596626783693758e-06, - "loss": 0.5283, - "step": 46984 - }, - { - "epoch": 1.2, - "learning_rate": 1.3596368594182694e-06, - "loss": 0.7803, - "step": 46985 - }, - { - "epoch": 1.2, - "learning_rate": 1.3596110401918058e-06, - "loss": 0.7588, - "step": 46986 - }, - { - "epoch": 1.2, - "learning_rate": 1.3595852206900043e-06, - "loss": 0.676, - "step": 46987 - }, - { - "epoch": 1.2, - "learning_rate": 1.3595594009128853e-06, - "loss": 0.7227, - "step": 46988 - }, - { - "epoch": 1.2, - "learning_rate": 1.3595335808604679e-06, - "loss": 0.6377, - "step": 46989 - }, - { - "epoch": 1.2, - "learning_rate": 1.3595077605327721e-06, - "loss": 0.4775, - "step": 46990 - }, - { - "epoch": 1.2, - "learning_rate": 1.3594819399298176e-06, - "loss": 0.8164, - "step": 46991 - }, - { - "epoch": 1.2, - "learning_rate": 1.3594561190516248e-06, - "loss": 0.7246, - "step": 46992 - }, - { - "epoch": 1.2, - "learning_rate": 1.3594302978982128e-06, - "loss": 0.6123, - "step": 46993 - }, - { - "epoch": 1.2, - "learning_rate": 1.3594044764696016e-06, - "loss": 0.6929, - "step": 46994 - }, - { - "epoch": 1.2, - "learning_rate": 1.3593786547658107e-06, - "loss": 0.5942, - "step": 46995 - }, - { - "epoch": 1.2, - "learning_rate": 1.3593528327868602e-06, - "loss": 0.8545, - "step": 46996 - }, - { - "epoch": 1.2, - "learning_rate": 1.3593270105327695e-06, - "loss": 0.5234, - "step": 46997 - }, - { - "epoch": 1.2, - "learning_rate": 1.3593011880035592e-06, - "loss": 0.4441, - "step": 46998 - }, - { - "epoch": 1.2, - "learning_rate": 1.359275365199248e-06, - "loss": 0.7852, - "step": 46999 - }, - { - "epoch": 1.2, - "learning_rate": 1.3592495421198562e-06, - "loss": 0.7559, - "step": 47000 - }, - { - "epoch": 1.2, - "learning_rate": 1.3592237187654036e-06, - "loss": 0.6914, - "step": 47001 - }, - { - "epoch": 1.2, - "learning_rate": 1.3591978951359102e-06, - "loss": 0.7178, - "step": 47002 - }, - { - "epoch": 1.2, - "learning_rate": 1.3591720712313955e-06, - "loss": 0.7744, - "step": 47003 - }, - { - "epoch": 1.2, - "learning_rate": 1.3591462470518788e-06, - "loss": 0.6797, - "step": 47004 - }, - { - "epoch": 1.2, - "learning_rate": 1.3591204225973804e-06, - "loss": 0.6289, - "step": 47005 - }, - { - "epoch": 1.2, - "learning_rate": 1.3590945978679202e-06, - "loss": 0.6753, - "step": 47006 - }, - { - "epoch": 1.2, - "learning_rate": 1.3590687728635177e-06, - "loss": 0.6997, - "step": 47007 - }, - { - "epoch": 1.2, - "learning_rate": 1.359042947584193e-06, - "loss": 0.6108, - "step": 47008 - }, - { - "epoch": 1.2, - "learning_rate": 1.3590171220299656e-06, - "loss": 0.563, - "step": 47009 - }, - { - "epoch": 1.2, - "learning_rate": 1.358991296200855e-06, - "loss": 0.6289, - "step": 47010 - }, - { - "epoch": 1.2, - "learning_rate": 1.3589654700968814e-06, - "loss": 0.6914, - "step": 47011 - }, - { - "epoch": 1.2, - "learning_rate": 1.3589396437180645e-06, - "loss": 0.833, - "step": 47012 - }, - { - "epoch": 1.2, - "learning_rate": 1.3589138170644241e-06, - "loss": 0.5352, - "step": 47013 - }, - { - "epoch": 1.2, - "learning_rate": 1.3588879901359796e-06, - "loss": 0.5586, - "step": 47014 - }, - { - "epoch": 1.21, - "learning_rate": 1.3588621629327514e-06, - "loss": 0.708, - "step": 47015 - }, - { - "epoch": 1.21, - "learning_rate": 1.3588363354547584e-06, - "loss": 0.5698, - "step": 47016 - }, - { - "epoch": 1.21, - "learning_rate": 1.3588105077020215e-06, - "loss": 0.6875, - "step": 47017 - }, - { - "epoch": 1.21, - "learning_rate": 1.3587846796745597e-06, - "loss": 0.5615, - "step": 47018 - }, - { - "epoch": 1.21, - "learning_rate": 1.358758851372393e-06, - "loss": 0.7754, - "step": 47019 - }, - { - "epoch": 1.21, - "learning_rate": 1.3587330227955411e-06, - "loss": 0.6763, - "step": 47020 - }, - { - "epoch": 1.21, - "learning_rate": 1.3587071939440237e-06, - "loss": 0.5547, - "step": 47021 - }, - { - "epoch": 1.21, - "learning_rate": 1.3586813648178609e-06, - "loss": 0.6724, - "step": 47022 - }, - { - "epoch": 1.21, - "learning_rate": 1.3586555354170722e-06, - "loss": 0.7588, - "step": 47023 - }, - { - "epoch": 1.21, - "learning_rate": 1.3586297057416776e-06, - "loss": 0.7246, - "step": 47024 - }, - { - "epoch": 1.21, - "learning_rate": 1.3586038757916965e-06, - "loss": 0.5735, - "step": 47025 - }, - { - "epoch": 1.21, - "learning_rate": 1.3585780455671488e-06, - "loss": 0.4934, - "step": 47026 - }, - { - "epoch": 1.21, - "learning_rate": 1.3585522150680546e-06, - "loss": 0.7471, - "step": 47027 - }, - { - "epoch": 1.21, - "learning_rate": 1.3585263842944335e-06, - "loss": 0.6387, - "step": 47028 - }, - { - "epoch": 1.21, - "learning_rate": 1.3585005532463049e-06, - "loss": 0.4403, - "step": 47029 - }, - { - "epoch": 1.21, - "learning_rate": 1.3584747219236893e-06, - "loss": 0.7129, - "step": 47030 - }, - { - "epoch": 1.21, - "learning_rate": 1.3584488903266058e-06, - "loss": 0.6177, - "step": 47031 - }, - { - "epoch": 1.21, - "learning_rate": 1.3584230584550746e-06, - "loss": 0.7197, - "step": 47032 - }, - { - "epoch": 1.21, - "learning_rate": 1.3583972263091154e-06, - "loss": 0.5186, - "step": 47033 - }, - { - "epoch": 1.21, - "learning_rate": 1.358371393888748e-06, - "loss": 0.4417, - "step": 47034 - }, - { - "epoch": 1.21, - "learning_rate": 1.3583455611939917e-06, - "loss": 0.7139, - "step": 47035 - }, - { - "epoch": 1.21, - "learning_rate": 1.358319728224867e-06, - "loss": 0.6826, - "step": 47036 - }, - { - "epoch": 1.21, - "learning_rate": 1.3582938949813934e-06, - "loss": 0.7314, - "step": 47037 - }, - { - "epoch": 1.21, - "learning_rate": 1.358268061463591e-06, - "loss": 0.5228, - "step": 47038 - }, - { - "epoch": 1.21, - "learning_rate": 1.3582422276714783e-06, - "loss": 0.749, - "step": 47039 - }, - { - "epoch": 1.21, - "learning_rate": 1.3582163936050765e-06, - "loss": 0.6084, - "step": 47040 - }, - { - "epoch": 1.21, - "learning_rate": 1.3581905592644046e-06, - "loss": 0.5762, - "step": 47041 - }, - { - "epoch": 1.21, - "learning_rate": 1.3581647246494832e-06, - "loss": 0.5703, - "step": 47042 - }, - { - "epoch": 1.21, - "learning_rate": 1.3581388897603312e-06, - "loss": 0.6533, - "step": 47043 - }, - { - "epoch": 1.21, - "learning_rate": 1.358113054596969e-06, - "loss": 0.4531, - "step": 47044 - }, - { - "epoch": 1.21, - "learning_rate": 1.3580872191594157e-06, - "loss": 0.7227, - "step": 47045 - }, - { - "epoch": 1.21, - "learning_rate": 1.3580613834476916e-06, - "loss": 0.6797, - "step": 47046 - }, - { - "epoch": 1.21, - "learning_rate": 1.3580355474618164e-06, - "loss": 0.665, - "step": 47047 - }, - { - "epoch": 1.21, - "learning_rate": 1.3580097112018098e-06, - "loss": 0.6621, - "step": 47048 - }, - { - "epoch": 1.21, - "learning_rate": 1.3579838746676916e-06, - "loss": 0.564, - "step": 47049 - }, - { - "epoch": 1.21, - "learning_rate": 1.3579580378594817e-06, - "loss": 0.3911, - "step": 47050 - }, - { - "epoch": 1.21, - "learning_rate": 1.3579322007771998e-06, - "loss": 0.749, - "step": 47051 - }, - { - "epoch": 1.21, - "learning_rate": 1.3579063634208655e-06, - "loss": 0.5708, - "step": 47052 - }, - { - "epoch": 1.21, - "learning_rate": 1.3578805257904994e-06, - "loss": 0.5405, - "step": 47053 - }, - { - "epoch": 1.21, - "learning_rate": 1.3578546878861197e-06, - "loss": 0.7578, - "step": 47054 - }, - { - "epoch": 1.21, - "learning_rate": 1.3578288497077478e-06, - "loss": 0.6025, - "step": 47055 - }, - { - "epoch": 1.21, - "learning_rate": 1.3578030112554024e-06, - "loss": 0.7285, - "step": 47056 - }, - { - "epoch": 1.21, - "learning_rate": 1.357777172529104e-06, - "loss": 0.6709, - "step": 47057 - }, - { - "epoch": 1.21, - "learning_rate": 1.357751333528872e-06, - "loss": 0.5142, - "step": 47058 - }, - { - "epoch": 1.21, - "learning_rate": 1.357725494254726e-06, - "loss": 0.6396, - "step": 47059 - }, - { - "epoch": 1.21, - "learning_rate": 1.357699654706686e-06, - "loss": 0.7383, - "step": 47060 - }, - { - "epoch": 1.21, - "learning_rate": 1.357673814884772e-06, - "loss": 0.791, - "step": 47061 - }, - { - "epoch": 1.21, - "learning_rate": 1.3576479747890037e-06, - "loss": 0.6689, - "step": 47062 - }, - { - "epoch": 1.21, - "learning_rate": 1.357622134419401e-06, - "loss": 0.7861, - "step": 47063 - }, - { - "epoch": 1.21, - "learning_rate": 1.3575962937759831e-06, - "loss": 0.5149, - "step": 47064 - }, - { - "epoch": 1.21, - "learning_rate": 1.3575704528587704e-06, - "loss": 0.5942, - "step": 47065 - }, - { - "epoch": 1.21, - "learning_rate": 1.357544611667782e-06, - "loss": 0.5305, - "step": 47066 - }, - { - "epoch": 1.21, - "learning_rate": 1.3575187702030387e-06, - "loss": 0.6553, - "step": 47067 - }, - { - "epoch": 1.21, - "learning_rate": 1.3574929284645596e-06, - "loss": 0.6816, - "step": 47068 - }, - { - "epoch": 1.21, - "learning_rate": 1.357467086452364e-06, - "loss": 0.499, - "step": 47069 - }, - { - "epoch": 1.21, - "learning_rate": 1.357441244166473e-06, - "loss": 0.6504, - "step": 47070 - }, - { - "epoch": 1.21, - "learning_rate": 1.3574154016069054e-06, - "loss": 0.5835, - "step": 47071 - }, - { - "epoch": 1.21, - "learning_rate": 1.3573895587736813e-06, - "loss": 0.5366, - "step": 47072 - }, - { - "epoch": 1.21, - "learning_rate": 1.3573637156668202e-06, - "loss": 0.7588, - "step": 47073 - }, - { - "epoch": 1.21, - "learning_rate": 1.3573378722863427e-06, - "loss": 0.6016, - "step": 47074 - }, - { - "epoch": 1.21, - "learning_rate": 1.3573120286322674e-06, - "loss": 0.7598, - "step": 47075 - }, - { - "epoch": 1.21, - "learning_rate": 1.3572861847046151e-06, - "loss": 0.7607, - "step": 47076 - }, - { - "epoch": 1.21, - "learning_rate": 1.357260340503405e-06, - "loss": 0.6802, - "step": 47077 - }, - { - "epoch": 1.21, - "learning_rate": 1.3572344960286575e-06, - "loss": 0.7129, - "step": 47078 - }, - { - "epoch": 1.21, - "learning_rate": 1.3572086512803915e-06, - "loss": 0.6479, - "step": 47079 - }, - { - "epoch": 1.21, - "learning_rate": 1.3571828062586275e-06, - "loss": 0.5781, - "step": 47080 - }, - { - "epoch": 1.21, - "learning_rate": 1.3571569609633846e-06, - "loss": 0.5933, - "step": 47081 - }, - { - "epoch": 1.21, - "learning_rate": 1.3571311153946837e-06, - "loss": 0.5835, - "step": 47082 - }, - { - "epoch": 1.21, - "learning_rate": 1.3571052695525436e-06, - "loss": 0.6704, - "step": 47083 - }, - { - "epoch": 1.21, - "learning_rate": 1.3570794234369844e-06, - "loss": 0.6543, - "step": 47084 - }, - { - "epoch": 1.21, - "learning_rate": 1.3570535770480259e-06, - "loss": 0.4556, - "step": 47085 - }, - { - "epoch": 1.21, - "learning_rate": 1.357027730385688e-06, - "loss": 0.5669, - "step": 47086 - }, - { - "epoch": 1.21, - "learning_rate": 1.3570018834499903e-06, - "loss": 0.6123, - "step": 47087 - }, - { - "epoch": 1.21, - "learning_rate": 1.356976036240953e-06, - "loss": 0.4368, - "step": 47088 - }, - { - "epoch": 1.21, - "learning_rate": 1.3569501887585951e-06, - "loss": 0.4926, - "step": 47089 - }, - { - "epoch": 1.21, - "learning_rate": 1.356924341002937e-06, - "loss": 0.6777, - "step": 47090 - }, - { - "epoch": 1.21, - "learning_rate": 1.3568984929739982e-06, - "loss": 0.4597, - "step": 47091 - }, - { - "epoch": 1.21, - "learning_rate": 1.356872644671799e-06, - "loss": 0.7173, - "step": 47092 - }, - { - "epoch": 1.21, - "learning_rate": 1.3568467960963585e-06, - "loss": 0.6299, - "step": 47093 - }, - { - "epoch": 1.21, - "learning_rate": 1.3568209472476967e-06, - "loss": 0.7354, - "step": 47094 - }, - { - "epoch": 1.21, - "learning_rate": 1.356795098125834e-06, - "loss": 0.6982, - "step": 47095 - }, - { - "epoch": 1.21, - "learning_rate": 1.3567692487307892e-06, - "loss": 0.6631, - "step": 47096 - }, - { - "epoch": 1.21, - "learning_rate": 1.3567433990625829e-06, - "loss": 0.6069, - "step": 47097 - }, - { - "epoch": 1.21, - "learning_rate": 1.3567175491212347e-06, - "loss": 0.707, - "step": 47098 - }, - { - "epoch": 1.21, - "learning_rate": 1.356691698906764e-06, - "loss": 0.4517, - "step": 47099 - }, - { - "epoch": 1.21, - "learning_rate": 1.356665848419191e-06, - "loss": 0.7822, - "step": 47100 - }, - { - "epoch": 1.21, - "learning_rate": 1.3566399976585353e-06, - "loss": 0.6501, - "step": 47101 - }, - { - "epoch": 1.21, - "learning_rate": 1.3566141466248167e-06, - "loss": 0.4916, - "step": 47102 - }, - { - "epoch": 1.21, - "learning_rate": 1.3565882953180552e-06, - "loss": 0.5762, - "step": 47103 - }, - { - "epoch": 1.21, - "learning_rate": 1.3565624437382704e-06, - "loss": 0.6338, - "step": 47104 - }, - { - "epoch": 1.21, - "learning_rate": 1.356536591885482e-06, - "loss": 0.5742, - "step": 47105 - }, - { - "epoch": 1.21, - "learning_rate": 1.35651073975971e-06, - "loss": 0.4518, - "step": 47106 - }, - { - "epoch": 1.21, - "learning_rate": 1.356484887360974e-06, - "loss": 0.6797, - "step": 47107 - }, - { - "epoch": 1.21, - "learning_rate": 1.3564590346892941e-06, - "loss": 0.5532, - "step": 47108 - }, - { - "epoch": 1.21, - "learning_rate": 1.35643318174469e-06, - "loss": 0.7734, - "step": 47109 - }, - { - "epoch": 1.21, - "learning_rate": 1.3564073285271812e-06, - "loss": 0.6006, - "step": 47110 - }, - { - "epoch": 1.21, - "learning_rate": 1.3563814750367878e-06, - "loss": 0.6431, - "step": 47111 - }, - { - "epoch": 1.21, - "learning_rate": 1.3563556212735293e-06, - "loss": 0.5144, - "step": 47112 - }, - { - "epoch": 1.21, - "learning_rate": 1.3563297672374258e-06, - "loss": 0.6514, - "step": 47113 - }, - { - "epoch": 1.21, - "learning_rate": 1.3563039129284972e-06, - "loss": 0.4938, - "step": 47114 - }, - { - "epoch": 1.21, - "learning_rate": 1.3562780583467629e-06, - "loss": 0.7632, - "step": 47115 - }, - { - "epoch": 1.21, - "learning_rate": 1.3562522034922426e-06, - "loss": 0.7183, - "step": 47116 - }, - { - "epoch": 1.21, - "learning_rate": 1.3562263483649567e-06, - "loss": 0.6318, - "step": 47117 - }, - { - "epoch": 1.21, - "learning_rate": 1.3562004929649246e-06, - "loss": 0.5854, - "step": 47118 - }, - { - "epoch": 1.21, - "learning_rate": 1.356174637292166e-06, - "loss": 0.7598, - "step": 47119 - }, - { - "epoch": 1.21, - "learning_rate": 1.3561487813467012e-06, - "loss": 0.6855, - "step": 47120 - }, - { - "epoch": 1.21, - "learning_rate": 1.3561229251285494e-06, - "loss": 0.5201, - "step": 47121 - }, - { - "epoch": 1.21, - "learning_rate": 1.3560970686377307e-06, - "loss": 0.877, - "step": 47122 - }, - { - "epoch": 1.21, - "learning_rate": 1.356071211874265e-06, - "loss": 0.6904, - "step": 47123 - }, - { - "epoch": 1.21, - "learning_rate": 1.356045354838172e-06, - "loss": 0.5317, - "step": 47124 - }, - { - "epoch": 1.21, - "learning_rate": 1.3560194975294709e-06, - "loss": 0.7197, - "step": 47125 - }, - { - "epoch": 1.21, - "learning_rate": 1.3559936399481826e-06, - "loss": 0.6113, - "step": 47126 - }, - { - "epoch": 1.21, - "learning_rate": 1.355967782094326e-06, - "loss": 0.7014, - "step": 47127 - }, - { - "epoch": 1.21, - "learning_rate": 1.3559419239679214e-06, - "loss": 0.5869, - "step": 47128 - }, - { - "epoch": 1.21, - "learning_rate": 1.3559160655689886e-06, - "loss": 0.7949, - "step": 47129 - }, - { - "epoch": 1.21, - "learning_rate": 1.3558902068975469e-06, - "loss": 0.5298, - "step": 47130 - }, - { - "epoch": 1.21, - "learning_rate": 1.3558643479536165e-06, - "loss": 0.6025, - "step": 47131 - }, - { - "epoch": 1.21, - "learning_rate": 1.3558384887372173e-06, - "loss": 0.8848, - "step": 47132 - }, - { - "epoch": 1.21, - "learning_rate": 1.3558126292483687e-06, - "loss": 0.6729, - "step": 47133 - }, - { - "epoch": 1.21, - "learning_rate": 1.355786769487091e-06, - "loss": 0.7168, - "step": 47134 - }, - { - "epoch": 1.21, - "learning_rate": 1.3557609094534036e-06, - "loss": 0.4663, - "step": 47135 - }, - { - "epoch": 1.21, - "learning_rate": 1.3557350491473263e-06, - "loss": 0.6304, - "step": 47136 - }, - { - "epoch": 1.21, - "learning_rate": 1.3557091885688795e-06, - "loss": 0.6113, - "step": 47137 - }, - { - "epoch": 1.21, - "learning_rate": 1.355683327718082e-06, - "loss": 0.7637, - "step": 47138 - }, - { - "epoch": 1.21, - "learning_rate": 1.3556574665949543e-06, - "loss": 0.5059, - "step": 47139 - }, - { - "epoch": 1.21, - "learning_rate": 1.3556316051995158e-06, - "loss": 0.7104, - "step": 47140 - }, - { - "epoch": 1.21, - "learning_rate": 1.355605743531787e-06, - "loss": 0.7949, - "step": 47141 - }, - { - "epoch": 1.21, - "learning_rate": 1.355579881591787e-06, - "loss": 0.6782, - "step": 47142 - }, - { - "epoch": 1.21, - "learning_rate": 1.355554019379536e-06, - "loss": 0.5762, - "step": 47143 - }, - { - "epoch": 1.21, - "learning_rate": 1.3555281568950532e-06, - "loss": 0.6724, - "step": 47144 - }, - { - "epoch": 1.21, - "learning_rate": 1.355502294138359e-06, - "loss": 0.5684, - "step": 47145 - }, - { - "epoch": 1.21, - "learning_rate": 1.3554764311094732e-06, - "loss": 0.5034, - "step": 47146 - }, - { - "epoch": 1.21, - "learning_rate": 1.3554505678084156e-06, - "loss": 0.7827, - "step": 47147 - }, - { - "epoch": 1.21, - "learning_rate": 1.3554247042352056e-06, - "loss": 0.6899, - "step": 47148 - }, - { - "epoch": 1.21, - "learning_rate": 1.3553988403898634e-06, - "loss": 0.667, - "step": 47149 - }, - { - "epoch": 1.21, - "learning_rate": 1.3553729762724083e-06, - "loss": 0.5884, - "step": 47150 - }, - { - "epoch": 1.21, - "learning_rate": 1.3553471118828608e-06, - "loss": 0.6592, - "step": 47151 - }, - { - "epoch": 1.21, - "learning_rate": 1.3553212472212402e-06, - "loss": 0.5728, - "step": 47152 - }, - { - "epoch": 1.21, - "learning_rate": 1.3552953822875668e-06, - "loss": 0.717, - "step": 47153 - }, - { - "epoch": 1.21, - "learning_rate": 1.3552695170818596e-06, - "loss": 0.6602, - "step": 47154 - }, - { - "epoch": 1.21, - "learning_rate": 1.3552436516041393e-06, - "loss": 0.6284, - "step": 47155 - }, - { - "epoch": 1.21, - "learning_rate": 1.3552177858544248e-06, - "loss": 0.624, - "step": 47156 - }, - { - "epoch": 1.21, - "learning_rate": 1.3551919198327367e-06, - "loss": 0.6191, - "step": 47157 - }, - { - "epoch": 1.21, - "learning_rate": 1.3551660535390943e-06, - "loss": 0.6372, - "step": 47158 - }, - { - "epoch": 1.21, - "learning_rate": 1.3551401869735174e-06, - "loss": 0.572, - "step": 47159 - }, - { - "epoch": 1.21, - "learning_rate": 1.3551143201360265e-06, - "loss": 0.6362, - "step": 47160 - }, - { - "epoch": 1.21, - "learning_rate": 1.3550884530266403e-06, - "loss": 0.7012, - "step": 47161 - }, - { - "epoch": 1.21, - "learning_rate": 1.3550625856453799e-06, - "loss": 0.8115, - "step": 47162 - }, - { - "epoch": 1.21, - "learning_rate": 1.355036717992264e-06, - "loss": 0.5994, - "step": 47163 - }, - { - "epoch": 1.21, - "learning_rate": 1.3550108500673128e-06, - "loss": 0.5446, - "step": 47164 - }, - { - "epoch": 1.21, - "learning_rate": 1.3549849818705461e-06, - "loss": 0.8359, - "step": 47165 - }, - { - "epoch": 1.21, - "learning_rate": 1.3549591134019838e-06, - "loss": 0.6768, - "step": 47166 - }, - { - "epoch": 1.21, - "learning_rate": 1.3549332446616454e-06, - "loss": 0.5354, - "step": 47167 - }, - { - "epoch": 1.21, - "learning_rate": 1.3549073756495516e-06, - "loss": 0.7168, - "step": 47168 - }, - { - "epoch": 1.21, - "learning_rate": 1.3548815063657209e-06, - "loss": 0.6348, - "step": 47169 - }, - { - "epoch": 1.21, - "learning_rate": 1.354855636810174e-06, - "loss": 0.5312, - "step": 47170 - }, - { - "epoch": 1.21, - "learning_rate": 1.35482976698293e-06, - "loss": 0.6328, - "step": 47171 - }, - { - "epoch": 1.21, - "learning_rate": 1.35480389688401e-06, - "loss": 0.4346, - "step": 47172 - }, - { - "epoch": 1.21, - "learning_rate": 1.3547780265134322e-06, - "loss": 0.5049, - "step": 47173 - }, - { - "epoch": 1.21, - "learning_rate": 1.3547521558712176e-06, - "loss": 0.7158, - "step": 47174 - }, - { - "epoch": 1.21, - "learning_rate": 1.3547262849573854e-06, - "loss": 0.5918, - "step": 47175 - }, - { - "epoch": 1.21, - "learning_rate": 1.3547004137719558e-06, - "loss": 0.7061, - "step": 47176 - }, - { - "epoch": 1.21, - "learning_rate": 1.3546745423149483e-06, - "loss": 0.7954, - "step": 47177 - }, - { - "epoch": 1.21, - "learning_rate": 1.354648670586383e-06, - "loss": 0.8486, - "step": 47178 - }, - { - "epoch": 1.21, - "learning_rate": 1.354622798586279e-06, - "loss": 0.5283, - "step": 47179 - }, - { - "epoch": 1.21, - "learning_rate": 1.354596926314657e-06, - "loss": 0.707, - "step": 47180 - }, - { - "epoch": 1.21, - "learning_rate": 1.3545710537715365e-06, - "loss": 0.7617, - "step": 47181 - }, - { - "epoch": 1.21, - "learning_rate": 1.354545180956937e-06, - "loss": 0.6519, - "step": 47182 - }, - { - "epoch": 1.21, - "learning_rate": 1.3545193078708788e-06, - "loss": 0.7793, - "step": 47183 - }, - { - "epoch": 1.21, - "learning_rate": 1.3544934345133812e-06, - "loss": 0.6724, - "step": 47184 - }, - { - "epoch": 1.21, - "learning_rate": 1.3544675608844646e-06, - "loss": 0.7119, - "step": 47185 - }, - { - "epoch": 1.21, - "learning_rate": 1.3544416869841482e-06, - "loss": 0.6621, - "step": 47186 - }, - { - "epoch": 1.21, - "learning_rate": 1.3544158128124523e-06, - "loss": 0.8545, - "step": 47187 - }, - { - "epoch": 1.21, - "learning_rate": 1.3543899383693964e-06, - "loss": 0.6514, - "step": 47188 - }, - { - "epoch": 1.21, - "learning_rate": 1.3543640636550005e-06, - "loss": 0.7559, - "step": 47189 - }, - { - "epoch": 1.21, - "learning_rate": 1.3543381886692843e-06, - "loss": 0.5964, - "step": 47190 - }, - { - "epoch": 1.21, - "learning_rate": 1.3543123134122676e-06, - "loss": 0.7861, - "step": 47191 - }, - { - "epoch": 1.21, - "learning_rate": 1.3542864378839703e-06, - "loss": 0.6895, - "step": 47192 - }, - { - "epoch": 1.21, - "learning_rate": 1.3542605620844123e-06, - "loss": 0.543, - "step": 47193 - }, - { - "epoch": 1.21, - "learning_rate": 1.3542346860136128e-06, - "loss": 0.668, - "step": 47194 - }, - { - "epoch": 1.21, - "learning_rate": 1.3542088096715925e-06, - "loss": 0.6455, - "step": 47195 - }, - { - "epoch": 1.21, - "learning_rate": 1.3541829330583706e-06, - "loss": 0.6616, - "step": 47196 - }, - { - "epoch": 1.21, - "learning_rate": 1.3541570561739674e-06, - "loss": 0.6904, - "step": 47197 - }, - { - "epoch": 1.21, - "learning_rate": 1.3541311790184022e-06, - "loss": 0.752, - "step": 47198 - }, - { - "epoch": 1.21, - "learning_rate": 1.3541053015916952e-06, - "loss": 0.7402, - "step": 47199 - }, - { - "epoch": 1.21, - "learning_rate": 1.3540794238938657e-06, - "loss": 0.5176, - "step": 47200 - }, - { - "epoch": 1.21, - "learning_rate": 1.3540535459249342e-06, - "loss": 0.6074, - "step": 47201 - }, - { - "epoch": 1.21, - "learning_rate": 1.3540276676849201e-06, - "loss": 0.709, - "step": 47202 - }, - { - "epoch": 1.21, - "learning_rate": 1.3540017891738432e-06, - "loss": 0.5273, - "step": 47203 - }, - { - "epoch": 1.21, - "learning_rate": 1.3539759103917235e-06, - "loss": 0.6289, - "step": 47204 - }, - { - "epoch": 1.21, - "learning_rate": 1.3539500313385809e-06, - "loss": 0.563, - "step": 47205 - }, - { - "epoch": 1.21, - "learning_rate": 1.3539241520144347e-06, - "loss": 0.6895, - "step": 47206 - }, - { - "epoch": 1.21, - "learning_rate": 1.3538982724193054e-06, - "loss": 0.6802, - "step": 47207 - }, - { - "epoch": 1.21, - "learning_rate": 1.3538723925532121e-06, - "loss": 0.6357, - "step": 47208 - }, - { - "epoch": 1.21, - "learning_rate": 1.353846512416175e-06, - "loss": 0.5571, - "step": 47209 - }, - { - "epoch": 1.21, - "learning_rate": 1.3538206320082143e-06, - "loss": 0.6602, - "step": 47210 - }, - { - "epoch": 1.21, - "learning_rate": 1.3537947513293488e-06, - "loss": 0.5371, - "step": 47211 - }, - { - "epoch": 1.21, - "learning_rate": 1.3537688703795995e-06, - "loss": 0.5542, - "step": 47212 - }, - { - "epoch": 1.21, - "learning_rate": 1.3537429891589854e-06, - "loss": 0.6514, - "step": 47213 - }, - { - "epoch": 1.21, - "learning_rate": 1.3537171076675267e-06, - "loss": 0.7207, - "step": 47214 - }, - { - "epoch": 1.21, - "learning_rate": 1.3536912259052426e-06, - "loss": 0.6494, - "step": 47215 - }, - { - "epoch": 1.21, - "learning_rate": 1.3536653438721538e-06, - "loss": 0.3652, - "step": 47216 - }, - { - "epoch": 1.21, - "learning_rate": 1.3536394615682799e-06, - "loss": 0.749, - "step": 47217 - }, - { - "epoch": 1.21, - "learning_rate": 1.3536135789936403e-06, - "loss": 0.561, - "step": 47218 - }, - { - "epoch": 1.21, - "learning_rate": 1.3535876961482548e-06, - "loss": 0.6006, - "step": 47219 - }, - { - "epoch": 1.21, - "learning_rate": 1.3535618130321438e-06, - "loss": 0.5864, - "step": 47220 - }, - { - "epoch": 1.21, - "learning_rate": 1.3535359296453265e-06, - "loss": 0.5703, - "step": 47221 - }, - { - "epoch": 1.21, - "learning_rate": 1.3535100459878233e-06, - "loss": 0.5713, - "step": 47222 - }, - { - "epoch": 1.21, - "learning_rate": 1.3534841620596535e-06, - "loss": 0.6387, - "step": 47223 - }, - { - "epoch": 1.21, - "learning_rate": 1.3534582778608372e-06, - "loss": 0.7402, - "step": 47224 - }, - { - "epoch": 1.21, - "learning_rate": 1.3534323933913944e-06, - "loss": 0.5723, - "step": 47225 - }, - { - "epoch": 1.21, - "learning_rate": 1.3534065086513441e-06, - "loss": 0.75, - "step": 47226 - }, - { - "epoch": 1.21, - "learning_rate": 1.353380623640707e-06, - "loss": 0.7485, - "step": 47227 - }, - { - "epoch": 1.21, - "learning_rate": 1.3533547383595026e-06, - "loss": 0.5532, - "step": 47228 - }, - { - "epoch": 1.21, - "learning_rate": 1.3533288528077508e-06, - "loss": 0.6465, - "step": 47229 - }, - { - "epoch": 1.21, - "learning_rate": 1.3533029669854712e-06, - "loss": 0.8955, - "step": 47230 - }, - { - "epoch": 1.21, - "learning_rate": 1.353277080892684e-06, - "loss": 0.7007, - "step": 47231 - }, - { - "epoch": 1.21, - "learning_rate": 1.3532511945294085e-06, - "loss": 0.7949, - "step": 47232 - }, - { - "epoch": 1.21, - "learning_rate": 1.353225307895665e-06, - "loss": 0.6753, - "step": 47233 - }, - { - "epoch": 1.21, - "learning_rate": 1.3531994209914729e-06, - "loss": 0.6504, - "step": 47234 - }, - { - "epoch": 1.21, - "learning_rate": 1.3531735338168524e-06, - "loss": 0.6768, - "step": 47235 - }, - { - "epoch": 1.21, - "learning_rate": 1.353147646371823e-06, - "loss": 0.6909, - "step": 47236 - }, - { - "epoch": 1.21, - "learning_rate": 1.3531217586564052e-06, - "loss": 0.646, - "step": 47237 - }, - { - "epoch": 1.21, - "learning_rate": 1.3530958706706176e-06, - "loss": 0.5923, - "step": 47238 - }, - { - "epoch": 1.21, - "learning_rate": 1.3530699824144814e-06, - "loss": 0.5652, - "step": 47239 - }, - { - "epoch": 1.21, - "learning_rate": 1.3530440938880151e-06, - "loss": 0.6357, - "step": 47240 - }, - { - "epoch": 1.21, - "learning_rate": 1.3530182050912395e-06, - "loss": 0.6489, - "step": 47241 - }, - { - "epoch": 1.21, - "learning_rate": 1.3529923160241742e-06, - "loss": 0.6719, - "step": 47242 - }, - { - "epoch": 1.21, - "learning_rate": 1.352966426686839e-06, - "loss": 0.5923, - "step": 47243 - }, - { - "epoch": 1.21, - "learning_rate": 1.3529405370792533e-06, - "loss": 0.8174, - "step": 47244 - }, - { - "epoch": 1.21, - "learning_rate": 1.3529146472014374e-06, - "loss": 0.5869, - "step": 47245 - }, - { - "epoch": 1.21, - "learning_rate": 1.352888757053411e-06, - "loss": 0.7305, - "step": 47246 - }, - { - "epoch": 1.21, - "learning_rate": 1.3528628666351938e-06, - "loss": 0.6963, - "step": 47247 - }, - { - "epoch": 1.21, - "learning_rate": 1.352836975946806e-06, - "loss": 0.4856, - "step": 47248 - }, - { - "epoch": 1.21, - "learning_rate": 1.3528110849882665e-06, - "loss": 0.4458, - "step": 47249 - }, - { - "epoch": 1.21, - "learning_rate": 1.3527851937595964e-06, - "loss": 0.6621, - "step": 47250 - }, - { - "epoch": 1.21, - "learning_rate": 1.3527593022608147e-06, - "loss": 0.4629, - "step": 47251 - }, - { - "epoch": 1.21, - "learning_rate": 1.3527334104919418e-06, - "loss": 0.4685, - "step": 47252 - }, - { - "epoch": 1.21, - "learning_rate": 1.3527075184529965e-06, - "loss": 0.6494, - "step": 47253 - }, - { - "epoch": 1.21, - "learning_rate": 1.3526816261439997e-06, - "loss": 0.6387, - "step": 47254 - }, - { - "epoch": 1.21, - "learning_rate": 1.3526557335649704e-06, - "loss": 0.6055, - "step": 47255 - }, - { - "epoch": 1.21, - "learning_rate": 1.3526298407159294e-06, - "loss": 0.479, - "step": 47256 - }, - { - "epoch": 1.21, - "learning_rate": 1.3526039475968956e-06, - "loss": 0.5815, - "step": 47257 - }, - { - "epoch": 1.21, - "learning_rate": 1.3525780542078892e-06, - "loss": 0.5942, - "step": 47258 - }, - { - "epoch": 1.21, - "learning_rate": 1.35255216054893e-06, - "loss": 0.7637, - "step": 47259 - }, - { - "epoch": 1.21, - "learning_rate": 1.3525262666200378e-06, - "loss": 0.5747, - "step": 47260 - }, - { - "epoch": 1.21, - "learning_rate": 1.3525003724212323e-06, - "loss": 0.5918, - "step": 47261 - }, - { - "epoch": 1.21, - "learning_rate": 1.3524744779525339e-06, - "loss": 0.7207, - "step": 47262 - }, - { - "epoch": 1.21, - "learning_rate": 1.3524485832139617e-06, - "loss": 0.5685, - "step": 47263 - }, - { - "epoch": 1.21, - "learning_rate": 1.3524226882055358e-06, - "loss": 0.7217, - "step": 47264 - }, - { - "epoch": 1.21, - "learning_rate": 1.3523967929272762e-06, - "loss": 0.646, - "step": 47265 - }, - { - "epoch": 1.21, - "learning_rate": 1.3523708973792024e-06, - "loss": 0.5083, - "step": 47266 - }, - { - "epoch": 1.21, - "learning_rate": 1.3523450015613347e-06, - "loss": 0.7285, - "step": 47267 - }, - { - "epoch": 1.21, - "learning_rate": 1.3523191054736925e-06, - "loss": 0.5603, - "step": 47268 - }, - { - "epoch": 1.21, - "learning_rate": 1.3522932091162955e-06, - "loss": 0.7046, - "step": 47269 - }, - { - "epoch": 1.21, - "learning_rate": 1.3522673124891642e-06, - "loss": 0.572, - "step": 47270 - }, - { - "epoch": 1.21, - "learning_rate": 1.3522414155923176e-06, - "loss": 0.6309, - "step": 47271 - }, - { - "epoch": 1.21, - "learning_rate": 1.3522155184257763e-06, - "loss": 0.605, - "step": 47272 - }, - { - "epoch": 1.21, - "learning_rate": 1.3521896209895596e-06, - "loss": 0.5378, - "step": 47273 - }, - { - "epoch": 1.21, - "learning_rate": 1.3521637232836874e-06, - "loss": 0.7617, - "step": 47274 - }, - { - "epoch": 1.21, - "learning_rate": 1.3521378253081796e-06, - "loss": 0.6455, - "step": 47275 - }, - { - "epoch": 1.21, - "learning_rate": 1.3521119270630564e-06, - "loss": 0.6436, - "step": 47276 - }, - { - "epoch": 1.21, - "learning_rate": 1.3520860285483372e-06, - "loss": 0.8193, - "step": 47277 - }, - { - "epoch": 1.21, - "learning_rate": 1.3520601297640418e-06, - "loss": 0.6816, - "step": 47278 - }, - { - "epoch": 1.21, - "learning_rate": 1.3520342307101901e-06, - "loss": 0.7188, - "step": 47279 - }, - { - "epoch": 1.21, - "learning_rate": 1.3520083313868018e-06, - "loss": 0.5571, - "step": 47280 - }, - { - "epoch": 1.21, - "learning_rate": 1.3519824317938973e-06, - "loss": 0.626, - "step": 47281 - }, - { - "epoch": 1.21, - "learning_rate": 1.351956531931496e-06, - "loss": 0.752, - "step": 47282 - }, - { - "epoch": 1.21, - "learning_rate": 1.3519306317996177e-06, - "loss": 0.7803, - "step": 47283 - }, - { - "epoch": 1.21, - "learning_rate": 1.3519047313982821e-06, - "loss": 0.7246, - "step": 47284 - }, - { - "epoch": 1.21, - "learning_rate": 1.3518788307275096e-06, - "loss": 0.606, - "step": 47285 - }, - { - "epoch": 1.21, - "learning_rate": 1.3518529297873192e-06, - "loss": 0.5508, - "step": 47286 - }, - { - "epoch": 1.21, - "learning_rate": 1.3518270285777317e-06, - "loss": 0.5342, - "step": 47287 - }, - { - "epoch": 1.21, - "learning_rate": 1.3518011270987658e-06, - "loss": 0.6479, - "step": 47288 - }, - { - "epoch": 1.21, - "learning_rate": 1.3517752253504427e-06, - "loss": 0.6943, - "step": 47289 - }, - { - "epoch": 1.21, - "learning_rate": 1.3517493233327808e-06, - "loss": 0.7441, - "step": 47290 - }, - { - "epoch": 1.21, - "learning_rate": 1.3517234210458008e-06, - "loss": 0.6367, - "step": 47291 - }, - { - "epoch": 1.21, - "learning_rate": 1.3516975184895226e-06, - "loss": 0.7412, - "step": 47292 - }, - { - "epoch": 1.21, - "learning_rate": 1.3516716156639656e-06, - "loss": 0.6914, - "step": 47293 - }, - { - "epoch": 1.21, - "learning_rate": 1.3516457125691497e-06, - "loss": 0.5273, - "step": 47294 - }, - { - "epoch": 1.21, - "learning_rate": 1.3516198092050951e-06, - "loss": 0.7217, - "step": 47295 - }, - { - "epoch": 1.21, - "learning_rate": 1.3515939055718213e-06, - "loss": 0.6841, - "step": 47296 - }, - { - "epoch": 1.21, - "learning_rate": 1.3515680016693483e-06, - "loss": 0.6958, - "step": 47297 - }, - { - "epoch": 1.21, - "learning_rate": 1.3515420974976956e-06, - "loss": 0.7178, - "step": 47298 - }, - { - "epoch": 1.21, - "learning_rate": 1.3515161930568834e-06, - "loss": 0.5942, - "step": 47299 - }, - { - "epoch": 1.21, - "learning_rate": 1.3514902883469314e-06, - "loss": 0.5842, - "step": 47300 - }, - { - "epoch": 1.21, - "learning_rate": 1.3514643833678594e-06, - "loss": 0.5293, - "step": 47301 - }, - { - "epoch": 1.21, - "learning_rate": 1.3514384781196878e-06, - "loss": 0.6846, - "step": 47302 - }, - { - "epoch": 1.21, - "learning_rate": 1.3514125726024352e-06, - "loss": 0.5327, - "step": 47303 - }, - { - "epoch": 1.21, - "learning_rate": 1.3513866668161224e-06, - "loss": 0.6719, - "step": 47304 - }, - { - "epoch": 1.21, - "learning_rate": 1.3513607607607688e-06, - "loss": 0.6758, - "step": 47305 - }, - { - "epoch": 1.21, - "learning_rate": 1.3513348544363949e-06, - "loss": 0.9121, - "step": 47306 - }, - { - "epoch": 1.21, - "learning_rate": 1.3513089478430197e-06, - "loss": 0.8076, - "step": 47307 - }, - { - "epoch": 1.21, - "learning_rate": 1.3512830409806638e-06, - "loss": 0.7549, - "step": 47308 - }, - { - "epoch": 1.21, - "learning_rate": 1.3512571338493461e-06, - "loss": 0.6963, - "step": 47309 - }, - { - "epoch": 1.21, - "learning_rate": 1.3512312264490872e-06, - "loss": 0.7178, - "step": 47310 - }, - { - "epoch": 1.21, - "learning_rate": 1.3512053187799065e-06, - "loss": 0.708, - "step": 47311 - }, - { - "epoch": 1.21, - "learning_rate": 1.3511794108418243e-06, - "loss": 0.5747, - "step": 47312 - }, - { - "epoch": 1.21, - "learning_rate": 1.3511535026348603e-06, - "loss": 0.7798, - "step": 47313 - }, - { - "epoch": 1.21, - "learning_rate": 1.3511275941590338e-06, - "loss": 0.6265, - "step": 47314 - }, - { - "epoch": 1.21, - "learning_rate": 1.351101685414365e-06, - "loss": 0.6758, - "step": 47315 - }, - { - "epoch": 1.21, - "learning_rate": 1.3510757764008745e-06, - "loss": 0.8125, - "step": 47316 - }, - { - "epoch": 1.21, - "learning_rate": 1.3510498671185808e-06, - "loss": 0.5757, - "step": 47317 - }, - { - "epoch": 1.21, - "learning_rate": 1.3510239575675045e-06, - "loss": 0.6353, - "step": 47318 - }, - { - "epoch": 1.21, - "learning_rate": 1.3509980477476653e-06, - "loss": 0.8291, - "step": 47319 - }, - { - "epoch": 1.21, - "learning_rate": 1.3509721376590828e-06, - "loss": 0.6719, - "step": 47320 - }, - { - "epoch": 1.21, - "learning_rate": 1.3509462273017772e-06, - "loss": 0.7861, - "step": 47321 - }, - { - "epoch": 1.21, - "learning_rate": 1.3509203166757685e-06, - "loss": 0.7109, - "step": 47322 - }, - { - "epoch": 1.21, - "learning_rate": 1.3508944057810762e-06, - "loss": 0.6245, - "step": 47323 - }, - { - "epoch": 1.21, - "learning_rate": 1.35086849461772e-06, - "loss": 0.7705, - "step": 47324 - }, - { - "epoch": 1.21, - "learning_rate": 1.35084258318572e-06, - "loss": 0.6025, - "step": 47325 - }, - { - "epoch": 1.21, - "learning_rate": 1.3508166714850958e-06, - "loss": 0.6895, - "step": 47326 - }, - { - "epoch": 1.21, - "learning_rate": 1.350790759515868e-06, - "loss": 0.7148, - "step": 47327 - }, - { - "epoch": 1.21, - "learning_rate": 1.350764847278055e-06, - "loss": 0.4709, - "step": 47328 - }, - { - "epoch": 1.21, - "learning_rate": 1.350738934771678e-06, - "loss": 0.6016, - "step": 47329 - }, - { - "epoch": 1.21, - "learning_rate": 1.3507130219967561e-06, - "loss": 0.6846, - "step": 47330 - }, - { - "epoch": 1.21, - "learning_rate": 1.3506871089533096e-06, - "loss": 0.8291, - "step": 47331 - }, - { - "epoch": 1.21, - "learning_rate": 1.350661195641358e-06, - "loss": 0.8213, - "step": 47332 - }, - { - "epoch": 1.21, - "learning_rate": 1.3506352820609213e-06, - "loss": 0.5308, - "step": 47333 - }, - { - "epoch": 1.21, - "learning_rate": 1.350609368212019e-06, - "loss": 0.6787, - "step": 47334 - }, - { - "epoch": 1.21, - "learning_rate": 1.3505834540946718e-06, - "loss": 0.5518, - "step": 47335 - }, - { - "epoch": 1.21, - "learning_rate": 1.3505575397088982e-06, - "loss": 0.8291, - "step": 47336 - }, - { - "epoch": 1.21, - "learning_rate": 1.3505316250547195e-06, - "loss": 0.8252, - "step": 47337 - }, - { - "epoch": 1.21, - "learning_rate": 1.3505057101321545e-06, - "loss": 0.7979, - "step": 47338 - }, - { - "epoch": 1.21, - "learning_rate": 1.3504797949412234e-06, - "loss": 0.7139, - "step": 47339 - }, - { - "epoch": 1.21, - "learning_rate": 1.3504538794819462e-06, - "loss": 0.6094, - "step": 47340 - }, - { - "epoch": 1.21, - "learning_rate": 1.3504279637543425e-06, - "loss": 0.6362, - "step": 47341 - }, - { - "epoch": 1.21, - "learning_rate": 1.3504020477584322e-06, - "loss": 0.7725, - "step": 47342 - }, - { - "epoch": 1.21, - "learning_rate": 1.350376131494235e-06, - "loss": 0.6641, - "step": 47343 - }, - { - "epoch": 1.21, - "learning_rate": 1.3503502149617712e-06, - "loss": 0.605, - "step": 47344 - }, - { - "epoch": 1.21, - "learning_rate": 1.35032429816106e-06, - "loss": 0.7783, - "step": 47345 - }, - { - "epoch": 1.21, - "learning_rate": 1.350298381092122e-06, - "loss": 0.8047, - "step": 47346 - }, - { - "epoch": 1.21, - "learning_rate": 1.3502724637549765e-06, - "loss": 0.6421, - "step": 47347 - }, - { - "epoch": 1.21, - "learning_rate": 1.3502465461496435e-06, - "loss": 0.6572, - "step": 47348 - }, - { - "epoch": 1.21, - "learning_rate": 1.3502206282761426e-06, - "loss": 0.6982, - "step": 47349 - }, - { - "epoch": 1.21, - "learning_rate": 1.350194710134494e-06, - "loss": 0.6909, - "step": 47350 - }, - { - "epoch": 1.21, - "learning_rate": 1.3501687917247173e-06, - "loss": 0.4829, - "step": 47351 - }, - { - "epoch": 1.21, - "learning_rate": 1.3501428730468329e-06, - "loss": 0.6855, - "step": 47352 - }, - { - "epoch": 1.21, - "learning_rate": 1.35011695410086e-06, - "loss": 0.5479, - "step": 47353 - }, - { - "epoch": 1.21, - "learning_rate": 1.3500910348868184e-06, - "loss": 0.5417, - "step": 47354 - }, - { - "epoch": 1.21, - "learning_rate": 1.3500651154047282e-06, - "loss": 0.6025, - "step": 47355 - }, - { - "epoch": 1.21, - "learning_rate": 1.3500391956546095e-06, - "loss": 0.7939, - "step": 47356 - }, - { - "epoch": 1.21, - "learning_rate": 1.350013275636482e-06, - "loss": 0.6924, - "step": 47357 - }, - { - "epoch": 1.21, - "learning_rate": 1.3499873553503652e-06, - "loss": 0.6489, - "step": 47358 - }, - { - "epoch": 1.21, - "learning_rate": 1.3499614347962788e-06, - "loss": 0.7266, - "step": 47359 - }, - { - "epoch": 1.21, - "learning_rate": 1.3499355139742437e-06, - "loss": 0.7314, - "step": 47360 - }, - { - "epoch": 1.21, - "learning_rate": 1.3499095928842785e-06, - "loss": 0.6699, - "step": 47361 - }, - { - "epoch": 1.21, - "learning_rate": 1.349883671526404e-06, - "loss": 0.6802, - "step": 47362 - }, - { - "epoch": 1.21, - "learning_rate": 1.3498577499006397e-06, - "loss": 0.667, - "step": 47363 - }, - { - "epoch": 1.21, - "learning_rate": 1.349831828007005e-06, - "loss": 0.6292, - "step": 47364 - }, - { - "epoch": 1.21, - "learning_rate": 1.3498059058455205e-06, - "loss": 0.5076, - "step": 47365 - }, - { - "epoch": 1.21, - "learning_rate": 1.3497799834162054e-06, - "loss": 0.5469, - "step": 47366 - }, - { - "epoch": 1.21, - "learning_rate": 1.3497540607190803e-06, - "loss": 0.5933, - "step": 47367 - }, - { - "epoch": 1.21, - "learning_rate": 1.3497281377541643e-06, - "loss": 0.6216, - "step": 47368 - }, - { - "epoch": 1.21, - "learning_rate": 1.3497022145214777e-06, - "loss": 0.5342, - "step": 47369 - }, - { - "epoch": 1.21, - "learning_rate": 1.3496762910210397e-06, - "loss": 0.6436, - "step": 47370 - }, - { - "epoch": 1.21, - "learning_rate": 1.3496503672528711e-06, - "loss": 0.7422, - "step": 47371 - }, - { - "epoch": 1.21, - "learning_rate": 1.3496244432169914e-06, - "loss": 0.7178, - "step": 47372 - }, - { - "epoch": 1.21, - "learning_rate": 1.3495985189134203e-06, - "loss": 0.4924, - "step": 47373 - }, - { - "epoch": 1.21, - "learning_rate": 1.3495725943421775e-06, - "loss": 0.6548, - "step": 47374 - }, - { - "epoch": 1.21, - "learning_rate": 1.3495466695032828e-06, - "loss": 0.6497, - "step": 47375 - }, - { - "epoch": 1.21, - "learning_rate": 1.3495207443967566e-06, - "loss": 0.6973, - "step": 47376 - }, - { - "epoch": 1.21, - "learning_rate": 1.3494948190226184e-06, - "loss": 0.7842, - "step": 47377 - }, - { - "epoch": 1.21, - "learning_rate": 1.3494688933808881e-06, - "loss": 0.6509, - "step": 47378 - }, - { - "epoch": 1.21, - "learning_rate": 1.3494429674715857e-06, - "loss": 0.585, - "step": 47379 - }, - { - "epoch": 1.21, - "learning_rate": 1.3494170412947307e-06, - "loss": 0.6729, - "step": 47380 - }, - { - "epoch": 1.21, - "learning_rate": 1.3493911148503433e-06, - "loss": 0.77, - "step": 47381 - }, - { - "epoch": 1.21, - "learning_rate": 1.349365188138443e-06, - "loss": 0.6904, - "step": 47382 - }, - { - "epoch": 1.21, - "learning_rate": 1.3493392611590497e-06, - "loss": 0.751, - "step": 47383 - }, - { - "epoch": 1.21, - "learning_rate": 1.3493133339121837e-06, - "loss": 0.6572, - "step": 47384 - }, - { - "epoch": 1.21, - "learning_rate": 1.349287406397864e-06, - "loss": 0.6416, - "step": 47385 - }, - { - "epoch": 1.21, - "learning_rate": 1.3492614786161116e-06, - "loss": 0.7417, - "step": 47386 - }, - { - "epoch": 1.21, - "learning_rate": 1.3492355505669458e-06, - "loss": 0.6621, - "step": 47387 - }, - { - "epoch": 1.21, - "learning_rate": 1.3492096222503862e-06, - "loss": 0.6787, - "step": 47388 - }, - { - "epoch": 1.21, - "learning_rate": 1.3491836936664527e-06, - "loss": 0.7705, - "step": 47389 - }, - { - "epoch": 1.21, - "learning_rate": 1.3491577648151653e-06, - "loss": 0.4617, - "step": 47390 - }, - { - "epoch": 1.21, - "learning_rate": 1.3491318356965437e-06, - "loss": 0.5, - "step": 47391 - }, - { - "epoch": 1.21, - "learning_rate": 1.3491059063106086e-06, - "loss": 0.5928, - "step": 47392 - }, - { - "epoch": 1.21, - "learning_rate": 1.3490799766573786e-06, - "loss": 0.7061, - "step": 47393 - }, - { - "epoch": 1.21, - "learning_rate": 1.3490540467368743e-06, - "loss": 0.561, - "step": 47394 - }, - { - "epoch": 1.21, - "learning_rate": 1.3490281165491152e-06, - "loss": 0.4934, - "step": 47395 - }, - { - "epoch": 1.21, - "learning_rate": 1.3490021860941215e-06, - "loss": 0.7354, - "step": 47396 - }, - { - "epoch": 1.21, - "learning_rate": 1.3489762553719128e-06, - "loss": 0.8457, - "step": 47397 - }, - { - "epoch": 1.21, - "learning_rate": 1.3489503243825092e-06, - "loss": 0.6133, - "step": 47398 - }, - { - "epoch": 1.21, - "learning_rate": 1.34892439312593e-06, - "loss": 0.6494, - "step": 47399 - }, - { - "epoch": 1.21, - "learning_rate": 1.3488984616021957e-06, - "loss": 0.7666, - "step": 47400 - }, - { - "epoch": 1.21, - "learning_rate": 1.3488725298113257e-06, - "loss": 0.7129, - "step": 47401 - }, - { - "epoch": 1.21, - "learning_rate": 1.3488465977533404e-06, - "loss": 0.5168, - "step": 47402 - }, - { - "epoch": 1.21, - "learning_rate": 1.348820665428259e-06, - "loss": 0.8516, - "step": 47403 - }, - { - "epoch": 1.21, - "learning_rate": 1.3487947328361018e-06, - "loss": 0.7012, - "step": 47404 - }, - { - "epoch": 1.22, - "learning_rate": 1.3487687999768885e-06, - "loss": 0.5303, - "step": 47405 - }, - { - "epoch": 1.22, - "learning_rate": 1.348742866850639e-06, - "loss": 0.7852, - "step": 47406 - }, - { - "epoch": 1.22, - "learning_rate": 1.3487169334573728e-06, - "loss": 0.7607, - "step": 47407 - }, - { - "epoch": 1.22, - "learning_rate": 1.3486909997971103e-06, - "loss": 0.6943, - "step": 47408 - }, - { - "epoch": 1.22, - "learning_rate": 1.3486650658698712e-06, - "loss": 0.5093, - "step": 47409 - }, - { - "epoch": 1.22, - "learning_rate": 1.348639131675675e-06, - "loss": 0.7402, - "step": 47410 - }, - { - "epoch": 1.22, - "learning_rate": 1.3486131972145422e-06, - "loss": 0.7354, - "step": 47411 - }, - { - "epoch": 1.22, - "learning_rate": 1.3485872624864922e-06, - "loss": 0.54, - "step": 47412 - }, - { - "epoch": 1.22, - "learning_rate": 1.3485613274915452e-06, - "loss": 0.7012, - "step": 47413 - }, - { - "epoch": 1.22, - "learning_rate": 1.3485353922297204e-06, - "loss": 0.7158, - "step": 47414 - }, - { - "epoch": 1.22, - "learning_rate": 1.3485094567010384e-06, - "loss": 0.6182, - "step": 47415 - }, - { - "epoch": 1.22, - "learning_rate": 1.3484835209055185e-06, - "loss": 0.6958, - "step": 47416 - }, - { - "epoch": 1.22, - "learning_rate": 1.3484575848431812e-06, - "loss": 0.6206, - "step": 47417 - }, - { - "epoch": 1.22, - "learning_rate": 1.3484316485140451e-06, - "loss": 0.7178, - "step": 47418 - }, - { - "epoch": 1.22, - "learning_rate": 1.3484057119181318e-06, - "loss": 0.6689, - "step": 47419 - }, - { - "epoch": 1.22, - "learning_rate": 1.3483797750554598e-06, - "loss": 0.5825, - "step": 47420 - }, - { - "epoch": 1.22, - "learning_rate": 1.3483538379260497e-06, - "loss": 0.4431, - "step": 47421 - }, - { - "epoch": 1.22, - "learning_rate": 1.3483279005299208e-06, - "loss": 0.6543, - "step": 47422 - }, - { - "epoch": 1.22, - "learning_rate": 1.3483019628670932e-06, - "loss": 0.645, - "step": 47423 - }, - { - "epoch": 1.22, - "learning_rate": 1.348276024937587e-06, - "loss": 0.7305, - "step": 47424 - }, - { - "epoch": 1.22, - "learning_rate": 1.348250086741422e-06, - "loss": 0.7383, - "step": 47425 - }, - { - "epoch": 1.22, - "learning_rate": 1.3482241482786177e-06, - "loss": 0.5647, - "step": 47426 - }, - { - "epoch": 1.22, - "learning_rate": 1.3481982095491942e-06, - "loss": 0.5081, - "step": 47427 - }, - { - "epoch": 1.22, - "learning_rate": 1.3481722705531712e-06, - "loss": 0.7222, - "step": 47428 - }, - { - "epoch": 1.22, - "learning_rate": 1.348146331290569e-06, - "loss": 0.5591, - "step": 47429 - }, - { - "epoch": 1.22, - "learning_rate": 1.348120391761407e-06, - "loss": 0.7471, - "step": 47430 - }, - { - "epoch": 1.22, - "learning_rate": 1.3480944519657054e-06, - "loss": 0.6846, - "step": 47431 - }, - { - "epoch": 1.22, - "learning_rate": 1.3480685119034835e-06, - "loss": 0.6313, - "step": 47432 - }, - { - "epoch": 1.22, - "learning_rate": 1.3480425715747618e-06, - "loss": 0.6963, - "step": 47433 - }, - { - "epoch": 1.22, - "learning_rate": 1.34801663097956e-06, - "loss": 0.6992, - "step": 47434 - }, - { - "epoch": 1.22, - "learning_rate": 1.3479906901178976e-06, - "loss": 0.3842, - "step": 47435 - }, - { - "epoch": 1.22, - "learning_rate": 1.3479647489897951e-06, - "loss": 0.6831, - "step": 47436 - }, - { - "epoch": 1.22, - "learning_rate": 1.3479388075952716e-06, - "loss": 0.7061, - "step": 47437 - }, - { - "epoch": 1.22, - "learning_rate": 1.3479128659343477e-06, - "loss": 0.7363, - "step": 47438 - }, - { - "epoch": 1.22, - "learning_rate": 1.3478869240070425e-06, - "loss": 0.6582, - "step": 47439 - }, - { - "epoch": 1.22, - "learning_rate": 1.3478609818133766e-06, - "loss": 0.79, - "step": 47440 - }, - { - "epoch": 1.22, - "learning_rate": 1.3478350393533694e-06, - "loss": 0.7803, - "step": 47441 - }, - { - "epoch": 1.22, - "learning_rate": 1.3478090966270411e-06, - "loss": 0.4846, - "step": 47442 - }, - { - "epoch": 1.22, - "learning_rate": 1.3477831536344112e-06, - "loss": 0.6958, - "step": 47443 - }, - { - "epoch": 1.22, - "learning_rate": 1.3477572103754997e-06, - "loss": 0.7529, - "step": 47444 - }, - { - "epoch": 1.22, - "learning_rate": 1.3477312668503266e-06, - "loss": 0.7246, - "step": 47445 - }, - { - "epoch": 1.22, - "learning_rate": 1.3477053230589117e-06, - "loss": 0.7002, - "step": 47446 - }, - { - "epoch": 1.22, - "learning_rate": 1.3476793790012749e-06, - "loss": 0.5586, - "step": 47447 - }, - { - "epoch": 1.22, - "learning_rate": 1.3476534346774357e-06, - "loss": 0.6602, - "step": 47448 - }, - { - "epoch": 1.22, - "learning_rate": 1.3476274900874142e-06, - "loss": 0.6519, - "step": 47449 - }, - { - "epoch": 1.22, - "learning_rate": 1.3476015452312307e-06, - "loss": 0.7324, - "step": 47450 - }, - { - "epoch": 1.22, - "learning_rate": 1.3475756001089045e-06, - "loss": 0.5347, - "step": 47451 - }, - { - "epoch": 1.22, - "learning_rate": 1.3475496547204554e-06, - "loss": 0.709, - "step": 47452 - }, - { - "epoch": 1.22, - "learning_rate": 1.347523709065904e-06, - "loss": 0.479, - "step": 47453 - }, - { - "epoch": 1.22, - "learning_rate": 1.3474977631452692e-06, - "loss": 0.6533, - "step": 47454 - }, - { - "epoch": 1.22, - "learning_rate": 1.3474718169585716e-06, - "loss": 0.5874, - "step": 47455 - }, - { - "epoch": 1.22, - "learning_rate": 1.3474458705058307e-06, - "loss": 0.5566, - "step": 47456 - }, - { - "epoch": 1.22, - "learning_rate": 1.3474199237870668e-06, - "loss": 0.5864, - "step": 47457 - }, - { - "epoch": 1.22, - "learning_rate": 1.3473939768022988e-06, - "loss": 0.5188, - "step": 47458 - }, - { - "epoch": 1.22, - "learning_rate": 1.3473680295515478e-06, - "loss": 0.6523, - "step": 47459 - }, - { - "epoch": 1.22, - "learning_rate": 1.3473420820348327e-06, - "loss": 0.6963, - "step": 47460 - }, - { - "epoch": 1.22, - "learning_rate": 1.347316134252174e-06, - "loss": 0.8037, - "step": 47461 - }, - { - "epoch": 1.22, - "learning_rate": 1.3472901862035913e-06, - "loss": 0.6313, - "step": 47462 - }, - { - "epoch": 1.22, - "learning_rate": 1.3472642378891044e-06, - "loss": 0.502, - "step": 47463 - }, - { - "epoch": 1.22, - "learning_rate": 1.3472382893087328e-06, - "loss": 0.8955, - "step": 47464 - }, - { - "epoch": 1.22, - "learning_rate": 1.3472123404624972e-06, - "loss": 0.7524, - "step": 47465 - }, - { - "epoch": 1.22, - "learning_rate": 1.3471863913504174e-06, - "loss": 0.667, - "step": 47466 - }, - { - "epoch": 1.22, - "learning_rate": 1.3471604419725126e-06, - "loss": 0.793, - "step": 47467 - }, - { - "epoch": 1.22, - "learning_rate": 1.3471344923288031e-06, - "loss": 0.5996, - "step": 47468 - }, - { - "epoch": 1.22, - "learning_rate": 1.3471085424193085e-06, - "loss": 0.5537, - "step": 47469 - }, - { - "epoch": 1.22, - "learning_rate": 1.3470825922440488e-06, - "loss": 0.7134, - "step": 47470 - }, - { - "epoch": 1.22, - "learning_rate": 1.3470566418030443e-06, - "loss": 0.6914, - "step": 47471 - }, - { - "epoch": 1.22, - "learning_rate": 1.3470306910963142e-06, - "loss": 0.5293, - "step": 47472 - }, - { - "epoch": 1.22, - "learning_rate": 1.3470047401238786e-06, - "loss": 0.6631, - "step": 47473 - }, - { - "epoch": 1.22, - "learning_rate": 1.3469787888857575e-06, - "loss": 0.5215, - "step": 47474 - }, - { - "epoch": 1.22, - "learning_rate": 1.3469528373819707e-06, - "loss": 0.6709, - "step": 47475 - }, - { - "epoch": 1.22, - "learning_rate": 1.3469268856125384e-06, - "loss": 0.5007, - "step": 47476 - }, - { - "epoch": 1.22, - "learning_rate": 1.3469009335774798e-06, - "loss": 0.6182, - "step": 47477 - }, - { - "epoch": 1.22, - "learning_rate": 1.3468749812768152e-06, - "loss": 0.7656, - "step": 47478 - }, - { - "epoch": 1.22, - "learning_rate": 1.3468490287105642e-06, - "loss": 0.6235, - "step": 47479 - }, - { - "epoch": 1.22, - "learning_rate": 1.346823075878747e-06, - "loss": 0.5405, - "step": 47480 - }, - { - "epoch": 1.22, - "learning_rate": 1.3467971227813836e-06, - "loss": 0.4829, - "step": 47481 - }, - { - "epoch": 1.22, - "learning_rate": 1.3467711694184932e-06, - "loss": 0.5459, - "step": 47482 - }, - { - "epoch": 1.22, - "learning_rate": 1.346745215790096e-06, - "loss": 0.6582, - "step": 47483 - }, - { - "epoch": 1.22, - "learning_rate": 1.3467192618962122e-06, - "loss": 0.7383, - "step": 47484 - }, - { - "epoch": 1.22, - "learning_rate": 1.3466933077368612e-06, - "loss": 0.5869, - "step": 47485 - }, - { - "epoch": 1.22, - "learning_rate": 1.3466673533120635e-06, - "loss": 0.5957, - "step": 47486 - }, - { - "epoch": 1.22, - "learning_rate": 1.3466413986218382e-06, - "loss": 0.5154, - "step": 47487 - }, - { - "epoch": 1.22, - "learning_rate": 1.3466154436662053e-06, - "loss": 0.8252, - "step": 47488 - }, - { - "epoch": 1.22, - "learning_rate": 1.346589488445185e-06, - "loss": 0.5625, - "step": 47489 - }, - { - "epoch": 1.22, - "learning_rate": 1.3465635329587973e-06, - "loss": 0.5713, - "step": 47490 - }, - { - "epoch": 1.22, - "learning_rate": 1.3465375772070616e-06, - "loss": 0.6357, - "step": 47491 - }, - { - "epoch": 1.22, - "learning_rate": 1.3465116211899982e-06, - "loss": 0.6089, - "step": 47492 - }, - { - "epoch": 1.22, - "learning_rate": 1.3464856649076267e-06, - "loss": 0.627, - "step": 47493 - }, - { - "epoch": 1.22, - "learning_rate": 1.3464597083599673e-06, - "loss": 0.5679, - "step": 47494 - }, - { - "epoch": 1.22, - "learning_rate": 1.3464337515470392e-06, - "loss": 0.584, - "step": 47495 - }, - { - "epoch": 1.22, - "learning_rate": 1.346407794468863e-06, - "loss": 0.646, - "step": 47496 - }, - { - "epoch": 1.22, - "learning_rate": 1.3463818371254583e-06, - "loss": 0.5332, - "step": 47497 - }, - { - "epoch": 1.22, - "learning_rate": 1.3463558795168448e-06, - "loss": 0.5571, - "step": 47498 - }, - { - "epoch": 1.22, - "learning_rate": 1.3463299216430426e-06, - "loss": 0.5625, - "step": 47499 - }, - { - "epoch": 1.22, - "learning_rate": 1.3463039635040714e-06, - "loss": 0.6455, - "step": 47500 - }, - { - "epoch": 1.22, - "learning_rate": 1.3462780050999514e-06, - "loss": 0.9385, - "step": 47501 - }, - { - "epoch": 1.22, - "learning_rate": 1.346252046430702e-06, - "loss": 0.5225, - "step": 47502 - }, - { - "epoch": 1.22, - "learning_rate": 1.3462260874963435e-06, - "loss": 0.686, - "step": 47503 - }, - { - "epoch": 1.22, - "learning_rate": 1.3462001282968956e-06, - "loss": 0.562, - "step": 47504 - }, - { - "epoch": 1.22, - "learning_rate": 1.3461741688323782e-06, - "loss": 0.6069, - "step": 47505 - }, - { - "epoch": 1.22, - "learning_rate": 1.3461482091028111e-06, - "loss": 0.4933, - "step": 47506 - }, - { - "epoch": 1.22, - "learning_rate": 1.3461222491082142e-06, - "loss": 0.6074, - "step": 47507 - }, - { - "epoch": 1.22, - "learning_rate": 1.3460962888486074e-06, - "loss": 0.8037, - "step": 47508 - }, - { - "epoch": 1.22, - "learning_rate": 1.3460703283240107e-06, - "loss": 0.583, - "step": 47509 - }, - { - "epoch": 1.22, - "learning_rate": 1.3460443675344437e-06, - "loss": 0.583, - "step": 47510 - }, - { - "epoch": 1.22, - "learning_rate": 1.3460184064799267e-06, - "loss": 0.8223, - "step": 47511 - }, - { - "epoch": 1.22, - "learning_rate": 1.345992445160479e-06, - "loss": 0.7114, - "step": 47512 - }, - { - "epoch": 1.22, - "learning_rate": 1.345966483576121e-06, - "loss": 0.5825, - "step": 47513 - }, - { - "epoch": 1.22, - "learning_rate": 1.3459405217268722e-06, - "loss": 0.6875, - "step": 47514 - }, - { - "epoch": 1.22, - "learning_rate": 1.3459145596127528e-06, - "loss": 0.7275, - "step": 47515 - }, - { - "epoch": 1.22, - "learning_rate": 1.3458885972337825e-06, - "loss": 0.7109, - "step": 47516 - }, - { - "epoch": 1.22, - "learning_rate": 1.345862634589981e-06, - "loss": 0.6162, - "step": 47517 - }, - { - "epoch": 1.22, - "learning_rate": 1.3458366716813688e-06, - "loss": 0.5308, - "step": 47518 - }, - { - "epoch": 1.22, - "learning_rate": 1.3458107085079648e-06, - "loss": 0.5967, - "step": 47519 - }, - { - "epoch": 1.22, - "learning_rate": 1.34578474506979e-06, - "loss": 0.8008, - "step": 47520 - }, - { - "epoch": 1.22, - "learning_rate": 1.3457587813668637e-06, - "loss": 0.7539, - "step": 47521 - }, - { - "epoch": 1.22, - "learning_rate": 1.3457328173992056e-06, - "loss": 0.6118, - "step": 47522 - }, - { - "epoch": 1.22, - "learning_rate": 1.3457068531668357e-06, - "loss": 0.7168, - "step": 47523 - }, - { - "epoch": 1.22, - "learning_rate": 1.345680888669774e-06, - "loss": 0.5405, - "step": 47524 - }, - { - "epoch": 1.22, - "learning_rate": 1.3456549239080402e-06, - "loss": 0.6267, - "step": 47525 - }, - { - "epoch": 1.22, - "learning_rate": 1.3456289588816547e-06, - "loss": 0.6157, - "step": 47526 - }, - { - "epoch": 1.22, - "learning_rate": 1.3456029935906365e-06, - "loss": 0.4988, - "step": 47527 - }, - { - "epoch": 1.22, - "learning_rate": 1.3455770280350066e-06, - "loss": 0.668, - "step": 47528 - }, - { - "epoch": 1.22, - "learning_rate": 1.3455510622147836e-06, - "loss": 0.5237, - "step": 47529 - }, - { - "epoch": 1.22, - "learning_rate": 1.3455250961299885e-06, - "loss": 0.312, - "step": 47530 - }, - { - "epoch": 1.22, - "learning_rate": 1.3454991297806406e-06, - "loss": 0.6851, - "step": 47531 - }, - { - "epoch": 1.22, - "learning_rate": 1.34547316316676e-06, - "loss": 0.7217, - "step": 47532 - }, - { - "epoch": 1.22, - "learning_rate": 1.3454471962883662e-06, - "loss": 0.6978, - "step": 47533 - }, - { - "epoch": 1.22, - "learning_rate": 1.3454212291454797e-06, - "loss": 0.7363, - "step": 47534 - }, - { - "epoch": 1.22, - "learning_rate": 1.3453952617381197e-06, - "loss": 0.7441, - "step": 47535 - }, - { - "epoch": 1.22, - "learning_rate": 1.3453692940663067e-06, - "loss": 0.5156, - "step": 47536 - }, - { - "epoch": 1.22, - "learning_rate": 1.3453433261300603e-06, - "loss": 0.5654, - "step": 47537 - }, - { - "epoch": 1.22, - "learning_rate": 1.3453173579294004e-06, - "loss": 0.5342, - "step": 47538 - }, - { - "epoch": 1.22, - "learning_rate": 1.3452913894643465e-06, - "loss": 0.5679, - "step": 47539 - }, - { - "epoch": 1.22, - "learning_rate": 1.3452654207349192e-06, - "loss": 0.7109, - "step": 47540 - }, - { - "epoch": 1.22, - "learning_rate": 1.3452394517411383e-06, - "loss": 0.5972, - "step": 47541 - }, - { - "epoch": 1.22, - "learning_rate": 1.3452134824830231e-06, - "loss": 0.7207, - "step": 47542 - }, - { - "epoch": 1.22, - "learning_rate": 1.3451875129605937e-06, - "loss": 0.7559, - "step": 47543 - }, - { - "epoch": 1.22, - "learning_rate": 1.34516154317387e-06, - "loss": 0.707, - "step": 47544 - }, - { - "epoch": 1.22, - "learning_rate": 1.3451355731228723e-06, - "loss": 0.4878, - "step": 47545 - }, - { - "epoch": 1.22, - "learning_rate": 1.3451096028076202e-06, - "loss": 0.6099, - "step": 47546 - }, - { - "epoch": 1.22, - "learning_rate": 1.3450836322281337e-06, - "loss": 0.5679, - "step": 47547 - }, - { - "epoch": 1.22, - "learning_rate": 1.345057661384432e-06, - "loss": 0.436, - "step": 47548 - }, - { - "epoch": 1.22, - "learning_rate": 1.3450316902765357e-06, - "loss": 0.7344, - "step": 47549 - }, - { - "epoch": 1.22, - "learning_rate": 1.3450057189044644e-06, - "loss": 0.7188, - "step": 47550 - }, - { - "epoch": 1.22, - "learning_rate": 1.3449797472682388e-06, - "loss": 0.666, - "step": 47551 - }, - { - "epoch": 1.22, - "learning_rate": 1.3449537753678772e-06, - "loss": 0.6406, - "step": 47552 - }, - { - "epoch": 1.22, - "learning_rate": 1.3449278032034008e-06, - "loss": 0.6956, - "step": 47553 - }, - { - "epoch": 1.22, - "learning_rate": 1.3449018307748288e-06, - "loss": 0.7803, - "step": 47554 - }, - { - "epoch": 1.22, - "learning_rate": 1.3448758580821814e-06, - "loss": 0.6191, - "step": 47555 - }, - { - "epoch": 1.22, - "learning_rate": 1.3448498851254786e-06, - "loss": 0.7021, - "step": 47556 - }, - { - "epoch": 1.22, - "learning_rate": 1.34482391190474e-06, - "loss": 0.6118, - "step": 47557 - }, - { - "epoch": 1.22, - "learning_rate": 1.3447979384199854e-06, - "loss": 0.6572, - "step": 47558 - }, - { - "epoch": 1.22, - "learning_rate": 1.344771964671235e-06, - "loss": 0.5342, - "step": 47559 - }, - { - "epoch": 1.22, - "learning_rate": 1.3447459906585086e-06, - "loss": 0.6274, - "step": 47560 - }, - { - "epoch": 1.22, - "learning_rate": 1.344720016381826e-06, - "loss": 0.6694, - "step": 47561 - }, - { - "epoch": 1.22, - "learning_rate": 1.3446940418412072e-06, - "loss": 0.6133, - "step": 47562 - }, - { - "epoch": 1.22, - "learning_rate": 1.3446680670366718e-06, - "loss": 0.6807, - "step": 47563 - }, - { - "epoch": 1.22, - "learning_rate": 1.34464209196824e-06, - "loss": 0.6001, - "step": 47564 - }, - { - "epoch": 1.22, - "learning_rate": 1.3446161166359318e-06, - "loss": 0.5615, - "step": 47565 - }, - { - "epoch": 1.22, - "learning_rate": 1.344590141039767e-06, - "loss": 0.6494, - "step": 47566 - }, - { - "epoch": 1.22, - "learning_rate": 1.344564165179765e-06, - "loss": 0.6357, - "step": 47567 - }, - { - "epoch": 1.22, - "learning_rate": 1.3445381890559463e-06, - "loss": 0.6963, - "step": 47568 - }, - { - "epoch": 1.22, - "learning_rate": 1.3445122126683304e-06, - "loss": 0.5884, - "step": 47569 - }, - { - "epoch": 1.22, - "learning_rate": 1.3444862360169373e-06, - "loss": 0.6133, - "step": 47570 - }, - { - "epoch": 1.22, - "learning_rate": 1.344460259101787e-06, - "loss": 0.627, - "step": 47571 - }, - { - "epoch": 1.22, - "learning_rate": 1.3444342819228995e-06, - "loss": 0.6982, - "step": 47572 - }, - { - "epoch": 1.22, - "learning_rate": 1.3444083044802942e-06, - "loss": 0.7334, - "step": 47573 - }, - { - "epoch": 1.22, - "learning_rate": 1.3443823267739916e-06, - "loss": 0.7324, - "step": 47574 - }, - { - "epoch": 1.22, - "learning_rate": 1.344356348804011e-06, - "loss": 0.6968, - "step": 47575 - }, - { - "epoch": 1.22, - "learning_rate": 1.3443303705703728e-06, - "loss": 0.6184, - "step": 47576 - }, - { - "epoch": 1.22, - "learning_rate": 1.3443043920730964e-06, - "loss": 0.5089, - "step": 47577 - }, - { - "epoch": 1.22, - "learning_rate": 1.3442784133122023e-06, - "loss": 0.5269, - "step": 47578 - }, - { - "epoch": 1.22, - "learning_rate": 1.3442524342877098e-06, - "loss": 0.7402, - "step": 47579 - }, - { - "epoch": 1.22, - "learning_rate": 1.344226454999639e-06, - "loss": 0.6934, - "step": 47580 - }, - { - "epoch": 1.22, - "learning_rate": 1.3442004754480102e-06, - "loss": 0.5771, - "step": 47581 - }, - { - "epoch": 1.22, - "learning_rate": 1.3441744956328426e-06, - "loss": 0.6812, - "step": 47582 - }, - { - "epoch": 1.22, - "learning_rate": 1.3441485155541566e-06, - "loss": 0.5767, - "step": 47583 - }, - { - "epoch": 1.22, - "learning_rate": 1.3441225352119718e-06, - "loss": 0.6836, - "step": 47584 - }, - { - "epoch": 1.22, - "learning_rate": 1.344096554606308e-06, - "loss": 0.5659, - "step": 47585 - }, - { - "epoch": 1.22, - "learning_rate": 1.3440705737371855e-06, - "loss": 0.6375, - "step": 47586 - }, - { - "epoch": 1.22, - "learning_rate": 1.3440445926046241e-06, - "loss": 0.5491, - "step": 47587 - }, - { - "epoch": 1.22, - "learning_rate": 1.3440186112086433e-06, - "loss": 0.7349, - "step": 47588 - }, - { - "epoch": 1.22, - "learning_rate": 1.3439926295492636e-06, - "loss": 0.5776, - "step": 47589 - }, - { - "epoch": 1.22, - "learning_rate": 1.343966647626504e-06, - "loss": 0.6504, - "step": 47590 - }, - { - "epoch": 1.22, - "learning_rate": 1.3439406654403857e-06, - "loss": 0.6406, - "step": 47591 - }, - { - "epoch": 1.22, - "learning_rate": 1.3439146829909276e-06, - "loss": 0.7329, - "step": 47592 - }, - { - "epoch": 1.22, - "learning_rate": 1.3438887002781496e-06, - "loss": 0.7695, - "step": 47593 - }, - { - "epoch": 1.22, - "learning_rate": 1.3438627173020718e-06, - "loss": 0.6089, - "step": 47594 - }, - { - "epoch": 1.22, - "learning_rate": 1.3438367340627143e-06, - "loss": 0.728, - "step": 47595 - }, - { - "epoch": 1.22, - "learning_rate": 1.3438107505600971e-06, - "loss": 0.7656, - "step": 47596 - }, - { - "epoch": 1.22, - "learning_rate": 1.3437847667942395e-06, - "loss": 0.7144, - "step": 47597 - }, - { - "epoch": 1.22, - "learning_rate": 1.3437587827651614e-06, - "loss": 0.6992, - "step": 47598 - }, - { - "epoch": 1.22, - "learning_rate": 1.3437327984728834e-06, - "loss": 0.5791, - "step": 47599 - }, - { - "epoch": 1.22, - "learning_rate": 1.343706813917425e-06, - "loss": 0.6855, - "step": 47600 - }, - { - "epoch": 1.22, - "learning_rate": 1.3436808290988061e-06, - "loss": 0.5059, - "step": 47601 - }, - { - "epoch": 1.22, - "learning_rate": 1.3436548440170466e-06, - "loss": 0.6821, - "step": 47602 - }, - { - "epoch": 1.22, - "learning_rate": 1.3436288586721664e-06, - "loss": 0.7002, - "step": 47603 - }, - { - "epoch": 1.22, - "learning_rate": 1.343602873064185e-06, - "loss": 0.7021, - "step": 47604 - }, - { - "epoch": 1.22, - "learning_rate": 1.3435768871931231e-06, - "loss": 0.5928, - "step": 47605 - }, - { - "epoch": 1.22, - "learning_rate": 1.3435509010590003e-06, - "loss": 0.7227, - "step": 47606 - }, - { - "epoch": 1.22, - "learning_rate": 1.3435249146618359e-06, - "loss": 0.666, - "step": 47607 - }, - { - "epoch": 1.22, - "learning_rate": 1.3434989280016505e-06, - "loss": 0.5293, - "step": 47608 - }, - { - "epoch": 1.22, - "learning_rate": 1.3434729410784638e-06, - "loss": 0.5815, - "step": 47609 - }, - { - "epoch": 1.22, - "learning_rate": 1.3434469538922955e-06, - "loss": 0.6631, - "step": 47610 - }, - { - "epoch": 1.22, - "learning_rate": 1.343420966443166e-06, - "loss": 0.6748, - "step": 47611 - }, - { - "epoch": 1.22, - "learning_rate": 1.3433949787310946e-06, - "loss": 0.7412, - "step": 47612 - }, - { - "epoch": 1.22, - "learning_rate": 1.3433689907561015e-06, - "loss": 0.5986, - "step": 47613 - }, - { - "epoch": 1.22, - "learning_rate": 1.3433430025182063e-06, - "loss": 0.6611, - "step": 47614 - }, - { - "epoch": 1.22, - "learning_rate": 1.3433170140174294e-06, - "loss": 0.7656, - "step": 47615 - }, - { - "epoch": 1.22, - "learning_rate": 1.3432910252537908e-06, - "loss": 0.6069, - "step": 47616 - }, - { - "epoch": 1.22, - "learning_rate": 1.3432650362273095e-06, - "loss": 0.6758, - "step": 47617 - }, - { - "epoch": 1.22, - "learning_rate": 1.343239046938006e-06, - "loss": 0.6387, - "step": 47618 - }, - { - "epoch": 1.22, - "learning_rate": 1.3432130573859003e-06, - "loss": 0.7314, - "step": 47619 - }, - { - "epoch": 1.22, - "learning_rate": 1.3431870675710121e-06, - "loss": 0.5708, - "step": 47620 - }, - { - "epoch": 1.22, - "learning_rate": 1.3431610774933618e-06, - "loss": 0.8008, - "step": 47621 - }, - { - "epoch": 1.22, - "learning_rate": 1.3431350871529682e-06, - "loss": 0.7729, - "step": 47622 - }, - { - "epoch": 1.22, - "learning_rate": 1.343109096549852e-06, - "loss": 0.625, - "step": 47623 - }, - { - "epoch": 1.22, - "learning_rate": 1.343083105684033e-06, - "loss": 0.5093, - "step": 47624 - }, - { - "epoch": 1.22, - "learning_rate": 1.343057114555531e-06, - "loss": 0.9043, - "step": 47625 - }, - { - "epoch": 1.22, - "learning_rate": 1.3430311231643661e-06, - "loss": 0.7188, - "step": 47626 - }, - { - "epoch": 1.22, - "learning_rate": 1.343005131510558e-06, - "loss": 0.6406, - "step": 47627 - }, - { - "epoch": 1.22, - "learning_rate": 1.3429791395941266e-06, - "loss": 0.5864, - "step": 47628 - }, - { - "epoch": 1.22, - "learning_rate": 1.3429531474150918e-06, - "loss": 0.5857, - "step": 47629 - }, - { - "epoch": 1.22, - "learning_rate": 1.3429271549734733e-06, - "loss": 0.7012, - "step": 47630 - }, - { - "epoch": 1.22, - "learning_rate": 1.3429011622692915e-06, - "loss": 0.5464, - "step": 47631 - }, - { - "epoch": 1.22, - "learning_rate": 1.342875169302566e-06, - "loss": 0.5054, - "step": 47632 - }, - { - "epoch": 1.22, - "learning_rate": 1.342849176073317e-06, - "loss": 0.6738, - "step": 47633 - }, - { - "epoch": 1.22, - "learning_rate": 1.3428231825815636e-06, - "loss": 0.6279, - "step": 47634 - }, - { - "epoch": 1.22, - "learning_rate": 1.3427971888273268e-06, - "loss": 0.6416, - "step": 47635 - }, - { - "epoch": 1.22, - "learning_rate": 1.3427711948106258e-06, - "loss": 0.7554, - "step": 47636 - }, - { - "epoch": 1.22, - "learning_rate": 1.3427452005314805e-06, - "loss": 0.834, - "step": 47637 - }, - { - "epoch": 1.22, - "learning_rate": 1.342719205989911e-06, - "loss": 0.7627, - "step": 47638 - }, - { - "epoch": 1.22, - "learning_rate": 1.3426932111859372e-06, - "loss": 0.5801, - "step": 47639 - }, - { - "epoch": 1.22, - "learning_rate": 1.3426672161195792e-06, - "loss": 0.6758, - "step": 47640 - }, - { - "epoch": 1.22, - "learning_rate": 1.3426412207908565e-06, - "loss": 0.6602, - "step": 47641 - }, - { - "epoch": 1.22, - "learning_rate": 1.3426152251997892e-06, - "loss": 0.5342, - "step": 47642 - }, - { - "epoch": 1.22, - "learning_rate": 1.342589229346397e-06, - "loss": 0.5525, - "step": 47643 - }, - { - "epoch": 1.22, - "learning_rate": 1.3425632332307e-06, - "loss": 0.5334, - "step": 47644 - }, - { - "epoch": 1.22, - "learning_rate": 1.3425372368527183e-06, - "loss": 0.6313, - "step": 47645 - }, - { - "epoch": 1.22, - "learning_rate": 1.3425112402124714e-06, - "loss": 0.5317, - "step": 47646 - }, - { - "epoch": 1.22, - "learning_rate": 1.3424852433099795e-06, - "loss": 0.7529, - "step": 47647 - }, - { - "epoch": 1.22, - "learning_rate": 1.3424592461452622e-06, - "loss": 0.8477, - "step": 47648 - }, - { - "epoch": 1.22, - "learning_rate": 1.3424332487183398e-06, - "loss": 0.644, - "step": 47649 - }, - { - "epoch": 1.22, - "learning_rate": 1.342407251029232e-06, - "loss": 0.5557, - "step": 47650 - }, - { - "epoch": 1.22, - "learning_rate": 1.3423812530779585e-06, - "loss": 0.6484, - "step": 47651 - }, - { - "epoch": 1.22, - "learning_rate": 1.3423552548645398e-06, - "loss": 0.7148, - "step": 47652 - }, - { - "epoch": 1.22, - "learning_rate": 1.342329256388995e-06, - "loss": 0.5259, - "step": 47653 - }, - { - "epoch": 1.22, - "learning_rate": 1.342303257651345e-06, - "loss": 0.5342, - "step": 47654 - }, - { - "epoch": 1.22, - "learning_rate": 1.3422772586516084e-06, - "loss": 0.5923, - "step": 47655 - }, - { - "epoch": 1.22, - "learning_rate": 1.3422512593898066e-06, - "loss": 0.7227, - "step": 47656 - }, - { - "epoch": 1.22, - "learning_rate": 1.3422252598659583e-06, - "loss": 0.6006, - "step": 47657 - }, - { - "epoch": 1.22, - "learning_rate": 1.342199260080084e-06, - "loss": 0.4448, - "step": 47658 - }, - { - "epoch": 1.22, - "learning_rate": 1.3421732600322032e-06, - "loss": 0.7148, - "step": 47659 - }, - { - "epoch": 1.22, - "learning_rate": 1.3421472597223362e-06, - "loss": 0.5291, - "step": 47660 - }, - { - "epoch": 1.22, - "learning_rate": 1.342121259150503e-06, - "loss": 0.6943, - "step": 47661 - }, - { - "epoch": 1.22, - "learning_rate": 1.3420952583167232e-06, - "loss": 0.71, - "step": 47662 - }, - { - "epoch": 1.22, - "learning_rate": 1.3420692572210163e-06, - "loss": 0.8076, - "step": 47663 - }, - { - "epoch": 1.22, - "learning_rate": 1.3420432558634035e-06, - "loss": 0.4449, - "step": 47664 - }, - { - "epoch": 1.22, - "learning_rate": 1.3420172542439033e-06, - "loss": 0.6392, - "step": 47665 - }, - { - "epoch": 1.22, - "learning_rate": 1.3419912523625365e-06, - "loss": 0.5742, - "step": 47666 - }, - { - "epoch": 1.22, - "learning_rate": 1.3419652502193226e-06, - "loss": 0.7617, - "step": 47667 - }, - { - "epoch": 1.22, - "learning_rate": 1.3419392478142818e-06, - "loss": 0.6548, - "step": 47668 - }, - { - "epoch": 1.22, - "learning_rate": 1.3419132451474336e-06, - "loss": 0.7246, - "step": 47669 - }, - { - "epoch": 1.22, - "learning_rate": 1.341887242218798e-06, - "loss": 0.6997, - "step": 47670 - }, - { - "epoch": 1.22, - "learning_rate": 1.3418612390283956e-06, - "loss": 0.8535, - "step": 47671 - }, - { - "epoch": 1.22, - "learning_rate": 1.3418352355762454e-06, - "loss": 0.4897, - "step": 47672 - }, - { - "epoch": 1.22, - "learning_rate": 1.341809231862368e-06, - "loss": 0.6572, - "step": 47673 - }, - { - "epoch": 1.22, - "learning_rate": 1.3417832278867828e-06, - "loss": 0.5825, - "step": 47674 - }, - { - "epoch": 1.22, - "learning_rate": 1.3417572236495097e-06, - "loss": 0.8179, - "step": 47675 - }, - { - "epoch": 1.22, - "learning_rate": 1.341731219150569e-06, - "loss": 0.6787, - "step": 47676 - }, - { - "epoch": 1.22, - "learning_rate": 1.3417052143899804e-06, - "loss": 0.7236, - "step": 47677 - }, - { - "epoch": 1.22, - "learning_rate": 1.3416792093677636e-06, - "loss": 0.5474, - "step": 47678 - }, - { - "epoch": 1.22, - "learning_rate": 1.341653204083939e-06, - "loss": 0.7578, - "step": 47679 - }, - { - "epoch": 1.22, - "learning_rate": 1.3416271985385262e-06, - "loss": 0.5967, - "step": 47680 - }, - { - "epoch": 1.22, - "learning_rate": 1.3416011927315454e-06, - "loss": 0.728, - "step": 47681 - }, - { - "epoch": 1.22, - "learning_rate": 1.3415751866630159e-06, - "loss": 0.7568, - "step": 47682 - }, - { - "epoch": 1.22, - "learning_rate": 1.3415491803329582e-06, - "loss": 0.6021, - "step": 47683 - }, - { - "epoch": 1.22, - "learning_rate": 1.3415231737413917e-06, - "loss": 0.668, - "step": 47684 - }, - { - "epoch": 1.22, - "learning_rate": 1.341497166888337e-06, - "loss": 0.6111, - "step": 47685 - }, - { - "epoch": 1.22, - "learning_rate": 1.3414711597738136e-06, - "loss": 0.7959, - "step": 47686 - }, - { - "epoch": 1.22, - "learning_rate": 1.341445152397841e-06, - "loss": 0.7217, - "step": 47687 - }, - { - "epoch": 1.22, - "learning_rate": 1.3414191447604399e-06, - "loss": 0.752, - "step": 47688 - }, - { - "epoch": 1.22, - "learning_rate": 1.3413931368616297e-06, - "loss": 0.8281, - "step": 47689 - }, - { - "epoch": 1.22, - "learning_rate": 1.3413671287014305e-06, - "loss": 0.5454, - "step": 47690 - }, - { - "epoch": 1.22, - "learning_rate": 1.3413411202798625e-06, - "loss": 0.6475, - "step": 47691 - }, - { - "epoch": 1.22, - "learning_rate": 1.341315111596945e-06, - "loss": 0.6047, - "step": 47692 - }, - { - "epoch": 1.22, - "learning_rate": 1.3412891026526984e-06, - "loss": 0.7559, - "step": 47693 - }, - { - "epoch": 1.22, - "learning_rate": 1.3412630934471422e-06, - "loss": 0.7744, - "step": 47694 - }, - { - "epoch": 1.22, - "learning_rate": 1.3412370839802968e-06, - "loss": 0.6208, - "step": 47695 - }, - { - "epoch": 1.22, - "learning_rate": 1.3412110742521815e-06, - "loss": 0.7451, - "step": 47696 - }, - { - "epoch": 1.22, - "learning_rate": 1.3411850642628165e-06, - "loss": 0.519, - "step": 47697 - }, - { - "epoch": 1.22, - "learning_rate": 1.3411590540122224e-06, - "loss": 0.4883, - "step": 47698 - }, - { - "epoch": 1.22, - "learning_rate": 1.341133043500418e-06, - "loss": 0.5957, - "step": 47699 - }, - { - "epoch": 1.22, - "learning_rate": 1.341107032727424e-06, - "loss": 0.7236, - "step": 47700 - }, - { - "epoch": 1.22, - "learning_rate": 1.3410810216932597e-06, - "loss": 0.7139, - "step": 47701 - }, - { - "epoch": 1.22, - "learning_rate": 1.3410550103979456e-06, - "loss": 0.8838, - "step": 47702 - }, - { - "epoch": 1.22, - "learning_rate": 1.3410289988415013e-06, - "loss": 0.2537, - "step": 47703 - }, - { - "epoch": 1.22, - "learning_rate": 1.3410029870239468e-06, - "loss": 0.6123, - "step": 47704 - }, - { - "epoch": 1.22, - "learning_rate": 1.340976974945302e-06, - "loss": 0.6182, - "step": 47705 - }, - { - "epoch": 1.22, - "learning_rate": 1.340950962605587e-06, - "loss": 0.6626, - "step": 47706 - }, - { - "epoch": 1.22, - "learning_rate": 1.3409249500048211e-06, - "loss": 0.6377, - "step": 47707 - }, - { - "epoch": 1.22, - "learning_rate": 1.340898937143025e-06, - "loss": 0.623, - "step": 47708 - }, - { - "epoch": 1.22, - "learning_rate": 1.3408729240202178e-06, - "loss": 0.6689, - "step": 47709 - }, - { - "epoch": 1.22, - "learning_rate": 1.3408469106364202e-06, - "loss": 0.6865, - "step": 47710 - }, - { - "epoch": 1.22, - "learning_rate": 1.3408208969916519e-06, - "loss": 0.7842, - "step": 47711 - }, - { - "epoch": 1.22, - "learning_rate": 1.3407948830859327e-06, - "loss": 0.6289, - "step": 47712 - }, - { - "epoch": 1.22, - "learning_rate": 1.3407688689192822e-06, - "loss": 0.6724, - "step": 47713 - }, - { - "epoch": 1.22, - "learning_rate": 1.340742854491721e-06, - "loss": 0.4648, - "step": 47714 - }, - { - "epoch": 1.22, - "learning_rate": 1.3407168398032684e-06, - "loss": 0.6606, - "step": 47715 - }, - { - "epoch": 1.22, - "learning_rate": 1.3406908248539446e-06, - "loss": 0.6611, - "step": 47716 - }, - { - "epoch": 1.22, - "learning_rate": 1.3406648096437699e-06, - "loss": 0.5879, - "step": 47717 - }, - { - "epoch": 1.22, - "learning_rate": 1.3406387941727632e-06, - "loss": 0.5698, - "step": 47718 - }, - { - "epoch": 1.22, - "learning_rate": 1.3406127784409456e-06, - "loss": 0.5986, - "step": 47719 - }, - { - "epoch": 1.22, - "learning_rate": 1.340586762448336e-06, - "loss": 0.877, - "step": 47720 - }, - { - "epoch": 1.22, - "learning_rate": 1.340560746194955e-06, - "loss": 0.7017, - "step": 47721 - }, - { - "epoch": 1.22, - "learning_rate": 1.3405347296808222e-06, - "loss": 0.6875, - "step": 47722 - }, - { - "epoch": 1.22, - "learning_rate": 1.340508712905958e-06, - "loss": 0.6699, - "step": 47723 - }, - { - "epoch": 1.22, - "learning_rate": 1.3404826958703813e-06, - "loss": 0.6611, - "step": 47724 - }, - { - "epoch": 1.22, - "learning_rate": 1.3404566785741133e-06, - "loss": 0.645, - "step": 47725 - }, - { - "epoch": 1.22, - "learning_rate": 1.340430661017173e-06, - "loss": 0.4539, - "step": 47726 - }, - { - "epoch": 1.22, - "learning_rate": 1.3404046431995806e-06, - "loss": 0.6646, - "step": 47727 - }, - { - "epoch": 1.22, - "learning_rate": 1.3403786251213559e-06, - "loss": 0.5815, - "step": 47728 - }, - { - "epoch": 1.22, - "learning_rate": 1.340352606782519e-06, - "loss": 0.6943, - "step": 47729 - }, - { - "epoch": 1.22, - "learning_rate": 1.3403265881830898e-06, - "loss": 0.7637, - "step": 47730 - }, - { - "epoch": 1.22, - "learning_rate": 1.3403005693230882e-06, - "loss": 0.6714, - "step": 47731 - }, - { - "epoch": 1.22, - "learning_rate": 1.340274550202534e-06, - "loss": 0.6318, - "step": 47732 - }, - { - "epoch": 1.22, - "learning_rate": 1.3402485308214472e-06, - "loss": 0.6216, - "step": 47733 - }, - { - "epoch": 1.22, - "learning_rate": 1.3402225111798477e-06, - "loss": 0.7744, - "step": 47734 - }, - { - "epoch": 1.22, - "learning_rate": 1.3401964912777556e-06, - "loss": 0.6172, - "step": 47735 - }, - { - "epoch": 1.22, - "learning_rate": 1.3401704711151908e-06, - "loss": 0.5933, - "step": 47736 - }, - { - "epoch": 1.22, - "learning_rate": 1.3401444506921733e-06, - "loss": 0.6289, - "step": 47737 - }, - { - "epoch": 1.22, - "learning_rate": 1.3401184300087224e-06, - "loss": 0.8311, - "step": 47738 - }, - { - "epoch": 1.22, - "learning_rate": 1.3400924090648586e-06, - "loss": 0.6553, - "step": 47739 - }, - { - "epoch": 1.22, - "learning_rate": 1.3400663878606016e-06, - "loss": 0.7178, - "step": 47740 - }, - { - "epoch": 1.22, - "learning_rate": 1.3400403663959714e-06, - "loss": 0.6294, - "step": 47741 - }, - { - "epoch": 1.22, - "learning_rate": 1.3400143446709882e-06, - "loss": 0.5378, - "step": 47742 - }, - { - "epoch": 1.22, - "learning_rate": 1.3399883226856711e-06, - "loss": 0.6885, - "step": 47743 - }, - { - "epoch": 1.22, - "learning_rate": 1.3399623004400412e-06, - "loss": 0.6785, - "step": 47744 - }, - { - "epoch": 1.22, - "learning_rate": 1.3399362779341175e-06, - "loss": 0.4929, - "step": 47745 - }, - { - "epoch": 1.22, - "learning_rate": 1.3399102551679202e-06, - "loss": 0.6641, - "step": 47746 - }, - { - "epoch": 1.22, - "learning_rate": 1.3398842321414692e-06, - "loss": 0.6865, - "step": 47747 - }, - { - "epoch": 1.22, - "learning_rate": 1.3398582088547847e-06, - "loss": 0.709, - "step": 47748 - }, - { - "epoch": 1.22, - "learning_rate": 1.339832185307886e-06, - "loss": 0.7686, - "step": 47749 - }, - { - "epoch": 1.22, - "learning_rate": 1.3398061615007941e-06, - "loss": 0.6821, - "step": 47750 - }, - { - "epoch": 1.22, - "learning_rate": 1.3397801374335277e-06, - "loss": 0.5898, - "step": 47751 - }, - { - "epoch": 1.22, - "learning_rate": 1.3397541131061073e-06, - "loss": 0.6846, - "step": 47752 - }, - { - "epoch": 1.22, - "learning_rate": 1.3397280885185528e-06, - "loss": 0.6475, - "step": 47753 - }, - { - "epoch": 1.22, - "learning_rate": 1.3397020636708844e-06, - "loss": 0.6616, - "step": 47754 - }, - { - "epoch": 1.22, - "learning_rate": 1.3396760385631217e-06, - "loss": 0.7393, - "step": 47755 - }, - { - "epoch": 1.22, - "learning_rate": 1.3396500131952846e-06, - "loss": 0.6953, - "step": 47756 - }, - { - "epoch": 1.22, - "learning_rate": 1.3396239875673928e-06, - "loss": 0.8008, - "step": 47757 - }, - { - "epoch": 1.22, - "learning_rate": 1.3395979616794667e-06, - "loss": 0.5342, - "step": 47758 - }, - { - "epoch": 1.22, - "learning_rate": 1.3395719355315263e-06, - "loss": 0.636, - "step": 47759 - }, - { - "epoch": 1.22, - "learning_rate": 1.339545909123591e-06, - "loss": 0.6372, - "step": 47760 - }, - { - "epoch": 1.22, - "learning_rate": 1.3395198824556812e-06, - "loss": 0.6172, - "step": 47761 - }, - { - "epoch": 1.22, - "learning_rate": 1.3394938555278166e-06, - "loss": 0.6509, - "step": 47762 - }, - { - "epoch": 1.22, - "learning_rate": 1.3394678283400168e-06, - "loss": 0.5488, - "step": 47763 - }, - { - "epoch": 1.22, - "learning_rate": 1.3394418008923027e-06, - "loss": 0.6865, - "step": 47764 - }, - { - "epoch": 1.22, - "learning_rate": 1.3394157731846934e-06, - "loss": 0.8228, - "step": 47765 - }, - { - "epoch": 1.22, - "learning_rate": 1.339389745217209e-06, - "loss": 0.6182, - "step": 47766 - }, - { - "epoch": 1.22, - "learning_rate": 1.3393637169898695e-06, - "loss": 0.5708, - "step": 47767 - }, - { - "epoch": 1.22, - "learning_rate": 1.3393376885026945e-06, - "loss": 0.6543, - "step": 47768 - }, - { - "epoch": 1.22, - "learning_rate": 1.3393116597557047e-06, - "loss": 0.7314, - "step": 47769 - }, - { - "epoch": 1.22, - "learning_rate": 1.3392856307489196e-06, - "loss": 0.5785, - "step": 47770 - }, - { - "epoch": 1.22, - "learning_rate": 1.3392596014823587e-06, - "loss": 0.6763, - "step": 47771 - }, - { - "epoch": 1.22, - "learning_rate": 1.3392335719560424e-06, - "loss": 0.833, - "step": 47772 - }, - { - "epoch": 1.22, - "learning_rate": 1.3392075421699907e-06, - "loss": 0.6377, - "step": 47773 - }, - { - "epoch": 1.22, - "learning_rate": 1.3391815121242232e-06, - "loss": 0.5469, - "step": 47774 - }, - { - "epoch": 1.22, - "learning_rate": 1.3391554818187605e-06, - "loss": 0.6685, - "step": 47775 - }, - { - "epoch": 1.22, - "learning_rate": 1.3391294512536216e-06, - "loss": 0.6206, - "step": 47776 - }, - { - "epoch": 1.22, - "learning_rate": 1.3391034204288269e-06, - "loss": 0.6123, - "step": 47777 - }, - { - "epoch": 1.22, - "learning_rate": 1.3390773893443962e-06, - "loss": 0.7246, - "step": 47778 - }, - { - "epoch": 1.22, - "learning_rate": 1.3390513580003498e-06, - "loss": 0.5771, - "step": 47779 - }, - { - "epoch": 1.22, - "learning_rate": 1.3390253263967072e-06, - "loss": 0.8062, - "step": 47780 - }, - { - "epoch": 1.22, - "learning_rate": 1.3389992945334887e-06, - "loss": 0.604, - "step": 47781 - }, - { - "epoch": 1.22, - "learning_rate": 1.3389732624107138e-06, - "loss": 0.5923, - "step": 47782 - }, - { - "epoch": 1.22, - "learning_rate": 1.3389472300284027e-06, - "loss": 0.7383, - "step": 47783 - }, - { - "epoch": 1.22, - "learning_rate": 1.3389211973865752e-06, - "loss": 0.7803, - "step": 47784 - }, - { - "epoch": 1.22, - "learning_rate": 1.3388951644852514e-06, - "loss": 0.6768, - "step": 47785 - }, - { - "epoch": 1.22, - "learning_rate": 1.3388691313244515e-06, - "loss": 0.625, - "step": 47786 - }, - { - "epoch": 1.22, - "learning_rate": 1.3388430979041947e-06, - "loss": 0.6768, - "step": 47787 - }, - { - "epoch": 1.22, - "learning_rate": 1.3388170642245013e-06, - "loss": 0.7646, - "step": 47788 - }, - { - "epoch": 1.22, - "learning_rate": 1.3387910302853913e-06, - "loss": 0.8066, - "step": 47789 - }, - { - "epoch": 1.22, - "learning_rate": 1.338764996086885e-06, - "loss": 0.6299, - "step": 47790 - }, - { - "epoch": 1.22, - "learning_rate": 1.3387389616290016e-06, - "loss": 0.6318, - "step": 47791 - }, - { - "epoch": 1.22, - "learning_rate": 1.3387129269117612e-06, - "loss": 0.7783, - "step": 47792 - }, - { - "epoch": 1.22, - "learning_rate": 1.3386868919351839e-06, - "loss": 0.6475, - "step": 47793 - }, - { - "epoch": 1.22, - "learning_rate": 1.33866085669929e-06, - "loss": 0.5759, - "step": 47794 - }, - { - "epoch": 1.23, - "learning_rate": 1.3386348212040987e-06, - "loss": 0.7578, - "step": 47795 - }, - { - "epoch": 1.23, - "learning_rate": 1.3386087854496305e-06, - "loss": 0.6504, - "step": 47796 - }, - { - "epoch": 1.23, - "learning_rate": 1.3385827494359047e-06, - "loss": 0.6108, - "step": 47797 - }, - { - "epoch": 1.23, - "learning_rate": 1.338556713162942e-06, - "loss": 0.7148, - "step": 47798 - }, - { - "epoch": 1.23, - "learning_rate": 1.338530676630762e-06, - "loss": 0.6206, - "step": 47799 - }, - { - "epoch": 1.23, - "learning_rate": 1.3385046398393848e-06, - "loss": 0.5034, - "step": 47800 - }, - { - "epoch": 1.23, - "learning_rate": 1.3384786027888298e-06, - "loss": 0.6201, - "step": 47801 - }, - { - "epoch": 1.23, - "learning_rate": 1.3384525654791174e-06, - "loss": 0.7188, - "step": 47802 - }, - { - "epoch": 1.23, - "learning_rate": 1.3384265279102675e-06, - "loss": 0.5347, - "step": 47803 - }, - { - "epoch": 1.23, - "learning_rate": 1.3384004900823e-06, - "loss": 0.5781, - "step": 47804 - }, - { - "epoch": 1.23, - "learning_rate": 1.3383744519952346e-06, - "loss": 0.6724, - "step": 47805 - }, - { - "epoch": 1.23, - "learning_rate": 1.3383484136490916e-06, - "loss": 0.5522, - "step": 47806 - }, - { - "epoch": 1.23, - "learning_rate": 1.3383223750438908e-06, - "loss": 0.7529, - "step": 47807 - }, - { - "epoch": 1.23, - "learning_rate": 1.3382963361796519e-06, - "loss": 0.7588, - "step": 47808 - }, - { - "epoch": 1.23, - "learning_rate": 1.3382702970563953e-06, - "loss": 0.7715, - "step": 47809 - }, - { - "epoch": 1.23, - "learning_rate": 1.3382442576741407e-06, - "loss": 0.6562, - "step": 47810 - }, - { - "epoch": 1.23, - "learning_rate": 1.338218218032908e-06, - "loss": 0.646, - "step": 47811 - }, - { - "epoch": 1.23, - "learning_rate": 1.338192178132717e-06, - "loss": 0.8008, - "step": 47812 - }, - { - "epoch": 1.23, - "learning_rate": 1.338166137973588e-06, - "loss": 0.5906, - "step": 47813 - }, - { - "epoch": 1.23, - "learning_rate": 1.3381400975555406e-06, - "loss": 0.7383, - "step": 47814 - }, - { - "epoch": 1.23, - "learning_rate": 1.3381140568785952e-06, - "loss": 0.707, - "step": 47815 - }, - { - "epoch": 1.23, - "learning_rate": 1.338088015942771e-06, - "loss": 0.5522, - "step": 47816 - }, - { - "epoch": 1.23, - "learning_rate": 1.3380619747480883e-06, - "loss": 0.5986, - "step": 47817 - }, - { - "epoch": 1.23, - "learning_rate": 1.3380359332945673e-06, - "loss": 0.604, - "step": 47818 - }, - { - "epoch": 1.23, - "learning_rate": 1.3380098915822277e-06, - "loss": 0.7432, - "step": 47819 - }, - { - "epoch": 1.23, - "learning_rate": 1.3379838496110895e-06, - "loss": 0.6296, - "step": 47820 - }, - { - "epoch": 1.23, - "learning_rate": 1.3379578073811728e-06, - "loss": 0.7471, - "step": 47821 - }, - { - "epoch": 1.23, - "learning_rate": 1.3379317648924968e-06, - "loss": 0.6396, - "step": 47822 - }, - { - "epoch": 1.23, - "learning_rate": 1.3379057221450825e-06, - "loss": 0.4263, - "step": 47823 - }, - { - "epoch": 1.23, - "learning_rate": 1.337879679138949e-06, - "loss": 0.5232, - "step": 47824 - }, - { - "epoch": 1.23, - "learning_rate": 1.3378536358741168e-06, - "loss": 0.6504, - "step": 47825 - }, - { - "epoch": 1.23, - "learning_rate": 1.3378275923506054e-06, - "loss": 0.7153, - "step": 47826 - }, - { - "epoch": 1.23, - "learning_rate": 1.3378015485684354e-06, - "loss": 0.5132, - "step": 47827 - }, - { - "epoch": 1.23, - "learning_rate": 1.3377755045276255e-06, - "loss": 0.6807, - "step": 47828 - }, - { - "epoch": 1.23, - "learning_rate": 1.337749460228197e-06, - "loss": 0.6973, - "step": 47829 - }, - { - "epoch": 1.23, - "learning_rate": 1.3377234156701693e-06, - "loss": 0.4907, - "step": 47830 - }, - { - "epoch": 1.23, - "learning_rate": 1.337697370853562e-06, - "loss": 0.6616, - "step": 47831 - }, - { - "epoch": 1.23, - "learning_rate": 1.3376713257783955e-06, - "loss": 0.748, - "step": 47832 - }, - { - "epoch": 1.23, - "learning_rate": 1.3376452804446894e-06, - "loss": 0.5129, - "step": 47833 - }, - { - "epoch": 1.23, - "learning_rate": 1.3376192348524641e-06, - "loss": 0.7119, - "step": 47834 - }, - { - "epoch": 1.23, - "learning_rate": 1.3375931890017393e-06, - "loss": 0.708, - "step": 47835 - }, - { - "epoch": 1.23, - "learning_rate": 1.3375671428925349e-06, - "loss": 0.6221, - "step": 47836 - }, - { - "epoch": 1.23, - "learning_rate": 1.3375410965248706e-06, - "loss": 0.6533, - "step": 47837 - }, - { - "epoch": 1.23, - "learning_rate": 1.337515049898767e-06, - "loss": 0.6533, - "step": 47838 - }, - { - "epoch": 1.23, - "learning_rate": 1.3374890030142432e-06, - "loss": 0.7876, - "step": 47839 - }, - { - "epoch": 1.23, - "learning_rate": 1.33746295587132e-06, - "loss": 0.6914, - "step": 47840 - }, - { - "epoch": 1.23, - "learning_rate": 1.3374369084700166e-06, - "loss": 0.7705, - "step": 47841 - }, - { - "epoch": 1.23, - "learning_rate": 1.3374108608103536e-06, - "loss": 0.5605, - "step": 47842 - }, - { - "epoch": 1.23, - "learning_rate": 1.3373848128923501e-06, - "loss": 0.7139, - "step": 47843 - }, - { - "epoch": 1.23, - "learning_rate": 1.3373587647160273e-06, - "loss": 0.7754, - "step": 47844 - }, - { - "epoch": 1.23, - "learning_rate": 1.3373327162814038e-06, - "loss": 0.5366, - "step": 47845 - }, - { - "epoch": 1.23, - "learning_rate": 1.3373066675885005e-06, - "loss": 0.6177, - "step": 47846 - }, - { - "epoch": 1.23, - "learning_rate": 1.3372806186373367e-06, - "loss": 0.8486, - "step": 47847 - }, - { - "epoch": 1.23, - "learning_rate": 1.3372545694279328e-06, - "loss": 0.7109, - "step": 47848 - }, - { - "epoch": 1.23, - "learning_rate": 1.3372285199603087e-06, - "loss": 0.5869, - "step": 47849 - }, - { - "epoch": 1.23, - "learning_rate": 1.3372024702344839e-06, - "loss": 0.6489, - "step": 47850 - }, - { - "epoch": 1.23, - "learning_rate": 1.337176420250479e-06, - "loss": 0.8379, - "step": 47851 - }, - { - "epoch": 1.23, - "learning_rate": 1.3371503700083133e-06, - "loss": 0.6455, - "step": 47852 - }, - { - "epoch": 1.23, - "learning_rate": 1.3371243195080073e-06, - "loss": 0.7842, - "step": 47853 - }, - { - "epoch": 1.23, - "learning_rate": 1.337098268749581e-06, - "loss": 0.5139, - "step": 47854 - }, - { - "epoch": 1.23, - "learning_rate": 1.3370722177330536e-06, - "loss": 0.7227, - "step": 47855 - }, - { - "epoch": 1.23, - "learning_rate": 1.3370461664584456e-06, - "loss": 0.4407, - "step": 47856 - }, - { - "epoch": 1.23, - "learning_rate": 1.3370201149257767e-06, - "loss": 0.5625, - "step": 47857 - }, - { - "epoch": 1.23, - "learning_rate": 1.336994063135067e-06, - "loss": 0.5251, - "step": 47858 - }, - { - "epoch": 1.23, - "learning_rate": 1.3369680110863368e-06, - "loss": 0.6138, - "step": 47859 - }, - { - "epoch": 1.23, - "learning_rate": 1.3369419587796055e-06, - "loss": 0.752, - "step": 47860 - }, - { - "epoch": 1.23, - "learning_rate": 1.3369159062148933e-06, - "loss": 0.7461, - "step": 47861 - }, - { - "epoch": 1.23, - "learning_rate": 1.3368898533922199e-06, - "loss": 0.6758, - "step": 47862 - }, - { - "epoch": 1.23, - "learning_rate": 1.3368638003116057e-06, - "loss": 0.6768, - "step": 47863 - }, - { - "epoch": 1.23, - "learning_rate": 1.3368377469730702e-06, - "loss": 0.6431, - "step": 47864 - }, - { - "epoch": 1.23, - "learning_rate": 1.3368116933766339e-06, - "loss": 0.7227, - "step": 47865 - }, - { - "epoch": 1.23, - "learning_rate": 1.3367856395223158e-06, - "loss": 0.666, - "step": 47866 - }, - { - "epoch": 1.23, - "learning_rate": 1.3367595854101366e-06, - "loss": 0.834, - "step": 47867 - }, - { - "epoch": 1.23, - "learning_rate": 1.336733531040116e-06, - "loss": 0.6475, - "step": 47868 - }, - { - "epoch": 1.23, - "learning_rate": 1.336707476412274e-06, - "loss": 0.7957, - "step": 47869 - }, - { - "epoch": 1.23, - "learning_rate": 1.336681421526631e-06, - "loss": 0.6465, - "step": 47870 - }, - { - "epoch": 1.23, - "learning_rate": 1.3366553663832063e-06, - "loss": 0.6123, - "step": 47871 - }, - { - "epoch": 1.23, - "learning_rate": 1.3366293109820198e-06, - "loss": 0.46, - "step": 47872 - }, - { - "epoch": 1.23, - "learning_rate": 1.336603255323092e-06, - "loss": 0.7617, - "step": 47873 - }, - { - "epoch": 1.23, - "learning_rate": 1.3365771994064422e-06, - "loss": 0.5649, - "step": 47874 - }, - { - "epoch": 1.23, - "learning_rate": 1.336551143232091e-06, - "loss": 0.8428, - "step": 47875 - }, - { - "epoch": 1.23, - "learning_rate": 1.3365250868000582e-06, - "loss": 0.6265, - "step": 47876 - }, - { - "epoch": 1.23, - "learning_rate": 1.3364990301103634e-06, - "loss": 0.7168, - "step": 47877 - }, - { - "epoch": 1.23, - "learning_rate": 1.3364729731630269e-06, - "loss": 0.6084, - "step": 47878 - }, - { - "epoch": 1.23, - "learning_rate": 1.3364469159580682e-06, - "loss": 0.79, - "step": 47879 - }, - { - "epoch": 1.23, - "learning_rate": 1.336420858495508e-06, - "loss": 0.6514, - "step": 47880 - }, - { - "epoch": 1.23, - "learning_rate": 1.3363948007753655e-06, - "loss": 0.6855, - "step": 47881 - }, - { - "epoch": 1.23, - "learning_rate": 1.3363687427976612e-06, - "loss": 0.6479, - "step": 47882 - }, - { - "epoch": 1.23, - "learning_rate": 1.3363426845624147e-06, - "loss": 0.6281, - "step": 47883 - }, - { - "epoch": 1.23, - "learning_rate": 1.3363166260696462e-06, - "loss": 0.5923, - "step": 47884 - }, - { - "epoch": 1.23, - "learning_rate": 1.3362905673193755e-06, - "loss": 0.9531, - "step": 47885 - }, - { - "epoch": 1.23, - "learning_rate": 1.3362645083116224e-06, - "loss": 0.7344, - "step": 47886 - }, - { - "epoch": 1.23, - "learning_rate": 1.3362384490464069e-06, - "loss": 0.6401, - "step": 47887 - }, - { - "epoch": 1.23, - "learning_rate": 1.3362123895237494e-06, - "loss": 0.6982, - "step": 47888 - }, - { - "epoch": 1.23, - "learning_rate": 1.3361863297436694e-06, - "loss": 0.7588, - "step": 47889 - }, - { - "epoch": 1.23, - "learning_rate": 1.336160269706187e-06, - "loss": 0.7295, - "step": 47890 - }, - { - "epoch": 1.23, - "learning_rate": 1.336134209411322e-06, - "loss": 0.7285, - "step": 47891 - }, - { - "epoch": 1.23, - "learning_rate": 1.3361081488590948e-06, - "loss": 0.5039, - "step": 47892 - }, - { - "epoch": 1.23, - "learning_rate": 1.3360820880495248e-06, - "loss": 0.6147, - "step": 47893 - }, - { - "epoch": 1.23, - "learning_rate": 1.3360560269826325e-06, - "loss": 0.8154, - "step": 47894 - }, - { - "epoch": 1.23, - "learning_rate": 1.3360299656584372e-06, - "loss": 0.7168, - "step": 47895 - }, - { - "epoch": 1.23, - "learning_rate": 1.3360039040769593e-06, - "loss": 0.5345, - "step": 47896 - }, - { - "epoch": 1.23, - "learning_rate": 1.3359778422382188e-06, - "loss": 0.6426, - "step": 47897 - }, - { - "epoch": 1.23, - "learning_rate": 1.3359517801422352e-06, - "loss": 0.4607, - "step": 47898 - }, - { - "epoch": 1.23, - "learning_rate": 1.335925717789029e-06, - "loss": 0.7705, - "step": 47899 - }, - { - "epoch": 1.23, - "learning_rate": 1.33589965517862e-06, - "loss": 0.8408, - "step": 47900 - }, - { - "epoch": 1.23, - "learning_rate": 1.335873592311028e-06, - "loss": 0.2503, - "step": 47901 - }, - { - "epoch": 1.23, - "learning_rate": 1.335847529186273e-06, - "loss": 0.5664, - "step": 47902 - }, - { - "epoch": 1.23, - "learning_rate": 1.3358214658043751e-06, - "loss": 0.7061, - "step": 47903 - }, - { - "epoch": 1.23, - "learning_rate": 1.335795402165354e-06, - "loss": 0.6738, - "step": 47904 - }, - { - "epoch": 1.23, - "learning_rate": 1.3357693382692302e-06, - "loss": 0.8096, - "step": 47905 - }, - { - "epoch": 1.23, - "learning_rate": 1.3357432741160226e-06, - "loss": 0.7402, - "step": 47906 - }, - { - "epoch": 1.23, - "learning_rate": 1.3357172097057521e-06, - "loss": 0.6748, - "step": 47907 - }, - { - "epoch": 1.23, - "learning_rate": 1.3356911450384383e-06, - "loss": 0.7554, - "step": 47908 - }, - { - "epoch": 1.23, - "learning_rate": 1.3356650801141014e-06, - "loss": 0.6729, - "step": 47909 - }, - { - "epoch": 1.23, - "learning_rate": 1.3356390149327612e-06, - "loss": 0.5745, - "step": 47910 - }, - { - "epoch": 1.23, - "learning_rate": 1.3356129494944377e-06, - "loss": 0.6904, - "step": 47911 - }, - { - "epoch": 1.23, - "learning_rate": 1.3355868837991503e-06, - "loss": 0.6489, - "step": 47912 - }, - { - "epoch": 1.23, - "learning_rate": 1.33556081784692e-06, - "loss": 0.6699, - "step": 47913 - }, - { - "epoch": 1.23, - "learning_rate": 1.3355347516377658e-06, - "loss": 0.6787, - "step": 47914 - }, - { - "epoch": 1.23, - "learning_rate": 1.3355086851717084e-06, - "loss": 0.646, - "step": 47915 - }, - { - "epoch": 1.23, - "learning_rate": 1.3354826184487674e-06, - "loss": 0.71, - "step": 47916 - }, - { - "epoch": 1.23, - "learning_rate": 1.3354565514689625e-06, - "loss": 0.7031, - "step": 47917 - }, - { - "epoch": 1.23, - "learning_rate": 1.3354304842323142e-06, - "loss": 0.7036, - "step": 47918 - }, - { - "epoch": 1.23, - "learning_rate": 1.3354044167388424e-06, - "loss": 0.7109, - "step": 47919 - }, - { - "epoch": 1.23, - "learning_rate": 1.3353783489885664e-06, - "loss": 0.6836, - "step": 47920 - }, - { - "epoch": 1.23, - "learning_rate": 1.3353522809815067e-06, - "loss": 0.7544, - "step": 47921 - }, - { - "epoch": 1.23, - "learning_rate": 1.3353262127176833e-06, - "loss": 0.6299, - "step": 47922 - }, - { - "epoch": 1.23, - "learning_rate": 1.335300144197116e-06, - "loss": 0.7324, - "step": 47923 - }, - { - "epoch": 1.23, - "learning_rate": 1.335274075419825e-06, - "loss": 0.6479, - "step": 47924 - }, - { - "epoch": 1.23, - "learning_rate": 1.3352480063858299e-06, - "loss": 0.5059, - "step": 47925 - }, - { - "epoch": 1.23, - "learning_rate": 1.3352219370951508e-06, - "loss": 0.6582, - "step": 47926 - }, - { - "epoch": 1.23, - "learning_rate": 1.3351958675478074e-06, - "loss": 0.7197, - "step": 47927 - }, - { - "epoch": 1.23, - "learning_rate": 1.3351697977438203e-06, - "loss": 0.7354, - "step": 47928 - }, - { - "epoch": 1.23, - "learning_rate": 1.335143727683209e-06, - "loss": 0.5642, - "step": 47929 - }, - { - "epoch": 1.23, - "learning_rate": 1.335117657365994e-06, - "loss": 0.5176, - "step": 47930 - }, - { - "epoch": 1.23, - "learning_rate": 1.335091586792194e-06, - "loss": 0.7197, - "step": 47931 - }, - { - "epoch": 1.23, - "learning_rate": 1.3350655159618304e-06, - "loss": 0.5596, - "step": 47932 - }, - { - "epoch": 1.23, - "learning_rate": 1.335039444874922e-06, - "loss": 0.7314, - "step": 47933 - }, - { - "epoch": 1.23, - "learning_rate": 1.3350133735314897e-06, - "loss": 0.5508, - "step": 47934 - }, - { - "epoch": 1.23, - "learning_rate": 1.3349873019315532e-06, - "loss": 0.5557, - "step": 47935 - }, - { - "epoch": 1.23, - "learning_rate": 1.3349612300751321e-06, - "loss": 0.7422, - "step": 47936 - }, - { - "epoch": 1.23, - "learning_rate": 1.3349351579622464e-06, - "loss": 0.5918, - "step": 47937 - }, - { - "epoch": 1.23, - "learning_rate": 1.3349090855929167e-06, - "loss": 0.6704, - "step": 47938 - }, - { - "epoch": 1.23, - "learning_rate": 1.334883012967162e-06, - "loss": 0.7134, - "step": 47939 - }, - { - "epoch": 1.23, - "learning_rate": 1.334856940085003e-06, - "loss": 0.7002, - "step": 47940 - }, - { - "epoch": 1.23, - "learning_rate": 1.3348308669464596e-06, - "loss": 0.4358, - "step": 47941 - }, - { - "epoch": 1.23, - "learning_rate": 1.3348047935515513e-06, - "loss": 0.7207, - "step": 47942 - }, - { - "epoch": 1.23, - "learning_rate": 1.3347787199002987e-06, - "loss": 0.8242, - "step": 47943 - }, - { - "epoch": 1.23, - "learning_rate": 1.334752645992721e-06, - "loss": 0.4603, - "step": 47944 - }, - { - "epoch": 1.23, - "learning_rate": 1.3347265718288391e-06, - "loss": 0.668, - "step": 47945 - }, - { - "epoch": 1.23, - "learning_rate": 1.3347004974086721e-06, - "loss": 0.4412, - "step": 47946 - }, - { - "epoch": 1.23, - "learning_rate": 1.3346744227322404e-06, - "loss": 0.752, - "step": 47947 - }, - { - "epoch": 1.23, - "learning_rate": 1.3346483477995638e-06, - "loss": 0.5725, - "step": 47948 - }, - { - "epoch": 1.23, - "learning_rate": 1.3346222726106627e-06, - "loss": 0.6738, - "step": 47949 - }, - { - "epoch": 1.23, - "learning_rate": 1.3345961971655564e-06, - "loss": 0.6133, - "step": 47950 - }, - { - "epoch": 1.23, - "learning_rate": 1.3345701214642654e-06, - "loss": 0.4146, - "step": 47951 - }, - { - "epoch": 1.23, - "learning_rate": 1.3345440455068091e-06, - "loss": 0.5581, - "step": 47952 - }, - { - "epoch": 1.23, - "learning_rate": 1.334517969293208e-06, - "loss": 0.7559, - "step": 47953 - }, - { - "epoch": 1.23, - "learning_rate": 1.334491892823482e-06, - "loss": 0.7061, - "step": 47954 - }, - { - "epoch": 1.23, - "learning_rate": 1.334465816097651e-06, - "loss": 0.6157, - "step": 47955 - }, - { - "epoch": 1.23, - "learning_rate": 1.3344397391157345e-06, - "loss": 0.7104, - "step": 47956 - }, - { - "epoch": 1.23, - "learning_rate": 1.3344136618777531e-06, - "loss": 0.7559, - "step": 47957 - }, - { - "epoch": 1.23, - "learning_rate": 1.3343875843837262e-06, - "loss": 0.5698, - "step": 47958 - }, - { - "epoch": 1.23, - "learning_rate": 1.3343615066336747e-06, - "loss": 0.6421, - "step": 47959 - }, - { - "epoch": 1.23, - "learning_rate": 1.3343354286276176e-06, - "loss": 0.6299, - "step": 47960 - }, - { - "epoch": 1.23, - "learning_rate": 1.3343093503655753e-06, - "loss": 0.6934, - "step": 47961 - }, - { - "epoch": 1.23, - "learning_rate": 1.3342832718475677e-06, - "loss": 0.6768, - "step": 47962 - }, - { - "epoch": 1.23, - "learning_rate": 1.334257193073615e-06, - "loss": 0.7373, - "step": 47963 - }, - { - "epoch": 1.23, - "learning_rate": 1.3342311140437366e-06, - "loss": 0.5352, - "step": 47964 - }, - { - "epoch": 1.23, - "learning_rate": 1.3342050347579527e-06, - "loss": 0.6611, - "step": 47965 - }, - { - "epoch": 1.23, - "learning_rate": 1.3341789552162838e-06, - "loss": 0.708, - "step": 47966 - }, - { - "epoch": 1.23, - "learning_rate": 1.3341528754187493e-06, - "loss": 0.5266, - "step": 47967 - }, - { - "epoch": 1.23, - "learning_rate": 1.3341267953653691e-06, - "loss": 0.4386, - "step": 47968 - }, - { - "epoch": 1.23, - "learning_rate": 1.3341007150561634e-06, - "loss": 0.7085, - "step": 47969 - }, - { - "epoch": 1.23, - "learning_rate": 1.3340746344911526e-06, - "loss": 0.6914, - "step": 47970 - }, - { - "epoch": 1.23, - "learning_rate": 1.3340485536703557e-06, - "loss": 0.7383, - "step": 47971 - }, - { - "epoch": 1.23, - "learning_rate": 1.3340224725937934e-06, - "loss": 0.7295, - "step": 47972 - }, - { - "epoch": 1.23, - "learning_rate": 1.3339963912614854e-06, - "loss": 0.5806, - "step": 47973 - }, - { - "epoch": 1.23, - "learning_rate": 1.3339703096734518e-06, - "loss": 0.6689, - "step": 47974 - }, - { - "epoch": 1.23, - "learning_rate": 1.3339442278297127e-06, - "loss": 0.5256, - "step": 47975 - }, - { - "epoch": 1.23, - "learning_rate": 1.3339181457302876e-06, - "loss": 0.4756, - "step": 47976 - }, - { - "epoch": 1.23, - "learning_rate": 1.3338920633751964e-06, - "loss": 0.6543, - "step": 47977 - }, - { - "epoch": 1.23, - "learning_rate": 1.3338659807644598e-06, - "loss": 0.4434, - "step": 47978 - }, - { - "epoch": 1.23, - "learning_rate": 1.3338398978980972e-06, - "loss": 0.7314, - "step": 47979 - }, - { - "epoch": 1.23, - "learning_rate": 1.333813814776129e-06, - "loss": 0.6084, - "step": 47980 - }, - { - "epoch": 1.23, - "learning_rate": 1.3337877313985746e-06, - "loss": 0.5676, - "step": 47981 - }, - { - "epoch": 1.23, - "learning_rate": 1.3337616477654545e-06, - "loss": 0.7803, - "step": 47982 - }, - { - "epoch": 1.23, - "learning_rate": 1.3337355638767881e-06, - "loss": 0.5623, - "step": 47983 - }, - { - "epoch": 1.23, - "learning_rate": 1.3337094797325963e-06, - "loss": 0.6294, - "step": 47984 - }, - { - "epoch": 1.23, - "learning_rate": 1.3336833953328984e-06, - "loss": 0.71, - "step": 47985 - }, - { - "epoch": 1.23, - "learning_rate": 1.333657310677714e-06, - "loss": 0.7119, - "step": 47986 - }, - { - "epoch": 1.23, - "learning_rate": 1.3336312257670638e-06, - "loss": 0.6455, - "step": 47987 - }, - { - "epoch": 1.23, - "learning_rate": 1.3336051406009674e-06, - "loss": 0.6582, - "step": 47988 - }, - { - "epoch": 1.23, - "learning_rate": 1.333579055179445e-06, - "loss": 0.4951, - "step": 47989 - }, - { - "epoch": 1.23, - "learning_rate": 1.3335529695025165e-06, - "loss": 0.532, - "step": 47990 - }, - { - "epoch": 1.23, - "learning_rate": 1.3335268835702019e-06, - "loss": 0.6807, - "step": 47991 - }, - { - "epoch": 1.23, - "learning_rate": 1.333500797382521e-06, - "loss": 0.5803, - "step": 47992 - }, - { - "epoch": 1.23, - "learning_rate": 1.3334747109394938e-06, - "loss": 0.6719, - "step": 47993 - }, - { - "epoch": 1.23, - "learning_rate": 1.3334486242411403e-06, - "loss": 0.5967, - "step": 47994 - }, - { - "epoch": 1.23, - "learning_rate": 1.3334225372874808e-06, - "loss": 0.5586, - "step": 47995 - }, - { - "epoch": 1.23, - "learning_rate": 1.3333964500785348e-06, - "loss": 0.6719, - "step": 47996 - }, - { - "epoch": 1.23, - "learning_rate": 1.3333703626143224e-06, - "loss": 0.4644, - "step": 47997 - }, - { - "epoch": 1.23, - "learning_rate": 1.3333442748948637e-06, - "loss": 0.7168, - "step": 47998 - }, - { - "epoch": 1.23, - "learning_rate": 1.3333181869201786e-06, - "loss": 0.6025, - "step": 47999 - }, - { - "epoch": 1.23, - "learning_rate": 1.3332920986902873e-06, - "loss": 0.4795, - "step": 48000 - }, - { - "epoch": 1.23, - "learning_rate": 1.3332660102052096e-06, - "loss": 0.4429, - "step": 48001 - }, - { - "epoch": 1.23, - "learning_rate": 1.333239921464965e-06, - "loss": 0.5771, - "step": 48002 - }, - { - "epoch": 1.23, - "learning_rate": 1.3332138324695743e-06, - "loss": 0.5076, - "step": 48003 - }, - { - "epoch": 1.23, - "learning_rate": 1.3331877432190568e-06, - "loss": 0.6621, - "step": 48004 - }, - { - "epoch": 1.23, - "learning_rate": 1.333161653713433e-06, - "loss": 0.645, - "step": 48005 - }, - { - "epoch": 1.23, - "learning_rate": 1.3331355639527227e-06, - "loss": 0.5466, - "step": 48006 - }, - { - "epoch": 1.23, - "learning_rate": 1.3331094739369454e-06, - "loss": 0.7637, - "step": 48007 - }, - { - "epoch": 1.23, - "learning_rate": 1.3330833836661217e-06, - "loss": 0.5864, - "step": 48008 - }, - { - "epoch": 1.23, - "learning_rate": 1.3330572931402718e-06, - "loss": 0.7305, - "step": 48009 - }, - { - "epoch": 1.23, - "learning_rate": 1.3330312023594148e-06, - "loss": 0.5913, - "step": 48010 - }, - { - "epoch": 1.23, - "learning_rate": 1.333005111323571e-06, - "loss": 0.7734, - "step": 48011 - }, - { - "epoch": 1.23, - "learning_rate": 1.3329790200327608e-06, - "loss": 0.5488, - "step": 48012 - }, - { - "epoch": 1.23, - "learning_rate": 1.3329529284870036e-06, - "loss": 0.6289, - "step": 48013 - }, - { - "epoch": 1.23, - "learning_rate": 1.3329268366863202e-06, - "loss": 0.8311, - "step": 48014 - }, - { - "epoch": 1.23, - "learning_rate": 1.3329007446307295e-06, - "loss": 0.4629, - "step": 48015 - }, - { - "epoch": 1.23, - "learning_rate": 1.332874652320252e-06, - "loss": 0.7031, - "step": 48016 - }, - { - "epoch": 1.23, - "learning_rate": 1.332848559754908e-06, - "loss": 0.3967, - "step": 48017 - }, - { - "epoch": 1.23, - "learning_rate": 1.332822466934717e-06, - "loss": 0.6509, - "step": 48018 - }, - { - "epoch": 1.23, - "learning_rate": 1.3327963738596993e-06, - "loss": 0.5166, - "step": 48019 - }, - { - "epoch": 1.23, - "learning_rate": 1.3327702805298743e-06, - "loss": 0.728, - "step": 48020 - }, - { - "epoch": 1.23, - "learning_rate": 1.3327441869452627e-06, - "loss": 0.5691, - "step": 48021 - }, - { - "epoch": 1.23, - "learning_rate": 1.332718093105884e-06, - "loss": 0.7295, - "step": 48022 - }, - { - "epoch": 1.23, - "learning_rate": 1.3326919990117586e-06, - "loss": 0.7031, - "step": 48023 - }, - { - "epoch": 1.23, - "learning_rate": 1.3326659046629064e-06, - "loss": 0.6914, - "step": 48024 - }, - { - "epoch": 1.23, - "learning_rate": 1.3326398100593469e-06, - "loss": 0.6143, - "step": 48025 - }, - { - "epoch": 1.23, - "learning_rate": 1.3326137152011003e-06, - "loss": 0.5919, - "step": 48026 - }, - { - "epoch": 1.23, - "learning_rate": 1.3325876200881867e-06, - "loss": 0.8198, - "step": 48027 - }, - { - "epoch": 1.23, - "learning_rate": 1.3325615247206263e-06, - "loss": 0.6597, - "step": 48028 - }, - { - "epoch": 1.23, - "learning_rate": 1.3325354290984388e-06, - "loss": 0.7588, - "step": 48029 - }, - { - "epoch": 1.23, - "learning_rate": 1.332509333221644e-06, - "loss": 0.75, - "step": 48030 - }, - { - "epoch": 1.23, - "learning_rate": 1.3324832370902624e-06, - "loss": 0.5684, - "step": 48031 - }, - { - "epoch": 1.23, - "learning_rate": 1.3324571407043133e-06, - "loss": 0.6973, - "step": 48032 - }, - { - "epoch": 1.23, - "learning_rate": 1.332431044063817e-06, - "loss": 0.5669, - "step": 48033 - }, - { - "epoch": 1.23, - "learning_rate": 1.332404947168794e-06, - "loss": 0.48, - "step": 48034 - }, - { - "epoch": 1.23, - "learning_rate": 1.3323788500192637e-06, - "loss": 0.6597, - "step": 48035 - }, - { - "epoch": 1.23, - "learning_rate": 1.3323527526152458e-06, - "loss": 0.5735, - "step": 48036 - }, - { - "epoch": 1.23, - "learning_rate": 1.332326654956761e-06, - "loss": 0.5488, - "step": 48037 - }, - { - "epoch": 1.23, - "learning_rate": 1.3323005570438288e-06, - "loss": 0.7461, - "step": 48038 - }, - { - "epoch": 1.23, - "learning_rate": 1.33227445887647e-06, - "loss": 0.5083, - "step": 48039 - }, - { - "epoch": 1.23, - "learning_rate": 1.332248360454703e-06, - "loss": 0.6807, - "step": 48040 - }, - { - "epoch": 1.23, - "learning_rate": 1.3322222617785492e-06, - "loss": 0.6025, - "step": 48041 - }, - { - "epoch": 1.23, - "learning_rate": 1.3321961628480278e-06, - "loss": 0.6602, - "step": 48042 - }, - { - "epoch": 1.23, - "learning_rate": 1.332170063663159e-06, - "loss": 0.7266, - "step": 48043 - }, - { - "epoch": 1.23, - "learning_rate": 1.3321439642239635e-06, - "loss": 0.7539, - "step": 48044 - }, - { - "epoch": 1.23, - "learning_rate": 1.3321178645304602e-06, - "loss": 0.5908, - "step": 48045 - }, - { - "epoch": 1.23, - "learning_rate": 1.3320917645826694e-06, - "loss": 0.5146, - "step": 48046 - }, - { - "epoch": 1.23, - "learning_rate": 1.3320656643806116e-06, - "loss": 0.6064, - "step": 48047 - }, - { - "epoch": 1.23, - "learning_rate": 1.332039563924306e-06, - "loss": 0.7002, - "step": 48048 - }, - { - "epoch": 1.23, - "learning_rate": 1.3320134632137733e-06, - "loss": 0.7163, - "step": 48049 - }, - { - "epoch": 1.23, - "learning_rate": 1.331987362249033e-06, - "loss": 0.6626, - "step": 48050 - }, - { - "epoch": 1.23, - "learning_rate": 1.3319612610301051e-06, - "loss": 0.5933, - "step": 48051 - }, - { - "epoch": 1.23, - "learning_rate": 1.3319351595570098e-06, - "loss": 0.5098, - "step": 48052 - }, - { - "epoch": 1.23, - "learning_rate": 1.331909057829767e-06, - "loss": 0.4561, - "step": 48053 - }, - { - "epoch": 1.23, - "learning_rate": 1.331882955848397e-06, - "loss": 0.5938, - "step": 48054 - }, - { - "epoch": 1.23, - "learning_rate": 1.3318568536129192e-06, - "loss": 0.6001, - "step": 48055 - }, - { - "epoch": 1.23, - "learning_rate": 1.331830751123354e-06, - "loss": 0.5532, - "step": 48056 - }, - { - "epoch": 1.23, - "learning_rate": 1.3318046483797209e-06, - "loss": 0.7676, - "step": 48057 - }, - { - "epoch": 1.23, - "learning_rate": 1.3317785453820408e-06, - "loss": 0.5425, - "step": 48058 - }, - { - "epoch": 1.23, - "learning_rate": 1.3317524421303327e-06, - "loss": 0.751, - "step": 48059 - }, - { - "epoch": 1.23, - "learning_rate": 1.3317263386246173e-06, - "loss": 0.748, - "step": 48060 - }, - { - "epoch": 1.23, - "learning_rate": 1.331700234864914e-06, - "loss": 0.5284, - "step": 48061 - }, - { - "epoch": 1.23, - "learning_rate": 1.3316741308512434e-06, - "loss": 0.4646, - "step": 48062 - }, - { - "epoch": 1.23, - "learning_rate": 1.3316480265836248e-06, - "loss": 0.7266, - "step": 48063 - }, - { - "epoch": 1.23, - "learning_rate": 1.331621922062079e-06, - "loss": 0.7188, - "step": 48064 - }, - { - "epoch": 1.23, - "learning_rate": 1.331595817286625e-06, - "loss": 0.6621, - "step": 48065 - }, - { - "epoch": 1.23, - "learning_rate": 1.3315697122572838e-06, - "loss": 0.6992, - "step": 48066 - }, - { - "epoch": 1.23, - "learning_rate": 1.3315436069740746e-06, - "loss": 0.6069, - "step": 48067 - }, - { - "epoch": 1.23, - "learning_rate": 1.331517501437018e-06, - "loss": 0.6133, - "step": 48068 - }, - { - "epoch": 1.23, - "learning_rate": 1.3314913956461336e-06, - "loss": 0.6157, - "step": 48069 - }, - { - "epoch": 1.23, - "learning_rate": 1.3314652896014413e-06, - "loss": 0.7144, - "step": 48070 - }, - { - "epoch": 1.23, - "learning_rate": 1.3314391833029613e-06, - "loss": 0.7168, - "step": 48071 - }, - { - "epoch": 1.23, - "learning_rate": 1.3314130767507137e-06, - "loss": 0.7197, - "step": 48072 - }, - { - "epoch": 1.23, - "learning_rate": 1.3313869699447182e-06, - "loss": 0.707, - "step": 48073 - }, - { - "epoch": 1.23, - "learning_rate": 1.331360862884995e-06, - "loss": 0.6167, - "step": 48074 - }, - { - "epoch": 1.23, - "learning_rate": 1.3313347555715641e-06, - "loss": 0.7002, - "step": 48075 - }, - { - "epoch": 1.23, - "learning_rate": 1.3313086480044453e-06, - "loss": 0.6831, - "step": 48076 - }, - { - "epoch": 1.23, - "learning_rate": 1.331282540183659e-06, - "loss": 0.6807, - "step": 48077 - }, - { - "epoch": 1.23, - "learning_rate": 1.3312564321092243e-06, - "loss": 0.7285, - "step": 48078 - }, - { - "epoch": 1.23, - "learning_rate": 1.3312303237811624e-06, - "loss": 0.8096, - "step": 48079 - }, - { - "epoch": 1.23, - "learning_rate": 1.3312042151994924e-06, - "loss": 0.6128, - "step": 48080 - }, - { - "epoch": 1.23, - "learning_rate": 1.3311781063642346e-06, - "loss": 0.8462, - "step": 48081 - }, - { - "epoch": 1.23, - "learning_rate": 1.3311519972754086e-06, - "loss": 0.6616, - "step": 48082 - }, - { - "epoch": 1.23, - "learning_rate": 1.3311258879330352e-06, - "loss": 0.7598, - "step": 48083 - }, - { - "epoch": 1.23, - "learning_rate": 1.3310997783371338e-06, - "loss": 0.6855, - "step": 48084 - }, - { - "epoch": 1.23, - "learning_rate": 1.3310736684877246e-06, - "loss": 0.833, - "step": 48085 - }, - { - "epoch": 1.23, - "learning_rate": 1.3310475583848276e-06, - "loss": 0.7085, - "step": 48086 - }, - { - "epoch": 1.23, - "learning_rate": 1.3310214480284626e-06, - "loss": 0.6396, - "step": 48087 - }, - { - "epoch": 1.23, - "learning_rate": 1.3309953374186494e-06, - "loss": 0.6299, - "step": 48088 - }, - { - "epoch": 1.23, - "learning_rate": 1.3309692265554086e-06, - "loss": 0.6226, - "step": 48089 - }, - { - "epoch": 1.23, - "learning_rate": 1.3309431154387597e-06, - "loss": 0.6465, - "step": 48090 - }, - { - "epoch": 1.23, - "learning_rate": 1.3309170040687233e-06, - "loss": 0.6406, - "step": 48091 - }, - { - "epoch": 1.23, - "learning_rate": 1.3308908924453183e-06, - "loss": 0.7041, - "step": 48092 - }, - { - "epoch": 1.23, - "learning_rate": 1.3308647805685658e-06, - "loss": 0.8477, - "step": 48093 - }, - { - "epoch": 1.23, - "learning_rate": 1.3308386684384854e-06, - "loss": 0.5391, - "step": 48094 - }, - { - "epoch": 1.23, - "learning_rate": 1.3308125560550966e-06, - "loss": 0.7979, - "step": 48095 - }, - { - "epoch": 1.23, - "learning_rate": 1.3307864434184204e-06, - "loss": 0.4949, - "step": 48096 - }, - { - "epoch": 1.23, - "learning_rate": 1.3307603305284758e-06, - "loss": 0.8525, - "step": 48097 - }, - { - "epoch": 1.23, - "learning_rate": 1.3307342173852833e-06, - "loss": 0.5361, - "step": 48098 - }, - { - "epoch": 1.23, - "learning_rate": 1.330708103988863e-06, - "loss": 0.5391, - "step": 48099 - }, - { - "epoch": 1.23, - "learning_rate": 1.3306819903392347e-06, - "loss": 0.6396, - "step": 48100 - }, - { - "epoch": 1.23, - "learning_rate": 1.3306558764364181e-06, - "loss": 0.5918, - "step": 48101 - }, - { - "epoch": 1.23, - "learning_rate": 1.330629762280434e-06, - "loss": 0.7002, - "step": 48102 - }, - { - "epoch": 1.23, - "learning_rate": 1.3306036478713015e-06, - "loss": 0.5566, - "step": 48103 - }, - { - "epoch": 1.23, - "learning_rate": 1.330577533209041e-06, - "loss": 0.5786, - "step": 48104 - }, - { - "epoch": 1.23, - "learning_rate": 1.3305514182936729e-06, - "loss": 0.455, - "step": 48105 - }, - { - "epoch": 1.23, - "learning_rate": 1.3305253031252165e-06, - "loss": 0.5171, - "step": 48106 - }, - { - "epoch": 1.23, - "learning_rate": 1.3304991877036918e-06, - "loss": 0.6328, - "step": 48107 - }, - { - "epoch": 1.23, - "learning_rate": 1.3304730720291192e-06, - "loss": 0.6396, - "step": 48108 - }, - { - "epoch": 1.23, - "learning_rate": 1.330446956101519e-06, - "loss": 0.6523, - "step": 48109 - }, - { - "epoch": 1.23, - "learning_rate": 1.3304208399209104e-06, - "loss": 0.6748, - "step": 48110 - }, - { - "epoch": 1.23, - "learning_rate": 1.3303947234873135e-06, - "loss": 0.6787, - "step": 48111 - }, - { - "epoch": 1.23, - "learning_rate": 1.3303686068007492e-06, - "loss": 0.6914, - "step": 48112 - }, - { - "epoch": 1.23, - "learning_rate": 1.3303424898612363e-06, - "loss": 0.5142, - "step": 48113 - }, - { - "epoch": 1.23, - "learning_rate": 1.3303163726687955e-06, - "loss": 0.5137, - "step": 48114 - }, - { - "epoch": 1.23, - "learning_rate": 1.3302902552234468e-06, - "loss": 0.7422, - "step": 48115 - }, - { - "epoch": 1.23, - "learning_rate": 1.33026413752521e-06, - "loss": 0.5513, - "step": 48116 - }, - { - "epoch": 1.23, - "learning_rate": 1.330238019574105e-06, - "loss": 0.5874, - "step": 48117 - }, - { - "epoch": 1.23, - "learning_rate": 1.330211901370152e-06, - "loss": 0.7559, - "step": 48118 - }, - { - "epoch": 1.23, - "learning_rate": 1.330185782913371e-06, - "loss": 0.6226, - "step": 48119 - }, - { - "epoch": 1.23, - "learning_rate": 1.3301596642037815e-06, - "loss": 0.6934, - "step": 48120 - }, - { - "epoch": 1.23, - "learning_rate": 1.3301335452414044e-06, - "loss": 0.5776, - "step": 48121 - }, - { - "epoch": 1.23, - "learning_rate": 1.330107426026259e-06, - "loss": 0.7578, - "step": 48122 - }, - { - "epoch": 1.23, - "learning_rate": 1.3300813065583655e-06, - "loss": 0.7998, - "step": 48123 - }, - { - "epoch": 1.23, - "learning_rate": 1.3300551868377442e-06, - "loss": 0.7529, - "step": 48124 - }, - { - "epoch": 1.23, - "learning_rate": 1.3300290668644147e-06, - "loss": 0.9248, - "step": 48125 - }, - { - "epoch": 1.23, - "learning_rate": 1.3300029466383972e-06, - "loss": 0.6821, - "step": 48126 - }, - { - "epoch": 1.23, - "learning_rate": 1.3299768261597114e-06, - "loss": 0.5786, - "step": 48127 - }, - { - "epoch": 1.23, - "learning_rate": 1.3299507054283776e-06, - "loss": 0.5952, - "step": 48128 - }, - { - "epoch": 1.23, - "learning_rate": 1.329924584444416e-06, - "loss": 0.752, - "step": 48129 - }, - { - "epoch": 1.23, - "learning_rate": 1.3298984632078458e-06, - "loss": 0.5386, - "step": 48130 - }, - { - "epoch": 1.23, - "learning_rate": 1.3298723417186879e-06, - "loss": 0.6479, - "step": 48131 - }, - { - "epoch": 1.23, - "learning_rate": 1.3298462199769615e-06, - "loss": 0.6382, - "step": 48132 - }, - { - "epoch": 1.23, - "learning_rate": 1.3298200979826875e-06, - "loss": 0.6196, - "step": 48133 - }, - { - "epoch": 1.23, - "learning_rate": 1.329793975735885e-06, - "loss": 0.6133, - "step": 48134 - }, - { - "epoch": 1.23, - "learning_rate": 1.3297678532365747e-06, - "loss": 0.7002, - "step": 48135 - }, - { - "epoch": 1.23, - "learning_rate": 1.3297417304847761e-06, - "loss": 0.7852, - "step": 48136 - }, - { - "epoch": 1.23, - "learning_rate": 1.3297156074805099e-06, - "loss": 0.6099, - "step": 48137 - }, - { - "epoch": 1.23, - "learning_rate": 1.3296894842237951e-06, - "loss": 0.6885, - "step": 48138 - }, - { - "epoch": 1.23, - "learning_rate": 1.3296633607146523e-06, - "loss": 0.6562, - "step": 48139 - }, - { - "epoch": 1.23, - "learning_rate": 1.3296372369531017e-06, - "loss": 0.6211, - "step": 48140 - }, - { - "epoch": 1.23, - "learning_rate": 1.3296111129391628e-06, - "loss": 0.6509, - "step": 48141 - }, - { - "epoch": 1.23, - "learning_rate": 1.3295849886728558e-06, - "loss": 0.6758, - "step": 48142 - }, - { - "epoch": 1.23, - "learning_rate": 1.329558864154201e-06, - "loss": 0.668, - "step": 48143 - }, - { - "epoch": 1.23, - "learning_rate": 1.329532739383218e-06, - "loss": 0.9385, - "step": 48144 - }, - { - "epoch": 1.23, - "learning_rate": 1.3295066143599267e-06, - "loss": 0.6709, - "step": 48145 - }, - { - "epoch": 1.23, - "learning_rate": 1.3294804890843475e-06, - "loss": 0.5469, - "step": 48146 - }, - { - "epoch": 1.23, - "learning_rate": 1.3294543635565e-06, - "loss": 0.7373, - "step": 48147 - }, - { - "epoch": 1.23, - "learning_rate": 1.329428237776405e-06, - "loss": 0.6929, - "step": 48148 - }, - { - "epoch": 1.23, - "learning_rate": 1.3294021117440817e-06, - "loss": 0.7236, - "step": 48149 - }, - { - "epoch": 1.23, - "learning_rate": 1.3293759854595503e-06, - "loss": 0.6504, - "step": 48150 - }, - { - "epoch": 1.23, - "learning_rate": 1.3293498589228307e-06, - "loss": 0.7764, - "step": 48151 - }, - { - "epoch": 1.23, - "learning_rate": 1.3293237321339433e-06, - "loss": 0.573, - "step": 48152 - }, - { - "epoch": 1.23, - "learning_rate": 1.3292976050929077e-06, - "loss": 0.6416, - "step": 48153 - }, - { - "epoch": 1.23, - "learning_rate": 1.3292714777997443e-06, - "loss": 0.5337, - "step": 48154 - }, - { - "epoch": 1.23, - "learning_rate": 1.3292453502544725e-06, - "loss": 0.5669, - "step": 48155 - }, - { - "epoch": 1.23, - "learning_rate": 1.329219222457113e-06, - "loss": 0.9121, - "step": 48156 - }, - { - "epoch": 1.23, - "learning_rate": 1.3291930944076853e-06, - "loss": 0.7354, - "step": 48157 - }, - { - "epoch": 1.23, - "learning_rate": 1.3291669661062094e-06, - "loss": 0.6602, - "step": 48158 - }, - { - "epoch": 1.23, - "learning_rate": 1.329140837552706e-06, - "loss": 0.5757, - "step": 48159 - }, - { - "epoch": 1.23, - "learning_rate": 1.3291147087471943e-06, - "loss": 0.5754, - "step": 48160 - }, - { - "epoch": 1.23, - "learning_rate": 1.3290885796896945e-06, - "loss": 0.6436, - "step": 48161 - }, - { - "epoch": 1.23, - "learning_rate": 1.3290624503802268e-06, - "loss": 0.6055, - "step": 48162 - }, - { - "epoch": 1.23, - "learning_rate": 1.329036320818811e-06, - "loss": 0.7207, - "step": 48163 - }, - { - "epoch": 1.23, - "learning_rate": 1.3290101910054677e-06, - "loss": 0.6611, - "step": 48164 - }, - { - "epoch": 1.23, - "learning_rate": 1.328984060940216e-06, - "loss": 0.8027, - "step": 48165 - }, - { - "epoch": 1.23, - "learning_rate": 1.3289579306230763e-06, - "loss": 0.9043, - "step": 48166 - }, - { - "epoch": 1.23, - "learning_rate": 1.3289318000540687e-06, - "loss": 0.7578, - "step": 48167 - }, - { - "epoch": 1.23, - "learning_rate": 1.328905669233213e-06, - "loss": 0.5898, - "step": 48168 - }, - { - "epoch": 1.23, - "learning_rate": 1.32887953816053e-06, - "loss": 0.6445, - "step": 48169 - }, - { - "epoch": 1.23, - "learning_rate": 1.3288534068360383e-06, - "loss": 0.6523, - "step": 48170 - }, - { - "epoch": 1.23, - "learning_rate": 1.3288272752597592e-06, - "loss": 0.6279, - "step": 48171 - }, - { - "epoch": 1.23, - "learning_rate": 1.3288011434317116e-06, - "loss": 0.5586, - "step": 48172 - }, - { - "epoch": 1.23, - "learning_rate": 1.3287750113519168e-06, - "loss": 0.7559, - "step": 48173 - }, - { - "epoch": 1.23, - "learning_rate": 1.3287488790203936e-06, - "loss": 0.6582, - "step": 48174 - }, - { - "epoch": 1.23, - "learning_rate": 1.3287227464371626e-06, - "loss": 0.5737, - "step": 48175 - }, - { - "epoch": 1.23, - "learning_rate": 1.3286966136022438e-06, - "loss": 0.5557, - "step": 48176 - }, - { - "epoch": 1.23, - "learning_rate": 1.328670480515657e-06, - "loss": 0.6484, - "step": 48177 - }, - { - "epoch": 1.23, - "learning_rate": 1.3286443471774222e-06, - "loss": 0.5081, - "step": 48178 - }, - { - "epoch": 1.23, - "learning_rate": 1.32861821358756e-06, - "loss": 0.7275, - "step": 48179 - }, - { - "epoch": 1.23, - "learning_rate": 1.3285920797460897e-06, - "loss": 0.5913, - "step": 48180 - }, - { - "epoch": 1.23, - "learning_rate": 1.3285659456530314e-06, - "loss": 0.4437, - "step": 48181 - }, - { - "epoch": 1.23, - "learning_rate": 1.3285398113084053e-06, - "loss": 0.4731, - "step": 48182 - }, - { - "epoch": 1.23, - "learning_rate": 1.3285136767122316e-06, - "loss": 0.5879, - "step": 48183 - }, - { - "epoch": 1.23, - "learning_rate": 1.3284875418645298e-06, - "loss": 0.6123, - "step": 48184 - }, - { - "epoch": 1.24, - "learning_rate": 1.3284614067653204e-06, - "loss": 0.4252, - "step": 48185 - }, - { - "epoch": 1.24, - "learning_rate": 1.328435271414623e-06, - "loss": 0.6641, - "step": 48186 - }, - { - "epoch": 1.24, - "learning_rate": 1.328409135812458e-06, - "loss": 0.6045, - "step": 48187 - }, - { - "epoch": 1.24, - "learning_rate": 1.328382999958845e-06, - "loss": 0.4954, - "step": 48188 - }, - { - "epoch": 1.24, - "learning_rate": 1.3283568638538045e-06, - "loss": 0.5015, - "step": 48189 - }, - { - "epoch": 1.24, - "learning_rate": 1.3283307274973564e-06, - "loss": 0.5273, - "step": 48190 - }, - { - "epoch": 1.24, - "learning_rate": 1.32830459088952e-06, - "loss": 0.6113, - "step": 48191 - }, - { - "epoch": 1.24, - "learning_rate": 1.3282784540303162e-06, - "loss": 0.7637, - "step": 48192 - }, - { - "epoch": 1.24, - "learning_rate": 1.3282523169197646e-06, - "loss": 0.6875, - "step": 48193 - }, - { - "epoch": 1.24, - "learning_rate": 1.3282261795578858e-06, - "loss": 0.6436, - "step": 48194 - }, - { - "epoch": 1.24, - "learning_rate": 1.3282000419446987e-06, - "loss": 0.7827, - "step": 48195 - }, - { - "epoch": 1.24, - "learning_rate": 1.328173904080224e-06, - "loss": 0.5181, - "step": 48196 - }, - { - "epoch": 1.24, - "learning_rate": 1.3281477659644815e-06, - "loss": 0.8447, - "step": 48197 - }, - { - "epoch": 1.24, - "learning_rate": 1.3281216275974916e-06, - "loss": 0.7158, - "step": 48198 - }, - { - "epoch": 1.24, - "learning_rate": 1.3280954889792743e-06, - "loss": 0.4353, - "step": 48199 - }, - { - "epoch": 1.24, - "learning_rate": 1.328069350109849e-06, - "loss": 0.6104, - "step": 48200 - }, - { - "epoch": 1.24, - "learning_rate": 1.328043210989236e-06, - "loss": 0.6245, - "step": 48201 - }, - { - "epoch": 1.24, - "learning_rate": 1.3280170716174557e-06, - "loss": 0.7559, - "step": 48202 - }, - { - "epoch": 1.24, - "learning_rate": 1.3279909319945275e-06, - "loss": 0.626, - "step": 48203 - }, - { - "epoch": 1.24, - "learning_rate": 1.3279647921204722e-06, - "loss": 0.5037, - "step": 48204 - }, - { - "epoch": 1.24, - "learning_rate": 1.3279386519953088e-06, - "loss": 0.7402, - "step": 48205 - }, - { - "epoch": 1.24, - "learning_rate": 1.3279125116190583e-06, - "loss": 0.7773, - "step": 48206 - }, - { - "epoch": 1.24, - "learning_rate": 1.3278863709917398e-06, - "loss": 0.6421, - "step": 48207 - }, - { - "epoch": 1.24, - "learning_rate": 1.327860230113374e-06, - "loss": 0.6489, - "step": 48208 - }, - { - "epoch": 1.24, - "learning_rate": 1.327834088983981e-06, - "loss": 0.441, - "step": 48209 - }, - { - "epoch": 1.24, - "learning_rate": 1.32780794760358e-06, - "loss": 0.6885, - "step": 48210 - }, - { - "epoch": 1.24, - "learning_rate": 1.327781805972192e-06, - "loss": 0.5615, - "step": 48211 - }, - { - "epoch": 1.24, - "learning_rate": 1.3277556640898362e-06, - "loss": 0.5322, - "step": 48212 - }, - { - "epoch": 1.24, - "learning_rate": 1.327729521956533e-06, - "loss": 0.5513, - "step": 48213 - }, - { - "epoch": 1.24, - "learning_rate": 1.3277033795723026e-06, - "loss": 0.6296, - "step": 48214 - }, - { - "epoch": 1.24, - "learning_rate": 1.3276772369371647e-06, - "loss": 0.6758, - "step": 48215 - }, - { - "epoch": 1.24, - "learning_rate": 1.3276510940511392e-06, - "loss": 0.7109, - "step": 48216 - }, - { - "epoch": 1.24, - "learning_rate": 1.3276249509142466e-06, - "loss": 0.7412, - "step": 48217 - }, - { - "epoch": 1.24, - "learning_rate": 1.3275988075265064e-06, - "loss": 0.6582, - "step": 48218 - }, - { - "epoch": 1.24, - "learning_rate": 1.3275726638879392e-06, - "loss": 0.5535, - "step": 48219 - }, - { - "epoch": 1.24, - "learning_rate": 1.3275465199985643e-06, - "loss": 0.7275, - "step": 48220 - }, - { - "epoch": 1.24, - "learning_rate": 1.3275203758584024e-06, - "loss": 0.7178, - "step": 48221 - }, - { - "epoch": 1.24, - "learning_rate": 1.327494231467473e-06, - "loss": 0.5657, - "step": 48222 - }, - { - "epoch": 1.24, - "learning_rate": 1.3274680868257962e-06, - "loss": 0.7383, - "step": 48223 - }, - { - "epoch": 1.24, - "learning_rate": 1.3274419419333924e-06, - "loss": 0.7268, - "step": 48224 - }, - { - "epoch": 1.24, - "learning_rate": 1.3274157967902812e-06, - "loss": 0.543, - "step": 48225 - }, - { - "epoch": 1.24, - "learning_rate": 1.3273896513964828e-06, - "loss": 0.6401, - "step": 48226 - }, - { - "epoch": 1.24, - "learning_rate": 1.3273635057520173e-06, - "loss": 0.6821, - "step": 48227 - }, - { - "epoch": 1.24, - "learning_rate": 1.3273373598569043e-06, - "loss": 0.8086, - "step": 48228 - }, - { - "epoch": 1.24, - "learning_rate": 1.3273112137111645e-06, - "loss": 0.481, - "step": 48229 - }, - { - "epoch": 1.24, - "learning_rate": 1.3272850673148177e-06, - "loss": 0.6294, - "step": 48230 - }, - { - "epoch": 1.24, - "learning_rate": 1.3272589206678832e-06, - "loss": 0.7085, - "step": 48231 - }, - { - "epoch": 1.24, - "learning_rate": 1.3272327737703821e-06, - "loss": 0.8604, - "step": 48232 - }, - { - "epoch": 1.24, - "learning_rate": 1.3272066266223338e-06, - "loss": 0.5605, - "step": 48233 - }, - { - "epoch": 1.24, - "learning_rate": 1.3271804792237584e-06, - "loss": 0.627, - "step": 48234 - }, - { - "epoch": 1.24, - "learning_rate": 1.3271543315746759e-06, - "loss": 0.5566, - "step": 48235 - }, - { - "epoch": 1.24, - "learning_rate": 1.3271281836751062e-06, - "loss": 0.606, - "step": 48236 - }, - { - "epoch": 1.24, - "learning_rate": 1.3271020355250696e-06, - "loss": 0.5962, - "step": 48237 - }, - { - "epoch": 1.24, - "learning_rate": 1.3270758871245861e-06, - "loss": 0.6948, - "step": 48238 - }, - { - "epoch": 1.24, - "learning_rate": 1.3270497384736758e-06, - "loss": 0.6426, - "step": 48239 - }, - { - "epoch": 1.24, - "learning_rate": 1.3270235895723585e-06, - "loss": 0.6011, - "step": 48240 - }, - { - "epoch": 1.24, - "learning_rate": 1.3269974404206541e-06, - "loss": 0.6484, - "step": 48241 - }, - { - "epoch": 1.24, - "learning_rate": 1.326971291018583e-06, - "loss": 0.7314, - "step": 48242 - }, - { - "epoch": 1.24, - "learning_rate": 1.3269451413661646e-06, - "loss": 0.5327, - "step": 48243 - }, - { - "epoch": 1.24, - "learning_rate": 1.3269189914634197e-06, - "loss": 0.5972, - "step": 48244 - }, - { - "epoch": 1.24, - "learning_rate": 1.326892841310368e-06, - "loss": 0.6768, - "step": 48245 - }, - { - "epoch": 1.24, - "learning_rate": 1.3268666909070292e-06, - "loss": 0.5625, - "step": 48246 - }, - { - "epoch": 1.24, - "learning_rate": 1.3268405402534236e-06, - "loss": 0.561, - "step": 48247 - }, - { - "epoch": 1.24, - "learning_rate": 1.3268143893495713e-06, - "loss": 0.6328, - "step": 48248 - }, - { - "epoch": 1.24, - "learning_rate": 1.3267882381954927e-06, - "loss": 0.7422, - "step": 48249 - }, - { - "epoch": 1.24, - "learning_rate": 1.326762086791207e-06, - "loss": 0.4951, - "step": 48250 - }, - { - "epoch": 1.24, - "learning_rate": 1.3267359351367344e-06, - "loss": 0.5393, - "step": 48251 - }, - { - "epoch": 1.24, - "learning_rate": 1.3267097832320952e-06, - "loss": 0.4546, - "step": 48252 - }, - { - "epoch": 1.24, - "learning_rate": 1.3266836310773095e-06, - "loss": 0.7686, - "step": 48253 - }, - { - "epoch": 1.24, - "learning_rate": 1.3266574786723973e-06, - "loss": 0.3999, - "step": 48254 - }, - { - "epoch": 1.24, - "learning_rate": 1.3266313260173782e-06, - "loss": 0.665, - "step": 48255 - }, - { - "epoch": 1.24, - "learning_rate": 1.3266051731122725e-06, - "loss": 0.6357, - "step": 48256 - }, - { - "epoch": 1.24, - "learning_rate": 1.3265790199571006e-06, - "loss": 0.6616, - "step": 48257 - }, - { - "epoch": 1.24, - "learning_rate": 1.3265528665518816e-06, - "loss": 0.8867, - "step": 48258 - }, - { - "epoch": 1.24, - "learning_rate": 1.3265267128966367e-06, - "loss": 0.4722, - "step": 48259 - }, - { - "epoch": 1.24, - "learning_rate": 1.326500558991385e-06, - "loss": 0.5122, - "step": 48260 - }, - { - "epoch": 1.24, - "learning_rate": 1.3264744048361467e-06, - "loss": 0.7158, - "step": 48261 - }, - { - "epoch": 1.24, - "learning_rate": 1.326448250430942e-06, - "loss": 0.6514, - "step": 48262 - }, - { - "epoch": 1.24, - "learning_rate": 1.326422095775791e-06, - "loss": 0.6484, - "step": 48263 - }, - { - "epoch": 1.24, - "learning_rate": 1.3263959408707137e-06, - "loss": 0.5796, - "step": 48264 - }, - { - "epoch": 1.24, - "learning_rate": 1.32636978571573e-06, - "loss": 0.6221, - "step": 48265 - }, - { - "epoch": 1.24, - "learning_rate": 1.32634363031086e-06, - "loss": 0.5092, - "step": 48266 - }, - { - "epoch": 1.24, - "learning_rate": 1.3263174746561233e-06, - "loss": 0.592, - "step": 48267 - }, - { - "epoch": 1.24, - "learning_rate": 1.3262913187515405e-06, - "loss": 0.8154, - "step": 48268 - }, - { - "epoch": 1.24, - "learning_rate": 1.326265162597132e-06, - "loss": 0.6426, - "step": 48269 - }, - { - "epoch": 1.24, - "learning_rate": 1.3262390061929166e-06, - "loss": 0.5088, - "step": 48270 - }, - { - "epoch": 1.24, - "learning_rate": 1.3262128495389154e-06, - "loss": 0.7793, - "step": 48271 - }, - { - "epoch": 1.24, - "learning_rate": 1.3261866926351476e-06, - "loss": 0.7681, - "step": 48272 - }, - { - "epoch": 1.24, - "learning_rate": 1.326160535481634e-06, - "loss": 0.7529, - "step": 48273 - }, - { - "epoch": 1.24, - "learning_rate": 1.326134378078394e-06, - "loss": 0.5874, - "step": 48274 - }, - { - "epoch": 1.24, - "learning_rate": 1.3261082204254482e-06, - "loss": 0.6489, - "step": 48275 - }, - { - "epoch": 1.24, - "learning_rate": 1.326082062522816e-06, - "loss": 0.8223, - "step": 48276 - }, - { - "epoch": 1.24, - "learning_rate": 1.3260559043705183e-06, - "loss": 0.7295, - "step": 48277 - }, - { - "epoch": 1.24, - "learning_rate": 1.3260297459685738e-06, - "loss": 0.6953, - "step": 48278 - }, - { - "epoch": 1.24, - "learning_rate": 1.3260035873170039e-06, - "loss": 0.7393, - "step": 48279 - }, - { - "epoch": 1.24, - "learning_rate": 1.325977428415828e-06, - "loss": 0.7432, - "step": 48280 - }, - { - "epoch": 1.24, - "learning_rate": 1.3259512692650659e-06, - "loss": 0.6699, - "step": 48281 - }, - { - "epoch": 1.24, - "learning_rate": 1.3259251098647378e-06, - "loss": 0.6992, - "step": 48282 - }, - { - "epoch": 1.24, - "learning_rate": 1.3258989502148642e-06, - "loss": 0.6611, - "step": 48283 - }, - { - "epoch": 1.24, - "learning_rate": 1.325872790315465e-06, - "loss": 0.6631, - "step": 48284 - }, - { - "epoch": 1.24, - "learning_rate": 1.3258466301665593e-06, - "loss": 0.4667, - "step": 48285 - }, - { - "epoch": 1.24, - "learning_rate": 1.3258204697681684e-06, - "loss": 0.7104, - "step": 48286 - }, - { - "epoch": 1.24, - "learning_rate": 1.3257943091203112e-06, - "loss": 0.8486, - "step": 48287 - }, - { - "epoch": 1.24, - "learning_rate": 1.3257681482230087e-06, - "loss": 0.623, - "step": 48288 - }, - { - "epoch": 1.24, - "learning_rate": 1.3257419870762804e-06, - "loss": 0.4692, - "step": 48289 - }, - { - "epoch": 1.24, - "learning_rate": 1.3257158256801467e-06, - "loss": 0.7573, - "step": 48290 - }, - { - "epoch": 1.24, - "learning_rate": 1.325689664034627e-06, - "loss": 0.707, - "step": 48291 - }, - { - "epoch": 1.24, - "learning_rate": 1.3256635021397418e-06, - "loss": 0.6104, - "step": 48292 - }, - { - "epoch": 1.24, - "learning_rate": 1.3256373399955107e-06, - "loss": 0.5054, - "step": 48293 - }, - { - "epoch": 1.24, - "learning_rate": 1.3256111776019548e-06, - "loss": 0.5364, - "step": 48294 - }, - { - "epoch": 1.24, - "learning_rate": 1.3255850149590928e-06, - "loss": 0.4692, - "step": 48295 - }, - { - "epoch": 1.24, - "learning_rate": 1.3255588520669453e-06, - "loss": 0.6807, - "step": 48296 - }, - { - "epoch": 1.24, - "learning_rate": 1.3255326889255324e-06, - "loss": 0.6299, - "step": 48297 - }, - { - "epoch": 1.24, - "learning_rate": 1.3255065255348745e-06, - "loss": 0.8086, - "step": 48298 - }, - { - "epoch": 1.24, - "learning_rate": 1.325480361894991e-06, - "loss": 0.6675, - "step": 48299 - }, - { - "epoch": 1.24, - "learning_rate": 1.325454198005902e-06, - "loss": 0.5801, - "step": 48300 - }, - { - "epoch": 1.24, - "learning_rate": 1.325428033867628e-06, - "loss": 0.4958, - "step": 48301 - }, - { - "epoch": 1.24, - "learning_rate": 1.3254018694801882e-06, - "loss": 0.6426, - "step": 48302 - }, - { - "epoch": 1.24, - "learning_rate": 1.3253757048436035e-06, - "loss": 0.6621, - "step": 48303 - }, - { - "epoch": 1.24, - "learning_rate": 1.3253495399578937e-06, - "loss": 0.6367, - "step": 48304 - }, - { - "epoch": 1.24, - "learning_rate": 1.3253233748230788e-06, - "loss": 0.8623, - "step": 48305 - }, - { - "epoch": 1.24, - "learning_rate": 1.3252972094391783e-06, - "loss": 0.5547, - "step": 48306 - }, - { - "epoch": 1.24, - "learning_rate": 1.3252710438062129e-06, - "loss": 0.4512, - "step": 48307 - }, - { - "epoch": 1.24, - "learning_rate": 1.3252448779242026e-06, - "loss": 0.6621, - "step": 48308 - }, - { - "epoch": 1.24, - "learning_rate": 1.325218711793167e-06, - "loss": 0.6719, - "step": 48309 - }, - { - "epoch": 1.24, - "learning_rate": 1.3251925454131265e-06, - "loss": 0.5635, - "step": 48310 - }, - { - "epoch": 1.24, - "learning_rate": 1.325166378784101e-06, - "loss": 0.4644, - "step": 48311 - }, - { - "epoch": 1.24, - "learning_rate": 1.3251402119061104e-06, - "loss": 0.5212, - "step": 48312 - }, - { - "epoch": 1.24, - "learning_rate": 1.3251140447791754e-06, - "loss": 0.7178, - "step": 48313 - }, - { - "epoch": 1.24, - "learning_rate": 1.325087877403315e-06, - "loss": 0.6001, - "step": 48314 - }, - { - "epoch": 1.24, - "learning_rate": 1.3250617097785498e-06, - "loss": 0.5017, - "step": 48315 - }, - { - "epoch": 1.24, - "learning_rate": 1.3250355419049e-06, - "loss": 0.6875, - "step": 48316 - }, - { - "epoch": 1.24, - "learning_rate": 1.3250093737823853e-06, - "loss": 0.6992, - "step": 48317 - }, - { - "epoch": 1.24, - "learning_rate": 1.3249832054110259e-06, - "loss": 0.7754, - "step": 48318 - }, - { - "epoch": 1.24, - "learning_rate": 1.3249570367908419e-06, - "loss": 0.6719, - "step": 48319 - }, - { - "epoch": 1.24, - "learning_rate": 1.3249308679218531e-06, - "loss": 0.6343, - "step": 48320 - }, - { - "epoch": 1.24, - "learning_rate": 1.3249046988040796e-06, - "loss": 0.5771, - "step": 48321 - }, - { - "epoch": 1.24, - "learning_rate": 1.3248785294375418e-06, - "loss": 0.8311, - "step": 48322 - }, - { - "epoch": 1.24, - "learning_rate": 1.3248523598222592e-06, - "loss": 0.7983, - "step": 48323 - }, - { - "epoch": 1.24, - "learning_rate": 1.3248261899582522e-06, - "loss": 0.606, - "step": 48324 - }, - { - "epoch": 1.24, - "learning_rate": 1.3248000198455407e-06, - "loss": 0.7227, - "step": 48325 - }, - { - "epoch": 1.24, - "learning_rate": 1.3247738494841447e-06, - "loss": 0.6416, - "step": 48326 - }, - { - "epoch": 1.24, - "learning_rate": 1.3247476788740844e-06, - "loss": 0.7231, - "step": 48327 - }, - { - "epoch": 1.24, - "learning_rate": 1.3247215080153797e-06, - "loss": 0.6211, - "step": 48328 - }, - { - "epoch": 1.24, - "learning_rate": 1.3246953369080507e-06, - "loss": 0.4946, - "step": 48329 - }, - { - "epoch": 1.24, - "learning_rate": 1.3246691655521173e-06, - "loss": 0.5518, - "step": 48330 - }, - { - "epoch": 1.24, - "learning_rate": 1.3246429939475997e-06, - "loss": 0.708, - "step": 48331 - }, - { - "epoch": 1.24, - "learning_rate": 1.3246168220945179e-06, - "loss": 0.7256, - "step": 48332 - }, - { - "epoch": 1.24, - "learning_rate": 1.324590649992892e-06, - "loss": 0.3894, - "step": 48333 - }, - { - "epoch": 1.24, - "learning_rate": 1.3245644776427421e-06, - "loss": 0.5703, - "step": 48334 - }, - { - "epoch": 1.24, - "learning_rate": 1.3245383050440878e-06, - "loss": 0.5269, - "step": 48335 - }, - { - "epoch": 1.24, - "learning_rate": 1.3245121321969495e-06, - "loss": 0.5371, - "step": 48336 - }, - { - "epoch": 1.24, - "learning_rate": 1.324485959101347e-06, - "loss": 0.4856, - "step": 48337 - }, - { - "epoch": 1.24, - "learning_rate": 1.324459785757301e-06, - "loss": 0.708, - "step": 48338 - }, - { - "epoch": 1.24, - "learning_rate": 1.3244336121648306e-06, - "loss": 0.542, - "step": 48339 - }, - { - "epoch": 1.24, - "learning_rate": 1.3244074383239567e-06, - "loss": 0.7168, - "step": 48340 - }, - { - "epoch": 1.24, - "learning_rate": 1.3243812642346988e-06, - "loss": 0.6709, - "step": 48341 - }, - { - "epoch": 1.24, - "learning_rate": 1.324355089897077e-06, - "loss": 0.6382, - "step": 48342 - }, - { - "epoch": 1.24, - "learning_rate": 1.3243289153111115e-06, - "loss": 0.6455, - "step": 48343 - }, - { - "epoch": 1.24, - "learning_rate": 1.324302740476822e-06, - "loss": 0.6958, - "step": 48344 - }, - { - "epoch": 1.24, - "learning_rate": 1.3242765653942292e-06, - "loss": 0.4833, - "step": 48345 - }, - { - "epoch": 1.24, - "learning_rate": 1.3242503900633523e-06, - "loss": 0.666, - "step": 48346 - }, - { - "epoch": 1.24, - "learning_rate": 1.3242242144842122e-06, - "loss": 0.6011, - "step": 48347 - }, - { - "epoch": 1.24, - "learning_rate": 1.3241980386568284e-06, - "loss": 0.5591, - "step": 48348 - }, - { - "epoch": 1.24, - "learning_rate": 1.324171862581221e-06, - "loss": 0.606, - "step": 48349 - }, - { - "epoch": 1.24, - "learning_rate": 1.32414568625741e-06, - "loss": 0.6694, - "step": 48350 - }, - { - "epoch": 1.24, - "learning_rate": 1.3241195096854158e-06, - "loss": 0.6968, - "step": 48351 - }, - { - "epoch": 1.24, - "learning_rate": 1.3240933328652578e-06, - "loss": 0.5645, - "step": 48352 - }, - { - "epoch": 1.24, - "learning_rate": 1.3240671557969573e-06, - "loss": 0.4745, - "step": 48353 - }, - { - "epoch": 1.24, - "learning_rate": 1.3240409784805327e-06, - "loss": 0.6875, - "step": 48354 - }, - { - "epoch": 1.24, - "learning_rate": 1.324014800916005e-06, - "loss": 0.6455, - "step": 48355 - }, - { - "epoch": 1.24, - "learning_rate": 1.323988623103394e-06, - "loss": 0.4712, - "step": 48356 - }, - { - "epoch": 1.24, - "learning_rate": 1.32396244504272e-06, - "loss": 0.5073, - "step": 48357 - }, - { - "epoch": 1.24, - "learning_rate": 1.323936266734003e-06, - "loss": 0.7178, - "step": 48358 - }, - { - "epoch": 1.24, - "learning_rate": 1.3239100881772627e-06, - "loss": 0.7314, - "step": 48359 - }, - { - "epoch": 1.24, - "learning_rate": 1.323883909372519e-06, - "loss": 0.647, - "step": 48360 - }, - { - "epoch": 1.24, - "learning_rate": 1.323857730319793e-06, - "loss": 0.5396, - "step": 48361 - }, - { - "epoch": 1.24, - "learning_rate": 1.3238315510191033e-06, - "loss": 0.8525, - "step": 48362 - }, - { - "epoch": 1.24, - "learning_rate": 1.323805371470471e-06, - "loss": 0.472, - "step": 48363 - }, - { - "epoch": 1.24, - "learning_rate": 1.3237791916739159e-06, - "loss": 0.6597, - "step": 48364 - }, - { - "epoch": 1.24, - "learning_rate": 1.3237530116294578e-06, - "loss": 0.6396, - "step": 48365 - }, - { - "epoch": 1.24, - "learning_rate": 1.323726831337117e-06, - "loss": 0.7256, - "step": 48366 - }, - { - "epoch": 1.24, - "learning_rate": 1.3237006507969133e-06, - "loss": 0.5425, - "step": 48367 - }, - { - "epoch": 1.24, - "learning_rate": 1.3236744700088674e-06, - "loss": 0.7246, - "step": 48368 - }, - { - "epoch": 1.24, - "learning_rate": 1.3236482889729981e-06, - "loss": 0.5762, - "step": 48369 - }, - { - "epoch": 1.24, - "learning_rate": 1.3236221076893266e-06, - "loss": 0.6768, - "step": 48370 - }, - { - "epoch": 1.24, - "learning_rate": 1.3235959261578725e-06, - "loss": 0.5464, - "step": 48371 - }, - { - "epoch": 1.24, - "learning_rate": 1.3235697443786558e-06, - "loss": 0.5959, - "step": 48372 - }, - { - "epoch": 1.24, - "learning_rate": 1.3235435623516967e-06, - "loss": 0.7119, - "step": 48373 - }, - { - "epoch": 1.24, - "learning_rate": 1.3235173800770153e-06, - "loss": 0.479, - "step": 48374 - }, - { - "epoch": 1.24, - "learning_rate": 1.3234911975546313e-06, - "loss": 0.665, - "step": 48375 - }, - { - "epoch": 1.24, - "learning_rate": 1.323465014784565e-06, - "loss": 0.7578, - "step": 48376 - }, - { - "epoch": 1.24, - "learning_rate": 1.3234388317668361e-06, - "loss": 0.7017, - "step": 48377 - }, - { - "epoch": 1.24, - "learning_rate": 1.3234126485014656e-06, - "loss": 0.6294, - "step": 48378 - }, - { - "epoch": 1.24, - "learning_rate": 1.3233864649884728e-06, - "loss": 0.4189, - "step": 48379 - }, - { - "epoch": 1.24, - "learning_rate": 1.3233602812278774e-06, - "loss": 0.5696, - "step": 48380 - }, - { - "epoch": 1.24, - "learning_rate": 1.3233340972197002e-06, - "loss": 0.5552, - "step": 48381 - }, - { - "epoch": 1.24, - "learning_rate": 1.323307912963961e-06, - "loss": 0.6228, - "step": 48382 - }, - { - "epoch": 1.24, - "learning_rate": 1.3232817284606797e-06, - "loss": 0.7559, - "step": 48383 - }, - { - "epoch": 1.24, - "learning_rate": 1.3232555437098764e-06, - "loss": 0.7529, - "step": 48384 - }, - { - "epoch": 1.24, - "learning_rate": 1.3232293587115713e-06, - "loss": 0.7881, - "step": 48385 - }, - { - "epoch": 1.24, - "learning_rate": 1.3232031734657843e-06, - "loss": 0.7158, - "step": 48386 - }, - { - "epoch": 1.24, - "learning_rate": 1.3231769879725354e-06, - "loss": 0.6504, - "step": 48387 - }, - { - "epoch": 1.24, - "learning_rate": 1.323150802231845e-06, - "loss": 0.7197, - "step": 48388 - }, - { - "epoch": 1.24, - "learning_rate": 1.3231246162437327e-06, - "loss": 0.6021, - "step": 48389 - }, - { - "epoch": 1.24, - "learning_rate": 1.3230984300082187e-06, - "loss": 0.5129, - "step": 48390 - }, - { - "epoch": 1.24, - "learning_rate": 1.323072243525323e-06, - "loss": 0.6787, - "step": 48391 - }, - { - "epoch": 1.24, - "learning_rate": 1.3230460567950656e-06, - "loss": 0.6357, - "step": 48392 - }, - { - "epoch": 1.24, - "learning_rate": 1.3230198698174673e-06, - "loss": 0.6416, - "step": 48393 - }, - { - "epoch": 1.24, - "learning_rate": 1.3229936825925472e-06, - "loss": 0.5806, - "step": 48394 - }, - { - "epoch": 1.24, - "learning_rate": 1.3229674951203257e-06, - "loss": 0.7246, - "step": 48395 - }, - { - "epoch": 1.24, - "learning_rate": 1.3229413074008227e-06, - "loss": 0.6162, - "step": 48396 - }, - { - "epoch": 1.24, - "learning_rate": 1.3229151194340586e-06, - "loss": 0.6438, - "step": 48397 - }, - { - "epoch": 1.24, - "learning_rate": 1.3228889312200533e-06, - "loss": 0.6904, - "step": 48398 - }, - { - "epoch": 1.24, - "learning_rate": 1.3228627427588266e-06, - "loss": 0.6318, - "step": 48399 - }, - { - "epoch": 1.24, - "learning_rate": 1.3228365540503988e-06, - "loss": 0.5708, - "step": 48400 - }, - { - "epoch": 1.24, - "learning_rate": 1.3228103650947898e-06, - "loss": 0.5649, - "step": 48401 - }, - { - "epoch": 1.24, - "learning_rate": 1.3227841758920197e-06, - "loss": 0.7754, - "step": 48402 - }, - { - "epoch": 1.24, - "learning_rate": 1.322757986442109e-06, - "loss": 0.7695, - "step": 48403 - }, - { - "epoch": 1.24, - "learning_rate": 1.322731796745077e-06, - "loss": 0.5765, - "step": 48404 - }, - { - "epoch": 1.24, - "learning_rate": 1.3227056068009443e-06, - "loss": 0.5244, - "step": 48405 - }, - { - "epoch": 1.24, - "learning_rate": 1.3226794166097307e-06, - "loss": 0.6885, - "step": 48406 - }, - { - "epoch": 1.24, - "learning_rate": 1.322653226171456e-06, - "loss": 0.708, - "step": 48407 - }, - { - "epoch": 1.24, - "learning_rate": 1.322627035486141e-06, - "loss": 0.5552, - "step": 48408 - }, - { - "epoch": 1.24, - "learning_rate": 1.3226008445538051e-06, - "loss": 0.6787, - "step": 48409 - }, - { - "epoch": 1.24, - "learning_rate": 1.3225746533744685e-06, - "loss": 0.6504, - "step": 48410 - }, - { - "epoch": 1.24, - "learning_rate": 1.3225484619481513e-06, - "loss": 0.6533, - "step": 48411 - }, - { - "epoch": 1.24, - "learning_rate": 1.3225222702748738e-06, - "loss": 0.7085, - "step": 48412 - }, - { - "epoch": 1.24, - "learning_rate": 1.3224960783546557e-06, - "loss": 0.5872, - "step": 48413 - }, - { - "epoch": 1.24, - "learning_rate": 1.3224698861875175e-06, - "loss": 0.5591, - "step": 48414 - }, - { - "epoch": 1.24, - "learning_rate": 1.3224436937734783e-06, - "loss": 0.6484, - "step": 48415 - }, - { - "epoch": 1.24, - "learning_rate": 1.3224175011125593e-06, - "loss": 0.6035, - "step": 48416 - }, - { - "epoch": 1.24, - "learning_rate": 1.3223913082047798e-06, - "loss": 0.6768, - "step": 48417 - }, - { - "epoch": 1.24, - "learning_rate": 1.3223651150501605e-06, - "loss": 0.7158, - "step": 48418 - }, - { - "epoch": 1.24, - "learning_rate": 1.3223389216487204e-06, - "loss": 0.5535, - "step": 48419 - }, - { - "epoch": 1.24, - "learning_rate": 1.3223127280004807e-06, - "loss": 0.7656, - "step": 48420 - }, - { - "epoch": 1.24, - "learning_rate": 1.3222865341054606e-06, - "loss": 0.7832, - "step": 48421 - }, - { - "epoch": 1.24, - "learning_rate": 1.3222603399636807e-06, - "loss": 0.7324, - "step": 48422 - }, - { - "epoch": 1.24, - "learning_rate": 1.322234145575161e-06, - "loss": 0.5796, - "step": 48423 - }, - { - "epoch": 1.24, - "learning_rate": 1.3222079509399216e-06, - "loss": 0.6982, - "step": 48424 - }, - { - "epoch": 1.24, - "learning_rate": 1.3221817560579819e-06, - "loss": 0.7686, - "step": 48425 - }, - { - "epoch": 1.24, - "learning_rate": 1.3221555609293626e-06, - "loss": 0.5298, - "step": 48426 - }, - { - "epoch": 1.24, - "learning_rate": 1.3221293655540836e-06, - "loss": 0.6533, - "step": 48427 - }, - { - "epoch": 1.24, - "learning_rate": 1.322103169932165e-06, - "loss": 0.6548, - "step": 48428 - }, - { - "epoch": 1.24, - "learning_rate": 1.322076974063627e-06, - "loss": 0.6714, - "step": 48429 - }, - { - "epoch": 1.24, - "learning_rate": 1.3220507779484894e-06, - "loss": 0.5193, - "step": 48430 - }, - { - "epoch": 1.24, - "learning_rate": 1.3220245815867718e-06, - "loss": 0.6294, - "step": 48431 - }, - { - "epoch": 1.24, - "learning_rate": 1.3219983849784955e-06, - "loss": 0.6465, - "step": 48432 - }, - { - "epoch": 1.24, - "learning_rate": 1.3219721881236796e-06, - "loss": 0.6445, - "step": 48433 - }, - { - "epoch": 1.24, - "learning_rate": 1.321945991022344e-06, - "loss": 0.5669, - "step": 48434 - }, - { - "epoch": 1.24, - "learning_rate": 1.3219197936745096e-06, - "loss": 0.6187, - "step": 48435 - }, - { - "epoch": 1.24, - "learning_rate": 1.321893596080196e-06, - "loss": 0.6899, - "step": 48436 - }, - { - "epoch": 1.24, - "learning_rate": 1.3218673982394233e-06, - "loss": 0.5508, - "step": 48437 - }, - { - "epoch": 1.24, - "learning_rate": 1.3218412001522116e-06, - "loss": 0.6191, - "step": 48438 - }, - { - "epoch": 1.24, - "learning_rate": 1.3218150018185806e-06, - "loss": 0.835, - "step": 48439 - }, - { - "epoch": 1.24, - "learning_rate": 1.3217888032385507e-06, - "loss": 0.8096, - "step": 48440 - }, - { - "epoch": 1.24, - "learning_rate": 1.321762604412142e-06, - "loss": 0.5991, - "step": 48441 - }, - { - "epoch": 1.24, - "learning_rate": 1.3217364053393743e-06, - "loss": 0.5051, - "step": 48442 - }, - { - "epoch": 1.24, - "learning_rate": 1.3217102060202682e-06, - "loss": 0.4775, - "step": 48443 - }, - { - "epoch": 1.24, - "learning_rate": 1.3216840064548431e-06, - "loss": 0.9229, - "step": 48444 - }, - { - "epoch": 1.24, - "learning_rate": 1.3216578066431195e-06, - "loss": 0.7295, - "step": 48445 - }, - { - "epoch": 1.24, - "learning_rate": 1.321631606585117e-06, - "loss": 0.5776, - "step": 48446 - }, - { - "epoch": 1.24, - "learning_rate": 1.3216054062808563e-06, - "loss": 0.5718, - "step": 48447 - }, - { - "epoch": 1.24, - "learning_rate": 1.321579205730357e-06, - "loss": 0.7222, - "step": 48448 - }, - { - "epoch": 1.24, - "learning_rate": 1.3215530049336395e-06, - "loss": 0.3511, - "step": 48449 - }, - { - "epoch": 1.24, - "learning_rate": 1.3215268038907232e-06, - "loss": 0.5806, - "step": 48450 - }, - { - "epoch": 1.24, - "learning_rate": 1.3215006026016291e-06, - "loss": 0.5093, - "step": 48451 - }, - { - "epoch": 1.24, - "learning_rate": 1.3214744010663762e-06, - "loss": 0.4346, - "step": 48452 - }, - { - "epoch": 1.24, - "learning_rate": 1.3214481992849857e-06, - "loss": 0.5269, - "step": 48453 - }, - { - "epoch": 1.24, - "learning_rate": 1.3214219972574769e-06, - "loss": 0.6104, - "step": 48454 - }, - { - "epoch": 1.24, - "learning_rate": 1.3213957949838698e-06, - "loss": 0.6387, - "step": 48455 - }, - { - "epoch": 1.24, - "learning_rate": 1.321369592464185e-06, - "loss": 0.5781, - "step": 48456 - }, - { - "epoch": 1.24, - "learning_rate": 1.3213433896984425e-06, - "loss": 0.6064, - "step": 48457 - }, - { - "epoch": 1.24, - "learning_rate": 1.321317186686662e-06, - "loss": 0.7773, - "step": 48458 - }, - { - "epoch": 1.24, - "learning_rate": 1.3212909834288633e-06, - "loss": 0.7236, - "step": 48459 - }, - { - "epoch": 1.24, - "learning_rate": 1.3212647799250671e-06, - "loss": 0.6533, - "step": 48460 - }, - { - "epoch": 1.24, - "learning_rate": 1.3212385761752934e-06, - "loss": 0.5194, - "step": 48461 - }, - { - "epoch": 1.24, - "learning_rate": 1.3212123721795618e-06, - "loss": 0.7764, - "step": 48462 - }, - { - "epoch": 1.24, - "learning_rate": 1.3211861679378927e-06, - "loss": 0.5518, - "step": 48463 - }, - { - "epoch": 1.24, - "learning_rate": 1.3211599634503065e-06, - "loss": 0.7319, - "step": 48464 - }, - { - "epoch": 1.24, - "learning_rate": 1.3211337587168226e-06, - "loss": 0.605, - "step": 48465 - }, - { - "epoch": 1.24, - "learning_rate": 1.3211075537374613e-06, - "loss": 0.7793, - "step": 48466 - }, - { - "epoch": 1.24, - "learning_rate": 1.3210813485122428e-06, - "loss": 0.7124, - "step": 48467 - }, - { - "epoch": 1.24, - "learning_rate": 1.3210551430411871e-06, - "loss": 0.752, - "step": 48468 - }, - { - "epoch": 1.24, - "learning_rate": 1.3210289373243143e-06, - "loss": 0.7109, - "step": 48469 - }, - { - "epoch": 1.24, - "learning_rate": 1.3210027313616443e-06, - "loss": 0.7358, - "step": 48470 - }, - { - "epoch": 1.24, - "learning_rate": 1.320976525153197e-06, - "loss": 0.6245, - "step": 48471 - }, - { - "epoch": 1.24, - "learning_rate": 1.320950318698993e-06, - "loss": 0.6699, - "step": 48472 - }, - { - "epoch": 1.24, - "learning_rate": 1.3209241119990523e-06, - "loss": 0.5859, - "step": 48473 - }, - { - "epoch": 1.24, - "learning_rate": 1.3208979050533945e-06, - "loss": 0.7715, - "step": 48474 - }, - { - "epoch": 1.24, - "learning_rate": 1.32087169786204e-06, - "loss": 0.6274, - "step": 48475 - }, - { - "epoch": 1.24, - "learning_rate": 1.320845490425009e-06, - "loss": 0.6782, - "step": 48476 - }, - { - "epoch": 1.24, - "learning_rate": 1.3208192827423208e-06, - "loss": 0.7773, - "step": 48477 - }, - { - "epoch": 1.24, - "learning_rate": 1.3207930748139963e-06, - "loss": 0.3983, - "step": 48478 - }, - { - "epoch": 1.24, - "learning_rate": 1.3207668666400556e-06, - "loss": 0.6187, - "step": 48479 - }, - { - "epoch": 1.24, - "learning_rate": 1.320740658220518e-06, - "loss": 0.7334, - "step": 48480 - }, - { - "epoch": 1.24, - "learning_rate": 1.3207144495554045e-06, - "loss": 0.6699, - "step": 48481 - }, - { - "epoch": 1.24, - "learning_rate": 1.3206882406447342e-06, - "loss": 0.6353, - "step": 48482 - }, - { - "epoch": 1.24, - "learning_rate": 1.320662031488528e-06, - "loss": 0.7812, - "step": 48483 - }, - { - "epoch": 1.24, - "learning_rate": 1.3206358220868057e-06, - "loss": 0.6699, - "step": 48484 - }, - { - "epoch": 1.24, - "learning_rate": 1.320609612439587e-06, - "loss": 0.7051, - "step": 48485 - }, - { - "epoch": 1.24, - "learning_rate": 1.3205834025468924e-06, - "loss": 0.7754, - "step": 48486 - }, - { - "epoch": 1.24, - "learning_rate": 1.3205571924087417e-06, - "loss": 0.6523, - "step": 48487 - }, - { - "epoch": 1.24, - "learning_rate": 1.3205309820251552e-06, - "loss": 0.7627, - "step": 48488 - }, - { - "epoch": 1.24, - "learning_rate": 1.3205047713961532e-06, - "loss": 0.665, - "step": 48489 - }, - { - "epoch": 1.24, - "learning_rate": 1.320478560521755e-06, - "loss": 0.6338, - "step": 48490 - }, - { - "epoch": 1.24, - "learning_rate": 1.3204523494019812e-06, - "loss": 0.7061, - "step": 48491 - }, - { - "epoch": 1.24, - "learning_rate": 1.3204261380368515e-06, - "loss": 0.6719, - "step": 48492 - }, - { - "epoch": 1.24, - "learning_rate": 1.320399926426387e-06, - "loss": 0.8164, - "step": 48493 - }, - { - "epoch": 1.24, - "learning_rate": 1.3203737145706063e-06, - "loss": 0.7603, - "step": 48494 - }, - { - "epoch": 1.24, - "learning_rate": 1.3203475024695305e-06, - "loss": 0.709, - "step": 48495 - }, - { - "epoch": 1.24, - "learning_rate": 1.3203212901231792e-06, - "loss": 0.7051, - "step": 48496 - }, - { - "epoch": 1.24, - "learning_rate": 1.3202950775315726e-06, - "loss": 0.6372, - "step": 48497 - }, - { - "epoch": 1.24, - "learning_rate": 1.3202688646947311e-06, - "loss": 0.6895, - "step": 48498 - }, - { - "epoch": 1.24, - "learning_rate": 1.3202426516126739e-06, - "loss": 0.6855, - "step": 48499 - }, - { - "epoch": 1.24, - "learning_rate": 1.3202164382854221e-06, - "loss": 0.4741, - "step": 48500 - }, - { - "epoch": 1.24, - "learning_rate": 1.320190224712995e-06, - "loss": 0.7725, - "step": 48501 - }, - { - "epoch": 1.24, - "learning_rate": 1.3201640108954133e-06, - "loss": 0.6514, - "step": 48502 - }, - { - "epoch": 1.24, - "learning_rate": 1.3201377968326965e-06, - "loss": 0.6826, - "step": 48503 - }, - { - "epoch": 1.24, - "learning_rate": 1.320111582524865e-06, - "loss": 0.4556, - "step": 48504 - }, - { - "epoch": 1.24, - "learning_rate": 1.3200853679719388e-06, - "loss": 0.748, - "step": 48505 - }, - { - "epoch": 1.24, - "learning_rate": 1.3200591531739378e-06, - "loss": 0.5835, - "step": 48506 - }, - { - "epoch": 1.24, - "learning_rate": 1.3200329381308822e-06, - "loss": 0.793, - "step": 48507 - }, - { - "epoch": 1.24, - "learning_rate": 1.3200067228427924e-06, - "loss": 0.75, - "step": 48508 - }, - { - "epoch": 1.24, - "learning_rate": 1.319980507309688e-06, - "loss": 0.6953, - "step": 48509 - }, - { - "epoch": 1.24, - "learning_rate": 1.3199542915315892e-06, - "loss": 0.7119, - "step": 48510 - }, - { - "epoch": 1.24, - "learning_rate": 1.319928075508516e-06, - "loss": 0.7119, - "step": 48511 - }, - { - "epoch": 1.24, - "learning_rate": 1.3199018592404887e-06, - "loss": 0.7173, - "step": 48512 - }, - { - "epoch": 1.24, - "learning_rate": 1.3198756427275274e-06, - "loss": 0.7295, - "step": 48513 - }, - { - "epoch": 1.24, - "learning_rate": 1.319849425969652e-06, - "loss": 0.6816, - "step": 48514 - }, - { - "epoch": 1.24, - "learning_rate": 1.3198232089668824e-06, - "loss": 0.5649, - "step": 48515 - }, - { - "epoch": 1.24, - "learning_rate": 1.3197969917192388e-06, - "loss": 0.665, - "step": 48516 - }, - { - "epoch": 1.24, - "learning_rate": 1.3197707742267415e-06, - "loss": 0.7559, - "step": 48517 - }, - { - "epoch": 1.24, - "learning_rate": 1.3197445564894104e-06, - "loss": 0.6514, - "step": 48518 - }, - { - "epoch": 1.24, - "learning_rate": 1.3197183385072659e-06, - "loss": 0.7285, - "step": 48519 - }, - { - "epoch": 1.24, - "learning_rate": 1.3196921202803275e-06, - "loss": 0.6621, - "step": 48520 - }, - { - "epoch": 1.24, - "learning_rate": 1.3196659018086155e-06, - "loss": 0.5938, - "step": 48521 - }, - { - "epoch": 1.24, - "learning_rate": 1.31963968309215e-06, - "loss": 0.6553, - "step": 48522 - }, - { - "epoch": 1.24, - "learning_rate": 1.3196134641309513e-06, - "loss": 0.7207, - "step": 48523 - }, - { - "epoch": 1.24, - "learning_rate": 1.319587244925039e-06, - "loss": 0.5845, - "step": 48524 - }, - { - "epoch": 1.24, - "learning_rate": 1.3195610254744335e-06, - "loss": 0.5977, - "step": 48525 - }, - { - "epoch": 1.24, - "learning_rate": 1.3195348057791549e-06, - "loss": 0.6221, - "step": 48526 - }, - { - "epoch": 1.24, - "learning_rate": 1.3195085858392232e-06, - "loss": 0.4696, - "step": 48527 - }, - { - "epoch": 1.24, - "learning_rate": 1.3194823656546585e-06, - "loss": 0.4653, - "step": 48528 - }, - { - "epoch": 1.24, - "learning_rate": 1.3194561452254809e-06, - "loss": 0.5582, - "step": 48529 - }, - { - "epoch": 1.24, - "learning_rate": 1.3194299245517102e-06, - "loss": 0.7393, - "step": 48530 - }, - { - "epoch": 1.24, - "learning_rate": 1.319403703633367e-06, - "loss": 0.7998, - "step": 48531 - }, - { - "epoch": 1.24, - "learning_rate": 1.3193774824704703e-06, - "loss": 0.5552, - "step": 48532 - }, - { - "epoch": 1.24, - "learning_rate": 1.319351261063042e-06, - "loss": 0.7617, - "step": 48533 - }, - { - "epoch": 1.24, - "learning_rate": 1.3193250394111006e-06, - "loss": 0.6738, - "step": 48534 - }, - { - "epoch": 1.24, - "learning_rate": 1.3192988175146668e-06, - "loss": 0.7163, - "step": 48535 - }, - { - "epoch": 1.24, - "learning_rate": 1.3192725953737603e-06, - "loss": 0.5396, - "step": 48536 - }, - { - "epoch": 1.24, - "learning_rate": 1.3192463729884018e-06, - "loss": 0.6719, - "step": 48537 - }, - { - "epoch": 1.24, - "learning_rate": 1.319220150358611e-06, - "loss": 0.449, - "step": 48538 - }, - { - "epoch": 1.24, - "learning_rate": 1.3191939274844079e-06, - "loss": 0.6128, - "step": 48539 - }, - { - "epoch": 1.24, - "learning_rate": 1.3191677043658125e-06, - "loss": 0.7339, - "step": 48540 - }, - { - "epoch": 1.24, - "learning_rate": 1.3191414810028454e-06, - "loss": 0.6484, - "step": 48541 - }, - { - "epoch": 1.24, - "learning_rate": 1.3191152573955262e-06, - "loss": 0.6313, - "step": 48542 - }, - { - "epoch": 1.24, - "learning_rate": 1.3190890335438751e-06, - "loss": 0.8506, - "step": 48543 - }, - { - "epoch": 1.24, - "learning_rate": 1.3190628094479124e-06, - "loss": 0.6797, - "step": 48544 - }, - { - "epoch": 1.24, - "learning_rate": 1.3190365851076575e-06, - "loss": 0.5576, - "step": 48545 - }, - { - "epoch": 1.24, - "learning_rate": 1.3190103605231312e-06, - "loss": 0.7466, - "step": 48546 - }, - { - "epoch": 1.24, - "learning_rate": 1.3189841356943537e-06, - "loss": 0.7539, - "step": 48547 - }, - { - "epoch": 1.24, - "learning_rate": 1.3189579106213444e-06, - "loss": 0.8506, - "step": 48548 - }, - { - "epoch": 1.24, - "learning_rate": 1.3189316853041236e-06, - "loss": 0.6465, - "step": 48549 - }, - { - "epoch": 1.24, - "learning_rate": 1.3189054597427115e-06, - "loss": 0.6743, - "step": 48550 - }, - { - "epoch": 1.24, - "learning_rate": 1.3188792339371282e-06, - "loss": 0.5601, - "step": 48551 - }, - { - "epoch": 1.24, - "learning_rate": 1.318853007887394e-06, - "loss": 0.6748, - "step": 48552 - }, - { - "epoch": 1.24, - "learning_rate": 1.3188267815935283e-06, - "loss": 0.7344, - "step": 48553 - }, - { - "epoch": 1.24, - "learning_rate": 1.3188005550555518e-06, - "loss": 0.4763, - "step": 48554 - }, - { - "epoch": 1.24, - "learning_rate": 1.3187743282734843e-06, - "loss": 0.8262, - "step": 48555 - }, - { - "epoch": 1.24, - "learning_rate": 1.318748101247346e-06, - "loss": 0.7842, - "step": 48556 - }, - { - "epoch": 1.24, - "learning_rate": 1.318721873977157e-06, - "loss": 0.5503, - "step": 48557 - }, - { - "epoch": 1.24, - "learning_rate": 1.3186956464629372e-06, - "loss": 0.6436, - "step": 48558 - }, - { - "epoch": 1.24, - "learning_rate": 1.3186694187047068e-06, - "loss": 0.6377, - "step": 48559 - }, - { - "epoch": 1.24, - "learning_rate": 1.318643190702486e-06, - "loss": 0.5073, - "step": 48560 - }, - { - "epoch": 1.24, - "learning_rate": 1.3186169624562946e-06, - "loss": 0.7734, - "step": 48561 - }, - { - "epoch": 1.24, - "learning_rate": 1.318590733966153e-06, - "loss": 0.6025, - "step": 48562 - }, - { - "epoch": 1.24, - "learning_rate": 1.3185645052320812e-06, - "loss": 0.7598, - "step": 48563 - }, - { - "epoch": 1.24, - "learning_rate": 1.3185382762540988e-06, - "loss": 0.667, - "step": 48564 - }, - { - "epoch": 1.24, - "learning_rate": 1.3185120470322266e-06, - "loss": 0.7246, - "step": 48565 - }, - { - "epoch": 1.24, - "learning_rate": 1.3184858175664845e-06, - "loss": 0.5588, - "step": 48566 - }, - { - "epoch": 1.24, - "learning_rate": 1.318459587856892e-06, - "loss": 0.4885, - "step": 48567 - }, - { - "epoch": 1.24, - "learning_rate": 1.31843335790347e-06, - "loss": 0.7402, - "step": 48568 - }, - { - "epoch": 1.24, - "learning_rate": 1.3184071277062384e-06, - "loss": 0.5933, - "step": 48569 - }, - { - "epoch": 1.24, - "learning_rate": 1.3183808972652166e-06, - "loss": 0.5811, - "step": 48570 - }, - { - "epoch": 1.24, - "learning_rate": 1.3183546665804255e-06, - "loss": 0.6421, - "step": 48571 - }, - { - "epoch": 1.24, - "learning_rate": 1.3183284356518847e-06, - "loss": 0.5625, - "step": 48572 - }, - { - "epoch": 1.24, - "learning_rate": 1.3183022044796145e-06, - "loss": 0.7373, - "step": 48573 - }, - { - "epoch": 1.24, - "learning_rate": 1.318275973063635e-06, - "loss": 0.6772, - "step": 48574 - }, - { - "epoch": 1.25, - "learning_rate": 1.3182497414039664e-06, - "loss": 0.6758, - "step": 48575 - }, - { - "epoch": 1.25, - "learning_rate": 1.3182235095006282e-06, - "loss": 0.6113, - "step": 48576 - }, - { - "epoch": 1.25, - "learning_rate": 1.3181972773536412e-06, - "loss": 0.5178, - "step": 48577 - }, - { - "epoch": 1.25, - "learning_rate": 1.3181710449630251e-06, - "loss": 0.6729, - "step": 48578 - }, - { - "epoch": 1.25, - "learning_rate": 1.3181448123288003e-06, - "loss": 0.6973, - "step": 48579 - }, - { - "epoch": 1.25, - "learning_rate": 1.3181185794509858e-06, - "loss": 0.6128, - "step": 48580 - }, - { - "epoch": 1.25, - "learning_rate": 1.3180923463296035e-06, - "loss": 0.792, - "step": 48581 - }, - { - "epoch": 1.25, - "learning_rate": 1.3180661129646719e-06, - "loss": 0.6553, - "step": 48582 - }, - { - "epoch": 1.25, - "learning_rate": 1.3180398793562121e-06, - "loss": 0.6206, - "step": 48583 - }, - { - "epoch": 1.25, - "learning_rate": 1.3180136455042436e-06, - "loss": 0.6475, - "step": 48584 - }, - { - "epoch": 1.25, - "learning_rate": 1.3179874114087869e-06, - "loss": 0.6821, - "step": 48585 - }, - { - "epoch": 1.25, - "learning_rate": 1.3179611770698614e-06, - "loss": 0.7632, - "step": 48586 - }, - { - "epoch": 1.25, - "learning_rate": 1.317934942487488e-06, - "loss": 0.665, - "step": 48587 - }, - { - "epoch": 1.25, - "learning_rate": 1.3179087076616863e-06, - "loss": 0.6709, - "step": 48588 - }, - { - "epoch": 1.25, - "learning_rate": 1.3178824725924763e-06, - "loss": 0.5054, - "step": 48589 - }, - { - "epoch": 1.25, - "learning_rate": 1.3178562372798786e-06, - "loss": 0.6367, - "step": 48590 - }, - { - "epoch": 1.25, - "learning_rate": 1.317830001723913e-06, - "loss": 0.7012, - "step": 48591 - }, - { - "epoch": 1.25, - "learning_rate": 1.3178037659245997e-06, - "loss": 0.6904, - "step": 48592 - }, - { - "epoch": 1.25, - "learning_rate": 1.3177775298819587e-06, - "loss": 0.4622, - "step": 48593 - }, - { - "epoch": 1.25, - "learning_rate": 1.3177512935960098e-06, - "loss": 0.6406, - "step": 48594 - }, - { - "epoch": 1.25, - "learning_rate": 1.3177250570667734e-06, - "loss": 0.7959, - "step": 48595 - }, - { - "epoch": 1.25, - "learning_rate": 1.3176988202942695e-06, - "loss": 0.5688, - "step": 48596 - }, - { - "epoch": 1.25, - "learning_rate": 1.317672583278518e-06, - "loss": 0.6982, - "step": 48597 - }, - { - "epoch": 1.25, - "learning_rate": 1.3176463460195399e-06, - "loss": 0.6582, - "step": 48598 - }, - { - "epoch": 1.25, - "learning_rate": 1.317620108517354e-06, - "loss": 0.6162, - "step": 48599 - }, - { - "epoch": 1.25, - "learning_rate": 1.317593870771981e-06, - "loss": 0.7451, - "step": 48600 - }, - { - "epoch": 1.25, - "learning_rate": 1.317567632783441e-06, - "loss": 0.4327, - "step": 48601 - }, - { - "epoch": 1.25, - "learning_rate": 1.3175413945517546e-06, - "loss": 0.5898, - "step": 48602 - }, - { - "epoch": 1.25, - "learning_rate": 1.3175151560769409e-06, - "loss": 0.6484, - "step": 48603 - }, - { - "epoch": 1.25, - "learning_rate": 1.3174889173590206e-06, - "loss": 0.6724, - "step": 48604 - }, - { - "epoch": 1.25, - "learning_rate": 1.3174626783980134e-06, - "loss": 0.5508, - "step": 48605 - }, - { - "epoch": 1.25, - "learning_rate": 1.3174364391939399e-06, - "loss": 0.6621, - "step": 48606 - }, - { - "epoch": 1.25, - "learning_rate": 1.3174101997468198e-06, - "loss": 0.6738, - "step": 48607 - }, - { - "epoch": 1.25, - "learning_rate": 1.3173839600566732e-06, - "loss": 0.6406, - "step": 48608 - }, - { - "epoch": 1.25, - "learning_rate": 1.3173577201235205e-06, - "loss": 0.6895, - "step": 48609 - }, - { - "epoch": 1.25, - "learning_rate": 1.3173314799473814e-06, - "loss": 0.7354, - "step": 48610 - }, - { - "epoch": 1.25, - "learning_rate": 1.317305239528276e-06, - "loss": 0.5493, - "step": 48611 - }, - { - "epoch": 1.25, - "learning_rate": 1.317278998866225e-06, - "loss": 0.6299, - "step": 48612 - }, - { - "epoch": 1.25, - "learning_rate": 1.3172527579612478e-06, - "loss": 0.6724, - "step": 48613 - }, - { - "epoch": 1.25, - "learning_rate": 1.3172265168133648e-06, - "loss": 0.8135, - "step": 48614 - }, - { - "epoch": 1.25, - "learning_rate": 1.317200275422596e-06, - "loss": 0.5236, - "step": 48615 - }, - { - "epoch": 1.25, - "learning_rate": 1.3171740337889616e-06, - "loss": 0.5723, - "step": 48616 - }, - { - "epoch": 1.25, - "learning_rate": 1.3171477919124818e-06, - "loss": 0.6943, - "step": 48617 - }, - { - "epoch": 1.25, - "learning_rate": 1.3171215497931762e-06, - "loss": 0.509, - "step": 48618 - }, - { - "epoch": 1.25, - "learning_rate": 1.3170953074310655e-06, - "loss": 0.8379, - "step": 48619 - }, - { - "epoch": 1.25, - "learning_rate": 1.3170690648261693e-06, - "loss": 0.6867, - "step": 48620 - }, - { - "epoch": 1.25, - "learning_rate": 1.317042821978508e-06, - "loss": 0.418, - "step": 48621 - }, - { - "epoch": 1.25, - "learning_rate": 1.3170165788881016e-06, - "loss": 0.625, - "step": 48622 - }, - { - "epoch": 1.25, - "learning_rate": 1.31699033555497e-06, - "loss": 0.6073, - "step": 48623 - }, - { - "epoch": 1.25, - "learning_rate": 1.3169640919791336e-06, - "loss": 0.667, - "step": 48624 - }, - { - "epoch": 1.25, - "learning_rate": 1.3169378481606124e-06, - "loss": 0.5664, - "step": 48625 - }, - { - "epoch": 1.25, - "learning_rate": 1.3169116040994264e-06, - "loss": 0.6743, - "step": 48626 - }, - { - "epoch": 1.25, - "learning_rate": 1.316885359795596e-06, - "loss": 0.7402, - "step": 48627 - }, - { - "epoch": 1.25, - "learning_rate": 1.3168591152491406e-06, - "loss": 0.6836, - "step": 48628 - }, - { - "epoch": 1.25, - "learning_rate": 1.316832870460081e-06, - "loss": 0.8105, - "step": 48629 - }, - { - "epoch": 1.25, - "learning_rate": 1.3168066254284371e-06, - "loss": 0.2849, - "step": 48630 - }, - { - "epoch": 1.25, - "learning_rate": 1.316780380154229e-06, - "loss": 0.7207, - "step": 48631 - }, - { - "epoch": 1.25, - "learning_rate": 1.3167541346374767e-06, - "loss": 0.6943, - "step": 48632 - }, - { - "epoch": 1.25, - "learning_rate": 1.3167278888782e-06, - "loss": 0.6855, - "step": 48633 - }, - { - "epoch": 1.25, - "learning_rate": 1.3167016428764195e-06, - "loss": 0.6458, - "step": 48634 - }, - { - "epoch": 1.25, - "learning_rate": 1.316675396632155e-06, - "loss": 0.75, - "step": 48635 - }, - { - "epoch": 1.25, - "learning_rate": 1.3166491501454269e-06, - "loss": 0.5869, - "step": 48636 - }, - { - "epoch": 1.25, - "learning_rate": 1.3166229034162553e-06, - "loss": 0.7295, - "step": 48637 - }, - { - "epoch": 1.25, - "learning_rate": 1.3165966564446599e-06, - "loss": 0.6597, - "step": 48638 - }, - { - "epoch": 1.25, - "learning_rate": 1.3165704092306606e-06, - "loss": 0.7061, - "step": 48639 - }, - { - "epoch": 1.25, - "learning_rate": 1.3165441617742783e-06, - "loss": 0.5977, - "step": 48640 - }, - { - "epoch": 1.25, - "learning_rate": 1.3165179140755327e-06, - "loss": 0.6826, - "step": 48641 - }, - { - "epoch": 1.25, - "learning_rate": 1.316491666134444e-06, - "loss": 0.7402, - "step": 48642 - }, - { - "epoch": 1.25, - "learning_rate": 1.316465417951032e-06, - "loss": 0.752, - "step": 48643 - }, - { - "epoch": 1.25, - "learning_rate": 1.316439169525317e-06, - "loss": 0.4702, - "step": 48644 - }, - { - "epoch": 1.25, - "learning_rate": 1.316412920857319e-06, - "loss": 0.6562, - "step": 48645 - }, - { - "epoch": 1.25, - "learning_rate": 1.3163866719470583e-06, - "loss": 0.6357, - "step": 48646 - }, - { - "epoch": 1.25, - "learning_rate": 1.3163604227945548e-06, - "loss": 0.5603, - "step": 48647 - }, - { - "epoch": 1.25, - "learning_rate": 1.3163341733998288e-06, - "loss": 0.5505, - "step": 48648 - }, - { - "epoch": 1.25, - "learning_rate": 1.3163079237629e-06, - "loss": 0.5532, - "step": 48649 - }, - { - "epoch": 1.25, - "learning_rate": 1.316281673883789e-06, - "loss": 0.5981, - "step": 48650 - }, - { - "epoch": 1.25, - "learning_rate": 1.3162554237625153e-06, - "loss": 0.5757, - "step": 48651 - }, - { - "epoch": 1.25, - "learning_rate": 1.3162291733990997e-06, - "loss": 0.7031, - "step": 48652 - }, - { - "epoch": 1.25, - "learning_rate": 1.316202922793562e-06, - "loss": 0.7793, - "step": 48653 - }, - { - "epoch": 1.25, - "learning_rate": 1.316176671945922e-06, - "loss": 0.6963, - "step": 48654 - }, - { - "epoch": 1.25, - "learning_rate": 1.3161504208562005e-06, - "loss": 0.5942, - "step": 48655 - }, - { - "epoch": 1.25, - "learning_rate": 1.316124169524417e-06, - "loss": 0.585, - "step": 48656 - }, - { - "epoch": 1.25, - "learning_rate": 1.3160979179505918e-06, - "loss": 0.7568, - "step": 48657 - }, - { - "epoch": 1.25, - "learning_rate": 1.3160716661347446e-06, - "loss": 0.7559, - "step": 48658 - }, - { - "epoch": 1.25, - "learning_rate": 1.3160454140768962e-06, - "loss": 0.541, - "step": 48659 - }, - { - "epoch": 1.25, - "learning_rate": 1.3160191617770663e-06, - "loss": 0.5762, - "step": 48660 - }, - { - "epoch": 1.25, - "learning_rate": 1.3159929092352748e-06, - "loss": 0.7334, - "step": 48661 - }, - { - "epoch": 1.25, - "learning_rate": 1.3159666564515424e-06, - "loss": 0.7559, - "step": 48662 - }, - { - "epoch": 1.25, - "learning_rate": 1.3159404034258887e-06, - "loss": 0.5828, - "step": 48663 - }, - { - "epoch": 1.25, - "learning_rate": 1.315914150158334e-06, - "loss": 0.749, - "step": 48664 - }, - { - "epoch": 1.25, - "learning_rate": 1.3158878966488983e-06, - "loss": 0.7051, - "step": 48665 - }, - { - "epoch": 1.25, - "learning_rate": 1.3158616428976016e-06, - "loss": 0.6191, - "step": 48666 - }, - { - "epoch": 1.25, - "learning_rate": 1.3158353889044648e-06, - "loss": 0.7012, - "step": 48667 - }, - { - "epoch": 1.25, - "learning_rate": 1.3158091346695066e-06, - "loss": 0.7998, - "step": 48668 - }, - { - "epoch": 1.25, - "learning_rate": 1.3157828801927484e-06, - "loss": 0.4409, - "step": 48669 - }, - { - "epoch": 1.25, - "learning_rate": 1.3157566254742093e-06, - "loss": 0.6904, - "step": 48670 - }, - { - "epoch": 1.25, - "learning_rate": 1.3157303705139101e-06, - "loss": 0.4756, - "step": 48671 - }, - { - "epoch": 1.25, - "learning_rate": 1.315704115311871e-06, - "loss": 0.5881, - "step": 48672 - }, - { - "epoch": 1.25, - "learning_rate": 1.3156778598681116e-06, - "loss": 0.6328, - "step": 48673 - }, - { - "epoch": 1.25, - "learning_rate": 1.3156516041826518e-06, - "loss": 0.6182, - "step": 48674 - }, - { - "epoch": 1.25, - "learning_rate": 1.3156253482555124e-06, - "loss": 0.6152, - "step": 48675 - }, - { - "epoch": 1.25, - "learning_rate": 1.3155990920867131e-06, - "loss": 0.4816, - "step": 48676 - }, - { - "epoch": 1.25, - "learning_rate": 1.315572835676274e-06, - "loss": 0.6377, - "step": 48677 - }, - { - "epoch": 1.25, - "learning_rate": 1.3155465790242154e-06, - "loss": 0.5483, - "step": 48678 - }, - { - "epoch": 1.25, - "learning_rate": 1.3155203221305574e-06, - "loss": 0.7764, - "step": 48679 - }, - { - "epoch": 1.25, - "learning_rate": 1.3154940649953198e-06, - "loss": 0.7422, - "step": 48680 - }, - { - "epoch": 1.25, - "learning_rate": 1.315467807618523e-06, - "loss": 0.5481, - "step": 48681 - }, - { - "epoch": 1.25, - "learning_rate": 1.3154415500001873e-06, - "loss": 0.5801, - "step": 48682 - }, - { - "epoch": 1.25, - "learning_rate": 1.3154152921403321e-06, - "loss": 0.6335, - "step": 48683 - }, - { - "epoch": 1.25, - "learning_rate": 1.3153890340389779e-06, - "loss": 0.5703, - "step": 48684 - }, - { - "epoch": 1.25, - "learning_rate": 1.315362775696145e-06, - "loss": 0.4458, - "step": 48685 - }, - { - "epoch": 1.25, - "learning_rate": 1.3153365171118532e-06, - "loss": 0.7178, - "step": 48686 - }, - { - "epoch": 1.25, - "learning_rate": 1.315310258286123e-06, - "loss": 0.5352, - "step": 48687 - }, - { - "epoch": 1.25, - "learning_rate": 1.315283999218974e-06, - "loss": 0.6406, - "step": 48688 - }, - { - "epoch": 1.25, - "learning_rate": 1.3152577399104264e-06, - "loss": 0.5762, - "step": 48689 - }, - { - "epoch": 1.25, - "learning_rate": 1.3152314803605006e-06, - "loss": 0.6289, - "step": 48690 - }, - { - "epoch": 1.25, - "learning_rate": 1.3152052205692163e-06, - "loss": 0.5122, - "step": 48691 - }, - { - "epoch": 1.25, - "learning_rate": 1.3151789605365946e-06, - "loss": 0.7705, - "step": 48692 - }, - { - "epoch": 1.25, - "learning_rate": 1.3151527002626544e-06, - "loss": 0.7383, - "step": 48693 - }, - { - "epoch": 1.25, - "learning_rate": 1.315126439747416e-06, - "loss": 0.5715, - "step": 48694 - }, - { - "epoch": 1.25, - "learning_rate": 1.3151001789909e-06, - "loss": 0.8496, - "step": 48695 - }, - { - "epoch": 1.25, - "learning_rate": 1.3150739179931263e-06, - "loss": 0.4954, - "step": 48696 - }, - { - "epoch": 1.25, - "learning_rate": 1.3150476567541151e-06, - "loss": 0.623, - "step": 48697 - }, - { - "epoch": 1.25, - "learning_rate": 1.3150213952738863e-06, - "loss": 0.6206, - "step": 48698 - }, - { - "epoch": 1.25, - "learning_rate": 1.31499513355246e-06, - "loss": 0.5952, - "step": 48699 - }, - { - "epoch": 1.25, - "learning_rate": 1.3149688715898565e-06, - "loss": 0.6211, - "step": 48700 - }, - { - "epoch": 1.25, - "learning_rate": 1.3149426093860958e-06, - "loss": 0.6074, - "step": 48701 - }, - { - "epoch": 1.25, - "learning_rate": 1.3149163469411981e-06, - "loss": 0.566, - "step": 48702 - }, - { - "epoch": 1.25, - "learning_rate": 1.3148900842551834e-06, - "loss": 0.6865, - "step": 48703 - }, - { - "epoch": 1.25, - "learning_rate": 1.3148638213280716e-06, - "loss": 0.7217, - "step": 48704 - }, - { - "epoch": 1.25, - "learning_rate": 1.3148375581598834e-06, - "loss": 0.8154, - "step": 48705 - }, - { - "epoch": 1.25, - "learning_rate": 1.3148112947506383e-06, - "loss": 0.4521, - "step": 48706 - }, - { - "epoch": 1.25, - "learning_rate": 1.3147850311003572e-06, - "loss": 0.5483, - "step": 48707 - }, - { - "epoch": 1.25, - "learning_rate": 1.3147587672090593e-06, - "loss": 0.7236, - "step": 48708 - }, - { - "epoch": 1.25, - "learning_rate": 1.3147325030767648e-06, - "loss": 0.4595, - "step": 48709 - }, - { - "epoch": 1.25, - "learning_rate": 1.3147062387034944e-06, - "loss": 0.707, - "step": 48710 - }, - { - "epoch": 1.25, - "learning_rate": 1.3146799740892678e-06, - "loss": 0.6182, - "step": 48711 - }, - { - "epoch": 1.25, - "learning_rate": 1.3146537092341055e-06, - "loss": 0.5332, - "step": 48712 - }, - { - "epoch": 1.25, - "learning_rate": 1.3146274441380269e-06, - "loss": 0.603, - "step": 48713 - }, - { - "epoch": 1.25, - "learning_rate": 1.3146011788010527e-06, - "loss": 0.7656, - "step": 48714 - }, - { - "epoch": 1.25, - "learning_rate": 1.314574913223203e-06, - "loss": 0.645, - "step": 48715 - }, - { - "epoch": 1.25, - "learning_rate": 1.3145486474044972e-06, - "loss": 0.7871, - "step": 48716 - }, - { - "epoch": 1.25, - "learning_rate": 1.3145223813449568e-06, - "loss": 0.6416, - "step": 48717 - }, - { - "epoch": 1.25, - "learning_rate": 1.3144961150446006e-06, - "loss": 0.7178, - "step": 48718 - }, - { - "epoch": 1.25, - "learning_rate": 1.3144698485034492e-06, - "loss": 0.647, - "step": 48719 - }, - { - "epoch": 1.25, - "learning_rate": 1.3144435817215227e-06, - "loss": 0.5206, - "step": 48720 - }, - { - "epoch": 1.25, - "learning_rate": 1.3144173146988413e-06, - "loss": 0.5869, - "step": 48721 - }, - { - "epoch": 1.25, - "learning_rate": 1.314391047435425e-06, - "loss": 0.5557, - "step": 48722 - }, - { - "epoch": 1.25, - "learning_rate": 1.3143647799312938e-06, - "loss": 0.7041, - "step": 48723 - }, - { - "epoch": 1.25, - "learning_rate": 1.3143385121864682e-06, - "loss": 0.8066, - "step": 48724 - }, - { - "epoch": 1.25, - "learning_rate": 1.3143122442009677e-06, - "loss": 0.5337, - "step": 48725 - }, - { - "epoch": 1.25, - "learning_rate": 1.314285975974813e-06, - "loss": 0.5942, - "step": 48726 - }, - { - "epoch": 1.25, - "learning_rate": 1.314259707508024e-06, - "loss": 0.5349, - "step": 48727 - }, - { - "epoch": 1.25, - "learning_rate": 1.3142334388006208e-06, - "loss": 0.7188, - "step": 48728 - }, - { - "epoch": 1.25, - "learning_rate": 1.3142071698526233e-06, - "loss": 0.6406, - "step": 48729 - }, - { - "epoch": 1.25, - "learning_rate": 1.314180900664052e-06, - "loss": 0.4556, - "step": 48730 - }, - { - "epoch": 1.25, - "learning_rate": 1.3141546312349268e-06, - "loss": 0.6562, - "step": 48731 - }, - { - "epoch": 1.25, - "learning_rate": 1.314128361565268e-06, - "loss": 0.5859, - "step": 48732 - }, - { - "epoch": 1.25, - "learning_rate": 1.3141020916550954e-06, - "loss": 0.6519, - "step": 48733 - }, - { - "epoch": 1.25, - "learning_rate": 1.3140758215044292e-06, - "loss": 0.4675, - "step": 48734 - }, - { - "epoch": 1.25, - "learning_rate": 1.3140495511132895e-06, - "loss": 0.6611, - "step": 48735 - }, - { - "epoch": 1.25, - "learning_rate": 1.3140232804816966e-06, - "loss": 0.7217, - "step": 48736 - }, - { - "epoch": 1.25, - "learning_rate": 1.313997009609671e-06, - "loss": 0.6309, - "step": 48737 - }, - { - "epoch": 1.25, - "learning_rate": 1.3139707384972316e-06, - "loss": 0.6436, - "step": 48738 - }, - { - "epoch": 1.25, - "learning_rate": 1.3139444671443995e-06, - "loss": 0.7168, - "step": 48739 - }, - { - "epoch": 1.25, - "learning_rate": 1.3139181955511947e-06, - "loss": 0.6445, - "step": 48740 - }, - { - "epoch": 1.25, - "learning_rate": 1.3138919237176369e-06, - "loss": 0.5649, - "step": 48741 - }, - { - "epoch": 1.25, - "learning_rate": 1.3138656516437468e-06, - "loss": 0.6577, - "step": 48742 - }, - { - "epoch": 1.25, - "learning_rate": 1.313839379329544e-06, - "loss": 0.5864, - "step": 48743 - }, - { - "epoch": 1.25, - "learning_rate": 1.3138131067750486e-06, - "loss": 0.6743, - "step": 48744 - }, - { - "epoch": 1.25, - "learning_rate": 1.3137868339802814e-06, - "loss": 0.624, - "step": 48745 - }, - { - "epoch": 1.25, - "learning_rate": 1.313760560945262e-06, - "loss": 0.6025, - "step": 48746 - }, - { - "epoch": 1.25, - "learning_rate": 1.3137342876700105e-06, - "loss": 0.5688, - "step": 48747 - }, - { - "epoch": 1.25, - "learning_rate": 1.3137080141545467e-06, - "loss": 0.7949, - "step": 48748 - }, - { - "epoch": 1.25, - "learning_rate": 1.3136817403988916e-06, - "loss": 0.6445, - "step": 48749 - }, - { - "epoch": 1.25, - "learning_rate": 1.3136554664030643e-06, - "loss": 0.6323, - "step": 48750 - }, - { - "epoch": 1.25, - "learning_rate": 1.313629192167086e-06, - "loss": 0.6553, - "step": 48751 - }, - { - "epoch": 1.25, - "learning_rate": 1.313602917690976e-06, - "loss": 0.5918, - "step": 48752 - }, - { - "epoch": 1.25, - "learning_rate": 1.3135766429747545e-06, - "loss": 0.5181, - "step": 48753 - }, - { - "epoch": 1.25, - "learning_rate": 1.3135503680184418e-06, - "loss": 0.6191, - "step": 48754 - }, - { - "epoch": 1.25, - "learning_rate": 1.3135240928220583e-06, - "loss": 0.6689, - "step": 48755 - }, - { - "epoch": 1.25, - "learning_rate": 1.3134978173856234e-06, - "loss": 0.5649, - "step": 48756 - }, - { - "epoch": 1.25, - "learning_rate": 1.3134715417091584e-06, - "loss": 0.6096, - "step": 48757 - }, - { - "epoch": 1.25, - "learning_rate": 1.313445265792682e-06, - "loss": 0.6558, - "step": 48758 - }, - { - "epoch": 1.25, - "learning_rate": 1.313418989636215e-06, - "loss": 0.7275, - "step": 48759 - }, - { - "epoch": 1.25, - "learning_rate": 1.3133927132397778e-06, - "loss": 0.521, - "step": 48760 - }, - { - "epoch": 1.25, - "learning_rate": 1.3133664366033899e-06, - "loss": 0.6743, - "step": 48761 - }, - { - "epoch": 1.25, - "learning_rate": 1.313340159727072e-06, - "loss": 0.7012, - "step": 48762 - }, - { - "epoch": 1.25, - "learning_rate": 1.313313882610844e-06, - "loss": 0.4312, - "step": 48763 - }, - { - "epoch": 1.25, - "learning_rate": 1.3132876052547253e-06, - "loss": 0.6758, - "step": 48764 - }, - { - "epoch": 1.25, - "learning_rate": 1.3132613276587373e-06, - "loss": 0.6343, - "step": 48765 - }, - { - "epoch": 1.25, - "learning_rate": 1.3132350498228992e-06, - "loss": 0.7705, - "step": 48766 - }, - { - "epoch": 1.25, - "learning_rate": 1.3132087717472319e-06, - "loss": 0.7695, - "step": 48767 - }, - { - "epoch": 1.25, - "learning_rate": 1.3131824934317546e-06, - "loss": 0.6309, - "step": 48768 - }, - { - "epoch": 1.25, - "learning_rate": 1.3131562148764878e-06, - "loss": 0.6191, - "step": 48769 - }, - { - "epoch": 1.25, - "learning_rate": 1.3131299360814519e-06, - "loss": 0.5728, - "step": 48770 - }, - { - "epoch": 1.25, - "learning_rate": 1.3131036570466666e-06, - "loss": 0.8135, - "step": 48771 - }, - { - "epoch": 1.25, - "learning_rate": 1.3130773777721529e-06, - "loss": 0.4854, - "step": 48772 - }, - { - "epoch": 1.25, - "learning_rate": 1.3130510982579294e-06, - "loss": 0.6865, - "step": 48773 - }, - { - "epoch": 1.25, - "learning_rate": 1.3130248185040176e-06, - "loss": 0.5771, - "step": 48774 - }, - { - "epoch": 1.25, - "learning_rate": 1.3129985385104368e-06, - "loss": 0.3909, - "step": 48775 - }, - { - "epoch": 1.25, - "learning_rate": 1.3129722582772075e-06, - "loss": 0.7451, - "step": 48776 - }, - { - "epoch": 1.25, - "learning_rate": 1.3129459778043499e-06, - "loss": 0.5083, - "step": 48777 - }, - { - "epoch": 1.25, - "learning_rate": 1.312919697091884e-06, - "loss": 0.7988, - "step": 48778 - }, - { - "epoch": 1.25, - "learning_rate": 1.3128934161398295e-06, - "loss": 0.7646, - "step": 48779 - }, - { - "epoch": 1.25, - "learning_rate": 1.312867134948207e-06, - "loss": 0.7568, - "step": 48780 - }, - { - "epoch": 1.25, - "learning_rate": 1.3128408535170366e-06, - "loss": 0.6484, - "step": 48781 - }, - { - "epoch": 1.25, - "learning_rate": 1.3128145718463386e-06, - "loss": 0.7324, - "step": 48782 - }, - { - "epoch": 1.25, - "learning_rate": 1.3127882899361325e-06, - "loss": 0.6455, - "step": 48783 - }, - { - "epoch": 1.25, - "learning_rate": 1.312762007786439e-06, - "loss": 0.6162, - "step": 48784 - }, - { - "epoch": 1.25, - "learning_rate": 1.3127357253972778e-06, - "loss": 0.7031, - "step": 48785 - }, - { - "epoch": 1.25, - "learning_rate": 1.3127094427686694e-06, - "loss": 0.6416, - "step": 48786 - }, - { - "epoch": 1.25, - "learning_rate": 1.3126831599006338e-06, - "loss": 0.6401, - "step": 48787 - }, - { - "epoch": 1.25, - "learning_rate": 1.3126568767931907e-06, - "loss": 0.6836, - "step": 48788 - }, - { - "epoch": 1.25, - "learning_rate": 1.312630593446361e-06, - "loss": 0.5884, - "step": 48789 - }, - { - "epoch": 1.25, - "learning_rate": 1.3126043098601645e-06, - "loss": 0.6934, - "step": 48790 - }, - { - "epoch": 1.25, - "learning_rate": 1.3125780260346208e-06, - "loss": 0.6758, - "step": 48791 - }, - { - "epoch": 1.25, - "learning_rate": 1.312551741969751e-06, - "loss": 0.6118, - "step": 48792 - }, - { - "epoch": 1.25, - "learning_rate": 1.3125254576655744e-06, - "loss": 0.6509, - "step": 48793 - }, - { - "epoch": 1.25, - "learning_rate": 1.3124991731221112e-06, - "loss": 0.7666, - "step": 48794 - }, - { - "epoch": 1.25, - "learning_rate": 1.3124728883393822e-06, - "loss": 0.5217, - "step": 48795 - }, - { - "epoch": 1.25, - "learning_rate": 1.3124466033174068e-06, - "loss": 0.5742, - "step": 48796 - }, - { - "epoch": 1.25, - "learning_rate": 1.3124203180562059e-06, - "loss": 0.6719, - "step": 48797 - }, - { - "epoch": 1.25, - "learning_rate": 1.3123940325557987e-06, - "loss": 0.4382, - "step": 48798 - }, - { - "epoch": 1.25, - "learning_rate": 1.3123677468162058e-06, - "loss": 0.604, - "step": 48799 - }, - { - "epoch": 1.25, - "learning_rate": 1.3123414608374472e-06, - "loss": 0.7275, - "step": 48800 - }, - { - "epoch": 1.25, - "learning_rate": 1.312315174619543e-06, - "loss": 0.4717, - "step": 48801 - }, - { - "epoch": 1.25, - "learning_rate": 1.312288888162514e-06, - "loss": 0.5552, - "step": 48802 - }, - { - "epoch": 1.25, - "learning_rate": 1.3122626014663794e-06, - "loss": 0.569, - "step": 48803 - }, - { - "epoch": 1.25, - "learning_rate": 1.3122363145311595e-06, - "loss": 0.6538, - "step": 48804 - }, - { - "epoch": 1.25, - "learning_rate": 1.3122100273568748e-06, - "loss": 0.6531, - "step": 48805 - }, - { - "epoch": 1.25, - "learning_rate": 1.312183739943545e-06, - "loss": 0.4962, - "step": 48806 - }, - { - "epoch": 1.25, - "learning_rate": 1.3121574522911906e-06, - "loss": 0.5679, - "step": 48807 - }, - { - "epoch": 1.25, - "learning_rate": 1.3121311643998318e-06, - "loss": 0.7812, - "step": 48808 - }, - { - "epoch": 1.25, - "learning_rate": 1.3121048762694886e-06, - "loss": 0.6592, - "step": 48809 - }, - { - "epoch": 1.25, - "learning_rate": 1.3120785879001805e-06, - "loss": 0.4205, - "step": 48810 - }, - { - "epoch": 1.25, - "learning_rate": 1.3120522992919288e-06, - "loss": 0.5941, - "step": 48811 - }, - { - "epoch": 1.25, - "learning_rate": 1.3120260104447527e-06, - "loss": 0.8066, - "step": 48812 - }, - { - "epoch": 1.25, - "learning_rate": 1.3119997213586723e-06, - "loss": 0.6104, - "step": 48813 - }, - { - "epoch": 1.25, - "learning_rate": 1.3119734320337088e-06, - "loss": 0.708, - "step": 48814 - }, - { - "epoch": 1.25, - "learning_rate": 1.311947142469881e-06, - "loss": 0.7139, - "step": 48815 - }, - { - "epoch": 1.25, - "learning_rate": 1.31192085266721e-06, - "loss": 0.439, - "step": 48816 - }, - { - "epoch": 1.25, - "learning_rate": 1.3118945626257154e-06, - "loss": 0.6299, - "step": 48817 - }, - { - "epoch": 1.25, - "learning_rate": 1.3118682723454173e-06, - "loss": 0.5156, - "step": 48818 - }, - { - "epoch": 1.25, - "learning_rate": 1.311841981826336e-06, - "loss": 0.6147, - "step": 48819 - }, - { - "epoch": 1.25, - "learning_rate": 1.3118156910684919e-06, - "loss": 0.5679, - "step": 48820 - }, - { - "epoch": 1.25, - "learning_rate": 1.3117894000719046e-06, - "loss": 0.5327, - "step": 48821 - }, - { - "epoch": 1.25, - "learning_rate": 1.3117631088365948e-06, - "loss": 0.6924, - "step": 48822 - }, - { - "epoch": 1.25, - "learning_rate": 1.311736817362582e-06, - "loss": 0.6167, - "step": 48823 - }, - { - "epoch": 1.25, - "learning_rate": 1.311710525649887e-06, - "loss": 0.7764, - "step": 48824 - }, - { - "epoch": 1.25, - "learning_rate": 1.3116842336985292e-06, - "loss": 0.6035, - "step": 48825 - }, - { - "epoch": 1.25, - "learning_rate": 1.3116579415085294e-06, - "loss": 0.7603, - "step": 48826 - }, - { - "epoch": 1.25, - "learning_rate": 1.3116316490799074e-06, - "loss": 0.5654, - "step": 48827 - }, - { - "epoch": 1.25, - "learning_rate": 1.3116053564126834e-06, - "loss": 0.7578, - "step": 48828 - }, - { - "epoch": 1.25, - "learning_rate": 1.3115790635068773e-06, - "loss": 0.5459, - "step": 48829 - }, - { - "epoch": 1.25, - "learning_rate": 1.3115527703625096e-06, - "loss": 0.6475, - "step": 48830 - }, - { - "epoch": 1.25, - "learning_rate": 1.3115264769796e-06, - "loss": 0.7725, - "step": 48831 - }, - { - "epoch": 1.25, - "learning_rate": 1.3115001833581691e-06, - "loss": 0.5991, - "step": 48832 - }, - { - "epoch": 1.25, - "learning_rate": 1.3114738894982372e-06, - "loss": 0.6924, - "step": 48833 - }, - { - "epoch": 1.25, - "learning_rate": 1.3114475953998235e-06, - "loss": 0.4938, - "step": 48834 - }, - { - "epoch": 1.25, - "learning_rate": 1.3114213010629489e-06, - "loss": 0.6279, - "step": 48835 - }, - { - "epoch": 1.25, - "learning_rate": 1.3113950064876336e-06, - "loss": 0.6509, - "step": 48836 - }, - { - "epoch": 1.25, - "learning_rate": 1.3113687116738972e-06, - "loss": 0.6357, - "step": 48837 - }, - { - "epoch": 1.25, - "learning_rate": 1.3113424166217598e-06, - "loss": 0.7148, - "step": 48838 - }, - { - "epoch": 1.25, - "learning_rate": 1.3113161213312424e-06, - "loss": 0.7188, - "step": 48839 - }, - { - "epoch": 1.25, - "learning_rate": 1.3112898258023641e-06, - "loss": 0.7163, - "step": 48840 - }, - { - "epoch": 1.25, - "learning_rate": 1.3112635300351458e-06, - "loss": 0.7065, - "step": 48841 - }, - { - "epoch": 1.25, - "learning_rate": 1.3112372340296072e-06, - "loss": 0.5742, - "step": 48842 - }, - { - "epoch": 1.25, - "learning_rate": 1.3112109377857688e-06, - "loss": 0.6538, - "step": 48843 - }, - { - "epoch": 1.25, - "learning_rate": 1.31118464130365e-06, - "loss": 0.8057, - "step": 48844 - }, - { - "epoch": 1.25, - "learning_rate": 1.3111583445832719e-06, - "loss": 0.6709, - "step": 48845 - }, - { - "epoch": 1.25, - "learning_rate": 1.3111320476246537e-06, - "loss": 0.8223, - "step": 48846 - }, - { - "epoch": 1.25, - "learning_rate": 1.3111057504278166e-06, - "loss": 0.5249, - "step": 48847 - }, - { - "epoch": 1.25, - "learning_rate": 1.3110794529927796e-06, - "loss": 0.6787, - "step": 48848 - }, - { - "epoch": 1.25, - "learning_rate": 1.3110531553195635e-06, - "loss": 0.7158, - "step": 48849 - }, - { - "epoch": 1.25, - "learning_rate": 1.3110268574081885e-06, - "loss": 0.5566, - "step": 48850 - }, - { - "epoch": 1.25, - "learning_rate": 1.3110005592586744e-06, - "loss": 0.6431, - "step": 48851 - }, - { - "epoch": 1.25, - "learning_rate": 1.3109742608710415e-06, - "loss": 0.6831, - "step": 48852 - }, - { - "epoch": 1.25, - "learning_rate": 1.31094796224531e-06, - "loss": 0.6777, - "step": 48853 - }, - { - "epoch": 1.25, - "learning_rate": 1.3109216633814998e-06, - "loss": 0.6357, - "step": 48854 - }, - { - "epoch": 1.25, - "learning_rate": 1.3108953642796311e-06, - "loss": 0.7837, - "step": 48855 - }, - { - "epoch": 1.25, - "learning_rate": 1.310869064939724e-06, - "loss": 0.5615, - "step": 48856 - }, - { - "epoch": 1.25, - "learning_rate": 1.3108427653617991e-06, - "loss": 0.8135, - "step": 48857 - }, - { - "epoch": 1.25, - "learning_rate": 1.3108164655458762e-06, - "loss": 0.7666, - "step": 48858 - }, - { - "epoch": 1.25, - "learning_rate": 1.3107901654919752e-06, - "loss": 0.6328, - "step": 48859 - }, - { - "epoch": 1.25, - "learning_rate": 1.3107638652001165e-06, - "loss": 0.7246, - "step": 48860 - }, - { - "epoch": 1.25, - "learning_rate": 1.31073756467032e-06, - "loss": 0.8008, - "step": 48861 - }, - { - "epoch": 1.25, - "learning_rate": 1.3107112639026069e-06, - "loss": 0.5371, - "step": 48862 - }, - { - "epoch": 1.25, - "learning_rate": 1.3106849628969953e-06, - "loss": 0.6846, - "step": 48863 - }, - { - "epoch": 1.25, - "learning_rate": 1.3106586616535072e-06, - "loss": 0.7051, - "step": 48864 - }, - { - "epoch": 1.25, - "learning_rate": 1.3106323601721618e-06, - "loss": 0.7529, - "step": 48865 - }, - { - "epoch": 1.25, - "learning_rate": 1.3106060584529796e-06, - "loss": 0.4922, - "step": 48866 - }, - { - "epoch": 1.25, - "learning_rate": 1.3105797564959808e-06, - "loss": 0.5425, - "step": 48867 - }, - { - "epoch": 1.25, - "learning_rate": 1.3105534543011851e-06, - "loss": 0.7764, - "step": 48868 - }, - { - "epoch": 1.25, - "learning_rate": 1.310527151868613e-06, - "loss": 0.7334, - "step": 48869 - }, - { - "epoch": 1.25, - "learning_rate": 1.3105008491982845e-06, - "loss": 0.5664, - "step": 48870 - }, - { - "epoch": 1.25, - "learning_rate": 1.3104745462902195e-06, - "loss": 0.6177, - "step": 48871 - }, - { - "epoch": 1.25, - "learning_rate": 1.3104482431444392e-06, - "loss": 0.6348, - "step": 48872 - }, - { - "epoch": 1.25, - "learning_rate": 1.3104219397609622e-06, - "loss": 0.749, - "step": 48873 - }, - { - "epoch": 1.25, - "learning_rate": 1.3103956361398098e-06, - "loss": 0.7295, - "step": 48874 - }, - { - "epoch": 1.25, - "learning_rate": 1.3103693322810014e-06, - "loss": 0.7295, - "step": 48875 - }, - { - "epoch": 1.25, - "learning_rate": 1.3103430281845577e-06, - "loss": 0.5049, - "step": 48876 - }, - { - "epoch": 1.25, - "learning_rate": 1.3103167238504986e-06, - "loss": 0.6689, - "step": 48877 - }, - { - "epoch": 1.25, - "learning_rate": 1.3102904192788441e-06, - "loss": 0.6606, - "step": 48878 - }, - { - "epoch": 1.25, - "learning_rate": 1.3102641144696148e-06, - "loss": 0.5693, - "step": 48879 - }, - { - "epoch": 1.25, - "learning_rate": 1.3102378094228304e-06, - "loss": 0.4746, - "step": 48880 - }, - { - "epoch": 1.25, - "learning_rate": 1.310211504138511e-06, - "loss": 0.708, - "step": 48881 - }, - { - "epoch": 1.25, - "learning_rate": 1.3101851986166769e-06, - "loss": 0.6738, - "step": 48882 - }, - { - "epoch": 1.25, - "learning_rate": 1.3101588928573487e-06, - "loss": 0.6279, - "step": 48883 - }, - { - "epoch": 1.25, - "learning_rate": 1.3101325868605457e-06, - "loss": 0.7695, - "step": 48884 - }, - { - "epoch": 1.25, - "learning_rate": 1.3101062806262886e-06, - "loss": 0.6719, - "step": 48885 - }, - { - "epoch": 1.25, - "learning_rate": 1.3100799741545972e-06, - "loss": 0.7852, - "step": 48886 - }, - { - "epoch": 1.25, - "learning_rate": 1.310053667445492e-06, - "loss": 0.6504, - "step": 48887 - }, - { - "epoch": 1.25, - "learning_rate": 1.310027360498993e-06, - "loss": 0.4548, - "step": 48888 - }, - { - "epoch": 1.25, - "learning_rate": 1.31000105331512e-06, - "loss": 0.5161, - "step": 48889 - }, - { - "epoch": 1.25, - "learning_rate": 1.3099747458938937e-06, - "loss": 0.5354, - "step": 48890 - }, - { - "epoch": 1.25, - "learning_rate": 1.309948438235334e-06, - "loss": 0.6553, - "step": 48891 - }, - { - "epoch": 1.25, - "learning_rate": 1.309922130339461e-06, - "loss": 0.5371, - "step": 48892 - }, - { - "epoch": 1.25, - "learning_rate": 1.3098958222062951e-06, - "loss": 0.7378, - "step": 48893 - }, - { - "epoch": 1.25, - "learning_rate": 1.3098695138358555e-06, - "loss": 0.834, - "step": 48894 - }, - { - "epoch": 1.25, - "learning_rate": 1.3098432052281638e-06, - "loss": 0.5231, - "step": 48895 - }, - { - "epoch": 1.25, - "learning_rate": 1.309816896383239e-06, - "loss": 0.6914, - "step": 48896 - }, - { - "epoch": 1.25, - "learning_rate": 1.309790587301102e-06, - "loss": 0.8125, - "step": 48897 - }, - { - "epoch": 1.25, - "learning_rate": 1.3097642779817722e-06, - "loss": 0.7559, - "step": 48898 - }, - { - "epoch": 1.25, - "learning_rate": 1.3097379684252703e-06, - "loss": 0.5884, - "step": 48899 - }, - { - "epoch": 1.25, - "learning_rate": 1.3097116586316165e-06, - "loss": 0.7168, - "step": 48900 - }, - { - "epoch": 1.25, - "learning_rate": 1.3096853486008303e-06, - "loss": 0.4878, - "step": 48901 - }, - { - "epoch": 1.25, - "learning_rate": 1.3096590383329326e-06, - "loss": 0.8184, - "step": 48902 - }, - { - "epoch": 1.25, - "learning_rate": 1.3096327278279429e-06, - "loss": 0.6145, - "step": 48903 - }, - { - "epoch": 1.25, - "learning_rate": 1.309606417085882e-06, - "loss": 0.6523, - "step": 48904 - }, - { - "epoch": 1.25, - "learning_rate": 1.3095801061067695e-06, - "loss": 1.0234, - "step": 48905 - }, - { - "epoch": 1.25, - "learning_rate": 1.309553794890626e-06, - "loss": 0.4172, - "step": 48906 - }, - { - "epoch": 1.25, - "learning_rate": 1.3095274834374709e-06, - "loss": 0.4716, - "step": 48907 - }, - { - "epoch": 1.25, - "learning_rate": 1.3095011717473251e-06, - "loss": 0.6279, - "step": 48908 - }, - { - "epoch": 1.25, - "learning_rate": 1.3094748598202086e-06, - "loss": 0.5059, - "step": 48909 - }, - { - "epoch": 1.25, - "learning_rate": 1.3094485476561415e-06, - "loss": 0.5952, - "step": 48910 - }, - { - "epoch": 1.25, - "learning_rate": 1.3094222352551439e-06, - "loss": 0.603, - "step": 48911 - }, - { - "epoch": 1.25, - "learning_rate": 1.3093959226172358e-06, - "loss": 0.4216, - "step": 48912 - }, - { - "epoch": 1.25, - "learning_rate": 1.3093696097424372e-06, - "loss": 0.7412, - "step": 48913 - }, - { - "epoch": 1.25, - "learning_rate": 1.3093432966307687e-06, - "loss": 0.6133, - "step": 48914 - }, - { - "epoch": 1.25, - "learning_rate": 1.3093169832822502e-06, - "loss": 0.5854, - "step": 48915 - }, - { - "epoch": 1.25, - "learning_rate": 1.3092906696969021e-06, - "loss": 0.6133, - "step": 48916 - }, - { - "epoch": 1.25, - "learning_rate": 1.3092643558747444e-06, - "loss": 0.5535, - "step": 48917 - }, - { - "epoch": 1.25, - "learning_rate": 1.309238041815797e-06, - "loss": 0.6333, - "step": 48918 - }, - { - "epoch": 1.25, - "learning_rate": 1.3092117275200803e-06, - "loss": 0.5234, - "step": 48919 - }, - { - "epoch": 1.25, - "learning_rate": 1.3091854129876143e-06, - "loss": 0.5669, - "step": 48920 - }, - { - "epoch": 1.25, - "learning_rate": 1.3091590982184195e-06, - "loss": 0.8091, - "step": 48921 - }, - { - "epoch": 1.25, - "learning_rate": 1.3091327832125154e-06, - "loss": 0.6824, - "step": 48922 - }, - { - "epoch": 1.25, - "learning_rate": 1.3091064679699228e-06, - "loss": 0.6514, - "step": 48923 - }, - { - "epoch": 1.25, - "learning_rate": 1.3090801524906617e-06, - "loss": 0.5774, - "step": 48924 - }, - { - "epoch": 1.25, - "learning_rate": 1.309053836774752e-06, - "loss": 0.6504, - "step": 48925 - }, - { - "epoch": 1.25, - "learning_rate": 1.3090275208222142e-06, - "loss": 0.6265, - "step": 48926 - }, - { - "epoch": 1.25, - "learning_rate": 1.309001204633068e-06, - "loss": 0.668, - "step": 48927 - }, - { - "epoch": 1.25, - "learning_rate": 1.3089748882073338e-06, - "loss": 0.6968, - "step": 48928 - }, - { - "epoch": 1.25, - "learning_rate": 1.3089485715450316e-06, - "loss": 0.6841, - "step": 48929 - }, - { - "epoch": 1.25, - "learning_rate": 1.3089222546461819e-06, - "loss": 0.7744, - "step": 48930 - }, - { - "epoch": 1.25, - "learning_rate": 1.3088959375108045e-06, - "loss": 0.5298, - "step": 48931 - }, - { - "epoch": 1.25, - "learning_rate": 1.3088696201389197e-06, - "loss": 0.6763, - "step": 48932 - }, - { - "epoch": 1.25, - "learning_rate": 1.3088433025305478e-06, - "loss": 0.8066, - "step": 48933 - }, - { - "epoch": 1.25, - "learning_rate": 1.3088169846857086e-06, - "loss": 0.6646, - "step": 48934 - }, - { - "epoch": 1.25, - "learning_rate": 1.3087906666044227e-06, - "loss": 0.6123, - "step": 48935 - }, - { - "epoch": 1.25, - "learning_rate": 1.30876434828671e-06, - "loss": 0.6851, - "step": 48936 - }, - { - "epoch": 1.25, - "learning_rate": 1.3087380297325904e-06, - "loss": 0.5574, - "step": 48937 - }, - { - "epoch": 1.25, - "learning_rate": 1.3087117109420842e-06, - "loss": 0.7646, - "step": 48938 - }, - { - "epoch": 1.25, - "learning_rate": 1.3086853919152118e-06, - "loss": 0.7598, - "step": 48939 - }, - { - "epoch": 1.25, - "learning_rate": 1.308659072651993e-06, - "loss": 0.708, - "step": 48940 - }, - { - "epoch": 1.25, - "learning_rate": 1.3086327531524483e-06, - "loss": 0.6299, - "step": 48941 - }, - { - "epoch": 1.25, - "learning_rate": 1.308606433416598e-06, - "loss": 0.5396, - "step": 48942 - }, - { - "epoch": 1.25, - "learning_rate": 1.3085801134444615e-06, - "loss": 0.6655, - "step": 48943 - }, - { - "epoch": 1.25, - "learning_rate": 1.3085537932360592e-06, - "loss": 0.7432, - "step": 48944 - }, - { - "epoch": 1.25, - "learning_rate": 1.3085274727914119e-06, - "loss": 0.6396, - "step": 48945 - }, - { - "epoch": 1.25, - "learning_rate": 1.3085011521105393e-06, - "loss": 0.9316, - "step": 48946 - }, - { - "epoch": 1.25, - "learning_rate": 1.3084748311934614e-06, - "loss": 0.5493, - "step": 48947 - }, - { - "epoch": 1.25, - "learning_rate": 1.3084485100401987e-06, - "loss": 0.5723, - "step": 48948 - }, - { - "epoch": 1.25, - "learning_rate": 1.3084221886507706e-06, - "loss": 0.5859, - "step": 48949 - }, - { - "epoch": 1.25, - "learning_rate": 1.3083958670251984e-06, - "loss": 0.7725, - "step": 48950 - }, - { - "epoch": 1.25, - "learning_rate": 1.3083695451635015e-06, - "loss": 0.7676, - "step": 48951 - }, - { - "epoch": 1.25, - "learning_rate": 1.3083432230657003e-06, - "loss": 0.6079, - "step": 48952 - }, - { - "epoch": 1.25, - "learning_rate": 1.3083169007318146e-06, - "loss": 0.6108, - "step": 48953 - }, - { - "epoch": 1.25, - "learning_rate": 1.3082905781618652e-06, - "loss": 0.5938, - "step": 48954 - }, - { - "epoch": 1.25, - "learning_rate": 1.3082642553558714e-06, - "loss": 0.6689, - "step": 48955 - }, - { - "epoch": 1.25, - "learning_rate": 1.3082379323138543e-06, - "loss": 0.7178, - "step": 48956 - }, - { - "epoch": 1.25, - "learning_rate": 1.3082116090358332e-06, - "loss": 0.5535, - "step": 48957 - }, - { - "epoch": 1.25, - "learning_rate": 1.3081852855218292e-06, - "loss": 0.7393, - "step": 48958 - }, - { - "epoch": 1.25, - "learning_rate": 1.3081589617718614e-06, - "loss": 0.5488, - "step": 48959 - }, - { - "epoch": 1.25, - "learning_rate": 1.3081326377859506e-06, - "loss": 0.7773, - "step": 48960 - }, - { - "epoch": 1.25, - "learning_rate": 1.308106313564117e-06, - "loss": 0.8652, - "step": 48961 - }, - { - "epoch": 1.25, - "learning_rate": 1.3080799891063803e-06, - "loss": 0.6367, - "step": 48962 - }, - { - "epoch": 1.25, - "learning_rate": 1.308053664412761e-06, - "loss": 0.5012, - "step": 48963 - }, - { - "epoch": 1.25, - "learning_rate": 1.308027339483279e-06, - "loss": 0.5879, - "step": 48964 - }, - { - "epoch": 1.25, - "learning_rate": 1.3080010143179547e-06, - "loss": 0.6699, - "step": 48965 - }, - { - "epoch": 1.26, - "learning_rate": 1.3079746889168082e-06, - "loss": 0.7275, - "step": 48966 - }, - { - "epoch": 1.26, - "learning_rate": 1.30794836327986e-06, - "loss": 0.8213, - "step": 48967 - }, - { - "epoch": 1.26, - "learning_rate": 1.3079220374071294e-06, - "loss": 0.5771, - "step": 48968 - }, - { - "epoch": 1.26, - "learning_rate": 1.3078957112986371e-06, - "loss": 0.6074, - "step": 48969 - }, - { - "epoch": 1.26, - "learning_rate": 1.3078693849544034e-06, - "loss": 0.5801, - "step": 48970 - }, - { - "epoch": 1.26, - "learning_rate": 1.3078430583744484e-06, - "loss": 0.6611, - "step": 48971 - }, - { - "epoch": 1.26, - "learning_rate": 1.3078167315587919e-06, - "loss": 0.4805, - "step": 48972 - }, - { - "epoch": 1.26, - "learning_rate": 1.3077904045074544e-06, - "loss": 0.7056, - "step": 48973 - }, - { - "epoch": 1.26, - "learning_rate": 1.3077640772204556e-06, - "loss": 0.5977, - "step": 48974 - }, - { - "epoch": 1.26, - "learning_rate": 1.3077377496978167e-06, - "loss": 0.626, - "step": 48975 - }, - { - "epoch": 1.26, - "learning_rate": 1.3077114219395565e-06, - "loss": 0.8574, - "step": 48976 - }, - { - "epoch": 1.26, - "learning_rate": 1.3076850939456962e-06, - "loss": 0.6274, - "step": 48977 - }, - { - "epoch": 1.26, - "learning_rate": 1.3076587657162553e-06, - "loss": 0.5859, - "step": 48978 - }, - { - "epoch": 1.26, - "learning_rate": 1.3076324372512543e-06, - "loss": 0.6489, - "step": 48979 - }, - { - "epoch": 1.26, - "learning_rate": 1.3076061085507132e-06, - "loss": 0.7207, - "step": 48980 - }, - { - "epoch": 1.26, - "learning_rate": 1.3075797796146529e-06, - "loss": 0.8145, - "step": 48981 - }, - { - "epoch": 1.26, - "learning_rate": 1.3075534504430921e-06, - "loss": 0.6826, - "step": 48982 - }, - { - "epoch": 1.26, - "learning_rate": 1.307527121036052e-06, - "loss": 1.043, - "step": 48983 - }, - { - "epoch": 1.26, - "learning_rate": 1.3075007913935525e-06, - "loss": 0.6035, - "step": 48984 - }, - { - "epoch": 1.26, - "learning_rate": 1.307474461515614e-06, - "loss": 0.8184, - "step": 48985 - }, - { - "epoch": 1.26, - "learning_rate": 1.3074481314022563e-06, - "loss": 0.7646, - "step": 48986 - }, - { - "epoch": 1.26, - "learning_rate": 1.3074218010534996e-06, - "loss": 0.5103, - "step": 48987 - }, - { - "epoch": 1.26, - "learning_rate": 1.3073954704693643e-06, - "loss": 0.7427, - "step": 48988 - }, - { - "epoch": 1.26, - "learning_rate": 1.3073691396498705e-06, - "loss": 0.6177, - "step": 48989 - }, - { - "epoch": 1.26, - "learning_rate": 1.307342808595038e-06, - "loss": 0.6494, - "step": 48990 - }, - { - "epoch": 1.26, - "learning_rate": 1.3073164773048875e-06, - "loss": 0.5024, - "step": 48991 - }, - { - "epoch": 1.26, - "learning_rate": 1.307290145779439e-06, - "loss": 0.5342, - "step": 48992 - }, - { - "epoch": 1.26, - "learning_rate": 1.3072638140187122e-06, - "loss": 0.6104, - "step": 48993 - }, - { - "epoch": 1.26, - "learning_rate": 1.307237482022728e-06, - "loss": 0.6836, - "step": 48994 - }, - { - "epoch": 1.26, - "learning_rate": 1.3072111497915058e-06, - "loss": 0.7197, - "step": 48995 - }, - { - "epoch": 1.26, - "learning_rate": 1.3071848173250665e-06, - "loss": 0.6338, - "step": 48996 - }, - { - "epoch": 1.26, - "learning_rate": 1.3071584846234295e-06, - "loss": 0.6104, - "step": 48997 - }, - { - "epoch": 1.26, - "learning_rate": 1.307132151686616e-06, - "loss": 0.6772, - "step": 48998 - }, - { - "epoch": 1.26, - "learning_rate": 1.3071058185146448e-06, - "loss": 0.7017, - "step": 48999 - }, - { - "epoch": 1.26, - "learning_rate": 1.3070794851075374e-06, - "loss": 0.7676, - "step": 49000 - }, - { - "epoch": 1.26, - "learning_rate": 1.307053151465313e-06, - "loss": 0.71, - "step": 49001 - }, - { - "epoch": 1.26, - "learning_rate": 1.3070268175879924e-06, - "loss": 0.6519, - "step": 49002 - }, - { - "epoch": 1.26, - "learning_rate": 1.3070004834755951e-06, - "loss": 0.6768, - "step": 49003 - }, - { - "epoch": 1.26, - "learning_rate": 1.306974149128142e-06, - "loss": 0.6416, - "step": 49004 - }, - { - "epoch": 1.26, - "learning_rate": 1.3069478145456526e-06, - "loss": 0.8984, - "step": 49005 - }, - { - "epoch": 1.26, - "learning_rate": 1.3069214797281479e-06, - "loss": 0.8594, - "step": 49006 - }, - { - "epoch": 1.26, - "learning_rate": 1.3068951446756472e-06, - "loss": 0.6182, - "step": 49007 - }, - { - "epoch": 1.26, - "learning_rate": 1.3068688093881708e-06, - "loss": 0.5327, - "step": 49008 - }, - { - "epoch": 1.26, - "learning_rate": 1.3068424738657392e-06, - "loss": 0.7373, - "step": 49009 - }, - { - "epoch": 1.26, - "learning_rate": 1.3068161381083726e-06, - "loss": 0.5738, - "step": 49010 - }, - { - "epoch": 1.26, - "learning_rate": 1.306789802116091e-06, - "loss": 0.6582, - "step": 49011 - }, - { - "epoch": 1.26, - "learning_rate": 1.3067634658889141e-06, - "loss": 0.7373, - "step": 49012 - }, - { - "epoch": 1.26, - "learning_rate": 1.306737129426863e-06, - "loss": 0.582, - "step": 49013 - }, - { - "epoch": 1.26, - "learning_rate": 1.306710792729957e-06, - "loss": 0.5459, - "step": 49014 - }, - { - "epoch": 1.26, - "learning_rate": 1.3066844557982171e-06, - "loss": 0.5178, - "step": 49015 - }, - { - "epoch": 1.26, - "learning_rate": 1.3066581186316628e-06, - "loss": 0.6152, - "step": 49016 - }, - { - "epoch": 1.26, - "learning_rate": 1.3066317812303145e-06, - "loss": 0.6255, - "step": 49017 - }, - { - "epoch": 1.26, - "learning_rate": 1.3066054435941922e-06, - "loss": 0.7412, - "step": 49018 - }, - { - "epoch": 1.26, - "learning_rate": 1.3065791057233164e-06, - "loss": 0.6006, - "step": 49019 - }, - { - "epoch": 1.26, - "learning_rate": 1.3065527676177068e-06, - "loss": 0.4966, - "step": 49020 - }, - { - "epoch": 1.26, - "learning_rate": 1.3065264292773844e-06, - "loss": 0.4592, - "step": 49021 - }, - { - "epoch": 1.26, - "learning_rate": 1.3065000907023682e-06, - "loss": 0.7002, - "step": 49022 - }, - { - "epoch": 1.26, - "learning_rate": 1.3064737518926794e-06, - "loss": 0.584, - "step": 49023 - }, - { - "epoch": 1.26, - "learning_rate": 1.3064474128483373e-06, - "loss": 0.5449, - "step": 49024 - }, - { - "epoch": 1.26, - "learning_rate": 1.3064210735693628e-06, - "loss": 0.5728, - "step": 49025 - }, - { - "epoch": 1.26, - "learning_rate": 1.306394734055776e-06, - "loss": 0.5132, - "step": 49026 - }, - { - "epoch": 1.26, - "learning_rate": 1.3063683943075964e-06, - "loss": 0.6143, - "step": 49027 - }, - { - "epoch": 1.26, - "learning_rate": 1.306342054324845e-06, - "loss": 0.6768, - "step": 49028 - }, - { - "epoch": 1.26, - "learning_rate": 1.3063157141075411e-06, - "loss": 0.6318, - "step": 49029 - }, - { - "epoch": 1.26, - "learning_rate": 1.3062893736557056e-06, - "loss": 0.623, - "step": 49030 - }, - { - "epoch": 1.26, - "learning_rate": 1.3062630329693585e-06, - "loss": 0.7168, - "step": 49031 - }, - { - "epoch": 1.26, - "learning_rate": 1.30623669204852e-06, - "loss": 0.7373, - "step": 49032 - }, - { - "epoch": 1.26, - "learning_rate": 1.30621035089321e-06, - "loss": 1.0176, - "step": 49033 - }, - { - "epoch": 1.26, - "learning_rate": 1.3061840095034484e-06, - "loss": 0.5513, - "step": 49034 - }, - { - "epoch": 1.26, - "learning_rate": 1.3061576678792564e-06, - "loss": 0.6089, - "step": 49035 - }, - { - "epoch": 1.26, - "learning_rate": 1.3061313260206532e-06, - "loss": 0.7139, - "step": 49036 - }, - { - "epoch": 1.26, - "learning_rate": 1.3061049839276593e-06, - "loss": 0.6541, - "step": 49037 - }, - { - "epoch": 1.26, - "learning_rate": 1.3060786416002952e-06, - "loss": 0.709, - "step": 49038 - }, - { - "epoch": 1.26, - "learning_rate": 1.3060522990385802e-06, - "loss": 0.6973, - "step": 49039 - }, - { - "epoch": 1.26, - "learning_rate": 1.3060259562425356e-06, - "loss": 0.7129, - "step": 49040 - }, - { - "epoch": 1.26, - "learning_rate": 1.305999613212181e-06, - "loss": 0.6406, - "step": 49041 - }, - { - "epoch": 1.26, - "learning_rate": 1.3059732699475361e-06, - "loss": 0.7021, - "step": 49042 - }, - { - "epoch": 1.26, - "learning_rate": 1.3059469264486217e-06, - "loss": 0.6536, - "step": 49043 - }, - { - "epoch": 1.26, - "learning_rate": 1.305920582715458e-06, - "loss": 0.4204, - "step": 49044 - }, - { - "epoch": 1.26, - "learning_rate": 1.3058942387480647e-06, - "loss": 0.5911, - "step": 49045 - }, - { - "epoch": 1.26, - "learning_rate": 1.3058678945464627e-06, - "loss": 0.7598, - "step": 49046 - }, - { - "epoch": 1.26, - "learning_rate": 1.3058415501106712e-06, - "loss": 0.623, - "step": 49047 - }, - { - "epoch": 1.26, - "learning_rate": 1.3058152054407113e-06, - "loss": 0.5908, - "step": 49048 - }, - { - "epoch": 1.26, - "learning_rate": 1.3057888605366025e-06, - "loss": 0.7959, - "step": 49049 - }, - { - "epoch": 1.26, - "learning_rate": 1.3057625153983654e-06, - "loss": 0.7852, - "step": 49050 - }, - { - "epoch": 1.26, - "learning_rate": 1.30573617002602e-06, - "loss": 0.7349, - "step": 49051 - }, - { - "epoch": 1.26, - "learning_rate": 1.3057098244195864e-06, - "loss": 0.5991, - "step": 49052 - }, - { - "epoch": 1.26, - "learning_rate": 1.3056834785790845e-06, - "loss": 0.5908, - "step": 49053 - }, - { - "epoch": 1.26, - "learning_rate": 1.3056571325045354e-06, - "loss": 0.5037, - "step": 49054 - }, - { - "epoch": 1.26, - "learning_rate": 1.305630786195958e-06, - "loss": 0.6641, - "step": 49055 - }, - { - "epoch": 1.26, - "learning_rate": 1.3056044396533738e-06, - "loss": 0.6523, - "step": 49056 - }, - { - "epoch": 1.26, - "learning_rate": 1.3055780928768023e-06, - "loss": 0.6621, - "step": 49057 - }, - { - "epoch": 1.26, - "learning_rate": 1.3055517458662634e-06, - "loss": 0.791, - "step": 49058 - }, - { - "epoch": 1.26, - "learning_rate": 1.3055253986217775e-06, - "loss": 0.5498, - "step": 49059 - }, - { - "epoch": 1.26, - "learning_rate": 1.3054990511433653e-06, - "loss": 0.5801, - "step": 49060 - }, - { - "epoch": 1.26, - "learning_rate": 1.3054727034310464e-06, - "loss": 0.7246, - "step": 49061 - }, - { - "epoch": 1.26, - "learning_rate": 1.3054463554848408e-06, - "loss": 0.6393, - "step": 49062 - }, - { - "epoch": 1.26, - "learning_rate": 1.305420007304769e-06, - "loss": 0.6611, - "step": 49063 - }, - { - "epoch": 1.26, - "learning_rate": 1.3053936588908513e-06, - "loss": 0.6294, - "step": 49064 - }, - { - "epoch": 1.26, - "learning_rate": 1.3053673102431078e-06, - "loss": 0.7725, - "step": 49065 - }, - { - "epoch": 1.26, - "learning_rate": 1.3053409613615584e-06, - "loss": 0.5132, - "step": 49066 - }, - { - "epoch": 1.26, - "learning_rate": 1.3053146122462239e-06, - "loss": 0.6826, - "step": 49067 - }, - { - "epoch": 1.26, - "learning_rate": 1.3052882628971235e-06, - "loss": 0.6411, - "step": 49068 - }, - { - "epoch": 1.26, - "learning_rate": 1.305261913314278e-06, - "loss": 0.4893, - "step": 49069 - }, - { - "epoch": 1.26, - "learning_rate": 1.3052355634977076e-06, - "loss": 0.6196, - "step": 49070 - }, - { - "epoch": 1.26, - "learning_rate": 1.3052092134474325e-06, - "loss": 0.7246, - "step": 49071 - }, - { - "epoch": 1.26, - "learning_rate": 1.3051828631634727e-06, - "loss": 0.7695, - "step": 49072 - }, - { - "epoch": 1.26, - "learning_rate": 1.3051565126458485e-06, - "loss": 0.6206, - "step": 49073 - }, - { - "epoch": 1.26, - "learning_rate": 1.3051301618945795e-06, - "loss": 0.6846, - "step": 49074 - }, - { - "epoch": 1.26, - "learning_rate": 1.3051038109096868e-06, - "loss": 0.626, - "step": 49075 - }, - { - "epoch": 1.26, - "learning_rate": 1.3050774596911902e-06, - "loss": 0.707, - "step": 49076 - }, - { - "epoch": 1.26, - "learning_rate": 1.3050511082391095e-06, - "loss": 0.3888, - "step": 49077 - }, - { - "epoch": 1.26, - "learning_rate": 1.3050247565534653e-06, - "loss": 0.6421, - "step": 49078 - }, - { - "epoch": 1.26, - "learning_rate": 1.3049984046342777e-06, - "loss": 0.7354, - "step": 49079 - }, - { - "epoch": 1.26, - "learning_rate": 1.3049720524815669e-06, - "loss": 0.5632, - "step": 49080 - }, - { - "epoch": 1.26, - "learning_rate": 1.304945700095353e-06, - "loss": 0.7422, - "step": 49081 - }, - { - "epoch": 1.26, - "learning_rate": 1.3049193474756562e-06, - "loss": 0.6013, - "step": 49082 - }, - { - "epoch": 1.26, - "learning_rate": 1.3048929946224966e-06, - "loss": 0.748, - "step": 49083 - }, - { - "epoch": 1.26, - "learning_rate": 1.3048666415358945e-06, - "loss": 0.7129, - "step": 49084 - }, - { - "epoch": 1.26, - "learning_rate": 1.3048402882158698e-06, - "loss": 0.5762, - "step": 49085 - }, - { - "epoch": 1.26, - "learning_rate": 1.3048139346624434e-06, - "loss": 0.6934, - "step": 49086 - }, - { - "epoch": 1.26, - "learning_rate": 1.3047875808756345e-06, - "loss": 0.6553, - "step": 49087 - }, - { - "epoch": 1.26, - "learning_rate": 1.3047612268554643e-06, - "loss": 0.7793, - "step": 49088 - }, - { - "epoch": 1.26, - "learning_rate": 1.3047348726019519e-06, - "loss": 0.5293, - "step": 49089 - }, - { - "epoch": 1.26, - "learning_rate": 1.3047085181151183e-06, - "loss": 0.5693, - "step": 49090 - }, - { - "epoch": 1.26, - "learning_rate": 1.3046821633949833e-06, - "loss": 0.5615, - "step": 49091 - }, - { - "epoch": 1.26, - "learning_rate": 1.3046558084415674e-06, - "loss": 0.6538, - "step": 49092 - }, - { - "epoch": 1.26, - "learning_rate": 1.3046294532548902e-06, - "loss": 0.6758, - "step": 49093 - }, - { - "epoch": 1.26, - "learning_rate": 1.3046030978349726e-06, - "loss": 0.54, - "step": 49094 - }, - { - "epoch": 1.26, - "learning_rate": 1.3045767421818341e-06, - "loss": 0.522, - "step": 49095 - }, - { - "epoch": 1.26, - "learning_rate": 1.3045503862954955e-06, - "loss": 0.8721, - "step": 49096 - }, - { - "epoch": 1.26, - "learning_rate": 1.3045240301759763e-06, - "loss": 0.7012, - "step": 49097 - }, - { - "epoch": 1.26, - "learning_rate": 1.3044976738232973e-06, - "loss": 0.6611, - "step": 49098 - }, - { - "epoch": 1.26, - "learning_rate": 1.3044713172374784e-06, - "loss": 0.6729, - "step": 49099 - }, - { - "epoch": 1.26, - "learning_rate": 1.30444496041854e-06, - "loss": 0.7344, - "step": 49100 - }, - { - "epoch": 1.26, - "learning_rate": 1.3044186033665016e-06, - "loss": 0.5771, - "step": 49101 - }, - { - "epoch": 1.26, - "learning_rate": 1.3043922460813842e-06, - "loss": 0.5332, - "step": 49102 - }, - { - "epoch": 1.26, - "learning_rate": 1.3043658885632075e-06, - "loss": 0.8291, - "step": 49103 - }, - { - "epoch": 1.26, - "learning_rate": 1.304339530811992e-06, - "loss": 0.645, - "step": 49104 - }, - { - "epoch": 1.26, - "learning_rate": 1.3043131728277577e-06, - "loss": 0.7227, - "step": 49105 - }, - { - "epoch": 1.26, - "learning_rate": 1.3042868146105248e-06, - "loss": 0.7373, - "step": 49106 - }, - { - "epoch": 1.26, - "learning_rate": 1.3042604561603133e-06, - "loss": 0.6816, - "step": 49107 - }, - { - "epoch": 1.26, - "learning_rate": 1.3042340974771437e-06, - "loss": 0.7471, - "step": 49108 - }, - { - "epoch": 1.26, - "learning_rate": 1.3042077385610361e-06, - "loss": 0.4557, - "step": 49109 - }, - { - "epoch": 1.26, - "learning_rate": 1.3041813794120104e-06, - "loss": 0.6572, - "step": 49110 - }, - { - "epoch": 1.26, - "learning_rate": 1.3041550200300875e-06, - "loss": 0.5918, - "step": 49111 - }, - { - "epoch": 1.26, - "learning_rate": 1.3041286604152866e-06, - "loss": 0.6523, - "step": 49112 - }, - { - "epoch": 1.26, - "learning_rate": 1.3041023005676286e-06, - "loss": 0.5869, - "step": 49113 - }, - { - "epoch": 1.26, - "learning_rate": 1.304075940487133e-06, - "loss": 0.7031, - "step": 49114 - }, - { - "epoch": 1.26, - "learning_rate": 1.304049580173821e-06, - "loss": 0.8184, - "step": 49115 - }, - { - "epoch": 1.26, - "learning_rate": 1.3040232196277122e-06, - "loss": 0.9551, - "step": 49116 - }, - { - "epoch": 1.26, - "learning_rate": 1.303996858848827e-06, - "loss": 0.6685, - "step": 49117 - }, - { - "epoch": 1.26, - "learning_rate": 1.3039704978371847e-06, - "loss": 0.6289, - "step": 49118 - }, - { - "epoch": 1.26, - "learning_rate": 1.3039441365928063e-06, - "loss": 0.6675, - "step": 49119 - }, - { - "epoch": 1.26, - "learning_rate": 1.303917775115712e-06, - "loss": 0.6143, - "step": 49120 - }, - { - "epoch": 1.26, - "learning_rate": 1.3038914134059221e-06, - "loss": 0.4495, - "step": 49121 - }, - { - "epoch": 1.26, - "learning_rate": 1.303865051463456e-06, - "loss": 0.6401, - "step": 49122 - }, - { - "epoch": 1.26, - "learning_rate": 1.3038386892883348e-06, - "loss": 0.7529, - "step": 49123 - }, - { - "epoch": 1.26, - "learning_rate": 1.3038123268805781e-06, - "loss": 0.5856, - "step": 49124 - }, - { - "epoch": 1.26, - "learning_rate": 1.3037859642402063e-06, - "loss": 0.4905, - "step": 49125 - }, - { - "epoch": 1.26, - "learning_rate": 1.3037596013672398e-06, - "loss": 0.7021, - "step": 49126 - }, - { - "epoch": 1.26, - "learning_rate": 1.3037332382616982e-06, - "loss": 0.645, - "step": 49127 - }, - { - "epoch": 1.26, - "learning_rate": 1.3037068749236022e-06, - "loss": 0.5691, - "step": 49128 - }, - { - "epoch": 1.26, - "learning_rate": 1.3036805113529716e-06, - "loss": 0.6768, - "step": 49129 - }, - { - "epoch": 1.26, - "learning_rate": 1.303654147549827e-06, - "loss": 0.5083, - "step": 49130 - }, - { - "epoch": 1.26, - "learning_rate": 1.3036277835141884e-06, - "loss": 0.5393, - "step": 49131 - }, - { - "epoch": 1.26, - "learning_rate": 1.303601419246076e-06, - "loss": 0.5767, - "step": 49132 - }, - { - "epoch": 1.26, - "learning_rate": 1.3035750547455097e-06, - "loss": 0.527, - "step": 49133 - }, - { - "epoch": 1.26, - "learning_rate": 1.3035486900125104e-06, - "loss": 0.6543, - "step": 49134 - }, - { - "epoch": 1.26, - "learning_rate": 1.3035223250470972e-06, - "loss": 0.4976, - "step": 49135 - }, - { - "epoch": 1.26, - "learning_rate": 1.3034959598492913e-06, - "loss": 0.5813, - "step": 49136 - }, - { - "epoch": 1.26, - "learning_rate": 1.3034695944191125e-06, - "loss": 0.7178, - "step": 49137 - }, - { - "epoch": 1.26, - "learning_rate": 1.3034432287565808e-06, - "loss": 0.7168, - "step": 49138 - }, - { - "epoch": 1.26, - "learning_rate": 1.3034168628617167e-06, - "loss": 0.4937, - "step": 49139 - }, - { - "epoch": 1.26, - "learning_rate": 1.3033904967345403e-06, - "loss": 0.5552, - "step": 49140 - }, - { - "epoch": 1.26, - "learning_rate": 1.3033641303750717e-06, - "loss": 0.6348, - "step": 49141 - }, - { - "epoch": 1.26, - "learning_rate": 1.3033377637833314e-06, - "loss": 0.8076, - "step": 49142 - }, - { - "epoch": 1.26, - "learning_rate": 1.303311396959339e-06, - "loss": 0.6309, - "step": 49143 - }, - { - "epoch": 1.26, - "learning_rate": 1.303285029903115e-06, - "loss": 0.6934, - "step": 49144 - }, - { - "epoch": 1.26, - "learning_rate": 1.3032586626146796e-06, - "loss": 0.6252, - "step": 49145 - }, - { - "epoch": 1.26, - "learning_rate": 1.303232295094053e-06, - "loss": 0.8584, - "step": 49146 - }, - { - "epoch": 1.26, - "learning_rate": 1.3032059273412555e-06, - "loss": 0.666, - "step": 49147 - }, - { - "epoch": 1.26, - "learning_rate": 1.303179559356307e-06, - "loss": 0.665, - "step": 49148 - }, - { - "epoch": 1.26, - "learning_rate": 1.3031531911392279e-06, - "loss": 0.6465, - "step": 49149 - }, - { - "epoch": 1.26, - "learning_rate": 1.3031268226900385e-06, - "loss": 0.6064, - "step": 49150 - }, - { - "epoch": 1.26, - "learning_rate": 1.303100454008759e-06, - "loss": 0.7578, - "step": 49151 - }, - { - "epoch": 1.26, - "learning_rate": 1.303074085095409e-06, - "loss": 0.7852, - "step": 49152 - }, - { - "epoch": 1.26, - "learning_rate": 1.3030477159500093e-06, - "loss": 0.5923, - "step": 49153 - }, - { - "epoch": 1.26, - "learning_rate": 1.3030213465725797e-06, - "loss": 0.4659, - "step": 49154 - }, - { - "epoch": 1.26, - "learning_rate": 1.3029949769631405e-06, - "loss": 0.6768, - "step": 49155 - }, - { - "epoch": 1.26, - "learning_rate": 1.3029686071217123e-06, - "loss": 0.6436, - "step": 49156 - }, - { - "epoch": 1.26, - "learning_rate": 1.302942237048315e-06, - "loss": 0.7598, - "step": 49157 - }, - { - "epoch": 1.26, - "learning_rate": 1.3029158667429684e-06, - "loss": 0.6377, - "step": 49158 - }, - { - "epoch": 1.26, - "learning_rate": 1.3028894962056935e-06, - "loss": 0.6104, - "step": 49159 - }, - { - "epoch": 1.26, - "learning_rate": 1.3028631254365098e-06, - "loss": 0.585, - "step": 49160 - }, - { - "epoch": 1.26, - "learning_rate": 1.302836754435438e-06, - "loss": 0.7139, - "step": 49161 - }, - { - "epoch": 1.26, - "learning_rate": 1.3028103832024977e-06, - "loss": 0.5264, - "step": 49162 - }, - { - "epoch": 1.26, - "learning_rate": 1.3027840117377093e-06, - "loss": 0.7412, - "step": 49163 - }, - { - "epoch": 1.26, - "learning_rate": 1.3027576400410933e-06, - "loss": 0.7363, - "step": 49164 - }, - { - "epoch": 1.26, - "learning_rate": 1.30273126811267e-06, - "loss": 0.5425, - "step": 49165 - }, - { - "epoch": 1.26, - "learning_rate": 1.3027048959524586e-06, - "loss": 0.7725, - "step": 49166 - }, - { - "epoch": 1.26, - "learning_rate": 1.3026785235604804e-06, - "loss": 0.6367, - "step": 49167 - }, - { - "epoch": 1.26, - "learning_rate": 1.3026521509367552e-06, - "loss": 0.5938, - "step": 49168 - }, - { - "epoch": 1.26, - "learning_rate": 1.3026257780813032e-06, - "loss": 0.6362, - "step": 49169 - }, - { - "epoch": 1.26, - "learning_rate": 1.3025994049941441e-06, - "loss": 0.5361, - "step": 49170 - }, - { - "epoch": 1.26, - "learning_rate": 1.3025730316752993e-06, - "loss": 0.7285, - "step": 49171 - }, - { - "epoch": 1.26, - "learning_rate": 1.3025466581247877e-06, - "loss": 0.6826, - "step": 49172 - }, - { - "epoch": 1.26, - "learning_rate": 1.3025202843426302e-06, - "loss": 0.7109, - "step": 49173 - }, - { - "epoch": 1.26, - "learning_rate": 1.3024939103288467e-06, - "loss": 0.6934, - "step": 49174 - }, - { - "epoch": 1.26, - "learning_rate": 1.3024675360834575e-06, - "loss": 0.6416, - "step": 49175 - }, - { - "epoch": 1.26, - "learning_rate": 1.3024411616064831e-06, - "loss": 0.874, - "step": 49176 - }, - { - "epoch": 1.26, - "learning_rate": 1.3024147868979433e-06, - "loss": 0.6538, - "step": 49177 - }, - { - "epoch": 1.26, - "learning_rate": 1.3023884119578585e-06, - "loss": 0.6235, - "step": 49178 - }, - { - "epoch": 1.26, - "learning_rate": 1.3023620367862485e-06, - "loss": 0.5862, - "step": 49179 - }, - { - "epoch": 1.26, - "learning_rate": 1.302335661383134e-06, - "loss": 0.7231, - "step": 49180 - }, - { - "epoch": 1.26, - "learning_rate": 1.302309285748535e-06, - "loss": 0.666, - "step": 49181 - }, - { - "epoch": 1.26, - "learning_rate": 1.3022829098824717e-06, - "loss": 0.396, - "step": 49182 - }, - { - "epoch": 1.26, - "learning_rate": 1.302256533784964e-06, - "loss": 0.5596, - "step": 49183 - }, - { - "epoch": 1.26, - "learning_rate": 1.3022301574560326e-06, - "loss": 0.7832, - "step": 49184 - }, - { - "epoch": 1.26, - "learning_rate": 1.3022037808956975e-06, - "loss": 0.6104, - "step": 49185 - }, - { - "epoch": 1.26, - "learning_rate": 1.3021774041039788e-06, - "loss": 0.7686, - "step": 49186 - }, - { - "epoch": 1.26, - "learning_rate": 1.3021510270808966e-06, - "loss": 0.7285, - "step": 49187 - }, - { - "epoch": 1.26, - "learning_rate": 1.3021246498264716e-06, - "loss": 0.7705, - "step": 49188 - }, - { - "epoch": 1.26, - "learning_rate": 1.3020982723407233e-06, - "loss": 0.668, - "step": 49189 - }, - { - "epoch": 1.26, - "learning_rate": 1.3020718946236724e-06, - "loss": 0.5425, - "step": 49190 - }, - { - "epoch": 1.26, - "learning_rate": 1.302045516675339e-06, - "loss": 0.6504, - "step": 49191 - }, - { - "epoch": 1.26, - "learning_rate": 1.302019138495743e-06, - "loss": 0.6548, - "step": 49192 - }, - { - "epoch": 1.26, - "learning_rate": 1.301992760084905e-06, - "loss": 0.498, - "step": 49193 - }, - { - "epoch": 1.26, - "learning_rate": 1.301966381442845e-06, - "loss": 0.6729, - "step": 49194 - }, - { - "epoch": 1.26, - "learning_rate": 1.3019400025695835e-06, - "loss": 0.7197, - "step": 49195 - }, - { - "epoch": 1.26, - "learning_rate": 1.30191362346514e-06, - "loss": 0.561, - "step": 49196 - }, - { - "epoch": 1.26, - "learning_rate": 1.3018872441295353e-06, - "loss": 0.6309, - "step": 49197 - }, - { - "epoch": 1.26, - "learning_rate": 1.3018608645627893e-06, - "loss": 0.8154, - "step": 49198 - }, - { - "epoch": 1.26, - "learning_rate": 1.3018344847649225e-06, - "loss": 0.5786, - "step": 49199 - }, - { - "epoch": 1.26, - "learning_rate": 1.3018081047359549e-06, - "loss": 0.6084, - "step": 49200 - }, - { - "epoch": 1.26, - "learning_rate": 1.301781724475907e-06, - "loss": 0.7207, - "step": 49201 - }, - { - "epoch": 1.26, - "learning_rate": 1.3017553439847979e-06, - "loss": 0.7529, - "step": 49202 - }, - { - "epoch": 1.26, - "learning_rate": 1.3017289632626491e-06, - "loss": 0.5541, - "step": 49203 - }, - { - "epoch": 1.26, - "learning_rate": 1.3017025823094802e-06, - "loss": 0.7393, - "step": 49204 - }, - { - "epoch": 1.26, - "learning_rate": 1.3016762011253119e-06, - "loss": 0.7344, - "step": 49205 - }, - { - "epoch": 1.26, - "learning_rate": 1.3016498197101636e-06, - "loss": 0.6816, - "step": 49206 - }, - { - "epoch": 1.26, - "learning_rate": 1.301623438064056e-06, - "loss": 0.4802, - "step": 49207 - }, - { - "epoch": 1.26, - "learning_rate": 1.301597056187009e-06, - "loss": 0.6006, - "step": 49208 - }, - { - "epoch": 1.26, - "learning_rate": 1.3015706740790433e-06, - "loss": 0.6172, - "step": 49209 - }, - { - "epoch": 1.26, - "learning_rate": 1.3015442917401789e-06, - "loss": 0.5605, - "step": 49210 - }, - { - "epoch": 1.26, - "learning_rate": 1.3015179091704353e-06, - "loss": 0.6997, - "step": 49211 - }, - { - "epoch": 1.26, - "learning_rate": 1.3014915263698338e-06, - "loss": 0.4829, - "step": 49212 - }, - { - "epoch": 1.26, - "learning_rate": 1.3014651433383941e-06, - "loss": 0.7637, - "step": 49213 - }, - { - "epoch": 1.26, - "learning_rate": 1.3014387600761363e-06, - "loss": 0.6445, - "step": 49214 - }, - { - "epoch": 1.26, - "learning_rate": 1.3014123765830807e-06, - "loss": 0.6675, - "step": 49215 - }, - { - "epoch": 1.26, - "learning_rate": 1.3013859928592475e-06, - "loss": 0.751, - "step": 49216 - }, - { - "epoch": 1.26, - "learning_rate": 1.3013596089046568e-06, - "loss": 0.7734, - "step": 49217 - }, - { - "epoch": 1.26, - "learning_rate": 1.3013332247193291e-06, - "loss": 0.5808, - "step": 49218 - }, - { - "epoch": 1.26, - "learning_rate": 1.3013068403032841e-06, - "loss": 0.8223, - "step": 49219 - }, - { - "epoch": 1.26, - "learning_rate": 1.301280455656543e-06, - "loss": 0.7285, - "step": 49220 - }, - { - "epoch": 1.26, - "learning_rate": 1.3012540707791246e-06, - "loss": 0.6768, - "step": 49221 - }, - { - "epoch": 1.26, - "learning_rate": 1.30122768567105e-06, - "loss": 0.6211, - "step": 49222 - }, - { - "epoch": 1.26, - "learning_rate": 1.3012013003323393e-06, - "loss": 0.5146, - "step": 49223 - }, - { - "epoch": 1.26, - "learning_rate": 1.3011749147630123e-06, - "loss": 0.6377, - "step": 49224 - }, - { - "epoch": 1.26, - "learning_rate": 1.3011485289630902e-06, - "loss": 0.5137, - "step": 49225 - }, - { - "epoch": 1.26, - "learning_rate": 1.301122142932592e-06, - "loss": 0.428, - "step": 49226 - }, - { - "epoch": 1.26, - "learning_rate": 1.3010957566715383e-06, - "loss": 0.7441, - "step": 49227 - }, - { - "epoch": 1.26, - "learning_rate": 1.3010693701799498e-06, - "loss": 0.6416, - "step": 49228 - }, - { - "epoch": 1.26, - "learning_rate": 1.301042983457846e-06, - "loss": 0.7168, - "step": 49229 - }, - { - "epoch": 1.26, - "learning_rate": 1.3010165965052477e-06, - "loss": 0.7266, - "step": 49230 - }, - { - "epoch": 1.26, - "learning_rate": 1.300990209322175e-06, - "loss": 0.6846, - "step": 49231 - }, - { - "epoch": 1.26, - "learning_rate": 1.3009638219086477e-06, - "loss": 0.4612, - "step": 49232 - }, - { - "epoch": 1.26, - "learning_rate": 1.300937434264686e-06, - "loss": 0.6973, - "step": 49233 - }, - { - "epoch": 1.26, - "learning_rate": 1.3009110463903106e-06, - "loss": 0.7627, - "step": 49234 - }, - { - "epoch": 1.26, - "learning_rate": 1.3008846582855415e-06, - "loss": 0.6572, - "step": 49235 - }, - { - "epoch": 1.26, - "learning_rate": 1.3008582699503987e-06, - "loss": 0.6396, - "step": 49236 - }, - { - "epoch": 1.26, - "learning_rate": 1.3008318813849026e-06, - "loss": 0.7754, - "step": 49237 - }, - { - "epoch": 1.26, - "learning_rate": 1.3008054925890732e-06, - "loss": 0.7207, - "step": 49238 - }, - { - "epoch": 1.26, - "learning_rate": 1.3007791035629311e-06, - "loss": 0.7568, - "step": 49239 - }, - { - "epoch": 1.26, - "learning_rate": 1.3007527143064962e-06, - "loss": 0.7471, - "step": 49240 - }, - { - "epoch": 1.26, - "learning_rate": 1.300726324819789e-06, - "loss": 0.5903, - "step": 49241 - }, - { - "epoch": 1.26, - "learning_rate": 1.3006999351028291e-06, - "loss": 0.7051, - "step": 49242 - }, - { - "epoch": 1.26, - "learning_rate": 1.3006735451556374e-06, - "loss": 0.6719, - "step": 49243 - }, - { - "epoch": 1.26, - "learning_rate": 1.3006471549782333e-06, - "loss": 0.8047, - "step": 49244 - }, - { - "epoch": 1.26, - "learning_rate": 1.3006207645706383e-06, - "loss": 0.5334, - "step": 49245 - }, - { - "epoch": 1.26, - "learning_rate": 1.3005943739328712e-06, - "loss": 0.6582, - "step": 49246 - }, - { - "epoch": 1.26, - "learning_rate": 1.300567983064953e-06, - "loss": 0.6062, - "step": 49247 - }, - { - "epoch": 1.26, - "learning_rate": 1.3005415919669036e-06, - "loss": 0.7354, - "step": 49248 - }, - { - "epoch": 1.26, - "learning_rate": 1.3005152006387435e-06, - "loss": 0.6494, - "step": 49249 - }, - { - "epoch": 1.26, - "learning_rate": 1.3004888090804927e-06, - "loss": 0.5303, - "step": 49250 - }, - { - "epoch": 1.26, - "learning_rate": 1.3004624172921713e-06, - "loss": 0.5918, - "step": 49251 - }, - { - "epoch": 1.26, - "learning_rate": 1.3004360252737996e-06, - "loss": 0.668, - "step": 49252 - }, - { - "epoch": 1.26, - "learning_rate": 1.300409633025398e-06, - "loss": 0.5615, - "step": 49253 - }, - { - "epoch": 1.26, - "learning_rate": 1.3003832405469864e-06, - "loss": 0.6592, - "step": 49254 - }, - { - "epoch": 1.26, - "learning_rate": 1.3003568478385854e-06, - "loss": 0.6489, - "step": 49255 - }, - { - "epoch": 1.26, - "learning_rate": 1.300330454900215e-06, - "loss": 0.8018, - "step": 49256 - }, - { - "epoch": 1.26, - "learning_rate": 1.300304061731895e-06, - "loss": 0.6514, - "step": 49257 - }, - { - "epoch": 1.26, - "learning_rate": 1.3002776683336462e-06, - "loss": 0.6133, - "step": 49258 - }, - { - "epoch": 1.26, - "learning_rate": 1.3002512747054888e-06, - "loss": 0.6187, - "step": 49259 - }, - { - "epoch": 1.26, - "learning_rate": 1.3002248808474426e-06, - "loss": 0.564, - "step": 49260 - }, - { - "epoch": 1.26, - "learning_rate": 1.300198486759528e-06, - "loss": 0.6436, - "step": 49261 - }, - { - "epoch": 1.26, - "learning_rate": 1.3001720924417652e-06, - "loss": 0.6904, - "step": 49262 - }, - { - "epoch": 1.26, - "learning_rate": 1.3001456978941745e-06, - "loss": 0.6377, - "step": 49263 - }, - { - "epoch": 1.26, - "learning_rate": 1.300119303116776e-06, - "loss": 0.6802, - "step": 49264 - }, - { - "epoch": 1.26, - "learning_rate": 1.30009290810959e-06, - "loss": 0.7646, - "step": 49265 - }, - { - "epoch": 1.26, - "learning_rate": 1.3000665128726368e-06, - "loss": 0.5098, - "step": 49266 - }, - { - "epoch": 1.26, - "learning_rate": 1.300040117405936e-06, - "loss": 0.6245, - "step": 49267 - }, - { - "epoch": 1.26, - "learning_rate": 1.3000137217095088e-06, - "loss": 0.4888, - "step": 49268 - }, - { - "epoch": 1.26, - "learning_rate": 1.2999873257833745e-06, - "loss": 0.6611, - "step": 49269 - }, - { - "epoch": 1.26, - "learning_rate": 1.299960929627554e-06, - "loss": 0.6074, - "step": 49270 - }, - { - "epoch": 1.26, - "learning_rate": 1.299934533242067e-06, - "loss": 0.4646, - "step": 49271 - }, - { - "epoch": 1.26, - "learning_rate": 1.299908136626934e-06, - "loss": 0.437, - "step": 49272 - }, - { - "epoch": 1.26, - "learning_rate": 1.2998817397821752e-06, - "loss": 0.7705, - "step": 49273 - }, - { - "epoch": 1.26, - "learning_rate": 1.2998553427078104e-06, - "loss": 0.8574, - "step": 49274 - }, - { - "epoch": 1.26, - "learning_rate": 1.2998289454038608e-06, - "loss": 0.6904, - "step": 49275 - }, - { - "epoch": 1.26, - "learning_rate": 1.2998025478703457e-06, - "loss": 0.7354, - "step": 49276 - }, - { - "epoch": 1.26, - "learning_rate": 1.2997761501072853e-06, - "loss": 0.5972, - "step": 49277 - }, - { - "epoch": 1.26, - "learning_rate": 1.2997497521147e-06, - "loss": 0.5825, - "step": 49278 - }, - { - "epoch": 1.26, - "learning_rate": 1.2997233538926104e-06, - "loss": 0.4094, - "step": 49279 - }, - { - "epoch": 1.26, - "learning_rate": 1.2996969554410364e-06, - "loss": 0.7168, - "step": 49280 - }, - { - "epoch": 1.26, - "learning_rate": 1.2996705567599981e-06, - "loss": 0.668, - "step": 49281 - }, - { - "epoch": 1.26, - "learning_rate": 1.2996441578495158e-06, - "loss": 0.6782, - "step": 49282 - }, - { - "epoch": 1.26, - "learning_rate": 1.29961775870961e-06, - "loss": 0.5396, - "step": 49283 - }, - { - "epoch": 1.26, - "learning_rate": 1.2995913593403003e-06, - "loss": 0.6895, - "step": 49284 - }, - { - "epoch": 1.26, - "learning_rate": 1.299564959741608e-06, - "loss": 0.8135, - "step": 49285 - }, - { - "epoch": 1.26, - "learning_rate": 1.2995385599135517e-06, - "loss": 0.7031, - "step": 49286 - }, - { - "epoch": 1.26, - "learning_rate": 1.299512159856153e-06, - "loss": 0.6201, - "step": 49287 - }, - { - "epoch": 1.26, - "learning_rate": 1.2994857595694314e-06, - "loss": 0.6484, - "step": 49288 - }, - { - "epoch": 1.26, - "learning_rate": 1.2994593590534074e-06, - "loss": 0.6504, - "step": 49289 - }, - { - "epoch": 1.26, - "learning_rate": 1.2994329583081012e-06, - "loss": 0.575, - "step": 49290 - }, - { - "epoch": 1.26, - "learning_rate": 1.299406557333533e-06, - "loss": 0.8252, - "step": 49291 - }, - { - "epoch": 1.26, - "learning_rate": 1.2993801561297227e-06, - "loss": 0.6992, - "step": 49292 - }, - { - "epoch": 1.26, - "learning_rate": 1.299353754696691e-06, - "loss": 0.6226, - "step": 49293 - }, - { - "epoch": 1.26, - "learning_rate": 1.2993273530344577e-06, - "loss": 0.6655, - "step": 49294 - }, - { - "epoch": 1.26, - "learning_rate": 1.2993009511430435e-06, - "loss": 0.5718, - "step": 49295 - }, - { - "epoch": 1.26, - "learning_rate": 1.299274549022468e-06, - "loss": 0.6924, - "step": 49296 - }, - { - "epoch": 1.26, - "learning_rate": 1.299248146672752e-06, - "loss": 0.7007, - "step": 49297 - }, - { - "epoch": 1.26, - "learning_rate": 1.2992217440939153e-06, - "loss": 0.6455, - "step": 49298 - }, - { - "epoch": 1.26, - "learning_rate": 1.2991953412859784e-06, - "loss": 0.6777, - "step": 49299 - }, - { - "epoch": 1.26, - "learning_rate": 1.2991689382489614e-06, - "loss": 0.5281, - "step": 49300 - }, - { - "epoch": 1.26, - "learning_rate": 1.2991425349828842e-06, - "loss": 0.6689, - "step": 49301 - }, - { - "epoch": 1.26, - "learning_rate": 1.2991161314877677e-06, - "loss": 0.8564, - "step": 49302 - }, - { - "epoch": 1.26, - "learning_rate": 1.2990897277636314e-06, - "loss": 0.7168, - "step": 49303 - }, - { - "epoch": 1.26, - "learning_rate": 1.299063323810496e-06, - "loss": 0.6484, - "step": 49304 - }, - { - "epoch": 1.26, - "learning_rate": 1.2990369196283817e-06, - "loss": 0.5469, - "step": 49305 - }, - { - "epoch": 1.26, - "learning_rate": 1.2990105152173085e-06, - "loss": 0.6055, - "step": 49306 - }, - { - "epoch": 1.26, - "learning_rate": 1.2989841105772965e-06, - "loss": 0.6294, - "step": 49307 - }, - { - "epoch": 1.26, - "learning_rate": 1.2989577057083662e-06, - "loss": 0.6758, - "step": 49308 - }, - { - "epoch": 1.26, - "learning_rate": 1.2989313006105378e-06, - "loss": 0.6934, - "step": 49309 - }, - { - "epoch": 1.26, - "learning_rate": 1.2989048952838317e-06, - "loss": 0.5049, - "step": 49310 - }, - { - "epoch": 1.26, - "learning_rate": 1.2988784897282675e-06, - "loss": 0.5552, - "step": 49311 - }, - { - "epoch": 1.26, - "learning_rate": 1.2988520839438659e-06, - "loss": 0.8555, - "step": 49312 - }, - { - "epoch": 1.26, - "learning_rate": 1.2988256779306468e-06, - "loss": 0.7109, - "step": 49313 - }, - { - "epoch": 1.26, - "learning_rate": 1.298799271688631e-06, - "loss": 0.6279, - "step": 49314 - }, - { - "epoch": 1.26, - "learning_rate": 1.2987728652178383e-06, - "loss": 0.6973, - "step": 49315 - }, - { - "epoch": 1.26, - "learning_rate": 1.2987464585182888e-06, - "loss": 0.6104, - "step": 49316 - }, - { - "epoch": 1.26, - "learning_rate": 1.2987200515900027e-06, - "loss": 0.4702, - "step": 49317 - }, - { - "epoch": 1.26, - "learning_rate": 1.2986936444330005e-06, - "loss": 0.6006, - "step": 49318 - }, - { - "epoch": 1.26, - "learning_rate": 1.2986672370473023e-06, - "loss": 0.4835, - "step": 49319 - }, - { - "epoch": 1.26, - "learning_rate": 1.2986408294329284e-06, - "loss": 0.3215, - "step": 49320 - }, - { - "epoch": 1.26, - "learning_rate": 1.298614421589899e-06, - "loss": 0.5972, - "step": 49321 - }, - { - "epoch": 1.26, - "learning_rate": 1.2985880135182346e-06, - "loss": 0.833, - "step": 49322 - }, - { - "epoch": 1.26, - "learning_rate": 1.2985616052179544e-06, - "loss": 0.5291, - "step": 49323 - }, - { - "epoch": 1.26, - "learning_rate": 1.2985351966890796e-06, - "loss": 0.6055, - "step": 49324 - }, - { - "epoch": 1.26, - "learning_rate": 1.2985087879316303e-06, - "loss": 0.7832, - "step": 49325 - }, - { - "epoch": 1.26, - "learning_rate": 1.2984823789456263e-06, - "loss": 0.501, - "step": 49326 - }, - { - "epoch": 1.26, - "learning_rate": 1.298455969731088e-06, - "loss": 0.5913, - "step": 49327 - }, - { - "epoch": 1.26, - "learning_rate": 1.2984295602880359e-06, - "loss": 0.5083, - "step": 49328 - }, - { - "epoch": 1.26, - "learning_rate": 1.29840315061649e-06, - "loss": 0.6357, - "step": 49329 - }, - { - "epoch": 1.26, - "learning_rate": 1.2983767407164705e-06, - "loss": 0.7295, - "step": 49330 - }, - { - "epoch": 1.26, - "learning_rate": 1.2983503305879977e-06, - "loss": 0.5782, - "step": 49331 - }, - { - "epoch": 1.26, - "learning_rate": 1.2983239202310916e-06, - "loss": 0.8652, - "step": 49332 - }, - { - "epoch": 1.26, - "learning_rate": 1.298297509645773e-06, - "loss": 0.7461, - "step": 49333 - }, - { - "epoch": 1.26, - "learning_rate": 1.2982710988320611e-06, - "loss": 0.7266, - "step": 49334 - }, - { - "epoch": 1.26, - "learning_rate": 1.2982446877899774e-06, - "loss": 0.667, - "step": 49335 - }, - { - "epoch": 1.26, - "learning_rate": 1.298218276519541e-06, - "loss": 0.6782, - "step": 49336 - }, - { - "epoch": 1.26, - "learning_rate": 1.2981918650207726e-06, - "loss": 0.7534, - "step": 49337 - }, - { - "epoch": 1.26, - "learning_rate": 1.2981654532936922e-06, - "loss": 0.665, - "step": 49338 - }, - { - "epoch": 1.26, - "learning_rate": 1.2981390413383206e-06, - "loss": 0.5073, - "step": 49339 - }, - { - "epoch": 1.26, - "learning_rate": 1.2981126291546778e-06, - "loss": 0.647, - "step": 49340 - }, - { - "epoch": 1.26, - "learning_rate": 1.2980862167427836e-06, - "loss": 0.7886, - "step": 49341 - }, - { - "epoch": 1.26, - "learning_rate": 1.2980598041026585e-06, - "loss": 0.7578, - "step": 49342 - }, - { - "epoch": 1.26, - "learning_rate": 1.2980333912343226e-06, - "loss": 0.7461, - "step": 49343 - }, - { - "epoch": 1.26, - "learning_rate": 1.2980069781377962e-06, - "loss": 0.7676, - "step": 49344 - }, - { - "epoch": 1.26, - "learning_rate": 1.2979805648130997e-06, - "loss": 0.6621, - "step": 49345 - }, - { - "epoch": 1.26, - "learning_rate": 1.2979541512602533e-06, - "loss": 0.564, - "step": 49346 - }, - { - "epoch": 1.26, - "learning_rate": 1.2979277374792769e-06, - "loss": 0.7676, - "step": 49347 - }, - { - "epoch": 1.26, - "learning_rate": 1.2979013234701913e-06, - "loss": 0.7334, - "step": 49348 - }, - { - "epoch": 1.26, - "learning_rate": 1.297874909233016e-06, - "loss": 0.7363, - "step": 49349 - }, - { - "epoch": 1.26, - "learning_rate": 1.2978484947677717e-06, - "loss": 0.5068, - "step": 49350 - }, - { - "epoch": 1.26, - "learning_rate": 1.2978220800744783e-06, - "loss": 0.5142, - "step": 49351 - }, - { - "epoch": 1.26, - "learning_rate": 1.2977956651531566e-06, - "loss": 0.4229, - "step": 49352 - }, - { - "epoch": 1.26, - "learning_rate": 1.297769250003826e-06, - "loss": 0.5293, - "step": 49353 - }, - { - "epoch": 1.26, - "learning_rate": 1.2977428346265075e-06, - "loss": 0.7471, - "step": 49354 - }, - { - "epoch": 1.26, - "learning_rate": 1.2977164190212212e-06, - "loss": 0.7275, - "step": 49355 - }, - { - "epoch": 1.27, - "learning_rate": 1.2976900031879868e-06, - "loss": 0.7988, - "step": 49356 - }, - { - "epoch": 1.27, - "learning_rate": 1.2976635871268246e-06, - "loss": 0.6592, - "step": 49357 - }, - { - "epoch": 1.27, - "learning_rate": 1.2976371708377556e-06, - "loss": 0.4094, - "step": 49358 - }, - { - "epoch": 1.27, - "learning_rate": 1.297610754320799e-06, - "loss": 0.7241, - "step": 49359 - }, - { - "epoch": 1.27, - "learning_rate": 1.2975843375759762e-06, - "loss": 0.5532, - "step": 49360 - }, - { - "epoch": 1.27, - "learning_rate": 1.2975579206033063e-06, - "loss": 0.708, - "step": 49361 - }, - { - "epoch": 1.27, - "learning_rate": 1.29753150340281e-06, - "loss": 0.8125, - "step": 49362 - }, - { - "epoch": 1.27, - "learning_rate": 1.2975050859745076e-06, - "loss": 0.7607, - "step": 49363 - }, - { - "epoch": 1.27, - "learning_rate": 1.2974786683184191e-06, - "loss": 0.709, - "step": 49364 - }, - { - "epoch": 1.27, - "learning_rate": 1.297452250434565e-06, - "loss": 0.5603, - "step": 49365 - }, - { - "epoch": 1.27, - "learning_rate": 1.2974258323229656e-06, - "loss": 0.7104, - "step": 49366 - }, - { - "epoch": 1.27, - "learning_rate": 1.2973994139836405e-06, - "loss": 0.3921, - "step": 49367 - }, - { - "epoch": 1.27, - "learning_rate": 1.2973729954166107e-06, - "loss": 0.6846, - "step": 49368 - }, - { - "epoch": 1.27, - "learning_rate": 1.2973465766218956e-06, - "loss": 0.8145, - "step": 49369 - }, - { - "epoch": 1.27, - "learning_rate": 1.2973201575995164e-06, - "loss": 0.7402, - "step": 49370 - }, - { - "epoch": 1.27, - "learning_rate": 1.2972937383494924e-06, - "loss": 0.5532, - "step": 49371 - }, - { - "epoch": 1.27, - "learning_rate": 1.2972673188718443e-06, - "loss": 0.3977, - "step": 49372 - }, - { - "epoch": 1.27, - "learning_rate": 1.2972408991665926e-06, - "loss": 0.5698, - "step": 49373 - }, - { - "epoch": 1.27, - "learning_rate": 1.297214479233757e-06, - "loss": 0.4995, - "step": 49374 - }, - { - "epoch": 1.27, - "learning_rate": 1.2971880590733582e-06, - "loss": 0.6357, - "step": 49375 - }, - { - "epoch": 1.27, - "learning_rate": 1.297161638685416e-06, - "loss": 0.5918, - "step": 49376 - }, - { - "epoch": 1.27, - "learning_rate": 1.2971352180699506e-06, - "loss": 0.6484, - "step": 49377 - }, - { - "epoch": 1.27, - "learning_rate": 1.2971087972269825e-06, - "loss": 0.7812, - "step": 49378 - }, - { - "epoch": 1.27, - "learning_rate": 1.2970823761565322e-06, - "loss": 0.5962, - "step": 49379 - }, - { - "epoch": 1.27, - "learning_rate": 1.2970559548586192e-06, - "loss": 0.6914, - "step": 49380 - }, - { - "epoch": 1.27, - "learning_rate": 1.2970295333332644e-06, - "loss": 0.7822, - "step": 49381 - }, - { - "epoch": 1.27, - "learning_rate": 1.2970031115804873e-06, - "loss": 0.6543, - "step": 49382 - }, - { - "epoch": 1.27, - "learning_rate": 1.2969766896003088e-06, - "loss": 0.5508, - "step": 49383 - }, - { - "epoch": 1.27, - "learning_rate": 1.296950267392749e-06, - "loss": 0.7505, - "step": 49384 - }, - { - "epoch": 1.27, - "learning_rate": 1.2969238449578284e-06, - "loss": 0.5796, - "step": 49385 - }, - { - "epoch": 1.27, - "learning_rate": 1.2968974222955662e-06, - "loss": 0.7471, - "step": 49386 - }, - { - "epoch": 1.27, - "learning_rate": 1.2968709994059837e-06, - "loss": 0.6768, - "step": 49387 - }, - { - "epoch": 1.27, - "learning_rate": 1.2968445762891005e-06, - "loss": 0.424, - "step": 49388 - }, - { - "epoch": 1.27, - "learning_rate": 1.296818152944937e-06, - "loss": 0.6348, - "step": 49389 - }, - { - "epoch": 1.27, - "learning_rate": 1.2967917293735138e-06, - "loss": 0.543, - "step": 49390 - }, - { - "epoch": 1.27, - "learning_rate": 1.2967653055748504e-06, - "loss": 0.7163, - "step": 49391 - }, - { - "epoch": 1.27, - "learning_rate": 1.296738881548968e-06, - "loss": 0.7422, - "step": 49392 - }, - { - "epoch": 1.27, - "learning_rate": 1.2967124572958857e-06, - "loss": 0.6533, - "step": 49393 - }, - { - "epoch": 1.27, - "learning_rate": 1.2966860328156247e-06, - "loss": 0.6154, - "step": 49394 - }, - { - "epoch": 1.27, - "learning_rate": 1.2966596081082049e-06, - "loss": 0.6514, - "step": 49395 - }, - { - "epoch": 1.27, - "learning_rate": 1.2966331831736464e-06, - "loss": 0.603, - "step": 49396 - }, - { - "epoch": 1.27, - "learning_rate": 1.2966067580119694e-06, - "loss": 0.79, - "step": 49397 - }, - { - "epoch": 1.27, - "learning_rate": 1.2965803326231941e-06, - "loss": 0.6592, - "step": 49398 - }, - { - "epoch": 1.27, - "learning_rate": 1.296553907007341e-06, - "loss": 0.582, - "step": 49399 - }, - { - "epoch": 1.27, - "learning_rate": 1.2965274811644305e-06, - "loss": 0.749, - "step": 49400 - }, - { - "epoch": 1.27, - "learning_rate": 1.2965010550944822e-06, - "loss": 0.605, - "step": 49401 - }, - { - "epoch": 1.27, - "learning_rate": 1.2964746287975167e-06, - "loss": 0.5776, - "step": 49402 - }, - { - "epoch": 1.27, - "learning_rate": 1.2964482022735543e-06, - "loss": 0.5586, - "step": 49403 - }, - { - "epoch": 1.27, - "learning_rate": 1.2964217755226152e-06, - "loss": 0.6304, - "step": 49404 - }, - { - "epoch": 1.27, - "learning_rate": 1.2963953485447197e-06, - "loss": 0.5664, - "step": 49405 - }, - { - "epoch": 1.27, - "learning_rate": 1.2963689213398877e-06, - "loss": 0.7734, - "step": 49406 - }, - { - "epoch": 1.27, - "learning_rate": 1.2963424939081395e-06, - "loss": 0.7617, - "step": 49407 - }, - { - "epoch": 1.27, - "learning_rate": 1.2963160662494957e-06, - "loss": 0.5745, - "step": 49408 - }, - { - "epoch": 1.27, - "learning_rate": 1.296289638363976e-06, - "loss": 0.7617, - "step": 49409 - }, - { - "epoch": 1.27, - "learning_rate": 1.2962632102516013e-06, - "loss": 0.7686, - "step": 49410 - }, - { - "epoch": 1.27, - "learning_rate": 1.2962367819123916e-06, - "loss": 0.667, - "step": 49411 - }, - { - "epoch": 1.27, - "learning_rate": 1.296210353346367e-06, - "loss": 0.5186, - "step": 49412 - }, - { - "epoch": 1.27, - "learning_rate": 1.2961839245535471e-06, - "loss": 0.4419, - "step": 49413 - }, - { - "epoch": 1.27, - "learning_rate": 1.2961574955339533e-06, - "loss": 0.752, - "step": 49414 - }, - { - "epoch": 1.27, - "learning_rate": 1.2961310662876056e-06, - "loss": 0.748, - "step": 49415 - }, - { - "epoch": 1.27, - "learning_rate": 1.2961046368145235e-06, - "loss": 0.7192, - "step": 49416 - }, - { - "epoch": 1.27, - "learning_rate": 1.2960782071147279e-06, - "loss": 0.6167, - "step": 49417 - }, - { - "epoch": 1.27, - "learning_rate": 1.2960517771882385e-06, - "loss": 0.6504, - "step": 49418 - }, - { - "epoch": 1.27, - "learning_rate": 1.2960253470350762e-06, - "loss": 0.7725, - "step": 49419 - }, - { - "epoch": 1.27, - "learning_rate": 1.295998916655261e-06, - "loss": 0.533, - "step": 49420 - }, - { - "epoch": 1.27, - "learning_rate": 1.295972486048813e-06, - "loss": 0.6006, - "step": 49421 - }, - { - "epoch": 1.27, - "learning_rate": 1.295946055215752e-06, - "loss": 0.6631, - "step": 49422 - }, - { - "epoch": 1.27, - "learning_rate": 1.295919624156099e-06, - "loss": 0.5465, - "step": 49423 - }, - { - "epoch": 1.27, - "learning_rate": 1.295893192869874e-06, - "loss": 0.5757, - "step": 49424 - }, - { - "epoch": 1.27, - "learning_rate": 1.2958667613570974e-06, - "loss": 0.8027, - "step": 49425 - }, - { - "epoch": 1.27, - "learning_rate": 1.2958403296177888e-06, - "loss": 0.6816, - "step": 49426 - }, - { - "epoch": 1.27, - "learning_rate": 1.2958138976519692e-06, - "loss": 0.7231, - "step": 49427 - }, - { - "epoch": 1.27, - "learning_rate": 1.2957874654596584e-06, - "loss": 0.6445, - "step": 49428 - }, - { - "epoch": 1.27, - "learning_rate": 1.2957610330408765e-06, - "loss": 0.6475, - "step": 49429 - }, - { - "epoch": 1.27, - "learning_rate": 1.2957346003956445e-06, - "loss": 0.6621, - "step": 49430 - }, - { - "epoch": 1.27, - "learning_rate": 1.2957081675239818e-06, - "loss": 0.8262, - "step": 49431 - }, - { - "epoch": 1.27, - "learning_rate": 1.2956817344259089e-06, - "loss": 0.4218, - "step": 49432 - }, - { - "epoch": 1.27, - "learning_rate": 1.295655301101446e-06, - "loss": 0.5883, - "step": 49433 - }, - { - "epoch": 1.27, - "learning_rate": 1.2956288675506135e-06, - "loss": 0.7207, - "step": 49434 - }, - { - "epoch": 1.27, - "learning_rate": 1.2956024337734319e-06, - "loss": 0.6362, - "step": 49435 - }, - { - "epoch": 1.27, - "learning_rate": 1.295575999769921e-06, - "loss": 0.626, - "step": 49436 - }, - { - "epoch": 1.27, - "learning_rate": 1.2955495655401009e-06, - "loss": 0.6445, - "step": 49437 - }, - { - "epoch": 1.27, - "learning_rate": 1.295523131083992e-06, - "loss": 0.4246, - "step": 49438 - }, - { - "epoch": 1.27, - "learning_rate": 1.295496696401615e-06, - "loss": 0.5693, - "step": 49439 - }, - { - "epoch": 1.27, - "learning_rate": 1.2954702614929898e-06, - "loss": 0.7061, - "step": 49440 - }, - { - "epoch": 1.27, - "learning_rate": 1.2954438263581362e-06, - "loss": 0.6885, - "step": 49441 - }, - { - "epoch": 1.27, - "learning_rate": 1.2954173909970752e-06, - "loss": 0.7324, - "step": 49442 - }, - { - "epoch": 1.27, - "learning_rate": 1.2953909554098261e-06, - "loss": 0.5144, - "step": 49443 - }, - { - "epoch": 1.27, - "learning_rate": 1.2953645195964106e-06, - "loss": 0.5293, - "step": 49444 - }, - { - "epoch": 1.27, - "learning_rate": 1.2953380835568474e-06, - "loss": 0.6406, - "step": 49445 - }, - { - "epoch": 1.27, - "learning_rate": 1.2953116472911577e-06, - "loss": 0.6807, - "step": 49446 - }, - { - "epoch": 1.27, - "learning_rate": 1.2952852107993613e-06, - "loss": 0.4824, - "step": 49447 - }, - { - "epoch": 1.27, - "learning_rate": 1.2952587740814787e-06, - "loss": 0.5308, - "step": 49448 - }, - { - "epoch": 1.27, - "learning_rate": 1.2952323371375298e-06, - "loss": 0.4717, - "step": 49449 - }, - { - "epoch": 1.27, - "learning_rate": 1.2952058999675357e-06, - "loss": 0.6082, - "step": 49450 - }, - { - "epoch": 1.27, - "learning_rate": 1.2951794625715153e-06, - "loss": 0.8018, - "step": 49451 - }, - { - "epoch": 1.27, - "learning_rate": 1.29515302494949e-06, - "loss": 0.6143, - "step": 49452 - }, - { - "epoch": 1.27, - "learning_rate": 1.2951265871014793e-06, - "loss": 0.624, - "step": 49453 - }, - { - "epoch": 1.27, - "learning_rate": 1.2951001490275041e-06, - "loss": 0.626, - "step": 49454 - }, - { - "epoch": 1.27, - "learning_rate": 1.2950737107275842e-06, - "loss": 0.7598, - "step": 49455 - }, - { - "epoch": 1.27, - "learning_rate": 1.2950472722017398e-06, - "loss": 0.772, - "step": 49456 - }, - { - "epoch": 1.27, - "learning_rate": 1.2950208334499913e-06, - "loss": 0.7842, - "step": 49457 - }, - { - "epoch": 1.27, - "learning_rate": 1.294994394472359e-06, - "loss": 0.7783, - "step": 49458 - }, - { - "epoch": 1.27, - "learning_rate": 1.2949679552688627e-06, - "loss": 0.5583, - "step": 49459 - }, - { - "epoch": 1.27, - "learning_rate": 1.2949415158395232e-06, - "loss": 0.5422, - "step": 49460 - }, - { - "epoch": 1.27, - "learning_rate": 1.2949150761843609e-06, - "loss": 0.6704, - "step": 49461 - }, - { - "epoch": 1.27, - "learning_rate": 1.294888636303395e-06, - "loss": 0.647, - "step": 49462 - }, - { - "epoch": 1.27, - "learning_rate": 1.2948621961966471e-06, - "loss": 0.6548, - "step": 49463 - }, - { - "epoch": 1.27, - "learning_rate": 1.2948357558641363e-06, - "loss": 0.5269, - "step": 49464 - }, - { - "epoch": 1.27, - "learning_rate": 1.2948093153058836e-06, - "loss": 0.6982, - "step": 49465 - }, - { - "epoch": 1.27, - "learning_rate": 1.2947828745219089e-06, - "loss": 0.6299, - "step": 49466 - }, - { - "epoch": 1.27, - "learning_rate": 1.2947564335122325e-06, - "loss": 0.8164, - "step": 49467 - }, - { - "epoch": 1.27, - "learning_rate": 1.2947299922768746e-06, - "loss": 0.5, - "step": 49468 - }, - { - "epoch": 1.27, - "learning_rate": 1.2947035508158554e-06, - "loss": 0.6807, - "step": 49469 - }, - { - "epoch": 1.27, - "learning_rate": 1.2946771091291955e-06, - "loss": 0.6602, - "step": 49470 - }, - { - "epoch": 1.27, - "learning_rate": 1.294650667216915e-06, - "loss": 0.6377, - "step": 49471 - }, - { - "epoch": 1.27, - "learning_rate": 1.2946242250790336e-06, - "loss": 0.6016, - "step": 49472 - }, - { - "epoch": 1.27, - "learning_rate": 1.2945977827155722e-06, - "loss": 0.8271, - "step": 49473 - }, - { - "epoch": 1.27, - "learning_rate": 1.2945713401265506e-06, - "loss": 0.6816, - "step": 49474 - }, - { - "epoch": 1.27, - "learning_rate": 1.2945448973119897e-06, - "loss": 0.6602, - "step": 49475 - }, - { - "epoch": 1.27, - "learning_rate": 1.2945184542719089e-06, - "loss": 0.7588, - "step": 49476 - }, - { - "epoch": 1.27, - "learning_rate": 1.294492011006329e-06, - "loss": 0.665, - "step": 49477 - }, - { - "epoch": 1.27, - "learning_rate": 1.2944655675152702e-06, - "loss": 0.5972, - "step": 49478 - }, - { - "epoch": 1.27, - "learning_rate": 1.2944391237987527e-06, - "loss": 0.7056, - "step": 49479 - }, - { - "epoch": 1.27, - "learning_rate": 1.2944126798567967e-06, - "loss": 0.5708, - "step": 49480 - }, - { - "epoch": 1.27, - "learning_rate": 1.2943862356894221e-06, - "loss": 0.6074, - "step": 49481 - }, - { - "epoch": 1.27, - "learning_rate": 1.29435979129665e-06, - "loss": 0.4777, - "step": 49482 - }, - { - "epoch": 1.27, - "learning_rate": 1.2943333466784995e-06, - "loss": 0.5825, - "step": 49483 - }, - { - "epoch": 1.27, - "learning_rate": 1.2943069018349921e-06, - "loss": 0.7212, - "step": 49484 - }, - { - "epoch": 1.27, - "learning_rate": 1.294280456766147e-06, - "loss": 0.7412, - "step": 49485 - }, - { - "epoch": 1.27, - "learning_rate": 1.2942540114719856e-06, - "loss": 0.5298, - "step": 49486 - }, - { - "epoch": 1.27, - "learning_rate": 1.2942275659525268e-06, - "loss": 0.6162, - "step": 49487 - }, - { - "epoch": 1.27, - "learning_rate": 1.2942011202077917e-06, - "loss": 0.5215, - "step": 49488 - }, - { - "epoch": 1.27, - "learning_rate": 1.2941746742378001e-06, - "loss": 0.7451, - "step": 49489 - }, - { - "epoch": 1.27, - "learning_rate": 1.2941482280425728e-06, - "loss": 0.5647, - "step": 49490 - }, - { - "epoch": 1.27, - "learning_rate": 1.2941217816221296e-06, - "loss": 0.7979, - "step": 49491 - }, - { - "epoch": 1.27, - "learning_rate": 1.2940953349764908e-06, - "loss": 0.6865, - "step": 49492 - }, - { - "epoch": 1.27, - "learning_rate": 1.2940688881056765e-06, - "loss": 0.7686, - "step": 49493 - }, - { - "epoch": 1.27, - "learning_rate": 1.2940424410097078e-06, - "loss": 0.324, - "step": 49494 - }, - { - "epoch": 1.27, - "learning_rate": 1.2940159936886036e-06, - "loss": 0.6548, - "step": 49495 - }, - { - "epoch": 1.27, - "learning_rate": 1.2939895461423854e-06, - "loss": 0.5107, - "step": 49496 - }, - { - "epoch": 1.27, - "learning_rate": 1.2939630983710728e-06, - "loss": 0.6509, - "step": 49497 - }, - { - "epoch": 1.27, - "learning_rate": 1.293936650374686e-06, - "loss": 0.5732, - "step": 49498 - }, - { - "epoch": 1.27, - "learning_rate": 1.2939102021532456e-06, - "loss": 0.8467, - "step": 49499 - }, - { - "epoch": 1.27, - "learning_rate": 1.2938837537067715e-06, - "loss": 0.6182, - "step": 49500 - }, - { - "epoch": 1.27, - "learning_rate": 1.2938573050352843e-06, - "loss": 0.6353, - "step": 49501 - }, - { - "epoch": 1.27, - "learning_rate": 1.293830856138804e-06, - "loss": 0.6055, - "step": 49502 - }, - { - "epoch": 1.27, - "learning_rate": 1.293804407017351e-06, - "loss": 0.7742, - "step": 49503 - }, - { - "epoch": 1.27, - "learning_rate": 1.2937779576709456e-06, - "loss": 0.834, - "step": 49504 - }, - { - "epoch": 1.27, - "learning_rate": 1.2937515080996075e-06, - "loss": 0.7461, - "step": 49505 - }, - { - "epoch": 1.27, - "learning_rate": 1.2937250583033577e-06, - "loss": 0.7109, - "step": 49506 - }, - { - "epoch": 1.27, - "learning_rate": 1.2936986082822162e-06, - "loss": 0.7432, - "step": 49507 - }, - { - "epoch": 1.27, - "learning_rate": 1.2936721580362026e-06, - "loss": 0.4458, - "step": 49508 - }, - { - "epoch": 1.27, - "learning_rate": 1.2936457075653385e-06, - "loss": 0.5781, - "step": 49509 - }, - { - "epoch": 1.27, - "learning_rate": 1.293619256869643e-06, - "loss": 0.6196, - "step": 49510 - }, - { - "epoch": 1.27, - "learning_rate": 1.2935928059491369e-06, - "loss": 0.7021, - "step": 49511 - }, - { - "epoch": 1.27, - "learning_rate": 1.29356635480384e-06, - "loss": 0.5996, - "step": 49512 - }, - { - "epoch": 1.27, - "learning_rate": 1.293539903433773e-06, - "loss": 0.6812, - "step": 49513 - }, - { - "epoch": 1.27, - "learning_rate": 1.293513451838956e-06, - "loss": 0.625, - "step": 49514 - }, - { - "epoch": 1.27, - "learning_rate": 1.2934870000194094e-06, - "loss": 0.54, - "step": 49515 - }, - { - "epoch": 1.27, - "learning_rate": 1.293460547975153e-06, - "loss": 0.7051, - "step": 49516 - }, - { - "epoch": 1.27, - "learning_rate": 1.2934340957062075e-06, - "loss": 0.7246, - "step": 49517 - }, - { - "epoch": 1.27, - "learning_rate": 1.2934076432125928e-06, - "loss": 0.532, - "step": 49518 - }, - { - "epoch": 1.27, - "learning_rate": 1.2933811904943298e-06, - "loss": 0.8604, - "step": 49519 - }, - { - "epoch": 1.27, - "learning_rate": 1.293354737551438e-06, - "loss": 0.5762, - "step": 49520 - }, - { - "epoch": 1.27, - "learning_rate": 1.293328284383938e-06, - "loss": 0.8115, - "step": 49521 - }, - { - "epoch": 1.27, - "learning_rate": 1.29330183099185e-06, - "loss": 0.7861, - "step": 49522 - }, - { - "epoch": 1.27, - "learning_rate": 1.2932753773751946e-06, - "loss": 0.7695, - "step": 49523 - }, - { - "epoch": 1.27, - "learning_rate": 1.2932489235339915e-06, - "loss": 0.6074, - "step": 49524 - }, - { - "epoch": 1.27, - "learning_rate": 1.293222469468261e-06, - "loss": 0.5693, - "step": 49525 - }, - { - "epoch": 1.27, - "learning_rate": 1.2931960151780237e-06, - "loss": 0.8359, - "step": 49526 - }, - { - "epoch": 1.27, - "learning_rate": 1.2931695606632995e-06, - "loss": 0.667, - "step": 49527 - }, - { - "epoch": 1.27, - "learning_rate": 1.293143105924109e-06, - "loss": 0.4868, - "step": 49528 - }, - { - "epoch": 1.27, - "learning_rate": 1.2931166509604725e-06, - "loss": 0.7529, - "step": 49529 - }, - { - "epoch": 1.27, - "learning_rate": 1.29309019577241e-06, - "loss": 0.7363, - "step": 49530 - }, - { - "epoch": 1.27, - "learning_rate": 1.2930637403599415e-06, - "loss": 0.6306, - "step": 49531 - }, - { - "epoch": 1.27, - "learning_rate": 1.293037284723088e-06, - "loss": 0.7861, - "step": 49532 - }, - { - "epoch": 1.27, - "learning_rate": 1.2930108288618688e-06, - "loss": 0.5513, - "step": 49533 - }, - { - "epoch": 1.27, - "learning_rate": 1.2929843727763053e-06, - "loss": 0.7432, - "step": 49534 - }, - { - "epoch": 1.27, - "learning_rate": 1.2929579164664165e-06, - "loss": 0.623, - "step": 49535 - }, - { - "epoch": 1.27, - "learning_rate": 1.292931459932224e-06, - "loss": 0.6826, - "step": 49536 - }, - { - "epoch": 1.27, - "learning_rate": 1.2929050031737468e-06, - "loss": 0.6631, - "step": 49537 - }, - { - "epoch": 1.27, - "learning_rate": 1.2928785461910058e-06, - "loss": 0.5223, - "step": 49538 - }, - { - "epoch": 1.27, - "learning_rate": 1.2928520889840212e-06, - "loss": 0.6514, - "step": 49539 - }, - { - "epoch": 1.27, - "learning_rate": 1.2928256315528134e-06, - "loss": 0.3564, - "step": 49540 - }, - { - "epoch": 1.27, - "learning_rate": 1.2927991738974022e-06, - "loss": 0.6343, - "step": 49541 - }, - { - "epoch": 1.27, - "learning_rate": 1.2927727160178083e-06, - "loss": 0.4607, - "step": 49542 - }, - { - "epoch": 1.27, - "learning_rate": 1.2927462579140516e-06, - "loss": 0.625, - "step": 49543 - }, - { - "epoch": 1.27, - "learning_rate": 1.2927197995861528e-06, - "loss": 0.7939, - "step": 49544 - }, - { - "epoch": 1.27, - "learning_rate": 1.2926933410341318e-06, - "loss": 0.7422, - "step": 49545 - }, - { - "epoch": 1.27, - "learning_rate": 1.292666882258009e-06, - "loss": 0.5332, - "step": 49546 - }, - { - "epoch": 1.27, - "learning_rate": 1.2926404232578048e-06, - "loss": 0.585, - "step": 49547 - }, - { - "epoch": 1.27, - "learning_rate": 1.2926139640335389e-06, - "loss": 0.5479, - "step": 49548 - }, - { - "epoch": 1.27, - "learning_rate": 1.2925875045852323e-06, - "loss": 0.5505, - "step": 49549 - }, - { - "epoch": 1.27, - "learning_rate": 1.2925610449129044e-06, - "loss": 0.6768, - "step": 49550 - }, - { - "epoch": 1.27, - "learning_rate": 1.2925345850165765e-06, - "loss": 0.6665, - "step": 49551 - }, - { - "epoch": 1.27, - "learning_rate": 1.2925081248962682e-06, - "loss": 0.6553, - "step": 49552 - }, - { - "epoch": 1.27, - "learning_rate": 1.2924816645519996e-06, - "loss": 0.6304, - "step": 49553 - }, - { - "epoch": 1.27, - "learning_rate": 1.2924552039837914e-06, - "loss": 0.6631, - "step": 49554 - }, - { - "epoch": 1.27, - "learning_rate": 1.2924287431916642e-06, - "loss": 0.6895, - "step": 49555 - }, - { - "epoch": 1.27, - "learning_rate": 1.292402282175637e-06, - "loss": 0.5752, - "step": 49556 - }, - { - "epoch": 1.27, - "learning_rate": 1.2923758209357311e-06, - "loss": 0.6201, - "step": 49557 - }, - { - "epoch": 1.27, - "learning_rate": 1.2923493594719662e-06, - "loss": 0.625, - "step": 49558 - }, - { - "epoch": 1.27, - "learning_rate": 1.2923228977843636e-06, - "loss": 0.4032, - "step": 49559 - }, - { - "epoch": 1.27, - "learning_rate": 1.2922964358729422e-06, - "loss": 0.7588, - "step": 49560 - }, - { - "epoch": 1.27, - "learning_rate": 1.292269973737723e-06, - "loss": 0.6843, - "step": 49561 - }, - { - "epoch": 1.27, - "learning_rate": 1.292243511378726e-06, - "loss": 0.5923, - "step": 49562 - }, - { - "epoch": 1.27, - "learning_rate": 1.2922170487959716e-06, - "loss": 0.5894, - "step": 49563 - }, - { - "epoch": 1.27, - "learning_rate": 1.2921905859894803e-06, - "loss": 0.5356, - "step": 49564 - }, - { - "epoch": 1.27, - "learning_rate": 1.2921641229592722e-06, - "loss": 0.7754, - "step": 49565 - }, - { - "epoch": 1.27, - "learning_rate": 1.292137659705367e-06, - "loss": 0.6025, - "step": 49566 - }, - { - "epoch": 1.27, - "learning_rate": 1.2921111962277856e-06, - "loss": 0.4844, - "step": 49567 - }, - { - "epoch": 1.27, - "learning_rate": 1.2920847325265478e-06, - "loss": 0.5339, - "step": 49568 - }, - { - "epoch": 1.27, - "learning_rate": 1.2920582686016745e-06, - "loss": 0.6372, - "step": 49569 - }, - { - "epoch": 1.27, - "learning_rate": 1.292031804453186e-06, - "loss": 0.6387, - "step": 49570 - }, - { - "epoch": 1.27, - "learning_rate": 1.2920053400811015e-06, - "loss": 0.5137, - "step": 49571 - }, - { - "epoch": 1.27, - "learning_rate": 1.2919788754854422e-06, - "loss": 0.6787, - "step": 49572 - }, - { - "epoch": 1.27, - "learning_rate": 1.2919524106662279e-06, - "loss": 0.8047, - "step": 49573 - }, - { - "epoch": 1.27, - "learning_rate": 1.2919259456234794e-06, - "loss": 0.5825, - "step": 49574 - }, - { - "epoch": 1.27, - "learning_rate": 1.2918994803572165e-06, - "loss": 0.4768, - "step": 49575 - }, - { - "epoch": 1.27, - "learning_rate": 1.2918730148674594e-06, - "loss": 0.5962, - "step": 49576 - }, - { - "epoch": 1.27, - "learning_rate": 1.2918465491542287e-06, - "loss": 0.6772, - "step": 49577 - }, - { - "epoch": 1.27, - "learning_rate": 1.2918200832175447e-06, - "loss": 0.6309, - "step": 49578 - }, - { - "epoch": 1.27, - "learning_rate": 1.2917936170574275e-06, - "loss": 0.6211, - "step": 49579 - }, - { - "epoch": 1.27, - "learning_rate": 1.291767150673897e-06, - "loss": 0.6367, - "step": 49580 - }, - { - "epoch": 1.27, - "learning_rate": 1.291740684066974e-06, - "loss": 0.6562, - "step": 49581 - }, - { - "epoch": 1.27, - "learning_rate": 1.2917142172366786e-06, - "loss": 0.5259, - "step": 49582 - }, - { - "epoch": 1.27, - "learning_rate": 1.2916877501830308e-06, - "loss": 0.6968, - "step": 49583 - }, - { - "epoch": 1.27, - "learning_rate": 1.2916612829060517e-06, - "loss": 0.6802, - "step": 49584 - }, - { - "epoch": 1.27, - "learning_rate": 1.2916348154057604e-06, - "loss": 0.6572, - "step": 49585 - }, - { - "epoch": 1.27, - "learning_rate": 1.2916083476821778e-06, - "loss": 0.7061, - "step": 49586 - }, - { - "epoch": 1.27, - "learning_rate": 1.291581879735324e-06, - "loss": 0.5869, - "step": 49587 - }, - { - "epoch": 1.27, - "learning_rate": 1.2915554115652196e-06, - "loss": 0.8262, - "step": 49588 - }, - { - "epoch": 1.27, - "learning_rate": 1.2915289431718845e-06, - "loss": 0.6748, - "step": 49589 - }, - { - "epoch": 1.27, - "learning_rate": 1.291502474555339e-06, - "loss": 0.7871, - "step": 49590 - }, - { - "epoch": 1.27, - "learning_rate": 1.2914760057156039e-06, - "loss": 0.8096, - "step": 49591 - }, - { - "epoch": 1.27, - "learning_rate": 1.2914495366526988e-06, - "loss": 0.6184, - "step": 49592 - }, - { - "epoch": 1.27, - "learning_rate": 1.2914230673666439e-06, - "loss": 0.7666, - "step": 49593 - }, - { - "epoch": 1.27, - "learning_rate": 1.2913965978574602e-06, - "loss": 0.4758, - "step": 49594 - }, - { - "epoch": 1.27, - "learning_rate": 1.2913701281251674e-06, - "loss": 0.5889, - "step": 49595 - }, - { - "epoch": 1.27, - "learning_rate": 1.2913436581697856e-06, - "loss": 0.6904, - "step": 49596 - }, - { - "epoch": 1.27, - "learning_rate": 1.2913171879913356e-06, - "loss": 0.5649, - "step": 49597 - }, - { - "epoch": 1.27, - "learning_rate": 1.2912907175898372e-06, - "loss": 0.5459, - "step": 49598 - }, - { - "epoch": 1.27, - "learning_rate": 1.2912642469653115e-06, - "loss": 0.5215, - "step": 49599 - }, - { - "epoch": 1.27, - "learning_rate": 1.2912377761177774e-06, - "loss": 0.8408, - "step": 49600 - }, - { - "epoch": 1.27, - "learning_rate": 1.2912113050472564e-06, - "loss": 0.4722, - "step": 49601 - }, - { - "epoch": 1.27, - "learning_rate": 1.291184833753768e-06, - "loss": 0.686, - "step": 49602 - }, - { - "epoch": 1.27, - "learning_rate": 1.291158362237333e-06, - "loss": 0.5918, - "step": 49603 - }, - { - "epoch": 1.27, - "learning_rate": 1.2911318904979714e-06, - "loss": 0.7891, - "step": 49604 - }, - { - "epoch": 1.27, - "learning_rate": 1.2911054185357036e-06, - "loss": 0.6357, - "step": 49605 - }, - { - "epoch": 1.27, - "learning_rate": 1.2910789463505493e-06, - "loss": 0.5343, - "step": 49606 - }, - { - "epoch": 1.27, - "learning_rate": 1.2910524739425296e-06, - "loss": 0.6367, - "step": 49607 - }, - { - "epoch": 1.27, - "learning_rate": 1.2910260013116645e-06, - "loss": 0.5679, - "step": 49608 - }, - { - "epoch": 1.27, - "learning_rate": 1.2909995284579742e-06, - "loss": 0.6406, - "step": 49609 - }, - { - "epoch": 1.27, - "learning_rate": 1.2909730553814786e-06, - "loss": 0.603, - "step": 49610 - }, - { - "epoch": 1.27, - "learning_rate": 1.2909465820821986e-06, - "loss": 0.604, - "step": 49611 - }, - { - "epoch": 1.27, - "learning_rate": 1.290920108560154e-06, - "loss": 0.564, - "step": 49612 - }, - { - "epoch": 1.27, - "learning_rate": 1.2908936348153651e-06, - "loss": 0.7471, - "step": 49613 - }, - { - "epoch": 1.27, - "learning_rate": 1.2908671608478528e-06, - "loss": 0.543, - "step": 49614 - }, - { - "epoch": 1.27, - "learning_rate": 1.2908406866576364e-06, - "loss": 0.7344, - "step": 49615 - }, - { - "epoch": 1.27, - "learning_rate": 1.290814212244737e-06, - "loss": 0.6304, - "step": 49616 - }, - { - "epoch": 1.27, - "learning_rate": 1.2907877376091743e-06, - "loss": 0.665, - "step": 49617 - }, - { - "epoch": 1.27, - "learning_rate": 1.290761262750969e-06, - "loss": 0.5669, - "step": 49618 - }, - { - "epoch": 1.27, - "learning_rate": 1.2907347876701412e-06, - "loss": 0.7412, - "step": 49619 - }, - { - "epoch": 1.27, - "learning_rate": 1.290708312366711e-06, - "loss": 0.6699, - "step": 49620 - }, - { - "epoch": 1.27, - "learning_rate": 1.2906818368406986e-06, - "loss": 0.731, - "step": 49621 - }, - { - "epoch": 1.27, - "learning_rate": 1.2906553610921247e-06, - "loss": 0.6406, - "step": 49622 - }, - { - "epoch": 1.27, - "learning_rate": 1.2906288851210093e-06, - "loss": 0.5339, - "step": 49623 - }, - { - "epoch": 1.27, - "learning_rate": 1.290602408927373e-06, - "loss": 0.627, - "step": 49624 - }, - { - "epoch": 1.27, - "learning_rate": 1.2905759325112355e-06, - "loss": 0.5972, - "step": 49625 - }, - { - "epoch": 1.27, - "learning_rate": 1.2905494558726175e-06, - "loss": 0.7227, - "step": 49626 - }, - { - "epoch": 1.27, - "learning_rate": 1.2905229790115391e-06, - "loss": 0.5972, - "step": 49627 - }, - { - "epoch": 1.27, - "learning_rate": 1.2904965019280206e-06, - "loss": 0.6406, - "step": 49628 - }, - { - "epoch": 1.27, - "learning_rate": 1.2904700246220822e-06, - "loss": 0.7041, - "step": 49629 - }, - { - "epoch": 1.27, - "learning_rate": 1.2904435470937448e-06, - "loss": 0.7244, - "step": 49630 - }, - { - "epoch": 1.27, - "learning_rate": 1.2904170693430273e-06, - "loss": 0.7129, - "step": 49631 - }, - { - "epoch": 1.27, - "learning_rate": 1.2903905913699514e-06, - "loss": 0.6021, - "step": 49632 - }, - { - "epoch": 1.27, - "learning_rate": 1.2903641131745363e-06, - "loss": 0.8164, - "step": 49633 - }, - { - "epoch": 1.27, - "learning_rate": 1.290337634756803e-06, - "loss": 0.667, - "step": 49634 - }, - { - "epoch": 1.27, - "learning_rate": 1.290311156116772e-06, - "loss": 0.5796, - "step": 49635 - }, - { - "epoch": 1.27, - "learning_rate": 1.2902846772544622e-06, - "loss": 0.7119, - "step": 49636 - }, - { - "epoch": 1.27, - "learning_rate": 1.2902581981698953e-06, - "loss": 0.751, - "step": 49637 - }, - { - "epoch": 1.27, - "learning_rate": 1.2902317188630912e-06, - "loss": 0.5562, - "step": 49638 - }, - { - "epoch": 1.27, - "learning_rate": 1.2902052393340696e-06, - "loss": 0.6816, - "step": 49639 - }, - { - "epoch": 1.27, - "learning_rate": 1.2901787595828513e-06, - "loss": 0.5078, - "step": 49640 - }, - { - "epoch": 1.27, - "learning_rate": 1.2901522796094567e-06, - "loss": 0.5015, - "step": 49641 - }, - { - "epoch": 1.27, - "learning_rate": 1.2901257994139054e-06, - "loss": 0.6914, - "step": 49642 - }, - { - "epoch": 1.27, - "learning_rate": 1.2900993189962183e-06, - "loss": 0.5132, - "step": 49643 - }, - { - "epoch": 1.27, - "learning_rate": 1.2900728383564159e-06, - "loss": 0.5107, - "step": 49644 - }, - { - "epoch": 1.27, - "learning_rate": 1.2900463574945178e-06, - "loss": 0.6279, - "step": 49645 - }, - { - "epoch": 1.27, - "learning_rate": 1.2900198764105444e-06, - "loss": 0.7222, - "step": 49646 - }, - { - "epoch": 1.27, - "learning_rate": 1.289993395104516e-06, - "loss": 0.8701, - "step": 49647 - }, - { - "epoch": 1.27, - "learning_rate": 1.2899669135764532e-06, - "loss": 0.5366, - "step": 49648 - }, - { - "epoch": 1.27, - "learning_rate": 1.2899404318263765e-06, - "loss": 0.6172, - "step": 49649 - }, - { - "epoch": 1.27, - "learning_rate": 1.289913949854305e-06, - "loss": 0.7568, - "step": 49650 - }, - { - "epoch": 1.27, - "learning_rate": 1.28988746766026e-06, - "loss": 0.71, - "step": 49651 - }, - { - "epoch": 1.27, - "learning_rate": 1.2898609852442614e-06, - "loss": 0.6763, - "step": 49652 - }, - { - "epoch": 1.27, - "learning_rate": 1.2898345026063298e-06, - "loss": 0.447, - "step": 49653 - }, - { - "epoch": 1.27, - "learning_rate": 1.2898080197464854e-06, - "loss": 0.4778, - "step": 49654 - }, - { - "epoch": 1.27, - "learning_rate": 1.289781536664748e-06, - "loss": 0.7646, - "step": 49655 - }, - { - "epoch": 1.27, - "learning_rate": 1.289755053361138e-06, - "loss": 0.6582, - "step": 49656 - }, - { - "epoch": 1.27, - "learning_rate": 1.2897285698356765e-06, - "loss": 0.478, - "step": 49657 - }, - { - "epoch": 1.27, - "learning_rate": 1.2897020860883824e-06, - "loss": 0.5825, - "step": 49658 - }, - { - "epoch": 1.27, - "learning_rate": 1.2896756021192774e-06, - "loss": 0.4797, - "step": 49659 - }, - { - "epoch": 1.27, - "learning_rate": 1.2896491179283808e-06, - "loss": 0.6191, - "step": 49660 - }, - { - "epoch": 1.27, - "learning_rate": 1.2896226335157132e-06, - "loss": 0.3131, - "step": 49661 - }, - { - "epoch": 1.27, - "learning_rate": 1.2895961488812947e-06, - "loss": 0.6387, - "step": 49662 - }, - { - "epoch": 1.27, - "learning_rate": 1.289569664025146e-06, - "loss": 0.6787, - "step": 49663 - }, - { - "epoch": 1.27, - "learning_rate": 1.2895431789472872e-06, - "loss": 0.4617, - "step": 49664 - }, - { - "epoch": 1.27, - "learning_rate": 1.2895166936477384e-06, - "loss": 0.6035, - "step": 49665 - }, - { - "epoch": 1.27, - "learning_rate": 1.28949020812652e-06, - "loss": 0.7207, - "step": 49666 - }, - { - "epoch": 1.27, - "learning_rate": 1.289463722383652e-06, - "loss": 0.6028, - "step": 49667 - }, - { - "epoch": 1.27, - "learning_rate": 1.2894372364191552e-06, - "loss": 0.7812, - "step": 49668 - }, - { - "epoch": 1.27, - "learning_rate": 1.2894107502330496e-06, - "loss": 0.6807, - "step": 49669 - }, - { - "epoch": 1.27, - "learning_rate": 1.2893842638253555e-06, - "loss": 0.5029, - "step": 49670 - }, - { - "epoch": 1.27, - "learning_rate": 1.2893577771960931e-06, - "loss": 0.6938, - "step": 49671 - }, - { - "epoch": 1.27, - "learning_rate": 1.289331290345283e-06, - "loss": 0.3943, - "step": 49672 - }, - { - "epoch": 1.27, - "learning_rate": 1.2893048032729448e-06, - "loss": 0.6602, - "step": 49673 - }, - { - "epoch": 1.27, - "learning_rate": 1.2892783159790997e-06, - "loss": 0.6055, - "step": 49674 - }, - { - "epoch": 1.27, - "learning_rate": 1.289251828463767e-06, - "loss": 0.6738, - "step": 49675 - }, - { - "epoch": 1.27, - "learning_rate": 1.2892253407269678e-06, - "loss": 0.7314, - "step": 49676 - }, - { - "epoch": 1.27, - "learning_rate": 1.289198852768722e-06, - "loss": 0.4062, - "step": 49677 - }, - { - "epoch": 1.27, - "learning_rate": 1.2891723645890498e-06, - "loss": 0.6562, - "step": 49678 - }, - { - "epoch": 1.27, - "learning_rate": 1.289145876187972e-06, - "loss": 0.7383, - "step": 49679 - }, - { - "epoch": 1.27, - "learning_rate": 1.289119387565508e-06, - "loss": 0.7549, - "step": 49680 - }, - { - "epoch": 1.27, - "learning_rate": 1.2890928987216788e-06, - "loss": 0.6091, - "step": 49681 - }, - { - "epoch": 1.27, - "learning_rate": 1.2890664096565044e-06, - "loss": 0.6689, - "step": 49682 - }, - { - "epoch": 1.27, - "learning_rate": 1.289039920370005e-06, - "loss": 0.4302, - "step": 49683 - }, - { - "epoch": 1.27, - "learning_rate": 1.2890134308622015e-06, - "loss": 0.5381, - "step": 49684 - }, - { - "epoch": 1.27, - "learning_rate": 1.2889869411331134e-06, - "loss": 0.6157, - "step": 49685 - }, - { - "epoch": 1.27, - "learning_rate": 1.2889604511827612e-06, - "loss": 0.7178, - "step": 49686 - }, - { - "epoch": 1.27, - "learning_rate": 1.2889339610111653e-06, - "loss": 0.7969, - "step": 49687 - }, - { - "epoch": 1.27, - "learning_rate": 1.288907470618346e-06, - "loss": 0.7881, - "step": 49688 - }, - { - "epoch": 1.27, - "learning_rate": 1.2888809800043238e-06, - "loss": 0.5476, - "step": 49689 - }, - { - "epoch": 1.27, - "learning_rate": 1.2888544891691184e-06, - "loss": 0.6826, - "step": 49690 - }, - { - "epoch": 1.27, - "learning_rate": 1.2888279981127506e-06, - "loss": 0.708, - "step": 49691 - }, - { - "epoch": 1.27, - "learning_rate": 1.2888015068352404e-06, - "loss": 0.7373, - "step": 49692 - }, - { - "epoch": 1.27, - "learning_rate": 1.2887750153366079e-06, - "loss": 0.7646, - "step": 49693 - }, - { - "epoch": 1.27, - "learning_rate": 1.288748523616874e-06, - "loss": 0.6641, - "step": 49694 - }, - { - "epoch": 1.27, - "learning_rate": 1.2887220316760585e-06, - "loss": 0.7598, - "step": 49695 - }, - { - "epoch": 1.27, - "learning_rate": 1.2886955395141819e-06, - "loss": 0.6611, - "step": 49696 - }, - { - "epoch": 1.27, - "learning_rate": 1.2886690471312642e-06, - "loss": 0.6953, - "step": 49697 - }, - { - "epoch": 1.27, - "learning_rate": 1.2886425545273261e-06, - "loss": 0.5742, - "step": 49698 - }, - { - "epoch": 1.27, - "learning_rate": 1.2886160617023878e-06, - "loss": 0.7126, - "step": 49699 - }, - { - "epoch": 1.27, - "learning_rate": 1.2885895686564688e-06, - "loss": 0.7197, - "step": 49700 - }, - { - "epoch": 1.27, - "learning_rate": 1.288563075389591e-06, - "loss": 0.7607, - "step": 49701 - }, - { - "epoch": 1.27, - "learning_rate": 1.288536581901773e-06, - "loss": 0.7466, - "step": 49702 - }, - { - "epoch": 1.27, - "learning_rate": 1.288510088193036e-06, - "loss": 0.6616, - "step": 49703 - }, - { - "epoch": 1.27, - "learning_rate": 1.2884835942634e-06, - "loss": 0.6416, - "step": 49704 - }, - { - "epoch": 1.27, - "learning_rate": 1.2884571001128854e-06, - "loss": 0.5771, - "step": 49705 - }, - { - "epoch": 1.27, - "learning_rate": 1.2884306057415127e-06, - "loss": 0.7158, - "step": 49706 - }, - { - "epoch": 1.27, - "learning_rate": 1.2884041111493016e-06, - "loss": 0.7363, - "step": 49707 - }, - { - "epoch": 1.27, - "learning_rate": 1.2883776163362729e-06, - "loss": 0.8809, - "step": 49708 - }, - { - "epoch": 1.27, - "learning_rate": 1.2883511213024467e-06, - "loss": 0.6084, - "step": 49709 - }, - { - "epoch": 1.27, - "learning_rate": 1.2883246260478436e-06, - "loss": 0.5723, - "step": 49710 - }, - { - "epoch": 1.27, - "learning_rate": 1.2882981305724831e-06, - "loss": 0.793, - "step": 49711 - }, - { - "epoch": 1.27, - "learning_rate": 1.2882716348763863e-06, - "loss": 0.7373, - "step": 49712 - }, - { - "epoch": 1.27, - "learning_rate": 1.288245138959573e-06, - "loss": 0.6377, - "step": 49713 - }, - { - "epoch": 1.27, - "learning_rate": 1.2882186428220638e-06, - "loss": 0.5889, - "step": 49714 - }, - { - "epoch": 1.27, - "learning_rate": 1.2881921464638788e-06, - "loss": 0.7451, - "step": 49715 - }, - { - "epoch": 1.27, - "learning_rate": 1.2881656498850383e-06, - "loss": 0.6963, - "step": 49716 - }, - { - "epoch": 1.27, - "learning_rate": 1.2881391530855622e-06, - "loss": 0.6099, - "step": 49717 - }, - { - "epoch": 1.27, - "learning_rate": 1.2881126560654718e-06, - "loss": 0.7178, - "step": 49718 - }, - { - "epoch": 1.27, - "learning_rate": 1.2880861588247867e-06, - "loss": 0.6621, - "step": 49719 - }, - { - "epoch": 1.27, - "learning_rate": 1.2880596613635274e-06, - "loss": 0.6724, - "step": 49720 - }, - { - "epoch": 1.27, - "learning_rate": 1.2880331636817134e-06, - "loss": 0.5742, - "step": 49721 - }, - { - "epoch": 1.27, - "learning_rate": 1.2880066657793662e-06, - "loss": 0.6631, - "step": 49722 - }, - { - "epoch": 1.27, - "learning_rate": 1.2879801676565051e-06, - "loss": 0.7344, - "step": 49723 - }, - { - "epoch": 1.27, - "learning_rate": 1.2879536693131514e-06, - "loss": 0.6738, - "step": 49724 - }, - { - "epoch": 1.27, - "learning_rate": 1.2879271707493246e-06, - "loss": 0.593, - "step": 49725 - }, - { - "epoch": 1.27, - "learning_rate": 1.287900671965045e-06, - "loss": 0.7969, - "step": 49726 - }, - { - "epoch": 1.27, - "learning_rate": 1.2878741729603332e-06, - "loss": 0.792, - "step": 49727 - }, - { - "epoch": 1.27, - "learning_rate": 1.2878476737352096e-06, - "loss": 0.6572, - "step": 49728 - }, - { - "epoch": 1.27, - "learning_rate": 1.2878211742896943e-06, - "loss": 0.7041, - "step": 49729 - }, - { - "epoch": 1.27, - "learning_rate": 1.287794674623807e-06, - "loss": 0.6675, - "step": 49730 - }, - { - "epoch": 1.27, - "learning_rate": 1.2877681747375691e-06, - "loss": 0.7412, - "step": 49731 - }, - { - "epoch": 1.27, - "learning_rate": 1.2877416746309999e-06, - "loss": 0.5791, - "step": 49732 - }, - { - "epoch": 1.27, - "learning_rate": 1.2877151743041206e-06, - "loss": 0.5928, - "step": 49733 - }, - { - "epoch": 1.27, - "learning_rate": 1.2876886737569508e-06, - "loss": 0.7656, - "step": 49734 - }, - { - "epoch": 1.27, - "learning_rate": 1.2876621729895113e-06, - "loss": 0.7637, - "step": 49735 - }, - { - "epoch": 1.27, - "learning_rate": 1.2876356720018215e-06, - "loss": 0.6108, - "step": 49736 - }, - { - "epoch": 1.27, - "learning_rate": 1.2876091707939028e-06, - "loss": 0.8789, - "step": 49737 - }, - { - "epoch": 1.27, - "learning_rate": 1.2875826693657745e-06, - "loss": 0.707, - "step": 49738 - }, - { - "epoch": 1.27, - "learning_rate": 1.287556167717458e-06, - "loss": 0.4795, - "step": 49739 - }, - { - "epoch": 1.27, - "learning_rate": 1.2875296658489725e-06, - "loss": 0.7422, - "step": 49740 - }, - { - "epoch": 1.27, - "learning_rate": 1.2875031637603388e-06, - "loss": 0.6218, - "step": 49741 - }, - { - "epoch": 1.27, - "learning_rate": 1.2874766614515773e-06, - "loss": 0.5718, - "step": 49742 - }, - { - "epoch": 1.27, - "learning_rate": 1.287450158922708e-06, - "loss": 0.5576, - "step": 49743 - }, - { - "epoch": 1.27, - "learning_rate": 1.2874236561737514e-06, - "loss": 0.5449, - "step": 49744 - }, - { - "epoch": 1.27, - "learning_rate": 1.2873971532047278e-06, - "loss": 0.6826, - "step": 49745 - }, - { - "epoch": 1.28, - "learning_rate": 1.2873706500156574e-06, - "loss": 0.7773, - "step": 49746 - }, - { - "epoch": 1.28, - "learning_rate": 1.2873441466065605e-06, - "loss": 0.75, - "step": 49747 - }, - { - "epoch": 1.28, - "learning_rate": 1.2873176429774572e-06, - "loss": 0.6318, - "step": 49748 - }, - { - "epoch": 1.28, - "learning_rate": 1.2872911391283681e-06, - "loss": 0.7598, - "step": 49749 - }, - { - "epoch": 1.28, - "learning_rate": 1.2872646350593136e-06, - "loss": 0.5991, - "step": 49750 - }, - { - "epoch": 1.28, - "learning_rate": 1.2872381307703135e-06, - "loss": 0.4819, - "step": 49751 - }, - { - "epoch": 1.28, - "learning_rate": 1.2872116262613886e-06, - "loss": 0.5859, - "step": 49752 - }, - { - "epoch": 1.28, - "learning_rate": 1.2871851215325587e-06, - "loss": 0.7891, - "step": 49753 - }, - { - "epoch": 1.28, - "learning_rate": 1.2871586165838445e-06, - "loss": 0.666, - "step": 49754 - }, - { - "epoch": 1.28, - "learning_rate": 1.287132111415266e-06, - "loss": 0.6582, - "step": 49755 - }, - { - "epoch": 1.28, - "learning_rate": 1.2871056060268439e-06, - "loss": 0.6025, - "step": 49756 - }, - { - "epoch": 1.28, - "learning_rate": 1.287079100418598e-06, - "loss": 0.7744, - "step": 49757 - }, - { - "epoch": 1.28, - "learning_rate": 1.287052594590549e-06, - "loss": 0.5859, - "step": 49758 - }, - { - "epoch": 1.28, - "learning_rate": 1.2870260885427172e-06, - "loss": 0.6421, - "step": 49759 - }, - { - "epoch": 1.28, - "learning_rate": 1.2869995822751225e-06, - "loss": 0.8018, - "step": 49760 - }, - { - "epoch": 1.28, - "learning_rate": 1.2869730757877853e-06, - "loss": 0.6431, - "step": 49761 - }, - { - "epoch": 1.28, - "learning_rate": 1.2869465690807262e-06, - "loss": 0.75, - "step": 49762 - }, - { - "epoch": 1.28, - "learning_rate": 1.286920062153965e-06, - "loss": 0.7363, - "step": 49763 - }, - { - "epoch": 1.28, - "learning_rate": 1.286893555007523e-06, - "loss": 0.625, - "step": 49764 - }, - { - "epoch": 1.28, - "learning_rate": 1.2868670476414192e-06, - "loss": 0.6636, - "step": 49765 - }, - { - "epoch": 1.28, - "learning_rate": 1.2868405400556746e-06, - "loss": 0.7002, - "step": 49766 - }, - { - "epoch": 1.28, - "learning_rate": 1.2868140322503094e-06, - "loss": 0.5559, - "step": 49767 - }, - { - "epoch": 1.28, - "learning_rate": 1.286787524225344e-06, - "loss": 0.6738, - "step": 49768 - }, - { - "epoch": 1.28, - "learning_rate": 1.2867610159807986e-06, - "loss": 0.6934, - "step": 49769 - }, - { - "epoch": 1.28, - "learning_rate": 1.286734507516693e-06, - "loss": 0.54, - "step": 49770 - }, - { - "epoch": 1.28, - "learning_rate": 1.2867079988330485e-06, - "loss": 0.6631, - "step": 49771 - }, - { - "epoch": 1.28, - "learning_rate": 1.2866814899298848e-06, - "loss": 0.6289, - "step": 49772 - }, - { - "epoch": 1.28, - "learning_rate": 1.286654980807222e-06, - "loss": 0.5378, - "step": 49773 - }, - { - "epoch": 1.28, - "learning_rate": 1.2866284714650807e-06, - "loss": 0.5537, - "step": 49774 - }, - { - "epoch": 1.28, - "learning_rate": 1.2866019619034817e-06, - "loss": 0.8145, - "step": 49775 - }, - { - "epoch": 1.28, - "learning_rate": 1.286575452122444e-06, - "loss": 0.6689, - "step": 49776 - }, - { - "epoch": 1.28, - "learning_rate": 1.286548942121989e-06, - "loss": 0.6719, - "step": 49777 - }, - { - "epoch": 1.28, - "learning_rate": 1.2865224319021365e-06, - "loss": 0.4871, - "step": 49778 - }, - { - "epoch": 1.28, - "learning_rate": 1.2864959214629073e-06, - "loss": 0.6719, - "step": 49779 - }, - { - "epoch": 1.28, - "learning_rate": 1.286469410804321e-06, - "loss": 0.6685, - "step": 49780 - }, - { - "epoch": 1.28, - "learning_rate": 1.2864428999263988e-06, - "loss": 0.6738, - "step": 49781 - }, - { - "epoch": 1.28, - "learning_rate": 1.2864163888291597e-06, - "loss": 0.5723, - "step": 49782 - }, - { - "epoch": 1.28, - "learning_rate": 1.286389877512625e-06, - "loss": 0.5361, - "step": 49783 - }, - { - "epoch": 1.28, - "learning_rate": 1.2863633659768152e-06, - "loss": 0.4668, - "step": 49784 - }, - { - "epoch": 1.28, - "learning_rate": 1.2863368542217496e-06, - "loss": 0.5688, - "step": 49785 - }, - { - "epoch": 1.28, - "learning_rate": 1.2863103422474491e-06, - "loss": 0.8076, - "step": 49786 - }, - { - "epoch": 1.28, - "learning_rate": 1.286283830053934e-06, - "loss": 0.6357, - "step": 49787 - }, - { - "epoch": 1.28, - "learning_rate": 1.2862573176412248e-06, - "loss": 0.6621, - "step": 49788 - }, - { - "epoch": 1.28, - "learning_rate": 1.2862308050093414e-06, - "loss": 0.6963, - "step": 49789 - }, - { - "epoch": 1.28, - "learning_rate": 1.2862042921583039e-06, - "loss": 0.4126, - "step": 49790 - }, - { - "epoch": 1.28, - "learning_rate": 1.2861777790881332e-06, - "loss": 0.6396, - "step": 49791 - }, - { - "epoch": 1.28, - "learning_rate": 1.286151265798849e-06, - "loss": 0.5747, - "step": 49792 - }, - { - "epoch": 1.28, - "learning_rate": 1.2861247522904724e-06, - "loss": 0.4932, - "step": 49793 - }, - { - "epoch": 1.28, - "learning_rate": 1.286098238563023e-06, - "loss": 0.752, - "step": 49794 - }, - { - "epoch": 1.28, - "learning_rate": 1.2860717246165214e-06, - "loss": 0.7275, - "step": 49795 - }, - { - "epoch": 1.28, - "learning_rate": 1.2860452104509878e-06, - "loss": 0.6875, - "step": 49796 - }, - { - "epoch": 1.28, - "learning_rate": 1.2860186960664424e-06, - "loss": 0.6084, - "step": 49797 - }, - { - "epoch": 1.28, - "learning_rate": 1.2859921814629062e-06, - "loss": 0.6357, - "step": 49798 - }, - { - "epoch": 1.28, - "learning_rate": 1.2859656666403984e-06, - "loss": 0.6064, - "step": 49799 - }, - { - "epoch": 1.28, - "learning_rate": 1.28593915159894e-06, - "loss": 0.5889, - "step": 49800 - }, - { - "epoch": 1.28, - "learning_rate": 1.285912636338551e-06, - "loss": 0.7715, - "step": 49801 - }, - { - "epoch": 1.28, - "learning_rate": 1.285886120859252e-06, - "loss": 0.5679, - "step": 49802 - }, - { - "epoch": 1.28, - "learning_rate": 1.2858596051610633e-06, - "loss": 0.7705, - "step": 49803 - }, - { - "epoch": 1.28, - "learning_rate": 1.2858330892440049e-06, - "loss": 0.6284, - "step": 49804 - }, - { - "epoch": 1.28, - "learning_rate": 1.285806573108097e-06, - "loss": 0.8154, - "step": 49805 - }, - { - "epoch": 1.28, - "learning_rate": 1.2857800567533603e-06, - "loss": 0.5837, - "step": 49806 - }, - { - "epoch": 1.28, - "learning_rate": 1.2857535401798148e-06, - "loss": 0.6807, - "step": 49807 - }, - { - "epoch": 1.28, - "learning_rate": 1.2857270233874815e-06, - "loss": 0.4802, - "step": 49808 - }, - { - "epoch": 1.28, - "learning_rate": 1.2857005063763797e-06, - "loss": 0.6543, - "step": 49809 - }, - { - "epoch": 1.28, - "learning_rate": 1.2856739891465302e-06, - "loss": 0.7222, - "step": 49810 - }, - { - "epoch": 1.28, - "learning_rate": 1.2856474716979532e-06, - "loss": 0.6914, - "step": 49811 - }, - { - "epoch": 1.28, - "learning_rate": 1.2856209540306694e-06, - "loss": 0.7461, - "step": 49812 - }, - { - "epoch": 1.28, - "learning_rate": 1.2855944361446984e-06, - "loss": 0.6636, - "step": 49813 - }, - { - "epoch": 1.28, - "learning_rate": 1.285567918040061e-06, - "loss": 0.6221, - "step": 49814 - }, - { - "epoch": 1.28, - "learning_rate": 1.2855413997167774e-06, - "loss": 0.4624, - "step": 49815 - }, - { - "epoch": 1.28, - "learning_rate": 1.2855148811748677e-06, - "loss": 0.5581, - "step": 49816 - }, - { - "epoch": 1.28, - "learning_rate": 1.2854883624143526e-06, - "loss": 0.6094, - "step": 49817 - }, - { - "epoch": 1.28, - "learning_rate": 1.2854618434352525e-06, - "loss": 0.7402, - "step": 49818 - }, - { - "epoch": 1.28, - "learning_rate": 1.285435324237587e-06, - "loss": 0.6216, - "step": 49819 - }, - { - "epoch": 1.28, - "learning_rate": 1.2854088048213767e-06, - "loss": 0.6816, - "step": 49820 - }, - { - "epoch": 1.28, - "learning_rate": 1.285382285186642e-06, - "loss": 0.5857, - "step": 49821 - }, - { - "epoch": 1.28, - "learning_rate": 1.2853557653334033e-06, - "loss": 0.6709, - "step": 49822 - }, - { - "epoch": 1.28, - "learning_rate": 1.285329245261681e-06, - "loss": 0.6147, - "step": 49823 - }, - { - "epoch": 1.28, - "learning_rate": 1.2853027249714953e-06, - "loss": 0.4081, - "step": 49824 - }, - { - "epoch": 1.28, - "learning_rate": 1.2852762044628663e-06, - "loss": 0.5205, - "step": 49825 - }, - { - "epoch": 1.28, - "learning_rate": 1.285249683735814e-06, - "loss": 0.7876, - "step": 49826 - }, - { - "epoch": 1.28, - "learning_rate": 1.2852231627903596e-06, - "loss": 0.7324, - "step": 49827 - }, - { - "epoch": 1.28, - "learning_rate": 1.2851966416265227e-06, - "loss": 0.4612, - "step": 49828 - }, - { - "epoch": 1.28, - "learning_rate": 1.2851701202443241e-06, - "loss": 0.3921, - "step": 49829 - }, - { - "epoch": 1.28, - "learning_rate": 1.2851435986437835e-06, - "loss": 0.7734, - "step": 49830 - }, - { - "epoch": 1.28, - "learning_rate": 1.2851170768249219e-06, - "loss": 0.5693, - "step": 49831 - }, - { - "epoch": 1.28, - "learning_rate": 1.2850905547877589e-06, - "loss": 0.6699, - "step": 49832 - }, - { - "epoch": 1.28, - "learning_rate": 1.2850640325323155e-06, - "loss": 0.394, - "step": 49833 - }, - { - "epoch": 1.28, - "learning_rate": 1.2850375100586118e-06, - "loss": 0.5972, - "step": 49834 - }, - { - "epoch": 1.28, - "learning_rate": 1.2850109873666678e-06, - "loss": 0.5542, - "step": 49835 - }, - { - "epoch": 1.28, - "learning_rate": 1.2849844644565035e-06, - "loss": 0.6157, - "step": 49836 - }, - { - "epoch": 1.28, - "learning_rate": 1.2849579413281403e-06, - "loss": 0.6855, - "step": 49837 - }, - { - "epoch": 1.28, - "learning_rate": 1.284931417981598e-06, - "loss": 0.6787, - "step": 49838 - }, - { - "epoch": 1.28, - "learning_rate": 1.2849048944168962e-06, - "loss": 0.6121, - "step": 49839 - }, - { - "epoch": 1.28, - "learning_rate": 1.2848783706340563e-06, - "loss": 0.5029, - "step": 49840 - }, - { - "epoch": 1.28, - "learning_rate": 1.284851846633098e-06, - "loss": 0.6777, - "step": 49841 - }, - { - "epoch": 1.28, - "learning_rate": 1.2848253224140417e-06, - "loss": 0.5457, - "step": 49842 - }, - { - "epoch": 1.28, - "learning_rate": 1.284798797976908e-06, - "loss": 0.6792, - "step": 49843 - }, - { - "epoch": 1.28, - "learning_rate": 1.2847722733217167e-06, - "loss": 0.6387, - "step": 49844 - }, - { - "epoch": 1.28, - "learning_rate": 1.2847457484484882e-06, - "loss": 0.7607, - "step": 49845 - }, - { - "epoch": 1.28, - "learning_rate": 1.2847192233572433e-06, - "loss": 0.666, - "step": 49846 - }, - { - "epoch": 1.28, - "learning_rate": 1.2846926980480017e-06, - "loss": 0.6318, - "step": 49847 - }, - { - "epoch": 1.28, - "learning_rate": 1.2846661725207845e-06, - "loss": 0.7119, - "step": 49848 - }, - { - "epoch": 1.28, - "learning_rate": 1.2846396467756111e-06, - "loss": 0.5203, - "step": 49849 - }, - { - "epoch": 1.28, - "learning_rate": 1.2846131208125025e-06, - "loss": 0.5244, - "step": 49850 - }, - { - "epoch": 1.28, - "learning_rate": 1.2845865946314783e-06, - "loss": 0.5896, - "step": 49851 - }, - { - "epoch": 1.28, - "learning_rate": 1.2845600682325594e-06, - "loss": 0.6904, - "step": 49852 - }, - { - "epoch": 1.28, - "learning_rate": 1.284533541615766e-06, - "loss": 0.5938, - "step": 49853 - }, - { - "epoch": 1.28, - "learning_rate": 1.2845070147811185e-06, - "loss": 0.6582, - "step": 49854 - }, - { - "epoch": 1.28, - "learning_rate": 1.2844804877286368e-06, - "loss": 0.5713, - "step": 49855 - }, - { - "epoch": 1.28, - "learning_rate": 1.2844539604583416e-06, - "loss": 0.5635, - "step": 49856 - }, - { - "epoch": 1.28, - "learning_rate": 1.2844274329702529e-06, - "loss": 0.7539, - "step": 49857 - }, - { - "epoch": 1.28, - "learning_rate": 1.2844009052643913e-06, - "loss": 0.7617, - "step": 49858 - }, - { - "epoch": 1.28, - "learning_rate": 1.284374377340777e-06, - "loss": 0.5737, - "step": 49859 - }, - { - "epoch": 1.28, - "learning_rate": 1.2843478491994305e-06, - "loss": 0.6855, - "step": 49860 - }, - { - "epoch": 1.28, - "learning_rate": 1.2843213208403716e-06, - "loss": 0.6768, - "step": 49861 - }, - { - "epoch": 1.28, - "learning_rate": 1.2842947922636213e-06, - "loss": 0.8887, - "step": 49862 - }, - { - "epoch": 1.28, - "learning_rate": 1.2842682634691992e-06, - "loss": 0.5845, - "step": 49863 - }, - { - "epoch": 1.28, - "learning_rate": 1.2842417344571262e-06, - "loss": 0.5557, - "step": 49864 - }, - { - "epoch": 1.28, - "learning_rate": 1.2842152052274221e-06, - "loss": 0.7861, - "step": 49865 - }, - { - "epoch": 1.28, - "learning_rate": 1.2841886757801076e-06, - "loss": 0.4514, - "step": 49866 - }, - { - "epoch": 1.28, - "learning_rate": 1.2841621461152033e-06, - "loss": 0.4895, - "step": 49867 - }, - { - "epoch": 1.28, - "learning_rate": 1.2841356162327288e-06, - "loss": 0.7759, - "step": 49868 - }, - { - "epoch": 1.28, - "learning_rate": 1.284109086132705e-06, - "loss": 0.627, - "step": 49869 - }, - { - "epoch": 1.28, - "learning_rate": 1.2840825558151513e-06, - "loss": 0.7148, - "step": 49870 - }, - { - "epoch": 1.28, - "learning_rate": 1.2840560252800892e-06, - "loss": 0.7725, - "step": 49871 - }, - { - "epoch": 1.28, - "learning_rate": 1.284029494527538e-06, - "loss": 0.5452, - "step": 49872 - }, - { - "epoch": 1.28, - "learning_rate": 1.2840029635575192e-06, - "loss": 0.8066, - "step": 49873 - }, - { - "epoch": 1.28, - "learning_rate": 1.2839764323700517e-06, - "loss": 0.7764, - "step": 49874 - }, - { - "epoch": 1.28, - "learning_rate": 1.2839499009651566e-06, - "loss": 0.6753, - "step": 49875 - }, - { - "epoch": 1.28, - "learning_rate": 1.2839233693428542e-06, - "loss": 0.5427, - "step": 49876 - }, - { - "epoch": 1.28, - "learning_rate": 1.2838968375031649e-06, - "loss": 0.7754, - "step": 49877 - }, - { - "epoch": 1.28, - "learning_rate": 1.2838703054461086e-06, - "loss": 0.5815, - "step": 49878 - }, - { - "epoch": 1.28, - "learning_rate": 1.2838437731717062e-06, - "loss": 0.5015, - "step": 49879 - }, - { - "epoch": 1.28, - "learning_rate": 1.2838172406799773e-06, - "loss": 0.47, - "step": 49880 - }, - { - "epoch": 1.28, - "learning_rate": 1.2837907079709428e-06, - "loss": 0.4756, - "step": 49881 - }, - { - "epoch": 1.28, - "learning_rate": 1.2837641750446226e-06, - "loss": 0.6943, - "step": 49882 - }, - { - "epoch": 1.28, - "learning_rate": 1.2837376419010376e-06, - "loss": 0.5991, - "step": 49883 - }, - { - "epoch": 1.28, - "learning_rate": 1.2837111085402075e-06, - "loss": 0.6172, - "step": 49884 - }, - { - "epoch": 1.28, - "learning_rate": 1.2836845749621528e-06, - "loss": 0.8359, - "step": 49885 - }, - { - "epoch": 1.28, - "learning_rate": 1.283658041166894e-06, - "loss": 0.5288, - "step": 49886 - }, - { - "epoch": 1.28, - "learning_rate": 1.283631507154451e-06, - "loss": 0.6914, - "step": 49887 - }, - { - "epoch": 1.28, - "learning_rate": 1.283604972924845e-06, - "loss": 0.6387, - "step": 49888 - }, - { - "epoch": 1.28, - "learning_rate": 1.283578438478095e-06, - "loss": 0.5308, - "step": 49889 - }, - { - "epoch": 1.28, - "learning_rate": 1.2835519038142225e-06, - "loss": 0.6431, - "step": 49890 - }, - { - "epoch": 1.28, - "learning_rate": 1.2835253689332471e-06, - "loss": 0.6768, - "step": 49891 - }, - { - "epoch": 1.28, - "learning_rate": 1.2834988338351895e-06, - "loss": 0.6968, - "step": 49892 - }, - { - "epoch": 1.28, - "learning_rate": 1.28347229852007e-06, - "loss": 0.6943, - "step": 49893 - }, - { - "epoch": 1.28, - "learning_rate": 1.2834457629879086e-06, - "loss": 0.7607, - "step": 49894 - }, - { - "epoch": 1.28, - "learning_rate": 1.2834192272387257e-06, - "loss": 0.7256, - "step": 49895 - }, - { - "epoch": 1.28, - "learning_rate": 1.2833926912725419e-06, - "loss": 0.5615, - "step": 49896 - }, - { - "epoch": 1.28, - "learning_rate": 1.283366155089377e-06, - "loss": 0.6772, - "step": 49897 - }, - { - "epoch": 1.28, - "learning_rate": 1.2833396186892525e-06, - "loss": 0.6592, - "step": 49898 - }, - { - "epoch": 1.28, - "learning_rate": 1.2833130820721872e-06, - "loss": 0.5435, - "step": 49899 - }, - { - "epoch": 1.28, - "learning_rate": 1.2832865452382022e-06, - "loss": 0.7461, - "step": 49900 - }, - { - "epoch": 1.28, - "learning_rate": 1.2832600081873178e-06, - "loss": 0.6357, - "step": 49901 - }, - { - "epoch": 1.28, - "learning_rate": 1.2832334709195541e-06, - "loss": 0.7031, - "step": 49902 - }, - { - "epoch": 1.28, - "learning_rate": 1.2832069334349318e-06, - "loss": 0.7686, - "step": 49903 - }, - { - "epoch": 1.28, - "learning_rate": 1.2831803957334706e-06, - "loss": 0.5229, - "step": 49904 - }, - { - "epoch": 1.28, - "learning_rate": 1.2831538578151918e-06, - "loss": 0.6611, - "step": 49905 - }, - { - "epoch": 1.28, - "learning_rate": 1.2831273196801145e-06, - "loss": 0.5488, - "step": 49906 - }, - { - "epoch": 1.28, - "learning_rate": 1.28310078132826e-06, - "loss": 0.6577, - "step": 49907 - }, - { - "epoch": 1.28, - "learning_rate": 1.283074242759648e-06, - "loss": 0.5508, - "step": 49908 - }, - { - "epoch": 1.28, - "learning_rate": 1.2830477039742992e-06, - "loss": 0.8721, - "step": 49909 - }, - { - "epoch": 1.28, - "learning_rate": 1.2830211649722337e-06, - "loss": 0.6919, - "step": 49910 - }, - { - "epoch": 1.28, - "learning_rate": 1.2829946257534721e-06, - "loss": 0.8428, - "step": 49911 - }, - { - "epoch": 1.28, - "learning_rate": 1.2829680863180343e-06, - "loss": 0.5513, - "step": 49912 - }, - { - "epoch": 1.28, - "learning_rate": 1.2829415466659413e-06, - "loss": 0.6396, - "step": 49913 - }, - { - "epoch": 1.28, - "learning_rate": 1.2829150067972124e-06, - "loss": 0.5923, - "step": 49914 - }, - { - "epoch": 1.28, - "learning_rate": 1.2828884667118688e-06, - "loss": 0.6934, - "step": 49915 - }, - { - "epoch": 1.28, - "learning_rate": 1.2828619264099303e-06, - "loss": 0.5366, - "step": 49916 - }, - { - "epoch": 1.28, - "learning_rate": 1.2828353858914176e-06, - "loss": 0.455, - "step": 49917 - }, - { - "epoch": 1.28, - "learning_rate": 1.2828088451563509e-06, - "loss": 0.623, - "step": 49918 - }, - { - "epoch": 1.28, - "learning_rate": 1.2827823042047503e-06, - "loss": 0.71, - "step": 49919 - }, - { - "epoch": 1.28, - "learning_rate": 1.2827557630366363e-06, - "loss": 0.7852, - "step": 49920 - }, - { - "epoch": 1.28, - "learning_rate": 1.2827292216520293e-06, - "loss": 0.6753, - "step": 49921 - }, - { - "epoch": 1.28, - "learning_rate": 1.2827026800509495e-06, - "loss": 0.7461, - "step": 49922 - }, - { - "epoch": 1.28, - "learning_rate": 1.2826761382334171e-06, - "loss": 0.6675, - "step": 49923 - }, - { - "epoch": 1.28, - "learning_rate": 1.282649596199453e-06, - "loss": 0.748, - "step": 49924 - }, - { - "epoch": 1.28, - "learning_rate": 1.282623053949077e-06, - "loss": 0.5815, - "step": 49925 - }, - { - "epoch": 1.28, - "learning_rate": 1.2825965114823092e-06, - "loss": 0.708, - "step": 49926 - }, - { - "epoch": 1.28, - "learning_rate": 1.2825699687991704e-06, - "loss": 0.5786, - "step": 49927 - }, - { - "epoch": 1.28, - "learning_rate": 1.282543425899681e-06, - "loss": 0.4429, - "step": 49928 - }, - { - "epoch": 1.28, - "learning_rate": 1.2825168827838609e-06, - "loss": 0.7998, - "step": 49929 - }, - { - "epoch": 1.28, - "learning_rate": 1.2824903394517303e-06, - "loss": 0.8447, - "step": 49930 - }, - { - "epoch": 1.28, - "learning_rate": 1.2824637959033103e-06, - "loss": 0.5669, - "step": 49931 - }, - { - "epoch": 1.28, - "learning_rate": 1.2824372521386204e-06, - "loss": 0.5723, - "step": 49932 - }, - { - "epoch": 1.28, - "learning_rate": 1.2824107081576816e-06, - "loss": 0.8623, - "step": 49933 - }, - { - "epoch": 1.28, - "learning_rate": 1.282384163960514e-06, - "loss": 0.7285, - "step": 49934 - }, - { - "epoch": 1.28, - "learning_rate": 1.2823576195471372e-06, - "loss": 0.4231, - "step": 49935 - }, - { - "epoch": 1.28, - "learning_rate": 1.2823310749175728e-06, - "loss": 0.6484, - "step": 49936 - }, - { - "epoch": 1.28, - "learning_rate": 1.28230453007184e-06, - "loss": 0.5164, - "step": 49937 - }, - { - "epoch": 1.28, - "learning_rate": 1.2822779850099603e-06, - "loss": 0.6992, - "step": 49938 - }, - { - "epoch": 1.28, - "learning_rate": 1.2822514397319526e-06, - "loss": 0.7793, - "step": 49939 - }, - { - "epoch": 1.28, - "learning_rate": 1.2822248942378385e-06, - "loss": 0.4881, - "step": 49940 - }, - { - "epoch": 1.28, - "learning_rate": 1.282198348527637e-06, - "loss": 0.5269, - "step": 49941 - }, - { - "epoch": 1.28, - "learning_rate": 1.2821718026013699e-06, - "loss": 0.6719, - "step": 49942 - }, - { - "epoch": 1.28, - "learning_rate": 1.2821452564590567e-06, - "loss": 0.6318, - "step": 49943 - }, - { - "epoch": 1.28, - "learning_rate": 1.2821187101007178e-06, - "loss": 0.7061, - "step": 49944 - }, - { - "epoch": 1.28, - "learning_rate": 1.2820921635263734e-06, - "loss": 0.6992, - "step": 49945 - }, - { - "epoch": 1.28, - "learning_rate": 1.2820656167360445e-06, - "loss": 0.6565, - "step": 49946 - }, - { - "epoch": 1.28, - "learning_rate": 1.2820390697297504e-06, - "loss": 0.6592, - "step": 49947 - }, - { - "epoch": 1.28, - "learning_rate": 1.282012522507512e-06, - "loss": 0.6597, - "step": 49948 - }, - { - "epoch": 1.28, - "learning_rate": 1.2819859750693498e-06, - "loss": 0.6982, - "step": 49949 - }, - { - "epoch": 1.28, - "learning_rate": 1.2819594274152836e-06, - "loss": 0.645, - "step": 49950 - }, - { - "epoch": 1.28, - "learning_rate": 1.2819328795453345e-06, - "loss": 0.7402, - "step": 49951 - }, - { - "epoch": 1.28, - "learning_rate": 1.2819063314595223e-06, - "loss": 0.8701, - "step": 49952 - }, - { - "epoch": 1.28, - "learning_rate": 1.2818797831578672e-06, - "loss": 0.6465, - "step": 49953 - }, - { - "epoch": 1.28, - "learning_rate": 1.2818532346403895e-06, - "loss": 0.5757, - "step": 49954 - }, - { - "epoch": 1.28, - "learning_rate": 1.28182668590711e-06, - "loss": 0.6147, - "step": 49955 - }, - { - "epoch": 1.28, - "learning_rate": 1.2818001369580485e-06, - "loss": 0.8213, - "step": 49956 - }, - { - "epoch": 1.28, - "learning_rate": 1.2817735877932258e-06, - "loss": 0.8105, - "step": 49957 - }, - { - "epoch": 1.28, - "learning_rate": 1.281747038412662e-06, - "loss": 0.605, - "step": 49958 - }, - { - "epoch": 1.28, - "learning_rate": 1.2817204888163777e-06, - "loss": 0.6611, - "step": 49959 - }, - { - "epoch": 1.28, - "learning_rate": 1.2816939390043926e-06, - "loss": 0.7173, - "step": 49960 - }, - { - "epoch": 1.28, - "learning_rate": 1.2816673889767275e-06, - "loss": 0.8154, - "step": 49961 - }, - { - "epoch": 1.28, - "learning_rate": 1.2816408387334025e-06, - "loss": 0.7832, - "step": 49962 - }, - { - "epoch": 1.28, - "learning_rate": 1.2816142882744388e-06, - "loss": 0.5881, - "step": 49963 - }, - { - "epoch": 1.28, - "learning_rate": 1.2815877375998552e-06, - "loss": 0.7051, - "step": 49964 - }, - { - "epoch": 1.28, - "learning_rate": 1.281561186709673e-06, - "loss": 0.8047, - "step": 49965 - }, - { - "epoch": 1.28, - "learning_rate": 1.2815346356039124e-06, - "loss": 0.6016, - "step": 49966 - }, - { - "epoch": 1.28, - "learning_rate": 1.2815080842825935e-06, - "loss": 0.7529, - "step": 49967 - }, - { - "epoch": 1.28, - "learning_rate": 1.2814815327457372e-06, - "loss": 0.7275, - "step": 49968 - }, - { - "epoch": 1.28, - "learning_rate": 1.2814549809933633e-06, - "loss": 0.4721, - "step": 49969 - }, - { - "epoch": 1.28, - "learning_rate": 1.281428429025492e-06, - "loss": 0.7812, - "step": 49970 - }, - { - "epoch": 1.28, - "learning_rate": 1.281401876842144e-06, - "loss": 0.6235, - "step": 49971 - }, - { - "epoch": 1.28, - "learning_rate": 1.2813753244433394e-06, - "loss": 0.8057, - "step": 49972 - }, - { - "epoch": 1.28, - "learning_rate": 1.281348771829099e-06, - "loss": 0.5473, - "step": 49973 - }, - { - "epoch": 1.28, - "learning_rate": 1.2813222189994426e-06, - "loss": 0.5754, - "step": 49974 - }, - { - "epoch": 1.28, - "learning_rate": 1.2812956659543905e-06, - "loss": 0.4833, - "step": 49975 - }, - { - "epoch": 1.28, - "learning_rate": 1.2812691126939636e-06, - "loss": 0.6782, - "step": 49976 - }, - { - "epoch": 1.28, - "learning_rate": 1.2812425592181817e-06, - "loss": 0.6738, - "step": 49977 - }, - { - "epoch": 1.28, - "learning_rate": 1.2812160055270655e-06, - "loss": 0.5659, - "step": 49978 - }, - { - "epoch": 1.28, - "learning_rate": 1.2811894516206349e-06, - "loss": 0.623, - "step": 49979 - }, - { - "epoch": 1.28, - "learning_rate": 1.2811628974989106e-06, - "loss": 0.8408, - "step": 49980 - }, - { - "epoch": 1.28, - "learning_rate": 1.2811363431619126e-06, - "loss": 0.8096, - "step": 49981 - }, - { - "epoch": 1.28, - "learning_rate": 1.2811097886096617e-06, - "loss": 0.8076, - "step": 49982 - }, - { - "epoch": 1.28, - "learning_rate": 1.2810832338421777e-06, - "loss": 0.6675, - "step": 49983 - }, - { - "epoch": 1.28, - "learning_rate": 1.2810566788594815e-06, - "loss": 0.543, - "step": 49984 - }, - { - "epoch": 1.28, - "learning_rate": 1.2810301236615929e-06, - "loss": 0.8611, - "step": 49985 - }, - { - "epoch": 1.28, - "learning_rate": 1.2810035682485325e-06, - "loss": 0.7012, - "step": 49986 - }, - { - "epoch": 1.28, - "learning_rate": 1.2809770126203205e-06, - "loss": 0.6611, - "step": 49987 - }, - { - "epoch": 1.28, - "learning_rate": 1.2809504567769778e-06, - "loss": 0.6826, - "step": 49988 - }, - { - "epoch": 1.28, - "learning_rate": 1.2809239007185236e-06, - "loss": 0.7729, - "step": 49989 - }, - { - "epoch": 1.28, - "learning_rate": 1.280897344444979e-06, - "loss": 0.7529, - "step": 49990 - }, - { - "epoch": 1.28, - "learning_rate": 1.2808707879563645e-06, - "loss": 0.6372, - "step": 49991 - }, - { - "epoch": 1.28, - "learning_rate": 1.2808442312527001e-06, - "loss": 0.5225, - "step": 49992 - }, - { - "epoch": 1.28, - "learning_rate": 1.2808176743340063e-06, - "loss": 0.7949, - "step": 49993 - }, - { - "epoch": 1.28, - "learning_rate": 1.2807911172003027e-06, - "loss": 0.7002, - "step": 49994 - }, - { - "epoch": 1.28, - "learning_rate": 1.280764559851611e-06, - "loss": 0.5776, - "step": 49995 - }, - { - "epoch": 1.28, - "learning_rate": 1.2807380022879502e-06, - "loss": 0.8691, - "step": 49996 - }, - { - "epoch": 1.28, - "learning_rate": 1.2807114445093413e-06, - "loss": 0.6455, - "step": 49997 - }, - { - "epoch": 1.28, - "learning_rate": 1.280684886515805e-06, - "loss": 0.6733, - "step": 49998 - }, - { - "epoch": 1.28, - "learning_rate": 1.280658328307361e-06, - "loss": 0.6438, - "step": 49999 - }, - { - "epoch": 1.28, - "learning_rate": 1.2806317698840297e-06, - "loss": 0.4318, - "step": 50000 - }, - { - "epoch": 1.28, - "learning_rate": 1.2806052112458316e-06, - "loss": 0.6055, - "step": 50001 - }, - { - "epoch": 1.28, - "learning_rate": 1.2805786523927869e-06, - "loss": 0.6123, - "step": 50002 - }, - { - "epoch": 1.28, - "learning_rate": 1.2805520933249164e-06, - "loss": 0.5898, - "step": 50003 - }, - { - "epoch": 1.28, - "learning_rate": 1.2805255340422396e-06, - "loss": 0.5688, - "step": 50004 - }, - { - "epoch": 1.28, - "learning_rate": 1.2804989745447777e-06, - "loss": 0.7178, - "step": 50005 - }, - { - "epoch": 1.28, - "learning_rate": 1.2804724148325503e-06, - "loss": 0.6289, - "step": 50006 - }, - { - "epoch": 1.28, - "learning_rate": 1.2804458549055781e-06, - "loss": 0.564, - "step": 50007 - }, - { - "epoch": 1.28, - "learning_rate": 1.2804192947638816e-06, - "loss": 0.5579, - "step": 50008 - }, - { - "epoch": 1.28, - "learning_rate": 1.280392734407481e-06, - "loss": 0.6895, - "step": 50009 - }, - { - "epoch": 1.28, - "learning_rate": 1.2803661738363962e-06, - "loss": 0.6567, - "step": 50010 - }, - { - "epoch": 1.28, - "learning_rate": 1.2803396130506484e-06, - "loss": 0.7397, - "step": 50011 - }, - { - "epoch": 1.28, - "learning_rate": 1.280313052050257e-06, - "loss": 0.6379, - "step": 50012 - }, - { - "epoch": 1.28, - "learning_rate": 1.2802864908352428e-06, - "loss": 0.7109, - "step": 50013 - }, - { - "epoch": 1.28, - "learning_rate": 1.2802599294056264e-06, - "loss": 0.7236, - "step": 50014 - }, - { - "epoch": 1.28, - "learning_rate": 1.2802333677614278e-06, - "loss": 0.4922, - "step": 50015 - }, - { - "epoch": 1.28, - "learning_rate": 1.2802068059026674e-06, - "loss": 0.7051, - "step": 50016 - }, - { - "epoch": 1.28, - "learning_rate": 1.2801802438293654e-06, - "loss": 0.7998, - "step": 50017 - }, - { - "epoch": 1.28, - "learning_rate": 1.2801536815415423e-06, - "loss": 0.6426, - "step": 50018 - }, - { - "epoch": 1.28, - "learning_rate": 1.2801271190392185e-06, - "loss": 0.5845, - "step": 50019 - }, - { - "epoch": 1.28, - "learning_rate": 1.2801005563224141e-06, - "loss": 0.7568, - "step": 50020 - }, - { - "epoch": 1.28, - "learning_rate": 1.2800739933911495e-06, - "loss": 0.6973, - "step": 50021 - }, - { - "epoch": 1.28, - "learning_rate": 1.2800474302454455e-06, - "loss": 0.7236, - "step": 50022 - }, - { - "epoch": 1.28, - "learning_rate": 1.280020866885322e-06, - "loss": 0.8506, - "step": 50023 - }, - { - "epoch": 1.28, - "learning_rate": 1.2799943033107993e-06, - "loss": 0.8008, - "step": 50024 - }, - { - "epoch": 1.28, - "learning_rate": 1.2799677395218974e-06, - "loss": 0.603, - "step": 50025 - }, - { - "epoch": 1.28, - "learning_rate": 1.2799411755186378e-06, - "loss": 0.6621, - "step": 50026 - }, - { - "epoch": 1.28, - "learning_rate": 1.2799146113010395e-06, - "loss": 0.6377, - "step": 50027 - }, - { - "epoch": 1.28, - "learning_rate": 1.279888046869124e-06, - "loss": 0.6543, - "step": 50028 - }, - { - "epoch": 1.28, - "learning_rate": 1.2798614822229108e-06, - "loss": 0.5801, - "step": 50029 - }, - { - "epoch": 1.28, - "learning_rate": 1.2798349173624206e-06, - "loss": 0.5425, - "step": 50030 - }, - { - "epoch": 1.28, - "learning_rate": 1.2798083522876734e-06, - "loss": 0.709, - "step": 50031 - }, - { - "epoch": 1.28, - "learning_rate": 1.2797817869986902e-06, - "loss": 0.4893, - "step": 50032 - }, - { - "epoch": 1.28, - "learning_rate": 1.2797552214954907e-06, - "loss": 0.6509, - "step": 50033 - }, - { - "epoch": 1.28, - "learning_rate": 1.2797286557780958e-06, - "loss": 0.7119, - "step": 50034 - }, - { - "epoch": 1.28, - "learning_rate": 1.2797020898465252e-06, - "loss": 0.583, - "step": 50035 - }, - { - "epoch": 1.28, - "learning_rate": 1.2796755237007997e-06, - "loss": 0.708, - "step": 50036 - }, - { - "epoch": 1.28, - "learning_rate": 1.2796489573409393e-06, - "loss": 0.6382, - "step": 50037 - }, - { - "epoch": 1.28, - "learning_rate": 1.2796223907669647e-06, - "loss": 0.6763, - "step": 50038 - }, - { - "epoch": 1.28, - "learning_rate": 1.2795958239788965e-06, - "loss": 0.5918, - "step": 50039 - }, - { - "epoch": 1.28, - "learning_rate": 1.279569256976754e-06, - "loss": 0.7559, - "step": 50040 - }, - { - "epoch": 1.28, - "learning_rate": 1.2795426897605587e-06, - "loss": 0.5422, - "step": 50041 - }, - { - "epoch": 1.28, - "learning_rate": 1.27951612233033e-06, - "loss": 0.6523, - "step": 50042 - }, - { - "epoch": 1.28, - "learning_rate": 1.2794895546860889e-06, - "loss": 0.6226, - "step": 50043 - }, - { - "epoch": 1.28, - "learning_rate": 1.2794629868278553e-06, - "loss": 0.7617, - "step": 50044 - }, - { - "epoch": 1.28, - "learning_rate": 1.27943641875565e-06, - "loss": 0.6875, - "step": 50045 - }, - { - "epoch": 1.28, - "learning_rate": 1.2794098504694927e-06, - "loss": 0.79, - "step": 50046 - }, - { - "epoch": 1.28, - "learning_rate": 1.2793832819694044e-06, - "loss": 0.7734, - "step": 50047 - }, - { - "epoch": 1.28, - "learning_rate": 1.2793567132554052e-06, - "loss": 0.7744, - "step": 50048 - }, - { - "epoch": 1.28, - "learning_rate": 1.2793301443275155e-06, - "loss": 0.4707, - "step": 50049 - }, - { - "epoch": 1.28, - "learning_rate": 1.2793035751857553e-06, - "loss": 0.7441, - "step": 50050 - }, - { - "epoch": 1.28, - "learning_rate": 1.2792770058301451e-06, - "loss": 0.7266, - "step": 50051 - }, - { - "epoch": 1.28, - "learning_rate": 1.2792504362607055e-06, - "loss": 0.7637, - "step": 50052 - }, - { - "epoch": 1.28, - "learning_rate": 1.2792238664774572e-06, - "loss": 0.4741, - "step": 50053 - }, - { - "epoch": 1.28, - "learning_rate": 1.2791972964804192e-06, - "loss": 0.792, - "step": 50054 - }, - { - "epoch": 1.28, - "learning_rate": 1.2791707262696132e-06, - "loss": 0.7295, - "step": 50055 - }, - { - "epoch": 1.28, - "learning_rate": 1.2791441558450587e-06, - "loss": 0.6138, - "step": 50056 - }, - { - "epoch": 1.28, - "learning_rate": 1.2791175852067765e-06, - "loss": 0.7197, - "step": 50057 - }, - { - "epoch": 1.28, - "learning_rate": 1.279091014354787e-06, - "loss": 0.5908, - "step": 50058 - }, - { - "epoch": 1.28, - "learning_rate": 1.2790644432891098e-06, - "loss": 0.6147, - "step": 50059 - }, - { - "epoch": 1.28, - "learning_rate": 1.2790378720097662e-06, - "loss": 0.7842, - "step": 50060 - }, - { - "epoch": 1.28, - "learning_rate": 1.279011300516776e-06, - "loss": 0.6582, - "step": 50061 - }, - { - "epoch": 1.28, - "learning_rate": 1.2789847288101595e-06, - "loss": 0.7891, - "step": 50062 - }, - { - "epoch": 1.28, - "learning_rate": 1.2789581568899377e-06, - "loss": 0.5898, - "step": 50063 - }, - { - "epoch": 1.28, - "learning_rate": 1.2789315847561302e-06, - "loss": 0.7461, - "step": 50064 - }, - { - "epoch": 1.28, - "learning_rate": 1.2789050124087575e-06, - "loss": 0.6641, - "step": 50065 - }, - { - "epoch": 1.28, - "learning_rate": 1.2788784398478404e-06, - "loss": 0.498, - "step": 50066 - }, - { - "epoch": 1.28, - "learning_rate": 1.2788518670733983e-06, - "loss": 0.7939, - "step": 50067 - }, - { - "epoch": 1.28, - "learning_rate": 1.2788252940854527e-06, - "loss": 0.7988, - "step": 50068 - }, - { - "epoch": 1.28, - "learning_rate": 1.2787987208840233e-06, - "loss": 0.4325, - "step": 50069 - }, - { - "epoch": 1.28, - "learning_rate": 1.2787721474691305e-06, - "loss": 0.7939, - "step": 50070 - }, - { - "epoch": 1.28, - "learning_rate": 1.2787455738407943e-06, - "loss": 0.8105, - "step": 50071 - }, - { - "epoch": 1.28, - "learning_rate": 1.278718999999036e-06, - "loss": 0.6348, - "step": 50072 - }, - { - "epoch": 1.28, - "learning_rate": 1.2786924259438752e-06, - "loss": 0.7617, - "step": 50073 - }, - { - "epoch": 1.28, - "learning_rate": 1.2786658516753324e-06, - "loss": 0.7773, - "step": 50074 - }, - { - "epoch": 1.28, - "learning_rate": 1.2786392771934278e-06, - "loss": 0.7295, - "step": 50075 - }, - { - "epoch": 1.28, - "learning_rate": 1.278612702498182e-06, - "loss": 0.8125, - "step": 50076 - }, - { - "epoch": 1.28, - "learning_rate": 1.2785861275896153e-06, - "loss": 0.6606, - "step": 50077 - }, - { - "epoch": 1.28, - "learning_rate": 1.2785595524677485e-06, - "loss": 0.8027, - "step": 50078 - }, - { - "epoch": 1.28, - "learning_rate": 1.2785329771326005e-06, - "loss": 0.7734, - "step": 50079 - }, - { - "epoch": 1.28, - "learning_rate": 1.2785064015841933e-06, - "loss": 0.7319, - "step": 50080 - }, - { - "epoch": 1.28, - "learning_rate": 1.2784798258225462e-06, - "loss": 0.6514, - "step": 50081 - }, - { - "epoch": 1.28, - "learning_rate": 1.2784532498476801e-06, - "loss": 0.4204, - "step": 50082 - }, - { - "epoch": 1.28, - "learning_rate": 1.2784266736596153e-06, - "loss": 0.752, - "step": 50083 - }, - { - "epoch": 1.28, - "learning_rate": 1.2784000972583715e-06, - "loss": 0.549, - "step": 50084 - }, - { - "epoch": 1.28, - "learning_rate": 1.27837352064397e-06, - "loss": 0.5698, - "step": 50085 - }, - { - "epoch": 1.28, - "learning_rate": 1.2783469438164303e-06, - "loss": 0.6758, - "step": 50086 - }, - { - "epoch": 1.28, - "learning_rate": 1.2783203667757736e-06, - "loss": 0.5828, - "step": 50087 - }, - { - "epoch": 1.28, - "learning_rate": 1.2782937895220193e-06, - "loss": 0.7695, - "step": 50088 - }, - { - "epoch": 1.28, - "learning_rate": 1.2782672120551888e-06, - "loss": 0.6943, - "step": 50089 - }, - { - "epoch": 1.28, - "learning_rate": 1.2782406343753014e-06, - "loss": 0.5405, - "step": 50090 - }, - { - "epoch": 1.28, - "learning_rate": 1.2782140564823783e-06, - "loss": 0.5186, - "step": 50091 - }, - { - "epoch": 1.28, - "learning_rate": 1.2781874783764394e-06, - "loss": 0.6074, - "step": 50092 - }, - { - "epoch": 1.28, - "learning_rate": 1.278160900057505e-06, - "loss": 0.4954, - "step": 50093 - }, - { - "epoch": 1.28, - "learning_rate": 1.2781343215255958e-06, - "loss": 0.7197, - "step": 50094 - }, - { - "epoch": 1.28, - "learning_rate": 1.2781077427807319e-06, - "loss": 0.6704, - "step": 50095 - }, - { - "epoch": 1.28, - "learning_rate": 1.2780811638229332e-06, - "loss": 0.6201, - "step": 50096 - }, - { - "epoch": 1.28, - "learning_rate": 1.2780545846522212e-06, - "loss": 0.6602, - "step": 50097 - }, - { - "epoch": 1.28, - "learning_rate": 1.2780280052686152e-06, - "loss": 0.6426, - "step": 50098 - }, - { - "epoch": 1.28, - "learning_rate": 1.2780014256721364e-06, - "loss": 0.7034, - "step": 50099 - }, - { - "epoch": 1.28, - "learning_rate": 1.277974845862804e-06, - "loss": 0.6387, - "step": 50100 - }, - { - "epoch": 1.28, - "learning_rate": 1.2779482658406395e-06, - "loss": 0.6216, - "step": 50101 - }, - { - "epoch": 1.28, - "learning_rate": 1.2779216856056627e-06, - "loss": 0.7217, - "step": 50102 - }, - { - "epoch": 1.28, - "learning_rate": 1.277895105157894e-06, - "loss": 0.6807, - "step": 50103 - }, - { - "epoch": 1.28, - "learning_rate": 1.2778685244973539e-06, - "loss": 0.7227, - "step": 50104 - }, - { - "epoch": 1.28, - "learning_rate": 1.2778419436240626e-06, - "loss": 0.6191, - "step": 50105 - }, - { - "epoch": 1.28, - "learning_rate": 1.2778153625380403e-06, - "loss": 0.7598, - "step": 50106 - }, - { - "epoch": 1.28, - "learning_rate": 1.277788781239308e-06, - "loss": 0.7578, - "step": 50107 - }, - { - "epoch": 1.28, - "learning_rate": 1.2777621997278853e-06, - "loss": 0.5713, - "step": 50108 - }, - { - "epoch": 1.28, - "learning_rate": 1.277735618003793e-06, - "loss": 0.5518, - "step": 50109 - }, - { - "epoch": 1.28, - "learning_rate": 1.2777090360670511e-06, - "loss": 0.7539, - "step": 50110 - }, - { - "epoch": 1.28, - "learning_rate": 1.27768245391768e-06, - "loss": 0.8125, - "step": 50111 - }, - { - "epoch": 1.28, - "learning_rate": 1.2776558715557006e-06, - "loss": 0.6304, - "step": 50112 - }, - { - "epoch": 1.28, - "learning_rate": 1.2776292889811329e-06, - "loss": 0.7949, - "step": 50113 - }, - { - "epoch": 1.28, - "learning_rate": 1.277602706193997e-06, - "loss": 0.7241, - "step": 50114 - }, - { - "epoch": 1.28, - "learning_rate": 1.2775761231943133e-06, - "loss": 0.5693, - "step": 50115 - }, - { - "epoch": 1.28, - "learning_rate": 1.2775495399821026e-06, - "loss": 0.5967, - "step": 50116 - }, - { - "epoch": 1.28, - "learning_rate": 1.277522956557385e-06, - "loss": 0.7822, - "step": 50117 - }, - { - "epoch": 1.28, - "learning_rate": 1.2774963729201808e-06, - "loss": 0.5371, - "step": 50118 - }, - { - "epoch": 1.28, - "learning_rate": 1.2774697890705105e-06, - "loss": 0.7236, - "step": 50119 - }, - { - "epoch": 1.28, - "learning_rate": 1.277443205008394e-06, - "loss": 0.561, - "step": 50120 - }, - { - "epoch": 1.28, - "learning_rate": 1.2774166207338522e-06, - "loss": 0.6504, - "step": 50121 - }, - { - "epoch": 1.28, - "learning_rate": 1.2773900362469053e-06, - "loss": 0.6826, - "step": 50122 - }, - { - "epoch": 1.28, - "learning_rate": 1.2773634515475735e-06, - "loss": 0.5867, - "step": 50123 - }, - { - "epoch": 1.28, - "learning_rate": 1.2773368666358775e-06, - "loss": 0.6113, - "step": 50124 - }, - { - "epoch": 1.28, - "learning_rate": 1.277310281511837e-06, - "loss": 0.7539, - "step": 50125 - }, - { - "epoch": 1.28, - "learning_rate": 1.277283696175473e-06, - "loss": 0.6289, - "step": 50126 - }, - { - "epoch": 1.28, - "learning_rate": 1.2772571106268057e-06, - "loss": 0.5815, - "step": 50127 - }, - { - "epoch": 1.28, - "learning_rate": 1.2772305248658553e-06, - "loss": 0.6099, - "step": 50128 - }, - { - "epoch": 1.28, - "learning_rate": 1.2772039388926422e-06, - "loss": 0.5891, - "step": 50129 - }, - { - "epoch": 1.28, - "learning_rate": 1.2771773527071866e-06, - "loss": 0.7188, - "step": 50130 - }, - { - "epoch": 1.28, - "learning_rate": 1.2771507663095094e-06, - "loss": 0.6128, - "step": 50131 - }, - { - "epoch": 1.28, - "learning_rate": 1.2771241796996303e-06, - "loss": 0.6304, - "step": 50132 - }, - { - "epoch": 1.28, - "learning_rate": 1.2770975928775704e-06, - "loss": 0.6904, - "step": 50133 - }, - { - "epoch": 1.28, - "learning_rate": 1.2770710058433492e-06, - "loss": 0.7842, - "step": 50134 - }, - { - "epoch": 1.28, - "learning_rate": 1.2770444185969878e-06, - "loss": 0.7861, - "step": 50135 - }, - { - "epoch": 1.29, - "learning_rate": 1.2770178311385058e-06, - "loss": 0.7988, - "step": 50136 - }, - { - "epoch": 1.29, - "learning_rate": 1.2769912434679244e-06, - "loss": 0.8018, - "step": 50137 - }, - { - "epoch": 1.29, - "learning_rate": 1.2769646555852634e-06, - "loss": 0.7393, - "step": 50138 - }, - { - "epoch": 1.29, - "learning_rate": 1.2769380674905432e-06, - "loss": 0.5547, - "step": 50139 - }, - { - "epoch": 1.29, - "learning_rate": 1.2769114791837842e-06, - "loss": 0.7412, - "step": 50140 - }, - { - "epoch": 1.29, - "learning_rate": 1.2768848906650069e-06, - "loss": 0.6223, - "step": 50141 - }, - { - "epoch": 1.29, - "learning_rate": 1.2768583019342316e-06, - "loss": 0.5791, - "step": 50142 - }, - { - "epoch": 1.29, - "learning_rate": 1.2768317129914788e-06, - "loss": 0.6196, - "step": 50143 - }, - { - "epoch": 1.29, - "learning_rate": 1.2768051238367682e-06, - "loss": 0.7148, - "step": 50144 - }, - { - "epoch": 1.29, - "learning_rate": 1.2767785344701211e-06, - "loss": 0.627, - "step": 50145 - }, - { - "epoch": 1.29, - "learning_rate": 1.2767519448915572e-06, - "loss": 0.6008, - "step": 50146 - }, - { - "epoch": 1.29, - "learning_rate": 1.2767253551010972e-06, - "loss": 0.7031, - "step": 50147 - }, - { - "epoch": 1.29, - "learning_rate": 1.2766987650987614e-06, - "loss": 0.5928, - "step": 50148 - }, - { - "epoch": 1.29, - "learning_rate": 1.2766721748845697e-06, - "loss": 0.8047, - "step": 50149 - }, - { - "epoch": 1.29, - "learning_rate": 1.2766455844585431e-06, - "loss": 0.8359, - "step": 50150 - }, - { - "epoch": 1.29, - "learning_rate": 1.2766189938207016e-06, - "loss": 0.8164, - "step": 50151 - }, - { - "epoch": 1.29, - "learning_rate": 1.2765924029710658e-06, - "loss": 0.665, - "step": 50152 - }, - { - "epoch": 1.29, - "learning_rate": 1.2765658119096555e-06, - "loss": 0.707, - "step": 50153 - }, - { - "epoch": 1.29, - "learning_rate": 1.2765392206364923e-06, - "loss": 0.606, - "step": 50154 - }, - { - "epoch": 1.29, - "learning_rate": 1.276512629151595e-06, - "loss": 0.438, - "step": 50155 - }, - { - "epoch": 1.29, - "learning_rate": 1.2764860374549848e-06, - "loss": 0.7949, - "step": 50156 - }, - { - "epoch": 1.29, - "learning_rate": 1.2764594455466822e-06, - "loss": 0.6123, - "step": 50157 - }, - { - "epoch": 1.29, - "learning_rate": 1.2764328534267073e-06, - "loss": 0.7568, - "step": 50158 - }, - { - "epoch": 1.29, - "learning_rate": 1.2764062610950802e-06, - "loss": 0.6143, - "step": 50159 - }, - { - "epoch": 1.29, - "learning_rate": 1.2763796685518218e-06, - "loss": 0.6641, - "step": 50160 - }, - { - "epoch": 1.29, - "learning_rate": 1.276353075796952e-06, - "loss": 0.8994, - "step": 50161 - }, - { - "epoch": 1.29, - "learning_rate": 1.2763264828304915e-06, - "loss": 0.6277, - "step": 50162 - }, - { - "epoch": 1.29, - "learning_rate": 1.2762998896524605e-06, - "loss": 0.6616, - "step": 50163 - }, - { - "epoch": 1.29, - "learning_rate": 1.2762732962628795e-06, - "loss": 0.7451, - "step": 50164 - }, - { - "epoch": 1.29, - "learning_rate": 1.2762467026617682e-06, - "loss": 0.4626, - "step": 50165 - }, - { - "epoch": 1.29, - "learning_rate": 1.2762201088491483e-06, - "loss": 0.4655, - "step": 50166 - }, - { - "epoch": 1.29, - "learning_rate": 1.2761935148250388e-06, - "loss": 0.7285, - "step": 50167 - }, - { - "epoch": 1.29, - "learning_rate": 1.276166920589461e-06, - "loss": 0.4392, - "step": 50168 - }, - { - "epoch": 1.29, - "learning_rate": 1.2761403261424344e-06, - "loss": 0.7871, - "step": 50169 - }, - { - "epoch": 1.29, - "learning_rate": 1.2761137314839803e-06, - "loss": 0.6079, - "step": 50170 - }, - { - "epoch": 1.29, - "learning_rate": 1.2760871366141182e-06, - "loss": 0.8057, - "step": 50171 - }, - { - "epoch": 1.29, - "learning_rate": 1.2760605415328691e-06, - "loss": 0.5923, - "step": 50172 - }, - { - "epoch": 1.29, - "learning_rate": 1.276033946240253e-06, - "loss": 0.8232, - "step": 50173 - }, - { - "epoch": 1.29, - "learning_rate": 1.2760073507362907e-06, - "loss": 0.7383, - "step": 50174 - }, - { - "epoch": 1.29, - "learning_rate": 1.2759807550210023e-06, - "loss": 0.7285, - "step": 50175 - }, - { - "epoch": 1.29, - "learning_rate": 1.2759541590944075e-06, - "loss": 0.7734, - "step": 50176 - }, - { - "epoch": 1.29, - "learning_rate": 1.2759275629565282e-06, - "loss": 0.7158, - "step": 50177 - }, - { - "epoch": 1.29, - "learning_rate": 1.2759009666073832e-06, - "loss": 0.5654, - "step": 50178 - }, - { - "epoch": 1.29, - "learning_rate": 1.2758743700469937e-06, - "loss": 0.5413, - "step": 50179 - }, - { - "epoch": 1.29, - "learning_rate": 1.2758477732753798e-06, - "loss": 0.6724, - "step": 50180 - }, - { - "epoch": 1.29, - "learning_rate": 1.275821176292562e-06, - "loss": 0.6484, - "step": 50181 - }, - { - "epoch": 1.29, - "learning_rate": 1.2757945790985606e-06, - "loss": 0.8008, - "step": 50182 - }, - { - "epoch": 1.29, - "learning_rate": 1.2757679816933961e-06, - "loss": 0.6543, - "step": 50183 - }, - { - "epoch": 1.29, - "learning_rate": 1.2757413840770886e-06, - "loss": 0.75, - "step": 50184 - }, - { - "epoch": 1.29, - "learning_rate": 1.2757147862496587e-06, - "loss": 0.6025, - "step": 50185 - }, - { - "epoch": 1.29, - "learning_rate": 1.2756881882111264e-06, - "loss": 0.7979, - "step": 50186 - }, - { - "epoch": 1.29, - "learning_rate": 1.2756615899615129e-06, - "loss": 0.8086, - "step": 50187 - }, - { - "epoch": 1.29, - "learning_rate": 1.2756349915008376e-06, - "loss": 0.7832, - "step": 50188 - }, - { - "epoch": 1.29, - "learning_rate": 1.2756083928291212e-06, - "loss": 0.6226, - "step": 50189 - }, - { - "epoch": 1.29, - "learning_rate": 1.275581793946384e-06, - "loss": 0.5832, - "step": 50190 - }, - { - "epoch": 1.29, - "learning_rate": 1.2755551948526469e-06, - "loss": 0.5776, - "step": 50191 - }, - { - "epoch": 1.29, - "learning_rate": 1.2755285955479295e-06, - "loss": 0.6484, - "step": 50192 - }, - { - "epoch": 1.29, - "learning_rate": 1.2755019960322528e-06, - "loss": 0.644, - "step": 50193 - }, - { - "epoch": 1.29, - "learning_rate": 1.2754753963056368e-06, - "loss": 0.7744, - "step": 50194 - }, - { - "epoch": 1.29, - "learning_rate": 1.275448796368102e-06, - "loss": 0.6396, - "step": 50195 - }, - { - "epoch": 1.29, - "learning_rate": 1.2754221962196684e-06, - "loss": 0.6523, - "step": 50196 - }, - { - "epoch": 1.29, - "learning_rate": 1.275395595860357e-06, - "loss": 0.668, - "step": 50197 - }, - { - "epoch": 1.29, - "learning_rate": 1.2753689952901877e-06, - "loss": 0.6143, - "step": 50198 - }, - { - "epoch": 1.29, - "learning_rate": 1.2753423945091813e-06, - "loss": 0.7588, - "step": 50199 - }, - { - "epoch": 1.29, - "learning_rate": 1.2753157935173577e-06, - "loss": 0.5815, - "step": 50200 - }, - { - "epoch": 1.29, - "learning_rate": 1.2752891923147374e-06, - "loss": 0.6211, - "step": 50201 - }, - { - "epoch": 1.29, - "learning_rate": 1.275262590901341e-06, - "loss": 0.7393, - "step": 50202 - }, - { - "epoch": 1.29, - "learning_rate": 1.2752359892771884e-06, - "loss": 0.6074, - "step": 50203 - }, - { - "epoch": 1.29, - "learning_rate": 1.2752093874423006e-06, - "loss": 0.793, - "step": 50204 - }, - { - "epoch": 1.29, - "learning_rate": 1.2751827853966975e-06, - "loss": 0.5811, - "step": 50205 - }, - { - "epoch": 1.29, - "learning_rate": 1.2751561831403994e-06, - "loss": 0.7285, - "step": 50206 - }, - { - "epoch": 1.29, - "learning_rate": 1.2751295806734272e-06, - "loss": 0.6748, - "step": 50207 - }, - { - "epoch": 1.29, - "learning_rate": 1.2751029779958007e-06, - "loss": 0.5376, - "step": 50208 - }, - { - "epoch": 1.29, - "learning_rate": 1.2750763751075404e-06, - "loss": 0.6631, - "step": 50209 - }, - { - "epoch": 1.29, - "learning_rate": 1.275049772008667e-06, - "loss": 0.7559, - "step": 50210 - }, - { - "epoch": 1.29, - "learning_rate": 1.2750231686992003e-06, - "loss": 0.7109, - "step": 50211 - }, - { - "epoch": 1.29, - "learning_rate": 1.2749965651791617e-06, - "loss": 0.6816, - "step": 50212 - }, - { - "epoch": 1.29, - "learning_rate": 1.2749699614485703e-06, - "loss": 0.4856, - "step": 50213 - }, - { - "epoch": 1.29, - "learning_rate": 1.2749433575074474e-06, - "loss": 0.5747, - "step": 50214 - }, - { - "epoch": 1.29, - "learning_rate": 1.2749167533558125e-06, - "loss": 0.5449, - "step": 50215 - }, - { - "epoch": 1.29, - "learning_rate": 1.2748901489936867e-06, - "loss": 0.6548, - "step": 50216 - }, - { - "epoch": 1.29, - "learning_rate": 1.2748635444210905e-06, - "loss": 0.7617, - "step": 50217 - }, - { - "epoch": 1.29, - "learning_rate": 1.2748369396380434e-06, - "loss": 0.6963, - "step": 50218 - }, - { - "epoch": 1.29, - "learning_rate": 1.2748103346445667e-06, - "loss": 0.7412, - "step": 50219 - }, - { - "epoch": 1.29, - "learning_rate": 1.2747837294406801e-06, - "loss": 0.6528, - "step": 50220 - }, - { - "epoch": 1.29, - "learning_rate": 1.2747571240264043e-06, - "loss": 0.603, - "step": 50221 - }, - { - "epoch": 1.29, - "learning_rate": 1.2747305184017598e-06, - "loss": 0.6704, - "step": 50222 - }, - { - "epoch": 1.29, - "learning_rate": 1.2747039125667667e-06, - "loss": 0.5771, - "step": 50223 - }, - { - "epoch": 1.29, - "learning_rate": 1.274677306521445e-06, - "loss": 0.7627, - "step": 50224 - }, - { - "epoch": 1.29, - "learning_rate": 1.2746507002658162e-06, - "loss": 0.7588, - "step": 50225 - }, - { - "epoch": 1.29, - "learning_rate": 1.2746240937998995e-06, - "loss": 0.647, - "step": 50226 - }, - { - "epoch": 1.29, - "learning_rate": 1.274597487123716e-06, - "loss": 0.6602, - "step": 50227 - }, - { - "epoch": 1.29, - "learning_rate": 1.2745708802372858e-06, - "loss": 0.5898, - "step": 50228 - }, - { - "epoch": 1.29, - "learning_rate": 1.2745442731406293e-06, - "loss": 0.6807, - "step": 50229 - }, - { - "epoch": 1.29, - "learning_rate": 1.2745176658337666e-06, - "loss": 0.8564, - "step": 50230 - }, - { - "epoch": 1.29, - "learning_rate": 1.2744910583167187e-06, - "loss": 0.6777, - "step": 50231 - }, - { - "epoch": 1.29, - "learning_rate": 1.2744644505895057e-06, - "loss": 0.8066, - "step": 50232 - }, - { - "epoch": 1.29, - "learning_rate": 1.2744378426521477e-06, - "loss": 0.425, - "step": 50233 - }, - { - "epoch": 1.29, - "learning_rate": 1.2744112345046651e-06, - "loss": 0.749, - "step": 50234 - }, - { - "epoch": 1.29, - "learning_rate": 1.2743846261470785e-06, - "loss": 0.467, - "step": 50235 - }, - { - "epoch": 1.29, - "learning_rate": 1.2743580175794081e-06, - "loss": 0.6533, - "step": 50236 - }, - { - "epoch": 1.29, - "learning_rate": 1.2743314088016748e-06, - "loss": 0.5273, - "step": 50237 - }, - { - "epoch": 1.29, - "learning_rate": 1.2743047998138985e-06, - "loss": 0.2727, - "step": 50238 - }, - { - "epoch": 1.29, - "learning_rate": 1.274278190616099e-06, - "loss": 0.5203, - "step": 50239 - }, - { - "epoch": 1.29, - "learning_rate": 1.2742515812082981e-06, - "loss": 0.7844, - "step": 50240 - }, - { - "epoch": 1.29, - "learning_rate": 1.274224971590515e-06, - "loss": 0.7002, - "step": 50241 - }, - { - "epoch": 1.29, - "learning_rate": 1.2741983617627704e-06, - "loss": 0.8262, - "step": 50242 - }, - { - "epoch": 1.29, - "learning_rate": 1.2741717517250847e-06, - "loss": 0.6978, - "step": 50243 - }, - { - "epoch": 1.29, - "learning_rate": 1.2741451414774786e-06, - "loss": 0.5404, - "step": 50244 - }, - { - "epoch": 1.29, - "learning_rate": 1.2741185310199718e-06, - "loss": 0.6904, - "step": 50245 - }, - { - "epoch": 1.29, - "learning_rate": 1.2740919203525852e-06, - "loss": 0.689, - "step": 50246 - }, - { - "epoch": 1.29, - "learning_rate": 1.2740653094753393e-06, - "loss": 0.7598, - "step": 50247 - }, - { - "epoch": 1.29, - "learning_rate": 1.2740386983882538e-06, - "loss": 0.8125, - "step": 50248 - }, - { - "epoch": 1.29, - "learning_rate": 1.2740120870913497e-06, - "loss": 0.708, - "step": 50249 - }, - { - "epoch": 1.29, - "learning_rate": 1.273985475584647e-06, - "loss": 0.6338, - "step": 50250 - }, - { - "epoch": 1.29, - "learning_rate": 1.2739588638681662e-06, - "loss": 0.5239, - "step": 50251 - }, - { - "epoch": 1.29, - "learning_rate": 1.273932251941928e-06, - "loss": 0.5146, - "step": 50252 - }, - { - "epoch": 1.29, - "learning_rate": 1.273905639805952e-06, - "loss": 0.4871, - "step": 50253 - }, - { - "epoch": 1.29, - "learning_rate": 1.2738790274602593e-06, - "loss": 0.748, - "step": 50254 - }, - { - "epoch": 1.29, - "learning_rate": 1.27385241490487e-06, - "loss": 0.5288, - "step": 50255 - }, - { - "epoch": 1.29, - "learning_rate": 1.2738258021398045e-06, - "loss": 0.5288, - "step": 50256 - }, - { - "epoch": 1.29, - "learning_rate": 1.2737991891650832e-06, - "loss": 0.6641, - "step": 50257 - }, - { - "epoch": 1.29, - "learning_rate": 1.2737725759807264e-06, - "loss": 0.644, - "step": 50258 - }, - { - "epoch": 1.29, - "learning_rate": 1.2737459625867546e-06, - "loss": 0.7871, - "step": 50259 - }, - { - "epoch": 1.29, - "learning_rate": 1.273719348983188e-06, - "loss": 0.709, - "step": 50260 - }, - { - "epoch": 1.29, - "learning_rate": 1.2736927351700471e-06, - "loss": 0.5037, - "step": 50261 - }, - { - "epoch": 1.29, - "learning_rate": 1.2736661211473522e-06, - "loss": 0.6592, - "step": 50262 - }, - { - "epoch": 1.29, - "learning_rate": 1.273639506915124e-06, - "loss": 0.4792, - "step": 50263 - }, - { - "epoch": 1.29, - "learning_rate": 1.2736128924733823e-06, - "loss": 0.6113, - "step": 50264 - }, - { - "epoch": 1.29, - "learning_rate": 1.273586277822148e-06, - "loss": 0.5505, - "step": 50265 - }, - { - "epoch": 1.29, - "learning_rate": 1.2735596629614408e-06, - "loss": 0.6406, - "step": 50266 - }, - { - "epoch": 1.29, - "learning_rate": 1.2735330478912825e-06, - "loss": 0.9561, - "step": 50267 - }, - { - "epoch": 1.29, - "learning_rate": 1.2735064326116918e-06, - "loss": 0.6631, - "step": 50268 - }, - { - "epoch": 1.29, - "learning_rate": 1.2734798171226899e-06, - "loss": 0.6074, - "step": 50269 - }, - { - "epoch": 1.29, - "learning_rate": 1.2734532014242971e-06, - "loss": 0.9258, - "step": 50270 - }, - { - "epoch": 1.29, - "learning_rate": 1.2734265855165338e-06, - "loss": 0.521, - "step": 50271 - }, - { - "epoch": 1.29, - "learning_rate": 1.2733999693994205e-06, - "loss": 0.5356, - "step": 50272 - }, - { - "epoch": 1.29, - "learning_rate": 1.2733733530729774e-06, - "loss": 0.5977, - "step": 50273 - }, - { - "epoch": 1.29, - "learning_rate": 1.2733467365372246e-06, - "loss": 0.541, - "step": 50274 - }, - { - "epoch": 1.29, - "learning_rate": 1.2733201197921829e-06, - "loss": 0.6543, - "step": 50275 - }, - { - "epoch": 1.29, - "learning_rate": 1.2732935028378724e-06, - "loss": 0.7158, - "step": 50276 - }, - { - "epoch": 1.29, - "learning_rate": 1.273266885674314e-06, - "loss": 0.501, - "step": 50277 - }, - { - "epoch": 1.29, - "learning_rate": 1.2732402683015273e-06, - "loss": 0.5537, - "step": 50278 - }, - { - "epoch": 1.29, - "learning_rate": 1.2732136507195334e-06, - "loss": 0.7241, - "step": 50279 - }, - { - "epoch": 1.29, - "learning_rate": 1.273187032928352e-06, - "loss": 0.7402, - "step": 50280 - }, - { - "epoch": 1.29, - "learning_rate": 1.2731604149280043e-06, - "loss": 0.5576, - "step": 50281 - }, - { - "epoch": 1.29, - "learning_rate": 1.2731337967185102e-06, - "loss": 0.7261, - "step": 50282 - }, - { - "epoch": 1.29, - "learning_rate": 1.2731071782998898e-06, - "loss": 0.6523, - "step": 50283 - }, - { - "epoch": 1.29, - "learning_rate": 1.2730805596721639e-06, - "loss": 0.6685, - "step": 50284 - }, - { - "epoch": 1.29, - "learning_rate": 1.2730539408353531e-06, - "loss": 0.4866, - "step": 50285 - }, - { - "epoch": 1.29, - "learning_rate": 1.2730273217894769e-06, - "loss": 0.6211, - "step": 50286 - }, - { - "epoch": 1.29, - "learning_rate": 1.2730007025345567e-06, - "loss": 0.6094, - "step": 50287 - }, - { - "epoch": 1.29, - "learning_rate": 1.272974083070612e-06, - "loss": 0.4849, - "step": 50288 - }, - { - "epoch": 1.29, - "learning_rate": 1.2729474633976638e-06, - "loss": 0.5723, - "step": 50289 - }, - { - "epoch": 1.29, - "learning_rate": 1.2729208435157323e-06, - "loss": 0.5791, - "step": 50290 - }, - { - "epoch": 1.29, - "learning_rate": 1.2728942234248379e-06, - "loss": 0.6064, - "step": 50291 - }, - { - "epoch": 1.29, - "learning_rate": 1.2728676031250011e-06, - "loss": 0.7139, - "step": 50292 - }, - { - "epoch": 1.29, - "learning_rate": 1.2728409826162418e-06, - "loss": 0.6675, - "step": 50293 - }, - { - "epoch": 1.29, - "learning_rate": 1.2728143618985808e-06, - "loss": 0.5735, - "step": 50294 - }, - { - "epoch": 1.29, - "learning_rate": 1.2727877409720384e-06, - "loss": 0.5576, - "step": 50295 - }, - { - "epoch": 1.29, - "learning_rate": 1.272761119836635e-06, - "loss": 0.7393, - "step": 50296 - }, - { - "epoch": 1.29, - "learning_rate": 1.2727344984923912e-06, - "loss": 0.729, - "step": 50297 - }, - { - "epoch": 1.29, - "learning_rate": 1.2727078769393266e-06, - "loss": 0.5591, - "step": 50298 - }, - { - "epoch": 1.29, - "learning_rate": 1.2726812551774625e-06, - "loss": 0.7017, - "step": 50299 - }, - { - "epoch": 1.29, - "learning_rate": 1.2726546332068187e-06, - "loss": 0.549, - "step": 50300 - }, - { - "epoch": 1.29, - "learning_rate": 1.2726280110274159e-06, - "loss": 0.6377, - "step": 50301 - }, - { - "epoch": 1.29, - "learning_rate": 1.2726013886392747e-06, - "loss": 0.5862, - "step": 50302 - }, - { - "epoch": 1.29, - "learning_rate": 1.2725747660424144e-06, - "loss": 0.7246, - "step": 50303 - }, - { - "epoch": 1.29, - "learning_rate": 1.2725481432368566e-06, - "loss": 0.6294, - "step": 50304 - }, - { - "epoch": 1.29, - "learning_rate": 1.2725215202226212e-06, - "loss": 0.5479, - "step": 50305 - }, - { - "epoch": 1.29, - "learning_rate": 1.2724948969997284e-06, - "loss": 0.7051, - "step": 50306 - }, - { - "epoch": 1.29, - "learning_rate": 1.2724682735681991e-06, - "loss": 0.6567, - "step": 50307 - }, - { - "epoch": 1.29, - "learning_rate": 1.272441649928053e-06, - "loss": 0.6758, - "step": 50308 - }, - { - "epoch": 1.29, - "learning_rate": 1.2724150260793113e-06, - "loss": 0.6484, - "step": 50309 - }, - { - "epoch": 1.29, - "learning_rate": 1.2723884020219936e-06, - "loss": 0.75, - "step": 50310 - }, - { - "epoch": 1.29, - "learning_rate": 1.2723617777561207e-06, - "loss": 0.6011, - "step": 50311 - }, - { - "epoch": 1.29, - "learning_rate": 1.272335153281713e-06, - "loss": 0.7168, - "step": 50312 - }, - { - "epoch": 1.29, - "learning_rate": 1.2723085285987908e-06, - "loss": 0.6963, - "step": 50313 - }, - { - "epoch": 1.29, - "learning_rate": 1.2722819037073741e-06, - "loss": 0.8184, - "step": 50314 - }, - { - "epoch": 1.29, - "learning_rate": 1.272255278607484e-06, - "loss": 0.6748, - "step": 50315 - }, - { - "epoch": 1.29, - "learning_rate": 1.2722286532991406e-06, - "loss": 0.488, - "step": 50316 - }, - { - "epoch": 1.29, - "learning_rate": 1.2722020277823644e-06, - "loss": 0.5146, - "step": 50317 - }, - { - "epoch": 1.29, - "learning_rate": 1.2721754020571754e-06, - "loss": 0.8145, - "step": 50318 - }, - { - "epoch": 1.29, - "learning_rate": 1.2721487761235944e-06, - "loss": 0.71, - "step": 50319 - }, - { - "epoch": 1.29, - "learning_rate": 1.272122149981641e-06, - "loss": 0.7407, - "step": 50320 - }, - { - "epoch": 1.29, - "learning_rate": 1.2720955236313367e-06, - "loss": 0.7139, - "step": 50321 - }, - { - "epoch": 1.29, - "learning_rate": 1.2720688970727015e-06, - "loss": 0.6748, - "step": 50322 - }, - { - "epoch": 1.29, - "learning_rate": 1.2720422703057553e-06, - "loss": 0.5571, - "step": 50323 - }, - { - "epoch": 1.29, - "learning_rate": 1.2720156433305188e-06, - "loss": 0.6006, - "step": 50324 - }, - { - "epoch": 1.29, - "learning_rate": 1.2719890161470125e-06, - "loss": 0.6592, - "step": 50325 - }, - { - "epoch": 1.29, - "learning_rate": 1.2719623887552567e-06, - "loss": 0.6091, - "step": 50326 - }, - { - "epoch": 1.29, - "learning_rate": 1.2719357611552722e-06, - "loss": 0.6099, - "step": 50327 - }, - { - "epoch": 1.29, - "learning_rate": 1.2719091333470786e-06, - "loss": 0.6963, - "step": 50328 - }, - { - "epoch": 1.29, - "learning_rate": 1.2718825053306965e-06, - "loss": 0.6172, - "step": 50329 - }, - { - "epoch": 1.29, - "learning_rate": 1.271855877106147e-06, - "loss": 0.6162, - "step": 50330 - }, - { - "epoch": 1.29, - "learning_rate": 1.2718292486734497e-06, - "loss": 0.4771, - "step": 50331 - }, - { - "epoch": 1.29, - "learning_rate": 1.2718026200326252e-06, - "loss": 0.6484, - "step": 50332 - }, - { - "epoch": 1.29, - "learning_rate": 1.271775991183694e-06, - "loss": 0.5708, - "step": 50333 - }, - { - "epoch": 1.29, - "learning_rate": 1.2717493621266765e-06, - "loss": 0.5317, - "step": 50334 - }, - { - "epoch": 1.29, - "learning_rate": 1.2717227328615927e-06, - "loss": 0.7061, - "step": 50335 - }, - { - "epoch": 1.29, - "learning_rate": 1.2716961033884635e-06, - "loss": 0.7227, - "step": 50336 - }, - { - "epoch": 1.29, - "learning_rate": 1.271669473707309e-06, - "loss": 0.7012, - "step": 50337 - }, - { - "epoch": 1.29, - "learning_rate": 1.2716428438181499e-06, - "loss": 0.5513, - "step": 50338 - }, - { - "epoch": 1.29, - "learning_rate": 1.271616213721006e-06, - "loss": 0.4846, - "step": 50339 - }, - { - "epoch": 1.29, - "learning_rate": 1.2715895834158985e-06, - "loss": 0.6299, - "step": 50340 - }, - { - "epoch": 1.29, - "learning_rate": 1.271562952902847e-06, - "loss": 0.668, - "step": 50341 - }, - { - "epoch": 1.29, - "learning_rate": 1.2715363221818727e-06, - "loss": 0.6558, - "step": 50342 - }, - { - "epoch": 1.29, - "learning_rate": 1.2715096912529951e-06, - "loss": 0.6304, - "step": 50343 - }, - { - "epoch": 1.29, - "learning_rate": 1.271483060116235e-06, - "loss": 0.5044, - "step": 50344 - }, - { - "epoch": 1.29, - "learning_rate": 1.2714564287716126e-06, - "loss": 0.7422, - "step": 50345 - }, - { - "epoch": 1.29, - "learning_rate": 1.271429797219149e-06, - "loss": 0.6357, - "step": 50346 - }, - { - "epoch": 1.29, - "learning_rate": 1.271403165458864e-06, - "loss": 0.6602, - "step": 50347 - }, - { - "epoch": 1.29, - "learning_rate": 1.271376533490778e-06, - "loss": 0.6309, - "step": 50348 - }, - { - "epoch": 1.29, - "learning_rate": 1.2713499013149115e-06, - "loss": 0.8652, - "step": 50349 - }, - { - "epoch": 1.29, - "learning_rate": 1.2713232689312845e-06, - "loss": 0.8281, - "step": 50350 - }, - { - "epoch": 1.29, - "learning_rate": 1.271296636339918e-06, - "loss": 0.4961, - "step": 50351 - }, - { - "epoch": 1.29, - "learning_rate": 1.2712700035408322e-06, - "loss": 0.6875, - "step": 50352 - }, - { - "epoch": 1.29, - "learning_rate": 1.2712433705340475e-06, - "loss": 0.6836, - "step": 50353 - }, - { - "epoch": 1.29, - "learning_rate": 1.2712167373195839e-06, - "loss": 0.6953, - "step": 50354 - }, - { - "epoch": 1.29, - "learning_rate": 1.2711901038974623e-06, - "loss": 0.7227, - "step": 50355 - }, - { - "epoch": 1.29, - "learning_rate": 1.271163470267703e-06, - "loss": 0.4905, - "step": 50356 - }, - { - "epoch": 1.29, - "learning_rate": 1.2711368364303266e-06, - "loss": 0.7676, - "step": 50357 - }, - { - "epoch": 1.29, - "learning_rate": 1.2711102023853525e-06, - "loss": 0.7134, - "step": 50358 - }, - { - "epoch": 1.29, - "learning_rate": 1.2710835681328022e-06, - "loss": 0.5762, - "step": 50359 - }, - { - "epoch": 1.29, - "learning_rate": 1.2710569336726955e-06, - "loss": 0.6899, - "step": 50360 - }, - { - "epoch": 1.29, - "learning_rate": 1.2710302990050533e-06, - "loss": 0.4231, - "step": 50361 - }, - { - "epoch": 1.29, - "learning_rate": 1.2710036641298954e-06, - "loss": 0.6895, - "step": 50362 - }, - { - "epoch": 1.29, - "learning_rate": 1.2709770290472426e-06, - "loss": 0.7725, - "step": 50363 - }, - { - "epoch": 1.29, - "learning_rate": 1.2709503937571146e-06, - "loss": 0.7656, - "step": 50364 - }, - { - "epoch": 1.29, - "learning_rate": 1.270923758259533e-06, - "loss": 0.5115, - "step": 50365 - }, - { - "epoch": 1.29, - "learning_rate": 1.270897122554517e-06, - "loss": 0.6685, - "step": 50366 - }, - { - "epoch": 1.29, - "learning_rate": 1.2708704866420883e-06, - "loss": 0.6689, - "step": 50367 - }, - { - "epoch": 1.29, - "learning_rate": 1.270843850522266e-06, - "loss": 0.4001, - "step": 50368 - }, - { - "epoch": 1.29, - "learning_rate": 1.270817214195071e-06, - "loss": 0.6978, - "step": 50369 - }, - { - "epoch": 1.29, - "learning_rate": 1.2707905776605237e-06, - "loss": 0.7207, - "step": 50370 - }, - { - "epoch": 1.29, - "learning_rate": 1.2707639409186445e-06, - "loss": 0.553, - "step": 50371 - }, - { - "epoch": 1.29, - "learning_rate": 1.270737303969454e-06, - "loss": 0.5249, - "step": 50372 - }, - { - "epoch": 1.29, - "learning_rate": 1.2707106668129722e-06, - "loss": 0.5806, - "step": 50373 - }, - { - "epoch": 1.29, - "learning_rate": 1.2706840294492198e-06, - "loss": 0.623, - "step": 50374 - }, - { - "epoch": 1.29, - "learning_rate": 1.2706573918782174e-06, - "loss": 0.6138, - "step": 50375 - }, - { - "epoch": 1.29, - "learning_rate": 1.2706307540999845e-06, - "loss": 0.7109, - "step": 50376 - }, - { - "epoch": 1.29, - "learning_rate": 1.2706041161145422e-06, - "loss": 0.8008, - "step": 50377 - }, - { - "epoch": 1.29, - "learning_rate": 1.2705774779219112e-06, - "loss": 0.5798, - "step": 50378 - }, - { - "epoch": 1.29, - "learning_rate": 1.270550839522111e-06, - "loss": 0.7646, - "step": 50379 - }, - { - "epoch": 1.29, - "learning_rate": 1.2705242009151626e-06, - "loss": 0.6523, - "step": 50380 - }, - { - "epoch": 1.29, - "learning_rate": 1.2704975621010862e-06, - "loss": 0.6475, - "step": 50381 - }, - { - "epoch": 1.29, - "learning_rate": 1.2704709230799023e-06, - "loss": 0.7061, - "step": 50382 - }, - { - "epoch": 1.29, - "learning_rate": 1.2704442838516314e-06, - "loss": 0.7705, - "step": 50383 - }, - { - "epoch": 1.29, - "learning_rate": 1.2704176444162938e-06, - "loss": 0.7368, - "step": 50384 - }, - { - "epoch": 1.29, - "learning_rate": 1.2703910047739094e-06, - "loss": 0.7715, - "step": 50385 - }, - { - "epoch": 1.29, - "learning_rate": 1.2703643649244995e-06, - "loss": 0.5881, - "step": 50386 - }, - { - "epoch": 1.29, - "learning_rate": 1.2703377248680838e-06, - "loss": 0.6338, - "step": 50387 - }, - { - "epoch": 1.29, - "learning_rate": 1.2703110846046832e-06, - "loss": 0.5913, - "step": 50388 - }, - { - "epoch": 1.29, - "learning_rate": 1.2702844441343172e-06, - "loss": 0.6562, - "step": 50389 - }, - { - "epoch": 1.29, - "learning_rate": 1.2702578034570076e-06, - "loss": 0.6123, - "step": 50390 - }, - { - "epoch": 1.29, - "learning_rate": 1.2702311625727735e-06, - "loss": 0.5123, - "step": 50391 - }, - { - "epoch": 1.29, - "learning_rate": 1.270204521481636e-06, - "loss": 0.5513, - "step": 50392 - }, - { - "epoch": 1.29, - "learning_rate": 1.2701778801836153e-06, - "loss": 0.5552, - "step": 50393 - }, - { - "epoch": 1.29, - "learning_rate": 1.2701512386787318e-06, - "loss": 0.4775, - "step": 50394 - }, - { - "epoch": 1.29, - "learning_rate": 1.270124596967006e-06, - "loss": 0.5536, - "step": 50395 - }, - { - "epoch": 1.29, - "learning_rate": 1.2700979550484583e-06, - "loss": 0.6445, - "step": 50396 - }, - { - "epoch": 1.29, - "learning_rate": 1.2700713129231088e-06, - "loss": 0.7598, - "step": 50397 - }, - { - "epoch": 1.29, - "learning_rate": 1.2700446705909782e-06, - "loss": 0.6099, - "step": 50398 - }, - { - "epoch": 1.29, - "learning_rate": 1.2700180280520867e-06, - "loss": 0.7256, - "step": 50399 - }, - { - "epoch": 1.29, - "learning_rate": 1.2699913853064547e-06, - "loss": 0.6919, - "step": 50400 - }, - { - "epoch": 1.29, - "learning_rate": 1.2699647423541033e-06, - "loss": 0.7024, - "step": 50401 - }, - { - "epoch": 1.29, - "learning_rate": 1.269938099195052e-06, - "loss": 0.6904, - "step": 50402 - }, - { - "epoch": 1.29, - "learning_rate": 1.2699114558293213e-06, - "loss": 0.6714, - "step": 50403 - }, - { - "epoch": 1.29, - "learning_rate": 1.269884812256932e-06, - "loss": 0.7119, - "step": 50404 - }, - { - "epoch": 1.29, - "learning_rate": 1.2698581684779044e-06, - "loss": 0.6611, - "step": 50405 - }, - { - "epoch": 1.29, - "learning_rate": 1.2698315244922586e-06, - "loss": 0.6216, - "step": 50406 - }, - { - "epoch": 1.29, - "learning_rate": 1.2698048803000155e-06, - "loss": 0.7988, - "step": 50407 - }, - { - "epoch": 1.29, - "learning_rate": 1.2697782359011948e-06, - "loss": 0.6475, - "step": 50408 - }, - { - "epoch": 1.29, - "learning_rate": 1.2697515912958177e-06, - "loss": 0.5466, - "step": 50409 - }, - { - "epoch": 1.29, - "learning_rate": 1.2697249464839037e-06, - "loss": 0.6455, - "step": 50410 - }, - { - "epoch": 1.29, - "learning_rate": 1.2696983014654742e-06, - "loss": 0.6797, - "step": 50411 - }, - { - "epoch": 1.29, - "learning_rate": 1.2696716562405489e-06, - "loss": 0.7764, - "step": 50412 - }, - { - "epoch": 1.29, - "learning_rate": 1.2696450108091484e-06, - "loss": 0.6494, - "step": 50413 - }, - { - "epoch": 1.29, - "learning_rate": 1.2696183651712933e-06, - "loss": 0.5178, - "step": 50414 - }, - { - "epoch": 1.29, - "learning_rate": 1.2695917193270039e-06, - "loss": 0.6738, - "step": 50415 - }, - { - "epoch": 1.29, - "learning_rate": 1.2695650732763002e-06, - "loss": 0.6074, - "step": 50416 - }, - { - "epoch": 1.29, - "learning_rate": 1.269538427019203e-06, - "loss": 0.6519, - "step": 50417 - }, - { - "epoch": 1.29, - "learning_rate": 1.2695117805557324e-06, - "loss": 0.7354, - "step": 50418 - }, - { - "epoch": 1.29, - "learning_rate": 1.2694851338859095e-06, - "loss": 0.4683, - "step": 50419 - }, - { - "epoch": 1.29, - "learning_rate": 1.269458487009754e-06, - "loss": 0.708, - "step": 50420 - }, - { - "epoch": 1.29, - "learning_rate": 1.2694318399272866e-06, - "loss": 0.7686, - "step": 50421 - }, - { - "epoch": 1.29, - "learning_rate": 1.2694051926385274e-06, - "loss": 0.7266, - "step": 50422 - }, - { - "epoch": 1.29, - "learning_rate": 1.269378545143497e-06, - "loss": 0.7666, - "step": 50423 - }, - { - "epoch": 1.29, - "learning_rate": 1.2693518974422162e-06, - "loss": 0.6621, - "step": 50424 - }, - { - "epoch": 1.29, - "learning_rate": 1.2693252495347047e-06, - "loss": 0.4697, - "step": 50425 - }, - { - "epoch": 1.29, - "learning_rate": 1.2692986014209836e-06, - "loss": 0.8301, - "step": 50426 - }, - { - "epoch": 1.29, - "learning_rate": 1.2692719531010727e-06, - "loss": 0.5586, - "step": 50427 - }, - { - "epoch": 1.29, - "learning_rate": 1.2692453045749927e-06, - "loss": 0.6865, - "step": 50428 - }, - { - "epoch": 1.29, - "learning_rate": 1.2692186558427638e-06, - "loss": 0.813, - "step": 50429 - }, - { - "epoch": 1.29, - "learning_rate": 1.2691920069044066e-06, - "loss": 0.7617, - "step": 50430 - }, - { - "epoch": 1.29, - "learning_rate": 1.2691653577599417e-06, - "loss": 0.7217, - "step": 50431 - }, - { - "epoch": 1.29, - "learning_rate": 1.269138708409389e-06, - "loss": 0.583, - "step": 50432 - }, - { - "epoch": 1.29, - "learning_rate": 1.2691120588527692e-06, - "loss": 0.5945, - "step": 50433 - }, - { - "epoch": 1.29, - "learning_rate": 1.269085409090103e-06, - "loss": 0.5693, - "step": 50434 - }, - { - "epoch": 1.29, - "learning_rate": 1.26905875912141e-06, - "loss": 0.5391, - "step": 50435 - }, - { - "epoch": 1.29, - "learning_rate": 1.2690321089467114e-06, - "loss": 0.7441, - "step": 50436 - }, - { - "epoch": 1.29, - "learning_rate": 1.2690054585660272e-06, - "loss": 0.6572, - "step": 50437 - }, - { - "epoch": 1.29, - "learning_rate": 1.268978807979378e-06, - "loss": 0.4841, - "step": 50438 - }, - { - "epoch": 1.29, - "learning_rate": 1.268952157186784e-06, - "loss": 0.7178, - "step": 50439 - }, - { - "epoch": 1.29, - "learning_rate": 1.2689255061882656e-06, - "loss": 0.611, - "step": 50440 - }, - { - "epoch": 1.29, - "learning_rate": 1.2688988549838433e-06, - "loss": 0.6768, - "step": 50441 - }, - { - "epoch": 1.29, - "learning_rate": 1.2688722035735376e-06, - "loss": 0.563, - "step": 50442 - }, - { - "epoch": 1.29, - "learning_rate": 1.268845551957369e-06, - "loss": 0.6445, - "step": 50443 - }, - { - "epoch": 1.29, - "learning_rate": 1.2688189001353571e-06, - "loss": 0.7061, - "step": 50444 - }, - { - "epoch": 1.29, - "learning_rate": 1.2687922481075235e-06, - "loss": 0.6445, - "step": 50445 - }, - { - "epoch": 1.29, - "learning_rate": 1.268765595873888e-06, - "loss": 0.6343, - "step": 50446 - }, - { - "epoch": 1.29, - "learning_rate": 1.2687389434344709e-06, - "loss": 0.6387, - "step": 50447 - }, - { - "epoch": 1.29, - "learning_rate": 1.2687122907892928e-06, - "loss": 0.626, - "step": 50448 - }, - { - "epoch": 1.29, - "learning_rate": 1.268685637938374e-06, - "loss": 0.5562, - "step": 50449 - }, - { - "epoch": 1.29, - "learning_rate": 1.268658984881735e-06, - "loss": 0.6357, - "step": 50450 - }, - { - "epoch": 1.29, - "learning_rate": 1.2686323316193963e-06, - "loss": 0.5608, - "step": 50451 - }, - { - "epoch": 1.29, - "learning_rate": 1.2686056781513778e-06, - "loss": 0.6572, - "step": 50452 - }, - { - "epoch": 1.29, - "learning_rate": 1.2685790244777007e-06, - "loss": 0.6545, - "step": 50453 - }, - { - "epoch": 1.29, - "learning_rate": 1.2685523705983846e-06, - "loss": 0.5879, - "step": 50454 - }, - { - "epoch": 1.29, - "learning_rate": 1.2685257165134507e-06, - "loss": 0.4255, - "step": 50455 - }, - { - "epoch": 1.29, - "learning_rate": 1.2684990622229187e-06, - "loss": 0.5488, - "step": 50456 - }, - { - "epoch": 1.29, - "learning_rate": 1.2684724077268097e-06, - "loss": 0.7637, - "step": 50457 - }, - { - "epoch": 1.29, - "learning_rate": 1.2684457530251432e-06, - "loss": 0.613, - "step": 50458 - }, - { - "epoch": 1.29, - "learning_rate": 1.2684190981179403e-06, - "loss": 0.7715, - "step": 50459 - }, - { - "epoch": 1.29, - "learning_rate": 1.2683924430052213e-06, - "loss": 0.5693, - "step": 50460 - }, - { - "epoch": 1.29, - "learning_rate": 1.2683657876870067e-06, - "loss": 0.6897, - "step": 50461 - }, - { - "epoch": 1.29, - "learning_rate": 1.2683391321633165e-06, - "loss": 0.5952, - "step": 50462 - }, - { - "epoch": 1.29, - "learning_rate": 1.2683124764341714e-06, - "loss": 0.5889, - "step": 50463 - }, - { - "epoch": 1.29, - "learning_rate": 1.268285820499592e-06, - "loss": 0.7266, - "step": 50464 - }, - { - "epoch": 1.29, - "learning_rate": 1.2682591643595984e-06, - "loss": 0.5304, - "step": 50465 - }, - { - "epoch": 1.29, - "learning_rate": 1.268232508014211e-06, - "loss": 0.6416, - "step": 50466 - }, - { - "epoch": 1.29, - "learning_rate": 1.2682058514634504e-06, - "loss": 0.8398, - "step": 50467 - }, - { - "epoch": 1.29, - "learning_rate": 1.2681791947073368e-06, - "loss": 0.5999, - "step": 50468 - }, - { - "epoch": 1.29, - "learning_rate": 1.2681525377458905e-06, - "loss": 0.7275, - "step": 50469 - }, - { - "epoch": 1.29, - "learning_rate": 1.2681258805791326e-06, - "loss": 0.5732, - "step": 50470 - }, - { - "epoch": 1.29, - "learning_rate": 1.2680992232070828e-06, - "loss": 0.8291, - "step": 50471 - }, - { - "epoch": 1.29, - "learning_rate": 1.2680725656297619e-06, - "loss": 0.4656, - "step": 50472 - }, - { - "epoch": 1.29, - "learning_rate": 1.26804590784719e-06, - "loss": 0.6724, - "step": 50473 - }, - { - "epoch": 1.29, - "learning_rate": 1.2680192498593878e-06, - "loss": 0.543, - "step": 50474 - }, - { - "epoch": 1.29, - "learning_rate": 1.2679925916663753e-06, - "loss": 0.6133, - "step": 50475 - }, - { - "epoch": 1.29, - "learning_rate": 1.2679659332681738e-06, - "loss": 0.6353, - "step": 50476 - }, - { - "epoch": 1.29, - "learning_rate": 1.2679392746648026e-06, - "loss": 0.5774, - "step": 50477 - }, - { - "epoch": 1.29, - "learning_rate": 1.2679126158562826e-06, - "loss": 0.4004, - "step": 50478 - }, - { - "epoch": 1.29, - "learning_rate": 1.2678859568426344e-06, - "loss": 0.5854, - "step": 50479 - }, - { - "epoch": 1.29, - "learning_rate": 1.2678592976238783e-06, - "loss": 0.6924, - "step": 50480 - }, - { - "epoch": 1.29, - "learning_rate": 1.2678326382000346e-06, - "loss": 0.6494, - "step": 50481 - }, - { - "epoch": 1.29, - "learning_rate": 1.2678059785711237e-06, - "loss": 0.6128, - "step": 50482 - }, - { - "epoch": 1.29, - "learning_rate": 1.267779318737166e-06, - "loss": 0.5361, - "step": 50483 - }, - { - "epoch": 1.29, - "learning_rate": 1.2677526586981821e-06, - "loss": 0.6777, - "step": 50484 - }, - { - "epoch": 1.29, - "learning_rate": 1.2677259984541922e-06, - "loss": 0.7295, - "step": 50485 - }, - { - "epoch": 1.29, - "learning_rate": 1.267699338005217e-06, - "loss": 0.6387, - "step": 50486 - }, - { - "epoch": 1.29, - "learning_rate": 1.2676726773512767e-06, - "loss": 0.7129, - "step": 50487 - }, - { - "epoch": 1.29, - "learning_rate": 1.2676460164923915e-06, - "loss": 0.8672, - "step": 50488 - }, - { - "epoch": 1.29, - "learning_rate": 1.2676193554285823e-06, - "loss": 0.6484, - "step": 50489 - }, - { - "epoch": 1.29, - "learning_rate": 1.2675926941598691e-06, - "loss": 0.6982, - "step": 50490 - }, - { - "epoch": 1.29, - "learning_rate": 1.2675660326862726e-06, - "loss": 0.6152, - "step": 50491 - }, - { - "epoch": 1.29, - "learning_rate": 1.267539371007813e-06, - "loss": 0.7144, - "step": 50492 - }, - { - "epoch": 1.29, - "learning_rate": 1.267512709124511e-06, - "loss": 0.6748, - "step": 50493 - }, - { - "epoch": 1.29, - "learning_rate": 1.2674860470363867e-06, - "loss": 0.4336, - "step": 50494 - }, - { - "epoch": 1.29, - "learning_rate": 1.2674593847434607e-06, - "loss": 0.7725, - "step": 50495 - }, - { - "epoch": 1.29, - "learning_rate": 1.2674327222457533e-06, - "loss": 0.7998, - "step": 50496 - }, - { - "epoch": 1.29, - "learning_rate": 1.267406059543285e-06, - "loss": 0.6738, - "step": 50497 - }, - { - "epoch": 1.29, - "learning_rate": 1.267379396636076e-06, - "loss": 0.5049, - "step": 50498 - }, - { - "epoch": 1.29, - "learning_rate": 1.267352733524147e-06, - "loss": 0.7754, - "step": 50499 - }, - { - "epoch": 1.29, - "learning_rate": 1.267326070207518e-06, - "loss": 0.645, - "step": 50500 - }, - { - "epoch": 1.29, - "learning_rate": 1.2672994066862103e-06, - "loss": 0.584, - "step": 50501 - }, - { - "epoch": 1.29, - "learning_rate": 1.2672727429602435e-06, - "loss": 0.5985, - "step": 50502 - }, - { - "epoch": 1.29, - "learning_rate": 1.2672460790296382e-06, - "loss": 0.645, - "step": 50503 - }, - { - "epoch": 1.29, - "learning_rate": 1.2672194148944147e-06, - "loss": 0.8408, - "step": 50504 - }, - { - "epoch": 1.29, - "learning_rate": 1.2671927505545938e-06, - "loss": 0.6001, - "step": 50505 - }, - { - "epoch": 1.29, - "learning_rate": 1.2671660860101959e-06, - "loss": 0.5146, - "step": 50506 - }, - { - "epoch": 1.29, - "learning_rate": 1.2671394212612407e-06, - "loss": 0.5103, - "step": 50507 - }, - { - "epoch": 1.29, - "learning_rate": 1.2671127563077493e-06, - "loss": 0.7236, - "step": 50508 - }, - { - "epoch": 1.29, - "learning_rate": 1.2670860911497418e-06, - "loss": 0.7783, - "step": 50509 - }, - { - "epoch": 1.29, - "learning_rate": 1.2670594257872394e-06, - "loss": 0.5986, - "step": 50510 - }, - { - "epoch": 1.29, - "learning_rate": 1.2670327602202613e-06, - "loss": 0.6245, - "step": 50511 - }, - { - "epoch": 1.29, - "learning_rate": 1.2670060944488288e-06, - "loss": 0.5947, - "step": 50512 - }, - { - "epoch": 1.29, - "learning_rate": 1.2669794284729616e-06, - "loss": 0.7363, - "step": 50513 - }, - { - "epoch": 1.29, - "learning_rate": 1.266952762292681e-06, - "loss": 0.7266, - "step": 50514 - }, - { - "epoch": 1.29, - "learning_rate": 1.2669260959080066e-06, - "loss": 0.7725, - "step": 50515 - }, - { - "epoch": 1.29, - "learning_rate": 1.2668994293189594e-06, - "loss": 0.7549, - "step": 50516 - }, - { - "epoch": 1.29, - "learning_rate": 1.2668727625255596e-06, - "loss": 0.4727, - "step": 50517 - }, - { - "epoch": 1.29, - "learning_rate": 1.2668460955278274e-06, - "loss": 0.7236, - "step": 50518 - }, - { - "epoch": 1.29, - "learning_rate": 1.2668194283257833e-06, - "loss": 0.792, - "step": 50519 - }, - { - "epoch": 1.29, - "learning_rate": 1.2667927609194482e-06, - "loss": 0.7363, - "step": 50520 - }, - { - "epoch": 1.29, - "learning_rate": 1.266766093308842e-06, - "loss": 0.5232, - "step": 50521 - }, - { - "epoch": 1.29, - "learning_rate": 1.2667394254939854e-06, - "loss": 0.4951, - "step": 50522 - }, - { - "epoch": 1.29, - "learning_rate": 1.2667127574748984e-06, - "loss": 0.6201, - "step": 50523 - }, - { - "epoch": 1.29, - "learning_rate": 1.2666860892516017e-06, - "loss": 0.7017, - "step": 50524 - }, - { - "epoch": 1.29, - "learning_rate": 1.2666594208241159e-06, - "loss": 0.7891, - "step": 50525 - }, - { - "epoch": 1.3, - "learning_rate": 1.2666327521924612e-06, - "loss": 0.751, - "step": 50526 - }, - { - "epoch": 1.3, - "learning_rate": 1.2666060833566583e-06, - "loss": 0.6255, - "step": 50527 - }, - { - "epoch": 1.3, - "learning_rate": 1.2665794143167272e-06, - "loss": 0.6895, - "step": 50528 - }, - { - "epoch": 1.3, - "learning_rate": 1.2665527450726882e-06, - "loss": 0.5703, - "step": 50529 - }, - { - "epoch": 1.3, - "learning_rate": 1.2665260756245624e-06, - "loss": 0.6729, - "step": 50530 - }, - { - "epoch": 1.3, - "learning_rate": 1.2664994059723696e-06, - "loss": 0.4368, - "step": 50531 - }, - { - "epoch": 1.3, - "learning_rate": 1.2664727361161304e-06, - "loss": 0.7285, - "step": 50532 - }, - { - "epoch": 1.3, - "learning_rate": 1.2664460660558657e-06, - "loss": 0.624, - "step": 50533 - }, - { - "epoch": 1.3, - "learning_rate": 1.2664193957915949e-06, - "loss": 0.668, - "step": 50534 - }, - { - "epoch": 1.3, - "learning_rate": 1.2663927253233398e-06, - "loss": 0.5796, - "step": 50535 - }, - { - "epoch": 1.3, - "learning_rate": 1.2663660546511195e-06, - "loss": 0.6318, - "step": 50536 - }, - { - "epoch": 1.3, - "learning_rate": 1.2663393837749552e-06, - "loss": 0.6768, - "step": 50537 - }, - { - "epoch": 1.3, - "learning_rate": 1.2663127126948667e-06, - "loss": 0.3779, - "step": 50538 - }, - { - "epoch": 1.3, - "learning_rate": 1.266286041410875e-06, - "loss": 0.6992, - "step": 50539 - }, - { - "epoch": 1.3, - "learning_rate": 1.2662593699230005e-06, - "loss": 0.6855, - "step": 50540 - }, - { - "epoch": 1.3, - "learning_rate": 1.2662326982312634e-06, - "loss": 0.5371, - "step": 50541 - }, - { - "epoch": 1.3, - "learning_rate": 1.266206026335684e-06, - "loss": 0.5234, - "step": 50542 - }, - { - "epoch": 1.3, - "learning_rate": 1.2661793542362831e-06, - "loss": 0.6814, - "step": 50543 - }, - { - "epoch": 1.3, - "learning_rate": 1.2661526819330805e-06, - "loss": 0.7637, - "step": 50544 - }, - { - "epoch": 1.3, - "learning_rate": 1.2661260094260974e-06, - "loss": 0.6348, - "step": 50545 - }, - { - "epoch": 1.3, - "learning_rate": 1.2660993367153538e-06, - "loss": 0.5022, - "step": 50546 - }, - { - "epoch": 1.3, - "learning_rate": 1.2660726638008702e-06, - "loss": 0.4722, - "step": 50547 - }, - { - "epoch": 1.3, - "learning_rate": 1.2660459906826668e-06, - "loss": 0.7324, - "step": 50548 - }, - { - "epoch": 1.3, - "learning_rate": 1.2660193173607644e-06, - "loss": 0.6797, - "step": 50549 - }, - { - "epoch": 1.3, - "learning_rate": 1.265992643835183e-06, - "loss": 0.8184, - "step": 50550 - }, - { - "epoch": 1.3, - "learning_rate": 1.2659659701059435e-06, - "loss": 0.6025, - "step": 50551 - }, - { - "epoch": 1.3, - "learning_rate": 1.2659392961730663e-06, - "loss": 0.4937, - "step": 50552 - }, - { - "epoch": 1.3, - "learning_rate": 1.265912622036571e-06, - "loss": 0.4854, - "step": 50553 - }, - { - "epoch": 1.3, - "learning_rate": 1.265885947696479e-06, - "loss": 0.7588, - "step": 50554 - }, - { - "epoch": 1.3, - "learning_rate": 1.2658592731528102e-06, - "loss": 0.7354, - "step": 50555 - }, - { - "epoch": 1.3, - "learning_rate": 1.2658325984055855e-06, - "loss": 0.7129, - "step": 50556 - }, - { - "epoch": 1.3, - "learning_rate": 1.265805923454825e-06, - "loss": 0.7383, - "step": 50557 - }, - { - "epoch": 1.3, - "learning_rate": 1.2657792483005488e-06, - "loss": 0.6274, - "step": 50558 - }, - { - "epoch": 1.3, - "learning_rate": 1.2657525729427777e-06, - "loss": 0.6807, - "step": 50559 - }, - { - "epoch": 1.3, - "learning_rate": 1.265725897381532e-06, - "loss": 0.751, - "step": 50560 - }, - { - "epoch": 1.3, - "learning_rate": 1.2656992216168325e-06, - "loss": 0.6416, - "step": 50561 - }, - { - "epoch": 1.3, - "learning_rate": 1.2656725456486994e-06, - "loss": 0.5779, - "step": 50562 - }, - { - "epoch": 1.3, - "learning_rate": 1.2656458694771526e-06, - "loss": 0.5469, - "step": 50563 - }, - { - "epoch": 1.3, - "learning_rate": 1.2656191931022132e-06, - "loss": 0.5129, - "step": 50564 - }, - { - "epoch": 1.3, - "learning_rate": 1.2655925165239013e-06, - "loss": 0.7441, - "step": 50565 - }, - { - "epoch": 1.3, - "learning_rate": 1.2655658397422377e-06, - "loss": 0.8076, - "step": 50566 - }, - { - "epoch": 1.3, - "learning_rate": 1.2655391627572423e-06, - "loss": 0.6074, - "step": 50567 - }, - { - "epoch": 1.3, - "learning_rate": 1.2655124855689358e-06, - "loss": 0.6665, - "step": 50568 - }, - { - "epoch": 1.3, - "learning_rate": 1.2654858081773388e-06, - "loss": 0.5918, - "step": 50569 - }, - { - "epoch": 1.3, - "learning_rate": 1.2654591305824713e-06, - "loss": 0.6177, - "step": 50570 - }, - { - "epoch": 1.3, - "learning_rate": 1.265432452784354e-06, - "loss": 0.5288, - "step": 50571 - }, - { - "epoch": 1.3, - "learning_rate": 1.2654057747830072e-06, - "loss": 0.7119, - "step": 50572 - }, - { - "epoch": 1.3, - "learning_rate": 1.2653790965784517e-06, - "loss": 0.3145, - "step": 50573 - }, - { - "epoch": 1.3, - "learning_rate": 1.2653524181707074e-06, - "loss": 0.5366, - "step": 50574 - }, - { - "epoch": 1.3, - "learning_rate": 1.2653257395597946e-06, - "loss": 0.7266, - "step": 50575 - }, - { - "epoch": 1.3, - "learning_rate": 1.2652990607457348e-06, - "loss": 0.6514, - "step": 50576 - }, - { - "epoch": 1.3, - "learning_rate": 1.2652723817285473e-06, - "loss": 0.5879, - "step": 50577 - }, - { - "epoch": 1.3, - "learning_rate": 1.2652457025082528e-06, - "loss": 0.6499, - "step": 50578 - }, - { - "epoch": 1.3, - "learning_rate": 1.2652190230848723e-06, - "loss": 0.7676, - "step": 50579 - }, - { - "epoch": 1.3, - "learning_rate": 1.2651923434584253e-06, - "loss": 0.5728, - "step": 50580 - }, - { - "epoch": 1.3, - "learning_rate": 1.2651656636289332e-06, - "loss": 0.626, - "step": 50581 - }, - { - "epoch": 1.3, - "learning_rate": 1.2651389835964156e-06, - "loss": 0.5157, - "step": 50582 - }, - { - "epoch": 1.3, - "learning_rate": 1.2651123033608934e-06, - "loss": 0.6157, - "step": 50583 - }, - { - "epoch": 1.3, - "learning_rate": 1.2650856229223868e-06, - "loss": 0.6768, - "step": 50584 - }, - { - "epoch": 1.3, - "learning_rate": 1.2650589422809165e-06, - "loss": 0.5918, - "step": 50585 - }, - { - "epoch": 1.3, - "learning_rate": 1.2650322614365027e-06, - "loss": 0.8799, - "step": 50586 - }, - { - "epoch": 1.3, - "learning_rate": 1.265005580389166e-06, - "loss": 0.6777, - "step": 50587 - }, - { - "epoch": 1.3, - "learning_rate": 1.2649788991389263e-06, - "loss": 0.5126, - "step": 50588 - }, - { - "epoch": 1.3, - "learning_rate": 1.2649522176858048e-06, - "loss": 0.6493, - "step": 50589 - }, - { - "epoch": 1.3, - "learning_rate": 1.2649255360298213e-06, - "loss": 0.5625, - "step": 50590 - }, - { - "epoch": 1.3, - "learning_rate": 1.2648988541709971e-06, - "loss": 0.6514, - "step": 50591 - }, - { - "epoch": 1.3, - "learning_rate": 1.2648721721093511e-06, - "loss": 0.4382, - "step": 50592 - }, - { - "epoch": 1.3, - "learning_rate": 1.2648454898449055e-06, - "loss": 0.594, - "step": 50593 - }, - { - "epoch": 1.3, - "learning_rate": 1.2648188073776794e-06, - "loss": 0.7158, - "step": 50594 - }, - { - "epoch": 1.3, - "learning_rate": 1.2647921247076939e-06, - "loss": 0.5151, - "step": 50595 - }, - { - "epoch": 1.3, - "learning_rate": 1.2647654418349691e-06, - "loss": 0.6602, - "step": 50596 - }, - { - "epoch": 1.3, - "learning_rate": 1.2647387587595257e-06, - "loss": 0.7109, - "step": 50597 - }, - { - "epoch": 1.3, - "learning_rate": 1.264712075481384e-06, - "loss": 0.6543, - "step": 50598 - }, - { - "epoch": 1.3, - "learning_rate": 1.2646853920005642e-06, - "loss": 0.748, - "step": 50599 - }, - { - "epoch": 1.3, - "learning_rate": 1.2646587083170875e-06, - "loss": 0.6875, - "step": 50600 - }, - { - "epoch": 1.3, - "learning_rate": 1.2646320244309734e-06, - "loss": 0.6105, - "step": 50601 - }, - { - "epoch": 1.3, - "learning_rate": 1.2646053403422428e-06, - "loss": 0.7217, - "step": 50602 - }, - { - "epoch": 1.3, - "learning_rate": 1.264578656050916e-06, - "loss": 0.5803, - "step": 50603 - }, - { - "epoch": 1.3, - "learning_rate": 1.2645519715570134e-06, - "loss": 0.5093, - "step": 50604 - }, - { - "epoch": 1.3, - "learning_rate": 1.2645252868605556e-06, - "loss": 0.7344, - "step": 50605 - }, - { - "epoch": 1.3, - "learning_rate": 1.2644986019615633e-06, - "loss": 0.7109, - "step": 50606 - }, - { - "epoch": 1.3, - "learning_rate": 1.2644719168600562e-06, - "loss": 0.6484, - "step": 50607 - }, - { - "epoch": 1.3, - "learning_rate": 1.2644452315560555e-06, - "loss": 0.8389, - "step": 50608 - }, - { - "epoch": 1.3, - "learning_rate": 1.2644185460495807e-06, - "loss": 0.6934, - "step": 50609 - }, - { - "epoch": 1.3, - "learning_rate": 1.2643918603406532e-06, - "loss": 0.5457, - "step": 50610 - }, - { - "epoch": 1.3, - "learning_rate": 1.2643651744292928e-06, - "loss": 0.7871, - "step": 50611 - }, - { - "epoch": 1.3, - "learning_rate": 1.2643384883155204e-06, - "loss": 0.6758, - "step": 50612 - }, - { - "epoch": 1.3, - "learning_rate": 1.2643118019993558e-06, - "loss": 0.7314, - "step": 50613 - }, - { - "epoch": 1.3, - "learning_rate": 1.2642851154808197e-06, - "loss": 0.6162, - "step": 50614 - }, - { - "epoch": 1.3, - "learning_rate": 1.2642584287599328e-06, - "loss": 0.7344, - "step": 50615 - }, - { - "epoch": 1.3, - "learning_rate": 1.2642317418367156e-06, - "loss": 0.6602, - "step": 50616 - }, - { - "epoch": 1.3, - "learning_rate": 1.2642050547111884e-06, - "loss": 0.7998, - "step": 50617 - }, - { - "epoch": 1.3, - "learning_rate": 1.2641783673833714e-06, - "loss": 0.4782, - "step": 50618 - }, - { - "epoch": 1.3, - "learning_rate": 1.264151679853285e-06, - "loss": 0.6108, - "step": 50619 - }, - { - "epoch": 1.3, - "learning_rate": 1.26412499212095e-06, - "loss": 0.7979, - "step": 50620 - }, - { - "epoch": 1.3, - "learning_rate": 1.2640983041863865e-06, - "loss": 0.8135, - "step": 50621 - }, - { - "epoch": 1.3, - "learning_rate": 1.264071616049615e-06, - "loss": 0.618, - "step": 50622 - }, - { - "epoch": 1.3, - "learning_rate": 1.264044927710656e-06, - "loss": 0.6055, - "step": 50623 - }, - { - "epoch": 1.3, - "learning_rate": 1.26401823916953e-06, - "loss": 0.7188, - "step": 50624 - }, - { - "epoch": 1.3, - "learning_rate": 1.2639915504262576e-06, - "loss": 0.531, - "step": 50625 - }, - { - "epoch": 1.3, - "learning_rate": 1.263964861480859e-06, - "loss": 0.707, - "step": 50626 - }, - { - "epoch": 1.3, - "learning_rate": 1.2639381723333543e-06, - "loss": 0.4424, - "step": 50627 - }, - { - "epoch": 1.3, - "learning_rate": 1.2639114829837644e-06, - "loss": 0.5132, - "step": 50628 - }, - { - "epoch": 1.3, - "learning_rate": 1.2638847934321097e-06, - "loss": 0.6523, - "step": 50629 - }, - { - "epoch": 1.3, - "learning_rate": 1.2638581036784105e-06, - "loss": 0.6904, - "step": 50630 - }, - { - "epoch": 1.3, - "learning_rate": 1.2638314137226877e-06, - "loss": 0.5146, - "step": 50631 - }, - { - "epoch": 1.3, - "learning_rate": 1.2638047235649608e-06, - "loss": 0.6836, - "step": 50632 - }, - { - "epoch": 1.3, - "learning_rate": 1.2637780332052508e-06, - "loss": 0.9482, - "step": 50633 - }, - { - "epoch": 1.3, - "learning_rate": 1.263751342643578e-06, - "loss": 0.79, - "step": 50634 - }, - { - "epoch": 1.3, - "learning_rate": 1.263724651879963e-06, - "loss": 0.7544, - "step": 50635 - }, - { - "epoch": 1.3, - "learning_rate": 1.2636979609144266e-06, - "loss": 0.6826, - "step": 50636 - }, - { - "epoch": 1.3, - "learning_rate": 1.2636712697469885e-06, - "loss": 0.6611, - "step": 50637 - }, - { - "epoch": 1.3, - "learning_rate": 1.2636445783776693e-06, - "loss": 0.4753, - "step": 50638 - }, - { - "epoch": 1.3, - "learning_rate": 1.2636178868064894e-06, - "loss": 0.8496, - "step": 50639 - }, - { - "epoch": 1.3, - "learning_rate": 1.2635911950334697e-06, - "loss": 0.6953, - "step": 50640 - }, - { - "epoch": 1.3, - "learning_rate": 1.2635645030586303e-06, - "loss": 0.7598, - "step": 50641 - }, - { - "epoch": 1.3, - "learning_rate": 1.263537810881992e-06, - "loss": 0.834, - "step": 50642 - }, - { - "epoch": 1.3, - "learning_rate": 1.2635111185035744e-06, - "loss": 0.8252, - "step": 50643 - }, - { - "epoch": 1.3, - "learning_rate": 1.2634844259233985e-06, - "loss": 0.8496, - "step": 50644 - }, - { - "epoch": 1.3, - "learning_rate": 1.263457733141485e-06, - "loss": 0.623, - "step": 50645 - }, - { - "epoch": 1.3, - "learning_rate": 1.2634310401578541e-06, - "loss": 0.7749, - "step": 50646 - }, - { - "epoch": 1.3, - "learning_rate": 1.2634043469725257e-06, - "loss": 0.5986, - "step": 50647 - }, - { - "epoch": 1.3, - "learning_rate": 1.263377653585521e-06, - "loss": 0.6387, - "step": 50648 - }, - { - "epoch": 1.3, - "learning_rate": 1.2633509599968599e-06, - "loss": 0.6104, - "step": 50649 - }, - { - "epoch": 1.3, - "learning_rate": 1.2633242662065634e-06, - "loss": 0.6602, - "step": 50650 - }, - { - "epoch": 1.3, - "learning_rate": 1.2632975722146514e-06, - "loss": 0.6475, - "step": 50651 - }, - { - "epoch": 1.3, - "learning_rate": 1.2632708780211448e-06, - "loss": 0.6963, - "step": 50652 - }, - { - "epoch": 1.3, - "learning_rate": 1.2632441836260633e-06, - "loss": 0.7383, - "step": 50653 - }, - { - "epoch": 1.3, - "learning_rate": 1.2632174890294283e-06, - "loss": 0.6733, - "step": 50654 - }, - { - "epoch": 1.3, - "learning_rate": 1.2631907942312596e-06, - "loss": 0.7461, - "step": 50655 - }, - { - "epoch": 1.3, - "learning_rate": 1.2631640992315779e-06, - "loss": 0.5879, - "step": 50656 - }, - { - "epoch": 1.3, - "learning_rate": 1.2631374040304034e-06, - "loss": 0.7119, - "step": 50657 - }, - { - "epoch": 1.3, - "learning_rate": 1.2631107086277568e-06, - "loss": 0.8174, - "step": 50658 - }, - { - "epoch": 1.3, - "learning_rate": 1.2630840130236584e-06, - "loss": 0.5454, - "step": 50659 - }, - { - "epoch": 1.3, - "learning_rate": 1.2630573172181287e-06, - "loss": 0.6055, - "step": 50660 - }, - { - "epoch": 1.3, - "learning_rate": 1.263030621211188e-06, - "loss": 0.6826, - "step": 50661 - }, - { - "epoch": 1.3, - "learning_rate": 1.2630039250028568e-06, - "loss": 0.6909, - "step": 50662 - }, - { - "epoch": 1.3, - "learning_rate": 1.262977228593156e-06, - "loss": 0.5112, - "step": 50663 - }, - { - "epoch": 1.3, - "learning_rate": 1.2629505319821055e-06, - "loss": 0.7285, - "step": 50664 - }, - { - "epoch": 1.3, - "learning_rate": 1.2629238351697253e-06, - "loss": 0.8047, - "step": 50665 - }, - { - "epoch": 1.3, - "learning_rate": 1.262897138156037e-06, - "loss": 0.7744, - "step": 50666 - }, - { - "epoch": 1.3, - "learning_rate": 1.2628704409410605e-06, - "loss": 0.6729, - "step": 50667 - }, - { - "epoch": 1.3, - "learning_rate": 1.2628437435248157e-06, - "loss": 0.7256, - "step": 50668 - }, - { - "epoch": 1.3, - "learning_rate": 1.2628170459073238e-06, - "loss": 0.666, - "step": 50669 - }, - { - "epoch": 1.3, - "learning_rate": 1.2627903480886049e-06, - "loss": 0.7754, - "step": 50670 - }, - { - "epoch": 1.3, - "learning_rate": 1.2627636500686798e-06, - "loss": 0.603, - "step": 50671 - }, - { - "epoch": 1.3, - "learning_rate": 1.2627369518475682e-06, - "loss": 0.6016, - "step": 50672 - }, - { - "epoch": 1.3, - "learning_rate": 1.2627102534252915e-06, - "loss": 0.5757, - "step": 50673 - }, - { - "epoch": 1.3, - "learning_rate": 1.262683554801869e-06, - "loss": 0.6216, - "step": 50674 - }, - { - "epoch": 1.3, - "learning_rate": 1.2626568559773226e-06, - "loss": 0.5913, - "step": 50675 - }, - { - "epoch": 1.3, - "learning_rate": 1.2626301569516713e-06, - "loss": 0.6553, - "step": 50676 - }, - { - "epoch": 1.3, - "learning_rate": 1.2626034577249365e-06, - "loss": 0.7041, - "step": 50677 - }, - { - "epoch": 1.3, - "learning_rate": 1.2625767582971378e-06, - "loss": 0.6436, - "step": 50678 - }, - { - "epoch": 1.3, - "learning_rate": 1.2625500586682966e-06, - "loss": 0.6592, - "step": 50679 - }, - { - "epoch": 1.3, - "learning_rate": 1.262523358838433e-06, - "loss": 0.5879, - "step": 50680 - }, - { - "epoch": 1.3, - "learning_rate": 1.262496658807567e-06, - "loss": 0.7104, - "step": 50681 - }, - { - "epoch": 1.3, - "learning_rate": 1.2624699585757195e-06, - "loss": 0.8682, - "step": 50682 - }, - { - "epoch": 1.3, - "learning_rate": 1.2624432581429107e-06, - "loss": 0.6226, - "step": 50683 - }, - { - "epoch": 1.3, - "learning_rate": 1.2624165575091612e-06, - "loss": 0.7764, - "step": 50684 - }, - { - "epoch": 1.3, - "learning_rate": 1.2623898566744915e-06, - "loss": 0.7383, - "step": 50685 - }, - { - "epoch": 1.3, - "learning_rate": 1.262363155638922e-06, - "loss": 0.7627, - "step": 50686 - }, - { - "epoch": 1.3, - "learning_rate": 1.262336454402473e-06, - "loss": 0.6826, - "step": 50687 - }, - { - "epoch": 1.3, - "learning_rate": 1.2623097529651652e-06, - "loss": 0.7271, - "step": 50688 - }, - { - "epoch": 1.3, - "learning_rate": 1.2622830513270187e-06, - "loss": 0.8447, - "step": 50689 - }, - { - "epoch": 1.3, - "learning_rate": 1.2622563494880542e-06, - "loss": 0.4371, - "step": 50690 - }, - { - "epoch": 1.3, - "learning_rate": 1.262229647448292e-06, - "loss": 0.397, - "step": 50691 - }, - { - "epoch": 1.3, - "learning_rate": 1.2622029452077528e-06, - "loss": 0.5619, - "step": 50692 - }, - { - "epoch": 1.3, - "learning_rate": 1.2621762427664566e-06, - "loss": 0.7373, - "step": 50693 - }, - { - "epoch": 1.3, - "learning_rate": 1.2621495401244244e-06, - "loss": 0.6138, - "step": 50694 - }, - { - "epoch": 1.3, - "learning_rate": 1.262122837281676e-06, - "loss": 0.6392, - "step": 50695 - }, - { - "epoch": 1.3, - "learning_rate": 1.2620961342382326e-06, - "loss": 0.7676, - "step": 50696 - }, - { - "epoch": 1.3, - "learning_rate": 1.262069430994114e-06, - "loss": 0.4292, - "step": 50697 - }, - { - "epoch": 1.3, - "learning_rate": 1.262042727549341e-06, - "loss": 0.5288, - "step": 50698 - }, - { - "epoch": 1.3, - "learning_rate": 1.2620160239039336e-06, - "loss": 0.5557, - "step": 50699 - }, - { - "epoch": 1.3, - "learning_rate": 1.2619893200579133e-06, - "loss": 0.7023, - "step": 50700 - }, - { - "epoch": 1.3, - "learning_rate": 1.261962616011299e-06, - "loss": 0.5977, - "step": 50701 - }, - { - "epoch": 1.3, - "learning_rate": 1.2619359117641123e-06, - "loss": 0.5684, - "step": 50702 - }, - { - "epoch": 1.3, - "learning_rate": 1.2619092073163736e-06, - "loss": 0.6768, - "step": 50703 - }, - { - "epoch": 1.3, - "learning_rate": 1.2618825026681025e-06, - "loss": 0.7949, - "step": 50704 - }, - { - "epoch": 1.3, - "learning_rate": 1.2618557978193206e-06, - "loss": 0.4624, - "step": 50705 - }, - { - "epoch": 1.3, - "learning_rate": 1.2618290927700472e-06, - "loss": 0.5527, - "step": 50706 - }, - { - "epoch": 1.3, - "learning_rate": 1.2618023875203036e-06, - "loss": 0.7363, - "step": 50707 - }, - { - "epoch": 1.3, - "learning_rate": 1.2617756820701102e-06, - "loss": 0.5586, - "step": 50708 - }, - { - "epoch": 1.3, - "learning_rate": 1.2617489764194868e-06, - "loss": 0.6758, - "step": 50709 - }, - { - "epoch": 1.3, - "learning_rate": 1.2617222705684544e-06, - "loss": 0.667, - "step": 50710 - }, - { - "epoch": 1.3, - "learning_rate": 1.2616955645170333e-06, - "loss": 0.7422, - "step": 50711 - }, - { - "epoch": 1.3, - "learning_rate": 1.2616688582652437e-06, - "loss": 0.6987, - "step": 50712 - }, - { - "epoch": 1.3, - "learning_rate": 1.2616421518131066e-06, - "loss": 0.7148, - "step": 50713 - }, - { - "epoch": 1.3, - "learning_rate": 1.261615445160642e-06, - "loss": 0.5798, - "step": 50714 - }, - { - "epoch": 1.3, - "learning_rate": 1.2615887383078708e-06, - "loss": 0.5874, - "step": 50715 - }, - { - "epoch": 1.3, - "learning_rate": 1.2615620312548124e-06, - "loss": 0.5767, - "step": 50716 - }, - { - "epoch": 1.3, - "learning_rate": 1.2615353240014886e-06, - "loss": 0.8008, - "step": 50717 - }, - { - "epoch": 1.3, - "learning_rate": 1.261508616547919e-06, - "loss": 0.5562, - "step": 50718 - }, - { - "epoch": 1.3, - "learning_rate": 1.2614819088941243e-06, - "loss": 0.5288, - "step": 50719 - }, - { - "epoch": 1.3, - "learning_rate": 1.2614552010401251e-06, - "loss": 0.7024, - "step": 50720 - }, - { - "epoch": 1.3, - "learning_rate": 1.2614284929859416e-06, - "loss": 0.6206, - "step": 50721 - }, - { - "epoch": 1.3, - "learning_rate": 1.261401784731594e-06, - "loss": 0.6357, - "step": 50722 - }, - { - "epoch": 1.3, - "learning_rate": 1.2613750762771033e-06, - "loss": 0.6577, - "step": 50723 - }, - { - "epoch": 1.3, - "learning_rate": 1.2613483676224897e-06, - "loss": 0.8184, - "step": 50724 - }, - { - "epoch": 1.3, - "learning_rate": 1.2613216587677736e-06, - "loss": 0.5674, - "step": 50725 - }, - { - "epoch": 1.3, - "learning_rate": 1.261294949712976e-06, - "loss": 0.6567, - "step": 50726 - }, - { - "epoch": 1.3, - "learning_rate": 1.2612682404581166e-06, - "loss": 0.8291, - "step": 50727 - }, - { - "epoch": 1.3, - "learning_rate": 1.2612415310032156e-06, - "loss": 0.592, - "step": 50728 - }, - { - "epoch": 1.3, - "learning_rate": 1.2612148213482944e-06, - "loss": 0.8555, - "step": 50729 - }, - { - "epoch": 1.3, - "learning_rate": 1.2611881114933732e-06, - "loss": 0.5913, - "step": 50730 - }, - { - "epoch": 1.3, - "learning_rate": 1.261161401438472e-06, - "loss": 0.6279, - "step": 50731 - }, - { - "epoch": 1.3, - "learning_rate": 1.2611346911836118e-06, - "loss": 0.5986, - "step": 50732 - }, - { - "epoch": 1.3, - "learning_rate": 1.2611079807288124e-06, - "loss": 0.6748, - "step": 50733 - }, - { - "epoch": 1.3, - "learning_rate": 1.261081270074095e-06, - "loss": 0.5793, - "step": 50734 - }, - { - "epoch": 1.3, - "learning_rate": 1.2610545592194795e-06, - "loss": 0.7949, - "step": 50735 - }, - { - "epoch": 1.3, - "learning_rate": 1.2610278481649864e-06, - "loss": 0.5864, - "step": 50736 - }, - { - "epoch": 1.3, - "learning_rate": 1.2610011369106364e-06, - "loss": 0.8076, - "step": 50737 - }, - { - "epoch": 1.3, - "learning_rate": 1.26097442545645e-06, - "loss": 0.6689, - "step": 50738 - }, - { - "epoch": 1.3, - "learning_rate": 1.260947713802447e-06, - "loss": 0.7109, - "step": 50739 - }, - { - "epoch": 1.3, - "learning_rate": 1.2609210019486489e-06, - "loss": 0.5571, - "step": 50740 - }, - { - "epoch": 1.3, - "learning_rate": 1.2608942898950752e-06, - "loss": 0.6855, - "step": 50741 - }, - { - "epoch": 1.3, - "learning_rate": 1.260867577641747e-06, - "loss": 0.5916, - "step": 50742 - }, - { - "epoch": 1.3, - "learning_rate": 1.2608408651886842e-06, - "loss": 0.8525, - "step": 50743 - }, - { - "epoch": 1.3, - "learning_rate": 1.2608141525359077e-06, - "loss": 0.4844, - "step": 50744 - }, - { - "epoch": 1.3, - "learning_rate": 1.260787439683438e-06, - "loss": 0.5688, - "step": 50745 - }, - { - "epoch": 1.3, - "learning_rate": 1.2607607266312953e-06, - "loss": 0.5139, - "step": 50746 - }, - { - "epoch": 1.3, - "learning_rate": 1.2607340133794997e-06, - "loss": 0.4103, - "step": 50747 - }, - { - "epoch": 1.3, - "learning_rate": 1.2607072999280724e-06, - "loss": 0.7007, - "step": 50748 - }, - { - "epoch": 1.3, - "learning_rate": 1.2606805862770333e-06, - "loss": 0.6138, - "step": 50749 - }, - { - "epoch": 1.3, - "learning_rate": 1.2606538724264032e-06, - "loss": 0.5413, - "step": 50750 - }, - { - "epoch": 1.3, - "learning_rate": 1.2606271583762026e-06, - "loss": 0.6099, - "step": 50751 - }, - { - "epoch": 1.3, - "learning_rate": 1.2606004441264512e-06, - "loss": 0.7031, - "step": 50752 - }, - { - "epoch": 1.3, - "learning_rate": 1.2605737296771706e-06, - "loss": 0.7173, - "step": 50753 - }, - { - "epoch": 1.3, - "learning_rate": 1.2605470150283805e-06, - "loss": 0.6016, - "step": 50754 - }, - { - "epoch": 1.3, - "learning_rate": 1.2605203001801014e-06, - "loss": 0.7461, - "step": 50755 - }, - { - "epoch": 1.3, - "learning_rate": 1.260493585132354e-06, - "loss": 0.6436, - "step": 50756 - }, - { - "epoch": 1.3, - "learning_rate": 1.2604668698851586e-06, - "loss": 0.6807, - "step": 50757 - }, - { - "epoch": 1.3, - "learning_rate": 1.2604401544385356e-06, - "loss": 0.5488, - "step": 50758 - }, - { - "epoch": 1.3, - "learning_rate": 1.2604134387925057e-06, - "loss": 0.6709, - "step": 50759 - }, - { - "epoch": 1.3, - "learning_rate": 1.2603867229470893e-06, - "loss": 0.6372, - "step": 50760 - }, - { - "epoch": 1.3, - "learning_rate": 1.2603600069023065e-06, - "loss": 0.5532, - "step": 50761 - }, - { - "epoch": 1.3, - "learning_rate": 1.2603332906581781e-06, - "loss": 0.5591, - "step": 50762 - }, - { - "epoch": 1.3, - "learning_rate": 1.2603065742147245e-06, - "loss": 0.5884, - "step": 50763 - }, - { - "epoch": 1.3, - "learning_rate": 1.260279857571966e-06, - "loss": 0.6914, - "step": 50764 - }, - { - "epoch": 1.3, - "learning_rate": 1.2602531407299237e-06, - "loss": 0.5601, - "step": 50765 - }, - { - "epoch": 1.3, - "learning_rate": 1.2602264236886169e-06, - "loss": 0.6807, - "step": 50766 - }, - { - "epoch": 1.3, - "learning_rate": 1.260199706448067e-06, - "loss": 0.6895, - "step": 50767 - }, - { - "epoch": 1.3, - "learning_rate": 1.2601729890082941e-06, - "loss": 0.7773, - "step": 50768 - }, - { - "epoch": 1.3, - "learning_rate": 1.2601462713693187e-06, - "loss": 0.4268, - "step": 50769 - }, - { - "epoch": 1.3, - "learning_rate": 1.2601195535311613e-06, - "loss": 0.6587, - "step": 50770 - }, - { - "epoch": 1.3, - "learning_rate": 1.2600928354938422e-06, - "loss": 0.583, - "step": 50771 - }, - { - "epoch": 1.3, - "learning_rate": 1.260066117257382e-06, - "loss": 0.6123, - "step": 50772 - }, - { - "epoch": 1.3, - "learning_rate": 1.2600393988218013e-06, - "loss": 0.6831, - "step": 50773 - }, - { - "epoch": 1.3, - "learning_rate": 1.26001268018712e-06, - "loss": 0.7031, - "step": 50774 - }, - { - "epoch": 1.3, - "learning_rate": 1.2599859613533595e-06, - "loss": 0.6626, - "step": 50775 - }, - { - "epoch": 1.3, - "learning_rate": 1.2599592423205395e-06, - "loss": 0.635, - "step": 50776 - }, - { - "epoch": 1.3, - "learning_rate": 1.2599325230886805e-06, - "loss": 0.5278, - "step": 50777 - }, - { - "epoch": 1.3, - "learning_rate": 1.2599058036578032e-06, - "loss": 0.6255, - "step": 50778 - }, - { - "epoch": 1.3, - "learning_rate": 1.2598790840279279e-06, - "loss": 0.5347, - "step": 50779 - }, - { - "epoch": 1.3, - "learning_rate": 1.2598523641990752e-06, - "loss": 0.5168, - "step": 50780 - }, - { - "epoch": 1.3, - "learning_rate": 1.2598256441712657e-06, - "loss": 0.748, - "step": 50781 - }, - { - "epoch": 1.3, - "learning_rate": 1.2597989239445195e-06, - "loss": 0.6533, - "step": 50782 - }, - { - "epoch": 1.3, - "learning_rate": 1.2597722035188569e-06, - "loss": 0.6572, - "step": 50783 - }, - { - "epoch": 1.3, - "learning_rate": 1.259745482894299e-06, - "loss": 0.6572, - "step": 50784 - }, - { - "epoch": 1.3, - "learning_rate": 1.259718762070866e-06, - "loss": 0.7422, - "step": 50785 - }, - { - "epoch": 1.3, - "learning_rate": 1.259692041048578e-06, - "loss": 0.6211, - "step": 50786 - }, - { - "epoch": 1.3, - "learning_rate": 1.259665319827456e-06, - "loss": 0.6182, - "step": 50787 - }, - { - "epoch": 1.3, - "learning_rate": 1.2596385984075203e-06, - "loss": 0.585, - "step": 50788 - }, - { - "epoch": 1.3, - "learning_rate": 1.2596118767887906e-06, - "loss": 0.7344, - "step": 50789 - }, - { - "epoch": 1.3, - "learning_rate": 1.259585154971289e-06, - "loss": 0.6099, - "step": 50790 - }, - { - "epoch": 1.3, - "learning_rate": 1.2595584329550343e-06, - "loss": 0.7412, - "step": 50791 - }, - { - "epoch": 1.3, - "learning_rate": 1.2595317107400478e-06, - "loss": 0.5796, - "step": 50792 - }, - { - "epoch": 1.3, - "learning_rate": 1.2595049883263498e-06, - "loss": 0.5483, - "step": 50793 - }, - { - "epoch": 1.3, - "learning_rate": 1.2594782657139607e-06, - "loss": 0.751, - "step": 50794 - }, - { - "epoch": 1.3, - "learning_rate": 1.259451542902901e-06, - "loss": 0.6187, - "step": 50795 - }, - { - "epoch": 1.3, - "learning_rate": 1.2594248198931915e-06, - "loss": 0.4541, - "step": 50796 - }, - { - "epoch": 1.3, - "learning_rate": 1.259398096684852e-06, - "loss": 0.7139, - "step": 50797 - }, - { - "epoch": 1.3, - "learning_rate": 1.2593713732779034e-06, - "loss": 0.6421, - "step": 50798 - }, - { - "epoch": 1.3, - "learning_rate": 1.259344649672366e-06, - "loss": 0.6777, - "step": 50799 - }, - { - "epoch": 1.3, - "learning_rate": 1.2593179258682605e-06, - "loss": 0.7129, - "step": 50800 - }, - { - "epoch": 1.3, - "learning_rate": 1.2592912018656072e-06, - "loss": 0.5869, - "step": 50801 - }, - { - "epoch": 1.3, - "learning_rate": 1.2592644776644264e-06, - "loss": 0.6709, - "step": 50802 - }, - { - "epoch": 1.3, - "learning_rate": 1.2592377532647389e-06, - "loss": 0.6074, - "step": 50803 - }, - { - "epoch": 1.3, - "learning_rate": 1.2592110286665647e-06, - "loss": 0.7588, - "step": 50804 - }, - { - "epoch": 1.3, - "learning_rate": 1.259184303869925e-06, - "loss": 0.5977, - "step": 50805 - }, - { - "epoch": 1.3, - "learning_rate": 1.2591575788748391e-06, - "loss": 0.4714, - "step": 50806 - }, - { - "epoch": 1.3, - "learning_rate": 1.2591308536813287e-06, - "loss": 0.5967, - "step": 50807 - }, - { - "epoch": 1.3, - "learning_rate": 1.2591041282894135e-06, - "loss": 0.5371, - "step": 50808 - }, - { - "epoch": 1.3, - "learning_rate": 1.2590774026991142e-06, - "loss": 0.6558, - "step": 50809 - }, - { - "epoch": 1.3, - "learning_rate": 1.2590506769104513e-06, - "loss": 0.7705, - "step": 50810 - }, - { - "epoch": 1.3, - "learning_rate": 1.2590239509234453e-06, - "loss": 0.5308, - "step": 50811 - }, - { - "epoch": 1.3, - "learning_rate": 1.2589972247381164e-06, - "loss": 0.6361, - "step": 50812 - }, - { - "epoch": 1.3, - "learning_rate": 1.2589704983544853e-06, - "loss": 0.71, - "step": 50813 - }, - { - "epoch": 1.3, - "learning_rate": 1.2589437717725724e-06, - "loss": 0.6675, - "step": 50814 - }, - { - "epoch": 1.3, - "learning_rate": 1.2589170449923981e-06, - "loss": 0.5933, - "step": 50815 - }, - { - "epoch": 1.3, - "learning_rate": 1.2588903180139832e-06, - "loss": 0.7666, - "step": 50816 - }, - { - "epoch": 1.3, - "learning_rate": 1.2588635908373477e-06, - "loss": 0.6553, - "step": 50817 - }, - { - "epoch": 1.3, - "learning_rate": 1.2588368634625119e-06, - "loss": 0.5845, - "step": 50818 - }, - { - "epoch": 1.3, - "learning_rate": 1.2588101358894972e-06, - "loss": 0.5825, - "step": 50819 - }, - { - "epoch": 1.3, - "learning_rate": 1.2587834081183234e-06, - "loss": 0.6885, - "step": 50820 - }, - { - "epoch": 1.3, - "learning_rate": 1.2587566801490104e-06, - "loss": 0.7646, - "step": 50821 - }, - { - "epoch": 1.3, - "learning_rate": 1.25872995198158e-06, - "loss": 0.6914, - "step": 50822 - }, - { - "epoch": 1.3, - "learning_rate": 1.2587032236160516e-06, - "loss": 0.6758, - "step": 50823 - }, - { - "epoch": 1.3, - "learning_rate": 1.2586764950524463e-06, - "loss": 0.5283, - "step": 50824 - }, - { - "epoch": 1.3, - "learning_rate": 1.2586497662907843e-06, - "loss": 0.7314, - "step": 50825 - }, - { - "epoch": 1.3, - "learning_rate": 1.2586230373310858e-06, - "loss": 0.7812, - "step": 50826 - }, - { - "epoch": 1.3, - "learning_rate": 1.2585963081733714e-06, - "loss": 0.6143, - "step": 50827 - }, - { - "epoch": 1.3, - "learning_rate": 1.2585695788176622e-06, - "loss": 0.6626, - "step": 50828 - }, - { - "epoch": 1.3, - "learning_rate": 1.2585428492639778e-06, - "loss": 0.5752, - "step": 50829 - }, - { - "epoch": 1.3, - "learning_rate": 1.2585161195123396e-06, - "loss": 0.6064, - "step": 50830 - }, - { - "epoch": 1.3, - "learning_rate": 1.2584893895627668e-06, - "loss": 0.6484, - "step": 50831 - }, - { - "epoch": 1.3, - "learning_rate": 1.2584626594152806e-06, - "loss": 0.6284, - "step": 50832 - }, - { - "epoch": 1.3, - "learning_rate": 1.258435929069902e-06, - "loss": 0.707, - "step": 50833 - }, - { - "epoch": 1.3, - "learning_rate": 1.2584091985266504e-06, - "loss": 0.7451, - "step": 50834 - }, - { - "epoch": 1.3, - "learning_rate": 1.2583824677855467e-06, - "loss": 0.8379, - "step": 50835 - }, - { - "epoch": 1.3, - "learning_rate": 1.258355736846612e-06, - "loss": 0.5146, - "step": 50836 - }, - { - "epoch": 1.3, - "learning_rate": 1.2583290057098657e-06, - "loss": 0.71, - "step": 50837 - }, - { - "epoch": 1.3, - "learning_rate": 1.2583022743753289e-06, - "loss": 0.5288, - "step": 50838 - }, - { - "epoch": 1.3, - "learning_rate": 1.2582755428430217e-06, - "loss": 0.6465, - "step": 50839 - }, - { - "epoch": 1.3, - "learning_rate": 1.258248811112965e-06, - "loss": 0.54, - "step": 50840 - }, - { - "epoch": 1.3, - "learning_rate": 1.2582220791851792e-06, - "loss": 0.5947, - "step": 50841 - }, - { - "epoch": 1.3, - "learning_rate": 1.2581953470596843e-06, - "loss": 0.7144, - "step": 50842 - }, - { - "epoch": 1.3, - "learning_rate": 1.2581686147365014e-06, - "loss": 0.667, - "step": 50843 - }, - { - "epoch": 1.3, - "learning_rate": 1.2581418822156505e-06, - "loss": 0.7295, - "step": 50844 - }, - { - "epoch": 1.3, - "learning_rate": 1.2581151494971525e-06, - "loss": 0.7344, - "step": 50845 - }, - { - "epoch": 1.3, - "learning_rate": 1.258088416581027e-06, - "loss": 0.627, - "step": 50846 - }, - { - "epoch": 1.3, - "learning_rate": 1.2580616834672957e-06, - "loss": 0.6943, - "step": 50847 - }, - { - "epoch": 1.3, - "learning_rate": 1.258034950155978e-06, - "loss": 0.8076, - "step": 50848 - }, - { - "epoch": 1.3, - "learning_rate": 1.2580082166470949e-06, - "loss": 0.6602, - "step": 50849 - }, - { - "epoch": 1.3, - "learning_rate": 1.257981482940667e-06, - "loss": 0.5625, - "step": 50850 - }, - { - "epoch": 1.3, - "learning_rate": 1.2579547490367144e-06, - "loss": 0.8555, - "step": 50851 - }, - { - "epoch": 1.3, - "learning_rate": 1.2579280149352576e-06, - "loss": 0.5483, - "step": 50852 - }, - { - "epoch": 1.3, - "learning_rate": 1.2579012806363172e-06, - "loss": 0.8086, - "step": 50853 - }, - { - "epoch": 1.3, - "learning_rate": 1.2578745461399136e-06, - "loss": 0.5698, - "step": 50854 - }, - { - "epoch": 1.3, - "learning_rate": 1.2578478114460678e-06, - "loss": 0.7725, - "step": 50855 - }, - { - "epoch": 1.3, - "learning_rate": 1.2578210765547992e-06, - "loss": 0.533, - "step": 50856 - }, - { - "epoch": 1.3, - "learning_rate": 1.2577943414661292e-06, - "loss": 0.5801, - "step": 50857 - }, - { - "epoch": 1.3, - "learning_rate": 1.2577676061800778e-06, - "loss": 0.8379, - "step": 50858 - }, - { - "epoch": 1.3, - "learning_rate": 1.2577408706966654e-06, - "loss": 0.6133, - "step": 50859 - }, - { - "epoch": 1.3, - "learning_rate": 1.257714135015913e-06, - "loss": 0.6978, - "step": 50860 - }, - { - "epoch": 1.3, - "learning_rate": 1.2576873991378408e-06, - "loss": 0.7607, - "step": 50861 - }, - { - "epoch": 1.3, - "learning_rate": 1.2576606630624689e-06, - "loss": 0.5496, - "step": 50862 - }, - { - "epoch": 1.3, - "learning_rate": 1.257633926789818e-06, - "loss": 0.5898, - "step": 50863 - }, - { - "epoch": 1.3, - "learning_rate": 1.2576071903199087e-06, - "loss": 0.6486, - "step": 50864 - }, - { - "epoch": 1.3, - "learning_rate": 1.2575804536527619e-06, - "loss": 0.6768, - "step": 50865 - }, - { - "epoch": 1.3, - "learning_rate": 1.2575537167883972e-06, - "loss": 0.6382, - "step": 50866 - }, - { - "epoch": 1.3, - "learning_rate": 1.2575269797268353e-06, - "loss": 0.6201, - "step": 50867 - }, - { - "epoch": 1.3, - "learning_rate": 1.2575002424680971e-06, - "loss": 0.6797, - "step": 50868 - }, - { - "epoch": 1.3, - "learning_rate": 1.2574735050122027e-06, - "loss": 0.5925, - "step": 50869 - }, - { - "epoch": 1.3, - "learning_rate": 1.2574467673591728e-06, - "loss": 0.543, - "step": 50870 - }, - { - "epoch": 1.3, - "learning_rate": 1.2574200295090278e-06, - "loss": 0.6631, - "step": 50871 - }, - { - "epoch": 1.3, - "learning_rate": 1.257393291461788e-06, - "loss": 0.6665, - "step": 50872 - }, - { - "epoch": 1.3, - "learning_rate": 1.2573665532174737e-06, - "loss": 0.5552, - "step": 50873 - }, - { - "epoch": 1.3, - "learning_rate": 1.257339814776106e-06, - "loss": 0.5508, - "step": 50874 - }, - { - "epoch": 1.3, - "learning_rate": 1.2573130761377053e-06, - "loss": 0.7363, - "step": 50875 - }, - { - "epoch": 1.3, - "learning_rate": 1.2572863373022916e-06, - "loss": 0.8516, - "step": 50876 - }, - { - "epoch": 1.3, - "learning_rate": 1.2572595982698852e-06, - "loss": 0.7427, - "step": 50877 - }, - { - "epoch": 1.3, - "learning_rate": 1.2572328590405073e-06, - "loss": 0.6553, - "step": 50878 - }, - { - "epoch": 1.3, - "learning_rate": 1.2572061196141777e-06, - "loss": 0.5015, - "step": 50879 - }, - { - "epoch": 1.3, - "learning_rate": 1.2571793799909179e-06, - "loss": 0.6001, - "step": 50880 - }, - { - "epoch": 1.3, - "learning_rate": 1.257152640170747e-06, - "loss": 0.5664, - "step": 50881 - }, - { - "epoch": 1.3, - "learning_rate": 1.2571259001536864e-06, - "loss": 0.4287, - "step": 50882 - }, - { - "epoch": 1.3, - "learning_rate": 1.2570991599397562e-06, - "loss": 0.5984, - "step": 50883 - }, - { - "epoch": 1.3, - "learning_rate": 1.2570724195289772e-06, - "loss": 0.5229, - "step": 50884 - }, - { - "epoch": 1.3, - "learning_rate": 1.2570456789213697e-06, - "loss": 0.584, - "step": 50885 - }, - { - "epoch": 1.3, - "learning_rate": 1.2570189381169537e-06, - "loss": 0.6909, - "step": 50886 - }, - { - "epoch": 1.3, - "learning_rate": 1.2569921971157506e-06, - "loss": 0.708, - "step": 50887 - }, - { - "epoch": 1.3, - "learning_rate": 1.25696545591778e-06, - "loss": 0.6929, - "step": 50888 - }, - { - "epoch": 1.3, - "learning_rate": 1.2569387145230632e-06, - "loss": 0.6694, - "step": 50889 - }, - { - "epoch": 1.3, - "learning_rate": 1.25691197293162e-06, - "loss": 0.4186, - "step": 50890 - }, - { - "epoch": 1.3, - "learning_rate": 1.2568852311434712e-06, - "loss": 0.4822, - "step": 50891 - }, - { - "epoch": 1.3, - "learning_rate": 1.2568584891586368e-06, - "loss": 0.6602, - "step": 50892 - }, - { - "epoch": 1.3, - "learning_rate": 1.2568317469771384e-06, - "loss": 0.644, - "step": 50893 - }, - { - "epoch": 1.3, - "learning_rate": 1.2568050045989951e-06, - "loss": 0.5615, - "step": 50894 - }, - { - "epoch": 1.3, - "learning_rate": 1.2567782620242284e-06, - "loss": 0.915, - "step": 50895 - }, - { - "epoch": 1.3, - "learning_rate": 1.2567515192528582e-06, - "loss": 0.564, - "step": 50896 - }, - { - "epoch": 1.3, - "learning_rate": 1.2567247762849053e-06, - "loss": 0.4686, - "step": 50897 - }, - { - "epoch": 1.3, - "learning_rate": 1.2566980331203898e-06, - "loss": 0.7988, - "step": 50898 - }, - { - "epoch": 1.3, - "learning_rate": 1.2566712897593325e-06, - "loss": 0.6318, - "step": 50899 - }, - { - "epoch": 1.3, - "learning_rate": 1.2566445462017541e-06, - "loss": 0.365, - "step": 50900 - }, - { - "epoch": 1.3, - "learning_rate": 1.2566178024476747e-06, - "loss": 0.6777, - "step": 50901 - }, - { - "epoch": 1.3, - "learning_rate": 1.2565910584971145e-06, - "loss": 0.6465, - "step": 50902 - }, - { - "epoch": 1.3, - "learning_rate": 1.2565643143500945e-06, - "loss": 0.7568, - "step": 50903 - }, - { - "epoch": 1.3, - "learning_rate": 1.2565375700066349e-06, - "loss": 0.5383, - "step": 50904 - }, - { - "epoch": 1.3, - "learning_rate": 1.2565108254667564e-06, - "loss": 0.5977, - "step": 50905 - }, - { - "epoch": 1.3, - "learning_rate": 1.2564840807304795e-06, - "loss": 0.6587, - "step": 50906 - }, - { - "epoch": 1.3, - "learning_rate": 1.2564573357978242e-06, - "loss": 0.6943, - "step": 50907 - }, - { - "epoch": 1.3, - "learning_rate": 1.2564305906688114e-06, - "loss": 0.6333, - "step": 50908 - }, - { - "epoch": 1.3, - "learning_rate": 1.2564038453434617e-06, - "loss": 0.7012, - "step": 50909 - }, - { - "epoch": 1.3, - "learning_rate": 1.2563770998217954e-06, - "loss": 0.7017, - "step": 50910 - }, - { - "epoch": 1.3, - "learning_rate": 1.2563503541038328e-06, - "loss": 0.6152, - "step": 50911 - }, - { - "epoch": 1.3, - "learning_rate": 1.2563236081895946e-06, - "loss": 0.7222, - "step": 50912 - }, - { - "epoch": 1.3, - "learning_rate": 1.2562968620791008e-06, - "loss": 0.6626, - "step": 50913 - }, - { - "epoch": 1.3, - "learning_rate": 1.2562701157723728e-06, - "loss": 0.6201, - "step": 50914 - }, - { - "epoch": 1.3, - "learning_rate": 1.2562433692694304e-06, - "loss": 0.7363, - "step": 50915 - }, - { - "epoch": 1.31, - "learning_rate": 1.2562166225702942e-06, - "loss": 0.5227, - "step": 50916 - }, - { - "epoch": 1.31, - "learning_rate": 1.2561898756749844e-06, - "loss": 0.6072, - "step": 50917 - }, - { - "epoch": 1.31, - "learning_rate": 1.2561631285835223e-06, - "loss": 0.4697, - "step": 50918 - }, - { - "epoch": 1.31, - "learning_rate": 1.2561363812959273e-06, - "loss": 0.6455, - "step": 50919 - }, - { - "epoch": 1.31, - "learning_rate": 1.2561096338122212e-06, - "loss": 0.6533, - "step": 50920 - }, - { - "epoch": 1.31, - "learning_rate": 1.2560828861324231e-06, - "loss": 0.6797, - "step": 50921 - }, - { - "epoch": 1.31, - "learning_rate": 1.2560561382565547e-06, - "loss": 0.7061, - "step": 50922 - }, - { - "epoch": 1.31, - "learning_rate": 1.2560293901846352e-06, - "loss": 0.7695, - "step": 50923 - }, - { - "epoch": 1.31, - "learning_rate": 1.2560026419166862e-06, - "loss": 0.5615, - "step": 50924 - }, - { - "epoch": 1.31, - "learning_rate": 1.2559758934527275e-06, - "loss": 0.6553, - "step": 50925 - }, - { - "epoch": 1.31, - "learning_rate": 1.2559491447927802e-06, - "loss": 0.4731, - "step": 50926 - }, - { - "epoch": 1.31, - "learning_rate": 1.2559223959368641e-06, - "loss": 0.6387, - "step": 50927 - }, - { - "epoch": 1.31, - "learning_rate": 1.2558956468850001e-06, - "loss": 0.6382, - "step": 50928 - }, - { - "epoch": 1.31, - "learning_rate": 1.2558688976372085e-06, - "loss": 0.6631, - "step": 50929 - }, - { - "epoch": 1.31, - "learning_rate": 1.2558421481935099e-06, - "loss": 0.7695, - "step": 50930 - }, - { - "epoch": 1.31, - "learning_rate": 1.2558153985539249e-06, - "loss": 0.6826, - "step": 50931 - }, - { - "epoch": 1.31, - "learning_rate": 1.2557886487184735e-06, - "loss": 0.6582, - "step": 50932 - }, - { - "epoch": 1.31, - "learning_rate": 1.2557618986871766e-06, - "loss": 0.6284, - "step": 50933 - }, - { - "epoch": 1.31, - "learning_rate": 1.2557351484600546e-06, - "loss": 0.4844, - "step": 50934 - }, - { - "epoch": 1.31, - "learning_rate": 1.255708398037128e-06, - "loss": 0.538, - "step": 50935 - }, - { - "epoch": 1.31, - "learning_rate": 1.255681647418417e-06, - "loss": 0.6992, - "step": 50936 - }, - { - "epoch": 1.31, - "learning_rate": 1.255654896603943e-06, - "loss": 0.5034, - "step": 50937 - }, - { - "epoch": 1.31, - "learning_rate": 1.255628145593725e-06, - "loss": 0.7598, - "step": 50938 - }, - { - "epoch": 1.31, - "learning_rate": 1.2556013943877845e-06, - "loss": 0.7139, - "step": 50939 - }, - { - "epoch": 1.31, - "learning_rate": 1.255574642986142e-06, - "loss": 0.5381, - "step": 50940 - }, - { - "epoch": 1.31, - "learning_rate": 1.2555478913888178e-06, - "loss": 0.6567, - "step": 50941 - }, - { - "epoch": 1.31, - "learning_rate": 1.2555211395958318e-06, - "loss": 0.7012, - "step": 50942 - }, - { - "epoch": 1.31, - "learning_rate": 1.2554943876072055e-06, - "loss": 0.7266, - "step": 50943 - }, - { - "epoch": 1.31, - "learning_rate": 1.2554676354229586e-06, - "loss": 0.5962, - "step": 50944 - }, - { - "epoch": 1.31, - "learning_rate": 1.2554408830431125e-06, - "loss": 0.5359, - "step": 50945 - }, - { - "epoch": 1.31, - "learning_rate": 1.2554141304676864e-06, - "loss": 0.5752, - "step": 50946 - }, - { - "epoch": 1.31, - "learning_rate": 1.2553873776967017e-06, - "loss": 0.5901, - "step": 50947 - }, - { - "epoch": 1.31, - "learning_rate": 1.2553606247301782e-06, - "loss": 0.7139, - "step": 50948 - }, - { - "epoch": 1.31, - "learning_rate": 1.2553338715681374e-06, - "loss": 0.5391, - "step": 50949 - }, - { - "epoch": 1.31, - "learning_rate": 1.255307118210599e-06, - "loss": 0.6685, - "step": 50950 - }, - { - "epoch": 1.31, - "learning_rate": 1.2552803646575839e-06, - "loss": 0.4702, - "step": 50951 - }, - { - "epoch": 1.31, - "learning_rate": 1.255253610909112e-06, - "loss": 0.6104, - "step": 50952 - }, - { - "epoch": 1.31, - "learning_rate": 1.255226856965204e-06, - "loss": 0.4739, - "step": 50953 - }, - { - "epoch": 1.31, - "learning_rate": 1.2552001028258806e-06, - "loss": 0.708, - "step": 50954 - }, - { - "epoch": 1.31, - "learning_rate": 1.2551733484911626e-06, - "loss": 0.7373, - "step": 50955 - }, - { - "epoch": 1.31, - "learning_rate": 1.2551465939610698e-06, - "loss": 0.6641, - "step": 50956 - }, - { - "epoch": 1.31, - "learning_rate": 1.2551198392356233e-06, - "loss": 0.6304, - "step": 50957 - }, - { - "epoch": 1.31, - "learning_rate": 1.2550930843148432e-06, - "loss": 0.6904, - "step": 50958 - }, - { - "epoch": 1.31, - "learning_rate": 1.2550663291987495e-06, - "loss": 0.7383, - "step": 50959 - }, - { - "epoch": 1.31, - "learning_rate": 1.2550395738873641e-06, - "loss": 0.6963, - "step": 50960 - }, - { - "epoch": 1.31, - "learning_rate": 1.2550128183807061e-06, - "loss": 0.6123, - "step": 50961 - }, - { - "epoch": 1.31, - "learning_rate": 1.2549860626787964e-06, - "loss": 0.6777, - "step": 50962 - }, - { - "epoch": 1.31, - "learning_rate": 1.2549593067816558e-06, - "loss": 0.7676, - "step": 50963 - }, - { - "epoch": 1.31, - "learning_rate": 1.2549325506893046e-06, - "loss": 0.8955, - "step": 50964 - }, - { - "epoch": 1.31, - "learning_rate": 1.2549057944017633e-06, - "loss": 0.6348, - "step": 50965 - }, - { - "epoch": 1.31, - "learning_rate": 1.2548790379190523e-06, - "loss": 0.6357, - "step": 50966 - }, - { - "epoch": 1.31, - "learning_rate": 1.254852281241192e-06, - "loss": 0.668, - "step": 50967 - }, - { - "epoch": 1.31, - "learning_rate": 1.2548255243682034e-06, - "loss": 0.6328, - "step": 50968 - }, - { - "epoch": 1.31, - "learning_rate": 1.2547987673001064e-06, - "loss": 0.604, - "step": 50969 - }, - { - "epoch": 1.31, - "learning_rate": 1.2547720100369217e-06, - "loss": 0.6689, - "step": 50970 - }, - { - "epoch": 1.31, - "learning_rate": 1.2547452525786697e-06, - "loss": 0.7412, - "step": 50971 - }, - { - "epoch": 1.31, - "learning_rate": 1.254718494925371e-06, - "loss": 0.665, - "step": 50972 - }, - { - "epoch": 1.31, - "learning_rate": 1.254691737077046e-06, - "loss": 0.8184, - "step": 50973 - }, - { - "epoch": 1.31, - "learning_rate": 1.2546649790337155e-06, - "loss": 0.8271, - "step": 50974 - }, - { - "epoch": 1.31, - "learning_rate": 1.2546382207953997e-06, - "loss": 0.5869, - "step": 50975 - }, - { - "epoch": 1.31, - "learning_rate": 1.2546114623621188e-06, - "loss": 0.5996, - "step": 50976 - }, - { - "epoch": 1.31, - "learning_rate": 1.2545847037338936e-06, - "loss": 0.7007, - "step": 50977 - }, - { - "epoch": 1.31, - "learning_rate": 1.2545579449107448e-06, - "loss": 0.583, - "step": 50978 - }, - { - "epoch": 1.31, - "learning_rate": 1.254531185892693e-06, - "loss": 0.7461, - "step": 50979 - }, - { - "epoch": 1.31, - "learning_rate": 1.254504426679758e-06, - "loss": 0.7754, - "step": 50980 - }, - { - "epoch": 1.31, - "learning_rate": 1.2544776672719609e-06, - "loss": 0.8428, - "step": 50981 - }, - { - "epoch": 1.31, - "learning_rate": 1.2544509076693215e-06, - "loss": 0.7568, - "step": 50982 - }, - { - "epoch": 1.31, - "learning_rate": 1.2544241478718612e-06, - "loss": 0.7402, - "step": 50983 - }, - { - "epoch": 1.31, - "learning_rate": 1.2543973878795996e-06, - "loss": 0.5547, - "step": 50984 - }, - { - "epoch": 1.31, - "learning_rate": 1.2543706276925581e-06, - "loss": 0.7295, - "step": 50985 - }, - { - "epoch": 1.31, - "learning_rate": 1.2543438673107565e-06, - "loss": 0.7979, - "step": 50986 - }, - { - "epoch": 1.31, - "learning_rate": 1.2543171067342154e-06, - "loss": 0.646, - "step": 50987 - }, - { - "epoch": 1.31, - "learning_rate": 1.2542903459629551e-06, - "loss": 0.7539, - "step": 50988 - }, - { - "epoch": 1.31, - "learning_rate": 1.2542635849969972e-06, - "loss": 0.6257, - "step": 50989 - }, - { - "epoch": 1.31, - "learning_rate": 1.2542368238363608e-06, - "loss": 0.8135, - "step": 50990 - }, - { - "epoch": 1.31, - "learning_rate": 1.254210062481067e-06, - "loss": 0.6729, - "step": 50991 - }, - { - "epoch": 1.31, - "learning_rate": 1.2541833009311363e-06, - "loss": 0.6943, - "step": 50992 - }, - { - "epoch": 1.31, - "learning_rate": 1.254156539186589e-06, - "loss": 0.7646, - "step": 50993 - }, - { - "epoch": 1.31, - "learning_rate": 1.2541297772474462e-06, - "loss": 0.6641, - "step": 50994 - }, - { - "epoch": 1.31, - "learning_rate": 1.2541030151137273e-06, - "loss": 0.5991, - "step": 50995 - }, - { - "epoch": 1.31, - "learning_rate": 1.2540762527854539e-06, - "loss": 0.5466, - "step": 50996 - }, - { - "epoch": 1.31, - "learning_rate": 1.2540494902626458e-06, - "loss": 0.6289, - "step": 50997 - }, - { - "epoch": 1.31, - "learning_rate": 1.2540227275453234e-06, - "loss": 0.6592, - "step": 50998 - }, - { - "epoch": 1.31, - "learning_rate": 1.253995964633508e-06, - "loss": 0.7275, - "step": 50999 - }, - { - "epoch": 1.31, - "learning_rate": 1.253969201527219e-06, - "loss": 0.4639, - "step": 51000 - }, - { - "epoch": 1.31, - "learning_rate": 1.2539424382264777e-06, - "loss": 0.7148, - "step": 51001 - }, - { - "epoch": 1.31, - "learning_rate": 1.2539156747313046e-06, - "loss": 0.6873, - "step": 51002 - }, - { - "epoch": 1.31, - "learning_rate": 1.2538889110417196e-06, - "loss": 0.5999, - "step": 51003 - }, - { - "epoch": 1.31, - "learning_rate": 1.253862147157744e-06, - "loss": 0.5867, - "step": 51004 - }, - { - "epoch": 1.31, - "learning_rate": 1.2538353830793974e-06, - "loss": 0.6572, - "step": 51005 - }, - { - "epoch": 1.31, - "learning_rate": 1.2538086188067007e-06, - "loss": 0.709, - "step": 51006 - }, - { - "epoch": 1.31, - "learning_rate": 1.2537818543396746e-06, - "loss": 0.7598, - "step": 51007 - }, - { - "epoch": 1.31, - "learning_rate": 1.2537550896783393e-06, - "loss": 0.6016, - "step": 51008 - }, - { - "epoch": 1.31, - "learning_rate": 1.2537283248227155e-06, - "loss": 0.7676, - "step": 51009 - }, - { - "epoch": 1.31, - "learning_rate": 1.2537015597728238e-06, - "loss": 0.5947, - "step": 51010 - }, - { - "epoch": 1.31, - "learning_rate": 1.2536747945286839e-06, - "loss": 0.4133, - "step": 51011 - }, - { - "epoch": 1.31, - "learning_rate": 1.2536480290903172e-06, - "loss": 0.605, - "step": 51012 - }, - { - "epoch": 1.31, - "learning_rate": 1.253621263457744e-06, - "loss": 0.7246, - "step": 51013 - }, - { - "epoch": 1.31, - "learning_rate": 1.2535944976309847e-06, - "loss": 0.5793, - "step": 51014 - }, - { - "epoch": 1.31, - "learning_rate": 1.2535677316100595e-06, - "loss": 0.6592, - "step": 51015 - }, - { - "epoch": 1.31, - "learning_rate": 1.2535409653949892e-06, - "loss": 0.752, - "step": 51016 - }, - { - "epoch": 1.31, - "learning_rate": 1.253514198985794e-06, - "loss": 0.3582, - "step": 51017 - }, - { - "epoch": 1.31, - "learning_rate": 1.2534874323824952e-06, - "loss": 0.6396, - "step": 51018 - }, - { - "epoch": 1.31, - "learning_rate": 1.2534606655851122e-06, - "loss": 0.6934, - "step": 51019 - }, - { - "epoch": 1.31, - "learning_rate": 1.2534338985936664e-06, - "loss": 0.5317, - "step": 51020 - }, - { - "epoch": 1.31, - "learning_rate": 1.2534071314081778e-06, - "loss": 0.6157, - "step": 51021 - }, - { - "epoch": 1.31, - "learning_rate": 1.2533803640286666e-06, - "loss": 0.6689, - "step": 51022 - }, - { - "epoch": 1.31, - "learning_rate": 1.2533535964551542e-06, - "loss": 0.52, - "step": 51023 - }, - { - "epoch": 1.31, - "learning_rate": 1.2533268286876606e-06, - "loss": 0.7039, - "step": 51024 - }, - { - "epoch": 1.31, - "learning_rate": 1.2533000607262064e-06, - "loss": 0.8018, - "step": 51025 - }, - { - "epoch": 1.31, - "learning_rate": 1.2532732925708115e-06, - "loss": 0.7324, - "step": 51026 - }, - { - "epoch": 1.31, - "learning_rate": 1.2532465242214971e-06, - "loss": 0.5781, - "step": 51027 - }, - { - "epoch": 1.31, - "learning_rate": 1.2532197556782836e-06, - "loss": 0.8125, - "step": 51028 - }, - { - "epoch": 1.31, - "learning_rate": 1.2531929869411916e-06, - "loss": 0.7891, - "step": 51029 - }, - { - "epoch": 1.31, - "learning_rate": 1.2531662180102408e-06, - "loss": 0.7861, - "step": 51030 - }, - { - "epoch": 1.31, - "learning_rate": 1.2531394488854527e-06, - "loss": 0.5791, - "step": 51031 - }, - { - "epoch": 1.31, - "learning_rate": 1.253112679566847e-06, - "loss": 0.6709, - "step": 51032 - }, - { - "epoch": 1.31, - "learning_rate": 1.2530859100544448e-06, - "loss": 0.6182, - "step": 51033 - }, - { - "epoch": 1.31, - "learning_rate": 1.2530591403482666e-06, - "loss": 0.6211, - "step": 51034 - }, - { - "epoch": 1.31, - "learning_rate": 1.2530323704483322e-06, - "loss": 0.6367, - "step": 51035 - }, - { - "epoch": 1.31, - "learning_rate": 1.2530056003546627e-06, - "loss": 0.4634, - "step": 51036 - }, - { - "epoch": 1.31, - "learning_rate": 1.2529788300672785e-06, - "loss": 0.8945, - "step": 51037 - }, - { - "epoch": 1.31, - "learning_rate": 1.2529520595862e-06, - "loss": 0.6631, - "step": 51038 - }, - { - "epoch": 1.31, - "learning_rate": 1.2529252889114478e-06, - "loss": 0.5938, - "step": 51039 - }, - { - "epoch": 1.31, - "learning_rate": 1.2528985180430422e-06, - "loss": 0.7292, - "step": 51040 - }, - { - "epoch": 1.31, - "learning_rate": 1.2528717469810042e-06, - "loss": 0.5214, - "step": 51041 - }, - { - "epoch": 1.31, - "learning_rate": 1.2528449757253534e-06, - "loss": 0.7686, - "step": 51042 - }, - { - "epoch": 1.31, - "learning_rate": 1.2528182042761112e-06, - "loss": 0.6431, - "step": 51043 - }, - { - "epoch": 1.31, - "learning_rate": 1.2527914326332979e-06, - "loss": 0.4917, - "step": 51044 - }, - { - "epoch": 1.31, - "learning_rate": 1.252764660796933e-06, - "loss": 0.605, - "step": 51045 - }, - { - "epoch": 1.31, - "learning_rate": 1.2527378887670388e-06, - "loss": 0.6763, - "step": 51046 - }, - { - "epoch": 1.31, - "learning_rate": 1.2527111165436342e-06, - "loss": 0.4868, - "step": 51047 - }, - { - "epoch": 1.31, - "learning_rate": 1.2526843441267405e-06, - "loss": 0.34, - "step": 51048 - }, - { - "epoch": 1.31, - "learning_rate": 1.252657571516378e-06, - "loss": 0.5769, - "step": 51049 - }, - { - "epoch": 1.31, - "learning_rate": 1.2526307987125673e-06, - "loss": 0.7207, - "step": 51050 - }, - { - "epoch": 1.31, - "learning_rate": 1.2526040257153288e-06, - "loss": 0.6357, - "step": 51051 - }, - { - "epoch": 1.31, - "learning_rate": 1.2525772525246829e-06, - "loss": 0.7148, - "step": 51052 - }, - { - "epoch": 1.31, - "learning_rate": 1.25255047914065e-06, - "loss": 0.8545, - "step": 51053 - }, - { - "epoch": 1.31, - "learning_rate": 1.2525237055632513e-06, - "loss": 0.6406, - "step": 51054 - }, - { - "epoch": 1.31, - "learning_rate": 1.2524969317925065e-06, - "loss": 0.5552, - "step": 51055 - }, - { - "epoch": 1.31, - "learning_rate": 1.2524701578284367e-06, - "loss": 0.6592, - "step": 51056 - }, - { - "epoch": 1.31, - "learning_rate": 1.2524433836710616e-06, - "loss": 0.6982, - "step": 51057 - }, - { - "epoch": 1.31, - "learning_rate": 1.2524166093204028e-06, - "loss": 0.6826, - "step": 51058 - }, - { - "epoch": 1.31, - "learning_rate": 1.2523898347764798e-06, - "loss": 0.79, - "step": 51059 - }, - { - "epoch": 1.31, - "learning_rate": 1.2523630600393139e-06, - "loss": 0.6182, - "step": 51060 - }, - { - "epoch": 1.31, - "learning_rate": 1.2523362851089247e-06, - "loss": 0.6431, - "step": 51061 - }, - { - "epoch": 1.31, - "learning_rate": 1.2523095099853337e-06, - "loss": 0.7002, - "step": 51062 - }, - { - "epoch": 1.31, - "learning_rate": 1.2522827346685603e-06, - "loss": 0.626, - "step": 51063 - }, - { - "epoch": 1.31, - "learning_rate": 1.252255959158626e-06, - "loss": 0.3822, - "step": 51064 - }, - { - "epoch": 1.31, - "learning_rate": 1.252229183455551e-06, - "loss": 0.6431, - "step": 51065 - }, - { - "epoch": 1.31, - "learning_rate": 1.2522024075593556e-06, - "loss": 0.6338, - "step": 51066 - }, - { - "epoch": 1.31, - "learning_rate": 1.2521756314700604e-06, - "loss": 0.6104, - "step": 51067 - }, - { - "epoch": 1.31, - "learning_rate": 1.2521488551876857e-06, - "loss": 0.7539, - "step": 51068 - }, - { - "epoch": 1.31, - "learning_rate": 1.2521220787122525e-06, - "loss": 0.6665, - "step": 51069 - }, - { - "epoch": 1.31, - "learning_rate": 1.252095302043781e-06, - "loss": 0.7036, - "step": 51070 - }, - { - "epoch": 1.31, - "learning_rate": 1.2520685251822918e-06, - "loss": 0.5215, - "step": 51071 - }, - { - "epoch": 1.31, - "learning_rate": 1.252041748127805e-06, - "loss": 0.5435, - "step": 51072 - }, - { - "epoch": 1.31, - "learning_rate": 1.2520149708803418e-06, - "loss": 0.8154, - "step": 51073 - }, - { - "epoch": 1.31, - "learning_rate": 1.2519881934399221e-06, - "loss": 0.6904, - "step": 51074 - }, - { - "epoch": 1.31, - "learning_rate": 1.2519614158065667e-06, - "loss": 0.562, - "step": 51075 - }, - { - "epoch": 1.31, - "learning_rate": 1.251934637980296e-06, - "loss": 0.7246, - "step": 51076 - }, - { - "epoch": 1.31, - "learning_rate": 1.2519078599611307e-06, - "loss": 0.3274, - "step": 51077 - }, - { - "epoch": 1.31, - "learning_rate": 1.2518810817490906e-06, - "loss": 0.7217, - "step": 51078 - }, - { - "epoch": 1.31, - "learning_rate": 1.2518543033441975e-06, - "loss": 0.7539, - "step": 51079 - }, - { - "epoch": 1.31, - "learning_rate": 1.2518275247464704e-06, - "loss": 0.5037, - "step": 51080 - }, - { - "epoch": 1.31, - "learning_rate": 1.251800745955931e-06, - "loss": 0.5776, - "step": 51081 - }, - { - "epoch": 1.31, - "learning_rate": 1.2517739669725993e-06, - "loss": 0.6001, - "step": 51082 - }, - { - "epoch": 1.31, - "learning_rate": 1.2517471877964956e-06, - "loss": 0.623, - "step": 51083 - }, - { - "epoch": 1.31, - "learning_rate": 1.2517204084276412e-06, - "loss": 0.748, - "step": 51084 - }, - { - "epoch": 1.31, - "learning_rate": 1.2516936288660554e-06, - "loss": 0.6992, - "step": 51085 - }, - { - "epoch": 1.31, - "learning_rate": 1.2516668491117596e-06, - "loss": 0.5522, - "step": 51086 - }, - { - "epoch": 1.31, - "learning_rate": 1.2516400691647744e-06, - "loss": 0.5835, - "step": 51087 - }, - { - "epoch": 1.31, - "learning_rate": 1.2516132890251194e-06, - "loss": 0.6411, - "step": 51088 - }, - { - "epoch": 1.31, - "learning_rate": 1.2515865086928162e-06, - "loss": 0.626, - "step": 51089 - }, - { - "epoch": 1.31, - "learning_rate": 1.2515597281678845e-06, - "loss": 0.6699, - "step": 51090 - }, - { - "epoch": 1.31, - "learning_rate": 1.251532947450345e-06, - "loss": 0.7012, - "step": 51091 - }, - { - "epoch": 1.31, - "learning_rate": 1.2515061665402185e-06, - "loss": 0.7793, - "step": 51092 - }, - { - "epoch": 1.31, - "learning_rate": 1.251479385437525e-06, - "loss": 0.6514, - "step": 51093 - }, - { - "epoch": 1.31, - "learning_rate": 1.2514526041422859e-06, - "loss": 0.7441, - "step": 51094 - }, - { - "epoch": 1.31, - "learning_rate": 1.2514258226545204e-06, - "loss": 0.7017, - "step": 51095 - }, - { - "epoch": 1.31, - "learning_rate": 1.25139904097425e-06, - "loss": 0.7617, - "step": 51096 - }, - { - "epoch": 1.31, - "learning_rate": 1.2513722591014947e-06, - "loss": 0.6494, - "step": 51097 - }, - { - "epoch": 1.31, - "learning_rate": 1.2513454770362758e-06, - "loss": 0.7085, - "step": 51098 - }, - { - "epoch": 1.31, - "learning_rate": 1.251318694778613e-06, - "loss": 0.5645, - "step": 51099 - }, - { - "epoch": 1.31, - "learning_rate": 1.251291912328527e-06, - "loss": 0.4541, - "step": 51100 - }, - { - "epoch": 1.31, - "learning_rate": 1.2512651296860378e-06, - "loss": 0.7285, - "step": 51101 - }, - { - "epoch": 1.31, - "learning_rate": 1.251238346851167e-06, - "loss": 0.521, - "step": 51102 - }, - { - "epoch": 1.31, - "learning_rate": 1.2512115638239345e-06, - "loss": 0.6123, - "step": 51103 - }, - { - "epoch": 1.31, - "learning_rate": 1.251184780604361e-06, - "loss": 0.625, - "step": 51104 - }, - { - "epoch": 1.31, - "learning_rate": 1.2511579971924664e-06, - "loss": 0.6797, - "step": 51105 - }, - { - "epoch": 1.31, - "learning_rate": 1.251131213588272e-06, - "loss": 0.7061, - "step": 51106 - }, - { - "epoch": 1.31, - "learning_rate": 1.2511044297917978e-06, - "loss": 0.6885, - "step": 51107 - }, - { - "epoch": 1.31, - "learning_rate": 1.2510776458030648e-06, - "loss": 0.6875, - "step": 51108 - }, - { - "epoch": 1.31, - "learning_rate": 1.2510508616220929e-06, - "loss": 0.6211, - "step": 51109 - }, - { - "epoch": 1.31, - "learning_rate": 1.251024077248903e-06, - "loss": 0.6431, - "step": 51110 - }, - { - "epoch": 1.31, - "learning_rate": 1.2509972926835154e-06, - "loss": 0.668, - "step": 51111 - }, - { - "epoch": 1.31, - "learning_rate": 1.2509705079259508e-06, - "loss": 0.5649, - "step": 51112 - }, - { - "epoch": 1.31, - "learning_rate": 1.2509437229762296e-06, - "loss": 0.603, - "step": 51113 - }, - { - "epoch": 1.31, - "learning_rate": 1.2509169378343724e-06, - "loss": 0.7529, - "step": 51114 - }, - { - "epoch": 1.31, - "learning_rate": 1.2508901525003996e-06, - "loss": 0.6914, - "step": 51115 - }, - { - "epoch": 1.31, - "learning_rate": 1.2508633669743317e-06, - "loss": 0.6982, - "step": 51116 - }, - { - "epoch": 1.31, - "learning_rate": 1.2508365812561893e-06, - "loss": 0.6719, - "step": 51117 - }, - { - "epoch": 1.31, - "learning_rate": 1.2508097953459929e-06, - "loss": 0.6042, - "step": 51118 - }, - { - "epoch": 1.31, - "learning_rate": 1.250783009243763e-06, - "loss": 0.5728, - "step": 51119 - }, - { - "epoch": 1.31, - "learning_rate": 1.2507562229495199e-06, - "loss": 0.6904, - "step": 51120 - }, - { - "epoch": 1.31, - "learning_rate": 1.2507294364632845e-06, - "loss": 0.6992, - "step": 51121 - }, - { - "epoch": 1.31, - "learning_rate": 1.2507026497850769e-06, - "loss": 0.7217, - "step": 51122 - }, - { - "epoch": 1.31, - "learning_rate": 1.2506758629149178e-06, - "loss": 0.6323, - "step": 51123 - }, - { - "epoch": 1.31, - "learning_rate": 1.2506490758528281e-06, - "loss": 0.6729, - "step": 51124 - }, - { - "epoch": 1.31, - "learning_rate": 1.2506222885988278e-06, - "loss": 0.7832, - "step": 51125 - }, - { - "epoch": 1.31, - "learning_rate": 1.250595501152937e-06, - "loss": 0.5483, - "step": 51126 - }, - { - "epoch": 1.31, - "learning_rate": 1.2505687135151771e-06, - "loss": 0.4705, - "step": 51127 - }, - { - "epoch": 1.31, - "learning_rate": 1.2505419256855682e-06, - "loss": 0.7793, - "step": 51128 - }, - { - "epoch": 1.31, - "learning_rate": 1.250515137664131e-06, - "loss": 0.7217, - "step": 51129 - }, - { - "epoch": 1.31, - "learning_rate": 1.2504883494508861e-06, - "loss": 0.5432, - "step": 51130 - }, - { - "epoch": 1.31, - "learning_rate": 1.2504615610458536e-06, - "loss": 0.6895, - "step": 51131 - }, - { - "epoch": 1.31, - "learning_rate": 1.250434772449054e-06, - "loss": 0.6843, - "step": 51132 - }, - { - "epoch": 1.31, - "learning_rate": 1.2504079836605082e-06, - "loss": 0.7705, - "step": 51133 - }, - { - "epoch": 1.31, - "learning_rate": 1.2503811946802366e-06, - "loss": 0.7568, - "step": 51134 - }, - { - "epoch": 1.31, - "learning_rate": 1.2503544055082594e-06, - "loss": 0.7168, - "step": 51135 - }, - { - "epoch": 1.31, - "learning_rate": 1.2503276161445976e-06, - "loss": 0.6001, - "step": 51136 - }, - { - "epoch": 1.31, - "learning_rate": 1.250300826589271e-06, - "loss": 0.5425, - "step": 51137 - }, - { - "epoch": 1.31, - "learning_rate": 1.2502740368423007e-06, - "loss": 0.4839, - "step": 51138 - }, - { - "epoch": 1.31, - "learning_rate": 1.2502472469037075e-06, - "loss": 0.7278, - "step": 51139 - }, - { - "epoch": 1.31, - "learning_rate": 1.2502204567735113e-06, - "loss": 0.7622, - "step": 51140 - }, - { - "epoch": 1.31, - "learning_rate": 1.2501936664517324e-06, - "loss": 0.3378, - "step": 51141 - }, - { - "epoch": 1.31, - "learning_rate": 1.2501668759383924e-06, - "loss": 0.832, - "step": 51142 - }, - { - "epoch": 1.31, - "learning_rate": 1.2501400852335104e-06, - "loss": 0.5518, - "step": 51143 - }, - { - "epoch": 1.31, - "learning_rate": 1.2501132943371082e-06, - "loss": 0.626, - "step": 51144 - }, - { - "epoch": 1.31, - "learning_rate": 1.2500865032492055e-06, - "loss": 0.6895, - "step": 51145 - }, - { - "epoch": 1.31, - "learning_rate": 1.2500597119698233e-06, - "loss": 0.5996, - "step": 51146 - }, - { - "epoch": 1.31, - "learning_rate": 1.2500329204989815e-06, - "loss": 0.425, - "step": 51147 - }, - { - "epoch": 1.31, - "learning_rate": 1.2500061288367011e-06, - "loss": 0.7715, - "step": 51148 - }, - { - "epoch": 1.31, - "learning_rate": 1.2499793369830028e-06, - "loss": 0.624, - "step": 51149 - }, - { - "epoch": 1.31, - "learning_rate": 1.2499525449379068e-06, - "loss": 0.686, - "step": 51150 - }, - { - "epoch": 1.31, - "learning_rate": 1.249925752701433e-06, - "loss": 0.6372, - "step": 51151 - }, - { - "epoch": 1.31, - "learning_rate": 1.2498989602736032e-06, - "loss": 0.6377, - "step": 51152 - }, - { - "epoch": 1.31, - "learning_rate": 1.2498721676544367e-06, - "loss": 0.668, - "step": 51153 - }, - { - "epoch": 1.31, - "learning_rate": 1.2498453748439552e-06, - "loss": 0.7822, - "step": 51154 - }, - { - "epoch": 1.31, - "learning_rate": 1.2498185818421782e-06, - "loss": 0.4944, - "step": 51155 - }, - { - "epoch": 1.31, - "learning_rate": 1.2497917886491266e-06, - "loss": 0.645, - "step": 51156 - }, - { - "epoch": 1.31, - "learning_rate": 1.249764995264821e-06, - "loss": 0.5229, - "step": 51157 - }, - { - "epoch": 1.31, - "learning_rate": 1.2497382016892818e-06, - "loss": 0.7632, - "step": 51158 - }, - { - "epoch": 1.31, - "learning_rate": 1.24971140792253e-06, - "loss": 0.4893, - "step": 51159 - }, - { - "epoch": 1.31, - "learning_rate": 1.2496846139645849e-06, - "loss": 0.6191, - "step": 51160 - }, - { - "epoch": 1.31, - "learning_rate": 1.2496578198154681e-06, - "loss": 0.4551, - "step": 51161 - }, - { - "epoch": 1.31, - "learning_rate": 1.2496310254751997e-06, - "loss": 0.7959, - "step": 51162 - }, - { - "epoch": 1.31, - "learning_rate": 1.2496042309438007e-06, - "loss": 0.6592, - "step": 51163 - }, - { - "epoch": 1.31, - "learning_rate": 1.2495774362212907e-06, - "loss": 0.7539, - "step": 51164 - }, - { - "epoch": 1.31, - "learning_rate": 1.2495506413076911e-06, - "loss": 0.3979, - "step": 51165 - }, - { - "epoch": 1.31, - "learning_rate": 1.2495238462030217e-06, - "loss": 0.5103, - "step": 51166 - }, - { - "epoch": 1.31, - "learning_rate": 1.2494970509073037e-06, - "loss": 0.4592, - "step": 51167 - }, - { - "epoch": 1.31, - "learning_rate": 1.249470255420557e-06, - "loss": 0.8022, - "step": 51168 - }, - { - "epoch": 1.31, - "learning_rate": 1.2494434597428028e-06, - "loss": 0.6277, - "step": 51169 - }, - { - "epoch": 1.31, - "learning_rate": 1.249416663874061e-06, - "loss": 0.5474, - "step": 51170 - }, - { - "epoch": 1.31, - "learning_rate": 1.2493898678143521e-06, - "loss": 0.6611, - "step": 51171 - }, - { - "epoch": 1.31, - "learning_rate": 1.2493630715636969e-06, - "loss": 0.6074, - "step": 51172 - }, - { - "epoch": 1.31, - "learning_rate": 1.2493362751221161e-06, - "loss": 0.4633, - "step": 51173 - }, - { - "epoch": 1.31, - "learning_rate": 1.2493094784896299e-06, - "loss": 0.6152, - "step": 51174 - }, - { - "epoch": 1.31, - "learning_rate": 1.2492826816662588e-06, - "loss": 0.5752, - "step": 51175 - }, - { - "epoch": 1.31, - "learning_rate": 1.2492558846520234e-06, - "loss": 0.4756, - "step": 51176 - }, - { - "epoch": 1.31, - "learning_rate": 1.2492290874469443e-06, - "loss": 0.6045, - "step": 51177 - }, - { - "epoch": 1.31, - "learning_rate": 1.2492022900510419e-06, - "loss": 0.5752, - "step": 51178 - }, - { - "epoch": 1.31, - "learning_rate": 1.249175492464337e-06, - "loss": 0.266, - "step": 51179 - }, - { - "epoch": 1.31, - "learning_rate": 1.2491486946868498e-06, - "loss": 0.7666, - "step": 51180 - }, - { - "epoch": 1.31, - "learning_rate": 1.2491218967186004e-06, - "loss": 0.7314, - "step": 51181 - }, - { - "epoch": 1.31, - "learning_rate": 1.2490950985596104e-06, - "loss": 0.5315, - "step": 51182 - }, - { - "epoch": 1.31, - "learning_rate": 1.2490683002098995e-06, - "loss": 0.7754, - "step": 51183 - }, - { - "epoch": 1.31, - "learning_rate": 1.2490415016694886e-06, - "loss": 0.8027, - "step": 51184 - }, - { - "epoch": 1.31, - "learning_rate": 1.249014702938398e-06, - "loss": 0.6279, - "step": 51185 - }, - { - "epoch": 1.31, - "learning_rate": 1.2489879040166482e-06, - "loss": 0.6084, - "step": 51186 - }, - { - "epoch": 1.31, - "learning_rate": 1.2489611049042597e-06, - "loss": 0.7607, - "step": 51187 - }, - { - "epoch": 1.31, - "learning_rate": 1.2489343056012533e-06, - "loss": 0.7078, - "step": 51188 - }, - { - "epoch": 1.31, - "learning_rate": 1.2489075061076496e-06, - "loss": 0.6724, - "step": 51189 - }, - { - "epoch": 1.31, - "learning_rate": 1.2488807064234685e-06, - "loss": 0.3514, - "step": 51190 - }, - { - "epoch": 1.31, - "learning_rate": 1.248853906548731e-06, - "loss": 0.7705, - "step": 51191 - }, - { - "epoch": 1.31, - "learning_rate": 1.2488271064834575e-06, - "loss": 0.7451, - "step": 51192 - }, - { - "epoch": 1.31, - "learning_rate": 1.2488003062276683e-06, - "loss": 0.5742, - "step": 51193 - }, - { - "epoch": 1.31, - "learning_rate": 1.2487735057813849e-06, - "loss": 0.6592, - "step": 51194 - }, - { - "epoch": 1.31, - "learning_rate": 1.2487467051446263e-06, - "loss": 0.7593, - "step": 51195 - }, - { - "epoch": 1.31, - "learning_rate": 1.2487199043174142e-06, - "loss": 0.5234, - "step": 51196 - }, - { - "epoch": 1.31, - "learning_rate": 1.2486931032997682e-06, - "loss": 0.7051, - "step": 51197 - }, - { - "epoch": 1.31, - "learning_rate": 1.24866630209171e-06, - "loss": 0.7148, - "step": 51198 - }, - { - "epoch": 1.31, - "learning_rate": 1.2486395006932591e-06, - "loss": 0.6113, - "step": 51199 - }, - { - "epoch": 1.31, - "learning_rate": 1.2486126991044362e-06, - "loss": 0.5952, - "step": 51200 - }, - { - "epoch": 1.31, - "learning_rate": 1.2485858973252623e-06, - "loss": 0.7373, - "step": 51201 - }, - { - "epoch": 1.31, - "learning_rate": 1.2485590953557572e-06, - "loss": 0.6914, - "step": 51202 - }, - { - "epoch": 1.31, - "learning_rate": 1.2485322931959424e-06, - "loss": 0.7217, - "step": 51203 - }, - { - "epoch": 1.31, - "learning_rate": 1.2485054908458374e-06, - "loss": 0.6826, - "step": 51204 - }, - { - "epoch": 1.31, - "learning_rate": 1.2484786883054633e-06, - "loss": 0.5371, - "step": 51205 - }, - { - "epoch": 1.31, - "learning_rate": 1.2484518855748407e-06, - "loss": 0.6465, - "step": 51206 - }, - { - "epoch": 1.31, - "learning_rate": 1.2484250826539898e-06, - "loss": 0.6592, - "step": 51207 - }, - { - "epoch": 1.31, - "learning_rate": 1.248398279542931e-06, - "loss": 0.584, - "step": 51208 - }, - { - "epoch": 1.31, - "learning_rate": 1.2483714762416855e-06, - "loss": 0.7861, - "step": 51209 - }, - { - "epoch": 1.31, - "learning_rate": 1.2483446727502728e-06, - "loss": 0.644, - "step": 51210 - }, - { - "epoch": 1.31, - "learning_rate": 1.2483178690687146e-06, - "loss": 0.6016, - "step": 51211 - }, - { - "epoch": 1.31, - "learning_rate": 1.2482910651970305e-06, - "loss": 0.6943, - "step": 51212 - }, - { - "epoch": 1.31, - "learning_rate": 1.2482642611352411e-06, - "loss": 0.5315, - "step": 51213 - }, - { - "epoch": 1.31, - "learning_rate": 1.2482374568833678e-06, - "loss": 0.6205, - "step": 51214 - }, - { - "epoch": 1.31, - "learning_rate": 1.2482106524414302e-06, - "loss": 0.6765, - "step": 51215 - }, - { - "epoch": 1.31, - "learning_rate": 1.2481838478094487e-06, - "loss": 0.4043, - "step": 51216 - }, - { - "epoch": 1.31, - "learning_rate": 1.2481570429874447e-06, - "loss": 0.5939, - "step": 51217 - }, - { - "epoch": 1.31, - "learning_rate": 1.2481302379754381e-06, - "loss": 0.6436, - "step": 51218 - }, - { - "epoch": 1.31, - "learning_rate": 1.2481034327734498e-06, - "loss": 0.7832, - "step": 51219 - }, - { - "epoch": 1.31, - "learning_rate": 1.2480766273815002e-06, - "loss": 0.5859, - "step": 51220 - }, - { - "epoch": 1.31, - "learning_rate": 1.2480498217996096e-06, - "loss": 0.75, - "step": 51221 - }, - { - "epoch": 1.31, - "learning_rate": 1.2480230160277981e-06, - "loss": 0.5251, - "step": 51222 - }, - { - "epoch": 1.31, - "learning_rate": 1.2479962100660874e-06, - "loss": 0.4683, - "step": 51223 - }, - { - "epoch": 1.31, - "learning_rate": 1.2479694039144975e-06, - "loss": 0.6572, - "step": 51224 - }, - { - "epoch": 1.31, - "learning_rate": 1.2479425975730485e-06, - "loss": 0.6299, - "step": 51225 - }, - { - "epoch": 1.31, - "learning_rate": 1.2479157910417612e-06, - "loss": 0.7788, - "step": 51226 - }, - { - "epoch": 1.31, - "learning_rate": 1.2478889843206562e-06, - "loss": 0.752, - "step": 51227 - }, - { - "epoch": 1.31, - "learning_rate": 1.2478621774097542e-06, - "loss": 0.4456, - "step": 51228 - }, - { - "epoch": 1.31, - "learning_rate": 1.2478353703090757e-06, - "loss": 0.7559, - "step": 51229 - }, - { - "epoch": 1.31, - "learning_rate": 1.2478085630186408e-06, - "loss": 0.5879, - "step": 51230 - }, - { - "epoch": 1.31, - "learning_rate": 1.24778175553847e-06, - "loss": 0.5234, - "step": 51231 - }, - { - "epoch": 1.31, - "learning_rate": 1.2477549478685845e-06, - "loss": 0.7979, - "step": 51232 - }, - { - "epoch": 1.31, - "learning_rate": 1.2477281400090043e-06, - "loss": 0.7305, - "step": 51233 - }, - { - "epoch": 1.31, - "learning_rate": 1.2477013319597502e-06, - "loss": 0.5022, - "step": 51234 - }, - { - "epoch": 1.31, - "learning_rate": 1.2476745237208423e-06, - "loss": 0.6064, - "step": 51235 - }, - { - "epoch": 1.31, - "learning_rate": 1.2476477152923014e-06, - "loss": 0.5781, - "step": 51236 - }, - { - "epoch": 1.31, - "learning_rate": 1.2476209066741484e-06, - "loss": 0.5308, - "step": 51237 - }, - { - "epoch": 1.31, - "learning_rate": 1.2475940978664033e-06, - "loss": 0.4844, - "step": 51238 - }, - { - "epoch": 1.31, - "learning_rate": 1.2475672888690868e-06, - "loss": 0.5132, - "step": 51239 - }, - { - "epoch": 1.31, - "learning_rate": 1.2475404796822193e-06, - "loss": 0.5605, - "step": 51240 - }, - { - "epoch": 1.31, - "learning_rate": 1.2475136703058214e-06, - "loss": 0.668, - "step": 51241 - }, - { - "epoch": 1.31, - "learning_rate": 1.2474868607399137e-06, - "loss": 0.6123, - "step": 51242 - }, - { - "epoch": 1.31, - "learning_rate": 1.2474600509845166e-06, - "loss": 0.5571, - "step": 51243 - }, - { - "epoch": 1.31, - "learning_rate": 1.2474332410396508e-06, - "loss": 0.6439, - "step": 51244 - }, - { - "epoch": 1.31, - "learning_rate": 1.247406430905337e-06, - "loss": 0.6675, - "step": 51245 - }, - { - "epoch": 1.31, - "learning_rate": 1.247379620581595e-06, - "loss": 0.6699, - "step": 51246 - }, - { - "epoch": 1.31, - "learning_rate": 1.247352810068446e-06, - "loss": 0.624, - "step": 51247 - }, - { - "epoch": 1.31, - "learning_rate": 1.2473259993659105e-06, - "loss": 0.5854, - "step": 51248 - }, - { - "epoch": 1.31, - "learning_rate": 1.2472991884740089e-06, - "loss": 0.5913, - "step": 51249 - }, - { - "epoch": 1.31, - "learning_rate": 1.2472723773927613e-06, - "loss": 0.6577, - "step": 51250 - }, - { - "epoch": 1.31, - "learning_rate": 1.247245566122189e-06, - "loss": 0.6196, - "step": 51251 - }, - { - "epoch": 1.31, - "learning_rate": 1.247218754662312e-06, - "loss": 0.6797, - "step": 51252 - }, - { - "epoch": 1.31, - "learning_rate": 1.2471919430131508e-06, - "loss": 0.6152, - "step": 51253 - }, - { - "epoch": 1.31, - "learning_rate": 1.2471651311747263e-06, - "loss": 0.7363, - "step": 51254 - }, - { - "epoch": 1.31, - "learning_rate": 1.2471383191470588e-06, - "loss": 0.6196, - "step": 51255 - }, - { - "epoch": 1.31, - "learning_rate": 1.2471115069301687e-06, - "loss": 0.6289, - "step": 51256 - }, - { - "epoch": 1.31, - "learning_rate": 1.247084694524077e-06, - "loss": 0.5747, - "step": 51257 - }, - { - "epoch": 1.31, - "learning_rate": 1.2470578819288033e-06, - "loss": 0.5942, - "step": 51258 - }, - { - "epoch": 1.31, - "learning_rate": 1.2470310691443696e-06, - "loss": 0.6514, - "step": 51259 - }, - { - "epoch": 1.31, - "learning_rate": 1.247004256170795e-06, - "loss": 0.6494, - "step": 51260 - }, - { - "epoch": 1.31, - "learning_rate": 1.2469774430081005e-06, - "loss": 0.6689, - "step": 51261 - }, - { - "epoch": 1.31, - "learning_rate": 1.246950629656307e-06, - "loss": 0.7197, - "step": 51262 - }, - { - "epoch": 1.31, - "learning_rate": 1.2469238161154348e-06, - "loss": 0.8047, - "step": 51263 - }, - { - "epoch": 1.31, - "learning_rate": 1.2468970023855044e-06, - "loss": 0.7627, - "step": 51264 - }, - { - "epoch": 1.31, - "learning_rate": 1.246870188466536e-06, - "loss": 0.6519, - "step": 51265 - }, - { - "epoch": 1.31, - "learning_rate": 1.2468433743585506e-06, - "loss": 0.4253, - "step": 51266 - }, - { - "epoch": 1.31, - "learning_rate": 1.2468165600615687e-06, - "loss": 0.6831, - "step": 51267 - }, - { - "epoch": 1.31, - "learning_rate": 1.2467897455756106e-06, - "loss": 0.6025, - "step": 51268 - }, - { - "epoch": 1.31, - "learning_rate": 1.2467629309006968e-06, - "loss": 0.4841, - "step": 51269 - }, - { - "epoch": 1.31, - "learning_rate": 1.2467361160368483e-06, - "loss": 0.7612, - "step": 51270 - }, - { - "epoch": 1.31, - "learning_rate": 1.246709300984085e-06, - "loss": 0.5791, - "step": 51271 - }, - { - "epoch": 1.31, - "learning_rate": 1.2466824857424281e-06, - "loss": 0.6709, - "step": 51272 - }, - { - "epoch": 1.31, - "learning_rate": 1.2466556703118976e-06, - "loss": 0.7305, - "step": 51273 - }, - { - "epoch": 1.31, - "learning_rate": 1.2466288546925141e-06, - "loss": 0.6514, - "step": 51274 - }, - { - "epoch": 1.31, - "learning_rate": 1.2466020388842982e-06, - "loss": 0.6914, - "step": 51275 - }, - { - "epoch": 1.31, - "learning_rate": 1.2465752228872706e-06, - "loss": 0.5811, - "step": 51276 - }, - { - "epoch": 1.31, - "learning_rate": 1.2465484067014514e-06, - "loss": 0.5259, - "step": 51277 - }, - { - "epoch": 1.31, - "learning_rate": 1.246521590326862e-06, - "loss": 0.7783, - "step": 51278 - }, - { - "epoch": 1.31, - "learning_rate": 1.2464947737635219e-06, - "loss": 0.6416, - "step": 51279 - }, - { - "epoch": 1.31, - "learning_rate": 1.246467957011452e-06, - "loss": 0.7559, - "step": 51280 - }, - { - "epoch": 1.31, - "learning_rate": 1.2464411400706732e-06, - "loss": 0.4675, - "step": 51281 - }, - { - "epoch": 1.31, - "learning_rate": 1.2464143229412053e-06, - "loss": 0.4624, - "step": 51282 - }, - { - "epoch": 1.31, - "learning_rate": 1.24638750562307e-06, - "loss": 0.6431, - "step": 51283 - }, - { - "epoch": 1.31, - "learning_rate": 1.2463606881162868e-06, - "loss": 0.8027, - "step": 51284 - }, - { - "epoch": 1.31, - "learning_rate": 1.2463338704208764e-06, - "loss": 0.6289, - "step": 51285 - }, - { - "epoch": 1.31, - "learning_rate": 1.2463070525368594e-06, - "loss": 0.7046, - "step": 51286 - }, - { - "epoch": 1.31, - "learning_rate": 1.2462802344642566e-06, - "loss": 0.752, - "step": 51287 - }, - { - "epoch": 1.31, - "learning_rate": 1.2462534162030885e-06, - "loss": 0.5752, - "step": 51288 - }, - { - "epoch": 1.31, - "learning_rate": 1.2462265977533753e-06, - "loss": 0.8662, - "step": 51289 - }, - { - "epoch": 1.31, - "learning_rate": 1.2461997791151376e-06, - "loss": 0.7246, - "step": 51290 - }, - { - "epoch": 1.31, - "learning_rate": 1.246172960288396e-06, - "loss": 0.7148, - "step": 51291 - }, - { - "epoch": 1.31, - "learning_rate": 1.2461461412731713e-06, - "loss": 0.7871, - "step": 51292 - }, - { - "epoch": 1.31, - "learning_rate": 1.246119322069484e-06, - "loss": 0.7354, - "step": 51293 - }, - { - "epoch": 1.31, - "learning_rate": 1.2460925026773542e-06, - "loss": 0.6904, - "step": 51294 - }, - { - "epoch": 1.31, - "learning_rate": 1.2460656830968029e-06, - "loss": 0.625, - "step": 51295 - }, - { - "epoch": 1.31, - "learning_rate": 1.24603886332785e-06, - "loss": 0.5781, - "step": 51296 - }, - { - "epoch": 1.31, - "learning_rate": 1.2460120433705167e-06, - "loss": 0.6172, - "step": 51297 - }, - { - "epoch": 1.31, - "learning_rate": 1.2459852232248234e-06, - "loss": 0.5444, - "step": 51298 - }, - { - "epoch": 1.31, - "learning_rate": 1.2459584028907903e-06, - "loss": 0.7139, - "step": 51299 - }, - { - "epoch": 1.31, - "learning_rate": 1.2459315823684382e-06, - "loss": 0.6143, - "step": 51300 - }, - { - "epoch": 1.31, - "learning_rate": 1.2459047616577878e-06, - "loss": 0.6309, - "step": 51301 - }, - { - "epoch": 1.31, - "learning_rate": 1.2458779407588592e-06, - "loss": 0.5161, - "step": 51302 - }, - { - "epoch": 1.31, - "learning_rate": 1.2458511196716734e-06, - "loss": 0.446, - "step": 51303 - }, - { - "epoch": 1.31, - "learning_rate": 1.2458242983962505e-06, - "loss": 0.5433, - "step": 51304 - }, - { - "epoch": 1.31, - "learning_rate": 1.2457974769326114e-06, - "loss": 0.7578, - "step": 51305 - }, - { - "epoch": 1.31, - "learning_rate": 1.2457706552807763e-06, - "loss": 0.5645, - "step": 51306 - }, - { - "epoch": 1.32, - "learning_rate": 1.245743833440766e-06, - "loss": 0.707, - "step": 51307 - }, - { - "epoch": 1.32, - "learning_rate": 1.245717011412601e-06, - "loss": 0.5664, - "step": 51308 - }, - { - "epoch": 1.32, - "learning_rate": 1.2456901891963017e-06, - "loss": 0.6875, - "step": 51309 - }, - { - "epoch": 1.32, - "learning_rate": 1.2456633667918889e-06, - "loss": 0.7212, - "step": 51310 - }, - { - "epoch": 1.32, - "learning_rate": 1.2456365441993826e-06, - "loss": 0.4624, - "step": 51311 - }, - { - "epoch": 1.32, - "learning_rate": 1.2456097214188038e-06, - "loss": 0.6958, - "step": 51312 - }, - { - "epoch": 1.32, - "learning_rate": 1.245582898450173e-06, - "loss": 0.7119, - "step": 51313 - }, - { - "epoch": 1.32, - "learning_rate": 1.2455560752935109e-06, - "loss": 0.6733, - "step": 51314 - }, - { - "epoch": 1.32, - "learning_rate": 1.2455292519488373e-06, - "loss": 0.6313, - "step": 51315 - }, - { - "epoch": 1.32, - "learning_rate": 1.2455024284161736e-06, - "loss": 0.5364, - "step": 51316 - }, - { - "epoch": 1.32, - "learning_rate": 1.2454756046955398e-06, - "loss": 0.7578, - "step": 51317 - }, - { - "epoch": 1.32, - "learning_rate": 1.2454487807869572e-06, - "loss": 0.6338, - "step": 51318 - }, - { - "epoch": 1.32, - "learning_rate": 1.245421956690445e-06, - "loss": 0.709, - "step": 51319 - }, - { - "epoch": 1.32, - "learning_rate": 1.2453951324060247e-06, - "loss": 0.7197, - "step": 51320 - }, - { - "epoch": 1.32, - "learning_rate": 1.2453683079337167e-06, - "loss": 0.5542, - "step": 51321 - }, - { - "epoch": 1.32, - "learning_rate": 1.2453414832735417e-06, - "loss": 0.6689, - "step": 51322 - }, - { - "epoch": 1.32, - "learning_rate": 1.2453146584255197e-06, - "loss": 0.6362, - "step": 51323 - }, - { - "epoch": 1.32, - "learning_rate": 1.2452878333896718e-06, - "loss": 0.5752, - "step": 51324 - }, - { - "epoch": 1.32, - "learning_rate": 1.2452610081660178e-06, - "loss": 0.7051, - "step": 51325 - }, - { - "epoch": 1.32, - "learning_rate": 1.2452341827545792e-06, - "loss": 0.7012, - "step": 51326 - }, - { - "epoch": 1.32, - "learning_rate": 1.2452073571553756e-06, - "loss": 0.563, - "step": 51327 - }, - { - "epoch": 1.32, - "learning_rate": 1.2451805313684286e-06, - "loss": 0.7036, - "step": 51328 - }, - { - "epoch": 1.32, - "learning_rate": 1.2451537053937577e-06, - "loss": 0.6943, - "step": 51329 - }, - { - "epoch": 1.32, - "learning_rate": 1.2451268792313843e-06, - "loss": 0.6846, - "step": 51330 - }, - { - "epoch": 1.32, - "learning_rate": 1.245100052881328e-06, - "loss": 0.7446, - "step": 51331 - }, - { - "epoch": 1.32, - "learning_rate": 1.2450732263436102e-06, - "loss": 0.6116, - "step": 51332 - }, - { - "epoch": 1.32, - "learning_rate": 1.245046399618251e-06, - "loss": 0.7432, - "step": 51333 - }, - { - "epoch": 1.32, - "learning_rate": 1.2450195727052708e-06, - "loss": 0.6338, - "step": 51334 - }, - { - "epoch": 1.32, - "learning_rate": 1.2449927456046907e-06, - "loss": 0.606, - "step": 51335 - }, - { - "epoch": 1.32, - "learning_rate": 1.2449659183165309e-06, - "loss": 0.748, - "step": 51336 - }, - { - "epoch": 1.32, - "learning_rate": 1.2449390908408118e-06, - "loss": 0.5378, - "step": 51337 - }, - { - "epoch": 1.32, - "learning_rate": 1.2449122631775545e-06, - "loss": 0.5757, - "step": 51338 - }, - { - "epoch": 1.32, - "learning_rate": 1.2448854353267789e-06, - "loss": 0.606, - "step": 51339 - }, - { - "epoch": 1.32, - "learning_rate": 1.2448586072885054e-06, - "loss": 0.7373, - "step": 51340 - }, - { - "epoch": 1.32, - "learning_rate": 1.2448317790627553e-06, - "loss": 0.5503, - "step": 51341 - }, - { - "epoch": 1.32, - "learning_rate": 1.2448049506495486e-06, - "loss": 0.7656, - "step": 51342 - }, - { - "epoch": 1.32, - "learning_rate": 1.2447781220489064e-06, - "loss": 0.6992, - "step": 51343 - }, - { - "epoch": 1.32, - "learning_rate": 1.2447512932608484e-06, - "loss": 0.7012, - "step": 51344 - }, - { - "epoch": 1.32, - "learning_rate": 1.2447244642853958e-06, - "loss": 0.668, - "step": 51345 - }, - { - "epoch": 1.32, - "learning_rate": 1.2446976351225685e-06, - "loss": 0.7339, - "step": 51346 - }, - { - "epoch": 1.32, - "learning_rate": 1.2446708057723882e-06, - "loss": 0.5015, - "step": 51347 - }, - { - "epoch": 1.32, - "learning_rate": 1.2446439762348744e-06, - "loss": 0.6016, - "step": 51348 - }, - { - "epoch": 1.32, - "learning_rate": 1.244617146510048e-06, - "loss": 0.4619, - "step": 51349 - }, - { - "epoch": 1.32, - "learning_rate": 1.2445903165979292e-06, - "loss": 0.6123, - "step": 51350 - }, - { - "epoch": 1.32, - "learning_rate": 1.2445634864985393e-06, - "loss": 0.6763, - "step": 51351 - }, - { - "epoch": 1.32, - "learning_rate": 1.2445366562118979e-06, - "loss": 0.582, - "step": 51352 - }, - { - "epoch": 1.32, - "learning_rate": 1.2445098257380264e-06, - "loss": 0.6724, - "step": 51353 - }, - { - "epoch": 1.32, - "learning_rate": 1.2444829950769448e-06, - "loss": 0.79, - "step": 51354 - }, - { - "epoch": 1.32, - "learning_rate": 1.2444561642286738e-06, - "loss": 0.4578, - "step": 51355 - }, - { - "epoch": 1.32, - "learning_rate": 1.2444293331932342e-06, - "loss": 0.6973, - "step": 51356 - }, - { - "epoch": 1.32, - "learning_rate": 1.2444025019706461e-06, - "loss": 0.8447, - "step": 51357 - }, - { - "epoch": 1.32, - "learning_rate": 1.2443756705609304e-06, - "loss": 0.3235, - "step": 51358 - }, - { - "epoch": 1.32, - "learning_rate": 1.244348838964107e-06, - "loss": 0.5938, - "step": 51359 - }, - { - "epoch": 1.32, - "learning_rate": 1.2443220071801974e-06, - "loss": 0.5444, - "step": 51360 - }, - { - "epoch": 1.32, - "learning_rate": 1.2442951752092214e-06, - "loss": 0.5522, - "step": 51361 - }, - { - "epoch": 1.32, - "learning_rate": 1.2442683430512e-06, - "loss": 0.6367, - "step": 51362 - }, - { - "epoch": 1.32, - "learning_rate": 1.2442415107061537e-06, - "loss": 0.7754, - "step": 51363 - }, - { - "epoch": 1.32, - "learning_rate": 1.2442146781741027e-06, - "loss": 0.6543, - "step": 51364 - }, - { - "epoch": 1.32, - "learning_rate": 1.2441878454550675e-06, - "loss": 0.4639, - "step": 51365 - }, - { - "epoch": 1.32, - "learning_rate": 1.2441610125490693e-06, - "loss": 0.5352, - "step": 51366 - }, - { - "epoch": 1.32, - "learning_rate": 1.244134179456128e-06, - "loss": 0.7422, - "step": 51367 - }, - { - "epoch": 1.32, - "learning_rate": 1.2441073461762649e-06, - "loss": 0.6406, - "step": 51368 - }, - { - "epoch": 1.32, - "learning_rate": 1.2440805127094993e-06, - "loss": 0.5933, - "step": 51369 - }, - { - "epoch": 1.32, - "learning_rate": 1.2440536790558528e-06, - "loss": 0.5627, - "step": 51370 - }, - { - "epoch": 1.32, - "learning_rate": 1.2440268452153456e-06, - "loss": 0.6289, - "step": 51371 - }, - { - "epoch": 1.32, - "learning_rate": 1.2440000111879983e-06, - "loss": 0.6172, - "step": 51372 - }, - { - "epoch": 1.32, - "learning_rate": 1.2439731769738316e-06, - "loss": 0.6797, - "step": 51373 - }, - { - "epoch": 1.32, - "learning_rate": 1.2439463425728656e-06, - "loss": 0.5037, - "step": 51374 - }, - { - "epoch": 1.32, - "learning_rate": 1.2439195079851211e-06, - "loss": 0.5479, - "step": 51375 - }, - { - "epoch": 1.32, - "learning_rate": 1.2438926732106188e-06, - "loss": 0.4956, - "step": 51376 - }, - { - "epoch": 1.32, - "learning_rate": 1.2438658382493788e-06, - "loss": 0.573, - "step": 51377 - }, - { - "epoch": 1.32, - "learning_rate": 1.243839003101422e-06, - "loss": 0.6855, - "step": 51378 - }, - { - "epoch": 1.32, - "learning_rate": 1.2438121677667692e-06, - "loss": 0.7383, - "step": 51379 - }, - { - "epoch": 1.32, - "learning_rate": 1.2437853322454403e-06, - "loss": 0.7832, - "step": 51380 - }, - { - "epoch": 1.32, - "learning_rate": 1.2437584965374567e-06, - "loss": 0.5247, - "step": 51381 - }, - { - "epoch": 1.32, - "learning_rate": 1.2437316606428376e-06, - "loss": 0.688, - "step": 51382 - }, - { - "epoch": 1.32, - "learning_rate": 1.2437048245616053e-06, - "loss": 0.6104, - "step": 51383 - }, - { - "epoch": 1.32, - "learning_rate": 1.2436779882937786e-06, - "loss": 0.6631, - "step": 51384 - }, - { - "epoch": 1.32, - "learning_rate": 1.2436511518393796e-06, - "loss": 0.5151, - "step": 51385 - }, - { - "epoch": 1.32, - "learning_rate": 1.2436243151984275e-06, - "loss": 0.3661, - "step": 51386 - }, - { - "epoch": 1.32, - "learning_rate": 1.2435974783709437e-06, - "loss": 0.7695, - "step": 51387 - }, - { - "epoch": 1.32, - "learning_rate": 1.2435706413569487e-06, - "loss": 0.6392, - "step": 51388 - }, - { - "epoch": 1.32, - "learning_rate": 1.2435438041564628e-06, - "loss": 0.7119, - "step": 51389 - }, - { - "epoch": 1.32, - "learning_rate": 1.2435169667695063e-06, - "loss": 0.416, - "step": 51390 - }, - { - "epoch": 1.32, - "learning_rate": 1.2434901291961001e-06, - "loss": 0.667, - "step": 51391 - }, - { - "epoch": 1.32, - "learning_rate": 1.243463291436265e-06, - "loss": 0.7871, - "step": 51392 - }, - { - "epoch": 1.32, - "learning_rate": 1.2434364534900213e-06, - "loss": 0.4519, - "step": 51393 - }, - { - "epoch": 1.32, - "learning_rate": 1.2434096153573891e-06, - "loss": 0.6797, - "step": 51394 - }, - { - "epoch": 1.32, - "learning_rate": 1.2433827770383896e-06, - "loss": 0.6499, - "step": 51395 - }, - { - "epoch": 1.32, - "learning_rate": 1.243355938533043e-06, - "loss": 0.6143, - "step": 51396 - }, - { - "epoch": 1.32, - "learning_rate": 1.24332909984137e-06, - "loss": 0.6104, - "step": 51397 - }, - { - "epoch": 1.32, - "learning_rate": 1.243302260963391e-06, - "loss": 0.814, - "step": 51398 - }, - { - "epoch": 1.32, - "learning_rate": 1.2432754218991269e-06, - "loss": 0.6475, - "step": 51399 - }, - { - "epoch": 1.32, - "learning_rate": 1.2432485826485978e-06, - "loss": 0.7529, - "step": 51400 - }, - { - "epoch": 1.32, - "learning_rate": 1.2432217432118243e-06, - "loss": 0.5707, - "step": 51401 - }, - { - "epoch": 1.32, - "learning_rate": 1.2431949035888273e-06, - "loss": 0.7246, - "step": 51402 - }, - { - "epoch": 1.32, - "learning_rate": 1.2431680637796272e-06, - "loss": 0.7803, - "step": 51403 - }, - { - "epoch": 1.32, - "learning_rate": 1.2431412237842444e-06, - "loss": 0.6958, - "step": 51404 - }, - { - "epoch": 1.32, - "learning_rate": 1.2431143836026995e-06, - "loss": 0.8662, - "step": 51405 - }, - { - "epoch": 1.32, - "learning_rate": 1.2430875432350131e-06, - "loss": 0.71, - "step": 51406 - }, - { - "epoch": 1.32, - "learning_rate": 1.2430607026812059e-06, - "loss": 0.7832, - "step": 51407 - }, - { - "epoch": 1.32, - "learning_rate": 1.2430338619412983e-06, - "loss": 0.6699, - "step": 51408 - }, - { - "epoch": 1.32, - "learning_rate": 1.2430070210153107e-06, - "loss": 0.7236, - "step": 51409 - }, - { - "epoch": 1.32, - "learning_rate": 1.242980179903264e-06, - "loss": 0.5288, - "step": 51410 - }, - { - "epoch": 1.32, - "learning_rate": 1.2429533386051783e-06, - "loss": 0.563, - "step": 51411 - }, - { - "epoch": 1.32, - "learning_rate": 1.2429264971210745e-06, - "loss": 0.5854, - "step": 51412 - }, - { - "epoch": 1.32, - "learning_rate": 1.242899655450973e-06, - "loss": 0.7168, - "step": 51413 - }, - { - "epoch": 1.32, - "learning_rate": 1.2428728135948945e-06, - "loss": 0.637, - "step": 51414 - }, - { - "epoch": 1.32, - "learning_rate": 1.2428459715528594e-06, - "loss": 0.6082, - "step": 51415 - }, - { - "epoch": 1.32, - "learning_rate": 1.2428191293248884e-06, - "loss": 0.7002, - "step": 51416 - }, - { - "epoch": 1.32, - "learning_rate": 1.2427922869110017e-06, - "loss": 0.6899, - "step": 51417 - }, - { - "epoch": 1.32, - "learning_rate": 1.2427654443112202e-06, - "loss": 0.7529, - "step": 51418 - }, - { - "epoch": 1.32, - "learning_rate": 1.2427386015255646e-06, - "loss": 0.7744, - "step": 51419 - }, - { - "epoch": 1.32, - "learning_rate": 1.2427117585540551e-06, - "loss": 0.5957, - "step": 51420 - }, - { - "epoch": 1.32, - "learning_rate": 1.2426849153967123e-06, - "loss": 0.6348, - "step": 51421 - }, - { - "epoch": 1.32, - "learning_rate": 1.242658072053557e-06, - "loss": 0.7402, - "step": 51422 - }, - { - "epoch": 1.32, - "learning_rate": 1.2426312285246092e-06, - "loss": 0.8174, - "step": 51423 - }, - { - "epoch": 1.32, - "learning_rate": 1.24260438480989e-06, - "loss": 0.5542, - "step": 51424 - }, - { - "epoch": 1.32, - "learning_rate": 1.24257754090942e-06, - "loss": 0.7334, - "step": 51425 - }, - { - "epoch": 1.32, - "learning_rate": 1.242550696823219e-06, - "loss": 0.4849, - "step": 51426 - }, - { - "epoch": 1.32, - "learning_rate": 1.2425238525513084e-06, - "loss": 0.6104, - "step": 51427 - }, - { - "epoch": 1.32, - "learning_rate": 1.2424970080937086e-06, - "loss": 0.6562, - "step": 51428 - }, - { - "epoch": 1.32, - "learning_rate": 1.2424701634504399e-06, - "loss": 0.6279, - "step": 51429 - }, - { - "epoch": 1.32, - "learning_rate": 1.2424433186215229e-06, - "loss": 0.502, - "step": 51430 - }, - { - "epoch": 1.32, - "learning_rate": 1.2424164736069782e-06, - "loss": 0.6074, - "step": 51431 - }, - { - "epoch": 1.32, - "learning_rate": 1.2423896284068263e-06, - "loss": 0.668, - "step": 51432 - }, - { - "epoch": 1.32, - "learning_rate": 1.242362783021088e-06, - "loss": 0.6191, - "step": 51433 - }, - { - "epoch": 1.32, - "learning_rate": 1.2423359374497836e-06, - "loss": 0.6514, - "step": 51434 - }, - { - "epoch": 1.32, - "learning_rate": 1.2423090916929335e-06, - "loss": 0.5923, - "step": 51435 - }, - { - "epoch": 1.32, - "learning_rate": 1.2422822457505585e-06, - "loss": 0.7246, - "step": 51436 - }, - { - "epoch": 1.32, - "learning_rate": 1.2422553996226792e-06, - "loss": 0.5557, - "step": 51437 - }, - { - "epoch": 1.32, - "learning_rate": 1.2422285533093162e-06, - "loss": 0.5356, - "step": 51438 - }, - { - "epoch": 1.32, - "learning_rate": 1.24220170681049e-06, - "loss": 0.6108, - "step": 51439 - }, - { - "epoch": 1.32, - "learning_rate": 1.2421748601262208e-06, - "loss": 0.593, - "step": 51440 - }, - { - "epoch": 1.32, - "learning_rate": 1.2421480132565296e-06, - "loss": 0.5503, - "step": 51441 - }, - { - "epoch": 1.32, - "learning_rate": 1.2421211662014366e-06, - "loss": 0.9531, - "step": 51442 - }, - { - "epoch": 1.32, - "learning_rate": 1.242094318960963e-06, - "loss": 0.7471, - "step": 51443 - }, - { - "epoch": 1.32, - "learning_rate": 1.2420674715351287e-06, - "loss": 0.7534, - "step": 51444 - }, - { - "epoch": 1.32, - "learning_rate": 1.2420406239239541e-06, - "loss": 0.6111, - "step": 51445 - }, - { - "epoch": 1.32, - "learning_rate": 1.2420137761274606e-06, - "loss": 0.5789, - "step": 51446 - }, - { - "epoch": 1.32, - "learning_rate": 1.241986928145668e-06, - "loss": 0.5347, - "step": 51447 - }, - { - "epoch": 1.32, - "learning_rate": 1.2419600799785973e-06, - "loss": 0.6924, - "step": 51448 - }, - { - "epoch": 1.32, - "learning_rate": 1.241933231626269e-06, - "loss": 0.6201, - "step": 51449 - }, - { - "epoch": 1.32, - "learning_rate": 1.2419063830887033e-06, - "loss": 0.6992, - "step": 51450 - }, - { - "epoch": 1.32, - "learning_rate": 1.241879534365921e-06, - "loss": 0.75, - "step": 51451 - }, - { - "epoch": 1.32, - "learning_rate": 1.2418526854579428e-06, - "loss": 0.793, - "step": 51452 - }, - { - "epoch": 1.32, - "learning_rate": 1.2418258363647892e-06, - "loss": 0.793, - "step": 51453 - }, - { - "epoch": 1.32, - "learning_rate": 1.2417989870864807e-06, - "loss": 0.5591, - "step": 51454 - }, - { - "epoch": 1.32, - "learning_rate": 1.2417721376230374e-06, - "loss": 0.7275, - "step": 51455 - }, - { - "epoch": 1.32, - "learning_rate": 1.2417452879744807e-06, - "loss": 0.4626, - "step": 51456 - }, - { - "epoch": 1.32, - "learning_rate": 1.2417184381408305e-06, - "loss": 0.7427, - "step": 51457 - }, - { - "epoch": 1.32, - "learning_rate": 1.241691588122108e-06, - "loss": 0.6055, - "step": 51458 - }, - { - "epoch": 1.32, - "learning_rate": 1.241664737918333e-06, - "loss": 0.6382, - "step": 51459 - }, - { - "epoch": 1.32, - "learning_rate": 1.2416378875295267e-06, - "loss": 0.7075, - "step": 51460 - }, - { - "epoch": 1.32, - "learning_rate": 1.2416110369557089e-06, - "loss": 0.7744, - "step": 51461 - }, - { - "epoch": 1.32, - "learning_rate": 1.241584186196901e-06, - "loss": 0.7217, - "step": 51462 - }, - { - "epoch": 1.32, - "learning_rate": 1.2415573352531233e-06, - "loss": 0.5659, - "step": 51463 - }, - { - "epoch": 1.32, - "learning_rate": 1.241530484124396e-06, - "loss": 0.7822, - "step": 51464 - }, - { - "epoch": 1.32, - "learning_rate": 1.24150363281074e-06, - "loss": 0.7529, - "step": 51465 - }, - { - "epoch": 1.32, - "learning_rate": 1.2414767813121757e-06, - "loss": 0.7939, - "step": 51466 - }, - { - "epoch": 1.32, - "learning_rate": 1.2414499296287238e-06, - "loss": 0.4503, - "step": 51467 - }, - { - "epoch": 1.32, - "learning_rate": 1.2414230777604048e-06, - "loss": 0.6123, - "step": 51468 - }, - { - "epoch": 1.32, - "learning_rate": 1.2413962257072395e-06, - "loss": 0.6006, - "step": 51469 - }, - { - "epoch": 1.32, - "learning_rate": 1.2413693734692476e-06, - "loss": 0.5166, - "step": 51470 - }, - { - "epoch": 1.32, - "learning_rate": 1.2413425210464507e-06, - "loss": 0.6372, - "step": 51471 - }, - { - "epoch": 1.32, - "learning_rate": 1.241315668438869e-06, - "loss": 0.7197, - "step": 51472 - }, - { - "epoch": 1.32, - "learning_rate": 1.2412888156465232e-06, - "loss": 0.4402, - "step": 51473 - }, - { - "epoch": 1.32, - "learning_rate": 1.241261962669433e-06, - "loss": 0.6255, - "step": 51474 - }, - { - "epoch": 1.32, - "learning_rate": 1.24123510950762e-06, - "loss": 0.5332, - "step": 51475 - }, - { - "epoch": 1.32, - "learning_rate": 1.2412082561611041e-06, - "loss": 0.6553, - "step": 51476 - }, - { - "epoch": 1.32, - "learning_rate": 1.2411814026299064e-06, - "loss": 0.6343, - "step": 51477 - }, - { - "epoch": 1.32, - "learning_rate": 1.2411545489140472e-06, - "loss": 0.5964, - "step": 51478 - }, - { - "epoch": 1.32, - "learning_rate": 1.241127695013547e-06, - "loss": 0.4475, - "step": 51479 - }, - { - "epoch": 1.32, - "learning_rate": 1.2411008409284262e-06, - "loss": 0.8018, - "step": 51480 - }, - { - "epoch": 1.32, - "learning_rate": 1.241073986658706e-06, - "loss": 0.6494, - "step": 51481 - }, - { - "epoch": 1.32, - "learning_rate": 1.241047132204406e-06, - "loss": 0.6533, - "step": 51482 - }, - { - "epoch": 1.32, - "learning_rate": 1.2410202775655478e-06, - "loss": 0.6626, - "step": 51483 - }, - { - "epoch": 1.32, - "learning_rate": 1.240993422742151e-06, - "loss": 0.573, - "step": 51484 - }, - { - "epoch": 1.32, - "learning_rate": 1.240966567734237e-06, - "loss": 0.6714, - "step": 51485 - }, - { - "epoch": 1.32, - "learning_rate": 1.2409397125418255e-06, - "loss": 0.6431, - "step": 51486 - }, - { - "epoch": 1.32, - "learning_rate": 1.240912857164938e-06, - "loss": 0.792, - "step": 51487 - }, - { - "epoch": 1.32, - "learning_rate": 1.2408860016035944e-06, - "loss": 0.6768, - "step": 51488 - }, - { - "epoch": 1.32, - "learning_rate": 1.2408591458578154e-06, - "loss": 0.4924, - "step": 51489 - }, - { - "epoch": 1.32, - "learning_rate": 1.240832289927622e-06, - "loss": 0.7832, - "step": 51490 - }, - { - "epoch": 1.32, - "learning_rate": 1.240805433813034e-06, - "loss": 0.7173, - "step": 51491 - }, - { - "epoch": 1.32, - "learning_rate": 1.2407785775140725e-06, - "loss": 0.6309, - "step": 51492 - }, - { - "epoch": 1.32, - "learning_rate": 1.240751721030758e-06, - "loss": 0.6953, - "step": 51493 - }, - { - "epoch": 1.32, - "learning_rate": 1.240724864363111e-06, - "loss": 0.6836, - "step": 51494 - }, - { - "epoch": 1.32, - "learning_rate": 1.2406980075111517e-06, - "loss": 0.4932, - "step": 51495 - }, - { - "epoch": 1.32, - "learning_rate": 1.2406711504749013e-06, - "loss": 0.7119, - "step": 51496 - }, - { - "epoch": 1.32, - "learning_rate": 1.24064429325438e-06, - "loss": 0.6875, - "step": 51497 - }, - { - "epoch": 1.32, - "learning_rate": 1.2406174358496086e-06, - "loss": 0.4922, - "step": 51498 - }, - { - "epoch": 1.32, - "learning_rate": 1.2405905782606072e-06, - "loss": 0.8066, - "step": 51499 - }, - { - "epoch": 1.32, - "learning_rate": 1.2405637204873967e-06, - "loss": 0.4535, - "step": 51500 - }, - { - "epoch": 1.32, - "learning_rate": 1.2405368625299977e-06, - "loss": 0.667, - "step": 51501 - }, - { - "epoch": 1.32, - "learning_rate": 1.2405100043884308e-06, - "loss": 0.5518, - "step": 51502 - }, - { - "epoch": 1.32, - "learning_rate": 1.2404831460627163e-06, - "loss": 0.6465, - "step": 51503 - }, - { - "epoch": 1.32, - "learning_rate": 1.240456287552875e-06, - "loss": 0.6377, - "step": 51504 - }, - { - "epoch": 1.32, - "learning_rate": 1.2404294288589272e-06, - "loss": 0.5913, - "step": 51505 - }, - { - "epoch": 1.32, - "learning_rate": 1.2404025699808937e-06, - "loss": 0.6699, - "step": 51506 - }, - { - "epoch": 1.32, - "learning_rate": 1.2403757109187948e-06, - "loss": 0.7402, - "step": 51507 - }, - { - "epoch": 1.32, - "learning_rate": 1.2403488516726518e-06, - "loss": 0.5615, - "step": 51508 - }, - { - "epoch": 1.32, - "learning_rate": 1.2403219922424845e-06, - "loss": 0.6406, - "step": 51509 - }, - { - "epoch": 1.32, - "learning_rate": 1.2402951326283137e-06, - "loss": 0.623, - "step": 51510 - }, - { - "epoch": 1.32, - "learning_rate": 1.24026827283016e-06, - "loss": 0.5122, - "step": 51511 - }, - { - "epoch": 1.32, - "learning_rate": 1.2402414128480438e-06, - "loss": 0.6985, - "step": 51512 - }, - { - "epoch": 1.32, - "learning_rate": 1.2402145526819859e-06, - "loss": 0.8213, - "step": 51513 - }, - { - "epoch": 1.32, - "learning_rate": 1.2401876923320067e-06, - "loss": 0.6572, - "step": 51514 - }, - { - "epoch": 1.32, - "learning_rate": 1.2401608317981269e-06, - "loss": 0.5596, - "step": 51515 - }, - { - "epoch": 1.32, - "learning_rate": 1.2401339710803666e-06, - "loss": 0.6216, - "step": 51516 - }, - { - "epoch": 1.32, - "learning_rate": 1.2401071101787472e-06, - "loss": 0.458, - "step": 51517 - }, - { - "epoch": 1.32, - "learning_rate": 1.2400802490932888e-06, - "loss": 0.2642, - "step": 51518 - }, - { - "epoch": 1.32, - "learning_rate": 1.240053387824012e-06, - "loss": 0.8389, - "step": 51519 - }, - { - "epoch": 1.32, - "learning_rate": 1.2400265263709374e-06, - "loss": 0.5579, - "step": 51520 - }, - { - "epoch": 1.32, - "learning_rate": 1.2399996647340854e-06, - "loss": 0.6973, - "step": 51521 - }, - { - "epoch": 1.32, - "learning_rate": 1.2399728029134765e-06, - "loss": 0.5464, - "step": 51522 - }, - { - "epoch": 1.32, - "learning_rate": 1.2399459409091319e-06, - "loss": 0.6934, - "step": 51523 - }, - { - "epoch": 1.32, - "learning_rate": 1.2399190787210715e-06, - "loss": 0.8115, - "step": 51524 - }, - { - "epoch": 1.32, - "learning_rate": 1.2398922163493159e-06, - "loss": 0.7295, - "step": 51525 - }, - { - "epoch": 1.32, - "learning_rate": 1.239865353793886e-06, - "loss": 0.7451, - "step": 51526 - }, - { - "epoch": 1.32, - "learning_rate": 1.2398384910548023e-06, - "loss": 0.6367, - "step": 51527 - }, - { - "epoch": 1.32, - "learning_rate": 1.2398116281320855e-06, - "loss": 0.7871, - "step": 51528 - }, - { - "epoch": 1.32, - "learning_rate": 1.2397847650257558e-06, - "loss": 0.6384, - "step": 51529 - }, - { - "epoch": 1.32, - "learning_rate": 1.2397579017358337e-06, - "loss": 0.4697, - "step": 51530 - }, - { - "epoch": 1.32, - "learning_rate": 1.2397310382623402e-06, - "loss": 0.6479, - "step": 51531 - }, - { - "epoch": 1.32, - "learning_rate": 1.2397041746052953e-06, - "loss": 0.5708, - "step": 51532 - }, - { - "epoch": 1.32, - "learning_rate": 1.2396773107647204e-06, - "loss": 0.5825, - "step": 51533 - }, - { - "epoch": 1.32, - "learning_rate": 1.2396504467406356e-06, - "loss": 0.6213, - "step": 51534 - }, - { - "epoch": 1.32, - "learning_rate": 1.2396235825330613e-06, - "loss": 0.7998, - "step": 51535 - }, - { - "epoch": 1.32, - "learning_rate": 1.2395967181420183e-06, - "loss": 0.7422, - "step": 51536 - }, - { - "epoch": 1.32, - "learning_rate": 1.2395698535675273e-06, - "loss": 0.5571, - "step": 51537 - }, - { - "epoch": 1.32, - "learning_rate": 1.2395429888096083e-06, - "loss": 0.8027, - "step": 51538 - }, - { - "epoch": 1.32, - "learning_rate": 1.2395161238682823e-06, - "loss": 0.5688, - "step": 51539 - }, - { - "epoch": 1.32, - "learning_rate": 1.2394892587435701e-06, - "loss": 0.6436, - "step": 51540 - }, - { - "epoch": 1.32, - "learning_rate": 1.2394623934354918e-06, - "loss": 0.5181, - "step": 51541 - }, - { - "epoch": 1.32, - "learning_rate": 1.239435527944068e-06, - "loss": 0.5088, - "step": 51542 - }, - { - "epoch": 1.32, - "learning_rate": 1.2394086622693199e-06, - "loss": 0.5093, - "step": 51543 - }, - { - "epoch": 1.32, - "learning_rate": 1.239381796411267e-06, - "loss": 0.6309, - "step": 51544 - }, - { - "epoch": 1.32, - "learning_rate": 1.239354930369931e-06, - "loss": 0.5581, - "step": 51545 - }, - { - "epoch": 1.32, - "learning_rate": 1.2393280641453317e-06, - "loss": 0.6875, - "step": 51546 - }, - { - "epoch": 1.32, - "learning_rate": 1.2393011977374897e-06, - "loss": 0.7207, - "step": 51547 - }, - { - "epoch": 1.32, - "learning_rate": 1.2392743311464263e-06, - "loss": 0.791, - "step": 51548 - }, - { - "epoch": 1.32, - "learning_rate": 1.239247464372161e-06, - "loss": 0.6514, - "step": 51549 - }, - { - "epoch": 1.32, - "learning_rate": 1.2392205974147152e-06, - "loss": 0.4048, - "step": 51550 - }, - { - "epoch": 1.32, - "learning_rate": 1.2391937302741088e-06, - "loss": 0.6353, - "step": 51551 - }, - { - "epoch": 1.32, - "learning_rate": 1.2391668629503633e-06, - "loss": 0.6133, - "step": 51552 - }, - { - "epoch": 1.32, - "learning_rate": 1.2391399954434987e-06, - "loss": 0.6465, - "step": 51553 - }, - { - "epoch": 1.32, - "learning_rate": 1.2391131277535353e-06, - "loss": 0.5796, - "step": 51554 - }, - { - "epoch": 1.32, - "learning_rate": 1.239086259880494e-06, - "loss": 0.7139, - "step": 51555 - }, - { - "epoch": 1.32, - "learning_rate": 1.2390593918243957e-06, - "loss": 0.7285, - "step": 51556 - }, - { - "epoch": 1.32, - "learning_rate": 1.2390325235852602e-06, - "loss": 0.7471, - "step": 51557 - }, - { - "epoch": 1.32, - "learning_rate": 1.2390056551631087e-06, - "loss": 0.7666, - "step": 51558 - }, - { - "epoch": 1.32, - "learning_rate": 1.2389787865579616e-06, - "loss": 0.6689, - "step": 51559 - }, - { - "epoch": 1.32, - "learning_rate": 1.2389519177698391e-06, - "loss": 0.6484, - "step": 51560 - }, - { - "epoch": 1.32, - "learning_rate": 1.2389250487987624e-06, - "loss": 0.6406, - "step": 51561 - }, - { - "epoch": 1.32, - "learning_rate": 1.2388981796447517e-06, - "loss": 0.8379, - "step": 51562 - }, - { - "epoch": 1.32, - "learning_rate": 1.2388713103078279e-06, - "loss": 0.7061, - "step": 51563 - }, - { - "epoch": 1.32, - "learning_rate": 1.2388444407880108e-06, - "loss": 0.6116, - "step": 51564 - }, - { - "epoch": 1.32, - "learning_rate": 1.2388175710853218e-06, - "loss": 0.7593, - "step": 51565 - }, - { - "epoch": 1.32, - "learning_rate": 1.2387907011997811e-06, - "loss": 0.5311, - "step": 51566 - }, - { - "epoch": 1.32, - "learning_rate": 1.2387638311314096e-06, - "loss": 0.8506, - "step": 51567 - }, - { - "epoch": 1.32, - "learning_rate": 1.2387369608802275e-06, - "loss": 0.7031, - "step": 51568 - }, - { - "epoch": 1.32, - "learning_rate": 1.2387100904462554e-06, - "loss": 0.7207, - "step": 51569 - }, - { - "epoch": 1.32, - "learning_rate": 1.2386832198295137e-06, - "loss": 0.708, - "step": 51570 - }, - { - "epoch": 1.32, - "learning_rate": 1.2386563490300238e-06, - "loss": 0.7129, - "step": 51571 - }, - { - "epoch": 1.32, - "learning_rate": 1.2386294780478054e-06, - "loss": 0.708, - "step": 51572 - }, - { - "epoch": 1.32, - "learning_rate": 1.2386026068828792e-06, - "loss": 0.6709, - "step": 51573 - }, - { - "epoch": 1.32, - "learning_rate": 1.238575735535266e-06, - "loss": 0.6758, - "step": 51574 - }, - { - "epoch": 1.32, - "learning_rate": 1.2385488640049866e-06, - "loss": 0.7266, - "step": 51575 - }, - { - "epoch": 1.32, - "learning_rate": 1.2385219922920608e-06, - "loss": 0.7505, - "step": 51576 - }, - { - "epoch": 1.32, - "learning_rate": 1.2384951203965105e-06, - "loss": 0.7393, - "step": 51577 - }, - { - "epoch": 1.32, - "learning_rate": 1.2384682483183549e-06, - "loss": 0.6294, - "step": 51578 - }, - { - "epoch": 1.32, - "learning_rate": 1.2384413760576152e-06, - "loss": 0.6738, - "step": 51579 - }, - { - "epoch": 1.32, - "learning_rate": 1.238414503614312e-06, - "loss": 0.5791, - "step": 51580 - }, - { - "epoch": 1.32, - "learning_rate": 1.2383876309884653e-06, - "loss": 0.6855, - "step": 51581 - }, - { - "epoch": 1.32, - "learning_rate": 1.238360758180097e-06, - "loss": 0.8916, - "step": 51582 - }, - { - "epoch": 1.32, - "learning_rate": 1.2383338851892262e-06, - "loss": 0.5635, - "step": 51583 - }, - { - "epoch": 1.32, - "learning_rate": 1.2383070120158743e-06, - "loss": 0.7207, - "step": 51584 - }, - { - "epoch": 1.32, - "learning_rate": 1.2382801386600615e-06, - "loss": 0.5361, - "step": 51585 - }, - { - "epoch": 1.32, - "learning_rate": 1.2382532651218087e-06, - "loss": 0.7332, - "step": 51586 - }, - { - "epoch": 1.32, - "learning_rate": 1.2382263914011364e-06, - "loss": 0.5366, - "step": 51587 - }, - { - "epoch": 1.32, - "learning_rate": 1.238199517498065e-06, - "loss": 0.7485, - "step": 51588 - }, - { - "epoch": 1.32, - "learning_rate": 1.2381726434126152e-06, - "loss": 0.6377, - "step": 51589 - }, - { - "epoch": 1.32, - "learning_rate": 1.2381457691448077e-06, - "loss": 0.6343, - "step": 51590 - }, - { - "epoch": 1.32, - "learning_rate": 1.2381188946946627e-06, - "loss": 0.6211, - "step": 51591 - }, - { - "epoch": 1.32, - "learning_rate": 1.2380920200622013e-06, - "loss": 0.4485, - "step": 51592 - }, - { - "epoch": 1.32, - "learning_rate": 1.2380651452474435e-06, - "loss": 0.7393, - "step": 51593 - }, - { - "epoch": 1.32, - "learning_rate": 1.2380382702504104e-06, - "loss": 0.4858, - "step": 51594 - }, - { - "epoch": 1.32, - "learning_rate": 1.2380113950711222e-06, - "loss": 0.5029, - "step": 51595 - }, - { - "epoch": 1.32, - "learning_rate": 1.2379845197095996e-06, - "loss": 0.4689, - "step": 51596 - }, - { - "epoch": 1.32, - "learning_rate": 1.2379576441658634e-06, - "loss": 0.5076, - "step": 51597 - }, - { - "epoch": 1.32, - "learning_rate": 1.2379307684399335e-06, - "loss": 0.7891, - "step": 51598 - }, - { - "epoch": 1.32, - "learning_rate": 1.2379038925318314e-06, - "loss": 0.4154, - "step": 51599 - }, - { - "epoch": 1.32, - "learning_rate": 1.2378770164415772e-06, - "loss": 0.7896, - "step": 51600 - }, - { - "epoch": 1.32, - "learning_rate": 1.2378501401691912e-06, - "loss": 0.6514, - "step": 51601 - }, - { - "epoch": 1.32, - "learning_rate": 1.2378232637146947e-06, - "loss": 0.7559, - "step": 51602 - }, - { - "epoch": 1.32, - "learning_rate": 1.2377963870781076e-06, - "loss": 0.6367, - "step": 51603 - }, - { - "epoch": 1.32, - "learning_rate": 1.2377695102594508e-06, - "loss": 0.6455, - "step": 51604 - }, - { - "epoch": 1.32, - "learning_rate": 1.2377426332587448e-06, - "loss": 0.8008, - "step": 51605 - }, - { - "epoch": 1.32, - "learning_rate": 1.23771575607601e-06, - "loss": 0.7178, - "step": 51606 - }, - { - "epoch": 1.32, - "learning_rate": 1.2376888787112677e-06, - "loss": 0.6768, - "step": 51607 - }, - { - "epoch": 1.32, - "learning_rate": 1.2376620011645376e-06, - "loss": 0.7549, - "step": 51608 - }, - { - "epoch": 1.32, - "learning_rate": 1.2376351234358406e-06, - "loss": 0.5552, - "step": 51609 - }, - { - "epoch": 1.32, - "learning_rate": 1.2376082455251972e-06, - "loss": 0.6294, - "step": 51610 - }, - { - "epoch": 1.32, - "learning_rate": 1.2375813674326283e-06, - "loss": 0.5825, - "step": 51611 - }, - { - "epoch": 1.32, - "learning_rate": 1.2375544891581544e-06, - "loss": 0.7012, - "step": 51612 - }, - { - "epoch": 1.32, - "learning_rate": 1.2375276107017958e-06, - "loss": 0.5776, - "step": 51613 - }, - { - "epoch": 1.32, - "learning_rate": 1.2375007320635731e-06, - "loss": 0.5349, - "step": 51614 - }, - { - "epoch": 1.32, - "learning_rate": 1.237473853243507e-06, - "loss": 0.6357, - "step": 51615 - }, - { - "epoch": 1.32, - "learning_rate": 1.2374469742416182e-06, - "loss": 0.729, - "step": 51616 - }, - { - "epoch": 1.32, - "learning_rate": 1.2374200950579277e-06, - "loss": 0.6626, - "step": 51617 - }, - { - "epoch": 1.32, - "learning_rate": 1.237393215692455e-06, - "loss": 0.6826, - "step": 51618 - }, - { - "epoch": 1.32, - "learning_rate": 1.2373663361452211e-06, - "loss": 0.6365, - "step": 51619 - }, - { - "epoch": 1.32, - "learning_rate": 1.237339456416247e-06, - "loss": 0.6172, - "step": 51620 - }, - { - "epoch": 1.32, - "learning_rate": 1.2373125765055528e-06, - "loss": 0.6021, - "step": 51621 - }, - { - "epoch": 1.32, - "learning_rate": 1.2372856964131596e-06, - "loss": 0.791, - "step": 51622 - }, - { - "epoch": 1.32, - "learning_rate": 1.2372588161390871e-06, - "loss": 0.8066, - "step": 51623 - }, - { - "epoch": 1.32, - "learning_rate": 1.2372319356833566e-06, - "loss": 0.6562, - "step": 51624 - }, - { - "epoch": 1.32, - "learning_rate": 1.2372050550459888e-06, - "loss": 0.5859, - "step": 51625 - }, - { - "epoch": 1.32, - "learning_rate": 1.2371781742270038e-06, - "loss": 0.6553, - "step": 51626 - }, - { - "epoch": 1.32, - "learning_rate": 1.2371512932264225e-06, - "loss": 0.7021, - "step": 51627 - }, - { - "epoch": 1.32, - "learning_rate": 1.2371244120442653e-06, - "loss": 0.6865, - "step": 51628 - }, - { - "epoch": 1.32, - "learning_rate": 1.2370975306805528e-06, - "loss": 0.5908, - "step": 51629 - }, - { - "epoch": 1.32, - "learning_rate": 1.2370706491353056e-06, - "loss": 0.6582, - "step": 51630 - }, - { - "epoch": 1.32, - "learning_rate": 1.2370437674085443e-06, - "loss": 0.6963, - "step": 51631 - }, - { - "epoch": 1.32, - "learning_rate": 1.2370168855002898e-06, - "loss": 0.697, - "step": 51632 - }, - { - "epoch": 1.32, - "learning_rate": 1.236990003410562e-06, - "loss": 0.5049, - "step": 51633 - }, - { - "epoch": 1.32, - "learning_rate": 1.2369631211393822e-06, - "loss": 0.645, - "step": 51634 - }, - { - "epoch": 1.32, - "learning_rate": 1.2369362386867702e-06, - "loss": 0.5796, - "step": 51635 - }, - { - "epoch": 1.32, - "learning_rate": 1.236909356052747e-06, - "loss": 0.4384, - "step": 51636 - }, - { - "epoch": 1.32, - "learning_rate": 1.2368824732373336e-06, - "loss": 0.6826, - "step": 51637 - }, - { - "epoch": 1.32, - "learning_rate": 1.23685559024055e-06, - "loss": 0.498, - "step": 51638 - }, - { - "epoch": 1.32, - "learning_rate": 1.2368287070624168e-06, - "loss": 0.446, - "step": 51639 - }, - { - "epoch": 1.32, - "learning_rate": 1.2368018237029549e-06, - "loss": 0.6353, - "step": 51640 - }, - { - "epoch": 1.32, - "learning_rate": 1.2367749401621847e-06, - "loss": 0.708, - "step": 51641 - }, - { - "epoch": 1.32, - "learning_rate": 1.236748056440127e-06, - "loss": 0.5427, - "step": 51642 - }, - { - "epoch": 1.32, - "learning_rate": 1.2367211725368021e-06, - "loss": 0.4436, - "step": 51643 - }, - { - "epoch": 1.32, - "learning_rate": 1.2366942884522304e-06, - "loss": 0.71, - "step": 51644 - }, - { - "epoch": 1.32, - "learning_rate": 1.236667404186433e-06, - "loss": 0.493, - "step": 51645 - }, - { - "epoch": 1.32, - "learning_rate": 1.2366405197394306e-06, - "loss": 0.6553, - "step": 51646 - }, - { - "epoch": 1.32, - "learning_rate": 1.2366136351112431e-06, - "loss": 0.6909, - "step": 51647 - }, - { - "epoch": 1.32, - "learning_rate": 1.2365867503018912e-06, - "loss": 0.6631, - "step": 51648 - }, - { - "epoch": 1.32, - "learning_rate": 1.236559865311396e-06, - "loss": 0.6299, - "step": 51649 - }, - { - "epoch": 1.32, - "learning_rate": 1.2365329801397775e-06, - "loss": 0.7471, - "step": 51650 - }, - { - "epoch": 1.32, - "learning_rate": 1.2365060947870569e-06, - "loss": 0.5723, - "step": 51651 - }, - { - "epoch": 1.32, - "learning_rate": 1.2364792092532544e-06, - "loss": 0.5605, - "step": 51652 - }, - { - "epoch": 1.32, - "learning_rate": 1.2364523235383905e-06, - "loss": 0.436, - "step": 51653 - }, - { - "epoch": 1.32, - "learning_rate": 1.2364254376424861e-06, - "loss": 0.6675, - "step": 51654 - }, - { - "epoch": 1.32, - "learning_rate": 1.2363985515655614e-06, - "loss": 0.7842, - "step": 51655 - }, - { - "epoch": 1.32, - "learning_rate": 1.2363716653076372e-06, - "loss": 0.5801, - "step": 51656 - }, - { - "epoch": 1.32, - "learning_rate": 1.2363447788687347e-06, - "loss": 0.6836, - "step": 51657 - }, - { - "epoch": 1.32, - "learning_rate": 1.2363178922488731e-06, - "loss": 0.708, - "step": 51658 - }, - { - "epoch": 1.32, - "learning_rate": 1.2362910054480739e-06, - "loss": 0.7339, - "step": 51659 - }, - { - "epoch": 1.32, - "learning_rate": 1.236264118466358e-06, - "loss": 0.6309, - "step": 51660 - }, - { - "epoch": 1.32, - "learning_rate": 1.236237231303745e-06, - "loss": 0.6587, - "step": 51661 - }, - { - "epoch": 1.32, - "learning_rate": 1.2362103439602563e-06, - "loss": 0.7236, - "step": 51662 - }, - { - "epoch": 1.32, - "learning_rate": 1.2361834564359122e-06, - "loss": 0.6035, - "step": 51663 - }, - { - "epoch": 1.32, - "learning_rate": 1.236156568730733e-06, - "loss": 0.6035, - "step": 51664 - }, - { - "epoch": 1.32, - "learning_rate": 1.2361296808447398e-06, - "loss": 0.5635, - "step": 51665 - }, - { - "epoch": 1.32, - "learning_rate": 1.2361027927779528e-06, - "loss": 0.7725, - "step": 51666 - }, - { - "epoch": 1.32, - "learning_rate": 1.236075904530393e-06, - "loss": 0.5823, - "step": 51667 - }, - { - "epoch": 1.32, - "learning_rate": 1.2360490161020806e-06, - "loss": 0.623, - "step": 51668 - }, - { - "epoch": 1.32, - "learning_rate": 1.2360221274930363e-06, - "loss": 0.6025, - "step": 51669 - }, - { - "epoch": 1.32, - "learning_rate": 1.2359952387032809e-06, - "loss": 0.4585, - "step": 51670 - }, - { - "epoch": 1.32, - "learning_rate": 1.2359683497328344e-06, - "loss": 0.7695, - "step": 51671 - }, - { - "epoch": 1.32, - "learning_rate": 1.2359414605817182e-06, - "loss": 0.6196, - "step": 51672 - }, - { - "epoch": 1.32, - "learning_rate": 1.2359145712499523e-06, - "loss": 0.7129, - "step": 51673 - }, - { - "epoch": 1.32, - "learning_rate": 1.2358876817375573e-06, - "loss": 0.6611, - "step": 51674 - }, - { - "epoch": 1.32, - "learning_rate": 1.2358607920445541e-06, - "loss": 0.4663, - "step": 51675 - }, - { - "epoch": 1.32, - "learning_rate": 1.2358339021709633e-06, - "loss": 0.7021, - "step": 51676 - }, - { - "epoch": 1.32, - "learning_rate": 1.2358070121168051e-06, - "loss": 0.6035, - "step": 51677 - }, - { - "epoch": 1.32, - "learning_rate": 1.2357801218821006e-06, - "loss": 0.6182, - "step": 51678 - }, - { - "epoch": 1.32, - "learning_rate": 1.2357532314668697e-06, - "loss": 0.7549, - "step": 51679 - }, - { - "epoch": 1.32, - "learning_rate": 1.2357263408711335e-06, - "loss": 0.5908, - "step": 51680 - }, - { - "epoch": 1.32, - "learning_rate": 1.2356994500949128e-06, - "loss": 0.7241, - "step": 51681 - }, - { - "epoch": 1.32, - "learning_rate": 1.2356725591382277e-06, - "loss": 0.5874, - "step": 51682 - }, - { - "epoch": 1.32, - "learning_rate": 1.2356456680010987e-06, - "loss": 0.5684, - "step": 51683 - }, - { - "epoch": 1.32, - "learning_rate": 1.235618776683547e-06, - "loss": 0.6504, - "step": 51684 - }, - { - "epoch": 1.32, - "learning_rate": 1.2355918851855925e-06, - "loss": 0.8232, - "step": 51685 - }, - { - "epoch": 1.32, - "learning_rate": 1.2355649935072563e-06, - "loss": 0.7822, - "step": 51686 - }, - { - "epoch": 1.32, - "learning_rate": 1.2355381016485588e-06, - "loss": 0.7188, - "step": 51687 - }, - { - "epoch": 1.32, - "learning_rate": 1.2355112096095206e-06, - "loss": 0.7705, - "step": 51688 - }, - { - "epoch": 1.32, - "learning_rate": 1.2354843173901623e-06, - "loss": 0.7139, - "step": 51689 - }, - { - "epoch": 1.32, - "learning_rate": 1.2354574249905047e-06, - "loss": 0.5459, - "step": 51690 - }, - { - "epoch": 1.32, - "learning_rate": 1.2354305324105677e-06, - "loss": 0.7969, - "step": 51691 - }, - { - "epoch": 1.32, - "learning_rate": 1.2354036396503729e-06, - "loss": 0.603, - "step": 51692 - }, - { - "epoch": 1.32, - "learning_rate": 1.23537674670994e-06, - "loss": 0.6294, - "step": 51693 - }, - { - "epoch": 1.32, - "learning_rate": 1.23534985358929e-06, - "loss": 0.625, - "step": 51694 - }, - { - "epoch": 1.32, - "learning_rate": 1.2353229602884436e-06, - "loss": 0.7349, - "step": 51695 - }, - { - "epoch": 1.32, - "learning_rate": 1.235296066807421e-06, - "loss": 0.8477, - "step": 51696 - }, - { - "epoch": 1.33, - "learning_rate": 1.2352691731462436e-06, - "loss": 0.6729, - "step": 51697 - }, - { - "epoch": 1.33, - "learning_rate": 1.2352422793049306e-06, - "loss": 0.7739, - "step": 51698 - }, - { - "epoch": 1.33, - "learning_rate": 1.2352153852835039e-06, - "loss": 0.6396, - "step": 51699 - }, - { - "epoch": 1.33, - "learning_rate": 1.2351884910819832e-06, - "loss": 0.6724, - "step": 51700 - }, - { - "epoch": 1.33, - "learning_rate": 1.2351615967003898e-06, - "loss": 0.7783, - "step": 51701 - }, - { - "epoch": 1.33, - "learning_rate": 1.235134702138744e-06, - "loss": 0.7832, - "step": 51702 - }, - { - "epoch": 1.33, - "learning_rate": 1.2351078073970665e-06, - "loss": 0.6543, - "step": 51703 - }, - { - "epoch": 1.33, - "learning_rate": 1.2350809124753774e-06, - "loss": 0.8154, - "step": 51704 - }, - { - "epoch": 1.33, - "learning_rate": 1.2350540173736978e-06, - "loss": 0.7754, - "step": 51705 - }, - { - "epoch": 1.33, - "learning_rate": 1.235027122092048e-06, - "loss": 0.6436, - "step": 51706 - }, - { - "epoch": 1.33, - "learning_rate": 1.2350002266304492e-06, - "loss": 0.8145, - "step": 51707 - }, - { - "epoch": 1.33, - "learning_rate": 1.234973330988921e-06, - "loss": 0.6416, - "step": 51708 - }, - { - "epoch": 1.33, - "learning_rate": 1.2349464351674847e-06, - "loss": 0.7451, - "step": 51709 - }, - { - "epoch": 1.33, - "learning_rate": 1.2349195391661606e-06, - "loss": 0.6052, - "step": 51710 - }, - { - "epoch": 1.33, - "learning_rate": 1.2348926429849697e-06, - "loss": 0.6953, - "step": 51711 - }, - { - "epoch": 1.33, - "learning_rate": 1.2348657466239324e-06, - "loss": 0.7734, - "step": 51712 - }, - { - "epoch": 1.33, - "learning_rate": 1.2348388500830689e-06, - "loss": 0.5371, - "step": 51713 - }, - { - "epoch": 1.33, - "learning_rate": 1.2348119533624002e-06, - "loss": 0.5444, - "step": 51714 - }, - { - "epoch": 1.33, - "learning_rate": 1.2347850564619466e-06, - "loss": 0.6963, - "step": 51715 - }, - { - "epoch": 1.33, - "learning_rate": 1.2347581593817291e-06, - "loss": 0.6797, - "step": 51716 - }, - { - "epoch": 1.33, - "learning_rate": 1.234731262121768e-06, - "loss": 0.6006, - "step": 51717 - }, - { - "epoch": 1.33, - "learning_rate": 1.234704364682084e-06, - "loss": 0.6216, - "step": 51718 - }, - { - "epoch": 1.33, - "learning_rate": 1.2346774670626975e-06, - "loss": 0.6525, - "step": 51719 - }, - { - "epoch": 1.33, - "learning_rate": 1.2346505692636296e-06, - "loss": 0.7539, - "step": 51720 - }, - { - "epoch": 1.33, - "learning_rate": 1.2346236712849002e-06, - "loss": 0.4746, - "step": 51721 - }, - { - "epoch": 1.33, - "learning_rate": 1.2345967731265305e-06, - "loss": 0.5469, - "step": 51722 - }, - { - "epoch": 1.33, - "learning_rate": 1.2345698747885407e-06, - "loss": 0.625, - "step": 51723 - }, - { - "epoch": 1.33, - "learning_rate": 1.2345429762709515e-06, - "loss": 0.6025, - "step": 51724 - }, - { - "epoch": 1.33, - "learning_rate": 1.2345160775737835e-06, - "loss": 0.707, - "step": 51725 - }, - { - "epoch": 1.33, - "learning_rate": 1.2344891786970574e-06, - "loss": 0.5791, - "step": 51726 - }, - { - "epoch": 1.33, - "learning_rate": 1.2344622796407938e-06, - "loss": 0.7959, - "step": 51727 - }, - { - "epoch": 1.33, - "learning_rate": 1.2344353804050133e-06, - "loss": 0.6807, - "step": 51728 - }, - { - "epoch": 1.33, - "learning_rate": 1.234408480989736e-06, - "loss": 0.6943, - "step": 51729 - }, - { - "epoch": 1.33, - "learning_rate": 1.234381581394983e-06, - "loss": 0.6426, - "step": 51730 - }, - { - "epoch": 1.33, - "learning_rate": 1.234354681620775e-06, - "loss": 0.6758, - "step": 51731 - }, - { - "epoch": 1.33, - "learning_rate": 1.2343277816671323e-06, - "loss": 0.5957, - "step": 51732 - }, - { - "epoch": 1.33, - "learning_rate": 1.2343008815340756e-06, - "loss": 0.6035, - "step": 51733 - }, - { - "epoch": 1.33, - "learning_rate": 1.2342739812216257e-06, - "loss": 0.7568, - "step": 51734 - }, - { - "epoch": 1.33, - "learning_rate": 1.2342470807298026e-06, - "loss": 0.5935, - "step": 51735 - }, - { - "epoch": 1.33, - "learning_rate": 1.2342201800586275e-06, - "loss": 0.646, - "step": 51736 - }, - { - "epoch": 1.33, - "learning_rate": 1.234193279208121e-06, - "loss": 0.6699, - "step": 51737 - }, - { - "epoch": 1.33, - "learning_rate": 1.2341663781783032e-06, - "loss": 0.5527, - "step": 51738 - }, - { - "epoch": 1.33, - "learning_rate": 1.2341394769691948e-06, - "loss": 0.6572, - "step": 51739 - }, - { - "epoch": 1.33, - "learning_rate": 1.2341125755808168e-06, - "loss": 0.7002, - "step": 51740 - }, - { - "epoch": 1.33, - "learning_rate": 1.2340856740131895e-06, - "loss": 0.4956, - "step": 51741 - }, - { - "epoch": 1.33, - "learning_rate": 1.2340587722663338e-06, - "loss": 0.5908, - "step": 51742 - }, - { - "epoch": 1.33, - "learning_rate": 1.2340318703402698e-06, - "loss": 0.748, - "step": 51743 - }, - { - "epoch": 1.33, - "learning_rate": 1.2340049682350184e-06, - "loss": 0.6738, - "step": 51744 - }, - { - "epoch": 1.33, - "learning_rate": 1.2339780659506002e-06, - "loss": 0.6543, - "step": 51745 - }, - { - "epoch": 1.33, - "learning_rate": 1.2339511634870356e-06, - "loss": 0.6479, - "step": 51746 - }, - { - "epoch": 1.33, - "learning_rate": 1.2339242608443456e-06, - "loss": 0.6406, - "step": 51747 - }, - { - "epoch": 1.33, - "learning_rate": 1.2338973580225505e-06, - "loss": 0.5459, - "step": 51748 - }, - { - "epoch": 1.33, - "learning_rate": 1.233870455021671e-06, - "loss": 0.606, - "step": 51749 - }, - { - "epoch": 1.33, - "learning_rate": 1.2338435518417272e-06, - "loss": 0.5908, - "step": 51750 - }, - { - "epoch": 1.33, - "learning_rate": 1.2338166484827406e-06, - "loss": 0.7285, - "step": 51751 - }, - { - "epoch": 1.33, - "learning_rate": 1.2337897449447314e-06, - "loss": 0.8574, - "step": 51752 - }, - { - "epoch": 1.33, - "learning_rate": 1.2337628412277199e-06, - "loss": 0.8032, - "step": 51753 - }, - { - "epoch": 1.33, - "learning_rate": 1.2337359373317269e-06, - "loss": 0.7139, - "step": 51754 - }, - { - "epoch": 1.33, - "learning_rate": 1.2337090332567732e-06, - "loss": 0.5596, - "step": 51755 - }, - { - "epoch": 1.33, - "learning_rate": 1.2336821290028789e-06, - "loss": 0.6484, - "step": 51756 - }, - { - "epoch": 1.33, - "learning_rate": 1.2336552245700654e-06, - "loss": 0.6309, - "step": 51757 - }, - { - "epoch": 1.33, - "learning_rate": 1.2336283199583528e-06, - "loss": 0.7432, - "step": 51758 - }, - { - "epoch": 1.33, - "learning_rate": 1.2336014151677613e-06, - "loss": 0.5942, - "step": 51759 - }, - { - "epoch": 1.33, - "learning_rate": 1.2335745101983124e-06, - "loss": 0.7291, - "step": 51760 - }, - { - "epoch": 1.33, - "learning_rate": 1.233547605050026e-06, - "loss": 0.5896, - "step": 51761 - }, - { - "epoch": 1.33, - "learning_rate": 1.2335206997229233e-06, - "loss": 0.7236, - "step": 51762 - }, - { - "epoch": 1.33, - "learning_rate": 1.233493794217024e-06, - "loss": 0.6113, - "step": 51763 - }, - { - "epoch": 1.33, - "learning_rate": 1.2334668885323495e-06, - "loss": 0.5737, - "step": 51764 - }, - { - "epoch": 1.33, - "learning_rate": 1.2334399826689202e-06, - "loss": 0.6396, - "step": 51765 - }, - { - "epoch": 1.33, - "learning_rate": 1.2334130766267564e-06, - "loss": 0.5444, - "step": 51766 - }, - { - "epoch": 1.33, - "learning_rate": 1.2333861704058793e-06, - "loss": 0.6982, - "step": 51767 - }, - { - "epoch": 1.33, - "learning_rate": 1.2333592640063089e-06, - "loss": 0.4624, - "step": 51768 - }, - { - "epoch": 1.33, - "learning_rate": 1.2333323574280662e-06, - "loss": 0.708, - "step": 51769 - }, - { - "epoch": 1.33, - "learning_rate": 1.2333054506711713e-06, - "loss": 0.7822, - "step": 51770 - }, - { - "epoch": 1.33, - "learning_rate": 1.2332785437356453e-06, - "loss": 0.6895, - "step": 51771 - }, - { - "epoch": 1.33, - "learning_rate": 1.233251636621509e-06, - "loss": 0.6289, - "step": 51772 - }, - { - "epoch": 1.33, - "learning_rate": 1.2332247293287821e-06, - "loss": 0.6362, - "step": 51773 - }, - { - "epoch": 1.33, - "learning_rate": 1.2331978218574861e-06, - "loss": 0.6982, - "step": 51774 - }, - { - "epoch": 1.33, - "learning_rate": 1.2331709142076409e-06, - "loss": 0.708, - "step": 51775 - }, - { - "epoch": 1.33, - "learning_rate": 1.233144006379268e-06, - "loss": 0.6484, - "step": 51776 - }, - { - "epoch": 1.33, - "learning_rate": 1.233117098372387e-06, - "loss": 0.7188, - "step": 51777 - }, - { - "epoch": 1.33, - "learning_rate": 1.2330901901870193e-06, - "loss": 0.7041, - "step": 51778 - }, - { - "epoch": 1.33, - "learning_rate": 1.233063281823185e-06, - "loss": 0.6963, - "step": 51779 - }, - { - "epoch": 1.33, - "learning_rate": 1.2330363732809047e-06, - "loss": 0.4473, - "step": 51780 - }, - { - "epoch": 1.33, - "learning_rate": 1.2330094645601993e-06, - "loss": 0.626, - "step": 51781 - }, - { - "epoch": 1.33, - "learning_rate": 1.2329825556610893e-06, - "loss": 0.8105, - "step": 51782 - }, - { - "epoch": 1.33, - "learning_rate": 1.2329556465835953e-06, - "loss": 0.5928, - "step": 51783 - }, - { - "epoch": 1.33, - "learning_rate": 1.2329287373277376e-06, - "loss": 0.7773, - "step": 51784 - }, - { - "epoch": 1.33, - "learning_rate": 1.2329018278935374e-06, - "loss": 0.6494, - "step": 51785 - }, - { - "epoch": 1.33, - "learning_rate": 1.2328749182810148e-06, - "loss": 0.4871, - "step": 51786 - }, - { - "epoch": 1.33, - "learning_rate": 1.2328480084901908e-06, - "loss": 0.6284, - "step": 51787 - }, - { - "epoch": 1.33, - "learning_rate": 1.2328210985210855e-06, - "loss": 0.6504, - "step": 51788 - }, - { - "epoch": 1.33, - "learning_rate": 1.2327941883737202e-06, - "loss": 0.5479, - "step": 51789 - }, - { - "epoch": 1.33, - "learning_rate": 1.2327672780481146e-06, - "loss": 0.7402, - "step": 51790 - }, - { - "epoch": 1.33, - "learning_rate": 1.2327403675442903e-06, - "loss": 0.8652, - "step": 51791 - }, - { - "epoch": 1.33, - "learning_rate": 1.232713456862267e-06, - "loss": 0.6196, - "step": 51792 - }, - { - "epoch": 1.33, - "learning_rate": 1.2326865460020659e-06, - "loss": 0.7305, - "step": 51793 - }, - { - "epoch": 1.33, - "learning_rate": 1.2326596349637073e-06, - "loss": 0.7715, - "step": 51794 - }, - { - "epoch": 1.33, - "learning_rate": 1.232632723747212e-06, - "loss": 0.6934, - "step": 51795 - }, - { - "epoch": 1.33, - "learning_rate": 1.2326058123526005e-06, - "loss": 0.7217, - "step": 51796 - }, - { - "epoch": 1.33, - "learning_rate": 1.2325789007798935e-06, - "loss": 0.6533, - "step": 51797 - }, - { - "epoch": 1.33, - "learning_rate": 1.2325519890291113e-06, - "loss": 0.392, - "step": 51798 - }, - { - "epoch": 1.33, - "learning_rate": 1.2325250771002748e-06, - "loss": 0.7051, - "step": 51799 - }, - { - "epoch": 1.33, - "learning_rate": 1.2324981649934044e-06, - "loss": 0.5073, - "step": 51800 - }, - { - "epoch": 1.33, - "learning_rate": 1.2324712527085212e-06, - "loss": 0.9043, - "step": 51801 - }, - { - "epoch": 1.33, - "learning_rate": 1.2324443402456454e-06, - "loss": 0.5459, - "step": 51802 - }, - { - "epoch": 1.33, - "learning_rate": 1.2324174276047977e-06, - "loss": 0.5664, - "step": 51803 - }, - { - "epoch": 1.33, - "learning_rate": 1.2323905147859982e-06, - "loss": 0.5703, - "step": 51804 - }, - { - "epoch": 1.33, - "learning_rate": 1.2323636017892685e-06, - "loss": 0.6919, - "step": 51805 - }, - { - "epoch": 1.33, - "learning_rate": 1.2323366886146284e-06, - "loss": 0.52, - "step": 51806 - }, - { - "epoch": 1.33, - "learning_rate": 1.232309775262099e-06, - "loss": 0.46, - "step": 51807 - }, - { - "epoch": 1.33, - "learning_rate": 1.2322828617317005e-06, - "loss": 0.6406, - "step": 51808 - }, - { - "epoch": 1.33, - "learning_rate": 1.2322559480234536e-06, - "loss": 0.6289, - "step": 51809 - }, - { - "epoch": 1.33, - "learning_rate": 1.2322290341373793e-06, - "loss": 0.7275, - "step": 51810 - }, - { - "epoch": 1.33, - "learning_rate": 1.2322021200734976e-06, - "loss": 0.6943, - "step": 51811 - }, - { - "epoch": 1.33, - "learning_rate": 1.2321752058318297e-06, - "loss": 0.4422, - "step": 51812 - }, - { - "epoch": 1.33, - "learning_rate": 1.2321482914123958e-06, - "loss": 0.5732, - "step": 51813 - }, - { - "epoch": 1.33, - "learning_rate": 1.2321213768152165e-06, - "loss": 0.6865, - "step": 51814 - }, - { - "epoch": 1.33, - "learning_rate": 1.2320944620403127e-06, - "loss": 0.623, - "step": 51815 - }, - { - "epoch": 1.33, - "learning_rate": 1.2320675470877047e-06, - "loss": 0.6934, - "step": 51816 - }, - { - "epoch": 1.33, - "learning_rate": 1.2320406319574135e-06, - "loss": 0.6514, - "step": 51817 - }, - { - "epoch": 1.33, - "learning_rate": 1.2320137166494593e-06, - "loss": 0.461, - "step": 51818 - }, - { - "epoch": 1.33, - "learning_rate": 1.2319868011638629e-06, - "loss": 0.6082, - "step": 51819 - }, - { - "epoch": 1.33, - "learning_rate": 1.2319598855006446e-06, - "loss": 0.748, - "step": 51820 - }, - { - "epoch": 1.33, - "learning_rate": 1.2319329696598254e-06, - "loss": 0.7549, - "step": 51821 - }, - { - "epoch": 1.33, - "learning_rate": 1.231906053641426e-06, - "loss": 0.5791, - "step": 51822 - }, - { - "epoch": 1.33, - "learning_rate": 1.2318791374454667e-06, - "loss": 0.4188, - "step": 51823 - }, - { - "epoch": 1.33, - "learning_rate": 1.2318522210719682e-06, - "loss": 0.7402, - "step": 51824 - }, - { - "epoch": 1.33, - "learning_rate": 1.231825304520951e-06, - "loss": 0.7324, - "step": 51825 - }, - { - "epoch": 1.33, - "learning_rate": 1.2317983877924361e-06, - "loss": 0.5757, - "step": 51826 - }, - { - "epoch": 1.33, - "learning_rate": 1.2317714708864438e-06, - "loss": 0.6143, - "step": 51827 - }, - { - "epoch": 1.33, - "learning_rate": 1.2317445538029944e-06, - "loss": 0.6211, - "step": 51828 - }, - { - "epoch": 1.33, - "learning_rate": 1.2317176365421092e-06, - "loss": 0.7734, - "step": 51829 - }, - { - "epoch": 1.33, - "learning_rate": 1.2316907191038082e-06, - "loss": 0.5811, - "step": 51830 - }, - { - "epoch": 1.33, - "learning_rate": 1.2316638014881123e-06, - "loss": 0.4929, - "step": 51831 - }, - { - "epoch": 1.33, - "learning_rate": 1.2316368836950425e-06, - "loss": 0.6782, - "step": 51832 - }, - { - "epoch": 1.33, - "learning_rate": 1.2316099657246187e-06, - "loss": 0.5217, - "step": 51833 - }, - { - "epoch": 1.33, - "learning_rate": 1.2315830475768614e-06, - "loss": 0.7441, - "step": 51834 - }, - { - "epoch": 1.33, - "learning_rate": 1.2315561292517922e-06, - "loss": 0.4978, - "step": 51835 - }, - { - "epoch": 1.33, - "learning_rate": 1.2315292107494307e-06, - "loss": 0.7139, - "step": 51836 - }, - { - "epoch": 1.33, - "learning_rate": 1.2315022920697983e-06, - "loss": 0.6694, - "step": 51837 - }, - { - "epoch": 1.33, - "learning_rate": 1.231475373212915e-06, - "loss": 0.624, - "step": 51838 - }, - { - "epoch": 1.33, - "learning_rate": 1.2314484541788016e-06, - "loss": 0.5735, - "step": 51839 - }, - { - "epoch": 1.33, - "learning_rate": 1.2314215349674789e-06, - "loss": 0.7031, - "step": 51840 - }, - { - "epoch": 1.33, - "learning_rate": 1.2313946155789674e-06, - "loss": 0.748, - "step": 51841 - }, - { - "epoch": 1.33, - "learning_rate": 1.2313676960132877e-06, - "loss": 0.623, - "step": 51842 - }, - { - "epoch": 1.33, - "learning_rate": 1.2313407762704604e-06, - "loss": 0.6123, - "step": 51843 - }, - { - "epoch": 1.33, - "learning_rate": 1.2313138563505059e-06, - "loss": 0.5737, - "step": 51844 - }, - { - "epoch": 1.33, - "learning_rate": 1.2312869362534452e-06, - "loss": 0.5469, - "step": 51845 - }, - { - "epoch": 1.33, - "learning_rate": 1.2312600159792985e-06, - "loss": 0.5504, - "step": 51846 - }, - { - "epoch": 1.33, - "learning_rate": 1.2312330955280868e-06, - "loss": 0.5244, - "step": 51847 - }, - { - "epoch": 1.33, - "learning_rate": 1.2312061748998308e-06, - "loss": 0.4705, - "step": 51848 - }, - { - "epoch": 1.33, - "learning_rate": 1.2311792540945504e-06, - "loss": 0.7041, - "step": 51849 - }, - { - "epoch": 1.33, - "learning_rate": 1.2311523331122668e-06, - "loss": 0.6875, - "step": 51850 - }, - { - "epoch": 1.33, - "learning_rate": 1.2311254119530005e-06, - "loss": 0.5675, - "step": 51851 - }, - { - "epoch": 1.33, - "learning_rate": 1.2310984906167725e-06, - "loss": 0.6333, - "step": 51852 - }, - { - "epoch": 1.33, - "learning_rate": 1.2310715691036026e-06, - "loss": 0.5999, - "step": 51853 - }, - { - "epoch": 1.33, - "learning_rate": 1.231044647413512e-06, - "loss": 0.7363, - "step": 51854 - }, - { - "epoch": 1.33, - "learning_rate": 1.2310177255465209e-06, - "loss": 0.8066, - "step": 51855 - }, - { - "epoch": 1.33, - "learning_rate": 1.2309908035026507e-06, - "loss": 0.6943, - "step": 51856 - }, - { - "epoch": 1.33, - "learning_rate": 1.2309638812819208e-06, - "loss": 0.6943, - "step": 51857 - }, - { - "epoch": 1.33, - "learning_rate": 1.2309369588843528e-06, - "loss": 0.6548, - "step": 51858 - }, - { - "epoch": 1.33, - "learning_rate": 1.2309100363099668e-06, - "loss": 0.5151, - "step": 51859 - }, - { - "epoch": 1.33, - "learning_rate": 1.2308831135587838e-06, - "loss": 0.6743, - "step": 51860 - }, - { - "epoch": 1.33, - "learning_rate": 1.2308561906308242e-06, - "loss": 0.665, - "step": 51861 - }, - { - "epoch": 1.33, - "learning_rate": 1.2308292675261088e-06, - "loss": 0.6504, - "step": 51862 - }, - { - "epoch": 1.33, - "learning_rate": 1.2308023442446576e-06, - "loss": 0.6714, - "step": 51863 - }, - { - "epoch": 1.33, - "learning_rate": 1.230775420786492e-06, - "loss": 0.7285, - "step": 51864 - }, - { - "epoch": 1.33, - "learning_rate": 1.230748497151632e-06, - "loss": 0.5532, - "step": 51865 - }, - { - "epoch": 1.33, - "learning_rate": 1.2307215733400987e-06, - "loss": 0.709, - "step": 51866 - }, - { - "epoch": 1.33, - "learning_rate": 1.2306946493519124e-06, - "loss": 0.7109, - "step": 51867 - }, - { - "epoch": 1.33, - "learning_rate": 1.2306677251870937e-06, - "loss": 0.4124, - "step": 51868 - }, - { - "epoch": 1.33, - "learning_rate": 1.2306408008456636e-06, - "loss": 0.3708, - "step": 51869 - }, - { - "epoch": 1.33, - "learning_rate": 1.2306138763276424e-06, - "loss": 0.6733, - "step": 51870 - }, - { - "epoch": 1.33, - "learning_rate": 1.2305869516330507e-06, - "loss": 0.7051, - "step": 51871 - }, - { - "epoch": 1.33, - "learning_rate": 1.2305600267619093e-06, - "loss": 0.791, - "step": 51872 - }, - { - "epoch": 1.33, - "learning_rate": 1.2305331017142383e-06, - "loss": 0.5637, - "step": 51873 - }, - { - "epoch": 1.33, - "learning_rate": 1.230506176490059e-06, - "loss": 0.5371, - "step": 51874 - }, - { - "epoch": 1.33, - "learning_rate": 1.2304792510893918e-06, - "loss": 0.9038, - "step": 51875 - }, - { - "epoch": 1.33, - "learning_rate": 1.230452325512257e-06, - "loss": 0.6929, - "step": 51876 - }, - { - "epoch": 1.33, - "learning_rate": 1.2304253997586758e-06, - "loss": 0.4978, - "step": 51877 - }, - { - "epoch": 1.33, - "learning_rate": 1.230398473828668e-06, - "loss": 0.6865, - "step": 51878 - }, - { - "epoch": 1.33, - "learning_rate": 1.230371547722255e-06, - "loss": 0.6875, - "step": 51879 - }, - { - "epoch": 1.33, - "learning_rate": 1.2303446214394569e-06, - "loss": 0.6094, - "step": 51880 - }, - { - "epoch": 1.33, - "learning_rate": 1.2303176949802949e-06, - "loss": 0.8096, - "step": 51881 - }, - { - "epoch": 1.33, - "learning_rate": 1.2302907683447886e-06, - "loss": 0.4673, - "step": 51882 - }, - { - "epoch": 1.33, - "learning_rate": 1.2302638415329598e-06, - "loss": 0.6748, - "step": 51883 - }, - { - "epoch": 1.33, - "learning_rate": 1.230236914544828e-06, - "loss": 0.6992, - "step": 51884 - }, - { - "epoch": 1.33, - "learning_rate": 1.230209987380415e-06, - "loss": 0.7148, - "step": 51885 - }, - { - "epoch": 1.33, - "learning_rate": 1.2301830600397407e-06, - "loss": 0.4826, - "step": 51886 - }, - { - "epoch": 1.33, - "learning_rate": 1.2301561325228258e-06, - "loss": 0.5703, - "step": 51887 - }, - { - "epoch": 1.33, - "learning_rate": 1.2301292048296905e-06, - "loss": 0.7451, - "step": 51888 - }, - { - "epoch": 1.33, - "learning_rate": 1.230102276960356e-06, - "loss": 0.4819, - "step": 51889 - }, - { - "epoch": 1.33, - "learning_rate": 1.230075348914843e-06, - "loss": 0.6072, - "step": 51890 - }, - { - "epoch": 1.33, - "learning_rate": 1.230048420693172e-06, - "loss": 0.4675, - "step": 51891 - }, - { - "epoch": 1.33, - "learning_rate": 1.2300214922953633e-06, - "loss": 0.6206, - "step": 51892 - }, - { - "epoch": 1.33, - "learning_rate": 1.2299945637214376e-06, - "loss": 0.7544, - "step": 51893 - }, - { - "epoch": 1.33, - "learning_rate": 1.2299676349714157e-06, - "loss": 0.7451, - "step": 51894 - }, - { - "epoch": 1.33, - "learning_rate": 1.229940706045318e-06, - "loss": 0.5957, - "step": 51895 - }, - { - "epoch": 1.33, - "learning_rate": 1.229913776943166e-06, - "loss": 0.5493, - "step": 51896 - }, - { - "epoch": 1.33, - "learning_rate": 1.2298868476649788e-06, - "loss": 0.626, - "step": 51897 - }, - { - "epoch": 1.33, - "learning_rate": 1.2298599182107784e-06, - "loss": 0.5977, - "step": 51898 - }, - { - "epoch": 1.33, - "learning_rate": 1.229832988580584e-06, - "loss": 0.5874, - "step": 51899 - }, - { - "epoch": 1.33, - "learning_rate": 1.2298060587744177e-06, - "loss": 0.4788, - "step": 51900 - }, - { - "epoch": 1.33, - "learning_rate": 1.2297791287922995e-06, - "loss": 0.7822, - "step": 51901 - }, - { - "epoch": 1.33, - "learning_rate": 1.22975219863425e-06, - "loss": 0.5991, - "step": 51902 - }, - { - "epoch": 1.33, - "learning_rate": 1.2297252683002895e-06, - "loss": 0.6069, - "step": 51903 - }, - { - "epoch": 1.33, - "learning_rate": 1.2296983377904391e-06, - "loss": 0.8447, - "step": 51904 - }, - { - "epoch": 1.33, - "learning_rate": 1.2296714071047189e-06, - "loss": 0.7734, - "step": 51905 - }, - { - "epoch": 1.33, - "learning_rate": 1.2296444762431506e-06, - "loss": 0.8398, - "step": 51906 - }, - { - "epoch": 1.33, - "learning_rate": 1.2296175452057533e-06, - "loss": 0.5698, - "step": 51907 - }, - { - "epoch": 1.33, - "learning_rate": 1.229590613992549e-06, - "loss": 0.7109, - "step": 51908 - }, - { - "epoch": 1.33, - "learning_rate": 1.2295636826035574e-06, - "loss": 0.5703, - "step": 51909 - }, - { - "epoch": 1.33, - "learning_rate": 1.2295367510387995e-06, - "loss": 0.7539, - "step": 51910 - }, - { - "epoch": 1.33, - "learning_rate": 1.229509819298296e-06, - "loss": 0.5859, - "step": 51911 - }, - { - "epoch": 1.33, - "learning_rate": 1.229482887382067e-06, - "loss": 0.7334, - "step": 51912 - }, - { - "epoch": 1.33, - "learning_rate": 1.2294559552901338e-06, - "loss": 0.3345, - "step": 51913 - }, - { - "epoch": 1.33, - "learning_rate": 1.2294290230225166e-06, - "loss": 0.7529, - "step": 51914 - }, - { - "epoch": 1.33, - "learning_rate": 1.2294020905792365e-06, - "loss": 0.6042, - "step": 51915 - }, - { - "epoch": 1.33, - "learning_rate": 1.2293751579603133e-06, - "loss": 0.7432, - "step": 51916 - }, - { - "epoch": 1.33, - "learning_rate": 1.2293482251657685e-06, - "loss": 0.6362, - "step": 51917 - }, - { - "epoch": 1.33, - "learning_rate": 1.229321292195622e-06, - "loss": 0.7656, - "step": 51918 - }, - { - "epoch": 1.33, - "learning_rate": 1.2292943590498947e-06, - "loss": 0.7363, - "step": 51919 - }, - { - "epoch": 1.33, - "learning_rate": 1.2292674257286073e-06, - "loss": 0.5181, - "step": 51920 - }, - { - "epoch": 1.33, - "learning_rate": 1.229240492231781e-06, - "loss": 0.6025, - "step": 51921 - }, - { - "epoch": 1.33, - "learning_rate": 1.229213558559435e-06, - "loss": 0.5656, - "step": 51922 - }, - { - "epoch": 1.33, - "learning_rate": 1.2291866247115909e-06, - "loss": 0.7432, - "step": 51923 - }, - { - "epoch": 1.33, - "learning_rate": 1.229159690688269e-06, - "loss": 0.6528, - "step": 51924 - }, - { - "epoch": 1.33, - "learning_rate": 1.2291327564894904e-06, - "loss": 0.8027, - "step": 51925 - }, - { - "epoch": 1.33, - "learning_rate": 1.2291058221152754e-06, - "loss": 0.6694, - "step": 51926 - }, - { - "epoch": 1.33, - "learning_rate": 1.2290788875656446e-06, - "loss": 0.7129, - "step": 51927 - }, - { - "epoch": 1.33, - "learning_rate": 1.2290519528406184e-06, - "loss": 0.6587, - "step": 51928 - }, - { - "epoch": 1.33, - "learning_rate": 1.2290250179402178e-06, - "loss": 0.7163, - "step": 51929 - }, - { - "epoch": 1.33, - "learning_rate": 1.228998082864463e-06, - "loss": 0.8184, - "step": 51930 - }, - { - "epoch": 1.33, - "learning_rate": 1.2289711476133754e-06, - "loss": 0.6602, - "step": 51931 - }, - { - "epoch": 1.33, - "learning_rate": 1.2289442121869748e-06, - "loss": 0.6826, - "step": 51932 - }, - { - "epoch": 1.33, - "learning_rate": 1.2289172765852822e-06, - "loss": 0.6406, - "step": 51933 - }, - { - "epoch": 1.33, - "learning_rate": 1.228890340808318e-06, - "loss": 0.7822, - "step": 51934 - }, - { - "epoch": 1.33, - "learning_rate": 1.2288634048561032e-06, - "loss": 0.4639, - "step": 51935 - }, - { - "epoch": 1.33, - "learning_rate": 1.2288364687286583e-06, - "loss": 0.7314, - "step": 51936 - }, - { - "epoch": 1.33, - "learning_rate": 1.2288095324260034e-06, - "loss": 0.7324, - "step": 51937 - }, - { - "epoch": 1.33, - "learning_rate": 1.22878259594816e-06, - "loss": 0.6636, - "step": 51938 - }, - { - "epoch": 1.33, - "learning_rate": 1.228755659295148e-06, - "loss": 0.7676, - "step": 51939 - }, - { - "epoch": 1.33, - "learning_rate": 1.2287287224669887e-06, - "loss": 0.6289, - "step": 51940 - }, - { - "epoch": 1.33, - "learning_rate": 1.228701785463702e-06, - "loss": 0.7842, - "step": 51941 - }, - { - "epoch": 1.33, - "learning_rate": 1.228674848285309e-06, - "loss": 0.7617, - "step": 51942 - }, - { - "epoch": 1.33, - "learning_rate": 1.22864791093183e-06, - "loss": 0.6294, - "step": 51943 - }, - { - "epoch": 1.33, - "learning_rate": 1.2286209734032863e-06, - "loss": 0.3983, - "step": 51944 - }, - { - "epoch": 1.33, - "learning_rate": 1.2285940356996973e-06, - "loss": 0.6572, - "step": 51945 - }, - { - "epoch": 1.33, - "learning_rate": 1.2285670978210849e-06, - "loss": 0.7725, - "step": 51946 - }, - { - "epoch": 1.33, - "learning_rate": 1.2285401597674689e-06, - "loss": 0.4485, - "step": 51947 - }, - { - "epoch": 1.33, - "learning_rate": 1.2285132215388705e-06, - "loss": 0.6562, - "step": 51948 - }, - { - "epoch": 1.33, - "learning_rate": 1.2284862831353098e-06, - "loss": 0.5981, - "step": 51949 - }, - { - "epoch": 1.33, - "learning_rate": 1.2284593445568076e-06, - "loss": 0.5347, - "step": 51950 - }, - { - "epoch": 1.33, - "learning_rate": 1.2284324058033848e-06, - "loss": 0.6841, - "step": 51951 - }, - { - "epoch": 1.33, - "learning_rate": 1.2284054668750618e-06, - "loss": 0.5258, - "step": 51952 - }, - { - "epoch": 1.33, - "learning_rate": 1.228378527771859e-06, - "loss": 0.75, - "step": 51953 - }, - { - "epoch": 1.33, - "learning_rate": 1.2283515884937977e-06, - "loss": 0.436, - "step": 51954 - }, - { - "epoch": 1.33, - "learning_rate": 1.2283246490408976e-06, - "loss": 0.7402, - "step": 51955 - }, - { - "epoch": 1.33, - "learning_rate": 1.22829770941318e-06, - "loss": 0.7725, - "step": 51956 - }, - { - "epoch": 1.33, - "learning_rate": 1.2282707696106653e-06, - "loss": 0.8018, - "step": 51957 - }, - { - "epoch": 1.33, - "learning_rate": 1.2282438296333742e-06, - "loss": 0.7441, - "step": 51958 - }, - { - "epoch": 1.33, - "learning_rate": 1.2282168894813274e-06, - "loss": 0.5083, - "step": 51959 - }, - { - "epoch": 1.33, - "learning_rate": 1.2281899491545454e-06, - "loss": 0.5947, - "step": 51960 - }, - { - "epoch": 1.33, - "learning_rate": 1.2281630086530489e-06, - "loss": 0.666, - "step": 51961 - }, - { - "epoch": 1.33, - "learning_rate": 1.2281360679768581e-06, - "loss": 0.6387, - "step": 51962 - }, - { - "epoch": 1.33, - "learning_rate": 1.2281091271259944e-06, - "loss": 0.7871, - "step": 51963 - }, - { - "epoch": 1.33, - "learning_rate": 1.2280821861004777e-06, - "loss": 0.7881, - "step": 51964 - }, - { - "epoch": 1.33, - "learning_rate": 1.2280552449003291e-06, - "loss": 0.6606, - "step": 51965 - }, - { - "epoch": 1.33, - "learning_rate": 1.2280283035255693e-06, - "loss": 0.5974, - "step": 51966 - }, - { - "epoch": 1.33, - "learning_rate": 1.2280013619762187e-06, - "loss": 0.7275, - "step": 51967 - }, - { - "epoch": 1.33, - "learning_rate": 1.2279744202522978e-06, - "loss": 0.9072, - "step": 51968 - }, - { - "epoch": 1.33, - "learning_rate": 1.2279474783538273e-06, - "loss": 0.6826, - "step": 51969 - }, - { - "epoch": 1.33, - "learning_rate": 1.2279205362808277e-06, - "loss": 0.6543, - "step": 51970 - }, - { - "epoch": 1.33, - "learning_rate": 1.2278935940333204e-06, - "loss": 0.7295, - "step": 51971 - }, - { - "epoch": 1.33, - "learning_rate": 1.227866651611325e-06, - "loss": 0.5308, - "step": 51972 - }, - { - "epoch": 1.33, - "learning_rate": 1.227839709014863e-06, - "loss": 0.5264, - "step": 51973 - }, - { - "epoch": 1.33, - "learning_rate": 1.2278127662439542e-06, - "loss": 0.7871, - "step": 51974 - }, - { - "epoch": 1.33, - "learning_rate": 1.2277858232986198e-06, - "loss": 0.6523, - "step": 51975 - }, - { - "epoch": 1.33, - "learning_rate": 1.22775888017888e-06, - "loss": 0.6245, - "step": 51976 - }, - { - "epoch": 1.33, - "learning_rate": 1.2277319368847561e-06, - "loss": 0.5828, - "step": 51977 - }, - { - "epoch": 1.33, - "learning_rate": 1.2277049934162681e-06, - "loss": 0.707, - "step": 51978 - }, - { - "epoch": 1.33, - "learning_rate": 1.227678049773437e-06, - "loss": 0.5806, - "step": 51979 - }, - { - "epoch": 1.33, - "learning_rate": 1.2276511059562831e-06, - "loss": 0.7285, - "step": 51980 - }, - { - "epoch": 1.33, - "learning_rate": 1.2276241619648273e-06, - "loss": 0.7969, - "step": 51981 - }, - { - "epoch": 1.33, - "learning_rate": 1.2275972177990903e-06, - "loss": 0.6294, - "step": 51982 - }, - { - "epoch": 1.33, - "learning_rate": 1.2275702734590922e-06, - "loss": 0.4729, - "step": 51983 - }, - { - "epoch": 1.33, - "learning_rate": 1.2275433289448544e-06, - "loss": 0.7656, - "step": 51984 - }, - { - "epoch": 1.33, - "learning_rate": 1.227516384256397e-06, - "loss": 0.573, - "step": 51985 - }, - { - "epoch": 1.33, - "learning_rate": 1.227489439393741e-06, - "loss": 0.7461, - "step": 51986 - }, - { - "epoch": 1.33, - "learning_rate": 1.2274624943569062e-06, - "loss": 0.6206, - "step": 51987 - }, - { - "epoch": 1.33, - "learning_rate": 1.2274355491459143e-06, - "loss": 0.7793, - "step": 51988 - }, - { - "epoch": 1.33, - "learning_rate": 1.2274086037607854e-06, - "loss": 0.585, - "step": 51989 - }, - { - "epoch": 1.33, - "learning_rate": 1.2273816582015401e-06, - "loss": 0.7725, - "step": 51990 - }, - { - "epoch": 1.33, - "learning_rate": 1.227354712468199e-06, - "loss": 0.7871, - "step": 51991 - }, - { - "epoch": 1.33, - "learning_rate": 1.2273277665607833e-06, - "loss": 0.7822, - "step": 51992 - }, - { - "epoch": 1.33, - "learning_rate": 1.2273008204793128e-06, - "loss": 0.6895, - "step": 51993 - }, - { - "epoch": 1.33, - "learning_rate": 1.2272738742238085e-06, - "loss": 0.7285, - "step": 51994 - }, - { - "epoch": 1.33, - "learning_rate": 1.227246927794291e-06, - "loss": 0.6782, - "step": 51995 - }, - { - "epoch": 1.33, - "learning_rate": 1.2272199811907813e-06, - "loss": 0.6851, - "step": 51996 - }, - { - "epoch": 1.33, - "learning_rate": 1.2271930344132994e-06, - "loss": 0.7578, - "step": 51997 - }, - { - "epoch": 1.33, - "learning_rate": 1.2271660874618665e-06, - "loss": 0.6079, - "step": 51998 - }, - { - "epoch": 1.33, - "learning_rate": 1.2271391403365029e-06, - "loss": 0.5635, - "step": 51999 - }, - { - "epoch": 1.33, - "learning_rate": 1.227112193037229e-06, - "loss": 0.7236, - "step": 52000 - }, - { - "epoch": 1.33, - "learning_rate": 1.2270852455640662e-06, - "loss": 0.6504, - "step": 52001 - }, - { - "epoch": 1.33, - "learning_rate": 1.2270582979170344e-06, - "loss": 0.5835, - "step": 52002 - }, - { - "epoch": 1.33, - "learning_rate": 1.2270313500961544e-06, - "loss": 0.792, - "step": 52003 - }, - { - "epoch": 1.33, - "learning_rate": 1.227004402101447e-06, - "loss": 0.5269, - "step": 52004 - }, - { - "epoch": 1.33, - "learning_rate": 1.226977453932933e-06, - "loss": 0.5938, - "step": 52005 - }, - { - "epoch": 1.33, - "learning_rate": 1.2269505055906327e-06, - "loss": 0.6191, - "step": 52006 - }, - { - "epoch": 1.33, - "learning_rate": 1.226923557074567e-06, - "loss": 0.7051, - "step": 52007 - }, - { - "epoch": 1.33, - "learning_rate": 1.2268966083847559e-06, - "loss": 0.522, - "step": 52008 - }, - { - "epoch": 1.33, - "learning_rate": 1.2268696595212207e-06, - "loss": 0.7998, - "step": 52009 - }, - { - "epoch": 1.33, - "learning_rate": 1.226842710483982e-06, - "loss": 0.7451, - "step": 52010 - }, - { - "epoch": 1.33, - "learning_rate": 1.22681576127306e-06, - "loss": 0.5908, - "step": 52011 - }, - { - "epoch": 1.33, - "learning_rate": 1.2267888118884757e-06, - "loss": 0.6758, - "step": 52012 - }, - { - "epoch": 1.33, - "learning_rate": 1.2267618623302499e-06, - "loss": 0.6777, - "step": 52013 - }, - { - "epoch": 1.33, - "learning_rate": 1.2267349125984026e-06, - "loss": 0.6562, - "step": 52014 - }, - { - "epoch": 1.33, - "learning_rate": 1.2267079626929548e-06, - "loss": 0.5693, - "step": 52015 - }, - { - "epoch": 1.33, - "learning_rate": 1.2266810126139276e-06, - "loss": 0.4524, - "step": 52016 - }, - { - "epoch": 1.33, - "learning_rate": 1.226654062361341e-06, - "loss": 0.7617, - "step": 52017 - }, - { - "epoch": 1.33, - "learning_rate": 1.2266271119352155e-06, - "loss": 0.5396, - "step": 52018 - }, - { - "epoch": 1.33, - "learning_rate": 1.226600161335572e-06, - "loss": 0.5625, - "step": 52019 - }, - { - "epoch": 1.33, - "learning_rate": 1.2265732105624314e-06, - "loss": 0.8691, - "step": 52020 - }, - { - "epoch": 1.33, - "learning_rate": 1.226546259615814e-06, - "loss": 0.7744, - "step": 52021 - }, - { - "epoch": 1.33, - "learning_rate": 1.2265193084957408e-06, - "loss": 0.6592, - "step": 52022 - }, - { - "epoch": 1.33, - "learning_rate": 1.226492357202232e-06, - "loss": 0.6914, - "step": 52023 - }, - { - "epoch": 1.33, - "learning_rate": 1.2264654057353085e-06, - "loss": 0.4208, - "step": 52024 - }, - { - "epoch": 1.33, - "learning_rate": 1.226438454094991e-06, - "loss": 0.4604, - "step": 52025 - }, - { - "epoch": 1.33, - "learning_rate": 1.2264115022812997e-06, - "loss": 0.6318, - "step": 52026 - }, - { - "epoch": 1.33, - "learning_rate": 1.2263845502942553e-06, - "loss": 0.7461, - "step": 52027 - }, - { - "epoch": 1.33, - "learning_rate": 1.2263575981338792e-06, - "loss": 0.7705, - "step": 52028 - }, - { - "epoch": 1.33, - "learning_rate": 1.2263306458001909e-06, - "loss": 0.7773, - "step": 52029 - }, - { - "epoch": 1.33, - "learning_rate": 1.2263036932932123e-06, - "loss": 0.5903, - "step": 52030 - }, - { - "epoch": 1.33, - "learning_rate": 1.2262767406129631e-06, - "loss": 0.7061, - "step": 52031 - }, - { - "epoch": 1.33, - "learning_rate": 1.2262497877594642e-06, - "loss": 0.5767, - "step": 52032 - }, - { - "epoch": 1.33, - "learning_rate": 1.2262228347327358e-06, - "loss": 0.6982, - "step": 52033 - }, - { - "epoch": 1.33, - "learning_rate": 1.2261958815327998e-06, - "loss": 0.6812, - "step": 52034 - }, - { - "epoch": 1.33, - "learning_rate": 1.2261689281596752e-06, - "loss": 0.6172, - "step": 52035 - }, - { - "epoch": 1.33, - "learning_rate": 1.2261419746133842e-06, - "loss": 0.605, - "step": 52036 - }, - { - "epoch": 1.33, - "learning_rate": 1.2261150208939461e-06, - "loss": 0.5776, - "step": 52037 - }, - { - "epoch": 1.33, - "learning_rate": 1.2260880670013824e-06, - "loss": 0.6167, - "step": 52038 - }, - { - "epoch": 1.33, - "learning_rate": 1.2260611129357135e-06, - "loss": 0.6592, - "step": 52039 - }, - { - "epoch": 1.33, - "learning_rate": 1.22603415869696e-06, - "loss": 0.6943, - "step": 52040 - }, - { - "epoch": 1.33, - "learning_rate": 1.2260072042851423e-06, - "loss": 0.5617, - "step": 52041 - }, - { - "epoch": 1.33, - "learning_rate": 1.2259802497002816e-06, - "loss": 0.7285, - "step": 52042 - }, - { - "epoch": 1.33, - "learning_rate": 1.2259532949423978e-06, - "loss": 0.7783, - "step": 52043 - }, - { - "epoch": 1.33, - "learning_rate": 1.2259263400115125e-06, - "loss": 0.7871, - "step": 52044 - }, - { - "epoch": 1.33, - "learning_rate": 1.2258993849076452e-06, - "loss": 0.6594, - "step": 52045 - }, - { - "epoch": 1.33, - "learning_rate": 1.2258724296308177e-06, - "loss": 0.5889, - "step": 52046 - }, - { - "epoch": 1.33, - "learning_rate": 1.2258454741810499e-06, - "loss": 0.7715, - "step": 52047 - }, - { - "epoch": 1.33, - "learning_rate": 1.225818518558362e-06, - "loss": 0.5569, - "step": 52048 - }, - { - "epoch": 1.33, - "learning_rate": 1.225791562762776e-06, - "loss": 0.6367, - "step": 52049 - }, - { - "epoch": 1.33, - "learning_rate": 1.2257646067943114e-06, - "loss": 0.5774, - "step": 52050 - }, - { - "epoch": 1.33, - "learning_rate": 1.2257376506529895e-06, - "loss": 0.6592, - "step": 52051 - }, - { - "epoch": 1.33, - "learning_rate": 1.2257106943388306e-06, - "loss": 0.6885, - "step": 52052 - }, - { - "epoch": 1.33, - "learning_rate": 1.2256837378518553e-06, - "loss": 0.6514, - "step": 52053 - }, - { - "epoch": 1.33, - "learning_rate": 1.2256567811920842e-06, - "loss": 0.7285, - "step": 52054 - }, - { - "epoch": 1.33, - "learning_rate": 1.2256298243595381e-06, - "loss": 0.6396, - "step": 52055 - }, - { - "epoch": 1.33, - "learning_rate": 1.2256028673542377e-06, - "loss": 0.7168, - "step": 52056 - }, - { - "epoch": 1.33, - "learning_rate": 1.2255759101762039e-06, - "loss": 0.3921, - "step": 52057 - }, - { - "epoch": 1.33, - "learning_rate": 1.2255489528254566e-06, - "loss": 0.583, - "step": 52058 - }, - { - "epoch": 1.33, - "learning_rate": 1.2255219953020168e-06, - "loss": 0.6953, - "step": 52059 - }, - { - "epoch": 1.33, - "learning_rate": 1.2254950376059052e-06, - "loss": 0.5688, - "step": 52060 - }, - { - "epoch": 1.33, - "learning_rate": 1.2254680797371428e-06, - "loss": 0.6725, - "step": 52061 - }, - { - "epoch": 1.33, - "learning_rate": 1.2254411216957494e-06, - "loss": 0.5503, - "step": 52062 - }, - { - "epoch": 1.33, - "learning_rate": 1.2254141634817464e-06, - "loss": 0.4736, - "step": 52063 - }, - { - "epoch": 1.33, - "learning_rate": 1.225387205095154e-06, - "loss": 0.5679, - "step": 52064 - }, - { - "epoch": 1.33, - "learning_rate": 1.2253602465359929e-06, - "loss": 0.8252, - "step": 52065 - }, - { - "epoch": 1.33, - "learning_rate": 1.2253332878042841e-06, - "loss": 0.5625, - "step": 52066 - }, - { - "epoch": 1.33, - "learning_rate": 1.2253063289000475e-06, - "loss": 0.554, - "step": 52067 - }, - { - "epoch": 1.33, - "learning_rate": 1.2252793698233045e-06, - "loss": 0.7168, - "step": 52068 - }, - { - "epoch": 1.33, - "learning_rate": 1.2252524105740756e-06, - "loss": 0.5684, - "step": 52069 - }, - { - "epoch": 1.33, - "learning_rate": 1.225225451152381e-06, - "loss": 0.6968, - "step": 52070 - }, - { - "epoch": 1.33, - "learning_rate": 1.2251984915582418e-06, - "loss": 0.668, - "step": 52071 - }, - { - "epoch": 1.33, - "learning_rate": 1.2251715317916786e-06, - "loss": 0.541, - "step": 52072 - }, - { - "epoch": 1.33, - "learning_rate": 1.2251445718527116e-06, - "loss": 0.6514, - "step": 52073 - }, - { - "epoch": 1.33, - "learning_rate": 1.225117611741362e-06, - "loss": 0.6631, - "step": 52074 - }, - { - "epoch": 1.33, - "learning_rate": 1.2250906514576498e-06, - "loss": 0.7295, - "step": 52075 - }, - { - "epoch": 1.33, - "learning_rate": 1.2250636910015965e-06, - "loss": 0.6934, - "step": 52076 - }, - { - "epoch": 1.33, - "learning_rate": 1.2250367303732222e-06, - "loss": 0.7178, - "step": 52077 - }, - { - "epoch": 1.33, - "learning_rate": 1.2250097695725474e-06, - "loss": 0.7803, - "step": 52078 - }, - { - "epoch": 1.33, - "learning_rate": 1.224982808599593e-06, - "loss": 0.7666, - "step": 52079 - }, - { - "epoch": 1.33, - "learning_rate": 1.2249558474543798e-06, - "loss": 0.627, - "step": 52080 - }, - { - "epoch": 1.33, - "learning_rate": 1.2249288861369283e-06, - "loss": 0.7822, - "step": 52081 - }, - { - "epoch": 1.33, - "learning_rate": 1.2249019246472589e-06, - "loss": 0.7646, - "step": 52082 - }, - { - "epoch": 1.33, - "learning_rate": 1.2248749629853923e-06, - "loss": 0.7285, - "step": 52083 - }, - { - "epoch": 1.33, - "learning_rate": 1.2248480011513496e-06, - "loss": 0.624, - "step": 52084 - }, - { - "epoch": 1.33, - "learning_rate": 1.2248210391451508e-06, - "loss": 0.481, - "step": 52085 - }, - { - "epoch": 1.33, - "learning_rate": 1.2247940769668174e-06, - "loss": 0.7983, - "step": 52086 - }, - { - "epoch": 1.34, - "learning_rate": 1.224767114616369e-06, - "loss": 0.6255, - "step": 52087 - }, - { - "epoch": 1.34, - "learning_rate": 1.224740152093827e-06, - "loss": 0.7852, - "step": 52088 - }, - { - "epoch": 1.34, - "learning_rate": 1.2247131893992115e-06, - "loss": 0.606, - "step": 52089 - }, - { - "epoch": 1.34, - "learning_rate": 1.2246862265325437e-06, - "loss": 0.5791, - "step": 52090 - }, - { - "epoch": 1.34, - "learning_rate": 1.2246592634938442e-06, - "loss": 0.5605, - "step": 52091 - }, - { - "epoch": 1.34, - "learning_rate": 1.224632300283133e-06, - "loss": 0.6255, - "step": 52092 - }, - { - "epoch": 1.34, - "learning_rate": 1.2246053369004314e-06, - "loss": 0.604, - "step": 52093 - }, - { - "epoch": 1.34, - "learning_rate": 1.2245783733457596e-06, - "loss": 0.792, - "step": 52094 - }, - { - "epoch": 1.34, - "learning_rate": 1.2245514096191386e-06, - "loss": 0.7334, - "step": 52095 - }, - { - "epoch": 1.34, - "learning_rate": 1.2245244457205893e-06, - "loss": 0.668, - "step": 52096 - }, - { - "epoch": 1.34, - "learning_rate": 1.2244974816501314e-06, - "loss": 0.4081, - "step": 52097 - }, - { - "epoch": 1.34, - "learning_rate": 1.2244705174077862e-06, - "loss": 0.6494, - "step": 52098 - }, - { - "epoch": 1.34, - "learning_rate": 1.2244435529935746e-06, - "loss": 0.7773, - "step": 52099 - }, - { - "epoch": 1.34, - "learning_rate": 1.2244165884075164e-06, - "loss": 0.7773, - "step": 52100 - }, - { - "epoch": 1.34, - "learning_rate": 1.2243896236496334e-06, - "loss": 0.8467, - "step": 52101 - }, - { - "epoch": 1.34, - "learning_rate": 1.224362658719945e-06, - "loss": 0.6978, - "step": 52102 - }, - { - "epoch": 1.34, - "learning_rate": 1.2243356936184726e-06, - "loss": 0.5728, - "step": 52103 - }, - { - "epoch": 1.34, - "learning_rate": 1.2243087283452364e-06, - "loss": 0.625, - "step": 52104 - }, - { - "epoch": 1.34, - "learning_rate": 1.2242817629002577e-06, - "loss": 0.5156, - "step": 52105 - }, - { - "epoch": 1.34, - "learning_rate": 1.2242547972835569e-06, - "loss": 0.6069, - "step": 52106 - }, - { - "epoch": 1.34, - "learning_rate": 1.2242278314951542e-06, - "loss": 0.7529, - "step": 52107 - }, - { - "epoch": 1.34, - "learning_rate": 1.2242008655350706e-06, - "loss": 0.7412, - "step": 52108 - }, - { - "epoch": 1.34, - "learning_rate": 1.2241738994033267e-06, - "loss": 0.6934, - "step": 52109 - }, - { - "epoch": 1.34, - "learning_rate": 1.2241469330999433e-06, - "loss": 0.5872, - "step": 52110 - }, - { - "epoch": 1.34, - "learning_rate": 1.2241199666249408e-06, - "loss": 0.6572, - "step": 52111 - }, - { - "epoch": 1.34, - "learning_rate": 1.2240929999783398e-06, - "loss": 0.3173, - "step": 52112 - }, - { - "epoch": 1.34, - "learning_rate": 1.2240660331601614e-06, - "loss": 0.5632, - "step": 52113 - }, - { - "epoch": 1.34, - "learning_rate": 1.2240390661704257e-06, - "loss": 0.4365, - "step": 52114 - }, - { - "epoch": 1.34, - "learning_rate": 1.2240120990091537e-06, - "loss": 0.5957, - "step": 52115 - }, - { - "epoch": 1.34, - "learning_rate": 1.2239851316763658e-06, - "loss": 0.5698, - "step": 52116 - }, - { - "epoch": 1.34, - "learning_rate": 1.223958164172083e-06, - "loss": 0.6406, - "step": 52117 - }, - { - "epoch": 1.34, - "learning_rate": 1.2239311964963254e-06, - "loss": 0.6523, - "step": 52118 - }, - { - "epoch": 1.34, - "learning_rate": 1.223904228649114e-06, - "loss": 0.7139, - "step": 52119 - }, - { - "epoch": 1.34, - "learning_rate": 1.2238772606304698e-06, - "loss": 0.6279, - "step": 52120 - }, - { - "epoch": 1.34, - "learning_rate": 1.223850292440413e-06, - "loss": 0.7236, - "step": 52121 - }, - { - "epoch": 1.34, - "learning_rate": 1.2238233240789644e-06, - "loss": 0.6738, - "step": 52122 - }, - { - "epoch": 1.34, - "learning_rate": 1.223796355546144e-06, - "loss": 0.7051, - "step": 52123 - }, - { - "epoch": 1.34, - "learning_rate": 1.2237693868419738e-06, - "loss": 0.6289, - "step": 52124 - }, - { - "epoch": 1.34, - "learning_rate": 1.2237424179664731e-06, - "loss": 0.6675, - "step": 52125 - }, - { - "epoch": 1.34, - "learning_rate": 1.2237154489196634e-06, - "loss": 0.6338, - "step": 52126 - }, - { - "epoch": 1.34, - "learning_rate": 1.223688479701565e-06, - "loss": 0.6313, - "step": 52127 - }, - { - "epoch": 1.34, - "learning_rate": 1.2236615103121985e-06, - "loss": 0.6111, - "step": 52128 - }, - { - "epoch": 1.34, - "learning_rate": 1.2236345407515846e-06, - "loss": 0.606, - "step": 52129 - }, - { - "epoch": 1.34, - "learning_rate": 1.2236075710197444e-06, - "loss": 0.6509, - "step": 52130 - }, - { - "epoch": 1.34, - "learning_rate": 1.2235806011166981e-06, - "loss": 0.5195, - "step": 52131 - }, - { - "epoch": 1.34, - "learning_rate": 1.223553631042466e-06, - "loss": 0.5151, - "step": 52132 - }, - { - "epoch": 1.34, - "learning_rate": 1.2235266607970696e-06, - "loss": 0.6875, - "step": 52133 - }, - { - "epoch": 1.34, - "learning_rate": 1.2234996903805289e-06, - "loss": 0.6992, - "step": 52134 - }, - { - "epoch": 1.34, - "learning_rate": 1.2234727197928646e-06, - "loss": 0.585, - "step": 52135 - }, - { - "epoch": 1.34, - "learning_rate": 1.2234457490340978e-06, - "loss": 0.6787, - "step": 52136 - }, - { - "epoch": 1.34, - "learning_rate": 1.223418778104249e-06, - "loss": 0.5825, - "step": 52137 - }, - { - "epoch": 1.34, - "learning_rate": 1.2233918070033382e-06, - "loss": 0.5085, - "step": 52138 - }, - { - "epoch": 1.34, - "learning_rate": 1.2233648357313867e-06, - "loss": 0.6138, - "step": 52139 - }, - { - "epoch": 1.34, - "learning_rate": 1.223337864288415e-06, - "loss": 0.7441, - "step": 52140 - }, - { - "epoch": 1.34, - "learning_rate": 1.2233108926744444e-06, - "loss": 0.7524, - "step": 52141 - }, - { - "epoch": 1.34, - "learning_rate": 1.2232839208894942e-06, - "loss": 0.6279, - "step": 52142 - }, - { - "epoch": 1.34, - "learning_rate": 1.2232569489335863e-06, - "loss": 0.7725, - "step": 52143 - }, - { - "epoch": 1.34, - "learning_rate": 1.2232299768067403e-06, - "loss": 0.8242, - "step": 52144 - }, - { - "epoch": 1.34, - "learning_rate": 1.2232030045089775e-06, - "loss": 0.6777, - "step": 52145 - }, - { - "epoch": 1.34, - "learning_rate": 1.2231760320403189e-06, - "loss": 0.4377, - "step": 52146 - }, - { - "epoch": 1.34, - "learning_rate": 1.2231490594007842e-06, - "loss": 0.4834, - "step": 52147 - }, - { - "epoch": 1.34, - "learning_rate": 1.2231220865903945e-06, - "loss": 0.7471, - "step": 52148 - }, - { - "epoch": 1.34, - "learning_rate": 1.2230951136091708e-06, - "loss": 0.7817, - "step": 52149 - }, - { - "epoch": 1.34, - "learning_rate": 1.2230681404571333e-06, - "loss": 0.5791, - "step": 52150 - }, - { - "epoch": 1.34, - "learning_rate": 1.223041167134303e-06, - "loss": 0.6543, - "step": 52151 - }, - { - "epoch": 1.34, - "learning_rate": 1.2230141936406996e-06, - "loss": 0.6216, - "step": 52152 - }, - { - "epoch": 1.34, - "learning_rate": 1.2229872199763451e-06, - "loss": 0.6797, - "step": 52153 - }, - { - "epoch": 1.34, - "learning_rate": 1.2229602461412592e-06, - "loss": 0.6021, - "step": 52154 - }, - { - "epoch": 1.34, - "learning_rate": 1.222933272135463e-06, - "loss": 0.6099, - "step": 52155 - }, - { - "epoch": 1.34, - "learning_rate": 1.2229062979589773e-06, - "loss": 0.4802, - "step": 52156 - }, - { - "epoch": 1.34, - "learning_rate": 1.2228793236118223e-06, - "loss": 0.667, - "step": 52157 - }, - { - "epoch": 1.34, - "learning_rate": 1.2228523490940188e-06, - "loss": 0.7295, - "step": 52158 - }, - { - "epoch": 1.34, - "learning_rate": 1.2228253744055876e-06, - "loss": 0.5552, - "step": 52159 - }, - { - "epoch": 1.34, - "learning_rate": 1.2227983995465495e-06, - "loss": 0.7197, - "step": 52160 - }, - { - "epoch": 1.34, - "learning_rate": 1.2227714245169244e-06, - "loss": 0.7539, - "step": 52161 - }, - { - "epoch": 1.34, - "learning_rate": 1.2227444493167335e-06, - "loss": 0.8057, - "step": 52162 - }, - { - "epoch": 1.34, - "learning_rate": 1.2227174739459979e-06, - "loss": 0.6063, - "step": 52163 - }, - { - "epoch": 1.34, - "learning_rate": 1.2226904984047373e-06, - "loss": 0.5376, - "step": 52164 - }, - { - "epoch": 1.34, - "learning_rate": 1.222663522692973e-06, - "loss": 0.6445, - "step": 52165 - }, - { - "epoch": 1.34, - "learning_rate": 1.2226365468107257e-06, - "loss": 0.6602, - "step": 52166 - }, - { - "epoch": 1.34, - "learning_rate": 1.2226095707580154e-06, - "loss": 0.6436, - "step": 52167 - }, - { - "epoch": 1.34, - "learning_rate": 1.2225825945348635e-06, - "loss": 0.7285, - "step": 52168 - }, - { - "epoch": 1.34, - "learning_rate": 1.22255561814129e-06, - "loss": 0.5247, - "step": 52169 - }, - { - "epoch": 1.34, - "learning_rate": 1.2225286415773167e-06, - "loss": 0.427, - "step": 52170 - }, - { - "epoch": 1.34, - "learning_rate": 1.2225016648429628e-06, - "loss": 0.7871, - "step": 52171 - }, - { - "epoch": 1.34, - "learning_rate": 1.2224746879382494e-06, - "loss": 0.5757, - "step": 52172 - }, - { - "epoch": 1.34, - "learning_rate": 1.2224477108631977e-06, - "loss": 0.5671, - "step": 52173 - }, - { - "epoch": 1.34, - "learning_rate": 1.222420733617828e-06, - "loss": 0.5088, - "step": 52174 - }, - { - "epoch": 1.34, - "learning_rate": 1.222393756202161e-06, - "loss": 0.605, - "step": 52175 - }, - { - "epoch": 1.34, - "learning_rate": 1.2223667786162174e-06, - "loss": 0.7998, - "step": 52176 - }, - { - "epoch": 1.34, - "learning_rate": 1.2223398008600176e-06, - "loss": 0.5728, - "step": 52177 - }, - { - "epoch": 1.34, - "learning_rate": 1.2223128229335826e-06, - "loss": 0.626, - "step": 52178 - }, - { - "epoch": 1.34, - "learning_rate": 1.2222858448369327e-06, - "loss": 0.7295, - "step": 52179 - }, - { - "epoch": 1.34, - "learning_rate": 1.2222588665700888e-06, - "loss": 0.7002, - "step": 52180 - }, - { - "epoch": 1.34, - "learning_rate": 1.2222318881330716e-06, - "loss": 0.3877, - "step": 52181 - }, - { - "epoch": 1.34, - "learning_rate": 1.2222049095259014e-06, - "loss": 0.5464, - "step": 52182 - }, - { - "epoch": 1.34, - "learning_rate": 1.2221779307485996e-06, - "loss": 0.7676, - "step": 52183 - }, - { - "epoch": 1.34, - "learning_rate": 1.2221509518011858e-06, - "loss": 0.6738, - "step": 52184 - }, - { - "epoch": 1.34, - "learning_rate": 1.2221239726836818e-06, - "loss": 0.7124, - "step": 52185 - }, - { - "epoch": 1.34, - "learning_rate": 1.2220969933961075e-06, - "loss": 0.6406, - "step": 52186 - }, - { - "epoch": 1.34, - "learning_rate": 1.2220700139384836e-06, - "loss": 0.6997, - "step": 52187 - }, - { - "epoch": 1.34, - "learning_rate": 1.2220430343108308e-06, - "loss": 0.6328, - "step": 52188 - }, - { - "epoch": 1.34, - "learning_rate": 1.2220160545131702e-06, - "loss": 0.7222, - "step": 52189 - }, - { - "epoch": 1.34, - "learning_rate": 1.221989074545522e-06, - "loss": 0.751, - "step": 52190 - }, - { - "epoch": 1.34, - "learning_rate": 1.221962094407907e-06, - "loss": 0.6782, - "step": 52191 - }, - { - "epoch": 1.34, - "learning_rate": 1.2219351141003455e-06, - "loss": 0.7832, - "step": 52192 - }, - { - "epoch": 1.34, - "learning_rate": 1.2219081336228588e-06, - "loss": 0.5928, - "step": 52193 - }, - { - "epoch": 1.34, - "learning_rate": 1.2218811529754672e-06, - "loss": 0.6294, - "step": 52194 - }, - { - "epoch": 1.34, - "learning_rate": 1.2218541721581913e-06, - "loss": 0.6758, - "step": 52195 - }, - { - "epoch": 1.34, - "learning_rate": 1.2218271911710521e-06, - "loss": 0.5713, - "step": 52196 - }, - { - "epoch": 1.34, - "learning_rate": 1.2218002100140699e-06, - "loss": 0.5928, - "step": 52197 - }, - { - "epoch": 1.34, - "learning_rate": 1.2217732286872654e-06, - "loss": 0.7285, - "step": 52198 - }, - { - "epoch": 1.34, - "learning_rate": 1.2217462471906593e-06, - "loss": 0.4734, - "step": 52199 - }, - { - "epoch": 1.34, - "learning_rate": 1.2217192655242725e-06, - "loss": 0.3972, - "step": 52200 - }, - { - "epoch": 1.34, - "learning_rate": 1.221692283688125e-06, - "loss": 0.5317, - "step": 52201 - }, - { - "epoch": 1.34, - "learning_rate": 1.2216653016822386e-06, - "loss": 0.5051, - "step": 52202 - }, - { - "epoch": 1.34, - "learning_rate": 1.221638319506633e-06, - "loss": 0.7725, - "step": 52203 - }, - { - "epoch": 1.34, - "learning_rate": 1.2216113371613289e-06, - "loss": 0.6436, - "step": 52204 - }, - { - "epoch": 1.34, - "learning_rate": 1.2215843546463472e-06, - "loss": 0.793, - "step": 52205 - }, - { - "epoch": 1.34, - "learning_rate": 1.2215573719617086e-06, - "loss": 0.6577, - "step": 52206 - }, - { - "epoch": 1.34, - "learning_rate": 1.2215303891074337e-06, - "loss": 0.6372, - "step": 52207 - }, - { - "epoch": 1.34, - "learning_rate": 1.2215034060835434e-06, - "loss": 0.7578, - "step": 52208 - }, - { - "epoch": 1.34, - "learning_rate": 1.2214764228900579e-06, - "loss": 0.5449, - "step": 52209 - }, - { - "epoch": 1.34, - "learning_rate": 1.2214494395269982e-06, - "loss": 0.6055, - "step": 52210 - }, - { - "epoch": 1.34, - "learning_rate": 1.2214224559943848e-06, - "loss": 0.481, - "step": 52211 - }, - { - "epoch": 1.34, - "learning_rate": 1.2213954722922386e-06, - "loss": 0.6201, - "step": 52212 - }, - { - "epoch": 1.34, - "learning_rate": 1.2213684884205797e-06, - "loss": 0.6846, - "step": 52213 - }, - { - "epoch": 1.34, - "learning_rate": 1.2213415043794293e-06, - "loss": 0.7051, - "step": 52214 - }, - { - "epoch": 1.34, - "learning_rate": 1.221314520168808e-06, - "loss": 0.6851, - "step": 52215 - }, - { - "epoch": 1.34, - "learning_rate": 1.2212875357887362e-06, - "loss": 0.666, - "step": 52216 - }, - { - "epoch": 1.34, - "learning_rate": 1.2212605512392347e-06, - "loss": 0.7959, - "step": 52217 - }, - { - "epoch": 1.34, - "learning_rate": 1.2212335665203243e-06, - "loss": 0.6064, - "step": 52218 - }, - { - "epoch": 1.34, - "learning_rate": 1.2212065816320254e-06, - "loss": 0.606, - "step": 52219 - }, - { - "epoch": 1.34, - "learning_rate": 1.221179596574359e-06, - "loss": 0.5181, - "step": 52220 - }, - { - "epoch": 1.34, - "learning_rate": 1.2211526113473453e-06, - "loss": 0.668, - "step": 52221 - }, - { - "epoch": 1.34, - "learning_rate": 1.2211256259510053e-06, - "loss": 0.6621, - "step": 52222 - }, - { - "epoch": 1.34, - "learning_rate": 1.2210986403853595e-06, - "loss": 0.5796, - "step": 52223 - }, - { - "epoch": 1.34, - "learning_rate": 1.221071654650429e-06, - "loss": 0.3679, - "step": 52224 - }, - { - "epoch": 1.34, - "learning_rate": 1.221044668746234e-06, - "loss": 0.5488, - "step": 52225 - }, - { - "epoch": 1.34, - "learning_rate": 1.2210176826727947e-06, - "loss": 0.6504, - "step": 52226 - }, - { - "epoch": 1.34, - "learning_rate": 1.2209906964301328e-06, - "loss": 0.7021, - "step": 52227 - }, - { - "epoch": 1.34, - "learning_rate": 1.2209637100182683e-06, - "loss": 0.6826, - "step": 52228 - }, - { - "epoch": 1.34, - "learning_rate": 1.220936723437222e-06, - "loss": 0.7383, - "step": 52229 - }, - { - "epoch": 1.34, - "learning_rate": 1.220909736687015e-06, - "loss": 0.7114, - "step": 52230 - }, - { - "epoch": 1.34, - "learning_rate": 1.2208827497676675e-06, - "loss": 0.7363, - "step": 52231 - }, - { - "epoch": 1.34, - "learning_rate": 1.2208557626791998e-06, - "loss": 0.5483, - "step": 52232 - }, - { - "epoch": 1.34, - "learning_rate": 1.2208287754216332e-06, - "loss": 0.5337, - "step": 52233 - }, - { - "epoch": 1.34, - "learning_rate": 1.2208017879949883e-06, - "loss": 0.7275, - "step": 52234 - }, - { - "epoch": 1.34, - "learning_rate": 1.2207748003992857e-06, - "loss": 0.7415, - "step": 52235 - }, - { - "epoch": 1.34, - "learning_rate": 1.2207478126345459e-06, - "loss": 0.6377, - "step": 52236 - }, - { - "epoch": 1.34, - "learning_rate": 1.2207208247007895e-06, - "loss": 0.5918, - "step": 52237 - }, - { - "epoch": 1.34, - "learning_rate": 1.2206938365980373e-06, - "loss": 0.5579, - "step": 52238 - }, - { - "epoch": 1.34, - "learning_rate": 1.2206668483263102e-06, - "loss": 0.6187, - "step": 52239 - }, - { - "epoch": 1.34, - "learning_rate": 1.2206398598856285e-06, - "loss": 0.564, - "step": 52240 - }, - { - "epoch": 1.34, - "learning_rate": 1.220612871276013e-06, - "loss": 0.6633, - "step": 52241 - }, - { - "epoch": 1.34, - "learning_rate": 1.2205858824974843e-06, - "loss": 0.5962, - "step": 52242 - }, - { - "epoch": 1.34, - "learning_rate": 1.2205588935500633e-06, - "loss": 0.6621, - "step": 52243 - }, - { - "epoch": 1.34, - "learning_rate": 1.2205319044337703e-06, - "loss": 0.55, - "step": 52244 - }, - { - "epoch": 1.34, - "learning_rate": 1.2205049151486265e-06, - "loss": 0.791, - "step": 52245 - }, - { - "epoch": 1.34, - "learning_rate": 1.2204779256946518e-06, - "loss": 0.5737, - "step": 52246 - }, - { - "epoch": 1.34, - "learning_rate": 1.2204509360718675e-06, - "loss": 0.626, - "step": 52247 - }, - { - "epoch": 1.34, - "learning_rate": 1.220423946280294e-06, - "loss": 0.5234, - "step": 52248 - }, - { - "epoch": 1.34, - "learning_rate": 1.220396956319952e-06, - "loss": 0.5986, - "step": 52249 - }, - { - "epoch": 1.34, - "learning_rate": 1.2203699661908627e-06, - "loss": 0.561, - "step": 52250 - }, - { - "epoch": 1.34, - "learning_rate": 1.2203429758930454e-06, - "loss": 0.7412, - "step": 52251 - }, - { - "epoch": 1.34, - "learning_rate": 1.2203159854265222e-06, - "loss": 0.7598, - "step": 52252 - }, - { - "epoch": 1.34, - "learning_rate": 1.2202889947913129e-06, - "loss": 0.7451, - "step": 52253 - }, - { - "epoch": 1.34, - "learning_rate": 1.2202620039874385e-06, - "loss": 0.3427, - "step": 52254 - }, - { - "epoch": 1.34, - "learning_rate": 1.2202350130149197e-06, - "loss": 0.6035, - "step": 52255 - }, - { - "epoch": 1.34, - "learning_rate": 1.2202080218737771e-06, - "loss": 0.7568, - "step": 52256 - }, - { - "epoch": 1.34, - "learning_rate": 1.2201810305640312e-06, - "loss": 0.7266, - "step": 52257 - }, - { - "epoch": 1.34, - "learning_rate": 1.220154039085703e-06, - "loss": 0.5464, - "step": 52258 - }, - { - "epoch": 1.34, - "learning_rate": 1.2201270474388126e-06, - "loss": 0.8105, - "step": 52259 - }, - { - "epoch": 1.34, - "learning_rate": 1.2201000556233816e-06, - "loss": 0.6265, - "step": 52260 - }, - { - "epoch": 1.34, - "learning_rate": 1.2200730636394296e-06, - "loss": 0.5537, - "step": 52261 - }, - { - "epoch": 1.34, - "learning_rate": 1.2200460714869782e-06, - "loss": 0.6147, - "step": 52262 - }, - { - "epoch": 1.34, - "learning_rate": 1.220019079166047e-06, - "loss": 0.8047, - "step": 52263 - }, - { - "epoch": 1.34, - "learning_rate": 1.219992086676658e-06, - "loss": 0.7471, - "step": 52264 - }, - { - "epoch": 1.34, - "learning_rate": 1.219965094018831e-06, - "loss": 0.5015, - "step": 52265 - }, - { - "epoch": 1.34, - "learning_rate": 1.219938101192587e-06, - "loss": 0.5278, - "step": 52266 - }, - { - "epoch": 1.34, - "learning_rate": 1.219911108197946e-06, - "loss": 0.4126, - "step": 52267 - }, - { - "epoch": 1.34, - "learning_rate": 1.2198841150349296e-06, - "loss": 0.7344, - "step": 52268 - }, - { - "epoch": 1.34, - "learning_rate": 1.2198571217035576e-06, - "loss": 0.707, - "step": 52269 - }, - { - "epoch": 1.34, - "learning_rate": 1.2198301282038514e-06, - "loss": 0.6274, - "step": 52270 - }, - { - "epoch": 1.34, - "learning_rate": 1.2198031345358314e-06, - "loss": 0.6406, - "step": 52271 - }, - { - "epoch": 1.34, - "learning_rate": 1.2197761406995181e-06, - "loss": 0.4661, - "step": 52272 - }, - { - "epoch": 1.34, - "learning_rate": 1.2197491466949326e-06, - "loss": 0.668, - "step": 52273 - }, - { - "epoch": 1.34, - "learning_rate": 1.2197221525220948e-06, - "loss": 0.7129, - "step": 52274 - }, - { - "epoch": 1.34, - "learning_rate": 1.2196951581810266e-06, - "loss": 0.6992, - "step": 52275 - }, - { - "epoch": 1.34, - "learning_rate": 1.2196681636717475e-06, - "loss": 0.6816, - "step": 52276 - }, - { - "epoch": 1.34, - "learning_rate": 1.2196411689942786e-06, - "loss": 0.605, - "step": 52277 - }, - { - "epoch": 1.34, - "learning_rate": 1.2196141741486404e-06, - "loss": 0.5787, - "step": 52278 - }, - { - "epoch": 1.34, - "learning_rate": 1.2195871791348537e-06, - "loss": 0.751, - "step": 52279 - }, - { - "epoch": 1.34, - "learning_rate": 1.2195601839529394e-06, - "loss": 0.5942, - "step": 52280 - }, - { - "epoch": 1.34, - "learning_rate": 1.219533188602918e-06, - "loss": 0.6572, - "step": 52281 - }, - { - "epoch": 1.34, - "learning_rate": 1.2195061930848099e-06, - "loss": 0.6021, - "step": 52282 - }, - { - "epoch": 1.34, - "learning_rate": 1.2194791973986363e-06, - "loss": 0.4277, - "step": 52283 - }, - { - "epoch": 1.34, - "learning_rate": 1.2194522015444174e-06, - "loss": 0.6235, - "step": 52284 - }, - { - "epoch": 1.34, - "learning_rate": 1.2194252055221742e-06, - "loss": 0.6699, - "step": 52285 - }, - { - "epoch": 1.34, - "learning_rate": 1.219398209331927e-06, - "loss": 0.668, - "step": 52286 - }, - { - "epoch": 1.34, - "learning_rate": 1.2193712129736967e-06, - "loss": 0.5601, - "step": 52287 - }, - { - "epoch": 1.34, - "learning_rate": 1.2193442164475038e-06, - "loss": 0.6758, - "step": 52288 - }, - { - "epoch": 1.34, - "learning_rate": 1.2193172197533693e-06, - "loss": 0.7446, - "step": 52289 - }, - { - "epoch": 1.34, - "learning_rate": 1.2192902228913137e-06, - "loss": 0.7412, - "step": 52290 - }, - { - "epoch": 1.34, - "learning_rate": 1.2192632258613578e-06, - "loss": 0.4156, - "step": 52291 - }, - { - "epoch": 1.34, - "learning_rate": 1.2192362286635218e-06, - "loss": 0.6851, - "step": 52292 - }, - { - "epoch": 1.34, - "learning_rate": 1.219209231297827e-06, - "loss": 0.4758, - "step": 52293 - }, - { - "epoch": 1.34, - "learning_rate": 1.2191822337642936e-06, - "loss": 0.7168, - "step": 52294 - }, - { - "epoch": 1.34, - "learning_rate": 1.2191552360629427e-06, - "loss": 0.6177, - "step": 52295 - }, - { - "epoch": 1.34, - "learning_rate": 1.2191282381937944e-06, - "loss": 0.6655, - "step": 52296 - }, - { - "epoch": 1.34, - "learning_rate": 1.2191012401568696e-06, - "loss": 0.7007, - "step": 52297 - }, - { - "epoch": 1.34, - "learning_rate": 1.2190742419521893e-06, - "loss": 0.5493, - "step": 52298 - }, - { - "epoch": 1.34, - "learning_rate": 1.2190472435797738e-06, - "loss": 0.8281, - "step": 52299 - }, - { - "epoch": 1.34, - "learning_rate": 1.2190202450396443e-06, - "loss": 0.6743, - "step": 52300 - }, - { - "epoch": 1.34, - "learning_rate": 1.2189932463318207e-06, - "loss": 0.6758, - "step": 52301 - }, - { - "epoch": 1.34, - "learning_rate": 1.2189662474563241e-06, - "loss": 0.6797, - "step": 52302 - }, - { - "epoch": 1.34, - "learning_rate": 1.2189392484131748e-06, - "loss": 0.7578, - "step": 52303 - }, - { - "epoch": 1.34, - "learning_rate": 1.2189122492023942e-06, - "loss": 0.6738, - "step": 52304 - }, - { - "epoch": 1.34, - "learning_rate": 1.2188852498240026e-06, - "loss": 0.6895, - "step": 52305 - }, - { - "epoch": 1.34, - "learning_rate": 1.2188582502780204e-06, - "loss": 0.7939, - "step": 52306 - }, - { - "epoch": 1.34, - "learning_rate": 1.2188312505644684e-06, - "loss": 0.8149, - "step": 52307 - }, - { - "epoch": 1.34, - "learning_rate": 1.2188042506833678e-06, - "loss": 0.7612, - "step": 52308 - }, - { - "epoch": 1.34, - "learning_rate": 1.2187772506347385e-06, - "loss": 0.7432, - "step": 52309 - }, - { - "epoch": 1.34, - "learning_rate": 1.2187502504186016e-06, - "loss": 0.6499, - "step": 52310 - }, - { - "epoch": 1.34, - "learning_rate": 1.2187232500349777e-06, - "loss": 0.6206, - "step": 52311 - }, - { - "epoch": 1.34, - "learning_rate": 1.2186962494838878e-06, - "loss": 0.4639, - "step": 52312 - }, - { - "epoch": 1.34, - "learning_rate": 1.2186692487653516e-06, - "loss": 0.7246, - "step": 52313 - }, - { - "epoch": 1.34, - "learning_rate": 1.2186422478793908e-06, - "loss": 0.7383, - "step": 52314 - }, - { - "epoch": 1.34, - "learning_rate": 1.2186152468260256e-06, - "loss": 0.4672, - "step": 52315 - }, - { - "epoch": 1.34, - "learning_rate": 1.2185882456052765e-06, - "loss": 0.5693, - "step": 52316 - }, - { - "epoch": 1.34, - "learning_rate": 1.218561244217165e-06, - "loss": 0.7622, - "step": 52317 - }, - { - "epoch": 1.34, - "learning_rate": 1.2185342426617106e-06, - "loss": 0.4612, - "step": 52318 - }, - { - "epoch": 1.34, - "learning_rate": 1.218507240938935e-06, - "loss": 0.7539, - "step": 52319 - }, - { - "epoch": 1.34, - "learning_rate": 1.2184802390488584e-06, - "loss": 0.7793, - "step": 52320 - }, - { - "epoch": 1.34, - "learning_rate": 1.2184532369915015e-06, - "loss": 0.6709, - "step": 52321 - }, - { - "epoch": 1.34, - "learning_rate": 1.2184262347668847e-06, - "loss": 0.4741, - "step": 52322 - }, - { - "epoch": 1.34, - "learning_rate": 1.2183992323750294e-06, - "loss": 0.8066, - "step": 52323 - }, - { - "epoch": 1.34, - "learning_rate": 1.2183722298159555e-06, - "loss": 0.6182, - "step": 52324 - }, - { - "epoch": 1.34, - "learning_rate": 1.2183452270896846e-06, - "loss": 0.667, - "step": 52325 - }, - { - "epoch": 1.34, - "learning_rate": 1.2183182241962362e-06, - "loss": 0.5845, - "step": 52326 - }, - { - "epoch": 1.34, - "learning_rate": 1.2182912211356319e-06, - "loss": 0.7363, - "step": 52327 - }, - { - "epoch": 1.34, - "learning_rate": 1.2182642179078918e-06, - "loss": 0.6411, - "step": 52328 - }, - { - "epoch": 1.34, - "learning_rate": 1.2182372145130368e-06, - "loss": 0.6846, - "step": 52329 - }, - { - "epoch": 1.34, - "learning_rate": 1.2182102109510878e-06, - "loss": 0.4487, - "step": 52330 - }, - { - "epoch": 1.34, - "learning_rate": 1.2181832072220654e-06, - "loss": 0.626, - "step": 52331 - }, - { - "epoch": 1.34, - "learning_rate": 1.2181562033259898e-06, - "loss": 0.5757, - "step": 52332 - }, - { - "epoch": 1.34, - "learning_rate": 1.2181291992628824e-06, - "loss": 0.6396, - "step": 52333 - }, - { - "epoch": 1.34, - "learning_rate": 1.218102195032763e-06, - "loss": 0.7471, - "step": 52334 - }, - { - "epoch": 1.34, - "learning_rate": 1.2180751906356532e-06, - "loss": 0.5513, - "step": 52335 - }, - { - "epoch": 1.34, - "learning_rate": 1.2180481860715731e-06, - "loss": 0.6641, - "step": 52336 - }, - { - "epoch": 1.34, - "learning_rate": 1.2180211813405433e-06, - "loss": 0.7344, - "step": 52337 - }, - { - "epoch": 1.34, - "learning_rate": 1.2179941764425852e-06, - "loss": 0.752, - "step": 52338 - }, - { - "epoch": 1.34, - "learning_rate": 1.217967171377719e-06, - "loss": 0.7871, - "step": 52339 - }, - { - "epoch": 1.34, - "learning_rate": 1.217940166145965e-06, - "loss": 0.7256, - "step": 52340 - }, - { - "epoch": 1.34, - "learning_rate": 1.2179131607473443e-06, - "loss": 0.7656, - "step": 52341 - }, - { - "epoch": 1.34, - "learning_rate": 1.2178861551818775e-06, - "loss": 0.6055, - "step": 52342 - }, - { - "epoch": 1.34, - "learning_rate": 1.2178591494495854e-06, - "loss": 0.6167, - "step": 52343 - }, - { - "epoch": 1.34, - "learning_rate": 1.2178321435504887e-06, - "loss": 0.7383, - "step": 52344 - }, - { - "epoch": 1.34, - "learning_rate": 1.2178051374846076e-06, - "loss": 0.6836, - "step": 52345 - }, - { - "epoch": 1.34, - "learning_rate": 1.2177781312519635e-06, - "loss": 0.5974, - "step": 52346 - }, - { - "epoch": 1.34, - "learning_rate": 1.2177511248525763e-06, - "loss": 0.6416, - "step": 52347 - }, - { - "epoch": 1.34, - "learning_rate": 1.2177241182864672e-06, - "loss": 0.4988, - "step": 52348 - }, - { - "epoch": 1.34, - "learning_rate": 1.2176971115536567e-06, - "loss": 0.6611, - "step": 52349 - }, - { - "epoch": 1.34, - "learning_rate": 1.217670104654166e-06, - "loss": 0.4407, - "step": 52350 - }, - { - "epoch": 1.34, - "learning_rate": 1.2176430975880147e-06, - "loss": 0.7676, - "step": 52351 - }, - { - "epoch": 1.34, - "learning_rate": 1.2176160903552244e-06, - "loss": 0.5033, - "step": 52352 - }, - { - "epoch": 1.34, - "learning_rate": 1.2175890829558153e-06, - "loss": 0.8174, - "step": 52353 - }, - { - "epoch": 1.34, - "learning_rate": 1.2175620753898083e-06, - "loss": 0.7168, - "step": 52354 - }, - { - "epoch": 1.34, - "learning_rate": 1.2175350676572243e-06, - "loss": 0.6484, - "step": 52355 - }, - { - "epoch": 1.34, - "learning_rate": 1.2175080597580836e-06, - "loss": 0.7529, - "step": 52356 - }, - { - "epoch": 1.34, - "learning_rate": 1.2174810516924066e-06, - "loss": 0.5842, - "step": 52357 - }, - { - "epoch": 1.34, - "learning_rate": 1.2174540434602146e-06, - "loss": 0.4377, - "step": 52358 - }, - { - "epoch": 1.34, - "learning_rate": 1.2174270350615282e-06, - "loss": 0.6865, - "step": 52359 - }, - { - "epoch": 1.34, - "learning_rate": 1.2174000264963677e-06, - "loss": 0.6924, - "step": 52360 - }, - { - "epoch": 1.34, - "learning_rate": 1.2173730177647541e-06, - "loss": 0.3939, - "step": 52361 - }, - { - "epoch": 1.34, - "learning_rate": 1.2173460088667078e-06, - "loss": 0.5503, - "step": 52362 - }, - { - "epoch": 1.34, - "learning_rate": 1.2173189998022499e-06, - "loss": 0.5215, - "step": 52363 - }, - { - "epoch": 1.34, - "learning_rate": 1.2172919905714005e-06, - "loss": 0.4844, - "step": 52364 - }, - { - "epoch": 1.34, - "learning_rate": 1.217264981174181e-06, - "loss": 0.5737, - "step": 52365 - }, - { - "epoch": 1.34, - "learning_rate": 1.2172379716106116e-06, - "loss": 0.521, - "step": 52366 - }, - { - "epoch": 1.34, - "learning_rate": 1.217210961880713e-06, - "loss": 0.4507, - "step": 52367 - }, - { - "epoch": 1.34, - "learning_rate": 1.2171839519845056e-06, - "loss": 0.5227, - "step": 52368 - }, - { - "epoch": 1.34, - "learning_rate": 1.2171569419220112e-06, - "loss": 0.6309, - "step": 52369 - }, - { - "epoch": 1.34, - "learning_rate": 1.2171299316932493e-06, - "loss": 0.6274, - "step": 52370 - }, - { - "epoch": 1.34, - "learning_rate": 1.217102921298241e-06, - "loss": 0.7588, - "step": 52371 - }, - { - "epoch": 1.34, - "learning_rate": 1.217075910737007e-06, - "loss": 0.5532, - "step": 52372 - }, - { - "epoch": 1.34, - "learning_rate": 1.2170489000095678e-06, - "loss": 0.6816, - "step": 52373 - }, - { - "epoch": 1.34, - "learning_rate": 1.2170218891159443e-06, - "loss": 0.4741, - "step": 52374 - }, - { - "epoch": 1.34, - "learning_rate": 1.2169948780561577e-06, - "loss": 0.7578, - "step": 52375 - }, - { - "epoch": 1.34, - "learning_rate": 1.2169678668302272e-06, - "loss": 0.6582, - "step": 52376 - }, - { - "epoch": 1.34, - "learning_rate": 1.216940855438175e-06, - "loss": 0.6982, - "step": 52377 - }, - { - "epoch": 1.34, - "learning_rate": 1.2169138438800207e-06, - "loss": 0.6094, - "step": 52378 - }, - { - "epoch": 1.34, - "learning_rate": 1.2168868321557857e-06, - "loss": 0.6221, - "step": 52379 - }, - { - "epoch": 1.34, - "learning_rate": 1.2168598202654905e-06, - "loss": 0.5449, - "step": 52380 - }, - { - "epoch": 1.34, - "learning_rate": 1.2168328082091555e-06, - "loss": 0.6953, - "step": 52381 - }, - { - "epoch": 1.34, - "learning_rate": 1.216805795986802e-06, - "loss": 0.6958, - "step": 52382 - }, - { - "epoch": 1.34, - "learning_rate": 1.2167787835984497e-06, - "loss": 0.6553, - "step": 52383 - }, - { - "epoch": 1.34, - "learning_rate": 1.2167517710441203e-06, - "loss": 0.5728, - "step": 52384 - }, - { - "epoch": 1.34, - "learning_rate": 1.2167247583238338e-06, - "loss": 0.5972, - "step": 52385 - }, - { - "epoch": 1.34, - "learning_rate": 1.2166977454376112e-06, - "loss": 0.4932, - "step": 52386 - }, - { - "epoch": 1.34, - "learning_rate": 1.2166707323854731e-06, - "loss": 0.5112, - "step": 52387 - }, - { - "epoch": 1.34, - "learning_rate": 1.2166437191674402e-06, - "loss": 0.4392, - "step": 52388 - }, - { - "epoch": 1.34, - "learning_rate": 1.2166167057835329e-06, - "loss": 0.5708, - "step": 52389 - }, - { - "epoch": 1.34, - "learning_rate": 1.2165896922337726e-06, - "loss": 0.6265, - "step": 52390 - }, - { - "epoch": 1.34, - "learning_rate": 1.2165626785181792e-06, - "loss": 0.7314, - "step": 52391 - }, - { - "epoch": 1.34, - "learning_rate": 1.2165356646367739e-06, - "loss": 0.6948, - "step": 52392 - }, - { - "epoch": 1.34, - "learning_rate": 1.216508650589577e-06, - "loss": 0.6123, - "step": 52393 - }, - { - "epoch": 1.34, - "learning_rate": 1.2164816363766095e-06, - "loss": 0.6484, - "step": 52394 - }, - { - "epoch": 1.34, - "learning_rate": 1.2164546219978922e-06, - "loss": 0.3704, - "step": 52395 - }, - { - "epoch": 1.34, - "learning_rate": 1.2164276074534451e-06, - "loss": 0.7168, - "step": 52396 - }, - { - "epoch": 1.34, - "learning_rate": 1.2164005927432896e-06, - "loss": 0.6528, - "step": 52397 - }, - { - "epoch": 1.34, - "learning_rate": 1.2163735778674461e-06, - "loss": 0.7754, - "step": 52398 - }, - { - "epoch": 1.34, - "learning_rate": 1.216346562825935e-06, - "loss": 0.7412, - "step": 52399 - }, - { - "epoch": 1.34, - "learning_rate": 1.2163195476187777e-06, - "loss": 0.7202, - "step": 52400 - }, - { - "epoch": 1.34, - "learning_rate": 1.2162925322459946e-06, - "loss": 0.7129, - "step": 52401 - }, - { - "epoch": 1.34, - "learning_rate": 1.216265516707606e-06, - "loss": 0.6445, - "step": 52402 - }, - { - "epoch": 1.34, - "learning_rate": 1.2162385010036324e-06, - "loss": 0.6875, - "step": 52403 - }, - { - "epoch": 1.34, - "learning_rate": 1.2162114851340956e-06, - "loss": 0.6201, - "step": 52404 - }, - { - "epoch": 1.34, - "learning_rate": 1.2161844690990154e-06, - "loss": 0.7383, - "step": 52405 - }, - { - "epoch": 1.34, - "learning_rate": 1.2161574528984124e-06, - "loss": 0.6392, - "step": 52406 - }, - { - "epoch": 1.34, - "learning_rate": 1.2161304365323079e-06, - "loss": 0.793, - "step": 52407 - }, - { - "epoch": 1.34, - "learning_rate": 1.216103420000722e-06, - "loss": 0.585, - "step": 52408 - }, - { - "epoch": 1.34, - "learning_rate": 1.2160764033036759e-06, - "loss": 0.6416, - "step": 52409 - }, - { - "epoch": 1.34, - "learning_rate": 1.2160493864411901e-06, - "loss": 0.521, - "step": 52410 - }, - { - "epoch": 1.34, - "learning_rate": 1.2160223694132852e-06, - "loss": 0.625, - "step": 52411 - }, - { - "epoch": 1.34, - "learning_rate": 1.2159953522199814e-06, - "loss": 0.5977, - "step": 52412 - }, - { - "epoch": 1.34, - "learning_rate": 1.2159683348613006e-06, - "loss": 0.5684, - "step": 52413 - }, - { - "epoch": 1.34, - "learning_rate": 1.2159413173372624e-06, - "loss": 0.6499, - "step": 52414 - }, - { - "epoch": 1.34, - "learning_rate": 1.2159142996478878e-06, - "loss": 0.6084, - "step": 52415 - }, - { - "epoch": 1.34, - "learning_rate": 1.2158872817931979e-06, - "loss": 0.6421, - "step": 52416 - }, - { - "epoch": 1.34, - "learning_rate": 1.2158602637732128e-06, - "loss": 0.667, - "step": 52417 - }, - { - "epoch": 1.34, - "learning_rate": 1.2158332455879532e-06, - "loss": 0.7217, - "step": 52418 - }, - { - "epoch": 1.34, - "learning_rate": 1.2158062272374404e-06, - "loss": 0.7515, - "step": 52419 - }, - { - "epoch": 1.34, - "learning_rate": 1.2157792087216946e-06, - "loss": 0.5613, - "step": 52420 - }, - { - "epoch": 1.34, - "learning_rate": 1.2157521900407366e-06, - "loss": 0.6113, - "step": 52421 - }, - { - "epoch": 1.34, - "learning_rate": 1.2157251711945866e-06, - "loss": 0.6826, - "step": 52422 - }, - { - "epoch": 1.34, - "learning_rate": 1.2156981521832663e-06, - "loss": 0.5391, - "step": 52423 - }, - { - "epoch": 1.34, - "learning_rate": 1.2156711330067954e-06, - "loss": 0.6133, - "step": 52424 - }, - { - "epoch": 1.34, - "learning_rate": 1.2156441136651956e-06, - "loss": 0.5591, - "step": 52425 - }, - { - "epoch": 1.34, - "learning_rate": 1.2156170941584867e-06, - "loss": 0.7212, - "step": 52426 - }, - { - "epoch": 1.34, - "learning_rate": 1.2155900744866895e-06, - "loss": 0.6094, - "step": 52427 - }, - { - "epoch": 1.34, - "learning_rate": 1.2155630546498251e-06, - "loss": 0.6548, - "step": 52428 - }, - { - "epoch": 1.34, - "learning_rate": 1.2155360346479142e-06, - "loss": 0.7422, - "step": 52429 - }, - { - "epoch": 1.34, - "learning_rate": 1.2155090144809772e-06, - "loss": 0.6343, - "step": 52430 - }, - { - "epoch": 1.34, - "learning_rate": 1.2154819941490346e-06, - "loss": 0.75, - "step": 52431 - }, - { - "epoch": 1.34, - "learning_rate": 1.2154549736521075e-06, - "loss": 0.7295, - "step": 52432 - }, - { - "epoch": 1.34, - "learning_rate": 1.2154279529902163e-06, - "loss": 0.7363, - "step": 52433 - }, - { - "epoch": 1.34, - "learning_rate": 1.2154009321633819e-06, - "loss": 0.7158, - "step": 52434 - }, - { - "epoch": 1.34, - "learning_rate": 1.215373911171625e-06, - "loss": 0.7295, - "step": 52435 - }, - { - "epoch": 1.34, - "learning_rate": 1.215346890014966e-06, - "loss": 0.5154, - "step": 52436 - }, - { - "epoch": 1.34, - "learning_rate": 1.215319868693426e-06, - "loss": 0.5552, - "step": 52437 - }, - { - "epoch": 1.34, - "learning_rate": 1.2152928472070255e-06, - "loss": 0.6851, - "step": 52438 - }, - { - "epoch": 1.34, - "learning_rate": 1.2152658255557847e-06, - "loss": 0.7349, - "step": 52439 - }, - { - "epoch": 1.34, - "learning_rate": 1.2152388037397256e-06, - "loss": 0.6021, - "step": 52440 - }, - { - "epoch": 1.34, - "learning_rate": 1.2152117817588675e-06, - "loss": 0.6699, - "step": 52441 - }, - { - "epoch": 1.34, - "learning_rate": 1.2151847596132316e-06, - "loss": 0.6562, - "step": 52442 - }, - { - "epoch": 1.34, - "learning_rate": 1.2151577373028386e-06, - "loss": 0.6177, - "step": 52443 - }, - { - "epoch": 1.34, - "learning_rate": 1.2151307148277094e-06, - "loss": 0.8857, - "step": 52444 - }, - { - "epoch": 1.34, - "learning_rate": 1.2151036921878646e-06, - "loss": 0.5781, - "step": 52445 - }, - { - "epoch": 1.34, - "learning_rate": 1.2150766693833247e-06, - "loss": 0.6709, - "step": 52446 - }, - { - "epoch": 1.34, - "learning_rate": 1.2150496464141103e-06, - "loss": 0.647, - "step": 52447 - }, - { - "epoch": 1.34, - "learning_rate": 1.2150226232802424e-06, - "loss": 0.751, - "step": 52448 - }, - { - "epoch": 1.34, - "learning_rate": 1.2149955999817417e-06, - "loss": 0.5489, - "step": 52449 - }, - { - "epoch": 1.34, - "learning_rate": 1.2149685765186285e-06, - "loss": 0.6279, - "step": 52450 - }, - { - "epoch": 1.34, - "learning_rate": 1.2149415528909236e-06, - "loss": 0.7959, - "step": 52451 - }, - { - "epoch": 1.34, - "learning_rate": 1.2149145290986483e-06, - "loss": 0.6597, - "step": 52452 - }, - { - "epoch": 1.34, - "learning_rate": 1.2148875051418226e-06, - "loss": 0.4551, - "step": 52453 - }, - { - "epoch": 1.34, - "learning_rate": 1.2148604810204674e-06, - "loss": 0.7656, - "step": 52454 - }, - { - "epoch": 1.34, - "learning_rate": 1.2148334567346035e-06, - "loss": 0.6558, - "step": 52455 - }, - { - "epoch": 1.34, - "learning_rate": 1.2148064322842514e-06, - "loss": 0.7227, - "step": 52456 - }, - { - "epoch": 1.34, - "learning_rate": 1.2147794076694319e-06, - "loss": 0.7861, - "step": 52457 - }, - { - "epoch": 1.34, - "learning_rate": 1.2147523828901656e-06, - "loss": 0.5322, - "step": 52458 - }, - { - "epoch": 1.34, - "learning_rate": 1.2147253579464737e-06, - "loss": 0.6943, - "step": 52459 - }, - { - "epoch": 1.34, - "learning_rate": 1.2146983328383761e-06, - "loss": 0.5083, - "step": 52460 - }, - { - "epoch": 1.34, - "learning_rate": 1.214671307565894e-06, - "loss": 0.7578, - "step": 52461 - }, - { - "epoch": 1.34, - "learning_rate": 1.2146442821290477e-06, - "loss": 0.7075, - "step": 52462 - }, - { - "epoch": 1.34, - "learning_rate": 1.2146172565278586e-06, - "loss": 0.4963, - "step": 52463 - }, - { - "epoch": 1.34, - "learning_rate": 1.2145902307623465e-06, - "loss": 0.7002, - "step": 52464 - }, - { - "epoch": 1.34, - "learning_rate": 1.2145632048325327e-06, - "loss": 0.6934, - "step": 52465 - }, - { - "epoch": 1.34, - "learning_rate": 1.2145361787384375e-06, - "loss": 0.6519, - "step": 52466 - }, - { - "epoch": 1.34, - "learning_rate": 1.2145091524800821e-06, - "loss": 0.665, - "step": 52467 - }, - { - "epoch": 1.34, - "learning_rate": 1.2144821260574866e-06, - "loss": 0.5032, - "step": 52468 - }, - { - "epoch": 1.34, - "learning_rate": 1.2144550994706723e-06, - "loss": 0.5811, - "step": 52469 - }, - { - "epoch": 1.34, - "learning_rate": 1.2144280727196599e-06, - "loss": 0.6982, - "step": 52470 - }, - { - "epoch": 1.34, - "learning_rate": 1.2144010458044692e-06, - "loss": 0.4561, - "step": 52471 - }, - { - "epoch": 1.34, - "learning_rate": 1.2143740187251218e-06, - "loss": 0.6406, - "step": 52472 - }, - { - "epoch": 1.34, - "learning_rate": 1.2143469914816376e-06, - "loss": 0.5088, - "step": 52473 - }, - { - "epoch": 1.34, - "learning_rate": 1.2143199640740385e-06, - "loss": 0.6064, - "step": 52474 - }, - { - "epoch": 1.34, - "learning_rate": 1.2142929365023439e-06, - "loss": 0.7002, - "step": 52475 - }, - { - "epoch": 1.34, - "learning_rate": 1.2142659087665752e-06, - "loss": 0.6973, - "step": 52476 - }, - { - "epoch": 1.35, - "learning_rate": 1.2142388808667527e-06, - "loss": 0.7251, - "step": 52477 - }, - { - "epoch": 1.35, - "learning_rate": 1.2142118528028978e-06, - "loss": 0.6239, - "step": 52478 - }, - { - "epoch": 1.35, - "learning_rate": 1.2141848245750305e-06, - "loss": 0.5638, - "step": 52479 - }, - { - "epoch": 1.35, - "learning_rate": 1.2141577961831719e-06, - "loss": 0.6426, - "step": 52480 - }, - { - "epoch": 1.35, - "learning_rate": 1.2141307676273423e-06, - "loss": 0.5417, - "step": 52481 - }, - { - "epoch": 1.35, - "learning_rate": 1.2141037389075627e-06, - "loss": 0.6455, - "step": 52482 - }, - { - "epoch": 1.35, - "learning_rate": 1.2140767100238537e-06, - "loss": 0.5771, - "step": 52483 - }, - { - "epoch": 1.35, - "learning_rate": 1.2140496809762361e-06, - "loss": 0.5182, - "step": 52484 - }, - { - "epoch": 1.35, - "learning_rate": 1.2140226517647304e-06, - "loss": 0.7549, - "step": 52485 - }, - { - "epoch": 1.35, - "learning_rate": 1.2139956223893575e-06, - "loss": 0.7178, - "step": 52486 - }, - { - "epoch": 1.35, - "learning_rate": 1.2139685928501377e-06, - "loss": 0.6343, - "step": 52487 - }, - { - "epoch": 1.35, - "learning_rate": 1.2139415631470924e-06, - "loss": 0.6338, - "step": 52488 - }, - { - "epoch": 1.35, - "learning_rate": 1.2139145332802417e-06, - "loss": 0.6841, - "step": 52489 - }, - { - "epoch": 1.35, - "learning_rate": 1.2138875032496062e-06, - "loss": 0.5713, - "step": 52490 - }, - { - "epoch": 1.35, - "learning_rate": 1.2138604730552073e-06, - "loss": 0.5991, - "step": 52491 - }, - { - "epoch": 1.35, - "learning_rate": 1.213833442697065e-06, - "loss": 0.7046, - "step": 52492 - }, - { - "epoch": 1.35, - "learning_rate": 1.2138064121752004e-06, - "loss": 0.5713, - "step": 52493 - }, - { - "epoch": 1.35, - "learning_rate": 1.213779381489634e-06, - "loss": 0.8574, - "step": 52494 - }, - { - "epoch": 1.35, - "learning_rate": 1.2137523506403868e-06, - "loss": 0.7979, - "step": 52495 - }, - { - "epoch": 1.35, - "learning_rate": 1.2137253196274788e-06, - "loss": 0.7383, - "step": 52496 - }, - { - "epoch": 1.35, - "learning_rate": 1.2136982884509314e-06, - "loss": 0.5266, - "step": 52497 - }, - { - "epoch": 1.35, - "learning_rate": 1.213671257110765e-06, - "loss": 0.71, - "step": 52498 - }, - { - "epoch": 1.35, - "learning_rate": 1.2136442256070005e-06, - "loss": 0.647, - "step": 52499 - }, - { - "epoch": 1.35, - "learning_rate": 1.2136171939396582e-06, - "loss": 0.6919, - "step": 52500 - }, - { - "epoch": 1.35, - "learning_rate": 1.2135901621087595e-06, - "loss": 0.3462, - "step": 52501 - }, - { - "epoch": 1.35, - "learning_rate": 1.2135631301143238e-06, - "loss": 0.6367, - "step": 52502 - }, - { - "epoch": 1.35, - "learning_rate": 1.2135360979563733e-06, - "loss": 0.5938, - "step": 52503 - }, - { - "epoch": 1.35, - "learning_rate": 1.2135090656349281e-06, - "loss": 0.5248, - "step": 52504 - }, - { - "epoch": 1.35, - "learning_rate": 1.2134820331500085e-06, - "loss": 0.7559, - "step": 52505 - }, - { - "epoch": 1.35, - "learning_rate": 1.2134550005016355e-06, - "loss": 0.708, - "step": 52506 - }, - { - "epoch": 1.35, - "learning_rate": 1.21342796768983e-06, - "loss": 0.5938, - "step": 52507 - }, - { - "epoch": 1.35, - "learning_rate": 1.2134009347146124e-06, - "loss": 0.7598, - "step": 52508 - }, - { - "epoch": 1.35, - "learning_rate": 1.2133739015760038e-06, - "loss": 0.5767, - "step": 52509 - }, - { - "epoch": 1.35, - "learning_rate": 1.2133468682740241e-06, - "loss": 0.4258, - "step": 52510 - }, - { - "epoch": 1.35, - "learning_rate": 1.2133198348086948e-06, - "loss": 0.5483, - "step": 52511 - }, - { - "epoch": 1.35, - "learning_rate": 1.2132928011800364e-06, - "loss": 0.6455, - "step": 52512 - }, - { - "epoch": 1.35, - "learning_rate": 1.2132657673880693e-06, - "loss": 0.4917, - "step": 52513 - }, - { - "epoch": 1.35, - "learning_rate": 1.2132387334328147e-06, - "loss": 0.71, - "step": 52514 - }, - { - "epoch": 1.35, - "learning_rate": 1.2132116993142925e-06, - "loss": 0.7051, - "step": 52515 - }, - { - "epoch": 1.35, - "learning_rate": 1.2131846650325244e-06, - "loss": 0.7148, - "step": 52516 - }, - { - "epoch": 1.35, - "learning_rate": 1.2131576305875301e-06, - "loss": 0.5408, - "step": 52517 - }, - { - "epoch": 1.35, - "learning_rate": 1.2131305959793314e-06, - "loss": 0.627, - "step": 52518 - }, - { - "epoch": 1.35, - "learning_rate": 1.213103561207948e-06, - "loss": 0.8662, - "step": 52519 - }, - { - "epoch": 1.35, - "learning_rate": 1.2130765262734013e-06, - "loss": 0.6777, - "step": 52520 - }, - { - "epoch": 1.35, - "learning_rate": 1.2130494911757114e-06, - "loss": 0.6127, - "step": 52521 - }, - { - "epoch": 1.35, - "learning_rate": 1.2130224559148997e-06, - "loss": 0.4995, - "step": 52522 - }, - { - "epoch": 1.35, - "learning_rate": 1.212995420490986e-06, - "loss": 0.6221, - "step": 52523 - }, - { - "epoch": 1.35, - "learning_rate": 1.212968384903992e-06, - "loss": 0.6519, - "step": 52524 - }, - { - "epoch": 1.35, - "learning_rate": 1.2129413491539375e-06, - "loss": 0.6846, - "step": 52525 - }, - { - "epoch": 1.35, - "learning_rate": 1.2129143132408439e-06, - "loss": 0.6729, - "step": 52526 - }, - { - "epoch": 1.35, - "learning_rate": 1.2128872771647312e-06, - "loss": 0.7803, - "step": 52527 - }, - { - "epoch": 1.35, - "learning_rate": 1.2128602409256207e-06, - "loss": 0.6191, - "step": 52528 - }, - { - "epoch": 1.35, - "learning_rate": 1.2128332045235333e-06, - "loss": 0.6846, - "step": 52529 - }, - { - "epoch": 1.35, - "learning_rate": 1.2128061679584888e-06, - "loss": 0.7119, - "step": 52530 - }, - { - "epoch": 1.35, - "learning_rate": 1.2127791312305084e-06, - "loss": 0.5791, - "step": 52531 - }, - { - "epoch": 1.35, - "learning_rate": 1.212752094339613e-06, - "loss": 0.5249, - "step": 52532 - }, - { - "epoch": 1.35, - "learning_rate": 1.212725057285823e-06, - "loss": 0.6592, - "step": 52533 - }, - { - "epoch": 1.35, - "learning_rate": 1.2126980200691593e-06, - "loss": 0.6768, - "step": 52534 - }, - { - "epoch": 1.35, - "learning_rate": 1.2126709826896426e-06, - "loss": 0.689, - "step": 52535 - }, - { - "epoch": 1.35, - "learning_rate": 1.2126439451472934e-06, - "loss": 0.7646, - "step": 52536 - }, - { - "epoch": 1.35, - "learning_rate": 1.2126169074421324e-06, - "loss": 0.7168, - "step": 52537 - }, - { - "epoch": 1.35, - "learning_rate": 1.2125898695741806e-06, - "loss": 0.6299, - "step": 52538 - }, - { - "epoch": 1.35, - "learning_rate": 1.2125628315434585e-06, - "loss": 0.5493, - "step": 52539 - }, - { - "epoch": 1.35, - "learning_rate": 1.2125357933499864e-06, - "loss": 0.5576, - "step": 52540 - }, - { - "epoch": 1.35, - "learning_rate": 1.2125087549937859e-06, - "loss": 0.5405, - "step": 52541 - }, - { - "epoch": 1.35, - "learning_rate": 1.212481716474877e-06, - "loss": 0.7588, - "step": 52542 - }, - { - "epoch": 1.35, - "learning_rate": 1.2124546777932805e-06, - "loss": 0.5908, - "step": 52543 - }, - { - "epoch": 1.35, - "learning_rate": 1.2124276389490175e-06, - "loss": 0.8638, - "step": 52544 - }, - { - "epoch": 1.35, - "learning_rate": 1.2124005999421086e-06, - "loss": 0.5994, - "step": 52545 - }, - { - "epoch": 1.35, - "learning_rate": 1.2123735607725737e-06, - "loss": 0.2734, - "step": 52546 - }, - { - "epoch": 1.35, - "learning_rate": 1.2123465214404344e-06, - "loss": 0.7148, - "step": 52547 - }, - { - "epoch": 1.35, - "learning_rate": 1.2123194819457113e-06, - "loss": 0.7041, - "step": 52548 - }, - { - "epoch": 1.35, - "learning_rate": 1.212292442288425e-06, - "loss": 0.7061, - "step": 52549 - }, - { - "epoch": 1.35, - "learning_rate": 1.2122654024685959e-06, - "loss": 0.7139, - "step": 52550 - }, - { - "epoch": 1.35, - "learning_rate": 1.212238362486245e-06, - "loss": 0.6768, - "step": 52551 - }, - { - "epoch": 1.35, - "learning_rate": 1.212211322341393e-06, - "loss": 0.5469, - "step": 52552 - }, - { - "epoch": 1.35, - "learning_rate": 1.2121842820340604e-06, - "loss": 0.6172, - "step": 52553 - }, - { - "epoch": 1.35, - "learning_rate": 1.2121572415642682e-06, - "loss": 0.792, - "step": 52554 - }, - { - "epoch": 1.35, - "learning_rate": 1.212130200932037e-06, - "loss": 0.7412, - "step": 52555 - }, - { - "epoch": 1.35, - "learning_rate": 1.2121031601373873e-06, - "loss": 0.5048, - "step": 52556 - }, - { - "epoch": 1.35, - "learning_rate": 1.2120761191803402e-06, - "loss": 0.5547, - "step": 52557 - }, - { - "epoch": 1.35, - "learning_rate": 1.2120490780609158e-06, - "loss": 0.6104, - "step": 52558 - }, - { - "epoch": 1.35, - "learning_rate": 1.2120220367791353e-06, - "loss": 0.6577, - "step": 52559 - }, - { - "epoch": 1.35, - "learning_rate": 1.2119949953350197e-06, - "loss": 0.6543, - "step": 52560 - }, - { - "epoch": 1.35, - "learning_rate": 1.2119679537285886e-06, - "loss": 0.5464, - "step": 52561 - }, - { - "epoch": 1.35, - "learning_rate": 1.2119409119598637e-06, - "loss": 0.4226, - "step": 52562 - }, - { - "epoch": 1.35, - "learning_rate": 1.2119138700288653e-06, - "loss": 0.7803, - "step": 52563 - }, - { - "epoch": 1.35, - "learning_rate": 1.2118868279356148e-06, - "loss": 0.5566, - "step": 52564 - }, - { - "epoch": 1.35, - "learning_rate": 1.2118597856801316e-06, - "loss": 0.4297, - "step": 52565 - }, - { - "epoch": 1.35, - "learning_rate": 1.2118327432624373e-06, - "loss": 0.5272, - "step": 52566 - }, - { - "epoch": 1.35, - "learning_rate": 1.2118057006825524e-06, - "loss": 0.5483, - "step": 52567 - }, - { - "epoch": 1.35, - "learning_rate": 1.2117786579404977e-06, - "loss": 0.7236, - "step": 52568 - }, - { - "epoch": 1.35, - "learning_rate": 1.2117516150362938e-06, - "loss": 0.6555, - "step": 52569 - }, - { - "epoch": 1.35, - "learning_rate": 1.2117245719699614e-06, - "loss": 0.8018, - "step": 52570 - }, - { - "epoch": 1.35, - "learning_rate": 1.2116975287415211e-06, - "loss": 0.7471, - "step": 52571 - }, - { - "epoch": 1.35, - "learning_rate": 1.2116704853509939e-06, - "loss": 0.7285, - "step": 52572 - }, - { - "epoch": 1.35, - "learning_rate": 1.2116434417984e-06, - "loss": 0.6699, - "step": 52573 - }, - { - "epoch": 1.35, - "learning_rate": 1.2116163980837613e-06, - "loss": 0.8066, - "step": 52574 - }, - { - "epoch": 1.35, - "learning_rate": 1.2115893542070967e-06, - "loss": 0.4863, - "step": 52575 - }, - { - "epoch": 1.35, - "learning_rate": 1.2115623101684285e-06, - "loss": 0.626, - "step": 52576 - }, - { - "epoch": 1.35, - "learning_rate": 1.2115352659677763e-06, - "loss": 0.5344, - "step": 52577 - }, - { - "epoch": 1.35, - "learning_rate": 1.2115082216051615e-06, - "loss": 0.6355, - "step": 52578 - }, - { - "epoch": 1.35, - "learning_rate": 1.2114811770806047e-06, - "loss": 0.7236, - "step": 52579 - }, - { - "epoch": 1.35, - "learning_rate": 1.2114541323941261e-06, - "loss": 0.6423, - "step": 52580 - }, - { - "epoch": 1.35, - "learning_rate": 1.211427087545747e-06, - "loss": 0.7168, - "step": 52581 - }, - { - "epoch": 1.35, - "learning_rate": 1.2114000425354882e-06, - "loss": 0.6709, - "step": 52582 - }, - { - "epoch": 1.35, - "learning_rate": 1.2113729973633697e-06, - "loss": 0.6074, - "step": 52583 - }, - { - "epoch": 1.35, - "learning_rate": 1.211345952029413e-06, - "loss": 0.6436, - "step": 52584 - }, - { - "epoch": 1.35, - "learning_rate": 1.2113189065336383e-06, - "loss": 0.625, - "step": 52585 - }, - { - "epoch": 1.35, - "learning_rate": 1.2112918608760661e-06, - "loss": 0.6572, - "step": 52586 - }, - { - "epoch": 1.35, - "learning_rate": 1.2112648150567176e-06, - "loss": 0.6621, - "step": 52587 - }, - { - "epoch": 1.35, - "learning_rate": 1.2112377690756132e-06, - "loss": 0.6748, - "step": 52588 - }, - { - "epoch": 1.35, - "learning_rate": 1.2112107229327744e-06, - "loss": 0.4443, - "step": 52589 - }, - { - "epoch": 1.35, - "learning_rate": 1.2111836766282206e-06, - "loss": 0.5156, - "step": 52590 - }, - { - "epoch": 1.35, - "learning_rate": 1.2111566301619736e-06, - "loss": 0.6709, - "step": 52591 - }, - { - "epoch": 1.35, - "learning_rate": 1.2111295835340532e-06, - "loss": 0.6748, - "step": 52592 - }, - { - "epoch": 1.35, - "learning_rate": 1.211102536744481e-06, - "loss": 0.6694, - "step": 52593 - }, - { - "epoch": 1.35, - "learning_rate": 1.2110754897932771e-06, - "loss": 0.6802, - "step": 52594 - }, - { - "epoch": 1.35, - "learning_rate": 1.2110484426804625e-06, - "loss": 0.5137, - "step": 52595 - }, - { - "epoch": 1.35, - "learning_rate": 1.2110213954060578e-06, - "loss": 0.5669, - "step": 52596 - }, - { - "epoch": 1.35, - "learning_rate": 1.2109943479700836e-06, - "loss": 0.7178, - "step": 52597 - }, - { - "epoch": 1.35, - "learning_rate": 1.2109673003725608e-06, - "loss": 0.8369, - "step": 52598 - }, - { - "epoch": 1.35, - "learning_rate": 1.2109402526135102e-06, - "loss": 0.4404, - "step": 52599 - }, - { - "epoch": 1.35, - "learning_rate": 1.210913204692952e-06, - "loss": 0.6523, - "step": 52600 - }, - { - "epoch": 1.35, - "learning_rate": 1.2108861566109076e-06, - "loss": 0.5713, - "step": 52601 - }, - { - "epoch": 1.35, - "learning_rate": 1.2108591083673972e-06, - "loss": 0.6753, - "step": 52602 - }, - { - "epoch": 1.35, - "learning_rate": 1.2108320599624417e-06, - "loss": 0.7173, - "step": 52603 - }, - { - "epoch": 1.35, - "learning_rate": 1.210805011396062e-06, - "loss": 0.6318, - "step": 52604 - }, - { - "epoch": 1.35, - "learning_rate": 1.210777962668278e-06, - "loss": 0.6426, - "step": 52605 - }, - { - "epoch": 1.35, - "learning_rate": 1.2107509137791113e-06, - "loss": 0.8105, - "step": 52606 - }, - { - "epoch": 1.35, - "learning_rate": 1.2107238647285824e-06, - "loss": 0.6191, - "step": 52607 - }, - { - "epoch": 1.35, - "learning_rate": 1.210696815516712e-06, - "loss": 0.6982, - "step": 52608 - }, - { - "epoch": 1.35, - "learning_rate": 1.2106697661435208e-06, - "loss": 0.365, - "step": 52609 - }, - { - "epoch": 1.35, - "learning_rate": 1.2106427166090294e-06, - "loss": 0.6309, - "step": 52610 - }, - { - "epoch": 1.35, - "learning_rate": 1.2106156669132584e-06, - "loss": 0.7031, - "step": 52611 - }, - { - "epoch": 1.35, - "learning_rate": 1.2105886170562288e-06, - "loss": 0.665, - "step": 52612 - }, - { - "epoch": 1.35, - "learning_rate": 1.210561567037961e-06, - "loss": 0.6416, - "step": 52613 - }, - { - "epoch": 1.35, - "learning_rate": 1.210534516858476e-06, - "loss": 0.4758, - "step": 52614 - }, - { - "epoch": 1.35, - "learning_rate": 1.2105074665177945e-06, - "loss": 0.5767, - "step": 52615 - }, - { - "epoch": 1.35, - "learning_rate": 1.210480416015937e-06, - "loss": 0.6851, - "step": 52616 - }, - { - "epoch": 1.35, - "learning_rate": 1.2104533653529243e-06, - "loss": 0.8125, - "step": 52617 - }, - { - "epoch": 1.35, - "learning_rate": 1.210426314528777e-06, - "loss": 0.6787, - "step": 52618 - }, - { - "epoch": 1.35, - "learning_rate": 1.2103992635435165e-06, - "loss": 0.6519, - "step": 52619 - }, - { - "epoch": 1.35, - "learning_rate": 1.2103722123971624e-06, - "loss": 0.6338, - "step": 52620 - }, - { - "epoch": 1.35, - "learning_rate": 1.2103451610897363e-06, - "loss": 0.7783, - "step": 52621 - }, - { - "epoch": 1.35, - "learning_rate": 1.2103181096212585e-06, - "loss": 0.6299, - "step": 52622 - }, - { - "epoch": 1.35, - "learning_rate": 1.2102910579917493e-06, - "loss": 0.7168, - "step": 52623 - }, - { - "epoch": 1.35, - "learning_rate": 1.2102640062012306e-06, - "loss": 0.4712, - "step": 52624 - }, - { - "epoch": 1.35, - "learning_rate": 1.2102369542497221e-06, - "loss": 0.6689, - "step": 52625 - }, - { - "epoch": 1.35, - "learning_rate": 1.2102099021372452e-06, - "loss": 0.6318, - "step": 52626 - }, - { - "epoch": 1.35, - "learning_rate": 1.2101828498638197e-06, - "loss": 0.4614, - "step": 52627 - }, - { - "epoch": 1.35, - "learning_rate": 1.2101557974294672e-06, - "loss": 0.3591, - "step": 52628 - }, - { - "epoch": 1.35, - "learning_rate": 1.210128744834208e-06, - "loss": 0.6138, - "step": 52629 - }, - { - "epoch": 1.35, - "learning_rate": 1.2101016920780626e-06, - "loss": 0.6318, - "step": 52630 - }, - { - "epoch": 1.35, - "learning_rate": 1.2100746391610524e-06, - "loss": 0.5215, - "step": 52631 - }, - { - "epoch": 1.35, - "learning_rate": 1.2100475860831974e-06, - "loss": 0.626, - "step": 52632 - }, - { - "epoch": 1.35, - "learning_rate": 1.2100205328445187e-06, - "loss": 0.5759, - "step": 52633 - }, - { - "epoch": 1.35, - "learning_rate": 1.209993479445037e-06, - "loss": 0.6484, - "step": 52634 - }, - { - "epoch": 1.35, - "learning_rate": 1.2099664258847733e-06, - "loss": 0.6992, - "step": 52635 - }, - { - "epoch": 1.35, - "learning_rate": 1.2099393721637473e-06, - "loss": 0.9102, - "step": 52636 - }, - { - "epoch": 1.35, - "learning_rate": 1.2099123182819807e-06, - "loss": 0.6855, - "step": 52637 - }, - { - "epoch": 1.35, - "learning_rate": 1.2098852642394939e-06, - "loss": 0.5356, - "step": 52638 - }, - { - "epoch": 1.35, - "learning_rate": 1.2098582100363077e-06, - "loss": 0.6094, - "step": 52639 - }, - { - "epoch": 1.35, - "learning_rate": 1.2098311556724426e-06, - "loss": 0.6396, - "step": 52640 - }, - { - "epoch": 1.35, - "learning_rate": 1.2098041011479195e-06, - "loss": 0.8057, - "step": 52641 - }, - { - "epoch": 1.35, - "learning_rate": 1.2097770464627589e-06, - "loss": 0.8545, - "step": 52642 - }, - { - "epoch": 1.35, - "learning_rate": 1.2097499916169818e-06, - "loss": 0.5979, - "step": 52643 - }, - { - "epoch": 1.35, - "learning_rate": 1.2097229366106087e-06, - "loss": 0.6611, - "step": 52644 - }, - { - "epoch": 1.35, - "learning_rate": 1.2096958814436604e-06, - "loss": 0.5608, - "step": 52645 - }, - { - "epoch": 1.35, - "learning_rate": 1.2096688261161575e-06, - "loss": 0.4512, - "step": 52646 - }, - { - "epoch": 1.35, - "learning_rate": 1.209641770628121e-06, - "loss": 0.5425, - "step": 52647 - }, - { - "epoch": 1.35, - "learning_rate": 1.2096147149795712e-06, - "loss": 0.6523, - "step": 52648 - }, - { - "epoch": 1.35, - "learning_rate": 1.2095876591705292e-06, - "loss": 0.6187, - "step": 52649 - }, - { - "epoch": 1.35, - "learning_rate": 1.2095606032010157e-06, - "loss": 0.6143, - "step": 52650 - }, - { - "epoch": 1.35, - "learning_rate": 1.209533547071051e-06, - "loss": 0.7324, - "step": 52651 - }, - { - "epoch": 1.35, - "learning_rate": 1.2095064907806565e-06, - "loss": 0.6089, - "step": 52652 - }, - { - "epoch": 1.35, - "learning_rate": 1.209479434329852e-06, - "loss": 0.645, - "step": 52653 - }, - { - "epoch": 1.35, - "learning_rate": 1.2094523777186593e-06, - "loss": 0.7324, - "step": 52654 - }, - { - "epoch": 1.35, - "learning_rate": 1.2094253209470982e-06, - "loss": 0.5, - "step": 52655 - }, - { - "epoch": 1.35, - "learning_rate": 1.20939826401519e-06, - "loss": 0.6602, - "step": 52656 - }, - { - "epoch": 1.35, - "learning_rate": 1.2093712069229546e-06, - "loss": 0.4984, - "step": 52657 - }, - { - "epoch": 1.35, - "learning_rate": 1.2093441496704138e-06, - "loss": 0.7119, - "step": 52658 - }, - { - "epoch": 1.35, - "learning_rate": 1.2093170922575878e-06, - "loss": 0.8335, - "step": 52659 - }, - { - "epoch": 1.35, - "learning_rate": 1.2092900346844971e-06, - "loss": 0.5879, - "step": 52660 - }, - { - "epoch": 1.35, - "learning_rate": 1.209262976951163e-06, - "loss": 0.627, - "step": 52661 - }, - { - "epoch": 1.35, - "learning_rate": 1.2092359190576056e-06, - "loss": 0.7227, - "step": 52662 - }, - { - "epoch": 1.35, - "learning_rate": 1.2092088610038456e-06, - "loss": 0.5483, - "step": 52663 - }, - { - "epoch": 1.35, - "learning_rate": 1.2091818027899047e-06, - "loss": 0.6606, - "step": 52664 - }, - { - "epoch": 1.35, - "learning_rate": 1.2091547444158023e-06, - "loss": 0.542, - "step": 52665 - }, - { - "epoch": 1.35, - "learning_rate": 1.20912768588156e-06, - "loss": 0.5527, - "step": 52666 - }, - { - "epoch": 1.35, - "learning_rate": 1.209100627187198e-06, - "loss": 0.5742, - "step": 52667 - }, - { - "epoch": 1.35, - "learning_rate": 1.2090735683327375e-06, - "loss": 0.7334, - "step": 52668 - }, - { - "epoch": 1.35, - "learning_rate": 1.209046509318199e-06, - "loss": 1.0098, - "step": 52669 - }, - { - "epoch": 1.35, - "learning_rate": 1.209019450143603e-06, - "loss": 0.6216, - "step": 52670 - }, - { - "epoch": 1.35, - "learning_rate": 1.2089923908089708e-06, - "loss": 0.6807, - "step": 52671 - }, - { - "epoch": 1.35, - "learning_rate": 1.2089653313143224e-06, - "loss": 0.5388, - "step": 52672 - }, - { - "epoch": 1.35, - "learning_rate": 1.2089382716596788e-06, - "loss": 0.7656, - "step": 52673 - }, - { - "epoch": 1.35, - "learning_rate": 1.2089112118450611e-06, - "loss": 0.6152, - "step": 52674 - }, - { - "epoch": 1.35, - "learning_rate": 1.2088841518704896e-06, - "loss": 0.6846, - "step": 52675 - }, - { - "epoch": 1.35, - "learning_rate": 1.2088570917359849e-06, - "loss": 0.6213, - "step": 52676 - }, - { - "epoch": 1.35, - "learning_rate": 1.208830031441568e-06, - "loss": 0.6357, - "step": 52677 - }, - { - "epoch": 1.35, - "learning_rate": 1.2088029709872594e-06, - "loss": 0.6885, - "step": 52678 - }, - { - "epoch": 1.35, - "learning_rate": 1.2087759103730806e-06, - "loss": 0.6582, - "step": 52679 - }, - { - "epoch": 1.35, - "learning_rate": 1.208748849599051e-06, - "loss": 0.5359, - "step": 52680 - }, - { - "epoch": 1.35, - "learning_rate": 1.2087217886651924e-06, - "loss": 0.6538, - "step": 52681 - }, - { - "epoch": 1.35, - "learning_rate": 1.2086947275715247e-06, - "loss": 0.5889, - "step": 52682 - }, - { - "epoch": 1.35, - "learning_rate": 1.2086676663180695e-06, - "loss": 0.4463, - "step": 52683 - }, - { - "epoch": 1.35, - "learning_rate": 1.2086406049048468e-06, - "loss": 0.5859, - "step": 52684 - }, - { - "epoch": 1.35, - "learning_rate": 1.2086135433318777e-06, - "loss": 0.6934, - "step": 52685 - }, - { - "epoch": 1.35, - "learning_rate": 1.2085864815991826e-06, - "loss": 0.5199, - "step": 52686 - }, - { - "epoch": 1.35, - "learning_rate": 1.2085594197067827e-06, - "loss": 0.3151, - "step": 52687 - }, - { - "epoch": 1.35, - "learning_rate": 1.2085323576546981e-06, - "loss": 0.7773, - "step": 52688 - }, - { - "epoch": 1.35, - "learning_rate": 1.2085052954429504e-06, - "loss": 0.6953, - "step": 52689 - }, - { - "epoch": 1.35, - "learning_rate": 1.2084782330715595e-06, - "loss": 0.6406, - "step": 52690 - }, - { - "epoch": 1.35, - "learning_rate": 1.2084511705405462e-06, - "loss": 0.6826, - "step": 52691 - }, - { - "epoch": 1.35, - "learning_rate": 1.2084241078499315e-06, - "loss": 0.7002, - "step": 52692 - }, - { - "epoch": 1.35, - "learning_rate": 1.2083970449997363e-06, - "loss": 0.6592, - "step": 52693 - }, - { - "epoch": 1.35, - "learning_rate": 1.208369981989981e-06, - "loss": 0.5149, - "step": 52694 - }, - { - "epoch": 1.35, - "learning_rate": 1.2083429188206862e-06, - "loss": 0.6069, - "step": 52695 - }, - { - "epoch": 1.35, - "learning_rate": 1.2083158554918728e-06, - "loss": 0.6978, - "step": 52696 - }, - { - "epoch": 1.35, - "learning_rate": 1.2082887920035615e-06, - "loss": 0.8301, - "step": 52697 - }, - { - "epoch": 1.35, - "learning_rate": 1.2082617283557731e-06, - "loss": 0.6138, - "step": 52698 - }, - { - "epoch": 1.35, - "learning_rate": 1.2082346645485287e-06, - "loss": 0.6338, - "step": 52699 - }, - { - "epoch": 1.35, - "learning_rate": 1.2082076005818483e-06, - "loss": 0.5593, - "step": 52700 - }, - { - "epoch": 1.35, - "learning_rate": 1.2081805364557527e-06, - "loss": 0.5198, - "step": 52701 - }, - { - "epoch": 1.35, - "learning_rate": 1.208153472170263e-06, - "loss": 0.5259, - "step": 52702 - }, - { - "epoch": 1.35, - "learning_rate": 1.2081264077253995e-06, - "loss": 0.5933, - "step": 52703 - }, - { - "epoch": 1.35, - "learning_rate": 1.208099343121184e-06, - "loss": 0.5572, - "step": 52704 - }, - { - "epoch": 1.35, - "learning_rate": 1.2080722783576357e-06, - "loss": 0.6494, - "step": 52705 - }, - { - "epoch": 1.35, - "learning_rate": 1.208045213434776e-06, - "loss": 0.6245, - "step": 52706 - }, - { - "epoch": 1.35, - "learning_rate": 1.2080181483526256e-06, - "loss": 0.6558, - "step": 52707 - }, - { - "epoch": 1.35, - "learning_rate": 1.2079910831112058e-06, - "loss": 0.7808, - "step": 52708 - }, - { - "epoch": 1.35, - "learning_rate": 1.2079640177105363e-06, - "loss": 0.6562, - "step": 52709 - }, - { - "epoch": 1.35, - "learning_rate": 1.2079369521506386e-06, - "loss": 0.5542, - "step": 52710 - }, - { - "epoch": 1.35, - "learning_rate": 1.207909886431533e-06, - "loss": 0.7588, - "step": 52711 - }, - { - "epoch": 1.35, - "learning_rate": 1.2078828205532403e-06, - "loss": 0.605, - "step": 52712 - }, - { - "epoch": 1.35, - "learning_rate": 1.2078557545157814e-06, - "loss": 0.7402, - "step": 52713 - }, - { - "epoch": 1.35, - "learning_rate": 1.2078286883191768e-06, - "loss": 0.6748, - "step": 52714 - }, - { - "epoch": 1.35, - "learning_rate": 1.2078016219634474e-06, - "loss": 0.6396, - "step": 52715 - }, - { - "epoch": 1.35, - "learning_rate": 1.2077745554486139e-06, - "loss": 0.6514, - "step": 52716 - }, - { - "epoch": 1.35, - "learning_rate": 1.2077474887746967e-06, - "loss": 0.6816, - "step": 52717 - }, - { - "epoch": 1.35, - "learning_rate": 1.2077204219417172e-06, - "loss": 0.6348, - "step": 52718 - }, - { - "epoch": 1.35, - "learning_rate": 1.2076933549496958e-06, - "loss": 0.5283, - "step": 52719 - }, - { - "epoch": 1.35, - "learning_rate": 1.2076662877986526e-06, - "loss": 0.6548, - "step": 52720 - }, - { - "epoch": 1.35, - "learning_rate": 1.2076392204886093e-06, - "loss": 0.7061, - "step": 52721 - }, - { - "epoch": 1.35, - "learning_rate": 1.2076121530195858e-06, - "loss": 0.5352, - "step": 52722 - }, - { - "epoch": 1.35, - "learning_rate": 1.2075850853916033e-06, - "loss": 0.7998, - "step": 52723 - }, - { - "epoch": 1.35, - "learning_rate": 1.207558017604683e-06, - "loss": 0.7397, - "step": 52724 - }, - { - "epoch": 1.35, - "learning_rate": 1.2075309496588447e-06, - "loss": 0.5942, - "step": 52725 - }, - { - "epoch": 1.35, - "learning_rate": 1.2075038815541091e-06, - "loss": 0.5024, - "step": 52726 - }, - { - "epoch": 1.35, - "learning_rate": 1.207476813290498e-06, - "loss": 0.6211, - "step": 52727 - }, - { - "epoch": 1.35, - "learning_rate": 1.207449744868031e-06, - "loss": 0.792, - "step": 52728 - }, - { - "epoch": 1.35, - "learning_rate": 1.2074226762867297e-06, - "loss": 0.4819, - "step": 52729 - }, - { - "epoch": 1.35, - "learning_rate": 1.207395607546614e-06, - "loss": 0.7295, - "step": 52730 - }, - { - "epoch": 1.35, - "learning_rate": 1.2073685386477052e-06, - "loss": 0.5566, - "step": 52731 - }, - { - "epoch": 1.35, - "learning_rate": 1.2073414695900237e-06, - "loss": 0.8271, - "step": 52732 - }, - { - "epoch": 1.35, - "learning_rate": 1.2073144003735904e-06, - "loss": 0.5581, - "step": 52733 - }, - { - "epoch": 1.35, - "learning_rate": 1.2072873309984262e-06, - "loss": 0.6309, - "step": 52734 - }, - { - "epoch": 1.35, - "learning_rate": 1.2072602614645514e-06, - "loss": 0.4832, - "step": 52735 - }, - { - "epoch": 1.35, - "learning_rate": 1.207233191771987e-06, - "loss": 0.5791, - "step": 52736 - }, - { - "epoch": 1.35, - "learning_rate": 1.2072061219207538e-06, - "loss": 0.4927, - "step": 52737 - }, - { - "epoch": 1.35, - "learning_rate": 1.207179051910872e-06, - "loss": 0.5142, - "step": 52738 - }, - { - "epoch": 1.35, - "learning_rate": 1.2071519817423632e-06, - "loss": 0.5059, - "step": 52739 - }, - { - "epoch": 1.35, - "learning_rate": 1.2071249114152476e-06, - "loss": 0.5869, - "step": 52740 - }, - { - "epoch": 1.35, - "learning_rate": 1.2070978409295457e-06, - "loss": 0.4834, - "step": 52741 - }, - { - "epoch": 1.35, - "learning_rate": 1.2070707702852787e-06, - "loss": 0.5093, - "step": 52742 - }, - { - "epoch": 1.35, - "learning_rate": 1.207043699482467e-06, - "loss": 0.666, - "step": 52743 - }, - { - "epoch": 1.35, - "learning_rate": 1.2070166285211315e-06, - "loss": 0.8164, - "step": 52744 - }, - { - "epoch": 1.35, - "learning_rate": 1.2069895574012928e-06, - "loss": 0.7148, - "step": 52745 - }, - { - "epoch": 1.35, - "learning_rate": 1.2069624861229722e-06, - "loss": 0.5708, - "step": 52746 - }, - { - "epoch": 1.35, - "learning_rate": 1.2069354146861894e-06, - "loss": 0.583, - "step": 52747 - }, - { - "epoch": 1.35, - "learning_rate": 1.2069083430909662e-06, - "loss": 0.7949, - "step": 52748 - }, - { - "epoch": 1.35, - "learning_rate": 1.2068812713373222e-06, - "loss": 0.6436, - "step": 52749 - }, - { - "epoch": 1.35, - "learning_rate": 1.206854199425279e-06, - "loss": 0.7734, - "step": 52750 - }, - { - "epoch": 1.35, - "learning_rate": 1.206827127354857e-06, - "loss": 0.6274, - "step": 52751 - }, - { - "epoch": 1.35, - "learning_rate": 1.2068000551260772e-06, - "loss": 0.6729, - "step": 52752 - }, - { - "epoch": 1.35, - "learning_rate": 1.2067729827389599e-06, - "loss": 0.624, - "step": 52753 - }, - { - "epoch": 1.35, - "learning_rate": 1.206745910193526e-06, - "loss": 0.583, - "step": 52754 - }, - { - "epoch": 1.35, - "learning_rate": 1.206718837489796e-06, - "loss": 0.6738, - "step": 52755 - }, - { - "epoch": 1.35, - "learning_rate": 1.2066917646277914e-06, - "loss": 0.7109, - "step": 52756 - }, - { - "epoch": 1.35, - "learning_rate": 1.206664691607532e-06, - "loss": 0.6357, - "step": 52757 - }, - { - "epoch": 1.35, - "learning_rate": 1.2066376184290392e-06, - "loss": 0.7412, - "step": 52758 - }, - { - "epoch": 1.35, - "learning_rate": 1.2066105450923336e-06, - "loss": 0.6777, - "step": 52759 - }, - { - "epoch": 1.35, - "learning_rate": 1.2065834715974355e-06, - "loss": 0.7979, - "step": 52760 - }, - { - "epoch": 1.35, - "learning_rate": 1.2065563979443663e-06, - "loss": 0.8174, - "step": 52761 - }, - { - "epoch": 1.35, - "learning_rate": 1.2065293241331462e-06, - "loss": 0.6396, - "step": 52762 - }, - { - "epoch": 1.35, - "learning_rate": 1.206502250163796e-06, - "loss": 0.6084, - "step": 52763 - }, - { - "epoch": 1.35, - "learning_rate": 1.2064751760363366e-06, - "loss": 0.5874, - "step": 52764 - }, - { - "epoch": 1.35, - "learning_rate": 1.2064481017507885e-06, - "loss": 0.6416, - "step": 52765 - }, - { - "epoch": 1.35, - "learning_rate": 1.2064210273071726e-06, - "loss": 0.6094, - "step": 52766 - }, - { - "epoch": 1.35, - "learning_rate": 1.2063939527055097e-06, - "loss": 0.5996, - "step": 52767 - }, - { - "epoch": 1.35, - "learning_rate": 1.2063668779458205e-06, - "loss": 0.6279, - "step": 52768 - }, - { - "epoch": 1.35, - "learning_rate": 1.2063398030281258e-06, - "loss": 0.6924, - "step": 52769 - }, - { - "epoch": 1.35, - "learning_rate": 1.2063127279524459e-06, - "loss": 0.5068, - "step": 52770 - }, - { - "epoch": 1.35, - "learning_rate": 1.206285652718802e-06, - "loss": 0.6836, - "step": 52771 - }, - { - "epoch": 1.35, - "learning_rate": 1.2062585773272145e-06, - "loss": 0.5615, - "step": 52772 - }, - { - "epoch": 1.35, - "learning_rate": 1.2062315017777046e-06, - "loss": 0.7432, - "step": 52773 - }, - { - "epoch": 1.35, - "learning_rate": 1.2062044260702925e-06, - "loss": 0.7388, - "step": 52774 - }, - { - "epoch": 1.35, - "learning_rate": 1.2061773502049993e-06, - "loss": 0.7373, - "step": 52775 - }, - { - "epoch": 1.35, - "learning_rate": 1.2061502741818453e-06, - "loss": 0.6719, - "step": 52776 - }, - { - "epoch": 1.35, - "learning_rate": 1.2061231980008515e-06, - "loss": 0.5889, - "step": 52777 - }, - { - "epoch": 1.35, - "learning_rate": 1.2060961216620388e-06, - "loss": 0.5063, - "step": 52778 - }, - { - "epoch": 1.35, - "learning_rate": 1.206069045165428e-06, - "loss": 0.6694, - "step": 52779 - }, - { - "epoch": 1.35, - "learning_rate": 1.2060419685110393e-06, - "loss": 0.5234, - "step": 52780 - }, - { - "epoch": 1.35, - "learning_rate": 1.206014891698894e-06, - "loss": 0.7246, - "step": 52781 - }, - { - "epoch": 1.35, - "learning_rate": 1.205987814729012e-06, - "loss": 0.79, - "step": 52782 - }, - { - "epoch": 1.35, - "learning_rate": 1.2059607376014152e-06, - "loss": 0.5396, - "step": 52783 - }, - { - "epoch": 1.35, - "learning_rate": 1.2059336603161236e-06, - "loss": 0.7061, - "step": 52784 - }, - { - "epoch": 1.35, - "learning_rate": 1.205906582873158e-06, - "loss": 0.6226, - "step": 52785 - }, - { - "epoch": 1.35, - "learning_rate": 1.2058795052725393e-06, - "loss": 0.5557, - "step": 52786 - }, - { - "epoch": 1.35, - "learning_rate": 1.2058524275142878e-06, - "loss": 0.6348, - "step": 52787 - }, - { - "epoch": 1.35, - "learning_rate": 1.2058253495984253e-06, - "loss": 0.5742, - "step": 52788 - }, - { - "epoch": 1.35, - "learning_rate": 1.205798271524971e-06, - "loss": 0.6045, - "step": 52789 - }, - { - "epoch": 1.35, - "learning_rate": 1.2057711932939467e-06, - "loss": 0.6196, - "step": 52790 - }, - { - "epoch": 1.35, - "learning_rate": 1.2057441149053729e-06, - "loss": 0.5493, - "step": 52791 - }, - { - "epoch": 1.35, - "learning_rate": 1.2057170363592702e-06, - "loss": 0.7539, - "step": 52792 - }, - { - "epoch": 1.35, - "learning_rate": 1.2056899576556597e-06, - "loss": 0.5085, - "step": 52793 - }, - { - "epoch": 1.35, - "learning_rate": 1.2056628787945618e-06, - "loss": 0.7012, - "step": 52794 - }, - { - "epoch": 1.35, - "learning_rate": 1.2056357997759968e-06, - "loss": 0.5505, - "step": 52795 - }, - { - "epoch": 1.35, - "learning_rate": 1.2056087205999863e-06, - "loss": 0.6572, - "step": 52796 - }, - { - "epoch": 1.35, - "learning_rate": 1.2055816412665504e-06, - "loss": 0.7764, - "step": 52797 - }, - { - "epoch": 1.35, - "learning_rate": 1.2055545617757108e-06, - "loss": 0.6733, - "step": 52798 - }, - { - "epoch": 1.35, - "learning_rate": 1.2055274821274868e-06, - "loss": 0.7832, - "step": 52799 - }, - { - "epoch": 1.35, - "learning_rate": 1.2055004023219002e-06, - "loss": 0.4985, - "step": 52800 - }, - { - "epoch": 1.35, - "learning_rate": 1.205473322358971e-06, - "loss": 0.3915, - "step": 52801 - }, - { - "epoch": 1.35, - "learning_rate": 1.2054462422387207e-06, - "loss": 0.5244, - "step": 52802 - }, - { - "epoch": 1.35, - "learning_rate": 1.2054191619611699e-06, - "loss": 0.6377, - "step": 52803 - }, - { - "epoch": 1.35, - "learning_rate": 1.2053920815263385e-06, - "loss": 0.7837, - "step": 52804 - }, - { - "epoch": 1.35, - "learning_rate": 1.2053650009342481e-06, - "loss": 0.6982, - "step": 52805 - }, - { - "epoch": 1.35, - "learning_rate": 1.2053379201849192e-06, - "loss": 0.8516, - "step": 52806 - }, - { - "epoch": 1.35, - "learning_rate": 1.2053108392783725e-06, - "loss": 0.709, - "step": 52807 - }, - { - "epoch": 1.35, - "learning_rate": 1.2052837582146287e-06, - "loss": 0.5088, - "step": 52808 - }, - { - "epoch": 1.35, - "learning_rate": 1.2052566769937084e-06, - "loss": 0.666, - "step": 52809 - }, - { - "epoch": 1.35, - "learning_rate": 1.2052295956156327e-06, - "loss": 0.6377, - "step": 52810 - }, - { - "epoch": 1.35, - "learning_rate": 1.205202514080422e-06, - "loss": 0.5959, - "step": 52811 - }, - { - "epoch": 1.35, - "learning_rate": 1.205175432388097e-06, - "loss": 0.6787, - "step": 52812 - }, - { - "epoch": 1.35, - "learning_rate": 1.2051483505386792e-06, - "loss": 0.7188, - "step": 52813 - }, - { - "epoch": 1.35, - "learning_rate": 1.2051212685321882e-06, - "loss": 0.6738, - "step": 52814 - }, - { - "epoch": 1.35, - "learning_rate": 1.2050941863686457e-06, - "loss": 0.6294, - "step": 52815 - }, - { - "epoch": 1.35, - "learning_rate": 1.2050671040480715e-06, - "loss": 0.4299, - "step": 52816 - }, - { - "epoch": 1.35, - "learning_rate": 1.2050400215704874e-06, - "loss": 0.6357, - "step": 52817 - }, - { - "epoch": 1.35, - "learning_rate": 1.2050129389359134e-06, - "loss": 0.6504, - "step": 52818 - }, - { - "epoch": 1.35, - "learning_rate": 1.2049858561443705e-06, - "loss": 0.5239, - "step": 52819 - }, - { - "epoch": 1.35, - "learning_rate": 1.2049587731958789e-06, - "loss": 0.5789, - "step": 52820 - }, - { - "epoch": 1.35, - "learning_rate": 1.2049316900904602e-06, - "loss": 0.9365, - "step": 52821 - }, - { - "epoch": 1.35, - "learning_rate": 1.2049046068281342e-06, - "loss": 0.6431, - "step": 52822 - }, - { - "epoch": 1.35, - "learning_rate": 1.2048775234089227e-06, - "loss": 0.7109, - "step": 52823 - }, - { - "epoch": 1.35, - "learning_rate": 1.204850439832846e-06, - "loss": 0.564, - "step": 52824 - }, - { - "epoch": 1.35, - "learning_rate": 1.2048233560999246e-06, - "loss": 0.5605, - "step": 52825 - }, - { - "epoch": 1.35, - "learning_rate": 1.2047962722101793e-06, - "loss": 0.4993, - "step": 52826 - }, - { - "epoch": 1.35, - "learning_rate": 1.2047691881636308e-06, - "loss": 0.6274, - "step": 52827 - }, - { - "epoch": 1.35, - "learning_rate": 1.2047421039603001e-06, - "loss": 0.6846, - "step": 52828 - }, - { - "epoch": 1.35, - "learning_rate": 1.2047150196002076e-06, - "loss": 0.7124, - "step": 52829 - }, - { - "epoch": 1.35, - "learning_rate": 1.2046879350833746e-06, - "loss": 0.6357, - "step": 52830 - }, - { - "epoch": 1.35, - "learning_rate": 1.2046608504098207e-06, - "loss": 0.7373, - "step": 52831 - }, - { - "epoch": 1.35, - "learning_rate": 1.2046337655795682e-06, - "loss": 0.8271, - "step": 52832 - }, - { - "epoch": 1.35, - "learning_rate": 1.204606680592637e-06, - "loss": 0.5295, - "step": 52833 - }, - { - "epoch": 1.35, - "learning_rate": 1.2045795954490474e-06, - "loss": 0.7266, - "step": 52834 - }, - { - "epoch": 1.35, - "learning_rate": 1.2045525101488207e-06, - "loss": 0.5879, - "step": 52835 - }, - { - "epoch": 1.35, - "learning_rate": 1.2045254246919778e-06, - "loss": 0.6709, - "step": 52836 - }, - { - "epoch": 1.35, - "learning_rate": 1.204498339078539e-06, - "loss": 0.6201, - "step": 52837 - }, - { - "epoch": 1.35, - "learning_rate": 1.2044712533085255e-06, - "loss": 0.7393, - "step": 52838 - }, - { - "epoch": 1.35, - "learning_rate": 1.2044441673819575e-06, - "loss": 0.6562, - "step": 52839 - }, - { - "epoch": 1.35, - "learning_rate": 1.2044170812988562e-06, - "loss": 0.6758, - "step": 52840 - }, - { - "epoch": 1.35, - "learning_rate": 1.2043899950592418e-06, - "loss": 0.6364, - "step": 52841 - }, - { - "epoch": 1.35, - "learning_rate": 1.2043629086631355e-06, - "loss": 0.585, - "step": 52842 - }, - { - "epoch": 1.35, - "learning_rate": 1.2043358221105581e-06, - "loss": 0.5249, - "step": 52843 - }, - { - "epoch": 1.35, - "learning_rate": 1.2043087354015301e-06, - "loss": 0.5386, - "step": 52844 - }, - { - "epoch": 1.35, - "learning_rate": 1.204281648536072e-06, - "loss": 0.5745, - "step": 52845 - }, - { - "epoch": 1.35, - "learning_rate": 1.2042545615142052e-06, - "loss": 0.6738, - "step": 52846 - }, - { - "epoch": 1.35, - "learning_rate": 1.20422747433595e-06, - "loss": 0.7461, - "step": 52847 - }, - { - "epoch": 1.35, - "learning_rate": 1.2042003870013272e-06, - "loss": 0.5771, - "step": 52848 - }, - { - "epoch": 1.35, - "learning_rate": 1.2041732995103575e-06, - "loss": 0.6191, - "step": 52849 - }, - { - "epoch": 1.35, - "learning_rate": 1.2041462118630616e-06, - "loss": 0.6304, - "step": 52850 - }, - { - "epoch": 1.35, - "learning_rate": 1.2041191240594606e-06, - "loss": 0.7354, - "step": 52851 - }, - { - "epoch": 1.35, - "learning_rate": 1.2040920360995748e-06, - "loss": 0.4292, - "step": 52852 - }, - { - "epoch": 1.35, - "learning_rate": 1.2040649479834252e-06, - "loss": 0.6113, - "step": 52853 - }, - { - "epoch": 1.35, - "learning_rate": 1.2040378597110323e-06, - "loss": 0.7119, - "step": 52854 - }, - { - "epoch": 1.35, - "learning_rate": 1.204010771282417e-06, - "loss": 0.7285, - "step": 52855 - }, - { - "epoch": 1.35, - "learning_rate": 1.2039836826976e-06, - "loss": 0.5723, - "step": 52856 - }, - { - "epoch": 1.35, - "learning_rate": 1.2039565939566024e-06, - "loss": 0.8125, - "step": 52857 - }, - { - "epoch": 1.35, - "learning_rate": 1.2039295050594444e-06, - "loss": 0.4546, - "step": 52858 - }, - { - "epoch": 1.35, - "learning_rate": 1.203902416006147e-06, - "loss": 0.5669, - "step": 52859 - }, - { - "epoch": 1.35, - "learning_rate": 1.2038753267967307e-06, - "loss": 0.6289, - "step": 52860 - }, - { - "epoch": 1.35, - "learning_rate": 1.2038482374312166e-06, - "loss": 0.5566, - "step": 52861 - }, - { - "epoch": 1.35, - "learning_rate": 1.2038211479096253e-06, - "loss": 0.7939, - "step": 52862 - }, - { - "epoch": 1.35, - "learning_rate": 1.2037940582319776e-06, - "loss": 0.4897, - "step": 52863 - }, - { - "epoch": 1.35, - "learning_rate": 1.2037669683982938e-06, - "loss": 0.4961, - "step": 52864 - }, - { - "epoch": 1.35, - "learning_rate": 1.2037398784085954e-06, - "loss": 0.5129, - "step": 52865 - }, - { - "epoch": 1.35, - "learning_rate": 1.2037127882629025e-06, - "loss": 0.5444, - "step": 52866 - }, - { - "epoch": 1.36, - "learning_rate": 1.2036856979612362e-06, - "loss": 0.5889, - "step": 52867 - }, - { - "epoch": 1.36, - "learning_rate": 1.2036586075036173e-06, - "loss": 0.3687, - "step": 52868 - }, - { - "epoch": 1.36, - "learning_rate": 1.2036315168900662e-06, - "loss": 0.8867, - "step": 52869 - }, - { - "epoch": 1.36, - "learning_rate": 1.2036044261206035e-06, - "loss": 0.5645, - "step": 52870 - }, - { - "epoch": 1.36, - "learning_rate": 1.2035773351952507e-06, - "loss": 0.7129, - "step": 52871 - }, - { - "epoch": 1.36, - "learning_rate": 1.2035502441140277e-06, - "loss": 0.6738, - "step": 52872 - }, - { - "epoch": 1.36, - "learning_rate": 1.203523152876956e-06, - "loss": 0.6299, - "step": 52873 - }, - { - "epoch": 1.36, - "learning_rate": 1.2034960614840558e-06, - "loss": 0.6689, - "step": 52874 - }, - { - "epoch": 1.36, - "learning_rate": 1.203468969935348e-06, - "loss": 0.6963, - "step": 52875 - }, - { - "epoch": 1.36, - "learning_rate": 1.2034418782308536e-06, - "loss": 0.5596, - "step": 52876 - }, - { - "epoch": 1.36, - "learning_rate": 1.2034147863705928e-06, - "loss": 0.4956, - "step": 52877 - }, - { - "epoch": 1.36, - "learning_rate": 1.2033876943545869e-06, - "loss": 0.6416, - "step": 52878 - }, - { - "epoch": 1.36, - "learning_rate": 1.2033606021828562e-06, - "loss": 0.6665, - "step": 52879 - }, - { - "epoch": 1.36, - "learning_rate": 1.2033335098554218e-06, - "loss": 0.6328, - "step": 52880 - }, - { - "epoch": 1.36, - "learning_rate": 1.203306417372304e-06, - "loss": 0.6616, - "step": 52881 - }, - { - "epoch": 1.36, - "learning_rate": 1.2032793247335241e-06, - "loss": 0.7168, - "step": 52882 - }, - { - "epoch": 1.36, - "learning_rate": 1.2032522319391025e-06, - "loss": 0.7041, - "step": 52883 - }, - { - "epoch": 1.36, - "learning_rate": 1.2032251389890601e-06, - "loss": 0.8604, - "step": 52884 - }, - { - "epoch": 1.36, - "learning_rate": 1.2031980458834174e-06, - "loss": 0.7305, - "step": 52885 - }, - { - "epoch": 1.36, - "learning_rate": 1.2031709526221953e-06, - "loss": 0.4582, - "step": 52886 - }, - { - "epoch": 1.36, - "learning_rate": 1.2031438592054145e-06, - "loss": 0.6626, - "step": 52887 - }, - { - "epoch": 1.36, - "learning_rate": 1.2031167656330963e-06, - "loss": 0.7041, - "step": 52888 - }, - { - "epoch": 1.36, - "learning_rate": 1.2030896719052604e-06, - "loss": 0.5801, - "step": 52889 - }, - { - "epoch": 1.36, - "learning_rate": 1.2030625780219284e-06, - "loss": 0.6133, - "step": 52890 - }, - { - "epoch": 1.36, - "learning_rate": 1.2030354839831203e-06, - "loss": 0.7432, - "step": 52891 - }, - { - "epoch": 1.36, - "learning_rate": 1.2030083897888575e-06, - "loss": 0.5537, - "step": 52892 - }, - { - "epoch": 1.36, - "learning_rate": 1.2029812954391605e-06, - "loss": 0.6992, - "step": 52893 - }, - { - "epoch": 1.36, - "learning_rate": 1.20295420093405e-06, - "loss": 0.5601, - "step": 52894 - }, - { - "epoch": 1.36, - "learning_rate": 1.2029271062735468e-06, - "loss": 0.4568, - "step": 52895 - }, - { - "epoch": 1.36, - "learning_rate": 1.2029000114576717e-06, - "loss": 0.6006, - "step": 52896 - }, - { - "epoch": 1.36, - "learning_rate": 1.2028729164864455e-06, - "loss": 0.5034, - "step": 52897 - }, - { - "epoch": 1.36, - "learning_rate": 1.2028458213598887e-06, - "loss": 0.5647, - "step": 52898 - }, - { - "epoch": 1.36, - "learning_rate": 1.2028187260780222e-06, - "loss": 0.5508, - "step": 52899 - }, - { - "epoch": 1.36, - "learning_rate": 1.2027916306408667e-06, - "loss": 0.7197, - "step": 52900 - }, - { - "epoch": 1.36, - "learning_rate": 1.202764535048443e-06, - "loss": 0.8926, - "step": 52901 - }, - { - "epoch": 1.36, - "learning_rate": 1.2027374393007716e-06, - "loss": 0.5474, - "step": 52902 - }, - { - "epoch": 1.36, - "learning_rate": 1.2027103433978743e-06, - "loss": 0.7734, - "step": 52903 - }, - { - "epoch": 1.36, - "learning_rate": 1.2026832473397702e-06, - "loss": 0.666, - "step": 52904 - }, - { - "epoch": 1.36, - "learning_rate": 1.202656151126481e-06, - "loss": 0.5503, - "step": 52905 - }, - { - "epoch": 1.36, - "learning_rate": 1.2026290547580274e-06, - "loss": 0.5315, - "step": 52906 - }, - { - "epoch": 1.36, - "learning_rate": 1.20260195823443e-06, - "loss": 0.6904, - "step": 52907 - }, - { - "epoch": 1.36, - "learning_rate": 1.2025748615557096e-06, - "loss": 0.5586, - "step": 52908 - }, - { - "epoch": 1.36, - "learning_rate": 1.2025477647218872e-06, - "loss": 0.6128, - "step": 52909 - }, - { - "epoch": 1.36, - "learning_rate": 1.202520667732983e-06, - "loss": 0.6338, - "step": 52910 - }, - { - "epoch": 1.36, - "learning_rate": 1.2024935705890177e-06, - "loss": 0.7178, - "step": 52911 - }, - { - "epoch": 1.36, - "learning_rate": 1.2024664732900128e-06, - "loss": 0.8662, - "step": 52912 - }, - { - "epoch": 1.36, - "learning_rate": 1.2024393758359888e-06, - "loss": 0.6323, - "step": 52913 - }, - { - "epoch": 1.36, - "learning_rate": 1.202412278226966e-06, - "loss": 0.708, - "step": 52914 - }, - { - "epoch": 1.36, - "learning_rate": 1.2023851804629657e-06, - "loss": 0.5972, - "step": 52915 - }, - { - "epoch": 1.36, - "learning_rate": 1.2023580825440079e-06, - "loss": 0.5542, - "step": 52916 - }, - { - "epoch": 1.36, - "learning_rate": 1.2023309844701142e-06, - "loss": 0.5938, - "step": 52917 - }, - { - "epoch": 1.36, - "learning_rate": 1.2023038862413049e-06, - "loss": 0.6523, - "step": 52918 - }, - { - "epoch": 1.36, - "learning_rate": 1.2022767878576008e-06, - "loss": 0.7227, - "step": 52919 - }, - { - "epoch": 1.36, - "learning_rate": 1.2022496893190225e-06, - "loss": 0.6777, - "step": 52920 - }, - { - "epoch": 1.36, - "learning_rate": 1.202222590625591e-06, - "loss": 0.748, - "step": 52921 - }, - { - "epoch": 1.36, - "learning_rate": 1.2021954917773272e-06, - "loss": 0.5986, - "step": 52922 - }, - { - "epoch": 1.36, - "learning_rate": 1.2021683927742514e-06, - "loss": 0.646, - "step": 52923 - }, - { - "epoch": 1.36, - "learning_rate": 1.2021412936163847e-06, - "loss": 0.7734, - "step": 52924 - }, - { - "epoch": 1.36, - "learning_rate": 1.2021141943037474e-06, - "loss": 0.6234, - "step": 52925 - }, - { - "epoch": 1.36, - "learning_rate": 1.2020870948363608e-06, - "loss": 0.5388, - "step": 52926 - }, - { - "epoch": 1.36, - "learning_rate": 1.2020599952142453e-06, - "loss": 0.6045, - "step": 52927 - }, - { - "epoch": 1.36, - "learning_rate": 1.2020328954374219e-06, - "loss": 0.6836, - "step": 52928 - }, - { - "epoch": 1.36, - "learning_rate": 1.202005795505911e-06, - "loss": 0.8174, - "step": 52929 - }, - { - "epoch": 1.36, - "learning_rate": 1.2019786954197338e-06, - "loss": 0.7456, - "step": 52930 - }, - { - "epoch": 1.36, - "learning_rate": 1.2019515951789105e-06, - "loss": 0.6831, - "step": 52931 - }, - { - "epoch": 1.36, - "learning_rate": 1.2019244947834623e-06, - "loss": 0.7852, - "step": 52932 - }, - { - "epoch": 1.36, - "learning_rate": 1.20189739423341e-06, - "loss": 0.6196, - "step": 52933 - }, - { - "epoch": 1.36, - "learning_rate": 1.2018702935287739e-06, - "loss": 0.707, - "step": 52934 - }, - { - "epoch": 1.36, - "learning_rate": 1.201843192669575e-06, - "loss": 0.7559, - "step": 52935 - }, - { - "epoch": 1.36, - "learning_rate": 1.2018160916558342e-06, - "loss": 0.3564, - "step": 52936 - }, - { - "epoch": 1.36, - "learning_rate": 1.2017889904875718e-06, - "loss": 0.6475, - "step": 52937 - }, - { - "epoch": 1.36, - "learning_rate": 1.2017618891648091e-06, - "loss": 0.6528, - "step": 52938 - }, - { - "epoch": 1.36, - "learning_rate": 1.2017347876875667e-06, - "loss": 0.709, - "step": 52939 - }, - { - "epoch": 1.36, - "learning_rate": 1.2017076860558648e-06, - "loss": 0.7266, - "step": 52940 - }, - { - "epoch": 1.36, - "learning_rate": 1.201680584269725e-06, - "loss": 0.708, - "step": 52941 - }, - { - "epoch": 1.36, - "learning_rate": 1.2016534823291677e-06, - "loss": 0.6621, - "step": 52942 - }, - { - "epoch": 1.36, - "learning_rate": 1.2016263802342135e-06, - "loss": 0.5044, - "step": 52943 - }, - { - "epoch": 1.36, - "learning_rate": 1.201599277984883e-06, - "loss": 0.7344, - "step": 52944 - }, - { - "epoch": 1.36, - "learning_rate": 1.2015721755811976e-06, - "loss": 0.6035, - "step": 52945 - }, - { - "epoch": 1.36, - "learning_rate": 1.2015450730231773e-06, - "loss": 0.6816, - "step": 52946 - }, - { - "epoch": 1.36, - "learning_rate": 1.2015179703108433e-06, - "loss": 0.5898, - "step": 52947 - }, - { - "epoch": 1.36, - "learning_rate": 1.2014908674442163e-06, - "loss": 0.7178, - "step": 52948 - }, - { - "epoch": 1.36, - "learning_rate": 1.2014637644233171e-06, - "loss": 0.7334, - "step": 52949 - }, - { - "epoch": 1.36, - "learning_rate": 1.2014366612481664e-06, - "loss": 0.6309, - "step": 52950 - }, - { - "epoch": 1.36, - "learning_rate": 1.2014095579187848e-06, - "loss": 0.7383, - "step": 52951 - }, - { - "epoch": 1.36, - "learning_rate": 1.201382454435193e-06, - "loss": 0.5447, - "step": 52952 - }, - { - "epoch": 1.36, - "learning_rate": 1.2013553507974124e-06, - "loss": 0.918, - "step": 52953 - }, - { - "epoch": 1.36, - "learning_rate": 1.2013282470054626e-06, - "loss": 0.7344, - "step": 52954 - }, - { - "epoch": 1.36, - "learning_rate": 1.2013011430593656e-06, - "loss": 0.5684, - "step": 52955 - }, - { - "epoch": 1.36, - "learning_rate": 1.2012740389591412e-06, - "loss": 0.8545, - "step": 52956 - }, - { - "epoch": 1.36, - "learning_rate": 1.2012469347048106e-06, - "loss": 0.791, - "step": 52957 - }, - { - "epoch": 1.36, - "learning_rate": 1.2012198302963946e-06, - "loss": 0.585, - "step": 52958 - }, - { - "epoch": 1.36, - "learning_rate": 1.2011927257339138e-06, - "loss": 0.7153, - "step": 52959 - }, - { - "epoch": 1.36, - "learning_rate": 1.201165621017389e-06, - "loss": 0.7002, - "step": 52960 - }, - { - "epoch": 1.36, - "learning_rate": 1.2011385161468408e-06, - "loss": 0.5879, - "step": 52961 - }, - { - "epoch": 1.36, - "learning_rate": 1.20111141112229e-06, - "loss": 0.7363, - "step": 52962 - }, - { - "epoch": 1.36, - "learning_rate": 1.2010843059437577e-06, - "loss": 0.6445, - "step": 52963 - }, - { - "epoch": 1.36, - "learning_rate": 1.2010572006112643e-06, - "loss": 0.6406, - "step": 52964 - }, - { - "epoch": 1.36, - "learning_rate": 1.2010300951248305e-06, - "loss": 0.5591, - "step": 52965 - }, - { - "epoch": 1.36, - "learning_rate": 1.2010029894844774e-06, - "loss": 0.7441, - "step": 52966 - }, - { - "epoch": 1.36, - "learning_rate": 1.2009758836902252e-06, - "loss": 0.7646, - "step": 52967 - }, - { - "epoch": 1.36, - "learning_rate": 1.2009487777420958e-06, - "loss": 0.5776, - "step": 52968 - }, - { - "epoch": 1.36, - "learning_rate": 1.2009216716401085e-06, - "loss": 0.7773, - "step": 52969 - }, - { - "epoch": 1.36, - "learning_rate": 1.2008945653842848e-06, - "loss": 0.5776, - "step": 52970 - }, - { - "epoch": 1.36, - "learning_rate": 1.2008674589746452e-06, - "loss": 0.7227, - "step": 52971 - }, - { - "epoch": 1.36, - "learning_rate": 1.200840352411211e-06, - "loss": 0.8301, - "step": 52972 - }, - { - "epoch": 1.36, - "learning_rate": 1.2008132456940026e-06, - "loss": 0.3735, - "step": 52973 - }, - { - "epoch": 1.36, - "learning_rate": 1.2007861388230404e-06, - "loss": 0.7246, - "step": 52974 - }, - { - "epoch": 1.36, - "learning_rate": 1.2007590317983456e-06, - "loss": 0.751, - "step": 52975 - }, - { - "epoch": 1.36, - "learning_rate": 1.200731924619939e-06, - "loss": 0.6436, - "step": 52976 - }, - { - "epoch": 1.36, - "learning_rate": 1.2007048172878409e-06, - "loss": 0.5481, - "step": 52977 - }, - { - "epoch": 1.36, - "learning_rate": 1.2006777098020728e-06, - "loss": 0.8057, - "step": 52978 - }, - { - "epoch": 1.36, - "learning_rate": 1.2006506021626548e-06, - "loss": 0.8311, - "step": 52979 - }, - { - "epoch": 1.36, - "learning_rate": 1.2006234943696078e-06, - "loss": 0.6108, - "step": 52980 - }, - { - "epoch": 1.36, - "learning_rate": 1.2005963864229526e-06, - "loss": 0.6143, - "step": 52981 - }, - { - "epoch": 1.36, - "learning_rate": 1.20056927832271e-06, - "loss": 0.6978, - "step": 52982 - }, - { - "epoch": 1.36, - "learning_rate": 1.2005421700689007e-06, - "loss": 0.6719, - "step": 52983 - }, - { - "epoch": 1.36, - "learning_rate": 1.2005150616615453e-06, - "loss": 0.5957, - "step": 52984 - }, - { - "epoch": 1.36, - "learning_rate": 1.200487953100665e-06, - "loss": 0.6067, - "step": 52985 - }, - { - "epoch": 1.36, - "learning_rate": 1.20046084438628e-06, - "loss": 0.6211, - "step": 52986 - }, - { - "epoch": 1.36, - "learning_rate": 1.2004337355184118e-06, - "loss": 0.5889, - "step": 52987 - }, - { - "epoch": 1.36, - "learning_rate": 1.2004066264970805e-06, - "loss": 0.7842, - "step": 52988 - }, - { - "epoch": 1.36, - "learning_rate": 1.2003795173223072e-06, - "loss": 0.6182, - "step": 52989 - }, - { - "epoch": 1.36, - "learning_rate": 1.2003524079941124e-06, - "loss": 0.5646, - "step": 52990 - }, - { - "epoch": 1.36, - "learning_rate": 1.2003252985125168e-06, - "loss": 0.7178, - "step": 52991 - }, - { - "epoch": 1.36, - "learning_rate": 1.2002981888775411e-06, - "loss": 0.5605, - "step": 52992 - }, - { - "epoch": 1.36, - "learning_rate": 1.2002710790892072e-06, - "loss": 0.7646, - "step": 52993 - }, - { - "epoch": 1.36, - "learning_rate": 1.2002439691475342e-06, - "loss": 0.6982, - "step": 52994 - }, - { - "epoch": 1.36, - "learning_rate": 1.2002168590525438e-06, - "loss": 0.707, - "step": 52995 - }, - { - "epoch": 1.36, - "learning_rate": 1.2001897488042566e-06, - "loss": 0.7217, - "step": 52996 - }, - { - "epoch": 1.36, - "learning_rate": 1.2001626384026932e-06, - "loss": 0.6333, - "step": 52997 - }, - { - "epoch": 1.36, - "learning_rate": 1.2001355278478747e-06, - "loss": 0.4363, - "step": 52998 - }, - { - "epoch": 1.36, - "learning_rate": 1.2001084171398215e-06, - "loss": 0.7334, - "step": 52999 - }, - { - "epoch": 1.36, - "learning_rate": 1.200081306278554e-06, - "loss": 0.7031, - "step": 53000 - }, - { - "epoch": 1.36, - "learning_rate": 1.2000541952640942e-06, - "loss": 0.5781, - "step": 53001 - }, - { - "epoch": 1.36, - "learning_rate": 1.2000270840964617e-06, - "loss": 0.6768, - "step": 53002 - }, - { - "epoch": 1.36, - "learning_rate": 1.1999999727756777e-06, - "loss": 0.7734, - "step": 53003 - }, - { - "epoch": 1.36, - "learning_rate": 1.1999728613017632e-06, - "loss": 0.7168, - "step": 53004 - }, - { - "epoch": 1.36, - "learning_rate": 1.1999457496747386e-06, - "loss": 0.6699, - "step": 53005 - }, - { - "epoch": 1.36, - "learning_rate": 1.1999186378946242e-06, - "loss": 0.5391, - "step": 53006 - }, - { - "epoch": 1.36, - "learning_rate": 1.199891525961442e-06, - "loss": 0.6187, - "step": 53007 - }, - { - "epoch": 1.36, - "learning_rate": 1.1998644138752117e-06, - "loss": 0.5884, - "step": 53008 - }, - { - "epoch": 1.36, - "learning_rate": 1.1998373016359543e-06, - "loss": 0.6885, - "step": 53009 - }, - { - "epoch": 1.36, - "learning_rate": 1.1998101892436907e-06, - "loss": 0.6602, - "step": 53010 - }, - { - "epoch": 1.36, - "learning_rate": 1.1997830766984415e-06, - "loss": 0.7031, - "step": 53011 - }, - { - "epoch": 1.36, - "learning_rate": 1.1997559640002281e-06, - "loss": 0.626, - "step": 53012 - }, - { - "epoch": 1.36, - "learning_rate": 1.1997288511490705e-06, - "loss": 0.6006, - "step": 53013 - }, - { - "epoch": 1.36, - "learning_rate": 1.1997017381449897e-06, - "loss": 0.7295, - "step": 53014 - }, - { - "epoch": 1.36, - "learning_rate": 1.1996746249880063e-06, - "loss": 0.6965, - "step": 53015 - }, - { - "epoch": 1.36, - "learning_rate": 1.1996475116781414e-06, - "loss": 0.6167, - "step": 53016 - }, - { - "epoch": 1.36, - "learning_rate": 1.1996203982154153e-06, - "loss": 0.5044, - "step": 53017 - }, - { - "epoch": 1.36, - "learning_rate": 1.1995932845998496e-06, - "loss": 0.626, - "step": 53018 - }, - { - "epoch": 1.36, - "learning_rate": 1.1995661708314639e-06, - "loss": 0.4576, - "step": 53019 - }, - { - "epoch": 1.36, - "learning_rate": 1.19953905691028e-06, - "loss": 0.647, - "step": 53020 - }, - { - "epoch": 1.36, - "learning_rate": 1.1995119428363178e-06, - "loss": 0.583, - "step": 53021 - }, - { - "epoch": 1.36, - "learning_rate": 1.199484828609599e-06, - "loss": 0.5718, - "step": 53022 - }, - { - "epoch": 1.36, - "learning_rate": 1.1994577142301433e-06, - "loss": 0.688, - "step": 53023 - }, - { - "epoch": 1.36, - "learning_rate": 1.1994305996979726e-06, - "loss": 0.6885, - "step": 53024 - }, - { - "epoch": 1.36, - "learning_rate": 1.1994034850131065e-06, - "loss": 0.5513, - "step": 53025 - }, - { - "epoch": 1.36, - "learning_rate": 1.1993763701755666e-06, - "loss": 0.5674, - "step": 53026 - }, - { - "epoch": 1.36, - "learning_rate": 1.1993492551853733e-06, - "loss": 0.5171, - "step": 53027 - }, - { - "epoch": 1.36, - "learning_rate": 1.1993221400425473e-06, - "loss": 0.5986, - "step": 53028 - }, - { - "epoch": 1.36, - "learning_rate": 1.1992950247471098e-06, - "loss": 0.5118, - "step": 53029 - }, - { - "epoch": 1.36, - "learning_rate": 1.199267909299081e-06, - "loss": 0.8975, - "step": 53030 - }, - { - "epoch": 1.36, - "learning_rate": 1.1992407936984822e-06, - "loss": 0.7842, - "step": 53031 - }, - { - "epoch": 1.36, - "learning_rate": 1.1992136779453337e-06, - "loss": 0.5962, - "step": 53032 - }, - { - "epoch": 1.36, - "learning_rate": 1.1991865620396567e-06, - "loss": 0.604, - "step": 53033 - }, - { - "epoch": 1.36, - "learning_rate": 1.199159445981471e-06, - "loss": 0.7373, - "step": 53034 - }, - { - "epoch": 1.36, - "learning_rate": 1.1991323297707987e-06, - "loss": 0.6504, - "step": 53035 - }, - { - "epoch": 1.36, - "learning_rate": 1.1991052134076599e-06, - "loss": 0.6196, - "step": 53036 - }, - { - "epoch": 1.36, - "learning_rate": 1.1990780968920754e-06, - "loss": 0.7178, - "step": 53037 - }, - { - "epoch": 1.36, - "learning_rate": 1.1990509802240658e-06, - "loss": 0.5977, - "step": 53038 - }, - { - "epoch": 1.36, - "learning_rate": 1.199023863403652e-06, - "loss": 0.7021, - "step": 53039 - }, - { - "epoch": 1.36, - "learning_rate": 1.1989967464308549e-06, - "loss": 0.7305, - "step": 53040 - }, - { - "epoch": 1.36, - "learning_rate": 1.198969629305695e-06, - "loss": 0.5879, - "step": 53041 - }, - { - "epoch": 1.36, - "learning_rate": 1.1989425120281932e-06, - "loss": 0.9111, - "step": 53042 - }, - { - "epoch": 1.36, - "learning_rate": 1.1989153945983706e-06, - "loss": 0.5662, - "step": 53043 - }, - { - "epoch": 1.36, - "learning_rate": 1.1988882770162472e-06, - "loss": 0.6738, - "step": 53044 - }, - { - "epoch": 1.36, - "learning_rate": 1.1988611592818446e-06, - "loss": 0.6895, - "step": 53045 - }, - { - "epoch": 1.36, - "learning_rate": 1.1988340413951826e-06, - "loss": 0.6133, - "step": 53046 - }, - { - "epoch": 1.36, - "learning_rate": 1.198806923356283e-06, - "loss": 0.3467, - "step": 53047 - }, - { - "epoch": 1.36, - "learning_rate": 1.1987798051651659e-06, - "loss": 0.791, - "step": 53048 - }, - { - "epoch": 1.36, - "learning_rate": 1.1987526868218523e-06, - "loss": 0.7119, - "step": 53049 - }, - { - "epoch": 1.36, - "learning_rate": 1.1987255683263627e-06, - "loss": 0.8555, - "step": 53050 - }, - { - "epoch": 1.36, - "learning_rate": 1.1986984496787182e-06, - "loss": 0.707, - "step": 53051 - }, - { - "epoch": 1.36, - "learning_rate": 1.1986713308789397e-06, - "loss": 0.7656, - "step": 53052 - }, - { - "epoch": 1.36, - "learning_rate": 1.1986442119270473e-06, - "loss": 0.5557, - "step": 53053 - }, - { - "epoch": 1.36, - "learning_rate": 1.1986170928230623e-06, - "loss": 0.6001, - "step": 53054 - }, - { - "epoch": 1.36, - "learning_rate": 1.1985899735670053e-06, - "loss": 0.709, - "step": 53055 - }, - { - "epoch": 1.36, - "learning_rate": 1.1985628541588972e-06, - "loss": 0.6172, - "step": 53056 - }, - { - "epoch": 1.36, - "learning_rate": 1.1985357345987588e-06, - "loss": 0.6111, - "step": 53057 - }, - { - "epoch": 1.36, - "learning_rate": 1.1985086148866103e-06, - "loss": 0.6348, - "step": 53058 - }, - { - "epoch": 1.36, - "learning_rate": 1.198481495022473e-06, - "loss": 0.7979, - "step": 53059 - }, - { - "epoch": 1.36, - "learning_rate": 1.1984543750063678e-06, - "loss": 0.5322, - "step": 53060 - }, - { - "epoch": 1.36, - "learning_rate": 1.1984272548383149e-06, - "loss": 0.5063, - "step": 53061 - }, - { - "epoch": 1.36, - "learning_rate": 1.198400134518336e-06, - "loss": 0.4961, - "step": 53062 - }, - { - "epoch": 1.36, - "learning_rate": 1.1983730140464502e-06, - "loss": 0.7344, - "step": 53063 - }, - { - "epoch": 1.36, - "learning_rate": 1.1983458934226802e-06, - "loss": 0.5815, - "step": 53064 - }, - { - "epoch": 1.36, - "learning_rate": 1.1983187726470454e-06, - "loss": 0.8223, - "step": 53065 - }, - { - "epoch": 1.36, - "learning_rate": 1.1982916517195671e-06, - "loss": 0.5825, - "step": 53066 - }, - { - "epoch": 1.36, - "learning_rate": 1.1982645306402664e-06, - "loss": 0.5166, - "step": 53067 - }, - { - "epoch": 1.36, - "learning_rate": 1.1982374094091632e-06, - "loss": 0.7529, - "step": 53068 - }, - { - "epoch": 1.36, - "learning_rate": 1.1982102880262788e-06, - "loss": 0.6299, - "step": 53069 - }, - { - "epoch": 1.36, - "learning_rate": 1.198183166491634e-06, - "loss": 0.4932, - "step": 53070 - }, - { - "epoch": 1.36, - "learning_rate": 1.1981560448052493e-06, - "loss": 0.7666, - "step": 53071 - }, - { - "epoch": 1.36, - "learning_rate": 1.198128922967146e-06, - "loss": 0.4243, - "step": 53072 - }, - { - "epoch": 1.36, - "learning_rate": 1.198101800977344e-06, - "loss": 0.7305, - "step": 53073 - }, - { - "epoch": 1.36, - "learning_rate": 1.1980746788358649e-06, - "loss": 0.6074, - "step": 53074 - }, - { - "epoch": 1.36, - "learning_rate": 1.198047556542729e-06, - "loss": 0.5547, - "step": 53075 - }, - { - "epoch": 1.36, - "learning_rate": 1.1980204340979573e-06, - "loss": 0.4724, - "step": 53076 - }, - { - "epoch": 1.36, - "learning_rate": 1.1979933115015703e-06, - "loss": 0.812, - "step": 53077 - }, - { - "epoch": 1.36, - "learning_rate": 1.197966188753589e-06, - "loss": 0.8213, - "step": 53078 - }, - { - "epoch": 1.36, - "learning_rate": 1.1979390658540342e-06, - "loss": 0.5547, - "step": 53079 - }, - { - "epoch": 1.36, - "learning_rate": 1.1979119428029264e-06, - "loss": 0.5439, - "step": 53080 - }, - { - "epoch": 1.36, - "learning_rate": 1.1978848196002864e-06, - "loss": 0.7139, - "step": 53081 - }, - { - "epoch": 1.36, - "learning_rate": 1.1978576962461356e-06, - "loss": 0.6924, - "step": 53082 - }, - { - "epoch": 1.36, - "learning_rate": 1.197830572740494e-06, - "loss": 0.7686, - "step": 53083 - }, - { - "epoch": 1.36, - "learning_rate": 1.1978034490833825e-06, - "loss": 0.7031, - "step": 53084 - }, - { - "epoch": 1.36, - "learning_rate": 1.197776325274822e-06, - "loss": 0.5586, - "step": 53085 - }, - { - "epoch": 1.36, - "learning_rate": 1.197749201314833e-06, - "loss": 0.584, - "step": 53086 - }, - { - "epoch": 1.36, - "learning_rate": 1.1977220772034373e-06, - "loss": 0.7935, - "step": 53087 - }, - { - "epoch": 1.36, - "learning_rate": 1.1976949529406541e-06, - "loss": 0.7002, - "step": 53088 - }, - { - "epoch": 1.36, - "learning_rate": 1.1976678285265057e-06, - "loss": 0.4824, - "step": 53089 - }, - { - "epoch": 1.36, - "learning_rate": 1.1976407039610115e-06, - "loss": 0.7656, - "step": 53090 - }, - { - "epoch": 1.36, - "learning_rate": 1.197613579244193e-06, - "loss": 0.75, - "step": 53091 - }, - { - "epoch": 1.36, - "learning_rate": 1.1975864543760712e-06, - "loss": 0.7588, - "step": 53092 - }, - { - "epoch": 1.36, - "learning_rate": 1.1975593293566664e-06, - "loss": 0.5659, - "step": 53093 - }, - { - "epoch": 1.36, - "learning_rate": 1.1975322041859994e-06, - "loss": 0.5076, - "step": 53094 - }, - { - "epoch": 1.36, - "learning_rate": 1.1975050788640913e-06, - "loss": 0.7012, - "step": 53095 - }, - { - "epoch": 1.36, - "learning_rate": 1.1974779533909622e-06, - "loss": 0.5815, - "step": 53096 - }, - { - "epoch": 1.36, - "learning_rate": 1.1974508277666339e-06, - "loss": 0.7451, - "step": 53097 - }, - { - "epoch": 1.36, - "learning_rate": 1.1974237019911262e-06, - "loss": 0.6958, - "step": 53098 - }, - { - "epoch": 1.36, - "learning_rate": 1.19739657606446e-06, - "loss": 0.4722, - "step": 53099 - }, - { - "epoch": 1.36, - "learning_rate": 1.1973694499866566e-06, - "loss": 0.6172, - "step": 53100 - }, - { - "epoch": 1.36, - "learning_rate": 1.1973423237577365e-06, - "loss": 0.5879, - "step": 53101 - }, - { - "epoch": 1.36, - "learning_rate": 1.197315197377721e-06, - "loss": 0.708, - "step": 53102 - }, - { - "epoch": 1.36, - "learning_rate": 1.1972880708466294e-06, - "loss": 0.5034, - "step": 53103 - }, - { - "epoch": 1.36, - "learning_rate": 1.1972609441644838e-06, - "loss": 0.5271, - "step": 53104 - }, - { - "epoch": 1.36, - "learning_rate": 1.1972338173313046e-06, - "loss": 0.5708, - "step": 53105 - }, - { - "epoch": 1.36, - "learning_rate": 1.1972066903471125e-06, - "loss": 0.7139, - "step": 53106 - }, - { - "epoch": 1.36, - "learning_rate": 1.1971795632119283e-06, - "loss": 0.7764, - "step": 53107 - }, - { - "epoch": 1.36, - "learning_rate": 1.197152435925773e-06, - "loss": 0.6274, - "step": 53108 - }, - { - "epoch": 1.36, - "learning_rate": 1.1971253084886667e-06, - "loss": 0.5254, - "step": 53109 - }, - { - "epoch": 1.36, - "learning_rate": 1.1970981809006308e-06, - "loss": 0.4862, - "step": 53110 - }, - { - "epoch": 1.36, - "learning_rate": 1.197071053161686e-06, - "loss": 0.7363, - "step": 53111 - }, - { - "epoch": 1.36, - "learning_rate": 1.1970439252718532e-06, - "loss": 0.7979, - "step": 53112 - }, - { - "epoch": 1.36, - "learning_rate": 1.1970167972311523e-06, - "loss": 0.7295, - "step": 53113 - }, - { - "epoch": 1.36, - "learning_rate": 1.196989669039605e-06, - "loss": 0.6602, - "step": 53114 - }, - { - "epoch": 1.36, - "learning_rate": 1.1969625406972318e-06, - "loss": 0.7617, - "step": 53115 - }, - { - "epoch": 1.36, - "learning_rate": 1.1969354122040533e-06, - "loss": 0.5861, - "step": 53116 - }, - { - "epoch": 1.36, - "learning_rate": 1.1969082835600908e-06, - "loss": 0.7461, - "step": 53117 - }, - { - "epoch": 1.36, - "learning_rate": 1.1968811547653641e-06, - "loss": 0.6689, - "step": 53118 - }, - { - "epoch": 1.36, - "learning_rate": 1.1968540258198952e-06, - "loss": 0.5601, - "step": 53119 - }, - { - "epoch": 1.36, - "learning_rate": 1.1968268967237035e-06, - "loss": 0.7021, - "step": 53120 - }, - { - "epoch": 1.36, - "learning_rate": 1.1967997674768112e-06, - "loss": 0.4207, - "step": 53121 - }, - { - "epoch": 1.36, - "learning_rate": 1.196772638079238e-06, - "loss": 0.6826, - "step": 53122 - }, - { - "epoch": 1.36, - "learning_rate": 1.1967455085310052e-06, - "loss": 0.6274, - "step": 53123 - }, - { - "epoch": 1.36, - "learning_rate": 1.196718378832133e-06, - "loss": 0.6099, - "step": 53124 - }, - { - "epoch": 1.36, - "learning_rate": 1.196691248982643e-06, - "loss": 0.6899, - "step": 53125 - }, - { - "epoch": 1.36, - "learning_rate": 1.1966641189825552e-06, - "loss": 0.666, - "step": 53126 - }, - { - "epoch": 1.36, - "learning_rate": 1.1966369888318912e-06, - "loss": 0.793, - "step": 53127 - }, - { - "epoch": 1.36, - "learning_rate": 1.1966098585306709e-06, - "loss": 0.8486, - "step": 53128 - }, - { - "epoch": 1.36, - "learning_rate": 1.1965827280789159e-06, - "loss": 0.6284, - "step": 53129 - }, - { - "epoch": 1.36, - "learning_rate": 1.196555597476646e-06, - "loss": 0.8975, - "step": 53130 - }, - { - "epoch": 1.36, - "learning_rate": 1.1965284667238829e-06, - "loss": 0.6943, - "step": 53131 - }, - { - "epoch": 1.36, - "learning_rate": 1.196501335820647e-06, - "loss": 0.5811, - "step": 53132 - }, - { - "epoch": 1.36, - "learning_rate": 1.196474204766959e-06, - "loss": 0.6904, - "step": 53133 - }, - { - "epoch": 1.36, - "learning_rate": 1.1964470735628395e-06, - "loss": 0.5835, - "step": 53134 - }, - { - "epoch": 1.36, - "learning_rate": 1.1964199422083096e-06, - "loss": 0.561, - "step": 53135 - }, - { - "epoch": 1.36, - "learning_rate": 1.19639281070339e-06, - "loss": 0.5415, - "step": 53136 - }, - { - "epoch": 1.36, - "learning_rate": 1.1963656790481015e-06, - "loss": 0.667, - "step": 53137 - }, - { - "epoch": 1.36, - "learning_rate": 1.1963385472424651e-06, - "loss": 0.5693, - "step": 53138 - }, - { - "epoch": 1.36, - "learning_rate": 1.196311415286501e-06, - "loss": 0.5659, - "step": 53139 - }, - { - "epoch": 1.36, - "learning_rate": 1.1962842831802301e-06, - "loss": 0.6211, - "step": 53140 - }, - { - "epoch": 1.36, - "learning_rate": 1.1962571509236738e-06, - "loss": 0.7188, - "step": 53141 - }, - { - "epoch": 1.36, - "learning_rate": 1.1962300185168524e-06, - "loss": 0.6904, - "step": 53142 - }, - { - "epoch": 1.36, - "learning_rate": 1.1962028859597864e-06, - "loss": 0.6992, - "step": 53143 - }, - { - "epoch": 1.36, - "learning_rate": 1.196175753252497e-06, - "loss": 0.6631, - "step": 53144 - }, - { - "epoch": 1.36, - "learning_rate": 1.1961486203950045e-06, - "loss": 0.5298, - "step": 53145 - }, - { - "epoch": 1.36, - "learning_rate": 1.1961214873873304e-06, - "loss": 0.6768, - "step": 53146 - }, - { - "epoch": 1.36, - "learning_rate": 1.1960943542294952e-06, - "loss": 0.6377, - "step": 53147 - }, - { - "epoch": 1.36, - "learning_rate": 1.1960672209215195e-06, - "loss": 0.7256, - "step": 53148 - }, - { - "epoch": 1.36, - "learning_rate": 1.196040087463424e-06, - "loss": 0.7188, - "step": 53149 - }, - { - "epoch": 1.36, - "learning_rate": 1.1960129538552296e-06, - "loss": 0.6943, - "step": 53150 - }, - { - "epoch": 1.36, - "learning_rate": 1.195985820096957e-06, - "loss": 0.6665, - "step": 53151 - }, - { - "epoch": 1.36, - "learning_rate": 1.1959586861886276e-06, - "loss": 0.7266, - "step": 53152 - }, - { - "epoch": 1.36, - "learning_rate": 1.1959315521302611e-06, - "loss": 0.7061, - "step": 53153 - }, - { - "epoch": 1.36, - "learning_rate": 1.1959044179218792e-06, - "loss": 0.7598, - "step": 53154 - }, - { - "epoch": 1.36, - "learning_rate": 1.1958772835635017e-06, - "loss": 0.6816, - "step": 53155 - }, - { - "epoch": 1.36, - "learning_rate": 1.1958501490551505e-06, - "loss": 0.5848, - "step": 53156 - }, - { - "epoch": 1.36, - "learning_rate": 1.1958230143968458e-06, - "loss": 0.6973, - "step": 53157 - }, - { - "epoch": 1.36, - "learning_rate": 1.1957958795886085e-06, - "loss": 0.9038, - "step": 53158 - }, - { - "epoch": 1.36, - "learning_rate": 1.1957687446304589e-06, - "loss": 0.5923, - "step": 53159 - }, - { - "epoch": 1.36, - "learning_rate": 1.1957416095224185e-06, - "loss": 0.7295, - "step": 53160 - }, - { - "epoch": 1.36, - "learning_rate": 1.1957144742645075e-06, - "loss": 0.6738, - "step": 53161 - }, - { - "epoch": 1.36, - "learning_rate": 1.1956873388567472e-06, - "loss": 0.6992, - "step": 53162 - }, - { - "epoch": 1.36, - "learning_rate": 1.195660203299158e-06, - "loss": 0.5942, - "step": 53163 - }, - { - "epoch": 1.36, - "learning_rate": 1.1956330675917605e-06, - "loss": 0.5771, - "step": 53164 - }, - { - "epoch": 1.36, - "learning_rate": 1.195605931734576e-06, - "loss": 0.7314, - "step": 53165 - }, - { - "epoch": 1.36, - "learning_rate": 1.1955787957276251e-06, - "loss": 0.7373, - "step": 53166 - }, - { - "epoch": 1.36, - "learning_rate": 1.1955516595709287e-06, - "loss": 0.5996, - "step": 53167 - }, - { - "epoch": 1.36, - "learning_rate": 1.195524523264507e-06, - "loss": 0.6313, - "step": 53168 - }, - { - "epoch": 1.36, - "learning_rate": 1.1954973868083812e-06, - "loss": 0.5063, - "step": 53169 - }, - { - "epoch": 1.36, - "learning_rate": 1.1954702502025723e-06, - "loss": 0.7671, - "step": 53170 - }, - { - "epoch": 1.36, - "learning_rate": 1.1954431134471007e-06, - "loss": 0.5225, - "step": 53171 - }, - { - "epoch": 1.36, - "learning_rate": 1.1954159765419873e-06, - "loss": 0.6885, - "step": 53172 - }, - { - "epoch": 1.36, - "learning_rate": 1.1953888394872528e-06, - "loss": 0.6641, - "step": 53173 - }, - { - "epoch": 1.36, - "learning_rate": 1.1953617022829181e-06, - "loss": 0.3948, - "step": 53174 - }, - { - "epoch": 1.36, - "learning_rate": 1.195334564929004e-06, - "loss": 0.7246, - "step": 53175 - }, - { - "epoch": 1.36, - "learning_rate": 1.1953074274255309e-06, - "loss": 0.4675, - "step": 53176 - }, - { - "epoch": 1.36, - "learning_rate": 1.1952802897725203e-06, - "loss": 0.4858, - "step": 53177 - }, - { - "epoch": 1.36, - "learning_rate": 1.1952531519699923e-06, - "loss": 0.7358, - "step": 53178 - }, - { - "epoch": 1.36, - "learning_rate": 1.195226014017968e-06, - "loss": 0.7563, - "step": 53179 - }, - { - "epoch": 1.36, - "learning_rate": 1.195198875916468e-06, - "loss": 0.6201, - "step": 53180 - }, - { - "epoch": 1.36, - "learning_rate": 1.1951717376655132e-06, - "loss": 0.6494, - "step": 53181 - }, - { - "epoch": 1.36, - "learning_rate": 1.1951445992651248e-06, - "loss": 0.708, - "step": 53182 - }, - { - "epoch": 1.36, - "learning_rate": 1.1951174607153227e-06, - "loss": 0.6602, - "step": 53183 - }, - { - "epoch": 1.36, - "learning_rate": 1.1950903220161284e-06, - "loss": 0.5996, - "step": 53184 - }, - { - "epoch": 1.36, - "learning_rate": 1.1950631831675621e-06, - "loss": 0.5674, - "step": 53185 - }, - { - "epoch": 1.36, - "learning_rate": 1.195036044169645e-06, - "loss": 0.7412, - "step": 53186 - }, - { - "epoch": 1.36, - "learning_rate": 1.1950089050223979e-06, - "loss": 0.6277, - "step": 53187 - }, - { - "epoch": 1.36, - "learning_rate": 1.1949817657258416e-06, - "loss": 0.6377, - "step": 53188 - }, - { - "epoch": 1.36, - "learning_rate": 1.1949546262799964e-06, - "loss": 0.5037, - "step": 53189 - }, - { - "epoch": 1.36, - "learning_rate": 1.1949274866848835e-06, - "loss": 0.6533, - "step": 53190 - }, - { - "epoch": 1.36, - "learning_rate": 1.1949003469405235e-06, - "loss": 0.7773, - "step": 53191 - }, - { - "epoch": 1.36, - "learning_rate": 1.1948732070469376e-06, - "loss": 0.5015, - "step": 53192 - }, - { - "epoch": 1.36, - "learning_rate": 1.1948460670041457e-06, - "loss": 0.6533, - "step": 53193 - }, - { - "epoch": 1.36, - "learning_rate": 1.1948189268121697e-06, - "loss": 0.6089, - "step": 53194 - }, - { - "epoch": 1.36, - "learning_rate": 1.1947917864710296e-06, - "loss": 0.5381, - "step": 53195 - }, - { - "epoch": 1.36, - "learning_rate": 1.1947646459807464e-06, - "loss": 0.7314, - "step": 53196 - }, - { - "epoch": 1.36, - "learning_rate": 1.1947375053413407e-06, - "loss": 0.7192, - "step": 53197 - }, - { - "epoch": 1.36, - "learning_rate": 1.1947103645528335e-06, - "loss": 0.5615, - "step": 53198 - }, - { - "epoch": 1.36, - "learning_rate": 1.1946832236152456e-06, - "loss": 0.6221, - "step": 53199 - }, - { - "epoch": 1.36, - "learning_rate": 1.1946560825285976e-06, - "loss": 0.4744, - "step": 53200 - }, - { - "epoch": 1.36, - "learning_rate": 1.1946289412929106e-06, - "loss": 0.6709, - "step": 53201 - }, - { - "epoch": 1.36, - "learning_rate": 1.1946017999082053e-06, - "loss": 0.5996, - "step": 53202 - }, - { - "epoch": 1.36, - "learning_rate": 1.1945746583745018e-06, - "loss": 0.4644, - "step": 53203 - }, - { - "epoch": 1.36, - "learning_rate": 1.1945475166918217e-06, - "loss": 0.5981, - "step": 53204 - }, - { - "epoch": 1.36, - "learning_rate": 1.1945203748601856e-06, - "loss": 0.7217, - "step": 53205 - }, - { - "epoch": 1.36, - "learning_rate": 1.194493232879614e-06, - "loss": 0.5337, - "step": 53206 - }, - { - "epoch": 1.36, - "learning_rate": 1.1944660907501281e-06, - "loss": 0.9414, - "step": 53207 - }, - { - "epoch": 1.36, - "learning_rate": 1.1944389484717482e-06, - "loss": 0.5117, - "step": 53208 - }, - { - "epoch": 1.36, - "learning_rate": 1.1944118060444957e-06, - "loss": 0.5406, - "step": 53209 - }, - { - "epoch": 1.36, - "learning_rate": 1.1943846634683907e-06, - "loss": 0.6943, - "step": 53210 - }, - { - "epoch": 1.36, - "learning_rate": 1.1943575207434544e-06, - "loss": 0.6826, - "step": 53211 - }, - { - "epoch": 1.36, - "learning_rate": 1.1943303778697075e-06, - "loss": 0.5552, - "step": 53212 - }, - { - "epoch": 1.36, - "learning_rate": 1.1943032348471708e-06, - "loss": 0.6943, - "step": 53213 - }, - { - "epoch": 1.36, - "learning_rate": 1.1942760916758649e-06, - "loss": 0.6699, - "step": 53214 - }, - { - "epoch": 1.36, - "learning_rate": 1.1942489483558108e-06, - "loss": 0.7607, - "step": 53215 - }, - { - "epoch": 1.36, - "learning_rate": 1.1942218048870295e-06, - "loss": 0.7412, - "step": 53216 - }, - { - "epoch": 1.36, - "learning_rate": 1.1941946612695413e-06, - "loss": 0.5664, - "step": 53217 - }, - { - "epoch": 1.36, - "learning_rate": 1.194167517503367e-06, - "loss": 0.6758, - "step": 53218 - }, - { - "epoch": 1.36, - "learning_rate": 1.1941403735885278e-06, - "loss": 0.4351, - "step": 53219 - }, - { - "epoch": 1.36, - "learning_rate": 1.194113229525044e-06, - "loss": 0.4722, - "step": 53220 - }, - { - "epoch": 1.36, - "learning_rate": 1.194086085312937e-06, - "loss": 0.6252, - "step": 53221 - }, - { - "epoch": 1.36, - "learning_rate": 1.1940589409522269e-06, - "loss": 0.6572, - "step": 53222 - }, - { - "epoch": 1.36, - "learning_rate": 1.194031796442935e-06, - "loss": 0.7656, - "step": 53223 - }, - { - "epoch": 1.36, - "learning_rate": 1.1940046517850815e-06, - "loss": 0.5815, - "step": 53224 - }, - { - "epoch": 1.36, - "learning_rate": 1.1939775069786878e-06, - "loss": 0.707, - "step": 53225 - }, - { - "epoch": 1.36, - "learning_rate": 1.1939503620237744e-06, - "loss": 0.6841, - "step": 53226 - }, - { - "epoch": 1.36, - "learning_rate": 1.1939232169203621e-06, - "loss": 0.7773, - "step": 53227 - }, - { - "epoch": 1.36, - "learning_rate": 1.1938960716684718e-06, - "loss": 0.6772, - "step": 53228 - }, - { - "epoch": 1.36, - "learning_rate": 1.193868926268124e-06, - "loss": 0.6543, - "step": 53229 - }, - { - "epoch": 1.36, - "learning_rate": 1.19384178071934e-06, - "loss": 0.6538, - "step": 53230 - }, - { - "epoch": 1.36, - "learning_rate": 1.1938146350221401e-06, - "loss": 0.7305, - "step": 53231 - }, - { - "epoch": 1.36, - "learning_rate": 1.1937874891765453e-06, - "loss": 0.6855, - "step": 53232 - }, - { - "epoch": 1.36, - "learning_rate": 1.1937603431825762e-06, - "loss": 0.5825, - "step": 53233 - }, - { - "epoch": 1.36, - "learning_rate": 1.1937331970402537e-06, - "loss": 0.6211, - "step": 53234 - }, - { - "epoch": 1.36, - "learning_rate": 1.1937060507495986e-06, - "loss": 0.6826, - "step": 53235 - }, - { - "epoch": 1.36, - "learning_rate": 1.193678904310632e-06, - "loss": 0.7959, - "step": 53236 - }, - { - "epoch": 1.36, - "learning_rate": 1.1936517577233743e-06, - "loss": 0.7632, - "step": 53237 - }, - { - "epoch": 1.36, - "learning_rate": 1.193624610987846e-06, - "loss": 0.6826, - "step": 53238 - }, - { - "epoch": 1.36, - "learning_rate": 1.1935974641040684e-06, - "loss": 0.5571, - "step": 53239 - }, - { - "epoch": 1.36, - "learning_rate": 1.1935703170720623e-06, - "loss": 0.4951, - "step": 53240 - }, - { - "epoch": 1.36, - "learning_rate": 1.1935431698918479e-06, - "loss": 0.7461, - "step": 53241 - }, - { - "epoch": 1.36, - "learning_rate": 1.1935160225634471e-06, - "loss": 0.6152, - "step": 53242 - }, - { - "epoch": 1.36, - "learning_rate": 1.1934888750868792e-06, - "loss": 0.6548, - "step": 53243 - }, - { - "epoch": 1.36, - "learning_rate": 1.1934617274621664e-06, - "loss": 0.6904, - "step": 53244 - }, - { - "epoch": 1.36, - "learning_rate": 1.1934345796893284e-06, - "loss": 0.6162, - "step": 53245 - }, - { - "epoch": 1.36, - "learning_rate": 1.1934074317683866e-06, - "loss": 0.5151, - "step": 53246 - }, - { - "epoch": 1.36, - "learning_rate": 1.1933802836993617e-06, - "loss": 0.6084, - "step": 53247 - }, - { - "epoch": 1.36, - "learning_rate": 1.1933531354822743e-06, - "loss": 0.5518, - "step": 53248 - }, - { - "epoch": 1.36, - "learning_rate": 1.1933259871171453e-06, - "loss": 0.7607, - "step": 53249 - }, - { - "epoch": 1.36, - "learning_rate": 1.1932988386039956e-06, - "loss": 0.4438, - "step": 53250 - }, - { - "epoch": 1.36, - "learning_rate": 1.1932716899428455e-06, - "loss": 0.4241, - "step": 53251 - }, - { - "epoch": 1.36, - "learning_rate": 1.1932445411337164e-06, - "loss": 0.5088, - "step": 53252 - }, - { - "epoch": 1.36, - "learning_rate": 1.193217392176629e-06, - "loss": 0.9141, - "step": 53253 - }, - { - "epoch": 1.36, - "learning_rate": 1.1931902430716037e-06, - "loss": 0.6943, - "step": 53254 - }, - { - "epoch": 1.36, - "learning_rate": 1.1931630938186617e-06, - "loss": 0.7109, - "step": 53255 - }, - { - "epoch": 1.36, - "learning_rate": 1.1931359444178234e-06, - "loss": 0.5718, - "step": 53256 - }, - { - "epoch": 1.37, - "learning_rate": 1.19310879486911e-06, - "loss": 0.7998, - "step": 53257 - }, - { - "epoch": 1.37, - "learning_rate": 1.1930816451725417e-06, - "loss": 0.5977, - "step": 53258 - }, - { - "epoch": 1.37, - "learning_rate": 1.1930544953281402e-06, - "loss": 0.7725, - "step": 53259 - }, - { - "epoch": 1.37, - "learning_rate": 1.1930273453359255e-06, - "loss": 0.5359, - "step": 53260 - }, - { - "epoch": 1.37, - "learning_rate": 1.1930001951959185e-06, - "loss": 0.4628, - "step": 53261 - }, - { - "epoch": 1.37, - "learning_rate": 1.1929730449081403e-06, - "loss": 0.4663, - "step": 53262 - }, - { - "epoch": 1.37, - "learning_rate": 1.1929458944726116e-06, - "loss": 0.6816, - "step": 53263 - }, - { - "epoch": 1.37, - "learning_rate": 1.1929187438893528e-06, - "loss": 0.6492, - "step": 53264 - }, - { - "epoch": 1.37, - "learning_rate": 1.1928915931583851e-06, - "loss": 0.6426, - "step": 53265 - }, - { - "epoch": 1.37, - "learning_rate": 1.192864442279729e-06, - "loss": 0.6323, - "step": 53266 - }, - { - "epoch": 1.37, - "learning_rate": 1.192837291253406e-06, - "loss": 0.7749, - "step": 53267 - }, - { - "epoch": 1.37, - "learning_rate": 1.1928101400794362e-06, - "loss": 0.752, - "step": 53268 - }, - { - "epoch": 1.37, - "learning_rate": 1.1927829887578403e-06, - "loss": 0.5405, - "step": 53269 - }, - { - "epoch": 1.37, - "learning_rate": 1.1927558372886392e-06, - "loss": 0.7607, - "step": 53270 - }, - { - "epoch": 1.37, - "learning_rate": 1.192728685671854e-06, - "loss": 0.7227, - "step": 53271 - }, - { - "epoch": 1.37, - "learning_rate": 1.1927015339075056e-06, - "loss": 0.6895, - "step": 53272 - }, - { - "epoch": 1.37, - "learning_rate": 1.192674381995614e-06, - "loss": 0.5159, - "step": 53273 - }, - { - "epoch": 1.37, - "learning_rate": 1.1926472299362009e-06, - "loss": 0.7324, - "step": 53274 - }, - { - "epoch": 1.37, - "learning_rate": 1.1926200777292866e-06, - "loss": 0.5671, - "step": 53275 - }, - { - "epoch": 1.37, - "learning_rate": 1.1925929253748916e-06, - "loss": 0.6626, - "step": 53276 - }, - { - "epoch": 1.37, - "learning_rate": 1.1925657728730374e-06, - "loss": 0.4912, - "step": 53277 - }, - { - "epoch": 1.37, - "learning_rate": 1.1925386202237443e-06, - "loss": 0.5244, - "step": 53278 - }, - { - "epoch": 1.37, - "learning_rate": 1.1925114674270331e-06, - "loss": 0.7729, - "step": 53279 - }, - { - "epoch": 1.37, - "learning_rate": 1.1924843144829251e-06, - "loss": 0.6543, - "step": 53280 - }, - { - "epoch": 1.37, - "learning_rate": 1.1924571613914403e-06, - "loss": 0.6885, - "step": 53281 - }, - { - "epoch": 1.37, - "learning_rate": 1.1924300081526004e-06, - "loss": 0.4902, - "step": 53282 - }, - { - "epoch": 1.37, - "learning_rate": 1.1924028547664253e-06, - "loss": 0.3378, - "step": 53283 - }, - { - "epoch": 1.37, - "learning_rate": 1.1923757012329362e-06, - "loss": 0.7354, - "step": 53284 - }, - { - "epoch": 1.37, - "learning_rate": 1.192348547552154e-06, - "loss": 0.8594, - "step": 53285 - }, - { - "epoch": 1.37, - "learning_rate": 1.1923213937240995e-06, - "loss": 0.5061, - "step": 53286 - }, - { - "epoch": 1.37, - "learning_rate": 1.1922942397487932e-06, - "loss": 0.5928, - "step": 53287 - }, - { - "epoch": 1.37, - "learning_rate": 1.192267085626256e-06, - "loss": 0.6157, - "step": 53288 - }, - { - "epoch": 1.37, - "learning_rate": 1.1922399313565087e-06, - "loss": 0.6411, - "step": 53289 - }, - { - "epoch": 1.37, - "learning_rate": 1.1922127769395723e-06, - "loss": 0.7285, - "step": 53290 - }, - { - "epoch": 1.37, - "learning_rate": 1.192185622375467e-06, - "loss": 0.8135, - "step": 53291 - }, - { - "epoch": 1.37, - "learning_rate": 1.1921584676642144e-06, - "loss": 0.4991, - "step": 53292 - }, - { - "epoch": 1.37, - "learning_rate": 1.1921313128058348e-06, - "loss": 0.7314, - "step": 53293 - }, - { - "epoch": 1.37, - "learning_rate": 1.1921041578003493e-06, - "loss": 0.5481, - "step": 53294 - }, - { - "epoch": 1.37, - "learning_rate": 1.192077002647778e-06, - "loss": 0.6992, - "step": 53295 - }, - { - "epoch": 1.37, - "learning_rate": 1.1920498473481425e-06, - "loss": 0.5115, - "step": 53296 - }, - { - "epoch": 1.37, - "learning_rate": 1.1920226919014633e-06, - "loss": 0.7979, - "step": 53297 - }, - { - "epoch": 1.37, - "learning_rate": 1.1919955363077608e-06, - "loss": 0.5957, - "step": 53298 - }, - { - "epoch": 1.37, - "learning_rate": 1.1919683805670566e-06, - "loss": 0.8184, - "step": 53299 - }, - { - "epoch": 1.37, - "learning_rate": 1.1919412246793706e-06, - "loss": 0.6562, - "step": 53300 - }, - { - "epoch": 1.37, - "learning_rate": 1.1919140686447242e-06, - "loss": 0.6211, - "step": 53301 - }, - { - "epoch": 1.37, - "learning_rate": 1.1918869124631383e-06, - "loss": 0.8662, - "step": 53302 - }, - { - "epoch": 1.37, - "learning_rate": 1.1918597561346332e-06, - "loss": 0.7695, - "step": 53303 - }, - { - "epoch": 1.37, - "learning_rate": 1.1918325996592298e-06, - "loss": 0.791, - "step": 53304 - }, - { - "epoch": 1.37, - "learning_rate": 1.1918054430369492e-06, - "loss": 0.6416, - "step": 53305 - }, - { - "epoch": 1.37, - "learning_rate": 1.1917782862678117e-06, - "loss": 0.5977, - "step": 53306 - }, - { - "epoch": 1.37, - "learning_rate": 1.1917511293518389e-06, - "loss": 0.5016, - "step": 53307 - }, - { - "epoch": 1.37, - "learning_rate": 1.1917239722890507e-06, - "loss": 0.7861, - "step": 53308 - }, - { - "epoch": 1.37, - "learning_rate": 1.1916968150794682e-06, - "loss": 0.7188, - "step": 53309 - }, - { - "epoch": 1.37, - "learning_rate": 1.1916696577231121e-06, - "loss": 0.8291, - "step": 53310 - }, - { - "epoch": 1.37, - "learning_rate": 1.1916425002200038e-06, - "loss": 0.6084, - "step": 53311 - }, - { - "epoch": 1.37, - "learning_rate": 1.1916153425701636e-06, - "loss": 0.7588, - "step": 53312 - }, - { - "epoch": 1.37, - "learning_rate": 1.1915881847736124e-06, - "loss": 0.6875, - "step": 53313 - }, - { - "epoch": 1.37, - "learning_rate": 1.1915610268303706e-06, - "loss": 0.6221, - "step": 53314 - }, - { - "epoch": 1.37, - "learning_rate": 1.1915338687404597e-06, - "loss": 0.5605, - "step": 53315 - }, - { - "epoch": 1.37, - "learning_rate": 1.1915067105038996e-06, - "loss": 0.7109, - "step": 53316 - }, - { - "epoch": 1.37, - "learning_rate": 1.191479552120712e-06, - "loss": 0.5363, - "step": 53317 - }, - { - "epoch": 1.37, - "learning_rate": 1.1914523935909172e-06, - "loss": 0.5724, - "step": 53318 - }, - { - "epoch": 1.37, - "learning_rate": 1.1914252349145362e-06, - "loss": 0.6631, - "step": 53319 - }, - { - "epoch": 1.37, - "learning_rate": 1.1913980760915898e-06, - "loss": 0.665, - "step": 53320 - }, - { - "epoch": 1.37, - "learning_rate": 1.1913709171220985e-06, - "loss": 0.6533, - "step": 53321 - }, - { - "epoch": 1.37, - "learning_rate": 1.1913437580060834e-06, - "loss": 0.5752, - "step": 53322 - }, - { - "epoch": 1.37, - "learning_rate": 1.191316598743565e-06, - "loss": 0.4548, - "step": 53323 - }, - { - "epoch": 1.37, - "learning_rate": 1.1912894393345645e-06, - "loss": 0.4397, - "step": 53324 - }, - { - "epoch": 1.37, - "learning_rate": 1.1912622797791024e-06, - "loss": 0.6812, - "step": 53325 - }, - { - "epoch": 1.37, - "learning_rate": 1.1912351200771995e-06, - "loss": 0.7725, - "step": 53326 - }, - { - "epoch": 1.37, - "learning_rate": 1.1912079602288768e-06, - "loss": 0.6733, - "step": 53327 - }, - { - "epoch": 1.37, - "learning_rate": 1.1911808002341548e-06, - "loss": 0.6826, - "step": 53328 - }, - { - "epoch": 1.37, - "learning_rate": 1.1911536400930545e-06, - "loss": 0.5249, - "step": 53329 - }, - { - "epoch": 1.37, - "learning_rate": 1.1911264798055967e-06, - "loss": 0.6455, - "step": 53330 - }, - { - "epoch": 1.37, - "learning_rate": 1.191099319371802e-06, - "loss": 0.6174, - "step": 53331 - }, - { - "epoch": 1.37, - "learning_rate": 1.1910721587916916e-06, - "loss": 0.6555, - "step": 53332 - }, - { - "epoch": 1.37, - "learning_rate": 1.1910449980652858e-06, - "loss": 0.5996, - "step": 53333 - }, - { - "epoch": 1.37, - "learning_rate": 1.1910178371926059e-06, - "loss": 0.6914, - "step": 53334 - }, - { - "epoch": 1.37, - "learning_rate": 1.1909906761736718e-06, - "loss": 0.4974, - "step": 53335 - }, - { - "epoch": 1.37, - "learning_rate": 1.1909635150085055e-06, - "loss": 0.7676, - "step": 53336 - }, - { - "epoch": 1.37, - "learning_rate": 1.1909363536971271e-06, - "loss": 0.5776, - "step": 53337 - }, - { - "epoch": 1.37, - "learning_rate": 1.1909091922395576e-06, - "loss": 0.7446, - "step": 53338 - }, - { - "epoch": 1.37, - "learning_rate": 1.1908820306358174e-06, - "loss": 0.5693, - "step": 53339 - }, - { - "epoch": 1.37, - "learning_rate": 1.190854868885928e-06, - "loss": 0.6616, - "step": 53340 - }, - { - "epoch": 1.37, - "learning_rate": 1.1908277069899094e-06, - "loss": 0.5298, - "step": 53341 - }, - { - "epoch": 1.37, - "learning_rate": 1.1908005449477832e-06, - "loss": 0.5352, - "step": 53342 - }, - { - "epoch": 1.37, - "learning_rate": 1.1907733827595695e-06, - "loss": 0.7842, - "step": 53343 - }, - { - "epoch": 1.37, - "learning_rate": 1.1907462204252894e-06, - "loss": 0.665, - "step": 53344 - }, - { - "epoch": 1.37, - "learning_rate": 1.1907190579449638e-06, - "loss": 0.6328, - "step": 53345 - }, - { - "epoch": 1.37, - "learning_rate": 1.1906918953186134e-06, - "loss": 0.5237, - "step": 53346 - }, - { - "epoch": 1.37, - "learning_rate": 1.190664732546259e-06, - "loss": 0.5065, - "step": 53347 - }, - { - "epoch": 1.37, - "learning_rate": 1.190637569627921e-06, - "loss": 0.6523, - "step": 53348 - }, - { - "epoch": 1.37, - "learning_rate": 1.1906104065636212e-06, - "loss": 0.6426, - "step": 53349 - }, - { - "epoch": 1.37, - "learning_rate": 1.1905832433533794e-06, - "loss": 0.8516, - "step": 53350 - }, - { - "epoch": 1.37, - "learning_rate": 1.1905560799972173e-06, - "loss": 0.6914, - "step": 53351 - }, - { - "epoch": 1.37, - "learning_rate": 1.1905289164951544e-06, - "loss": 0.4146, - "step": 53352 - }, - { - "epoch": 1.37, - "learning_rate": 1.1905017528472126e-06, - "loss": 0.6782, - "step": 53353 - }, - { - "epoch": 1.37, - "learning_rate": 1.1904745890534123e-06, - "loss": 0.8125, - "step": 53354 - }, - { - "epoch": 1.37, - "learning_rate": 1.1904474251137744e-06, - "loss": 0.6299, - "step": 53355 - }, - { - "epoch": 1.37, - "learning_rate": 1.1904202610283199e-06, - "loss": 0.6602, - "step": 53356 - }, - { - "epoch": 1.37, - "learning_rate": 1.1903930967970692e-06, - "loss": 0.6548, - "step": 53357 - }, - { - "epoch": 1.37, - "learning_rate": 1.190365932420043e-06, - "loss": 0.8623, - "step": 53358 - }, - { - "epoch": 1.37, - "learning_rate": 1.1903387678972628e-06, - "loss": 0.7891, - "step": 53359 - }, - { - "epoch": 1.37, - "learning_rate": 1.1903116032287484e-06, - "loss": 0.6973, - "step": 53360 - }, - { - "epoch": 1.37, - "learning_rate": 1.1902844384145216e-06, - "loss": 0.6188, - "step": 53361 - }, - { - "epoch": 1.37, - "learning_rate": 1.1902572734546028e-06, - "loss": 0.6758, - "step": 53362 - }, - { - "epoch": 1.37, - "learning_rate": 1.1902301083490123e-06, - "loss": 0.6416, - "step": 53363 - }, - { - "epoch": 1.37, - "learning_rate": 1.1902029430977718e-06, - "loss": 0.6631, - "step": 53364 - }, - { - "epoch": 1.37, - "learning_rate": 1.1901757777009015e-06, - "loss": 0.7734, - "step": 53365 - }, - { - "epoch": 1.37, - "learning_rate": 1.1901486121584225e-06, - "loss": 0.688, - "step": 53366 - }, - { - "epoch": 1.37, - "learning_rate": 1.190121446470355e-06, - "loss": 0.6904, - "step": 53367 - }, - { - "epoch": 1.37, - "learning_rate": 1.1900942806367206e-06, - "loss": 0.605, - "step": 53368 - }, - { - "epoch": 1.37, - "learning_rate": 1.1900671146575396e-06, - "loss": 0.6143, - "step": 53369 - }, - { - "epoch": 1.37, - "learning_rate": 1.1900399485328332e-06, - "loss": 0.5825, - "step": 53370 - }, - { - "epoch": 1.37, - "learning_rate": 1.190012782262622e-06, - "loss": 0.5605, - "step": 53371 - }, - { - "epoch": 1.37, - "learning_rate": 1.1899856158469265e-06, - "loss": 0.8369, - "step": 53372 - }, - { - "epoch": 1.37, - "learning_rate": 1.1899584492857677e-06, - "loss": 0.7158, - "step": 53373 - }, - { - "epoch": 1.37, - "learning_rate": 1.1899312825791666e-06, - "loss": 0.6541, - "step": 53374 - }, - { - "epoch": 1.37, - "learning_rate": 1.1899041157271437e-06, - "loss": 0.7188, - "step": 53375 - }, - { - "epoch": 1.37, - "learning_rate": 1.1898769487297202e-06, - "loss": 0.6743, - "step": 53376 - }, - { - "epoch": 1.37, - "learning_rate": 1.1898497815869164e-06, - "loss": 0.6519, - "step": 53377 - }, - { - "epoch": 1.37, - "learning_rate": 1.1898226142987535e-06, - "loss": 0.6426, - "step": 53378 - }, - { - "epoch": 1.37, - "learning_rate": 1.189795446865252e-06, - "loss": 0.7227, - "step": 53379 - }, - { - "epoch": 1.37, - "learning_rate": 1.1897682792864331e-06, - "loss": 0.6211, - "step": 53380 - }, - { - "epoch": 1.37, - "learning_rate": 1.1897411115623172e-06, - "loss": 0.6421, - "step": 53381 - }, - { - "epoch": 1.37, - "learning_rate": 1.1897139436929253e-06, - "loss": 0.7998, - "step": 53382 - }, - { - "epoch": 1.37, - "learning_rate": 1.189686775678278e-06, - "loss": 0.7715, - "step": 53383 - }, - { - "epoch": 1.37, - "learning_rate": 1.1896596075183966e-06, - "loss": 0.6204, - "step": 53384 - }, - { - "epoch": 1.37, - "learning_rate": 1.1896324392133012e-06, - "loss": 0.6125, - "step": 53385 - }, - { - "epoch": 1.37, - "learning_rate": 1.189605270763013e-06, - "loss": 0.4751, - "step": 53386 - }, - { - "epoch": 1.37, - "learning_rate": 1.189578102167553e-06, - "loss": 0.584, - "step": 53387 - }, - { - "epoch": 1.37, - "learning_rate": 1.1895509334269417e-06, - "loss": 0.5186, - "step": 53388 - }, - { - "epoch": 1.37, - "learning_rate": 1.1895237645411999e-06, - "loss": 0.488, - "step": 53389 - }, - { - "epoch": 1.37, - "learning_rate": 1.1894965955103482e-06, - "loss": 0.6299, - "step": 53390 - }, - { - "epoch": 1.37, - "learning_rate": 1.1894694263344082e-06, - "loss": 0.5371, - "step": 53391 - }, - { - "epoch": 1.37, - "learning_rate": 1.1894422570134e-06, - "loss": 0.655, - "step": 53392 - }, - { - "epoch": 1.37, - "learning_rate": 1.1894150875473444e-06, - "loss": 0.6943, - "step": 53393 - }, - { - "epoch": 1.37, - "learning_rate": 1.1893879179362623e-06, - "loss": 0.5054, - "step": 53394 - }, - { - "epoch": 1.37, - "learning_rate": 1.1893607481801748e-06, - "loss": 0.5991, - "step": 53395 - }, - { - "epoch": 1.37, - "learning_rate": 1.1893335782791025e-06, - "loss": 0.729, - "step": 53396 - }, - { - "epoch": 1.37, - "learning_rate": 1.1893064082330661e-06, - "loss": 0.7368, - "step": 53397 - }, - { - "epoch": 1.37, - "learning_rate": 1.1892792380420864e-06, - "loss": 0.5798, - "step": 53398 - }, - { - "epoch": 1.37, - "learning_rate": 1.1892520677061846e-06, - "loss": 0.5894, - "step": 53399 - }, - { - "epoch": 1.37, - "learning_rate": 1.1892248972253808e-06, - "loss": 0.4562, - "step": 53400 - }, - { - "epoch": 1.37, - "learning_rate": 1.1891977265996966e-06, - "loss": 0.4027, - "step": 53401 - }, - { - "epoch": 1.37, - "learning_rate": 1.189170555829152e-06, - "loss": 0.5854, - "step": 53402 - }, - { - "epoch": 1.37, - "learning_rate": 1.1891433849137684e-06, - "loss": 0.5479, - "step": 53403 - }, - { - "epoch": 1.37, - "learning_rate": 1.1891162138535663e-06, - "loss": 0.6367, - "step": 53404 - }, - { - "epoch": 1.37, - "learning_rate": 1.1890890426485668e-06, - "loss": 0.7285, - "step": 53405 - }, - { - "epoch": 1.37, - "learning_rate": 1.1890618712987905e-06, - "loss": 0.6689, - "step": 53406 - }, - { - "epoch": 1.37, - "learning_rate": 1.189034699804258e-06, - "loss": 0.6602, - "step": 53407 - }, - { - "epoch": 1.37, - "learning_rate": 1.1890075281649905e-06, - "loss": 0.4929, - "step": 53408 - }, - { - "epoch": 1.37, - "learning_rate": 1.1889803563810086e-06, - "loss": 0.6406, - "step": 53409 - }, - { - "epoch": 1.37, - "learning_rate": 1.1889531844523331e-06, - "loss": 0.5864, - "step": 53410 - }, - { - "epoch": 1.37, - "learning_rate": 1.1889260123789849e-06, - "loss": 0.7549, - "step": 53411 - }, - { - "epoch": 1.37, - "learning_rate": 1.1888988401609847e-06, - "loss": 0.7065, - "step": 53412 - }, - { - "epoch": 1.37, - "learning_rate": 1.1888716677983533e-06, - "loss": 0.6914, - "step": 53413 - }, - { - "epoch": 1.37, - "learning_rate": 1.1888444952911116e-06, - "loss": 0.7456, - "step": 53414 - }, - { - "epoch": 1.37, - "learning_rate": 1.1888173226392802e-06, - "loss": 0.7197, - "step": 53415 - }, - { - "epoch": 1.37, - "learning_rate": 1.1887901498428805e-06, - "loss": 0.6416, - "step": 53416 - }, - { - "epoch": 1.37, - "learning_rate": 1.1887629769019322e-06, - "loss": 0.728, - "step": 53417 - }, - { - "epoch": 1.37, - "learning_rate": 1.1887358038164573e-06, - "loss": 0.7402, - "step": 53418 - }, - { - "epoch": 1.37, - "learning_rate": 1.1887086305864758e-06, - "loss": 0.5264, - "step": 53419 - }, - { - "epoch": 1.37, - "learning_rate": 1.1886814572120089e-06, - "loss": 0.6926, - "step": 53420 - }, - { - "epoch": 1.37, - "learning_rate": 1.1886542836930773e-06, - "loss": 0.7734, - "step": 53421 - }, - { - "epoch": 1.37, - "learning_rate": 1.1886271100297019e-06, - "loss": 0.6318, - "step": 53422 - }, - { - "epoch": 1.37, - "learning_rate": 1.188599936221903e-06, - "loss": 0.5325, - "step": 53423 - }, - { - "epoch": 1.37, - "learning_rate": 1.188572762269702e-06, - "loss": 0.6172, - "step": 53424 - }, - { - "epoch": 1.37, - "learning_rate": 1.1885455881731197e-06, - "loss": 0.7339, - "step": 53425 - }, - { - "epoch": 1.37, - "learning_rate": 1.1885184139321764e-06, - "loss": 0.7207, - "step": 53426 - }, - { - "epoch": 1.37, - "learning_rate": 1.1884912395468936e-06, - "loss": 0.8271, - "step": 53427 - }, - { - "epoch": 1.37, - "learning_rate": 1.1884640650172915e-06, - "loss": 0.7109, - "step": 53428 - }, - { - "epoch": 1.37, - "learning_rate": 1.188436890343391e-06, - "loss": 0.7119, - "step": 53429 - }, - { - "epoch": 1.37, - "learning_rate": 1.1884097155252133e-06, - "loss": 0.6816, - "step": 53430 - }, - { - "epoch": 1.37, - "learning_rate": 1.188382540562779e-06, - "loss": 0.5928, - "step": 53431 - }, - { - "epoch": 1.37, - "learning_rate": 1.1883553654561085e-06, - "loss": 0.6846, - "step": 53432 - }, - { - "epoch": 1.37, - "learning_rate": 1.188328190205223e-06, - "loss": 0.5356, - "step": 53433 - }, - { - "epoch": 1.37, - "learning_rate": 1.1883010148101434e-06, - "loss": 0.5117, - "step": 53434 - }, - { - "epoch": 1.37, - "learning_rate": 1.1882738392708904e-06, - "loss": 0.6382, - "step": 53435 - }, - { - "epoch": 1.37, - "learning_rate": 1.1882466635874848e-06, - "loss": 0.7344, - "step": 53436 - }, - { - "epoch": 1.37, - "learning_rate": 1.1882194877599473e-06, - "loss": 0.7314, - "step": 53437 - }, - { - "epoch": 1.37, - "learning_rate": 1.188192311788299e-06, - "loss": 0.5762, - "step": 53438 - }, - { - "epoch": 1.37, - "learning_rate": 1.1881651356725602e-06, - "loss": 0.7446, - "step": 53439 - }, - { - "epoch": 1.37, - "learning_rate": 1.1881379594127518e-06, - "loss": 0.5381, - "step": 53440 - }, - { - "epoch": 1.37, - "learning_rate": 1.1881107830088957e-06, - "loss": 0.7051, - "step": 53441 - }, - { - "epoch": 1.37, - "learning_rate": 1.188083606461011e-06, - "loss": 0.6313, - "step": 53442 - }, - { - "epoch": 1.37, - "learning_rate": 1.1880564297691196e-06, - "loss": 0.7939, - "step": 53443 - }, - { - "epoch": 1.37, - "learning_rate": 1.1880292529332422e-06, - "loss": 0.7041, - "step": 53444 - }, - { - "epoch": 1.37, - "learning_rate": 1.188002075953399e-06, - "loss": 0.752, - "step": 53445 - }, - { - "epoch": 1.37, - "learning_rate": 1.1879748988296117e-06, - "loss": 0.4944, - "step": 53446 - }, - { - "epoch": 1.37, - "learning_rate": 1.1879477215619008e-06, - "loss": 0.4282, - "step": 53447 - }, - { - "epoch": 1.37, - "learning_rate": 1.1879205441502862e-06, - "loss": 0.752, - "step": 53448 - }, - { - "epoch": 1.37, - "learning_rate": 1.18789336659479e-06, - "loss": 0.6094, - "step": 53449 - }, - { - "epoch": 1.37, - "learning_rate": 1.1878661888954325e-06, - "loss": 0.6099, - "step": 53450 - }, - { - "epoch": 1.37, - "learning_rate": 1.1878390110522344e-06, - "loss": 0.6335, - "step": 53451 - }, - { - "epoch": 1.37, - "learning_rate": 1.1878118330652168e-06, - "loss": 0.6313, - "step": 53452 - }, - { - "epoch": 1.37, - "learning_rate": 1.1877846549343998e-06, - "loss": 0.603, - "step": 53453 - }, - { - "epoch": 1.37, - "learning_rate": 1.1877574766598052e-06, - "loss": 0.8076, - "step": 53454 - }, - { - "epoch": 1.37, - "learning_rate": 1.1877302982414534e-06, - "loss": 0.6875, - "step": 53455 - }, - { - "epoch": 1.37, - "learning_rate": 1.187703119679365e-06, - "loss": 0.627, - "step": 53456 - }, - { - "epoch": 1.37, - "learning_rate": 1.1876759409735609e-06, - "loss": 0.8369, - "step": 53457 - }, - { - "epoch": 1.37, - "learning_rate": 1.1876487621240619e-06, - "loss": 0.5645, - "step": 53458 - }, - { - "epoch": 1.37, - "learning_rate": 1.187621583130889e-06, - "loss": 0.7598, - "step": 53459 - }, - { - "epoch": 1.37, - "learning_rate": 1.1875944039940628e-06, - "loss": 0.7188, - "step": 53460 - }, - { - "epoch": 1.37, - "learning_rate": 1.187567224713604e-06, - "loss": 0.7622, - "step": 53461 - }, - { - "epoch": 1.37, - "learning_rate": 1.187540045289534e-06, - "loss": 0.6953, - "step": 53462 - }, - { - "epoch": 1.37, - "learning_rate": 1.1875128657218729e-06, - "loss": 0.7764, - "step": 53463 - }, - { - "epoch": 1.37, - "learning_rate": 1.1874856860106421e-06, - "loss": 0.6516, - "step": 53464 - }, - { - "epoch": 1.37, - "learning_rate": 1.187458506155862e-06, - "loss": 0.5728, - "step": 53465 - }, - { - "epoch": 1.37, - "learning_rate": 1.1874313261575536e-06, - "loss": 0.4644, - "step": 53466 - }, - { - "epoch": 1.37, - "learning_rate": 1.1874041460157375e-06, - "loss": 0.6875, - "step": 53467 - }, - { - "epoch": 1.37, - "learning_rate": 1.1873769657304349e-06, - "loss": 0.6592, - "step": 53468 - }, - { - "epoch": 1.37, - "learning_rate": 1.187349785301666e-06, - "loss": 0.7812, - "step": 53469 - }, - { - "epoch": 1.37, - "learning_rate": 1.1873226047294522e-06, - "loss": 0.6357, - "step": 53470 - }, - { - "epoch": 1.37, - "learning_rate": 1.1872954240138142e-06, - "loss": 0.7197, - "step": 53471 - }, - { - "epoch": 1.37, - "learning_rate": 1.1872682431547728e-06, - "loss": 0.4937, - "step": 53472 - }, - { - "epoch": 1.37, - "learning_rate": 1.1872410621523483e-06, - "loss": 0.627, - "step": 53473 - }, - { - "epoch": 1.37, - "learning_rate": 1.187213881006562e-06, - "loss": 0.7051, - "step": 53474 - }, - { - "epoch": 1.37, - "learning_rate": 1.1871866997174348e-06, - "loss": 0.7676, - "step": 53475 - }, - { - "epoch": 1.37, - "learning_rate": 1.1871595182849874e-06, - "loss": 0.7124, - "step": 53476 - }, - { - "epoch": 1.37, - "learning_rate": 1.1871323367092406e-06, - "loss": 0.645, - "step": 53477 - }, - { - "epoch": 1.37, - "learning_rate": 1.1871051549902149e-06, - "loss": 0.6826, - "step": 53478 - }, - { - "epoch": 1.37, - "learning_rate": 1.1870779731279317e-06, - "loss": 0.5151, - "step": 53479 - }, - { - "epoch": 1.37, - "learning_rate": 1.187050791122411e-06, - "loss": 0.6279, - "step": 53480 - }, - { - "epoch": 1.37, - "learning_rate": 1.1870236089736749e-06, - "loss": 0.5801, - "step": 53481 - }, - { - "epoch": 1.37, - "learning_rate": 1.1869964266817427e-06, - "loss": 0.5334, - "step": 53482 - }, - { - "epoch": 1.37, - "learning_rate": 1.1869692442466364e-06, - "loss": 0.6367, - "step": 53483 - }, - { - "epoch": 1.37, - "learning_rate": 1.1869420616683761e-06, - "loss": 0.6152, - "step": 53484 - }, - { - "epoch": 1.37, - "learning_rate": 1.186914878946983e-06, - "loss": 0.677, - "step": 53485 - }, - { - "epoch": 1.37, - "learning_rate": 1.1868876960824776e-06, - "loss": 0.6011, - "step": 53486 - }, - { - "epoch": 1.37, - "learning_rate": 1.186860513074881e-06, - "loss": 0.5103, - "step": 53487 - }, - { - "epoch": 1.37, - "learning_rate": 1.1868333299242138e-06, - "loss": 0.6553, - "step": 53488 - }, - { - "epoch": 1.37, - "learning_rate": 1.186806146630497e-06, - "loss": 0.5991, - "step": 53489 - }, - { - "epoch": 1.37, - "learning_rate": 1.1867789631937512e-06, - "loss": 0.5139, - "step": 53490 - }, - { - "epoch": 1.37, - "learning_rate": 1.1867517796139978e-06, - "loss": 0.6294, - "step": 53491 - }, - { - "epoch": 1.37, - "learning_rate": 1.1867245958912567e-06, - "loss": 0.6938, - "step": 53492 - }, - { - "epoch": 1.37, - "learning_rate": 1.1866974120255492e-06, - "loss": 0.623, - "step": 53493 - }, - { - "epoch": 1.37, - "learning_rate": 1.1866702280168962e-06, - "loss": 0.6621, - "step": 53494 - }, - { - "epoch": 1.37, - "learning_rate": 1.1866430438653182e-06, - "loss": 0.6616, - "step": 53495 - }, - { - "epoch": 1.37, - "learning_rate": 1.1866158595708365e-06, - "loss": 0.6514, - "step": 53496 - }, - { - "epoch": 1.37, - "learning_rate": 1.1865886751334713e-06, - "loss": 0.5767, - "step": 53497 - }, - { - "epoch": 1.37, - "learning_rate": 1.1865614905532439e-06, - "loss": 0.6963, - "step": 53498 - }, - { - "epoch": 1.37, - "learning_rate": 1.186534305830175e-06, - "loss": 0.6604, - "step": 53499 - }, - { - "epoch": 1.37, - "learning_rate": 1.1865071209642852e-06, - "loss": 0.7012, - "step": 53500 - }, - { - "epoch": 1.37, - "learning_rate": 1.1864799359555954e-06, - "loss": 0.4697, - "step": 53501 - }, - { - "epoch": 1.37, - "learning_rate": 1.1864527508041268e-06, - "loss": 0.7607, - "step": 53502 - }, - { - "epoch": 1.37, - "learning_rate": 1.1864255655098995e-06, - "loss": 0.5383, - "step": 53503 - }, - { - "epoch": 1.37, - "learning_rate": 1.186398380072935e-06, - "loss": 0.585, - "step": 53504 - }, - { - "epoch": 1.37, - "learning_rate": 1.1863711944932536e-06, - "loss": 0.7104, - "step": 53505 - }, - { - "epoch": 1.37, - "learning_rate": 1.1863440087708772e-06, - "loss": 0.8164, - "step": 53506 - }, - { - "epoch": 1.37, - "learning_rate": 1.1863168229058249e-06, - "loss": 0.6133, - "step": 53507 - }, - { - "epoch": 1.37, - "learning_rate": 1.1862896368981186e-06, - "loss": 0.6787, - "step": 53508 - }, - { - "epoch": 1.37, - "learning_rate": 1.1862624507477788e-06, - "loss": 0.5513, - "step": 53509 - }, - { - "epoch": 1.37, - "learning_rate": 1.1862352644548264e-06, - "loss": 0.5527, - "step": 53510 - }, - { - "epoch": 1.37, - "learning_rate": 1.1862080780192825e-06, - "loss": 0.6167, - "step": 53511 - }, - { - "epoch": 1.37, - "learning_rate": 1.1861808914411674e-06, - "loss": 0.6709, - "step": 53512 - }, - { - "epoch": 1.37, - "learning_rate": 1.1861537047205018e-06, - "loss": 0.7217, - "step": 53513 - }, - { - "epoch": 1.37, - "learning_rate": 1.1861265178573074e-06, - "loss": 0.7139, - "step": 53514 - }, - { - "epoch": 1.37, - "learning_rate": 1.1860993308516042e-06, - "loss": 0.5151, - "step": 53515 - }, - { - "epoch": 1.37, - "learning_rate": 1.1860721437034137e-06, - "loss": 0.7568, - "step": 53516 - }, - { - "epoch": 1.37, - "learning_rate": 1.186044956412756e-06, - "loss": 0.6299, - "step": 53517 - }, - { - "epoch": 1.37, - "learning_rate": 1.1860177689796525e-06, - "loss": 0.5132, - "step": 53518 - }, - { - "epoch": 1.37, - "learning_rate": 1.1859905814041234e-06, - "loss": 0.5706, - "step": 53519 - }, - { - "epoch": 1.37, - "learning_rate": 1.18596339368619e-06, - "loss": 0.4561, - "step": 53520 - }, - { - "epoch": 1.37, - "learning_rate": 1.185936205825873e-06, - "loss": 0.6709, - "step": 53521 - }, - { - "epoch": 1.37, - "learning_rate": 1.185909017823193e-06, - "loss": 0.6133, - "step": 53522 - }, - { - "epoch": 1.37, - "learning_rate": 1.1858818296781712e-06, - "loss": 0.6265, - "step": 53523 - }, - { - "epoch": 1.37, - "learning_rate": 1.185854641390828e-06, - "loss": 0.5303, - "step": 53524 - }, - { - "epoch": 1.37, - "learning_rate": 1.1858274529611848e-06, - "loss": 0.697, - "step": 53525 - }, - { - "epoch": 1.37, - "learning_rate": 1.1858002643892619e-06, - "loss": 0.6211, - "step": 53526 - }, - { - "epoch": 1.37, - "learning_rate": 1.1857730756750806e-06, - "loss": 0.5532, - "step": 53527 - }, - { - "epoch": 1.37, - "learning_rate": 1.1857458868186609e-06, - "loss": 0.6973, - "step": 53528 - }, - { - "epoch": 1.37, - "learning_rate": 1.1857186978200243e-06, - "loss": 0.6411, - "step": 53529 - }, - { - "epoch": 1.37, - "learning_rate": 1.1856915086791915e-06, - "loss": 0.7578, - "step": 53530 - }, - { - "epoch": 1.37, - "learning_rate": 1.1856643193961833e-06, - "loss": 0.6016, - "step": 53531 - }, - { - "epoch": 1.37, - "learning_rate": 1.1856371299710202e-06, - "loss": 0.5649, - "step": 53532 - }, - { - "epoch": 1.37, - "learning_rate": 1.1856099404037236e-06, - "loss": 0.6816, - "step": 53533 - }, - { - "epoch": 1.37, - "learning_rate": 1.1855827506943138e-06, - "loss": 0.4543, - "step": 53534 - }, - { - "epoch": 1.37, - "learning_rate": 1.1855555608428118e-06, - "loss": 0.7812, - "step": 53535 - }, - { - "epoch": 1.37, - "learning_rate": 1.1855283708492385e-06, - "loss": 0.6729, - "step": 53536 - }, - { - "epoch": 1.37, - "learning_rate": 1.1855011807136148e-06, - "loss": 0.689, - "step": 53537 - }, - { - "epoch": 1.37, - "learning_rate": 1.185473990435961e-06, - "loss": 0.7642, - "step": 53538 - }, - { - "epoch": 1.37, - "learning_rate": 1.1854468000162987e-06, - "loss": 0.5266, - "step": 53539 - }, - { - "epoch": 1.37, - "learning_rate": 1.185419609454648e-06, - "loss": 0.7031, - "step": 53540 - }, - { - "epoch": 1.37, - "learning_rate": 1.1853924187510302e-06, - "loss": 0.7144, - "step": 53541 - }, - { - "epoch": 1.37, - "learning_rate": 1.1853652279054662e-06, - "loss": 0.4802, - "step": 53542 - }, - { - "epoch": 1.37, - "learning_rate": 1.1853380369179762e-06, - "loss": 0.7324, - "step": 53543 - }, - { - "epoch": 1.37, - "learning_rate": 1.1853108457885815e-06, - "loss": 0.4045, - "step": 53544 - }, - { - "epoch": 1.37, - "learning_rate": 1.1852836545173028e-06, - "loss": 0.4648, - "step": 53545 - }, - { - "epoch": 1.37, - "learning_rate": 1.185256463104161e-06, - "loss": 0.5435, - "step": 53546 - }, - { - "epoch": 1.37, - "learning_rate": 1.1852292715491767e-06, - "loss": 0.5502, - "step": 53547 - }, - { - "epoch": 1.37, - "learning_rate": 1.185202079852371e-06, - "loss": 0.6289, - "step": 53548 - }, - { - "epoch": 1.37, - "learning_rate": 1.1851748880137641e-06, - "loss": 0.6826, - "step": 53549 - }, - { - "epoch": 1.37, - "learning_rate": 1.1851476960333779e-06, - "loss": 0.6094, - "step": 53550 - }, - { - "epoch": 1.37, - "learning_rate": 1.1851205039112326e-06, - "loss": 0.5132, - "step": 53551 - }, - { - "epoch": 1.37, - "learning_rate": 1.185093311647349e-06, - "loss": 0.6475, - "step": 53552 - }, - { - "epoch": 1.37, - "learning_rate": 1.1850661192417478e-06, - "loss": 0.6855, - "step": 53553 - }, - { - "epoch": 1.37, - "learning_rate": 1.18503892669445e-06, - "loss": 0.6328, - "step": 53554 - }, - { - "epoch": 1.37, - "learning_rate": 1.1850117340054762e-06, - "loss": 0.3855, - "step": 53555 - }, - { - "epoch": 1.37, - "learning_rate": 1.184984541174848e-06, - "loss": 0.6196, - "step": 53556 - }, - { - "epoch": 1.37, - "learning_rate": 1.1849573482025852e-06, - "loss": 0.5139, - "step": 53557 - }, - { - "epoch": 1.37, - "learning_rate": 1.1849301550887092e-06, - "loss": 0.6216, - "step": 53558 - }, - { - "epoch": 1.37, - "learning_rate": 1.1849029618332404e-06, - "loss": 0.6455, - "step": 53559 - }, - { - "epoch": 1.37, - "learning_rate": 1.1848757684362002e-06, - "loss": 0.7241, - "step": 53560 - }, - { - "epoch": 1.37, - "learning_rate": 1.1848485748976092e-06, - "loss": 0.7178, - "step": 53561 - }, - { - "epoch": 1.37, - "learning_rate": 1.1848213812174878e-06, - "loss": 0.7207, - "step": 53562 - }, - { - "epoch": 1.37, - "learning_rate": 1.1847941873958575e-06, - "loss": 0.6084, - "step": 53563 - }, - { - "epoch": 1.37, - "learning_rate": 1.1847669934327386e-06, - "loss": 0.7441, - "step": 53564 - }, - { - "epoch": 1.37, - "learning_rate": 1.1847397993281521e-06, - "loss": 0.6855, - "step": 53565 - }, - { - "epoch": 1.37, - "learning_rate": 1.184712605082119e-06, - "loss": 0.4775, - "step": 53566 - }, - { - "epoch": 1.37, - "learning_rate": 1.18468541069466e-06, - "loss": 0.7153, - "step": 53567 - }, - { - "epoch": 1.37, - "learning_rate": 1.1846582161657956e-06, - "loss": 0.6699, - "step": 53568 - }, - { - "epoch": 1.37, - "learning_rate": 1.1846310214955471e-06, - "loss": 0.5635, - "step": 53569 - }, - { - "epoch": 1.37, - "learning_rate": 1.1846038266839348e-06, - "loss": 0.5303, - "step": 53570 - }, - { - "epoch": 1.37, - "learning_rate": 1.1845766317309804e-06, - "loss": 0.6641, - "step": 53571 - }, - { - "epoch": 1.37, - "learning_rate": 1.1845494366367037e-06, - "loss": 0.6533, - "step": 53572 - }, - { - "epoch": 1.37, - "learning_rate": 1.1845222414011262e-06, - "loss": 0.5366, - "step": 53573 - }, - { - "epoch": 1.37, - "learning_rate": 1.1844950460242682e-06, - "loss": 0.668, - "step": 53574 - }, - { - "epoch": 1.37, - "learning_rate": 1.1844678505061512e-06, - "loss": 0.6753, - "step": 53575 - }, - { - "epoch": 1.37, - "learning_rate": 1.1844406548467955e-06, - "loss": 0.6758, - "step": 53576 - }, - { - "epoch": 1.37, - "learning_rate": 1.1844134590462222e-06, - "loss": 0.5273, - "step": 53577 - }, - { - "epoch": 1.37, - "learning_rate": 1.1843862631044517e-06, - "loss": 0.6519, - "step": 53578 - }, - { - "epoch": 1.37, - "learning_rate": 1.1843590670215054e-06, - "loss": 0.6802, - "step": 53579 - }, - { - "epoch": 1.37, - "learning_rate": 1.1843318707974036e-06, - "loss": 0.6582, - "step": 53580 - }, - { - "epoch": 1.37, - "learning_rate": 1.184304674432168e-06, - "loss": 0.5564, - "step": 53581 - }, - { - "epoch": 1.37, - "learning_rate": 1.1842774779258178e-06, - "loss": 0.5625, - "step": 53582 - }, - { - "epoch": 1.37, - "learning_rate": 1.1842502812783755e-06, - "loss": 0.6768, - "step": 53583 - }, - { - "epoch": 1.37, - "learning_rate": 1.1842230844898609e-06, - "loss": 0.47, - "step": 53584 - }, - { - "epoch": 1.37, - "learning_rate": 1.1841958875602954e-06, - "loss": 0.5928, - "step": 53585 - }, - { - "epoch": 1.37, - "learning_rate": 1.1841686904896993e-06, - "loss": 0.6514, - "step": 53586 - }, - { - "epoch": 1.37, - "learning_rate": 1.1841414932780937e-06, - "loss": 0.4919, - "step": 53587 - }, - { - "epoch": 1.37, - "learning_rate": 1.1841142959254996e-06, - "loss": 0.7529, - "step": 53588 - }, - { - "epoch": 1.37, - "learning_rate": 1.1840870984319375e-06, - "loss": 0.8643, - "step": 53589 - }, - { - "epoch": 1.37, - "learning_rate": 1.1840599007974286e-06, - "loss": 0.5981, - "step": 53590 - }, - { - "epoch": 1.37, - "learning_rate": 1.1840327030219934e-06, - "loss": 0.6924, - "step": 53591 - }, - { - "epoch": 1.37, - "learning_rate": 1.184005505105653e-06, - "loss": 0.5728, - "step": 53592 - }, - { - "epoch": 1.37, - "learning_rate": 1.1839783070484276e-06, - "loss": 0.6914, - "step": 53593 - }, - { - "epoch": 1.37, - "learning_rate": 1.1839511088503388e-06, - "loss": 0.7246, - "step": 53594 - }, - { - "epoch": 1.37, - "learning_rate": 1.1839239105114069e-06, - "loss": 0.7139, - "step": 53595 - }, - { - "epoch": 1.37, - "learning_rate": 1.1838967120316533e-06, - "loss": 0.6162, - "step": 53596 - }, - { - "epoch": 1.37, - "learning_rate": 1.1838695134110982e-06, - "loss": 0.8418, - "step": 53597 - }, - { - "epoch": 1.37, - "learning_rate": 1.1838423146497628e-06, - "loss": 0.6304, - "step": 53598 - }, - { - "epoch": 1.37, - "learning_rate": 1.1838151157476674e-06, - "loss": 0.7959, - "step": 53599 - }, - { - "epoch": 1.37, - "learning_rate": 1.1837879167048335e-06, - "loss": 0.6562, - "step": 53600 - }, - { - "epoch": 1.37, - "learning_rate": 1.1837607175212818e-06, - "loss": 0.6807, - "step": 53601 - }, - { - "epoch": 1.37, - "learning_rate": 1.1837335181970328e-06, - "loss": 0.6729, - "step": 53602 - }, - { - "epoch": 1.37, - "learning_rate": 1.1837063187321073e-06, - "loss": 0.665, - "step": 53603 - }, - { - "epoch": 1.37, - "learning_rate": 1.1836791191265266e-06, - "loss": 0.6416, - "step": 53604 - }, - { - "epoch": 1.37, - "learning_rate": 1.183651919380311e-06, - "loss": 0.6465, - "step": 53605 - }, - { - "epoch": 1.37, - "learning_rate": 1.1836247194934816e-06, - "loss": 0.4937, - "step": 53606 - }, - { - "epoch": 1.37, - "learning_rate": 1.1835975194660595e-06, - "loss": 0.6113, - "step": 53607 - }, - { - "epoch": 1.37, - "learning_rate": 1.183570319298065e-06, - "loss": 0.6465, - "step": 53608 - }, - { - "epoch": 1.37, - "learning_rate": 1.183543118989519e-06, - "loss": 0.7715, - "step": 53609 - }, - { - "epoch": 1.37, - "learning_rate": 1.183515918540443e-06, - "loss": 0.7471, - "step": 53610 - }, - { - "epoch": 1.37, - "learning_rate": 1.1834887179508568e-06, - "loss": 0.5879, - "step": 53611 - }, - { - "epoch": 1.37, - "learning_rate": 1.1834615172207817e-06, - "loss": 0.7441, - "step": 53612 - }, - { - "epoch": 1.37, - "learning_rate": 1.1834343163502387e-06, - "loss": 0.7412, - "step": 53613 - }, - { - "epoch": 1.37, - "learning_rate": 1.1834071153392484e-06, - "loss": 0.6577, - "step": 53614 - }, - { - "epoch": 1.37, - "learning_rate": 1.183379914187832e-06, - "loss": 0.7754, - "step": 53615 - }, - { - "epoch": 1.37, - "learning_rate": 1.1833527128960098e-06, - "loss": 0.6816, - "step": 53616 - }, - { - "epoch": 1.37, - "learning_rate": 1.183325511463803e-06, - "loss": 0.6816, - "step": 53617 - }, - { - "epoch": 1.37, - "learning_rate": 1.1832983098912318e-06, - "loss": 0.8027, - "step": 53618 - }, - { - "epoch": 1.37, - "learning_rate": 1.1832711081783182e-06, - "loss": 0.6841, - "step": 53619 - }, - { - "epoch": 1.37, - "learning_rate": 1.183243906325082e-06, - "loss": 0.4758, - "step": 53620 - }, - { - "epoch": 1.37, - "learning_rate": 1.1832167043315446e-06, - "loss": 0.3127, - "step": 53621 - }, - { - "epoch": 1.37, - "learning_rate": 1.1831895021977263e-06, - "loss": 0.7861, - "step": 53622 - }, - { - "epoch": 1.37, - "learning_rate": 1.1831622999236484e-06, - "loss": 0.6626, - "step": 53623 - }, - { - "epoch": 1.37, - "learning_rate": 1.1831350975093312e-06, - "loss": 0.5879, - "step": 53624 - }, - { - "epoch": 1.37, - "learning_rate": 1.183107894954796e-06, - "loss": 0.6807, - "step": 53625 - }, - { - "epoch": 1.37, - "learning_rate": 1.1830806922600639e-06, - "loss": 0.467, - "step": 53626 - }, - { - "epoch": 1.37, - "learning_rate": 1.1830534894251552e-06, - "loss": 0.5059, - "step": 53627 - }, - { - "epoch": 1.37, - "learning_rate": 1.1830262864500907e-06, - "loss": 0.6816, - "step": 53628 - }, - { - "epoch": 1.37, - "learning_rate": 1.1829990833348913e-06, - "loss": 0.6116, - "step": 53629 - }, - { - "epoch": 1.37, - "learning_rate": 1.1829718800795781e-06, - "loss": 0.6543, - "step": 53630 - }, - { - "epoch": 1.37, - "learning_rate": 1.1829446766841716e-06, - "loss": 0.6387, - "step": 53631 - }, - { - "epoch": 1.37, - "learning_rate": 1.182917473148693e-06, - "loss": 0.6387, - "step": 53632 - }, - { - "epoch": 1.37, - "learning_rate": 1.1828902694731624e-06, - "loss": 0.5732, - "step": 53633 - }, - { - "epoch": 1.37, - "learning_rate": 1.1828630656576018e-06, - "loss": 0.6748, - "step": 53634 - }, - { - "epoch": 1.37, - "learning_rate": 1.182835861702031e-06, - "loss": 0.73, - "step": 53635 - }, - { - "epoch": 1.37, - "learning_rate": 1.1828086576064712e-06, - "loss": 0.6504, - "step": 53636 - }, - { - "epoch": 1.37, - "learning_rate": 1.1827814533709433e-06, - "loss": 0.6162, - "step": 53637 - }, - { - "epoch": 1.37, - "learning_rate": 1.182754248995468e-06, - "loss": 0.7607, - "step": 53638 - }, - { - "epoch": 1.37, - "learning_rate": 1.182727044480066e-06, - "loss": 0.749, - "step": 53639 - }, - { - "epoch": 1.37, - "learning_rate": 1.1826998398247588e-06, - "loss": 0.6924, - "step": 53640 - }, - { - "epoch": 1.37, - "learning_rate": 1.1826726350295662e-06, - "loss": 0.7207, - "step": 53641 - }, - { - "epoch": 1.37, - "learning_rate": 1.18264543009451e-06, - "loss": 0.5645, - "step": 53642 - }, - { - "epoch": 1.37, - "learning_rate": 1.1826182250196101e-06, - "loss": 0.7363, - "step": 53643 - }, - { - "epoch": 1.37, - "learning_rate": 1.182591019804888e-06, - "loss": 0.7119, - "step": 53644 - }, - { - "epoch": 1.37, - "learning_rate": 1.1825638144503646e-06, - "loss": 0.8232, - "step": 53645 - }, - { - "epoch": 1.37, - "learning_rate": 1.1825366089560604e-06, - "loss": 0.6543, - "step": 53646 - }, - { - "epoch": 1.38, - "learning_rate": 1.1825094033219962e-06, - "loss": 0.5869, - "step": 53647 - }, - { - "epoch": 1.38, - "learning_rate": 1.182482197548193e-06, - "loss": 0.6548, - "step": 53648 - }, - { - "epoch": 1.38, - "learning_rate": 1.1824549916346714e-06, - "loss": 0.6621, - "step": 53649 - }, - { - "epoch": 1.38, - "learning_rate": 1.1824277855814525e-06, - "loss": 0.4805, - "step": 53650 - }, - { - "epoch": 1.38, - "learning_rate": 1.1824005793885573e-06, - "loss": 0.7129, - "step": 53651 - }, - { - "epoch": 1.38, - "learning_rate": 1.182373373056006e-06, - "loss": 0.5029, - "step": 53652 - }, - { - "epoch": 1.38, - "learning_rate": 1.1823461665838199e-06, - "loss": 0.6602, - "step": 53653 - }, - { - "epoch": 1.38, - "learning_rate": 1.1823189599720198e-06, - "loss": 0.6787, - "step": 53654 - }, - { - "epoch": 1.38, - "learning_rate": 1.1822917532206264e-06, - "loss": 0.4357, - "step": 53655 - }, - { - "epoch": 1.38, - "learning_rate": 1.1822645463296606e-06, - "loss": 0.5317, - "step": 53656 - }, - { - "epoch": 1.38, - "learning_rate": 1.1822373392991434e-06, - "loss": 0.5923, - "step": 53657 - }, - { - "epoch": 1.38, - "learning_rate": 1.1822101321290952e-06, - "loss": 0.5654, - "step": 53658 - }, - { - "epoch": 1.38, - "learning_rate": 1.182182924819537e-06, - "loss": 0.563, - "step": 53659 - }, - { - "epoch": 1.38, - "learning_rate": 1.18215571737049e-06, - "loss": 0.6025, - "step": 53660 - }, - { - "epoch": 1.38, - "learning_rate": 1.1821285097819747e-06, - "loss": 0.5225, - "step": 53661 - }, - { - "epoch": 1.38, - "learning_rate": 1.1821013020540118e-06, - "loss": 0.4792, - "step": 53662 - }, - { - "epoch": 1.38, - "learning_rate": 1.1820740941866222e-06, - "loss": 0.5775, - "step": 53663 - }, - { - "epoch": 1.38, - "learning_rate": 1.182046886179827e-06, - "loss": 0.686, - "step": 53664 - }, - { - "epoch": 1.38, - "learning_rate": 1.1820196780336474e-06, - "loss": 0.5542, - "step": 53665 - }, - { - "epoch": 1.38, - "learning_rate": 1.1819924697481029e-06, - "loss": 0.6562, - "step": 53666 - }, - { - "epoch": 1.38, - "learning_rate": 1.1819652613232154e-06, - "loss": 0.7031, - "step": 53667 - }, - { - "epoch": 1.38, - "learning_rate": 1.1819380527590055e-06, - "loss": 0.958, - "step": 53668 - }, - { - "epoch": 1.38, - "learning_rate": 1.1819108440554938e-06, - "loss": 0.4774, - "step": 53669 - }, - { - "epoch": 1.38, - "learning_rate": 1.1818836352127017e-06, - "loss": 0.6836, - "step": 53670 - }, - { - "epoch": 1.38, - "learning_rate": 1.1818564262306496e-06, - "loss": 0.6416, - "step": 53671 - }, - { - "epoch": 1.38, - "learning_rate": 1.1818292171093582e-06, - "loss": 0.6436, - "step": 53672 - }, - { - "epoch": 1.38, - "learning_rate": 1.1818020078488486e-06, - "loss": 0.6211, - "step": 53673 - }, - { - "epoch": 1.38, - "learning_rate": 1.1817747984491415e-06, - "loss": 0.4407, - "step": 53674 - }, - { - "epoch": 1.38, - "learning_rate": 1.181747588910258e-06, - "loss": 0.4749, - "step": 53675 - }, - { - "epoch": 1.38, - "learning_rate": 1.1817203792322185e-06, - "loss": 0.7549, - "step": 53676 - }, - { - "epoch": 1.38, - "learning_rate": 1.1816931694150442e-06, - "loss": 0.6484, - "step": 53677 - }, - { - "epoch": 1.38, - "learning_rate": 1.1816659594587557e-06, - "loss": 0.4785, - "step": 53678 - }, - { - "epoch": 1.38, - "learning_rate": 1.1816387493633739e-06, - "loss": 0.625, - "step": 53679 - }, - { - "epoch": 1.38, - "learning_rate": 1.1816115391289202e-06, - "loss": 0.7461, - "step": 53680 - }, - { - "epoch": 1.38, - "learning_rate": 1.1815843287554142e-06, - "loss": 0.708, - "step": 53681 - }, - { - "epoch": 1.38, - "learning_rate": 1.1815571182428777e-06, - "loss": 0.6875, - "step": 53682 - }, - { - "epoch": 1.38, - "learning_rate": 1.181529907591331e-06, - "loss": 0.6367, - "step": 53683 - }, - { - "epoch": 1.38, - "learning_rate": 1.1815026968007954e-06, - "loss": 0.626, - "step": 53684 - }, - { - "epoch": 1.38, - "learning_rate": 1.181475485871292e-06, - "loss": 0.6113, - "step": 53685 - }, - { - "epoch": 1.38, - "learning_rate": 1.1814482748028405e-06, - "loss": 0.7666, - "step": 53686 - }, - { - "epoch": 1.38, - "learning_rate": 1.1814210635954628e-06, - "loss": 0.6797, - "step": 53687 - }, - { - "epoch": 1.38, - "learning_rate": 1.181393852249179e-06, - "loss": 0.616, - "step": 53688 - }, - { - "epoch": 1.38, - "learning_rate": 1.1813666407640103e-06, - "loss": 0.7324, - "step": 53689 - }, - { - "epoch": 1.38, - "learning_rate": 1.181339429139978e-06, - "loss": 0.8545, - "step": 53690 - }, - { - "epoch": 1.38, - "learning_rate": 1.1813122173771018e-06, - "loss": 0.6904, - "step": 53691 - }, - { - "epoch": 1.38, - "learning_rate": 1.1812850054754035e-06, - "loss": 0.5864, - "step": 53692 - }, - { - "epoch": 1.38, - "learning_rate": 1.1812577934349035e-06, - "loss": 0.6523, - "step": 53693 - }, - { - "epoch": 1.38, - "learning_rate": 1.181230581255623e-06, - "loss": 0.752, - "step": 53694 - }, - { - "epoch": 1.38, - "learning_rate": 1.1812033689375822e-06, - "loss": 0.7441, - "step": 53695 - }, - { - "epoch": 1.38, - "learning_rate": 1.1811761564808023e-06, - "loss": 0.6587, - "step": 53696 - }, - { - "epoch": 1.38, - "learning_rate": 1.1811489438853044e-06, - "loss": 0.5879, - "step": 53697 - }, - { - "epoch": 1.38, - "learning_rate": 1.1811217311511092e-06, - "loss": 0.6621, - "step": 53698 - }, - { - "epoch": 1.38, - "learning_rate": 1.181094518278237e-06, - "loss": 0.7061, - "step": 53699 - }, - { - "epoch": 1.38, - "learning_rate": 1.1810673052667094e-06, - "loss": 0.5662, - "step": 53700 - }, - { - "epoch": 1.38, - "learning_rate": 1.1810400921165468e-06, - "loss": 0.7119, - "step": 53701 - }, - { - "epoch": 1.38, - "learning_rate": 1.18101287882777e-06, - "loss": 0.8184, - "step": 53702 - }, - { - "epoch": 1.38, - "learning_rate": 1.1809856654004003e-06, - "loss": 0.4626, - "step": 53703 - }, - { - "epoch": 1.38, - "learning_rate": 1.1809584518344574e-06, - "loss": 0.6763, - "step": 53704 - }, - { - "epoch": 1.38, - "learning_rate": 1.180931238129964e-06, - "loss": 0.4454, - "step": 53705 - }, - { - "epoch": 1.38, - "learning_rate": 1.1809040242869392e-06, - "loss": 0.7334, - "step": 53706 - }, - { - "epoch": 1.38, - "learning_rate": 1.1808768103054047e-06, - "loss": 0.5903, - "step": 53707 - }, - { - "epoch": 1.38, - "learning_rate": 1.1808495961853811e-06, - "loss": 0.5859, - "step": 53708 - }, - { - "epoch": 1.38, - "learning_rate": 1.1808223819268893e-06, - "loss": 0.6724, - "step": 53709 - }, - { - "epoch": 1.38, - "learning_rate": 1.1807951675299501e-06, - "loss": 0.6191, - "step": 53710 - }, - { - "epoch": 1.38, - "learning_rate": 1.1807679529945844e-06, - "loss": 0.7715, - "step": 53711 - }, - { - "epoch": 1.38, - "learning_rate": 1.180740738320813e-06, - "loss": 0.7266, - "step": 53712 - }, - { - "epoch": 1.38, - "learning_rate": 1.1807135235086566e-06, - "loss": 0.4241, - "step": 53713 - }, - { - "epoch": 1.38, - "learning_rate": 1.1806863085581361e-06, - "loss": 0.707, - "step": 53714 - }, - { - "epoch": 1.38, - "learning_rate": 1.180659093469273e-06, - "loss": 0.4907, - "step": 53715 - }, - { - "epoch": 1.38, - "learning_rate": 1.1806318782420867e-06, - "loss": 0.7266, - "step": 53716 - }, - { - "epoch": 1.38, - "learning_rate": 1.1806046628765996e-06, - "loss": 0.4781, - "step": 53717 - }, - { - "epoch": 1.38, - "learning_rate": 1.180577447372831e-06, - "loss": 0.7842, - "step": 53718 - }, - { - "epoch": 1.38, - "learning_rate": 1.1805502317308035e-06, - "loss": 0.6519, - "step": 53719 - }, - { - "epoch": 1.38, - "learning_rate": 1.1805230159505365e-06, - "loss": 0.603, - "step": 53720 - }, - { - "epoch": 1.38, - "learning_rate": 1.180495800032051e-06, - "loss": 0.5337, - "step": 53721 - }, - { - "epoch": 1.38, - "learning_rate": 1.1804685839753688e-06, - "loss": 0.6455, - "step": 53722 - }, - { - "epoch": 1.38, - "learning_rate": 1.1804413677805097e-06, - "loss": 0.5385, - "step": 53723 - }, - { - "epoch": 1.38, - "learning_rate": 1.180414151447495e-06, - "loss": 0.5439, - "step": 53724 - }, - { - "epoch": 1.38, - "learning_rate": 1.1803869349763456e-06, - "loss": 0.7559, - "step": 53725 - }, - { - "epoch": 1.38, - "learning_rate": 1.1803597183670822e-06, - "loss": 0.6553, - "step": 53726 - }, - { - "epoch": 1.38, - "learning_rate": 1.1803325016197255e-06, - "loss": 0.5923, - "step": 53727 - }, - { - "epoch": 1.38, - "learning_rate": 1.1803052847342967e-06, - "loss": 0.6248, - "step": 53728 - }, - { - "epoch": 1.38, - "learning_rate": 1.1802780677108162e-06, - "loss": 0.5596, - "step": 53729 - }, - { - "epoch": 1.38, - "learning_rate": 1.1802508505493055e-06, - "loss": 0.752, - "step": 53730 - }, - { - "epoch": 1.38, - "learning_rate": 1.1802236332497843e-06, - "loss": 0.6924, - "step": 53731 - }, - { - "epoch": 1.38, - "learning_rate": 1.180196415812275e-06, - "loss": 0.7554, - "step": 53732 - }, - { - "epoch": 1.38, - "learning_rate": 1.180169198236797e-06, - "loss": 0.7197, - "step": 53733 - }, - { - "epoch": 1.38, - "learning_rate": 1.1801419805233719e-06, - "loss": 0.791, - "step": 53734 - }, - { - "epoch": 1.38, - "learning_rate": 1.1801147626720202e-06, - "loss": 0.6201, - "step": 53735 - }, - { - "epoch": 1.38, - "learning_rate": 1.1800875446827633e-06, - "loss": 0.6104, - "step": 53736 - }, - { - "epoch": 1.38, - "learning_rate": 1.1800603265556212e-06, - "loss": 0.6963, - "step": 53737 - }, - { - "epoch": 1.38, - "learning_rate": 1.1800331082906155e-06, - "loss": 0.5679, - "step": 53738 - }, - { - "epoch": 1.38, - "learning_rate": 1.1800058898877666e-06, - "loss": 0.8389, - "step": 53739 - }, - { - "epoch": 1.38, - "learning_rate": 1.1799786713470954e-06, - "loss": 0.5587, - "step": 53740 - }, - { - "epoch": 1.38, - "learning_rate": 1.179951452668623e-06, - "loss": 0.6875, - "step": 53741 - }, - { - "epoch": 1.38, - "learning_rate": 1.1799242338523697e-06, - "loss": 0.3728, - "step": 53742 - }, - { - "epoch": 1.38, - "learning_rate": 1.179897014898357e-06, - "loss": 0.5115, - "step": 53743 - }, - { - "epoch": 1.38, - "learning_rate": 1.1798697958066055e-06, - "loss": 0.5967, - "step": 53744 - }, - { - "epoch": 1.38, - "learning_rate": 1.179842576577136e-06, - "loss": 0.5273, - "step": 53745 - }, - { - "epoch": 1.38, - "learning_rate": 1.179815357209969e-06, - "loss": 0.5099, - "step": 53746 - }, - { - "epoch": 1.38, - "learning_rate": 1.1797881377051259e-06, - "loss": 0.6084, - "step": 53747 - }, - { - "epoch": 1.38, - "learning_rate": 1.179760918062627e-06, - "loss": 0.7256, - "step": 53748 - }, - { - "epoch": 1.38, - "learning_rate": 1.1797336982824937e-06, - "loss": 0.5952, - "step": 53749 - }, - { - "epoch": 1.38, - "learning_rate": 1.1797064783647465e-06, - "loss": 0.6646, - "step": 53750 - }, - { - "epoch": 1.38, - "learning_rate": 1.1796792583094064e-06, - "loss": 0.6699, - "step": 53751 - }, - { - "epoch": 1.38, - "learning_rate": 1.1796520381164941e-06, - "loss": 0.4773, - "step": 53752 - }, - { - "epoch": 1.38, - "learning_rate": 1.1796248177860303e-06, - "loss": 0.75, - "step": 53753 - }, - { - "epoch": 1.38, - "learning_rate": 1.179597597318036e-06, - "loss": 0.5942, - "step": 53754 - }, - { - "epoch": 1.38, - "learning_rate": 1.1795703767125326e-06, - "loss": 0.6128, - "step": 53755 - }, - { - "epoch": 1.38, - "learning_rate": 1.1795431559695402e-06, - "loss": 0.6274, - "step": 53756 - }, - { - "epoch": 1.38, - "learning_rate": 1.1795159350890795e-06, - "loss": 0.6455, - "step": 53757 - }, - { - "epoch": 1.38, - "learning_rate": 1.179488714071172e-06, - "loss": 0.7168, - "step": 53758 - }, - { - "epoch": 1.38, - "learning_rate": 1.1794614929158382e-06, - "loss": 0.6826, - "step": 53759 - }, - { - "epoch": 1.38, - "learning_rate": 1.179434271623099e-06, - "loss": 0.5723, - "step": 53760 - }, - { - "epoch": 1.38, - "learning_rate": 1.1794070501929753e-06, - "loss": 0.5254, - "step": 53761 - }, - { - "epoch": 1.38, - "learning_rate": 1.1793798286254876e-06, - "loss": 0.6904, - "step": 53762 - }, - { - "epoch": 1.38, - "learning_rate": 1.1793526069206574e-06, - "loss": 0.6494, - "step": 53763 - }, - { - "epoch": 1.38, - "learning_rate": 1.1793253850785049e-06, - "loss": 0.6387, - "step": 53764 - }, - { - "epoch": 1.38, - "learning_rate": 1.179298163099051e-06, - "loss": 0.6981, - "step": 53765 - }, - { - "epoch": 1.38, - "learning_rate": 1.1792709409823172e-06, - "loss": 0.7734, - "step": 53766 - }, - { - "epoch": 1.38, - "learning_rate": 1.1792437187283235e-06, - "loss": 0.6152, - "step": 53767 - }, - { - "epoch": 1.38, - "learning_rate": 1.1792164963370914e-06, - "loss": 0.7344, - "step": 53768 - }, - { - "epoch": 1.38, - "learning_rate": 1.179189273808641e-06, - "loss": 0.8438, - "step": 53769 - }, - { - "epoch": 1.38, - "learning_rate": 1.1791620511429946e-06, - "loss": 0.6914, - "step": 53770 - }, - { - "epoch": 1.38, - "learning_rate": 1.1791348283401712e-06, - "loss": 0.5027, - "step": 53771 - }, - { - "epoch": 1.38, - "learning_rate": 1.1791076054001928e-06, - "loss": 0.707, - "step": 53772 - }, - { - "epoch": 1.38, - "learning_rate": 1.1790803823230798e-06, - "loss": 0.7539, - "step": 53773 - }, - { - "epoch": 1.38, - "learning_rate": 1.1790531591088534e-06, - "loss": 0.876, - "step": 53774 - }, - { - "epoch": 1.38, - "learning_rate": 1.1790259357575338e-06, - "loss": 0.6738, - "step": 53775 - }, - { - "epoch": 1.38, - "learning_rate": 1.1789987122691426e-06, - "loss": 0.7061, - "step": 53776 - }, - { - "epoch": 1.38, - "learning_rate": 1.1789714886437003e-06, - "loss": 0.7803, - "step": 53777 - }, - { - "epoch": 1.38, - "learning_rate": 1.1789442648812278e-06, - "loss": 0.7607, - "step": 53778 - }, - { - "epoch": 1.38, - "learning_rate": 1.1789170409817457e-06, - "loss": 0.562, - "step": 53779 - }, - { - "epoch": 1.38, - "learning_rate": 1.1788898169452754e-06, - "loss": 0.6865, - "step": 53780 - }, - { - "epoch": 1.38, - "learning_rate": 1.1788625927718373e-06, - "loss": 0.584, - "step": 53781 - }, - { - "epoch": 1.38, - "learning_rate": 1.1788353684614521e-06, - "loss": 0.5649, - "step": 53782 - }, - { - "epoch": 1.38, - "learning_rate": 1.178808144014141e-06, - "loss": 0.7119, - "step": 53783 - }, - { - "epoch": 1.38, - "learning_rate": 1.1787809194299247e-06, - "loss": 0.6445, - "step": 53784 - }, - { - "epoch": 1.38, - "learning_rate": 1.178753694708824e-06, - "loss": 0.7266, - "step": 53785 - }, - { - "epoch": 1.38, - "learning_rate": 1.1787264698508599e-06, - "loss": 0.6289, - "step": 53786 - }, - { - "epoch": 1.38, - "learning_rate": 1.1786992448560533e-06, - "loss": 0.6855, - "step": 53787 - }, - { - "epoch": 1.38, - "learning_rate": 1.1786720197244248e-06, - "loss": 0.6919, - "step": 53788 - }, - { - "epoch": 1.38, - "learning_rate": 1.1786447944559952e-06, - "loss": 0.4189, - "step": 53789 - }, - { - "epoch": 1.38, - "learning_rate": 1.1786175690507855e-06, - "loss": 0.6184, - "step": 53790 - }, - { - "epoch": 1.38, - "learning_rate": 1.178590343508817e-06, - "loss": 0.5757, - "step": 53791 - }, - { - "epoch": 1.38, - "learning_rate": 1.1785631178301096e-06, - "loss": 0.6434, - "step": 53792 - }, - { - "epoch": 1.38, - "learning_rate": 1.1785358920146848e-06, - "loss": 0.645, - "step": 53793 - }, - { - "epoch": 1.38, - "learning_rate": 1.1785086660625632e-06, - "loss": 0.7207, - "step": 53794 - }, - { - "epoch": 1.38, - "learning_rate": 1.178481439973766e-06, - "loss": 0.5784, - "step": 53795 - }, - { - "epoch": 1.38, - "learning_rate": 1.1784542137483134e-06, - "loss": 0.4985, - "step": 53796 - }, - { - "epoch": 1.38, - "learning_rate": 1.1784269873862267e-06, - "loss": 0.644, - "step": 53797 - }, - { - "epoch": 1.38, - "learning_rate": 1.1783997608875266e-06, - "loss": 0.668, - "step": 53798 - }, - { - "epoch": 1.38, - "learning_rate": 1.1783725342522345e-06, - "loss": 0.5288, - "step": 53799 - }, - { - "epoch": 1.38, - "learning_rate": 1.17834530748037e-06, - "loss": 0.6763, - "step": 53800 - }, - { - "epoch": 1.38, - "learning_rate": 1.1783180805719553e-06, - "loss": 0.8047, - "step": 53801 - }, - { - "epoch": 1.38, - "learning_rate": 1.1782908535270103e-06, - "loss": 0.5503, - "step": 53802 - }, - { - "epoch": 1.38, - "learning_rate": 1.1782636263455566e-06, - "loss": 0.6514, - "step": 53803 - }, - { - "epoch": 1.38, - "learning_rate": 1.1782363990276141e-06, - "loss": 0.5859, - "step": 53804 - }, - { - "epoch": 1.38, - "learning_rate": 1.1782091715732047e-06, - "loss": 0.6689, - "step": 53805 - }, - { - "epoch": 1.38, - "learning_rate": 1.1781819439823484e-06, - "loss": 0.6553, - "step": 53806 - }, - { - "epoch": 1.38, - "learning_rate": 1.1781547162550665e-06, - "loss": 0.5757, - "step": 53807 - }, - { - "epoch": 1.38, - "learning_rate": 1.1781274883913794e-06, - "loss": 0.6226, - "step": 53808 - }, - { - "epoch": 1.38, - "learning_rate": 1.1781002603913086e-06, - "loss": 0.8848, - "step": 53809 - }, - { - "epoch": 1.38, - "learning_rate": 1.1780730322548745e-06, - "loss": 0.5232, - "step": 53810 - }, - { - "epoch": 1.38, - "learning_rate": 1.178045803982098e-06, - "loss": 0.4868, - "step": 53811 - }, - { - "epoch": 1.38, - "learning_rate": 1.1780185755730003e-06, - "loss": 0.668, - "step": 53812 - }, - { - "epoch": 1.38, - "learning_rate": 1.1779913470276017e-06, - "loss": 0.6816, - "step": 53813 - }, - { - "epoch": 1.38, - "learning_rate": 1.1779641183459234e-06, - "loss": 0.7544, - "step": 53814 - }, - { - "epoch": 1.38, - "learning_rate": 1.1779368895279864e-06, - "loss": 0.6709, - "step": 53815 - }, - { - "epoch": 1.38, - "learning_rate": 1.1779096605738113e-06, - "loss": 0.6475, - "step": 53816 - }, - { - "epoch": 1.38, - "learning_rate": 1.1778824314834185e-06, - "loss": 0.8711, - "step": 53817 - }, - { - "epoch": 1.38, - "learning_rate": 1.1778552022568296e-06, - "loss": 0.7744, - "step": 53818 - }, - { - "epoch": 1.38, - "learning_rate": 1.177827972894065e-06, - "loss": 0.7686, - "step": 53819 - }, - { - "epoch": 1.38, - "learning_rate": 1.177800743395146e-06, - "loss": 0.6396, - "step": 53820 - }, - { - "epoch": 1.38, - "learning_rate": 1.1777735137600928e-06, - "loss": 0.7188, - "step": 53821 - }, - { - "epoch": 1.38, - "learning_rate": 1.1777462839889267e-06, - "loss": 0.6914, - "step": 53822 - }, - { - "epoch": 1.38, - "learning_rate": 1.1777190540816684e-06, - "loss": 0.6943, - "step": 53823 - }, - { - "epoch": 1.38, - "learning_rate": 1.177691824038339e-06, - "loss": 0.3308, - "step": 53824 - }, - { - "epoch": 1.38, - "learning_rate": 1.1776645938589591e-06, - "loss": 0.6025, - "step": 53825 - }, - { - "epoch": 1.38, - "learning_rate": 1.1776373635435494e-06, - "loss": 0.6182, - "step": 53826 - }, - { - "epoch": 1.38, - "learning_rate": 1.1776101330921311e-06, - "loss": 0.77, - "step": 53827 - }, - { - "epoch": 1.38, - "learning_rate": 1.1775829025047249e-06, - "loss": 0.709, - "step": 53828 - }, - { - "epoch": 1.38, - "learning_rate": 1.1775556717813512e-06, - "loss": 0.6816, - "step": 53829 - }, - { - "epoch": 1.38, - "learning_rate": 1.1775284409220318e-06, - "loss": 0.646, - "step": 53830 - }, - { - "epoch": 1.38, - "learning_rate": 1.177501209926787e-06, - "loss": 0.5459, - "step": 53831 - }, - { - "epoch": 1.38, - "learning_rate": 1.1774739787956373e-06, - "loss": 0.7847, - "step": 53832 - }, - { - "epoch": 1.38, - "learning_rate": 1.1774467475286043e-06, - "loss": 0.6963, - "step": 53833 - }, - { - "epoch": 1.38, - "learning_rate": 1.1774195161257086e-06, - "loss": 0.6279, - "step": 53834 - }, - { - "epoch": 1.38, - "learning_rate": 1.1773922845869707e-06, - "loss": 0.6318, - "step": 53835 - }, - { - "epoch": 1.38, - "learning_rate": 1.1773650529124114e-06, - "loss": 0.5503, - "step": 53836 - }, - { - "epoch": 1.38, - "learning_rate": 1.1773378211020525e-06, - "loss": 0.7275, - "step": 53837 - }, - { - "epoch": 1.38, - "learning_rate": 1.1773105891559137e-06, - "loss": 0.4917, - "step": 53838 - }, - { - "epoch": 1.38, - "learning_rate": 1.1772833570740163e-06, - "loss": 0.6953, - "step": 53839 - }, - { - "epoch": 1.38, - "learning_rate": 1.1772561248563815e-06, - "loss": 0.5109, - "step": 53840 - }, - { - "epoch": 1.38, - "learning_rate": 1.1772288925030295e-06, - "loss": 0.6367, - "step": 53841 - }, - { - "epoch": 1.38, - "learning_rate": 1.1772016600139818e-06, - "loss": 0.7617, - "step": 53842 - }, - { - "epoch": 1.38, - "learning_rate": 1.1771744273892587e-06, - "loss": 0.7471, - "step": 53843 - }, - { - "epoch": 1.38, - "learning_rate": 1.1771471946288813e-06, - "loss": 0.584, - "step": 53844 - }, - { - "epoch": 1.38, - "learning_rate": 1.177119961732871e-06, - "loss": 0.7207, - "step": 53845 - }, - { - "epoch": 1.38, - "learning_rate": 1.1770927287012474e-06, - "loss": 0.7705, - "step": 53846 - }, - { - "epoch": 1.38, - "learning_rate": 1.1770654955340323e-06, - "loss": 0.7686, - "step": 53847 - }, - { - "epoch": 1.38, - "learning_rate": 1.177038262231246e-06, - "loss": 0.625, - "step": 53848 - }, - { - "epoch": 1.38, - "learning_rate": 1.17701102879291e-06, - "loss": 0.7383, - "step": 53849 - }, - { - "epoch": 1.38, - "learning_rate": 1.1769837952190447e-06, - "loss": 0.5864, - "step": 53850 - }, - { - "epoch": 1.38, - "learning_rate": 1.1769565615096714e-06, - "loss": 0.4856, - "step": 53851 - }, - { - "epoch": 1.38, - "learning_rate": 1.1769293276648098e-06, - "loss": 0.5825, - "step": 53852 - }, - { - "epoch": 1.38, - "learning_rate": 1.176902093684482e-06, - "loss": 0.752, - "step": 53853 - }, - { - "epoch": 1.38, - "learning_rate": 1.1768748595687084e-06, - "loss": 0.7754, - "step": 53854 - }, - { - "epoch": 1.38, - "learning_rate": 1.1768476253175098e-06, - "loss": 0.6389, - "step": 53855 - }, - { - "epoch": 1.38, - "learning_rate": 1.1768203909309074e-06, - "loss": 0.6318, - "step": 53856 - }, - { - "epoch": 1.38, - "learning_rate": 1.1767931564089213e-06, - "loss": 0.5461, - "step": 53857 - }, - { - "epoch": 1.38, - "learning_rate": 1.176765921751573e-06, - "loss": 0.7666, - "step": 53858 - }, - { - "epoch": 1.38, - "learning_rate": 1.1767386869588828e-06, - "loss": 0.6118, - "step": 53859 - }, - { - "epoch": 1.38, - "learning_rate": 1.1767114520308728e-06, - "loss": 0.7158, - "step": 53860 - }, - { - "epoch": 1.38, - "learning_rate": 1.1766842169675624e-06, - "loss": 0.3524, - "step": 53861 - }, - { - "epoch": 1.38, - "learning_rate": 1.1766569817689732e-06, - "loss": 0.5938, - "step": 53862 - }, - { - "epoch": 1.38, - "learning_rate": 1.1766297464351253e-06, - "loss": 0.5107, - "step": 53863 - }, - { - "epoch": 1.38, - "learning_rate": 1.1766025109660407e-06, - "loss": 0.5176, - "step": 53864 - }, - { - "epoch": 1.38, - "learning_rate": 1.1765752753617397e-06, - "loss": 0.6748, - "step": 53865 - }, - { - "epoch": 1.38, - "learning_rate": 1.1765480396222429e-06, - "loss": 0.6924, - "step": 53866 - }, - { - "epoch": 1.38, - "learning_rate": 1.1765208037475714e-06, - "loss": 0.5923, - "step": 53867 - }, - { - "epoch": 1.38, - "learning_rate": 1.1764935677377462e-06, - "loss": 0.6626, - "step": 53868 - }, - { - "epoch": 1.38, - "learning_rate": 1.1764663315927876e-06, - "loss": 0.749, - "step": 53869 - }, - { - "epoch": 1.38, - "learning_rate": 1.1764390953127175e-06, - "loss": 0.5757, - "step": 53870 - }, - { - "epoch": 1.38, - "learning_rate": 1.1764118588975556e-06, - "loss": 0.5278, - "step": 53871 - }, - { - "epoch": 1.38, - "learning_rate": 1.1763846223473235e-06, - "loss": 0.7607, - "step": 53872 - }, - { - "epoch": 1.38, - "learning_rate": 1.1763573856620416e-06, - "loss": 0.8105, - "step": 53873 - }, - { - "epoch": 1.38, - "learning_rate": 1.176330148841731e-06, - "loss": 0.4636, - "step": 53874 - }, - { - "epoch": 1.38, - "learning_rate": 1.1763029118864127e-06, - "loss": 0.5596, - "step": 53875 - }, - { - "epoch": 1.38, - "learning_rate": 1.176275674796107e-06, - "loss": 0.7163, - "step": 53876 - }, - { - "epoch": 1.38, - "learning_rate": 1.1762484375708355e-06, - "loss": 0.5588, - "step": 53877 - }, - { - "epoch": 1.38, - "learning_rate": 1.1762212002106184e-06, - "loss": 0.6807, - "step": 53878 - }, - { - "epoch": 1.38, - "learning_rate": 1.1761939627154768e-06, - "loss": 0.6016, - "step": 53879 - }, - { - "epoch": 1.38, - "learning_rate": 1.176166725085432e-06, - "loss": 0.6885, - "step": 53880 - }, - { - "epoch": 1.38, - "learning_rate": 1.1761394873205042e-06, - "loss": 0.5732, - "step": 53881 - }, - { - "epoch": 1.38, - "learning_rate": 1.1761122494207144e-06, - "loss": 0.5923, - "step": 53882 - }, - { - "epoch": 1.38, - "learning_rate": 1.1760850113860835e-06, - "loss": 0.6577, - "step": 53883 - }, - { - "epoch": 1.38, - "learning_rate": 1.1760577732166324e-06, - "loss": 0.6455, - "step": 53884 - }, - { - "epoch": 1.38, - "learning_rate": 1.1760305349123822e-06, - "loss": 0.71, - "step": 53885 - }, - { - "epoch": 1.38, - "learning_rate": 1.1760032964733535e-06, - "loss": 0.7998, - "step": 53886 - }, - { - "epoch": 1.38, - "learning_rate": 1.175976057899567e-06, - "loss": 0.4808, - "step": 53887 - }, - { - "epoch": 1.38, - "learning_rate": 1.1759488191910436e-06, - "loss": 0.5879, - "step": 53888 - }, - { - "epoch": 1.38, - "learning_rate": 1.1759215803478046e-06, - "loss": 0.5889, - "step": 53889 - }, - { - "epoch": 1.38, - "learning_rate": 1.1758943413698704e-06, - "loss": 0.6372, - "step": 53890 - }, - { - "epoch": 1.38, - "learning_rate": 1.1758671022572623e-06, - "loss": 0.6787, - "step": 53891 - }, - { - "epoch": 1.38, - "learning_rate": 1.1758398630100002e-06, - "loss": 0.7168, - "step": 53892 - }, - { - "epoch": 1.38, - "learning_rate": 1.175812623628106e-06, - "loss": 0.9678, - "step": 53893 - }, - { - "epoch": 1.38, - "learning_rate": 1.1757853841116e-06, - "loss": 0.7148, - "step": 53894 - }, - { - "epoch": 1.38, - "learning_rate": 1.1757581444605037e-06, - "loss": 0.6177, - "step": 53895 - }, - { - "epoch": 1.38, - "learning_rate": 1.1757309046748368e-06, - "loss": 0.6963, - "step": 53896 - }, - { - "epoch": 1.38, - "learning_rate": 1.1757036647546212e-06, - "loss": 0.6431, - "step": 53897 - }, - { - "epoch": 1.38, - "learning_rate": 1.1756764246998771e-06, - "loss": 0.6689, - "step": 53898 - }, - { - "epoch": 1.38, - "learning_rate": 1.1756491845106257e-06, - "loss": 0.567, - "step": 53899 - }, - { - "epoch": 1.38, - "learning_rate": 1.1756219441868883e-06, - "loss": 0.6304, - "step": 53900 - }, - { - "epoch": 1.38, - "learning_rate": 1.1755947037286846e-06, - "loss": 0.5781, - "step": 53901 - }, - { - "epoch": 1.38, - "learning_rate": 1.1755674631360363e-06, - "loss": 0.5332, - "step": 53902 - }, - { - "epoch": 1.38, - "learning_rate": 1.175540222408964e-06, - "loss": 0.4915, - "step": 53903 - }, - { - "epoch": 1.38, - "learning_rate": 1.1755129815474888e-06, - "loss": 0.6396, - "step": 53904 - }, - { - "epoch": 1.38, - "learning_rate": 1.1754857405516316e-06, - "loss": 0.4846, - "step": 53905 - }, - { - "epoch": 1.38, - "learning_rate": 1.175458499421413e-06, - "loss": 0.5564, - "step": 53906 - }, - { - "epoch": 1.38, - "learning_rate": 1.1754312581568535e-06, - "loss": 0.7236, - "step": 53907 - }, - { - "epoch": 1.38, - "learning_rate": 1.1754040167579746e-06, - "loss": 0.6768, - "step": 53908 - }, - { - "epoch": 1.38, - "learning_rate": 1.1753767752247968e-06, - "loss": 0.7915, - "step": 53909 - }, - { - "epoch": 1.38, - "learning_rate": 1.1753495335573413e-06, - "loss": 0.7271, - "step": 53910 - }, - { - "epoch": 1.38, - "learning_rate": 1.1753222917556284e-06, - "loss": 0.6929, - "step": 53911 - }, - { - "epoch": 1.38, - "learning_rate": 1.1752950498196794e-06, - "loss": 0.7412, - "step": 53912 - }, - { - "epoch": 1.38, - "learning_rate": 1.175267807749515e-06, - "loss": 0.6543, - "step": 53913 - }, - { - "epoch": 1.38, - "learning_rate": 1.1752405655451562e-06, - "loss": 0.6279, - "step": 53914 - }, - { - "epoch": 1.38, - "learning_rate": 1.1752133232066237e-06, - "loss": 0.7285, - "step": 53915 - }, - { - "epoch": 1.38, - "learning_rate": 1.1751860807339387e-06, - "loss": 0.5645, - "step": 53916 - }, - { - "epoch": 1.38, - "learning_rate": 1.1751588381271212e-06, - "loss": 0.5728, - "step": 53917 - }, - { - "epoch": 1.38, - "learning_rate": 1.1751315953861932e-06, - "loss": 0.4258, - "step": 53918 - }, - { - "epoch": 1.38, - "learning_rate": 1.1751043525111743e-06, - "loss": 0.751, - "step": 53919 - }, - { - "epoch": 1.38, - "learning_rate": 1.1750771095020867e-06, - "loss": 0.6089, - "step": 53920 - }, - { - "epoch": 1.38, - "learning_rate": 1.1750498663589506e-06, - "loss": 0.7051, - "step": 53921 - }, - { - "epoch": 1.38, - "learning_rate": 1.1750226230817863e-06, - "loss": 0.708, - "step": 53922 - }, - { - "epoch": 1.38, - "learning_rate": 1.1749953796706157e-06, - "loss": 0.4186, - "step": 53923 - }, - { - "epoch": 1.38, - "learning_rate": 1.1749681361254591e-06, - "loss": 0.6211, - "step": 53924 - }, - { - "epoch": 1.38, - "learning_rate": 1.1749408924463375e-06, - "loss": 0.5498, - "step": 53925 - }, - { - "epoch": 1.38, - "learning_rate": 1.1749136486332716e-06, - "loss": 0.4297, - "step": 53926 - }, - { - "epoch": 1.38, - "learning_rate": 1.1748864046862824e-06, - "loss": 0.4937, - "step": 53927 - }, - { - "epoch": 1.38, - "learning_rate": 1.1748591606053904e-06, - "loss": 0.6899, - "step": 53928 - }, - { - "epoch": 1.38, - "learning_rate": 1.1748319163906172e-06, - "loss": 0.8223, - "step": 53929 - }, - { - "epoch": 1.38, - "learning_rate": 1.1748046720419832e-06, - "loss": 0.7051, - "step": 53930 - }, - { - "epoch": 1.38, - "learning_rate": 1.1747774275595092e-06, - "loss": 0.688, - "step": 53931 - }, - { - "epoch": 1.38, - "learning_rate": 1.174750182943216e-06, - "loss": 0.7778, - "step": 53932 - }, - { - "epoch": 1.38, - "learning_rate": 1.174722938193125e-06, - "loss": 0.5784, - "step": 53933 - }, - { - "epoch": 1.38, - "learning_rate": 1.1746956933092565e-06, - "loss": 0.6855, - "step": 53934 - }, - { - "epoch": 1.38, - "learning_rate": 1.1746684482916316e-06, - "loss": 0.8135, - "step": 53935 - }, - { - "epoch": 1.38, - "learning_rate": 1.1746412031402708e-06, - "loss": 0.3057, - "step": 53936 - }, - { - "epoch": 1.38, - "learning_rate": 1.1746139578551954e-06, - "loss": 0.6455, - "step": 53937 - }, - { - "epoch": 1.38, - "learning_rate": 1.1745867124364261e-06, - "loss": 0.6367, - "step": 53938 - }, - { - "epoch": 1.38, - "learning_rate": 1.174559466883984e-06, - "loss": 0.5803, - "step": 53939 - }, - { - "epoch": 1.38, - "learning_rate": 1.1745322211978898e-06, - "loss": 0.814, - "step": 53940 - }, - { - "epoch": 1.38, - "learning_rate": 1.174504975378164e-06, - "loss": 0.6509, - "step": 53941 - }, - { - "epoch": 1.38, - "learning_rate": 1.1744777294248278e-06, - "loss": 0.5732, - "step": 53942 - }, - { - "epoch": 1.38, - "learning_rate": 1.1744504833379024e-06, - "loss": 0.6709, - "step": 53943 - }, - { - "epoch": 1.38, - "learning_rate": 1.174423237117408e-06, - "loss": 0.7441, - "step": 53944 - }, - { - "epoch": 1.38, - "learning_rate": 1.1743959907633656e-06, - "loss": 0.7676, - "step": 53945 - }, - { - "epoch": 1.38, - "learning_rate": 1.1743687442757963e-06, - "loss": 0.6567, - "step": 53946 - }, - { - "epoch": 1.38, - "learning_rate": 1.1743414976547209e-06, - "loss": 0.6504, - "step": 53947 - }, - { - "epoch": 1.38, - "learning_rate": 1.1743142509001603e-06, - "loss": 0.5996, - "step": 53948 - }, - { - "epoch": 1.38, - "learning_rate": 1.1742870040121352e-06, - "loss": 0.7021, - "step": 53949 - }, - { - "epoch": 1.38, - "learning_rate": 1.1742597569906667e-06, - "loss": 0.3569, - "step": 53950 - }, - { - "epoch": 1.38, - "learning_rate": 1.1742325098357752e-06, - "loss": 0.833, - "step": 53951 - }, - { - "epoch": 1.38, - "learning_rate": 1.1742052625474822e-06, - "loss": 0.5952, - "step": 53952 - }, - { - "epoch": 1.38, - "learning_rate": 1.174178015125808e-06, - "loss": 0.6387, - "step": 53953 - }, - { - "epoch": 1.38, - "learning_rate": 1.1741507675707741e-06, - "loss": 0.7188, - "step": 53954 - }, - { - "epoch": 1.38, - "learning_rate": 1.1741235198824006e-06, - "loss": 0.6978, - "step": 53955 - }, - { - "epoch": 1.38, - "learning_rate": 1.1740962720607091e-06, - "loss": 0.5825, - "step": 53956 - }, - { - "epoch": 1.38, - "learning_rate": 1.1740690241057196e-06, - "loss": 0.6787, - "step": 53957 - }, - { - "epoch": 1.38, - "learning_rate": 1.1740417760174538e-06, - "loss": 0.5693, - "step": 53958 - }, - { - "epoch": 1.38, - "learning_rate": 1.174014527795932e-06, - "loss": 0.4382, - "step": 53959 - }, - { - "epoch": 1.38, - "learning_rate": 1.1739872794411757e-06, - "loss": 0.6597, - "step": 53960 - }, - { - "epoch": 1.38, - "learning_rate": 1.1739600309532047e-06, - "loss": 0.6875, - "step": 53961 - }, - { - "epoch": 1.38, - "learning_rate": 1.173932782332041e-06, - "loss": 0.5527, - "step": 53962 - }, - { - "epoch": 1.38, - "learning_rate": 1.1739055335777046e-06, - "loss": 0.7627, - "step": 53963 - }, - { - "epoch": 1.38, - "learning_rate": 1.173878284690217e-06, - "loss": 0.5908, - "step": 53964 - }, - { - "epoch": 1.38, - "learning_rate": 1.1738510356695989e-06, - "loss": 0.667, - "step": 53965 - }, - { - "epoch": 1.38, - "learning_rate": 1.1738237865158706e-06, - "loss": 0.6162, - "step": 53966 - }, - { - "epoch": 1.38, - "learning_rate": 1.1737965372290537e-06, - "loss": 0.5259, - "step": 53967 - }, - { - "epoch": 1.38, - "learning_rate": 1.173769287809169e-06, - "loss": 0.5386, - "step": 53968 - }, - { - "epoch": 1.38, - "learning_rate": 1.173742038256237e-06, - "loss": 0.7363, - "step": 53969 - }, - { - "epoch": 1.38, - "learning_rate": 1.1737147885702782e-06, - "loss": 0.5498, - "step": 53970 - }, - { - "epoch": 1.38, - "learning_rate": 1.1736875387513146e-06, - "loss": 0.627, - "step": 53971 - }, - { - "epoch": 1.38, - "learning_rate": 1.173660288799366e-06, - "loss": 0.5293, - "step": 53972 - }, - { - "epoch": 1.38, - "learning_rate": 1.173633038714454e-06, - "loss": 0.6582, - "step": 53973 - }, - { - "epoch": 1.38, - "learning_rate": 1.1736057884965992e-06, - "loss": 0.5596, - "step": 53974 - }, - { - "epoch": 1.38, - "learning_rate": 1.1735785381458224e-06, - "loss": 0.7402, - "step": 53975 - }, - { - "epoch": 1.38, - "learning_rate": 1.1735512876621444e-06, - "loss": 0.8125, - "step": 53976 - }, - { - "epoch": 1.38, - "learning_rate": 1.1735240370455862e-06, - "loss": 0.625, - "step": 53977 - }, - { - "epoch": 1.38, - "learning_rate": 1.1734967862961685e-06, - "loss": 0.6709, - "step": 53978 - }, - { - "epoch": 1.38, - "learning_rate": 1.1734695354139126e-06, - "loss": 0.7559, - "step": 53979 - }, - { - "epoch": 1.38, - "learning_rate": 1.1734422843988387e-06, - "loss": 0.6123, - "step": 53980 - }, - { - "epoch": 1.38, - "learning_rate": 1.1734150332509683e-06, - "loss": 0.5859, - "step": 53981 - }, - { - "epoch": 1.38, - "learning_rate": 1.1733877819703214e-06, - "loss": 0.6914, - "step": 53982 - }, - { - "epoch": 1.38, - "learning_rate": 1.1733605305569202e-06, - "loss": 0.7471, - "step": 53983 - }, - { - "epoch": 1.38, - "learning_rate": 1.1733332790107846e-06, - "loss": 0.6079, - "step": 53984 - }, - { - "epoch": 1.38, - "learning_rate": 1.1733060273319355e-06, - "loss": 0.7559, - "step": 53985 - }, - { - "epoch": 1.38, - "learning_rate": 1.1732787755203938e-06, - "loss": 0.4907, - "step": 53986 - }, - { - "epoch": 1.38, - "learning_rate": 1.1732515235761811e-06, - "loss": 0.7163, - "step": 53987 - }, - { - "epoch": 1.38, - "learning_rate": 1.173224271499317e-06, - "loss": 0.4446, - "step": 53988 - }, - { - "epoch": 1.38, - "learning_rate": 1.1731970192898235e-06, - "loss": 0.8242, - "step": 53989 - }, - { - "epoch": 1.38, - "learning_rate": 1.1731697669477209e-06, - "loss": 0.5898, - "step": 53990 - }, - { - "epoch": 1.38, - "learning_rate": 1.17314251447303e-06, - "loss": 0.6528, - "step": 53991 - }, - { - "epoch": 1.38, - "learning_rate": 1.173115261865772e-06, - "loss": 0.7832, - "step": 53992 - }, - { - "epoch": 1.38, - "learning_rate": 1.1730880091259674e-06, - "loss": 0.6001, - "step": 53993 - }, - { - "epoch": 1.38, - "learning_rate": 1.1730607562536379e-06, - "loss": 0.6953, - "step": 53994 - }, - { - "epoch": 1.38, - "learning_rate": 1.173033503248803e-06, - "loss": 0.6382, - "step": 53995 - }, - { - "epoch": 1.38, - "learning_rate": 1.1730062501114848e-06, - "loss": 0.7017, - "step": 53996 - }, - { - "epoch": 1.38, - "learning_rate": 1.1729789968417033e-06, - "loss": 0.5112, - "step": 53997 - }, - { - "epoch": 1.38, - "learning_rate": 1.1729517434394799e-06, - "loss": 0.6108, - "step": 53998 - }, - { - "epoch": 1.38, - "learning_rate": 1.1729244899048354e-06, - "loss": 0.6426, - "step": 53999 - }, - { - "epoch": 1.38, - "learning_rate": 1.1728972362377905e-06, - "loss": 0.6748, - "step": 54000 - }, - { - "epoch": 1.38, - "learning_rate": 1.1728699824383658e-06, - "loss": 0.4592, - "step": 54001 - }, - { - "epoch": 1.38, - "learning_rate": 1.1728427285065829e-06, - "loss": 0.873, - "step": 54002 - }, - { - "epoch": 1.38, - "learning_rate": 1.172815474442462e-06, - "loss": 0.8398, - "step": 54003 - }, - { - "epoch": 1.38, - "learning_rate": 1.1727882202460248e-06, - "loss": 0.5227, - "step": 54004 - }, - { - "epoch": 1.38, - "learning_rate": 1.172760965917291e-06, - "loss": 0.7178, - "step": 54005 - }, - { - "epoch": 1.38, - "learning_rate": 1.1727337114562825e-06, - "loss": 0.6094, - "step": 54006 - }, - { - "epoch": 1.38, - "learning_rate": 1.1727064568630193e-06, - "loss": 0.6816, - "step": 54007 - }, - { - "epoch": 1.38, - "learning_rate": 1.1726792021375232e-06, - "loss": 0.5684, - "step": 54008 - }, - { - "epoch": 1.38, - "learning_rate": 1.1726519472798142e-06, - "loss": 0.542, - "step": 54009 - }, - { - "epoch": 1.38, - "learning_rate": 1.1726246922899135e-06, - "loss": 0.6792, - "step": 54010 - }, - { - "epoch": 1.38, - "learning_rate": 1.1725974371678423e-06, - "loss": 0.6367, - "step": 54011 - }, - { - "epoch": 1.38, - "learning_rate": 1.172570181913621e-06, - "loss": 0.6001, - "step": 54012 - }, - { - "epoch": 1.38, - "learning_rate": 1.1725429265272707e-06, - "loss": 0.5757, - "step": 54013 - }, - { - "epoch": 1.38, - "learning_rate": 1.1725156710088123e-06, - "loss": 0.6123, - "step": 54014 - }, - { - "epoch": 1.38, - "learning_rate": 1.1724884153582664e-06, - "loss": 0.7656, - "step": 54015 - }, - { - "epoch": 1.38, - "learning_rate": 1.172461159575654e-06, - "loss": 0.2573, - "step": 54016 - }, - { - "epoch": 1.38, - "learning_rate": 1.1724339036609962e-06, - "loss": 0.6113, - "step": 54017 - }, - { - "epoch": 1.38, - "learning_rate": 1.1724066476143135e-06, - "loss": 0.6001, - "step": 54018 - }, - { - "epoch": 1.38, - "learning_rate": 1.1723793914356274e-06, - "loss": 0.6863, - "step": 54019 - }, - { - "epoch": 1.38, - "learning_rate": 1.1723521351249578e-06, - "loss": 0.5208, - "step": 54020 - }, - { - "epoch": 1.38, - "learning_rate": 1.1723248786823266e-06, - "loss": 0.7402, - "step": 54021 - }, - { - "epoch": 1.38, - "learning_rate": 1.1722976221077536e-06, - "loss": 0.5244, - "step": 54022 - }, - { - "epoch": 1.38, - "learning_rate": 1.1722703654012606e-06, - "loss": 0.6729, - "step": 54023 - }, - { - "epoch": 1.38, - "learning_rate": 1.172243108562868e-06, - "loss": 0.6558, - "step": 54024 - }, - { - "epoch": 1.38, - "learning_rate": 1.1722158515925971e-06, - "loss": 0.5122, - "step": 54025 - }, - { - "epoch": 1.38, - "learning_rate": 1.172188594490468e-06, - "loss": 0.6455, - "step": 54026 - }, - { - "epoch": 1.38, - "learning_rate": 1.172161337256502e-06, - "loss": 0.4795, - "step": 54027 - }, - { - "epoch": 1.38, - "learning_rate": 1.17213407989072e-06, - "loss": 0.7402, - "step": 54028 - }, - { - "epoch": 1.38, - "learning_rate": 1.172106822393143e-06, - "loss": 0.6685, - "step": 54029 - }, - { - "epoch": 1.38, - "learning_rate": 1.172079564763792e-06, - "loss": 0.7842, - "step": 54030 - }, - { - "epoch": 1.38, - "learning_rate": 1.1720523070026873e-06, - "loss": 0.6211, - "step": 54031 - }, - { - "epoch": 1.38, - "learning_rate": 1.1720250491098499e-06, - "loss": 0.6543, - "step": 54032 - }, - { - "epoch": 1.38, - "learning_rate": 1.171997791085301e-06, - "loss": 0.7842, - "step": 54033 - }, - { - "epoch": 1.38, - "learning_rate": 1.1719705329290613e-06, - "loss": 0.4955, - "step": 54034 - }, - { - "epoch": 1.38, - "learning_rate": 1.1719432746411514e-06, - "loss": 0.5674, - "step": 54035 - }, - { - "epoch": 1.38, - "learning_rate": 1.171916016221593e-06, - "loss": 0.6255, - "step": 54036 - }, - { - "epoch": 1.38, - "learning_rate": 1.171888757670406e-06, - "loss": 0.562, - "step": 54037 - }, - { - "epoch": 1.39, - "learning_rate": 1.1718614989876117e-06, - "loss": 0.7617, - "step": 54038 - }, - { - "epoch": 1.39, - "learning_rate": 1.171834240173231e-06, - "loss": 0.7695, - "step": 54039 - }, - { - "epoch": 1.39, - "learning_rate": 1.1718069812272847e-06, - "loss": 0.6963, - "step": 54040 - }, - { - "epoch": 1.39, - "learning_rate": 1.1717797221497938e-06, - "loss": 0.7451, - "step": 54041 - }, - { - "epoch": 1.39, - "learning_rate": 1.171752462940779e-06, - "loss": 0.7432, - "step": 54042 - }, - { - "epoch": 1.39, - "learning_rate": 1.1717252036002611e-06, - "loss": 0.6108, - "step": 54043 - }, - { - "epoch": 1.39, - "learning_rate": 1.1716979441282616e-06, - "loss": 0.6265, - "step": 54044 - }, - { - "epoch": 1.39, - "learning_rate": 1.1716706845248005e-06, - "loss": 0.6462, - "step": 54045 - }, - { - "epoch": 1.39, - "learning_rate": 1.1716434247898992e-06, - "loss": 0.6094, - "step": 54046 - }, - { - "epoch": 1.39, - "learning_rate": 1.1716161649235782e-06, - "loss": 0.6523, - "step": 54047 - }, - { - "epoch": 1.39, - "learning_rate": 1.1715889049258588e-06, - "loss": 0.5645, - "step": 54048 - }, - { - "epoch": 1.39, - "learning_rate": 1.1715616447967615e-06, - "loss": 0.5864, - "step": 54049 - }, - { - "epoch": 1.39, - "learning_rate": 1.1715343845363075e-06, - "loss": 0.7227, - "step": 54050 - }, - { - "epoch": 1.39, - "learning_rate": 1.1715071241445173e-06, - "loss": 0.7051, - "step": 54051 - }, - { - "epoch": 1.39, - "learning_rate": 1.1714798636214122e-06, - "loss": 0.4463, - "step": 54052 - }, - { - "epoch": 1.39, - "learning_rate": 1.1714526029670126e-06, - "loss": 0.8057, - "step": 54053 - }, - { - "epoch": 1.39, - "learning_rate": 1.1714253421813397e-06, - "loss": 0.7393, - "step": 54054 - }, - { - "epoch": 1.39, - "learning_rate": 1.1713980812644147e-06, - "loss": 0.5239, - "step": 54055 - }, - { - "epoch": 1.39, - "learning_rate": 1.1713708202162576e-06, - "loss": 0.7549, - "step": 54056 - }, - { - "epoch": 1.39, - "learning_rate": 1.1713435590368898e-06, - "loss": 0.6221, - "step": 54057 - }, - { - "epoch": 1.39, - "learning_rate": 1.1713162977263323e-06, - "loss": 0.4668, - "step": 54058 - }, - { - "epoch": 1.39, - "learning_rate": 1.1712890362846058e-06, - "loss": 0.7598, - "step": 54059 - }, - { - "epoch": 1.39, - "learning_rate": 1.1712617747117308e-06, - "loss": 0.7793, - "step": 54060 - }, - { - "epoch": 1.39, - "learning_rate": 1.1712345130077288e-06, - "loss": 0.7705, - "step": 54061 - }, - { - "epoch": 1.39, - "learning_rate": 1.1712072511726203e-06, - "loss": 0.7002, - "step": 54062 - }, - { - "epoch": 1.39, - "learning_rate": 1.1711799892064264e-06, - "loss": 0.4927, - "step": 54063 - }, - { - "epoch": 1.39, - "learning_rate": 1.171152727109168e-06, - "loss": 0.5703, - "step": 54064 - }, - { - "epoch": 1.39, - "learning_rate": 1.1711254648808657e-06, - "loss": 0.6128, - "step": 54065 - }, - { - "epoch": 1.39, - "learning_rate": 1.1710982025215404e-06, - "loss": 0.7451, - "step": 54066 - }, - { - "epoch": 1.39, - "learning_rate": 1.171070940031213e-06, - "loss": 0.7036, - "step": 54067 - }, - { - "epoch": 1.39, - "learning_rate": 1.1710436774099047e-06, - "loss": 0.6465, - "step": 54068 - }, - { - "epoch": 1.39, - "learning_rate": 1.1710164146576363e-06, - "loss": 0.749, - "step": 54069 - }, - { - "epoch": 1.39, - "learning_rate": 1.1709891517744278e-06, - "loss": 0.6636, - "step": 54070 - }, - { - "epoch": 1.39, - "learning_rate": 1.1709618887603011e-06, - "loss": 0.8389, - "step": 54071 - }, - { - "epoch": 1.39, - "learning_rate": 1.1709346256152767e-06, - "loss": 0.4331, - "step": 54072 - }, - { - "epoch": 1.39, - "learning_rate": 1.170907362339376e-06, - "loss": 0.5381, - "step": 54073 - }, - { - "epoch": 1.39, - "learning_rate": 1.170880098932619e-06, - "loss": 0.5391, - "step": 54074 - }, - { - "epoch": 1.39, - "learning_rate": 1.170852835395027e-06, - "loss": 0.6802, - "step": 54075 - }, - { - "epoch": 1.39, - "learning_rate": 1.1708255717266206e-06, - "loss": 0.4626, - "step": 54076 - }, - { - "epoch": 1.39, - "learning_rate": 1.1707983079274212e-06, - "loss": 0.7974, - "step": 54077 - }, - { - "epoch": 1.39, - "learning_rate": 1.1707710439974492e-06, - "loss": 0.5278, - "step": 54078 - }, - { - "epoch": 1.39, - "learning_rate": 1.1707437799367259e-06, - "loss": 0.7178, - "step": 54079 - }, - { - "epoch": 1.39, - "learning_rate": 1.1707165157452718e-06, - "loss": 0.6169, - "step": 54080 - }, - { - "epoch": 1.39, - "learning_rate": 1.170689251423108e-06, - "loss": 0.6953, - "step": 54081 - }, - { - "epoch": 1.39, - "learning_rate": 1.170661986970255e-06, - "loss": 0.5938, - "step": 54082 - }, - { - "epoch": 1.39, - "learning_rate": 1.170634722386734e-06, - "loss": 0.6162, - "step": 54083 - }, - { - "epoch": 1.39, - "learning_rate": 1.1706074576725665e-06, - "loss": 0.5684, - "step": 54084 - }, - { - "epoch": 1.39, - "learning_rate": 1.170580192827772e-06, - "loss": 0.647, - "step": 54085 - }, - { - "epoch": 1.39, - "learning_rate": 1.1705529278523725e-06, - "loss": 0.4531, - "step": 54086 - }, - { - "epoch": 1.39, - "learning_rate": 1.1705256627463883e-06, - "loss": 0.8623, - "step": 54087 - }, - { - "epoch": 1.39, - "learning_rate": 1.1704983975098404e-06, - "loss": 0.7061, - "step": 54088 - }, - { - "epoch": 1.39, - "learning_rate": 1.1704711321427498e-06, - "loss": 0.5388, - "step": 54089 - }, - { - "epoch": 1.39, - "learning_rate": 1.1704438666451373e-06, - "loss": 0.6318, - "step": 54090 - }, - { - "epoch": 1.39, - "learning_rate": 1.1704166010170235e-06, - "loss": 0.5752, - "step": 54091 - }, - { - "epoch": 1.39, - "learning_rate": 1.17038933525843e-06, - "loss": 0.6465, - "step": 54092 - }, - { - "epoch": 1.39, - "learning_rate": 1.1703620693693767e-06, - "loss": 0.489, - "step": 54093 - }, - { - "epoch": 1.39, - "learning_rate": 1.1703348033498856e-06, - "loss": 0.7236, - "step": 54094 - }, - { - "epoch": 1.39, - "learning_rate": 1.1703075371999764e-06, - "loss": 0.5575, - "step": 54095 - }, - { - "epoch": 1.39, - "learning_rate": 1.1702802709196712e-06, - "loss": 0.7266, - "step": 54096 - }, - { - "epoch": 1.39, - "learning_rate": 1.1702530045089895e-06, - "loss": 0.8398, - "step": 54097 - }, - { - "epoch": 1.39, - "learning_rate": 1.1702257379679532e-06, - "loss": 0.582, - "step": 54098 - }, - { - "epoch": 1.39, - "learning_rate": 1.1701984712965832e-06, - "loss": 0.7305, - "step": 54099 - }, - { - "epoch": 1.39, - "learning_rate": 1.1701712044948995e-06, - "loss": 0.6064, - "step": 54100 - }, - { - "epoch": 1.39, - "learning_rate": 1.1701439375629238e-06, - "loss": 0.7808, - "step": 54101 - }, - { - "epoch": 1.39, - "learning_rate": 1.1701166705006767e-06, - "loss": 0.7373, - "step": 54102 - }, - { - "epoch": 1.39, - "learning_rate": 1.1700894033081792e-06, - "loss": 0.6074, - "step": 54103 - }, - { - "epoch": 1.39, - "learning_rate": 1.1700621359854519e-06, - "loss": 0.6284, - "step": 54104 - }, - { - "epoch": 1.39, - "learning_rate": 1.170034868532516e-06, - "loss": 0.6953, - "step": 54105 - }, - { - "epoch": 1.39, - "learning_rate": 1.170007600949392e-06, - "loss": 0.7891, - "step": 54106 - }, - { - "epoch": 1.39, - "learning_rate": 1.169980333236101e-06, - "loss": 0.5806, - "step": 54107 - }, - { - "epoch": 1.39, - "learning_rate": 1.1699530653926638e-06, - "loss": 0.6724, - "step": 54108 - }, - { - "epoch": 1.39, - "learning_rate": 1.169925797419102e-06, - "loss": 0.6855, - "step": 54109 - }, - { - "epoch": 1.39, - "learning_rate": 1.1698985293154354e-06, - "loss": 0.6807, - "step": 54110 - }, - { - "epoch": 1.39, - "learning_rate": 1.1698712610816852e-06, - "loss": 0.6807, - "step": 54111 - }, - { - "epoch": 1.39, - "learning_rate": 1.1698439927178722e-06, - "loss": 0.6353, - "step": 54112 - }, - { - "epoch": 1.39, - "learning_rate": 1.169816724224018e-06, - "loss": 0.521, - "step": 54113 - }, - { - "epoch": 1.39, - "learning_rate": 1.1697894556001427e-06, - "loss": 0.6943, - "step": 54114 - }, - { - "epoch": 1.39, - "learning_rate": 1.1697621868462675e-06, - "loss": 0.7261, - "step": 54115 - }, - { - "epoch": 1.39, - "learning_rate": 1.169734917962413e-06, - "loss": 0.6533, - "step": 54116 - }, - { - "epoch": 1.39, - "learning_rate": 1.1697076489486005e-06, - "loss": 0.5078, - "step": 54117 - }, - { - "epoch": 1.39, - "learning_rate": 1.1696803798048502e-06, - "loss": 0.876, - "step": 54118 - }, - { - "epoch": 1.39, - "learning_rate": 1.169653110531184e-06, - "loss": 0.6401, - "step": 54119 - }, - { - "epoch": 1.39, - "learning_rate": 1.169625841127622e-06, - "loss": 0.5454, - "step": 54120 - }, - { - "epoch": 1.39, - "learning_rate": 1.1695985715941853e-06, - "loss": 0.5581, - "step": 54121 - }, - { - "epoch": 1.39, - "learning_rate": 1.1695713019308947e-06, - "loss": 0.8018, - "step": 54122 - }, - { - "epoch": 1.39, - "learning_rate": 1.1695440321377712e-06, - "loss": 0.5439, - "step": 54123 - }, - { - "epoch": 1.39, - "learning_rate": 1.1695167622148357e-06, - "loss": 0.5242, - "step": 54124 - }, - { - "epoch": 1.39, - "learning_rate": 1.1694894921621087e-06, - "loss": 0.7295, - "step": 54125 - }, - { - "epoch": 1.39, - "learning_rate": 1.1694622219796117e-06, - "loss": 0.6426, - "step": 54126 - }, - { - "epoch": 1.39, - "learning_rate": 1.1694349516673652e-06, - "loss": 0.438, - "step": 54127 - }, - { - "epoch": 1.39, - "learning_rate": 1.1694076812253902e-06, - "loss": 0.5947, - "step": 54128 - }, - { - "epoch": 1.39, - "learning_rate": 1.1693804106537075e-06, - "loss": 0.4265, - "step": 54129 - }, - { - "epoch": 1.39, - "learning_rate": 1.169353139952338e-06, - "loss": 0.667, - "step": 54130 - }, - { - "epoch": 1.39, - "learning_rate": 1.1693258691213026e-06, - "loss": 0.7412, - "step": 54131 - }, - { - "epoch": 1.39, - "learning_rate": 1.169298598160622e-06, - "loss": 0.6523, - "step": 54132 - }, - { - "epoch": 1.39, - "learning_rate": 1.1692713270703173e-06, - "loss": 0.7363, - "step": 54133 - }, - { - "epoch": 1.39, - "learning_rate": 1.1692440558504099e-06, - "loss": 0.4717, - "step": 54134 - }, - { - "epoch": 1.39, - "learning_rate": 1.1692167845009193e-06, - "loss": 0.7129, - "step": 54135 - }, - { - "epoch": 1.39, - "learning_rate": 1.1691895130218676e-06, - "loss": 0.6006, - "step": 54136 - }, - { - "epoch": 1.39, - "learning_rate": 1.169162241413275e-06, - "loss": 0.4907, - "step": 54137 - }, - { - "epoch": 1.39, - "learning_rate": 1.1691349696751628e-06, - "loss": 0.6963, - "step": 54138 - }, - { - "epoch": 1.39, - "learning_rate": 1.1691076978075521e-06, - "loss": 0.6455, - "step": 54139 - }, - { - "epoch": 1.39, - "learning_rate": 1.169080425810463e-06, - "loss": 0.6211, - "step": 54140 - }, - { - "epoch": 1.39, - "learning_rate": 1.1690531536839168e-06, - "loss": 0.4861, - "step": 54141 - }, - { - "epoch": 1.39, - "learning_rate": 1.1690258814279345e-06, - "loss": 0.6719, - "step": 54142 - }, - { - "epoch": 1.39, - "learning_rate": 1.1689986090425366e-06, - "loss": 0.7334, - "step": 54143 - }, - { - "epoch": 1.39, - "learning_rate": 1.1689713365277445e-06, - "loss": 0.5059, - "step": 54144 - }, - { - "epoch": 1.39, - "learning_rate": 1.1689440638835788e-06, - "loss": 0.7148, - "step": 54145 - }, - { - "epoch": 1.39, - "learning_rate": 1.16891679111006e-06, - "loss": 0.4995, - "step": 54146 - }, - { - "epoch": 1.39, - "learning_rate": 1.1688895182072101e-06, - "loss": 0.6602, - "step": 54147 - }, - { - "epoch": 1.39, - "learning_rate": 1.1688622451750488e-06, - "loss": 0.5859, - "step": 54148 - }, - { - "epoch": 1.39, - "learning_rate": 1.1688349720135978e-06, - "loss": 0.6978, - "step": 54149 - }, - { - "epoch": 1.39, - "learning_rate": 1.168807698722877e-06, - "loss": 0.6665, - "step": 54150 - }, - { - "epoch": 1.39, - "learning_rate": 1.1687804253029083e-06, - "loss": 0.5537, - "step": 54151 - }, - { - "epoch": 1.39, - "learning_rate": 1.168753151753712e-06, - "loss": 0.5413, - "step": 54152 - }, - { - "epoch": 1.39, - "learning_rate": 1.1687258780753095e-06, - "loss": 0.448, - "step": 54153 - }, - { - "epoch": 1.39, - "learning_rate": 1.1686986042677212e-06, - "loss": 0.5625, - "step": 54154 - }, - { - "epoch": 1.39, - "learning_rate": 1.1686713303309683e-06, - "loss": 0.6807, - "step": 54155 - }, - { - "epoch": 1.39, - "learning_rate": 1.1686440562650712e-06, - "loss": 0.6479, - "step": 54156 - }, - { - "epoch": 1.39, - "learning_rate": 1.1686167820700511e-06, - "loss": 0.4851, - "step": 54157 - }, - { - "epoch": 1.39, - "learning_rate": 1.168589507745929e-06, - "loss": 0.6973, - "step": 54158 - }, - { - "epoch": 1.39, - "learning_rate": 1.1685622332927261e-06, - "loss": 0.6406, - "step": 54159 - }, - { - "epoch": 1.39, - "learning_rate": 1.1685349587104623e-06, - "loss": 0.4972, - "step": 54160 - }, - { - "epoch": 1.39, - "learning_rate": 1.168507683999159e-06, - "loss": 0.6895, - "step": 54161 - }, - { - "epoch": 1.39, - "learning_rate": 1.1684804091588372e-06, - "loss": 0.707, - "step": 54162 - }, - { - "epoch": 1.39, - "learning_rate": 1.1684531341895178e-06, - "loss": 0.7339, - "step": 54163 - }, - { - "epoch": 1.39, - "learning_rate": 1.1684258590912216e-06, - "loss": 0.7861, - "step": 54164 - }, - { - "epoch": 1.39, - "learning_rate": 1.1683985838639693e-06, - "loss": 0.8301, - "step": 54165 - }, - { - "epoch": 1.39, - "learning_rate": 1.1683713085077823e-06, - "loss": 0.5928, - "step": 54166 - }, - { - "epoch": 1.39, - "learning_rate": 1.1683440330226809e-06, - "loss": 0.7627, - "step": 54167 - }, - { - "epoch": 1.39, - "learning_rate": 1.168316757408686e-06, - "loss": 0.542, - "step": 54168 - }, - { - "epoch": 1.39, - "learning_rate": 1.168289481665819e-06, - "loss": 0.7207, - "step": 54169 - }, - { - "epoch": 1.39, - "learning_rate": 1.1682622057941005e-06, - "loss": 0.6577, - "step": 54170 - }, - { - "epoch": 1.39, - "learning_rate": 1.168234929793551e-06, - "loss": 0.6118, - "step": 54171 - }, - { - "epoch": 1.39, - "learning_rate": 1.1682076536641922e-06, - "loss": 0.6094, - "step": 54172 - }, - { - "epoch": 1.39, - "learning_rate": 1.168180377406044e-06, - "loss": 0.6274, - "step": 54173 - }, - { - "epoch": 1.39, - "learning_rate": 1.1681531010191287e-06, - "loss": 0.75, - "step": 54174 - }, - { - "epoch": 1.39, - "learning_rate": 1.1681258245034655e-06, - "loss": 0.7393, - "step": 54175 - }, - { - "epoch": 1.39, - "learning_rate": 1.1680985478590763e-06, - "loss": 0.4712, - "step": 54176 - }, - { - "epoch": 1.39, - "learning_rate": 1.1680712710859818e-06, - "loss": 0.6299, - "step": 54177 - }, - { - "epoch": 1.39, - "learning_rate": 1.1680439941842028e-06, - "loss": 0.4067, - "step": 54178 - }, - { - "epoch": 1.39, - "learning_rate": 1.1680167171537605e-06, - "loss": 0.6465, - "step": 54179 - }, - { - "epoch": 1.39, - "learning_rate": 1.1679894399946754e-06, - "loss": 0.623, - "step": 54180 - }, - { - "epoch": 1.39, - "learning_rate": 1.1679621627069685e-06, - "loss": 0.551, - "step": 54181 - }, - { - "epoch": 1.39, - "learning_rate": 1.1679348852906605e-06, - "loss": 0.6201, - "step": 54182 - }, - { - "epoch": 1.39, - "learning_rate": 1.1679076077457725e-06, - "loss": 0.8164, - "step": 54183 - }, - { - "epoch": 1.39, - "learning_rate": 1.167880330072326e-06, - "loss": 0.4707, - "step": 54184 - }, - { - "epoch": 1.39, - "learning_rate": 1.1678530522703405e-06, - "loss": 0.6047, - "step": 54185 - }, - { - "epoch": 1.39, - "learning_rate": 1.1678257743398378e-06, - "loss": 0.6426, - "step": 54186 - }, - { - "epoch": 1.39, - "learning_rate": 1.1677984962808388e-06, - "loss": 0.6797, - "step": 54187 - }, - { - "epoch": 1.39, - "learning_rate": 1.167771218093364e-06, - "loss": 0.5615, - "step": 54188 - }, - { - "epoch": 1.39, - "learning_rate": 1.1677439397774347e-06, - "loss": 0.8057, - "step": 54189 - }, - { - "epoch": 1.39, - "learning_rate": 1.1677166613330714e-06, - "loss": 0.6353, - "step": 54190 - }, - { - "epoch": 1.39, - "learning_rate": 1.1676893827602952e-06, - "loss": 0.6182, - "step": 54191 - }, - { - "epoch": 1.39, - "learning_rate": 1.1676621040591267e-06, - "loss": 0.7109, - "step": 54192 - }, - { - "epoch": 1.39, - "learning_rate": 1.1676348252295875e-06, - "loss": 0.8506, - "step": 54193 - }, - { - "epoch": 1.39, - "learning_rate": 1.1676075462716978e-06, - "loss": 0.5935, - "step": 54194 - }, - { - "epoch": 1.39, - "learning_rate": 1.167580267185479e-06, - "loss": 0.5745, - "step": 54195 - }, - { - "epoch": 1.39, - "learning_rate": 1.1675529879709514e-06, - "loss": 0.5083, - "step": 54196 - }, - { - "epoch": 1.39, - "learning_rate": 1.1675257086281363e-06, - "loss": 0.6431, - "step": 54197 - }, - { - "epoch": 1.39, - "learning_rate": 1.1674984291570543e-06, - "loss": 0.5903, - "step": 54198 - }, - { - "epoch": 1.39, - "learning_rate": 1.1674711495577268e-06, - "loss": 0.6826, - "step": 54199 - }, - { - "epoch": 1.39, - "learning_rate": 1.1674438698301739e-06, - "loss": 0.5811, - "step": 54200 - }, - { - "epoch": 1.39, - "learning_rate": 1.1674165899744174e-06, - "loss": 0.5977, - "step": 54201 - }, - { - "epoch": 1.39, - "learning_rate": 1.167389309990477e-06, - "loss": 0.7041, - "step": 54202 - }, - { - "epoch": 1.39, - "learning_rate": 1.167362029878375e-06, - "loss": 0.7793, - "step": 54203 - }, - { - "epoch": 1.39, - "learning_rate": 1.1673347496381313e-06, - "loss": 0.7373, - "step": 54204 - }, - { - "epoch": 1.39, - "learning_rate": 1.167307469269767e-06, - "loss": 0.5859, - "step": 54205 - }, - { - "epoch": 1.39, - "learning_rate": 1.1672801887733033e-06, - "loss": 0.7432, - "step": 54206 - }, - { - "epoch": 1.39, - "learning_rate": 1.1672529081487607e-06, - "loss": 0.5303, - "step": 54207 - }, - { - "epoch": 1.39, - "learning_rate": 1.16722562739616e-06, - "loss": 0.6411, - "step": 54208 - }, - { - "epoch": 1.39, - "learning_rate": 1.1671983465155228e-06, - "loss": 0.6816, - "step": 54209 - }, - { - "epoch": 1.39, - "learning_rate": 1.1671710655068694e-06, - "loss": 0.5269, - "step": 54210 - }, - { - "epoch": 1.39, - "learning_rate": 1.1671437843702208e-06, - "loss": 0.3887, - "step": 54211 - }, - { - "epoch": 1.39, - "learning_rate": 1.1671165031055975e-06, - "loss": 0.7773, - "step": 54212 - }, - { - "epoch": 1.39, - "learning_rate": 1.1670892217130213e-06, - "loss": 0.8208, - "step": 54213 - }, - { - "epoch": 1.39, - "learning_rate": 1.1670619401925124e-06, - "loss": 0.8203, - "step": 54214 - }, - { - "epoch": 1.39, - "learning_rate": 1.1670346585440916e-06, - "loss": 0.5161, - "step": 54215 - }, - { - "epoch": 1.39, - "learning_rate": 1.1670073767677804e-06, - "loss": 0.7168, - "step": 54216 - }, - { - "epoch": 1.39, - "learning_rate": 1.1669800948635988e-06, - "loss": 0.8213, - "step": 54217 - }, - { - "epoch": 1.39, - "learning_rate": 1.1669528128315688e-06, - "loss": 0.625, - "step": 54218 - }, - { - "epoch": 1.39, - "learning_rate": 1.1669255306717105e-06, - "loss": 0.6353, - "step": 54219 - }, - { - "epoch": 1.39, - "learning_rate": 1.166898248384045e-06, - "loss": 0.6709, - "step": 54220 - }, - { - "epoch": 1.39, - "learning_rate": 1.1668709659685932e-06, - "loss": 0.6958, - "step": 54221 - }, - { - "epoch": 1.39, - "learning_rate": 1.1668436834253759e-06, - "loss": 0.7256, - "step": 54222 - }, - { - "epoch": 1.39, - "learning_rate": 1.1668164007544143e-06, - "loss": 0.6904, - "step": 54223 - }, - { - "epoch": 1.39, - "learning_rate": 1.1667891179557289e-06, - "loss": 0.5703, - "step": 54224 - }, - { - "epoch": 1.39, - "learning_rate": 1.1667618350293405e-06, - "loss": 0.7314, - "step": 54225 - }, - { - "epoch": 1.39, - "learning_rate": 1.1667345519752704e-06, - "loss": 0.5371, - "step": 54226 - }, - { - "epoch": 1.39, - "learning_rate": 1.1667072687935393e-06, - "loss": 0.7715, - "step": 54227 - }, - { - "epoch": 1.39, - "learning_rate": 1.1666799854841684e-06, - "loss": 0.6465, - "step": 54228 - }, - { - "epoch": 1.39, - "learning_rate": 1.1666527020471782e-06, - "loss": 0.709, - "step": 54229 - }, - { - "epoch": 1.39, - "learning_rate": 1.1666254184825895e-06, - "loss": 0.7832, - "step": 54230 - }, - { - "epoch": 1.39, - "learning_rate": 1.1665981347904232e-06, - "loss": 0.6489, - "step": 54231 - }, - { - "epoch": 1.39, - "learning_rate": 1.1665708509707007e-06, - "loss": 0.627, - "step": 54232 - }, - { - "epoch": 1.39, - "learning_rate": 1.1665435670234426e-06, - "loss": 0.6641, - "step": 54233 - }, - { - "epoch": 1.39, - "learning_rate": 1.1665162829486694e-06, - "loss": 0.6304, - "step": 54234 - }, - { - "epoch": 1.39, - "learning_rate": 1.1664889987464026e-06, - "loss": 0.7148, - "step": 54235 - }, - { - "epoch": 1.39, - "learning_rate": 1.1664617144166627e-06, - "loss": 0.752, - "step": 54236 - }, - { - "epoch": 1.39, - "learning_rate": 1.1664344299594709e-06, - "loss": 0.4512, - "step": 54237 - }, - { - "epoch": 1.39, - "learning_rate": 1.1664071453748478e-06, - "loss": 0.4971, - "step": 54238 - }, - { - "epoch": 1.39, - "learning_rate": 1.1663798606628147e-06, - "loss": 0.5913, - "step": 54239 - }, - { - "epoch": 1.39, - "learning_rate": 1.1663525758233916e-06, - "loss": 0.5085, - "step": 54240 - }, - { - "epoch": 1.39, - "learning_rate": 1.1663252908566004e-06, - "loss": 0.5979, - "step": 54241 - }, - { - "epoch": 1.39, - "learning_rate": 1.1662980057624612e-06, - "loss": 0.5822, - "step": 54242 - }, - { - "epoch": 1.39, - "learning_rate": 1.1662707205409958e-06, - "loss": 0.6953, - "step": 54243 - }, - { - "epoch": 1.39, - "learning_rate": 1.166243435192224e-06, - "loss": 0.6836, - "step": 54244 - }, - { - "epoch": 1.39, - "learning_rate": 1.1662161497161678e-06, - "loss": 0.5139, - "step": 54245 - }, - { - "epoch": 1.39, - "learning_rate": 1.166188864112847e-06, - "loss": 0.4673, - "step": 54246 - }, - { - "epoch": 1.39, - "learning_rate": 1.1661615783822835e-06, - "loss": 0.7129, - "step": 54247 - }, - { - "epoch": 1.39, - "learning_rate": 1.1661342925244974e-06, - "loss": 0.7607, - "step": 54248 - }, - { - "epoch": 1.39, - "learning_rate": 1.1661070065395102e-06, - "loss": 0.5684, - "step": 54249 - }, - { - "epoch": 1.39, - "learning_rate": 1.166079720427342e-06, - "loss": 0.6875, - "step": 54250 - }, - { - "epoch": 1.39, - "learning_rate": 1.1660524341880146e-06, - "loss": 0.8057, - "step": 54251 - }, - { - "epoch": 1.39, - "learning_rate": 1.1660251478215485e-06, - "loss": 0.5336, - "step": 54252 - }, - { - "epoch": 1.39, - "learning_rate": 1.1659978613279645e-06, - "loss": 0.8193, - "step": 54253 - }, - { - "epoch": 1.39, - "learning_rate": 1.1659705747072837e-06, - "loss": 0.6177, - "step": 54254 - }, - { - "epoch": 1.39, - "learning_rate": 1.1659432879595263e-06, - "loss": 0.4197, - "step": 54255 - }, - { - "epoch": 1.39, - "learning_rate": 1.1659160010847144e-06, - "loss": 0.6729, - "step": 54256 - }, - { - "epoch": 1.39, - "learning_rate": 1.165888714082868e-06, - "loss": 0.6135, - "step": 54257 - }, - { - "epoch": 1.39, - "learning_rate": 1.1658614269540083e-06, - "loss": 0.6294, - "step": 54258 - }, - { - "epoch": 1.39, - "learning_rate": 1.1658341396981559e-06, - "loss": 0.7422, - "step": 54259 - }, - { - "epoch": 1.39, - "learning_rate": 1.1658068523153324e-06, - "loss": 0.6035, - "step": 54260 - }, - { - "epoch": 1.39, - "learning_rate": 1.1657795648055577e-06, - "loss": 0.7666, - "step": 54261 - }, - { - "epoch": 1.39, - "learning_rate": 1.1657522771688534e-06, - "loss": 0.7158, - "step": 54262 - }, - { - "epoch": 1.39, - "learning_rate": 1.1657249894052403e-06, - "loss": 0.8389, - "step": 54263 - }, - { - "epoch": 1.39, - "learning_rate": 1.1656977015147393e-06, - "loss": 0.5908, - "step": 54264 - }, - { - "epoch": 1.39, - "learning_rate": 1.165670413497371e-06, - "loss": 0.4788, - "step": 54265 - }, - { - "epoch": 1.39, - "learning_rate": 1.1656431253531564e-06, - "loss": 0.7998, - "step": 54266 - }, - { - "epoch": 1.39, - "learning_rate": 1.1656158370821165e-06, - "loss": 0.5981, - "step": 54267 - }, - { - "epoch": 1.39, - "learning_rate": 1.1655885486842725e-06, - "loss": 0.7031, - "step": 54268 - }, - { - "epoch": 1.39, - "learning_rate": 1.1655612601596445e-06, - "loss": 0.7363, - "step": 54269 - }, - { - "epoch": 1.39, - "learning_rate": 1.165533971508254e-06, - "loss": 0.4259, - "step": 54270 - }, - { - "epoch": 1.39, - "learning_rate": 1.1655066827301219e-06, - "loss": 0.584, - "step": 54271 - }, - { - "epoch": 1.39, - "learning_rate": 1.1654793938252689e-06, - "loss": 0.7031, - "step": 54272 - }, - { - "epoch": 1.39, - "learning_rate": 1.165452104793716e-06, - "loss": 0.7705, - "step": 54273 - }, - { - "epoch": 1.39, - "learning_rate": 1.165424815635484e-06, - "loss": 0.582, - "step": 54274 - }, - { - "epoch": 1.39, - "learning_rate": 1.1653975263505935e-06, - "loss": 0.6855, - "step": 54275 - }, - { - "epoch": 1.39, - "learning_rate": 1.1653702369390662e-06, - "loss": 0.5244, - "step": 54276 - }, - { - "epoch": 1.39, - "learning_rate": 1.165342947400922e-06, - "loss": 0.7334, - "step": 54277 - }, - { - "epoch": 1.39, - "learning_rate": 1.1653156577361826e-06, - "loss": 0.6646, - "step": 54278 - }, - { - "epoch": 1.39, - "learning_rate": 1.1652883679448688e-06, - "loss": 0.5815, - "step": 54279 - }, - { - "epoch": 1.39, - "learning_rate": 1.165261078027001e-06, - "loss": 0.6333, - "step": 54280 - }, - { - "epoch": 1.39, - "learning_rate": 1.1652337879826005e-06, - "loss": 0.6187, - "step": 54281 - }, - { - "epoch": 1.39, - "learning_rate": 1.1652064978116878e-06, - "loss": 0.5874, - "step": 54282 - }, - { - "epoch": 1.39, - "learning_rate": 1.1651792075142847e-06, - "loss": 0.79, - "step": 54283 - }, - { - "epoch": 1.39, - "learning_rate": 1.1651519170904109e-06, - "loss": 0.5264, - "step": 54284 - }, - { - "epoch": 1.39, - "learning_rate": 1.1651246265400882e-06, - "loss": 0.6641, - "step": 54285 - }, - { - "epoch": 1.39, - "learning_rate": 1.1650973358633369e-06, - "loss": 0.6616, - "step": 54286 - }, - { - "epoch": 1.39, - "learning_rate": 1.1650700450601785e-06, - "loss": 0.7021, - "step": 54287 - }, - { - "epoch": 1.39, - "learning_rate": 1.1650427541306336e-06, - "loss": 0.7314, - "step": 54288 - }, - { - "epoch": 1.39, - "learning_rate": 1.1650154630747229e-06, - "loss": 0.4194, - "step": 54289 - }, - { - "epoch": 1.39, - "learning_rate": 1.164988171892467e-06, - "loss": 0.71, - "step": 54290 - }, - { - "epoch": 1.39, - "learning_rate": 1.1649608805838878e-06, - "loss": 0.7578, - "step": 54291 - }, - { - "epoch": 1.39, - "learning_rate": 1.1649335891490052e-06, - "loss": 0.5239, - "step": 54292 - }, - { - "epoch": 1.39, - "learning_rate": 1.1649062975878412e-06, - "loss": 0.4751, - "step": 54293 - }, - { - "epoch": 1.39, - "learning_rate": 1.1648790059004155e-06, - "loss": 0.79, - "step": 54294 - }, - { - "epoch": 1.39, - "learning_rate": 1.1648517140867498e-06, - "loss": 0.8242, - "step": 54295 - }, - { - "epoch": 1.39, - "learning_rate": 1.1648244221468644e-06, - "loss": 0.5959, - "step": 54296 - }, - { - "epoch": 1.39, - "learning_rate": 1.1647971300807807e-06, - "loss": 0.4927, - "step": 54297 - }, - { - "epoch": 1.39, - "learning_rate": 1.1647698378885196e-06, - "loss": 0.5635, - "step": 54298 - }, - { - "epoch": 1.39, - "learning_rate": 1.1647425455701014e-06, - "loss": 0.708, - "step": 54299 - }, - { - "epoch": 1.39, - "learning_rate": 1.1647152531255476e-06, - "loss": 0.5947, - "step": 54300 - }, - { - "epoch": 1.39, - "learning_rate": 1.164687960554879e-06, - "loss": 0.6704, - "step": 54301 - }, - { - "epoch": 1.39, - "learning_rate": 1.1646606678581164e-06, - "loss": 0.7529, - "step": 54302 - }, - { - "epoch": 1.39, - "learning_rate": 1.1646333750352805e-06, - "loss": 0.5659, - "step": 54303 - }, - { - "epoch": 1.39, - "learning_rate": 1.1646060820863928e-06, - "loss": 0.481, - "step": 54304 - }, - { - "epoch": 1.39, - "learning_rate": 1.1645787890114733e-06, - "loss": 0.5164, - "step": 54305 - }, - { - "epoch": 1.39, - "learning_rate": 1.1645514958105436e-06, - "loss": 0.4172, - "step": 54306 - }, - { - "epoch": 1.39, - "learning_rate": 1.1645242024836242e-06, - "loss": 0.6504, - "step": 54307 - }, - { - "epoch": 1.39, - "learning_rate": 1.1644969090307369e-06, - "loss": 0.5659, - "step": 54308 - }, - { - "epoch": 1.39, - "learning_rate": 1.164469615451901e-06, - "loss": 0.6484, - "step": 54309 - }, - { - "epoch": 1.39, - "learning_rate": 1.1644423217471389e-06, - "loss": 0.7041, - "step": 54310 - }, - { - "epoch": 1.39, - "learning_rate": 1.1644150279164704e-06, - "loss": 0.5352, - "step": 54311 - }, - { - "epoch": 1.39, - "learning_rate": 1.1643877339599171e-06, - "loss": 0.5498, - "step": 54312 - }, - { - "epoch": 1.39, - "learning_rate": 1.1643604398774999e-06, - "loss": 0.623, - "step": 54313 - }, - { - "epoch": 1.39, - "learning_rate": 1.1643331456692391e-06, - "loss": 0.6211, - "step": 54314 - }, - { - "epoch": 1.39, - "learning_rate": 1.164305851335156e-06, - "loss": 0.625, - "step": 54315 - }, - { - "epoch": 1.39, - "learning_rate": 1.1642785568752715e-06, - "loss": 0.7339, - "step": 54316 - }, - { - "epoch": 1.39, - "learning_rate": 1.1642512622896063e-06, - "loss": 0.6587, - "step": 54317 - }, - { - "epoch": 1.39, - "learning_rate": 1.164223967578182e-06, - "loss": 0.6709, - "step": 54318 - }, - { - "epoch": 1.39, - "learning_rate": 1.1641966727410185e-06, - "loss": 0.6226, - "step": 54319 - }, - { - "epoch": 1.39, - "learning_rate": 1.1641693777781374e-06, - "loss": 0.7197, - "step": 54320 - }, - { - "epoch": 1.39, - "learning_rate": 1.1641420826895591e-06, - "loss": 0.8027, - "step": 54321 - }, - { - "epoch": 1.39, - "learning_rate": 1.164114787475305e-06, - "loss": 0.75, - "step": 54322 - }, - { - "epoch": 1.39, - "learning_rate": 1.1640874921353958e-06, - "loss": 0.6416, - "step": 54323 - }, - { - "epoch": 1.39, - "learning_rate": 1.164060196669852e-06, - "loss": 0.8311, - "step": 54324 - }, - { - "epoch": 1.39, - "learning_rate": 1.164032901078695e-06, - "loss": 0.7256, - "step": 54325 - }, - { - "epoch": 1.39, - "learning_rate": 1.1640056053619455e-06, - "loss": 0.6934, - "step": 54326 - }, - { - "epoch": 1.39, - "learning_rate": 1.1639783095196246e-06, - "loss": 0.7744, - "step": 54327 - }, - { - "epoch": 1.39, - "learning_rate": 1.1639510135517533e-06, - "loss": 0.5576, - "step": 54328 - }, - { - "epoch": 1.39, - "learning_rate": 1.1639237174583521e-06, - "loss": 0.4854, - "step": 54329 - }, - { - "epoch": 1.39, - "learning_rate": 1.1638964212394418e-06, - "loss": 0.6704, - "step": 54330 - }, - { - "epoch": 1.39, - "learning_rate": 1.1638691248950436e-06, - "loss": 0.5845, - "step": 54331 - }, - { - "epoch": 1.39, - "learning_rate": 1.1638418284251782e-06, - "loss": 0.6182, - "step": 54332 - }, - { - "epoch": 1.39, - "learning_rate": 1.163814531829867e-06, - "loss": 0.4802, - "step": 54333 - }, - { - "epoch": 1.39, - "learning_rate": 1.1637872351091304e-06, - "loss": 0.7266, - "step": 54334 - }, - { - "epoch": 1.39, - "learning_rate": 1.1637599382629895e-06, - "loss": 0.6748, - "step": 54335 - }, - { - "epoch": 1.39, - "learning_rate": 1.163732641291465e-06, - "loss": 0.6816, - "step": 54336 - }, - { - "epoch": 1.39, - "learning_rate": 1.1637053441945782e-06, - "loss": 0.5, - "step": 54337 - }, - { - "epoch": 1.39, - "learning_rate": 1.1636780469723495e-06, - "loss": 0.6357, - "step": 54338 - }, - { - "epoch": 1.39, - "learning_rate": 1.1636507496248002e-06, - "loss": 0.6953, - "step": 54339 - }, - { - "epoch": 1.39, - "learning_rate": 1.1636234521519508e-06, - "loss": 0.6816, - "step": 54340 - }, - { - "epoch": 1.39, - "learning_rate": 1.1635961545538227e-06, - "loss": 0.5708, - "step": 54341 - }, - { - "epoch": 1.39, - "learning_rate": 1.1635688568304363e-06, - "loss": 0.6255, - "step": 54342 - }, - { - "epoch": 1.39, - "learning_rate": 1.163541558981813e-06, - "loss": 0.6416, - "step": 54343 - }, - { - "epoch": 1.39, - "learning_rate": 1.1635142610079732e-06, - "loss": 0.6172, - "step": 54344 - }, - { - "epoch": 1.39, - "learning_rate": 1.1634869629089382e-06, - "loss": 0.7007, - "step": 54345 - }, - { - "epoch": 1.39, - "learning_rate": 1.1634596646847287e-06, - "loss": 0.5889, - "step": 54346 - }, - { - "epoch": 1.39, - "learning_rate": 1.163432366335366e-06, - "loss": 0.5129, - "step": 54347 - }, - { - "epoch": 1.39, - "learning_rate": 1.1634050678608705e-06, - "loss": 0.6592, - "step": 54348 - }, - { - "epoch": 1.39, - "learning_rate": 1.1633777692612627e-06, - "loss": 0.4365, - "step": 54349 - }, - { - "epoch": 1.39, - "learning_rate": 1.1633504705365647e-06, - "loss": 0.5776, - "step": 54350 - }, - { - "epoch": 1.39, - "learning_rate": 1.1633231716867964e-06, - "loss": 0.6357, - "step": 54351 - }, - { - "epoch": 1.39, - "learning_rate": 1.1632958727119793e-06, - "loss": 0.7119, - "step": 54352 - }, - { - "epoch": 1.39, - "learning_rate": 1.163268573612134e-06, - "loss": 0.5693, - "step": 54353 - }, - { - "epoch": 1.39, - "learning_rate": 1.1632412743872812e-06, - "loss": 0.5986, - "step": 54354 - }, - { - "epoch": 1.39, - "learning_rate": 1.1632139750374422e-06, - "loss": 0.7207, - "step": 54355 - }, - { - "epoch": 1.39, - "learning_rate": 1.1631866755626378e-06, - "loss": 0.5784, - "step": 54356 - }, - { - "epoch": 1.39, - "learning_rate": 1.163159375962889e-06, - "loss": 0.5615, - "step": 54357 - }, - { - "epoch": 1.39, - "learning_rate": 1.1631320762382166e-06, - "loss": 0.7246, - "step": 54358 - }, - { - "epoch": 1.39, - "learning_rate": 1.1631047763886413e-06, - "loss": 0.4436, - "step": 54359 - }, - { - "epoch": 1.39, - "learning_rate": 1.1630774764141842e-06, - "loss": 0.7334, - "step": 54360 - }, - { - "epoch": 1.39, - "learning_rate": 1.163050176314866e-06, - "loss": 0.6777, - "step": 54361 - }, - { - "epoch": 1.39, - "learning_rate": 1.163022876090708e-06, - "loss": 0.7256, - "step": 54362 - }, - { - "epoch": 1.39, - "learning_rate": 1.162995575741731e-06, - "loss": 0.5957, - "step": 54363 - }, - { - "epoch": 1.39, - "learning_rate": 1.1629682752679554e-06, - "loss": 0.72, - "step": 54364 - }, - { - "epoch": 1.39, - "learning_rate": 1.1629409746694028e-06, - "loss": 0.7451, - "step": 54365 - }, - { - "epoch": 1.39, - "learning_rate": 1.1629136739460937e-06, - "loss": 0.6592, - "step": 54366 - }, - { - "epoch": 1.39, - "learning_rate": 1.1628863730980489e-06, - "loss": 0.5796, - "step": 54367 - }, - { - "epoch": 1.39, - "learning_rate": 1.1628590721252898e-06, - "loss": 0.731, - "step": 54368 - }, - { - "epoch": 1.39, - "learning_rate": 1.1628317710278367e-06, - "loss": 0.6973, - "step": 54369 - }, - { - "epoch": 1.39, - "learning_rate": 1.162804469805711e-06, - "loss": 0.8115, - "step": 54370 - }, - { - "epoch": 1.39, - "learning_rate": 1.1627771684589333e-06, - "loss": 0.5835, - "step": 54371 - }, - { - "epoch": 1.39, - "learning_rate": 1.1627498669875247e-06, - "loss": 0.6587, - "step": 54372 - }, - { - "epoch": 1.39, - "learning_rate": 1.1627225653915062e-06, - "loss": 0.6641, - "step": 54373 - }, - { - "epoch": 1.39, - "learning_rate": 1.1626952636708981e-06, - "loss": 0.4263, - "step": 54374 - }, - { - "epoch": 1.39, - "learning_rate": 1.162667961825722e-06, - "loss": 0.7207, - "step": 54375 - }, - { - "epoch": 1.39, - "learning_rate": 1.1626406598559983e-06, - "loss": 0.7524, - "step": 54376 - }, - { - "epoch": 1.39, - "learning_rate": 1.1626133577617485e-06, - "loss": 0.6104, - "step": 54377 - }, - { - "epoch": 1.39, - "learning_rate": 1.162586055542993e-06, - "loss": 0.6992, - "step": 54378 - }, - { - "epoch": 1.39, - "learning_rate": 1.1625587531997527e-06, - "loss": 0.6777, - "step": 54379 - }, - { - "epoch": 1.39, - "learning_rate": 1.1625314507320485e-06, - "loss": 0.7295, - "step": 54380 - }, - { - "epoch": 1.39, - "learning_rate": 1.1625041481399016e-06, - "loss": 0.7549, - "step": 54381 - }, - { - "epoch": 1.39, - "learning_rate": 1.1624768454233327e-06, - "loss": 0.5996, - "step": 54382 - }, - { - "epoch": 1.39, - "learning_rate": 1.1624495425823631e-06, - "loss": 0.6289, - "step": 54383 - }, - { - "epoch": 1.39, - "learning_rate": 1.1624222396170129e-06, - "loss": 0.6772, - "step": 54384 - }, - { - "epoch": 1.39, - "learning_rate": 1.1623949365273036e-06, - "loss": 0.5981, - "step": 54385 - }, - { - "epoch": 1.39, - "learning_rate": 1.162367633313256e-06, - "loss": 0.6646, - "step": 54386 - }, - { - "epoch": 1.39, - "learning_rate": 1.1623403299748908e-06, - "loss": 0.5308, - "step": 54387 - }, - { - "epoch": 1.39, - "learning_rate": 1.1623130265122293e-06, - "loss": 0.5757, - "step": 54388 - }, - { - "epoch": 1.39, - "learning_rate": 1.162285722925292e-06, - "loss": 0.5415, - "step": 54389 - }, - { - "epoch": 1.39, - "learning_rate": 1.1622584192141002e-06, - "loss": 0.5547, - "step": 54390 - }, - { - "epoch": 1.39, - "learning_rate": 1.1622311153786745e-06, - "loss": 0.7422, - "step": 54391 - }, - { - "epoch": 1.39, - "learning_rate": 1.1622038114190357e-06, - "loss": 0.4966, - "step": 54392 - }, - { - "epoch": 1.39, - "learning_rate": 1.1621765073352053e-06, - "loss": 0.4707, - "step": 54393 - }, - { - "epoch": 1.39, - "learning_rate": 1.1621492031272035e-06, - "loss": 0.7139, - "step": 54394 - }, - { - "epoch": 1.39, - "learning_rate": 1.1621218987950515e-06, - "loss": 0.583, - "step": 54395 - }, - { - "epoch": 1.39, - "learning_rate": 1.1620945943387703e-06, - "loss": 0.4612, - "step": 54396 - }, - { - "epoch": 1.39, - "learning_rate": 1.1620672897583805e-06, - "loss": 0.6309, - "step": 54397 - }, - { - "epoch": 1.39, - "learning_rate": 1.1620399850539038e-06, - "loss": 0.6831, - "step": 54398 - }, - { - "epoch": 1.39, - "learning_rate": 1.16201268022536e-06, - "loss": 0.6251, - "step": 54399 - }, - { - "epoch": 1.39, - "learning_rate": 1.161985375272771e-06, - "loss": 0.4927, - "step": 54400 - }, - { - "epoch": 1.39, - "learning_rate": 1.1619580701961567e-06, - "loss": 0.7178, - "step": 54401 - }, - { - "epoch": 1.39, - "learning_rate": 1.161930764995539e-06, - "loss": 0.8809, - "step": 54402 - }, - { - "epoch": 1.39, - "learning_rate": 1.1619034596709382e-06, - "loss": 0.6523, - "step": 54403 - }, - { - "epoch": 1.39, - "learning_rate": 1.1618761542223753e-06, - "loss": 0.5854, - "step": 54404 - }, - { - "epoch": 1.39, - "learning_rate": 1.1618488486498712e-06, - "loss": 0.6367, - "step": 54405 - }, - { - "epoch": 1.39, - "learning_rate": 1.1618215429534472e-06, - "loss": 0.583, - "step": 54406 - }, - { - "epoch": 1.39, - "learning_rate": 1.1617942371331235e-06, - "loss": 0.5659, - "step": 54407 - }, - { - "epoch": 1.39, - "learning_rate": 1.1617669311889216e-06, - "loss": 0.7109, - "step": 54408 - }, - { - "epoch": 1.39, - "learning_rate": 1.1617396251208622e-06, - "loss": 0.5024, - "step": 54409 - }, - { - "epoch": 1.39, - "learning_rate": 1.1617123189289663e-06, - "loss": 0.625, - "step": 54410 - }, - { - "epoch": 1.39, - "learning_rate": 1.1616850126132545e-06, - "loss": 0.7344, - "step": 54411 - }, - { - "epoch": 1.39, - "learning_rate": 1.161657706173748e-06, - "loss": 0.5684, - "step": 54412 - }, - { - "epoch": 1.39, - "learning_rate": 1.1616303996104677e-06, - "loss": 0.5674, - "step": 54413 - }, - { - "epoch": 1.39, - "learning_rate": 1.1616030929234345e-06, - "loss": 0.6812, - "step": 54414 - }, - { - "epoch": 1.39, - "learning_rate": 1.161575786112669e-06, - "loss": 0.9375, - "step": 54415 - }, - { - "epoch": 1.39, - "learning_rate": 1.1615484791781924e-06, - "loss": 0.6416, - "step": 54416 - }, - { - "epoch": 1.39, - "learning_rate": 1.1615211721200258e-06, - "loss": 0.5459, - "step": 54417 - }, - { - "epoch": 1.39, - "learning_rate": 1.1614938649381896e-06, - "loss": 0.6885, - "step": 54418 - }, - { - "epoch": 1.39, - "learning_rate": 1.1614665576327052e-06, - "loss": 0.5649, - "step": 54419 - }, - { - "epoch": 1.39, - "learning_rate": 1.161439250203593e-06, - "loss": 0.8291, - "step": 54420 - }, - { - "epoch": 1.39, - "learning_rate": 1.1614119426508744e-06, - "loss": 0.7666, - "step": 54421 - }, - { - "epoch": 1.39, - "learning_rate": 1.16138463497457e-06, - "loss": 0.7617, - "step": 54422 - }, - { - "epoch": 1.39, - "learning_rate": 1.161357327174701e-06, - "loss": 0.6021, - "step": 54423 - }, - { - "epoch": 1.39, - "learning_rate": 1.1613300192512877e-06, - "loss": 0.6055, - "step": 54424 - }, - { - "epoch": 1.39, - "learning_rate": 1.1613027112043518e-06, - "loss": 0.6558, - "step": 54425 - }, - { - "epoch": 1.39, - "learning_rate": 1.1612754030339135e-06, - "loss": 0.751, - "step": 54426 - }, - { - "epoch": 1.39, - "learning_rate": 1.1612480947399944e-06, - "loss": 0.7246, - "step": 54427 - }, - { - "epoch": 1.4, - "learning_rate": 1.1612207863226152e-06, - "loss": 0.5942, - "step": 54428 - }, - { - "epoch": 1.4, - "learning_rate": 1.1611934777817963e-06, - "loss": 0.5, - "step": 54429 - }, - { - "epoch": 1.4, - "learning_rate": 1.1611661691175586e-06, - "loss": 0.655, - "step": 54430 - }, - { - "epoch": 1.4, - "learning_rate": 1.1611388603299241e-06, - "loss": 0.5366, - "step": 54431 - }, - { - "epoch": 1.4, - "learning_rate": 1.1611115514189125e-06, - "loss": 0.6719, - "step": 54432 - }, - { - "epoch": 1.4, - "learning_rate": 1.1610842423845455e-06, - "loss": 0.7451, - "step": 54433 - }, - { - "epoch": 1.4, - "learning_rate": 1.1610569332268436e-06, - "loss": 0.6704, - "step": 54434 - }, - { - "epoch": 1.4, - "learning_rate": 1.1610296239458277e-06, - "loss": 0.6533, - "step": 54435 - }, - { - "epoch": 1.4, - "learning_rate": 1.1610023145415189e-06, - "loss": 0.6582, - "step": 54436 - }, - { - "epoch": 1.4, - "learning_rate": 1.1609750050139382e-06, - "loss": 0.4041, - "step": 54437 - }, - { - "epoch": 1.4, - "learning_rate": 1.1609476953631062e-06, - "loss": 0.7642, - "step": 54438 - }, - { - "epoch": 1.4, - "learning_rate": 1.1609203855890438e-06, - "loss": 0.7637, - "step": 54439 - }, - { - "epoch": 1.4, - "learning_rate": 1.1608930756917722e-06, - "loss": 0.6179, - "step": 54440 - }, - { - "epoch": 1.4, - "learning_rate": 1.1608657656713121e-06, - "loss": 0.6738, - "step": 54441 - }, - { - "epoch": 1.4, - "learning_rate": 1.1608384555276844e-06, - "loss": 0.6318, - "step": 54442 - }, - { - "epoch": 1.4, - "learning_rate": 1.1608111452609103e-06, - "loss": 0.7412, - "step": 54443 - }, - { - "epoch": 1.4, - "learning_rate": 1.1607838348710105e-06, - "loss": 0.6201, - "step": 54444 - }, - { - "epoch": 1.4, - "learning_rate": 1.1607565243580057e-06, - "loss": 0.6367, - "step": 54445 - }, - { - "epoch": 1.4, - "learning_rate": 1.1607292137219174e-06, - "loss": 0.5874, - "step": 54446 - }, - { - "epoch": 1.4, - "learning_rate": 1.1607019029627659e-06, - "loss": 0.564, - "step": 54447 - }, - { - "epoch": 1.4, - "learning_rate": 1.1606745920805724e-06, - "loss": 0.6953, - "step": 54448 - }, - { - "epoch": 1.4, - "learning_rate": 1.1606472810753576e-06, - "loss": 0.625, - "step": 54449 - }, - { - "epoch": 1.4, - "learning_rate": 1.1606199699471426e-06, - "loss": 0.7842, - "step": 54450 - }, - { - "epoch": 1.4, - "learning_rate": 1.1605926586959483e-06, - "loss": 0.7822, - "step": 54451 - }, - { - "epoch": 1.4, - "learning_rate": 1.1605653473217956e-06, - "loss": 0.6406, - "step": 54452 - }, - { - "epoch": 1.4, - "learning_rate": 1.1605380358247055e-06, - "loss": 0.6465, - "step": 54453 - }, - { - "epoch": 1.4, - "learning_rate": 1.1605107242046987e-06, - "loss": 0.5845, - "step": 54454 - }, - { - "epoch": 1.4, - "learning_rate": 1.1604834124617961e-06, - "loss": 0.6504, - "step": 54455 - }, - { - "epoch": 1.4, - "learning_rate": 1.160456100596019e-06, - "loss": 0.5469, - "step": 54456 - }, - { - "epoch": 1.4, - "learning_rate": 1.1604287886073878e-06, - "loss": 0.6621, - "step": 54457 - }, - { - "epoch": 1.4, - "learning_rate": 1.1604014764959238e-06, - "loss": 0.4147, - "step": 54458 - }, - { - "epoch": 1.4, - "learning_rate": 1.1603741642616479e-06, - "loss": 0.5884, - "step": 54459 - }, - { - "epoch": 1.4, - "learning_rate": 1.1603468519045805e-06, - "loss": 0.7559, - "step": 54460 - }, - { - "epoch": 1.4, - "learning_rate": 1.1603195394247432e-06, - "loss": 0.5667, - "step": 54461 - }, - { - "epoch": 1.4, - "learning_rate": 1.1602922268221561e-06, - "loss": 0.5925, - "step": 54462 - }, - { - "epoch": 1.4, - "learning_rate": 1.1602649140968414e-06, - "loss": 0.793, - "step": 54463 - }, - { - "epoch": 1.4, - "learning_rate": 1.160237601248819e-06, - "loss": 0.5239, - "step": 54464 - }, - { - "epoch": 1.4, - "learning_rate": 1.1602102882781097e-06, - "loss": 0.7363, - "step": 54465 - }, - { - "epoch": 1.4, - "learning_rate": 1.1601829751847348e-06, - "loss": 0.666, - "step": 54466 - }, - { - "epoch": 1.4, - "learning_rate": 1.1601556619687155e-06, - "loss": 0.5366, - "step": 54467 - }, - { - "epoch": 1.4, - "learning_rate": 1.160128348630072e-06, - "loss": 0.7007, - "step": 54468 - }, - { - "epoch": 1.4, - "learning_rate": 1.160101035168826e-06, - "loss": 0.5095, - "step": 54469 - }, - { - "epoch": 1.4, - "learning_rate": 1.1600737215849974e-06, - "loss": 0.6533, - "step": 54470 - }, - { - "epoch": 1.4, - "learning_rate": 1.160046407878608e-06, - "loss": 0.7471, - "step": 54471 - }, - { - "epoch": 1.4, - "learning_rate": 1.1600190940496784e-06, - "loss": 0.4827, - "step": 54472 - }, - { - "epoch": 1.4, - "learning_rate": 1.15999178009823e-06, - "loss": 0.6709, - "step": 54473 - }, - { - "epoch": 1.4, - "learning_rate": 1.1599644660242827e-06, - "loss": 0.6914, - "step": 54474 - }, - { - "epoch": 1.4, - "learning_rate": 1.1599371518278583e-06, - "loss": 0.7227, - "step": 54475 - }, - { - "epoch": 1.4, - "learning_rate": 1.159909837508977e-06, - "loss": 0.5742, - "step": 54476 - }, - { - "epoch": 1.4, - "learning_rate": 1.1598825230676603e-06, - "loss": 0.6851, - "step": 54477 - }, - { - "epoch": 1.4, - "learning_rate": 1.159855208503929e-06, - "loss": 0.5938, - "step": 54478 - }, - { - "epoch": 1.4, - "learning_rate": 1.1598278938178037e-06, - "loss": 0.547, - "step": 54479 - }, - { - "epoch": 1.4, - "learning_rate": 1.1598005790093055e-06, - "loss": 0.7256, - "step": 54480 - }, - { - "epoch": 1.4, - "learning_rate": 1.1597732640784555e-06, - "loss": 0.5303, - "step": 54481 - }, - { - "epoch": 1.4, - "learning_rate": 1.1597459490252746e-06, - "loss": 0.6855, - "step": 54482 - }, - { - "epoch": 1.4, - "learning_rate": 1.1597186338497833e-06, - "loss": 0.7754, - "step": 54483 - }, - { - "epoch": 1.4, - "learning_rate": 1.159691318552003e-06, - "loss": 0.5132, - "step": 54484 - }, - { - "epoch": 1.4, - "learning_rate": 1.1596640031319542e-06, - "loss": 0.6338, - "step": 54485 - }, - { - "epoch": 1.4, - "learning_rate": 1.1596366875896583e-06, - "loss": 0.6025, - "step": 54486 - }, - { - "epoch": 1.4, - "learning_rate": 1.1596093719251354e-06, - "loss": 0.8008, - "step": 54487 - }, - { - "epoch": 1.4, - "learning_rate": 1.1595820561384075e-06, - "loss": 0.748, - "step": 54488 - }, - { - "epoch": 1.4, - "learning_rate": 1.1595547402294947e-06, - "loss": 0.7051, - "step": 54489 - }, - { - "epoch": 1.4, - "learning_rate": 1.1595274241984183e-06, - "loss": 0.7793, - "step": 54490 - }, - { - "epoch": 1.4, - "learning_rate": 1.159500108045199e-06, - "loss": 0.5654, - "step": 54491 - }, - { - "epoch": 1.4, - "learning_rate": 1.1594727917698576e-06, - "loss": 0.668, - "step": 54492 - }, - { - "epoch": 1.4, - "learning_rate": 1.1594454753724156e-06, - "loss": 0.6543, - "step": 54493 - }, - { - "epoch": 1.4, - "learning_rate": 1.1594181588528934e-06, - "loss": 0.6641, - "step": 54494 - }, - { - "epoch": 1.4, - "learning_rate": 1.159390842211312e-06, - "loss": 0.5938, - "step": 54495 - }, - { - "epoch": 1.4, - "learning_rate": 1.1593635254476923e-06, - "loss": 0.5151, - "step": 54496 - }, - { - "epoch": 1.4, - "learning_rate": 1.1593362085620552e-06, - "loss": 0.7412, - "step": 54497 - }, - { - "epoch": 1.4, - "learning_rate": 1.159308891554422e-06, - "loss": 0.699, - "step": 54498 - }, - { - "epoch": 1.4, - "learning_rate": 1.1592815744248132e-06, - "loss": 0.6362, - "step": 54499 - }, - { - "epoch": 1.4, - "learning_rate": 1.1592542571732498e-06, - "loss": 0.7002, - "step": 54500 - }, - { - "epoch": 1.4, - "learning_rate": 1.1592269397997525e-06, - "loss": 0.6699, - "step": 54501 - }, - { - "epoch": 1.4, - "learning_rate": 1.1591996223043427e-06, - "loss": 0.6602, - "step": 54502 - }, - { - "epoch": 1.4, - "learning_rate": 1.159172304687041e-06, - "loss": 0.7725, - "step": 54503 - }, - { - "epoch": 1.4, - "learning_rate": 1.1591449869478684e-06, - "loss": 0.5747, - "step": 54504 - }, - { - "epoch": 1.4, - "learning_rate": 1.1591176690868457e-06, - "loss": 0.5411, - "step": 54505 - }, - { - "epoch": 1.4, - "learning_rate": 1.159090351103994e-06, - "loss": 0.5371, - "step": 54506 - }, - { - "epoch": 1.4, - "learning_rate": 1.1590630329993343e-06, - "loss": 0.7031, - "step": 54507 - }, - { - "epoch": 1.4, - "learning_rate": 1.1590357147728873e-06, - "loss": 0.8174, - "step": 54508 - }, - { - "epoch": 1.4, - "learning_rate": 1.159008396424674e-06, - "loss": 0.6157, - "step": 54509 - }, - { - "epoch": 1.4, - "learning_rate": 1.1589810779547149e-06, - "loss": 0.7134, - "step": 54510 - }, - { - "epoch": 1.4, - "learning_rate": 1.1589537593630317e-06, - "loss": 0.6504, - "step": 54511 - }, - { - "epoch": 1.4, - "learning_rate": 1.1589264406496446e-06, - "loss": 0.5708, - "step": 54512 - }, - { - "epoch": 1.4, - "learning_rate": 1.1588991218145752e-06, - "loss": 0.5818, - "step": 54513 - }, - { - "epoch": 1.4, - "learning_rate": 1.1588718028578437e-06, - "loss": 0.7017, - "step": 54514 - }, - { - "epoch": 1.4, - "learning_rate": 1.1588444837794716e-06, - "loss": 0.7218, - "step": 54515 - }, - { - "epoch": 1.4, - "learning_rate": 1.1588171645794794e-06, - "loss": 0.7314, - "step": 54516 - }, - { - "epoch": 1.4, - "learning_rate": 1.1587898452578886e-06, - "loss": 0.5693, - "step": 54517 - }, - { - "epoch": 1.4, - "learning_rate": 1.1587625258147192e-06, - "loss": 0.54, - "step": 54518 - }, - { - "epoch": 1.4, - "learning_rate": 1.158735206249993e-06, - "loss": 0.5806, - "step": 54519 - }, - { - "epoch": 1.4, - "learning_rate": 1.1587078865637301e-06, - "loss": 0.5645, - "step": 54520 - }, - { - "epoch": 1.4, - "learning_rate": 1.1586805667559522e-06, - "loss": 0.7188, - "step": 54521 - }, - { - "epoch": 1.4, - "learning_rate": 1.15865324682668e-06, - "loss": 0.6738, - "step": 54522 - }, - { - "epoch": 1.4, - "learning_rate": 1.1586259267759339e-06, - "loss": 0.6904, - "step": 54523 - }, - { - "epoch": 1.4, - "learning_rate": 1.1585986066037357e-06, - "loss": 0.5469, - "step": 54524 - }, - { - "epoch": 1.4, - "learning_rate": 1.1585712863101054e-06, - "loss": 1.1729, - "step": 54525 - }, - { - "epoch": 1.4, - "learning_rate": 1.1585439658950647e-06, - "loss": 0.5781, - "step": 54526 - }, - { - "epoch": 1.4, - "learning_rate": 1.158516645358634e-06, - "loss": 0.6392, - "step": 54527 - }, - { - "epoch": 1.4, - "learning_rate": 1.1584893247008347e-06, - "loss": 0.54, - "step": 54528 - }, - { - "epoch": 1.4, - "learning_rate": 1.158462003921687e-06, - "loss": 0.7461, - "step": 54529 - }, - { - "epoch": 1.4, - "learning_rate": 1.1584346830212124e-06, - "loss": 0.7354, - "step": 54530 - }, - { - "epoch": 1.4, - "learning_rate": 1.1584073619994314e-06, - "loss": 0.5825, - "step": 54531 - }, - { - "epoch": 1.4, - "learning_rate": 1.1583800408563658e-06, - "loss": 0.5679, - "step": 54532 - }, - { - "epoch": 1.4, - "learning_rate": 1.1583527195920353e-06, - "loss": 0.7012, - "step": 54533 - }, - { - "epoch": 1.4, - "learning_rate": 1.1583253982064615e-06, - "loss": 0.7305, - "step": 54534 - }, - { - "epoch": 1.4, - "learning_rate": 1.1582980766996653e-06, - "loss": 0.791, - "step": 54535 - }, - { - "epoch": 1.4, - "learning_rate": 1.1582707550716678e-06, - "loss": 0.5657, - "step": 54536 - }, - { - "epoch": 1.4, - "learning_rate": 1.1582434333224893e-06, - "loss": 0.5525, - "step": 54537 - }, - { - "epoch": 1.4, - "learning_rate": 1.1582161114521514e-06, - "loss": 0.79, - "step": 54538 - }, - { - "epoch": 1.4, - "learning_rate": 1.1581887894606744e-06, - "loss": 0.668, - "step": 54539 - }, - { - "epoch": 1.4, - "learning_rate": 1.1581614673480796e-06, - "loss": 0.6338, - "step": 54540 - }, - { - "epoch": 1.4, - "learning_rate": 1.1581341451143876e-06, - "loss": 0.6323, - "step": 54541 - }, - { - "epoch": 1.4, - "learning_rate": 1.15810682275962e-06, - "loss": 0.6565, - "step": 54542 - }, - { - "epoch": 1.4, - "learning_rate": 1.158079500283797e-06, - "loss": 0.5239, - "step": 54543 - }, - { - "epoch": 1.4, - "learning_rate": 1.1580521776869402e-06, - "loss": 0.5439, - "step": 54544 - }, - { - "epoch": 1.4, - "learning_rate": 1.1580248549690693e-06, - "loss": 0.6436, - "step": 54545 - }, - { - "epoch": 1.4, - "learning_rate": 1.1579975321302067e-06, - "loss": 0.5444, - "step": 54546 - }, - { - "epoch": 1.4, - "learning_rate": 1.1579702091703726e-06, - "loss": 0.6077, - "step": 54547 - }, - { - "epoch": 1.4, - "learning_rate": 1.1579428860895876e-06, - "loss": 0.7236, - "step": 54548 - }, - { - "epoch": 1.4, - "learning_rate": 1.1579155628878734e-06, - "loss": 0.7227, - "step": 54549 - }, - { - "epoch": 1.4, - "learning_rate": 1.1578882395652503e-06, - "loss": 0.7017, - "step": 54550 - }, - { - "epoch": 1.4, - "learning_rate": 1.1578609161217394e-06, - "loss": 0.5986, - "step": 54551 - }, - { - "epoch": 1.4, - "learning_rate": 1.157833592557362e-06, - "loss": 0.7031, - "step": 54552 - }, - { - "epoch": 1.4, - "learning_rate": 1.1578062688721384e-06, - "loss": 0.7256, - "step": 54553 - }, - { - "epoch": 1.4, - "learning_rate": 1.1577789450660897e-06, - "loss": 0.6353, - "step": 54554 - }, - { - "epoch": 1.4, - "learning_rate": 1.157751621139237e-06, - "loss": 0.6338, - "step": 54555 - }, - { - "epoch": 1.4, - "learning_rate": 1.157724297091601e-06, - "loss": 0.5566, - "step": 54556 - }, - { - "epoch": 1.4, - "learning_rate": 1.1576969729232034e-06, - "loss": 0.6646, - "step": 54557 - }, - { - "epoch": 1.4, - "learning_rate": 1.1576696486340638e-06, - "loss": 0.7197, - "step": 54558 - }, - { - "epoch": 1.4, - "learning_rate": 1.157642324224204e-06, - "loss": 0.5008, - "step": 54559 - }, - { - "epoch": 1.4, - "learning_rate": 1.1576149996936446e-06, - "loss": 0.7607, - "step": 54560 - }, - { - "epoch": 1.4, - "learning_rate": 1.157587675042407e-06, - "loss": 0.6562, - "step": 54561 - }, - { - "epoch": 1.4, - "learning_rate": 1.1575603502705115e-06, - "loss": 0.5532, - "step": 54562 - }, - { - "epoch": 1.4, - "learning_rate": 1.1575330253779793e-06, - "loss": 0.5884, - "step": 54563 - }, - { - "epoch": 1.4, - "learning_rate": 1.1575057003648313e-06, - "loss": 0.9023, - "step": 54564 - }, - { - "epoch": 1.4, - "learning_rate": 1.1574783752310885e-06, - "loss": 0.625, - "step": 54565 - }, - { - "epoch": 1.4, - "learning_rate": 1.1574510499767716e-06, - "loss": 0.8223, - "step": 54566 - }, - { - "epoch": 1.4, - "learning_rate": 1.1574237246019018e-06, - "loss": 0.6006, - "step": 54567 - }, - { - "epoch": 1.4, - "learning_rate": 1.1573963991065e-06, - "loss": 0.6611, - "step": 54568 - }, - { - "epoch": 1.4, - "learning_rate": 1.1573690734905867e-06, - "loss": 0.7988, - "step": 54569 - }, - { - "epoch": 1.4, - "learning_rate": 1.1573417477541834e-06, - "loss": 0.6069, - "step": 54570 - }, - { - "epoch": 1.4, - "learning_rate": 1.1573144218973105e-06, - "loss": 0.5728, - "step": 54571 - }, - { - "epoch": 1.4, - "learning_rate": 1.1572870959199896e-06, - "loss": 0.6357, - "step": 54572 - }, - { - "epoch": 1.4, - "learning_rate": 1.157259769822241e-06, - "loss": 0.7344, - "step": 54573 - }, - { - "epoch": 1.4, - "learning_rate": 1.1572324436040859e-06, - "loss": 0.6367, - "step": 54574 - }, - { - "epoch": 1.4, - "learning_rate": 1.1572051172655448e-06, - "loss": 0.4639, - "step": 54575 - }, - { - "epoch": 1.4, - "learning_rate": 1.1571777908066394e-06, - "loss": 0.438, - "step": 54576 - }, - { - "epoch": 1.4, - "learning_rate": 1.15715046422739e-06, - "loss": 0.7754, - "step": 54577 - }, - { - "epoch": 1.4, - "learning_rate": 1.1571231375278176e-06, - "loss": 0.834, - "step": 54578 - }, - { - "epoch": 1.4, - "learning_rate": 1.1570958107079433e-06, - "loss": 0.5767, - "step": 54579 - }, - { - "epoch": 1.4, - "learning_rate": 1.1570684837677882e-06, - "loss": 0.7617, - "step": 54580 - }, - { - "epoch": 1.4, - "learning_rate": 1.1570411567073726e-06, - "loss": 0.5691, - "step": 54581 - }, - { - "epoch": 1.4, - "learning_rate": 1.1570138295267183e-06, - "loss": 0.5762, - "step": 54582 - }, - { - "epoch": 1.4, - "learning_rate": 1.156986502225845e-06, - "loss": 0.645, - "step": 54583 - }, - { - "epoch": 1.4, - "learning_rate": 1.1569591748047751e-06, - "loss": 0.7432, - "step": 54584 - }, - { - "epoch": 1.4, - "learning_rate": 1.1569318472635284e-06, - "loss": 0.7197, - "step": 54585 - }, - { - "epoch": 1.4, - "learning_rate": 1.1569045196021264e-06, - "loss": 0.8115, - "step": 54586 - }, - { - "epoch": 1.4, - "learning_rate": 1.1568771918205897e-06, - "loss": 0.5576, - "step": 54587 - }, - { - "epoch": 1.4, - "learning_rate": 1.1568498639189393e-06, - "loss": 0.7197, - "step": 54588 - }, - { - "epoch": 1.4, - "learning_rate": 1.1568225358971961e-06, - "loss": 0.7227, - "step": 54589 - }, - { - "epoch": 1.4, - "learning_rate": 1.1567952077553814e-06, - "loss": 0.6621, - "step": 54590 - }, - { - "epoch": 1.4, - "learning_rate": 1.1567678794935154e-06, - "loss": 0.5806, - "step": 54591 - }, - { - "epoch": 1.4, - "learning_rate": 1.1567405511116198e-06, - "loss": 0.6914, - "step": 54592 - }, - { - "epoch": 1.4, - "learning_rate": 1.1567132226097148e-06, - "loss": 0.5903, - "step": 54593 - }, - { - "epoch": 1.4, - "learning_rate": 1.156685893987822e-06, - "loss": 0.6992, - "step": 54594 - }, - { - "epoch": 1.4, - "learning_rate": 1.1566585652459619e-06, - "loss": 0.6875, - "step": 54595 - }, - { - "epoch": 1.4, - "learning_rate": 1.1566312363841556e-06, - "loss": 0.7158, - "step": 54596 - }, - { - "epoch": 1.4, - "learning_rate": 1.156603907402424e-06, - "loss": 0.6768, - "step": 54597 - }, - { - "epoch": 1.4, - "learning_rate": 1.156576578300788e-06, - "loss": 0.7393, - "step": 54598 - }, - { - "epoch": 1.4, - "learning_rate": 1.1565492490792686e-06, - "loss": 0.7979, - "step": 54599 - }, - { - "epoch": 1.4, - "learning_rate": 1.1565219197378862e-06, - "loss": 0.5815, - "step": 54600 - }, - { - "epoch": 1.4, - "learning_rate": 1.1564945902766625e-06, - "loss": 0.6851, - "step": 54601 - }, - { - "epoch": 1.4, - "learning_rate": 1.156467260695618e-06, - "loss": 0.5771, - "step": 54602 - }, - { - "epoch": 1.4, - "learning_rate": 1.156439930994774e-06, - "loss": 0.6592, - "step": 54603 - }, - { - "epoch": 1.4, - "learning_rate": 1.1564126011741505e-06, - "loss": 0.7773, - "step": 54604 - }, - { - "epoch": 1.4, - "learning_rate": 1.1563852712337698e-06, - "loss": 0.5796, - "step": 54605 - }, - { - "epoch": 1.4, - "learning_rate": 1.1563579411736516e-06, - "loss": 0.4402, - "step": 54606 - }, - { - "epoch": 1.4, - "learning_rate": 1.1563306109938177e-06, - "loss": 0.5747, - "step": 54607 - }, - { - "epoch": 1.4, - "learning_rate": 1.1563032806942882e-06, - "loss": 0.6543, - "step": 54608 - }, - { - "epoch": 1.4, - "learning_rate": 1.1562759502750848e-06, - "loss": 0.499, - "step": 54609 - }, - { - "epoch": 1.4, - "learning_rate": 1.1562486197362278e-06, - "loss": 0.6982, - "step": 54610 - }, - { - "epoch": 1.4, - "learning_rate": 1.1562212890777384e-06, - "loss": 0.6021, - "step": 54611 - }, - { - "epoch": 1.4, - "learning_rate": 1.156193958299638e-06, - "loss": 0.6733, - "step": 54612 - }, - { - "epoch": 1.4, - "learning_rate": 1.1561666274019466e-06, - "loss": 0.6528, - "step": 54613 - }, - { - "epoch": 1.4, - "learning_rate": 1.1561392963846858e-06, - "loss": 0.5588, - "step": 54614 - }, - { - "epoch": 1.4, - "learning_rate": 1.156111965247876e-06, - "loss": 0.5718, - "step": 54615 - }, - { - "epoch": 1.4, - "learning_rate": 1.1560846339915392e-06, - "loss": 0.5012, - "step": 54616 - }, - { - "epoch": 1.4, - "learning_rate": 1.156057302615695e-06, - "loss": 0.7051, - "step": 54617 - }, - { - "epoch": 1.4, - "learning_rate": 1.156029971120365e-06, - "loss": 0.6265, - "step": 54618 - }, - { - "epoch": 1.4, - "learning_rate": 1.15600263950557e-06, - "loss": 0.6143, - "step": 54619 - }, - { - "epoch": 1.4, - "learning_rate": 1.155975307771331e-06, - "loss": 0.9043, - "step": 54620 - }, - { - "epoch": 1.4, - "learning_rate": 1.1559479759176686e-06, - "loss": 0.877, - "step": 54621 - }, - { - "epoch": 1.4, - "learning_rate": 1.1559206439446048e-06, - "loss": 0.75, - "step": 54622 - }, - { - "epoch": 1.4, - "learning_rate": 1.155893311852159e-06, - "loss": 0.7178, - "step": 54623 - }, - { - "epoch": 1.4, - "learning_rate": 1.155865979640353e-06, - "loss": 0.7236, - "step": 54624 - }, - { - "epoch": 1.4, - "learning_rate": 1.1558386473092076e-06, - "loss": 0.6377, - "step": 54625 - }, - { - "epoch": 1.4, - "learning_rate": 1.1558113148587438e-06, - "loss": 0.4927, - "step": 54626 - }, - { - "epoch": 1.4, - "learning_rate": 1.1557839822889826e-06, - "loss": 0.6748, - "step": 54627 - }, - { - "epoch": 1.4, - "learning_rate": 1.1557566495999445e-06, - "loss": 0.7021, - "step": 54628 - }, - { - "epoch": 1.4, - "learning_rate": 1.1557293167916506e-06, - "loss": 0.7422, - "step": 54629 - }, - { - "epoch": 1.4, - "learning_rate": 1.1557019838641222e-06, - "loss": 0.7227, - "step": 54630 - }, - { - "epoch": 1.4, - "learning_rate": 1.1556746508173798e-06, - "loss": 0.5632, - "step": 54631 - }, - { - "epoch": 1.4, - "learning_rate": 1.1556473176514446e-06, - "loss": 0.521, - "step": 54632 - }, - { - "epoch": 1.4, - "learning_rate": 1.1556199843663372e-06, - "loss": 0.7148, - "step": 54633 - }, - { - "epoch": 1.4, - "learning_rate": 1.155592650962079e-06, - "loss": 0.6914, - "step": 54634 - }, - { - "epoch": 1.4, - "learning_rate": 1.1555653174386903e-06, - "loss": 0.7637, - "step": 54635 - }, - { - "epoch": 1.4, - "learning_rate": 1.1555379837961928e-06, - "loss": 0.7109, - "step": 54636 - }, - { - "epoch": 1.4, - "learning_rate": 1.1555106500346069e-06, - "loss": 0.5127, - "step": 54637 - }, - { - "epoch": 1.4, - "learning_rate": 1.1554833161539534e-06, - "loss": 0.6914, - "step": 54638 - }, - { - "epoch": 1.4, - "learning_rate": 1.1554559821542538e-06, - "loss": 0.6709, - "step": 54639 - }, - { - "epoch": 1.4, - "learning_rate": 1.1554286480355285e-06, - "loss": 0.6777, - "step": 54640 - }, - { - "epoch": 1.4, - "learning_rate": 1.1554013137977985e-06, - "loss": 0.5352, - "step": 54641 - }, - { - "epoch": 1.4, - "learning_rate": 1.1553739794410851e-06, - "loss": 0.6812, - "step": 54642 - }, - { - "epoch": 1.4, - "learning_rate": 1.155346644965409e-06, - "loss": 0.6426, - "step": 54643 - }, - { - "epoch": 1.4, - "learning_rate": 1.155319310370791e-06, - "loss": 0.6572, - "step": 54644 - }, - { - "epoch": 1.4, - "learning_rate": 1.1552919756572522e-06, - "loss": 0.5776, - "step": 54645 - }, - { - "epoch": 1.4, - "learning_rate": 1.1552646408248134e-06, - "loss": 0.5441, - "step": 54646 - }, - { - "epoch": 1.4, - "learning_rate": 1.1552373058734958e-06, - "loss": 0.5737, - "step": 54647 - }, - { - "epoch": 1.4, - "learning_rate": 1.15520997080332e-06, - "loss": 0.7715, - "step": 54648 - }, - { - "epoch": 1.4, - "learning_rate": 1.155182635614307e-06, - "loss": 0.689, - "step": 54649 - }, - { - "epoch": 1.4, - "learning_rate": 1.1551553003064777e-06, - "loss": 0.6836, - "step": 54650 - }, - { - "epoch": 1.4, - "learning_rate": 1.1551279648798535e-06, - "loss": 0.5947, - "step": 54651 - }, - { - "epoch": 1.4, - "learning_rate": 1.1551006293344548e-06, - "loss": 0.4717, - "step": 54652 - }, - { - "epoch": 1.4, - "learning_rate": 1.1550732936703027e-06, - "loss": 0.4756, - "step": 54653 - }, - { - "epoch": 1.4, - "learning_rate": 1.1550459578874177e-06, - "loss": 0.6338, - "step": 54654 - }, - { - "epoch": 1.4, - "learning_rate": 1.1550186219858215e-06, - "loss": 0.6328, - "step": 54655 - }, - { - "epoch": 1.4, - "learning_rate": 1.1549912859655345e-06, - "loss": 0.5396, - "step": 54656 - }, - { - "epoch": 1.4, - "learning_rate": 1.154963949826578e-06, - "loss": 0.562, - "step": 54657 - }, - { - "epoch": 1.4, - "learning_rate": 1.1549366135689729e-06, - "loss": 0.8027, - "step": 54658 - }, - { - "epoch": 1.4, - "learning_rate": 1.1549092771927394e-06, - "loss": 0.7061, - "step": 54659 - }, - { - "epoch": 1.4, - "learning_rate": 1.1548819406978993e-06, - "loss": 0.833, - "step": 54660 - }, - { - "epoch": 1.4, - "learning_rate": 1.1548546040844733e-06, - "loss": 0.5366, - "step": 54661 - }, - { - "epoch": 1.4, - "learning_rate": 1.1548272673524824e-06, - "loss": 0.8701, - "step": 54662 - }, - { - "epoch": 1.4, - "learning_rate": 1.154799930501947e-06, - "loss": 0.6147, - "step": 54663 - }, - { - "epoch": 1.4, - "learning_rate": 1.1547725935328887e-06, - "loss": 0.709, - "step": 54664 - }, - { - "epoch": 1.4, - "learning_rate": 1.1547452564453278e-06, - "loss": 0.5566, - "step": 54665 - }, - { - "epoch": 1.4, - "learning_rate": 1.1547179192392858e-06, - "loss": 0.6227, - "step": 54666 - }, - { - "epoch": 1.4, - "learning_rate": 1.1546905819147835e-06, - "loss": 0.4922, - "step": 54667 - }, - { - "epoch": 1.4, - "learning_rate": 1.1546632444718416e-06, - "loss": 0.6274, - "step": 54668 - }, - { - "epoch": 1.4, - "learning_rate": 1.1546359069104812e-06, - "loss": 0.7578, - "step": 54669 - }, - { - "epoch": 1.4, - "learning_rate": 1.154608569230723e-06, - "loss": 0.7656, - "step": 54670 - }, - { - "epoch": 1.4, - "learning_rate": 1.1545812314325883e-06, - "loss": 0.6289, - "step": 54671 - }, - { - "epoch": 1.4, - "learning_rate": 1.154553893516098e-06, - "loss": 0.5332, - "step": 54672 - }, - { - "epoch": 1.4, - "learning_rate": 1.1545265554812727e-06, - "loss": 0.7134, - "step": 54673 - }, - { - "epoch": 1.4, - "learning_rate": 1.1544992173281335e-06, - "loss": 0.5081, - "step": 54674 - }, - { - "epoch": 1.4, - "learning_rate": 1.1544718790567013e-06, - "loss": 0.4851, - "step": 54675 - }, - { - "epoch": 1.4, - "learning_rate": 1.1544445406669973e-06, - "loss": 0.7705, - "step": 54676 - }, - { - "epoch": 1.4, - "learning_rate": 1.1544172021590423e-06, - "loss": 0.623, - "step": 54677 - }, - { - "epoch": 1.4, - "learning_rate": 1.1543898635328569e-06, - "loss": 0.4204, - "step": 54678 - }, - { - "epoch": 1.4, - "learning_rate": 1.1543625247884622e-06, - "loss": 0.7178, - "step": 54679 - }, - { - "epoch": 1.4, - "learning_rate": 1.1543351859258796e-06, - "loss": 0.6167, - "step": 54680 - }, - { - "epoch": 1.4, - "learning_rate": 1.1543078469451293e-06, - "loss": 0.5337, - "step": 54681 - }, - { - "epoch": 1.4, - "learning_rate": 1.1542805078462327e-06, - "loss": 0.7119, - "step": 54682 - }, - { - "epoch": 1.4, - "learning_rate": 1.1542531686292106e-06, - "loss": 0.5403, - "step": 54683 - }, - { - "epoch": 1.4, - "learning_rate": 1.1542258292940838e-06, - "loss": 0.7314, - "step": 54684 - }, - { - "epoch": 1.4, - "learning_rate": 1.1541984898408736e-06, - "loss": 0.5241, - "step": 54685 - }, - { - "epoch": 1.4, - "learning_rate": 1.1541711502696005e-06, - "loss": 0.7461, - "step": 54686 - }, - { - "epoch": 1.4, - "learning_rate": 1.1541438105802862e-06, - "loss": 0.5996, - "step": 54687 - }, - { - "epoch": 1.4, - "learning_rate": 1.1541164707729505e-06, - "loss": 0.8984, - "step": 54688 - }, - { - "epoch": 1.4, - "learning_rate": 1.1540891308476151e-06, - "loss": 0.4963, - "step": 54689 - }, - { - "epoch": 1.4, - "learning_rate": 1.1540617908043005e-06, - "loss": 0.4175, - "step": 54690 - }, - { - "epoch": 1.4, - "learning_rate": 1.1540344506430281e-06, - "loss": 0.6484, - "step": 54691 - }, - { - "epoch": 1.4, - "learning_rate": 1.1540071103638187e-06, - "loss": 0.5913, - "step": 54692 - }, - { - "epoch": 1.4, - "learning_rate": 1.153979769966693e-06, - "loss": 0.8516, - "step": 54693 - }, - { - "epoch": 1.4, - "learning_rate": 1.1539524294516719e-06, - "loss": 0.5054, - "step": 54694 - }, - { - "epoch": 1.4, - "learning_rate": 1.1539250888187768e-06, - "loss": 1.1191, - "step": 54695 - }, - { - "epoch": 1.4, - "learning_rate": 1.1538977480680281e-06, - "loss": 0.6538, - "step": 54696 - }, - { - "epoch": 1.4, - "learning_rate": 1.1538704071994472e-06, - "loss": 0.5625, - "step": 54697 - }, - { - "epoch": 1.4, - "learning_rate": 1.1538430662130544e-06, - "loss": 0.875, - "step": 54698 - }, - { - "epoch": 1.4, - "learning_rate": 1.1538157251088715e-06, - "loss": 0.5718, - "step": 54699 - }, - { - "epoch": 1.4, - "learning_rate": 1.1537883838869186e-06, - "loss": 0.8564, - "step": 54700 - }, - { - "epoch": 1.4, - "learning_rate": 1.1537610425472174e-06, - "loss": 0.6113, - "step": 54701 - }, - { - "epoch": 1.4, - "learning_rate": 1.1537337010897883e-06, - "loss": 0.6509, - "step": 54702 - }, - { - "epoch": 1.4, - "learning_rate": 1.153706359514652e-06, - "loss": 0.4712, - "step": 54703 - }, - { - "epoch": 1.4, - "learning_rate": 1.1536790178218304e-06, - "loss": 0.4368, - "step": 54704 - }, - { - "epoch": 1.4, - "learning_rate": 1.1536516760113434e-06, - "loss": 0.709, - "step": 54705 - }, - { - "epoch": 1.4, - "learning_rate": 1.1536243340832125e-06, - "loss": 0.5908, - "step": 54706 - }, - { - "epoch": 1.4, - "learning_rate": 1.1535969920374587e-06, - "loss": 0.668, - "step": 54707 - }, - { - "epoch": 1.4, - "learning_rate": 1.1535696498741026e-06, - "loss": 0.5947, - "step": 54708 - }, - { - "epoch": 1.4, - "learning_rate": 1.1535423075931652e-06, - "loss": 0.7131, - "step": 54709 - }, - { - "epoch": 1.4, - "learning_rate": 1.1535149651946677e-06, - "loss": 0.6079, - "step": 54710 - }, - { - "epoch": 1.4, - "learning_rate": 1.1534876226786306e-06, - "loss": 0.6465, - "step": 54711 - }, - { - "epoch": 1.4, - "learning_rate": 1.1534602800450755e-06, - "loss": 0.5239, - "step": 54712 - }, - { - "epoch": 1.4, - "learning_rate": 1.1534329372940223e-06, - "loss": 0.6885, - "step": 54713 - }, - { - "epoch": 1.4, - "learning_rate": 1.153405594425493e-06, - "loss": 0.6143, - "step": 54714 - }, - { - "epoch": 1.4, - "learning_rate": 1.1533782514395079e-06, - "loss": 0.9043, - "step": 54715 - }, - { - "epoch": 1.4, - "learning_rate": 1.1533509083360881e-06, - "loss": 0.627, - "step": 54716 - }, - { - "epoch": 1.4, - "learning_rate": 1.1533235651152548e-06, - "loss": 0.5859, - "step": 54717 - }, - { - "epoch": 1.4, - "learning_rate": 1.1532962217770288e-06, - "loss": 0.3745, - "step": 54718 - }, - { - "epoch": 1.4, - "learning_rate": 1.1532688783214304e-06, - "loss": 0.8076, - "step": 54719 - }, - { - "epoch": 1.4, - "learning_rate": 1.1532415347484814e-06, - "loss": 0.8926, - "step": 54720 - }, - { - "epoch": 1.4, - "learning_rate": 1.1532141910582023e-06, - "loss": 0.54, - "step": 54721 - }, - { - "epoch": 1.4, - "learning_rate": 1.1531868472506142e-06, - "loss": 0.6606, - "step": 54722 - }, - { - "epoch": 1.4, - "learning_rate": 1.1531595033257381e-06, - "loss": 0.4712, - "step": 54723 - }, - { - "epoch": 1.4, - "learning_rate": 1.1531321592835948e-06, - "loss": 0.491, - "step": 54724 - }, - { - "epoch": 1.4, - "learning_rate": 1.153104815124205e-06, - "loss": 0.603, - "step": 54725 - }, - { - "epoch": 1.4, - "learning_rate": 1.1530774708475901e-06, - "loss": 0.792, - "step": 54726 - }, - { - "epoch": 1.4, - "learning_rate": 1.153050126453771e-06, - "loss": 0.6255, - "step": 54727 - }, - { - "epoch": 1.4, - "learning_rate": 1.1530227819427677e-06, - "loss": 0.4858, - "step": 54728 - }, - { - "epoch": 1.4, - "learning_rate": 1.1529954373146027e-06, - "loss": 0.6299, - "step": 54729 - }, - { - "epoch": 1.4, - "learning_rate": 1.1529680925692956e-06, - "loss": 0.6641, - "step": 54730 - }, - { - "epoch": 1.4, - "learning_rate": 1.1529407477068682e-06, - "loss": 0.5713, - "step": 54731 - }, - { - "epoch": 1.4, - "learning_rate": 1.152913402727341e-06, - "loss": 0.498, - "step": 54732 - }, - { - "epoch": 1.4, - "learning_rate": 1.1528860576307352e-06, - "loss": 0.7744, - "step": 54733 - }, - { - "epoch": 1.4, - "learning_rate": 1.1528587124170711e-06, - "loss": 0.6963, - "step": 54734 - }, - { - "epoch": 1.4, - "learning_rate": 1.1528313670863704e-06, - "loss": 0.792, - "step": 54735 - }, - { - "epoch": 1.4, - "learning_rate": 1.1528040216386536e-06, - "loss": 0.6274, - "step": 54736 - }, - { - "epoch": 1.4, - "learning_rate": 1.1527766760739423e-06, - "loss": 0.5718, - "step": 54737 - }, - { - "epoch": 1.4, - "learning_rate": 1.1527493303922565e-06, - "loss": 0.7393, - "step": 54738 - }, - { - "epoch": 1.4, - "learning_rate": 1.1527219845936177e-06, - "loss": 0.6541, - "step": 54739 - }, - { - "epoch": 1.4, - "learning_rate": 1.1526946386780465e-06, - "loss": 0.7266, - "step": 54740 - }, - { - "epoch": 1.4, - "learning_rate": 1.1526672926455642e-06, - "loss": 0.6982, - "step": 54741 - }, - { - "epoch": 1.4, - "learning_rate": 1.1526399464961915e-06, - "loss": 0.552, - "step": 54742 - }, - { - "epoch": 1.4, - "learning_rate": 1.1526126002299497e-06, - "loss": 0.6587, - "step": 54743 - }, - { - "epoch": 1.4, - "learning_rate": 1.152585253846859e-06, - "loss": 0.645, - "step": 54744 - }, - { - "epoch": 1.4, - "learning_rate": 1.1525579073469412e-06, - "loss": 0.8662, - "step": 54745 - }, - { - "epoch": 1.4, - "learning_rate": 1.1525305607302162e-06, - "loss": 0.6328, - "step": 54746 - }, - { - "epoch": 1.4, - "learning_rate": 1.152503213996706e-06, - "loss": 0.6689, - "step": 54747 - }, - { - "epoch": 1.4, - "learning_rate": 1.1524758671464315e-06, - "loss": 0.5483, - "step": 54748 - }, - { - "epoch": 1.4, - "learning_rate": 1.1524485201794126e-06, - "loss": 0.6538, - "step": 54749 - }, - { - "epoch": 1.4, - "learning_rate": 1.152421173095671e-06, - "loss": 0.7314, - "step": 54750 - }, - { - "epoch": 1.4, - "learning_rate": 1.1523938258952275e-06, - "loss": 0.6709, - "step": 54751 - }, - { - "epoch": 1.4, - "learning_rate": 1.1523664785781035e-06, - "loss": 0.6318, - "step": 54752 - }, - { - "epoch": 1.4, - "learning_rate": 1.1523391311443189e-06, - "loss": 0.6992, - "step": 54753 - }, - { - "epoch": 1.4, - "learning_rate": 1.1523117835938955e-06, - "loss": 0.7236, - "step": 54754 - }, - { - "epoch": 1.4, - "learning_rate": 1.1522844359268539e-06, - "loss": 0.6943, - "step": 54755 - }, - { - "epoch": 1.4, - "learning_rate": 1.1522570881432154e-06, - "loss": 0.5054, - "step": 54756 - }, - { - "epoch": 1.4, - "learning_rate": 1.1522297402430003e-06, - "loss": 0.8594, - "step": 54757 - }, - { - "epoch": 1.4, - "learning_rate": 1.1522023922262304e-06, - "loss": 0.6084, - "step": 54758 - }, - { - "epoch": 1.4, - "learning_rate": 1.1521750440929255e-06, - "loss": 0.6543, - "step": 54759 - }, - { - "epoch": 1.4, - "learning_rate": 1.1521476958431074e-06, - "loss": 0.6553, - "step": 54760 - }, - { - "epoch": 1.4, - "learning_rate": 1.1521203474767967e-06, - "loss": 0.7188, - "step": 54761 - }, - { - "epoch": 1.4, - "learning_rate": 1.1520929989940147e-06, - "loss": 0.6484, - "step": 54762 - }, - { - "epoch": 1.4, - "learning_rate": 1.1520656503947818e-06, - "loss": 0.7227, - "step": 54763 - }, - { - "epoch": 1.4, - "learning_rate": 1.1520383016791195e-06, - "loss": 0.6431, - "step": 54764 - }, - { - "epoch": 1.4, - "learning_rate": 1.152010952847048e-06, - "loss": 0.7061, - "step": 54765 - }, - { - "epoch": 1.4, - "learning_rate": 1.1519836038985894e-06, - "loss": 0.6978, - "step": 54766 - }, - { - "epoch": 1.4, - "learning_rate": 1.1519562548337636e-06, - "loss": 0.6553, - "step": 54767 - }, - { - "epoch": 1.4, - "learning_rate": 1.1519289056525915e-06, - "loss": 0.7324, - "step": 54768 - }, - { - "epoch": 1.4, - "learning_rate": 1.151901556355095e-06, - "loss": 0.5464, - "step": 54769 - }, - { - "epoch": 1.4, - "learning_rate": 1.1518742069412943e-06, - "loss": 0.6343, - "step": 54770 - }, - { - "epoch": 1.4, - "learning_rate": 1.1518468574112103e-06, - "loss": 0.6387, - "step": 54771 - }, - { - "epoch": 1.4, - "learning_rate": 1.1518195077648645e-06, - "loss": 0.6416, - "step": 54772 - }, - { - "epoch": 1.4, - "learning_rate": 1.151792158002277e-06, - "loss": 0.5864, - "step": 54773 - }, - { - "epoch": 1.4, - "learning_rate": 1.1517648081234694e-06, - "loss": 0.708, - "step": 54774 - }, - { - "epoch": 1.4, - "learning_rate": 1.1517374581284628e-06, - "loss": 0.8291, - "step": 54775 - }, - { - "epoch": 1.4, - "learning_rate": 1.1517101080172773e-06, - "loss": 0.7773, - "step": 54776 - }, - { - "epoch": 1.4, - "learning_rate": 1.151682757789935e-06, - "loss": 0.4812, - "step": 54777 - }, - { - "epoch": 1.4, - "learning_rate": 1.1516554074464554e-06, - "loss": 0.5999, - "step": 54778 - }, - { - "epoch": 1.4, - "learning_rate": 1.1516280569868608e-06, - "loss": 0.7153, - "step": 54779 - }, - { - "epoch": 1.4, - "learning_rate": 1.1516007064111715e-06, - "loss": 0.6787, - "step": 54780 - }, - { - "epoch": 1.4, - "learning_rate": 1.1515733557194083e-06, - "loss": 0.5908, - "step": 54781 - }, - { - "epoch": 1.4, - "learning_rate": 1.1515460049115927e-06, - "loss": 0.4066, - "step": 54782 - }, - { - "epoch": 1.4, - "learning_rate": 1.1515186539877451e-06, - "loss": 0.5205, - "step": 54783 - }, - { - "epoch": 1.4, - "learning_rate": 1.1514913029478863e-06, - "loss": 0.7148, - "step": 54784 - }, - { - "epoch": 1.4, - "learning_rate": 1.151463951792038e-06, - "loss": 0.5479, - "step": 54785 - }, - { - "epoch": 1.4, - "learning_rate": 1.1514366005202202e-06, - "loss": 0.7188, - "step": 54786 - }, - { - "epoch": 1.4, - "learning_rate": 1.151409249132455e-06, - "loss": 0.6738, - "step": 54787 - }, - { - "epoch": 1.4, - "learning_rate": 1.1513818976287625e-06, - "loss": 0.7041, - "step": 54788 - }, - { - "epoch": 1.4, - "learning_rate": 1.1513545460091638e-06, - "loss": 0.7871, - "step": 54789 - }, - { - "epoch": 1.4, - "learning_rate": 1.1513271942736798e-06, - "loss": 0.7773, - "step": 54790 - }, - { - "epoch": 1.4, - "learning_rate": 1.1512998424223316e-06, - "loss": 0.5632, - "step": 54791 - }, - { - "epoch": 1.4, - "learning_rate": 1.15127249045514e-06, - "loss": 0.5037, - "step": 54792 - }, - { - "epoch": 1.4, - "learning_rate": 1.151245138372126e-06, - "loss": 0.4626, - "step": 54793 - }, - { - "epoch": 1.4, - "learning_rate": 1.1512177861733108e-06, - "loss": 0.6396, - "step": 54794 - }, - { - "epoch": 1.4, - "learning_rate": 1.1511904338587146e-06, - "loss": 0.5957, - "step": 54795 - }, - { - "epoch": 1.4, - "learning_rate": 1.1511630814283593e-06, - "loss": 0.3574, - "step": 54796 - }, - { - "epoch": 1.4, - "learning_rate": 1.1511357288822652e-06, - "loss": 0.856, - "step": 54797 - }, - { - "epoch": 1.4, - "learning_rate": 1.1511083762204536e-06, - "loss": 0.8135, - "step": 54798 - }, - { - "epoch": 1.4, - "learning_rate": 1.1510810234429448e-06, - "loss": 0.6963, - "step": 54799 - }, - { - "epoch": 1.4, - "learning_rate": 1.1510536705497608e-06, - "loss": 0.5713, - "step": 54800 - }, - { - "epoch": 1.4, - "learning_rate": 1.1510263175409213e-06, - "loss": 0.7441, - "step": 54801 - }, - { - "epoch": 1.4, - "learning_rate": 1.1509989644164485e-06, - "loss": 0.7158, - "step": 54802 - }, - { - "epoch": 1.4, - "learning_rate": 1.1509716111763625e-06, - "loss": 0.5957, - "step": 54803 - }, - { - "epoch": 1.4, - "learning_rate": 1.1509442578206845e-06, - "loss": 0.7393, - "step": 54804 - }, - { - "epoch": 1.4, - "learning_rate": 1.1509169043494354e-06, - "loss": 0.5752, - "step": 54805 - }, - { - "epoch": 1.4, - "learning_rate": 1.1508895507626361e-06, - "loss": 0.6899, - "step": 54806 - }, - { - "epoch": 1.4, - "learning_rate": 1.150862197060308e-06, - "loss": 0.5771, - "step": 54807 - }, - { - "epoch": 1.4, - "learning_rate": 1.150834843242471e-06, - "loss": 0.6572, - "step": 54808 - }, - { - "epoch": 1.4, - "learning_rate": 1.1508074893091471e-06, - "loss": 0.5312, - "step": 54809 - }, - { - "epoch": 1.4, - "learning_rate": 1.1507801352603569e-06, - "loss": 0.7158, - "step": 54810 - }, - { - "epoch": 1.4, - "learning_rate": 1.150752781096121e-06, - "loss": 0.7607, - "step": 54811 - }, - { - "epoch": 1.4, - "learning_rate": 1.1507254268164607e-06, - "loss": 0.6436, - "step": 54812 - }, - { - "epoch": 1.4, - "learning_rate": 1.150698072421397e-06, - "loss": 0.6484, - "step": 54813 - }, - { - "epoch": 1.4, - "learning_rate": 1.1506707179109505e-06, - "loss": 0.6309, - "step": 54814 - }, - { - "epoch": 1.4, - "learning_rate": 1.1506433632851427e-06, - "loss": 0.4707, - "step": 54815 - }, - { - "epoch": 1.4, - "learning_rate": 1.150616008543994e-06, - "loss": 0.71, - "step": 54816 - }, - { - "epoch": 1.4, - "learning_rate": 1.1505886536875255e-06, - "loss": 0.6736, - "step": 54817 - }, - { - "epoch": 1.41, - "learning_rate": 1.1505612987157583e-06, - "loss": 0.6553, - "step": 54818 - }, - { - "epoch": 1.41, - "learning_rate": 1.1505339436287132e-06, - "loss": 0.7617, - "step": 54819 - }, - { - "epoch": 1.41, - "learning_rate": 1.1505065884264112e-06, - "loss": 0.7324, - "step": 54820 - }, - { - "epoch": 1.41, - "learning_rate": 1.1504792331088734e-06, - "loss": 0.7725, - "step": 54821 - }, - { - "epoch": 1.41, - "learning_rate": 1.15045187767612e-06, - "loss": 0.7393, - "step": 54822 - }, - { - "epoch": 1.41, - "learning_rate": 1.1504245221281733e-06, - "loss": 0.832, - "step": 54823 - }, - { - "epoch": 1.41, - "learning_rate": 1.1503971664650528e-06, - "loss": 0.6304, - "step": 54824 - }, - { - "epoch": 1.41, - "learning_rate": 1.1503698106867802e-06, - "loss": 0.6191, - "step": 54825 - }, - { - "epoch": 1.41, - "learning_rate": 1.1503424547933767e-06, - "loss": 0.7842, - "step": 54826 - }, - { - "epoch": 1.41, - "learning_rate": 1.1503150987848626e-06, - "loss": 0.8457, - "step": 54827 - }, - { - "epoch": 1.41, - "learning_rate": 1.1502877426612592e-06, - "loss": 0.6533, - "step": 54828 - }, - { - "epoch": 1.41, - "learning_rate": 1.1502603864225874e-06, - "loss": 0.6318, - "step": 54829 - }, - { - "epoch": 1.41, - "learning_rate": 1.150233030068868e-06, - "loss": 0.8037, - "step": 54830 - }, - { - "epoch": 1.41, - "learning_rate": 1.1502056736001224e-06, - "loss": 0.6875, - "step": 54831 - }, - { - "epoch": 1.41, - "learning_rate": 1.1501783170163713e-06, - "loss": 0.5459, - "step": 54832 - }, - { - "epoch": 1.41, - "learning_rate": 1.1501509603176352e-06, - "loss": 0.521, - "step": 54833 - }, - { - "epoch": 1.41, - "learning_rate": 1.1501236035039354e-06, - "loss": 0.6206, - "step": 54834 - }, - { - "epoch": 1.41, - "learning_rate": 1.150096246575293e-06, - "loss": 0.522, - "step": 54835 - }, - { - "epoch": 1.41, - "learning_rate": 1.150068889531729e-06, - "loss": 0.5581, - "step": 54836 - }, - { - "epoch": 1.41, - "learning_rate": 1.1500415323732638e-06, - "loss": 0.6899, - "step": 54837 - }, - { - "epoch": 1.41, - "learning_rate": 1.1500141750999188e-06, - "loss": 0.7539, - "step": 54838 - }, - { - "epoch": 1.41, - "learning_rate": 1.149986817711715e-06, - "loss": 0.4944, - "step": 54839 - }, - { - "epoch": 1.41, - "learning_rate": 1.149959460208673e-06, - "loss": 0.6777, - "step": 54840 - }, - { - "epoch": 1.41, - "learning_rate": 1.1499321025908141e-06, - "loss": 0.6455, - "step": 54841 - }, - { - "epoch": 1.41, - "learning_rate": 1.1499047448581592e-06, - "loss": 0.5981, - "step": 54842 - }, - { - "epoch": 1.41, - "learning_rate": 1.1498773870107288e-06, - "loss": 0.5989, - "step": 54843 - }, - { - "epoch": 1.41, - "learning_rate": 1.1498500290485442e-06, - "loss": 0.6846, - "step": 54844 - }, - { - "epoch": 1.41, - "learning_rate": 1.1498226709716263e-06, - "loss": 0.917, - "step": 54845 - }, - { - "epoch": 1.41, - "learning_rate": 1.1497953127799966e-06, - "loss": 0.5132, - "step": 54846 - }, - { - "epoch": 1.41, - "learning_rate": 1.149767954473675e-06, - "loss": 0.5503, - "step": 54847 - }, - { - "epoch": 1.41, - "learning_rate": 1.1497405960526832e-06, - "loss": 0.4716, - "step": 54848 - }, - { - "epoch": 1.41, - "learning_rate": 1.1497132375170414e-06, - "loss": 0.73, - "step": 54849 - }, - { - "epoch": 1.41, - "learning_rate": 1.1496858788667716e-06, - "loss": 0.7246, - "step": 54850 - }, - { - "epoch": 1.41, - "learning_rate": 1.1496585201018943e-06, - "loss": 0.6411, - "step": 54851 - }, - { - "epoch": 1.41, - "learning_rate": 1.14963116122243e-06, - "loss": 0.748, - "step": 54852 - }, - { - "epoch": 1.41, - "learning_rate": 1.1496038022284e-06, - "loss": 0.6846, - "step": 54853 - }, - { - "epoch": 1.41, - "learning_rate": 1.1495764431198255e-06, - "loss": 0.604, - "step": 54854 - }, - { - "epoch": 1.41, - "learning_rate": 1.1495490838967267e-06, - "loss": 0.7168, - "step": 54855 - }, - { - "epoch": 1.41, - "learning_rate": 1.1495217245591256e-06, - "loss": 0.5864, - "step": 54856 - }, - { - "epoch": 1.41, - "learning_rate": 1.1494943651070425e-06, - "loss": 0.7725, - "step": 54857 - }, - { - "epoch": 1.41, - "learning_rate": 1.1494670055404983e-06, - "loss": 0.6621, - "step": 54858 - }, - { - "epoch": 1.41, - "learning_rate": 1.1494396458595139e-06, - "loss": 0.6611, - "step": 54859 - }, - { - "epoch": 1.41, - "learning_rate": 1.149412286064111e-06, - "loss": 0.7715, - "step": 54860 - }, - { - "epoch": 1.41, - "learning_rate": 1.1493849261543096e-06, - "loss": 0.5679, - "step": 54861 - }, - { - "epoch": 1.41, - "learning_rate": 1.149357566130131e-06, - "loss": 0.584, - "step": 54862 - }, - { - "epoch": 1.41, - "learning_rate": 1.1493302059915962e-06, - "loss": 0.6846, - "step": 54863 - }, - { - "epoch": 1.41, - "learning_rate": 1.149302845738726e-06, - "loss": 0.6108, - "step": 54864 - }, - { - "epoch": 1.41, - "learning_rate": 1.1492754853715415e-06, - "loss": 0.6133, - "step": 54865 - }, - { - "epoch": 1.41, - "learning_rate": 1.1492481248900641e-06, - "loss": 0.7852, - "step": 54866 - }, - { - "epoch": 1.41, - "learning_rate": 1.149220764294314e-06, - "loss": 0.6104, - "step": 54867 - }, - { - "epoch": 1.41, - "learning_rate": 1.149193403584312e-06, - "loss": 0.6299, - "step": 54868 - }, - { - "epoch": 1.41, - "learning_rate": 1.14916604276008e-06, - "loss": 0.6514, - "step": 54869 - }, - { - "epoch": 1.41, - "learning_rate": 1.1491386818216382e-06, - "loss": 0.6763, - "step": 54870 - }, - { - "epoch": 1.41, - "learning_rate": 1.1491113207690082e-06, - "loss": 0.7441, - "step": 54871 - }, - { - "epoch": 1.41, - "learning_rate": 1.14908395960221e-06, - "loss": 0.4758, - "step": 54872 - }, - { - "epoch": 1.41, - "learning_rate": 1.1490565983212652e-06, - "loss": 0.8379, - "step": 54873 - }, - { - "epoch": 1.41, - "learning_rate": 1.1490292369261944e-06, - "loss": 0.71, - "step": 54874 - }, - { - "epoch": 1.41, - "learning_rate": 1.1490018754170192e-06, - "loss": 0.6445, - "step": 54875 - }, - { - "epoch": 1.41, - "learning_rate": 1.1489745137937598e-06, - "loss": 0.7061, - "step": 54876 - }, - { - "epoch": 1.41, - "learning_rate": 1.1489471520564379e-06, - "loss": 0.5398, - "step": 54877 - }, - { - "epoch": 1.41, - "learning_rate": 1.1489197902050734e-06, - "loss": 0.7637, - "step": 54878 - }, - { - "epoch": 1.41, - "learning_rate": 1.148892428239688e-06, - "loss": 0.6807, - "step": 54879 - }, - { - "epoch": 1.41, - "learning_rate": 1.1488650661603027e-06, - "loss": 0.6621, - "step": 54880 - }, - { - "epoch": 1.41, - "learning_rate": 1.1488377039669383e-06, - "loss": 0.707, - "step": 54881 - }, - { - "epoch": 1.41, - "learning_rate": 1.1488103416596157e-06, - "loss": 0.6611, - "step": 54882 - }, - { - "epoch": 1.41, - "learning_rate": 1.1487829792383556e-06, - "loss": 0.7266, - "step": 54883 - }, - { - "epoch": 1.41, - "learning_rate": 1.1487556167031795e-06, - "loss": 0.7129, - "step": 54884 - }, - { - "epoch": 1.41, - "learning_rate": 1.148728254054108e-06, - "loss": 0.6035, - "step": 54885 - }, - { - "epoch": 1.41, - "learning_rate": 1.1487008912911621e-06, - "loss": 0.6904, - "step": 54886 - }, - { - "epoch": 1.41, - "learning_rate": 1.1486735284143628e-06, - "loss": 0.8057, - "step": 54887 - }, - { - "epoch": 1.41, - "learning_rate": 1.148646165423731e-06, - "loss": 0.8213, - "step": 54888 - }, - { - "epoch": 1.41, - "learning_rate": 1.1486188023192875e-06, - "loss": 0.7207, - "step": 54889 - }, - { - "epoch": 1.41, - "learning_rate": 1.1485914391010536e-06, - "loss": 0.5474, - "step": 54890 - }, - { - "epoch": 1.41, - "learning_rate": 1.1485640757690501e-06, - "loss": 0.5312, - "step": 54891 - }, - { - "epoch": 1.41, - "learning_rate": 1.1485367123232982e-06, - "loss": 0.6387, - "step": 54892 - }, - { - "epoch": 1.41, - "learning_rate": 1.1485093487638178e-06, - "loss": 0.6406, - "step": 54893 - }, - { - "epoch": 1.41, - "learning_rate": 1.1484819850906311e-06, - "loss": 0.6602, - "step": 54894 - }, - { - "epoch": 1.41, - "learning_rate": 1.1484546213037584e-06, - "loss": 0.6416, - "step": 54895 - }, - { - "epoch": 1.41, - "learning_rate": 1.1484272574032213e-06, - "loss": 0.4658, - "step": 54896 - }, - { - "epoch": 1.41, - "learning_rate": 1.1483998933890397e-06, - "loss": 0.6108, - "step": 54897 - }, - { - "epoch": 1.41, - "learning_rate": 1.1483725292612354e-06, - "loss": 0.6514, - "step": 54898 - }, - { - "epoch": 1.41, - "learning_rate": 1.1483451650198287e-06, - "loss": 0.6987, - "step": 54899 - }, - { - "epoch": 1.41, - "learning_rate": 1.1483178006648415e-06, - "loss": 0.5349, - "step": 54900 - }, - { - "epoch": 1.41, - "learning_rate": 1.1482904361962939e-06, - "loss": 0.6396, - "step": 54901 - }, - { - "epoch": 1.41, - "learning_rate": 1.148263071614207e-06, - "loss": 0.6699, - "step": 54902 - }, - { - "epoch": 1.41, - "learning_rate": 1.1482357069186022e-06, - "loss": 0.5143, - "step": 54903 - }, - { - "epoch": 1.41, - "learning_rate": 1.1482083421094996e-06, - "loss": 0.5679, - "step": 54904 - }, - { - "epoch": 1.41, - "learning_rate": 1.1481809771869213e-06, - "loss": 0.6787, - "step": 54905 - }, - { - "epoch": 1.41, - "learning_rate": 1.1481536121508874e-06, - "loss": 0.7627, - "step": 54906 - }, - { - "epoch": 1.41, - "learning_rate": 1.1481262470014193e-06, - "loss": 0.7119, - "step": 54907 - }, - { - "epoch": 1.41, - "learning_rate": 1.1480988817385373e-06, - "loss": 0.5898, - "step": 54908 - }, - { - "epoch": 1.41, - "learning_rate": 1.1480715163622632e-06, - "loss": 0.8926, - "step": 54909 - }, - { - "epoch": 1.41, - "learning_rate": 1.148044150872617e-06, - "loss": 0.6133, - "step": 54910 - }, - { - "epoch": 1.41, - "learning_rate": 1.148016785269621e-06, - "loss": 0.6514, - "step": 54911 - }, - { - "epoch": 1.41, - "learning_rate": 1.1479894195532947e-06, - "loss": 0.6626, - "step": 54912 - }, - { - "epoch": 1.41, - "learning_rate": 1.14796205372366e-06, - "loss": 0.5708, - "step": 54913 - }, - { - "epoch": 1.41, - "learning_rate": 1.1479346877807374e-06, - "loss": 0.4532, - "step": 54914 - }, - { - "epoch": 1.41, - "learning_rate": 1.1479073217245482e-06, - "loss": 0.6211, - "step": 54915 - }, - { - "epoch": 1.41, - "learning_rate": 1.147879955555113e-06, - "loss": 0.3706, - "step": 54916 - }, - { - "epoch": 1.41, - "learning_rate": 1.1478525892724531e-06, - "loss": 0.7305, - "step": 54917 - }, - { - "epoch": 1.41, - "learning_rate": 1.147825222876589e-06, - "loss": 0.75, - "step": 54918 - }, - { - "epoch": 1.41, - "learning_rate": 1.1477978563675423e-06, - "loss": 0.5298, - "step": 54919 - }, - { - "epoch": 1.41, - "learning_rate": 1.1477704897453331e-06, - "loss": 0.5413, - "step": 54920 - }, - { - "epoch": 1.41, - "learning_rate": 1.1477431230099832e-06, - "loss": 0.6914, - "step": 54921 - }, - { - "epoch": 1.41, - "learning_rate": 1.1477157561615131e-06, - "loss": 0.6401, - "step": 54922 - }, - { - "epoch": 1.41, - "learning_rate": 1.1476883891999438e-06, - "loss": 0.5723, - "step": 54923 - }, - { - "epoch": 1.41, - "learning_rate": 1.1476610221252962e-06, - "loss": 0.6338, - "step": 54924 - }, - { - "epoch": 1.41, - "learning_rate": 1.1476336549375915e-06, - "loss": 0.7578, - "step": 54925 - }, - { - "epoch": 1.41, - "learning_rate": 1.1476062876368507e-06, - "loss": 0.6494, - "step": 54926 - }, - { - "epoch": 1.41, - "learning_rate": 1.147578920223094e-06, - "loss": 0.8271, - "step": 54927 - }, - { - "epoch": 1.41, - "learning_rate": 1.1475515526963433e-06, - "loss": 0.7119, - "step": 54928 - }, - { - "epoch": 1.41, - "learning_rate": 1.1475241850566188e-06, - "loss": 0.5513, - "step": 54929 - }, - { - "epoch": 1.41, - "learning_rate": 1.1474968173039423e-06, - "loss": 0.6299, - "step": 54930 - }, - { - "epoch": 1.41, - "learning_rate": 1.147469449438334e-06, - "loss": 0.5833, - "step": 54931 - }, - { - "epoch": 1.41, - "learning_rate": 1.1474420814598153e-06, - "loss": 0.8447, - "step": 54932 - }, - { - "epoch": 1.41, - "learning_rate": 1.1474147133684067e-06, - "loss": 0.5244, - "step": 54933 - }, - { - "epoch": 1.41, - "learning_rate": 1.1473873451641297e-06, - "loss": 0.7441, - "step": 54934 - }, - { - "epoch": 1.41, - "learning_rate": 1.1473599768470049e-06, - "loss": 0.5374, - "step": 54935 - }, - { - "epoch": 1.41, - "learning_rate": 1.1473326084170533e-06, - "loss": 0.7041, - "step": 54936 - }, - { - "epoch": 1.41, - "learning_rate": 1.147305239874296e-06, - "loss": 0.6709, - "step": 54937 - }, - { - "epoch": 1.41, - "learning_rate": 1.1472778712187536e-06, - "loss": 0.8096, - "step": 54938 - }, - { - "epoch": 1.41, - "learning_rate": 1.1472505024504475e-06, - "loss": 0.752, - "step": 54939 - }, - { - "epoch": 1.41, - "learning_rate": 1.1472231335693986e-06, - "loss": 0.791, - "step": 54940 - }, - { - "epoch": 1.41, - "learning_rate": 1.1471957645756274e-06, - "loss": 0.6951, - "step": 54941 - }, - { - "epoch": 1.41, - "learning_rate": 1.1471683954691553e-06, - "loss": 0.7734, - "step": 54942 - }, - { - "epoch": 1.41, - "learning_rate": 1.1471410262500032e-06, - "loss": 0.5239, - "step": 54943 - }, - { - "epoch": 1.41, - "learning_rate": 1.1471136569181917e-06, - "loss": 0.5645, - "step": 54944 - }, - { - "epoch": 1.41, - "learning_rate": 1.1470862874737423e-06, - "loss": 0.7266, - "step": 54945 - }, - { - "epoch": 1.41, - "learning_rate": 1.147058917916676e-06, - "loss": 0.6421, - "step": 54946 - }, - { - "epoch": 1.41, - "learning_rate": 1.1470315482470129e-06, - "loss": 0.7861, - "step": 54947 - }, - { - "epoch": 1.41, - "learning_rate": 1.1470041784647745e-06, - "loss": 0.7051, - "step": 54948 - }, - { - "epoch": 1.41, - "learning_rate": 1.146976808569982e-06, - "loss": 0.541, - "step": 54949 - }, - { - "epoch": 1.41, - "learning_rate": 1.1469494385626562e-06, - "loss": 0.5962, - "step": 54950 - }, - { - "epoch": 1.41, - "learning_rate": 1.146922068442818e-06, - "loss": 0.625, - "step": 54951 - }, - { - "epoch": 1.41, - "learning_rate": 1.1468946982104881e-06, - "loss": 0.5459, - "step": 54952 - }, - { - "epoch": 1.41, - "learning_rate": 1.1468673278656877e-06, - "loss": 0.7637, - "step": 54953 - }, - { - "epoch": 1.41, - "learning_rate": 1.1468399574084378e-06, - "loss": 0.5486, - "step": 54954 - }, - { - "epoch": 1.41, - "learning_rate": 1.1468125868387592e-06, - "loss": 0.6123, - "step": 54955 - }, - { - "epoch": 1.41, - "learning_rate": 1.146785216156673e-06, - "loss": 0.665, - "step": 54956 - }, - { - "epoch": 1.41, - "learning_rate": 1.1467578453622004e-06, - "loss": 0.4861, - "step": 54957 - }, - { - "epoch": 1.41, - "learning_rate": 1.1467304744553617e-06, - "loss": 0.5083, - "step": 54958 - }, - { - "epoch": 1.41, - "learning_rate": 1.1467031034361784e-06, - "loss": 0.6426, - "step": 54959 - }, - { - "epoch": 1.41, - "learning_rate": 1.1466757323046712e-06, - "loss": 0.4635, - "step": 54960 - }, - { - "epoch": 1.41, - "learning_rate": 1.1466483610608612e-06, - "loss": 0.7002, - "step": 54961 - }, - { - "epoch": 1.41, - "learning_rate": 1.146620989704769e-06, - "loss": 0.7139, - "step": 54962 - }, - { - "epoch": 1.41, - "learning_rate": 1.1465936182364165e-06, - "loss": 0.4458, - "step": 54963 - }, - { - "epoch": 1.41, - "learning_rate": 1.1465662466558234e-06, - "loss": 0.7705, - "step": 54964 - }, - { - "epoch": 1.41, - "learning_rate": 1.1465388749630116e-06, - "loss": 0.6299, - "step": 54965 - }, - { - "epoch": 1.41, - "learning_rate": 1.1465115031580018e-06, - "loss": 0.5928, - "step": 54966 - }, - { - "epoch": 1.41, - "learning_rate": 1.1464841312408147e-06, - "loss": 0.6162, - "step": 54967 - }, - { - "epoch": 1.41, - "learning_rate": 1.1464567592114712e-06, - "loss": 0.5659, - "step": 54968 - }, - { - "epoch": 1.41, - "learning_rate": 1.1464293870699928e-06, - "loss": 0.7822, - "step": 54969 - }, - { - "epoch": 1.41, - "learning_rate": 1.1464020148163998e-06, - "loss": 0.3828, - "step": 54970 - }, - { - "epoch": 1.41, - "learning_rate": 1.146374642450714e-06, - "loss": 0.6411, - "step": 54971 - }, - { - "epoch": 1.41, - "learning_rate": 1.1463472699729556e-06, - "loss": 0.6006, - "step": 54972 - }, - { - "epoch": 1.41, - "learning_rate": 1.1463198973831456e-06, - "loss": 0.7285, - "step": 54973 - }, - { - "epoch": 1.41, - "learning_rate": 1.1462925246813056e-06, - "loss": 0.4812, - "step": 54974 - }, - { - "epoch": 1.41, - "learning_rate": 1.146265151867456e-06, - "loss": 0.6982, - "step": 54975 - }, - { - "epoch": 1.41, - "learning_rate": 1.146237778941618e-06, - "loss": 0.7461, - "step": 54976 - }, - { - "epoch": 1.41, - "learning_rate": 1.1462104059038122e-06, - "loss": 0.8926, - "step": 54977 - }, - { - "epoch": 1.41, - "learning_rate": 1.14618303275406e-06, - "loss": 0.5854, - "step": 54978 - }, - { - "epoch": 1.41, - "learning_rate": 1.146155659492382e-06, - "loss": 0.5299, - "step": 54979 - }, - { - "epoch": 1.41, - "learning_rate": 1.1461282861187996e-06, - "loss": 0.5864, - "step": 54980 - }, - { - "epoch": 1.41, - "learning_rate": 1.1461009126333334e-06, - "loss": 0.6211, - "step": 54981 - }, - { - "epoch": 1.41, - "learning_rate": 1.1460735390360046e-06, - "loss": 0.6426, - "step": 54982 - }, - { - "epoch": 1.41, - "learning_rate": 1.1460461653268336e-06, - "loss": 0.6733, - "step": 54983 - }, - { - "epoch": 1.41, - "learning_rate": 1.146018791505842e-06, - "loss": 0.6982, - "step": 54984 - }, - { - "epoch": 1.41, - "learning_rate": 1.1459914175730502e-06, - "loss": 0.6445, - "step": 54985 - }, - { - "epoch": 1.41, - "learning_rate": 1.1459640435284802e-06, - "loss": 0.7568, - "step": 54986 - }, - { - "epoch": 1.41, - "learning_rate": 1.1459366693721518e-06, - "loss": 0.6107, - "step": 54987 - }, - { - "epoch": 1.41, - "learning_rate": 1.1459092951040864e-06, - "loss": 0.4104, - "step": 54988 - }, - { - "epoch": 1.41, - "learning_rate": 1.1458819207243048e-06, - "loss": 0.7207, - "step": 54989 - }, - { - "epoch": 1.41, - "learning_rate": 1.1458545462328284e-06, - "loss": 0.4985, - "step": 54990 - }, - { - "epoch": 1.41, - "learning_rate": 1.1458271716296778e-06, - "loss": 0.6963, - "step": 54991 - }, - { - "epoch": 1.41, - "learning_rate": 1.1457997969148741e-06, - "loss": 0.4436, - "step": 54992 - }, - { - "epoch": 1.41, - "learning_rate": 1.145772422088438e-06, - "loss": 0.834, - "step": 54993 - }, - { - "epoch": 1.41, - "learning_rate": 1.1457450471503906e-06, - "loss": 0.7441, - "step": 54994 - }, - { - "epoch": 1.41, - "learning_rate": 1.1457176721007533e-06, - "loss": 0.668, - "step": 54995 - }, - { - "epoch": 1.41, - "learning_rate": 1.1456902969395466e-06, - "loss": 0.5833, - "step": 54996 - }, - { - "epoch": 1.41, - "learning_rate": 1.1456629216667915e-06, - "loss": 0.6206, - "step": 54997 - }, - { - "epoch": 1.41, - "learning_rate": 1.1456355462825086e-06, - "loss": 0.5967, - "step": 54998 - }, - { - "epoch": 1.41, - "learning_rate": 1.1456081707867198e-06, - "loss": 0.5664, - "step": 54999 - }, - { - "epoch": 1.41, - "learning_rate": 1.1455807951794452e-06, - "loss": 0.4116, - "step": 55000 - }, - { - "epoch": 1.41, - "learning_rate": 1.1455534194607063e-06, - "loss": 0.6611, - "step": 55001 - }, - { - "epoch": 1.41, - "learning_rate": 1.1455260436305237e-06, - "loss": 0.6943, - "step": 55002 - }, - { - "epoch": 1.41, - "learning_rate": 1.1454986676889186e-06, - "loss": 0.5419, - "step": 55003 - }, - { - "epoch": 1.41, - "learning_rate": 1.1454712916359117e-06, - "loss": 0.646, - "step": 55004 - }, - { - "epoch": 1.41, - "learning_rate": 1.1454439154715242e-06, - "loss": 0.668, - "step": 55005 - }, - { - "epoch": 1.41, - "learning_rate": 1.145416539195777e-06, - "loss": 0.6963, - "step": 55006 - }, - { - "epoch": 1.41, - "learning_rate": 1.145389162808691e-06, - "loss": 0.7812, - "step": 55007 - }, - { - "epoch": 1.41, - "learning_rate": 1.1453617863102874e-06, - "loss": 0.6758, - "step": 55008 - }, - { - "epoch": 1.41, - "learning_rate": 1.1453344097005867e-06, - "loss": 0.6904, - "step": 55009 - }, - { - "epoch": 1.41, - "learning_rate": 1.14530703297961e-06, - "loss": 0.7041, - "step": 55010 - }, - { - "epoch": 1.41, - "learning_rate": 1.1452796561473788e-06, - "loss": 0.8125, - "step": 55011 - }, - { - "epoch": 1.41, - "learning_rate": 1.1452522792039135e-06, - "loss": 0.8535, - "step": 55012 - }, - { - "epoch": 1.41, - "learning_rate": 1.1452249021492353e-06, - "loss": 0.6162, - "step": 55013 - }, - { - "epoch": 1.41, - "learning_rate": 1.1451975249833648e-06, - "loss": 0.5413, - "step": 55014 - }, - { - "epoch": 1.41, - "learning_rate": 1.1451701477063233e-06, - "loss": 0.5547, - "step": 55015 - }, - { - "epoch": 1.41, - "learning_rate": 1.145142770318132e-06, - "loss": 0.6069, - "step": 55016 - }, - { - "epoch": 1.41, - "learning_rate": 1.145115392818811e-06, - "loss": 0.519, - "step": 55017 - }, - { - "epoch": 1.41, - "learning_rate": 1.1450880152083825e-06, - "loss": 0.6758, - "step": 55018 - }, - { - "epoch": 1.41, - "learning_rate": 1.1450606374868662e-06, - "loss": 0.5522, - "step": 55019 - }, - { - "epoch": 1.41, - "learning_rate": 1.1450332596542837e-06, - "loss": 0.6055, - "step": 55020 - }, - { - "epoch": 1.41, - "learning_rate": 1.1450058817106563e-06, - "loss": 0.5278, - "step": 55021 - }, - { - "epoch": 1.41, - "learning_rate": 1.1449785036560042e-06, - "loss": 0.6006, - "step": 55022 - }, - { - "epoch": 1.41, - "learning_rate": 1.1449511254903487e-06, - "loss": 0.793, - "step": 55023 - }, - { - "epoch": 1.41, - "learning_rate": 1.144923747213711e-06, - "loss": 0.7251, - "step": 55024 - }, - { - "epoch": 1.41, - "learning_rate": 1.1448963688261117e-06, - "loss": 0.5249, - "step": 55025 - }, - { - "epoch": 1.41, - "learning_rate": 1.1448689903275724e-06, - "loss": 0.6416, - "step": 55026 - }, - { - "epoch": 1.41, - "learning_rate": 1.144841611718113e-06, - "loss": 0.7656, - "step": 55027 - }, - { - "epoch": 1.41, - "learning_rate": 1.144814232997755e-06, - "loss": 0.6997, - "step": 55028 - }, - { - "epoch": 1.41, - "learning_rate": 1.1447868541665195e-06, - "loss": 0.6733, - "step": 55029 - }, - { - "epoch": 1.41, - "learning_rate": 1.1447594752244276e-06, - "loss": 0.8545, - "step": 55030 - }, - { - "epoch": 1.41, - "learning_rate": 1.1447320961714998e-06, - "loss": 0.7266, - "step": 55031 - }, - { - "epoch": 1.41, - "learning_rate": 1.1447047170077576e-06, - "loss": 0.666, - "step": 55032 - }, - { - "epoch": 1.41, - "learning_rate": 1.1446773377332212e-06, - "loss": 0.771, - "step": 55033 - }, - { - "epoch": 1.41, - "learning_rate": 1.1446499583479126e-06, - "loss": 0.7842, - "step": 55034 - }, - { - "epoch": 1.41, - "learning_rate": 1.1446225788518515e-06, - "loss": 0.8262, - "step": 55035 - }, - { - "epoch": 1.41, - "learning_rate": 1.14459519924506e-06, - "loss": 0.6704, - "step": 55036 - }, - { - "epoch": 1.41, - "learning_rate": 1.1445678195275584e-06, - "loss": 0.6548, - "step": 55037 - }, - { - "epoch": 1.41, - "learning_rate": 1.1445404396993678e-06, - "loss": 0.6301, - "step": 55038 - }, - { - "epoch": 1.41, - "learning_rate": 1.1445130597605094e-06, - "loss": 0.614, - "step": 55039 - }, - { - "epoch": 1.41, - "learning_rate": 1.1444856797110044e-06, - "loss": 0.7178, - "step": 55040 - }, - { - "epoch": 1.41, - "learning_rate": 1.144458299550873e-06, - "loss": 0.5215, - "step": 55041 - }, - { - "epoch": 1.41, - "learning_rate": 1.1444309192801363e-06, - "loss": 0.5903, - "step": 55042 - }, - { - "epoch": 1.41, - "learning_rate": 1.1444035388988156e-06, - "loss": 0.6816, - "step": 55043 - }, - { - "epoch": 1.41, - "learning_rate": 1.1443761584069315e-06, - "loss": 0.6553, - "step": 55044 - }, - { - "epoch": 1.41, - "learning_rate": 1.1443487778045056e-06, - "loss": 0.5659, - "step": 55045 - }, - { - "epoch": 1.41, - "learning_rate": 1.1443213970915583e-06, - "loss": 0.7002, - "step": 55046 - }, - { - "epoch": 1.41, - "learning_rate": 1.1442940162681112e-06, - "loss": 0.6387, - "step": 55047 - }, - { - "epoch": 1.41, - "learning_rate": 1.1442666353341841e-06, - "loss": 0.7783, - "step": 55048 - }, - { - "epoch": 1.41, - "learning_rate": 1.1442392542897993e-06, - "loss": 0.6445, - "step": 55049 - }, - { - "epoch": 1.41, - "learning_rate": 1.1442118731349766e-06, - "loss": 0.647, - "step": 55050 - }, - { - "epoch": 1.41, - "learning_rate": 1.1441844918697378e-06, - "loss": 0.752, - "step": 55051 - }, - { - "epoch": 1.41, - "learning_rate": 1.1441571104941034e-06, - "loss": 0.6865, - "step": 55052 - }, - { - "epoch": 1.41, - "learning_rate": 1.1441297290080946e-06, - "loss": 0.667, - "step": 55053 - }, - { - "epoch": 1.41, - "learning_rate": 1.1441023474117325e-06, - "loss": 0.688, - "step": 55054 - }, - { - "epoch": 1.41, - "learning_rate": 1.1440749657050377e-06, - "loss": 0.7246, - "step": 55055 - }, - { - "epoch": 1.41, - "learning_rate": 1.1440475838880311e-06, - "loss": 0.6704, - "step": 55056 - }, - { - "epoch": 1.41, - "learning_rate": 1.1440202019607343e-06, - "loss": 0.7627, - "step": 55057 - }, - { - "epoch": 1.41, - "learning_rate": 1.1439928199231675e-06, - "loss": 0.8533, - "step": 55058 - }, - { - "epoch": 1.41, - "learning_rate": 1.1439654377753522e-06, - "loss": 0.6494, - "step": 55059 - }, - { - "epoch": 1.41, - "learning_rate": 1.1439380555173091e-06, - "loss": 0.6777, - "step": 55060 - }, - { - "epoch": 1.41, - "learning_rate": 1.1439106731490594e-06, - "loss": 0.6284, - "step": 55061 - }, - { - "epoch": 1.41, - "learning_rate": 1.1438832906706236e-06, - "loss": 0.6538, - "step": 55062 - }, - { - "epoch": 1.41, - "learning_rate": 1.1438559080820232e-06, - "loss": 0.6797, - "step": 55063 - }, - { - "epoch": 1.41, - "learning_rate": 1.1438285253832792e-06, - "loss": 0.8135, - "step": 55064 - }, - { - "epoch": 1.41, - "learning_rate": 1.1438011425744119e-06, - "loss": 0.6812, - "step": 55065 - }, - { - "epoch": 1.41, - "learning_rate": 1.143773759655443e-06, - "loss": 0.6567, - "step": 55066 - }, - { - "epoch": 1.41, - "learning_rate": 1.1437463766263928e-06, - "loss": 0.4688, - "step": 55067 - }, - { - "epoch": 1.41, - "learning_rate": 1.143718993487283e-06, - "loss": 0.751, - "step": 55068 - }, - { - "epoch": 1.41, - "learning_rate": 1.1436916102381338e-06, - "loss": 0.6506, - "step": 55069 - }, - { - "epoch": 1.41, - "learning_rate": 1.1436642268789667e-06, - "loss": 0.6992, - "step": 55070 - }, - { - "epoch": 1.41, - "learning_rate": 1.1436368434098025e-06, - "loss": 0.6924, - "step": 55071 - }, - { - "epoch": 1.41, - "learning_rate": 1.1436094598306622e-06, - "loss": 0.5957, - "step": 55072 - }, - { - "epoch": 1.41, - "learning_rate": 1.1435820761415667e-06, - "loss": 0.6758, - "step": 55073 - }, - { - "epoch": 1.41, - "learning_rate": 1.143554692342537e-06, - "loss": 0.8691, - "step": 55074 - }, - { - "epoch": 1.41, - "learning_rate": 1.143527308433594e-06, - "loss": 0.6455, - "step": 55075 - }, - { - "epoch": 1.41, - "learning_rate": 1.143499924414759e-06, - "loss": 0.585, - "step": 55076 - }, - { - "epoch": 1.41, - "learning_rate": 1.1434725402860526e-06, - "loss": 0.5159, - "step": 55077 - }, - { - "epoch": 1.41, - "learning_rate": 1.1434451560474957e-06, - "loss": 0.6802, - "step": 55078 - }, - { - "epoch": 1.41, - "learning_rate": 1.1434177716991094e-06, - "loss": 0.9199, - "step": 55079 - }, - { - "epoch": 1.41, - "learning_rate": 1.143390387240915e-06, - "loss": 0.541, - "step": 55080 - }, - { - "epoch": 1.41, - "learning_rate": 1.1433630026729331e-06, - "loss": 0.6528, - "step": 55081 - }, - { - "epoch": 1.41, - "learning_rate": 1.1433356179951846e-06, - "loss": 0.6758, - "step": 55082 - }, - { - "epoch": 1.41, - "learning_rate": 1.1433082332076906e-06, - "loss": 0.5312, - "step": 55083 - }, - { - "epoch": 1.41, - "learning_rate": 1.1432808483104722e-06, - "loss": 0.6846, - "step": 55084 - }, - { - "epoch": 1.41, - "learning_rate": 1.1432534633035501e-06, - "loss": 0.7266, - "step": 55085 - }, - { - "epoch": 1.41, - "learning_rate": 1.1432260781869455e-06, - "loss": 0.8135, - "step": 55086 - }, - { - "epoch": 1.41, - "learning_rate": 1.1431986929606794e-06, - "loss": 0.5584, - "step": 55087 - }, - { - "epoch": 1.41, - "learning_rate": 1.1431713076247725e-06, - "loss": 0.7217, - "step": 55088 - }, - { - "epoch": 1.41, - "learning_rate": 1.1431439221792461e-06, - "loss": 0.6782, - "step": 55089 - }, - { - "epoch": 1.41, - "learning_rate": 1.1431165366241207e-06, - "loss": 0.6842, - "step": 55090 - }, - { - "epoch": 1.41, - "learning_rate": 1.1430891509594178e-06, - "loss": 0.6865, - "step": 55091 - }, - { - "epoch": 1.41, - "learning_rate": 1.143061765185158e-06, - "loss": 0.624, - "step": 55092 - }, - { - "epoch": 1.41, - "learning_rate": 1.1430343793013625e-06, - "loss": 0.6255, - "step": 55093 - }, - { - "epoch": 1.41, - "learning_rate": 1.1430069933080517e-06, - "loss": 0.8008, - "step": 55094 - }, - { - "epoch": 1.41, - "learning_rate": 1.1429796072052472e-06, - "loss": 0.7666, - "step": 55095 - }, - { - "epoch": 1.41, - "learning_rate": 1.1429522209929704e-06, - "loss": 0.6533, - "step": 55096 - }, - { - "epoch": 1.41, - "learning_rate": 1.1429248346712412e-06, - "loss": 0.584, - "step": 55097 - }, - { - "epoch": 1.41, - "learning_rate": 1.1428974482400809e-06, - "loss": 0.7227, - "step": 55098 - }, - { - "epoch": 1.41, - "learning_rate": 1.1428700616995105e-06, - "loss": 0.627, - "step": 55099 - }, - { - "epoch": 1.41, - "learning_rate": 1.1428426750495512e-06, - "loss": 0.7354, - "step": 55100 - }, - { - "epoch": 1.41, - "learning_rate": 1.1428152882902243e-06, - "loss": 0.585, - "step": 55101 - }, - { - "epoch": 1.41, - "learning_rate": 1.1427879014215498e-06, - "loss": 0.5728, - "step": 55102 - }, - { - "epoch": 1.41, - "learning_rate": 1.1427605144435492e-06, - "loss": 0.645, - "step": 55103 - }, - { - "epoch": 1.41, - "learning_rate": 1.1427331273562435e-06, - "loss": 0.6001, - "step": 55104 - }, - { - "epoch": 1.41, - "learning_rate": 1.1427057401596538e-06, - "loss": 0.665, - "step": 55105 - }, - { - "epoch": 1.41, - "learning_rate": 1.1426783528538007e-06, - "loss": 0.6016, - "step": 55106 - }, - { - "epoch": 1.41, - "learning_rate": 1.142650965438705e-06, - "loss": 0.6001, - "step": 55107 - }, - { - "epoch": 1.41, - "learning_rate": 1.1426235779143887e-06, - "loss": 0.5732, - "step": 55108 - }, - { - "epoch": 1.41, - "learning_rate": 1.1425961902808717e-06, - "loss": 0.4312, - "step": 55109 - }, - { - "epoch": 1.41, - "learning_rate": 1.1425688025381755e-06, - "loss": 0.6711, - "step": 55110 - }, - { - "epoch": 1.41, - "learning_rate": 1.1425414146863209e-06, - "loss": 0.3315, - "step": 55111 - }, - { - "epoch": 1.41, - "learning_rate": 1.1425140267253288e-06, - "loss": 0.3545, - "step": 55112 - }, - { - "epoch": 1.41, - "learning_rate": 1.14248663865522e-06, - "loss": 0.6123, - "step": 55113 - }, - { - "epoch": 1.41, - "learning_rate": 1.142459250476016e-06, - "loss": 0.5322, - "step": 55114 - }, - { - "epoch": 1.41, - "learning_rate": 1.1424318621877379e-06, - "loss": 0.5625, - "step": 55115 - }, - { - "epoch": 1.41, - "learning_rate": 1.1424044737904057e-06, - "loss": 0.6387, - "step": 55116 - }, - { - "epoch": 1.41, - "learning_rate": 1.1423770852840411e-06, - "loss": 0.7324, - "step": 55117 - }, - { - "epoch": 1.41, - "learning_rate": 1.142349696668665e-06, - "loss": 0.6904, - "step": 55118 - }, - { - "epoch": 1.41, - "learning_rate": 1.1423223079442981e-06, - "loss": 0.6562, - "step": 55119 - }, - { - "epoch": 1.41, - "learning_rate": 1.142294919110962e-06, - "loss": 0.7061, - "step": 55120 - }, - { - "epoch": 1.41, - "learning_rate": 1.1422675301686767e-06, - "loss": 0.6611, - "step": 55121 - }, - { - "epoch": 1.41, - "learning_rate": 1.142240141117464e-06, - "loss": 0.6953, - "step": 55122 - }, - { - "epoch": 1.41, - "learning_rate": 1.1422127519573444e-06, - "loss": 0.6519, - "step": 55123 - }, - { - "epoch": 1.41, - "learning_rate": 1.142185362688339e-06, - "loss": 0.6875, - "step": 55124 - }, - { - "epoch": 1.41, - "learning_rate": 1.1421579733104689e-06, - "loss": 0.6543, - "step": 55125 - }, - { - "epoch": 1.41, - "learning_rate": 1.142130583823755e-06, - "loss": 0.6577, - "step": 55126 - }, - { - "epoch": 1.41, - "learning_rate": 1.1421031942282182e-06, - "loss": 0.6519, - "step": 55127 - }, - { - "epoch": 1.41, - "learning_rate": 1.1420758045238794e-06, - "loss": 0.4346, - "step": 55128 - }, - { - "epoch": 1.41, - "learning_rate": 1.1420484147107599e-06, - "loss": 0.7349, - "step": 55129 - }, - { - "epoch": 1.41, - "learning_rate": 1.1420210247888804e-06, - "loss": 0.4702, - "step": 55130 - }, - { - "epoch": 1.41, - "learning_rate": 1.1419936347582622e-06, - "loss": 0.4873, - "step": 55131 - }, - { - "epoch": 1.41, - "learning_rate": 1.1419662446189255e-06, - "loss": 0.644, - "step": 55132 - }, - { - "epoch": 1.41, - "learning_rate": 1.1419388543708922e-06, - "loss": 0.501, - "step": 55133 - }, - { - "epoch": 1.41, - "learning_rate": 1.1419114640141822e-06, - "loss": 0.6572, - "step": 55134 - }, - { - "epoch": 1.41, - "learning_rate": 1.141884073548818e-06, - "loss": 0.6978, - "step": 55135 - }, - { - "epoch": 1.41, - "learning_rate": 1.1418566829748191e-06, - "loss": 0.8799, - "step": 55136 - }, - { - "epoch": 1.41, - "learning_rate": 1.1418292922922073e-06, - "loss": 0.6631, - "step": 55137 - }, - { - "epoch": 1.41, - "learning_rate": 1.1418019015010033e-06, - "loss": 0.7393, - "step": 55138 - }, - { - "epoch": 1.41, - "learning_rate": 1.1417745106012279e-06, - "loss": 0.7939, - "step": 55139 - }, - { - "epoch": 1.41, - "learning_rate": 1.1417471195929025e-06, - "loss": 0.5237, - "step": 55140 - }, - { - "epoch": 1.41, - "learning_rate": 1.1417197284760478e-06, - "loss": 0.7529, - "step": 55141 - }, - { - "epoch": 1.41, - "learning_rate": 1.1416923372506845e-06, - "loss": 0.7246, - "step": 55142 - }, - { - "epoch": 1.41, - "learning_rate": 1.1416649459168344e-06, - "loss": 0.5234, - "step": 55143 - }, - { - "epoch": 1.41, - "learning_rate": 1.1416375544745177e-06, - "loss": 0.6318, - "step": 55144 - }, - { - "epoch": 1.41, - "learning_rate": 1.1416101629237557e-06, - "loss": 0.7676, - "step": 55145 - }, - { - "epoch": 1.41, - "learning_rate": 1.1415827712645693e-06, - "loss": 0.6177, - "step": 55146 - }, - { - "epoch": 1.41, - "learning_rate": 1.1415553794969795e-06, - "loss": 0.606, - "step": 55147 - }, - { - "epoch": 1.41, - "learning_rate": 1.1415279876210073e-06, - "loss": 0.4443, - "step": 55148 - }, - { - "epoch": 1.41, - "learning_rate": 1.1415005956366737e-06, - "loss": 0.4619, - "step": 55149 - }, - { - "epoch": 1.41, - "learning_rate": 1.1414732035439994e-06, - "loss": 0.7393, - "step": 55150 - }, - { - "epoch": 1.41, - "learning_rate": 1.1414458113430054e-06, - "loss": 0.5732, - "step": 55151 - }, - { - "epoch": 1.41, - "learning_rate": 1.1414184190337132e-06, - "loss": 0.6699, - "step": 55152 - }, - { - "epoch": 1.41, - "learning_rate": 1.1413910266161432e-06, - "loss": 0.4863, - "step": 55153 - }, - { - "epoch": 1.41, - "learning_rate": 1.1413636340903168e-06, - "loss": 0.5259, - "step": 55154 - }, - { - "epoch": 1.41, - "learning_rate": 1.1413362414562548e-06, - "loss": 0.7646, - "step": 55155 - }, - { - "epoch": 1.41, - "learning_rate": 1.141308848713978e-06, - "loss": 0.7393, - "step": 55156 - }, - { - "epoch": 1.41, - "learning_rate": 1.1412814558635073e-06, - "loss": 0.6396, - "step": 55157 - }, - { - "epoch": 1.41, - "learning_rate": 1.1412540629048641e-06, - "loss": 0.7207, - "step": 55158 - }, - { - "epoch": 1.41, - "learning_rate": 1.141226669838069e-06, - "loss": 0.7852, - "step": 55159 - }, - { - "epoch": 1.41, - "learning_rate": 1.1411992766631437e-06, - "loss": 0.6772, - "step": 55160 - }, - { - "epoch": 1.41, - "learning_rate": 1.141171883380108e-06, - "loss": 0.5605, - "step": 55161 - }, - { - "epoch": 1.41, - "learning_rate": 1.1411444899889837e-06, - "loss": 0.6304, - "step": 55162 - }, - { - "epoch": 1.41, - "learning_rate": 1.1411170964897917e-06, - "loss": 0.8525, - "step": 55163 - }, - { - "epoch": 1.41, - "learning_rate": 1.1410897028825525e-06, - "loss": 0.7188, - "step": 55164 - }, - { - "epoch": 1.41, - "learning_rate": 1.1410623091672877e-06, - "loss": 0.7236, - "step": 55165 - }, - { - "epoch": 1.41, - "learning_rate": 1.141034915344018e-06, - "loss": 0.7402, - "step": 55166 - }, - { - "epoch": 1.41, - "learning_rate": 1.1410075214127638e-06, - "loss": 0.7026, - "step": 55167 - }, - { - "epoch": 1.41, - "learning_rate": 1.140980127373547e-06, - "loss": 0.6016, - "step": 55168 - }, - { - "epoch": 1.41, - "learning_rate": 1.1409527332263881e-06, - "loss": 0.4503, - "step": 55169 - }, - { - "epoch": 1.41, - "learning_rate": 1.1409253389713085e-06, - "loss": 0.353, - "step": 55170 - }, - { - "epoch": 1.41, - "learning_rate": 1.1408979446083286e-06, - "loss": 0.6431, - "step": 55171 - }, - { - "epoch": 1.41, - "learning_rate": 1.1408705501374695e-06, - "loss": 0.7959, - "step": 55172 - }, - { - "epoch": 1.41, - "learning_rate": 1.1408431555587526e-06, - "loss": 0.75, - "step": 55173 - }, - { - "epoch": 1.41, - "learning_rate": 1.1408157608721982e-06, - "loss": 0.5132, - "step": 55174 - }, - { - "epoch": 1.41, - "learning_rate": 1.1407883660778284e-06, - "loss": 0.5132, - "step": 55175 - }, - { - "epoch": 1.41, - "learning_rate": 1.1407609711756627e-06, - "loss": 0.6201, - "step": 55176 - }, - { - "epoch": 1.41, - "learning_rate": 1.140733576165723e-06, - "loss": 0.4622, - "step": 55177 - }, - { - "epoch": 1.41, - "learning_rate": 1.1407061810480298e-06, - "loss": 0.7026, - "step": 55178 - }, - { - "epoch": 1.41, - "learning_rate": 1.140678785822605e-06, - "loss": 0.6196, - "step": 55179 - }, - { - "epoch": 1.41, - "learning_rate": 1.1406513904894684e-06, - "loss": 0.7939, - "step": 55180 - }, - { - "epoch": 1.41, - "learning_rate": 1.1406239950486415e-06, - "loss": 0.5317, - "step": 55181 - }, - { - "epoch": 1.41, - "learning_rate": 1.1405965995001454e-06, - "loss": 0.7246, - "step": 55182 - }, - { - "epoch": 1.41, - "learning_rate": 1.1405692038440011e-06, - "loss": 0.6484, - "step": 55183 - }, - { - "epoch": 1.41, - "learning_rate": 1.1405418080802292e-06, - "loss": 0.564, - "step": 55184 - }, - { - "epoch": 1.41, - "learning_rate": 1.1405144122088511e-06, - "loss": 0.5211, - "step": 55185 - }, - { - "epoch": 1.41, - "learning_rate": 1.1404870162298873e-06, - "loss": 0.71, - "step": 55186 - }, - { - "epoch": 1.41, - "learning_rate": 1.1404596201433595e-06, - "loss": 0.6987, - "step": 55187 - }, - { - "epoch": 1.41, - "learning_rate": 1.1404322239492876e-06, - "loss": 0.834, - "step": 55188 - }, - { - "epoch": 1.41, - "learning_rate": 1.1404048276476937e-06, - "loss": 0.7031, - "step": 55189 - }, - { - "epoch": 1.41, - "learning_rate": 1.140377431238598e-06, - "loss": 0.5894, - "step": 55190 - }, - { - "epoch": 1.41, - "learning_rate": 1.1403500347220218e-06, - "loss": 0.5405, - "step": 55191 - }, - { - "epoch": 1.41, - "learning_rate": 1.1403226380979863e-06, - "loss": 0.6689, - "step": 55192 - }, - { - "epoch": 1.41, - "learning_rate": 1.140295241366512e-06, - "loss": 0.7695, - "step": 55193 - }, - { - "epoch": 1.41, - "learning_rate": 1.14026784452762e-06, - "loss": 0.6313, - "step": 55194 - }, - { - "epoch": 1.41, - "learning_rate": 1.1402404475813314e-06, - "loss": 0.4775, - "step": 55195 - }, - { - "epoch": 1.41, - "learning_rate": 1.1402130505276672e-06, - "loss": 0.7246, - "step": 55196 - }, - { - "epoch": 1.41, - "learning_rate": 1.1401856533666482e-06, - "loss": 0.4802, - "step": 55197 - }, - { - "epoch": 1.41, - "learning_rate": 1.1401582560982957e-06, - "loss": 0.7144, - "step": 55198 - }, - { - "epoch": 1.41, - "learning_rate": 1.14013085872263e-06, - "loss": 0.8066, - "step": 55199 - }, - { - "epoch": 1.41, - "learning_rate": 1.1401034612396733e-06, - "loss": 0.6943, - "step": 55200 - }, - { - "epoch": 1.41, - "learning_rate": 1.1400760636494453e-06, - "loss": 0.6055, - "step": 55201 - }, - { - "epoch": 1.41, - "learning_rate": 1.1400486659519678e-06, - "loss": 0.5898, - "step": 55202 - }, - { - "epoch": 1.41, - "learning_rate": 1.140021268147261e-06, - "loss": 0.7676, - "step": 55203 - }, - { - "epoch": 1.41, - "learning_rate": 1.139993870235347e-06, - "loss": 0.6431, - "step": 55204 - }, - { - "epoch": 1.41, - "learning_rate": 1.1399664722162456e-06, - "loss": 0.4868, - "step": 55205 - }, - { - "epoch": 1.41, - "learning_rate": 1.1399390740899786e-06, - "loss": 0.7119, - "step": 55206 - }, - { - "epoch": 1.41, - "learning_rate": 1.1399116758565665e-06, - "loss": 0.6016, - "step": 55207 - }, - { - "epoch": 1.42, - "learning_rate": 1.1398842775160306e-06, - "loss": 0.689, - "step": 55208 - }, - { - "epoch": 1.42, - "learning_rate": 1.1398568790683916e-06, - "loss": 0.5813, - "step": 55209 - }, - { - "epoch": 1.42, - "learning_rate": 1.139829480513671e-06, - "loss": 0.7871, - "step": 55210 - }, - { - "epoch": 1.42, - "learning_rate": 1.1398020818518889e-06, - "loss": 0.7266, - "step": 55211 - }, - { - "epoch": 1.42, - "learning_rate": 1.139774683083067e-06, - "loss": 0.5682, - "step": 55212 - }, - { - "epoch": 1.42, - "learning_rate": 1.139747284207226e-06, - "loss": 0.7166, - "step": 55213 - }, - { - "epoch": 1.42, - "learning_rate": 1.139719885224387e-06, - "loss": 0.6177, - "step": 55214 - }, - { - "epoch": 1.42, - "learning_rate": 1.139692486134571e-06, - "loss": 0.8633, - "step": 55215 - }, - { - "epoch": 1.42, - "learning_rate": 1.1396650869377985e-06, - "loss": 0.5269, - "step": 55216 - }, - { - "epoch": 1.42, - "learning_rate": 1.1396376876340913e-06, - "loss": 0.6396, - "step": 55217 - }, - { - "epoch": 1.42, - "learning_rate": 1.1396102882234694e-06, - "loss": 0.6626, - "step": 55218 - }, - { - "epoch": 1.42, - "learning_rate": 1.1395828887059548e-06, - "loss": 0.6953, - "step": 55219 - }, - { - "epoch": 1.42, - "learning_rate": 1.1395554890815679e-06, - "loss": 0.7402, - "step": 55220 - }, - { - "epoch": 1.42, - "learning_rate": 1.1395280893503299e-06, - "loss": 0.571, - "step": 55221 - }, - { - "epoch": 1.42, - "learning_rate": 1.1395006895122615e-06, - "loss": 0.6914, - "step": 55222 - }, - { - "epoch": 1.42, - "learning_rate": 1.1394732895673838e-06, - "loss": 0.6328, - "step": 55223 - }, - { - "epoch": 1.42, - "learning_rate": 1.1394458895157177e-06, - "loss": 0.5762, - "step": 55224 - }, - { - "epoch": 1.42, - "learning_rate": 1.139418489357285e-06, - "loss": 0.8047, - "step": 55225 - }, - { - "epoch": 1.42, - "learning_rate": 1.1393910890921051e-06, - "loss": 0.6382, - "step": 55226 - }, - { - "epoch": 1.42, - "learning_rate": 1.1393636887202002e-06, - "loss": 0.6953, - "step": 55227 - }, - { - "epoch": 1.42, - "learning_rate": 1.139336288241591e-06, - "loss": 0.7129, - "step": 55228 - }, - { - "epoch": 1.42, - "learning_rate": 1.1393088876562983e-06, - "loss": 0.6855, - "step": 55229 - }, - { - "epoch": 1.42, - "learning_rate": 1.1392814869643432e-06, - "loss": 0.584, - "step": 55230 - }, - { - "epoch": 1.42, - "learning_rate": 1.1392540861657467e-06, - "loss": 0.7412, - "step": 55231 - }, - { - "epoch": 1.42, - "learning_rate": 1.1392266852605297e-06, - "loss": 0.6205, - "step": 55232 - }, - { - "epoch": 1.42, - "learning_rate": 1.1391992842487132e-06, - "loss": 0.7139, - "step": 55233 - }, - { - "epoch": 1.42, - "learning_rate": 1.1391718831303184e-06, - "loss": 0.5625, - "step": 55234 - }, - { - "epoch": 1.42, - "learning_rate": 1.139144481905366e-06, - "loss": 0.5859, - "step": 55235 - }, - { - "epoch": 1.42, - "learning_rate": 1.139117080573877e-06, - "loss": 0.6582, - "step": 55236 - }, - { - "epoch": 1.42, - "learning_rate": 1.1390896791358723e-06, - "loss": 0.6045, - "step": 55237 - }, - { - "epoch": 1.42, - "learning_rate": 1.1390622775913735e-06, - "loss": 0.6128, - "step": 55238 - }, - { - "epoch": 1.42, - "learning_rate": 1.1390348759404008e-06, - "loss": 0.7471, - "step": 55239 - }, - { - "epoch": 1.42, - "learning_rate": 1.1390074741829757e-06, - "loss": 0.5439, - "step": 55240 - }, - { - "epoch": 1.42, - "learning_rate": 1.1389800723191185e-06, - "loss": 0.7358, - "step": 55241 - }, - { - "epoch": 1.42, - "learning_rate": 1.138952670348851e-06, - "loss": 0.6182, - "step": 55242 - }, - { - "epoch": 1.42, - "learning_rate": 1.1389252682721934e-06, - "loss": 0.7568, - "step": 55243 - }, - { - "epoch": 1.42, - "learning_rate": 1.1388978660891677e-06, - "loss": 0.6357, - "step": 55244 - }, - { - "epoch": 1.42, - "learning_rate": 1.138870463799794e-06, - "loss": 0.7822, - "step": 55245 - }, - { - "epoch": 1.42, - "learning_rate": 1.1388430614040938e-06, - "loss": 0.7773, - "step": 55246 - }, - { - "epoch": 1.42, - "learning_rate": 1.1388156589020876e-06, - "loss": 0.6494, - "step": 55247 - }, - { - "epoch": 1.42, - "learning_rate": 1.1387882562937967e-06, - "loss": 0.6855, - "step": 55248 - }, - { - "epoch": 1.42, - "learning_rate": 1.138760853579242e-06, - "loss": 0.8262, - "step": 55249 - }, - { - "epoch": 1.42, - "learning_rate": 1.1387334507584447e-06, - "loss": 0.7266, - "step": 55250 - }, - { - "epoch": 1.42, - "learning_rate": 1.1387060478314251e-06, - "loss": 0.6382, - "step": 55251 - }, - { - "epoch": 1.42, - "learning_rate": 1.1386786447982053e-06, - "loss": 0.5728, - "step": 55252 - }, - { - "epoch": 1.42, - "learning_rate": 1.138651241658805e-06, - "loss": 0.665, - "step": 55253 - }, - { - "epoch": 1.42, - "learning_rate": 1.1386238384132463e-06, - "loss": 0.625, - "step": 55254 - }, - { - "epoch": 1.42, - "learning_rate": 1.1385964350615495e-06, - "loss": 0.6616, - "step": 55255 - }, - { - "epoch": 1.42, - "learning_rate": 1.138569031603736e-06, - "loss": 0.5361, - "step": 55256 - }, - { - "epoch": 1.42, - "learning_rate": 1.1385416280398262e-06, - "loss": 0.7227, - "step": 55257 - }, - { - "epoch": 1.42, - "learning_rate": 1.1385142243698416e-06, - "loss": 0.8789, - "step": 55258 - }, - { - "epoch": 1.42, - "learning_rate": 1.138486820593803e-06, - "loss": 0.6377, - "step": 55259 - }, - { - "epoch": 1.42, - "learning_rate": 1.1384594167117314e-06, - "loss": 0.5669, - "step": 55260 - }, - { - "epoch": 1.42, - "learning_rate": 1.138432012723648e-06, - "loss": 0.5771, - "step": 55261 - }, - { - "epoch": 1.42, - "learning_rate": 1.138404608629573e-06, - "loss": 0.9062, - "step": 55262 - }, - { - "epoch": 1.42, - "learning_rate": 1.1383772044295286e-06, - "loss": 0.6543, - "step": 55263 - }, - { - "epoch": 1.42, - "learning_rate": 1.1383498001235347e-06, - "loss": 0.6782, - "step": 55264 - }, - { - "epoch": 1.42, - "learning_rate": 1.1383223957116133e-06, - "loss": 0.6567, - "step": 55265 - }, - { - "epoch": 1.42, - "learning_rate": 1.1382949911937843e-06, - "loss": 0.6543, - "step": 55266 - }, - { - "epoch": 1.42, - "learning_rate": 1.1382675865700692e-06, - "loss": 0.6201, - "step": 55267 - }, - { - "epoch": 1.42, - "learning_rate": 1.138240181840489e-06, - "loss": 0.7275, - "step": 55268 - }, - { - "epoch": 1.42, - "learning_rate": 1.1382127770050649e-06, - "loss": 0.6802, - "step": 55269 - }, - { - "epoch": 1.42, - "learning_rate": 1.1381853720638174e-06, - "loss": 0.7334, - "step": 55270 - }, - { - "epoch": 1.42, - "learning_rate": 1.1381579670167677e-06, - "loss": 0.627, - "step": 55271 - }, - { - "epoch": 1.42, - "learning_rate": 1.138130561863937e-06, - "loss": 0.4626, - "step": 55272 - }, - { - "epoch": 1.42, - "learning_rate": 1.1381031566053458e-06, - "loss": 0.6143, - "step": 55273 - }, - { - "epoch": 1.42, - "learning_rate": 1.1380757512410156e-06, - "loss": 0.5205, - "step": 55274 - }, - { - "epoch": 1.42, - "learning_rate": 1.1380483457709674e-06, - "loss": 0.5388, - "step": 55275 - }, - { - "epoch": 1.42, - "learning_rate": 1.1380209401952213e-06, - "loss": 0.5803, - "step": 55276 - }, - { - "epoch": 1.42, - "learning_rate": 1.1379935345137992e-06, - "loss": 0.4988, - "step": 55277 - }, - { - "epoch": 1.42, - "learning_rate": 1.1379661287267218e-06, - "loss": 0.6257, - "step": 55278 - }, - { - "epoch": 1.42, - "learning_rate": 1.13793872283401e-06, - "loss": 0.6816, - "step": 55279 - }, - { - "epoch": 1.42, - "learning_rate": 1.1379113168356852e-06, - "loss": 0.679, - "step": 55280 - }, - { - "epoch": 1.42, - "learning_rate": 1.1378839107317675e-06, - "loss": 0.6499, - "step": 55281 - }, - { - "epoch": 1.42, - "learning_rate": 1.1378565045222787e-06, - "loss": 0.6162, - "step": 55282 - }, - { - "epoch": 1.42, - "learning_rate": 1.1378290982072396e-06, - "loss": 0.6787, - "step": 55283 - }, - { - "epoch": 1.42, - "learning_rate": 1.1378016917866709e-06, - "loss": 0.6172, - "step": 55284 - }, - { - "epoch": 1.42, - "learning_rate": 1.137774285260594e-06, - "loss": 0.542, - "step": 55285 - }, - { - "epoch": 1.42, - "learning_rate": 1.1377468786290297e-06, - "loss": 0.709, - "step": 55286 - }, - { - "epoch": 1.42, - "learning_rate": 1.1377194718919985e-06, - "loss": 0.7012, - "step": 55287 - }, - { - "epoch": 1.42, - "learning_rate": 1.1376920650495222e-06, - "loss": 0.4895, - "step": 55288 - }, - { - "epoch": 1.42, - "learning_rate": 1.1376646581016213e-06, - "loss": 0.7246, - "step": 55289 - }, - { - "epoch": 1.42, - "learning_rate": 1.1376372510483171e-06, - "loss": 0.9531, - "step": 55290 - }, - { - "epoch": 1.42, - "learning_rate": 1.1376098438896302e-06, - "loss": 0.5972, - "step": 55291 - }, - { - "epoch": 1.42, - "learning_rate": 1.137582436625582e-06, - "loss": 0.7861, - "step": 55292 - }, - { - "epoch": 1.42, - "learning_rate": 1.1375550292561929e-06, - "loss": 0.6738, - "step": 55293 - }, - { - "epoch": 1.42, - "learning_rate": 1.1375276217814845e-06, - "loss": 0.6406, - "step": 55294 - }, - { - "epoch": 1.42, - "learning_rate": 1.1375002142014776e-06, - "loss": 0.6023, - "step": 55295 - }, - { - "epoch": 1.42, - "learning_rate": 1.1374728065161928e-06, - "loss": 0.5544, - "step": 55296 - }, - { - "epoch": 1.42, - "learning_rate": 1.1374453987256517e-06, - "loss": 0.6602, - "step": 55297 - }, - { - "epoch": 1.42, - "learning_rate": 1.1374179908298748e-06, - "loss": 0.6836, - "step": 55298 - }, - { - "epoch": 1.42, - "learning_rate": 1.137390582828883e-06, - "loss": 0.6943, - "step": 55299 - }, - { - "epoch": 1.42, - "learning_rate": 1.1373631747226982e-06, - "loss": 0.6064, - "step": 55300 - }, - { - "epoch": 1.42, - "learning_rate": 1.13733576651134e-06, - "loss": 0.6836, - "step": 55301 - }, - { - "epoch": 1.42, - "learning_rate": 1.1373083581948306e-06, - "loss": 0.5132, - "step": 55302 - }, - { - "epoch": 1.42, - "learning_rate": 1.1372809497731902e-06, - "loss": 0.5343, - "step": 55303 - }, - { - "epoch": 1.42, - "learning_rate": 1.1372535412464407e-06, - "loss": 0.6934, - "step": 55304 - }, - { - "epoch": 1.42, - "learning_rate": 1.137226132614602e-06, - "loss": 0.4474, - "step": 55305 - }, - { - "epoch": 1.42, - "learning_rate": 1.1371987238776953e-06, - "loss": 0.7012, - "step": 55306 - }, - { - "epoch": 1.42, - "learning_rate": 1.1371713150357422e-06, - "loss": 0.7744, - "step": 55307 - }, - { - "epoch": 1.42, - "learning_rate": 1.1371439060887632e-06, - "loss": 0.7529, - "step": 55308 - }, - { - "epoch": 1.42, - "learning_rate": 1.1371164970367798e-06, - "loss": 0.5142, - "step": 55309 - }, - { - "epoch": 1.42, - "learning_rate": 1.1370890878798123e-06, - "loss": 0.7705, - "step": 55310 - }, - { - "epoch": 1.42, - "learning_rate": 1.137061678617882e-06, - "loss": 0.6836, - "step": 55311 - }, - { - "epoch": 1.42, - "learning_rate": 1.1370342692510097e-06, - "loss": 0.6338, - "step": 55312 - }, - { - "epoch": 1.42, - "learning_rate": 1.1370068597792168e-06, - "loss": 0.7213, - "step": 55313 - }, - { - "epoch": 1.42, - "learning_rate": 1.1369794502025237e-06, - "loss": 0.6445, - "step": 55314 - }, - { - "epoch": 1.42, - "learning_rate": 1.1369520405209525e-06, - "loss": 0.6069, - "step": 55315 - }, - { - "epoch": 1.42, - "learning_rate": 1.1369246307345227e-06, - "loss": 0.6846, - "step": 55316 - }, - { - "epoch": 1.42, - "learning_rate": 1.1368972208432564e-06, - "loss": 0.793, - "step": 55317 - }, - { - "epoch": 1.42, - "learning_rate": 1.1368698108471738e-06, - "loss": 0.8145, - "step": 55318 - }, - { - "epoch": 1.42, - "learning_rate": 1.1368424007462967e-06, - "loss": 0.5603, - "step": 55319 - }, - { - "epoch": 1.42, - "learning_rate": 1.1368149905406455e-06, - "loss": 0.6924, - "step": 55320 - }, - { - "epoch": 1.42, - "learning_rate": 1.1367875802302413e-06, - "loss": 0.5765, - "step": 55321 - }, - { - "epoch": 1.42, - "learning_rate": 1.136760169815105e-06, - "loss": 0.6454, - "step": 55322 - }, - { - "epoch": 1.42, - "learning_rate": 1.136732759295258e-06, - "loss": 0.5938, - "step": 55323 - }, - { - "epoch": 1.42, - "learning_rate": 1.1367053486707207e-06, - "loss": 0.6621, - "step": 55324 - }, - { - "epoch": 1.42, - "learning_rate": 1.1366779379415148e-06, - "loss": 0.6895, - "step": 55325 - }, - { - "epoch": 1.42, - "learning_rate": 1.1366505271076607e-06, - "loss": 0.5234, - "step": 55326 - }, - { - "epoch": 1.42, - "learning_rate": 1.1366231161691794e-06, - "loss": 0.6174, - "step": 55327 - }, - { - "epoch": 1.42, - "learning_rate": 1.1365957051260923e-06, - "loss": 0.6277, - "step": 55328 - }, - { - "epoch": 1.42, - "learning_rate": 1.1365682939784202e-06, - "loss": 0.7539, - "step": 55329 - }, - { - "epoch": 1.42, - "learning_rate": 1.136540882726184e-06, - "loss": 0.5649, - "step": 55330 - }, - { - "epoch": 1.42, - "learning_rate": 1.1365134713694045e-06, - "loss": 0.4976, - "step": 55331 - }, - { - "epoch": 1.42, - "learning_rate": 1.136486059908103e-06, - "loss": 0.751, - "step": 55332 - }, - { - "epoch": 1.42, - "learning_rate": 1.1364586483423004e-06, - "loss": 0.7266, - "step": 55333 - }, - { - "epoch": 1.42, - "learning_rate": 1.136431236672018e-06, - "loss": 0.6499, - "step": 55334 - }, - { - "epoch": 1.42, - "learning_rate": 1.1364038248972761e-06, - "loss": 0.6113, - "step": 55335 - }, - { - "epoch": 1.42, - "learning_rate": 1.1363764130180961e-06, - "loss": 0.624, - "step": 55336 - }, - { - "epoch": 1.42, - "learning_rate": 1.1363490010344992e-06, - "loss": 0.6011, - "step": 55337 - }, - { - "epoch": 1.42, - "learning_rate": 1.136321588946506e-06, - "loss": 0.6167, - "step": 55338 - }, - { - "epoch": 1.42, - "learning_rate": 1.1362941767541374e-06, - "loss": 0.6973, - "step": 55339 - }, - { - "epoch": 1.42, - "learning_rate": 1.1362667644574151e-06, - "loss": 0.4526, - "step": 55340 - }, - { - "epoch": 1.42, - "learning_rate": 1.136239352056359e-06, - "loss": 0.7129, - "step": 55341 - }, - { - "epoch": 1.42, - "learning_rate": 1.1362119395509914e-06, - "loss": 0.5728, - "step": 55342 - }, - { - "epoch": 1.42, - "learning_rate": 1.1361845269413319e-06, - "loss": 0.6484, - "step": 55343 - }, - { - "epoch": 1.42, - "learning_rate": 1.1361571142274024e-06, - "loss": 0.6924, - "step": 55344 - }, - { - "epoch": 1.42, - "learning_rate": 1.136129701409224e-06, - "loss": 0.6534, - "step": 55345 - }, - { - "epoch": 1.42, - "learning_rate": 1.136102288486817e-06, - "loss": 0.6206, - "step": 55346 - }, - { - "epoch": 1.42, - "learning_rate": 1.1360748754602028e-06, - "loss": 0.6963, - "step": 55347 - }, - { - "epoch": 1.42, - "learning_rate": 1.1360474623294022e-06, - "loss": 0.7607, - "step": 55348 - }, - { - "epoch": 1.42, - "learning_rate": 1.1360200490944363e-06, - "loss": 0.6638, - "step": 55349 - }, - { - "epoch": 1.42, - "learning_rate": 1.1359926357553265e-06, - "loss": 0.6865, - "step": 55350 - }, - { - "epoch": 1.42, - "learning_rate": 1.135965222312093e-06, - "loss": 0.7266, - "step": 55351 - }, - { - "epoch": 1.42, - "learning_rate": 1.1359378087647574e-06, - "loss": 0.7373, - "step": 55352 - }, - { - "epoch": 1.42, - "learning_rate": 1.1359103951133401e-06, - "loss": 0.6514, - "step": 55353 - }, - { - "epoch": 1.42, - "learning_rate": 1.1358829813578627e-06, - "loss": 0.7046, - "step": 55354 - }, - { - "epoch": 1.42, - "learning_rate": 1.1358555674983464e-06, - "loss": 0.6055, - "step": 55355 - }, - { - "epoch": 1.42, - "learning_rate": 1.135828153534811e-06, - "loss": 0.7119, - "step": 55356 - }, - { - "epoch": 1.42, - "learning_rate": 1.1358007394672789e-06, - "loss": 0.5156, - "step": 55357 - }, - { - "epoch": 1.42, - "learning_rate": 1.1357733252957698e-06, - "loss": 0.8184, - "step": 55358 - }, - { - "epoch": 1.42, - "learning_rate": 1.135745911020306e-06, - "loss": 0.7393, - "step": 55359 - }, - { - "epoch": 1.42, - "learning_rate": 1.1357184966409072e-06, - "loss": 0.6353, - "step": 55360 - }, - { - "epoch": 1.42, - "learning_rate": 1.1356910821575952e-06, - "loss": 0.605, - "step": 55361 - }, - { - "epoch": 1.42, - "learning_rate": 1.1356636675703905e-06, - "loss": 0.6528, - "step": 55362 - }, - { - "epoch": 1.42, - "learning_rate": 1.1356362528793148e-06, - "loss": 0.5413, - "step": 55363 - }, - { - "epoch": 1.42, - "learning_rate": 1.1356088380843885e-06, - "loss": 0.7041, - "step": 55364 - }, - { - "epoch": 1.42, - "learning_rate": 1.1355814231856328e-06, - "loss": 0.645, - "step": 55365 - }, - { - "epoch": 1.42, - "learning_rate": 1.1355540081830686e-06, - "loss": 0.5488, - "step": 55366 - }, - { - "epoch": 1.42, - "learning_rate": 1.1355265930767168e-06, - "loss": 0.7324, - "step": 55367 - }, - { - "epoch": 1.42, - "learning_rate": 1.1354991778665986e-06, - "loss": 0.6382, - "step": 55368 - }, - { - "epoch": 1.42, - "learning_rate": 1.135471762552735e-06, - "loss": 0.6719, - "step": 55369 - }, - { - "epoch": 1.42, - "learning_rate": 1.1354443471351469e-06, - "loss": 0.6855, - "step": 55370 - }, - { - "epoch": 1.42, - "learning_rate": 1.1354169316138548e-06, - "loss": 0.5791, - "step": 55371 - }, - { - "epoch": 1.42, - "learning_rate": 1.1353895159888808e-06, - "loss": 0.6826, - "step": 55372 - }, - { - "epoch": 1.42, - "learning_rate": 1.135362100260245e-06, - "loss": 0.4307, - "step": 55373 - }, - { - "epoch": 1.42, - "learning_rate": 1.1353346844279687e-06, - "loss": 0.6719, - "step": 55374 - }, - { - "epoch": 1.42, - "learning_rate": 1.135307268492073e-06, - "loss": 0.4353, - "step": 55375 - }, - { - "epoch": 1.42, - "learning_rate": 1.135279852452579e-06, - "loss": 0.6572, - "step": 55376 - }, - { - "epoch": 1.42, - "learning_rate": 1.1352524363095067e-06, - "loss": 0.749, - "step": 55377 - }, - { - "epoch": 1.42, - "learning_rate": 1.135225020062878e-06, - "loss": 0.5444, - "step": 55378 - }, - { - "epoch": 1.42, - "learning_rate": 1.135197603712714e-06, - "loss": 0.6133, - "step": 55379 - }, - { - "epoch": 1.42, - "learning_rate": 1.1351701872590355e-06, - "loss": 0.6554, - "step": 55380 - }, - { - "epoch": 1.42, - "learning_rate": 1.1351427707018632e-06, - "loss": 0.7881, - "step": 55381 - }, - { - "epoch": 1.42, - "learning_rate": 1.1351153540412185e-06, - "loss": 0.6553, - "step": 55382 - }, - { - "epoch": 1.42, - "learning_rate": 1.1350879372771218e-06, - "loss": 0.8213, - "step": 55383 - }, - { - "epoch": 1.42, - "learning_rate": 1.1350605204095947e-06, - "loss": 0.7217, - "step": 55384 - }, - { - "epoch": 1.42, - "learning_rate": 1.135033103438658e-06, - "loss": 0.6, - "step": 55385 - }, - { - "epoch": 1.42, - "learning_rate": 1.1350056863643326e-06, - "loss": 0.4761, - "step": 55386 - }, - { - "epoch": 1.42, - "learning_rate": 1.1349782691866397e-06, - "loss": 0.5151, - "step": 55387 - }, - { - "epoch": 1.42, - "learning_rate": 1.1349508519055998e-06, - "loss": 0.4888, - "step": 55388 - }, - { - "epoch": 1.42, - "learning_rate": 1.1349234345212347e-06, - "loss": 0.5691, - "step": 55389 - }, - { - "epoch": 1.42, - "learning_rate": 1.134896017033565e-06, - "loss": 0.583, - "step": 55390 - }, - { - "epoch": 1.42, - "learning_rate": 1.134868599442611e-06, - "loss": 0.6685, - "step": 55391 - }, - { - "epoch": 1.42, - "learning_rate": 1.1348411817483948e-06, - "loss": 0.7275, - "step": 55392 - }, - { - "epoch": 1.42, - "learning_rate": 1.1348137639509365e-06, - "loss": 0.6162, - "step": 55393 - }, - { - "epoch": 1.42, - "learning_rate": 1.1347863460502578e-06, - "loss": 0.6602, - "step": 55394 - }, - { - "epoch": 1.42, - "learning_rate": 1.1347589280463795e-06, - "loss": 0.7559, - "step": 55395 - }, - { - "epoch": 1.42, - "learning_rate": 1.134731509939322e-06, - "loss": 0.7432, - "step": 55396 - }, - { - "epoch": 1.42, - "learning_rate": 1.1347040917291071e-06, - "loss": 0.7686, - "step": 55397 - }, - { - "epoch": 1.42, - "learning_rate": 1.1346766734157554e-06, - "loss": 0.8584, - "step": 55398 - }, - { - "epoch": 1.42, - "learning_rate": 1.134649254999288e-06, - "loss": 0.5938, - "step": 55399 - }, - { - "epoch": 1.42, - "learning_rate": 1.134621836479726e-06, - "loss": 0.7471, - "step": 55400 - }, - { - "epoch": 1.42, - "learning_rate": 1.1345944178570903e-06, - "loss": 0.7412, - "step": 55401 - }, - { - "epoch": 1.42, - "learning_rate": 1.1345669991314014e-06, - "loss": 0.6406, - "step": 55402 - }, - { - "epoch": 1.42, - "learning_rate": 1.1345395803026812e-06, - "loss": 0.7139, - "step": 55403 - }, - { - "epoch": 1.42, - "learning_rate": 1.13451216137095e-06, - "loss": 0.7783, - "step": 55404 - }, - { - "epoch": 1.42, - "learning_rate": 1.1344847423362291e-06, - "loss": 0.6582, - "step": 55405 - }, - { - "epoch": 1.42, - "learning_rate": 1.1344573231985392e-06, - "loss": 0.6128, - "step": 55406 - }, - { - "epoch": 1.42, - "learning_rate": 1.134429903957902e-06, - "loss": 0.5232, - "step": 55407 - }, - { - "epoch": 1.42, - "learning_rate": 1.1344024846143373e-06, - "loss": 0.6626, - "step": 55408 - }, - { - "epoch": 1.42, - "learning_rate": 1.1343750651678677e-06, - "loss": 0.5762, - "step": 55409 - }, - { - "epoch": 1.42, - "learning_rate": 1.1343476456185126e-06, - "loss": 0.6738, - "step": 55410 - }, - { - "epoch": 1.42, - "learning_rate": 1.1343202259662938e-06, - "loss": 0.6768, - "step": 55411 - }, - { - "epoch": 1.42, - "learning_rate": 1.1342928062112323e-06, - "loss": 0.6201, - "step": 55412 - }, - { - "epoch": 1.42, - "learning_rate": 1.134265386353349e-06, - "loss": 0.5245, - "step": 55413 - }, - { - "epoch": 1.42, - "learning_rate": 1.134237966392665e-06, - "loss": 0.6108, - "step": 55414 - }, - { - "epoch": 1.42, - "learning_rate": 1.1342105463292006e-06, - "loss": 0.8262, - "step": 55415 - }, - { - "epoch": 1.42, - "learning_rate": 1.1341831261629777e-06, - "loss": 0.6082, - "step": 55416 - }, - { - "epoch": 1.42, - "learning_rate": 1.134155705894017e-06, - "loss": 0.6636, - "step": 55417 - }, - { - "epoch": 1.42, - "learning_rate": 1.1341282855223393e-06, - "loss": 0.6631, - "step": 55418 - }, - { - "epoch": 1.42, - "learning_rate": 1.134100865047966e-06, - "loss": 0.603, - "step": 55419 - }, - { - "epoch": 1.42, - "learning_rate": 1.1340734444709176e-06, - "loss": 0.6199, - "step": 55420 - }, - { - "epoch": 1.42, - "learning_rate": 1.1340460237912154e-06, - "loss": 0.6294, - "step": 55421 - }, - { - "epoch": 1.42, - "learning_rate": 1.1340186030088804e-06, - "loss": 0.6255, - "step": 55422 - }, - { - "epoch": 1.42, - "learning_rate": 1.1339911821239333e-06, - "loss": 0.626, - "step": 55423 - }, - { - "epoch": 1.42, - "learning_rate": 1.1339637611363956e-06, - "loss": 0.6782, - "step": 55424 - }, - { - "epoch": 1.42, - "learning_rate": 1.1339363400462878e-06, - "loss": 0.7979, - "step": 55425 - }, - { - "epoch": 1.42, - "learning_rate": 1.1339089188536313e-06, - "loss": 0.7334, - "step": 55426 - }, - { - "epoch": 1.42, - "learning_rate": 1.1338814975584465e-06, - "loss": 0.7236, - "step": 55427 - }, - { - "epoch": 1.42, - "learning_rate": 1.1338540761607553e-06, - "loss": 0.7686, - "step": 55428 - }, - { - "epoch": 1.42, - "learning_rate": 1.1338266546605779e-06, - "loss": 0.6807, - "step": 55429 - }, - { - "epoch": 1.42, - "learning_rate": 1.1337992330579357e-06, - "loss": 0.626, - "step": 55430 - }, - { - "epoch": 1.42, - "learning_rate": 1.1337718113528493e-06, - "loss": 0.835, - "step": 55431 - }, - { - "epoch": 1.42, - "learning_rate": 1.1337443895453404e-06, - "loss": 0.583, - "step": 55432 - }, - { - "epoch": 1.42, - "learning_rate": 1.1337169676354292e-06, - "loss": 0.7695, - "step": 55433 - }, - { - "epoch": 1.42, - "learning_rate": 1.1336895456231373e-06, - "loss": 0.4667, - "step": 55434 - }, - { - "epoch": 1.42, - "learning_rate": 1.1336621235084855e-06, - "loss": 0.5947, - "step": 55435 - }, - { - "epoch": 1.42, - "learning_rate": 1.1336347012914946e-06, - "loss": 0.7656, - "step": 55436 - }, - { - "epoch": 1.42, - "learning_rate": 1.1336072789721858e-06, - "loss": 0.5679, - "step": 55437 - }, - { - "epoch": 1.42, - "learning_rate": 1.1335798565505801e-06, - "loss": 0.7158, - "step": 55438 - }, - { - "epoch": 1.42, - "learning_rate": 1.1335524340266983e-06, - "loss": 0.6865, - "step": 55439 - }, - { - "epoch": 1.42, - "learning_rate": 1.1335250114005617e-06, - "loss": 0.6406, - "step": 55440 - }, - { - "epoch": 1.42, - "learning_rate": 1.1334975886721911e-06, - "loss": 0.8467, - "step": 55441 - }, - { - "epoch": 1.42, - "learning_rate": 1.1334701658416072e-06, - "loss": 0.6772, - "step": 55442 - }, - { - "epoch": 1.42, - "learning_rate": 1.133442742908832e-06, - "loss": 0.9326, - "step": 55443 - }, - { - "epoch": 1.42, - "learning_rate": 1.1334153198738854e-06, - "loss": 0.385, - "step": 55444 - }, - { - "epoch": 1.42, - "learning_rate": 1.133387896736789e-06, - "loss": 0.3667, - "step": 55445 - }, - { - "epoch": 1.42, - "learning_rate": 1.1333604734975634e-06, - "loss": 0.8838, - "step": 55446 - }, - { - "epoch": 1.42, - "learning_rate": 1.13333305015623e-06, - "loss": 0.6807, - "step": 55447 - }, - { - "epoch": 1.42, - "learning_rate": 1.1333056267128094e-06, - "loss": 0.8477, - "step": 55448 - }, - { - "epoch": 1.42, - "learning_rate": 1.1332782031673231e-06, - "loss": 0.6514, - "step": 55449 - }, - { - "epoch": 1.42, - "learning_rate": 1.1332507795197916e-06, - "loss": 0.6035, - "step": 55450 - }, - { - "epoch": 1.42, - "learning_rate": 1.1332233557702362e-06, - "loss": 0.7549, - "step": 55451 - }, - { - "epoch": 1.42, - "learning_rate": 1.1331959319186777e-06, - "loss": 0.5557, - "step": 55452 - }, - { - "epoch": 1.42, - "learning_rate": 1.1331685079651373e-06, - "loss": 0.6885, - "step": 55453 - }, - { - "epoch": 1.42, - "learning_rate": 1.1331410839096357e-06, - "loss": 0.6582, - "step": 55454 - }, - { - "epoch": 1.42, - "learning_rate": 1.1331136597521946e-06, - "loss": 0.5869, - "step": 55455 - }, - { - "epoch": 1.42, - "learning_rate": 1.133086235492834e-06, - "loss": 0.5449, - "step": 55456 - }, - { - "epoch": 1.42, - "learning_rate": 1.1330588111315755e-06, - "loss": 0.5659, - "step": 55457 - }, - { - "epoch": 1.42, - "learning_rate": 1.13303138666844e-06, - "loss": 0.4731, - "step": 55458 - }, - { - "epoch": 1.42, - "learning_rate": 1.1330039621034485e-06, - "loss": 0.7811, - "step": 55459 - }, - { - "epoch": 1.42, - "learning_rate": 1.132976537436622e-06, - "loss": 0.5986, - "step": 55460 - }, - { - "epoch": 1.42, - "learning_rate": 1.1329491126679815e-06, - "loss": 0.6079, - "step": 55461 - }, - { - "epoch": 1.42, - "learning_rate": 1.132921687797548e-06, - "loss": 0.6816, - "step": 55462 - }, - { - "epoch": 1.42, - "learning_rate": 1.1328942628253425e-06, - "loss": 0.5293, - "step": 55463 - }, - { - "epoch": 1.42, - "learning_rate": 1.1328668377513858e-06, - "loss": 0.6665, - "step": 55464 - }, - { - "epoch": 1.42, - "learning_rate": 1.1328394125756993e-06, - "loss": 0.5503, - "step": 55465 - }, - { - "epoch": 1.42, - "learning_rate": 1.1328119872983036e-06, - "loss": 0.6855, - "step": 55466 - }, - { - "epoch": 1.42, - "learning_rate": 1.1327845619192198e-06, - "loss": 0.7471, - "step": 55467 - }, - { - "epoch": 1.42, - "learning_rate": 1.132757136438469e-06, - "loss": 0.7119, - "step": 55468 - }, - { - "epoch": 1.42, - "learning_rate": 1.1327297108560724e-06, - "loss": 0.583, - "step": 55469 - }, - { - "epoch": 1.42, - "learning_rate": 1.1327022851720507e-06, - "loss": 0.5781, - "step": 55470 - }, - { - "epoch": 1.42, - "learning_rate": 1.1326748593864248e-06, - "loss": 0.5244, - "step": 55471 - }, - { - "epoch": 1.42, - "learning_rate": 1.132647433499216e-06, - "loss": 0.6758, - "step": 55472 - }, - { - "epoch": 1.42, - "learning_rate": 1.132620007510445e-06, - "loss": 0.6094, - "step": 55473 - }, - { - "epoch": 1.42, - "learning_rate": 1.132592581420133e-06, - "loss": 0.6748, - "step": 55474 - }, - { - "epoch": 1.42, - "learning_rate": 1.132565155228301e-06, - "loss": 0.6909, - "step": 55475 - }, - { - "epoch": 1.42, - "learning_rate": 1.13253772893497e-06, - "loss": 0.8008, - "step": 55476 - }, - { - "epoch": 1.42, - "learning_rate": 1.1325103025401608e-06, - "loss": 0.7095, - "step": 55477 - }, - { - "epoch": 1.42, - "learning_rate": 1.1324828760438946e-06, - "loss": 0.7373, - "step": 55478 - }, - { - "epoch": 1.42, - "learning_rate": 1.1324554494461926e-06, - "loss": 0.6265, - "step": 55479 - }, - { - "epoch": 1.42, - "learning_rate": 1.1324280227470754e-06, - "loss": 0.7236, - "step": 55480 - }, - { - "epoch": 1.42, - "learning_rate": 1.132400595946564e-06, - "loss": 0.6885, - "step": 55481 - }, - { - "epoch": 1.42, - "learning_rate": 1.1323731690446799e-06, - "loss": 0.6533, - "step": 55482 - }, - { - "epoch": 1.42, - "learning_rate": 1.1323457420414433e-06, - "loss": 0.6763, - "step": 55483 - }, - { - "epoch": 1.42, - "learning_rate": 1.132318314936876e-06, - "loss": 0.6992, - "step": 55484 - }, - { - "epoch": 1.42, - "learning_rate": 1.1322908877309988e-06, - "loss": 0.7744, - "step": 55485 - }, - { - "epoch": 1.42, - "learning_rate": 1.132263460423832e-06, - "loss": 0.708, - "step": 55486 - }, - { - "epoch": 1.42, - "learning_rate": 1.1322360330153975e-06, - "loss": 0.8301, - "step": 55487 - }, - { - "epoch": 1.42, - "learning_rate": 1.1322086055057156e-06, - "loss": 0.7275, - "step": 55488 - }, - { - "epoch": 1.42, - "learning_rate": 1.1321811778948083e-06, - "loss": 0.7109, - "step": 55489 - }, - { - "epoch": 1.42, - "learning_rate": 1.1321537501826954e-06, - "loss": 0.707, - "step": 55490 - }, - { - "epoch": 1.42, - "learning_rate": 1.1321263223693986e-06, - "loss": 0.6851, - "step": 55491 - }, - { - "epoch": 1.42, - "learning_rate": 1.1320988944549388e-06, - "loss": 0.7051, - "step": 55492 - }, - { - "epoch": 1.42, - "learning_rate": 1.132071466439337e-06, - "loss": 0.5786, - "step": 55493 - }, - { - "epoch": 1.42, - "learning_rate": 1.132044038322614e-06, - "loss": 0.5562, - "step": 55494 - }, - { - "epoch": 1.42, - "learning_rate": 1.1320166101047911e-06, - "loss": 0.6895, - "step": 55495 - }, - { - "epoch": 1.42, - "learning_rate": 1.1319891817858892e-06, - "loss": 0.5784, - "step": 55496 - }, - { - "epoch": 1.42, - "learning_rate": 1.1319617533659292e-06, - "loss": 0.7363, - "step": 55497 - }, - { - "epoch": 1.42, - "learning_rate": 1.1319343248449318e-06, - "loss": 0.6807, - "step": 55498 - }, - { - "epoch": 1.42, - "learning_rate": 1.131906896222919e-06, - "loss": 0.6013, - "step": 55499 - }, - { - "epoch": 1.42, - "learning_rate": 1.1318794674999107e-06, - "loss": 0.5708, - "step": 55500 - }, - { - "epoch": 1.42, - "learning_rate": 1.1318520386759285e-06, - "loss": 0.7246, - "step": 55501 - }, - { - "epoch": 1.42, - "learning_rate": 1.131824609750993e-06, - "loss": 0.604, - "step": 55502 - }, - { - "epoch": 1.42, - "learning_rate": 1.131797180725126e-06, - "loss": 0.54, - "step": 55503 - }, - { - "epoch": 1.42, - "learning_rate": 1.1317697515983474e-06, - "loss": 0.6206, - "step": 55504 - }, - { - "epoch": 1.42, - "learning_rate": 1.131742322370679e-06, - "loss": 0.5947, - "step": 55505 - }, - { - "epoch": 1.42, - "learning_rate": 1.1317148930421416e-06, - "loss": 0.6885, - "step": 55506 - }, - { - "epoch": 1.42, - "learning_rate": 1.131687463612756e-06, - "loss": 0.7178, - "step": 55507 - }, - { - "epoch": 1.42, - "learning_rate": 1.1316600340825435e-06, - "loss": 0.7979, - "step": 55508 - }, - { - "epoch": 1.42, - "learning_rate": 1.1316326044515249e-06, - "loss": 0.531, - "step": 55509 - }, - { - "epoch": 1.42, - "learning_rate": 1.1316051747197216e-06, - "loss": 0.605, - "step": 55510 - }, - { - "epoch": 1.42, - "learning_rate": 1.1315777448871538e-06, - "loss": 0.6924, - "step": 55511 - }, - { - "epoch": 1.42, - "learning_rate": 1.1315503149538432e-06, - "loss": 0.7139, - "step": 55512 - }, - { - "epoch": 1.42, - "learning_rate": 1.1315228849198103e-06, - "loss": 0.4918, - "step": 55513 - }, - { - "epoch": 1.42, - "learning_rate": 1.1314954547850768e-06, - "loss": 0.4121, - "step": 55514 - }, - { - "epoch": 1.42, - "learning_rate": 1.1314680245496631e-06, - "loss": 0.6289, - "step": 55515 - }, - { - "epoch": 1.42, - "learning_rate": 1.1314405942135903e-06, - "loss": 0.6621, - "step": 55516 - }, - { - "epoch": 1.42, - "learning_rate": 1.1314131637768794e-06, - "loss": 0.791, - "step": 55517 - }, - { - "epoch": 1.42, - "learning_rate": 1.1313857332395518e-06, - "loss": 0.6836, - "step": 55518 - }, - { - "epoch": 1.42, - "learning_rate": 1.131358302601628e-06, - "loss": 0.439, - "step": 55519 - }, - { - "epoch": 1.42, - "learning_rate": 1.1313308718631293e-06, - "loss": 0.7236, - "step": 55520 - }, - { - "epoch": 1.42, - "learning_rate": 1.1313034410240762e-06, - "loss": 0.7275, - "step": 55521 - }, - { - "epoch": 1.42, - "learning_rate": 1.1312760100844906e-06, - "loss": 0.5898, - "step": 55522 - }, - { - "epoch": 1.42, - "learning_rate": 1.1312485790443926e-06, - "loss": 0.7588, - "step": 55523 - }, - { - "epoch": 1.42, - "learning_rate": 1.1312211479038039e-06, - "loss": 0.7549, - "step": 55524 - }, - { - "epoch": 1.42, - "learning_rate": 1.131193716662745e-06, - "loss": 0.3342, - "step": 55525 - }, - { - "epoch": 1.42, - "learning_rate": 1.1311662853212373e-06, - "loss": 0.7344, - "step": 55526 - }, - { - "epoch": 1.42, - "learning_rate": 1.1311388538793014e-06, - "loss": 0.6787, - "step": 55527 - }, - { - "epoch": 1.42, - "learning_rate": 1.1311114223369586e-06, - "loss": 0.5896, - "step": 55528 - }, - { - "epoch": 1.42, - "learning_rate": 1.13108399069423e-06, - "loss": 0.6611, - "step": 55529 - }, - { - "epoch": 1.42, - "learning_rate": 1.131056558951136e-06, - "loss": 0.5566, - "step": 55530 - }, - { - "epoch": 1.42, - "learning_rate": 1.131029127107698e-06, - "loss": 0.6826, - "step": 55531 - }, - { - "epoch": 1.42, - "learning_rate": 1.1310016951639375e-06, - "loss": 0.5249, - "step": 55532 - }, - { - "epoch": 1.42, - "learning_rate": 1.1309742631198746e-06, - "loss": 0.5437, - "step": 55533 - }, - { - "epoch": 1.42, - "learning_rate": 1.130946830975531e-06, - "loss": 0.4716, - "step": 55534 - }, - { - "epoch": 1.42, - "learning_rate": 1.1309193987309275e-06, - "loss": 0.5601, - "step": 55535 - }, - { - "epoch": 1.42, - "learning_rate": 1.1308919663860847e-06, - "loss": 0.709, - "step": 55536 - }, - { - "epoch": 1.42, - "learning_rate": 1.1308645339410244e-06, - "loss": 0.6582, - "step": 55537 - }, - { - "epoch": 1.42, - "learning_rate": 1.1308371013957665e-06, - "loss": 0.5955, - "step": 55538 - }, - { - "epoch": 1.42, - "learning_rate": 1.1308096687503335e-06, - "loss": 0.6992, - "step": 55539 - }, - { - "epoch": 1.42, - "learning_rate": 1.1307822360047448e-06, - "loss": 0.5205, - "step": 55540 - }, - { - "epoch": 1.42, - "learning_rate": 1.1307548031590225e-06, - "loss": 0.7715, - "step": 55541 - }, - { - "epoch": 1.42, - "learning_rate": 1.130727370213187e-06, - "loss": 0.7568, - "step": 55542 - }, - { - "epoch": 1.42, - "learning_rate": 1.13069993716726e-06, - "loss": 0.5444, - "step": 55543 - }, - { - "epoch": 1.42, - "learning_rate": 1.1306725040212616e-06, - "loss": 0.8564, - "step": 55544 - }, - { - "epoch": 1.42, - "learning_rate": 1.1306450707752135e-06, - "loss": 0.7266, - "step": 55545 - }, - { - "epoch": 1.42, - "learning_rate": 1.1306176374291365e-06, - "loss": 0.4856, - "step": 55546 - }, - { - "epoch": 1.42, - "learning_rate": 1.1305902039830516e-06, - "loss": 0.709, - "step": 55547 - }, - { - "epoch": 1.42, - "learning_rate": 1.1305627704369795e-06, - "loss": 0.6885, - "step": 55548 - }, - { - "epoch": 1.42, - "learning_rate": 1.1305353367909419e-06, - "loss": 0.5811, - "step": 55549 - }, - { - "epoch": 1.42, - "learning_rate": 1.1305079030449594e-06, - "loss": 0.5513, - "step": 55550 - }, - { - "epoch": 1.42, - "learning_rate": 1.1304804691990523e-06, - "loss": 0.6777, - "step": 55551 - }, - { - "epoch": 1.42, - "learning_rate": 1.1304530352532432e-06, - "loss": 0.8369, - "step": 55552 - }, - { - "epoch": 1.42, - "learning_rate": 1.1304256012075517e-06, - "loss": 0.6982, - "step": 55553 - }, - { - "epoch": 1.42, - "learning_rate": 1.1303981670619995e-06, - "loss": 0.6714, - "step": 55554 - }, - { - "epoch": 1.42, - "learning_rate": 1.1303707328166072e-06, - "loss": 0.6201, - "step": 55555 - }, - { - "epoch": 1.42, - "learning_rate": 1.1303432984713962e-06, - "loss": 0.5425, - "step": 55556 - }, - { - "epoch": 1.42, - "learning_rate": 1.1303158640263871e-06, - "loss": 0.5679, - "step": 55557 - }, - { - "epoch": 1.42, - "learning_rate": 1.1302884294816016e-06, - "loss": 0.5952, - "step": 55558 - }, - { - "epoch": 1.42, - "learning_rate": 1.1302609948370602e-06, - "loss": 0.728, - "step": 55559 - }, - { - "epoch": 1.42, - "learning_rate": 1.1302335600927838e-06, - "loss": 0.5269, - "step": 55560 - }, - { - "epoch": 1.42, - "learning_rate": 1.1302061252487934e-06, - "loss": 0.7275, - "step": 55561 - }, - { - "epoch": 1.42, - "learning_rate": 1.1301786903051104e-06, - "loss": 0.5591, - "step": 55562 - }, - { - "epoch": 1.42, - "learning_rate": 1.1301512552617549e-06, - "loss": 0.4902, - "step": 55563 - }, - { - "epoch": 1.42, - "learning_rate": 1.1301238201187496e-06, - "loss": 0.6553, - "step": 55564 - }, - { - "epoch": 1.42, - "learning_rate": 1.1300963848761135e-06, - "loss": 0.5068, - "step": 55565 - }, - { - "epoch": 1.42, - "learning_rate": 1.1300689495338693e-06, - "loss": 0.4978, - "step": 55566 - }, - { - "epoch": 1.42, - "learning_rate": 1.1300415140920367e-06, - "loss": 0.5459, - "step": 55567 - }, - { - "epoch": 1.42, - "learning_rate": 1.1300140785506377e-06, - "loss": 0.5332, - "step": 55568 - }, - { - "epoch": 1.42, - "learning_rate": 1.1299866429096929e-06, - "loss": 0.6348, - "step": 55569 - }, - { - "epoch": 1.42, - "learning_rate": 1.1299592071692231e-06, - "loss": 0.6841, - "step": 55570 - }, - { - "epoch": 1.42, - "learning_rate": 1.1299317713292497e-06, - "loss": 0.5483, - "step": 55571 - }, - { - "epoch": 1.42, - "learning_rate": 1.1299043353897935e-06, - "loss": 0.6338, - "step": 55572 - }, - { - "epoch": 1.42, - "learning_rate": 1.1298768993508753e-06, - "loss": 0.6621, - "step": 55573 - }, - { - "epoch": 1.42, - "learning_rate": 1.1298494632125167e-06, - "loss": 0.5867, - "step": 55574 - }, - { - "epoch": 1.42, - "learning_rate": 1.129822026974738e-06, - "loss": 0.7178, - "step": 55575 - }, - { - "epoch": 1.42, - "learning_rate": 1.1297945906375605e-06, - "loss": 0.7178, - "step": 55576 - }, - { - "epoch": 1.42, - "learning_rate": 1.1297671542010056e-06, - "loss": 0.6167, - "step": 55577 - }, - { - "epoch": 1.42, - "learning_rate": 1.1297397176650936e-06, - "loss": 0.6924, - "step": 55578 - }, - { - "epoch": 1.42, - "learning_rate": 1.1297122810298464e-06, - "loss": 0.7275, - "step": 55579 - }, - { - "epoch": 1.42, - "learning_rate": 1.129684844295284e-06, - "loss": 0.4966, - "step": 55580 - }, - { - "epoch": 1.42, - "learning_rate": 1.1296574074614281e-06, - "loss": 0.752, - "step": 55581 - }, - { - "epoch": 1.42, - "learning_rate": 1.129629970528299e-06, - "loss": 0.7207, - "step": 55582 - }, - { - "epoch": 1.42, - "learning_rate": 1.1296025334959187e-06, - "loss": 0.6768, - "step": 55583 - }, - { - "epoch": 1.42, - "learning_rate": 1.1295750963643076e-06, - "loss": 0.6357, - "step": 55584 - }, - { - "epoch": 1.42, - "learning_rate": 1.129547659133487e-06, - "loss": 0.5234, - "step": 55585 - }, - { - "epoch": 1.42, - "learning_rate": 1.1295202218034772e-06, - "loss": 0.7412, - "step": 55586 - }, - { - "epoch": 1.42, - "learning_rate": 1.1294927843743e-06, - "loss": 0.4834, - "step": 55587 - }, - { - "epoch": 1.42, - "learning_rate": 1.129465346845976e-06, - "loss": 0.7637, - "step": 55588 - }, - { - "epoch": 1.42, - "learning_rate": 1.1294379092185268e-06, - "loss": 0.6592, - "step": 55589 - }, - { - "epoch": 1.42, - "learning_rate": 1.1294104714919725e-06, - "loss": 0.5864, - "step": 55590 - }, - { - "epoch": 1.42, - "learning_rate": 1.1293830336663349e-06, - "loss": 0.7715, - "step": 55591 - }, - { - "epoch": 1.42, - "learning_rate": 1.1293555957416342e-06, - "loss": 0.7207, - "step": 55592 - }, - { - "epoch": 1.42, - "learning_rate": 1.129328157717892e-06, - "loss": 0.7104, - "step": 55593 - }, - { - "epoch": 1.42, - "learning_rate": 1.1293007195951295e-06, - "loss": 0.5537, - "step": 55594 - }, - { - "epoch": 1.42, - "learning_rate": 1.129273281373367e-06, - "loss": 0.5415, - "step": 55595 - }, - { - "epoch": 1.42, - "learning_rate": 1.1292458430526262e-06, - "loss": 0.4839, - "step": 55596 - }, - { - "epoch": 1.42, - "learning_rate": 1.1292184046329273e-06, - "loss": 0.7002, - "step": 55597 - }, - { - "epoch": 1.43, - "learning_rate": 1.1291909661142925e-06, - "loss": 0.6289, - "step": 55598 - }, - { - "epoch": 1.43, - "learning_rate": 1.1291635274967417e-06, - "loss": 0.6504, - "step": 55599 - }, - { - "epoch": 1.43, - "learning_rate": 1.1291360887802964e-06, - "loss": 0.5933, - "step": 55600 - }, - { - "epoch": 1.43, - "learning_rate": 1.1291086499649775e-06, - "loss": 0.6865, - "step": 55601 - }, - { - "epoch": 1.43, - "learning_rate": 1.1290812110508061e-06, - "loss": 0.6714, - "step": 55602 - }, - { - "epoch": 1.43, - "learning_rate": 1.129053772037803e-06, - "loss": 0.6309, - "step": 55603 - }, - { - "epoch": 1.43, - "learning_rate": 1.1290263329259899e-06, - "loss": 0.5342, - "step": 55604 - }, - { - "epoch": 1.43, - "learning_rate": 1.1289988937153867e-06, - "loss": 0.5181, - "step": 55605 - }, - { - "epoch": 1.43, - "learning_rate": 1.1289714544060152e-06, - "loss": 0.6277, - "step": 55606 - }, - { - "epoch": 1.43, - "learning_rate": 1.128944014997896e-06, - "loss": 0.6924, - "step": 55607 - }, - { - "epoch": 1.43, - "learning_rate": 1.1289165754910506e-06, - "loss": 0.6445, - "step": 55608 - }, - { - "epoch": 1.43, - "learning_rate": 1.1288891358854994e-06, - "loss": 0.4623, - "step": 55609 - }, - { - "epoch": 1.43, - "learning_rate": 1.128861696181264e-06, - "loss": 0.6191, - "step": 55610 - }, - { - "epoch": 1.43, - "learning_rate": 1.1288342563783648e-06, - "loss": 0.6538, - "step": 55611 - }, - { - "epoch": 1.43, - "learning_rate": 1.1288068164768235e-06, - "loss": 0.5762, - "step": 55612 - }, - { - "epoch": 1.43, - "learning_rate": 1.1287793764766602e-06, - "loss": 0.6313, - "step": 55613 - }, - { - "epoch": 1.43, - "learning_rate": 1.128751936377897e-06, - "loss": 0.667, - "step": 55614 - }, - { - "epoch": 1.43, - "learning_rate": 1.1287244961805542e-06, - "loss": 0.6743, - "step": 55615 - }, - { - "epoch": 1.43, - "learning_rate": 1.1286970558846532e-06, - "loss": 0.4663, - "step": 55616 - }, - { - "epoch": 1.43, - "learning_rate": 1.1286696154902143e-06, - "loss": 0.5977, - "step": 55617 - }, - { - "epoch": 1.43, - "learning_rate": 1.1286421749972593e-06, - "loss": 0.606, - "step": 55618 - }, - { - "epoch": 1.43, - "learning_rate": 1.1286147344058088e-06, - "loss": 0.7065, - "step": 55619 - }, - { - "epoch": 1.43, - "learning_rate": 1.1285872937158837e-06, - "loss": 0.7949, - "step": 55620 - }, - { - "epoch": 1.43, - "learning_rate": 1.1285598529275055e-06, - "loss": 0.5986, - "step": 55621 - }, - { - "epoch": 1.43, - "learning_rate": 1.1285324120406948e-06, - "loss": 0.6953, - "step": 55622 - }, - { - "epoch": 1.43, - "learning_rate": 1.1285049710554728e-06, - "loss": 0.7607, - "step": 55623 - }, - { - "epoch": 1.43, - "learning_rate": 1.1284775299718608e-06, - "loss": 0.7168, - "step": 55624 - }, - { - "epoch": 1.43, - "learning_rate": 1.128450088789879e-06, - "loss": 0.7471, - "step": 55625 - }, - { - "epoch": 1.43, - "learning_rate": 1.128422647509549e-06, - "loss": 0.5615, - "step": 55626 - }, - { - "epoch": 1.43, - "learning_rate": 1.1283952061308916e-06, - "loss": 0.4561, - "step": 55627 - }, - { - "epoch": 1.43, - "learning_rate": 1.128367764653928e-06, - "loss": 0.488, - "step": 55628 - }, - { - "epoch": 1.43, - "learning_rate": 1.1283403230786795e-06, - "loss": 0.667, - "step": 55629 - }, - { - "epoch": 1.43, - "learning_rate": 1.1283128814051658e-06, - "loss": 0.5903, - "step": 55630 - }, - { - "epoch": 1.43, - "learning_rate": 1.1282854396334096e-06, - "loss": 0.5796, - "step": 55631 - }, - { - "epoch": 1.43, - "learning_rate": 1.1282579977634309e-06, - "loss": 0.7227, - "step": 55632 - }, - { - "epoch": 1.43, - "learning_rate": 1.128230555795251e-06, - "loss": 0.666, - "step": 55633 - }, - { - "epoch": 1.43, - "learning_rate": 1.1282031137288907e-06, - "loss": 0.5571, - "step": 55634 - }, - { - "epoch": 1.43, - "learning_rate": 1.1281756715643713e-06, - "loss": 0.6904, - "step": 55635 - }, - { - "epoch": 1.43, - "learning_rate": 1.1281482293017135e-06, - "loss": 0.5771, - "step": 55636 - }, - { - "epoch": 1.43, - "learning_rate": 1.1281207869409387e-06, - "loss": 0.4575, - "step": 55637 - }, - { - "epoch": 1.43, - "learning_rate": 1.1280933444820675e-06, - "loss": 0.6855, - "step": 55638 - }, - { - "epoch": 1.43, - "learning_rate": 1.1280659019251213e-06, - "loss": 0.5747, - "step": 55639 - }, - { - "epoch": 1.43, - "learning_rate": 1.1280384592701208e-06, - "loss": 0.5615, - "step": 55640 - }, - { - "epoch": 1.43, - "learning_rate": 1.1280110165170873e-06, - "loss": 0.748, - "step": 55641 - }, - { - "epoch": 1.43, - "learning_rate": 1.1279835736660416e-06, - "loss": 0.5134, - "step": 55642 - }, - { - "epoch": 1.43, - "learning_rate": 1.1279561307170046e-06, - "loss": 0.6494, - "step": 55643 - }, - { - "epoch": 1.43, - "learning_rate": 1.1279286876699978e-06, - "loss": 0.6816, - "step": 55644 - }, - { - "epoch": 1.43, - "learning_rate": 1.1279012445250415e-06, - "loss": 0.5527, - "step": 55645 - }, - { - "epoch": 1.43, - "learning_rate": 1.1278738012821574e-06, - "loss": 0.6597, - "step": 55646 - }, - { - "epoch": 1.43, - "learning_rate": 1.1278463579413659e-06, - "loss": 0.8828, - "step": 55647 - }, - { - "epoch": 1.43, - "learning_rate": 1.1278189145026887e-06, - "loss": 0.4614, - "step": 55648 - }, - { - "epoch": 1.43, - "learning_rate": 1.1277914709661463e-06, - "loss": 0.7227, - "step": 55649 - }, - { - "epoch": 1.43, - "learning_rate": 1.1277640273317598e-06, - "loss": 0.613, - "step": 55650 - }, - { - "epoch": 1.43, - "learning_rate": 1.1277365835995503e-06, - "loss": 0.6338, - "step": 55651 - }, - { - "epoch": 1.43, - "learning_rate": 1.1277091397695386e-06, - "loss": 0.8506, - "step": 55652 - }, - { - "epoch": 1.43, - "learning_rate": 1.127681695841746e-06, - "loss": 0.6729, - "step": 55653 - }, - { - "epoch": 1.43, - "learning_rate": 1.1276542518161937e-06, - "loss": 0.5112, - "step": 55654 - }, - { - "epoch": 1.43, - "learning_rate": 1.127626807692902e-06, - "loss": 0.4298, - "step": 55655 - }, - { - "epoch": 1.43, - "learning_rate": 1.1275993634718926e-06, - "loss": 0.5593, - "step": 55656 - }, - { - "epoch": 1.43, - "learning_rate": 1.1275719191531858e-06, - "loss": 0.6335, - "step": 55657 - }, - { - "epoch": 1.43, - "learning_rate": 1.1275444747368034e-06, - "loss": 0.791, - "step": 55658 - }, - { - "epoch": 1.43, - "learning_rate": 1.1275170302227662e-06, - "loss": 0.6401, - "step": 55659 - }, - { - "epoch": 1.43, - "learning_rate": 1.1274895856110947e-06, - "loss": 0.79, - "step": 55660 - }, - { - "epoch": 1.43, - "learning_rate": 1.1274621409018105e-06, - "loss": 0.6294, - "step": 55661 - }, - { - "epoch": 1.43, - "learning_rate": 1.1274346960949343e-06, - "loss": 0.5293, - "step": 55662 - }, - { - "epoch": 1.43, - "learning_rate": 1.127407251190487e-06, - "loss": 0.7114, - "step": 55663 - }, - { - "epoch": 1.43, - "learning_rate": 1.1273798061884903e-06, - "loss": 0.5195, - "step": 55664 - }, - { - "epoch": 1.43, - "learning_rate": 1.1273523610889646e-06, - "loss": 0.605, - "step": 55665 - }, - { - "epoch": 1.43, - "learning_rate": 1.1273249158919306e-06, - "loss": 0.7529, - "step": 55666 - }, - { - "epoch": 1.43, - "learning_rate": 1.1272974705974103e-06, - "loss": 0.6172, - "step": 55667 - }, - { - "epoch": 1.43, - "learning_rate": 1.127270025205424e-06, - "loss": 0.6436, - "step": 55668 - }, - { - "epoch": 1.43, - "learning_rate": 1.1272425797159933e-06, - "loss": 0.6064, - "step": 55669 - }, - { - "epoch": 1.43, - "learning_rate": 1.127215134129138e-06, - "loss": 0.4329, - "step": 55670 - }, - { - "epoch": 1.43, - "learning_rate": 1.1271876884448806e-06, - "loss": 0.7432, - "step": 55671 - }, - { - "epoch": 1.43, - "learning_rate": 1.127160242663241e-06, - "loss": 0.5687, - "step": 55672 - }, - { - "epoch": 1.43, - "learning_rate": 1.1271327967842408e-06, - "loss": 0.6021, - "step": 55673 - }, - { - "epoch": 1.43, - "learning_rate": 1.1271053508079012e-06, - "loss": 0.6069, - "step": 55674 - }, - { - "epoch": 1.43, - "learning_rate": 1.1270779047342425e-06, - "loss": 0.7842, - "step": 55675 - }, - { - "epoch": 1.43, - "learning_rate": 1.127050458563286e-06, - "loss": 0.627, - "step": 55676 - }, - { - "epoch": 1.43, - "learning_rate": 1.1270230122950531e-06, - "loss": 0.7417, - "step": 55677 - }, - { - "epoch": 1.43, - "learning_rate": 1.1269955659295643e-06, - "loss": 0.5859, - "step": 55678 - }, - { - "epoch": 1.43, - "learning_rate": 1.126968119466841e-06, - "loss": 0.5269, - "step": 55679 - }, - { - "epoch": 1.43, - "learning_rate": 1.1269406729069039e-06, - "loss": 0.7227, - "step": 55680 - }, - { - "epoch": 1.43, - "learning_rate": 1.1269132262497742e-06, - "loss": 0.4767, - "step": 55681 - }, - { - "epoch": 1.43, - "learning_rate": 1.126885779495473e-06, - "loss": 0.52, - "step": 55682 - }, - { - "epoch": 1.43, - "learning_rate": 1.1268583326440212e-06, - "loss": 0.5405, - "step": 55683 - }, - { - "epoch": 1.43, - "learning_rate": 1.1268308856954395e-06, - "loss": 0.7793, - "step": 55684 - }, - { - "epoch": 1.43, - "learning_rate": 1.1268034386497496e-06, - "loss": 0.6523, - "step": 55685 - }, - { - "epoch": 1.43, - "learning_rate": 1.1267759915069719e-06, - "loss": 0.5664, - "step": 55686 - }, - { - "epoch": 1.43, - "learning_rate": 1.1267485442671276e-06, - "loss": 0.8311, - "step": 55687 - }, - { - "epoch": 1.43, - "learning_rate": 1.1267210969302379e-06, - "loss": 0.6016, - "step": 55688 - }, - { - "epoch": 1.43, - "learning_rate": 1.1266936494963237e-06, - "loss": 0.6855, - "step": 55689 - }, - { - "epoch": 1.43, - "learning_rate": 1.126666201965406e-06, - "loss": 0.7007, - "step": 55690 - }, - { - "epoch": 1.43, - "learning_rate": 1.1266387543375057e-06, - "loss": 0.7549, - "step": 55691 - }, - { - "epoch": 1.43, - "learning_rate": 1.1266113066126442e-06, - "loss": 0.7109, - "step": 55692 - }, - { - "epoch": 1.43, - "learning_rate": 1.1265838587908419e-06, - "loss": 0.519, - "step": 55693 - }, - { - "epoch": 1.43, - "learning_rate": 1.1265564108721206e-06, - "loss": 0.6636, - "step": 55694 - }, - { - "epoch": 1.43, - "learning_rate": 1.1265289628565004e-06, - "loss": 0.6592, - "step": 55695 - }, - { - "epoch": 1.43, - "learning_rate": 1.1265015147440032e-06, - "loss": 0.6855, - "step": 55696 - }, - { - "epoch": 1.43, - "learning_rate": 1.1264740665346492e-06, - "loss": 0.614, - "step": 55697 - }, - { - "epoch": 1.43, - "learning_rate": 1.1264466182284603e-06, - "loss": 0.5137, - "step": 55698 - }, - { - "epoch": 1.43, - "learning_rate": 1.1264191698254566e-06, - "loss": 0.6108, - "step": 55699 - }, - { - "epoch": 1.43, - "learning_rate": 1.1263917213256597e-06, - "loss": 0.5527, - "step": 55700 - }, - { - "epoch": 1.43, - "learning_rate": 1.1263642727290905e-06, - "loss": 0.7373, - "step": 55701 - }, - { - "epoch": 1.43, - "learning_rate": 1.12633682403577e-06, - "loss": 0.626, - "step": 55702 - }, - { - "epoch": 1.43, - "learning_rate": 1.1263093752457191e-06, - "loss": 0.5898, - "step": 55703 - }, - { - "epoch": 1.43, - "learning_rate": 1.126281926358959e-06, - "loss": 0.6201, - "step": 55704 - }, - { - "epoch": 1.43, - "learning_rate": 1.1262544773755107e-06, - "loss": 0.6797, - "step": 55705 - }, - { - "epoch": 1.43, - "learning_rate": 1.126227028295395e-06, - "loss": 0.6113, - "step": 55706 - }, - { - "epoch": 1.43, - "learning_rate": 1.126199579118633e-06, - "loss": 0.5559, - "step": 55707 - }, - { - "epoch": 1.43, - "learning_rate": 1.126172129845246e-06, - "loss": 0.5425, - "step": 55708 - }, - { - "epoch": 1.43, - "learning_rate": 1.1261446804752547e-06, - "loss": 0.5476, - "step": 55709 - }, - { - "epoch": 1.43, - "learning_rate": 1.1261172310086804e-06, - "loss": 0.7998, - "step": 55710 - }, - { - "epoch": 1.43, - "learning_rate": 1.1260897814455438e-06, - "loss": 0.7881, - "step": 55711 - }, - { - "epoch": 1.43, - "learning_rate": 1.1260623317858659e-06, - "loss": 0.4966, - "step": 55712 - }, - { - "epoch": 1.43, - "learning_rate": 1.1260348820296682e-06, - "loss": 0.7734, - "step": 55713 - }, - { - "epoch": 1.43, - "learning_rate": 1.126007432176971e-06, - "loss": 0.7334, - "step": 55714 - }, - { - "epoch": 1.43, - "learning_rate": 1.125979982227796e-06, - "loss": 0.71, - "step": 55715 - }, - { - "epoch": 1.43, - "learning_rate": 1.1259525321821636e-06, - "loss": 0.6572, - "step": 55716 - }, - { - "epoch": 1.43, - "learning_rate": 1.1259250820400956e-06, - "loss": 0.5112, - "step": 55717 - }, - { - "epoch": 1.43, - "learning_rate": 1.1258976318016124e-06, - "loss": 0.7773, - "step": 55718 - }, - { - "epoch": 1.43, - "learning_rate": 1.125870181466735e-06, - "loss": 0.8203, - "step": 55719 - }, - { - "epoch": 1.43, - "learning_rate": 1.1258427310354845e-06, - "loss": 0.7812, - "step": 55720 - }, - { - "epoch": 1.43, - "learning_rate": 1.1258152805078825e-06, - "loss": 0.7363, - "step": 55721 - }, - { - "epoch": 1.43, - "learning_rate": 1.1257878298839489e-06, - "loss": 0.646, - "step": 55722 - }, - { - "epoch": 1.43, - "learning_rate": 1.125760379163706e-06, - "loss": 0.5737, - "step": 55723 - }, - { - "epoch": 1.43, - "learning_rate": 1.1257329283471737e-06, - "loss": 0.6758, - "step": 55724 - }, - { - "epoch": 1.43, - "learning_rate": 1.1257054774343735e-06, - "loss": 0.5664, - "step": 55725 - }, - { - "epoch": 1.43, - "learning_rate": 1.1256780264253266e-06, - "loss": 0.5938, - "step": 55726 - }, - { - "epoch": 1.43, - "learning_rate": 1.1256505753200536e-06, - "loss": 0.5664, - "step": 55727 - }, - { - "epoch": 1.43, - "learning_rate": 1.1256231241185758e-06, - "loss": 0.6055, - "step": 55728 - }, - { - "epoch": 1.43, - "learning_rate": 1.125595672820914e-06, - "loss": 0.8506, - "step": 55729 - }, - { - "epoch": 1.43, - "learning_rate": 1.1255682214270896e-06, - "loss": 0.6538, - "step": 55730 - }, - { - "epoch": 1.43, - "learning_rate": 1.1255407699371234e-06, - "loss": 0.5957, - "step": 55731 - }, - { - "epoch": 1.43, - "learning_rate": 1.1255133183510364e-06, - "loss": 0.6147, - "step": 55732 - }, - { - "epoch": 1.43, - "learning_rate": 1.1254858666688497e-06, - "loss": 0.71, - "step": 55733 - }, - { - "epoch": 1.43, - "learning_rate": 1.1254584148905842e-06, - "loss": 0.4722, - "step": 55734 - }, - { - "epoch": 1.43, - "learning_rate": 1.1254309630162605e-06, - "loss": 0.8311, - "step": 55735 - }, - { - "epoch": 1.43, - "learning_rate": 1.1254035110459005e-06, - "loss": 0.6719, - "step": 55736 - }, - { - "epoch": 1.43, - "learning_rate": 1.1253760589795246e-06, - "loss": 0.4453, - "step": 55737 - }, - { - "epoch": 1.43, - "learning_rate": 1.1253486068171545e-06, - "loss": 0.8535, - "step": 55738 - }, - { - "epoch": 1.43, - "learning_rate": 1.1253211545588102e-06, - "loss": 0.5166, - "step": 55739 - }, - { - "epoch": 1.43, - "learning_rate": 1.1252937022045134e-06, - "loss": 0.6553, - "step": 55740 - }, - { - "epoch": 1.43, - "learning_rate": 1.125266249754285e-06, - "loss": 0.5466, - "step": 55741 - }, - { - "epoch": 1.43, - "learning_rate": 1.1252387972081461e-06, - "loss": 0.6631, - "step": 55742 - }, - { - "epoch": 1.43, - "learning_rate": 1.1252113445661175e-06, - "loss": 0.7754, - "step": 55743 - }, - { - "epoch": 1.43, - "learning_rate": 1.1251838918282205e-06, - "loss": 0.6016, - "step": 55744 - }, - { - "epoch": 1.43, - "learning_rate": 1.1251564389944758e-06, - "loss": 0.7344, - "step": 55745 - }, - { - "epoch": 1.43, - "learning_rate": 1.1251289860649045e-06, - "loss": 0.5347, - "step": 55746 - }, - { - "epoch": 1.43, - "learning_rate": 1.1251015330395276e-06, - "loss": 0.6062, - "step": 55747 - }, - { - "epoch": 1.43, - "learning_rate": 1.1250740799183664e-06, - "loss": 0.481, - "step": 55748 - }, - { - "epoch": 1.43, - "learning_rate": 1.1250466267014417e-06, - "loss": 0.6719, - "step": 55749 - }, - { - "epoch": 1.43, - "learning_rate": 1.1250191733887746e-06, - "loss": 0.6709, - "step": 55750 - }, - { - "epoch": 1.43, - "learning_rate": 1.124991719980386e-06, - "loss": 0.6187, - "step": 55751 - }, - { - "epoch": 1.43, - "learning_rate": 1.124964266476297e-06, - "loss": 0.564, - "step": 55752 - }, - { - "epoch": 1.43, - "learning_rate": 1.124936812876529e-06, - "loss": 0.8242, - "step": 55753 - }, - { - "epoch": 1.43, - "learning_rate": 1.1249093591811018e-06, - "loss": 0.5298, - "step": 55754 - }, - { - "epoch": 1.43, - "learning_rate": 1.1248819053900378e-06, - "loss": 0.6157, - "step": 55755 - }, - { - "epoch": 1.43, - "learning_rate": 1.1248544515033572e-06, - "loss": 0.6392, - "step": 55756 - }, - { - "epoch": 1.43, - "learning_rate": 1.1248269975210815e-06, - "loss": 0.6597, - "step": 55757 - }, - { - "epoch": 1.43, - "learning_rate": 1.1247995434432315e-06, - "loss": 0.7383, - "step": 55758 - }, - { - "epoch": 1.43, - "learning_rate": 1.1247720892698282e-06, - "loss": 0.7021, - "step": 55759 - }, - { - "epoch": 1.43, - "learning_rate": 1.1247446350008926e-06, - "loss": 0.6768, - "step": 55760 - }, - { - "epoch": 1.43, - "learning_rate": 1.124717180636446e-06, - "loss": 0.6196, - "step": 55761 - }, - { - "epoch": 1.43, - "learning_rate": 1.1246897261765088e-06, - "loss": 0.748, - "step": 55762 - }, - { - "epoch": 1.43, - "learning_rate": 1.1246622716211026e-06, - "loss": 0.7559, - "step": 55763 - }, - { - "epoch": 1.43, - "learning_rate": 1.1246348169702482e-06, - "loss": 0.5234, - "step": 55764 - }, - { - "epoch": 1.43, - "learning_rate": 1.124607362223967e-06, - "loss": 0.5455, - "step": 55765 - }, - { - "epoch": 1.43, - "learning_rate": 1.124579907382279e-06, - "loss": 0.752, - "step": 55766 - }, - { - "epoch": 1.43, - "learning_rate": 1.1245524524452063e-06, - "loss": 0.6309, - "step": 55767 - }, - { - "epoch": 1.43, - "learning_rate": 1.1245249974127695e-06, - "loss": 0.5298, - "step": 55768 - }, - { - "epoch": 1.43, - "learning_rate": 1.1244975422849897e-06, - "loss": 0.6138, - "step": 55769 - }, - { - "epoch": 1.43, - "learning_rate": 1.1244700870618874e-06, - "loss": 0.6289, - "step": 55770 - }, - { - "epoch": 1.43, - "learning_rate": 1.1244426317434848e-06, - "loss": 0.6689, - "step": 55771 - }, - { - "epoch": 1.43, - "learning_rate": 1.1244151763298016e-06, - "loss": 0.5908, - "step": 55772 - }, - { - "epoch": 1.43, - "learning_rate": 1.1243877208208595e-06, - "loss": 0.8096, - "step": 55773 - }, - { - "epoch": 1.43, - "learning_rate": 1.1243602652166799e-06, - "loss": 0.6143, - "step": 55774 - }, - { - "epoch": 1.43, - "learning_rate": 1.124332809517283e-06, - "loss": 0.6689, - "step": 55775 - }, - { - "epoch": 1.43, - "learning_rate": 1.12430535372269e-06, - "loss": 0.5566, - "step": 55776 - }, - { - "epoch": 1.43, - "learning_rate": 1.1242778978329224e-06, - "loss": 0.6777, - "step": 55777 - }, - { - "epoch": 1.43, - "learning_rate": 1.124250441848001e-06, - "loss": 0.8096, - "step": 55778 - }, - { - "epoch": 1.43, - "learning_rate": 1.1242229857679466e-06, - "loss": 0.7007, - "step": 55779 - }, - { - "epoch": 1.43, - "learning_rate": 1.1241955295927805e-06, - "loss": 0.5464, - "step": 55780 - }, - { - "epoch": 1.43, - "learning_rate": 1.1241680733225231e-06, - "loss": 0.5771, - "step": 55781 - }, - { - "epoch": 1.43, - "learning_rate": 1.1241406169571965e-06, - "loss": 0.3837, - "step": 55782 - }, - { - "epoch": 1.43, - "learning_rate": 1.124113160496821e-06, - "loss": 0.5505, - "step": 55783 - }, - { - "epoch": 1.43, - "learning_rate": 1.1240857039414177e-06, - "loss": 0.8262, - "step": 55784 - }, - { - "epoch": 1.43, - "learning_rate": 1.1240582472910077e-06, - "loss": 0.5759, - "step": 55785 - }, - { - "epoch": 1.43, - "learning_rate": 1.1240307905456119e-06, - "loss": 0.6191, - "step": 55786 - }, - { - "epoch": 1.43, - "learning_rate": 1.1240033337052516e-06, - "loss": 0.5869, - "step": 55787 - }, - { - "epoch": 1.43, - "learning_rate": 1.1239758767699476e-06, - "loss": 0.8682, - "step": 55788 - }, - { - "epoch": 1.43, - "learning_rate": 1.1239484197397208e-06, - "loss": 0.6641, - "step": 55789 - }, - { - "epoch": 1.43, - "learning_rate": 1.1239209626145927e-06, - "loss": 0.7266, - "step": 55790 - }, - { - "epoch": 1.43, - "learning_rate": 1.1238935053945837e-06, - "loss": 0.6787, - "step": 55791 - }, - { - "epoch": 1.43, - "learning_rate": 1.1238660480797154e-06, - "loss": 0.7549, - "step": 55792 - }, - { - "epoch": 1.43, - "learning_rate": 1.1238385906700085e-06, - "loss": 0.7031, - "step": 55793 - }, - { - "epoch": 1.43, - "learning_rate": 1.1238111331654838e-06, - "loss": 0.646, - "step": 55794 - }, - { - "epoch": 1.43, - "learning_rate": 1.1237836755661629e-06, - "loss": 0.8057, - "step": 55795 - }, - { - "epoch": 1.43, - "learning_rate": 1.1237562178720666e-06, - "loss": 0.6172, - "step": 55796 - }, - { - "epoch": 1.43, - "learning_rate": 1.1237287600832156e-06, - "loss": 0.603, - "step": 55797 - }, - { - "epoch": 1.43, - "learning_rate": 1.1237013021996313e-06, - "loss": 0.6611, - "step": 55798 - }, - { - "epoch": 1.43, - "learning_rate": 1.1236738442213347e-06, - "loss": 0.6592, - "step": 55799 - }, - { - "epoch": 1.43, - "learning_rate": 1.1236463861483464e-06, - "loss": 0.7129, - "step": 55800 - }, - { - "epoch": 1.43, - "learning_rate": 1.123618927980688e-06, - "loss": 0.6025, - "step": 55801 - }, - { - "epoch": 1.43, - "learning_rate": 1.12359146971838e-06, - "loss": 0.7119, - "step": 55802 - }, - { - "epoch": 1.43, - "learning_rate": 1.1235640113614443e-06, - "loss": 0.6875, - "step": 55803 - }, - { - "epoch": 1.43, - "learning_rate": 1.123536552909901e-06, - "loss": 0.7344, - "step": 55804 - }, - { - "epoch": 1.43, - "learning_rate": 1.1235090943637713e-06, - "loss": 0.7119, - "step": 55805 - }, - { - "epoch": 1.43, - "learning_rate": 1.1234816357230763e-06, - "loss": 0.748, - "step": 55806 - }, - { - "epoch": 1.43, - "learning_rate": 1.1234541769878375e-06, - "loss": 0.6553, - "step": 55807 - }, - { - "epoch": 1.43, - "learning_rate": 1.1234267181580752e-06, - "loss": 0.6543, - "step": 55808 - }, - { - "epoch": 1.43, - "learning_rate": 1.1233992592338108e-06, - "loss": 0.6953, - "step": 55809 - }, - { - "epoch": 1.43, - "learning_rate": 1.1233718002150652e-06, - "loss": 0.5737, - "step": 55810 - }, - { - "epoch": 1.43, - "learning_rate": 1.1233443411018597e-06, - "loss": 0.5786, - "step": 55811 - }, - { - "epoch": 1.43, - "learning_rate": 1.1233168818942146e-06, - "loss": 0.5649, - "step": 55812 - }, - { - "epoch": 1.43, - "learning_rate": 1.1232894225921523e-06, - "loss": 0.6553, - "step": 55813 - }, - { - "epoch": 1.43, - "learning_rate": 1.1232619631956922e-06, - "loss": 0.6777, - "step": 55814 - }, - { - "epoch": 1.43, - "learning_rate": 1.1232345037048566e-06, - "loss": 0.5396, - "step": 55815 - }, - { - "epoch": 1.43, - "learning_rate": 1.1232070441196655e-06, - "loss": 0.6348, - "step": 55816 - }, - { - "epoch": 1.43, - "learning_rate": 1.1231795844401405e-06, - "loss": 0.8955, - "step": 55817 - }, - { - "epoch": 1.43, - "learning_rate": 1.1231521246663029e-06, - "loss": 0.709, - "step": 55818 - }, - { - "epoch": 1.43, - "learning_rate": 1.1231246647981731e-06, - "loss": 0.5864, - "step": 55819 - }, - { - "epoch": 1.43, - "learning_rate": 1.1230972048357728e-06, - "loss": 0.6875, - "step": 55820 - }, - { - "epoch": 1.43, - "learning_rate": 1.123069744779122e-06, - "loss": 0.627, - "step": 55821 - }, - { - "epoch": 1.43, - "learning_rate": 1.1230422846282428e-06, - "loss": 0.6328, - "step": 55822 - }, - { - "epoch": 1.43, - "learning_rate": 1.1230148243831559e-06, - "loss": 0.6528, - "step": 55823 - }, - { - "epoch": 1.43, - "learning_rate": 1.1229873640438818e-06, - "loss": 0.6777, - "step": 55824 - }, - { - "epoch": 1.43, - "learning_rate": 1.122959903610442e-06, - "loss": 0.5488, - "step": 55825 - }, - { - "epoch": 1.43, - "learning_rate": 1.1229324430828577e-06, - "loss": 0.8604, - "step": 55826 - }, - { - "epoch": 1.43, - "learning_rate": 1.1229049824611495e-06, - "loss": 0.6421, - "step": 55827 - }, - { - "epoch": 1.43, - "learning_rate": 1.1228775217453388e-06, - "loss": 0.5972, - "step": 55828 - }, - { - "epoch": 1.43, - "learning_rate": 1.1228500609354462e-06, - "loss": 0.5122, - "step": 55829 - }, - { - "epoch": 1.43, - "learning_rate": 1.122822600031493e-06, - "loss": 0.6602, - "step": 55830 - }, - { - "epoch": 1.43, - "learning_rate": 1.1227951390335003e-06, - "loss": 0.7559, - "step": 55831 - }, - { - "epoch": 1.43, - "learning_rate": 1.122767677941489e-06, - "loss": 0.7344, - "step": 55832 - }, - { - "epoch": 1.43, - "learning_rate": 1.12274021675548e-06, - "loss": 0.6812, - "step": 55833 - }, - { - "epoch": 1.43, - "learning_rate": 1.1227127554754947e-06, - "loss": 0.79, - "step": 55834 - }, - { - "epoch": 1.43, - "learning_rate": 1.1226852941015534e-06, - "loss": 0.5752, - "step": 55835 - }, - { - "epoch": 1.43, - "learning_rate": 1.1226578326336783e-06, - "loss": 0.6062, - "step": 55836 - }, - { - "epoch": 1.43, - "learning_rate": 1.1226303710718892e-06, - "loss": 0.5791, - "step": 55837 - }, - { - "epoch": 1.43, - "learning_rate": 1.1226029094162078e-06, - "loss": 0.4514, - "step": 55838 - }, - { - "epoch": 1.43, - "learning_rate": 1.1225754476666552e-06, - "loss": 0.5801, - "step": 55839 - }, - { - "epoch": 1.43, - "learning_rate": 1.1225479858232518e-06, - "loss": 0.71, - "step": 55840 - }, - { - "epoch": 1.43, - "learning_rate": 1.1225205238860194e-06, - "loss": 0.7031, - "step": 55841 - }, - { - "epoch": 1.43, - "learning_rate": 1.1224930618549785e-06, - "loss": 0.6143, - "step": 55842 - }, - { - "epoch": 1.43, - "learning_rate": 1.1224655997301503e-06, - "loss": 0.7803, - "step": 55843 - }, - { - "epoch": 1.43, - "learning_rate": 1.1224381375115558e-06, - "loss": 0.75, - "step": 55844 - }, - { - "epoch": 1.43, - "learning_rate": 1.1224106751992161e-06, - "loss": 1.0029, - "step": 55845 - }, - { - "epoch": 1.43, - "learning_rate": 1.122383212793152e-06, - "loss": 0.4937, - "step": 55846 - }, - { - "epoch": 1.43, - "learning_rate": 1.1223557502933851e-06, - "loss": 0.6362, - "step": 55847 - }, - { - "epoch": 1.43, - "learning_rate": 1.1223282876999358e-06, - "loss": 0.6323, - "step": 55848 - }, - { - "epoch": 1.43, - "learning_rate": 1.1223008250128257e-06, - "loss": 0.79, - "step": 55849 - }, - { - "epoch": 1.43, - "learning_rate": 1.1222733622320747e-06, - "loss": 0.7783, - "step": 55850 - }, - { - "epoch": 1.43, - "learning_rate": 1.1222458993577054e-06, - "loss": 0.6426, - "step": 55851 - }, - { - "epoch": 1.43, - "learning_rate": 1.1222184363897374e-06, - "loss": 0.751, - "step": 55852 - }, - { - "epoch": 1.43, - "learning_rate": 1.1221909733281929e-06, - "loss": 0.6167, - "step": 55853 - }, - { - "epoch": 1.43, - "learning_rate": 1.1221635101730923e-06, - "loss": 0.6133, - "step": 55854 - }, - { - "epoch": 1.43, - "learning_rate": 1.1221360469244565e-06, - "loss": 0.3987, - "step": 55855 - }, - { - "epoch": 1.43, - "learning_rate": 1.1221085835823065e-06, - "loss": 0.7695, - "step": 55856 - }, - { - "epoch": 1.43, - "learning_rate": 1.1220811201466641e-06, - "loss": 0.709, - "step": 55857 - }, - { - "epoch": 1.43, - "learning_rate": 1.1220536566175495e-06, - "loss": 0.583, - "step": 55858 - }, - { - "epoch": 1.43, - "learning_rate": 1.1220261929949844e-06, - "loss": 0.7227, - "step": 55859 - }, - { - "epoch": 1.43, - "learning_rate": 1.1219987292789889e-06, - "loss": 0.5146, - "step": 55860 - }, - { - "epoch": 1.43, - "learning_rate": 1.121971265469585e-06, - "loss": 0.4863, - "step": 55861 - }, - { - "epoch": 1.43, - "learning_rate": 1.1219438015667931e-06, - "loss": 0.4697, - "step": 55862 - }, - { - "epoch": 1.43, - "learning_rate": 1.1219163375706343e-06, - "loss": 0.5918, - "step": 55863 - }, - { - "epoch": 1.43, - "learning_rate": 1.1218888734811302e-06, - "loss": 0.8486, - "step": 55864 - }, - { - "epoch": 1.43, - "learning_rate": 1.121861409298301e-06, - "loss": 0.6533, - "step": 55865 - }, - { - "epoch": 1.43, - "learning_rate": 1.1218339450221683e-06, - "loss": 0.6582, - "step": 55866 - }, - { - "epoch": 1.43, - "learning_rate": 1.1218064806527528e-06, - "loss": 0.7451, - "step": 55867 - }, - { - "epoch": 1.43, - "learning_rate": 1.121779016190076e-06, - "loss": 0.5742, - "step": 55868 - }, - { - "epoch": 1.43, - "learning_rate": 1.1217515516341584e-06, - "loss": 0.665, - "step": 55869 - }, - { - "epoch": 1.43, - "learning_rate": 1.1217240869850213e-06, - "loss": 0.6226, - "step": 55870 - }, - { - "epoch": 1.43, - "learning_rate": 1.1216966222426853e-06, - "loss": 0.7725, - "step": 55871 - }, - { - "epoch": 1.43, - "learning_rate": 1.1216691574071724e-06, - "loss": 0.7432, - "step": 55872 - }, - { - "epoch": 1.43, - "learning_rate": 1.121641692478503e-06, - "loss": 0.5178, - "step": 55873 - }, - { - "epoch": 1.43, - "learning_rate": 1.1216142274566977e-06, - "loss": 0.5618, - "step": 55874 - }, - { - "epoch": 1.43, - "learning_rate": 1.121586762341778e-06, - "loss": 0.7803, - "step": 55875 - }, - { - "epoch": 1.43, - "learning_rate": 1.1215592971337652e-06, - "loss": 0.5386, - "step": 55876 - }, - { - "epoch": 1.43, - "learning_rate": 1.1215318318326797e-06, - "loss": 0.4722, - "step": 55877 - }, - { - "epoch": 1.43, - "learning_rate": 1.1215043664385432e-06, - "loss": 0.6021, - "step": 55878 - }, - { - "epoch": 1.43, - "learning_rate": 1.1214769009513762e-06, - "loss": 0.624, - "step": 55879 - }, - { - "epoch": 1.43, - "learning_rate": 1.1214494353712002e-06, - "loss": 0.7051, - "step": 55880 - }, - { - "epoch": 1.43, - "learning_rate": 1.1214219696980353e-06, - "loss": 0.7705, - "step": 55881 - }, - { - "epoch": 1.43, - "learning_rate": 1.121394503931904e-06, - "loss": 0.5771, - "step": 55882 - }, - { - "epoch": 1.43, - "learning_rate": 1.121367038072826e-06, - "loss": 0.6504, - "step": 55883 - }, - { - "epoch": 1.43, - "learning_rate": 1.1213395721208228e-06, - "loss": 0.8398, - "step": 55884 - }, - { - "epoch": 1.43, - "learning_rate": 1.1213121060759156e-06, - "loss": 0.592, - "step": 55885 - }, - { - "epoch": 1.43, - "learning_rate": 1.1212846399381255e-06, - "loss": 0.6914, - "step": 55886 - }, - { - "epoch": 1.43, - "learning_rate": 1.121257173707473e-06, - "loss": 0.7422, - "step": 55887 - }, - { - "epoch": 1.43, - "learning_rate": 1.1212297073839798e-06, - "loss": 0.791, - "step": 55888 - }, - { - "epoch": 1.43, - "learning_rate": 1.1212022409676666e-06, - "loss": 0.353, - "step": 55889 - }, - { - "epoch": 1.43, - "learning_rate": 1.1211747744585537e-06, - "loss": 0.7949, - "step": 55890 - }, - { - "epoch": 1.43, - "learning_rate": 1.1211473078566636e-06, - "loss": 0.6279, - "step": 55891 - }, - { - "epoch": 1.43, - "learning_rate": 1.1211198411620163e-06, - "loss": 0.5073, - "step": 55892 - }, - { - "epoch": 1.43, - "learning_rate": 1.1210923743746334e-06, - "loss": 0.5906, - "step": 55893 - }, - { - "epoch": 1.43, - "learning_rate": 1.1210649074945351e-06, - "loss": 0.7432, - "step": 55894 - }, - { - "epoch": 1.43, - "learning_rate": 1.1210374405217433e-06, - "loss": 0.6758, - "step": 55895 - }, - { - "epoch": 1.43, - "learning_rate": 1.1210099734562787e-06, - "loss": 0.4965, - "step": 55896 - }, - { - "epoch": 1.43, - "learning_rate": 1.1209825062981622e-06, - "loss": 0.793, - "step": 55897 - }, - { - "epoch": 1.43, - "learning_rate": 1.1209550390474152e-06, - "loss": 0.7637, - "step": 55898 - }, - { - "epoch": 1.43, - "learning_rate": 1.1209275717040583e-06, - "loss": 0.627, - "step": 55899 - }, - { - "epoch": 1.43, - "learning_rate": 1.1209001042681125e-06, - "loss": 0.6084, - "step": 55900 - }, - { - "epoch": 1.43, - "learning_rate": 1.1208726367395995e-06, - "loss": 0.6816, - "step": 55901 - }, - { - "epoch": 1.43, - "learning_rate": 1.1208451691185395e-06, - "loss": 0.8516, - "step": 55902 - }, - { - "epoch": 1.43, - "learning_rate": 1.1208177014049542e-06, - "loss": 0.7285, - "step": 55903 - }, - { - "epoch": 1.43, - "learning_rate": 1.1207902335988643e-06, - "loss": 0.6045, - "step": 55904 - }, - { - "epoch": 1.43, - "learning_rate": 1.120762765700291e-06, - "loss": 0.4946, - "step": 55905 - }, - { - "epoch": 1.43, - "learning_rate": 1.1207352977092547e-06, - "loss": 0.5864, - "step": 55906 - }, - { - "epoch": 1.43, - "learning_rate": 1.1207078296257772e-06, - "loss": 0.4766, - "step": 55907 - }, - { - "epoch": 1.43, - "learning_rate": 1.1206803614498795e-06, - "loss": 0.6572, - "step": 55908 - }, - { - "epoch": 1.43, - "learning_rate": 1.1206528931815819e-06, - "loss": 0.5911, - "step": 55909 - }, - { - "epoch": 1.43, - "learning_rate": 1.1206254248209064e-06, - "loss": 0.6631, - "step": 55910 - }, - { - "epoch": 1.43, - "learning_rate": 1.1205979563678733e-06, - "loss": 0.6348, - "step": 55911 - }, - { - "epoch": 1.43, - "learning_rate": 1.120570487822504e-06, - "loss": 0.7256, - "step": 55912 - }, - { - "epoch": 1.43, - "learning_rate": 1.1205430191848196e-06, - "loss": 0.6826, - "step": 55913 - }, - { - "epoch": 1.43, - "learning_rate": 1.1205155504548408e-06, - "loss": 0.6865, - "step": 55914 - }, - { - "epoch": 1.43, - "learning_rate": 1.1204880816325885e-06, - "loss": 0.6992, - "step": 55915 - }, - { - "epoch": 1.43, - "learning_rate": 1.1204606127180842e-06, - "loss": 0.6836, - "step": 55916 - }, - { - "epoch": 1.43, - "learning_rate": 1.1204331437113488e-06, - "loss": 0.6758, - "step": 55917 - }, - { - "epoch": 1.43, - "learning_rate": 1.1204056746124035e-06, - "loss": 0.7471, - "step": 55918 - }, - { - "epoch": 1.43, - "learning_rate": 1.1203782054212688e-06, - "loss": 0.7915, - "step": 55919 - }, - { - "epoch": 1.43, - "learning_rate": 1.1203507361379661e-06, - "loss": 0.6472, - "step": 55920 - }, - { - "epoch": 1.43, - "learning_rate": 1.1203232667625162e-06, - "loss": 0.6279, - "step": 55921 - }, - { - "epoch": 1.43, - "learning_rate": 1.1202957972949407e-06, - "loss": 0.8564, - "step": 55922 - }, - { - "epoch": 1.43, - "learning_rate": 1.12026832773526e-06, - "loss": 0.8359, - "step": 55923 - }, - { - "epoch": 1.43, - "learning_rate": 1.1202408580834957e-06, - "loss": 0.834, - "step": 55924 - }, - { - "epoch": 1.43, - "learning_rate": 1.120213388339668e-06, - "loss": 0.7402, - "step": 55925 - }, - { - "epoch": 1.43, - "learning_rate": 1.1201859185037987e-06, - "loss": 0.5566, - "step": 55926 - }, - { - "epoch": 1.43, - "learning_rate": 1.1201584485759084e-06, - "loss": 0.8027, - "step": 55927 - }, - { - "epoch": 1.43, - "learning_rate": 1.1201309785560185e-06, - "loss": 0.6768, - "step": 55928 - }, - { - "epoch": 1.43, - "learning_rate": 1.1201035084441497e-06, - "loss": 0.4767, - "step": 55929 - }, - { - "epoch": 1.43, - "learning_rate": 1.1200760382403231e-06, - "loss": 0.749, - "step": 55930 - }, - { - "epoch": 1.43, - "learning_rate": 1.12004856794456e-06, - "loss": 0.6357, - "step": 55931 - }, - { - "epoch": 1.43, - "learning_rate": 1.1200210975568814e-06, - "loss": 0.9248, - "step": 55932 - }, - { - "epoch": 1.43, - "learning_rate": 1.1199936270773078e-06, - "loss": 0.8086, - "step": 55933 - }, - { - "epoch": 1.43, - "learning_rate": 1.1199661565058607e-06, - "loss": 0.7554, - "step": 55934 - }, - { - "epoch": 1.43, - "learning_rate": 1.119938685842561e-06, - "loss": 0.5239, - "step": 55935 - }, - { - "epoch": 1.43, - "learning_rate": 1.1199112150874297e-06, - "loss": 0.6943, - "step": 55936 - }, - { - "epoch": 1.43, - "learning_rate": 1.119883744240488e-06, - "loss": 0.6885, - "step": 55937 - }, - { - "epoch": 1.43, - "learning_rate": 1.1198562733017571e-06, - "loss": 0.5996, - "step": 55938 - }, - { - "epoch": 1.43, - "learning_rate": 1.1198288022712574e-06, - "loss": 0.7207, - "step": 55939 - }, - { - "epoch": 1.43, - "learning_rate": 1.1198013311490104e-06, - "loss": 0.6812, - "step": 55940 - }, - { - "epoch": 1.43, - "learning_rate": 1.1197738599350371e-06, - "loss": 0.8584, - "step": 55941 - }, - { - "epoch": 1.43, - "learning_rate": 1.1197463886293582e-06, - "loss": 0.8711, - "step": 55942 - }, - { - "epoch": 1.43, - "learning_rate": 1.1197189172319955e-06, - "loss": 0.438, - "step": 55943 - }, - { - "epoch": 1.43, - "learning_rate": 1.119691445742969e-06, - "loss": 0.6465, - "step": 55944 - }, - { - "epoch": 1.43, - "learning_rate": 1.1196639741623006e-06, - "loss": 0.6738, - "step": 55945 - }, - { - "epoch": 1.43, - "learning_rate": 1.1196365024900108e-06, - "loss": 0.6641, - "step": 55946 - }, - { - "epoch": 1.43, - "learning_rate": 1.119609030726121e-06, - "loss": 0.6016, - "step": 55947 - }, - { - "epoch": 1.43, - "learning_rate": 1.119581558870652e-06, - "loss": 0.7158, - "step": 55948 - }, - { - "epoch": 1.43, - "learning_rate": 1.1195540869236248e-06, - "loss": 0.6426, - "step": 55949 - }, - { - "epoch": 1.43, - "learning_rate": 1.1195266148850605e-06, - "loss": 0.7217, - "step": 55950 - }, - { - "epoch": 1.43, - "learning_rate": 1.1194991427549805e-06, - "loss": 0.645, - "step": 55951 - }, - { - "epoch": 1.43, - "learning_rate": 1.119471670533405e-06, - "loss": 0.604, - "step": 55952 - }, - { - "epoch": 1.43, - "learning_rate": 1.1194441982203559e-06, - "loss": 0.5798, - "step": 55953 - }, - { - "epoch": 1.43, - "learning_rate": 1.1194167258158537e-06, - "loss": 0.5151, - "step": 55954 - }, - { - "epoch": 1.43, - "learning_rate": 1.1193892533199196e-06, - "loss": 0.6943, - "step": 55955 - }, - { - "epoch": 1.43, - "learning_rate": 1.1193617807325747e-06, - "loss": 0.4072, - "step": 55956 - }, - { - "epoch": 1.43, - "learning_rate": 1.11933430805384e-06, - "loss": 0.7451, - "step": 55957 - }, - { - "epoch": 1.43, - "learning_rate": 1.119306835283737e-06, - "loss": 0.6631, - "step": 55958 - }, - { - "epoch": 1.43, - "learning_rate": 1.1192793624222854e-06, - "loss": 0.665, - "step": 55959 - }, - { - "epoch": 1.43, - "learning_rate": 1.1192518894695075e-06, - "loss": 0.6826, - "step": 55960 - }, - { - "epoch": 1.43, - "learning_rate": 1.1192244164254236e-06, - "loss": 0.7256, - "step": 55961 - }, - { - "epoch": 1.43, - "learning_rate": 1.1191969432900555e-06, - "loss": 0.6953, - "step": 55962 - }, - { - "epoch": 1.43, - "learning_rate": 1.1191694700634235e-06, - "loss": 0.6899, - "step": 55963 - }, - { - "epoch": 1.43, - "learning_rate": 1.1191419967455492e-06, - "loss": 0.8076, - "step": 55964 - }, - { - "epoch": 1.43, - "learning_rate": 1.119114523336453e-06, - "loss": 0.6953, - "step": 55965 - }, - { - "epoch": 1.43, - "learning_rate": 1.1190870498361563e-06, - "loss": 0.5691, - "step": 55966 - }, - { - "epoch": 1.43, - "learning_rate": 1.1190595762446802e-06, - "loss": 0.6973, - "step": 55967 - }, - { - "epoch": 1.43, - "learning_rate": 1.119032102562046e-06, - "loss": 0.4985, - "step": 55968 - }, - { - "epoch": 1.43, - "learning_rate": 1.119004628788274e-06, - "loss": 0.6406, - "step": 55969 - }, - { - "epoch": 1.43, - "learning_rate": 1.1189771549233857e-06, - "loss": 0.6328, - "step": 55970 - }, - { - "epoch": 1.43, - "learning_rate": 1.118949680967402e-06, - "loss": 0.4556, - "step": 55971 - }, - { - "epoch": 1.43, - "learning_rate": 1.1189222069203442e-06, - "loss": 0.7354, - "step": 55972 - }, - { - "epoch": 1.43, - "learning_rate": 1.118894732782233e-06, - "loss": 0.5737, - "step": 55973 - }, - { - "epoch": 1.43, - "learning_rate": 1.1188672585530895e-06, - "loss": 0.6411, - "step": 55974 - }, - { - "epoch": 1.43, - "learning_rate": 1.118839784232935e-06, - "loss": 0.6104, - "step": 55975 - }, - { - "epoch": 1.43, - "learning_rate": 1.1188123098217902e-06, - "loss": 0.7007, - "step": 55976 - }, - { - "epoch": 1.43, - "learning_rate": 1.118784835319676e-06, - "loss": 0.6104, - "step": 55977 - }, - { - "epoch": 1.43, - "learning_rate": 1.1187573607266144e-06, - "loss": 0.6562, - "step": 55978 - }, - { - "epoch": 1.43, - "learning_rate": 1.1187298860426252e-06, - "loss": 0.4512, - "step": 55979 - }, - { - "epoch": 1.43, - "learning_rate": 1.1187024112677301e-06, - "loss": 0.7246, - "step": 55980 - }, - { - "epoch": 1.43, - "learning_rate": 1.11867493640195e-06, - "loss": 0.7168, - "step": 55981 - }, - { - "epoch": 1.43, - "learning_rate": 1.118647461445306e-06, - "loss": 0.4673, - "step": 55982 - }, - { - "epoch": 1.43, - "learning_rate": 1.1186199863978194e-06, - "loss": 0.6411, - "step": 55983 - }, - { - "epoch": 1.43, - "learning_rate": 1.1185925112595106e-06, - "loss": 0.6396, - "step": 55984 - }, - { - "epoch": 1.43, - "learning_rate": 1.118565036030401e-06, - "loss": 0.522, - "step": 55985 - }, - { - "epoch": 1.43, - "learning_rate": 1.1185375607105114e-06, - "loss": 0.791, - "step": 55986 - }, - { - "epoch": 1.43, - "learning_rate": 1.1185100852998634e-06, - "loss": 0.5977, - "step": 55987 - }, - { - "epoch": 1.44, - "learning_rate": 1.1184826097984777e-06, - "loss": 0.709, - "step": 55988 - }, - { - "epoch": 1.44, - "learning_rate": 1.1184551342063752e-06, - "loss": 0.5334, - "step": 55989 - }, - { - "epoch": 1.44, - "learning_rate": 1.1184276585235768e-06, - "loss": 0.6128, - "step": 55990 - }, - { - "epoch": 1.44, - "learning_rate": 1.1184001827501042e-06, - "loss": 0.6284, - "step": 55991 - }, - { - "epoch": 1.44, - "learning_rate": 1.1183727068859777e-06, - "loss": 0.6272, - "step": 55992 - }, - { - "epoch": 1.44, - "learning_rate": 1.1183452309312186e-06, - "loss": 0.5781, - "step": 55993 - }, - { - "epoch": 1.44, - "learning_rate": 1.1183177548858484e-06, - "loss": 0.7861, - "step": 55994 - }, - { - "epoch": 1.44, - "learning_rate": 1.1182902787498876e-06, - "loss": 0.6426, - "step": 55995 - }, - { - "epoch": 1.44, - "learning_rate": 1.1182628025233572e-06, - "loss": 0.6426, - "step": 55996 - }, - { - "epoch": 1.44, - "learning_rate": 1.1182353262062785e-06, - "loss": 0.6748, - "step": 55997 - }, - { - "epoch": 1.44, - "learning_rate": 1.1182078497986724e-06, - "loss": 0.5938, - "step": 55998 - }, - { - "epoch": 1.44, - "learning_rate": 1.11818037330056e-06, - "loss": 0.7334, - "step": 55999 - }, - { - "epoch": 1.44, - "learning_rate": 1.1181528967119625e-06, - "loss": 0.4976, - "step": 56000 - }, - { - "epoch": 1.44, - "learning_rate": 1.1181254200329005e-06, - "loss": 0.5425, - "step": 56001 - }, - { - "epoch": 1.44, - "learning_rate": 1.1180979432633955e-06, - "loss": 0.4893, - "step": 56002 - }, - { - "epoch": 1.44, - "learning_rate": 1.1180704664034682e-06, - "loss": 0.6411, - "step": 56003 - }, - { - "epoch": 1.44, - "learning_rate": 1.1180429894531399e-06, - "loss": 0.4149, - "step": 56004 - }, - { - "epoch": 1.44, - "learning_rate": 1.1180155124124312e-06, - "loss": 0.5498, - "step": 56005 - }, - { - "epoch": 1.44, - "learning_rate": 1.1179880352813638e-06, - "loss": 0.7744, - "step": 56006 - }, - { - "epoch": 1.44, - "learning_rate": 1.1179605580599583e-06, - "loss": 0.5923, - "step": 56007 - }, - { - "epoch": 1.44, - "learning_rate": 1.117933080748236e-06, - "loss": 0.7021, - "step": 56008 - }, - { - "epoch": 1.44, - "learning_rate": 1.1179056033462173e-06, - "loss": 0.6997, - "step": 56009 - }, - { - "epoch": 1.44, - "learning_rate": 1.117878125853924e-06, - "loss": 0.7939, - "step": 56010 - }, - { - "epoch": 1.44, - "learning_rate": 1.1178506482713767e-06, - "loss": 0.5752, - "step": 56011 - }, - { - "epoch": 1.44, - "learning_rate": 1.117823170598597e-06, - "loss": 0.5635, - "step": 56012 - }, - { - "epoch": 1.44, - "learning_rate": 1.117795692835605e-06, - "loss": 0.5347, - "step": 56013 - }, - { - "epoch": 1.44, - "learning_rate": 1.1177682149824223e-06, - "loss": 0.6738, - "step": 56014 - }, - { - "epoch": 1.44, - "learning_rate": 1.1177407370390702e-06, - "loss": 0.5967, - "step": 56015 - }, - { - "epoch": 1.44, - "learning_rate": 1.117713259005569e-06, - "loss": 0.6946, - "step": 56016 - }, - { - "epoch": 1.44, - "learning_rate": 1.1176857808819406e-06, - "loss": 0.7422, - "step": 56017 - }, - { - "epoch": 1.44, - "learning_rate": 1.1176583026682053e-06, - "loss": 0.5417, - "step": 56018 - }, - { - "epoch": 1.44, - "learning_rate": 1.1176308243643848e-06, - "loss": 0.6157, - "step": 56019 - }, - { - "epoch": 1.44, - "learning_rate": 1.1176033459704995e-06, - "loss": 0.417, - "step": 56020 - }, - { - "epoch": 1.44, - "learning_rate": 1.1175758674865708e-06, - "loss": 0.455, - "step": 56021 - }, - { - "epoch": 1.44, - "learning_rate": 1.1175483889126196e-06, - "loss": 0.6812, - "step": 56022 - }, - { - "epoch": 1.44, - "learning_rate": 1.1175209102486674e-06, - "loss": 0.7627, - "step": 56023 - }, - { - "epoch": 1.44, - "learning_rate": 1.1174934314947343e-06, - "loss": 0.5425, - "step": 56024 - }, - { - "epoch": 1.44, - "learning_rate": 1.1174659526508422e-06, - "loss": 0.6216, - "step": 56025 - }, - { - "epoch": 1.44, - "learning_rate": 1.1174384737170115e-06, - "loss": 0.5267, - "step": 56026 - }, - { - "epoch": 1.44, - "learning_rate": 1.117410994693264e-06, - "loss": 0.647, - "step": 56027 - }, - { - "epoch": 1.44, - "learning_rate": 1.1173835155796199e-06, - "loss": 0.7607, - "step": 56028 - }, - { - "epoch": 1.44, - "learning_rate": 1.117356036376101e-06, - "loss": 0.6738, - "step": 56029 - }, - { - "epoch": 1.44, - "learning_rate": 1.1173285570827276e-06, - "loss": 0.4844, - "step": 56030 - }, - { - "epoch": 1.44, - "learning_rate": 1.1173010776995214e-06, - "loss": 0.6758, - "step": 56031 - }, - { - "epoch": 1.44, - "learning_rate": 1.1172735982265032e-06, - "loss": 0.7168, - "step": 56032 - }, - { - "epoch": 1.44, - "learning_rate": 1.1172461186636938e-06, - "loss": 0.5859, - "step": 56033 - }, - { - "epoch": 1.44, - "learning_rate": 1.1172186390111144e-06, - "loss": 0.6494, - "step": 56034 - }, - { - "epoch": 1.44, - "learning_rate": 1.117191159268786e-06, - "loss": 0.667, - "step": 56035 - }, - { - "epoch": 1.44, - "learning_rate": 1.1171636794367301e-06, - "loss": 0.4904, - "step": 56036 - }, - { - "epoch": 1.44, - "learning_rate": 1.117136199514967e-06, - "loss": 0.7852, - "step": 56037 - }, - { - "epoch": 1.44, - "learning_rate": 1.1171087195035186e-06, - "loss": 0.749, - "step": 56038 - }, - { - "epoch": 1.44, - "learning_rate": 1.1170812394024051e-06, - "loss": 0.5969, - "step": 56039 - }, - { - "epoch": 1.44, - "learning_rate": 1.1170537592116478e-06, - "loss": 0.4333, - "step": 56040 - }, - { - "epoch": 1.44, - "learning_rate": 1.117026278931268e-06, - "loss": 0.7275, - "step": 56041 - }, - { - "epoch": 1.44, - "learning_rate": 1.1169987985612863e-06, - "loss": 0.5454, - "step": 56042 - }, - { - "epoch": 1.44, - "learning_rate": 1.1169713181017242e-06, - "loss": 0.6826, - "step": 56043 - }, - { - "epoch": 1.44, - "learning_rate": 1.1169438375526025e-06, - "loss": 0.5879, - "step": 56044 - }, - { - "epoch": 1.44, - "learning_rate": 1.116916356913942e-06, - "loss": 0.6096, - "step": 56045 - }, - { - "epoch": 1.44, - "learning_rate": 1.1168888761857644e-06, - "loss": 0.793, - "step": 56046 - }, - { - "epoch": 1.44, - "learning_rate": 1.1168613953680903e-06, - "loss": 0.7324, - "step": 56047 - }, - { - "epoch": 1.44, - "learning_rate": 1.116833914460941e-06, - "loss": 0.7734, - "step": 56048 - }, - { - "epoch": 1.44, - "learning_rate": 1.116806433464337e-06, - "loss": 0.5811, - "step": 56049 - }, - { - "epoch": 1.44, - "learning_rate": 1.1167789523782999e-06, - "loss": 0.6543, - "step": 56050 - }, - { - "epoch": 1.44, - "learning_rate": 1.11675147120285e-06, - "loss": 0.6514, - "step": 56051 - }, - { - "epoch": 1.44, - "learning_rate": 1.1167239899380097e-06, - "loss": 0.6069, - "step": 56052 - }, - { - "epoch": 1.44, - "learning_rate": 1.1166965085837987e-06, - "loss": 0.9902, - "step": 56053 - }, - { - "epoch": 1.44, - "learning_rate": 1.1166690271402386e-06, - "loss": 0.5962, - "step": 56054 - }, - { - "epoch": 1.44, - "learning_rate": 1.1166415456073504e-06, - "loss": 0.488, - "step": 56055 - }, - { - "epoch": 1.44, - "learning_rate": 1.1166140639851551e-06, - "loss": 0.5186, - "step": 56056 - }, - { - "epoch": 1.44, - "learning_rate": 1.1165865822736739e-06, - "loss": 0.7314, - "step": 56057 - }, - { - "epoch": 1.44, - "learning_rate": 1.1165591004729278e-06, - "loss": 0.5776, - "step": 56058 - }, - { - "epoch": 1.44, - "learning_rate": 1.1165316185829373e-06, - "loss": 0.5889, - "step": 56059 - }, - { - "epoch": 1.44, - "learning_rate": 1.1165041366037244e-06, - "loss": 0.5526, - "step": 56060 - }, - { - "epoch": 1.44, - "learning_rate": 1.1164766545353094e-06, - "loss": 0.8545, - "step": 56061 - }, - { - "epoch": 1.44, - "learning_rate": 1.1164491723777137e-06, - "loss": 0.7227, - "step": 56062 - }, - { - "epoch": 1.44, - "learning_rate": 1.1164216901309582e-06, - "loss": 0.6294, - "step": 56063 - }, - { - "epoch": 1.44, - "learning_rate": 1.116394207795064e-06, - "loss": 0.5259, - "step": 56064 - }, - { - "epoch": 1.44, - "learning_rate": 1.1163667253700519e-06, - "loss": 0.5293, - "step": 56065 - }, - { - "epoch": 1.44, - "learning_rate": 1.1163392428559432e-06, - "loss": 0.5957, - "step": 56066 - }, - { - "epoch": 1.44, - "learning_rate": 1.1163117602527592e-06, - "loss": 0.6104, - "step": 56067 - }, - { - "epoch": 1.44, - "learning_rate": 1.11628427756052e-06, - "loss": 0.6846, - "step": 56068 - }, - { - "epoch": 1.44, - "learning_rate": 1.116256794779248e-06, - "loss": 0.6113, - "step": 56069 - }, - { - "epoch": 1.44, - "learning_rate": 1.116229311908963e-06, - "loss": 0.5088, - "step": 56070 - }, - { - "epoch": 1.44, - "learning_rate": 1.1162018289496868e-06, - "loss": 0.7163, - "step": 56071 - }, - { - "epoch": 1.44, - "learning_rate": 1.1161743459014404e-06, - "loss": 0.7725, - "step": 56072 - }, - { - "epoch": 1.44, - "learning_rate": 1.1161468627642443e-06, - "loss": 0.5996, - "step": 56073 - }, - { - "epoch": 1.44, - "learning_rate": 1.11611937953812e-06, - "loss": 0.5226, - "step": 56074 - }, - { - "epoch": 1.44, - "learning_rate": 1.1160918962230884e-06, - "loss": 0.4551, - "step": 56075 - }, - { - "epoch": 1.44, - "learning_rate": 1.1160644128191703e-06, - "loss": 0.5898, - "step": 56076 - }, - { - "epoch": 1.44, - "learning_rate": 1.1160369293263876e-06, - "loss": 0.7627, - "step": 56077 - }, - { - "epoch": 1.44, - "learning_rate": 1.1160094457447603e-06, - "loss": 0.7373, - "step": 56078 - }, - { - "epoch": 1.44, - "learning_rate": 1.1159819620743102e-06, - "loss": 0.7515, - "step": 56079 - }, - { - "epoch": 1.44, - "learning_rate": 1.1159544783150577e-06, - "loss": 0.6685, - "step": 56080 - }, - { - "epoch": 1.44, - "learning_rate": 1.1159269944670246e-06, - "loss": 0.6045, - "step": 56081 - }, - { - "epoch": 1.44, - "learning_rate": 1.1158995105302313e-06, - "loss": 0.5063, - "step": 56082 - }, - { - "epoch": 1.44, - "learning_rate": 1.115872026504699e-06, - "loss": 0.7148, - "step": 56083 - }, - { - "epoch": 1.44, - "learning_rate": 1.115844542390449e-06, - "loss": 0.5073, - "step": 56084 - }, - { - "epoch": 1.44, - "learning_rate": 1.1158170581875022e-06, - "loss": 0.6045, - "step": 56085 - }, - { - "epoch": 1.44, - "learning_rate": 1.1157895738958794e-06, - "loss": 0.7607, - "step": 56086 - }, - { - "epoch": 1.44, - "learning_rate": 1.1157620895156019e-06, - "loss": 0.6196, - "step": 56087 - }, - { - "epoch": 1.44, - "learning_rate": 1.1157346050466906e-06, - "loss": 0.6348, - "step": 56088 - }, - { - "epoch": 1.44, - "learning_rate": 1.1157071204891668e-06, - "loss": 0.5947, - "step": 56089 - }, - { - "epoch": 1.44, - "learning_rate": 1.1156796358430514e-06, - "loss": 0.7456, - "step": 56090 - }, - { - "epoch": 1.44, - "learning_rate": 1.115652151108365e-06, - "loss": 0.7026, - "step": 56091 - }, - { - "epoch": 1.44, - "learning_rate": 1.1156246662851298e-06, - "loss": 0.4658, - "step": 56092 - }, - { - "epoch": 1.44, - "learning_rate": 1.1155971813733658e-06, - "loss": 0.7168, - "step": 56093 - }, - { - "epoch": 1.44, - "learning_rate": 1.1155696963730942e-06, - "loss": 0.6035, - "step": 56094 - }, - { - "epoch": 1.44, - "learning_rate": 1.1155422112843363e-06, - "loss": 0.7227, - "step": 56095 - }, - { - "epoch": 1.44, - "learning_rate": 1.115514726107113e-06, - "loss": 0.5825, - "step": 56096 - }, - { - "epoch": 1.44, - "learning_rate": 1.1154872408414455e-06, - "loss": 0.6699, - "step": 56097 - }, - { - "epoch": 1.44, - "learning_rate": 1.1154597554873548e-06, - "loss": 0.6895, - "step": 56098 - }, - { - "epoch": 1.44, - "learning_rate": 1.1154322700448615e-06, - "loss": 0.6533, - "step": 56099 - }, - { - "epoch": 1.44, - "learning_rate": 1.1154047845139874e-06, - "loss": 0.7549, - "step": 56100 - }, - { - "epoch": 1.44, - "learning_rate": 1.1153772988947528e-06, - "loss": 0.5684, - "step": 56101 - }, - { - "epoch": 1.44, - "learning_rate": 1.1153498131871796e-06, - "loss": 0.6665, - "step": 56102 - }, - { - "epoch": 1.44, - "learning_rate": 1.1153223273912876e-06, - "loss": 0.6592, - "step": 56103 - }, - { - "epoch": 1.44, - "learning_rate": 1.1152948415070993e-06, - "loss": 0.71, - "step": 56104 - }, - { - "epoch": 1.44, - "learning_rate": 1.1152673555346347e-06, - "loss": 0.7021, - "step": 56105 - }, - { - "epoch": 1.44, - "learning_rate": 1.1152398694739154e-06, - "loss": 0.4054, - "step": 56106 - }, - { - "epoch": 1.44, - "learning_rate": 1.1152123833249623e-06, - "loss": 0.4995, - "step": 56107 - }, - { - "epoch": 1.44, - "learning_rate": 1.115184897087796e-06, - "loss": 0.7715, - "step": 56108 - }, - { - "epoch": 1.44, - "learning_rate": 1.115157410762438e-06, - "loss": 0.3291, - "step": 56109 - }, - { - "epoch": 1.44, - "learning_rate": 1.1151299243489094e-06, - "loss": 0.7812, - "step": 56110 - }, - { - "epoch": 1.44, - "learning_rate": 1.1151024378472311e-06, - "loss": 0.5278, - "step": 56111 - }, - { - "epoch": 1.44, - "learning_rate": 1.1150749512574243e-06, - "loss": 0.5847, - "step": 56112 - }, - { - "epoch": 1.44, - "learning_rate": 1.1150474645795096e-06, - "loss": 0.6235, - "step": 56113 - }, - { - "epoch": 1.44, - "learning_rate": 1.1150199778135085e-06, - "loss": 0.7744, - "step": 56114 - }, - { - "epoch": 1.44, - "learning_rate": 1.1149924909594418e-06, - "loss": 0.6006, - "step": 56115 - }, - { - "epoch": 1.44, - "learning_rate": 1.1149650040173305e-06, - "loss": 0.5485, - "step": 56116 - }, - { - "epoch": 1.44, - "learning_rate": 1.1149375169871964e-06, - "loss": 0.689, - "step": 56117 - }, - { - "epoch": 1.44, - "learning_rate": 1.1149100298690594e-06, - "loss": 0.6013, - "step": 56118 - }, - { - "epoch": 1.44, - "learning_rate": 1.1148825426629415e-06, - "loss": 0.5591, - "step": 56119 - }, - { - "epoch": 1.44, - "learning_rate": 1.1148550553688628e-06, - "loss": 0.7812, - "step": 56120 - }, - { - "epoch": 1.44, - "learning_rate": 1.114827567986845e-06, - "loss": 0.6475, - "step": 56121 - }, - { - "epoch": 1.44, - "learning_rate": 1.114800080516909e-06, - "loss": 0.4561, - "step": 56122 - }, - { - "epoch": 1.44, - "learning_rate": 1.1147725929590763e-06, - "loss": 0.6025, - "step": 56123 - }, - { - "epoch": 1.44, - "learning_rate": 1.114745105313367e-06, - "loss": 0.5347, - "step": 56124 - }, - { - "epoch": 1.44, - "learning_rate": 1.1147176175798027e-06, - "loss": 0.5701, - "step": 56125 - }, - { - "epoch": 1.44, - "learning_rate": 1.1146901297584045e-06, - "loss": 0.5947, - "step": 56126 - }, - { - "epoch": 1.44, - "learning_rate": 1.1146626418491933e-06, - "loss": 0.6953, - "step": 56127 - }, - { - "epoch": 1.44, - "learning_rate": 1.1146351538521903e-06, - "loss": 0.5425, - "step": 56128 - }, - { - "epoch": 1.44, - "learning_rate": 1.1146076657674166e-06, - "loss": 0.7544, - "step": 56129 - }, - { - "epoch": 1.44, - "learning_rate": 1.1145801775948927e-06, - "loss": 0.6777, - "step": 56130 - }, - { - "epoch": 1.44, - "learning_rate": 1.1145526893346402e-06, - "loss": 0.7354, - "step": 56131 - }, - { - "epoch": 1.44, - "learning_rate": 1.11452520098668e-06, - "loss": 0.6182, - "step": 56132 - }, - { - "epoch": 1.44, - "learning_rate": 1.1144977125510329e-06, - "loss": 0.6196, - "step": 56133 - }, - { - "epoch": 1.44, - "learning_rate": 1.1144702240277205e-06, - "loss": 0.645, - "step": 56134 - }, - { - "epoch": 1.44, - "learning_rate": 1.114442735416763e-06, - "loss": 0.8311, - "step": 56135 - }, - { - "epoch": 1.44, - "learning_rate": 1.1144152467181824e-06, - "loss": 0.7324, - "step": 56136 - }, - { - "epoch": 1.44, - "learning_rate": 1.1143877579319993e-06, - "loss": 0.5928, - "step": 56137 - }, - { - "epoch": 1.44, - "learning_rate": 1.1143602690582348e-06, - "loss": 0.8369, - "step": 56138 - }, - { - "epoch": 1.44, - "learning_rate": 1.1143327800969096e-06, - "loss": 0.6377, - "step": 56139 - }, - { - "epoch": 1.44, - "learning_rate": 1.1143052910480453e-06, - "loss": 0.6016, - "step": 56140 - }, - { - "epoch": 1.44, - "learning_rate": 1.1142778019116623e-06, - "loss": 0.6846, - "step": 56141 - }, - { - "epoch": 1.44, - "learning_rate": 1.1142503126877827e-06, - "loss": 0.5918, - "step": 56142 - }, - { - "epoch": 1.44, - "learning_rate": 1.1142228233764263e-06, - "loss": 0.6714, - "step": 56143 - }, - { - "epoch": 1.44, - "learning_rate": 1.1141953339776151e-06, - "loss": 0.5918, - "step": 56144 - }, - { - "epoch": 1.44, - "learning_rate": 1.1141678444913696e-06, - "loss": 0.6426, - "step": 56145 - }, - { - "epoch": 1.44, - "learning_rate": 1.114140354917711e-06, - "loss": 0.7427, - "step": 56146 - }, - { - "epoch": 1.44, - "learning_rate": 1.1141128652566608e-06, - "loss": 0.6875, - "step": 56147 - }, - { - "epoch": 1.44, - "learning_rate": 1.1140853755082393e-06, - "loss": 0.5864, - "step": 56148 - }, - { - "epoch": 1.44, - "learning_rate": 1.1140578856724676e-06, - "loss": 0.6306, - "step": 56149 - }, - { - "epoch": 1.44, - "learning_rate": 1.1140303957493676e-06, - "loss": 0.4751, - "step": 56150 - }, - { - "epoch": 1.44, - "learning_rate": 1.114002905738959e-06, - "loss": 0.6072, - "step": 56151 - }, - { - "epoch": 1.44, - "learning_rate": 1.1139754156412642e-06, - "loss": 0.7783, - "step": 56152 - }, - { - "epoch": 1.44, - "learning_rate": 1.1139479254563036e-06, - "loss": 0.5911, - "step": 56153 - }, - { - "epoch": 1.44, - "learning_rate": 1.1139204351840983e-06, - "loss": 0.7124, - "step": 56154 - }, - { - "epoch": 1.44, - "learning_rate": 1.1138929448246692e-06, - "loss": 0.5645, - "step": 56155 - }, - { - "epoch": 1.44, - "learning_rate": 1.1138654543780375e-06, - "loss": 0.7168, - "step": 56156 - }, - { - "epoch": 1.44, - "learning_rate": 1.1138379638442248e-06, - "loss": 0.8301, - "step": 56157 - }, - { - "epoch": 1.44, - "learning_rate": 1.113810473223251e-06, - "loss": 0.6812, - "step": 56158 - }, - { - "epoch": 1.44, - "learning_rate": 1.1137829825151378e-06, - "loss": 0.626, - "step": 56159 - }, - { - "epoch": 1.44, - "learning_rate": 1.1137554917199063e-06, - "loss": 0.7812, - "step": 56160 - }, - { - "epoch": 1.44, - "learning_rate": 1.1137280008375775e-06, - "loss": 0.7217, - "step": 56161 - }, - { - "epoch": 1.44, - "learning_rate": 1.1137005098681726e-06, - "loss": 0.5591, - "step": 56162 - }, - { - "epoch": 1.44, - "learning_rate": 1.1136730188117123e-06, - "loss": 0.6294, - "step": 56163 - }, - { - "epoch": 1.44, - "learning_rate": 1.1136455276682174e-06, - "loss": 0.5186, - "step": 56164 - }, - { - "epoch": 1.44, - "learning_rate": 1.11361803643771e-06, - "loss": 0.5942, - "step": 56165 - }, - { - "epoch": 1.44, - "learning_rate": 1.11359054512021e-06, - "loss": 0.8398, - "step": 56166 - }, - { - "epoch": 1.44, - "learning_rate": 1.1135630537157392e-06, - "loss": 0.5264, - "step": 56167 - }, - { - "epoch": 1.44, - "learning_rate": 1.1135355622243183e-06, - "loss": 0.8037, - "step": 56168 - }, - { - "epoch": 1.44, - "learning_rate": 1.1135080706459686e-06, - "loss": 0.7002, - "step": 56169 - }, - { - "epoch": 1.44, - "learning_rate": 1.1134805789807107e-06, - "loss": 0.5952, - "step": 56170 - }, - { - "epoch": 1.44, - "learning_rate": 1.1134530872285661e-06, - "loss": 0.7715, - "step": 56171 - }, - { - "epoch": 1.44, - "learning_rate": 1.1134255953895557e-06, - "loss": 0.6807, - "step": 56172 - }, - { - "epoch": 1.44, - "learning_rate": 1.1133981034637004e-06, - "loss": 0.5659, - "step": 56173 - }, - { - "epoch": 1.44, - "learning_rate": 1.1133706114510216e-06, - "loss": 0.5739, - "step": 56174 - }, - { - "epoch": 1.44, - "learning_rate": 1.1133431193515399e-06, - "loss": 0.6187, - "step": 56175 - }, - { - "epoch": 1.44, - "learning_rate": 1.1133156271652767e-06, - "loss": 0.625, - "step": 56176 - }, - { - "epoch": 1.44, - "learning_rate": 1.113288134892253e-06, - "loss": 0.4863, - "step": 56177 - }, - { - "epoch": 1.44, - "learning_rate": 1.1132606425324898e-06, - "loss": 0.625, - "step": 56178 - }, - { - "epoch": 1.44, - "learning_rate": 1.113233150086008e-06, - "loss": 0.6797, - "step": 56179 - }, - { - "epoch": 1.44, - "learning_rate": 1.1132056575528288e-06, - "loss": 0.6064, - "step": 56180 - }, - { - "epoch": 1.44, - "learning_rate": 1.113178164932973e-06, - "loss": 0.6558, - "step": 56181 - }, - { - "epoch": 1.44, - "learning_rate": 1.1131506722264625e-06, - "loss": 0.5703, - "step": 56182 - }, - { - "epoch": 1.44, - "learning_rate": 1.1131231794333174e-06, - "loss": 0.5815, - "step": 56183 - }, - { - "epoch": 1.44, - "learning_rate": 1.1130956865535591e-06, - "loss": 0.6104, - "step": 56184 - }, - { - "epoch": 1.44, - "learning_rate": 1.1130681935872085e-06, - "loss": 0.7725, - "step": 56185 - }, - { - "epoch": 1.44, - "learning_rate": 1.1130407005342868e-06, - "loss": 0.7295, - "step": 56186 - }, - { - "epoch": 1.44, - "learning_rate": 1.1130132073948153e-06, - "loss": 0.6636, - "step": 56187 - }, - { - "epoch": 1.44, - "learning_rate": 1.1129857141688145e-06, - "loss": 0.7168, - "step": 56188 - }, - { - "epoch": 1.44, - "learning_rate": 1.1129582208563057e-06, - "loss": 0.6992, - "step": 56189 - }, - { - "epoch": 1.44, - "learning_rate": 1.1129307274573103e-06, - "loss": 0.584, - "step": 56190 - }, - { - "epoch": 1.44, - "learning_rate": 1.1129032339718487e-06, - "loss": 0.667, - "step": 56191 - }, - { - "epoch": 1.44, - "learning_rate": 1.1128757403999428e-06, - "loss": 0.7139, - "step": 56192 - }, - { - "epoch": 1.44, - "learning_rate": 1.1128482467416128e-06, - "loss": 0.7275, - "step": 56193 - }, - { - "epoch": 1.44, - "learning_rate": 1.1128207529968801e-06, - "loss": 0.7568, - "step": 56194 - }, - { - "epoch": 1.44, - "learning_rate": 1.1127932591657654e-06, - "loss": 0.9424, - "step": 56195 - }, - { - "epoch": 1.44, - "learning_rate": 1.1127657652482905e-06, - "loss": 0.6626, - "step": 56196 - }, - { - "epoch": 1.44, - "learning_rate": 1.112738271244476e-06, - "loss": 0.5125, - "step": 56197 - }, - { - "epoch": 1.44, - "learning_rate": 1.1127107771543427e-06, - "loss": 0.6304, - "step": 56198 - }, - { - "epoch": 1.44, - "learning_rate": 1.1126832829779123e-06, - "loss": 0.55, - "step": 56199 - }, - { - "epoch": 1.44, - "learning_rate": 1.1126557887152053e-06, - "loss": 0.5474, - "step": 56200 - }, - { - "epoch": 1.44, - "learning_rate": 1.1126282943662432e-06, - "loss": 0.7305, - "step": 56201 - }, - { - "epoch": 1.44, - "learning_rate": 1.1126007999310465e-06, - "loss": 0.5562, - "step": 56202 - }, - { - "epoch": 1.44, - "learning_rate": 1.1125733054096368e-06, - "loss": 0.4964, - "step": 56203 - }, - { - "epoch": 1.44, - "learning_rate": 1.1125458108020344e-06, - "loss": 0.5952, - "step": 56204 - }, - { - "epoch": 1.44, - "learning_rate": 1.1125183161082613e-06, - "loss": 0.7676, - "step": 56205 - }, - { - "epoch": 1.44, - "learning_rate": 1.1124908213283377e-06, - "loss": 0.4214, - "step": 56206 - }, - { - "epoch": 1.44, - "learning_rate": 1.112463326462286e-06, - "loss": 0.6299, - "step": 56207 - }, - { - "epoch": 1.44, - "learning_rate": 1.1124358315101252e-06, - "loss": 0.6885, - "step": 56208 - }, - { - "epoch": 1.44, - "learning_rate": 1.112408336471878e-06, - "loss": 0.6553, - "step": 56209 - }, - { - "epoch": 1.44, - "learning_rate": 1.1123808413475645e-06, - "loss": 0.7197, - "step": 56210 - }, - { - "epoch": 1.44, - "learning_rate": 1.1123533461372065e-06, - "loss": 0.6167, - "step": 56211 - }, - { - "epoch": 1.44, - "learning_rate": 1.112325850840825e-06, - "loss": 0.7695, - "step": 56212 - }, - { - "epoch": 1.44, - "learning_rate": 1.1122983554584405e-06, - "loss": 0.6416, - "step": 56213 - }, - { - "epoch": 1.44, - "learning_rate": 1.112270859990074e-06, - "loss": 0.751, - "step": 56214 - }, - { - "epoch": 1.44, - "learning_rate": 1.112243364435747e-06, - "loss": 0.7578, - "step": 56215 - }, - { - "epoch": 1.44, - "learning_rate": 1.1122158687954803e-06, - "loss": 0.6855, - "step": 56216 - }, - { - "epoch": 1.44, - "learning_rate": 1.1121883730692955e-06, - "loss": 0.6284, - "step": 56217 - }, - { - "epoch": 1.44, - "learning_rate": 1.1121608772572132e-06, - "loss": 0.7568, - "step": 56218 - }, - { - "epoch": 1.44, - "learning_rate": 1.1121333813592542e-06, - "loss": 0.6021, - "step": 56219 - }, - { - "epoch": 1.44, - "learning_rate": 1.1121058853754397e-06, - "loss": 0.4985, - "step": 56220 - }, - { - "epoch": 1.44, - "learning_rate": 1.1120783893057911e-06, - "loss": 0.6072, - "step": 56221 - }, - { - "epoch": 1.44, - "learning_rate": 1.1120508931503295e-06, - "loss": 0.6846, - "step": 56222 - }, - { - "epoch": 1.44, - "learning_rate": 1.112023396909075e-06, - "loss": 0.7461, - "step": 56223 - }, - { - "epoch": 1.44, - "learning_rate": 1.11199590058205e-06, - "loss": 0.6367, - "step": 56224 - }, - { - "epoch": 1.44, - "learning_rate": 1.1119684041692745e-06, - "loss": 0.605, - "step": 56225 - }, - { - "epoch": 1.44, - "learning_rate": 1.11194090767077e-06, - "loss": 0.55, - "step": 56226 - }, - { - "epoch": 1.44, - "learning_rate": 1.1119134110865576e-06, - "loss": 0.4449, - "step": 56227 - }, - { - "epoch": 1.44, - "learning_rate": 1.1118859144166583e-06, - "loss": 0.6157, - "step": 56228 - }, - { - "epoch": 1.44, - "learning_rate": 1.111858417661093e-06, - "loss": 0.7402, - "step": 56229 - }, - { - "epoch": 1.44, - "learning_rate": 1.1118309208198828e-06, - "loss": 0.8242, - "step": 56230 - }, - { - "epoch": 1.44, - "learning_rate": 1.1118034238930488e-06, - "loss": 0.7559, - "step": 56231 - }, - { - "epoch": 1.44, - "learning_rate": 1.1117759268806123e-06, - "loss": 0.6514, - "step": 56232 - }, - { - "epoch": 1.44, - "learning_rate": 1.111748429782594e-06, - "loss": 0.7012, - "step": 56233 - }, - { - "epoch": 1.44, - "learning_rate": 1.111720932599015e-06, - "loss": 0.5139, - "step": 56234 - }, - { - "epoch": 1.44, - "learning_rate": 1.1116934353298961e-06, - "loss": 0.708, - "step": 56235 - }, - { - "epoch": 1.44, - "learning_rate": 1.111665937975259e-06, - "loss": 0.5293, - "step": 56236 - }, - { - "epoch": 1.44, - "learning_rate": 1.1116384405351247e-06, - "loss": 0.7295, - "step": 56237 - }, - { - "epoch": 1.44, - "learning_rate": 1.1116109430095137e-06, - "loss": 0.7212, - "step": 56238 - }, - { - "epoch": 1.44, - "learning_rate": 1.1115834453984471e-06, - "loss": 0.8047, - "step": 56239 - }, - { - "epoch": 1.44, - "learning_rate": 1.1115559477019464e-06, - "loss": 0.5708, - "step": 56240 - }, - { - "epoch": 1.44, - "learning_rate": 1.1115284499200324e-06, - "loss": 0.6548, - "step": 56241 - }, - { - "epoch": 1.44, - "learning_rate": 1.1115009520527262e-06, - "loss": 0.7363, - "step": 56242 - }, - { - "epoch": 1.44, - "learning_rate": 1.1114734541000491e-06, - "loss": 0.5742, - "step": 56243 - }, - { - "epoch": 1.44, - "learning_rate": 1.1114459560620216e-06, - "loss": 0.4998, - "step": 56244 - }, - { - "epoch": 1.44, - "learning_rate": 1.1114184579386652e-06, - "loss": 0.7236, - "step": 56245 - }, - { - "epoch": 1.44, - "learning_rate": 1.1113909597300007e-06, - "loss": 0.5808, - "step": 56246 - }, - { - "epoch": 1.44, - "learning_rate": 1.1113634614360496e-06, - "loss": 0.6262, - "step": 56247 - }, - { - "epoch": 1.44, - "learning_rate": 1.1113359630568323e-06, - "loss": 0.6899, - "step": 56248 - }, - { - "epoch": 1.44, - "learning_rate": 1.11130846459237e-06, - "loss": 0.6479, - "step": 56249 - }, - { - "epoch": 1.44, - "learning_rate": 1.1112809660426842e-06, - "loss": 0.522, - "step": 56250 - }, - { - "epoch": 1.44, - "learning_rate": 1.1112534674077957e-06, - "loss": 0.7188, - "step": 56251 - }, - { - "epoch": 1.44, - "learning_rate": 1.1112259686877255e-06, - "loss": 0.6997, - "step": 56252 - }, - { - "epoch": 1.44, - "learning_rate": 1.1111984698824947e-06, - "loss": 0.6248, - "step": 56253 - }, - { - "epoch": 1.44, - "learning_rate": 1.1111709709921242e-06, - "loss": 0.8174, - "step": 56254 - }, - { - "epoch": 1.44, - "learning_rate": 1.1111434720166353e-06, - "loss": 0.646, - "step": 56255 - }, - { - "epoch": 1.44, - "learning_rate": 1.1111159729560488e-06, - "loss": 0.7075, - "step": 56256 - }, - { - "epoch": 1.44, - "learning_rate": 1.1110884738103863e-06, - "loss": 0.6392, - "step": 56257 - }, - { - "epoch": 1.44, - "learning_rate": 1.1110609745796682e-06, - "loss": 0.7383, - "step": 56258 - }, - { - "epoch": 1.44, - "learning_rate": 1.1110334752639158e-06, - "loss": 0.5527, - "step": 56259 - }, - { - "epoch": 1.44, - "learning_rate": 1.11100597586315e-06, - "loss": 0.7061, - "step": 56260 - }, - { - "epoch": 1.44, - "learning_rate": 1.1109784763773924e-06, - "loss": 0.7324, - "step": 56261 - }, - { - "epoch": 1.44, - "learning_rate": 1.1109509768066636e-06, - "loss": 0.8184, - "step": 56262 - }, - { - "epoch": 1.44, - "learning_rate": 1.1109234771509846e-06, - "loss": 0.6719, - "step": 56263 - }, - { - "epoch": 1.44, - "learning_rate": 1.1108959774103768e-06, - "loss": 0.623, - "step": 56264 - }, - { - "epoch": 1.44, - "learning_rate": 1.110868477584861e-06, - "loss": 0.7734, - "step": 56265 - }, - { - "epoch": 1.44, - "learning_rate": 1.110840977674458e-06, - "loss": 0.623, - "step": 56266 - }, - { - "epoch": 1.44, - "learning_rate": 1.1108134776791892e-06, - "loss": 0.7168, - "step": 56267 - }, - { - "epoch": 1.44, - "learning_rate": 1.110785977599076e-06, - "loss": 0.4246, - "step": 56268 - }, - { - "epoch": 1.44, - "learning_rate": 1.1107584774341388e-06, - "loss": 0.6787, - "step": 56269 - }, - { - "epoch": 1.44, - "learning_rate": 1.110730977184399e-06, - "loss": 0.5225, - "step": 56270 - }, - { - "epoch": 1.44, - "learning_rate": 1.1107034768498774e-06, - "loss": 0.7051, - "step": 56271 - }, - { - "epoch": 1.44, - "learning_rate": 1.1106759764305957e-06, - "loss": 0.5703, - "step": 56272 - }, - { - "epoch": 1.44, - "learning_rate": 1.110648475926574e-06, - "loss": 0.5923, - "step": 56273 - }, - { - "epoch": 1.44, - "learning_rate": 1.1106209753378342e-06, - "loss": 0.6182, - "step": 56274 - }, - { - "epoch": 1.44, - "learning_rate": 1.1105934746643968e-06, - "loss": 0.6816, - "step": 56275 - }, - { - "epoch": 1.44, - "learning_rate": 1.1105659739062832e-06, - "loss": 0.4753, - "step": 56276 - }, - { - "epoch": 1.44, - "learning_rate": 1.110538473063514e-06, - "loss": 0.6772, - "step": 56277 - }, - { - "epoch": 1.44, - "learning_rate": 1.110510972136111e-06, - "loss": 0.75, - "step": 56278 - }, - { - "epoch": 1.44, - "learning_rate": 1.1104834711240944e-06, - "loss": 0.4956, - "step": 56279 - }, - { - "epoch": 1.44, - "learning_rate": 1.1104559700274862e-06, - "loss": 0.5151, - "step": 56280 - }, - { - "epoch": 1.44, - "learning_rate": 1.1104284688463063e-06, - "loss": 0.6826, - "step": 56281 - }, - { - "epoch": 1.44, - "learning_rate": 1.1104009675805771e-06, - "loss": 0.7178, - "step": 56282 - }, - { - "epoch": 1.44, - "learning_rate": 1.1103734662303185e-06, - "loss": 0.7144, - "step": 56283 - }, - { - "epoch": 1.44, - "learning_rate": 1.1103459647955525e-06, - "loss": 0.6943, - "step": 56284 - }, - { - "epoch": 1.44, - "learning_rate": 1.110318463276299e-06, - "loss": 0.5605, - "step": 56285 - }, - { - "epoch": 1.44, - "learning_rate": 1.1102909616725803e-06, - "loss": 0.6787, - "step": 56286 - }, - { - "epoch": 1.44, - "learning_rate": 1.1102634599844165e-06, - "loss": 0.6406, - "step": 56287 - }, - { - "epoch": 1.44, - "learning_rate": 1.110235958211829e-06, - "loss": 0.52, - "step": 56288 - }, - { - "epoch": 1.44, - "learning_rate": 1.110208456354839e-06, - "loss": 0.5923, - "step": 56289 - }, - { - "epoch": 1.44, - "learning_rate": 1.1101809544134674e-06, - "loss": 0.6514, - "step": 56290 - }, - { - "epoch": 1.44, - "learning_rate": 1.1101534523877356e-06, - "loss": 0.6924, - "step": 56291 - }, - { - "epoch": 1.44, - "learning_rate": 1.110125950277664e-06, - "loss": 0.5315, - "step": 56292 - }, - { - "epoch": 1.44, - "learning_rate": 1.1100984480832744e-06, - "loss": 0.7354, - "step": 56293 - }, - { - "epoch": 1.44, - "learning_rate": 1.1100709458045872e-06, - "loss": 0.5557, - "step": 56294 - }, - { - "epoch": 1.44, - "learning_rate": 1.110043443441624e-06, - "loss": 0.4961, - "step": 56295 - }, - { - "epoch": 1.44, - "learning_rate": 1.1100159409944052e-06, - "loss": 0.8467, - "step": 56296 - }, - { - "epoch": 1.44, - "learning_rate": 1.1099884384629526e-06, - "loss": 0.7793, - "step": 56297 - }, - { - "epoch": 1.44, - "learning_rate": 1.1099609358472869e-06, - "loss": 0.5791, - "step": 56298 - }, - { - "epoch": 1.44, - "learning_rate": 1.1099334331474288e-06, - "loss": 0.623, - "step": 56299 - }, - { - "epoch": 1.44, - "learning_rate": 1.1099059303633999e-06, - "loss": 0.7744, - "step": 56300 - }, - { - "epoch": 1.44, - "learning_rate": 1.1098784274952216e-06, - "loss": 0.7256, - "step": 56301 - }, - { - "epoch": 1.44, - "learning_rate": 1.1098509245429138e-06, - "loss": 0.6189, - "step": 56302 - }, - { - "epoch": 1.44, - "learning_rate": 1.1098234215064983e-06, - "loss": 0.5659, - "step": 56303 - }, - { - "epoch": 1.44, - "learning_rate": 1.109795918385996e-06, - "loss": 0.6904, - "step": 56304 - }, - { - "epoch": 1.44, - "learning_rate": 1.1097684151814281e-06, - "loss": 0.6465, - "step": 56305 - }, - { - "epoch": 1.44, - "learning_rate": 1.1097409118928157e-06, - "loss": 0.4412, - "step": 56306 - }, - { - "epoch": 1.44, - "learning_rate": 1.1097134085201795e-06, - "loss": 0.7998, - "step": 56307 - }, - { - "epoch": 1.44, - "learning_rate": 1.1096859050635412e-06, - "loss": 0.7002, - "step": 56308 - }, - { - "epoch": 1.44, - "learning_rate": 1.1096584015229214e-06, - "loss": 0.542, - "step": 56309 - }, - { - "epoch": 1.44, - "learning_rate": 1.1096308978983406e-06, - "loss": 0.6914, - "step": 56310 - }, - { - "epoch": 1.44, - "learning_rate": 1.109603394189821e-06, - "loss": 0.7559, - "step": 56311 - }, - { - "epoch": 1.44, - "learning_rate": 1.109575890397383e-06, - "loss": 0.6787, - "step": 56312 - }, - { - "epoch": 1.44, - "learning_rate": 1.1095483865210478e-06, - "loss": 0.75, - "step": 56313 - }, - { - "epoch": 1.44, - "learning_rate": 1.1095208825608365e-06, - "loss": 0.7959, - "step": 56314 - }, - { - "epoch": 1.44, - "learning_rate": 1.1094933785167698e-06, - "loss": 0.8008, - "step": 56315 - }, - { - "epoch": 1.44, - "learning_rate": 1.1094658743888694e-06, - "loss": 0.749, - "step": 56316 - }, - { - "epoch": 1.44, - "learning_rate": 1.1094383701771556e-06, - "loss": 0.5176, - "step": 56317 - }, - { - "epoch": 1.44, - "learning_rate": 1.1094108658816504e-06, - "loss": 0.5708, - "step": 56318 - }, - { - "epoch": 1.44, - "learning_rate": 1.109383361502374e-06, - "loss": 0.6504, - "step": 56319 - }, - { - "epoch": 1.44, - "learning_rate": 1.1093558570393478e-06, - "loss": 0.6553, - "step": 56320 - }, - { - "epoch": 1.44, - "learning_rate": 1.109328352492593e-06, - "loss": 0.6279, - "step": 56321 - }, - { - "epoch": 1.44, - "learning_rate": 1.1093008478621304e-06, - "loss": 0.7393, - "step": 56322 - }, - { - "epoch": 1.44, - "learning_rate": 1.109273343147981e-06, - "loss": 0.5605, - "step": 56323 - }, - { - "epoch": 1.44, - "learning_rate": 1.1092458383501663e-06, - "loss": 0.541, - "step": 56324 - }, - { - "epoch": 1.44, - "learning_rate": 1.1092183334687068e-06, - "loss": 0.623, - "step": 56325 - }, - { - "epoch": 1.44, - "learning_rate": 1.1091908285036243e-06, - "loss": 0.5776, - "step": 56326 - }, - { - "epoch": 1.44, - "learning_rate": 1.1091633234549392e-06, - "loss": 0.5137, - "step": 56327 - }, - { - "epoch": 1.44, - "learning_rate": 1.1091358183226728e-06, - "loss": 0.6768, - "step": 56328 - }, - { - "epoch": 1.44, - "learning_rate": 1.1091083131068457e-06, - "loss": 0.6855, - "step": 56329 - }, - { - "epoch": 1.44, - "learning_rate": 1.1090808078074797e-06, - "loss": 0.5562, - "step": 56330 - }, - { - "epoch": 1.44, - "learning_rate": 1.109053302424596e-06, - "loss": 0.5269, - "step": 56331 - }, - { - "epoch": 1.44, - "learning_rate": 1.1090257969582144e-06, - "loss": 0.5513, - "step": 56332 - }, - { - "epoch": 1.44, - "learning_rate": 1.108998291408357e-06, - "loss": 0.6992, - "step": 56333 - }, - { - "epoch": 1.44, - "learning_rate": 1.1089707857750448e-06, - "loss": 0.6943, - "step": 56334 - }, - { - "epoch": 1.44, - "learning_rate": 1.1089432800582985e-06, - "loss": 0.4468, - "step": 56335 - }, - { - "epoch": 1.44, - "learning_rate": 1.1089157742581396e-06, - "loss": 0.8467, - "step": 56336 - }, - { - "epoch": 1.44, - "learning_rate": 1.1088882683745888e-06, - "loss": 0.4954, - "step": 56337 - }, - { - "epoch": 1.44, - "learning_rate": 1.108860762407667e-06, - "loss": 0.5854, - "step": 56338 - }, - { - "epoch": 1.44, - "learning_rate": 1.1088332563573958e-06, - "loss": 0.7012, - "step": 56339 - }, - { - "epoch": 1.44, - "learning_rate": 1.1088057502237958e-06, - "loss": 0.6221, - "step": 56340 - }, - { - "epoch": 1.44, - "learning_rate": 1.1087782440068886e-06, - "loss": 0.5713, - "step": 56341 - }, - { - "epoch": 1.44, - "learning_rate": 1.1087507377066944e-06, - "loss": 0.6562, - "step": 56342 - }, - { - "epoch": 1.44, - "learning_rate": 1.1087232313232351e-06, - "loss": 0.6064, - "step": 56343 - }, - { - "epoch": 1.44, - "learning_rate": 1.1086957248565312e-06, - "loss": 0.7764, - "step": 56344 - }, - { - "epoch": 1.44, - "learning_rate": 1.1086682183066043e-06, - "loss": 0.4702, - "step": 56345 - }, - { - "epoch": 1.44, - "learning_rate": 1.108640711673475e-06, - "loss": 0.543, - "step": 56346 - }, - { - "epoch": 1.44, - "learning_rate": 1.1086132049571645e-06, - "loss": 0.6382, - "step": 56347 - }, - { - "epoch": 1.44, - "learning_rate": 1.1085856981576935e-06, - "loss": 0.8457, - "step": 56348 - }, - { - "epoch": 1.44, - "learning_rate": 1.1085581912750838e-06, - "loss": 0.7754, - "step": 56349 - }, - { - "epoch": 1.44, - "learning_rate": 1.1085306843093561e-06, - "loss": 0.6768, - "step": 56350 - }, - { - "epoch": 1.44, - "learning_rate": 1.1085031772605313e-06, - "loss": 0.7783, - "step": 56351 - }, - { - "epoch": 1.44, - "learning_rate": 1.108475670128631e-06, - "loss": 0.5879, - "step": 56352 - }, - { - "epoch": 1.44, - "learning_rate": 1.1084481629136752e-06, - "loss": 0.5151, - "step": 56353 - }, - { - "epoch": 1.44, - "learning_rate": 1.1084206556156861e-06, - "loss": 0.5261, - "step": 56354 - }, - { - "epoch": 1.44, - "learning_rate": 1.1083931482346842e-06, - "loss": 0.3376, - "step": 56355 - }, - { - "epoch": 1.44, - "learning_rate": 1.1083656407706906e-06, - "loss": 0.5752, - "step": 56356 - }, - { - "epoch": 1.44, - "learning_rate": 1.1083381332237262e-06, - "loss": 0.6621, - "step": 56357 - }, - { - "epoch": 1.44, - "learning_rate": 1.1083106255938126e-06, - "loss": 0.6328, - "step": 56358 - }, - { - "epoch": 1.44, - "learning_rate": 1.1082831178809705e-06, - "loss": 0.6274, - "step": 56359 - }, - { - "epoch": 1.44, - "learning_rate": 1.108255610085221e-06, - "loss": 0.7412, - "step": 56360 - }, - { - "epoch": 1.44, - "learning_rate": 1.1082281022065849e-06, - "loss": 0.6602, - "step": 56361 - }, - { - "epoch": 1.44, - "learning_rate": 1.1082005942450838e-06, - "loss": 0.5127, - "step": 56362 - }, - { - "epoch": 1.44, - "learning_rate": 1.1081730862007384e-06, - "loss": 0.5073, - "step": 56363 - }, - { - "epoch": 1.44, - "learning_rate": 1.1081455780735699e-06, - "loss": 0.5725, - "step": 56364 - }, - { - "epoch": 1.44, - "learning_rate": 1.108118069863599e-06, - "loss": 0.6663, - "step": 56365 - }, - { - "epoch": 1.44, - "learning_rate": 1.1080905615708475e-06, - "loss": 0.876, - "step": 56366 - }, - { - "epoch": 1.44, - "learning_rate": 1.1080630531953357e-06, - "loss": 0.7949, - "step": 56367 - }, - { - "epoch": 1.44, - "learning_rate": 1.1080355447370853e-06, - "loss": 0.6421, - "step": 56368 - }, - { - "epoch": 1.44, - "learning_rate": 1.1080080361961167e-06, - "loss": 0.5767, - "step": 56369 - }, - { - "epoch": 1.44, - "learning_rate": 1.1079805275724513e-06, - "loss": 0.6582, - "step": 56370 - }, - { - "epoch": 1.44, - "learning_rate": 1.1079530188661105e-06, - "loss": 0.4937, - "step": 56371 - }, - { - "epoch": 1.44, - "learning_rate": 1.107925510077115e-06, - "loss": 0.5122, - "step": 56372 - }, - { - "epoch": 1.44, - "learning_rate": 1.1078980012054858e-06, - "loss": 0.6206, - "step": 56373 - }, - { - "epoch": 1.44, - "learning_rate": 1.1078704922512439e-06, - "loss": 0.6416, - "step": 56374 - }, - { - "epoch": 1.44, - "learning_rate": 1.1078429832144105e-06, - "loss": 0.6274, - "step": 56375 - }, - { - "epoch": 1.44, - "learning_rate": 1.107815474095007e-06, - "loss": 0.396, - "step": 56376 - }, - { - "epoch": 1.44, - "learning_rate": 1.1077879648930541e-06, - "loss": 0.55, - "step": 56377 - }, - { - "epoch": 1.44, - "learning_rate": 1.1077604556085727e-06, - "loss": 0.7539, - "step": 56378 - }, - { - "epoch": 1.45, - "learning_rate": 1.1077329462415843e-06, - "loss": 0.6768, - "step": 56379 - }, - { - "epoch": 1.45, - "learning_rate": 1.1077054367921094e-06, - "loss": 0.6792, - "step": 56380 - }, - { - "epoch": 1.45, - "learning_rate": 1.1076779272601698e-06, - "loss": 0.4214, - "step": 56381 - }, - { - "epoch": 1.45, - "learning_rate": 1.107650417645786e-06, - "loss": 0.4958, - "step": 56382 - }, - { - "epoch": 1.45, - "learning_rate": 1.1076229079489793e-06, - "loss": 0.5068, - "step": 56383 - }, - { - "epoch": 1.45, - "learning_rate": 1.1075953981697704e-06, - "loss": 0.8047, - "step": 56384 - }, - { - "epoch": 1.45, - "learning_rate": 1.1075678883081808e-06, - "loss": 0.5239, - "step": 56385 - }, - { - "epoch": 1.45, - "learning_rate": 1.1075403783642317e-06, - "loss": 0.6343, - "step": 56386 - }, - { - "epoch": 1.45, - "learning_rate": 1.1075128683379436e-06, - "loss": 0.5698, - "step": 56387 - }, - { - "epoch": 1.45, - "learning_rate": 1.1074853582293378e-06, - "loss": 0.7754, - "step": 56388 - }, - { - "epoch": 1.45, - "learning_rate": 1.1074578480384356e-06, - "loss": 0.6689, - "step": 56389 - }, - { - "epoch": 1.45, - "learning_rate": 1.1074303377652576e-06, - "loss": 0.6948, - "step": 56390 - }, - { - "epoch": 1.45, - "learning_rate": 1.1074028274098254e-06, - "loss": 0.5737, - "step": 56391 - }, - { - "epoch": 1.45, - "learning_rate": 1.1073753169721596e-06, - "loss": 0.7168, - "step": 56392 - }, - { - "epoch": 1.45, - "learning_rate": 1.1073478064522817e-06, - "loss": 0.439, - "step": 56393 - }, - { - "epoch": 1.45, - "learning_rate": 1.107320295850212e-06, - "loss": 0.7207, - "step": 56394 - }, - { - "epoch": 1.45, - "learning_rate": 1.1072927851659727e-06, - "loss": 0.7285, - "step": 56395 - }, - { - "epoch": 1.45, - "learning_rate": 1.107265274399584e-06, - "loss": 0.4409, - "step": 56396 - }, - { - "epoch": 1.45, - "learning_rate": 1.107237763551067e-06, - "loss": 0.5796, - "step": 56397 - }, - { - "epoch": 1.45, - "learning_rate": 1.1072102526204433e-06, - "loss": 0.5122, - "step": 56398 - }, - { - "epoch": 1.45, - "learning_rate": 1.1071827416077334e-06, - "loss": 0.6602, - "step": 56399 - }, - { - "epoch": 1.45, - "learning_rate": 1.1071552305129587e-06, - "loss": 0.5249, - "step": 56400 - }, - { - "epoch": 1.45, - "learning_rate": 1.1071277193361404e-06, - "loss": 0.5356, - "step": 56401 - }, - { - "epoch": 1.45, - "learning_rate": 1.107100208077299e-06, - "loss": 0.668, - "step": 56402 - }, - { - "epoch": 1.45, - "learning_rate": 1.1070726967364558e-06, - "loss": 0.7998, - "step": 56403 - }, - { - "epoch": 1.45, - "learning_rate": 1.1070451853136324e-06, - "loss": 0.6387, - "step": 56404 - }, - { - "epoch": 1.45, - "learning_rate": 1.1070176738088491e-06, - "loss": 0.4573, - "step": 56405 - }, - { - "epoch": 1.45, - "learning_rate": 1.1069901622221277e-06, - "loss": 0.6602, - "step": 56406 - }, - { - "epoch": 1.45, - "learning_rate": 1.1069626505534884e-06, - "loss": 0.6387, - "step": 56407 - }, - { - "epoch": 1.45, - "learning_rate": 1.1069351388029529e-06, - "loss": 0.707, - "step": 56408 - }, - { - "epoch": 1.45, - "learning_rate": 1.1069076269705416e-06, - "loss": 0.6396, - "step": 56409 - }, - { - "epoch": 1.45, - "learning_rate": 1.1068801150562768e-06, - "loss": 0.6543, - "step": 56410 - }, - { - "epoch": 1.45, - "learning_rate": 1.1068526030601786e-06, - "loss": 0.6377, - "step": 56411 - }, - { - "epoch": 1.45, - "learning_rate": 1.106825090982268e-06, - "loss": 0.5571, - "step": 56412 - }, - { - "epoch": 1.45, - "learning_rate": 1.1067975788225664e-06, - "loss": 0.708, - "step": 56413 - }, - { - "epoch": 1.45, - "learning_rate": 1.106770066581095e-06, - "loss": 0.6528, - "step": 56414 - }, - { - "epoch": 1.45, - "learning_rate": 1.1067425542578747e-06, - "loss": 0.5525, - "step": 56415 - }, - { - "epoch": 1.45, - "learning_rate": 1.1067150418529263e-06, - "loss": 0.7188, - "step": 56416 - }, - { - "epoch": 1.45, - "learning_rate": 1.1066875293662711e-06, - "loss": 0.646, - "step": 56417 - }, - { - "epoch": 1.45, - "learning_rate": 1.1066600167979306e-06, - "loss": 0.5967, - "step": 56418 - }, - { - "epoch": 1.45, - "learning_rate": 1.1066325041479247e-06, - "loss": 0.5171, - "step": 56419 - }, - { - "epoch": 1.45, - "learning_rate": 1.1066049914162757e-06, - "loss": 0.7012, - "step": 56420 - }, - { - "epoch": 1.45, - "learning_rate": 1.1065774786030042e-06, - "loss": 0.6699, - "step": 56421 - }, - { - "epoch": 1.45, - "learning_rate": 1.106549965708131e-06, - "loss": 0.7427, - "step": 56422 - }, - { - "epoch": 1.45, - "learning_rate": 1.1065224527316775e-06, - "loss": 0.665, - "step": 56423 - }, - { - "epoch": 1.45, - "learning_rate": 1.1064949396736644e-06, - "loss": 0.7812, - "step": 56424 - }, - { - "epoch": 1.45, - "learning_rate": 1.1064674265341135e-06, - "loss": 0.791, - "step": 56425 - }, - { - "epoch": 1.45, - "learning_rate": 1.1064399133130451e-06, - "loss": 0.6885, - "step": 56426 - }, - { - "epoch": 1.45, - "learning_rate": 1.1064124000104805e-06, - "loss": 0.6421, - "step": 56427 - }, - { - "epoch": 1.45, - "learning_rate": 1.106384886626441e-06, - "loss": 0.6074, - "step": 56428 - }, - { - "epoch": 1.45, - "learning_rate": 1.1063573731609474e-06, - "loss": 0.6631, - "step": 56429 - }, - { - "epoch": 1.45, - "learning_rate": 1.1063298596140206e-06, - "loss": 0.7188, - "step": 56430 - }, - { - "epoch": 1.45, - "learning_rate": 1.1063023459856825e-06, - "loss": 0.6631, - "step": 56431 - }, - { - "epoch": 1.45, - "learning_rate": 1.1062748322759532e-06, - "loss": 0.6045, - "step": 56432 - }, - { - "epoch": 1.45, - "learning_rate": 1.1062473184848542e-06, - "loss": 0.6421, - "step": 56433 - }, - { - "epoch": 1.45, - "learning_rate": 1.1062198046124062e-06, - "loss": 0.5811, - "step": 56434 - }, - { - "epoch": 1.45, - "learning_rate": 1.106192290658631e-06, - "loss": 0.6694, - "step": 56435 - }, - { - "epoch": 1.45, - "learning_rate": 1.1061647766235492e-06, - "loss": 0.6523, - "step": 56436 - }, - { - "epoch": 1.45, - "learning_rate": 1.106137262507182e-06, - "loss": 0.6421, - "step": 56437 - }, - { - "epoch": 1.45, - "learning_rate": 1.10610974830955e-06, - "loss": 0.665, - "step": 56438 - }, - { - "epoch": 1.45, - "learning_rate": 1.106082234030675e-06, - "loss": 0.6768, - "step": 56439 - }, - { - "epoch": 1.45, - "learning_rate": 1.1060547196705774e-06, - "loss": 0.6299, - "step": 56440 - }, - { - "epoch": 1.45, - "learning_rate": 1.1060272052292789e-06, - "loss": 0.54, - "step": 56441 - }, - { - "epoch": 1.45, - "learning_rate": 1.1059996907068e-06, - "loss": 0.667, - "step": 56442 - }, - { - "epoch": 1.45, - "learning_rate": 1.1059721761031622e-06, - "loss": 0.4976, - "step": 56443 - }, - { - "epoch": 1.45, - "learning_rate": 1.1059446614183862e-06, - "loss": 0.4941, - "step": 56444 - }, - { - "epoch": 1.45, - "learning_rate": 1.1059171466524934e-06, - "loss": 0.627, - "step": 56445 - }, - { - "epoch": 1.45, - "learning_rate": 1.1058896318055047e-06, - "loss": 0.7412, - "step": 56446 - }, - { - "epoch": 1.45, - "learning_rate": 1.105862116877441e-06, - "loss": 0.7568, - "step": 56447 - }, - { - "epoch": 1.45, - "learning_rate": 1.1058346018683239e-06, - "loss": 0.4224, - "step": 56448 - }, - { - "epoch": 1.45, - "learning_rate": 1.1058070867781736e-06, - "loss": 0.5396, - "step": 56449 - }, - { - "epoch": 1.45, - "learning_rate": 1.105779571607012e-06, - "loss": 0.6636, - "step": 56450 - }, - { - "epoch": 1.45, - "learning_rate": 1.10575205635486e-06, - "loss": 0.5659, - "step": 56451 - }, - { - "epoch": 1.45, - "learning_rate": 1.105724541021738e-06, - "loss": 0.7783, - "step": 56452 - }, - { - "epoch": 1.45, - "learning_rate": 1.1056970256076682e-06, - "loss": 0.6167, - "step": 56453 - }, - { - "epoch": 1.45, - "learning_rate": 1.1056695101126704e-06, - "loss": 0.6367, - "step": 56454 - }, - { - "epoch": 1.45, - "learning_rate": 1.1056419945367668e-06, - "loss": 0.6982, - "step": 56455 - }, - { - "epoch": 1.45, - "learning_rate": 1.105614478879978e-06, - "loss": 0.3494, - "step": 56456 - }, - { - "epoch": 1.45, - "learning_rate": 1.1055869631423247e-06, - "loss": 0.7383, - "step": 56457 - }, - { - "epoch": 1.45, - "learning_rate": 1.1055594473238285e-06, - "loss": 0.7461, - "step": 56458 - }, - { - "epoch": 1.45, - "learning_rate": 1.1055319314245104e-06, - "loss": 0.6602, - "step": 56459 - }, - { - "epoch": 1.45, - "learning_rate": 1.105504415444391e-06, - "loss": 0.79, - "step": 56460 - }, - { - "epoch": 1.45, - "learning_rate": 1.1054768993834923e-06, - "loss": 0.6338, - "step": 56461 - }, - { - "epoch": 1.45, - "learning_rate": 1.1054493832418344e-06, - "loss": 0.624, - "step": 56462 - }, - { - "epoch": 1.45, - "learning_rate": 1.1054218670194386e-06, - "loss": 0.6167, - "step": 56463 - }, - { - "epoch": 1.45, - "learning_rate": 1.1053943507163265e-06, - "loss": 0.7227, - "step": 56464 - }, - { - "epoch": 1.45, - "learning_rate": 1.1053668343325185e-06, - "loss": 0.6294, - "step": 56465 - }, - { - "epoch": 1.45, - "learning_rate": 1.1053393178680362e-06, - "loss": 0.6362, - "step": 56466 - }, - { - "epoch": 1.45, - "learning_rate": 1.1053118013229004e-06, - "loss": 0.7896, - "step": 56467 - }, - { - "epoch": 1.45, - "learning_rate": 1.105284284697132e-06, - "loss": 0.614, - "step": 56468 - }, - { - "epoch": 1.45, - "learning_rate": 1.1052567679907522e-06, - "loss": 0.4172, - "step": 56469 - }, - { - "epoch": 1.45, - "learning_rate": 1.105229251203782e-06, - "loss": 0.4801, - "step": 56470 - }, - { - "epoch": 1.45, - "learning_rate": 1.1052017343362435e-06, - "loss": 0.543, - "step": 56471 - }, - { - "epoch": 1.45, - "learning_rate": 1.1051742173881562e-06, - "loss": 0.8379, - "step": 56472 - }, - { - "epoch": 1.45, - "learning_rate": 1.1051467003595418e-06, - "loss": 0.7559, - "step": 56473 - }, - { - "epoch": 1.45, - "learning_rate": 1.1051191832504215e-06, - "loss": 0.5366, - "step": 56474 - }, - { - "epoch": 1.45, - "learning_rate": 1.1050916660608162e-06, - "loss": 0.708, - "step": 56475 - }, - { - "epoch": 1.45, - "learning_rate": 1.1050641487907474e-06, - "loss": 0.6836, - "step": 56476 - }, - { - "epoch": 1.45, - "learning_rate": 1.1050366314402354e-06, - "loss": 0.7637, - "step": 56477 - }, - { - "epoch": 1.45, - "learning_rate": 1.105009114009302e-06, - "loss": 0.6006, - "step": 56478 - }, - { - "epoch": 1.45, - "learning_rate": 1.1049815964979677e-06, - "loss": 0.668, - "step": 56479 - }, - { - "epoch": 1.45, - "learning_rate": 1.1049540789062538e-06, - "loss": 0.4856, - "step": 56480 - }, - { - "epoch": 1.45, - "learning_rate": 1.1049265612341816e-06, - "loss": 0.665, - "step": 56481 - }, - { - "epoch": 1.45, - "learning_rate": 1.1048990434817718e-06, - "loss": 0.5898, - "step": 56482 - }, - { - "epoch": 1.45, - "learning_rate": 1.1048715256490457e-06, - "loss": 0.5728, - "step": 56483 - }, - { - "epoch": 1.45, - "learning_rate": 1.104844007736024e-06, - "loss": 0.645, - "step": 56484 - }, - { - "epoch": 1.45, - "learning_rate": 1.1048164897427287e-06, - "loss": 0.6846, - "step": 56485 - }, - { - "epoch": 1.45, - "learning_rate": 1.1047889716691799e-06, - "loss": 0.6699, - "step": 56486 - }, - { - "epoch": 1.45, - "learning_rate": 1.1047614535153986e-06, - "loss": 0.7446, - "step": 56487 - }, - { - "epoch": 1.45, - "learning_rate": 1.1047339352814067e-06, - "loss": 0.645, - "step": 56488 - }, - { - "epoch": 1.45, - "learning_rate": 1.1047064169672246e-06, - "loss": 0.8428, - "step": 56489 - }, - { - "epoch": 1.45, - "learning_rate": 1.1046788985728739e-06, - "loss": 0.6172, - "step": 56490 - }, - { - "epoch": 1.45, - "learning_rate": 1.1046513800983755e-06, - "loss": 0.5469, - "step": 56491 - }, - { - "epoch": 1.45, - "learning_rate": 1.10462386154375e-06, - "loss": 0.6511, - "step": 56492 - }, - { - "epoch": 1.45, - "learning_rate": 1.1045963429090189e-06, - "loss": 0.8008, - "step": 56493 - }, - { - "epoch": 1.45, - "learning_rate": 1.1045688241942032e-06, - "loss": 0.667, - "step": 56494 - }, - { - "epoch": 1.45, - "learning_rate": 1.1045413053993237e-06, - "loss": 0.6187, - "step": 56495 - }, - { - "epoch": 1.45, - "learning_rate": 1.1045137865244025e-06, - "loss": 0.7109, - "step": 56496 - }, - { - "epoch": 1.45, - "learning_rate": 1.1044862675694592e-06, - "loss": 0.6216, - "step": 56497 - }, - { - "epoch": 1.45, - "learning_rate": 1.1044587485345157e-06, - "loss": 0.6528, - "step": 56498 - }, - { - "epoch": 1.45, - "learning_rate": 1.104431229419593e-06, - "loss": 0.5991, - "step": 56499 - }, - { - "epoch": 1.45, - "learning_rate": 1.1044037102247124e-06, - "loss": 0.7646, - "step": 56500 - }, - { - "epoch": 1.45, - "learning_rate": 1.1043761909498943e-06, - "loss": 0.6465, - "step": 56501 - }, - { - "epoch": 1.45, - "learning_rate": 1.1043486715951605e-06, - "loss": 0.5569, - "step": 56502 - }, - { - "epoch": 1.45, - "learning_rate": 1.1043211521605314e-06, - "loss": 0.6479, - "step": 56503 - }, - { - "epoch": 1.45, - "learning_rate": 1.1042936326460284e-06, - "loss": 0.7061, - "step": 56504 - }, - { - "epoch": 1.45, - "learning_rate": 1.1042661130516724e-06, - "loss": 0.626, - "step": 56505 - }, - { - "epoch": 1.45, - "learning_rate": 1.104238593377485e-06, - "loss": 0.5887, - "step": 56506 - }, - { - "epoch": 1.45, - "learning_rate": 1.104211073623487e-06, - "loss": 0.665, - "step": 56507 - }, - { - "epoch": 1.45, - "learning_rate": 1.104183553789699e-06, - "loss": 0.5913, - "step": 56508 - }, - { - "epoch": 1.45, - "learning_rate": 1.1041560338761425e-06, - "loss": 0.603, - "step": 56509 - }, - { - "epoch": 1.45, - "learning_rate": 1.1041285138828387e-06, - "loss": 0.6504, - "step": 56510 - }, - { - "epoch": 1.45, - "learning_rate": 1.1041009938098084e-06, - "loss": 0.7207, - "step": 56511 - }, - { - "epoch": 1.45, - "learning_rate": 1.1040734736570726e-06, - "loss": 0.5156, - "step": 56512 - }, - { - "epoch": 1.45, - "learning_rate": 1.1040459534246526e-06, - "loss": 0.7041, - "step": 56513 - }, - { - "epoch": 1.45, - "learning_rate": 1.1040184331125694e-06, - "loss": 0.7168, - "step": 56514 - }, - { - "epoch": 1.45, - "learning_rate": 1.1039909127208443e-06, - "loss": 0.6016, - "step": 56515 - }, - { - "epoch": 1.45, - "learning_rate": 1.103963392249498e-06, - "loss": 0.7021, - "step": 56516 - }, - { - "epoch": 1.45, - "learning_rate": 1.1039358716985518e-06, - "loss": 0.5471, - "step": 56517 - }, - { - "epoch": 1.45, - "learning_rate": 1.1039083510680263e-06, - "loss": 0.6567, - "step": 56518 - }, - { - "epoch": 1.45, - "learning_rate": 1.1038808303579435e-06, - "loss": 0.7568, - "step": 56519 - }, - { - "epoch": 1.45, - "learning_rate": 1.1038533095683234e-06, - "loss": 0.8018, - "step": 56520 - }, - { - "epoch": 1.45, - "learning_rate": 1.103825788699188e-06, - "loss": 0.4438, - "step": 56521 - }, - { - "epoch": 1.45, - "learning_rate": 1.1037982677505577e-06, - "loss": 0.6138, - "step": 56522 - }, - { - "epoch": 1.45, - "learning_rate": 1.103770746722454e-06, - "loss": 0.6147, - "step": 56523 - }, - { - "epoch": 1.45, - "learning_rate": 1.1037432256148978e-06, - "loss": 0.604, - "step": 56524 - }, - { - "epoch": 1.45, - "learning_rate": 1.10371570442791e-06, - "loss": 0.7559, - "step": 56525 - }, - { - "epoch": 1.45, - "learning_rate": 1.1036881831615122e-06, - "loss": 0.6504, - "step": 56526 - }, - { - "epoch": 1.45, - "learning_rate": 1.103660661815725e-06, - "loss": 0.6074, - "step": 56527 - }, - { - "epoch": 1.45, - "learning_rate": 1.1036331403905693e-06, - "loss": 0.7148, - "step": 56528 - }, - { - "epoch": 1.45, - "learning_rate": 1.1036056188860667e-06, - "loss": 0.6362, - "step": 56529 - }, - { - "epoch": 1.45, - "learning_rate": 1.1035780973022378e-06, - "loss": 0.6865, - "step": 56530 - }, - { - "epoch": 1.45, - "learning_rate": 1.1035505756391044e-06, - "loss": 0.5837, - "step": 56531 - }, - { - "epoch": 1.45, - "learning_rate": 1.1035230538966868e-06, - "loss": 0.7344, - "step": 56532 - }, - { - "epoch": 1.45, - "learning_rate": 1.1034955320750062e-06, - "loss": 0.71, - "step": 56533 - }, - { - "epoch": 1.45, - "learning_rate": 1.103468010174084e-06, - "loss": 0.4575, - "step": 56534 - }, - { - "epoch": 1.45, - "learning_rate": 1.1034404881939413e-06, - "loss": 0.5784, - "step": 56535 - }, - { - "epoch": 1.45, - "learning_rate": 1.103412966134599e-06, - "loss": 0.6333, - "step": 56536 - }, - { - "epoch": 1.45, - "learning_rate": 1.1033854439960776e-06, - "loss": 0.832, - "step": 56537 - }, - { - "epoch": 1.45, - "learning_rate": 1.1033579217783992e-06, - "loss": 0.5659, - "step": 56538 - }, - { - "epoch": 1.45, - "learning_rate": 1.1033303994815841e-06, - "loss": 0.7041, - "step": 56539 - }, - { - "epoch": 1.45, - "learning_rate": 1.1033028771056539e-06, - "loss": 0.6006, - "step": 56540 - }, - { - "epoch": 1.45, - "learning_rate": 1.1032753546506296e-06, - "loss": 0.5479, - "step": 56541 - }, - { - "epoch": 1.45, - "learning_rate": 1.1032478321165318e-06, - "loss": 0.7539, - "step": 56542 - }, - { - "epoch": 1.45, - "learning_rate": 1.103220309503382e-06, - "loss": 0.6562, - "step": 56543 - }, - { - "epoch": 1.45, - "learning_rate": 1.103192786811201e-06, - "loss": 0.6602, - "step": 56544 - }, - { - "epoch": 1.45, - "learning_rate": 1.1031652640400099e-06, - "loss": 0.4248, - "step": 56545 - }, - { - "epoch": 1.45, - "learning_rate": 1.1031377411898303e-06, - "loss": 0.6362, - "step": 56546 - }, - { - "epoch": 1.45, - "learning_rate": 1.1031102182606825e-06, - "loss": 0.7539, - "step": 56547 - }, - { - "epoch": 1.45, - "learning_rate": 1.1030826952525885e-06, - "loss": 0.8184, - "step": 56548 - }, - { - "epoch": 1.45, - "learning_rate": 1.1030551721655684e-06, - "loss": 0.6245, - "step": 56549 - }, - { - "epoch": 1.45, - "learning_rate": 1.1030276489996437e-06, - "loss": 0.6348, - "step": 56550 - }, - { - "epoch": 1.45, - "learning_rate": 1.1030001257548355e-06, - "loss": 0.5728, - "step": 56551 - }, - { - "epoch": 1.45, - "learning_rate": 1.102972602431165e-06, - "loss": 0.6831, - "step": 56552 - }, - { - "epoch": 1.45, - "learning_rate": 1.1029450790286528e-06, - "loss": 0.6719, - "step": 56553 - }, - { - "epoch": 1.45, - "learning_rate": 1.1029175555473204e-06, - "loss": 0.6768, - "step": 56554 - }, - { - "epoch": 1.45, - "learning_rate": 1.1028900319871887e-06, - "loss": 0.7285, - "step": 56555 - }, - { - "epoch": 1.45, - "learning_rate": 1.1028625083482792e-06, - "loss": 0.6777, - "step": 56556 - }, - { - "epoch": 1.45, - "learning_rate": 1.1028349846306123e-06, - "loss": 0.6387, - "step": 56557 - }, - { - "epoch": 1.45, - "learning_rate": 1.1028074608342093e-06, - "loss": 0.6328, - "step": 56558 - }, - { - "epoch": 1.45, - "learning_rate": 1.1027799369590915e-06, - "loss": 0.5278, - "step": 56559 - }, - { - "epoch": 1.45, - "learning_rate": 1.1027524130052799e-06, - "loss": 0.5601, - "step": 56560 - }, - { - "epoch": 1.45, - "learning_rate": 1.1027248889727956e-06, - "loss": 0.6846, - "step": 56561 - }, - { - "epoch": 1.45, - "learning_rate": 1.1026973648616593e-06, - "loss": 0.6277, - "step": 56562 - }, - { - "epoch": 1.45, - "learning_rate": 1.1026698406718927e-06, - "loss": 0.4536, - "step": 56563 - }, - { - "epoch": 1.45, - "learning_rate": 1.102642316403516e-06, - "loss": 0.5352, - "step": 56564 - }, - { - "epoch": 1.45, - "learning_rate": 1.1026147920565512e-06, - "loss": 0.8076, - "step": 56565 - }, - { - "epoch": 1.45, - "learning_rate": 1.102587267631019e-06, - "loss": 0.5332, - "step": 56566 - }, - { - "epoch": 1.45, - "learning_rate": 1.1025597431269402e-06, - "loss": 0.6172, - "step": 56567 - }, - { - "epoch": 1.45, - "learning_rate": 1.1025322185443362e-06, - "loss": 0.5342, - "step": 56568 - }, - { - "epoch": 1.45, - "learning_rate": 1.1025046938832282e-06, - "loss": 0.6729, - "step": 56569 - }, - { - "epoch": 1.45, - "learning_rate": 1.1024771691436366e-06, - "loss": 0.6685, - "step": 56570 - }, - { - "epoch": 1.45, - "learning_rate": 1.1024496443255835e-06, - "loss": 0.6455, - "step": 56571 - }, - { - "epoch": 1.45, - "learning_rate": 1.102422119429089e-06, - "loss": 0.458, - "step": 56572 - }, - { - "epoch": 1.45, - "learning_rate": 1.1023945944541747e-06, - "loss": 0.4507, - "step": 56573 - }, - { - "epoch": 1.45, - "learning_rate": 1.1023670694008616e-06, - "loss": 0.5264, - "step": 56574 - }, - { - "epoch": 1.45, - "learning_rate": 1.1023395442691707e-06, - "loss": 0.6709, - "step": 56575 - }, - { - "epoch": 1.45, - "learning_rate": 1.1023120190591232e-06, - "loss": 0.7988, - "step": 56576 - }, - { - "epoch": 1.45, - "learning_rate": 1.10228449377074e-06, - "loss": 0.6143, - "step": 56577 - }, - { - "epoch": 1.45, - "learning_rate": 1.1022569684040423e-06, - "loss": 0.6001, - "step": 56578 - }, - { - "epoch": 1.45, - "learning_rate": 1.102229442959051e-06, - "loss": 0.6233, - "step": 56579 - }, - { - "epoch": 1.45, - "learning_rate": 1.1022019174357877e-06, - "loss": 0.6689, - "step": 56580 - }, - { - "epoch": 1.45, - "learning_rate": 1.102174391834273e-06, - "loss": 0.3196, - "step": 56581 - }, - { - "epoch": 1.45, - "learning_rate": 1.102146866154528e-06, - "loss": 0.6592, - "step": 56582 - }, - { - "epoch": 1.45, - "learning_rate": 1.1021193403965737e-06, - "loss": 0.6851, - "step": 56583 - }, - { - "epoch": 1.45, - "learning_rate": 1.1020918145604313e-06, - "loss": 0.5137, - "step": 56584 - }, - { - "epoch": 1.45, - "learning_rate": 1.102064288646122e-06, - "loss": 0.6709, - "step": 56585 - }, - { - "epoch": 1.45, - "learning_rate": 1.102036762653667e-06, - "loss": 0.7402, - "step": 56586 - }, - { - "epoch": 1.45, - "learning_rate": 1.1020092365830867e-06, - "loss": 0.5933, - "step": 56587 - }, - { - "epoch": 1.45, - "learning_rate": 1.1019817104344027e-06, - "loss": 0.5391, - "step": 56588 - }, - { - "epoch": 1.45, - "learning_rate": 1.1019541842076362e-06, - "loss": 0.6177, - "step": 56589 - }, - { - "epoch": 1.45, - "learning_rate": 1.1019266579028082e-06, - "loss": 0.6763, - "step": 56590 - }, - { - "epoch": 1.45, - "learning_rate": 1.1018991315199392e-06, - "loss": 0.6611, - "step": 56591 - }, - { - "epoch": 1.45, - "learning_rate": 1.1018716050590511e-06, - "loss": 0.6963, - "step": 56592 - }, - { - "epoch": 1.45, - "learning_rate": 1.1018440785201642e-06, - "loss": 0.6162, - "step": 56593 - }, - { - "epoch": 1.45, - "learning_rate": 1.1018165519033003e-06, - "loss": 0.7451, - "step": 56594 - }, - { - "epoch": 1.45, - "learning_rate": 1.10178902520848e-06, - "loss": 0.6963, - "step": 56595 - }, - { - "epoch": 1.45, - "learning_rate": 1.1017614984357246e-06, - "loss": 0.483, - "step": 56596 - }, - { - "epoch": 1.45, - "learning_rate": 1.101733971585055e-06, - "loss": 0.6191, - "step": 56597 - }, - { - "epoch": 1.45, - "learning_rate": 1.1017064446564925e-06, - "loss": 0.6934, - "step": 56598 - }, - { - "epoch": 1.45, - "learning_rate": 1.101678917650058e-06, - "loss": 0.6914, - "step": 56599 - }, - { - "epoch": 1.45, - "learning_rate": 1.1016513905657727e-06, - "loss": 0.5852, - "step": 56600 - }, - { - "epoch": 1.45, - "learning_rate": 1.1016238634036576e-06, - "loss": 0.7051, - "step": 56601 - }, - { - "epoch": 1.45, - "learning_rate": 1.1015963361637334e-06, - "loss": 0.5098, - "step": 56602 - }, - { - "epoch": 1.45, - "learning_rate": 1.1015688088460221e-06, - "loss": 0.4705, - "step": 56603 - }, - { - "epoch": 1.45, - "learning_rate": 1.101541281450544e-06, - "loss": 0.4229, - "step": 56604 - }, - { - "epoch": 1.45, - "learning_rate": 1.1015137539773208e-06, - "loss": 0.666, - "step": 56605 - }, - { - "epoch": 1.45, - "learning_rate": 1.1014862264263724e-06, - "loss": 0.6196, - "step": 56606 - }, - { - "epoch": 1.45, - "learning_rate": 1.1014586987977213e-06, - "loss": 0.7593, - "step": 56607 - }, - { - "epoch": 1.45, - "learning_rate": 1.1014311710913875e-06, - "loss": 0.6187, - "step": 56608 - }, - { - "epoch": 1.45, - "learning_rate": 1.1014036433073928e-06, - "loss": 0.5039, - "step": 56609 - }, - { - "epoch": 1.45, - "learning_rate": 1.1013761154457579e-06, - "loss": 0.7217, - "step": 56610 - }, - { - "epoch": 1.45, - "learning_rate": 1.101348587506504e-06, - "loss": 0.748, - "step": 56611 - }, - { - "epoch": 1.45, - "learning_rate": 1.101321059489652e-06, - "loss": 0.6333, - "step": 56612 - }, - { - "epoch": 1.45, - "learning_rate": 1.1012935313952233e-06, - "loss": 0.6177, - "step": 56613 - }, - { - "epoch": 1.45, - "learning_rate": 1.1012660032232389e-06, - "loss": 0.7764, - "step": 56614 - }, - { - "epoch": 1.45, - "learning_rate": 1.1012384749737198e-06, - "loss": 0.561, - "step": 56615 - }, - { - "epoch": 1.45, - "learning_rate": 1.1012109466466868e-06, - "loss": 0.7354, - "step": 56616 - }, - { - "epoch": 1.45, - "learning_rate": 1.1011834182421613e-06, - "loss": 0.7598, - "step": 56617 - }, - { - "epoch": 1.45, - "learning_rate": 1.1011558897601643e-06, - "loss": 0.8389, - "step": 56618 - }, - { - "epoch": 1.45, - "learning_rate": 1.101128361200717e-06, - "loss": 0.8037, - "step": 56619 - }, - { - "epoch": 1.45, - "learning_rate": 1.1011008325638402e-06, - "loss": 0.5759, - "step": 56620 - }, - { - "epoch": 1.45, - "learning_rate": 1.1010733038495552e-06, - "loss": 0.6973, - "step": 56621 - }, - { - "epoch": 1.45, - "learning_rate": 1.101045775057883e-06, - "loss": 0.6167, - "step": 56622 - }, - { - "epoch": 1.45, - "learning_rate": 1.1010182461888446e-06, - "loss": 0.6406, - "step": 56623 - }, - { - "epoch": 1.45, - "learning_rate": 1.1009907172424615e-06, - "loss": 0.4915, - "step": 56624 - }, - { - "epoch": 1.45, - "learning_rate": 1.1009631882187543e-06, - "loss": 0.5762, - "step": 56625 - }, - { - "epoch": 1.45, - "learning_rate": 1.1009356591177441e-06, - "loss": 0.708, - "step": 56626 - }, - { - "epoch": 1.45, - "learning_rate": 1.1009081299394524e-06, - "loss": 0.4434, - "step": 56627 - }, - { - "epoch": 1.45, - "learning_rate": 1.1008806006838995e-06, - "loss": 0.6699, - "step": 56628 - }, - { - "epoch": 1.45, - "learning_rate": 1.1008530713511073e-06, - "loss": 0.5122, - "step": 56629 - }, - { - "epoch": 1.45, - "learning_rate": 1.1008255419410967e-06, - "loss": 0.6191, - "step": 56630 - }, - { - "epoch": 1.45, - "learning_rate": 1.1007980124538882e-06, - "loss": 0.5195, - "step": 56631 - }, - { - "epoch": 1.45, - "learning_rate": 1.1007704828895038e-06, - "loss": 0.6558, - "step": 56632 - }, - { - "epoch": 1.45, - "learning_rate": 1.1007429532479636e-06, - "loss": 0.4116, - "step": 56633 - }, - { - "epoch": 1.45, - "learning_rate": 1.1007154235292893e-06, - "loss": 0.5103, - "step": 56634 - }, - { - "epoch": 1.45, - "learning_rate": 1.100687893733502e-06, - "loss": 0.7344, - "step": 56635 - }, - { - "epoch": 1.45, - "learning_rate": 1.1006603638606225e-06, - "loss": 0.7012, - "step": 56636 - }, - { - "epoch": 1.45, - "learning_rate": 1.1006328339106719e-06, - "loss": 0.6414, - "step": 56637 - }, - { - "epoch": 1.45, - "learning_rate": 1.1006053038836713e-06, - "loss": 0.5527, - "step": 56638 - }, - { - "epoch": 1.45, - "learning_rate": 1.100577773779642e-06, - "loss": 0.7227, - "step": 56639 - }, - { - "epoch": 1.45, - "learning_rate": 1.1005502435986049e-06, - "loss": 0.4365, - "step": 56640 - }, - { - "epoch": 1.45, - "learning_rate": 1.1005227133405812e-06, - "loss": 0.6777, - "step": 56641 - }, - { - "epoch": 1.45, - "learning_rate": 1.1004951830055918e-06, - "loss": 0.6782, - "step": 56642 - }, - { - "epoch": 1.45, - "learning_rate": 1.1004676525936575e-06, - "loss": 0.2974, - "step": 56643 - }, - { - "epoch": 1.45, - "learning_rate": 1.1004401221048004e-06, - "loss": 0.5361, - "step": 56644 - }, - { - "epoch": 1.45, - "learning_rate": 1.1004125915390405e-06, - "loss": 0.5715, - "step": 56645 - }, - { - "epoch": 1.45, - "learning_rate": 1.1003850608963994e-06, - "loss": 0.752, - "step": 56646 - }, - { - "epoch": 1.45, - "learning_rate": 1.1003575301768981e-06, - "loss": 0.7012, - "step": 56647 - }, - { - "epoch": 1.45, - "learning_rate": 1.1003299993805575e-06, - "loss": 0.6572, - "step": 56648 - }, - { - "epoch": 1.45, - "learning_rate": 1.100302468507399e-06, - "loss": 0.5986, - "step": 56649 - }, - { - "epoch": 1.45, - "learning_rate": 1.1002749375574433e-06, - "loss": 0.707, - "step": 56650 - }, - { - "epoch": 1.45, - "learning_rate": 1.1002474065307122e-06, - "loss": 0.5713, - "step": 56651 - }, - { - "epoch": 1.45, - "learning_rate": 1.1002198754272257e-06, - "loss": 0.595, - "step": 56652 - }, - { - "epoch": 1.45, - "learning_rate": 1.1001923442470059e-06, - "loss": 0.6543, - "step": 56653 - }, - { - "epoch": 1.45, - "learning_rate": 1.100164812990073e-06, - "loss": 0.54, - "step": 56654 - }, - { - "epoch": 1.45, - "learning_rate": 1.100137281656449e-06, - "loss": 0.6484, - "step": 56655 - }, - { - "epoch": 1.45, - "learning_rate": 1.100109750246154e-06, - "loss": 0.5527, - "step": 56656 - }, - { - "epoch": 1.45, - "learning_rate": 1.1000822187592098e-06, - "loss": 0.7207, - "step": 56657 - }, - { - "epoch": 1.45, - "learning_rate": 1.1000546871956372e-06, - "loss": 0.7158, - "step": 56658 - }, - { - "epoch": 1.45, - "learning_rate": 1.1000271555554573e-06, - "loss": 0.7422, - "step": 56659 - }, - { - "epoch": 1.45, - "learning_rate": 1.0999996238386912e-06, - "loss": 0.6997, - "step": 56660 - }, - { - "epoch": 1.45, - "learning_rate": 1.0999720920453601e-06, - "loss": 0.6924, - "step": 56661 - }, - { - "epoch": 1.45, - "learning_rate": 1.0999445601754848e-06, - "loss": 0.5986, - "step": 56662 - }, - { - "epoch": 1.45, - "learning_rate": 1.0999170282290868e-06, - "loss": 0.6523, - "step": 56663 - }, - { - "epoch": 1.45, - "learning_rate": 1.0998894962061867e-06, - "loss": 0.6035, - "step": 56664 - }, - { - "epoch": 1.45, - "learning_rate": 1.099861964106806e-06, - "loss": 0.4531, - "step": 56665 - }, - { - "epoch": 1.45, - "learning_rate": 1.0998344319309653e-06, - "loss": 0.5991, - "step": 56666 - }, - { - "epoch": 1.45, - "learning_rate": 1.099806899678686e-06, - "loss": 0.6914, - "step": 56667 - }, - { - "epoch": 1.45, - "learning_rate": 1.0997793673499894e-06, - "loss": 0.3951, - "step": 56668 - }, - { - "epoch": 1.45, - "learning_rate": 1.099751834944896e-06, - "loss": 0.6123, - "step": 56669 - }, - { - "epoch": 1.45, - "learning_rate": 1.0997243024634277e-06, - "loss": 0.5977, - "step": 56670 - }, - { - "epoch": 1.45, - "learning_rate": 1.0996967699056045e-06, - "loss": 0.6592, - "step": 56671 - }, - { - "epoch": 1.45, - "learning_rate": 1.0996692372714486e-06, - "loss": 0.6436, - "step": 56672 - }, - { - "epoch": 1.45, - "learning_rate": 1.09964170456098e-06, - "loss": 0.7129, - "step": 56673 - }, - { - "epoch": 1.45, - "learning_rate": 1.0996141717742208e-06, - "loss": 0.7407, - "step": 56674 - }, - { - "epoch": 1.45, - "learning_rate": 1.0995866389111917e-06, - "loss": 0.6309, - "step": 56675 - }, - { - "epoch": 1.45, - "learning_rate": 1.0995591059719134e-06, - "loss": 0.5547, - "step": 56676 - }, - { - "epoch": 1.45, - "learning_rate": 1.0995315729564071e-06, - "loss": 0.6196, - "step": 56677 - }, - { - "epoch": 1.45, - "learning_rate": 1.0995040398646944e-06, - "loss": 0.7012, - "step": 56678 - }, - { - "epoch": 1.45, - "learning_rate": 1.0994765066967957e-06, - "loss": 0.6104, - "step": 56679 - }, - { - "epoch": 1.45, - "learning_rate": 1.0994489734527329e-06, - "loss": 0.5745, - "step": 56680 - }, - { - "epoch": 1.45, - "learning_rate": 1.0994214401325262e-06, - "loss": 0.5231, - "step": 56681 - }, - { - "epoch": 1.45, - "learning_rate": 1.0993939067361973e-06, - "loss": 0.5986, - "step": 56682 - }, - { - "epoch": 1.45, - "learning_rate": 1.0993663732637666e-06, - "loss": 0.5654, - "step": 56683 - }, - { - "epoch": 1.45, - "learning_rate": 1.0993388397152562e-06, - "loss": 0.6284, - "step": 56684 - }, - { - "epoch": 1.45, - "learning_rate": 1.0993113060906865e-06, - "loss": 0.7295, - "step": 56685 - }, - { - "epoch": 1.45, - "learning_rate": 1.0992837723900784e-06, - "loss": 0.6416, - "step": 56686 - }, - { - "epoch": 1.45, - "learning_rate": 1.0992562386134533e-06, - "loss": 0.8086, - "step": 56687 - }, - { - "epoch": 1.45, - "learning_rate": 1.0992287047608327e-06, - "loss": 0.6133, - "step": 56688 - }, - { - "epoch": 1.45, - "learning_rate": 1.0992011708322366e-06, - "loss": 0.8076, - "step": 56689 - }, - { - "epoch": 1.45, - "learning_rate": 1.0991736368276874e-06, - "loss": 0.6313, - "step": 56690 - }, - { - "epoch": 1.45, - "learning_rate": 1.0991461027472052e-06, - "loss": 0.6992, - "step": 56691 - }, - { - "epoch": 1.45, - "learning_rate": 1.099118568590811e-06, - "loss": 0.6836, - "step": 56692 - }, - { - "epoch": 1.45, - "learning_rate": 1.0990910343585269e-06, - "loss": 0.6104, - "step": 56693 - }, - { - "epoch": 1.45, - "learning_rate": 1.099063500050373e-06, - "loss": 0.6245, - "step": 56694 - }, - { - "epoch": 1.45, - "learning_rate": 1.099035965666371e-06, - "loss": 0.6108, - "step": 56695 - }, - { - "epoch": 1.45, - "learning_rate": 1.0990084312065415e-06, - "loss": 0.5784, - "step": 56696 - }, - { - "epoch": 1.45, - "learning_rate": 1.098980896670906e-06, - "loss": 0.6504, - "step": 56697 - }, - { - "epoch": 1.45, - "learning_rate": 1.098953362059485e-06, - "loss": 0.6094, - "step": 56698 - }, - { - "epoch": 1.45, - "learning_rate": 1.0989258273723004e-06, - "loss": 0.5684, - "step": 56699 - }, - { - "epoch": 1.45, - "learning_rate": 1.0988982926093726e-06, - "loss": 0.7168, - "step": 56700 - }, - { - "epoch": 1.45, - "learning_rate": 1.098870757770723e-06, - "loss": 0.5254, - "step": 56701 - }, - { - "epoch": 1.45, - "learning_rate": 1.0988432228563724e-06, - "loss": 0.7627, - "step": 56702 - }, - { - "epoch": 1.45, - "learning_rate": 1.0988156878663423e-06, - "loss": 0.5981, - "step": 56703 - }, - { - "epoch": 1.45, - "learning_rate": 1.0987881528006534e-06, - "loss": 0.6602, - "step": 56704 - }, - { - "epoch": 1.45, - "learning_rate": 1.0987606176593274e-06, - "loss": 0.7236, - "step": 56705 - }, - { - "epoch": 1.45, - "learning_rate": 1.0987330824423847e-06, - "loss": 0.8428, - "step": 56706 - }, - { - "epoch": 1.45, - "learning_rate": 1.0987055471498463e-06, - "loss": 0.4424, - "step": 56707 - }, - { - "epoch": 1.45, - "learning_rate": 1.0986780117817338e-06, - "loss": 0.8184, - "step": 56708 - }, - { - "epoch": 1.45, - "learning_rate": 1.098650476338068e-06, - "loss": 0.6484, - "step": 56709 - }, - { - "epoch": 1.45, - "learning_rate": 1.0986229408188705e-06, - "loss": 0.4733, - "step": 56710 - }, - { - "epoch": 1.45, - "learning_rate": 1.0985954052241615e-06, - "loss": 0.6626, - "step": 56711 - }, - { - "epoch": 1.45, - "learning_rate": 1.0985678695539627e-06, - "loss": 0.6514, - "step": 56712 - }, - { - "epoch": 1.45, - "learning_rate": 1.0985403338082948e-06, - "loss": 0.7246, - "step": 56713 - }, - { - "epoch": 1.45, - "learning_rate": 1.0985127979871793e-06, - "loss": 0.5447, - "step": 56714 - }, - { - "epoch": 1.45, - "learning_rate": 1.0984852620906372e-06, - "loss": 0.5869, - "step": 56715 - }, - { - "epoch": 1.45, - "learning_rate": 1.0984577261186893e-06, - "loss": 0.7363, - "step": 56716 - }, - { - "epoch": 1.45, - "learning_rate": 1.0984301900713568e-06, - "loss": 0.4236, - "step": 56717 - }, - { - "epoch": 1.45, - "learning_rate": 1.0984026539486612e-06, - "loss": 0.7334, - "step": 56718 - }, - { - "epoch": 1.45, - "learning_rate": 1.0983751177506224e-06, - "loss": 0.7065, - "step": 56719 - }, - { - "epoch": 1.45, - "learning_rate": 1.098347581477263e-06, - "loss": 0.6074, - "step": 56720 - }, - { - "epoch": 1.45, - "learning_rate": 1.0983200451286032e-06, - "loss": 0.605, - "step": 56721 - }, - { - "epoch": 1.45, - "learning_rate": 1.0982925087046644e-06, - "loss": 0.5889, - "step": 56722 - }, - { - "epoch": 1.45, - "learning_rate": 1.0982649722054672e-06, - "loss": 0.7549, - "step": 56723 - }, - { - "epoch": 1.45, - "learning_rate": 1.0982374356310333e-06, - "loss": 0.7979, - "step": 56724 - }, - { - "epoch": 1.45, - "learning_rate": 1.0982098989813834e-06, - "loss": 0.6592, - "step": 56725 - }, - { - "epoch": 1.45, - "learning_rate": 1.0981823622565389e-06, - "loss": 0.6992, - "step": 56726 - }, - { - "epoch": 1.45, - "learning_rate": 1.0981548254565205e-06, - "loss": 0.8091, - "step": 56727 - }, - { - "epoch": 1.45, - "learning_rate": 1.0981272885813494e-06, - "loss": 0.5894, - "step": 56728 - }, - { - "epoch": 1.45, - "learning_rate": 1.0980997516310467e-06, - "loss": 0.7158, - "step": 56729 - }, - { - "epoch": 1.45, - "learning_rate": 1.0980722146056338e-06, - "loss": 0.7471, - "step": 56730 - }, - { - "epoch": 1.45, - "learning_rate": 1.0980446775051314e-06, - "loss": 0.5647, - "step": 56731 - }, - { - "epoch": 1.45, - "learning_rate": 1.0980171403295609e-06, - "loss": 0.6719, - "step": 56732 - }, - { - "epoch": 1.45, - "learning_rate": 1.0979896030789426e-06, - "loss": 0.5535, - "step": 56733 - }, - { - "epoch": 1.45, - "learning_rate": 1.0979620657532986e-06, - "loss": 0.5576, - "step": 56734 - }, - { - "epoch": 1.45, - "learning_rate": 1.0979345283526495e-06, - "loss": 0.5015, - "step": 56735 - }, - { - "epoch": 1.45, - "learning_rate": 1.0979069908770163e-06, - "loss": 0.6304, - "step": 56736 - }, - { - "epoch": 1.45, - "learning_rate": 1.0978794533264205e-06, - "loss": 0.6019, - "step": 56737 - }, - { - "epoch": 1.45, - "learning_rate": 1.0978519157008826e-06, - "loss": 0.4805, - "step": 56738 - }, - { - "epoch": 1.45, - "learning_rate": 1.097824378000424e-06, - "loss": 0.6025, - "step": 56739 - }, - { - "epoch": 1.45, - "learning_rate": 1.0977968402250658e-06, - "loss": 0.7637, - "step": 56740 - }, - { - "epoch": 1.45, - "learning_rate": 1.0977693023748294e-06, - "loss": 0.8003, - "step": 56741 - }, - { - "epoch": 1.45, - "learning_rate": 1.097741764449735e-06, - "loss": 0.8115, - "step": 56742 - }, - { - "epoch": 1.45, - "learning_rate": 1.0977142264498048e-06, - "loss": 0.7285, - "step": 56743 - }, - { - "epoch": 1.45, - "learning_rate": 1.0976866883750589e-06, - "loss": 0.749, - "step": 56744 - }, - { - "epoch": 1.45, - "learning_rate": 1.097659150225519e-06, - "loss": 0.8984, - "step": 56745 - }, - { - "epoch": 1.45, - "learning_rate": 1.097631612001206e-06, - "loss": 0.5142, - "step": 56746 - }, - { - "epoch": 1.45, - "learning_rate": 1.097604073702141e-06, - "loss": 0.6216, - "step": 56747 - }, - { - "epoch": 1.45, - "learning_rate": 1.0975765353283447e-06, - "loss": 0.5035, - "step": 56748 - }, - { - "epoch": 1.45, - "learning_rate": 1.0975489968798387e-06, - "loss": 0.6621, - "step": 56749 - }, - { - "epoch": 1.45, - "learning_rate": 1.0975214583566438e-06, - "loss": 0.5767, - "step": 56750 - }, - { - "epoch": 1.45, - "learning_rate": 1.0974939197587816e-06, - "loss": 0.6211, - "step": 56751 - }, - { - "epoch": 1.45, - "learning_rate": 1.0974663810862724e-06, - "loss": 0.6016, - "step": 56752 - }, - { - "epoch": 1.45, - "learning_rate": 1.097438842339138e-06, - "loss": 0.5576, - "step": 56753 - }, - { - "epoch": 1.45, - "learning_rate": 1.0974113035173987e-06, - "loss": 0.5081, - "step": 56754 - }, - { - "epoch": 1.45, - "learning_rate": 1.0973837646210764e-06, - "loss": 0.4861, - "step": 56755 - }, - { - "epoch": 1.45, - "learning_rate": 1.0973562256501918e-06, - "loss": 0.6514, - "step": 56756 - }, - { - "epoch": 1.45, - "learning_rate": 1.0973286866047658e-06, - "loss": 0.5967, - "step": 56757 - }, - { - "epoch": 1.45, - "learning_rate": 1.09730114748482e-06, - "loss": 0.5308, - "step": 56758 - }, - { - "epoch": 1.45, - "learning_rate": 1.0972736082903748e-06, - "loss": 0.6289, - "step": 56759 - }, - { - "epoch": 1.45, - "learning_rate": 1.0972460690214522e-06, - "loss": 0.751, - "step": 56760 - }, - { - "epoch": 1.45, - "learning_rate": 1.0972185296780724e-06, - "loss": 0.665, - "step": 56761 - }, - { - "epoch": 1.45, - "learning_rate": 1.097190990260257e-06, - "loss": 0.7583, - "step": 56762 - }, - { - "epoch": 1.45, - "learning_rate": 1.0971634507680268e-06, - "loss": 0.6885, - "step": 56763 - }, - { - "epoch": 1.45, - "learning_rate": 1.0971359112014028e-06, - "loss": 0.5957, - "step": 56764 - }, - { - "epoch": 1.45, - "learning_rate": 1.0971083715604068e-06, - "loss": 0.6855, - "step": 56765 - }, - { - "epoch": 1.45, - "learning_rate": 1.0970808318450592e-06, - "loss": 0.9736, - "step": 56766 - }, - { - "epoch": 1.45, - "learning_rate": 1.0970532920553812e-06, - "loss": 0.6663, - "step": 56767 - }, - { - "epoch": 1.45, - "learning_rate": 1.097025752191394e-06, - "loss": 0.7373, - "step": 56768 - }, - { - "epoch": 1.46, - "learning_rate": 1.0969982122531186e-06, - "loss": 0.7295, - "step": 56769 - }, - { - "epoch": 1.46, - "learning_rate": 1.0969706722405762e-06, - "loss": 0.6836, - "step": 56770 - }, - { - "epoch": 1.46, - "learning_rate": 1.0969431321537877e-06, - "loss": 0.7231, - "step": 56771 - }, - { - "epoch": 1.46, - "learning_rate": 1.0969155919927744e-06, - "loss": 0.5112, - "step": 56772 - }, - { - "epoch": 1.46, - "learning_rate": 1.0968880517575573e-06, - "loss": 0.6279, - "step": 56773 - }, - { - "epoch": 1.46, - "learning_rate": 1.0968605114481573e-06, - "loss": 0.6284, - "step": 56774 - }, - { - "epoch": 1.46, - "learning_rate": 1.0968329710645959e-06, - "loss": 0.5999, - "step": 56775 - }, - { - "epoch": 1.46, - "learning_rate": 1.0968054306068936e-06, - "loss": 0.6533, - "step": 56776 - }, - { - "epoch": 1.46, - "learning_rate": 1.0967778900750722e-06, - "loss": 0.665, - "step": 56777 - }, - { - "epoch": 1.46, - "learning_rate": 1.0967503494691523e-06, - "loss": 0.7852, - "step": 56778 - }, - { - "epoch": 1.46, - "learning_rate": 1.096722808789155e-06, - "loss": 0.543, - "step": 56779 - }, - { - "epoch": 1.46, - "learning_rate": 1.0966952680351017e-06, - "loss": 0.583, - "step": 56780 - }, - { - "epoch": 1.46, - "learning_rate": 1.096667727207013e-06, - "loss": 0.7451, - "step": 56781 - }, - { - "epoch": 1.46, - "learning_rate": 1.0966401863049104e-06, - "loss": 0.6592, - "step": 56782 - }, - { - "epoch": 1.46, - "learning_rate": 1.0966126453288148e-06, - "loss": 0.4889, - "step": 56783 - }, - { - "epoch": 1.46, - "learning_rate": 1.0965851042787475e-06, - "loss": 0.5464, - "step": 56784 - }, - { - "epoch": 1.46, - "learning_rate": 1.0965575631547298e-06, - "loss": 0.6841, - "step": 56785 - }, - { - "epoch": 1.46, - "learning_rate": 1.0965300219567817e-06, - "loss": 0.4351, - "step": 56786 - }, - { - "epoch": 1.46, - "learning_rate": 1.0965024806849251e-06, - "loss": 0.644, - "step": 56787 - }, - { - "epoch": 1.46, - "learning_rate": 1.0964749393391813e-06, - "loss": 0.7676, - "step": 56788 - }, - { - "epoch": 1.46, - "learning_rate": 1.0964473979195708e-06, - "loss": 0.6128, - "step": 56789 - }, - { - "epoch": 1.46, - "learning_rate": 1.0964198564261152e-06, - "loss": 0.6831, - "step": 56790 - }, - { - "epoch": 1.46, - "learning_rate": 1.0963923148588351e-06, - "loss": 0.6558, - "step": 56791 - }, - { - "epoch": 1.46, - "learning_rate": 1.096364773217752e-06, - "loss": 0.626, - "step": 56792 - }, - { - "epoch": 1.46, - "learning_rate": 1.096337231502887e-06, - "loss": 0.7285, - "step": 56793 - }, - { - "epoch": 1.46, - "learning_rate": 1.0963096897142606e-06, - "loss": 0.6313, - "step": 56794 - }, - { - "epoch": 1.46, - "learning_rate": 1.0962821478518946e-06, - "loss": 0.511, - "step": 56795 - }, - { - "epoch": 1.46, - "learning_rate": 1.0962546059158097e-06, - "loss": 0.7656, - "step": 56796 - }, - { - "epoch": 1.46, - "learning_rate": 1.096227063906027e-06, - "loss": 0.6699, - "step": 56797 - }, - { - "epoch": 1.46, - "learning_rate": 1.0961995218225677e-06, - "loss": 0.6885, - "step": 56798 - }, - { - "epoch": 1.46, - "learning_rate": 1.0961719796654529e-06, - "loss": 0.5815, - "step": 56799 - }, - { - "epoch": 1.46, - "learning_rate": 1.0961444374347038e-06, - "loss": 0.626, - "step": 56800 - }, - { - "epoch": 1.46, - "learning_rate": 1.096116895130341e-06, - "loss": 0.5811, - "step": 56801 - }, - { - "epoch": 1.46, - "learning_rate": 1.096089352752386e-06, - "loss": 0.4661, - "step": 56802 - }, - { - "epoch": 1.46, - "learning_rate": 1.0960618103008599e-06, - "loss": 0.707, - "step": 56803 - }, - { - "epoch": 1.46, - "learning_rate": 1.0960342677757836e-06, - "loss": 0.6045, - "step": 56804 - }, - { - "epoch": 1.46, - "learning_rate": 1.0960067251771782e-06, - "loss": 0.8018, - "step": 56805 - }, - { - "epoch": 1.46, - "learning_rate": 1.0959791825050653e-06, - "loss": 0.5312, - "step": 56806 - }, - { - "epoch": 1.46, - "learning_rate": 1.095951639759465e-06, - "loss": 0.5903, - "step": 56807 - }, - { - "epoch": 1.46, - "learning_rate": 1.0959240969403994e-06, - "loss": 0.5641, - "step": 56808 - }, - { - "epoch": 1.46, - "learning_rate": 1.0958965540478887e-06, - "loss": 0.6401, - "step": 56809 - }, - { - "epoch": 1.46, - "learning_rate": 1.0958690110819548e-06, - "loss": 0.6313, - "step": 56810 - }, - { - "epoch": 1.46, - "learning_rate": 1.0958414680426183e-06, - "loss": 0.709, - "step": 56811 - }, - { - "epoch": 1.46, - "learning_rate": 1.0958139249299004e-06, - "loss": 0.5229, - "step": 56812 - }, - { - "epoch": 1.46, - "learning_rate": 1.0957863817438218e-06, - "loss": 0.6099, - "step": 56813 - }, - { - "epoch": 1.46, - "learning_rate": 1.0957588384844043e-06, - "loss": 0.7412, - "step": 56814 - }, - { - "epoch": 1.46, - "learning_rate": 1.095731295151669e-06, - "loss": 0.4451, - "step": 56815 - }, - { - "epoch": 1.46, - "learning_rate": 1.0957037517456362e-06, - "loss": 0.7109, - "step": 56816 - }, - { - "epoch": 1.46, - "learning_rate": 1.0956762082663273e-06, - "loss": 0.4841, - "step": 56817 - }, - { - "epoch": 1.46, - "learning_rate": 1.095648664713764e-06, - "loss": 0.6768, - "step": 56818 - }, - { - "epoch": 1.46, - "learning_rate": 1.0956211210879665e-06, - "loss": 0.5889, - "step": 56819 - }, - { - "epoch": 1.46, - "learning_rate": 1.0955935773889565e-06, - "loss": 0.7236, - "step": 56820 - }, - { - "epoch": 1.46, - "learning_rate": 1.0955660336167548e-06, - "loss": 0.6562, - "step": 56821 - }, - { - "epoch": 1.46, - "learning_rate": 1.0955384897713826e-06, - "loss": 0.7305, - "step": 56822 - }, - { - "epoch": 1.46, - "learning_rate": 1.095510945852861e-06, - "loss": 0.4229, - "step": 56823 - }, - { - "epoch": 1.46, - "learning_rate": 1.0954834018612112e-06, - "loss": 0.5901, - "step": 56824 - }, - { - "epoch": 1.46, - "learning_rate": 1.095455857796454e-06, - "loss": 0.708, - "step": 56825 - }, - { - "epoch": 1.46, - "learning_rate": 1.0954283136586107e-06, - "loss": 0.6211, - "step": 56826 - }, - { - "epoch": 1.46, - "learning_rate": 1.0954007694477023e-06, - "loss": 0.5664, - "step": 56827 - }, - { - "epoch": 1.46, - "learning_rate": 1.0953732251637498e-06, - "loss": 0.5469, - "step": 56828 - }, - { - "epoch": 1.46, - "learning_rate": 1.0953456808067748e-06, - "loss": 0.6465, - "step": 56829 - }, - { - "epoch": 1.46, - "learning_rate": 1.0953181363767976e-06, - "loss": 0.6187, - "step": 56830 - }, - { - "epoch": 1.46, - "learning_rate": 1.09529059187384e-06, - "loss": 0.6455, - "step": 56831 - }, - { - "epoch": 1.46, - "learning_rate": 1.0952630472979223e-06, - "loss": 0.7529, - "step": 56832 - }, - { - "epoch": 1.46, - "learning_rate": 1.0952355026490665e-06, - "loss": 0.6929, - "step": 56833 - }, - { - "epoch": 1.46, - "learning_rate": 1.0952079579272928e-06, - "loss": 0.6699, - "step": 56834 - }, - { - "epoch": 1.46, - "learning_rate": 1.0951804131326234e-06, - "loss": 0.48, - "step": 56835 - }, - { - "epoch": 1.46, - "learning_rate": 1.0951528682650784e-06, - "loss": 0.6992, - "step": 56836 - }, - { - "epoch": 1.46, - "learning_rate": 1.0951253233246791e-06, - "loss": 0.7231, - "step": 56837 - }, - { - "epoch": 1.46, - "learning_rate": 1.0950977783114467e-06, - "loss": 0.5801, - "step": 56838 - }, - { - "epoch": 1.46, - "learning_rate": 1.0950702332254025e-06, - "loss": 0.5168, - "step": 56839 - }, - { - "epoch": 1.46, - "learning_rate": 1.0950426880665672e-06, - "loss": 0.6104, - "step": 56840 - }, - { - "epoch": 1.46, - "learning_rate": 1.0950151428349625e-06, - "loss": 0.667, - "step": 56841 - }, - { - "epoch": 1.46, - "learning_rate": 1.0949875975306087e-06, - "loss": 0.4958, - "step": 56842 - }, - { - "epoch": 1.46, - "learning_rate": 1.0949600521535273e-06, - "loss": 0.3528, - "step": 56843 - }, - { - "epoch": 1.46, - "learning_rate": 1.0949325067037392e-06, - "loss": 0.6294, - "step": 56844 - }, - { - "epoch": 1.46, - "learning_rate": 1.0949049611812659e-06, - "loss": 0.6289, - "step": 56845 - }, - { - "epoch": 1.46, - "learning_rate": 1.0948774155861282e-06, - "loss": 0.4341, - "step": 56846 - }, - { - "epoch": 1.46, - "learning_rate": 1.0948498699183472e-06, - "loss": 0.6816, - "step": 56847 - }, - { - "epoch": 1.46, - "learning_rate": 1.094822324177944e-06, - "loss": 0.9326, - "step": 56848 - }, - { - "epoch": 1.46, - "learning_rate": 1.0947947783649397e-06, - "loss": 0.6523, - "step": 56849 - }, - { - "epoch": 1.46, - "learning_rate": 1.0947672324793554e-06, - "loss": 0.6465, - "step": 56850 - }, - { - "epoch": 1.46, - "learning_rate": 1.0947396865212125e-06, - "loss": 0.7236, - "step": 56851 - }, - { - "epoch": 1.46, - "learning_rate": 1.0947121404905313e-06, - "loss": 0.6719, - "step": 56852 - }, - { - "epoch": 1.46, - "learning_rate": 1.0946845943873334e-06, - "loss": 0.6396, - "step": 56853 - }, - { - "epoch": 1.46, - "learning_rate": 1.0946570482116402e-06, - "loss": 0.6831, - "step": 56854 - }, - { - "epoch": 1.46, - "learning_rate": 1.0946295019634723e-06, - "loss": 0.6821, - "step": 56855 - }, - { - "epoch": 1.46, - "learning_rate": 1.0946019556428509e-06, - "loss": 0.7197, - "step": 56856 - }, - { - "epoch": 1.46, - "learning_rate": 1.094574409249797e-06, - "loss": 0.6436, - "step": 56857 - }, - { - "epoch": 1.46, - "learning_rate": 1.0945468627843322e-06, - "loss": 0.8809, - "step": 56858 - }, - { - "epoch": 1.46, - "learning_rate": 1.0945193162464767e-06, - "loss": 0.5054, - "step": 56859 - }, - { - "epoch": 1.46, - "learning_rate": 1.0944917696362528e-06, - "loss": 0.6616, - "step": 56860 - }, - { - "epoch": 1.46, - "learning_rate": 1.0944642229536802e-06, - "loss": 0.4873, - "step": 56861 - }, - { - "epoch": 1.46, - "learning_rate": 1.0944366761987812e-06, - "loss": 0.7012, - "step": 56862 - }, - { - "epoch": 1.46, - "learning_rate": 1.0944091293715758e-06, - "loss": 0.6079, - "step": 56863 - }, - { - "epoch": 1.46, - "learning_rate": 1.0943815824720861e-06, - "loss": 0.6855, - "step": 56864 - }, - { - "epoch": 1.46, - "learning_rate": 1.094354035500333e-06, - "loss": 0.6758, - "step": 56865 - }, - { - "epoch": 1.46, - "learning_rate": 1.0943264884563367e-06, - "loss": 0.4119, - "step": 56866 - }, - { - "epoch": 1.46, - "learning_rate": 1.0942989413401194e-06, - "loss": 0.5295, - "step": 56867 - }, - { - "epoch": 1.46, - "learning_rate": 1.0942713941517017e-06, - "loss": 0.6846, - "step": 56868 - }, - { - "epoch": 1.46, - "learning_rate": 1.0942438468911043e-06, - "loss": 0.6387, - "step": 56869 - }, - { - "epoch": 1.46, - "learning_rate": 1.0942162995583493e-06, - "loss": 0.5229, - "step": 56870 - }, - { - "epoch": 1.46, - "learning_rate": 1.0941887521534569e-06, - "loss": 0.7119, - "step": 56871 - }, - { - "epoch": 1.46, - "learning_rate": 1.0941612046764485e-06, - "loss": 0.6504, - "step": 56872 - }, - { - "epoch": 1.46, - "learning_rate": 1.0941336571273453e-06, - "loss": 0.3577, - "step": 56873 - }, - { - "epoch": 1.46, - "learning_rate": 1.0941061095061681e-06, - "loss": 0.5127, - "step": 56874 - }, - { - "epoch": 1.46, - "learning_rate": 1.0940785618129387e-06, - "loss": 0.7275, - "step": 56875 - }, - { - "epoch": 1.46, - "learning_rate": 1.0940510140476772e-06, - "loss": 0.6113, - "step": 56876 - }, - { - "epoch": 1.46, - "learning_rate": 1.0940234662104053e-06, - "loss": 0.624, - "step": 56877 - }, - { - "epoch": 1.46, - "learning_rate": 1.0939959183011438e-06, - "loss": 0.4521, - "step": 56878 - }, - { - "epoch": 1.46, - "learning_rate": 1.093968370319914e-06, - "loss": 0.5913, - "step": 56879 - }, - { - "epoch": 1.46, - "learning_rate": 1.0939408222667373e-06, - "loss": 0.5835, - "step": 56880 - }, - { - "epoch": 1.46, - "learning_rate": 1.0939132741416342e-06, - "loss": 0.6245, - "step": 56881 - }, - { - "epoch": 1.46, - "learning_rate": 1.0938857259446258e-06, - "loss": 0.4857, - "step": 56882 - }, - { - "epoch": 1.46, - "learning_rate": 1.0938581776757337e-06, - "loss": 0.5073, - "step": 56883 - }, - { - "epoch": 1.46, - "learning_rate": 1.0938306293349785e-06, - "loss": 0.5234, - "step": 56884 - }, - { - "epoch": 1.46, - "learning_rate": 1.0938030809223818e-06, - "loss": 0.7324, - "step": 56885 - }, - { - "epoch": 1.46, - "learning_rate": 1.093775532437964e-06, - "loss": 0.752, - "step": 56886 - }, - { - "epoch": 1.46, - "learning_rate": 1.093747983881747e-06, - "loss": 0.6111, - "step": 56887 - }, - { - "epoch": 1.46, - "learning_rate": 1.093720435253751e-06, - "loss": 0.6846, - "step": 56888 - }, - { - "epoch": 1.46, - "learning_rate": 1.093692886553998e-06, - "loss": 0.5632, - "step": 56889 - }, - { - "epoch": 1.46, - "learning_rate": 1.0936653377825085e-06, - "loss": 0.7227, - "step": 56890 - }, - { - "epoch": 1.46, - "learning_rate": 1.0936377889393035e-06, - "loss": 0.6533, - "step": 56891 - }, - { - "epoch": 1.46, - "learning_rate": 1.0936102400244048e-06, - "loss": 0.5403, - "step": 56892 - }, - { - "epoch": 1.46, - "learning_rate": 1.0935826910378325e-06, - "loss": 0.5364, - "step": 56893 - }, - { - "epoch": 1.46, - "learning_rate": 1.0935551419796089e-06, - "loss": 0.7041, - "step": 56894 - }, - { - "epoch": 1.46, - "learning_rate": 1.093527592849754e-06, - "loss": 0.4595, - "step": 56895 - }, - { - "epoch": 1.46, - "learning_rate": 1.0935000436482894e-06, - "loss": 0.5249, - "step": 56896 - }, - { - "epoch": 1.46, - "learning_rate": 1.0934724943752362e-06, - "loss": 0.6069, - "step": 56897 - }, - { - "epoch": 1.46, - "learning_rate": 1.0934449450306154e-06, - "loss": 0.4019, - "step": 56898 - }, - { - "epoch": 1.46, - "learning_rate": 1.0934173956144482e-06, - "loss": 0.7041, - "step": 56899 - }, - { - "epoch": 1.46, - "learning_rate": 1.0933898461267555e-06, - "loss": 0.5117, - "step": 56900 - }, - { - "epoch": 1.46, - "learning_rate": 1.0933622965675582e-06, - "loss": 0.7222, - "step": 56901 - }, - { - "epoch": 1.46, - "learning_rate": 1.0933347469368782e-06, - "loss": 0.7471, - "step": 56902 - }, - { - "epoch": 1.46, - "learning_rate": 1.0933071972347354e-06, - "loss": 0.7368, - "step": 56903 - }, - { - "epoch": 1.46, - "learning_rate": 1.0932796474611522e-06, - "loss": 0.6733, - "step": 56904 - }, - { - "epoch": 1.46, - "learning_rate": 1.0932520976161489e-06, - "loss": 0.502, - "step": 56905 - }, - { - "epoch": 1.46, - "learning_rate": 1.0932245476997468e-06, - "loss": 0.6807, - "step": 56906 - }, - { - "epoch": 1.46, - "learning_rate": 1.0931969977119665e-06, - "loss": 0.5605, - "step": 56907 - }, - { - "epoch": 1.46, - "learning_rate": 1.09316944765283e-06, - "loss": 0.6445, - "step": 56908 - }, - { - "epoch": 1.46, - "learning_rate": 1.093141897522358e-06, - "loss": 0.7324, - "step": 56909 - }, - { - "epoch": 1.46, - "learning_rate": 1.0931143473205713e-06, - "loss": 0.5645, - "step": 56910 - }, - { - "epoch": 1.46, - "learning_rate": 1.0930867970474913e-06, - "loss": 0.8154, - "step": 56911 - }, - { - "epoch": 1.46, - "learning_rate": 1.0930592467031387e-06, - "loss": 0.6323, - "step": 56912 - }, - { - "epoch": 1.46, - "learning_rate": 1.0930316962875354e-06, - "loss": 0.5229, - "step": 56913 - }, - { - "epoch": 1.46, - "learning_rate": 1.093004145800702e-06, - "loss": 0.5498, - "step": 56914 - }, - { - "epoch": 1.46, - "learning_rate": 1.0929765952426596e-06, - "loss": 0.3368, - "step": 56915 - }, - { - "epoch": 1.46, - "learning_rate": 1.0929490446134289e-06, - "loss": 0.6172, - "step": 56916 - }, - { - "epoch": 1.46, - "learning_rate": 1.0929214939130315e-06, - "loss": 0.7734, - "step": 56917 - }, - { - "epoch": 1.46, - "learning_rate": 1.0928939431414885e-06, - "loss": 0.6707, - "step": 56918 - }, - { - "epoch": 1.46, - "learning_rate": 1.092866392298821e-06, - "loss": 0.6577, - "step": 56919 - }, - { - "epoch": 1.46, - "learning_rate": 1.0928388413850499e-06, - "loss": 0.6611, - "step": 56920 - }, - { - "epoch": 1.46, - "learning_rate": 1.0928112904001962e-06, - "loss": 0.5918, - "step": 56921 - }, - { - "epoch": 1.46, - "learning_rate": 1.0927837393442811e-06, - "loss": 0.7812, - "step": 56922 - }, - { - "epoch": 1.46, - "learning_rate": 1.0927561882173262e-06, - "loss": 0.7461, - "step": 56923 - }, - { - "epoch": 1.46, - "learning_rate": 1.0927286370193521e-06, - "loss": 0.7314, - "step": 56924 - }, - { - "epoch": 1.46, - "learning_rate": 1.0927010857503797e-06, - "loss": 0.6174, - "step": 56925 - }, - { - "epoch": 1.46, - "learning_rate": 1.09267353441043e-06, - "loss": 0.6221, - "step": 56926 - }, - { - "epoch": 1.46, - "learning_rate": 1.0926459829995252e-06, - "loss": 0.8174, - "step": 56927 - }, - { - "epoch": 1.46, - "learning_rate": 1.092618431517685e-06, - "loss": 0.7607, - "step": 56928 - }, - { - "epoch": 1.46, - "learning_rate": 1.0925908799649314e-06, - "loss": 0.6069, - "step": 56929 - }, - { - "epoch": 1.46, - "learning_rate": 1.0925633283412851e-06, - "loss": 0.6968, - "step": 56930 - }, - { - "epoch": 1.46, - "learning_rate": 1.0925357766467676e-06, - "loss": 0.7554, - "step": 56931 - }, - { - "epoch": 1.46, - "learning_rate": 1.0925082248813995e-06, - "loss": 0.8115, - "step": 56932 - }, - { - "epoch": 1.46, - "learning_rate": 1.0924806730452021e-06, - "loss": 0.5391, - "step": 56933 - }, - { - "epoch": 1.46, - "learning_rate": 1.0924531211381966e-06, - "loss": 0.6924, - "step": 56934 - }, - { - "epoch": 1.46, - "learning_rate": 1.092425569160404e-06, - "loss": 0.667, - "step": 56935 - }, - { - "epoch": 1.46, - "learning_rate": 1.0923980171118452e-06, - "loss": 0.6748, - "step": 56936 - }, - { - "epoch": 1.46, - "learning_rate": 1.0923704649925415e-06, - "loss": 0.707, - "step": 56937 - }, - { - "epoch": 1.46, - "learning_rate": 1.092342912802514e-06, - "loss": 0.8252, - "step": 56938 - }, - { - "epoch": 1.46, - "learning_rate": 1.092315360541784e-06, - "loss": 0.6963, - "step": 56939 - }, - { - "epoch": 1.46, - "learning_rate": 1.0922878082103724e-06, - "loss": 0.5947, - "step": 56940 - }, - { - "epoch": 1.46, - "learning_rate": 1.0922602558082999e-06, - "loss": 0.6792, - "step": 56941 - }, - { - "epoch": 1.46, - "learning_rate": 1.0922327033355884e-06, - "loss": 0.5603, - "step": 56942 - }, - { - "epoch": 1.46, - "learning_rate": 1.092205150792258e-06, - "loss": 0.5981, - "step": 56943 - }, - { - "epoch": 1.46, - "learning_rate": 1.092177598178331e-06, - "loss": 0.708, - "step": 56944 - }, - { - "epoch": 1.46, - "learning_rate": 1.0921500454938272e-06, - "loss": 0.4836, - "step": 56945 - }, - { - "epoch": 1.46, - "learning_rate": 1.092122492738769e-06, - "loss": 0.6846, - "step": 56946 - }, - { - "epoch": 1.46, - "learning_rate": 1.0920949399131763e-06, - "loss": 0.4636, - "step": 56947 - }, - { - "epoch": 1.46, - "learning_rate": 1.092067387017071e-06, - "loss": 0.5264, - "step": 56948 - }, - { - "epoch": 1.46, - "learning_rate": 1.092039834050474e-06, - "loss": 0.457, - "step": 56949 - }, - { - "epoch": 1.46, - "learning_rate": 1.0920122810134063e-06, - "loss": 0.4454, - "step": 56950 - }, - { - "epoch": 1.46, - "learning_rate": 1.0919847279058887e-06, - "loss": 0.8047, - "step": 56951 - }, - { - "epoch": 1.46, - "learning_rate": 1.091957174727943e-06, - "loss": 0.4622, - "step": 56952 - }, - { - "epoch": 1.46, - "learning_rate": 1.0919296214795897e-06, - "loss": 0.7002, - "step": 56953 - }, - { - "epoch": 1.46, - "learning_rate": 1.0919020681608505e-06, - "loss": 0.3604, - "step": 56954 - }, - { - "epoch": 1.46, - "learning_rate": 1.0918745147717457e-06, - "loss": 0.625, - "step": 56955 - }, - { - "epoch": 1.46, - "learning_rate": 1.0918469613122967e-06, - "loss": 0.6426, - "step": 56956 - }, - { - "epoch": 1.46, - "learning_rate": 1.091819407782525e-06, - "loss": 0.5688, - "step": 56957 - }, - { - "epoch": 1.46, - "learning_rate": 1.0917918541824515e-06, - "loss": 0.6504, - "step": 56958 - }, - { - "epoch": 1.46, - "learning_rate": 1.091764300512097e-06, - "loss": 0.7129, - "step": 56959 - }, - { - "epoch": 1.46, - "learning_rate": 1.0917367467714829e-06, - "loss": 0.5048, - "step": 56960 - }, - { - "epoch": 1.46, - "learning_rate": 1.0917091929606302e-06, - "loss": 0.8037, - "step": 56961 - }, - { - "epoch": 1.46, - "learning_rate": 1.0916816390795597e-06, - "loss": 0.7236, - "step": 56962 - }, - { - "epoch": 1.46, - "learning_rate": 1.091654085128293e-06, - "loss": 0.6133, - "step": 56963 - }, - { - "epoch": 1.46, - "learning_rate": 1.0916265311068511e-06, - "loss": 0.7153, - "step": 56964 - }, - { - "epoch": 1.46, - "learning_rate": 1.091598977015255e-06, - "loss": 0.7295, - "step": 56965 - }, - { - "epoch": 1.46, - "learning_rate": 1.0915714228535254e-06, - "loss": 0.6172, - "step": 56966 - }, - { - "epoch": 1.46, - "learning_rate": 1.091543868621684e-06, - "loss": 0.709, - "step": 56967 - }, - { - "epoch": 1.46, - "learning_rate": 1.0915163143197517e-06, - "loss": 0.5054, - "step": 56968 - }, - { - "epoch": 1.46, - "learning_rate": 1.0914887599477499e-06, - "loss": 0.7432, - "step": 56969 - }, - { - "epoch": 1.46, - "learning_rate": 1.0914612055056986e-06, - "loss": 0.7021, - "step": 56970 - }, - { - "epoch": 1.46, - "learning_rate": 1.0914336509936202e-06, - "loss": 0.5845, - "step": 56971 - }, - { - "epoch": 1.46, - "learning_rate": 1.0914060964115351e-06, - "loss": 0.6296, - "step": 56972 - }, - { - "epoch": 1.46, - "learning_rate": 1.0913785417594646e-06, - "loss": 0.7295, - "step": 56973 - }, - { - "epoch": 1.46, - "learning_rate": 1.0913509870374298e-06, - "loss": 0.6191, - "step": 56974 - }, - { - "epoch": 1.46, - "learning_rate": 1.0913234322454516e-06, - "loss": 0.623, - "step": 56975 - }, - { - "epoch": 1.46, - "learning_rate": 1.0912958773835511e-06, - "loss": 0.6963, - "step": 56976 - }, - { - "epoch": 1.46, - "learning_rate": 1.09126832245175e-06, - "loss": 0.7812, - "step": 56977 - }, - { - "epoch": 1.46, - "learning_rate": 1.0912407674500686e-06, - "loss": 0.561, - "step": 56978 - }, - { - "epoch": 1.46, - "learning_rate": 1.0912132123785285e-06, - "loss": 0.7383, - "step": 56979 - }, - { - "epoch": 1.46, - "learning_rate": 1.0911856572371508e-06, - "loss": 0.594, - "step": 56980 - }, - { - "epoch": 1.46, - "learning_rate": 1.091158102025956e-06, - "loss": 0.6836, - "step": 56981 - }, - { - "epoch": 1.46, - "learning_rate": 1.0911305467449658e-06, - "loss": 0.4771, - "step": 56982 - }, - { - "epoch": 1.46, - "learning_rate": 1.091102991394201e-06, - "loss": 0.8076, - "step": 56983 - }, - { - "epoch": 1.46, - "learning_rate": 1.0910754359736836e-06, - "loss": 0.5361, - "step": 56984 - }, - { - "epoch": 1.46, - "learning_rate": 1.091047880483433e-06, - "loss": 0.6069, - "step": 56985 - }, - { - "epoch": 1.46, - "learning_rate": 1.0910203249234718e-06, - "loss": 0.5374, - "step": 56986 - }, - { - "epoch": 1.46, - "learning_rate": 1.0909927692938202e-06, - "loss": 0.7256, - "step": 56987 - }, - { - "epoch": 1.46, - "learning_rate": 1.0909652135944995e-06, - "loss": 0.7207, - "step": 56988 - }, - { - "epoch": 1.46, - "learning_rate": 1.0909376578255314e-06, - "loss": 0.564, - "step": 56989 - }, - { - "epoch": 1.46, - "learning_rate": 1.0909101019869362e-06, - "loss": 0.6875, - "step": 56990 - }, - { - "epoch": 1.46, - "learning_rate": 1.0908825460787351e-06, - "loss": 0.6221, - "step": 56991 - }, - { - "epoch": 1.46, - "learning_rate": 1.0908549901009498e-06, - "loss": 0.6572, - "step": 56992 - }, - { - "epoch": 1.46, - "learning_rate": 1.0908274340536009e-06, - "loss": 0.6824, - "step": 56993 - }, - { - "epoch": 1.46, - "learning_rate": 1.0907998779367099e-06, - "loss": 0.8145, - "step": 56994 - }, - { - "epoch": 1.46, - "learning_rate": 1.0907723217502972e-06, - "loss": 0.6777, - "step": 56995 - }, - { - "epoch": 1.46, - "learning_rate": 1.0907447654943844e-06, - "loss": 0.6191, - "step": 56996 - }, - { - "epoch": 1.46, - "learning_rate": 1.0907172091689924e-06, - "loss": 0.5586, - "step": 56997 - }, - { - "epoch": 1.46, - "learning_rate": 1.0906896527741425e-06, - "loss": 0.5991, - "step": 56998 - }, - { - "epoch": 1.46, - "learning_rate": 1.0906620963098558e-06, - "loss": 0.6821, - "step": 56999 - }, - { - "epoch": 1.46, - "learning_rate": 1.0906345397761533e-06, - "loss": 0.5967, - "step": 57000 - }, - { - "epoch": 1.46, - "learning_rate": 1.090606983173056e-06, - "loss": 0.6709, - "step": 57001 - }, - { - "epoch": 1.46, - "learning_rate": 1.090579426500585e-06, - "loss": 0.6846, - "step": 57002 - }, - { - "epoch": 1.46, - "learning_rate": 1.0905518697587617e-06, - "loss": 0.4976, - "step": 57003 - }, - { - "epoch": 1.46, - "learning_rate": 1.090524312947607e-06, - "loss": 0.5015, - "step": 57004 - }, - { - "epoch": 1.46, - "learning_rate": 1.0904967560671418e-06, - "loss": 0.6787, - "step": 57005 - }, - { - "epoch": 1.46, - "learning_rate": 1.0904691991173875e-06, - "loss": 0.562, - "step": 57006 - }, - { - "epoch": 1.46, - "learning_rate": 1.0904416420983651e-06, - "loss": 0.6582, - "step": 57007 - }, - { - "epoch": 1.46, - "learning_rate": 1.0904140850100955e-06, - "loss": 0.7168, - "step": 57008 - }, - { - "epoch": 1.46, - "learning_rate": 1.0903865278526006e-06, - "loss": 0.5601, - "step": 57009 - }, - { - "epoch": 1.46, - "learning_rate": 1.0903589706259002e-06, - "loss": 0.6064, - "step": 57010 - }, - { - "epoch": 1.46, - "learning_rate": 1.0903314133300166e-06, - "loss": 0.7266, - "step": 57011 - }, - { - "epoch": 1.46, - "learning_rate": 1.09030385596497e-06, - "loss": 0.6543, - "step": 57012 - }, - { - "epoch": 1.46, - "learning_rate": 1.0902762985307821e-06, - "loss": 0.7285, - "step": 57013 - }, - { - "epoch": 1.46, - "learning_rate": 1.090248741027474e-06, - "loss": 0.5049, - "step": 57014 - }, - { - "epoch": 1.46, - "learning_rate": 1.0902211834550664e-06, - "loss": 0.9189, - "step": 57015 - }, - { - "epoch": 1.46, - "learning_rate": 1.0901936258135802e-06, - "loss": 0.5674, - "step": 57016 - }, - { - "epoch": 1.46, - "learning_rate": 1.0901660681030374e-06, - "loss": 0.7041, - "step": 57017 - }, - { - "epoch": 1.46, - "learning_rate": 1.0901385103234583e-06, - "loss": 0.6172, - "step": 57018 - }, - { - "epoch": 1.46, - "learning_rate": 1.0901109524748643e-06, - "loss": 0.6982, - "step": 57019 - }, - { - "epoch": 1.46, - "learning_rate": 1.0900833945572768e-06, - "loss": 0.8213, - "step": 57020 - }, - { - "epoch": 1.46, - "learning_rate": 1.0900558365707162e-06, - "loss": 0.4783, - "step": 57021 - }, - { - "epoch": 1.46, - "learning_rate": 1.090028278515204e-06, - "loss": 0.7314, - "step": 57022 - }, - { - "epoch": 1.46, - "learning_rate": 1.0900007203907615e-06, - "loss": 0.6084, - "step": 57023 - }, - { - "epoch": 1.46, - "learning_rate": 1.0899731621974097e-06, - "loss": 0.6372, - "step": 57024 - }, - { - "epoch": 1.46, - "learning_rate": 1.0899456039351691e-06, - "loss": 0.7573, - "step": 57025 - }, - { - "epoch": 1.46, - "learning_rate": 1.0899180456040618e-06, - "loss": 0.8203, - "step": 57026 - }, - { - "epoch": 1.46, - "learning_rate": 1.0898904872041079e-06, - "loss": 0.5903, - "step": 57027 - }, - { - "epoch": 1.46, - "learning_rate": 1.0898629287353293e-06, - "loss": 0.7822, - "step": 57028 - }, - { - "epoch": 1.46, - "learning_rate": 1.089835370197747e-06, - "loss": 0.562, - "step": 57029 - }, - { - "epoch": 1.46, - "learning_rate": 1.0898078115913817e-06, - "loss": 0.6079, - "step": 57030 - }, - { - "epoch": 1.46, - "learning_rate": 1.0897802529162545e-06, - "loss": 0.5884, - "step": 57031 - }, - { - "epoch": 1.46, - "learning_rate": 1.089752694172387e-06, - "loss": 0.7256, - "step": 57032 - }, - { - "epoch": 1.46, - "learning_rate": 1.0897251353597996e-06, - "loss": 0.7373, - "step": 57033 - }, - { - "epoch": 1.46, - "learning_rate": 1.0896975764785141e-06, - "loss": 0.7559, - "step": 57034 - }, - { - "epoch": 1.46, - "learning_rate": 1.0896700175285512e-06, - "loss": 0.647, - "step": 57035 - }, - { - "epoch": 1.46, - "learning_rate": 1.0896424585099322e-06, - "loss": 0.5938, - "step": 57036 - }, - { - "epoch": 1.46, - "learning_rate": 1.0896148994226778e-06, - "loss": 0.4333, - "step": 57037 - }, - { - "epoch": 1.46, - "learning_rate": 1.0895873402668096e-06, - "loss": 0.6992, - "step": 57038 - }, - { - "epoch": 1.46, - "learning_rate": 1.0895597810423485e-06, - "loss": 0.8135, - "step": 57039 - }, - { - "epoch": 1.46, - "learning_rate": 1.0895322217493156e-06, - "loss": 0.5771, - "step": 57040 - }, - { - "epoch": 1.46, - "learning_rate": 1.0895046623877317e-06, - "loss": 0.7051, - "step": 57041 - }, - { - "epoch": 1.46, - "learning_rate": 1.0894771029576187e-06, - "loss": 0.8242, - "step": 57042 - }, - { - "epoch": 1.46, - "learning_rate": 1.0894495434589967e-06, - "loss": 0.6875, - "step": 57043 - }, - { - "epoch": 1.46, - "learning_rate": 1.0894219838918877e-06, - "loss": 0.6313, - "step": 57044 - }, - { - "epoch": 1.46, - "learning_rate": 1.0893944242563122e-06, - "loss": 0.6499, - "step": 57045 - }, - { - "epoch": 1.46, - "learning_rate": 1.0893668645522913e-06, - "loss": 0.8184, - "step": 57046 - }, - { - "epoch": 1.46, - "learning_rate": 1.0893393047798467e-06, - "loss": 0.5708, - "step": 57047 - }, - { - "epoch": 1.46, - "learning_rate": 1.089311744938999e-06, - "loss": 0.7363, - "step": 57048 - }, - { - "epoch": 1.46, - "learning_rate": 1.0892841850297694e-06, - "loss": 0.7666, - "step": 57049 - }, - { - "epoch": 1.46, - "learning_rate": 1.089256625052179e-06, - "loss": 0.6929, - "step": 57050 - }, - { - "epoch": 1.46, - "learning_rate": 1.0892290650062487e-06, - "loss": 0.6414, - "step": 57051 - }, - { - "epoch": 1.46, - "learning_rate": 1.0892015048919999e-06, - "loss": 0.7476, - "step": 57052 - }, - { - "epoch": 1.46, - "learning_rate": 1.0891739447094536e-06, - "loss": 0.6069, - "step": 57053 - }, - { - "epoch": 1.46, - "learning_rate": 1.089146384458631e-06, - "loss": 0.7324, - "step": 57054 - }, - { - "epoch": 1.46, - "learning_rate": 1.0891188241395533e-06, - "loss": 0.8867, - "step": 57055 - }, - { - "epoch": 1.46, - "learning_rate": 1.0890912637522411e-06, - "loss": 0.6904, - "step": 57056 - }, - { - "epoch": 1.46, - "learning_rate": 1.089063703296716e-06, - "loss": 0.6963, - "step": 57057 - }, - { - "epoch": 1.46, - "learning_rate": 1.0890361427729986e-06, - "loss": 0.7461, - "step": 57058 - }, - { - "epoch": 1.46, - "learning_rate": 1.0890085821811108e-06, - "loss": 0.5735, - "step": 57059 - }, - { - "epoch": 1.46, - "learning_rate": 1.0889810215210728e-06, - "loss": 0.5161, - "step": 57060 - }, - { - "epoch": 1.46, - "learning_rate": 1.0889534607929065e-06, - "loss": 0.6777, - "step": 57061 - }, - { - "epoch": 1.46, - "learning_rate": 1.0889258999966322e-06, - "loss": 0.7139, - "step": 57062 - }, - { - "epoch": 1.46, - "learning_rate": 1.0888983391322717e-06, - "loss": 0.5424, - "step": 57063 - }, - { - "epoch": 1.46, - "learning_rate": 1.088870778199846e-06, - "loss": 0.8076, - "step": 57064 - }, - { - "epoch": 1.46, - "learning_rate": 1.0888432171993757e-06, - "loss": 0.7344, - "step": 57065 - }, - { - "epoch": 1.46, - "learning_rate": 1.0888156561308824e-06, - "loss": 0.6396, - "step": 57066 - }, - { - "epoch": 1.46, - "learning_rate": 1.088788094994387e-06, - "loss": 0.7021, - "step": 57067 - }, - { - "epoch": 1.46, - "learning_rate": 1.0887605337899105e-06, - "loss": 0.7246, - "step": 57068 - }, - { - "epoch": 1.46, - "learning_rate": 1.0887329725174743e-06, - "loss": 0.7168, - "step": 57069 - }, - { - "epoch": 1.46, - "learning_rate": 1.0887054111770994e-06, - "loss": 0.623, - "step": 57070 - }, - { - "epoch": 1.46, - "learning_rate": 1.0886778497688066e-06, - "loss": 0.8057, - "step": 57071 - }, - { - "epoch": 1.46, - "learning_rate": 1.0886502882926174e-06, - "loss": 0.709, - "step": 57072 - }, - { - "epoch": 1.46, - "learning_rate": 1.0886227267485526e-06, - "loss": 0.6982, - "step": 57073 - }, - { - "epoch": 1.46, - "learning_rate": 1.0885951651366338e-06, - "loss": 0.6279, - "step": 57074 - }, - { - "epoch": 1.46, - "learning_rate": 1.0885676034568817e-06, - "loss": 0.6353, - "step": 57075 - }, - { - "epoch": 1.46, - "learning_rate": 1.0885400417093174e-06, - "loss": 0.6514, - "step": 57076 - }, - { - "epoch": 1.46, - "learning_rate": 1.0885124798939618e-06, - "loss": 0.5371, - "step": 57077 - }, - { - "epoch": 1.46, - "learning_rate": 1.0884849180108365e-06, - "loss": 0.6543, - "step": 57078 - }, - { - "epoch": 1.46, - "learning_rate": 1.0884573560599625e-06, - "loss": 0.5718, - "step": 57079 - }, - { - "epoch": 1.46, - "learning_rate": 1.0884297940413605e-06, - "loss": 0.6602, - "step": 57080 - }, - { - "epoch": 1.46, - "learning_rate": 1.0884022319550516e-06, - "loss": 0.5908, - "step": 57081 - }, - { - "epoch": 1.46, - "learning_rate": 1.0883746698010576e-06, - "loss": 0.7803, - "step": 57082 - }, - { - "epoch": 1.46, - "learning_rate": 1.088347107579399e-06, - "loss": 0.8027, - "step": 57083 - }, - { - "epoch": 1.46, - "learning_rate": 1.0883195452900974e-06, - "loss": 0.4956, - "step": 57084 - }, - { - "epoch": 1.46, - "learning_rate": 1.0882919829331734e-06, - "loss": 0.7793, - "step": 57085 - }, - { - "epoch": 1.46, - "learning_rate": 1.0882644205086485e-06, - "loss": 0.6973, - "step": 57086 - }, - { - "epoch": 1.46, - "learning_rate": 1.088236858016543e-06, - "loss": 0.6899, - "step": 57087 - }, - { - "epoch": 1.46, - "learning_rate": 1.0882092954568792e-06, - "loss": 0.5956, - "step": 57088 - }, - { - "epoch": 1.46, - "learning_rate": 1.0881817328296775e-06, - "loss": 0.4443, - "step": 57089 - }, - { - "epoch": 1.46, - "learning_rate": 1.0881541701349586e-06, - "loss": 0.667, - "step": 57090 - }, - { - "epoch": 1.46, - "learning_rate": 1.0881266073727443e-06, - "loss": 0.5605, - "step": 57091 - }, - { - "epoch": 1.46, - "learning_rate": 1.0880990445430558e-06, - "loss": 0.6826, - "step": 57092 - }, - { - "epoch": 1.46, - "learning_rate": 1.0880714816459139e-06, - "loss": 0.5101, - "step": 57093 - }, - { - "epoch": 1.46, - "learning_rate": 1.0880439186813394e-06, - "loss": 0.5197, - "step": 57094 - }, - { - "epoch": 1.46, - "learning_rate": 1.088016355649354e-06, - "loss": 0.8662, - "step": 57095 - }, - { - "epoch": 1.46, - "learning_rate": 1.0879887925499785e-06, - "loss": 0.6616, - "step": 57096 - }, - { - "epoch": 1.46, - "learning_rate": 1.0879612293832338e-06, - "loss": 0.623, - "step": 57097 - }, - { - "epoch": 1.46, - "learning_rate": 1.0879336661491415e-06, - "loss": 0.8652, - "step": 57098 - }, - { - "epoch": 1.46, - "learning_rate": 1.0879061028477225e-06, - "loss": 0.6577, - "step": 57099 - }, - { - "epoch": 1.46, - "learning_rate": 1.0878785394789975e-06, - "loss": 0.7979, - "step": 57100 - }, - { - "epoch": 1.46, - "learning_rate": 1.0878509760429882e-06, - "loss": 0.9111, - "step": 57101 - }, - { - "epoch": 1.46, - "learning_rate": 1.0878234125397152e-06, - "loss": 0.625, - "step": 57102 - }, - { - "epoch": 1.46, - "learning_rate": 1.0877958489692e-06, - "loss": 0.6484, - "step": 57103 - }, - { - "epoch": 1.46, - "learning_rate": 1.0877682853314637e-06, - "loss": 0.7197, - "step": 57104 - }, - { - "epoch": 1.46, - "learning_rate": 1.0877407216265274e-06, - "loss": 0.6572, - "step": 57105 - }, - { - "epoch": 1.46, - "learning_rate": 1.0877131578544114e-06, - "loss": 0.8301, - "step": 57106 - }, - { - "epoch": 1.46, - "learning_rate": 1.087685594015138e-06, - "loss": 0.8311, - "step": 57107 - }, - { - "epoch": 1.46, - "learning_rate": 1.0876580301087275e-06, - "loss": 0.6606, - "step": 57108 - }, - { - "epoch": 1.46, - "learning_rate": 1.0876304661352014e-06, - "loss": 0.5508, - "step": 57109 - }, - { - "epoch": 1.46, - "learning_rate": 1.0876029020945809e-06, - "loss": 0.6025, - "step": 57110 - }, - { - "epoch": 1.46, - "learning_rate": 1.0875753379868865e-06, - "loss": 0.626, - "step": 57111 - }, - { - "epoch": 1.46, - "learning_rate": 1.08754777381214e-06, - "loss": 0.8164, - "step": 57112 - }, - { - "epoch": 1.46, - "learning_rate": 1.087520209570362e-06, - "loss": 0.6826, - "step": 57113 - }, - { - "epoch": 1.46, - "learning_rate": 1.087492645261574e-06, - "loss": 0.6451, - "step": 57114 - }, - { - "epoch": 1.46, - "learning_rate": 1.0874650808857965e-06, - "loss": 0.4966, - "step": 57115 - }, - { - "epoch": 1.46, - "learning_rate": 1.0874375164430513e-06, - "loss": 0.563, - "step": 57116 - }, - { - "epoch": 1.46, - "learning_rate": 1.0874099519333593e-06, - "loss": 0.6572, - "step": 57117 - }, - { - "epoch": 1.46, - "learning_rate": 1.0873823873567414e-06, - "loss": 0.5884, - "step": 57118 - }, - { - "epoch": 1.46, - "learning_rate": 1.0873548227132189e-06, - "loss": 0.6216, - "step": 57119 - }, - { - "epoch": 1.46, - "learning_rate": 1.0873272580028127e-06, - "loss": 0.4543, - "step": 57120 - }, - { - "epoch": 1.46, - "learning_rate": 1.0872996932255441e-06, - "loss": 0.582, - "step": 57121 - }, - { - "epoch": 1.46, - "learning_rate": 1.087272128381434e-06, - "loss": 0.7236, - "step": 57122 - }, - { - "epoch": 1.46, - "learning_rate": 1.0872445634705038e-06, - "loss": 0.7168, - "step": 57123 - }, - { - "epoch": 1.46, - "learning_rate": 1.0872169984927745e-06, - "loss": 0.5996, - "step": 57124 - }, - { - "epoch": 1.46, - "learning_rate": 1.0871894334482672e-06, - "loss": 0.604, - "step": 57125 - }, - { - "epoch": 1.46, - "learning_rate": 1.0871618683370028e-06, - "loss": 0.7461, - "step": 57126 - }, - { - "epoch": 1.46, - "learning_rate": 1.0871343031590027e-06, - "loss": 0.7627, - "step": 57127 - }, - { - "epoch": 1.46, - "learning_rate": 1.0871067379142877e-06, - "loss": 0.6958, - "step": 57128 - }, - { - "epoch": 1.46, - "learning_rate": 1.0870791726028793e-06, - "loss": 0.7256, - "step": 57129 - }, - { - "epoch": 1.46, - "learning_rate": 1.0870516072247981e-06, - "loss": 0.647, - "step": 57130 - }, - { - "epoch": 1.46, - "learning_rate": 1.0870240417800657e-06, - "loss": 0.7656, - "step": 57131 - }, - { - "epoch": 1.46, - "learning_rate": 1.0869964762687028e-06, - "loss": 0.6387, - "step": 57132 - }, - { - "epoch": 1.46, - "learning_rate": 1.0869689106907306e-06, - "loss": 0.7773, - "step": 57133 - }, - { - "epoch": 1.46, - "learning_rate": 1.0869413450461706e-06, - "loss": 0.7158, - "step": 57134 - }, - { - "epoch": 1.46, - "learning_rate": 1.0869137793350435e-06, - "loss": 0.75, - "step": 57135 - }, - { - "epoch": 1.46, - "learning_rate": 1.0868862135573707e-06, - "loss": 0.6709, - "step": 57136 - }, - { - "epoch": 1.46, - "learning_rate": 1.0868586477131729e-06, - "loss": 0.564, - "step": 57137 - }, - { - "epoch": 1.46, - "learning_rate": 1.0868310818024715e-06, - "loss": 0.6201, - "step": 57138 - }, - { - "epoch": 1.46, - "learning_rate": 1.0868035158252878e-06, - "loss": 0.708, - "step": 57139 - }, - { - "epoch": 1.46, - "learning_rate": 1.086775949781642e-06, - "loss": 0.6973, - "step": 57140 - }, - { - "epoch": 1.46, - "learning_rate": 1.0867483836715563e-06, - "loss": 0.5906, - "step": 57141 - }, - { - "epoch": 1.46, - "learning_rate": 1.0867208174950513e-06, - "loss": 0.6904, - "step": 57142 - }, - { - "epoch": 1.46, - "learning_rate": 1.086693251252148e-06, - "loss": 0.707, - "step": 57143 - }, - { - "epoch": 1.46, - "learning_rate": 1.0866656849428679e-06, - "loss": 0.5498, - "step": 57144 - }, - { - "epoch": 1.46, - "learning_rate": 1.0866381185672318e-06, - "loss": 0.6084, - "step": 57145 - }, - { - "epoch": 1.46, - "learning_rate": 1.0866105521252606e-06, - "loss": 0.5007, - "step": 57146 - }, - { - "epoch": 1.46, - "learning_rate": 1.0865829856169762e-06, - "loss": 0.6982, - "step": 57147 - }, - { - "epoch": 1.46, - "learning_rate": 1.0865554190423987e-06, - "loss": 0.6494, - "step": 57148 - }, - { - "epoch": 1.46, - "learning_rate": 1.0865278524015503e-06, - "loss": 0.6785, - "step": 57149 - }, - { - "epoch": 1.46, - "learning_rate": 1.0865002856944507e-06, - "loss": 0.5522, - "step": 57150 - }, - { - "epoch": 1.46, - "learning_rate": 1.0864727189211225e-06, - "loss": 0.7036, - "step": 57151 - }, - { - "epoch": 1.46, - "learning_rate": 1.0864451520815856e-06, - "loss": 0.6321, - "step": 57152 - }, - { - "epoch": 1.46, - "learning_rate": 1.0864175851758619e-06, - "loss": 0.4064, - "step": 57153 - }, - { - "epoch": 1.46, - "learning_rate": 1.0863900182039722e-06, - "loss": 0.6963, - "step": 57154 - }, - { - "epoch": 1.46, - "learning_rate": 1.0863624511659375e-06, - "loss": 0.5669, - "step": 57155 - }, - { - "epoch": 1.46, - "learning_rate": 1.0863348840617792e-06, - "loss": 0.6963, - "step": 57156 - }, - { - "epoch": 1.46, - "learning_rate": 1.0863073168915182e-06, - "loss": 0.7305, - "step": 57157 - }, - { - "epoch": 1.46, - "learning_rate": 1.0862797496551757e-06, - "loss": 0.603, - "step": 57158 - }, - { - "epoch": 1.47, - "learning_rate": 1.0862521823527725e-06, - "loss": 0.6309, - "step": 57159 - }, - { - "epoch": 1.47, - "learning_rate": 1.0862246149843304e-06, - "loss": 0.5933, - "step": 57160 - }, - { - "epoch": 1.47, - "learning_rate": 1.0861970475498697e-06, - "loss": 0.6431, - "step": 57161 - }, - { - "epoch": 1.47, - "learning_rate": 1.0861694800494122e-06, - "loss": 0.499, - "step": 57162 - }, - { - "epoch": 1.47, - "learning_rate": 1.0861419124829783e-06, - "loss": 0.6924, - "step": 57163 - }, - { - "epoch": 1.47, - "learning_rate": 1.08611434485059e-06, - "loss": 0.5635, - "step": 57164 - }, - { - "epoch": 1.47, - "learning_rate": 1.0860867771522676e-06, - "loss": 0.6211, - "step": 57165 - }, - { - "epoch": 1.47, - "learning_rate": 1.0860592093880326e-06, - "loss": 0.6582, - "step": 57166 - }, - { - "epoch": 1.47, - "learning_rate": 1.0860316415579058e-06, - "loss": 0.6729, - "step": 57167 - }, - { - "epoch": 1.47, - "learning_rate": 1.0860040736619087e-06, - "loss": 0.6543, - "step": 57168 - }, - { - "epoch": 1.47, - "learning_rate": 1.0859765057000624e-06, - "loss": 0.6777, - "step": 57169 - }, - { - "epoch": 1.47, - "learning_rate": 1.085948937672388e-06, - "loss": 0.5201, - "step": 57170 - }, - { - "epoch": 1.47, - "learning_rate": 1.0859213695789057e-06, - "loss": 0.6343, - "step": 57171 - }, - { - "epoch": 1.47, - "learning_rate": 1.085893801419638e-06, - "loss": 0.5688, - "step": 57172 - }, - { - "epoch": 1.47, - "learning_rate": 1.0858662331946048e-06, - "loss": 0.4475, - "step": 57173 - }, - { - "epoch": 1.47, - "learning_rate": 1.0858386649038285e-06, - "loss": 0.6392, - "step": 57174 - }, - { - "epoch": 1.47, - "learning_rate": 1.085811096547329e-06, - "loss": 0.8359, - "step": 57175 - }, - { - "epoch": 1.47, - "learning_rate": 1.0857835281251282e-06, - "loss": 0.7324, - "step": 57176 - }, - { - "epoch": 1.47, - "learning_rate": 1.0857559596372465e-06, - "loss": 0.585, - "step": 57177 - }, - { - "epoch": 1.47, - "learning_rate": 1.0857283910837057e-06, - "loss": 0.708, - "step": 57178 - }, - { - "epoch": 1.47, - "learning_rate": 1.0857008224645265e-06, - "loss": 0.7529, - "step": 57179 - }, - { - "epoch": 1.47, - "learning_rate": 1.08567325377973e-06, - "loss": 0.6895, - "step": 57180 - }, - { - "epoch": 1.47, - "learning_rate": 1.0856456850293377e-06, - "loss": 0.5962, - "step": 57181 - }, - { - "epoch": 1.47, - "learning_rate": 1.0856181162133702e-06, - "loss": 0.7324, - "step": 57182 - }, - { - "epoch": 1.47, - "learning_rate": 1.0855905473318492e-06, - "loss": 0.5724, - "step": 57183 - }, - { - "epoch": 1.47, - "learning_rate": 1.085562978384795e-06, - "loss": 0.6934, - "step": 57184 - }, - { - "epoch": 1.47, - "learning_rate": 1.0855354093722295e-06, - "loss": 0.7617, - "step": 57185 - }, - { - "epoch": 1.47, - "learning_rate": 1.0855078402941731e-06, - "loss": 0.8369, - "step": 57186 - }, - { - "epoch": 1.47, - "learning_rate": 1.0854802711506477e-06, - "loss": 0.7334, - "step": 57187 - }, - { - "epoch": 1.47, - "learning_rate": 1.0854527019416737e-06, - "loss": 0.6973, - "step": 57188 - }, - { - "epoch": 1.47, - "learning_rate": 1.0854251326672728e-06, - "loss": 0.6658, - "step": 57189 - }, - { - "epoch": 1.47, - "learning_rate": 1.0853975633274654e-06, - "loss": 0.4663, - "step": 57190 - }, - { - "epoch": 1.47, - "learning_rate": 1.0853699939222733e-06, - "loss": 0.7109, - "step": 57191 - }, - { - "epoch": 1.47, - "learning_rate": 1.0853424244517171e-06, - "loss": 0.6113, - "step": 57192 - }, - { - "epoch": 1.47, - "learning_rate": 1.0853148549158185e-06, - "loss": 0.625, - "step": 57193 - }, - { - "epoch": 1.47, - "learning_rate": 1.0852872853145977e-06, - "loss": 0.7559, - "step": 57194 - }, - { - "epoch": 1.47, - "learning_rate": 1.0852597156480769e-06, - "loss": 0.6777, - "step": 57195 - }, - { - "epoch": 1.47, - "learning_rate": 1.0852321459162762e-06, - "loss": 0.749, - "step": 57196 - }, - { - "epoch": 1.47, - "learning_rate": 1.0852045761192174e-06, - "loss": 0.5835, - "step": 57197 - }, - { - "epoch": 1.47, - "learning_rate": 1.0851770062569214e-06, - "loss": 0.5341, - "step": 57198 - }, - { - "epoch": 1.47, - "learning_rate": 1.0851494363294092e-06, - "loss": 0.6172, - "step": 57199 - }, - { - "epoch": 1.47, - "learning_rate": 1.085121866336702e-06, - "loss": 0.5371, - "step": 57200 - }, - { - "epoch": 1.47, - "learning_rate": 1.085094296278821e-06, - "loss": 0.491, - "step": 57201 - }, - { - "epoch": 1.47, - "learning_rate": 1.0850667261557871e-06, - "loss": 0.6943, - "step": 57202 - }, - { - "epoch": 1.47, - "learning_rate": 1.0850391559676215e-06, - "loss": 0.707, - "step": 57203 - }, - { - "epoch": 1.47, - "learning_rate": 1.0850115857143456e-06, - "loss": 0.52, - "step": 57204 - }, - { - "epoch": 1.47, - "learning_rate": 1.0849840153959798e-06, - "loss": 0.7012, - "step": 57205 - }, - { - "epoch": 1.47, - "learning_rate": 1.084956445012546e-06, - "loss": 0.6221, - "step": 57206 - }, - { - "epoch": 1.47, - "learning_rate": 1.0849288745640646e-06, - "loss": 0.6445, - "step": 57207 - }, - { - "epoch": 1.47, - "learning_rate": 1.0849013040505575e-06, - "loss": 0.7715, - "step": 57208 - }, - { - "epoch": 1.47, - "learning_rate": 1.084873733472045e-06, - "loss": 0.6992, - "step": 57209 - }, - { - "epoch": 1.47, - "learning_rate": 1.0848461628285487e-06, - "loss": 0.6636, - "step": 57210 - }, - { - "epoch": 1.47, - "learning_rate": 1.0848185921200897e-06, - "loss": 0.6465, - "step": 57211 - }, - { - "epoch": 1.47, - "learning_rate": 1.0847910213466888e-06, - "loss": 0.7002, - "step": 57212 - }, - { - "epoch": 1.47, - "learning_rate": 1.0847634505083675e-06, - "loss": 0.6191, - "step": 57213 - }, - { - "epoch": 1.47, - "learning_rate": 1.0847358796051468e-06, - "loss": 0.5308, - "step": 57214 - }, - { - "epoch": 1.47, - "learning_rate": 1.0847083086370476e-06, - "loss": 0.7705, - "step": 57215 - }, - { - "epoch": 1.47, - "learning_rate": 1.0846807376040913e-06, - "loss": 0.6514, - "step": 57216 - }, - { - "epoch": 1.47, - "learning_rate": 1.0846531665062986e-06, - "loss": 0.7236, - "step": 57217 - }, - { - "epoch": 1.47, - "learning_rate": 1.0846255953436912e-06, - "loss": 0.623, - "step": 57218 - }, - { - "epoch": 1.47, - "learning_rate": 1.0845980241162896e-06, - "loss": 0.665, - "step": 57219 - }, - { - "epoch": 1.47, - "learning_rate": 1.0845704528241151e-06, - "loss": 0.5986, - "step": 57220 - }, - { - "epoch": 1.47, - "learning_rate": 1.0845428814671888e-06, - "loss": 0.665, - "step": 57221 - }, - { - "epoch": 1.47, - "learning_rate": 1.0845153100455323e-06, - "loss": 0.5535, - "step": 57222 - }, - { - "epoch": 1.47, - "learning_rate": 1.0844877385591662e-06, - "loss": 0.6309, - "step": 57223 - }, - { - "epoch": 1.47, - "learning_rate": 1.0844601670081116e-06, - "loss": 0.6685, - "step": 57224 - }, - { - "epoch": 1.47, - "learning_rate": 1.0844325953923898e-06, - "loss": 0.6475, - "step": 57225 - }, - { - "epoch": 1.47, - "learning_rate": 1.0844050237120217e-06, - "loss": 0.48, - "step": 57226 - }, - { - "epoch": 1.47, - "learning_rate": 1.0843774519670287e-06, - "loss": 0.7256, - "step": 57227 - }, - { - "epoch": 1.47, - "learning_rate": 1.0843498801574317e-06, - "loss": 0.7402, - "step": 57228 - }, - { - "epoch": 1.47, - "learning_rate": 1.0843223082832522e-06, - "loss": 0.7061, - "step": 57229 - }, - { - "epoch": 1.47, - "learning_rate": 1.0842947363445104e-06, - "loss": 0.6812, - "step": 57230 - }, - { - "epoch": 1.47, - "learning_rate": 1.0842671643412285e-06, - "loss": 0.6157, - "step": 57231 - }, - { - "epoch": 1.47, - "learning_rate": 1.0842395922734269e-06, - "loss": 0.6113, - "step": 57232 - }, - { - "epoch": 1.47, - "learning_rate": 1.084212020141127e-06, - "loss": 0.5544, - "step": 57233 - }, - { - "epoch": 1.47, - "learning_rate": 1.0841844479443498e-06, - "loss": 0.688, - "step": 57234 - }, - { - "epoch": 1.47, - "learning_rate": 1.0841568756831163e-06, - "loss": 0.6035, - "step": 57235 - }, - { - "epoch": 1.47, - "learning_rate": 1.084129303357448e-06, - "loss": 0.6948, - "step": 57236 - }, - { - "epoch": 1.47, - "learning_rate": 1.0841017309673655e-06, - "loss": 0.7529, - "step": 57237 - }, - { - "epoch": 1.47, - "learning_rate": 1.0840741585128903e-06, - "loss": 0.4619, - "step": 57238 - }, - { - "epoch": 1.47, - "learning_rate": 1.0840465859940436e-06, - "loss": 0.6816, - "step": 57239 - }, - { - "epoch": 1.47, - "learning_rate": 1.0840190134108459e-06, - "loss": 0.5615, - "step": 57240 - }, - { - "epoch": 1.47, - "learning_rate": 1.0839914407633188e-06, - "loss": 0.6299, - "step": 57241 - }, - { - "epoch": 1.47, - "learning_rate": 1.0839638680514832e-06, - "loss": 0.6162, - "step": 57242 - }, - { - "epoch": 1.47, - "learning_rate": 1.0839362952753608e-06, - "loss": 0.6494, - "step": 57243 - }, - { - "epoch": 1.47, - "learning_rate": 1.083908722434972e-06, - "loss": 0.6982, - "step": 57244 - }, - { - "epoch": 1.47, - "learning_rate": 1.083881149530338e-06, - "loss": 0.8506, - "step": 57245 - }, - { - "epoch": 1.47, - "learning_rate": 1.08385357656148e-06, - "loss": 0.6787, - "step": 57246 - }, - { - "epoch": 1.47, - "learning_rate": 1.0838260035284195e-06, - "loss": 0.7222, - "step": 57247 - }, - { - "epoch": 1.47, - "learning_rate": 1.0837984304311772e-06, - "loss": 0.6567, - "step": 57248 - }, - { - "epoch": 1.47, - "learning_rate": 1.0837708572697742e-06, - "loss": 0.7427, - "step": 57249 - }, - { - "epoch": 1.47, - "learning_rate": 1.0837432840442316e-06, - "loss": 0.5601, - "step": 57250 - }, - { - "epoch": 1.47, - "learning_rate": 1.0837157107545707e-06, - "loss": 0.6924, - "step": 57251 - }, - { - "epoch": 1.47, - "learning_rate": 1.0836881374008128e-06, - "loss": 0.5874, - "step": 57252 - }, - { - "epoch": 1.47, - "learning_rate": 1.0836605639829784e-06, - "loss": 0.662, - "step": 57253 - }, - { - "epoch": 1.47, - "learning_rate": 1.083632990501089e-06, - "loss": 0.7637, - "step": 57254 - }, - { - "epoch": 1.47, - "learning_rate": 1.0836054169551656e-06, - "loss": 0.7285, - "step": 57255 - }, - { - "epoch": 1.47, - "learning_rate": 1.0835778433452295e-06, - "loss": 0.5786, - "step": 57256 - }, - { - "epoch": 1.47, - "learning_rate": 1.0835502696713018e-06, - "loss": 0.6631, - "step": 57257 - }, - { - "epoch": 1.47, - "learning_rate": 1.0835226959334036e-06, - "loss": 0.5586, - "step": 57258 - }, - { - "epoch": 1.47, - "learning_rate": 1.0834951221315556e-06, - "loss": 0.7148, - "step": 57259 - }, - { - "epoch": 1.47, - "learning_rate": 1.0834675482657794e-06, - "loss": 0.6885, - "step": 57260 - }, - { - "epoch": 1.47, - "learning_rate": 1.0834399743360955e-06, - "loss": 0.5076, - "step": 57261 - }, - { - "epoch": 1.47, - "learning_rate": 1.083412400342526e-06, - "loss": 0.6748, - "step": 57262 - }, - { - "epoch": 1.47, - "learning_rate": 1.0833848262850913e-06, - "loss": 0.7812, - "step": 57263 - }, - { - "epoch": 1.47, - "learning_rate": 1.0833572521638128e-06, - "loss": 0.7432, - "step": 57264 - }, - { - "epoch": 1.47, - "learning_rate": 1.083329677978711e-06, - "loss": 0.5398, - "step": 57265 - }, - { - "epoch": 1.47, - "learning_rate": 1.083302103729808e-06, - "loss": 0.5869, - "step": 57266 - }, - { - "epoch": 1.47, - "learning_rate": 1.0832745294171242e-06, - "loss": 0.6533, - "step": 57267 - }, - { - "epoch": 1.47, - "learning_rate": 1.083246955040681e-06, - "loss": 0.6416, - "step": 57268 - }, - { - "epoch": 1.47, - "learning_rate": 1.0832193806004994e-06, - "loss": 0.6289, - "step": 57269 - }, - { - "epoch": 1.47, - "learning_rate": 1.0831918060966003e-06, - "loss": 0.7002, - "step": 57270 - }, - { - "epoch": 1.47, - "learning_rate": 1.0831642315290055e-06, - "loss": 0.7881, - "step": 57271 - }, - { - "epoch": 1.47, - "learning_rate": 1.0831366568977353e-06, - "loss": 0.5811, - "step": 57272 - }, - { - "epoch": 1.47, - "learning_rate": 1.0831090822028116e-06, - "loss": 0.6821, - "step": 57273 - }, - { - "epoch": 1.47, - "learning_rate": 1.0830815074442548e-06, - "loss": 0.6846, - "step": 57274 - }, - { - "epoch": 1.47, - "learning_rate": 1.0830539326220864e-06, - "loss": 0.6733, - "step": 57275 - }, - { - "epoch": 1.47, - "learning_rate": 1.0830263577363273e-06, - "loss": 0.5613, - "step": 57276 - }, - { - "epoch": 1.47, - "learning_rate": 1.082998782786999e-06, - "loss": 0.5942, - "step": 57277 - }, - { - "epoch": 1.47, - "learning_rate": 1.082971207774122e-06, - "loss": 0.5935, - "step": 57278 - }, - { - "epoch": 1.47, - "learning_rate": 1.082943632697718e-06, - "loss": 0.6104, - "step": 57279 - }, - { - "epoch": 1.47, - "learning_rate": 1.0829160575578078e-06, - "loss": 0.6064, - "step": 57280 - }, - { - "epoch": 1.47, - "learning_rate": 1.0828884823544125e-06, - "loss": 0.6577, - "step": 57281 - }, - { - "epoch": 1.47, - "learning_rate": 1.0828609070875531e-06, - "loss": 0.7344, - "step": 57282 - }, - { - "epoch": 1.47, - "learning_rate": 1.0828333317572518e-06, - "loss": 0.6631, - "step": 57283 - }, - { - "epoch": 1.47, - "learning_rate": 1.082805756363528e-06, - "loss": 0.5762, - "step": 57284 - }, - { - "epoch": 1.47, - "learning_rate": 1.082778180906404e-06, - "loss": 0.7178, - "step": 57285 - }, - { - "epoch": 1.47, - "learning_rate": 1.0827506053859e-06, - "loss": 0.6904, - "step": 57286 - }, - { - "epoch": 1.47, - "learning_rate": 1.0827230298020384e-06, - "loss": 0.6338, - "step": 57287 - }, - { - "epoch": 1.47, - "learning_rate": 1.0826954541548392e-06, - "loss": 0.7202, - "step": 57288 - }, - { - "epoch": 1.47, - "learning_rate": 1.082667878444324e-06, - "loss": 0.4659, - "step": 57289 - }, - { - "epoch": 1.47, - "learning_rate": 1.0826403026705137e-06, - "loss": 0.6216, - "step": 57290 - }, - { - "epoch": 1.47, - "learning_rate": 1.0826127268334298e-06, - "loss": 0.7305, - "step": 57291 - }, - { - "epoch": 1.47, - "learning_rate": 1.0825851509330927e-06, - "loss": 0.7119, - "step": 57292 - }, - { - "epoch": 1.47, - "learning_rate": 1.0825575749695241e-06, - "loss": 0.4788, - "step": 57293 - }, - { - "epoch": 1.47, - "learning_rate": 1.0825299989427451e-06, - "loss": 0.5712, - "step": 57294 - }, - { - "epoch": 1.47, - "learning_rate": 1.0825024228527766e-06, - "loss": 0.709, - "step": 57295 - }, - { - "epoch": 1.47, - "learning_rate": 1.08247484669964e-06, - "loss": 0.6934, - "step": 57296 - }, - { - "epoch": 1.47, - "learning_rate": 1.082447270483356e-06, - "loss": 0.5928, - "step": 57297 - }, - { - "epoch": 1.47, - "learning_rate": 1.082419694203946e-06, - "loss": 0.7354, - "step": 57298 - }, - { - "epoch": 1.47, - "learning_rate": 1.0823921178614307e-06, - "loss": 0.5464, - "step": 57299 - }, - { - "epoch": 1.47, - "learning_rate": 1.0823645414558319e-06, - "loss": 0.5312, - "step": 57300 - }, - { - "epoch": 1.47, - "learning_rate": 1.0823369649871701e-06, - "loss": 0.6025, - "step": 57301 - }, - { - "epoch": 1.47, - "learning_rate": 1.0823093884554667e-06, - "loss": 0.7441, - "step": 57302 - }, - { - "epoch": 1.47, - "learning_rate": 1.082281811860743e-06, - "loss": 0.5332, - "step": 57303 - }, - { - "epoch": 1.47, - "learning_rate": 1.08225423520302e-06, - "loss": 0.457, - "step": 57304 - }, - { - "epoch": 1.47, - "learning_rate": 1.0822266584823183e-06, - "loss": 0.4556, - "step": 57305 - }, - { - "epoch": 1.47, - "learning_rate": 1.0821990816986596e-06, - "loss": 0.7041, - "step": 57306 - }, - { - "epoch": 1.47, - "learning_rate": 1.082171504852065e-06, - "loss": 0.7383, - "step": 57307 - }, - { - "epoch": 1.47, - "learning_rate": 1.0821439279425556e-06, - "loss": 0.5154, - "step": 57308 - }, - { - "epoch": 1.47, - "learning_rate": 1.082116350970152e-06, - "loss": 0.6221, - "step": 57309 - }, - { - "epoch": 1.47, - "learning_rate": 1.0820887739348758e-06, - "loss": 0.7158, - "step": 57310 - }, - { - "epoch": 1.47, - "learning_rate": 1.0820611968367479e-06, - "loss": 0.7129, - "step": 57311 - }, - { - "epoch": 1.47, - "learning_rate": 1.0820336196757898e-06, - "loss": 0.5879, - "step": 57312 - }, - { - "epoch": 1.47, - "learning_rate": 1.0820060424520222e-06, - "loss": 0.4717, - "step": 57313 - }, - { - "epoch": 1.47, - "learning_rate": 1.081978465165466e-06, - "loss": 0.7178, - "step": 57314 - }, - { - "epoch": 1.47, - "learning_rate": 1.081950887816143e-06, - "loss": 0.7861, - "step": 57315 - }, - { - "epoch": 1.47, - "learning_rate": 1.0819233104040737e-06, - "loss": 0.7422, - "step": 57316 - }, - { - "epoch": 1.47, - "learning_rate": 1.08189573292928e-06, - "loss": 0.5625, - "step": 57317 - }, - { - "epoch": 1.47, - "learning_rate": 1.0818681553917821e-06, - "loss": 0.7725, - "step": 57318 - }, - { - "epoch": 1.47, - "learning_rate": 1.0818405777916017e-06, - "loss": 0.7578, - "step": 57319 - }, - { - "epoch": 1.47, - "learning_rate": 1.0818130001287595e-06, - "loss": 0.5549, - "step": 57320 - }, - { - "epoch": 1.47, - "learning_rate": 1.0817854224032773e-06, - "loss": 0.6279, - "step": 57321 - }, - { - "epoch": 1.47, - "learning_rate": 1.0817578446151752e-06, - "loss": 0.6987, - "step": 57322 - }, - { - "epoch": 1.47, - "learning_rate": 1.0817302667644754e-06, - "loss": 0.7842, - "step": 57323 - }, - { - "epoch": 1.47, - "learning_rate": 1.0817026888511982e-06, - "loss": 0.7236, - "step": 57324 - }, - { - "epoch": 1.47, - "learning_rate": 1.081675110875365e-06, - "loss": 0.6602, - "step": 57325 - }, - { - "epoch": 1.47, - "learning_rate": 1.0816475328369969e-06, - "loss": 0.7061, - "step": 57326 - }, - { - "epoch": 1.47, - "learning_rate": 1.0816199547361152e-06, - "loss": 0.6406, - "step": 57327 - }, - { - "epoch": 1.47, - "learning_rate": 1.0815923765727408e-06, - "loss": 0.6064, - "step": 57328 - }, - { - "epoch": 1.47, - "learning_rate": 1.0815647983468949e-06, - "loss": 0.6125, - "step": 57329 - }, - { - "epoch": 1.47, - "learning_rate": 1.0815372200585984e-06, - "loss": 0.6816, - "step": 57330 - }, - { - "epoch": 1.47, - "learning_rate": 1.081509641707873e-06, - "loss": 0.7256, - "step": 57331 - }, - { - "epoch": 1.47, - "learning_rate": 1.0814820632947389e-06, - "loss": 0.4702, - "step": 57332 - }, - { - "epoch": 1.47, - "learning_rate": 1.0814544848192179e-06, - "loss": 0.5996, - "step": 57333 - }, - { - "epoch": 1.47, - "learning_rate": 1.081426906281331e-06, - "loss": 0.6211, - "step": 57334 - }, - { - "epoch": 1.47, - "learning_rate": 1.0813993276810993e-06, - "loss": 0.6924, - "step": 57335 - }, - { - "epoch": 1.47, - "learning_rate": 1.081371749018544e-06, - "loss": 0.7109, - "step": 57336 - }, - { - "epoch": 1.47, - "learning_rate": 1.0813441702936859e-06, - "loss": 0.7344, - "step": 57337 - }, - { - "epoch": 1.47, - "learning_rate": 1.0813165915065465e-06, - "loss": 0.7539, - "step": 57338 - }, - { - "epoch": 1.47, - "learning_rate": 1.0812890126571462e-06, - "loss": 0.3594, - "step": 57339 - }, - { - "epoch": 1.47, - "learning_rate": 1.0812614337455073e-06, - "loss": 0.4241, - "step": 57340 - }, - { - "epoch": 1.47, - "learning_rate": 1.0812338547716497e-06, - "loss": 0.5972, - "step": 57341 - }, - { - "epoch": 1.47, - "learning_rate": 1.0812062757355955e-06, - "loss": 0.4285, - "step": 57342 - }, - { - "epoch": 1.47, - "learning_rate": 1.0811786966373653e-06, - "loss": 0.5061, - "step": 57343 - }, - { - "epoch": 1.47, - "learning_rate": 1.0811511174769803e-06, - "loss": 0.5491, - "step": 57344 - }, - { - "epoch": 1.47, - "learning_rate": 1.0811235382544614e-06, - "loss": 0.6504, - "step": 57345 - }, - { - "epoch": 1.47, - "learning_rate": 1.0810959589698303e-06, - "loss": 0.6123, - "step": 57346 - }, - { - "epoch": 1.47, - "learning_rate": 1.0810683796231072e-06, - "loss": 0.624, - "step": 57347 - }, - { - "epoch": 1.47, - "learning_rate": 1.0810408002143145e-06, - "loss": 0.6973, - "step": 57348 - }, - { - "epoch": 1.47, - "learning_rate": 1.0810132207434722e-06, - "loss": 0.7344, - "step": 57349 - }, - { - "epoch": 1.47, - "learning_rate": 1.0809856412106018e-06, - "loss": 0.4521, - "step": 57350 - }, - { - "epoch": 1.47, - "learning_rate": 1.0809580616157243e-06, - "loss": 0.6748, - "step": 57351 - }, - { - "epoch": 1.47, - "learning_rate": 1.0809304819588612e-06, - "loss": 0.5186, - "step": 57352 - }, - { - "epoch": 1.47, - "learning_rate": 1.080902902240033e-06, - "loss": 0.6519, - "step": 57353 - }, - { - "epoch": 1.47, - "learning_rate": 1.0808753224592616e-06, - "loss": 0.8145, - "step": 57354 - }, - { - "epoch": 1.47, - "learning_rate": 1.0808477426165674e-06, - "loss": 0.6279, - "step": 57355 - }, - { - "epoch": 1.47, - "learning_rate": 1.080820162711972e-06, - "loss": 0.7354, - "step": 57356 - }, - { - "epoch": 1.47, - "learning_rate": 1.080792582745496e-06, - "loss": 0.3844, - "step": 57357 - }, - { - "epoch": 1.47, - "learning_rate": 1.0807650027171612e-06, - "loss": 0.7168, - "step": 57358 - }, - { - "epoch": 1.47, - "learning_rate": 1.080737422626988e-06, - "loss": 0.6943, - "step": 57359 - }, - { - "epoch": 1.47, - "learning_rate": 1.080709842474998e-06, - "loss": 0.5991, - "step": 57360 - }, - { - "epoch": 1.47, - "learning_rate": 1.0806822622612124e-06, - "loss": 0.5752, - "step": 57361 - }, - { - "epoch": 1.47, - "learning_rate": 1.0806546819856517e-06, - "loss": 0.6328, - "step": 57362 - }, - { - "epoch": 1.47, - "learning_rate": 1.0806271016483379e-06, - "loss": 0.6411, - "step": 57363 - }, - { - "epoch": 1.47, - "learning_rate": 1.0805995212492913e-06, - "loss": 0.7256, - "step": 57364 - }, - { - "epoch": 1.47, - "learning_rate": 1.0805719407885334e-06, - "loss": 0.5715, - "step": 57365 - }, - { - "epoch": 1.47, - "learning_rate": 1.080544360266085e-06, - "loss": 0.6152, - "step": 57366 - }, - { - "epoch": 1.47, - "learning_rate": 1.080516779681968e-06, - "loss": 0.7021, - "step": 57367 - }, - { - "epoch": 1.47, - "learning_rate": 1.0804891990362028e-06, - "loss": 0.4789, - "step": 57368 - }, - { - "epoch": 1.47, - "learning_rate": 1.080461618328811e-06, - "loss": 0.5278, - "step": 57369 - }, - { - "epoch": 1.47, - "learning_rate": 1.080434037559813e-06, - "loss": 0.5635, - "step": 57370 - }, - { - "epoch": 1.47, - "learning_rate": 1.0804064567292305e-06, - "loss": 0.4868, - "step": 57371 - }, - { - "epoch": 1.47, - "learning_rate": 1.0803788758370843e-06, - "loss": 0.666, - "step": 57372 - }, - { - "epoch": 1.47, - "learning_rate": 1.080351294883396e-06, - "loss": 0.6631, - "step": 57373 - }, - { - "epoch": 1.47, - "learning_rate": 1.0803237138681865e-06, - "loss": 0.7109, - "step": 57374 - }, - { - "epoch": 1.47, - "learning_rate": 1.0802961327914765e-06, - "loss": 0.625, - "step": 57375 - }, - { - "epoch": 1.47, - "learning_rate": 1.0802685516532875e-06, - "loss": 0.4843, - "step": 57376 - }, - { - "epoch": 1.47, - "learning_rate": 1.0802409704536406e-06, - "loss": 0.7275, - "step": 57377 - }, - { - "epoch": 1.47, - "learning_rate": 1.0802133891925569e-06, - "loss": 0.7656, - "step": 57378 - }, - { - "epoch": 1.47, - "learning_rate": 1.0801858078700573e-06, - "loss": 0.8008, - "step": 57379 - }, - { - "epoch": 1.47, - "learning_rate": 1.0801582264861636e-06, - "loss": 0.7812, - "step": 57380 - }, - { - "epoch": 1.47, - "learning_rate": 1.080130645040896e-06, - "loss": 0.5483, - "step": 57381 - }, - { - "epoch": 1.47, - "learning_rate": 1.080103063534276e-06, - "loss": 0.5073, - "step": 57382 - }, - { - "epoch": 1.47, - "learning_rate": 1.0800754819663252e-06, - "loss": 0.6646, - "step": 57383 - }, - { - "epoch": 1.47, - "learning_rate": 1.080047900337064e-06, - "loss": 0.6709, - "step": 57384 - }, - { - "epoch": 1.47, - "learning_rate": 1.0800203186465138e-06, - "loss": 0.605, - "step": 57385 - }, - { - "epoch": 1.47, - "learning_rate": 1.0799927368946956e-06, - "loss": 0.5767, - "step": 57386 - }, - { - "epoch": 1.47, - "learning_rate": 1.0799651550816308e-06, - "loss": 0.5322, - "step": 57387 - }, - { - "epoch": 1.47, - "learning_rate": 1.0799375732073406e-06, - "loss": 0.6577, - "step": 57388 - }, - { - "epoch": 1.47, - "learning_rate": 1.0799099912718456e-06, - "loss": 0.6807, - "step": 57389 - }, - { - "epoch": 1.47, - "learning_rate": 1.0798824092751672e-06, - "loss": 0.542, - "step": 57390 - }, - { - "epoch": 1.47, - "learning_rate": 1.0798548272173264e-06, - "loss": 0.7412, - "step": 57391 - }, - { - "epoch": 1.47, - "learning_rate": 1.0798272450983448e-06, - "loss": 0.748, - "step": 57392 - }, - { - "epoch": 1.47, - "learning_rate": 1.0797996629182429e-06, - "loss": 0.6289, - "step": 57393 - }, - { - "epoch": 1.47, - "learning_rate": 1.079772080677042e-06, - "loss": 0.6836, - "step": 57394 - }, - { - "epoch": 1.47, - "learning_rate": 1.0797444983747634e-06, - "loss": 0.5425, - "step": 57395 - }, - { - "epoch": 1.47, - "learning_rate": 1.0797169160114281e-06, - "loss": 0.6494, - "step": 57396 - }, - { - "epoch": 1.47, - "learning_rate": 1.0796893335870571e-06, - "loss": 0.7422, - "step": 57397 - }, - { - "epoch": 1.47, - "learning_rate": 1.079661751101672e-06, - "loss": 0.6846, - "step": 57398 - }, - { - "epoch": 1.47, - "learning_rate": 1.0796341685552933e-06, - "loss": 0.6057, - "step": 57399 - }, - { - "epoch": 1.47, - "learning_rate": 1.0796065859479424e-06, - "loss": 0.5972, - "step": 57400 - }, - { - "epoch": 1.47, - "learning_rate": 1.07957900327964e-06, - "loss": 0.665, - "step": 57401 - }, - { - "epoch": 1.47, - "learning_rate": 1.0795514205504081e-06, - "loss": 0.8848, - "step": 57402 - }, - { - "epoch": 1.47, - "learning_rate": 1.0795238377602673e-06, - "loss": 0.748, - "step": 57403 - }, - { - "epoch": 1.47, - "learning_rate": 1.0794962549092386e-06, - "loss": 0.6743, - "step": 57404 - }, - { - "epoch": 1.47, - "learning_rate": 1.0794686719973434e-06, - "loss": 0.687, - "step": 57405 - }, - { - "epoch": 1.47, - "learning_rate": 1.0794410890246026e-06, - "loss": 0.6611, - "step": 57406 - }, - { - "epoch": 1.47, - "learning_rate": 1.0794135059910374e-06, - "loss": 0.4016, - "step": 57407 - }, - { - "epoch": 1.47, - "learning_rate": 1.079385922896669e-06, - "loss": 0.707, - "step": 57408 - }, - { - "epoch": 1.47, - "learning_rate": 1.0793583397415186e-06, - "loss": 0.7705, - "step": 57409 - }, - { - "epoch": 1.47, - "learning_rate": 1.079330756525607e-06, - "loss": 0.5522, - "step": 57410 - }, - { - "epoch": 1.47, - "learning_rate": 1.0793031732489554e-06, - "loss": 0.6904, - "step": 57411 - }, - { - "epoch": 1.47, - "learning_rate": 1.0792755899115852e-06, - "loss": 0.6836, - "step": 57412 - }, - { - "epoch": 1.47, - "learning_rate": 1.0792480065135174e-06, - "loss": 0.6191, - "step": 57413 - }, - { - "epoch": 1.47, - "learning_rate": 1.0792204230547728e-06, - "loss": 0.6411, - "step": 57414 - }, - { - "epoch": 1.47, - "learning_rate": 1.0791928395353728e-06, - "loss": 0.5955, - "step": 57415 - }, - { - "epoch": 1.47, - "learning_rate": 1.0791652559553384e-06, - "loss": 0.5413, - "step": 57416 - }, - { - "epoch": 1.47, - "learning_rate": 1.079137672314691e-06, - "loss": 0.6958, - "step": 57417 - }, - { - "epoch": 1.47, - "learning_rate": 1.0791100886134515e-06, - "loss": 0.7109, - "step": 57418 - }, - { - "epoch": 1.47, - "learning_rate": 1.079082504851641e-06, - "loss": 0.5621, - "step": 57419 - }, - { - "epoch": 1.47, - "learning_rate": 1.0790549210292805e-06, - "loss": 0.6274, - "step": 57420 - }, - { - "epoch": 1.47, - "learning_rate": 1.0790273371463916e-06, - "loss": 0.6147, - "step": 57421 - }, - { - "epoch": 1.47, - "learning_rate": 1.0789997532029946e-06, - "loss": 0.7441, - "step": 57422 - }, - { - "epoch": 1.47, - "learning_rate": 1.0789721691991115e-06, - "loss": 0.6089, - "step": 57423 - }, - { - "epoch": 1.47, - "learning_rate": 1.0789445851347632e-06, - "loss": 0.7715, - "step": 57424 - }, - { - "epoch": 1.47, - "learning_rate": 1.0789170010099703e-06, - "loss": 0.6357, - "step": 57425 - }, - { - "epoch": 1.47, - "learning_rate": 1.0788894168247546e-06, - "loss": 0.5488, - "step": 57426 - }, - { - "epoch": 1.47, - "learning_rate": 1.0788618325791367e-06, - "loss": 0.7612, - "step": 57427 - }, - { - "epoch": 1.47, - "learning_rate": 1.0788342482731381e-06, - "loss": 0.5828, - "step": 57428 - }, - { - "epoch": 1.47, - "learning_rate": 1.0788066639067793e-06, - "loss": 0.6021, - "step": 57429 - }, - { - "epoch": 1.47, - "learning_rate": 1.0787790794800824e-06, - "loss": 0.6221, - "step": 57430 - }, - { - "epoch": 1.47, - "learning_rate": 1.0787514949930675e-06, - "loss": 0.7549, - "step": 57431 - }, - { - "epoch": 1.47, - "learning_rate": 1.0787239104457567e-06, - "loss": 0.5454, - "step": 57432 - }, - { - "epoch": 1.47, - "learning_rate": 1.0786963258381703e-06, - "loss": 0.637, - "step": 57433 - }, - { - "epoch": 1.47, - "learning_rate": 1.07866874117033e-06, - "loss": 0.4211, - "step": 57434 - }, - { - "epoch": 1.47, - "learning_rate": 1.0786411564422562e-06, - "loss": 0.6138, - "step": 57435 - }, - { - "epoch": 1.47, - "learning_rate": 1.0786135716539708e-06, - "loss": 0.7485, - "step": 57436 - }, - { - "epoch": 1.47, - "learning_rate": 1.0785859868054946e-06, - "loss": 0.7305, - "step": 57437 - }, - { - "epoch": 1.47, - "learning_rate": 1.0785584018968488e-06, - "loss": 0.623, - "step": 57438 - }, - { - "epoch": 1.47, - "learning_rate": 1.0785308169280543e-06, - "loss": 0.752, - "step": 57439 - }, - { - "epoch": 1.47, - "learning_rate": 1.0785032318991326e-06, - "loss": 0.6616, - "step": 57440 - }, - { - "epoch": 1.47, - "learning_rate": 1.0784756468101039e-06, - "loss": 0.3821, - "step": 57441 - }, - { - "epoch": 1.47, - "learning_rate": 1.0784480616609907e-06, - "loss": 0.7549, - "step": 57442 - }, - { - "epoch": 1.47, - "learning_rate": 1.0784204764518132e-06, - "loss": 0.6309, - "step": 57443 - }, - { - "epoch": 1.47, - "learning_rate": 1.078392891182593e-06, - "loss": 0.4417, - "step": 57444 - }, - { - "epoch": 1.47, - "learning_rate": 1.0783653058533505e-06, - "loss": 0.668, - "step": 57445 - }, - { - "epoch": 1.47, - "learning_rate": 1.0783377204641075e-06, - "loss": 0.5693, - "step": 57446 - }, - { - "epoch": 1.47, - "learning_rate": 1.0783101350148848e-06, - "loss": 0.7427, - "step": 57447 - }, - { - "epoch": 1.47, - "learning_rate": 1.0782825495057037e-06, - "loss": 0.4513, - "step": 57448 - }, - { - "epoch": 1.47, - "learning_rate": 1.0782549639365854e-06, - "loss": 0.7236, - "step": 57449 - }, - { - "epoch": 1.47, - "learning_rate": 1.0782273783075508e-06, - "loss": 0.6045, - "step": 57450 - }, - { - "epoch": 1.47, - "learning_rate": 1.078199792618621e-06, - "loss": 0.708, - "step": 57451 - }, - { - "epoch": 1.47, - "learning_rate": 1.0781722068698172e-06, - "loss": 0.4653, - "step": 57452 - }, - { - "epoch": 1.47, - "learning_rate": 1.078144621061161e-06, - "loss": 0.5991, - "step": 57453 - }, - { - "epoch": 1.47, - "learning_rate": 1.0781170351926724e-06, - "loss": 0.7666, - "step": 57454 - }, - { - "epoch": 1.47, - "learning_rate": 1.0780894492643734e-06, - "loss": 0.6621, - "step": 57455 - }, - { - "epoch": 1.47, - "learning_rate": 1.078061863276285e-06, - "loss": 0.8193, - "step": 57456 - }, - { - "epoch": 1.47, - "learning_rate": 1.0780342772284283e-06, - "loss": 0.6113, - "step": 57457 - }, - { - "epoch": 1.47, - "learning_rate": 1.0780066911208243e-06, - "loss": 0.7432, - "step": 57458 - }, - { - "epoch": 1.47, - "learning_rate": 1.077979104953494e-06, - "loss": 0.7002, - "step": 57459 - }, - { - "epoch": 1.47, - "learning_rate": 1.0779515187264586e-06, - "loss": 0.7881, - "step": 57460 - }, - { - "epoch": 1.47, - "learning_rate": 1.0779239324397396e-06, - "loss": 0.5537, - "step": 57461 - }, - { - "epoch": 1.47, - "learning_rate": 1.0778963460933576e-06, - "loss": 0.6348, - "step": 57462 - }, - { - "epoch": 1.47, - "learning_rate": 1.0778687596873344e-06, - "loss": 0.5161, - "step": 57463 - }, - { - "epoch": 1.47, - "learning_rate": 1.0778411732216902e-06, - "loss": 0.5378, - "step": 57464 - }, - { - "epoch": 1.47, - "learning_rate": 1.0778135866964466e-06, - "loss": 0.4395, - "step": 57465 - }, - { - "epoch": 1.47, - "learning_rate": 1.0777860001116249e-06, - "loss": 0.7495, - "step": 57466 - }, - { - "epoch": 1.47, - "learning_rate": 1.077758413467246e-06, - "loss": 0.439, - "step": 57467 - }, - { - "epoch": 1.47, - "learning_rate": 1.077730826763331e-06, - "loss": 0.6045, - "step": 57468 - }, - { - "epoch": 1.47, - "learning_rate": 1.0777032399999009e-06, - "loss": 0.5093, - "step": 57469 - }, - { - "epoch": 1.47, - "learning_rate": 1.0776756531769773e-06, - "loss": 0.5771, - "step": 57470 - }, - { - "epoch": 1.47, - "learning_rate": 1.077648066294581e-06, - "loss": 0.5264, - "step": 57471 - }, - { - "epoch": 1.47, - "learning_rate": 1.077620479352733e-06, - "loss": 0.7148, - "step": 57472 - }, - { - "epoch": 1.47, - "learning_rate": 1.0775928923514546e-06, - "loss": 0.5596, - "step": 57473 - }, - { - "epoch": 1.47, - "learning_rate": 1.077565305290767e-06, - "loss": 0.5957, - "step": 57474 - }, - { - "epoch": 1.47, - "learning_rate": 1.077537718170691e-06, - "loss": 0.7949, - "step": 57475 - }, - { - "epoch": 1.47, - "learning_rate": 1.0775101309912483e-06, - "loss": 0.5317, - "step": 57476 - }, - { - "epoch": 1.47, - "learning_rate": 1.0774825437524593e-06, - "loss": 0.6562, - "step": 57477 - }, - { - "epoch": 1.47, - "learning_rate": 1.0774549564543459e-06, - "loss": 0.5879, - "step": 57478 - }, - { - "epoch": 1.47, - "learning_rate": 1.0774273690969282e-06, - "loss": 0.6091, - "step": 57479 - }, - { - "epoch": 1.47, - "learning_rate": 1.0773997816802282e-06, - "loss": 0.5933, - "step": 57480 - }, - { - "epoch": 1.47, - "learning_rate": 1.0773721942042668e-06, - "loss": 0.7383, - "step": 57481 - }, - { - "epoch": 1.47, - "learning_rate": 1.0773446066690653e-06, - "loss": 0.7285, - "step": 57482 - }, - { - "epoch": 1.47, - "learning_rate": 1.0773170190746444e-06, - "loss": 0.6265, - "step": 57483 - }, - { - "epoch": 1.47, - "learning_rate": 1.0772894314210253e-06, - "loss": 0.4624, - "step": 57484 - }, - { - "epoch": 1.47, - "learning_rate": 1.077261843708229e-06, - "loss": 0.6392, - "step": 57485 - }, - { - "epoch": 1.47, - "learning_rate": 1.0772342559362773e-06, - "loss": 0.5742, - "step": 57486 - }, - { - "epoch": 1.47, - "learning_rate": 1.0772066681051908e-06, - "loss": 0.667, - "step": 57487 - }, - { - "epoch": 1.47, - "learning_rate": 1.0771790802149905e-06, - "loss": 0.5693, - "step": 57488 - }, - { - "epoch": 1.47, - "learning_rate": 1.077151492265698e-06, - "loss": 0.5913, - "step": 57489 - }, - { - "epoch": 1.47, - "learning_rate": 1.077123904257334e-06, - "loss": 0.7227, - "step": 57490 - }, - { - "epoch": 1.47, - "learning_rate": 1.0770963161899196e-06, - "loss": 0.7969, - "step": 57491 - }, - { - "epoch": 1.47, - "learning_rate": 1.0770687280634765e-06, - "loss": 0.5381, - "step": 57492 - }, - { - "epoch": 1.47, - "learning_rate": 1.0770411398780253e-06, - "loss": 0.52, - "step": 57493 - }, - { - "epoch": 1.47, - "learning_rate": 1.077013551633587e-06, - "loss": 0.708, - "step": 57494 - }, - { - "epoch": 1.47, - "learning_rate": 1.0769859633301832e-06, - "loss": 0.6514, - "step": 57495 - }, - { - "epoch": 1.47, - "learning_rate": 1.0769583749678345e-06, - "loss": 0.7148, - "step": 57496 - }, - { - "epoch": 1.47, - "learning_rate": 1.0769307865465627e-06, - "loss": 0.6514, - "step": 57497 - }, - { - "epoch": 1.47, - "learning_rate": 1.0769031980663883e-06, - "loss": 0.7666, - "step": 57498 - }, - { - "epoch": 1.47, - "learning_rate": 1.0768756095273328e-06, - "loss": 0.7578, - "step": 57499 - }, - { - "epoch": 1.47, - "learning_rate": 1.0768480209294168e-06, - "loss": 0.7236, - "step": 57500 - }, - { - "epoch": 1.47, - "learning_rate": 1.0768204322726622e-06, - "loss": 0.6729, - "step": 57501 - }, - { - "epoch": 1.47, - "learning_rate": 1.0767928435570897e-06, - "loss": 0.645, - "step": 57502 - }, - { - "epoch": 1.47, - "learning_rate": 1.0767652547827205e-06, - "loss": 0.6494, - "step": 57503 - }, - { - "epoch": 1.47, - "learning_rate": 1.0767376659495753e-06, - "loss": 0.541, - "step": 57504 - }, - { - "epoch": 1.47, - "learning_rate": 1.076710077057676e-06, - "loss": 0.5427, - "step": 57505 - }, - { - "epoch": 1.47, - "learning_rate": 1.076682488107043e-06, - "loss": 0.5806, - "step": 57506 - }, - { - "epoch": 1.47, - "learning_rate": 1.076654899097698e-06, - "loss": 0.666, - "step": 57507 - }, - { - "epoch": 1.47, - "learning_rate": 1.0766273100296616e-06, - "loss": 0.6001, - "step": 57508 - }, - { - "epoch": 1.47, - "learning_rate": 1.0765997209029556e-06, - "loss": 0.8369, - "step": 57509 - }, - { - "epoch": 1.47, - "learning_rate": 1.0765721317176002e-06, - "loss": 0.7246, - "step": 57510 - }, - { - "epoch": 1.47, - "learning_rate": 1.0765445424736174e-06, - "loss": 0.4216, - "step": 57511 - }, - { - "epoch": 1.47, - "learning_rate": 1.076516953171028e-06, - "loss": 0.4208, - "step": 57512 - }, - { - "epoch": 1.47, - "learning_rate": 1.076489363809853e-06, - "loss": 0.8428, - "step": 57513 - }, - { - "epoch": 1.47, - "learning_rate": 1.0764617743901133e-06, - "loss": 0.5283, - "step": 57514 - }, - { - "epoch": 1.47, - "learning_rate": 1.0764341849118306e-06, - "loss": 0.5918, - "step": 57515 - }, - { - "epoch": 1.47, - "learning_rate": 1.0764065953750258e-06, - "loss": 0.7471, - "step": 57516 - }, - { - "epoch": 1.47, - "learning_rate": 1.0763790057797202e-06, - "loss": 0.5713, - "step": 57517 - }, - { - "epoch": 1.47, - "learning_rate": 1.0763514161259345e-06, - "loss": 0.6689, - "step": 57518 - }, - { - "epoch": 1.47, - "learning_rate": 1.0763238264136898e-06, - "loss": 0.7061, - "step": 57519 - }, - { - "epoch": 1.47, - "learning_rate": 1.0762962366430078e-06, - "loss": 0.7178, - "step": 57520 - }, - { - "epoch": 1.47, - "learning_rate": 1.0762686468139088e-06, - "loss": 0.6318, - "step": 57521 - }, - { - "epoch": 1.47, - "learning_rate": 1.076241056926415e-06, - "loss": 0.7773, - "step": 57522 - }, - { - "epoch": 1.47, - "learning_rate": 1.0762134669805466e-06, - "loss": 0.6641, - "step": 57523 - }, - { - "epoch": 1.47, - "learning_rate": 1.0761858769763253e-06, - "loss": 0.7148, - "step": 57524 - }, - { - "epoch": 1.47, - "learning_rate": 1.0761582869137716e-06, - "loss": 0.5684, - "step": 57525 - }, - { - "epoch": 1.47, - "learning_rate": 1.0761306967929075e-06, - "loss": 0.7363, - "step": 57526 - }, - { - "epoch": 1.47, - "learning_rate": 1.076103106613753e-06, - "loss": 0.6421, - "step": 57527 - }, - { - "epoch": 1.47, - "learning_rate": 1.0760755163763305e-06, - "loss": 0.6914, - "step": 57528 - }, - { - "epoch": 1.47, - "learning_rate": 1.07604792608066e-06, - "loss": 0.6575, - "step": 57529 - }, - { - "epoch": 1.47, - "learning_rate": 1.0760203357267633e-06, - "loss": 0.5669, - "step": 57530 - }, - { - "epoch": 1.47, - "learning_rate": 1.075992745314661e-06, - "loss": 0.6152, - "step": 57531 - }, - { - "epoch": 1.47, - "learning_rate": 1.075965154844375e-06, - "loss": 0.6328, - "step": 57532 - }, - { - "epoch": 1.47, - "learning_rate": 1.0759375643159258e-06, - "loss": 0.7412, - "step": 57533 - }, - { - "epoch": 1.47, - "learning_rate": 1.0759099737293348e-06, - "loss": 0.748, - "step": 57534 - }, - { - "epoch": 1.47, - "learning_rate": 1.0758823830846227e-06, - "loss": 0.7019, - "step": 57535 - }, - { - "epoch": 1.47, - "learning_rate": 1.0758547923818114e-06, - "loss": 0.6172, - "step": 57536 - }, - { - "epoch": 1.47, - "learning_rate": 1.0758272016209213e-06, - "loss": 0.71, - "step": 57537 - }, - { - "epoch": 1.47, - "learning_rate": 1.0757996108019735e-06, - "loss": 0.5566, - "step": 57538 - }, - { - "epoch": 1.47, - "learning_rate": 1.07577201992499e-06, - "loss": 0.6934, - "step": 57539 - }, - { - "epoch": 1.47, - "learning_rate": 1.0757444289899909e-06, - "loss": 0.6396, - "step": 57540 - }, - { - "epoch": 1.47, - "learning_rate": 1.0757168379969981e-06, - "loss": 0.7061, - "step": 57541 - }, - { - "epoch": 1.47, - "learning_rate": 1.0756892469460323e-06, - "loss": 0.7041, - "step": 57542 - }, - { - "epoch": 1.47, - "learning_rate": 1.0756616558371147e-06, - "loss": 0.6714, - "step": 57543 - }, - { - "epoch": 1.47, - "learning_rate": 1.0756340646702663e-06, - "loss": 0.6001, - "step": 57544 - }, - { - "epoch": 1.47, - "learning_rate": 1.0756064734455086e-06, - "loss": 0.5388, - "step": 57545 - }, - { - "epoch": 1.47, - "learning_rate": 1.0755788821628624e-06, - "loss": 0.4956, - "step": 57546 - }, - { - "epoch": 1.47, - "learning_rate": 1.0755512908223492e-06, - "loss": 0.6069, - "step": 57547 - }, - { - "epoch": 1.47, - "learning_rate": 1.0755236994239896e-06, - "loss": 0.6123, - "step": 57548 - }, - { - "epoch": 1.48, - "learning_rate": 1.0754961079678049e-06, - "loss": 0.709, - "step": 57549 - }, - { - "epoch": 1.48, - "learning_rate": 1.0754685164538162e-06, - "loss": 0.4456, - "step": 57550 - }, - { - "epoch": 1.48, - "learning_rate": 1.0754409248820452e-06, - "loss": 0.6987, - "step": 57551 - }, - { - "epoch": 1.48, - "learning_rate": 1.0754133332525123e-06, - "loss": 0.6934, - "step": 57552 - }, - { - "epoch": 1.48, - "learning_rate": 1.0753857415652388e-06, - "loss": 0.624, - "step": 57553 - }, - { - "epoch": 1.48, - "learning_rate": 1.0753581498202458e-06, - "loss": 0.8232, - "step": 57554 - }, - { - "epoch": 1.48, - "learning_rate": 1.0753305580175548e-06, - "loss": 0.6289, - "step": 57555 - }, - { - "epoch": 1.48, - "learning_rate": 1.075302966157186e-06, - "loss": 0.6152, - "step": 57556 - }, - { - "epoch": 1.48, - "learning_rate": 1.075275374239162e-06, - "loss": 0.7627, - "step": 57557 - }, - { - "epoch": 1.48, - "learning_rate": 1.0752477822635028e-06, - "loss": 0.7017, - "step": 57558 - }, - { - "epoch": 1.48, - "learning_rate": 1.0752201902302298e-06, - "loss": 0.7354, - "step": 57559 - }, - { - "epoch": 1.48, - "learning_rate": 1.0751925981393644e-06, - "loss": 0.542, - "step": 57560 - }, - { - "epoch": 1.48, - "learning_rate": 1.0751650059909272e-06, - "loss": 0.6641, - "step": 57561 - }, - { - "epoch": 1.48, - "learning_rate": 1.0751374137849399e-06, - "loss": 0.6875, - "step": 57562 - }, - { - "epoch": 1.48, - "learning_rate": 1.075109821521423e-06, - "loss": 0.5796, - "step": 57563 - }, - { - "epoch": 1.48, - "learning_rate": 1.075082229200398e-06, - "loss": 0.5439, - "step": 57564 - }, - { - "epoch": 1.48, - "learning_rate": 1.075054636821886e-06, - "loss": 0.6113, - "step": 57565 - }, - { - "epoch": 1.48, - "learning_rate": 1.0750270443859084e-06, - "loss": 0.8682, - "step": 57566 - }, - { - "epoch": 1.48, - "learning_rate": 1.074999451892486e-06, - "loss": 0.6855, - "step": 57567 - }, - { - "epoch": 1.48, - "learning_rate": 1.0749718593416397e-06, - "loss": 0.6592, - "step": 57568 - }, - { - "epoch": 1.48, - "learning_rate": 1.074944266733391e-06, - "loss": 0.6172, - "step": 57569 - }, - { - "epoch": 1.48, - "learning_rate": 1.074916674067761e-06, - "loss": 0.5035, - "step": 57570 - }, - { - "epoch": 1.48, - "learning_rate": 1.0748890813447703e-06, - "loss": 0.6865, - "step": 57571 - }, - { - "epoch": 1.48, - "learning_rate": 1.0748614885644413e-06, - "loss": 0.4342, - "step": 57572 - }, - { - "epoch": 1.48, - "learning_rate": 1.0748338957267938e-06, - "loss": 0.6548, - "step": 57573 - }, - { - "epoch": 1.48, - "learning_rate": 1.0748063028318495e-06, - "loss": 0.7354, - "step": 57574 - }, - { - "epoch": 1.48, - "learning_rate": 1.0747787098796293e-06, - "loss": 0.7109, - "step": 57575 - }, - { - "epoch": 1.48, - "learning_rate": 1.0747511168701546e-06, - "loss": 0.5962, - "step": 57576 - }, - { - "epoch": 1.48, - "learning_rate": 1.0747235238034467e-06, - "loss": 0.6016, - "step": 57577 - }, - { - "epoch": 1.48, - "learning_rate": 1.0746959306795257e-06, - "loss": 0.6245, - "step": 57578 - }, - { - "epoch": 1.48, - "learning_rate": 1.0746683374984142e-06, - "loss": 0.6147, - "step": 57579 - }, - { - "epoch": 1.48, - "learning_rate": 1.0746407442601323e-06, - "loss": 0.5513, - "step": 57580 - }, - { - "epoch": 1.48, - "learning_rate": 1.0746131509647014e-06, - "loss": 0.6548, - "step": 57581 - }, - { - "epoch": 1.48, - "learning_rate": 1.0745855576121425e-06, - "loss": 0.4275, - "step": 57582 - }, - { - "epoch": 1.48, - "learning_rate": 1.0745579642024773e-06, - "loss": 0.749, - "step": 57583 - }, - { - "epoch": 1.48, - "learning_rate": 1.0745303707357261e-06, - "loss": 0.6416, - "step": 57584 - }, - { - "epoch": 1.48, - "learning_rate": 1.0745027772119106e-06, - "loss": 0.7217, - "step": 57585 - }, - { - "epoch": 1.48, - "learning_rate": 1.0744751836310515e-06, - "loss": 0.7188, - "step": 57586 - }, - { - "epoch": 1.48, - "learning_rate": 1.0744475899931707e-06, - "loss": 0.6372, - "step": 57587 - }, - { - "epoch": 1.48, - "learning_rate": 1.0744199962982883e-06, - "loss": 0.7158, - "step": 57588 - }, - { - "epoch": 1.48, - "learning_rate": 1.0743924025464263e-06, - "loss": 0.6455, - "step": 57589 - }, - { - "epoch": 1.48, - "learning_rate": 1.0743648087376048e-06, - "loss": 0.7139, - "step": 57590 - }, - { - "epoch": 1.48, - "learning_rate": 1.0743372148718463e-06, - "loss": 0.4658, - "step": 57591 - }, - { - "epoch": 1.48, - "learning_rate": 1.0743096209491711e-06, - "loss": 0.5859, - "step": 57592 - }, - { - "epoch": 1.48, - "learning_rate": 1.0742820269696001e-06, - "loss": 0.6797, - "step": 57593 - }, - { - "epoch": 1.48, - "learning_rate": 1.0742544329331551e-06, - "loss": 0.5222, - "step": 57594 - }, - { - "epoch": 1.48, - "learning_rate": 1.0742268388398569e-06, - "loss": 0.7041, - "step": 57595 - }, - { - "epoch": 1.48, - "learning_rate": 1.074199244689726e-06, - "loss": 0.7373, - "step": 57596 - }, - { - "epoch": 1.48, - "learning_rate": 1.0741716504827852e-06, - "loss": 0.5562, - "step": 57597 - }, - { - "epoch": 1.48, - "learning_rate": 1.074144056219054e-06, - "loss": 0.6265, - "step": 57598 - }, - { - "epoch": 1.48, - "learning_rate": 1.074116461898554e-06, - "loss": 0.7217, - "step": 57599 - }, - { - "epoch": 1.48, - "learning_rate": 1.0740888675213064e-06, - "loss": 0.6709, - "step": 57600 - }, - { - "epoch": 1.48, - "learning_rate": 1.0740612730873327e-06, - "loss": 0.7412, - "step": 57601 - }, - { - "epoch": 1.48, - "learning_rate": 1.0740336785966536e-06, - "loss": 0.5303, - "step": 57602 - }, - { - "epoch": 1.48, - "learning_rate": 1.07400608404929e-06, - "loss": 0.709, - "step": 57603 - }, - { - "epoch": 1.48, - "learning_rate": 1.0739784894452634e-06, - "loss": 0.7842, - "step": 57604 - }, - { - "epoch": 1.48, - "learning_rate": 1.073950894784595e-06, - "loss": 0.5151, - "step": 57605 - }, - { - "epoch": 1.48, - "learning_rate": 1.0739233000673061e-06, - "loss": 0.5928, - "step": 57606 - }, - { - "epoch": 1.48, - "learning_rate": 1.0738957052934173e-06, - "loss": 0.4004, - "step": 57607 - }, - { - "epoch": 1.48, - "learning_rate": 1.0738681104629498e-06, - "loss": 0.4071, - "step": 57608 - }, - { - "epoch": 1.48, - "learning_rate": 1.073840515575925e-06, - "loss": 0.4524, - "step": 57609 - }, - { - "epoch": 1.48, - "learning_rate": 1.073812920632364e-06, - "loss": 0.6362, - "step": 57610 - }, - { - "epoch": 1.48, - "learning_rate": 1.0737853256322875e-06, - "loss": 0.6162, - "step": 57611 - }, - { - "epoch": 1.48, - "learning_rate": 1.0737577305757175e-06, - "loss": 0.6875, - "step": 57612 - }, - { - "epoch": 1.48, - "learning_rate": 1.0737301354626743e-06, - "loss": 0.6274, - "step": 57613 - }, - { - "epoch": 1.48, - "learning_rate": 1.0737025402931794e-06, - "loss": 0.6426, - "step": 57614 - }, - { - "epoch": 1.48, - "learning_rate": 1.0736749450672536e-06, - "loss": 0.6304, - "step": 57615 - }, - { - "epoch": 1.48, - "learning_rate": 1.0736473497849186e-06, - "loss": 0.7607, - "step": 57616 - }, - { - "epoch": 1.48, - "learning_rate": 1.0736197544461952e-06, - "loss": 0.6172, - "step": 57617 - }, - { - "epoch": 1.48, - "learning_rate": 1.0735921590511043e-06, - "loss": 0.5383, - "step": 57618 - }, - { - "epoch": 1.48, - "learning_rate": 1.0735645635996674e-06, - "loss": 0.7939, - "step": 57619 - }, - { - "epoch": 1.48, - "learning_rate": 1.0735369680919054e-06, - "loss": 0.7393, - "step": 57620 - }, - { - "epoch": 1.48, - "learning_rate": 1.0735093725278397e-06, - "loss": 0.6338, - "step": 57621 - }, - { - "epoch": 1.48, - "learning_rate": 1.0734817769074913e-06, - "loss": 0.5708, - "step": 57622 - }, - { - "epoch": 1.48, - "learning_rate": 1.073454181230881e-06, - "loss": 0.4712, - "step": 57623 - }, - { - "epoch": 1.48, - "learning_rate": 1.0734265854980308e-06, - "loss": 0.7744, - "step": 57624 - }, - { - "epoch": 1.48, - "learning_rate": 1.0733989897089604e-06, - "loss": 0.8018, - "step": 57625 - }, - { - "epoch": 1.48, - "learning_rate": 1.0733713938636925e-06, - "loss": 0.6006, - "step": 57626 - }, - { - "epoch": 1.48, - "learning_rate": 1.0733437979622471e-06, - "loss": 0.7012, - "step": 57627 - }, - { - "epoch": 1.48, - "learning_rate": 1.0733162020046456e-06, - "loss": 0.6592, - "step": 57628 - }, - { - "epoch": 1.48, - "learning_rate": 1.0732886059909093e-06, - "loss": 0.6543, - "step": 57629 - }, - { - "epoch": 1.48, - "learning_rate": 1.0732610099210595e-06, - "loss": 0.6328, - "step": 57630 - }, - { - "epoch": 1.48, - "learning_rate": 1.0732334137951172e-06, - "loss": 0.5303, - "step": 57631 - }, - { - "epoch": 1.48, - "learning_rate": 1.0732058176131034e-06, - "loss": 0.6514, - "step": 57632 - }, - { - "epoch": 1.48, - "learning_rate": 1.0731782213750391e-06, - "loss": 0.6875, - "step": 57633 - }, - { - "epoch": 1.48, - "learning_rate": 1.0731506250809457e-06, - "loss": 0.7031, - "step": 57634 - }, - { - "epoch": 1.48, - "learning_rate": 1.0731230287308442e-06, - "loss": 0.6592, - "step": 57635 - }, - { - "epoch": 1.48, - "learning_rate": 1.0730954323247557e-06, - "loss": 0.7031, - "step": 57636 - }, - { - "epoch": 1.48, - "learning_rate": 1.0730678358627016e-06, - "loss": 0.9004, - "step": 57637 - }, - { - "epoch": 1.48, - "learning_rate": 1.0730402393447025e-06, - "loss": 0.6836, - "step": 57638 - }, - { - "epoch": 1.48, - "learning_rate": 1.0730126427707801e-06, - "loss": 0.6948, - "step": 57639 - }, - { - "epoch": 1.48, - "learning_rate": 1.072985046140955e-06, - "loss": 0.7383, - "step": 57640 - }, - { - "epoch": 1.48, - "learning_rate": 1.072957449455249e-06, - "loss": 0.6719, - "step": 57641 - }, - { - "epoch": 1.48, - "learning_rate": 1.0729298527136824e-06, - "loss": 0.6211, - "step": 57642 - }, - { - "epoch": 1.48, - "learning_rate": 1.0729022559162772e-06, - "loss": 0.5249, - "step": 57643 - }, - { - "epoch": 1.48, - "learning_rate": 1.0728746590630538e-06, - "loss": 0.6162, - "step": 57644 - }, - { - "epoch": 1.48, - "learning_rate": 1.0728470621540337e-06, - "loss": 0.7588, - "step": 57645 - }, - { - "epoch": 1.48, - "learning_rate": 1.0728194651892379e-06, - "loss": 0.5952, - "step": 57646 - }, - { - "epoch": 1.48, - "learning_rate": 1.0727918681686877e-06, - "loss": 0.574, - "step": 57647 - }, - { - "epoch": 1.48, - "learning_rate": 1.0727642710924043e-06, - "loss": 0.4351, - "step": 57648 - }, - { - "epoch": 1.48, - "learning_rate": 1.0727366739604082e-06, - "loss": 0.6011, - "step": 57649 - }, - { - "epoch": 1.48, - "learning_rate": 1.072709076772721e-06, - "loss": 0.8701, - "step": 57650 - }, - { - "epoch": 1.48, - "learning_rate": 1.0726814795293642e-06, - "loss": 0.5469, - "step": 57651 - }, - { - "epoch": 1.48, - "learning_rate": 1.0726538822303586e-06, - "loss": 0.6387, - "step": 57652 - }, - { - "epoch": 1.48, - "learning_rate": 1.0726262848757249e-06, - "loss": 0.6982, - "step": 57653 - }, - { - "epoch": 1.48, - "learning_rate": 1.0725986874654847e-06, - "loss": 0.7354, - "step": 57654 - }, - { - "epoch": 1.48, - "learning_rate": 1.0725710899996587e-06, - "loss": 0.3763, - "step": 57655 - }, - { - "epoch": 1.48, - "learning_rate": 1.0725434924782688e-06, - "loss": 0.7686, - "step": 57656 - }, - { - "epoch": 1.48, - "learning_rate": 1.0725158949013355e-06, - "loss": 0.5005, - "step": 57657 - }, - { - "epoch": 1.48, - "learning_rate": 1.0724882972688801e-06, - "loss": 0.6685, - "step": 57658 - }, - { - "epoch": 1.48, - "learning_rate": 1.0724606995809237e-06, - "loss": 0.6523, - "step": 57659 - }, - { - "epoch": 1.48, - "learning_rate": 1.0724331018374877e-06, - "loss": 0.5781, - "step": 57660 - }, - { - "epoch": 1.48, - "learning_rate": 1.0724055040385929e-06, - "loss": 0.7646, - "step": 57661 - }, - { - "epoch": 1.48, - "learning_rate": 1.0723779061842606e-06, - "loss": 0.6475, - "step": 57662 - }, - { - "epoch": 1.48, - "learning_rate": 1.0723503082745118e-06, - "loss": 0.6279, - "step": 57663 - }, - { - "epoch": 1.48, - "learning_rate": 1.0723227103093677e-06, - "loss": 0.6641, - "step": 57664 - }, - { - "epoch": 1.48, - "learning_rate": 1.0722951122888492e-06, - "loss": 0.7744, - "step": 57665 - }, - { - "epoch": 1.48, - "learning_rate": 1.072267514212978e-06, - "loss": 0.7158, - "step": 57666 - }, - { - "epoch": 1.48, - "learning_rate": 1.0722399160817747e-06, - "loss": 0.7529, - "step": 57667 - }, - { - "epoch": 1.48, - "learning_rate": 1.0722123178952604e-06, - "loss": 0.5962, - "step": 57668 - }, - { - "epoch": 1.48, - "learning_rate": 1.072184719653457e-06, - "loss": 0.5615, - "step": 57669 - }, - { - "epoch": 1.48, - "learning_rate": 1.0721571213563847e-06, - "loss": 0.5195, - "step": 57670 - }, - { - "epoch": 1.48, - "learning_rate": 1.072129523004065e-06, - "loss": 0.748, - "step": 57671 - }, - { - "epoch": 1.48, - "learning_rate": 1.0721019245965192e-06, - "loss": 0.7725, - "step": 57672 - }, - { - "epoch": 1.48, - "learning_rate": 1.0720743261337684e-06, - "loss": 0.5869, - "step": 57673 - }, - { - "epoch": 1.48, - "learning_rate": 1.0720467276158332e-06, - "loss": 0.6504, - "step": 57674 - }, - { - "epoch": 1.48, - "learning_rate": 1.0720191290427355e-06, - "loss": 0.7266, - "step": 57675 - }, - { - "epoch": 1.48, - "learning_rate": 1.0719915304144958e-06, - "loss": 0.6348, - "step": 57676 - }, - { - "epoch": 1.48, - "learning_rate": 1.0719639317311357e-06, - "loss": 0.6416, - "step": 57677 - }, - { - "epoch": 1.48, - "learning_rate": 1.0719363329926757e-06, - "loss": 0.6548, - "step": 57678 - }, - { - "epoch": 1.48, - "learning_rate": 1.071908734199138e-06, - "loss": 0.8008, - "step": 57679 - }, - { - "epoch": 1.48, - "learning_rate": 1.0718811353505426e-06, - "loss": 0.8145, - "step": 57680 - }, - { - "epoch": 1.48, - "learning_rate": 1.0718535364469114e-06, - "loss": 0.5562, - "step": 57681 - }, - { - "epoch": 1.48, - "learning_rate": 1.0718259374882652e-06, - "loss": 0.688, - "step": 57682 - }, - { - "epoch": 1.48, - "learning_rate": 1.0717983384746251e-06, - "loss": 0.6289, - "step": 57683 - }, - { - "epoch": 1.48, - "learning_rate": 1.0717707394060122e-06, - "loss": 0.5811, - "step": 57684 - }, - { - "epoch": 1.48, - "learning_rate": 1.0717431402824478e-06, - "loss": 0.584, - "step": 57685 - }, - { - "epoch": 1.48, - "learning_rate": 1.0717155411039532e-06, - "loss": 0.5508, - "step": 57686 - }, - { - "epoch": 1.48, - "learning_rate": 1.0716879418705494e-06, - "loss": 0.4966, - "step": 57687 - }, - { - "epoch": 1.48, - "learning_rate": 1.071660342582257e-06, - "loss": 0.7383, - "step": 57688 - }, - { - "epoch": 1.48, - "learning_rate": 1.0716327432390978e-06, - "loss": 0.6055, - "step": 57689 - }, - { - "epoch": 1.48, - "learning_rate": 1.0716051438410927e-06, - "loss": 0.5752, - "step": 57690 - }, - { - "epoch": 1.48, - "learning_rate": 1.0715775443882629e-06, - "loss": 0.6982, - "step": 57691 - }, - { - "epoch": 1.48, - "learning_rate": 1.0715499448806294e-06, - "loss": 0.5444, - "step": 57692 - }, - { - "epoch": 1.48, - "learning_rate": 1.0715223453182132e-06, - "loss": 0.5908, - "step": 57693 - }, - { - "epoch": 1.48, - "learning_rate": 1.071494745701036e-06, - "loss": 0.4692, - "step": 57694 - }, - { - "epoch": 1.48, - "learning_rate": 1.0714671460291183e-06, - "loss": 0.6665, - "step": 57695 - }, - { - "epoch": 1.48, - "learning_rate": 1.0714395463024815e-06, - "loss": 0.5205, - "step": 57696 - }, - { - "epoch": 1.48, - "learning_rate": 1.071411946521147e-06, - "loss": 0.6123, - "step": 57697 - }, - { - "epoch": 1.48, - "learning_rate": 1.0713843466851353e-06, - "loss": 0.7256, - "step": 57698 - }, - { - "epoch": 1.48, - "learning_rate": 1.071356746794468e-06, - "loss": 0.6421, - "step": 57699 - }, - { - "epoch": 1.48, - "learning_rate": 1.071329146849166e-06, - "loss": 0.5376, - "step": 57700 - }, - { - "epoch": 1.48, - "learning_rate": 1.0713015468492508e-06, - "loss": 0.6836, - "step": 57701 - }, - { - "epoch": 1.48, - "learning_rate": 1.0712739467947434e-06, - "loss": 0.8467, - "step": 57702 - }, - { - "epoch": 1.48, - "learning_rate": 1.0712463466856645e-06, - "loss": 0.6001, - "step": 57703 - }, - { - "epoch": 1.48, - "learning_rate": 1.0712187465220358e-06, - "loss": 0.7051, - "step": 57704 - }, - { - "epoch": 1.48, - "learning_rate": 1.0711911463038778e-06, - "loss": 0.5762, - "step": 57705 - }, - { - "epoch": 1.48, - "learning_rate": 1.0711635460312122e-06, - "loss": 0.5273, - "step": 57706 - }, - { - "epoch": 1.48, - "learning_rate": 1.07113594570406e-06, - "loss": 0.6279, - "step": 57707 - }, - { - "epoch": 1.48, - "learning_rate": 1.0711083453224425e-06, - "loss": 0.7197, - "step": 57708 - }, - { - "epoch": 1.48, - "learning_rate": 1.0710807448863804e-06, - "loss": 0.7861, - "step": 57709 - }, - { - "epoch": 1.48, - "learning_rate": 1.071053144395895e-06, - "loss": 0.5137, - "step": 57710 - }, - { - "epoch": 1.48, - "learning_rate": 1.0710255438510072e-06, - "loss": 0.5232, - "step": 57711 - }, - { - "epoch": 1.48, - "learning_rate": 1.0709979432517389e-06, - "loss": 0.5996, - "step": 57712 - }, - { - "epoch": 1.48, - "learning_rate": 1.0709703425981105e-06, - "loss": 0.6211, - "step": 57713 - }, - { - "epoch": 1.48, - "learning_rate": 1.0709427418901435e-06, - "loss": 0.6267, - "step": 57714 - }, - { - "epoch": 1.48, - "learning_rate": 1.0709151411278587e-06, - "loss": 0.7773, - "step": 57715 - }, - { - "epoch": 1.48, - "learning_rate": 1.0708875403112775e-06, - "loss": 0.6982, - "step": 57716 - }, - { - "epoch": 1.48, - "learning_rate": 1.0708599394404212e-06, - "loss": 0.6685, - "step": 57717 - }, - { - "epoch": 1.48, - "learning_rate": 1.0708323385153105e-06, - "loss": 0.7012, - "step": 57718 - }, - { - "epoch": 1.48, - "learning_rate": 1.0708047375359668e-06, - "loss": 0.5679, - "step": 57719 - }, - { - "epoch": 1.48, - "learning_rate": 1.0707771365024109e-06, - "loss": 0.5083, - "step": 57720 - }, - { - "epoch": 1.48, - "learning_rate": 1.0707495354146645e-06, - "loss": 0.543, - "step": 57721 - }, - { - "epoch": 1.48, - "learning_rate": 1.0707219342727485e-06, - "loss": 0.71, - "step": 57722 - }, - { - "epoch": 1.48, - "learning_rate": 1.0706943330766839e-06, - "loss": 0.7549, - "step": 57723 - }, - { - "epoch": 1.48, - "learning_rate": 1.0706667318264916e-06, - "loss": 0.7539, - "step": 57724 - }, - { - "epoch": 1.48, - "learning_rate": 1.0706391305221933e-06, - "loss": 0.3938, - "step": 57725 - }, - { - "epoch": 1.48, - "learning_rate": 1.0706115291638098e-06, - "loss": 0.752, - "step": 57726 - }, - { - "epoch": 1.48, - "learning_rate": 1.0705839277513627e-06, - "loss": 0.5554, - "step": 57727 - }, - { - "epoch": 1.48, - "learning_rate": 1.070556326284872e-06, - "loss": 0.8242, - "step": 57728 - }, - { - "epoch": 1.48, - "learning_rate": 1.0705287247643602e-06, - "loss": 0.6772, - "step": 57729 - }, - { - "epoch": 1.48, - "learning_rate": 1.0705011231898473e-06, - "loss": 0.5645, - "step": 57730 - }, - { - "epoch": 1.48, - "learning_rate": 1.0704735215613551e-06, - "loss": 0.5688, - "step": 57731 - }, - { - "epoch": 1.48, - "learning_rate": 1.0704459198789049e-06, - "loss": 0.5879, - "step": 57732 - }, - { - "epoch": 1.48, - "learning_rate": 1.0704183181425172e-06, - "loss": 0.707, - "step": 57733 - }, - { - "epoch": 1.48, - "learning_rate": 1.0703907163522132e-06, - "loss": 0.7266, - "step": 57734 - }, - { - "epoch": 1.48, - "learning_rate": 1.0703631145080148e-06, - "loss": 0.6387, - "step": 57735 - }, - { - "epoch": 1.48, - "learning_rate": 1.070335512609942e-06, - "loss": 0.4852, - "step": 57736 - }, - { - "epoch": 1.48, - "learning_rate": 1.0703079106580172e-06, - "loss": 0.6504, - "step": 57737 - }, - { - "epoch": 1.48, - "learning_rate": 1.0702803086522603e-06, - "loss": 0.7539, - "step": 57738 - }, - { - "epoch": 1.48, - "learning_rate": 1.0702527065926932e-06, - "loss": 0.7793, - "step": 57739 - }, - { - "epoch": 1.48, - "learning_rate": 1.070225104479337e-06, - "loss": 0.4559, - "step": 57740 - }, - { - "epoch": 1.48, - "learning_rate": 1.070197502312212e-06, - "loss": 0.709, - "step": 57741 - }, - { - "epoch": 1.48, - "learning_rate": 1.0701699000913409e-06, - "loss": 0.511, - "step": 57742 - }, - { - "epoch": 1.48, - "learning_rate": 1.0701422978167434e-06, - "loss": 0.686, - "step": 57743 - }, - { - "epoch": 1.48, - "learning_rate": 1.0701146954884415e-06, - "loss": 0.7305, - "step": 57744 - }, - { - "epoch": 1.48, - "learning_rate": 1.0700870931064555e-06, - "loss": 0.5894, - "step": 57745 - }, - { - "epoch": 1.48, - "learning_rate": 1.0700594906708077e-06, - "loss": 0.7168, - "step": 57746 - }, - { - "epoch": 1.48, - "learning_rate": 1.0700318881815183e-06, - "loss": 0.7441, - "step": 57747 - }, - { - "epoch": 1.48, - "learning_rate": 1.0700042856386085e-06, - "loss": 0.708, - "step": 57748 - }, - { - "epoch": 1.48, - "learning_rate": 1.0699766830420998e-06, - "loss": 0.7402, - "step": 57749 - }, - { - "epoch": 1.48, - "learning_rate": 1.069949080392013e-06, - "loss": 0.5923, - "step": 57750 - }, - { - "epoch": 1.48, - "learning_rate": 1.0699214776883693e-06, - "loss": 0.6396, - "step": 57751 - }, - { - "epoch": 1.48, - "learning_rate": 1.0698938749311905e-06, - "loss": 0.7412, - "step": 57752 - }, - { - "epoch": 1.48, - "learning_rate": 1.0698662721204967e-06, - "loss": 0.6172, - "step": 57753 - }, - { - "epoch": 1.48, - "learning_rate": 1.06983866925631e-06, - "loss": 0.5315, - "step": 57754 - }, - { - "epoch": 1.48, - "learning_rate": 1.0698110663386504e-06, - "loss": 0.665, - "step": 57755 - }, - { - "epoch": 1.48, - "learning_rate": 1.06978346336754e-06, - "loss": 0.7314, - "step": 57756 - }, - { - "epoch": 1.48, - "learning_rate": 1.0697558603429997e-06, - "loss": 0.6426, - "step": 57757 - }, - { - "epoch": 1.48, - "learning_rate": 1.0697282572650504e-06, - "loss": 0.6357, - "step": 57758 - }, - { - "epoch": 1.48, - "learning_rate": 1.0697006541337134e-06, - "loss": 0.7236, - "step": 57759 - }, - { - "epoch": 1.48, - "learning_rate": 1.06967305094901e-06, - "loss": 0.4971, - "step": 57760 - }, - { - "epoch": 1.48, - "learning_rate": 1.0696454477109606e-06, - "loss": 0.8311, - "step": 57761 - }, - { - "epoch": 1.48, - "learning_rate": 1.0696178444195873e-06, - "loss": 0.5381, - "step": 57762 - }, - { - "epoch": 1.48, - "learning_rate": 1.069590241074911e-06, - "loss": 0.7129, - "step": 57763 - }, - { - "epoch": 1.48, - "learning_rate": 1.0695626376769521e-06, - "loss": 0.5903, - "step": 57764 - }, - { - "epoch": 1.48, - "learning_rate": 1.0695350342257327e-06, - "loss": 0.5967, - "step": 57765 - }, - { - "epoch": 1.48, - "learning_rate": 1.0695074307212735e-06, - "loss": 0.8252, - "step": 57766 - }, - { - "epoch": 1.48, - "learning_rate": 1.0694798271635958e-06, - "loss": 0.6006, - "step": 57767 - }, - { - "epoch": 1.48, - "learning_rate": 1.0694522235527204e-06, - "loss": 0.6001, - "step": 57768 - }, - { - "epoch": 1.48, - "learning_rate": 1.0694246198886686e-06, - "loss": 0.7705, - "step": 57769 - }, - { - "epoch": 1.48, - "learning_rate": 1.0693970161714613e-06, - "loss": 0.7627, - "step": 57770 - }, - { - "epoch": 1.48, - "learning_rate": 1.0693694124011206e-06, - "loss": 0.7915, - "step": 57771 - }, - { - "epoch": 1.48, - "learning_rate": 1.0693418085776662e-06, - "loss": 0.6982, - "step": 57772 - }, - { - "epoch": 1.48, - "learning_rate": 1.0693142047011202e-06, - "loss": 0.4844, - "step": 57773 - }, - { - "epoch": 1.48, - "learning_rate": 1.0692866007715036e-06, - "loss": 0.5938, - "step": 57774 - }, - { - "epoch": 1.48, - "learning_rate": 1.0692589967888375e-06, - "loss": 0.7422, - "step": 57775 - }, - { - "epoch": 1.48, - "learning_rate": 1.069231392753143e-06, - "loss": 0.7627, - "step": 57776 - }, - { - "epoch": 1.48, - "learning_rate": 1.069203788664441e-06, - "loss": 0.575, - "step": 57777 - }, - { - "epoch": 1.48, - "learning_rate": 1.069176184522753e-06, - "loss": 0.7695, - "step": 57778 - }, - { - "epoch": 1.48, - "learning_rate": 1.0691485803280998e-06, - "loss": 0.7798, - "step": 57779 - }, - { - "epoch": 1.48, - "learning_rate": 1.0691209760805026e-06, - "loss": 0.4749, - "step": 57780 - }, - { - "epoch": 1.48, - "learning_rate": 1.0690933717799831e-06, - "loss": 0.5996, - "step": 57781 - }, - { - "epoch": 1.48, - "learning_rate": 1.0690657674265616e-06, - "loss": 0.6853, - "step": 57782 - }, - { - "epoch": 1.48, - "learning_rate": 1.0690381630202597e-06, - "loss": 0.5874, - "step": 57783 - }, - { - "epoch": 1.48, - "learning_rate": 1.0690105585610986e-06, - "loss": 0.6465, - "step": 57784 - }, - { - "epoch": 1.48, - "learning_rate": 1.0689829540490992e-06, - "loss": 0.6982, - "step": 57785 - }, - { - "epoch": 1.48, - "learning_rate": 1.0689553494842828e-06, - "loss": 0.5459, - "step": 57786 - }, - { - "epoch": 1.48, - "learning_rate": 1.0689277448666702e-06, - "loss": 0.6641, - "step": 57787 - }, - { - "epoch": 1.48, - "learning_rate": 1.068900140196283e-06, - "loss": 0.5303, - "step": 57788 - }, - { - "epoch": 1.48, - "learning_rate": 1.068872535473142e-06, - "loss": 0.5319, - "step": 57789 - }, - { - "epoch": 1.48, - "learning_rate": 1.0688449306972686e-06, - "loss": 0.7275, - "step": 57790 - }, - { - "epoch": 1.48, - "learning_rate": 1.0688173258686838e-06, - "loss": 0.6709, - "step": 57791 - }, - { - "epoch": 1.48, - "learning_rate": 1.068789720987409e-06, - "loss": 0.6377, - "step": 57792 - }, - { - "epoch": 1.48, - "learning_rate": 1.0687621160534646e-06, - "loss": 0.752, - "step": 57793 - }, - { - "epoch": 1.48, - "learning_rate": 1.0687345110668724e-06, - "loss": 0.6997, - "step": 57794 - }, - { - "epoch": 1.48, - "learning_rate": 1.0687069060276532e-06, - "loss": 0.7432, - "step": 57795 - }, - { - "epoch": 1.48, - "learning_rate": 1.0686793009358288e-06, - "loss": 0.6816, - "step": 57796 - }, - { - "epoch": 1.48, - "learning_rate": 1.0686516957914191e-06, - "loss": 0.71, - "step": 57797 - }, - { - "epoch": 1.48, - "learning_rate": 1.0686240905944466e-06, - "loss": 0.8066, - "step": 57798 - }, - { - "epoch": 1.48, - "learning_rate": 1.0685964853449312e-06, - "loss": 0.7559, - "step": 57799 - }, - { - "epoch": 1.48, - "learning_rate": 1.0685688800428948e-06, - "loss": 0.646, - "step": 57800 - }, - { - "epoch": 1.48, - "learning_rate": 1.0685412746883587e-06, - "loss": 0.4226, - "step": 57801 - }, - { - "epoch": 1.48, - "learning_rate": 1.0685136692813434e-06, - "loss": 0.4697, - "step": 57802 - }, - { - "epoch": 1.48, - "learning_rate": 1.0684860638218705e-06, - "loss": 0.7578, - "step": 57803 - }, - { - "epoch": 1.48, - "learning_rate": 1.0684584583099608e-06, - "loss": 0.7949, - "step": 57804 - }, - { - "epoch": 1.48, - "learning_rate": 1.0684308527456356e-06, - "loss": 0.7217, - "step": 57805 - }, - { - "epoch": 1.48, - "learning_rate": 1.0684032471289161e-06, - "loss": 0.667, - "step": 57806 - }, - { - "epoch": 1.48, - "learning_rate": 1.0683756414598235e-06, - "loss": 0.6992, - "step": 57807 - }, - { - "epoch": 1.48, - "learning_rate": 1.0683480357383786e-06, - "loss": 0.6123, - "step": 57808 - }, - { - "epoch": 1.48, - "learning_rate": 1.068320429964603e-06, - "loss": 0.6592, - "step": 57809 - }, - { - "epoch": 1.48, - "learning_rate": 1.0682928241385172e-06, - "loss": 0.6675, - "step": 57810 - }, - { - "epoch": 1.48, - "learning_rate": 1.0682652182601433e-06, - "loss": 0.5908, - "step": 57811 - }, - { - "epoch": 1.48, - "learning_rate": 1.0682376123295014e-06, - "loss": 0.6855, - "step": 57812 - }, - { - "epoch": 1.48, - "learning_rate": 1.0682100063466134e-06, - "loss": 0.6309, - "step": 57813 - }, - { - "epoch": 1.48, - "learning_rate": 1.0681824003114996e-06, - "loss": 0.6826, - "step": 57814 - }, - { - "epoch": 1.48, - "learning_rate": 1.0681547942241822e-06, - "loss": 0.5664, - "step": 57815 - }, - { - "epoch": 1.48, - "learning_rate": 1.0681271880846818e-06, - "loss": 0.7285, - "step": 57816 - }, - { - "epoch": 1.48, - "learning_rate": 1.0680995818930195e-06, - "loss": 0.624, - "step": 57817 - }, - { - "epoch": 1.48, - "learning_rate": 1.068071975649216e-06, - "loss": 0.6387, - "step": 57818 - }, - { - "epoch": 1.48, - "learning_rate": 1.0680443693532935e-06, - "loss": 0.6094, - "step": 57819 - }, - { - "epoch": 1.48, - "learning_rate": 1.068016763005272e-06, - "loss": 0.6807, - "step": 57820 - }, - { - "epoch": 1.48, - "learning_rate": 1.0679891566051737e-06, - "loss": 0.5024, - "step": 57821 - }, - { - "epoch": 1.48, - "learning_rate": 1.0679615501530193e-06, - "loss": 0.531, - "step": 57822 - }, - { - "epoch": 1.48, - "learning_rate": 1.0679339436488297e-06, - "loss": 0.6826, - "step": 57823 - }, - { - "epoch": 1.48, - "learning_rate": 1.067906337092626e-06, - "loss": 0.8779, - "step": 57824 - }, - { - "epoch": 1.48, - "learning_rate": 1.0678787304844297e-06, - "loss": 0.5688, - "step": 57825 - }, - { - "epoch": 1.48, - "learning_rate": 1.0678511238242618e-06, - "loss": 0.6914, - "step": 57826 - }, - { - "epoch": 1.48, - "learning_rate": 1.0678235171121432e-06, - "loss": 0.6001, - "step": 57827 - }, - { - "epoch": 1.48, - "learning_rate": 1.0677959103480956e-06, - "loss": 0.6536, - "step": 57828 - }, - { - "epoch": 1.48, - "learning_rate": 1.0677683035321394e-06, - "loss": 0.4469, - "step": 57829 - }, - { - "epoch": 1.48, - "learning_rate": 1.0677406966642964e-06, - "loss": 0.5908, - "step": 57830 - }, - { - "epoch": 1.48, - "learning_rate": 1.0677130897445874e-06, - "loss": 0.5073, - "step": 57831 - }, - { - "epoch": 1.48, - "learning_rate": 1.0676854827730336e-06, - "loss": 0.511, - "step": 57832 - }, - { - "epoch": 1.48, - "learning_rate": 1.067657875749656e-06, - "loss": 0.6104, - "step": 57833 - }, - { - "epoch": 1.48, - "learning_rate": 1.0676302686744763e-06, - "loss": 0.6738, - "step": 57834 - }, - { - "epoch": 1.48, - "learning_rate": 1.0676026615475147e-06, - "loss": 0.5466, - "step": 57835 - }, - { - "epoch": 1.48, - "learning_rate": 1.0675750543687934e-06, - "loss": 0.6282, - "step": 57836 - }, - { - "epoch": 1.48, - "learning_rate": 1.0675474471383326e-06, - "loss": 0.7285, - "step": 57837 - }, - { - "epoch": 1.48, - "learning_rate": 1.0675198398561538e-06, - "loss": 0.7598, - "step": 57838 - }, - { - "epoch": 1.48, - "learning_rate": 1.0674922325222781e-06, - "loss": 0.48, - "step": 57839 - }, - { - "epoch": 1.48, - "learning_rate": 1.067464625136727e-06, - "loss": 0.6875, - "step": 57840 - }, - { - "epoch": 1.48, - "learning_rate": 1.0674370176995214e-06, - "loss": 0.5786, - "step": 57841 - }, - { - "epoch": 1.48, - "learning_rate": 1.067409410210682e-06, - "loss": 0.4648, - "step": 57842 - }, - { - "epoch": 1.48, - "learning_rate": 1.0673818026702303e-06, - "loss": 0.5413, - "step": 57843 - }, - { - "epoch": 1.48, - "learning_rate": 1.0673541950781876e-06, - "loss": 0.5347, - "step": 57844 - }, - { - "epoch": 1.48, - "learning_rate": 1.0673265874345748e-06, - "loss": 0.7529, - "step": 57845 - }, - { - "epoch": 1.48, - "learning_rate": 1.0672989797394133e-06, - "loss": 0.6333, - "step": 57846 - }, - { - "epoch": 1.48, - "learning_rate": 1.0672713719927243e-06, - "loss": 0.7607, - "step": 57847 - }, - { - "epoch": 1.48, - "learning_rate": 1.0672437641945282e-06, - "loss": 0.5957, - "step": 57848 - }, - { - "epoch": 1.48, - "learning_rate": 1.0672161563448469e-06, - "loss": 0.7539, - "step": 57849 - }, - { - "epoch": 1.48, - "learning_rate": 1.0671885484437014e-06, - "loss": 0.7422, - "step": 57850 - }, - { - "epoch": 1.48, - "learning_rate": 1.0671609404911126e-06, - "loss": 0.5068, - "step": 57851 - }, - { - "epoch": 1.48, - "learning_rate": 1.0671333324871017e-06, - "loss": 0.7212, - "step": 57852 - }, - { - "epoch": 1.48, - "learning_rate": 1.0671057244316898e-06, - "loss": 0.4622, - "step": 57853 - }, - { - "epoch": 1.48, - "learning_rate": 1.0670781163248983e-06, - "loss": 0.542, - "step": 57854 - }, - { - "epoch": 1.48, - "learning_rate": 1.067050508166748e-06, - "loss": 0.5679, - "step": 57855 - }, - { - "epoch": 1.48, - "learning_rate": 1.0670228999572606e-06, - "loss": 0.5894, - "step": 57856 - }, - { - "epoch": 1.48, - "learning_rate": 1.0669952916964566e-06, - "loss": 0.5796, - "step": 57857 - }, - { - "epoch": 1.48, - "learning_rate": 1.066967683384357e-06, - "loss": 0.7158, - "step": 57858 - }, - { - "epoch": 1.48, - "learning_rate": 1.0669400750209839e-06, - "loss": 0.6436, - "step": 57859 - }, - { - "epoch": 1.48, - "learning_rate": 1.0669124666063577e-06, - "loss": 0.7109, - "step": 57860 - }, - { - "epoch": 1.48, - "learning_rate": 1.0668848581404997e-06, - "loss": 0.6377, - "step": 57861 - }, - { - "epoch": 1.48, - "learning_rate": 1.066857249623431e-06, - "loss": 0.7188, - "step": 57862 - }, - { - "epoch": 1.48, - "learning_rate": 1.0668296410551727e-06, - "loss": 0.5879, - "step": 57863 - }, - { - "epoch": 1.48, - "learning_rate": 1.0668020324357458e-06, - "loss": 0.6475, - "step": 57864 - }, - { - "epoch": 1.48, - "learning_rate": 1.066774423765172e-06, - "loss": 0.4983, - "step": 57865 - }, - { - "epoch": 1.48, - "learning_rate": 1.0667468150434723e-06, - "loss": 0.6143, - "step": 57866 - }, - { - "epoch": 1.48, - "learning_rate": 1.0667192062706674e-06, - "loss": 0.7334, - "step": 57867 - }, - { - "epoch": 1.48, - "learning_rate": 1.0666915974467785e-06, - "loss": 0.6265, - "step": 57868 - }, - { - "epoch": 1.48, - "learning_rate": 1.0666639885718272e-06, - "loss": 0.6904, - "step": 57869 - }, - { - "epoch": 1.48, - "learning_rate": 1.066636379645834e-06, - "loss": 0.6982, - "step": 57870 - }, - { - "epoch": 1.48, - "learning_rate": 1.0666087706688205e-06, - "loss": 0.6335, - "step": 57871 - }, - { - "epoch": 1.48, - "learning_rate": 1.066581161640808e-06, - "loss": 0.5435, - "step": 57872 - }, - { - "epoch": 1.48, - "learning_rate": 1.066553552561817e-06, - "loss": 0.6396, - "step": 57873 - }, - { - "epoch": 1.48, - "learning_rate": 1.0665259434318691e-06, - "loss": 0.5439, - "step": 57874 - }, - { - "epoch": 1.48, - "learning_rate": 1.0664983342509854e-06, - "loss": 0.6338, - "step": 57875 - }, - { - "epoch": 1.48, - "learning_rate": 1.0664707250191873e-06, - "loss": 0.6548, - "step": 57876 - }, - { - "epoch": 1.48, - "learning_rate": 1.0664431157364952e-06, - "loss": 0.61, - "step": 57877 - }, - { - "epoch": 1.48, - "learning_rate": 1.0664155064029308e-06, - "loss": 0.748, - "step": 57878 - }, - { - "epoch": 1.48, - "learning_rate": 1.066387897018515e-06, - "loss": 0.8008, - "step": 57879 - }, - { - "epoch": 1.48, - "learning_rate": 1.0663602875832691e-06, - "loss": 0.7412, - "step": 57880 - }, - { - "epoch": 1.48, - "learning_rate": 1.0663326780972144e-06, - "loss": 0.4973, - "step": 57881 - }, - { - "epoch": 1.48, - "learning_rate": 1.0663050685603716e-06, - "loss": 0.6167, - "step": 57882 - }, - { - "epoch": 1.48, - "learning_rate": 1.0662774589727619e-06, - "loss": 0.6484, - "step": 57883 - }, - { - "epoch": 1.48, - "learning_rate": 1.066249849334407e-06, - "loss": 0.5474, - "step": 57884 - }, - { - "epoch": 1.48, - "learning_rate": 1.0662222396453272e-06, - "loss": 0.8496, - "step": 57885 - }, - { - "epoch": 1.48, - "learning_rate": 1.0661946299055447e-06, - "loss": 0.584, - "step": 57886 - }, - { - "epoch": 1.48, - "learning_rate": 1.0661670201150794e-06, - "loss": 0.5291, - "step": 57887 - }, - { - "epoch": 1.48, - "learning_rate": 1.0661394102739534e-06, - "loss": 0.8438, - "step": 57888 - }, - { - "epoch": 1.48, - "learning_rate": 1.0661118003821873e-06, - "loss": 0.7764, - "step": 57889 - }, - { - "epoch": 1.48, - "learning_rate": 1.0660841904398023e-06, - "loss": 0.541, - "step": 57890 - }, - { - "epoch": 1.48, - "learning_rate": 1.06605658044682e-06, - "loss": 0.6465, - "step": 57891 - }, - { - "epoch": 1.48, - "learning_rate": 1.066028970403261e-06, - "loss": 0.6758, - "step": 57892 - }, - { - "epoch": 1.48, - "learning_rate": 1.0660013603091468e-06, - "loss": 1.0078, - "step": 57893 - }, - { - "epoch": 1.48, - "learning_rate": 1.0659737501644984e-06, - "loss": 0.6123, - "step": 57894 - }, - { - "epoch": 1.48, - "learning_rate": 1.0659461399693369e-06, - "loss": 0.6284, - "step": 57895 - }, - { - "epoch": 1.48, - "learning_rate": 1.0659185297236832e-06, - "loss": 0.4224, - "step": 57896 - }, - { - "epoch": 1.48, - "learning_rate": 1.0658909194275592e-06, - "loss": 0.5137, - "step": 57897 - }, - { - "epoch": 1.48, - "learning_rate": 1.065863309080985e-06, - "loss": 0.8096, - "step": 57898 - }, - { - "epoch": 1.48, - "learning_rate": 1.0658356986839826e-06, - "loss": 0.748, - "step": 57899 - }, - { - "epoch": 1.48, - "learning_rate": 1.0658080882365728e-06, - "loss": 0.5376, - "step": 57900 - }, - { - "epoch": 1.48, - "learning_rate": 1.065780477738777e-06, - "loss": 0.5518, - "step": 57901 - }, - { - "epoch": 1.48, - "learning_rate": 1.065752867190616e-06, - "loss": 0.5166, - "step": 57902 - }, - { - "epoch": 1.48, - "learning_rate": 1.065725256592111e-06, - "loss": 0.6089, - "step": 57903 - }, - { - "epoch": 1.48, - "learning_rate": 1.0656976459432828e-06, - "loss": 0.7178, - "step": 57904 - }, - { - "epoch": 1.48, - "learning_rate": 1.0656700352441535e-06, - "loss": 0.3619, - "step": 57905 - }, - { - "epoch": 1.48, - "learning_rate": 1.0656424244947434e-06, - "loss": 0.7046, - "step": 57906 - }, - { - "epoch": 1.48, - "learning_rate": 1.0656148136950742e-06, - "loss": 0.5942, - "step": 57907 - }, - { - "epoch": 1.48, - "learning_rate": 1.0655872028451665e-06, - "loss": 0.7178, - "step": 57908 - }, - { - "epoch": 1.48, - "learning_rate": 1.0655595919450417e-06, - "loss": 0.6953, - "step": 57909 - }, - { - "epoch": 1.48, - "learning_rate": 1.0655319809947207e-06, - "loss": 0.604, - "step": 57910 - }, - { - "epoch": 1.48, - "learning_rate": 1.0655043699942251e-06, - "loss": 0.5732, - "step": 57911 - }, - { - "epoch": 1.48, - "learning_rate": 1.065476758943576e-06, - "loss": 0.4907, - "step": 57912 - }, - { - "epoch": 1.48, - "learning_rate": 1.0654491478427945e-06, - "loss": 0.5684, - "step": 57913 - }, - { - "epoch": 1.48, - "learning_rate": 1.065421536691901e-06, - "loss": 0.7305, - "step": 57914 - }, - { - "epoch": 1.48, - "learning_rate": 1.0653939254909177e-06, - "loss": 0.5587, - "step": 57915 - }, - { - "epoch": 1.48, - "learning_rate": 1.0653663142398653e-06, - "loss": 0.6016, - "step": 57916 - }, - { - "epoch": 1.48, - "learning_rate": 1.0653387029387643e-06, - "loss": 0.5518, - "step": 57917 - }, - { - "epoch": 1.48, - "learning_rate": 1.065311091587637e-06, - "loss": 0.6948, - "step": 57918 - }, - { - "epoch": 1.48, - "learning_rate": 1.0652834801865037e-06, - "loss": 0.5488, - "step": 57919 - }, - { - "epoch": 1.48, - "learning_rate": 1.0652558687353864e-06, - "loss": 0.585, - "step": 57920 - }, - { - "epoch": 1.48, - "learning_rate": 1.0652282572343053e-06, - "loss": 0.5889, - "step": 57921 - }, - { - "epoch": 1.48, - "learning_rate": 1.065200645683282e-06, - "loss": 0.7051, - "step": 57922 - }, - { - "epoch": 1.48, - "learning_rate": 1.0651730340823373e-06, - "loss": 0.8379, - "step": 57923 - }, - { - "epoch": 1.48, - "learning_rate": 1.065145422431493e-06, - "loss": 0.6086, - "step": 57924 - }, - { - "epoch": 1.48, - "learning_rate": 1.0651178107307694e-06, - "loss": 0.6738, - "step": 57925 - }, - { - "epoch": 1.48, - "learning_rate": 1.0650901989801888e-06, - "loss": 0.5543, - "step": 57926 - }, - { - "epoch": 1.48, - "learning_rate": 1.065062587179771e-06, - "loss": 0.5913, - "step": 57927 - }, - { - "epoch": 1.48, - "learning_rate": 1.065034975329538e-06, - "loss": 0.6079, - "step": 57928 - }, - { - "epoch": 1.48, - "learning_rate": 1.0650073634295104e-06, - "loss": 0.6035, - "step": 57929 - }, - { - "epoch": 1.48, - "learning_rate": 1.06497975147971e-06, - "loss": 0.5464, - "step": 57930 - }, - { - "epoch": 1.48, - "learning_rate": 1.0649521394801575e-06, - "loss": 0.5308, - "step": 57931 - }, - { - "epoch": 1.48, - "learning_rate": 1.0649245274308743e-06, - "loss": 0.6353, - "step": 57932 - }, - { - "epoch": 1.48, - "learning_rate": 1.064896915331881e-06, - "loss": 0.6689, - "step": 57933 - }, - { - "epoch": 1.48, - "learning_rate": 1.0648693031831993e-06, - "loss": 0.5012, - "step": 57934 - }, - { - "epoch": 1.48, - "learning_rate": 1.06484169098485e-06, - "loss": 0.752, - "step": 57935 - }, - { - "epoch": 1.48, - "learning_rate": 1.064814078736855e-06, - "loss": 0.5503, - "step": 57936 - }, - { - "epoch": 1.48, - "learning_rate": 1.0647864664392342e-06, - "loss": 0.5479, - "step": 57937 - }, - { - "epoch": 1.48, - "learning_rate": 1.0647588540920096e-06, - "loss": 0.7021, - "step": 57938 - }, - { - "epoch": 1.49, - "learning_rate": 1.0647312416952022e-06, - "loss": 0.5664, - "step": 57939 - }, - { - "epoch": 1.49, - "learning_rate": 1.064703629248833e-06, - "loss": 0.5638, - "step": 57940 - }, - { - "epoch": 1.49, - "learning_rate": 1.0646760167529233e-06, - "loss": 0.6143, - "step": 57941 - }, - { - "epoch": 1.49, - "learning_rate": 1.0646484042074938e-06, - "loss": 0.7051, - "step": 57942 - }, - { - "epoch": 1.49, - "learning_rate": 1.0646207916125665e-06, - "loss": 0.7676, - "step": 57943 - }, - { - "epoch": 1.49, - "learning_rate": 1.0645931789681614e-06, - "loss": 0.7466, - "step": 57944 - }, - { - "epoch": 1.49, - "learning_rate": 1.0645655662743008e-06, - "loss": 0.5552, - "step": 57945 - }, - { - "epoch": 1.49, - "learning_rate": 1.0645379535310052e-06, - "loss": 0.4966, - "step": 57946 - }, - { - "epoch": 1.49, - "learning_rate": 1.064510340738296e-06, - "loss": 0.835, - "step": 57947 - }, - { - "epoch": 1.49, - "learning_rate": 1.064482727896194e-06, - "loss": 0.751, - "step": 57948 - }, - { - "epoch": 1.49, - "learning_rate": 1.0644551150047204e-06, - "loss": 0.729, - "step": 57949 - }, - { - "epoch": 1.49, - "learning_rate": 1.0644275020638965e-06, - "loss": 0.5242, - "step": 57950 - }, - { - "epoch": 1.49, - "learning_rate": 1.0643998890737438e-06, - "loss": 0.6104, - "step": 57951 - }, - { - "epoch": 1.49, - "learning_rate": 1.0643722760342825e-06, - "loss": 0.7114, - "step": 57952 - }, - { - "epoch": 1.49, - "learning_rate": 1.0643446629455348e-06, - "loss": 0.8223, - "step": 57953 - }, - { - "epoch": 1.49, - "learning_rate": 1.0643170498075212e-06, - "loss": 0.6978, - "step": 57954 - }, - { - "epoch": 1.49, - "learning_rate": 1.0642894366202629e-06, - "loss": 0.645, - "step": 57955 - }, - { - "epoch": 1.49, - "learning_rate": 1.0642618233837813e-06, - "loss": 0.6719, - "step": 57956 - }, - { - "epoch": 1.49, - "learning_rate": 1.0642342100980973e-06, - "loss": 0.6763, - "step": 57957 - }, - { - "epoch": 1.49, - "learning_rate": 1.064206596763232e-06, - "loss": 0.6074, - "step": 57958 - }, - { - "epoch": 1.49, - "learning_rate": 1.0641789833792067e-06, - "loss": 0.5012, - "step": 57959 - }, - { - "epoch": 1.49, - "learning_rate": 1.0641513699460424e-06, - "loss": 0.6904, - "step": 57960 - }, - { - "epoch": 1.49, - "learning_rate": 1.0641237564637606e-06, - "loss": 0.6113, - "step": 57961 - }, - { - "epoch": 1.49, - "learning_rate": 1.0640961429323822e-06, - "loss": 0.6494, - "step": 57962 - }, - { - "epoch": 1.49, - "learning_rate": 1.0640685293519282e-06, - "loss": 0.5293, - "step": 57963 - }, - { - "epoch": 1.49, - "learning_rate": 1.06404091572242e-06, - "loss": 0.4924, - "step": 57964 - }, - { - "epoch": 1.49, - "learning_rate": 1.0640133020438785e-06, - "loss": 0.8525, - "step": 57965 - }, - { - "epoch": 1.49, - "learning_rate": 1.063985688316325e-06, - "loss": 0.6523, - "step": 57966 - }, - { - "epoch": 1.49, - "learning_rate": 1.0639580745397805e-06, - "loss": 0.6162, - "step": 57967 - }, - { - "epoch": 1.49, - "learning_rate": 1.0639304607142663e-06, - "loss": 0.5034, - "step": 57968 - }, - { - "epoch": 1.49, - "learning_rate": 1.0639028468398036e-06, - "loss": 0.6406, - "step": 57969 - }, - { - "epoch": 1.49, - "learning_rate": 1.063875232916413e-06, - "loss": 0.6025, - "step": 57970 - }, - { - "epoch": 1.49, - "learning_rate": 1.0638476189441167e-06, - "loss": 0.573, - "step": 57971 - }, - { - "epoch": 1.49, - "learning_rate": 1.0638200049229352e-06, - "loss": 0.7002, - "step": 57972 - }, - { - "epoch": 1.49, - "learning_rate": 1.063792390852889e-06, - "loss": 0.6113, - "step": 57973 - }, - { - "epoch": 1.49, - "learning_rate": 1.0637647767340004e-06, - "loss": 0.6777, - "step": 57974 - }, - { - "epoch": 1.49, - "learning_rate": 1.0637371625662896e-06, - "loss": 0.6362, - "step": 57975 - }, - { - "epoch": 1.49, - "learning_rate": 1.0637095483497789e-06, - "loss": 0.5562, - "step": 57976 - }, - { - "epoch": 1.49, - "learning_rate": 1.0636819340844883e-06, - "loss": 0.7637, - "step": 57977 - }, - { - "epoch": 1.49, - "learning_rate": 1.0636543197704392e-06, - "loss": 0.5486, - "step": 57978 - }, - { - "epoch": 1.49, - "learning_rate": 1.063626705407653e-06, - "loss": 0.5166, - "step": 57979 - }, - { - "epoch": 1.49, - "learning_rate": 1.063599090996151e-06, - "loss": 0.7344, - "step": 57980 - }, - { - "epoch": 1.49, - "learning_rate": 1.0635714765359541e-06, - "loss": 0.5337, - "step": 57981 - }, - { - "epoch": 1.49, - "learning_rate": 1.0635438620270832e-06, - "loss": 0.709, - "step": 57982 - }, - { - "epoch": 1.49, - "learning_rate": 1.0635162474695597e-06, - "loss": 0.7598, - "step": 57983 - }, - { - "epoch": 1.49, - "learning_rate": 1.0634886328634047e-06, - "loss": 0.5859, - "step": 57984 - }, - { - "epoch": 1.49, - "learning_rate": 1.0634610182086396e-06, - "loss": 0.6021, - "step": 57985 - }, - { - "epoch": 1.49, - "learning_rate": 1.0634334035052854e-06, - "loss": 0.6504, - "step": 57986 - }, - { - "epoch": 1.49, - "learning_rate": 1.0634057887533633e-06, - "loss": 0.8164, - "step": 57987 - }, - { - "epoch": 1.49, - "learning_rate": 1.0633781739528936e-06, - "loss": 0.6797, - "step": 57988 - }, - { - "epoch": 1.49, - "learning_rate": 1.0633505591038987e-06, - "loss": 0.5479, - "step": 57989 - }, - { - "epoch": 1.49, - "learning_rate": 1.0633229442063987e-06, - "loss": 0.7988, - "step": 57990 - }, - { - "epoch": 1.49, - "learning_rate": 1.0632953292604158e-06, - "loss": 0.6162, - "step": 57991 - }, - { - "epoch": 1.49, - "learning_rate": 1.0632677142659703e-06, - "loss": 0.6582, - "step": 57992 - }, - { - "epoch": 1.49, - "learning_rate": 1.0632400992230836e-06, - "loss": 0.7334, - "step": 57993 - }, - { - "epoch": 1.49, - "learning_rate": 1.063212484131777e-06, - "loss": 0.6387, - "step": 57994 - }, - { - "epoch": 1.49, - "learning_rate": 1.0631848689920715e-06, - "loss": 0.5518, - "step": 57995 - }, - { - "epoch": 1.49, - "learning_rate": 1.063157253803988e-06, - "loss": 0.7031, - "step": 57996 - }, - { - "epoch": 1.49, - "learning_rate": 1.0631296385675483e-06, - "loss": 0.6182, - "step": 57997 - }, - { - "epoch": 1.49, - "learning_rate": 1.0631020232827727e-06, - "loss": 0.6445, - "step": 57998 - }, - { - "epoch": 1.49, - "learning_rate": 1.0630744079496832e-06, - "loss": 0.4954, - "step": 57999 - }, - { - "epoch": 1.49, - "learning_rate": 1.0630467925683e-06, - "loss": 0.5391, - "step": 58000 - }, - { - "epoch": 1.49, - "learning_rate": 1.0630191771386451e-06, - "loss": 0.606, - "step": 58001 - }, - { - "epoch": 1.49, - "learning_rate": 1.0629915616607395e-06, - "loss": 0.7881, - "step": 58002 - }, - { - "epoch": 1.49, - "learning_rate": 1.062963946134604e-06, - "loss": 0.7715, - "step": 58003 - }, - { - "epoch": 1.49, - "learning_rate": 1.0629363305602597e-06, - "loss": 0.8105, - "step": 58004 - }, - { - "epoch": 1.49, - "learning_rate": 1.0629087149377282e-06, - "loss": 0.4823, - "step": 58005 - }, - { - "epoch": 1.49, - "learning_rate": 1.0628810992670303e-06, - "loss": 0.5054, - "step": 58006 - }, - { - "epoch": 1.49, - "learning_rate": 1.062853483548187e-06, - "loss": 0.8369, - "step": 58007 - }, - { - "epoch": 1.49, - "learning_rate": 1.0628258677812201e-06, - "loss": 0.729, - "step": 58008 - }, - { - "epoch": 1.49, - "learning_rate": 1.06279825196615e-06, - "loss": 0.6846, - "step": 58009 - }, - { - "epoch": 1.49, - "learning_rate": 1.0627706361029984e-06, - "loss": 0.7188, - "step": 58010 - }, - { - "epoch": 1.49, - "learning_rate": 1.0627430201917863e-06, - "loss": 0.7715, - "step": 58011 - }, - { - "epoch": 1.49, - "learning_rate": 1.0627154042325345e-06, - "loss": 0.7002, - "step": 58012 - }, - { - "epoch": 1.49, - "learning_rate": 1.0626877882252644e-06, - "loss": 0.6963, - "step": 58013 - }, - { - "epoch": 1.49, - "learning_rate": 1.0626601721699971e-06, - "loss": 0.6611, - "step": 58014 - }, - { - "epoch": 1.49, - "learning_rate": 1.0626325560667538e-06, - "loss": 0.7324, - "step": 58015 - }, - { - "epoch": 1.49, - "learning_rate": 1.0626049399155558e-06, - "loss": 0.458, - "step": 58016 - }, - { - "epoch": 1.49, - "learning_rate": 1.0625773237164239e-06, - "loss": 0.6924, - "step": 58017 - }, - { - "epoch": 1.49, - "learning_rate": 1.0625497074693797e-06, - "loss": 0.6543, - "step": 58018 - }, - { - "epoch": 1.49, - "learning_rate": 1.0625220911744437e-06, - "loss": 0.5732, - "step": 58019 - }, - { - "epoch": 1.49, - "learning_rate": 1.0624944748316378e-06, - "loss": 0.8242, - "step": 58020 - }, - { - "epoch": 1.49, - "learning_rate": 1.0624668584409826e-06, - "loss": 0.3826, - "step": 58021 - }, - { - "epoch": 1.49, - "learning_rate": 1.0624392420024992e-06, - "loss": 0.7939, - "step": 58022 - }, - { - "epoch": 1.49, - "learning_rate": 1.062411625516209e-06, - "loss": 0.5111, - "step": 58023 - }, - { - "epoch": 1.49, - "learning_rate": 1.0623840089821334e-06, - "loss": 0.7451, - "step": 58024 - }, - { - "epoch": 1.49, - "learning_rate": 1.0623563924002927e-06, - "loss": 0.5903, - "step": 58025 - }, - { - "epoch": 1.49, - "learning_rate": 1.0623287757707092e-06, - "loss": 0.7812, - "step": 58026 - }, - { - "epoch": 1.49, - "learning_rate": 1.062301159093403e-06, - "loss": 0.5969, - "step": 58027 - }, - { - "epoch": 1.49, - "learning_rate": 1.0622735423683957e-06, - "loss": 0.6748, - "step": 58028 - }, - { - "epoch": 1.49, - "learning_rate": 1.0622459255957085e-06, - "loss": 0.5039, - "step": 58029 - }, - { - "epoch": 1.49, - "learning_rate": 1.0622183087753624e-06, - "loss": 0.8594, - "step": 58030 - }, - { - "epoch": 1.49, - "learning_rate": 1.062190691907379e-06, - "loss": 0.4807, - "step": 58031 - }, - { - "epoch": 1.49, - "learning_rate": 1.0621630749917782e-06, - "loss": 0.5413, - "step": 58032 - }, - { - "epoch": 1.49, - "learning_rate": 1.0621354580285825e-06, - "loss": 0.4648, - "step": 58033 - }, - { - "epoch": 1.49, - "learning_rate": 1.0621078410178126e-06, - "loss": 0.6323, - "step": 58034 - }, - { - "epoch": 1.49, - "learning_rate": 1.0620802239594894e-06, - "loss": 0.6582, - "step": 58035 - }, - { - "epoch": 1.49, - "learning_rate": 1.0620526068536347e-06, - "loss": 0.6611, - "step": 58036 - }, - { - "epoch": 1.49, - "learning_rate": 1.0620249897002687e-06, - "loss": 0.6982, - "step": 58037 - }, - { - "epoch": 1.49, - "learning_rate": 1.061997372499413e-06, - "loss": 0.6023, - "step": 58038 - }, - { - "epoch": 1.49, - "learning_rate": 1.061969755251089e-06, - "loss": 0.4709, - "step": 58039 - }, - { - "epoch": 1.49, - "learning_rate": 1.0619421379553172e-06, - "loss": 0.261, - "step": 58040 - }, - { - "epoch": 1.49, - "learning_rate": 1.06191452061212e-06, - "loss": 0.6553, - "step": 58041 - }, - { - "epoch": 1.49, - "learning_rate": 1.0618869032215167e-06, - "loss": 0.6396, - "step": 58042 - }, - { - "epoch": 1.49, - "learning_rate": 1.06185928578353e-06, - "loss": 0.7051, - "step": 58043 - }, - { - "epoch": 1.49, - "learning_rate": 1.0618316682981802e-06, - "loss": 0.8613, - "step": 58044 - }, - { - "epoch": 1.49, - "learning_rate": 1.061804050765489e-06, - "loss": 0.6372, - "step": 58045 - }, - { - "epoch": 1.49, - "learning_rate": 1.0617764331854772e-06, - "loss": 0.4725, - "step": 58046 - }, - { - "epoch": 1.49, - "learning_rate": 1.0617488155581662e-06, - "loss": 0.5691, - "step": 58047 - }, - { - "epoch": 1.49, - "learning_rate": 1.0617211978835768e-06, - "loss": 0.6519, - "step": 58048 - }, - { - "epoch": 1.49, - "learning_rate": 1.06169358016173e-06, - "loss": 0.5732, - "step": 58049 - }, - { - "epoch": 1.49, - "learning_rate": 1.0616659623926475e-06, - "loss": 0.6538, - "step": 58050 - }, - { - "epoch": 1.49, - "learning_rate": 1.0616383445763505e-06, - "loss": 0.5447, - "step": 58051 - }, - { - "epoch": 1.49, - "learning_rate": 1.0616107267128598e-06, - "loss": 0.6748, - "step": 58052 - }, - { - "epoch": 1.49, - "learning_rate": 1.0615831088021962e-06, - "loss": 0.6279, - "step": 58053 - }, - { - "epoch": 1.49, - "learning_rate": 1.0615554908443816e-06, - "loss": 0.5972, - "step": 58054 - }, - { - "epoch": 1.49, - "learning_rate": 1.0615278728394363e-06, - "loss": 0.6611, - "step": 58055 - }, - { - "epoch": 1.49, - "learning_rate": 1.0615002547873828e-06, - "loss": 0.5981, - "step": 58056 - }, - { - "epoch": 1.49, - "learning_rate": 1.0614726366882407e-06, - "loss": 0.554, - "step": 58057 - }, - { - "epoch": 1.49, - "learning_rate": 1.061445018542032e-06, - "loss": 0.7559, - "step": 58058 - }, - { - "epoch": 1.49, - "learning_rate": 1.0614174003487774e-06, - "loss": 0.7988, - "step": 58059 - }, - { - "epoch": 1.49, - "learning_rate": 1.0613897821084989e-06, - "loss": 0.5579, - "step": 58060 - }, - { - "epoch": 1.49, - "learning_rate": 1.0613621638212166e-06, - "loss": 0.5349, - "step": 58061 - }, - { - "epoch": 1.49, - "learning_rate": 1.0613345454869524e-06, - "loss": 0.6074, - "step": 58062 - }, - { - "epoch": 1.49, - "learning_rate": 1.061306927105727e-06, - "loss": 0.5996, - "step": 58063 - }, - { - "epoch": 1.49, - "learning_rate": 1.0612793086775618e-06, - "loss": 0.6104, - "step": 58064 - }, - { - "epoch": 1.49, - "learning_rate": 1.061251690202478e-06, - "loss": 0.4724, - "step": 58065 - }, - { - "epoch": 1.49, - "learning_rate": 1.0612240716804964e-06, - "loss": 0.542, - "step": 58066 - }, - { - "epoch": 1.49, - "learning_rate": 1.0611964531116381e-06, - "loss": 0.7646, - "step": 58067 - }, - { - "epoch": 1.49, - "learning_rate": 1.0611688344959248e-06, - "loss": 0.606, - "step": 58068 - }, - { - "epoch": 1.49, - "learning_rate": 1.0611412158333773e-06, - "loss": 0.5383, - "step": 58069 - }, - { - "epoch": 1.49, - "learning_rate": 1.0611135971240168e-06, - "loss": 0.5752, - "step": 58070 - }, - { - "epoch": 1.49, - "learning_rate": 1.0610859783678643e-06, - "loss": 0.6816, - "step": 58071 - }, - { - "epoch": 1.49, - "learning_rate": 1.0610583595649413e-06, - "loss": 0.7812, - "step": 58072 - }, - { - "epoch": 1.49, - "learning_rate": 1.0610307407152683e-06, - "loss": 0.543, - "step": 58073 - }, - { - "epoch": 1.49, - "learning_rate": 1.061003121818867e-06, - "loss": 0.6846, - "step": 58074 - }, - { - "epoch": 1.49, - "learning_rate": 1.060975502875759e-06, - "loss": 0.6362, - "step": 58075 - }, - { - "epoch": 1.49, - "learning_rate": 1.0609478838859643e-06, - "loss": 0.7822, - "step": 58076 - }, - { - "epoch": 1.49, - "learning_rate": 1.060920264849505e-06, - "loss": 0.6807, - "step": 58077 - }, - { - "epoch": 1.49, - "learning_rate": 1.0608926457664011e-06, - "loss": 0.7314, - "step": 58078 - }, - { - "epoch": 1.49, - "learning_rate": 1.0608650266366751e-06, - "loss": 0.5508, - "step": 58079 - }, - { - "epoch": 1.49, - "learning_rate": 1.0608374074603475e-06, - "loss": 0.7168, - "step": 58080 - }, - { - "epoch": 1.49, - "learning_rate": 1.0608097882374396e-06, - "loss": 0.7041, - "step": 58081 - }, - { - "epoch": 1.49, - "learning_rate": 1.060782168967972e-06, - "loss": 0.6704, - "step": 58082 - }, - { - "epoch": 1.49, - "learning_rate": 1.0607545496519668e-06, - "loss": 0.7393, - "step": 58083 - }, - { - "epoch": 1.49, - "learning_rate": 1.0607269302894442e-06, - "loss": 0.689, - "step": 58084 - }, - { - "epoch": 1.49, - "learning_rate": 1.060699310880426e-06, - "loss": 0.6885, - "step": 58085 - }, - { - "epoch": 1.49, - "learning_rate": 1.0606716914249331e-06, - "loss": 0.7305, - "step": 58086 - }, - { - "epoch": 1.49, - "learning_rate": 1.0606440719229868e-06, - "loss": 0.5732, - "step": 58087 - }, - { - "epoch": 1.49, - "learning_rate": 1.0606164523746078e-06, - "loss": 0.7119, - "step": 58088 - }, - { - "epoch": 1.49, - "learning_rate": 1.060588832779818e-06, - "loss": 0.7148, - "step": 58089 - }, - { - "epoch": 1.49, - "learning_rate": 1.060561213138638e-06, - "loss": 0.5051, - "step": 58090 - }, - { - "epoch": 1.49, - "learning_rate": 1.0605335934510887e-06, - "loss": 0.6494, - "step": 58091 - }, - { - "epoch": 1.49, - "learning_rate": 1.0605059737171917e-06, - "loss": 0.502, - "step": 58092 - }, - { - "epoch": 1.49, - "learning_rate": 1.0604783539369683e-06, - "loss": 0.709, - "step": 58093 - }, - { - "epoch": 1.49, - "learning_rate": 1.0604507341104392e-06, - "loss": 0.8369, - "step": 58094 - }, - { - "epoch": 1.49, - "learning_rate": 1.060423114237626e-06, - "loss": 0.7002, - "step": 58095 - }, - { - "epoch": 1.49, - "learning_rate": 1.0603954943185496e-06, - "loss": 0.6172, - "step": 58096 - }, - { - "epoch": 1.49, - "learning_rate": 1.060367874353231e-06, - "loss": 0.6211, - "step": 58097 - }, - { - "epoch": 1.49, - "learning_rate": 1.0603402543416916e-06, - "loss": 0.5898, - "step": 58098 - }, - { - "epoch": 1.49, - "learning_rate": 1.060312634283952e-06, - "loss": 0.6846, - "step": 58099 - }, - { - "epoch": 1.49, - "learning_rate": 1.0602850141800344e-06, - "loss": 0.6548, - "step": 58100 - }, - { - "epoch": 1.49, - "learning_rate": 1.060257394029959e-06, - "loss": 0.521, - "step": 58101 - }, - { - "epoch": 1.49, - "learning_rate": 1.0602297738337474e-06, - "loss": 0.5654, - "step": 58102 - }, - { - "epoch": 1.49, - "learning_rate": 1.0602021535914205e-06, - "loss": 0.6455, - "step": 58103 - }, - { - "epoch": 1.49, - "learning_rate": 1.0601745333029996e-06, - "loss": 0.457, - "step": 58104 - }, - { - "epoch": 1.49, - "learning_rate": 1.060146912968506e-06, - "loss": 0.6436, - "step": 58105 - }, - { - "epoch": 1.49, - "learning_rate": 1.0601192925879606e-06, - "loss": 0.6709, - "step": 58106 - }, - { - "epoch": 1.49, - "learning_rate": 1.0600916721613846e-06, - "loss": 0.6943, - "step": 58107 - }, - { - "epoch": 1.49, - "learning_rate": 1.0600640516887993e-06, - "loss": 0.5928, - "step": 58108 - }, - { - "epoch": 1.49, - "learning_rate": 1.0600364311702254e-06, - "loss": 0.6221, - "step": 58109 - }, - { - "epoch": 1.49, - "learning_rate": 1.0600088106056849e-06, - "loss": 0.748, - "step": 58110 - }, - { - "epoch": 1.49, - "learning_rate": 1.0599811899951977e-06, - "loss": 0.5771, - "step": 58111 - }, - { - "epoch": 1.49, - "learning_rate": 1.0599535693387861e-06, - "loss": 0.6387, - "step": 58112 - }, - { - "epoch": 1.49, - "learning_rate": 1.0599259486364706e-06, - "loss": 0.7598, - "step": 58113 - }, - { - "epoch": 1.49, - "learning_rate": 1.0598983278882728e-06, - "loss": 0.6128, - "step": 58114 - }, - { - "epoch": 1.49, - "learning_rate": 1.0598707070942137e-06, - "loss": 0.6221, - "step": 58115 - }, - { - "epoch": 1.49, - "learning_rate": 1.059843086254314e-06, - "loss": 0.5803, - "step": 58116 - }, - { - "epoch": 1.49, - "learning_rate": 1.0598154653685954e-06, - "loss": 0.6798, - "step": 58117 - }, - { - "epoch": 1.49, - "learning_rate": 1.0597878444370787e-06, - "loss": 0.6919, - "step": 58118 - }, - { - "epoch": 1.49, - "learning_rate": 1.0597602234597854e-06, - "loss": 0.5869, - "step": 58119 - }, - { - "epoch": 1.49, - "learning_rate": 1.0597326024367364e-06, - "loss": 0.7627, - "step": 58120 - }, - { - "epoch": 1.49, - "learning_rate": 1.0597049813679528e-06, - "loss": 0.7441, - "step": 58121 - }, - { - "epoch": 1.49, - "learning_rate": 1.0596773602534556e-06, - "loss": 0.5972, - "step": 58122 - }, - { - "epoch": 1.49, - "learning_rate": 1.0596497390932667e-06, - "loss": 0.7783, - "step": 58123 - }, - { - "epoch": 1.49, - "learning_rate": 1.0596221178874062e-06, - "loss": 0.5428, - "step": 58124 - }, - { - "epoch": 1.49, - "learning_rate": 1.0595944966358966e-06, - "loss": 0.8584, - "step": 58125 - }, - { - "epoch": 1.49, - "learning_rate": 1.0595668753387575e-06, - "loss": 0.6978, - "step": 58126 - }, - { - "epoch": 1.49, - "learning_rate": 1.059539253996011e-06, - "loss": 0.6934, - "step": 58127 - }, - { - "epoch": 1.49, - "learning_rate": 1.0595116326076778e-06, - "loss": 0.7344, - "step": 58128 - }, - { - "epoch": 1.49, - "learning_rate": 1.0594840111737797e-06, - "loss": 0.709, - "step": 58129 - }, - { - "epoch": 1.49, - "learning_rate": 1.0594563896943373e-06, - "loss": 0.8003, - "step": 58130 - }, - { - "epoch": 1.49, - "learning_rate": 1.0594287681693718e-06, - "loss": 0.6631, - "step": 58131 - }, - { - "epoch": 1.49, - "learning_rate": 1.0594011465989043e-06, - "loss": 0.5277, - "step": 58132 - }, - { - "epoch": 1.49, - "learning_rate": 1.0593735249829564e-06, - "loss": 0.5554, - "step": 58133 - }, - { - "epoch": 1.49, - "learning_rate": 1.0593459033215487e-06, - "loss": 0.6953, - "step": 58134 - }, - { - "epoch": 1.49, - "learning_rate": 1.0593182816147025e-06, - "loss": 0.584, - "step": 58135 - }, - { - "epoch": 1.49, - "learning_rate": 1.059290659862439e-06, - "loss": 0.749, - "step": 58136 - }, - { - "epoch": 1.49, - "learning_rate": 1.0592630380647797e-06, - "loss": 0.5386, - "step": 58137 - }, - { - "epoch": 1.49, - "learning_rate": 1.059235416221745e-06, - "loss": 0.5209, - "step": 58138 - }, - { - "epoch": 1.49, - "learning_rate": 1.0592077943333569e-06, - "loss": 0.563, - "step": 58139 - }, - { - "epoch": 1.49, - "learning_rate": 1.059180172399636e-06, - "loss": 0.7725, - "step": 58140 - }, - { - "epoch": 1.49, - "learning_rate": 1.0591525504206033e-06, - "loss": 0.7773, - "step": 58141 - }, - { - "epoch": 1.49, - "learning_rate": 1.0591249283962805e-06, - "loss": 0.6562, - "step": 58142 - }, - { - "epoch": 1.49, - "learning_rate": 1.0590973063266882e-06, - "loss": 0.6162, - "step": 58143 - }, - { - "epoch": 1.49, - "learning_rate": 1.059069684211848e-06, - "loss": 0.708, - "step": 58144 - }, - { - "epoch": 1.49, - "learning_rate": 1.0590420620517809e-06, - "loss": 0.6655, - "step": 58145 - }, - { - "epoch": 1.49, - "learning_rate": 1.059014439846508e-06, - "loss": 0.7754, - "step": 58146 - }, - { - "epoch": 1.49, - "learning_rate": 1.0589868175960502e-06, - "loss": 0.6069, - "step": 58147 - }, - { - "epoch": 1.49, - "learning_rate": 1.058959195300429e-06, - "loss": 0.6992, - "step": 58148 - }, - { - "epoch": 1.49, - "learning_rate": 1.0589315729596654e-06, - "loss": 0.6294, - "step": 58149 - }, - { - "epoch": 1.49, - "learning_rate": 1.0589039505737808e-06, - "loss": 0.609, - "step": 58150 - }, - { - "epoch": 1.49, - "learning_rate": 1.0588763281427962e-06, - "loss": 0.5664, - "step": 58151 - }, - { - "epoch": 1.49, - "learning_rate": 1.0588487056667326e-06, - "loss": 0.7832, - "step": 58152 - }, - { - "epoch": 1.49, - "learning_rate": 1.058821083145611e-06, - "loss": 0.7549, - "step": 58153 - }, - { - "epoch": 1.49, - "learning_rate": 1.0587934605794533e-06, - "loss": 0.6377, - "step": 58154 - }, - { - "epoch": 1.49, - "learning_rate": 1.0587658379682798e-06, - "loss": 0.8076, - "step": 58155 - }, - { - "epoch": 1.49, - "learning_rate": 1.0587382153121123e-06, - "loss": 0.446, - "step": 58156 - }, - { - "epoch": 1.49, - "learning_rate": 1.0587105926109712e-06, - "loss": 0.7617, - "step": 58157 - }, - { - "epoch": 1.49, - "learning_rate": 1.0586829698648785e-06, - "loss": 0.5039, - "step": 58158 - }, - { - "epoch": 1.49, - "learning_rate": 1.0586553470738545e-06, - "loss": 0.6016, - "step": 58159 - }, - { - "epoch": 1.49, - "learning_rate": 1.058627724237921e-06, - "loss": 0.7119, - "step": 58160 - }, - { - "epoch": 1.49, - "learning_rate": 1.0586001013570993e-06, - "loss": 0.6748, - "step": 58161 - }, - { - "epoch": 1.49, - "learning_rate": 1.0585724784314098e-06, - "loss": 0.625, - "step": 58162 - }, - { - "epoch": 1.49, - "learning_rate": 1.0585448554608743e-06, - "loss": 0.5459, - "step": 58163 - }, - { - "epoch": 1.49, - "learning_rate": 1.0585172324455134e-06, - "loss": 0.791, - "step": 58164 - }, - { - "epoch": 1.49, - "learning_rate": 1.058489609385349e-06, - "loss": 0.5205, - "step": 58165 - }, - { - "epoch": 1.49, - "learning_rate": 1.0584619862804014e-06, - "loss": 0.7998, - "step": 58166 - }, - { - "epoch": 1.49, - "learning_rate": 1.0584343631306922e-06, - "loss": 0.6865, - "step": 58167 - }, - { - "epoch": 1.49, - "learning_rate": 1.0584067399362423e-06, - "loss": 0.6543, - "step": 58168 - }, - { - "epoch": 1.49, - "learning_rate": 1.0583791166970735e-06, - "loss": 0.771, - "step": 58169 - }, - { - "epoch": 1.49, - "learning_rate": 1.0583514934132062e-06, - "loss": 0.7197, - "step": 58170 - }, - { - "epoch": 1.49, - "learning_rate": 1.058323870084662e-06, - "loss": 0.647, - "step": 58171 - }, - { - "epoch": 1.49, - "learning_rate": 1.0582962467114618e-06, - "loss": 0.5942, - "step": 58172 - }, - { - "epoch": 1.49, - "learning_rate": 1.0582686232936268e-06, - "loss": 0.6523, - "step": 58173 - }, - { - "epoch": 1.49, - "learning_rate": 1.0582409998311782e-06, - "loss": 0.5836, - "step": 58174 - }, - { - "epoch": 1.49, - "learning_rate": 1.0582133763241376e-06, - "loss": 0.4434, - "step": 58175 - }, - { - "epoch": 1.49, - "learning_rate": 1.058185752772525e-06, - "loss": 0.5903, - "step": 58176 - }, - { - "epoch": 1.49, - "learning_rate": 1.0581581291763628e-06, - "loss": 0.5986, - "step": 58177 - }, - { - "epoch": 1.49, - "learning_rate": 1.0581305055356711e-06, - "loss": 0.5933, - "step": 58178 - }, - { - "epoch": 1.49, - "learning_rate": 1.058102881850472e-06, - "loss": 0.6445, - "step": 58179 - }, - { - "epoch": 1.49, - "learning_rate": 1.058075258120786e-06, - "loss": 0.7559, - "step": 58180 - }, - { - "epoch": 1.49, - "learning_rate": 1.0580476343466343e-06, - "loss": 0.7251, - "step": 58181 - }, - { - "epoch": 1.49, - "learning_rate": 1.0580200105280383e-06, - "loss": 0.6865, - "step": 58182 - }, - { - "epoch": 1.49, - "learning_rate": 1.057992386665019e-06, - "loss": 0.623, - "step": 58183 - }, - { - "epoch": 1.49, - "learning_rate": 1.0579647627575979e-06, - "loss": 0.7988, - "step": 58184 - }, - { - "epoch": 1.49, - "learning_rate": 1.0579371388057957e-06, - "loss": 0.5908, - "step": 58185 - }, - { - "epoch": 1.49, - "learning_rate": 1.0579095148096335e-06, - "loss": 0.7129, - "step": 58186 - }, - { - "epoch": 1.49, - "learning_rate": 1.0578818907691326e-06, - "loss": 0.7676, - "step": 58187 - }, - { - "epoch": 1.49, - "learning_rate": 1.0578542666843145e-06, - "loss": 0.5232, - "step": 58188 - }, - { - "epoch": 1.49, - "learning_rate": 1.0578266425551995e-06, - "loss": 0.6567, - "step": 58189 - }, - { - "epoch": 1.49, - "learning_rate": 1.0577990183818102e-06, - "loss": 0.5382, - "step": 58190 - }, - { - "epoch": 1.49, - "learning_rate": 1.0577713941641663e-06, - "loss": 0.584, - "step": 58191 - }, - { - "epoch": 1.49, - "learning_rate": 1.0577437699022895e-06, - "loss": 0.75, - "step": 58192 - }, - { - "epoch": 1.49, - "learning_rate": 1.057716145596201e-06, - "loss": 0.5786, - "step": 58193 - }, - { - "epoch": 1.49, - "learning_rate": 1.0576885212459219e-06, - "loss": 0.5837, - "step": 58194 - }, - { - "epoch": 1.49, - "learning_rate": 1.0576608968514734e-06, - "loss": 0.4268, - "step": 58195 - }, - { - "epoch": 1.49, - "learning_rate": 1.0576332724128767e-06, - "loss": 0.6758, - "step": 58196 - }, - { - "epoch": 1.49, - "learning_rate": 1.0576056479301526e-06, - "loss": 0.6074, - "step": 58197 - }, - { - "epoch": 1.49, - "learning_rate": 1.0575780234033224e-06, - "loss": 0.6953, - "step": 58198 - }, - { - "epoch": 1.49, - "learning_rate": 1.0575503988324076e-06, - "loss": 0.7119, - "step": 58199 - }, - { - "epoch": 1.49, - "learning_rate": 1.0575227742174294e-06, - "loss": 0.6367, - "step": 58200 - }, - { - "epoch": 1.49, - "learning_rate": 1.057495149558408e-06, - "loss": 0.7334, - "step": 58201 - }, - { - "epoch": 1.49, - "learning_rate": 1.0574675248553658e-06, - "loss": 0.485, - "step": 58202 - }, - { - "epoch": 1.49, - "learning_rate": 1.057439900108323e-06, - "loss": 0.4888, - "step": 58203 - }, - { - "epoch": 1.49, - "learning_rate": 1.057412275317301e-06, - "loss": 0.4397, - "step": 58204 - }, - { - "epoch": 1.49, - "learning_rate": 1.0573846504823216e-06, - "loss": 0.7412, - "step": 58205 - }, - { - "epoch": 1.49, - "learning_rate": 1.0573570256034048e-06, - "loss": 0.5068, - "step": 58206 - }, - { - "epoch": 1.49, - "learning_rate": 1.057329400680573e-06, - "loss": 0.709, - "step": 58207 - }, - { - "epoch": 1.49, - "learning_rate": 1.0573017757138461e-06, - "loss": 0.5859, - "step": 58208 - }, - { - "epoch": 1.49, - "learning_rate": 1.0572741507032462e-06, - "loss": 0.7588, - "step": 58209 - }, - { - "epoch": 1.49, - "learning_rate": 1.057246525648794e-06, - "loss": 0.707, - "step": 58210 - }, - { - "epoch": 1.49, - "learning_rate": 1.0572189005505108e-06, - "loss": 0.4924, - "step": 58211 - }, - { - "epoch": 1.49, - "learning_rate": 1.0571912754084175e-06, - "loss": 0.6816, - "step": 58212 - }, - { - "epoch": 1.49, - "learning_rate": 1.0571636502225358e-06, - "loss": 0.6299, - "step": 58213 - }, - { - "epoch": 1.49, - "learning_rate": 1.0571360249928865e-06, - "loss": 0.4675, - "step": 58214 - }, - { - "epoch": 1.49, - "learning_rate": 1.057108399719491e-06, - "loss": 0.6685, - "step": 58215 - }, - { - "epoch": 1.49, - "learning_rate": 1.0570807744023696e-06, - "loss": 0.5898, - "step": 58216 - }, - { - "epoch": 1.49, - "learning_rate": 1.0570531490415444e-06, - "loss": 0.4187, - "step": 58217 - }, - { - "epoch": 1.49, - "learning_rate": 1.0570255236370363e-06, - "loss": 0.71, - "step": 58218 - }, - { - "epoch": 1.49, - "learning_rate": 1.0569978981888663e-06, - "loss": 0.562, - "step": 58219 - }, - { - "epoch": 1.49, - "learning_rate": 1.0569702726970555e-06, - "loss": 0.6953, - "step": 58220 - }, - { - "epoch": 1.49, - "learning_rate": 1.0569426471616253e-06, - "loss": 0.7031, - "step": 58221 - }, - { - "epoch": 1.49, - "learning_rate": 1.0569150215825968e-06, - "loss": 0.7074, - "step": 58222 - }, - { - "epoch": 1.49, - "learning_rate": 1.056887395959991e-06, - "loss": 0.6631, - "step": 58223 - }, - { - "epoch": 1.49, - "learning_rate": 1.0568597702938291e-06, - "loss": 0.6904, - "step": 58224 - }, - { - "epoch": 1.49, - "learning_rate": 1.0568321445841325e-06, - "loss": 0.5918, - "step": 58225 - }, - { - "epoch": 1.49, - "learning_rate": 1.056804518830922e-06, - "loss": 0.6826, - "step": 58226 - }, - { - "epoch": 1.49, - "learning_rate": 1.056776893034219e-06, - "loss": 0.4463, - "step": 58227 - }, - { - "epoch": 1.49, - "learning_rate": 1.056749267194044e-06, - "loss": 0.7339, - "step": 58228 - }, - { - "epoch": 1.49, - "learning_rate": 1.0567216413104194e-06, - "loss": 0.6143, - "step": 58229 - }, - { - "epoch": 1.49, - "learning_rate": 1.0566940153833654e-06, - "loss": 0.5266, - "step": 58230 - }, - { - "epoch": 1.49, - "learning_rate": 1.0566663894129033e-06, - "loss": 0.645, - "step": 58231 - }, - { - "epoch": 1.49, - "learning_rate": 1.0566387633990545e-06, - "loss": 0.7129, - "step": 58232 - }, - { - "epoch": 1.49, - "learning_rate": 1.0566111373418399e-06, - "loss": 0.7285, - "step": 58233 - }, - { - "epoch": 1.49, - "learning_rate": 1.0565835112412807e-06, - "loss": 0.5386, - "step": 58234 - }, - { - "epoch": 1.49, - "learning_rate": 1.0565558850973983e-06, - "loss": 0.708, - "step": 58235 - }, - { - "epoch": 1.49, - "learning_rate": 1.0565282589102135e-06, - "loss": 0.9082, - "step": 58236 - }, - { - "epoch": 1.49, - "learning_rate": 1.0565006326797477e-06, - "loss": 0.5706, - "step": 58237 - }, - { - "epoch": 1.49, - "learning_rate": 1.056473006406022e-06, - "loss": 0.6719, - "step": 58238 - }, - { - "epoch": 1.49, - "learning_rate": 1.056445380089057e-06, - "loss": 0.6797, - "step": 58239 - }, - { - "epoch": 1.49, - "learning_rate": 1.0564177537288751e-06, - "loss": 0.6616, - "step": 58240 - }, - { - "epoch": 1.49, - "learning_rate": 1.0563901273254966e-06, - "loss": 0.7139, - "step": 58241 - }, - { - "epoch": 1.49, - "learning_rate": 1.0563625008789425e-06, - "loss": 0.8149, - "step": 58242 - }, - { - "epoch": 1.49, - "learning_rate": 1.0563348743892341e-06, - "loss": 0.7969, - "step": 58243 - }, - { - "epoch": 1.49, - "learning_rate": 1.056307247856393e-06, - "loss": 0.6279, - "step": 58244 - }, - { - "epoch": 1.49, - "learning_rate": 1.0562796212804401e-06, - "loss": 0.7754, - "step": 58245 - }, - { - "epoch": 1.49, - "learning_rate": 1.0562519946613964e-06, - "loss": 0.6475, - "step": 58246 - }, - { - "epoch": 1.49, - "learning_rate": 1.0562243679992828e-06, - "loss": 0.624, - "step": 58247 - }, - { - "epoch": 1.49, - "learning_rate": 1.056196741294121e-06, - "loss": 0.7363, - "step": 58248 - }, - { - "epoch": 1.49, - "learning_rate": 1.056169114545932e-06, - "loss": 0.9355, - "step": 58249 - }, - { - "epoch": 1.49, - "learning_rate": 1.0561414877547368e-06, - "loss": 0.4019, - "step": 58250 - }, - { - "epoch": 1.49, - "learning_rate": 1.056113860920557e-06, - "loss": 0.792, - "step": 58251 - }, - { - "epoch": 1.49, - "learning_rate": 1.0560862340434127e-06, - "loss": 0.7158, - "step": 58252 - }, - { - "epoch": 1.49, - "learning_rate": 1.0560586071233263e-06, - "loss": 0.7578, - "step": 58253 - }, - { - "epoch": 1.49, - "learning_rate": 1.0560309801603182e-06, - "loss": 0.645, - "step": 58254 - }, - { - "epoch": 1.49, - "learning_rate": 1.0560033531544102e-06, - "loss": 0.7188, - "step": 58255 - }, - { - "epoch": 1.49, - "learning_rate": 1.0559757261056224e-06, - "loss": 0.6533, - "step": 58256 - }, - { - "epoch": 1.49, - "learning_rate": 1.055948099013977e-06, - "loss": 0.6089, - "step": 58257 - }, - { - "epoch": 1.49, - "learning_rate": 1.0559204718794942e-06, - "loss": 0.6748, - "step": 58258 - }, - { - "epoch": 1.49, - "learning_rate": 1.055892844702196e-06, - "loss": 0.749, - "step": 58259 - }, - { - "epoch": 1.49, - "learning_rate": 1.0558652174821033e-06, - "loss": 0.7656, - "step": 58260 - }, - { - "epoch": 1.49, - "learning_rate": 1.055837590219237e-06, - "loss": 0.5234, - "step": 58261 - }, - { - "epoch": 1.49, - "learning_rate": 1.0558099629136183e-06, - "loss": 0.6016, - "step": 58262 - }, - { - "epoch": 1.49, - "learning_rate": 1.0557823355652686e-06, - "loss": 0.6201, - "step": 58263 - }, - { - "epoch": 1.49, - "learning_rate": 1.0557547081742088e-06, - "loss": 0.6597, - "step": 58264 - }, - { - "epoch": 1.49, - "learning_rate": 1.0557270807404608e-06, - "loss": 0.5327, - "step": 58265 - }, - { - "epoch": 1.49, - "learning_rate": 1.0556994532640447e-06, - "loss": 0.5654, - "step": 58266 - }, - { - "epoch": 1.49, - "learning_rate": 1.0556718257449819e-06, - "loss": 0.4829, - "step": 58267 - }, - { - "epoch": 1.49, - "learning_rate": 1.055644198183294e-06, - "loss": 0.6851, - "step": 58268 - }, - { - "epoch": 1.49, - "learning_rate": 1.055616570579002e-06, - "loss": 0.8701, - "step": 58269 - }, - { - "epoch": 1.49, - "learning_rate": 1.0555889429321267e-06, - "loss": 0.5017, - "step": 58270 - }, - { - "epoch": 1.49, - "learning_rate": 1.0555613152426894e-06, - "loss": 0.479, - "step": 58271 - }, - { - "epoch": 1.49, - "learning_rate": 1.0555336875107115e-06, - "loss": 0.8398, - "step": 58272 - }, - { - "epoch": 1.49, - "learning_rate": 1.0555060597362143e-06, - "loss": 0.6182, - "step": 58273 - }, - { - "epoch": 1.49, - "learning_rate": 1.0554784319192183e-06, - "loss": 0.8008, - "step": 58274 - }, - { - "epoch": 1.49, - "learning_rate": 1.055450804059745e-06, - "loss": 0.6279, - "step": 58275 - }, - { - "epoch": 1.49, - "learning_rate": 1.0554231761578159e-06, - "loss": 0.4871, - "step": 58276 - }, - { - "epoch": 1.49, - "learning_rate": 1.0553955482134513e-06, - "loss": 0.7476, - "step": 58277 - }, - { - "epoch": 1.49, - "learning_rate": 1.0553679202266734e-06, - "loss": 0.7451, - "step": 58278 - }, - { - "epoch": 1.49, - "learning_rate": 1.0553402921975024e-06, - "loss": 0.665, - "step": 58279 - }, - { - "epoch": 1.49, - "learning_rate": 1.0553126641259604e-06, - "loss": 0.6069, - "step": 58280 - }, - { - "epoch": 1.49, - "learning_rate": 1.0552850360120675e-06, - "loss": 0.6782, - "step": 58281 - }, - { - "epoch": 1.49, - "learning_rate": 1.0552574078558457e-06, - "loss": 0.3735, - "step": 58282 - }, - { - "epoch": 1.49, - "learning_rate": 1.0552297796573158e-06, - "loss": 0.709, - "step": 58283 - }, - { - "epoch": 1.49, - "learning_rate": 1.055202151416499e-06, - "loss": 0.6494, - "step": 58284 - }, - { - "epoch": 1.49, - "learning_rate": 1.0551745231334165e-06, - "loss": 0.5156, - "step": 58285 - }, - { - "epoch": 1.49, - "learning_rate": 1.0551468948080893e-06, - "loss": 0.5635, - "step": 58286 - }, - { - "epoch": 1.49, - "learning_rate": 1.0551192664405385e-06, - "loss": 0.6831, - "step": 58287 - }, - { - "epoch": 1.49, - "learning_rate": 1.0550916380307856e-06, - "loss": 0.5298, - "step": 58288 - }, - { - "epoch": 1.49, - "learning_rate": 1.0550640095788516e-06, - "loss": 0.7158, - "step": 58289 - }, - { - "epoch": 1.49, - "learning_rate": 1.0550363810847577e-06, - "loss": 0.7559, - "step": 58290 - }, - { - "epoch": 1.49, - "learning_rate": 1.055008752548525e-06, - "loss": 0.665, - "step": 58291 - }, - { - "epoch": 1.49, - "learning_rate": 1.0549811239701745e-06, - "loss": 0.6416, - "step": 58292 - }, - { - "epoch": 1.49, - "learning_rate": 1.0549534953497272e-06, - "loss": 0.6016, - "step": 58293 - }, - { - "epoch": 1.49, - "learning_rate": 1.0549258666872049e-06, - "loss": 0.7432, - "step": 58294 - }, - { - "epoch": 1.49, - "learning_rate": 1.0548982379826284e-06, - "loss": 0.5854, - "step": 58295 - }, - { - "epoch": 1.49, - "learning_rate": 1.0548706092360184e-06, - "loss": 0.5308, - "step": 58296 - }, - { - "epoch": 1.49, - "learning_rate": 1.054842980447397e-06, - "loss": 0.4374, - "step": 58297 - }, - { - "epoch": 1.49, - "learning_rate": 1.0548153516167846e-06, - "loss": 0.5562, - "step": 58298 - }, - { - "epoch": 1.49, - "learning_rate": 1.0547877227442027e-06, - "loss": 0.4853, - "step": 58299 - }, - { - "epoch": 1.49, - "learning_rate": 1.0547600938296724e-06, - "loss": 0.8037, - "step": 58300 - }, - { - "epoch": 1.49, - "learning_rate": 1.054732464873215e-06, - "loss": 0.6055, - "step": 58301 - }, - { - "epoch": 1.49, - "learning_rate": 1.0547048358748509e-06, - "loss": 0.6455, - "step": 58302 - }, - { - "epoch": 1.49, - "learning_rate": 1.0546772068346025e-06, - "loss": 0.479, - "step": 58303 - }, - { - "epoch": 1.49, - "learning_rate": 1.0546495777524894e-06, - "loss": 0.5101, - "step": 58304 - }, - { - "epoch": 1.49, - "learning_rate": 1.0546219486285347e-06, - "loss": 0.749, - "step": 58305 - }, - { - "epoch": 1.49, - "learning_rate": 1.0545943194627579e-06, - "loss": 0.6709, - "step": 58306 - }, - { - "epoch": 1.49, - "learning_rate": 1.0545666902551806e-06, - "loss": 0.6973, - "step": 58307 - }, - { - "epoch": 1.49, - "learning_rate": 1.0545390610058241e-06, - "loss": 0.6108, - "step": 58308 - }, - { - "epoch": 1.49, - "learning_rate": 1.05451143171471e-06, - "loss": 0.6055, - "step": 58309 - }, - { - "epoch": 1.49, - "learning_rate": 1.0544838023818587e-06, - "loss": 0.6406, - "step": 58310 - }, - { - "epoch": 1.49, - "learning_rate": 1.0544561730072919e-06, - "loss": 0.7979, - "step": 58311 - }, - { - "epoch": 1.49, - "learning_rate": 1.05442854359103e-06, - "loss": 0.5227, - "step": 58312 - }, - { - "epoch": 1.49, - "learning_rate": 1.054400914133095e-06, - "loss": 0.531, - "step": 58313 - }, - { - "epoch": 1.49, - "learning_rate": 1.0543732846335077e-06, - "loss": 0.7109, - "step": 58314 - }, - { - "epoch": 1.49, - "learning_rate": 1.0543456550922892e-06, - "loss": 0.6606, - "step": 58315 - }, - { - "epoch": 1.49, - "learning_rate": 1.0543180255094607e-06, - "loss": 0.6846, - "step": 58316 - }, - { - "epoch": 1.49, - "learning_rate": 1.0542903958850438e-06, - "loss": 0.4963, - "step": 58317 - }, - { - "epoch": 1.49, - "learning_rate": 1.0542627662190589e-06, - "loss": 0.7451, - "step": 58318 - }, - { - "epoch": 1.49, - "learning_rate": 1.0542351365115274e-06, - "loss": 0.6392, - "step": 58319 - }, - { - "epoch": 1.49, - "learning_rate": 1.0542075067624708e-06, - "loss": 0.5283, - "step": 58320 - }, - { - "epoch": 1.49, - "learning_rate": 1.0541798769719096e-06, - "loss": 0.4907, - "step": 58321 - }, - { - "epoch": 1.49, - "learning_rate": 1.0541522471398658e-06, - "loss": 0.6709, - "step": 58322 - }, - { - "epoch": 1.49, - "learning_rate": 1.0541246172663597e-06, - "loss": 0.6426, - "step": 58323 - }, - { - "epoch": 1.49, - "learning_rate": 1.0540969873514134e-06, - "loss": 0.5371, - "step": 58324 - }, - { - "epoch": 1.49, - "learning_rate": 1.0540693573950472e-06, - "loss": 0.6685, - "step": 58325 - }, - { - "epoch": 1.49, - "learning_rate": 1.0540417273972826e-06, - "loss": 0.6201, - "step": 58326 - }, - { - "epoch": 1.49, - "learning_rate": 1.0540140973581406e-06, - "loss": 0.5547, - "step": 58327 - }, - { - "epoch": 1.49, - "learning_rate": 1.053986467277643e-06, - "loss": 0.7168, - "step": 58328 - }, - { - "epoch": 1.5, - "learning_rate": 1.0539588371558097e-06, - "loss": 0.606, - "step": 58329 - }, - { - "epoch": 1.5, - "learning_rate": 1.0539312069926634e-06, - "loss": 0.3275, - "step": 58330 - }, - { - "epoch": 1.5, - "learning_rate": 1.053903576788224e-06, - "loss": 0.8062, - "step": 58331 - }, - { - "epoch": 1.5, - "learning_rate": 1.0538759465425131e-06, - "loss": 0.5244, - "step": 58332 - }, - { - "epoch": 1.5, - "learning_rate": 1.0538483162555516e-06, - "loss": 0.7559, - "step": 58333 - }, - { - "epoch": 1.5, - "learning_rate": 1.0538206859273615e-06, - "loss": 0.4357, - "step": 58334 - }, - { - "epoch": 1.5, - "learning_rate": 1.0537930555579631e-06, - "loss": 0.5488, - "step": 58335 - }, - { - "epoch": 1.5, - "learning_rate": 1.053765425147378e-06, - "loss": 0.6025, - "step": 58336 - }, - { - "epoch": 1.5, - "learning_rate": 1.0537377946956267e-06, - "loss": 0.5386, - "step": 58337 - }, - { - "epoch": 1.5, - "learning_rate": 1.0537101642027312e-06, - "loss": 0.7031, - "step": 58338 - }, - { - "epoch": 1.5, - "learning_rate": 1.0536825336687122e-06, - "loss": 0.5957, - "step": 58339 - }, - { - "epoch": 1.5, - "learning_rate": 1.053654903093591e-06, - "loss": 0.53, - "step": 58340 - }, - { - "epoch": 1.5, - "learning_rate": 1.0536272724773888e-06, - "loss": 0.6128, - "step": 58341 - }, - { - "epoch": 1.5, - "learning_rate": 1.0535996418201266e-06, - "loss": 0.7031, - "step": 58342 - }, - { - "epoch": 1.5, - "learning_rate": 1.0535720111218255e-06, - "loss": 0.6494, - "step": 58343 - }, - { - "epoch": 1.5, - "learning_rate": 1.0535443803825067e-06, - "loss": 0.6904, - "step": 58344 - }, - { - "epoch": 1.5, - "learning_rate": 1.0535167496021922e-06, - "loss": 0.6084, - "step": 58345 - }, - { - "epoch": 1.5, - "learning_rate": 1.0534891187809016e-06, - "loss": 0.8672, - "step": 58346 - }, - { - "epoch": 1.5, - "learning_rate": 1.0534614879186569e-06, - "loss": 0.6631, - "step": 58347 - }, - { - "epoch": 1.5, - "learning_rate": 1.0534338570154794e-06, - "loss": 0.6406, - "step": 58348 - }, - { - "epoch": 1.5, - "learning_rate": 1.0534062260713901e-06, - "loss": 0.5269, - "step": 58349 - }, - { - "epoch": 1.5, - "learning_rate": 1.05337859508641e-06, - "loss": 0.502, - "step": 58350 - }, - { - "epoch": 1.5, - "learning_rate": 1.0533509640605605e-06, - "loss": 0.668, - "step": 58351 - }, - { - "epoch": 1.5, - "learning_rate": 1.0533233329938622e-06, - "loss": 0.8418, - "step": 58352 - }, - { - "epoch": 1.5, - "learning_rate": 1.053295701886337e-06, - "loss": 0.5957, - "step": 58353 - }, - { - "epoch": 1.5, - "learning_rate": 1.0532680707380058e-06, - "loss": 0.7471, - "step": 58354 - }, - { - "epoch": 1.5, - "learning_rate": 1.0532404395488896e-06, - "loss": 0.7188, - "step": 58355 - }, - { - "epoch": 1.5, - "learning_rate": 1.0532128083190096e-06, - "loss": 0.6108, - "step": 58356 - }, - { - "epoch": 1.5, - "learning_rate": 1.053185177048387e-06, - "loss": 0.5371, - "step": 58357 - }, - { - "epoch": 1.5, - "learning_rate": 1.053157545737043e-06, - "loss": 0.6167, - "step": 58358 - }, - { - "epoch": 1.5, - "learning_rate": 1.0531299143849985e-06, - "loss": 0.7061, - "step": 58359 - }, - { - "epoch": 1.5, - "learning_rate": 1.0531022829922753e-06, - "loss": 0.5898, - "step": 58360 - }, - { - "epoch": 1.5, - "learning_rate": 1.0530746515588937e-06, - "loss": 0.7451, - "step": 58361 - }, - { - "epoch": 1.5, - "learning_rate": 1.0530470200848755e-06, - "loss": 0.7266, - "step": 58362 - }, - { - "epoch": 1.5, - "learning_rate": 1.0530193885702416e-06, - "loss": 0.6211, - "step": 58363 - }, - { - "epoch": 1.5, - "learning_rate": 1.0529917570150132e-06, - "loss": 0.6328, - "step": 58364 - }, - { - "epoch": 1.5, - "learning_rate": 1.0529641254192113e-06, - "loss": 0.71, - "step": 58365 - }, - { - "epoch": 1.5, - "learning_rate": 1.0529364937828575e-06, - "loss": 0.5649, - "step": 58366 - }, - { - "epoch": 1.5, - "learning_rate": 1.0529088621059724e-06, - "loss": 0.7007, - "step": 58367 - }, - { - "epoch": 1.5, - "learning_rate": 1.0528812303885776e-06, - "loss": 0.6582, - "step": 58368 - }, - { - "epoch": 1.5, - "learning_rate": 1.052853598630694e-06, - "loss": 0.5229, - "step": 58369 - }, - { - "epoch": 1.5, - "learning_rate": 1.052825966832343e-06, - "loss": 0.5342, - "step": 58370 - }, - { - "epoch": 1.5, - "learning_rate": 1.0527983349935453e-06, - "loss": 0.5176, - "step": 58371 - }, - { - "epoch": 1.5, - "learning_rate": 1.0527707031143224e-06, - "loss": 0.6494, - "step": 58372 - }, - { - "epoch": 1.5, - "learning_rate": 1.0527430711946954e-06, - "loss": 0.7686, - "step": 58373 - }, - { - "epoch": 1.5, - "learning_rate": 1.0527154392346858e-06, - "loss": 0.79, - "step": 58374 - }, - { - "epoch": 1.5, - "learning_rate": 1.052687807234314e-06, - "loss": 0.5869, - "step": 58375 - }, - { - "epoch": 1.5, - "learning_rate": 1.0526601751936018e-06, - "loss": 0.6963, - "step": 58376 - }, - { - "epoch": 1.5, - "learning_rate": 1.0526325431125697e-06, - "loss": 0.6631, - "step": 58377 - }, - { - "epoch": 1.5, - "learning_rate": 1.0526049109912396e-06, - "loss": 0.6562, - "step": 58378 - }, - { - "epoch": 1.5, - "learning_rate": 1.0525772788296326e-06, - "loss": 0.5176, - "step": 58379 - }, - { - "epoch": 1.5, - "learning_rate": 1.0525496466277693e-06, - "loss": 0.6836, - "step": 58380 - }, - { - "epoch": 1.5, - "learning_rate": 1.052522014385671e-06, - "loss": 0.6465, - "step": 58381 - }, - { - "epoch": 1.5, - "learning_rate": 1.0524943821033592e-06, - "loss": 0.3567, - "step": 58382 - }, - { - "epoch": 1.5, - "learning_rate": 1.0524667497808548e-06, - "loss": 0.7266, - "step": 58383 - }, - { - "epoch": 1.5, - "learning_rate": 1.052439117418179e-06, - "loss": 0.7344, - "step": 58384 - }, - { - "epoch": 1.5, - "learning_rate": 1.0524114850153532e-06, - "loss": 0.6719, - "step": 58385 - }, - { - "epoch": 1.5, - "learning_rate": 1.0523838525723981e-06, - "loss": 0.5991, - "step": 58386 - }, - { - "epoch": 1.5, - "learning_rate": 1.0523562200893352e-06, - "loss": 0.6299, - "step": 58387 - }, - { - "epoch": 1.5, - "learning_rate": 1.0523285875661853e-06, - "loss": 0.5327, - "step": 58388 - }, - { - "epoch": 1.5, - "learning_rate": 1.0523009550029704e-06, - "loss": 0.6558, - "step": 58389 - }, - { - "epoch": 1.5, - "learning_rate": 1.0522733223997105e-06, - "loss": 0.6025, - "step": 58390 - }, - { - "epoch": 1.5, - "learning_rate": 1.0522456897564276e-06, - "loss": 0.7576, - "step": 58391 - }, - { - "epoch": 1.5, - "learning_rate": 1.0522180570731424e-06, - "loss": 0.6602, - "step": 58392 - }, - { - "epoch": 1.5, - "learning_rate": 1.0521904243498765e-06, - "loss": 0.7266, - "step": 58393 - }, - { - "epoch": 1.5, - "learning_rate": 1.0521627915866507e-06, - "loss": 0.4976, - "step": 58394 - }, - { - "epoch": 1.5, - "learning_rate": 1.0521351587834861e-06, - "loss": 0.5437, - "step": 58395 - }, - { - "epoch": 1.5, - "learning_rate": 1.052107525940404e-06, - "loss": 0.6641, - "step": 58396 - }, - { - "epoch": 1.5, - "learning_rate": 1.0520798930574257e-06, - "loss": 0.7031, - "step": 58397 - }, - { - "epoch": 1.5, - "learning_rate": 1.052052260134572e-06, - "loss": 0.542, - "step": 58398 - }, - { - "epoch": 1.5, - "learning_rate": 1.0520246271718646e-06, - "loss": 0.6348, - "step": 58399 - }, - { - "epoch": 1.5, - "learning_rate": 1.0519969941693242e-06, - "loss": 0.6953, - "step": 58400 - }, - { - "epoch": 1.5, - "learning_rate": 1.0519693611269721e-06, - "loss": 0.5923, - "step": 58401 - }, - { - "epoch": 1.5, - "learning_rate": 1.0519417280448292e-06, - "loss": 0.7402, - "step": 58402 - }, - { - "epoch": 1.5, - "learning_rate": 1.0519140949229173e-06, - "loss": 0.6699, - "step": 58403 - }, - { - "epoch": 1.5, - "learning_rate": 1.051886461761257e-06, - "loss": 0.7725, - "step": 58404 - }, - { - "epoch": 1.5, - "learning_rate": 1.0518588285598695e-06, - "loss": 0.5859, - "step": 58405 - }, - { - "epoch": 1.5, - "learning_rate": 1.0518311953187762e-06, - "loss": 0.6069, - "step": 58406 - }, - { - "epoch": 1.5, - "learning_rate": 1.0518035620379981e-06, - "loss": 0.6616, - "step": 58407 - }, - { - "epoch": 1.5, - "learning_rate": 1.0517759287175565e-06, - "loss": 0.4846, - "step": 58408 - }, - { - "epoch": 1.5, - "learning_rate": 1.0517482953574722e-06, - "loss": 0.4429, - "step": 58409 - }, - { - "epoch": 1.5, - "learning_rate": 1.051720661957767e-06, - "loss": 0.7173, - "step": 58410 - }, - { - "epoch": 1.5, - "learning_rate": 1.0516930285184614e-06, - "loss": 0.5498, - "step": 58411 - }, - { - "epoch": 1.5, - "learning_rate": 1.051665395039577e-06, - "loss": 0.5005, - "step": 58412 - }, - { - "epoch": 1.5, - "learning_rate": 1.0516377615211346e-06, - "loss": 0.7881, - "step": 58413 - }, - { - "epoch": 1.5, - "learning_rate": 1.0516101279631557e-06, - "loss": 0.5669, - "step": 58414 - }, - { - "epoch": 1.5, - "learning_rate": 1.051582494365661e-06, - "loss": 0.8184, - "step": 58415 - }, - { - "epoch": 1.5, - "learning_rate": 1.0515548607286723e-06, - "loss": 0.481, - "step": 58416 - }, - { - "epoch": 1.5, - "learning_rate": 1.0515272270522103e-06, - "loss": 0.6465, - "step": 58417 - }, - { - "epoch": 1.5, - "learning_rate": 1.0514995933362961e-06, - "loss": 0.5596, - "step": 58418 - }, - { - "epoch": 1.5, - "learning_rate": 1.0514719595809514e-06, - "loss": 0.4922, - "step": 58419 - }, - { - "epoch": 1.5, - "learning_rate": 1.0514443257861967e-06, - "loss": 0.5581, - "step": 58420 - }, - { - "epoch": 1.5, - "learning_rate": 1.0514166919520533e-06, - "loss": 0.6582, - "step": 58421 - }, - { - "epoch": 1.5, - "learning_rate": 1.051389058078543e-06, - "loss": 0.6973, - "step": 58422 - }, - { - "epoch": 1.5, - "learning_rate": 1.0513614241656858e-06, - "loss": 0.7744, - "step": 58423 - }, - { - "epoch": 1.5, - "learning_rate": 1.051333790213504e-06, - "loss": 0.7041, - "step": 58424 - }, - { - "epoch": 1.5, - "learning_rate": 1.0513061562220182e-06, - "loss": 0.5425, - "step": 58425 - }, - { - "epoch": 1.5, - "learning_rate": 1.0512785221912497e-06, - "loss": 0.7051, - "step": 58426 - }, - { - "epoch": 1.5, - "learning_rate": 1.0512508881212195e-06, - "loss": 0.625, - "step": 58427 - }, - { - "epoch": 1.5, - "learning_rate": 1.0512232540119487e-06, - "loss": 0.5669, - "step": 58428 - }, - { - "epoch": 1.5, - "learning_rate": 1.051195619863459e-06, - "loss": 0.8115, - "step": 58429 - }, - { - "epoch": 1.5, - "learning_rate": 1.0511679856757707e-06, - "loss": 0.709, - "step": 58430 - }, - { - "epoch": 1.5, - "learning_rate": 1.0511403514489056e-06, - "loss": 0.7324, - "step": 58431 - }, - { - "epoch": 1.5, - "learning_rate": 1.0511127171828846e-06, - "loss": 0.752, - "step": 58432 - }, - { - "epoch": 1.5, - "learning_rate": 1.051085082877729e-06, - "loss": 0.5711, - "step": 58433 - }, - { - "epoch": 1.5, - "learning_rate": 1.0510574485334603e-06, - "loss": 0.4685, - "step": 58434 - }, - { - "epoch": 1.5, - "learning_rate": 1.051029814150099e-06, - "loss": 0.5928, - "step": 58435 - }, - { - "epoch": 1.5, - "learning_rate": 1.0510021797276662e-06, - "loss": 0.4385, - "step": 58436 - }, - { - "epoch": 1.5, - "learning_rate": 1.0509745452661838e-06, - "loss": 0.5908, - "step": 58437 - }, - { - "epoch": 1.5, - "learning_rate": 1.0509469107656721e-06, - "loss": 0.7393, - "step": 58438 - }, - { - "epoch": 1.5, - "learning_rate": 1.0509192762261534e-06, - "loss": 0.7256, - "step": 58439 - }, - { - "epoch": 1.5, - "learning_rate": 1.0508916416476474e-06, - "loss": 0.563, - "step": 58440 - }, - { - "epoch": 1.5, - "learning_rate": 1.0508640070301763e-06, - "loss": 0.5493, - "step": 58441 - }, - { - "epoch": 1.5, - "learning_rate": 1.050836372373761e-06, - "loss": 0.7881, - "step": 58442 - }, - { - "epoch": 1.5, - "learning_rate": 1.0508087376784228e-06, - "loss": 0.5332, - "step": 58443 - }, - { - "epoch": 1.5, - "learning_rate": 1.0507811029441823e-06, - "loss": 0.5649, - "step": 58444 - }, - { - "epoch": 1.5, - "learning_rate": 1.0507534681710614e-06, - "loss": 0.7373, - "step": 58445 - }, - { - "epoch": 1.5, - "learning_rate": 1.0507258333590807e-06, - "loss": 0.6641, - "step": 58446 - }, - { - "epoch": 1.5, - "learning_rate": 1.0506981985082617e-06, - "loss": 0.668, - "step": 58447 - }, - { - "epoch": 1.5, - "learning_rate": 1.0506705636186252e-06, - "loss": 0.8242, - "step": 58448 - }, - { - "epoch": 1.5, - "learning_rate": 1.0506429286901928e-06, - "loss": 0.7422, - "step": 58449 - }, - { - "epoch": 1.5, - "learning_rate": 1.0506152937229852e-06, - "loss": 0.4829, - "step": 58450 - }, - { - "epoch": 1.5, - "learning_rate": 1.0505876587170238e-06, - "loss": 0.6865, - "step": 58451 - }, - { - "epoch": 1.5, - "learning_rate": 1.0505600236723302e-06, - "loss": 0.4529, - "step": 58452 - }, - { - "epoch": 1.5, - "learning_rate": 1.0505323885889248e-06, - "loss": 0.6343, - "step": 58453 - }, - { - "epoch": 1.5, - "learning_rate": 1.0505047534668292e-06, - "loss": 0.6841, - "step": 58454 - }, - { - "epoch": 1.5, - "learning_rate": 1.050477118306064e-06, - "loss": 0.6855, - "step": 58455 - }, - { - "epoch": 1.5, - "learning_rate": 1.0504494831066514e-06, - "loss": 0.7075, - "step": 58456 - }, - { - "epoch": 1.5, - "learning_rate": 1.0504218478686116e-06, - "loss": 0.4905, - "step": 58457 - }, - { - "epoch": 1.5, - "learning_rate": 1.050394212591966e-06, - "loss": 0.7246, - "step": 58458 - }, - { - "epoch": 1.5, - "learning_rate": 1.0503665772767362e-06, - "loss": 0.7607, - "step": 58459 - }, - { - "epoch": 1.5, - "learning_rate": 1.050338941922943e-06, - "loss": 0.6377, - "step": 58460 - }, - { - "epoch": 1.5, - "learning_rate": 1.0503113065306073e-06, - "loss": 0.7266, - "step": 58461 - }, - { - "epoch": 1.5, - "learning_rate": 1.0502836710997507e-06, - "loss": 0.6348, - "step": 58462 - }, - { - "epoch": 1.5, - "learning_rate": 1.0502560356303939e-06, - "loss": 0.7598, - "step": 58463 - }, - { - "epoch": 1.5, - "learning_rate": 1.0502284001225591e-06, - "loss": 0.6421, - "step": 58464 - }, - { - "epoch": 1.5, - "learning_rate": 1.0502007645762663e-06, - "loss": 0.5757, - "step": 58465 - }, - { - "epoch": 1.5, - "learning_rate": 1.050173128991537e-06, - "loss": 0.752, - "step": 58466 - }, - { - "epoch": 1.5, - "learning_rate": 1.0501454933683925e-06, - "loss": 0.7529, - "step": 58467 - }, - { - "epoch": 1.5, - "learning_rate": 1.0501178577068539e-06, - "loss": 0.6558, - "step": 58468 - }, - { - "epoch": 1.5, - "learning_rate": 1.0500902220069425e-06, - "loss": 0.5107, - "step": 58469 - }, - { - "epoch": 1.5, - "learning_rate": 1.0500625862686792e-06, - "loss": 0.7188, - "step": 58470 - }, - { - "epoch": 1.5, - "learning_rate": 1.0500349504920851e-06, - "loss": 0.563, - "step": 58471 - }, - { - "epoch": 1.5, - "learning_rate": 1.050007314677182e-06, - "loss": 0.6797, - "step": 58472 - }, - { - "epoch": 1.5, - "learning_rate": 1.0499796788239901e-06, - "loss": 0.665, - "step": 58473 - }, - { - "epoch": 1.5, - "learning_rate": 1.0499520429325312e-06, - "loss": 0.5664, - "step": 58474 - }, - { - "epoch": 1.5, - "learning_rate": 1.0499244070028266e-06, - "loss": 0.7046, - "step": 58475 - }, - { - "epoch": 1.5, - "learning_rate": 1.0498967710348966e-06, - "loss": 0.7495, - "step": 58476 - }, - { - "epoch": 1.5, - "learning_rate": 1.0498691350287636e-06, - "loss": 0.7468, - "step": 58477 - }, - { - "epoch": 1.5, - "learning_rate": 1.0498414989844476e-06, - "loss": 0.5112, - "step": 58478 - }, - { - "epoch": 1.5, - "learning_rate": 1.0498138629019709e-06, - "loss": 0.6641, - "step": 58479 - }, - { - "epoch": 1.5, - "learning_rate": 1.0497862267813533e-06, - "loss": 0.748, - "step": 58480 - }, - { - "epoch": 1.5, - "learning_rate": 1.0497585906226169e-06, - "loss": 0.5366, - "step": 58481 - }, - { - "epoch": 1.5, - "learning_rate": 1.0497309544257826e-06, - "loss": 0.4563, - "step": 58482 - }, - { - "epoch": 1.5, - "learning_rate": 1.049703318190872e-06, - "loss": 0.6519, - "step": 58483 - }, - { - "epoch": 1.5, - "learning_rate": 1.0496756819179053e-06, - "loss": 0.7637, - "step": 58484 - }, - { - "epoch": 1.5, - "learning_rate": 1.0496480456069046e-06, - "loss": 0.6484, - "step": 58485 - }, - { - "epoch": 1.5, - "learning_rate": 1.0496204092578905e-06, - "loss": 0.6177, - "step": 58486 - }, - { - "epoch": 1.5, - "learning_rate": 1.0495927728708845e-06, - "loss": 0.6758, - "step": 58487 - }, - { - "epoch": 1.5, - "learning_rate": 1.049565136445907e-06, - "loss": 0.4912, - "step": 58488 - }, - { - "epoch": 1.5, - "learning_rate": 1.0495374999829807e-06, - "loss": 0.5452, - "step": 58489 - }, - { - "epoch": 1.5, - "learning_rate": 1.0495098634821252e-06, - "loss": 0.5887, - "step": 58490 - }, - { - "epoch": 1.5, - "learning_rate": 1.0494822269433624e-06, - "loss": 0.5928, - "step": 58491 - }, - { - "epoch": 1.5, - "learning_rate": 1.049454590366713e-06, - "loss": 0.7236, - "step": 58492 - }, - { - "epoch": 1.5, - "learning_rate": 1.049426953752199e-06, - "loss": 0.6738, - "step": 58493 - }, - { - "epoch": 1.5, - "learning_rate": 1.049399317099841e-06, - "loss": 0.4467, - "step": 58494 - }, - { - "epoch": 1.5, - "learning_rate": 1.04937168040966e-06, - "loss": 0.5649, - "step": 58495 - }, - { - "epoch": 1.5, - "learning_rate": 1.0493440436816773e-06, - "loss": 0.4194, - "step": 58496 - }, - { - "epoch": 1.5, - "learning_rate": 1.0493164069159144e-06, - "loss": 0.6748, - "step": 58497 - }, - { - "epoch": 1.5, - "learning_rate": 1.049288770112392e-06, - "loss": 0.5095, - "step": 58498 - }, - { - "epoch": 1.5, - "learning_rate": 1.0492611332711319e-06, - "loss": 0.748, - "step": 58499 - }, - { - "epoch": 1.5, - "learning_rate": 1.0492334963921542e-06, - "loss": 0.7246, - "step": 58500 - }, - { - "epoch": 1.5, - "learning_rate": 1.049205859475481e-06, - "loss": 0.6831, - "step": 58501 - }, - { - "epoch": 1.5, - "learning_rate": 1.0491782225211332e-06, - "loss": 0.5317, - "step": 58502 - }, - { - "epoch": 1.5, - "learning_rate": 1.0491505855291316e-06, - "loss": 0.7314, - "step": 58503 - }, - { - "epoch": 1.5, - "learning_rate": 1.0491229484994981e-06, - "loss": 0.6484, - "step": 58504 - }, - { - "epoch": 1.5, - "learning_rate": 1.0490953114322529e-06, - "loss": 0.7314, - "step": 58505 - }, - { - "epoch": 1.5, - "learning_rate": 1.0490676743274181e-06, - "loss": 0.8418, - "step": 58506 - }, - { - "epoch": 1.5, - "learning_rate": 1.0490400371850141e-06, - "loss": 0.666, - "step": 58507 - }, - { - "epoch": 1.5, - "learning_rate": 1.0490124000050626e-06, - "loss": 0.452, - "step": 58508 - }, - { - "epoch": 1.5, - "learning_rate": 1.0489847627875846e-06, - "loss": 0.6348, - "step": 58509 - }, - { - "epoch": 1.5, - "learning_rate": 1.0489571255326012e-06, - "loss": 0.6235, - "step": 58510 - }, - { - "epoch": 1.5, - "learning_rate": 1.0489294882401335e-06, - "loss": 0.5095, - "step": 58511 - }, - { - "epoch": 1.5, - "learning_rate": 1.0489018509102027e-06, - "loss": 0.6445, - "step": 58512 - }, - { - "epoch": 1.5, - "learning_rate": 1.04887421354283e-06, - "loss": 0.5103, - "step": 58513 - }, - { - "epoch": 1.5, - "learning_rate": 1.0488465761380367e-06, - "loss": 0.6973, - "step": 58514 - }, - { - "epoch": 1.5, - "learning_rate": 1.0488189386958436e-06, - "loss": 0.708, - "step": 58515 - }, - { - "epoch": 1.5, - "learning_rate": 1.0487913012162726e-06, - "loss": 0.6338, - "step": 58516 - }, - { - "epoch": 1.5, - "learning_rate": 1.0487636636993437e-06, - "loss": 0.6152, - "step": 58517 - }, - { - "epoch": 1.5, - "learning_rate": 1.048736026145079e-06, - "loss": 0.4949, - "step": 58518 - }, - { - "epoch": 1.5, - "learning_rate": 1.0487083885534996e-06, - "loss": 0.4866, - "step": 58519 - }, - { - "epoch": 1.5, - "learning_rate": 1.0486807509246259e-06, - "loss": 0.5415, - "step": 58520 - }, - { - "epoch": 1.5, - "learning_rate": 1.04865311325848e-06, - "loss": 0.6895, - "step": 58521 - }, - { - "epoch": 1.5, - "learning_rate": 1.0486254755550823e-06, - "loss": 0.5312, - "step": 58522 - }, - { - "epoch": 1.5, - "learning_rate": 1.0485978378144547e-06, - "loss": 0.7021, - "step": 58523 - }, - { - "epoch": 1.5, - "learning_rate": 1.0485702000366178e-06, - "loss": 0.5151, - "step": 58524 - }, - { - "epoch": 1.5, - "learning_rate": 1.048542562221593e-06, - "loss": 0.5029, - "step": 58525 - }, - { - "epoch": 1.5, - "learning_rate": 1.0485149243694012e-06, - "loss": 0.5942, - "step": 58526 - }, - { - "epoch": 1.5, - "learning_rate": 1.0484872864800638e-06, - "loss": 0.5752, - "step": 58527 - }, - { - "epoch": 1.5, - "learning_rate": 1.0484596485536018e-06, - "loss": 0.5535, - "step": 58528 - }, - { - "epoch": 1.5, - "learning_rate": 1.048432010590037e-06, - "loss": 0.6758, - "step": 58529 - }, - { - "epoch": 1.5, - "learning_rate": 1.0484043725893896e-06, - "loss": 0.6392, - "step": 58530 - }, - { - "epoch": 1.5, - "learning_rate": 1.0483767345516813e-06, - "loss": 0.7549, - "step": 58531 - }, - { - "epoch": 1.5, - "learning_rate": 1.0483490964769331e-06, - "loss": 0.6555, - "step": 58532 - }, - { - "epoch": 1.5, - "learning_rate": 1.0483214583651662e-06, - "loss": 0.6724, - "step": 58533 - }, - { - "epoch": 1.5, - "learning_rate": 1.0482938202164021e-06, - "loss": 0.5034, - "step": 58534 - }, - { - "epoch": 1.5, - "learning_rate": 1.0482661820306612e-06, - "loss": 0.6235, - "step": 58535 - }, - { - "epoch": 1.5, - "learning_rate": 1.0482385438079654e-06, - "loss": 0.6943, - "step": 58536 - }, - { - "epoch": 1.5, - "learning_rate": 1.0482109055483355e-06, - "loss": 0.6572, - "step": 58537 - }, - { - "epoch": 1.5, - "learning_rate": 1.0481832672517926e-06, - "loss": 0.5591, - "step": 58538 - }, - { - "epoch": 1.5, - "learning_rate": 1.048155628918358e-06, - "loss": 0.6704, - "step": 58539 - }, - { - "epoch": 1.5, - "learning_rate": 1.0481279905480528e-06, - "loss": 0.6299, - "step": 58540 - }, - { - "epoch": 1.5, - "learning_rate": 1.0481003521408984e-06, - "loss": 0.6289, - "step": 58541 - }, - { - "epoch": 1.5, - "learning_rate": 1.0480727136969156e-06, - "loss": 0.4922, - "step": 58542 - }, - { - "epoch": 1.5, - "learning_rate": 1.048045075216126e-06, - "loss": 0.5938, - "step": 58543 - }, - { - "epoch": 1.5, - "learning_rate": 1.0480174366985503e-06, - "loss": 0.5967, - "step": 58544 - }, - { - "epoch": 1.5, - "learning_rate": 1.04798979814421e-06, - "loss": 0.6548, - "step": 58545 - }, - { - "epoch": 1.5, - "learning_rate": 1.047962159553126e-06, - "loss": 0.5098, - "step": 58546 - }, - { - "epoch": 1.5, - "learning_rate": 1.0479345209253194e-06, - "loss": 0.7256, - "step": 58547 - }, - { - "epoch": 1.5, - "learning_rate": 1.047906882260812e-06, - "loss": 0.6855, - "step": 58548 - }, - { - "epoch": 1.5, - "learning_rate": 1.0478792435596242e-06, - "loss": 0.6299, - "step": 58549 - }, - { - "epoch": 1.5, - "learning_rate": 1.0478516048217775e-06, - "loss": 0.7217, - "step": 58550 - }, - { - "epoch": 1.5, - "learning_rate": 1.0478239660472929e-06, - "loss": 0.6904, - "step": 58551 - }, - { - "epoch": 1.5, - "learning_rate": 1.0477963272361918e-06, - "loss": 0.5503, - "step": 58552 - }, - { - "epoch": 1.5, - "learning_rate": 1.0477686883884951e-06, - "loss": 0.6113, - "step": 58553 - }, - { - "epoch": 1.5, - "learning_rate": 1.0477410495042246e-06, - "loss": 0.5396, - "step": 58554 - }, - { - "epoch": 1.5, - "learning_rate": 1.0477134105834004e-06, - "loss": 0.6748, - "step": 58555 - }, - { - "epoch": 1.5, - "learning_rate": 1.0476857716260447e-06, - "loss": 0.6758, - "step": 58556 - }, - { - "epoch": 1.5, - "learning_rate": 1.0476581326321779e-06, - "loss": 0.605, - "step": 58557 - }, - { - "epoch": 1.5, - "learning_rate": 1.0476304936018215e-06, - "loss": 0.6587, - "step": 58558 - }, - { - "epoch": 1.5, - "learning_rate": 1.047602854534997e-06, - "loss": 0.6025, - "step": 58559 - }, - { - "epoch": 1.5, - "learning_rate": 1.0475752154317248e-06, - "loss": 0.5339, - "step": 58560 - }, - { - "epoch": 1.5, - "learning_rate": 1.0475475762920262e-06, - "loss": 0.6143, - "step": 58561 - }, - { - "epoch": 1.5, - "learning_rate": 1.047519937115923e-06, - "loss": 0.8467, - "step": 58562 - }, - { - "epoch": 1.5, - "learning_rate": 1.0474922979034356e-06, - "loss": 0.6562, - "step": 58563 - }, - { - "epoch": 1.5, - "learning_rate": 1.0474646586545858e-06, - "loss": 0.4539, - "step": 58564 - }, - { - "epoch": 1.5, - "learning_rate": 1.0474370193693947e-06, - "loss": 0.625, - "step": 58565 - }, - { - "epoch": 1.5, - "learning_rate": 1.0474093800478828e-06, - "loss": 0.4083, - "step": 58566 - }, - { - "epoch": 1.5, - "learning_rate": 1.0473817406900722e-06, - "loss": 0.6465, - "step": 58567 - }, - { - "epoch": 1.5, - "learning_rate": 1.0473541012959831e-06, - "loss": 0.6035, - "step": 58568 - }, - { - "epoch": 1.5, - "learning_rate": 1.0473264618656377e-06, - "loss": 0.8369, - "step": 58569 - }, - { - "epoch": 1.5, - "learning_rate": 1.0472988223990562e-06, - "loss": 0.7686, - "step": 58570 - }, - { - "epoch": 1.5, - "learning_rate": 1.0472711828962604e-06, - "loss": 0.7598, - "step": 58571 - }, - { - "epoch": 1.5, - "learning_rate": 1.0472435433572709e-06, - "loss": 0.7588, - "step": 58572 - }, - { - "epoch": 1.5, - "learning_rate": 1.0472159037821092e-06, - "loss": 0.5759, - "step": 58573 - }, - { - "epoch": 1.5, - "learning_rate": 1.0471882641707969e-06, - "loss": 0.5776, - "step": 58574 - }, - { - "epoch": 1.5, - "learning_rate": 1.0471606245233546e-06, - "loss": 0.5869, - "step": 58575 - }, - { - "epoch": 1.5, - "learning_rate": 1.0471329848398032e-06, - "loss": 0.5088, - "step": 58576 - }, - { - "epoch": 1.5, - "learning_rate": 1.0471053451201647e-06, - "loss": 0.6152, - "step": 58577 - }, - { - "epoch": 1.5, - "learning_rate": 1.0470777053644592e-06, - "loss": 0.7422, - "step": 58578 - }, - { - "epoch": 1.5, - "learning_rate": 1.0470500655727092e-06, - "loss": 0.6768, - "step": 58579 - }, - { - "epoch": 1.5, - "learning_rate": 1.0470224257449346e-06, - "loss": 0.6431, - "step": 58580 - }, - { - "epoch": 1.5, - "learning_rate": 1.0469947858811575e-06, - "loss": 0.4226, - "step": 58581 - }, - { - "epoch": 1.5, - "learning_rate": 1.046967145981398e-06, - "loss": 0.6553, - "step": 58582 - }, - { - "epoch": 1.5, - "learning_rate": 1.0469395060456784e-06, - "loss": 0.5879, - "step": 58583 - }, - { - "epoch": 1.5, - "learning_rate": 1.0469118660740194e-06, - "loss": 0.5923, - "step": 58584 - }, - { - "epoch": 1.5, - "learning_rate": 1.046884226066442e-06, - "loss": 0.6768, - "step": 58585 - }, - { - "epoch": 1.5, - "learning_rate": 1.0468565860229675e-06, - "loss": 0.6377, - "step": 58586 - }, - { - "epoch": 1.5, - "learning_rate": 1.046828945943617e-06, - "loss": 0.6074, - "step": 58587 - }, - { - "epoch": 1.5, - "learning_rate": 1.046801305828412e-06, - "loss": 0.5229, - "step": 58588 - }, - { - "epoch": 1.5, - "learning_rate": 1.046773665677373e-06, - "loss": 0.6621, - "step": 58589 - }, - { - "epoch": 1.5, - "learning_rate": 1.0467460254905221e-06, - "loss": 0.7012, - "step": 58590 - }, - { - "epoch": 1.5, - "learning_rate": 1.0467183852678794e-06, - "loss": 0.6479, - "step": 58591 - }, - { - "epoch": 1.5, - "learning_rate": 1.046690745009467e-06, - "loss": 0.7725, - "step": 58592 - }, - { - "epoch": 1.5, - "learning_rate": 1.0466631047153052e-06, - "loss": 0.4902, - "step": 58593 - }, - { - "epoch": 1.5, - "learning_rate": 1.046635464385416e-06, - "loss": 0.6245, - "step": 58594 - }, - { - "epoch": 1.5, - "learning_rate": 1.04660782401982e-06, - "loss": 0.6846, - "step": 58595 - }, - { - "epoch": 1.5, - "learning_rate": 1.0465801836185387e-06, - "loss": 0.7529, - "step": 58596 - }, - { - "epoch": 1.5, - "learning_rate": 1.0465525431815926e-06, - "loss": 0.6401, - "step": 58597 - }, - { - "epoch": 1.5, - "learning_rate": 1.0465249027090038e-06, - "loss": 0.5767, - "step": 58598 - }, - { - "epoch": 1.5, - "learning_rate": 1.046497262200793e-06, - "loss": 0.4673, - "step": 58599 - }, - { - "epoch": 1.5, - "learning_rate": 1.0464696216569813e-06, - "loss": 0.752, - "step": 58600 - }, - { - "epoch": 1.5, - "learning_rate": 1.0464419810775899e-06, - "loss": 0.6152, - "step": 58601 - }, - { - "epoch": 1.5, - "learning_rate": 1.04641434046264e-06, - "loss": 0.605, - "step": 58602 - }, - { - "epoch": 1.5, - "learning_rate": 1.0463866998121527e-06, - "loss": 0.5776, - "step": 58603 - }, - { - "epoch": 1.5, - "learning_rate": 1.0463590591261496e-06, - "loss": 0.5586, - "step": 58604 - }, - { - "epoch": 1.5, - "learning_rate": 1.0463314184046512e-06, - "loss": 0.4041, - "step": 58605 - }, - { - "epoch": 1.5, - "learning_rate": 1.0463037776476792e-06, - "loss": 0.7783, - "step": 58606 - }, - { - "epoch": 1.5, - "learning_rate": 1.0462761368552541e-06, - "loss": 0.6953, - "step": 58607 - }, - { - "epoch": 1.5, - "learning_rate": 1.046248496027398e-06, - "loss": 0.7861, - "step": 58608 - }, - { - "epoch": 1.5, - "learning_rate": 1.0462208551641313e-06, - "loss": 0.6387, - "step": 58609 - }, - { - "epoch": 1.5, - "learning_rate": 1.0461932142654751e-06, - "loss": 0.6382, - "step": 58610 - }, - { - "epoch": 1.5, - "learning_rate": 1.0461655733314514e-06, - "loss": 0.5511, - "step": 58611 - }, - { - "epoch": 1.5, - "learning_rate": 1.0461379323620805e-06, - "loss": 0.4585, - "step": 58612 - }, - { - "epoch": 1.5, - "learning_rate": 1.0461102913573841e-06, - "loss": 0.5942, - "step": 58613 - }, - { - "epoch": 1.5, - "learning_rate": 1.0460826503173832e-06, - "loss": 0.6455, - "step": 58614 - }, - { - "epoch": 1.5, - "learning_rate": 1.046055009242099e-06, - "loss": 0.4969, - "step": 58615 - }, - { - "epoch": 1.5, - "learning_rate": 1.046027368131552e-06, - "loss": 0.7148, - "step": 58616 - }, - { - "epoch": 1.5, - "learning_rate": 1.0459997269857645e-06, - "loss": 0.7793, - "step": 58617 - }, - { - "epoch": 1.5, - "learning_rate": 1.045972085804757e-06, - "loss": 0.7383, - "step": 58618 - }, - { - "epoch": 1.5, - "learning_rate": 1.0459444445885512e-06, - "loss": 0.8477, - "step": 58619 - }, - { - "epoch": 1.5, - "learning_rate": 1.0459168033371673e-06, - "loss": 0.6484, - "step": 58620 - }, - { - "epoch": 1.5, - "learning_rate": 1.0458891620506272e-06, - "loss": 0.542, - "step": 58621 - }, - { - "epoch": 1.5, - "learning_rate": 1.0458615207289519e-06, - "loss": 0.6753, - "step": 58622 - }, - { - "epoch": 1.5, - "learning_rate": 1.0458338793721623e-06, - "loss": 0.5867, - "step": 58623 - }, - { - "epoch": 1.5, - "learning_rate": 1.0458062379802802e-06, - "loss": 0.6304, - "step": 58624 - }, - { - "epoch": 1.5, - "learning_rate": 1.0457785965533263e-06, - "loss": 0.6479, - "step": 58625 - }, - { - "epoch": 1.5, - "learning_rate": 1.0457509550913215e-06, - "loss": 0.6113, - "step": 58626 - }, - { - "epoch": 1.5, - "learning_rate": 1.0457233135942876e-06, - "loss": 0.4907, - "step": 58627 - }, - { - "epoch": 1.5, - "learning_rate": 1.0456956720622452e-06, - "loss": 0.6377, - "step": 58628 - }, - { - "epoch": 1.5, - "learning_rate": 1.045668030495216e-06, - "loss": 0.644, - "step": 58629 - }, - { - "epoch": 1.5, - "learning_rate": 1.0456403888932208e-06, - "loss": 0.6152, - "step": 58630 - }, - { - "epoch": 1.5, - "learning_rate": 1.0456127472562808e-06, - "loss": 0.5205, - "step": 58631 - }, - { - "epoch": 1.5, - "learning_rate": 1.0455851055844174e-06, - "loss": 0.6992, - "step": 58632 - }, - { - "epoch": 1.5, - "learning_rate": 1.0455574638776514e-06, - "loss": 0.7256, - "step": 58633 - }, - { - "epoch": 1.5, - "learning_rate": 1.0455298221360042e-06, - "loss": 0.8281, - "step": 58634 - }, - { - "epoch": 1.5, - "learning_rate": 1.0455021803594967e-06, - "loss": 0.6875, - "step": 58635 - }, - { - "epoch": 1.5, - "learning_rate": 1.0454745385481508e-06, - "loss": 0.6885, - "step": 58636 - }, - { - "epoch": 1.5, - "learning_rate": 1.0454468967019864e-06, - "loss": 0.5, - "step": 58637 - }, - { - "epoch": 1.5, - "learning_rate": 1.0454192548210258e-06, - "loss": 0.6284, - "step": 58638 - }, - { - "epoch": 1.5, - "learning_rate": 1.04539161290529e-06, - "loss": 0.5679, - "step": 58639 - }, - { - "epoch": 1.5, - "learning_rate": 1.0453639709547996e-06, - "loss": 0.748, - "step": 58640 - }, - { - "epoch": 1.5, - "learning_rate": 1.0453363289695762e-06, - "loss": 0.6392, - "step": 58641 - }, - { - "epoch": 1.5, - "learning_rate": 1.0453086869496408e-06, - "loss": 0.6943, - "step": 58642 - }, - { - "epoch": 1.5, - "learning_rate": 1.0452810448950146e-06, - "loss": 0.5957, - "step": 58643 - }, - { - "epoch": 1.5, - "learning_rate": 1.0452534028057193e-06, - "loss": 0.7393, - "step": 58644 - }, - { - "epoch": 1.5, - "learning_rate": 1.045225760681775e-06, - "loss": 0.4663, - "step": 58645 - }, - { - "epoch": 1.5, - "learning_rate": 1.0451981185232035e-06, - "loss": 0.6797, - "step": 58646 - }, - { - "epoch": 1.5, - "learning_rate": 1.0451704763300256e-06, - "loss": 0.7051, - "step": 58647 - }, - { - "epoch": 1.5, - "learning_rate": 1.0451428341022633e-06, - "loss": 0.8662, - "step": 58648 - }, - { - "epoch": 1.5, - "learning_rate": 1.0451151918399368e-06, - "loss": 0.7617, - "step": 58649 - }, - { - "epoch": 1.5, - "learning_rate": 1.045087549543068e-06, - "loss": 0.6284, - "step": 58650 - }, - { - "epoch": 1.5, - "learning_rate": 1.0450599072116774e-06, - "loss": 0.8438, - "step": 58651 - }, - { - "epoch": 1.5, - "learning_rate": 1.0450322648457868e-06, - "loss": 0.4927, - "step": 58652 - }, - { - "epoch": 1.5, - "learning_rate": 1.0450046224454167e-06, - "loss": 0.7959, - "step": 58653 - }, - { - "epoch": 1.5, - "learning_rate": 1.044976980010589e-06, - "loss": 0.5374, - "step": 58654 - }, - { - "epoch": 1.5, - "learning_rate": 1.0449493375413242e-06, - "loss": 0.4966, - "step": 58655 - }, - { - "epoch": 1.5, - "learning_rate": 1.0449216950376438e-06, - "loss": 0.6406, - "step": 58656 - }, - { - "epoch": 1.5, - "learning_rate": 1.0448940524995692e-06, - "loss": 0.6553, - "step": 58657 - }, - { - "epoch": 1.5, - "learning_rate": 1.0448664099271211e-06, - "loss": 0.6963, - "step": 58658 - }, - { - "epoch": 1.5, - "learning_rate": 1.044838767320321e-06, - "loss": 0.7666, - "step": 58659 - }, - { - "epoch": 1.5, - "learning_rate": 1.0448111246791898e-06, - "loss": 0.7393, - "step": 58660 - }, - { - "epoch": 1.5, - "learning_rate": 1.0447834820037487e-06, - "loss": 0.7441, - "step": 58661 - }, - { - "epoch": 1.5, - "learning_rate": 1.044755839294019e-06, - "loss": 0.7148, - "step": 58662 - }, - { - "epoch": 1.5, - "learning_rate": 1.044728196550022e-06, - "loss": 0.5586, - "step": 58663 - }, - { - "epoch": 1.5, - "learning_rate": 1.0447005537717784e-06, - "loss": 0.8389, - "step": 58664 - }, - { - "epoch": 1.5, - "learning_rate": 1.0446729109593098e-06, - "loss": 0.6426, - "step": 58665 - }, - { - "epoch": 1.5, - "learning_rate": 1.044645268112637e-06, - "loss": 0.5996, - "step": 58666 - }, - { - "epoch": 1.5, - "learning_rate": 1.0446176252317815e-06, - "loss": 0.5227, - "step": 58667 - }, - { - "epoch": 1.5, - "learning_rate": 1.0445899823167645e-06, - "loss": 0.575, - "step": 58668 - }, - { - "epoch": 1.5, - "learning_rate": 1.044562339367607e-06, - "loss": 0.5474, - "step": 58669 - }, - { - "epoch": 1.5, - "learning_rate": 1.0445346963843297e-06, - "loss": 0.7422, - "step": 58670 - }, - { - "epoch": 1.5, - "learning_rate": 1.044507053366955e-06, - "loss": 0.6772, - "step": 58671 - }, - { - "epoch": 1.5, - "learning_rate": 1.0444794103155026e-06, - "loss": 0.5298, - "step": 58672 - }, - { - "epoch": 1.5, - "learning_rate": 1.0444517672299946e-06, - "loss": 0.625, - "step": 58673 - }, - { - "epoch": 1.5, - "learning_rate": 1.0444241241104522e-06, - "loss": 0.5879, - "step": 58674 - }, - { - "epoch": 1.5, - "learning_rate": 1.0443964809568957e-06, - "loss": 0.3336, - "step": 58675 - }, - { - "epoch": 1.5, - "learning_rate": 1.0443688377693472e-06, - "loss": 0.4768, - "step": 58676 - }, - { - "epoch": 1.5, - "learning_rate": 1.0443411945478273e-06, - "loss": 0.4497, - "step": 58677 - }, - { - "epoch": 1.5, - "learning_rate": 1.044313551292358e-06, - "loss": 0.6851, - "step": 58678 - }, - { - "epoch": 1.5, - "learning_rate": 1.0442859080029593e-06, - "loss": 0.5322, - "step": 58679 - }, - { - "epoch": 1.5, - "learning_rate": 1.0442582646796532e-06, - "loss": 0.6367, - "step": 58680 - }, - { - "epoch": 1.5, - "learning_rate": 1.0442306213224603e-06, - "loss": 0.7881, - "step": 58681 - }, - { - "epoch": 1.5, - "learning_rate": 1.044202977931402e-06, - "loss": 0.7305, - "step": 58682 - }, - { - "epoch": 1.5, - "learning_rate": 1.0441753345064999e-06, - "loss": 0.8281, - "step": 58683 - }, - { - "epoch": 1.5, - "learning_rate": 1.0441476910477748e-06, - "loss": 0.5469, - "step": 58684 - }, - { - "epoch": 1.5, - "learning_rate": 1.0441200475552473e-06, - "loss": 0.7891, - "step": 58685 - }, - { - "epoch": 1.5, - "learning_rate": 1.0440924040289396e-06, - "loss": 0.5791, - "step": 58686 - }, - { - "epoch": 1.5, - "learning_rate": 1.044064760468872e-06, - "loss": 0.6631, - "step": 58687 - }, - { - "epoch": 1.5, - "learning_rate": 1.0440371168750666e-06, - "loss": 0.6055, - "step": 58688 - }, - { - "epoch": 1.5, - "learning_rate": 1.0440094732475435e-06, - "loss": 0.5894, - "step": 58689 - }, - { - "epoch": 1.5, - "learning_rate": 1.0439818295863246e-06, - "loss": 0.7217, - "step": 58690 - }, - { - "epoch": 1.5, - "learning_rate": 1.0439541858914306e-06, - "loss": 0.5195, - "step": 58691 - }, - { - "epoch": 1.5, - "learning_rate": 1.0439265421628832e-06, - "loss": 0.582, - "step": 58692 - }, - { - "epoch": 1.5, - "learning_rate": 1.043898898400703e-06, - "loss": 0.6084, - "step": 58693 - }, - { - "epoch": 1.5, - "learning_rate": 1.0438712546049115e-06, - "loss": 0.5107, - "step": 58694 - }, - { - "epoch": 1.5, - "learning_rate": 1.04384361077553e-06, - "loss": 0.6006, - "step": 58695 - }, - { - "epoch": 1.5, - "learning_rate": 1.0438159669125795e-06, - "loss": 0.5933, - "step": 58696 - }, - { - "epoch": 1.5, - "learning_rate": 1.0437883230160807e-06, - "loss": 0.6284, - "step": 58697 - }, - { - "epoch": 1.5, - "learning_rate": 1.0437606790860554e-06, - "loss": 0.6001, - "step": 58698 - }, - { - "epoch": 1.5, - "learning_rate": 1.0437330351225247e-06, - "loss": 0.6201, - "step": 58699 - }, - { - "epoch": 1.5, - "learning_rate": 1.0437053911255093e-06, - "loss": 0.6279, - "step": 58700 - }, - { - "epoch": 1.5, - "learning_rate": 1.043677747095031e-06, - "loss": 0.6069, - "step": 58701 - }, - { - "epoch": 1.5, - "learning_rate": 1.0436501030311105e-06, - "loss": 0.6455, - "step": 58702 - }, - { - "epoch": 1.5, - "learning_rate": 1.0436224589337695e-06, - "loss": 0.5942, - "step": 58703 - }, - { - "epoch": 1.5, - "learning_rate": 1.0435948148030282e-06, - "loss": 0.6689, - "step": 58704 - }, - { - "epoch": 1.5, - "learning_rate": 1.0435671706389089e-06, - "loss": 0.5508, - "step": 58705 - }, - { - "epoch": 1.5, - "learning_rate": 1.0435395264414317e-06, - "loss": 0.6914, - "step": 58706 - }, - { - "epoch": 1.5, - "learning_rate": 1.0435118822106185e-06, - "loss": 0.7178, - "step": 58707 - }, - { - "epoch": 1.5, - "learning_rate": 1.0434842379464906e-06, - "loss": 0.5938, - "step": 58708 - }, - { - "epoch": 1.5, - "learning_rate": 1.0434565936490685e-06, - "loss": 0.6025, - "step": 58709 - }, - { - "epoch": 1.5, - "learning_rate": 1.0434289493183738e-06, - "loss": 0.7324, - "step": 58710 - }, - { - "epoch": 1.5, - "learning_rate": 1.0434013049544273e-06, - "loss": 0.5627, - "step": 58711 - }, - { - "epoch": 1.5, - "learning_rate": 1.0433736605572505e-06, - "loss": 0.7178, - "step": 58712 - }, - { - "epoch": 1.5, - "learning_rate": 1.0433460161268649e-06, - "loss": 0.6475, - "step": 58713 - }, - { - "epoch": 1.5, - "learning_rate": 1.0433183716632908e-06, - "loss": 0.6699, - "step": 58714 - }, - { - "epoch": 1.5, - "learning_rate": 1.04329072716655e-06, - "loss": 0.7461, - "step": 58715 - }, - { - "epoch": 1.5, - "learning_rate": 1.0432630826366632e-06, - "loss": 0.6836, - "step": 58716 - }, - { - "epoch": 1.5, - "learning_rate": 1.043235438073652e-06, - "loss": 0.7227, - "step": 58717 - }, - { - "epoch": 1.5, - "learning_rate": 1.0432077934775377e-06, - "loss": 0.6362, - "step": 58718 - }, - { - "epoch": 1.5, - "learning_rate": 1.0431801488483408e-06, - "loss": 0.689, - "step": 58719 - }, - { - "epoch": 1.51, - "learning_rate": 1.0431525041860829e-06, - "loss": 0.6157, - "step": 58720 - }, - { - "epoch": 1.51, - "learning_rate": 1.0431248594907852e-06, - "loss": 0.792, - "step": 58721 - }, - { - "epoch": 1.51, - "learning_rate": 1.0430972147624686e-06, - "loss": 0.6973, - "step": 58722 - }, - { - "epoch": 1.51, - "learning_rate": 1.0430695700011547e-06, - "loss": 0.6572, - "step": 58723 - }, - { - "epoch": 1.51, - "learning_rate": 1.0430419252068644e-06, - "loss": 0.7617, - "step": 58724 - }, - { - "epoch": 1.51, - "learning_rate": 1.0430142803796187e-06, - "loss": 0.5459, - "step": 58725 - }, - { - "epoch": 1.51, - "learning_rate": 1.0429866355194393e-06, - "loss": 0.7461, - "step": 58726 - }, - { - "epoch": 1.51, - "learning_rate": 1.0429589906263465e-06, - "loss": 0.6611, - "step": 58727 - }, - { - "epoch": 1.51, - "learning_rate": 1.0429313457003625e-06, - "loss": 0.6047, - "step": 58728 - }, - { - "epoch": 1.51, - "learning_rate": 1.0429037007415075e-06, - "loss": 0.4412, - "step": 58729 - }, - { - "epoch": 1.51, - "learning_rate": 1.0428760557498034e-06, - "loss": 0.6816, - "step": 58730 - }, - { - "epoch": 1.51, - "learning_rate": 1.042848410725271e-06, - "loss": 0.667, - "step": 58731 - }, - { - "epoch": 1.51, - "learning_rate": 1.0428207656679313e-06, - "loss": 0.7041, - "step": 58732 - }, - { - "epoch": 1.51, - "learning_rate": 1.042793120577806e-06, - "loss": 0.6924, - "step": 58733 - }, - { - "epoch": 1.51, - "learning_rate": 1.042765475454916e-06, - "loss": 0.8447, - "step": 58734 - }, - { - "epoch": 1.51, - "learning_rate": 1.0427378302992821e-06, - "loss": 0.6641, - "step": 58735 - }, - { - "epoch": 1.51, - "learning_rate": 1.0427101851109261e-06, - "loss": 0.6748, - "step": 58736 - }, - { - "epoch": 1.51, - "learning_rate": 1.0426825398898687e-06, - "loss": 0.5391, - "step": 58737 - }, - { - "epoch": 1.51, - "learning_rate": 1.0426548946361315e-06, - "loss": 0.5601, - "step": 58738 - }, - { - "epoch": 1.51, - "learning_rate": 1.0426272493497353e-06, - "loss": 0.5444, - "step": 58739 - }, - { - "epoch": 1.51, - "learning_rate": 1.0425996040307012e-06, - "loss": 0.5571, - "step": 58740 - }, - { - "epoch": 1.51, - "learning_rate": 1.0425719586790508e-06, - "loss": 0.623, - "step": 58741 - }, - { - "epoch": 1.51, - "learning_rate": 1.0425443132948048e-06, - "loss": 0.6758, - "step": 58742 - }, - { - "epoch": 1.51, - "learning_rate": 1.0425166678779848e-06, - "loss": 0.6143, - "step": 58743 - }, - { - "epoch": 1.51, - "learning_rate": 1.0424890224286115e-06, - "loss": 0.5557, - "step": 58744 - }, - { - "epoch": 1.51, - "learning_rate": 1.0424613769467065e-06, - "loss": 0.6963, - "step": 58745 - }, - { - "epoch": 1.51, - "learning_rate": 1.0424337314322907e-06, - "loss": 0.6445, - "step": 58746 - }, - { - "epoch": 1.51, - "learning_rate": 1.0424060858853852e-06, - "loss": 0.7212, - "step": 58747 - }, - { - "epoch": 1.51, - "learning_rate": 1.0423784403060117e-06, - "loss": 0.6001, - "step": 58748 - }, - { - "epoch": 1.51, - "learning_rate": 1.0423507946941907e-06, - "loss": 0.4915, - "step": 58749 - }, - { - "epoch": 1.51, - "learning_rate": 1.0423231490499436e-06, - "loss": 0.6125, - "step": 58750 - }, - { - "epoch": 1.51, - "learning_rate": 1.0422955033732917e-06, - "loss": 0.6719, - "step": 58751 - }, - { - "epoch": 1.51, - "learning_rate": 1.0422678576642559e-06, - "loss": 0.5439, - "step": 58752 - }, - { - "epoch": 1.51, - "learning_rate": 1.0422402119228579e-06, - "loss": 0.8643, - "step": 58753 - }, - { - "epoch": 1.51, - "learning_rate": 1.042212566149118e-06, - "loss": 0.5845, - "step": 58754 - }, - { - "epoch": 1.51, - "learning_rate": 1.0421849203430584e-06, - "loss": 0.4346, - "step": 58755 - }, - { - "epoch": 1.51, - "learning_rate": 1.0421572745046995e-06, - "loss": 0.8096, - "step": 58756 - }, - { - "epoch": 1.51, - "learning_rate": 1.0421296286340629e-06, - "loss": 0.7412, - "step": 58757 - }, - { - "epoch": 1.51, - "learning_rate": 1.0421019827311694e-06, - "loss": 0.6187, - "step": 58758 - }, - { - "epoch": 1.51, - "learning_rate": 1.0420743367960403e-06, - "loss": 0.5757, - "step": 58759 - }, - { - "epoch": 1.51, - "learning_rate": 1.042046690828697e-06, - "loss": 0.6357, - "step": 58760 - }, - { - "epoch": 1.51, - "learning_rate": 1.0420190448291603e-06, - "loss": 0.7432, - "step": 58761 - }, - { - "epoch": 1.51, - "learning_rate": 1.0419913987974515e-06, - "loss": 0.5493, - "step": 58762 - }, - { - "epoch": 1.51, - "learning_rate": 1.041963752733592e-06, - "loss": 0.6699, - "step": 58763 - }, - { - "epoch": 1.51, - "learning_rate": 1.0419361066376026e-06, - "loss": 0.6797, - "step": 58764 - }, - { - "epoch": 1.51, - "learning_rate": 1.0419084605095048e-06, - "loss": 0.7002, - "step": 58765 - }, - { - "epoch": 1.51, - "learning_rate": 1.0418808143493196e-06, - "loss": 0.6548, - "step": 58766 - }, - { - "epoch": 1.51, - "learning_rate": 1.0418531681570682e-06, - "loss": 0.5938, - "step": 58767 - }, - { - "epoch": 1.51, - "learning_rate": 1.0418255219327718e-06, - "loss": 0.5659, - "step": 58768 - }, - { - "epoch": 1.51, - "learning_rate": 1.0417978756764515e-06, - "loss": 0.6006, - "step": 58769 - }, - { - "epoch": 1.51, - "learning_rate": 1.0417702293881285e-06, - "loss": 0.5493, - "step": 58770 - }, - { - "epoch": 1.51, - "learning_rate": 1.0417425830678237e-06, - "loss": 0.7393, - "step": 58771 - }, - { - "epoch": 1.51, - "learning_rate": 1.041714936715559e-06, - "loss": 0.4741, - "step": 58772 - }, - { - "epoch": 1.51, - "learning_rate": 1.0416872903313548e-06, - "loss": 0.5869, - "step": 58773 - }, - { - "epoch": 1.51, - "learning_rate": 1.0416596439152326e-06, - "loss": 0.7373, - "step": 58774 - }, - { - "epoch": 1.51, - "learning_rate": 1.0416319974672132e-06, - "loss": 0.6943, - "step": 58775 - }, - { - "epoch": 1.51, - "learning_rate": 1.0416043509873186e-06, - "loss": 0.6816, - "step": 58776 - }, - { - "epoch": 1.51, - "learning_rate": 1.041576704475569e-06, - "loss": 0.7051, - "step": 58777 - }, - { - "epoch": 1.51, - "learning_rate": 1.0415490579319866e-06, - "loss": 0.5557, - "step": 58778 - }, - { - "epoch": 1.51, - "learning_rate": 1.0415214113565915e-06, - "loss": 0.447, - "step": 58779 - }, - { - "epoch": 1.51, - "learning_rate": 1.0414937647494058e-06, - "loss": 0.4597, - "step": 58780 - }, - { - "epoch": 1.51, - "learning_rate": 1.0414661181104497e-06, - "loss": 0.6978, - "step": 58781 - }, - { - "epoch": 1.51, - "learning_rate": 1.0414384714397452e-06, - "loss": 0.7979, - "step": 58782 - }, - { - "epoch": 1.51, - "learning_rate": 1.0414108247373131e-06, - "loss": 0.7686, - "step": 58783 - }, - { - "epoch": 1.51, - "learning_rate": 1.0413831780031747e-06, - "loss": 0.6675, - "step": 58784 - }, - { - "epoch": 1.51, - "learning_rate": 1.0413555312373512e-06, - "loss": 0.4761, - "step": 58785 - }, - { - "epoch": 1.51, - "learning_rate": 1.0413278844398636e-06, - "loss": 0.6924, - "step": 58786 - }, - { - "epoch": 1.51, - "learning_rate": 1.041300237610733e-06, - "loss": 0.5234, - "step": 58787 - }, - { - "epoch": 1.51, - "learning_rate": 1.041272590749981e-06, - "loss": 0.7031, - "step": 58788 - }, - { - "epoch": 1.51, - "learning_rate": 1.0412449438576282e-06, - "loss": 0.6709, - "step": 58789 - }, - { - "epoch": 1.51, - "learning_rate": 1.0412172969336958e-06, - "loss": 0.6411, - "step": 58790 - }, - { - "epoch": 1.51, - "learning_rate": 1.0411896499782059e-06, - "loss": 0.7988, - "step": 58791 - }, - { - "epoch": 1.51, - "learning_rate": 1.0411620029911784e-06, - "loss": 0.6035, - "step": 58792 - }, - { - "epoch": 1.51, - "learning_rate": 1.0411343559726355e-06, - "loss": 0.5701, - "step": 58793 - }, - { - "epoch": 1.51, - "learning_rate": 1.0411067089225975e-06, - "loss": 0.4143, - "step": 58794 - }, - { - "epoch": 1.51, - "learning_rate": 1.0410790618410864e-06, - "loss": 0.4883, - "step": 58795 - }, - { - "epoch": 1.51, - "learning_rate": 1.0410514147281225e-06, - "loss": 0.5679, - "step": 58796 - }, - { - "epoch": 1.51, - "learning_rate": 1.0410237675837277e-06, - "loss": 0.625, - "step": 58797 - }, - { - "epoch": 1.51, - "learning_rate": 1.0409961204079228e-06, - "loss": 0.5234, - "step": 58798 - }, - { - "epoch": 1.51, - "learning_rate": 1.0409684732007292e-06, - "loss": 0.5459, - "step": 58799 - }, - { - "epoch": 1.51, - "learning_rate": 1.0409408259621674e-06, - "loss": 0.8066, - "step": 58800 - }, - { - "epoch": 1.51, - "learning_rate": 1.0409131786922597e-06, - "loss": 0.7163, - "step": 58801 - }, - { - "epoch": 1.51, - "learning_rate": 1.0408855313910264e-06, - "loss": 0.6812, - "step": 58802 - }, - { - "epoch": 1.51, - "learning_rate": 1.040857884058489e-06, - "loss": 0.7236, - "step": 58803 - }, - { - "epoch": 1.51, - "learning_rate": 1.0408302366946687e-06, - "loss": 0.5183, - "step": 58804 - }, - { - "epoch": 1.51, - "learning_rate": 1.0408025892995865e-06, - "loss": 0.7773, - "step": 58805 - }, - { - "epoch": 1.51, - "learning_rate": 1.0407749418732633e-06, - "loss": 0.6299, - "step": 58806 - }, - { - "epoch": 1.51, - "learning_rate": 1.0407472944157209e-06, - "loss": 0.6924, - "step": 58807 - }, - { - "epoch": 1.51, - "learning_rate": 1.0407196469269803e-06, - "loss": 0.3357, - "step": 58808 - }, - { - "epoch": 1.51, - "learning_rate": 1.0406919994070622e-06, - "loss": 0.6499, - "step": 58809 - }, - { - "epoch": 1.51, - "learning_rate": 1.0406643518559884e-06, - "loss": 0.647, - "step": 58810 - }, - { - "epoch": 1.51, - "learning_rate": 1.0406367042737797e-06, - "loss": 0.5857, - "step": 58811 - }, - { - "epoch": 1.51, - "learning_rate": 1.040609056660457e-06, - "loss": 0.6133, - "step": 58812 - }, - { - "epoch": 1.51, - "learning_rate": 1.0405814090160422e-06, - "loss": 0.502, - "step": 58813 - }, - { - "epoch": 1.51, - "learning_rate": 1.040553761340556e-06, - "loss": 0.6597, - "step": 58814 - }, - { - "epoch": 1.51, - "learning_rate": 1.0405261136340198e-06, - "loss": 0.8496, - "step": 58815 - }, - { - "epoch": 1.51, - "learning_rate": 1.0404984658964544e-06, - "loss": 0.7432, - "step": 58816 - }, - { - "epoch": 1.51, - "learning_rate": 1.0404708181278813e-06, - "loss": 0.4575, - "step": 58817 - }, - { - "epoch": 1.51, - "learning_rate": 1.0404431703283215e-06, - "loss": 0.8276, - "step": 58818 - }, - { - "epoch": 1.51, - "learning_rate": 1.0404155224977962e-06, - "loss": 0.6177, - "step": 58819 - }, - { - "epoch": 1.51, - "learning_rate": 1.0403878746363268e-06, - "loss": 0.5623, - "step": 58820 - }, - { - "epoch": 1.51, - "learning_rate": 1.040360226743934e-06, - "loss": 0.709, - "step": 58821 - }, - { - "epoch": 1.51, - "learning_rate": 1.0403325788206394e-06, - "loss": 0.7061, - "step": 58822 - }, - { - "epoch": 1.51, - "learning_rate": 1.040304930866464e-06, - "loss": 0.792, - "step": 58823 - }, - { - "epoch": 1.51, - "learning_rate": 1.0402772828814288e-06, - "loss": 0.5425, - "step": 58824 - }, - { - "epoch": 1.51, - "learning_rate": 1.040249634865555e-06, - "loss": 0.395, - "step": 58825 - }, - { - "epoch": 1.51, - "learning_rate": 1.0402219868188644e-06, - "loss": 0.6372, - "step": 58826 - }, - { - "epoch": 1.51, - "learning_rate": 1.0401943387413772e-06, - "loss": 0.6089, - "step": 58827 - }, - { - "epoch": 1.51, - "learning_rate": 1.0401666906331153e-06, - "loss": 0.6021, - "step": 58828 - }, - { - "epoch": 1.51, - "learning_rate": 1.0401390424940997e-06, - "loss": 0.6641, - "step": 58829 - }, - { - "epoch": 1.51, - "learning_rate": 1.0401113943243512e-06, - "loss": 0.7764, - "step": 58830 - }, - { - "epoch": 1.51, - "learning_rate": 1.0400837461238914e-06, - "loss": 0.6777, - "step": 58831 - }, - { - "epoch": 1.51, - "learning_rate": 1.0400560978927413e-06, - "loss": 0.7568, - "step": 58832 - }, - { - "epoch": 1.51, - "learning_rate": 1.0400284496309222e-06, - "loss": 0.6602, - "step": 58833 - }, - { - "epoch": 1.51, - "learning_rate": 1.040000801338455e-06, - "loss": 0.5764, - "step": 58834 - }, - { - "epoch": 1.51, - "learning_rate": 1.039973153015361e-06, - "loss": 0.5654, - "step": 58835 - }, - { - "epoch": 1.51, - "learning_rate": 1.0399455046616614e-06, - "loss": 0.7085, - "step": 58836 - }, - { - "epoch": 1.51, - "learning_rate": 1.0399178562773776e-06, - "loss": 0.6724, - "step": 58837 - }, - { - "epoch": 1.51, - "learning_rate": 1.0398902078625304e-06, - "loss": 0.6396, - "step": 58838 - }, - { - "epoch": 1.51, - "learning_rate": 1.039862559417141e-06, - "loss": 0.6582, - "step": 58839 - }, - { - "epoch": 1.51, - "learning_rate": 1.0398349109412308e-06, - "loss": 0.5049, - "step": 58840 - }, - { - "epoch": 1.51, - "learning_rate": 1.0398072624348206e-06, - "loss": 0.6309, - "step": 58841 - }, - { - "epoch": 1.51, - "learning_rate": 1.039779613897932e-06, - "loss": 0.5654, - "step": 58842 - }, - { - "epoch": 1.51, - "learning_rate": 1.0397519653305863e-06, - "loss": 0.7061, - "step": 58843 - }, - { - "epoch": 1.51, - "learning_rate": 1.0397243167328039e-06, - "loss": 0.6509, - "step": 58844 - }, - { - "epoch": 1.51, - "learning_rate": 1.0396966681046064e-06, - "loss": 0.5732, - "step": 58845 - }, - { - "epoch": 1.51, - "learning_rate": 1.039669019446015e-06, - "loss": 0.7031, - "step": 58846 - }, - { - "epoch": 1.51, - "learning_rate": 1.039641370757051e-06, - "loss": 0.6846, - "step": 58847 - }, - { - "epoch": 1.51, - "learning_rate": 1.0396137220377357e-06, - "loss": 0.7227, - "step": 58848 - }, - { - "epoch": 1.51, - "learning_rate": 1.0395860732880896e-06, - "loss": 0.5596, - "step": 58849 - }, - { - "epoch": 1.51, - "learning_rate": 1.0395584245081344e-06, - "loss": 0.6084, - "step": 58850 - }, - { - "epoch": 1.51, - "learning_rate": 1.039530775697891e-06, - "loss": 0.6816, - "step": 58851 - }, - { - "epoch": 1.51, - "learning_rate": 1.0395031268573808e-06, - "loss": 0.7471, - "step": 58852 - }, - { - "epoch": 1.51, - "learning_rate": 1.0394754779866249e-06, - "loss": 0.7725, - "step": 58853 - }, - { - "epoch": 1.51, - "learning_rate": 1.0394478290856445e-06, - "loss": 0.7041, - "step": 58854 - }, - { - "epoch": 1.51, - "learning_rate": 1.0394201801544604e-06, - "loss": 0.6309, - "step": 58855 - }, - { - "epoch": 1.51, - "learning_rate": 1.0393925311930944e-06, - "loss": 0.6042, - "step": 58856 - }, - { - "epoch": 1.51, - "learning_rate": 1.039364882201567e-06, - "loss": 0.6333, - "step": 58857 - }, - { - "epoch": 1.51, - "learning_rate": 1.0393372331799005e-06, - "loss": 0.5581, - "step": 58858 - }, - { - "epoch": 1.51, - "learning_rate": 1.0393095841281146e-06, - "loss": 0.6211, - "step": 58859 - }, - { - "epoch": 1.51, - "learning_rate": 1.0392819350462312e-06, - "loss": 0.7061, - "step": 58860 - }, - { - "epoch": 1.51, - "learning_rate": 1.0392542859342714e-06, - "loss": 0.6533, - "step": 58861 - }, - { - "epoch": 1.51, - "learning_rate": 1.0392266367922566e-06, - "loss": 0.7119, - "step": 58862 - }, - { - "epoch": 1.51, - "learning_rate": 1.0391989876202079e-06, - "loss": 0.4331, - "step": 58863 - }, - { - "epoch": 1.51, - "learning_rate": 1.0391713384181462e-06, - "loss": 0.7754, - "step": 58864 - }, - { - "epoch": 1.51, - "learning_rate": 1.0391436891860926e-06, - "loss": 0.543, - "step": 58865 - }, - { - "epoch": 1.51, - "learning_rate": 1.0391160399240689e-06, - "loss": 0.6025, - "step": 58866 - }, - { - "epoch": 1.51, - "learning_rate": 1.0390883906320953e-06, - "loss": 0.5815, - "step": 58867 - }, - { - "epoch": 1.51, - "learning_rate": 1.0390607413101942e-06, - "loss": 0.8203, - "step": 58868 - }, - { - "epoch": 1.51, - "learning_rate": 1.0390330919583854e-06, - "loss": 0.7666, - "step": 58869 - }, - { - "epoch": 1.51, - "learning_rate": 1.0390054425766911e-06, - "loss": 0.4297, - "step": 58870 - }, - { - "epoch": 1.51, - "learning_rate": 1.038977793165132e-06, - "loss": 0.4929, - "step": 58871 - }, - { - "epoch": 1.51, - "learning_rate": 1.0389501437237295e-06, - "loss": 0.7275, - "step": 58872 - }, - { - "epoch": 1.51, - "learning_rate": 1.0389224942525047e-06, - "loss": 0.4639, - "step": 58873 - }, - { - "epoch": 1.51, - "learning_rate": 1.0388948447514786e-06, - "loss": 0.7549, - "step": 58874 - }, - { - "epoch": 1.51, - "learning_rate": 1.0388671952206724e-06, - "loss": 0.6816, - "step": 58875 - }, - { - "epoch": 1.51, - "learning_rate": 1.0388395456601077e-06, - "loss": 0.522, - "step": 58876 - }, - { - "epoch": 1.51, - "learning_rate": 1.0388118960698051e-06, - "loss": 0.5254, - "step": 58877 - }, - { - "epoch": 1.51, - "learning_rate": 1.0387842464497863e-06, - "loss": 0.8662, - "step": 58878 - }, - { - "epoch": 1.51, - "learning_rate": 1.038756596800072e-06, - "loss": 0.6333, - "step": 58879 - }, - { - "epoch": 1.51, - "learning_rate": 1.0387289471206835e-06, - "loss": 0.6631, - "step": 58880 - }, - { - "epoch": 1.51, - "learning_rate": 1.038701297411642e-06, - "loss": 0.5488, - "step": 58881 - }, - { - "epoch": 1.51, - "learning_rate": 1.0386736476729686e-06, - "loss": 0.8271, - "step": 58882 - }, - { - "epoch": 1.51, - "learning_rate": 1.0386459979046852e-06, - "loss": 0.6689, - "step": 58883 - }, - { - "epoch": 1.51, - "learning_rate": 1.0386183481068117e-06, - "loss": 0.5718, - "step": 58884 - }, - { - "epoch": 1.51, - "learning_rate": 1.03859069827937e-06, - "loss": 0.5977, - "step": 58885 - }, - { - "epoch": 1.51, - "learning_rate": 1.0385630484223811e-06, - "loss": 0.7012, - "step": 58886 - }, - { - "epoch": 1.51, - "learning_rate": 1.0385353985358665e-06, - "loss": 0.7812, - "step": 58887 - }, - { - "epoch": 1.51, - "learning_rate": 1.0385077486198473e-06, - "loss": 0.6055, - "step": 58888 - }, - { - "epoch": 1.51, - "learning_rate": 1.038480098674344e-06, - "loss": 0.4277, - "step": 58889 - }, - { - "epoch": 1.51, - "learning_rate": 1.0384524486993783e-06, - "loss": 0.6099, - "step": 58890 - }, - { - "epoch": 1.51, - "learning_rate": 1.0384247986949717e-06, - "loss": 0.6855, - "step": 58891 - }, - { - "epoch": 1.51, - "learning_rate": 1.0383971486611447e-06, - "loss": 0.6582, - "step": 58892 - }, - { - "epoch": 1.51, - "learning_rate": 1.0383694985979193e-06, - "loss": 0.5459, - "step": 58893 - }, - { - "epoch": 1.51, - "learning_rate": 1.0383418485053156e-06, - "loss": 0.8086, - "step": 58894 - }, - { - "epoch": 1.51, - "learning_rate": 1.0383141983833552e-06, - "loss": 0.7764, - "step": 58895 - }, - { - "epoch": 1.51, - "learning_rate": 1.0382865482320595e-06, - "loss": 0.6494, - "step": 58896 - }, - { - "epoch": 1.51, - "learning_rate": 1.0382588980514497e-06, - "loss": 0.6357, - "step": 58897 - }, - { - "epoch": 1.51, - "learning_rate": 1.038231247841547e-06, - "loss": 0.8164, - "step": 58898 - }, - { - "epoch": 1.51, - "learning_rate": 1.038203597602372e-06, - "loss": 0.5947, - "step": 58899 - }, - { - "epoch": 1.51, - "learning_rate": 1.0381759473339465e-06, - "loss": 0.5845, - "step": 58900 - }, - { - "epoch": 1.51, - "learning_rate": 1.0381482970362912e-06, - "loss": 0.7598, - "step": 58901 - }, - { - "epoch": 1.51, - "learning_rate": 1.0381206467094276e-06, - "loss": 0.5449, - "step": 58902 - }, - { - "epoch": 1.51, - "learning_rate": 1.038092996353377e-06, - "loss": 0.583, - "step": 58903 - }, - { - "epoch": 1.51, - "learning_rate": 1.0380653459681602e-06, - "loss": 0.6172, - "step": 58904 - }, - { - "epoch": 1.51, - "learning_rate": 1.0380376955537983e-06, - "loss": 0.5488, - "step": 58905 - }, - { - "epoch": 1.51, - "learning_rate": 1.0380100451103129e-06, - "loss": 0.7598, - "step": 58906 - }, - { - "epoch": 1.51, - "learning_rate": 1.037982394637725e-06, - "loss": 0.6421, - "step": 58907 - }, - { - "epoch": 1.51, - "learning_rate": 1.037954744136056e-06, - "loss": 0.623, - "step": 58908 - }, - { - "epoch": 1.51, - "learning_rate": 1.0379270936053261e-06, - "loss": 0.6562, - "step": 58909 - }, - { - "epoch": 1.51, - "learning_rate": 1.0378994430455577e-06, - "loss": 0.7339, - "step": 58910 - }, - { - "epoch": 1.51, - "learning_rate": 1.037871792456771e-06, - "loss": 0.6367, - "step": 58911 - }, - { - "epoch": 1.51, - "learning_rate": 1.0378441418389878e-06, - "loss": 0.4038, - "step": 58912 - }, - { - "epoch": 1.51, - "learning_rate": 1.0378164911922293e-06, - "loss": 0.7139, - "step": 58913 - }, - { - "epoch": 1.51, - "learning_rate": 1.0377888405165165e-06, - "loss": 0.6494, - "step": 58914 - }, - { - "epoch": 1.51, - "learning_rate": 1.03776118981187e-06, - "loss": 0.7012, - "step": 58915 - }, - { - "epoch": 1.51, - "learning_rate": 1.037733539078312e-06, - "loss": 0.5566, - "step": 58916 - }, - { - "epoch": 1.51, - "learning_rate": 1.0377058883158628e-06, - "loss": 0.7109, - "step": 58917 - }, - { - "epoch": 1.51, - "learning_rate": 1.0376782375245444e-06, - "loss": 0.6665, - "step": 58918 - }, - { - "epoch": 1.51, - "learning_rate": 1.0376505867043773e-06, - "loss": 0.5713, - "step": 58919 - }, - { - "epoch": 1.51, - "learning_rate": 1.0376229358553825e-06, - "loss": 0.6099, - "step": 58920 - }, - { - "epoch": 1.51, - "learning_rate": 1.037595284977582e-06, - "loss": 0.626, - "step": 58921 - }, - { - "epoch": 1.51, - "learning_rate": 1.0375676340709963e-06, - "loss": 0.748, - "step": 58922 - }, - { - "epoch": 1.51, - "learning_rate": 1.0375399831356471e-06, - "loss": 0.5571, - "step": 58923 - }, - { - "epoch": 1.51, - "learning_rate": 1.0375123321715547e-06, - "loss": 0.3448, - "step": 58924 - }, - { - "epoch": 1.51, - "learning_rate": 1.0374846811787411e-06, - "loss": 0.6455, - "step": 58925 - }, - { - "epoch": 1.51, - "learning_rate": 1.037457030157227e-06, - "loss": 0.6484, - "step": 58926 - }, - { - "epoch": 1.51, - "learning_rate": 1.0374293791070342e-06, - "loss": 0.4635, - "step": 58927 - }, - { - "epoch": 1.51, - "learning_rate": 1.0374017280281835e-06, - "loss": 0.4885, - "step": 58928 - }, - { - "epoch": 1.51, - "learning_rate": 1.0373740769206958e-06, - "loss": 0.6797, - "step": 58929 - }, - { - "epoch": 1.51, - "learning_rate": 1.0373464257845926e-06, - "loss": 0.7393, - "step": 58930 - }, - { - "epoch": 1.51, - "learning_rate": 1.0373187746198948e-06, - "loss": 0.5806, - "step": 58931 - }, - { - "epoch": 1.51, - "learning_rate": 1.0372911234266235e-06, - "loss": 0.5996, - "step": 58932 - }, - { - "epoch": 1.51, - "learning_rate": 1.0372634722048008e-06, - "loss": 0.6694, - "step": 58933 - }, - { - "epoch": 1.51, - "learning_rate": 1.0372358209544466e-06, - "loss": 0.593, - "step": 58934 - }, - { - "epoch": 1.51, - "learning_rate": 1.0372081696755828e-06, - "loss": 0.8135, - "step": 58935 - }, - { - "epoch": 1.51, - "learning_rate": 1.0371805183682303e-06, - "loss": 0.5583, - "step": 58936 - }, - { - "epoch": 1.51, - "learning_rate": 1.0371528670324105e-06, - "loss": 0.4648, - "step": 58937 - }, - { - "epoch": 1.51, - "learning_rate": 1.0371252156681445e-06, - "loss": 0.7119, - "step": 58938 - }, - { - "epoch": 1.51, - "learning_rate": 1.0370975642754535e-06, - "loss": 0.625, - "step": 58939 - }, - { - "epoch": 1.51, - "learning_rate": 1.0370699128543582e-06, - "loss": 0.6592, - "step": 58940 - }, - { - "epoch": 1.51, - "learning_rate": 1.0370422614048806e-06, - "loss": 0.7065, - "step": 58941 - }, - { - "epoch": 1.51, - "learning_rate": 1.037014609927041e-06, - "loss": 0.791, - "step": 58942 - }, - { - "epoch": 1.51, - "learning_rate": 1.0369869584208616e-06, - "loss": 0.7324, - "step": 58943 - }, - { - "epoch": 1.51, - "learning_rate": 1.0369593068863628e-06, - "loss": 0.6138, - "step": 58944 - }, - { - "epoch": 1.51, - "learning_rate": 1.0369316553235657e-06, - "loss": 0.6787, - "step": 58945 - }, - { - "epoch": 1.51, - "learning_rate": 1.0369040037324918e-06, - "loss": 0.7256, - "step": 58946 - }, - { - "epoch": 1.51, - "learning_rate": 1.0368763521131623e-06, - "loss": 0.6348, - "step": 58947 - }, - { - "epoch": 1.51, - "learning_rate": 1.0368487004655984e-06, - "loss": 0.5908, - "step": 58948 - }, - { - "epoch": 1.51, - "learning_rate": 1.0368210487898208e-06, - "loss": 0.5139, - "step": 58949 - }, - { - "epoch": 1.51, - "learning_rate": 1.0367933970858513e-06, - "loss": 0.8223, - "step": 58950 - }, - { - "epoch": 1.51, - "learning_rate": 1.0367657453537107e-06, - "loss": 0.749, - "step": 58951 - }, - { - "epoch": 1.51, - "learning_rate": 1.0367380935934205e-06, - "loss": 0.5327, - "step": 58952 - }, - { - "epoch": 1.51, - "learning_rate": 1.0367104418050013e-06, - "loss": 0.7568, - "step": 58953 - }, - { - "epoch": 1.51, - "learning_rate": 1.0366827899884746e-06, - "loss": 0.7197, - "step": 58954 - }, - { - "epoch": 1.51, - "learning_rate": 1.0366551381438618e-06, - "loss": 0.6611, - "step": 58955 - }, - { - "epoch": 1.51, - "learning_rate": 1.0366274862711837e-06, - "loss": 0.5527, - "step": 58956 - }, - { - "epoch": 1.51, - "learning_rate": 1.0365998343704617e-06, - "loss": 0.6875, - "step": 58957 - }, - { - "epoch": 1.51, - "learning_rate": 1.036572182441717e-06, - "loss": 0.5715, - "step": 58958 - }, - { - "epoch": 1.51, - "learning_rate": 1.0365445304849703e-06, - "loss": 0.8408, - "step": 58959 - }, - { - "epoch": 1.51, - "learning_rate": 1.0365168785002432e-06, - "loss": 0.7324, - "step": 58960 - }, - { - "epoch": 1.51, - "learning_rate": 1.0364892264875569e-06, - "loss": 0.7148, - "step": 58961 - }, - { - "epoch": 1.51, - "learning_rate": 1.0364615744469326e-06, - "loss": 0.4624, - "step": 58962 - }, - { - "epoch": 1.51, - "learning_rate": 1.0364339223783914e-06, - "loss": 0.5288, - "step": 58963 - }, - { - "epoch": 1.51, - "learning_rate": 1.036406270281954e-06, - "loss": 0.7148, - "step": 58964 - }, - { - "epoch": 1.51, - "learning_rate": 1.0363786181576424e-06, - "loss": 0.6592, - "step": 58965 - }, - { - "epoch": 1.51, - "learning_rate": 1.0363509660054773e-06, - "loss": 0.4767, - "step": 58966 - }, - { - "epoch": 1.51, - "learning_rate": 1.0363233138254799e-06, - "loss": 0.48, - "step": 58967 - }, - { - "epoch": 1.51, - "learning_rate": 1.0362956616176712e-06, - "loss": 0.6265, - "step": 58968 - }, - { - "epoch": 1.51, - "learning_rate": 1.0362680093820729e-06, - "loss": 0.6831, - "step": 58969 - }, - { - "epoch": 1.51, - "learning_rate": 1.0362403571187054e-06, - "loss": 0.4761, - "step": 58970 - }, - { - "epoch": 1.51, - "learning_rate": 1.0362127048275908e-06, - "loss": 0.5173, - "step": 58971 - }, - { - "epoch": 1.51, - "learning_rate": 1.0361850525087497e-06, - "loss": 0.6069, - "step": 58972 - }, - { - "epoch": 1.51, - "learning_rate": 1.0361574001622034e-06, - "loss": 0.6763, - "step": 58973 - }, - { - "epoch": 1.51, - "learning_rate": 1.0361297477879727e-06, - "loss": 0.6943, - "step": 58974 - }, - { - "epoch": 1.51, - "learning_rate": 1.0361020953860795e-06, - "loss": 0.6704, - "step": 58975 - }, - { - "epoch": 1.51, - "learning_rate": 1.0360744429565443e-06, - "loss": 0.7205, - "step": 58976 - }, - { - "epoch": 1.51, - "learning_rate": 1.036046790499389e-06, - "loss": 0.553, - "step": 58977 - }, - { - "epoch": 1.51, - "learning_rate": 1.0360191380146338e-06, - "loss": 0.5498, - "step": 58978 - }, - { - "epoch": 1.51, - "learning_rate": 1.0359914855023007e-06, - "loss": 0.667, - "step": 58979 - }, - { - "epoch": 1.51, - "learning_rate": 1.0359638329624103e-06, - "loss": 0.6484, - "step": 58980 - }, - { - "epoch": 1.51, - "learning_rate": 1.0359361803949844e-06, - "loss": 0.7568, - "step": 58981 - }, - { - "epoch": 1.51, - "learning_rate": 1.0359085278000436e-06, - "loss": 0.6709, - "step": 58982 - }, - { - "epoch": 1.51, - "learning_rate": 1.0358808751776096e-06, - "loss": 0.5903, - "step": 58983 - }, - { - "epoch": 1.51, - "learning_rate": 1.0358532225277028e-06, - "loss": 0.6172, - "step": 58984 - }, - { - "epoch": 1.51, - "learning_rate": 1.0358255698503453e-06, - "loss": 0.6982, - "step": 58985 - }, - { - "epoch": 1.51, - "learning_rate": 1.0357979171455574e-06, - "loss": 0.7168, - "step": 58986 - }, - { - "epoch": 1.51, - "learning_rate": 1.0357702644133608e-06, - "loss": 0.4629, - "step": 58987 - }, - { - "epoch": 1.51, - "learning_rate": 1.0357426116537766e-06, - "loss": 0.6826, - "step": 58988 - }, - { - "epoch": 1.51, - "learning_rate": 1.035714958866826e-06, - "loss": 0.9453, - "step": 58989 - }, - { - "epoch": 1.51, - "learning_rate": 1.03568730605253e-06, - "loss": 0.5552, - "step": 58990 - }, - { - "epoch": 1.51, - "learning_rate": 1.0356596532109099e-06, - "loss": 0.6846, - "step": 58991 - }, - { - "epoch": 1.51, - "learning_rate": 1.035632000341987e-06, - "loss": 0.6904, - "step": 58992 - }, - { - "epoch": 1.51, - "learning_rate": 1.035604347445782e-06, - "loss": 0.6387, - "step": 58993 - }, - { - "epoch": 1.51, - "learning_rate": 1.0355766945223166e-06, - "loss": 0.6504, - "step": 58994 - }, - { - "epoch": 1.51, - "learning_rate": 1.0355490415716115e-06, - "loss": 0.6816, - "step": 58995 - }, - { - "epoch": 1.51, - "learning_rate": 1.0355213885936885e-06, - "loss": 0.7139, - "step": 58996 - }, - { - "epoch": 1.51, - "learning_rate": 1.0354937355885682e-06, - "loss": 0.7217, - "step": 58997 - }, - { - "epoch": 1.51, - "learning_rate": 1.0354660825562722e-06, - "loss": 0.5776, - "step": 58998 - }, - { - "epoch": 1.51, - "learning_rate": 1.0354384294968213e-06, - "loss": 0.8604, - "step": 58999 - }, - { - "epoch": 1.51, - "learning_rate": 1.0354107764102367e-06, - "loss": 0.5859, - "step": 59000 - }, - { - "epoch": 1.51, - "learning_rate": 1.0353831232965398e-06, - "loss": 0.6768, - "step": 59001 - }, - { - "epoch": 1.51, - "learning_rate": 1.035355470155752e-06, - "loss": 0.7119, - "step": 59002 - }, - { - "epoch": 1.51, - "learning_rate": 1.0353278169878934e-06, - "loss": 0.6465, - "step": 59003 - }, - { - "epoch": 1.51, - "learning_rate": 1.0353001637929867e-06, - "loss": 0.666, - "step": 59004 - }, - { - "epoch": 1.51, - "learning_rate": 1.0352725105710515e-06, - "loss": 0.7305, - "step": 59005 - }, - { - "epoch": 1.51, - "learning_rate": 1.0352448573221102e-06, - "loss": 0.5483, - "step": 59006 - }, - { - "epoch": 1.51, - "learning_rate": 1.0352172040461838e-06, - "loss": 0.4958, - "step": 59007 - }, - { - "epoch": 1.51, - "learning_rate": 1.0351895507432926e-06, - "loss": 0.8193, - "step": 59008 - }, - { - "epoch": 1.51, - "learning_rate": 1.0351618974134588e-06, - "loss": 0.5845, - "step": 59009 - }, - { - "epoch": 1.51, - "learning_rate": 1.0351342440567031e-06, - "loss": 0.6748, - "step": 59010 - }, - { - "epoch": 1.51, - "learning_rate": 1.0351065906730465e-06, - "loss": 0.6719, - "step": 59011 - }, - { - "epoch": 1.51, - "learning_rate": 1.0350789372625105e-06, - "loss": 0.6572, - "step": 59012 - }, - { - "epoch": 1.51, - "learning_rate": 1.0350512838251164e-06, - "loss": 0.6953, - "step": 59013 - }, - { - "epoch": 1.51, - "learning_rate": 1.035023630360885e-06, - "loss": 0.6226, - "step": 59014 - }, - { - "epoch": 1.51, - "learning_rate": 1.0349959768698375e-06, - "loss": 0.832, - "step": 59015 - }, - { - "epoch": 1.51, - "learning_rate": 1.0349683233519951e-06, - "loss": 0.6104, - "step": 59016 - }, - { - "epoch": 1.51, - "learning_rate": 1.0349406698073798e-06, - "loss": 0.6606, - "step": 59017 - }, - { - "epoch": 1.51, - "learning_rate": 1.0349130162360111e-06, - "loss": 0.7087, - "step": 59018 - }, - { - "epoch": 1.51, - "learning_rate": 1.0348853626379116e-06, - "loss": 0.6641, - "step": 59019 - }, - { - "epoch": 1.51, - "learning_rate": 1.034857709013102e-06, - "loss": 0.6577, - "step": 59020 - }, - { - "epoch": 1.51, - "learning_rate": 1.0348300553616031e-06, - "loss": 0.6836, - "step": 59021 - }, - { - "epoch": 1.51, - "learning_rate": 1.034802401683437e-06, - "loss": 0.4834, - "step": 59022 - }, - { - "epoch": 1.51, - "learning_rate": 1.034774747978624e-06, - "loss": 0.5962, - "step": 59023 - }, - { - "epoch": 1.51, - "learning_rate": 1.0347470942471851e-06, - "loss": 0.4722, - "step": 59024 - }, - { - "epoch": 1.51, - "learning_rate": 1.0347194404891427e-06, - "loss": 0.5493, - "step": 59025 - }, - { - "epoch": 1.51, - "learning_rate": 1.0346917867045166e-06, - "loss": 0.7251, - "step": 59026 - }, - { - "epoch": 1.51, - "learning_rate": 1.034664132893329e-06, - "loss": 0.6167, - "step": 59027 - }, - { - "epoch": 1.51, - "learning_rate": 1.0346364790556008e-06, - "loss": 0.3945, - "step": 59028 - }, - { - "epoch": 1.51, - "learning_rate": 1.0346088251913527e-06, - "loss": 0.5795, - "step": 59029 - }, - { - "epoch": 1.51, - "learning_rate": 1.0345811713006063e-06, - "loss": 0.7617, - "step": 59030 - }, - { - "epoch": 1.51, - "learning_rate": 1.0345535173833828e-06, - "loss": 0.5449, - "step": 59031 - }, - { - "epoch": 1.51, - "learning_rate": 1.0345258634397032e-06, - "loss": 0.5752, - "step": 59032 - }, - { - "epoch": 1.51, - "learning_rate": 1.0344982094695885e-06, - "loss": 0.3206, - "step": 59033 - }, - { - "epoch": 1.51, - "learning_rate": 1.0344705554730603e-06, - "loss": 0.499, - "step": 59034 - }, - { - "epoch": 1.51, - "learning_rate": 1.0344429014501394e-06, - "loss": 0.6287, - "step": 59035 - }, - { - "epoch": 1.51, - "learning_rate": 1.0344152474008477e-06, - "loss": 0.5454, - "step": 59036 - }, - { - "epoch": 1.51, - "learning_rate": 1.0343875933252054e-06, - "loss": 0.4938, - "step": 59037 - }, - { - "epoch": 1.51, - "learning_rate": 1.0343599392232343e-06, - "loss": 0.7471, - "step": 59038 - }, - { - "epoch": 1.51, - "learning_rate": 1.034332285094955e-06, - "loss": 0.7607, - "step": 59039 - }, - { - "epoch": 1.51, - "learning_rate": 1.0343046309403894e-06, - "loss": 0.4756, - "step": 59040 - }, - { - "epoch": 1.51, - "learning_rate": 1.034276976759558e-06, - "loss": 0.751, - "step": 59041 - }, - { - "epoch": 1.51, - "learning_rate": 1.034249322552483e-06, - "loss": 0.486, - "step": 59042 - }, - { - "epoch": 1.51, - "learning_rate": 1.034221668319184e-06, - "loss": 0.3964, - "step": 59043 - }, - { - "epoch": 1.51, - "learning_rate": 1.0341940140596837e-06, - "loss": 0.5742, - "step": 59044 - }, - { - "epoch": 1.51, - "learning_rate": 1.034166359774002e-06, - "loss": 0.75, - "step": 59045 - }, - { - "epoch": 1.51, - "learning_rate": 1.0341387054621612e-06, - "loss": 0.6084, - "step": 59046 - }, - { - "epoch": 1.51, - "learning_rate": 1.034111051124182e-06, - "loss": 0.4961, - "step": 59047 - }, - { - "epoch": 1.51, - "learning_rate": 1.0340833967600853e-06, - "loss": 0.4958, - "step": 59048 - }, - { - "epoch": 1.51, - "learning_rate": 1.0340557423698922e-06, - "loss": 0.8477, - "step": 59049 - }, - { - "epoch": 1.51, - "learning_rate": 1.0340280879536247e-06, - "loss": 0.5347, - "step": 59050 - }, - { - "epoch": 1.51, - "learning_rate": 1.0340004335113031e-06, - "loss": 0.5879, - "step": 59051 - }, - { - "epoch": 1.51, - "learning_rate": 1.0339727790429492e-06, - "loss": 0.6079, - "step": 59052 - }, - { - "epoch": 1.51, - "learning_rate": 1.033945124548584e-06, - "loss": 0.7197, - "step": 59053 - }, - { - "epoch": 1.51, - "learning_rate": 1.0339174700282282e-06, - "loss": 0.6157, - "step": 59054 - }, - { - "epoch": 1.51, - "learning_rate": 1.0338898154819035e-06, - "loss": 0.5447, - "step": 59055 - }, - { - "epoch": 1.51, - "learning_rate": 1.0338621609096311e-06, - "loss": 0.5352, - "step": 59056 - }, - { - "epoch": 1.51, - "learning_rate": 1.033834506311432e-06, - "loss": 0.8145, - "step": 59057 - }, - { - "epoch": 1.51, - "learning_rate": 1.0338068516873271e-06, - "loss": 0.7109, - "step": 59058 - }, - { - "epoch": 1.51, - "learning_rate": 1.033779197037338e-06, - "loss": 0.7092, - "step": 59059 - }, - { - "epoch": 1.51, - "learning_rate": 1.0337515423614856e-06, - "loss": 0.3816, - "step": 59060 - }, - { - "epoch": 1.51, - "learning_rate": 1.0337238876597913e-06, - "loss": 0.6191, - "step": 59061 - }, - { - "epoch": 1.51, - "learning_rate": 1.0336962329322763e-06, - "loss": 0.6055, - "step": 59062 - }, - { - "epoch": 1.51, - "learning_rate": 1.0336685781789616e-06, - "loss": 0.7471, - "step": 59063 - }, - { - "epoch": 1.51, - "learning_rate": 1.0336409233998682e-06, - "loss": 0.7939, - "step": 59064 - }, - { - "epoch": 1.51, - "learning_rate": 1.0336132685950178e-06, - "loss": 0.7227, - "step": 59065 - }, - { - "epoch": 1.51, - "learning_rate": 1.033585613764431e-06, - "loss": 0.7178, - "step": 59066 - }, - { - "epoch": 1.51, - "learning_rate": 1.0335579589081295e-06, - "loss": 0.6523, - "step": 59067 - }, - { - "epoch": 1.51, - "learning_rate": 1.033530304026134e-06, - "loss": 0.6553, - "step": 59068 - }, - { - "epoch": 1.51, - "learning_rate": 1.033502649118466e-06, - "loss": 0.5977, - "step": 59069 - }, - { - "epoch": 1.51, - "learning_rate": 1.0334749941851464e-06, - "loss": 0.5127, - "step": 59070 - }, - { - "epoch": 1.51, - "learning_rate": 1.0334473392261966e-06, - "loss": 0.5151, - "step": 59071 - }, - { - "epoch": 1.51, - "learning_rate": 1.033419684241638e-06, - "loss": 0.5703, - "step": 59072 - }, - { - "epoch": 1.51, - "learning_rate": 1.033392029231491e-06, - "loss": 0.6982, - "step": 59073 - }, - { - "epoch": 1.51, - "learning_rate": 1.0333643741957776e-06, - "loss": 0.5781, - "step": 59074 - }, - { - "epoch": 1.51, - "learning_rate": 1.0333367191345186e-06, - "loss": 0.7764, - "step": 59075 - }, - { - "epoch": 1.51, - "learning_rate": 1.033309064047735e-06, - "loss": 0.5571, - "step": 59076 - }, - { - "epoch": 1.51, - "learning_rate": 1.0332814089354482e-06, - "loss": 0.4095, - "step": 59077 - }, - { - "epoch": 1.51, - "learning_rate": 1.0332537537976797e-06, - "loss": 0.5781, - "step": 59078 - }, - { - "epoch": 1.51, - "learning_rate": 1.0332260986344498e-06, - "loss": 0.5693, - "step": 59079 - }, - { - "epoch": 1.51, - "learning_rate": 1.0331984434457808e-06, - "loss": 0.7681, - "step": 59080 - }, - { - "epoch": 1.51, - "learning_rate": 1.0331707882316928e-06, - "loss": 0.6602, - "step": 59081 - }, - { - "epoch": 1.51, - "learning_rate": 1.0331431329922077e-06, - "loss": 0.5859, - "step": 59082 - }, - { - "epoch": 1.51, - "learning_rate": 1.0331154777273464e-06, - "loss": 0.7012, - "step": 59083 - }, - { - "epoch": 1.51, - "learning_rate": 1.0330878224371302e-06, - "loss": 0.5232, - "step": 59084 - }, - { - "epoch": 1.51, - "learning_rate": 1.0330601671215797e-06, - "loss": 0.6426, - "step": 59085 - }, - { - "epoch": 1.51, - "learning_rate": 1.033032511780717e-06, - "loss": 0.564, - "step": 59086 - }, - { - "epoch": 1.51, - "learning_rate": 1.0330048564145628e-06, - "loss": 0.7148, - "step": 59087 - }, - { - "epoch": 1.51, - "learning_rate": 1.0329772010231383e-06, - "loss": 0.6733, - "step": 59088 - }, - { - "epoch": 1.51, - "learning_rate": 1.0329495456064645e-06, - "loss": 0.4561, - "step": 59089 - }, - { - "epoch": 1.51, - "learning_rate": 1.032921890164563e-06, - "loss": 0.665, - "step": 59090 - }, - { - "epoch": 1.51, - "learning_rate": 1.0328942346974543e-06, - "loss": 0.5615, - "step": 59091 - }, - { - "epoch": 1.51, - "learning_rate": 1.0328665792051606e-06, - "loss": 0.6008, - "step": 59092 - }, - { - "epoch": 1.51, - "learning_rate": 1.032838923687702e-06, - "loss": 0.5967, - "step": 59093 - }, - { - "epoch": 1.51, - "learning_rate": 1.0328112681451002e-06, - "loss": 0.7822, - "step": 59094 - }, - { - "epoch": 1.51, - "learning_rate": 1.0327836125773763e-06, - "loss": 0.7148, - "step": 59095 - }, - { - "epoch": 1.51, - "learning_rate": 1.0327559569845517e-06, - "loss": 0.5708, - "step": 59096 - }, - { - "epoch": 1.51, - "learning_rate": 1.0327283013666473e-06, - "loss": 0.4622, - "step": 59097 - }, - { - "epoch": 1.51, - "learning_rate": 1.0327006457236842e-06, - "loss": 0.6123, - "step": 59098 - }, - { - "epoch": 1.51, - "learning_rate": 1.0326729900556839e-06, - "loss": 0.5303, - "step": 59099 - }, - { - "epoch": 1.51, - "learning_rate": 1.032645334362667e-06, - "loss": 0.5542, - "step": 59100 - }, - { - "epoch": 1.51, - "learning_rate": 1.0326176786446556e-06, - "loss": 0.7432, - "step": 59101 - }, - { - "epoch": 1.51, - "learning_rate": 1.0325900229016703e-06, - "loss": 0.6323, - "step": 59102 - }, - { - "epoch": 1.51, - "learning_rate": 1.0325623671337321e-06, - "loss": 0.6211, - "step": 59103 - }, - { - "epoch": 1.51, - "learning_rate": 1.0325347113408622e-06, - "loss": 0.6621, - "step": 59104 - }, - { - "epoch": 1.51, - "learning_rate": 1.0325070555230824e-06, - "loss": 0.5962, - "step": 59105 - }, - { - "epoch": 1.51, - "learning_rate": 1.032479399680413e-06, - "loss": 0.397, - "step": 59106 - }, - { - "epoch": 1.51, - "learning_rate": 1.0324517438128764e-06, - "loss": 0.5908, - "step": 59107 - }, - { - "epoch": 1.51, - "learning_rate": 1.0324240879204922e-06, - "loss": 0.6797, - "step": 59108 - }, - { - "epoch": 1.51, - "learning_rate": 1.0323964320032827e-06, - "loss": 0.4375, - "step": 59109 - }, - { - "epoch": 1.52, - "learning_rate": 1.0323687760612685e-06, - "loss": 0.5958, - "step": 59110 - }, - { - "epoch": 1.52, - "learning_rate": 1.0323411200944712e-06, - "loss": 0.7178, - "step": 59111 - }, - { - "epoch": 1.52, - "learning_rate": 1.032313464102912e-06, - "loss": 0.8262, - "step": 59112 - }, - { - "epoch": 1.52, - "learning_rate": 1.0322858080866117e-06, - "loss": 0.665, - "step": 59113 - }, - { - "epoch": 1.52, - "learning_rate": 1.0322581520455912e-06, - "loss": 0.5854, - "step": 59114 - }, - { - "epoch": 1.52, - "learning_rate": 1.0322304959798727e-06, - "loss": 0.6611, - "step": 59115 - }, - { - "epoch": 1.52, - "learning_rate": 1.0322028398894764e-06, - "loss": 0.6816, - "step": 59116 - }, - { - "epoch": 1.52, - "learning_rate": 1.0321751837744241e-06, - "loss": 0.6904, - "step": 59117 - }, - { - "epoch": 1.52, - "learning_rate": 1.0321475276347368e-06, - "loss": 0.6699, - "step": 59118 - }, - { - "epoch": 1.52, - "learning_rate": 1.0321198714704355e-06, - "loss": 0.8008, - "step": 59119 - }, - { - "epoch": 1.52, - "learning_rate": 1.0320922152815415e-06, - "loss": 0.6626, - "step": 59120 - }, - { - "epoch": 1.52, - "learning_rate": 1.0320645590680762e-06, - "loss": 0.5957, - "step": 59121 - }, - { - "epoch": 1.52, - "learning_rate": 1.0320369028300602e-06, - "loss": 0.6807, - "step": 59122 - }, - { - "epoch": 1.52, - "learning_rate": 1.032009246567515e-06, - "loss": 0.5454, - "step": 59123 - }, - { - "epoch": 1.52, - "learning_rate": 1.031981590280462e-06, - "loss": 0.7246, - "step": 59124 - }, - { - "epoch": 1.52, - "learning_rate": 1.0319539339689222e-06, - "loss": 0.7979, - "step": 59125 - }, - { - "epoch": 1.52, - "learning_rate": 1.0319262776329165e-06, - "loss": 0.7246, - "step": 59126 - }, - { - "epoch": 1.52, - "learning_rate": 1.0318986212724666e-06, - "loss": 0.5698, - "step": 59127 - }, - { - "epoch": 1.52, - "learning_rate": 1.0318709648875933e-06, - "loss": 0.4902, - "step": 59128 - }, - { - "epoch": 1.52, - "learning_rate": 1.0318433084783176e-06, - "loss": 0.6577, - "step": 59129 - }, - { - "epoch": 1.52, - "learning_rate": 1.0318156520446613e-06, - "loss": 0.7197, - "step": 59130 - }, - { - "epoch": 1.52, - "learning_rate": 1.0317879955866448e-06, - "loss": 0.541, - "step": 59131 - }, - { - "epoch": 1.52, - "learning_rate": 1.0317603391042901e-06, - "loss": 0.6821, - "step": 59132 - }, - { - "epoch": 1.52, - "learning_rate": 1.0317326825976177e-06, - "loss": 0.5918, - "step": 59133 - }, - { - "epoch": 1.52, - "learning_rate": 1.0317050260666492e-06, - "loss": 0.647, - "step": 59134 - }, - { - "epoch": 1.52, - "learning_rate": 1.0316773695114056e-06, - "loss": 0.626, - "step": 59135 - }, - { - "epoch": 1.52, - "learning_rate": 1.031649712931908e-06, - "loss": 0.5717, - "step": 59136 - }, - { - "epoch": 1.52, - "learning_rate": 1.0316220563281782e-06, - "loss": 0.8037, - "step": 59137 - }, - { - "epoch": 1.52, - "learning_rate": 1.0315943997002363e-06, - "loss": 0.5596, - "step": 59138 - }, - { - "epoch": 1.52, - "learning_rate": 1.031566743048104e-06, - "loss": 0.7393, - "step": 59139 - }, - { - "epoch": 1.52, - "learning_rate": 1.0315390863718027e-06, - "loss": 0.6042, - "step": 59140 - }, - { - "epoch": 1.52, - "learning_rate": 1.0315114296713533e-06, - "loss": 0.5396, - "step": 59141 - }, - { - "epoch": 1.52, - "learning_rate": 1.031483772946777e-06, - "loss": 0.6133, - "step": 59142 - }, - { - "epoch": 1.52, - "learning_rate": 1.031456116198095e-06, - "loss": 0.7832, - "step": 59143 - }, - { - "epoch": 1.52, - "learning_rate": 1.0314284594253285e-06, - "loss": 0.584, - "step": 59144 - }, - { - "epoch": 1.52, - "learning_rate": 1.0314008026284988e-06, - "loss": 0.5825, - "step": 59145 - }, - { - "epoch": 1.52, - "learning_rate": 1.031373145807627e-06, - "loss": 0.7012, - "step": 59146 - }, - { - "epoch": 1.52, - "learning_rate": 1.0313454889627343e-06, - "loss": 0.6699, - "step": 59147 - }, - { - "epoch": 1.52, - "learning_rate": 1.0313178320938414e-06, - "loss": 0.7822, - "step": 59148 - }, - { - "epoch": 1.52, - "learning_rate": 1.03129017520097e-06, - "loss": 0.6641, - "step": 59149 - }, - { - "epoch": 1.52, - "learning_rate": 1.0312625182841412e-06, - "loss": 0.5669, - "step": 59150 - }, - { - "epoch": 1.52, - "learning_rate": 1.031234861343376e-06, - "loss": 0.6372, - "step": 59151 - }, - { - "epoch": 1.52, - "learning_rate": 1.0312072043786962e-06, - "loss": 0.647, - "step": 59152 - }, - { - "epoch": 1.52, - "learning_rate": 1.0311795473901222e-06, - "loss": 0.7285, - "step": 59153 - }, - { - "epoch": 1.52, - "learning_rate": 1.0311518903776752e-06, - "loss": 0.6738, - "step": 59154 - }, - { - "epoch": 1.52, - "learning_rate": 1.031124233341377e-06, - "loss": 0.7423, - "step": 59155 - }, - { - "epoch": 1.52, - "learning_rate": 1.031096576281248e-06, - "loss": 0.488, - "step": 59156 - }, - { - "epoch": 1.52, - "learning_rate": 1.0310689191973104e-06, - "loss": 0.6472, - "step": 59157 - }, - { - "epoch": 1.52, - "learning_rate": 1.031041262089584e-06, - "loss": 0.5801, - "step": 59158 - }, - { - "epoch": 1.52, - "learning_rate": 1.0310136049580912e-06, - "loss": 0.8027, - "step": 59159 - }, - { - "epoch": 1.52, - "learning_rate": 1.0309859478028527e-06, - "loss": 0.6714, - "step": 59160 - }, - { - "epoch": 1.52, - "learning_rate": 1.0309582906238896e-06, - "loss": 0.5713, - "step": 59161 - }, - { - "epoch": 1.52, - "learning_rate": 1.0309306334212231e-06, - "loss": 0.7559, - "step": 59162 - }, - { - "epoch": 1.52, - "learning_rate": 1.0309029761948745e-06, - "loss": 0.7021, - "step": 59163 - }, - { - "epoch": 1.52, - "learning_rate": 1.0308753189448648e-06, - "loss": 0.6689, - "step": 59164 - }, - { - "epoch": 1.52, - "learning_rate": 1.0308476616712155e-06, - "loss": 0.413, - "step": 59165 - }, - { - "epoch": 1.52, - "learning_rate": 1.0308200043739476e-06, - "loss": 0.562, - "step": 59166 - }, - { - "epoch": 1.52, - "learning_rate": 1.0307923470530819e-06, - "loss": 0.6602, - "step": 59167 - }, - { - "epoch": 1.52, - "learning_rate": 1.0307646897086401e-06, - "loss": 0.582, - "step": 59168 - }, - { - "epoch": 1.52, - "learning_rate": 1.0307370323406432e-06, - "loss": 0.6758, - "step": 59169 - }, - { - "epoch": 1.52, - "learning_rate": 1.0307093749491125e-06, - "loss": 0.6299, - "step": 59170 - }, - { - "epoch": 1.52, - "learning_rate": 1.0306817175340687e-06, - "loss": 0.6709, - "step": 59171 - }, - { - "epoch": 1.52, - "learning_rate": 1.0306540600955338e-06, - "loss": 0.6948, - "step": 59172 - }, - { - "epoch": 1.52, - "learning_rate": 1.0306264026335281e-06, - "loss": 0.6172, - "step": 59173 - }, - { - "epoch": 1.52, - "learning_rate": 1.0305987451480736e-06, - "loss": 0.8633, - "step": 59174 - }, - { - "epoch": 1.52, - "learning_rate": 1.0305710876391905e-06, - "loss": 0.6201, - "step": 59175 - }, - { - "epoch": 1.52, - "learning_rate": 1.0305434301069008e-06, - "loss": 0.6465, - "step": 59176 - }, - { - "epoch": 1.52, - "learning_rate": 1.0305157725512255e-06, - "loss": 0.6709, - "step": 59177 - }, - { - "epoch": 1.52, - "learning_rate": 1.0304881149721857e-06, - "loss": 0.564, - "step": 59178 - }, - { - "epoch": 1.52, - "learning_rate": 1.0304604573698022e-06, - "loss": 0.7559, - "step": 59179 - }, - { - "epoch": 1.52, - "learning_rate": 1.0304327997440966e-06, - "loss": 0.5786, - "step": 59180 - }, - { - "epoch": 1.52, - "learning_rate": 1.0304051420950902e-06, - "loss": 0.8828, - "step": 59181 - }, - { - "epoch": 1.52, - "learning_rate": 1.030377484422804e-06, - "loss": 0.6101, - "step": 59182 - }, - { - "epoch": 1.52, - "learning_rate": 1.030349826727259e-06, - "loss": 0.457, - "step": 59183 - }, - { - "epoch": 1.52, - "learning_rate": 1.0303221690084766e-06, - "loss": 0.4658, - "step": 59184 - }, - { - "epoch": 1.52, - "learning_rate": 1.030294511266478e-06, - "loss": 0.4958, - "step": 59185 - }, - { - "epoch": 1.52, - "learning_rate": 1.030266853501284e-06, - "loss": 0.7144, - "step": 59186 - }, - { - "epoch": 1.52, - "learning_rate": 1.0302391957129166e-06, - "loss": 0.7148, - "step": 59187 - }, - { - "epoch": 1.52, - "learning_rate": 1.0302115379013959e-06, - "loss": 0.6216, - "step": 59188 - }, - { - "epoch": 1.52, - "learning_rate": 1.030183880066744e-06, - "loss": 0.7158, - "step": 59189 - }, - { - "epoch": 1.52, - "learning_rate": 1.0301562222089811e-06, - "loss": 0.604, - "step": 59190 - }, - { - "epoch": 1.52, - "learning_rate": 1.0301285643281297e-06, - "loss": 0.6213, - "step": 59191 - }, - { - "epoch": 1.52, - "learning_rate": 1.03010090642421e-06, - "loss": 0.6602, - "step": 59192 - }, - { - "epoch": 1.52, - "learning_rate": 1.0300732484972433e-06, - "loss": 0.6265, - "step": 59193 - }, - { - "epoch": 1.52, - "learning_rate": 1.030045590547251e-06, - "loss": 0.5864, - "step": 59194 - }, - { - "epoch": 1.52, - "learning_rate": 1.030017932574254e-06, - "loss": 0.645, - "step": 59195 - }, - { - "epoch": 1.52, - "learning_rate": 1.0299902745782736e-06, - "loss": 0.6553, - "step": 59196 - }, - { - "epoch": 1.52, - "learning_rate": 1.0299626165593316e-06, - "loss": 0.626, - "step": 59197 - }, - { - "epoch": 1.52, - "learning_rate": 1.029934958517448e-06, - "loss": 0.6113, - "step": 59198 - }, - { - "epoch": 1.52, - "learning_rate": 1.0299073004526448e-06, - "loss": 0.7109, - "step": 59199 - }, - { - "epoch": 1.52, - "learning_rate": 1.0298796423649428e-06, - "loss": 0.6523, - "step": 59200 - }, - { - "epoch": 1.52, - "learning_rate": 1.0298519842543635e-06, - "loss": 0.5427, - "step": 59201 - }, - { - "epoch": 1.52, - "learning_rate": 1.029824326120928e-06, - "loss": 0.7451, - "step": 59202 - }, - { - "epoch": 1.52, - "learning_rate": 1.0297966679646572e-06, - "loss": 0.6885, - "step": 59203 - }, - { - "epoch": 1.52, - "learning_rate": 1.0297690097855724e-06, - "loss": 0.6216, - "step": 59204 - }, - { - "epoch": 1.52, - "learning_rate": 1.029741351583695e-06, - "loss": 0.814, - "step": 59205 - }, - { - "epoch": 1.52, - "learning_rate": 1.0297136933590457e-06, - "loss": 0.5938, - "step": 59206 - }, - { - "epoch": 1.52, - "learning_rate": 1.0296860351116465e-06, - "loss": 0.6626, - "step": 59207 - }, - { - "epoch": 1.52, - "learning_rate": 1.029658376841518e-06, - "loss": 0.7246, - "step": 59208 - }, - { - "epoch": 1.52, - "learning_rate": 1.0296307185486812e-06, - "loss": 0.5972, - "step": 59209 - }, - { - "epoch": 1.52, - "learning_rate": 1.0296030602331574e-06, - "loss": 0.417, - "step": 59210 - }, - { - "epoch": 1.52, - "learning_rate": 1.0295754018949683e-06, - "loss": 0.5449, - "step": 59211 - }, - { - "epoch": 1.52, - "learning_rate": 1.0295477435341344e-06, - "loss": 0.6182, - "step": 59212 - }, - { - "epoch": 1.52, - "learning_rate": 1.0295200851506772e-06, - "loss": 0.637, - "step": 59213 - }, - { - "epoch": 1.52, - "learning_rate": 1.0294924267446179e-06, - "loss": 0.6792, - "step": 59214 - }, - { - "epoch": 1.52, - "learning_rate": 1.0294647683159773e-06, - "loss": 0.7383, - "step": 59215 - }, - { - "epoch": 1.52, - "learning_rate": 1.029437109864777e-06, - "loss": 0.4993, - "step": 59216 - }, - { - "epoch": 1.52, - "learning_rate": 1.0294094513910386e-06, - "loss": 0.7949, - "step": 59217 - }, - { - "epoch": 1.52, - "learning_rate": 1.0293817928947824e-06, - "loss": 0.7422, - "step": 59218 - }, - { - "epoch": 1.52, - "learning_rate": 1.0293541343760294e-06, - "loss": 0.6094, - "step": 59219 - }, - { - "epoch": 1.52, - "learning_rate": 1.0293264758348018e-06, - "loss": 0.5923, - "step": 59220 - }, - { - "epoch": 1.52, - "learning_rate": 1.02929881727112e-06, - "loss": 0.7129, - "step": 59221 - }, - { - "epoch": 1.52, - "learning_rate": 1.029271158685006e-06, - "loss": 0.7036, - "step": 59222 - }, - { - "epoch": 1.52, - "learning_rate": 1.0292435000764802e-06, - "loss": 0.5996, - "step": 59223 - }, - { - "epoch": 1.52, - "learning_rate": 1.029215841445564e-06, - "loss": 0.5718, - "step": 59224 - }, - { - "epoch": 1.52, - "learning_rate": 1.029188182792278e-06, - "loss": 0.583, - "step": 59225 - }, - { - "epoch": 1.52, - "learning_rate": 1.0291605241166443e-06, - "loss": 0.7754, - "step": 59226 - }, - { - "epoch": 1.52, - "learning_rate": 1.0291328654186839e-06, - "loss": 0.5935, - "step": 59227 - }, - { - "epoch": 1.52, - "learning_rate": 1.029105206698418e-06, - "loss": 0.5693, - "step": 59228 - }, - { - "epoch": 1.52, - "learning_rate": 1.0290775479558671e-06, - "loss": 0.6377, - "step": 59229 - }, - { - "epoch": 1.52, - "learning_rate": 1.029049889191053e-06, - "loss": 0.7368, - "step": 59230 - }, - { - "epoch": 1.52, - "learning_rate": 1.0290222304039966e-06, - "loss": 0.666, - "step": 59231 - }, - { - "epoch": 1.52, - "learning_rate": 1.0289945715947195e-06, - "loss": 0.6465, - "step": 59232 - }, - { - "epoch": 1.52, - "learning_rate": 1.0289669127632426e-06, - "loss": 0.7539, - "step": 59233 - }, - { - "epoch": 1.52, - "learning_rate": 1.0289392539095867e-06, - "loss": 0.4158, - "step": 59234 - }, - { - "epoch": 1.52, - "learning_rate": 1.0289115950337736e-06, - "loss": 0.5889, - "step": 59235 - }, - { - "epoch": 1.52, - "learning_rate": 1.028883936135824e-06, - "loss": 0.666, - "step": 59236 - }, - { - "epoch": 1.52, - "learning_rate": 1.0288562772157602e-06, - "loss": 0.7783, - "step": 59237 - }, - { - "epoch": 1.52, - "learning_rate": 1.0288286182736014e-06, - "loss": 0.7754, - "step": 59238 - }, - { - "epoch": 1.52, - "learning_rate": 1.0288009593093703e-06, - "loss": 0.5869, - "step": 59239 - }, - { - "epoch": 1.52, - "learning_rate": 1.0287733003230873e-06, - "loss": 0.5938, - "step": 59240 - }, - { - "epoch": 1.52, - "learning_rate": 1.0287456413147745e-06, - "loss": 0.3835, - "step": 59241 - }, - { - "epoch": 1.52, - "learning_rate": 1.0287179822844523e-06, - "loss": 0.4558, - "step": 59242 - }, - { - "epoch": 1.52, - "learning_rate": 1.0286903232321418e-06, - "loss": 0.5454, - "step": 59243 - }, - { - "epoch": 1.52, - "learning_rate": 1.0286626641578644e-06, - "loss": 0.686, - "step": 59244 - }, - { - "epoch": 1.52, - "learning_rate": 1.0286350050616418e-06, - "loss": 0.6519, - "step": 59245 - }, - { - "epoch": 1.52, - "learning_rate": 1.0286073459434944e-06, - "loss": 0.7227, - "step": 59246 - }, - { - "epoch": 1.52, - "learning_rate": 1.0285796868034436e-06, - "loss": 0.7783, - "step": 59247 - }, - { - "epoch": 1.52, - "learning_rate": 1.0285520276415105e-06, - "loss": 0.4767, - "step": 59248 - }, - { - "epoch": 1.52, - "learning_rate": 1.0285243684577168e-06, - "loss": 0.5996, - "step": 59249 - }, - { - "epoch": 1.52, - "learning_rate": 1.028496709252083e-06, - "loss": 0.6621, - "step": 59250 - }, - { - "epoch": 1.52, - "learning_rate": 1.0284690500246306e-06, - "loss": 0.6318, - "step": 59251 - }, - { - "epoch": 1.52, - "learning_rate": 1.0284413907753811e-06, - "loss": 0.7056, - "step": 59252 - }, - { - "epoch": 1.52, - "learning_rate": 1.0284137315043549e-06, - "loss": 0.7275, - "step": 59253 - }, - { - "epoch": 1.52, - "learning_rate": 1.0283860722115739e-06, - "loss": 0.7529, - "step": 59254 - }, - { - "epoch": 1.52, - "learning_rate": 1.0283584128970588e-06, - "loss": 0.4888, - "step": 59255 - }, - { - "epoch": 1.52, - "learning_rate": 1.0283307535608311e-06, - "loss": 0.5466, - "step": 59256 - }, - { - "epoch": 1.52, - "learning_rate": 1.0283030942029118e-06, - "loss": 0.6221, - "step": 59257 - }, - { - "epoch": 1.52, - "learning_rate": 1.028275434823322e-06, - "loss": 0.5347, - "step": 59258 - }, - { - "epoch": 1.52, - "learning_rate": 1.028247775422083e-06, - "loss": 0.793, - "step": 59259 - }, - { - "epoch": 1.52, - "learning_rate": 1.0282201159992164e-06, - "loss": 0.7051, - "step": 59260 - }, - { - "epoch": 1.52, - "learning_rate": 1.0281924565547425e-06, - "loss": 0.5767, - "step": 59261 - }, - { - "epoch": 1.52, - "learning_rate": 1.0281647970886833e-06, - "loss": 0.7695, - "step": 59262 - }, - { - "epoch": 1.52, - "learning_rate": 1.0281371376010593e-06, - "loss": 0.667, - "step": 59263 - }, - { - "epoch": 1.52, - "learning_rate": 1.0281094780918919e-06, - "loss": 0.6973, - "step": 59264 - }, - { - "epoch": 1.52, - "learning_rate": 1.0280818185612026e-06, - "loss": 0.5764, - "step": 59265 - }, - { - "epoch": 1.52, - "learning_rate": 1.0280541590090126e-06, - "loss": 0.665, - "step": 59266 - }, - { - "epoch": 1.52, - "learning_rate": 1.0280264994353424e-06, - "loss": 0.4692, - "step": 59267 - }, - { - "epoch": 1.52, - "learning_rate": 1.0279988398402138e-06, - "loss": 0.5913, - "step": 59268 - }, - { - "epoch": 1.52, - "learning_rate": 1.0279711802236474e-06, - "loss": 0.7266, - "step": 59269 - }, - { - "epoch": 1.52, - "learning_rate": 1.0279435205856653e-06, - "loss": 0.6729, - "step": 59270 - }, - { - "epoch": 1.52, - "learning_rate": 1.027915860926288e-06, - "loss": 0.4204, - "step": 59271 - }, - { - "epoch": 1.52, - "learning_rate": 1.0278882012455364e-06, - "loss": 0.5271, - "step": 59272 - }, - { - "epoch": 1.52, - "learning_rate": 1.0278605415434325e-06, - "loss": 0.7573, - "step": 59273 - }, - { - "epoch": 1.52, - "learning_rate": 1.0278328818199968e-06, - "loss": 0.8223, - "step": 59274 - }, - { - "epoch": 1.52, - "learning_rate": 1.0278052220752509e-06, - "loss": 0.5952, - "step": 59275 - }, - { - "epoch": 1.52, - "learning_rate": 1.0277775623092158e-06, - "loss": 0.6309, - "step": 59276 - }, - { - "epoch": 1.52, - "learning_rate": 1.0277499025219128e-06, - "loss": 0.7183, - "step": 59277 - }, - { - "epoch": 1.52, - "learning_rate": 1.0277222427133628e-06, - "loss": 0.511, - "step": 59278 - }, - { - "epoch": 1.52, - "learning_rate": 1.0276945828835872e-06, - "loss": 0.5767, - "step": 59279 - }, - { - "epoch": 1.52, - "learning_rate": 1.0276669230326068e-06, - "loss": 0.6123, - "step": 59280 - }, - { - "epoch": 1.52, - "learning_rate": 1.027639263160444e-06, - "loss": 0.6201, - "step": 59281 - }, - { - "epoch": 1.52, - "learning_rate": 1.0276116032671184e-06, - "loss": 0.5798, - "step": 59282 - }, - { - "epoch": 1.52, - "learning_rate": 1.027583943352652e-06, - "loss": 0.6592, - "step": 59283 - }, - { - "epoch": 1.52, - "learning_rate": 1.0275562834170657e-06, - "loss": 0.5923, - "step": 59284 - }, - { - "epoch": 1.52, - "learning_rate": 1.0275286234603811e-06, - "loss": 0.834, - "step": 59285 - }, - { - "epoch": 1.52, - "learning_rate": 1.0275009634826192e-06, - "loss": 0.6387, - "step": 59286 - }, - { - "epoch": 1.52, - "learning_rate": 1.0274733034838008e-06, - "loss": 0.5908, - "step": 59287 - }, - { - "epoch": 1.52, - "learning_rate": 1.027445643463947e-06, - "loss": 0.585, - "step": 59288 - }, - { - "epoch": 1.52, - "learning_rate": 1.02741798342308e-06, - "loss": 0.6289, - "step": 59289 - }, - { - "epoch": 1.52, - "learning_rate": 1.02739032336122e-06, - "loss": 0.751, - "step": 59290 - }, - { - "epoch": 1.52, - "learning_rate": 1.0273626632783887e-06, - "loss": 0.6172, - "step": 59291 - }, - { - "epoch": 1.52, - "learning_rate": 1.0273350031746069e-06, - "loss": 0.481, - "step": 59292 - }, - { - "epoch": 1.52, - "learning_rate": 1.027307343049896e-06, - "loss": 0.5986, - "step": 59293 - }, - { - "epoch": 1.52, - "learning_rate": 1.027279682904277e-06, - "loss": 0.6855, - "step": 59294 - }, - { - "epoch": 1.52, - "learning_rate": 1.0272520227377713e-06, - "loss": 0.5591, - "step": 59295 - }, - { - "epoch": 1.52, - "learning_rate": 1.0272243625504e-06, - "loss": 0.7227, - "step": 59296 - }, - { - "epoch": 1.52, - "learning_rate": 1.027196702342184e-06, - "loss": 0.5593, - "step": 59297 - }, - { - "epoch": 1.52, - "learning_rate": 1.027169042113145e-06, - "loss": 0.75, - "step": 59298 - }, - { - "epoch": 1.52, - "learning_rate": 1.027141381863304e-06, - "loss": 0.7227, - "step": 59299 - }, - { - "epoch": 1.52, - "learning_rate": 1.0271137215926816e-06, - "loss": 0.6226, - "step": 59300 - }, - { - "epoch": 1.52, - "learning_rate": 1.0270860613013002e-06, - "loss": 0.9805, - "step": 59301 - }, - { - "epoch": 1.52, - "learning_rate": 1.0270584009891799e-06, - "loss": 0.6553, - "step": 59302 - }, - { - "epoch": 1.52, - "learning_rate": 1.0270307406563419e-06, - "loss": 0.6689, - "step": 59303 - }, - { - "epoch": 1.52, - "learning_rate": 1.0270030803028082e-06, - "loss": 0.832, - "step": 59304 - }, - { - "epoch": 1.52, - "learning_rate": 1.0269754199285992e-06, - "loss": 0.5835, - "step": 59305 - }, - { - "epoch": 1.52, - "learning_rate": 1.0269477595337366e-06, - "loss": 0.6743, - "step": 59306 - }, - { - "epoch": 1.52, - "learning_rate": 1.026920099118241e-06, - "loss": 0.5605, - "step": 59307 - }, - { - "epoch": 1.52, - "learning_rate": 1.0268924386821342e-06, - "loss": 0.6118, - "step": 59308 - }, - { - "epoch": 1.52, - "learning_rate": 1.026864778225437e-06, - "loss": 0.7412, - "step": 59309 - }, - { - "epoch": 1.52, - "learning_rate": 1.0268371177481708e-06, - "loss": 0.7598, - "step": 59310 - }, - { - "epoch": 1.52, - "learning_rate": 1.0268094572503564e-06, - "loss": 0.4661, - "step": 59311 - }, - { - "epoch": 1.52, - "learning_rate": 1.0267817967320155e-06, - "loss": 0.6177, - "step": 59312 - }, - { - "epoch": 1.52, - "learning_rate": 1.0267541361931685e-06, - "loss": 0.6265, - "step": 59313 - }, - { - "epoch": 1.52, - "learning_rate": 1.0267264756338376e-06, - "loss": 0.6982, - "step": 59314 - }, - { - "epoch": 1.52, - "learning_rate": 1.0266988150540431e-06, - "loss": 0.5737, - "step": 59315 - }, - { - "epoch": 1.52, - "learning_rate": 1.0266711544538075e-06, - "loss": 0.6953, - "step": 59316 - }, - { - "epoch": 1.52, - "learning_rate": 1.0266434938331498e-06, - "loss": 0.7725, - "step": 59317 - }, - { - "epoch": 1.52, - "learning_rate": 1.026615833192093e-06, - "loss": 0.4285, - "step": 59318 - }, - { - "epoch": 1.52, - "learning_rate": 1.0265881725306576e-06, - "loss": 0.7383, - "step": 59319 - }, - { - "epoch": 1.52, - "learning_rate": 1.026560511848865e-06, - "loss": 0.5381, - "step": 59320 - }, - { - "epoch": 1.52, - "learning_rate": 1.0265328511467358e-06, - "loss": 0.582, - "step": 59321 - }, - { - "epoch": 1.52, - "learning_rate": 1.0265051904242917e-06, - "loss": 0.5229, - "step": 59322 - }, - { - "epoch": 1.52, - "learning_rate": 1.0264775296815542e-06, - "loss": 0.667, - "step": 59323 - }, - { - "epoch": 1.52, - "learning_rate": 1.0264498689185436e-06, - "loss": 0.6099, - "step": 59324 - }, - { - "epoch": 1.52, - "learning_rate": 1.026422208135282e-06, - "loss": 0.5491, - "step": 59325 - }, - { - "epoch": 1.52, - "learning_rate": 1.02639454733179e-06, - "loss": 0.5532, - "step": 59326 - }, - { - "epoch": 1.52, - "learning_rate": 1.026366886508089e-06, - "loss": 0.5376, - "step": 59327 - }, - { - "epoch": 1.52, - "learning_rate": 1.0263392256641997e-06, - "loss": 0.7539, - "step": 59328 - }, - { - "epoch": 1.52, - "learning_rate": 1.0263115648001442e-06, - "loss": 0.6948, - "step": 59329 - }, - { - "epoch": 1.52, - "learning_rate": 1.0262839039159426e-06, - "loss": 0.4434, - "step": 59330 - }, - { - "epoch": 1.52, - "learning_rate": 1.026256243011617e-06, - "loss": 0.4946, - "step": 59331 - }, - { - "epoch": 1.52, - "learning_rate": 1.026228582087188e-06, - "loss": 0.54, - "step": 59332 - }, - { - "epoch": 1.52, - "learning_rate": 1.0262009211426773e-06, - "loss": 0.6797, - "step": 59333 - }, - { - "epoch": 1.52, - "learning_rate": 1.0261732601781052e-06, - "loss": 0.6362, - "step": 59334 - }, - { - "epoch": 1.52, - "learning_rate": 1.0261455991934938e-06, - "loss": 0.6089, - "step": 59335 - }, - { - "epoch": 1.52, - "learning_rate": 1.026117938188864e-06, - "loss": 0.6411, - "step": 59336 - }, - { - "epoch": 1.52, - "learning_rate": 1.0260902771642367e-06, - "loss": 0.7017, - "step": 59337 - }, - { - "epoch": 1.52, - "learning_rate": 1.0260626161196334e-06, - "loss": 0.7676, - "step": 59338 - }, - { - "epoch": 1.52, - "learning_rate": 1.026034955055075e-06, - "loss": 0.6572, - "step": 59339 - }, - { - "epoch": 1.52, - "learning_rate": 1.0260072939705827e-06, - "loss": 0.8301, - "step": 59340 - }, - { - "epoch": 1.52, - "learning_rate": 1.0259796328661782e-06, - "loss": 0.6343, - "step": 59341 - }, - { - "epoch": 1.52, - "learning_rate": 1.0259519717418822e-06, - "loss": 0.7197, - "step": 59342 - }, - { - "epoch": 1.52, - "learning_rate": 1.0259243105977159e-06, - "loss": 0.5833, - "step": 59343 - }, - { - "epoch": 1.52, - "learning_rate": 1.0258966494337004e-06, - "loss": 0.9023, - "step": 59344 - }, - { - "epoch": 1.52, - "learning_rate": 1.0258689882498573e-06, - "loss": 0.4688, - "step": 59345 - }, - { - "epoch": 1.52, - "learning_rate": 1.0258413270462074e-06, - "loss": 0.6382, - "step": 59346 - }, - { - "epoch": 1.52, - "learning_rate": 1.025813665822772e-06, - "loss": 0.3816, - "step": 59347 - }, - { - "epoch": 1.52, - "learning_rate": 1.0257860045795722e-06, - "loss": 0.7686, - "step": 59348 - }, - { - "epoch": 1.52, - "learning_rate": 1.025758343316629e-06, - "loss": 0.71, - "step": 59349 - }, - { - "epoch": 1.52, - "learning_rate": 1.0257306820339642e-06, - "loss": 0.7285, - "step": 59350 - }, - { - "epoch": 1.52, - "learning_rate": 1.0257030207315986e-06, - "loss": 0.6035, - "step": 59351 - }, - { - "epoch": 1.52, - "learning_rate": 1.0256753594095532e-06, - "loss": 0.5229, - "step": 59352 - }, - { - "epoch": 1.52, - "learning_rate": 1.0256476980678492e-06, - "loss": 0.5835, - "step": 59353 - }, - { - "epoch": 1.52, - "learning_rate": 1.0256200367065085e-06, - "loss": 0.52, - "step": 59354 - }, - { - "epoch": 1.52, - "learning_rate": 1.0255923753255511e-06, - "loss": 0.7139, - "step": 59355 - }, - { - "epoch": 1.52, - "learning_rate": 1.0255647139249993e-06, - "loss": 0.8535, - "step": 59356 - }, - { - "epoch": 1.52, - "learning_rate": 1.0255370525048735e-06, - "loss": 0.5415, - "step": 59357 - }, - { - "epoch": 1.52, - "learning_rate": 1.0255093910651953e-06, - "loss": 0.7051, - "step": 59358 - }, - { - "epoch": 1.52, - "learning_rate": 1.0254817296059854e-06, - "loss": 0.707, - "step": 59359 - }, - { - "epoch": 1.52, - "learning_rate": 1.0254540681272656e-06, - "loss": 0.7012, - "step": 59360 - }, - { - "epoch": 1.52, - "learning_rate": 1.0254264066290567e-06, - "loss": 0.73, - "step": 59361 - }, - { - "epoch": 1.52, - "learning_rate": 1.0253987451113801e-06, - "loss": 0.7383, - "step": 59362 - }, - { - "epoch": 1.52, - "learning_rate": 1.0253710835742566e-06, - "loss": 0.585, - "step": 59363 - }, - { - "epoch": 1.52, - "learning_rate": 1.025343422017708e-06, - "loss": 0.834, - "step": 59364 - }, - { - "epoch": 1.52, - "learning_rate": 1.0253157604417545e-06, - "loss": 0.6111, - "step": 59365 - }, - { - "epoch": 1.52, - "learning_rate": 1.0252880988464186e-06, - "loss": 0.5825, - "step": 59366 - }, - { - "epoch": 1.52, - "learning_rate": 1.0252604372317204e-06, - "loss": 0.6387, - "step": 59367 - }, - { - "epoch": 1.52, - "learning_rate": 1.0252327755976812e-06, - "loss": 0.835, - "step": 59368 - }, - { - "epoch": 1.52, - "learning_rate": 1.0252051139443227e-06, - "loss": 0.7148, - "step": 59369 - }, - { - "epoch": 1.52, - "learning_rate": 1.0251774522716658e-06, - "loss": 0.6157, - "step": 59370 - }, - { - "epoch": 1.52, - "learning_rate": 1.025149790579732e-06, - "loss": 0.7061, - "step": 59371 - }, - { - "epoch": 1.52, - "learning_rate": 1.0251221288685416e-06, - "loss": 0.5215, - "step": 59372 - }, - { - "epoch": 1.52, - "learning_rate": 1.0250944671381169e-06, - "loss": 0.6875, - "step": 59373 - }, - { - "epoch": 1.52, - "learning_rate": 1.0250668053884778e-06, - "loss": 0.5693, - "step": 59374 - }, - { - "epoch": 1.52, - "learning_rate": 1.0250391436196469e-06, - "loss": 0.6626, - "step": 59375 - }, - { - "epoch": 1.52, - "learning_rate": 1.0250114818316442e-06, - "loss": 0.4661, - "step": 59376 - }, - { - "epoch": 1.52, - "learning_rate": 1.0249838200244918e-06, - "loss": 0.7178, - "step": 59377 - }, - { - "epoch": 1.52, - "learning_rate": 1.02495615819821e-06, - "loss": 0.8125, - "step": 59378 - }, - { - "epoch": 1.52, - "learning_rate": 1.0249284963528207e-06, - "loss": 0.4993, - "step": 59379 - }, - { - "epoch": 1.52, - "learning_rate": 1.0249008344883445e-06, - "loss": 0.5596, - "step": 59380 - }, - { - "epoch": 1.52, - "learning_rate": 1.0248731726048033e-06, - "loss": 0.7139, - "step": 59381 - }, - { - "epoch": 1.52, - "learning_rate": 1.0248455107022177e-06, - "loss": 0.6807, - "step": 59382 - }, - { - "epoch": 1.52, - "learning_rate": 1.024817848780609e-06, - "loss": 0.7354, - "step": 59383 - }, - { - "epoch": 1.52, - "learning_rate": 1.0247901868399982e-06, - "loss": 0.4683, - "step": 59384 - }, - { - "epoch": 1.52, - "learning_rate": 1.0247625248804068e-06, - "loss": 0.7432, - "step": 59385 - }, - { - "epoch": 1.52, - "learning_rate": 1.024734862901856e-06, - "loss": 0.5918, - "step": 59386 - }, - { - "epoch": 1.52, - "learning_rate": 1.0247072009043667e-06, - "loss": 0.6445, - "step": 59387 - }, - { - "epoch": 1.52, - "learning_rate": 1.0246795388879603e-06, - "loss": 0.5732, - "step": 59388 - }, - { - "epoch": 1.52, - "learning_rate": 1.0246518768526581e-06, - "loss": 0.6709, - "step": 59389 - }, - { - "epoch": 1.52, - "learning_rate": 1.0246242147984807e-06, - "loss": 0.6758, - "step": 59390 - }, - { - "epoch": 1.52, - "learning_rate": 1.0245965527254501e-06, - "loss": 0.8398, - "step": 59391 - }, - { - "epoch": 1.52, - "learning_rate": 1.024568890633587e-06, - "loss": 0.5322, - "step": 59392 - }, - { - "epoch": 1.52, - "learning_rate": 1.0245412285229123e-06, - "loss": 0.7119, - "step": 59393 - }, - { - "epoch": 1.52, - "learning_rate": 1.0245135663934476e-06, - "loss": 0.6294, - "step": 59394 - }, - { - "epoch": 1.52, - "learning_rate": 1.0244859042452141e-06, - "loss": 0.6313, - "step": 59395 - }, - { - "epoch": 1.52, - "learning_rate": 1.024458242078233e-06, - "loss": 0.7529, - "step": 59396 - }, - { - "epoch": 1.52, - "learning_rate": 1.024430579892525e-06, - "loss": 0.561, - "step": 59397 - }, - { - "epoch": 1.52, - "learning_rate": 1.024402917688112e-06, - "loss": 0.875, - "step": 59398 - }, - { - "epoch": 1.52, - "learning_rate": 1.0243752554650145e-06, - "loss": 0.6416, - "step": 59399 - }, - { - "epoch": 1.52, - "learning_rate": 1.0243475932232542e-06, - "loss": 0.623, - "step": 59400 - }, - { - "epoch": 1.52, - "learning_rate": 1.0243199309628522e-06, - "loss": 0.5015, - "step": 59401 - }, - { - "epoch": 1.52, - "learning_rate": 1.0242922686838294e-06, - "loss": 0.5576, - "step": 59402 - }, - { - "epoch": 1.52, - "learning_rate": 1.0242646063862068e-06, - "loss": 0.6274, - "step": 59403 - }, - { - "epoch": 1.52, - "learning_rate": 1.0242369440700063e-06, - "loss": 0.3384, - "step": 59404 - }, - { - "epoch": 1.52, - "learning_rate": 1.0242092817352483e-06, - "loss": 0.6777, - "step": 59405 - }, - { - "epoch": 1.52, - "learning_rate": 1.024181619381955e-06, - "loss": 0.4412, - "step": 59406 - }, - { - "epoch": 1.52, - "learning_rate": 1.0241539570101462e-06, - "loss": 0.7373, - "step": 59407 - }, - { - "epoch": 1.52, - "learning_rate": 1.0241262946198443e-06, - "loss": 0.7402, - "step": 59408 - }, - { - "epoch": 1.52, - "learning_rate": 1.0240986322110698e-06, - "loss": 0.5752, - "step": 59409 - }, - { - "epoch": 1.52, - "learning_rate": 1.0240709697838444e-06, - "loss": 0.5327, - "step": 59410 - }, - { - "epoch": 1.52, - "learning_rate": 1.0240433073381888e-06, - "loss": 0.6152, - "step": 59411 - }, - { - "epoch": 1.52, - "learning_rate": 1.024015644874124e-06, - "loss": 0.5579, - "step": 59412 - }, - { - "epoch": 1.52, - "learning_rate": 1.023987982391672e-06, - "loss": 0.6108, - "step": 59413 - }, - { - "epoch": 1.52, - "learning_rate": 1.0239603198908534e-06, - "loss": 0.6255, - "step": 59414 - }, - { - "epoch": 1.52, - "learning_rate": 1.0239326573716893e-06, - "loss": 0.5479, - "step": 59415 - }, - { - "epoch": 1.52, - "learning_rate": 1.0239049948342014e-06, - "loss": 0.71, - "step": 59416 - }, - { - "epoch": 1.52, - "learning_rate": 1.0238773322784102e-06, - "loss": 0.6792, - "step": 59417 - }, - { - "epoch": 1.52, - "learning_rate": 1.0238496697043372e-06, - "loss": 0.6221, - "step": 59418 - }, - { - "epoch": 1.52, - "learning_rate": 1.0238220071120037e-06, - "loss": 0.8418, - "step": 59419 - }, - { - "epoch": 1.52, - "learning_rate": 1.0237943445014307e-06, - "loss": 0.6157, - "step": 59420 - }, - { - "epoch": 1.52, - "learning_rate": 1.02376668187264e-06, - "loss": 0.6895, - "step": 59421 - }, - { - "epoch": 1.52, - "learning_rate": 1.0237390192256517e-06, - "loss": 0.707, - "step": 59422 - }, - { - "epoch": 1.52, - "learning_rate": 1.0237113565604878e-06, - "loss": 0.5166, - "step": 59423 - }, - { - "epoch": 1.52, - "learning_rate": 1.023683693877169e-06, - "loss": 0.6572, - "step": 59424 - }, - { - "epoch": 1.52, - "learning_rate": 1.0236560311757167e-06, - "loss": 0.7603, - "step": 59425 - }, - { - "epoch": 1.52, - "learning_rate": 1.0236283684561523e-06, - "loss": 0.6895, - "step": 59426 - }, - { - "epoch": 1.52, - "learning_rate": 1.0236007057184965e-06, - "loss": 0.7002, - "step": 59427 - }, - { - "epoch": 1.52, - "learning_rate": 1.0235730429627708e-06, - "loss": 0.5215, - "step": 59428 - }, - { - "epoch": 1.52, - "learning_rate": 1.0235453801889964e-06, - "loss": 0.7095, - "step": 59429 - }, - { - "epoch": 1.52, - "learning_rate": 1.023517717397194e-06, - "loss": 0.6626, - "step": 59430 - }, - { - "epoch": 1.52, - "learning_rate": 1.0234900545873855e-06, - "loss": 0.6875, - "step": 59431 - }, - { - "epoch": 1.52, - "learning_rate": 1.0234623917595917e-06, - "loss": 0.5957, - "step": 59432 - }, - { - "epoch": 1.52, - "learning_rate": 1.0234347289138338e-06, - "loss": 0.5942, - "step": 59433 - }, - { - "epoch": 1.52, - "learning_rate": 1.0234070660501332e-06, - "loss": 0.6841, - "step": 59434 - }, - { - "epoch": 1.52, - "learning_rate": 1.0233794031685106e-06, - "loss": 0.7617, - "step": 59435 - }, - { - "epoch": 1.52, - "learning_rate": 1.0233517402689877e-06, - "loss": 0.6479, - "step": 59436 - }, - { - "epoch": 1.52, - "learning_rate": 1.0233240773515852e-06, - "loss": 0.4231, - "step": 59437 - }, - { - "epoch": 1.52, - "learning_rate": 1.0232964144163247e-06, - "loss": 0.7207, - "step": 59438 - }, - { - "epoch": 1.52, - "learning_rate": 1.023268751463227e-06, - "loss": 0.4351, - "step": 59439 - }, - { - "epoch": 1.52, - "learning_rate": 1.0232410884923137e-06, - "loss": 0.7026, - "step": 59440 - }, - { - "epoch": 1.52, - "learning_rate": 1.0232134255036059e-06, - "loss": 0.5266, - "step": 59441 - }, - { - "epoch": 1.52, - "learning_rate": 1.0231857624971245e-06, - "loss": 0.7246, - "step": 59442 - }, - { - "epoch": 1.52, - "learning_rate": 1.0231580994728906e-06, - "loss": 0.6514, - "step": 59443 - }, - { - "epoch": 1.52, - "learning_rate": 1.023130436430926e-06, - "loss": 0.8066, - "step": 59444 - }, - { - "epoch": 1.52, - "learning_rate": 1.023102773371251e-06, - "loss": 0.6831, - "step": 59445 - }, - { - "epoch": 1.52, - "learning_rate": 1.0230751102938877e-06, - "loss": 0.6309, - "step": 59446 - }, - { - "epoch": 1.52, - "learning_rate": 1.0230474471988567e-06, - "loss": 0.7168, - "step": 59447 - }, - { - "epoch": 1.52, - "learning_rate": 1.0230197840861794e-06, - "loss": 0.7559, - "step": 59448 - }, - { - "epoch": 1.52, - "learning_rate": 1.0229921209558767e-06, - "loss": 0.7012, - "step": 59449 - }, - { - "epoch": 1.52, - "learning_rate": 1.0229644578079702e-06, - "loss": 0.6675, - "step": 59450 - }, - { - "epoch": 1.52, - "learning_rate": 1.0229367946424807e-06, - "loss": 0.6572, - "step": 59451 - }, - { - "epoch": 1.52, - "learning_rate": 1.0229091314594298e-06, - "loss": 0.583, - "step": 59452 - }, - { - "epoch": 1.52, - "learning_rate": 1.0228814682588383e-06, - "loss": 0.5084, - "step": 59453 - }, - { - "epoch": 1.52, - "learning_rate": 1.0228538050407275e-06, - "loss": 0.624, - "step": 59454 - }, - { - "epoch": 1.52, - "learning_rate": 1.0228261418051182e-06, - "loss": 0.3838, - "step": 59455 - }, - { - "epoch": 1.52, - "learning_rate": 1.0227984785520325e-06, - "loss": 0.644, - "step": 59456 - }, - { - "epoch": 1.52, - "learning_rate": 1.0227708152814912e-06, - "loss": 0.5852, - "step": 59457 - }, - { - "epoch": 1.52, - "learning_rate": 1.0227431519935147e-06, - "loss": 0.7354, - "step": 59458 - }, - { - "epoch": 1.52, - "learning_rate": 1.0227154886881254e-06, - "loss": 0.6318, - "step": 59459 - }, - { - "epoch": 1.52, - "learning_rate": 1.0226878253653435e-06, - "loss": 0.5728, - "step": 59460 - }, - { - "epoch": 1.52, - "learning_rate": 1.0226601620251908e-06, - "loss": 0.5874, - "step": 59461 - }, - { - "epoch": 1.52, - "learning_rate": 1.0226324986676882e-06, - "loss": 0.5571, - "step": 59462 - }, - { - "epoch": 1.52, - "learning_rate": 1.022604835292857e-06, - "loss": 0.6743, - "step": 59463 - }, - { - "epoch": 1.52, - "learning_rate": 1.0225771719007182e-06, - "loss": 0.6904, - "step": 59464 - }, - { - "epoch": 1.52, - "learning_rate": 1.0225495084912933e-06, - "loss": 0.7109, - "step": 59465 - }, - { - "epoch": 1.52, - "learning_rate": 1.0225218450646029e-06, - "loss": 0.792, - "step": 59466 - }, - { - "epoch": 1.52, - "learning_rate": 1.022494181620669e-06, - "loss": 0.5693, - "step": 59467 - }, - { - "epoch": 1.52, - "learning_rate": 1.0224665181595118e-06, - "loss": 0.6084, - "step": 59468 - }, - { - "epoch": 1.52, - "learning_rate": 1.0224388546811535e-06, - "loss": 0.8203, - "step": 59469 - }, - { - "epoch": 1.52, - "learning_rate": 1.0224111911856143e-06, - "loss": 0.6143, - "step": 59470 - }, - { - "epoch": 1.52, - "learning_rate": 1.0223835276729167e-06, - "loss": 0.6846, - "step": 59471 - }, - { - "epoch": 1.52, - "learning_rate": 1.0223558641430803e-06, - "loss": 0.5864, - "step": 59472 - }, - { - "epoch": 1.52, - "learning_rate": 1.0223282005961276e-06, - "loss": 0.4028, - "step": 59473 - }, - { - "epoch": 1.52, - "learning_rate": 1.0223005370320787e-06, - "loss": 0.4946, - "step": 59474 - }, - { - "epoch": 1.52, - "learning_rate": 1.0222728734509556e-06, - "loss": 0.6558, - "step": 59475 - }, - { - "epoch": 1.52, - "learning_rate": 1.0222452098527791e-06, - "loss": 0.4904, - "step": 59476 - }, - { - "epoch": 1.52, - "learning_rate": 1.0222175462375703e-06, - "loss": 0.6416, - "step": 59477 - }, - { - "epoch": 1.52, - "learning_rate": 1.022189882605351e-06, - "loss": 0.7314, - "step": 59478 - }, - { - "epoch": 1.52, - "learning_rate": 1.0221622189561417e-06, - "loss": 0.6631, - "step": 59479 - }, - { - "epoch": 1.52, - "learning_rate": 1.0221345552899635e-06, - "loss": 0.8174, - "step": 59480 - }, - { - "epoch": 1.52, - "learning_rate": 1.0221068916068386e-06, - "loss": 0.4692, - "step": 59481 - }, - { - "epoch": 1.52, - "learning_rate": 1.022079227906787e-06, - "loss": 0.7334, - "step": 59482 - }, - { - "epoch": 1.52, - "learning_rate": 1.0220515641898302e-06, - "loss": 0.6162, - "step": 59483 - }, - { - "epoch": 1.52, - "learning_rate": 1.0220239004559896e-06, - "loss": 0.5435, - "step": 59484 - }, - { - "epoch": 1.52, - "learning_rate": 1.0219962367052862e-06, - "loss": 0.4768, - "step": 59485 - }, - { - "epoch": 1.52, - "learning_rate": 1.0219685729377422e-06, - "loss": 0.6367, - "step": 59486 - }, - { - "epoch": 1.52, - "learning_rate": 1.0219409091533769e-06, - "loss": 0.6924, - "step": 59487 - }, - { - "epoch": 1.52, - "learning_rate": 1.0219132453522128e-06, - "loss": 0.6646, - "step": 59488 - }, - { - "epoch": 1.52, - "learning_rate": 1.0218855815342707e-06, - "loss": 0.6934, - "step": 59489 - }, - { - "epoch": 1.52, - "learning_rate": 1.0218579176995715e-06, - "loss": 0.5806, - "step": 59490 - }, - { - "epoch": 1.52, - "learning_rate": 1.0218302538481373e-06, - "loss": 0.3357, - "step": 59491 - }, - { - "epoch": 1.52, - "learning_rate": 1.0218025899799884e-06, - "loss": 0.7119, - "step": 59492 - }, - { - "epoch": 1.52, - "learning_rate": 1.021774926095146e-06, - "loss": 0.5449, - "step": 59493 - }, - { - "epoch": 1.52, - "learning_rate": 1.021747262193632e-06, - "loss": 0.627, - "step": 59494 - }, - { - "epoch": 1.52, - "learning_rate": 1.0217195982754668e-06, - "loss": 0.6816, - "step": 59495 - }, - { - "epoch": 1.52, - "learning_rate": 1.021691934340672e-06, - "loss": 0.8057, - "step": 59496 - }, - { - "epoch": 1.52, - "learning_rate": 1.021664270389269e-06, - "loss": 0.5205, - "step": 59497 - }, - { - "epoch": 1.52, - "learning_rate": 1.0216366064212783e-06, - "loss": 0.6904, - "step": 59498 - }, - { - "epoch": 1.52, - "learning_rate": 1.0216089424367214e-06, - "loss": 0.751, - "step": 59499 - }, - { - "epoch": 1.53, - "learning_rate": 1.0215812784356195e-06, - "loss": 0.7119, - "step": 59500 - }, - { - "epoch": 1.53, - "learning_rate": 1.0215536144179942e-06, - "loss": 0.7061, - "step": 59501 - }, - { - "epoch": 1.53, - "learning_rate": 1.0215259503838658e-06, - "loss": 0.6826, - "step": 59502 - }, - { - "epoch": 1.53, - "learning_rate": 1.0214982863332562e-06, - "loss": 0.5996, - "step": 59503 - }, - { - "epoch": 1.53, - "learning_rate": 1.0214706222661863e-06, - "loss": 0.6587, - "step": 59504 - }, - { - "epoch": 1.53, - "learning_rate": 1.0214429581826773e-06, - "loss": 0.6758, - "step": 59505 - }, - { - "epoch": 1.53, - "learning_rate": 1.0214152940827505e-06, - "loss": 0.7812, - "step": 59506 - }, - { - "epoch": 1.53, - "learning_rate": 1.0213876299664273e-06, - "loss": 0.4482, - "step": 59507 - }, - { - "epoch": 1.53, - "learning_rate": 1.021359965833728e-06, - "loss": 0.5518, - "step": 59508 - }, - { - "epoch": 1.53, - "learning_rate": 1.0213323016846746e-06, - "loss": 0.4028, - "step": 59509 - }, - { - "epoch": 1.53, - "learning_rate": 1.021304637519288e-06, - "loss": 0.5471, - "step": 59510 - }, - { - "epoch": 1.53, - "learning_rate": 1.0212769733375897e-06, - "loss": 0.6533, - "step": 59511 - }, - { - "epoch": 1.53, - "learning_rate": 1.0212493091396002e-06, - "loss": 0.665, - "step": 59512 - }, - { - "epoch": 1.53, - "learning_rate": 1.0212216449253412e-06, - "loss": 0.6279, - "step": 59513 - }, - { - "epoch": 1.53, - "learning_rate": 1.0211939806948337e-06, - "loss": 0.502, - "step": 59514 - }, - { - "epoch": 1.53, - "learning_rate": 1.0211663164480993e-06, - "loss": 0.5435, - "step": 59515 - }, - { - "epoch": 1.53, - "learning_rate": 1.0211386521851585e-06, - "loss": 0.584, - "step": 59516 - }, - { - "epoch": 1.53, - "learning_rate": 1.021110987906033e-06, - "loss": 0.5996, - "step": 59517 - }, - { - "epoch": 1.53, - "learning_rate": 1.0210833236107434e-06, - "loss": 0.6211, - "step": 59518 - }, - { - "epoch": 1.53, - "learning_rate": 1.0210556592993118e-06, - "loss": 0.5725, - "step": 59519 - }, - { - "epoch": 1.53, - "learning_rate": 1.0210279949717585e-06, - "loss": 0.6899, - "step": 59520 - }, - { - "epoch": 1.53, - "learning_rate": 1.0210003306281052e-06, - "loss": 0.605, - "step": 59521 - }, - { - "epoch": 1.53, - "learning_rate": 1.0209726662683729e-06, - "loss": 0.7393, - "step": 59522 - }, - { - "epoch": 1.53, - "learning_rate": 1.0209450018925825e-06, - "loss": 0.6216, - "step": 59523 - }, - { - "epoch": 1.53, - "learning_rate": 1.0209173375007559e-06, - "loss": 0.6426, - "step": 59524 - }, - { - "epoch": 1.53, - "learning_rate": 1.0208896730929135e-06, - "loss": 0.5181, - "step": 59525 - }, - { - "epoch": 1.53, - "learning_rate": 1.0208620086690771e-06, - "loss": 0.6104, - "step": 59526 - }, - { - "epoch": 1.53, - "learning_rate": 1.0208343442292676e-06, - "loss": 0.7578, - "step": 59527 - }, - { - "epoch": 1.53, - "learning_rate": 1.020806679773506e-06, - "loss": 0.6069, - "step": 59528 - }, - { - "epoch": 1.53, - "learning_rate": 1.0207790153018135e-06, - "loss": 0.7246, - "step": 59529 - }, - { - "epoch": 1.53, - "learning_rate": 1.020751350814212e-06, - "loss": 0.4556, - "step": 59530 - }, - { - "epoch": 1.53, - "learning_rate": 1.020723686310722e-06, - "loss": 0.7207, - "step": 59531 - }, - { - "epoch": 1.53, - "learning_rate": 1.0206960217913648e-06, - "loss": 0.6396, - "step": 59532 - }, - { - "epoch": 1.53, - "learning_rate": 1.0206683572561613e-06, - "loss": 0.8232, - "step": 59533 - }, - { - "epoch": 1.53, - "learning_rate": 1.0206406927051334e-06, - "loss": 0.6265, - "step": 59534 - }, - { - "epoch": 1.53, - "learning_rate": 1.0206130281383017e-06, - "loss": 0.4194, - "step": 59535 - }, - { - "epoch": 1.53, - "learning_rate": 1.0205853635556877e-06, - "loss": 0.6382, - "step": 59536 - }, - { - "epoch": 1.53, - "learning_rate": 1.020557698957312e-06, - "loss": 0.5742, - "step": 59537 - }, - { - "epoch": 1.53, - "learning_rate": 1.0205300343431967e-06, - "loss": 0.7305, - "step": 59538 - }, - { - "epoch": 1.53, - "learning_rate": 1.020502369713362e-06, - "loss": 0.8447, - "step": 59539 - }, - { - "epoch": 1.53, - "learning_rate": 1.0204747050678302e-06, - "loss": 0.5732, - "step": 59540 - }, - { - "epoch": 1.53, - "learning_rate": 1.0204470404066215e-06, - "loss": 0.2485, - "step": 59541 - }, - { - "epoch": 1.53, - "learning_rate": 1.0204193757297575e-06, - "loss": 0.7246, - "step": 59542 - }, - { - "epoch": 1.53, - "learning_rate": 1.0203917110372594e-06, - "loss": 0.4927, - "step": 59543 - }, - { - "epoch": 1.53, - "learning_rate": 1.0203640463291481e-06, - "loss": 0.584, - "step": 59544 - }, - { - "epoch": 1.53, - "learning_rate": 1.0203363816054451e-06, - "loss": 0.6465, - "step": 59545 - }, - { - "epoch": 1.53, - "learning_rate": 1.0203087168661713e-06, - "loss": 0.5508, - "step": 59546 - }, - { - "epoch": 1.53, - "learning_rate": 1.0202810521113483e-06, - "loss": 0.7427, - "step": 59547 - }, - { - "epoch": 1.53, - "learning_rate": 1.0202533873409968e-06, - "loss": 0.5903, - "step": 59548 - }, - { - "epoch": 1.53, - "learning_rate": 1.0202257225551385e-06, - "loss": 0.6836, - "step": 59549 - }, - { - "epoch": 1.53, - "learning_rate": 1.0201980577537941e-06, - "loss": 0.7988, - "step": 59550 - }, - { - "epoch": 1.53, - "learning_rate": 1.020170392936985e-06, - "loss": 0.6416, - "step": 59551 - }, - { - "epoch": 1.53, - "learning_rate": 1.0201427281047324e-06, - "loss": 0.6216, - "step": 59552 - }, - { - "epoch": 1.53, - "learning_rate": 1.0201150632570574e-06, - "loss": 0.6187, - "step": 59553 - }, - { - "epoch": 1.53, - "learning_rate": 1.0200873983939813e-06, - "loss": 0.7246, - "step": 59554 - }, - { - "epoch": 1.53, - "learning_rate": 1.0200597335155251e-06, - "loss": 0.6973, - "step": 59555 - }, - { - "epoch": 1.53, - "learning_rate": 1.0200320686217102e-06, - "loss": 0.5332, - "step": 59556 - }, - { - "epoch": 1.53, - "learning_rate": 1.0200044037125577e-06, - "loss": 0.6069, - "step": 59557 - }, - { - "epoch": 1.53, - "learning_rate": 1.0199767387880884e-06, - "loss": 0.7842, - "step": 59558 - }, - { - "epoch": 1.53, - "learning_rate": 1.0199490738483242e-06, - "loss": 0.7617, - "step": 59559 - }, - { - "epoch": 1.53, - "learning_rate": 1.019921408893286e-06, - "loss": 0.6196, - "step": 59560 - }, - { - "epoch": 1.53, - "learning_rate": 1.0198937439229947e-06, - "loss": 0.3867, - "step": 59561 - }, - { - "epoch": 1.53, - "learning_rate": 1.0198660789374712e-06, - "loss": 0.6204, - "step": 59562 - }, - { - "epoch": 1.53, - "learning_rate": 1.019838413936738e-06, - "loss": 0.6826, - "step": 59563 - }, - { - "epoch": 1.53, - "learning_rate": 1.0198107489208148e-06, - "loss": 0.7256, - "step": 59564 - }, - { - "epoch": 1.53, - "learning_rate": 1.0197830838897237e-06, - "loss": 0.8037, - "step": 59565 - }, - { - "epoch": 1.53, - "learning_rate": 1.0197554188434856e-06, - "loss": 0.7007, - "step": 59566 - }, - { - "epoch": 1.53, - "learning_rate": 1.0197277537821216e-06, - "loss": 0.5283, - "step": 59567 - }, - { - "epoch": 1.53, - "learning_rate": 1.019700088705653e-06, - "loss": 0.791, - "step": 59568 - }, - { - "epoch": 1.53, - "learning_rate": 1.0196724236141008e-06, - "loss": 0.832, - "step": 59569 - }, - { - "epoch": 1.53, - "learning_rate": 1.0196447585074868e-06, - "loss": 0.8604, - "step": 59570 - }, - { - "epoch": 1.53, - "learning_rate": 1.0196170933858311e-06, - "loss": 0.75, - "step": 59571 - }, - { - "epoch": 1.53, - "learning_rate": 1.0195894282491561e-06, - "loss": 0.873, - "step": 59572 - }, - { - "epoch": 1.53, - "learning_rate": 1.0195617630974819e-06, - "loss": 0.7256, - "step": 59573 - }, - { - "epoch": 1.53, - "learning_rate": 1.0195340979308304e-06, - "loss": 0.5046, - "step": 59574 - }, - { - "epoch": 1.53, - "learning_rate": 1.0195064327492226e-06, - "loss": 0.6826, - "step": 59575 - }, - { - "epoch": 1.53, - "learning_rate": 1.0194787675526796e-06, - "loss": 0.4978, - "step": 59576 - }, - { - "epoch": 1.53, - "learning_rate": 1.0194511023412222e-06, - "loss": 0.6875, - "step": 59577 - }, - { - "epoch": 1.53, - "learning_rate": 1.0194234371148724e-06, - "loss": 0.5635, - "step": 59578 - }, - { - "epoch": 1.53, - "learning_rate": 1.0193957718736507e-06, - "loss": 0.7119, - "step": 59579 - }, - { - "epoch": 1.53, - "learning_rate": 1.019368106617579e-06, - "loss": 0.7246, - "step": 59580 - }, - { - "epoch": 1.53, - "learning_rate": 1.0193404413466774e-06, - "loss": 0.6084, - "step": 59581 - }, - { - "epoch": 1.53, - "learning_rate": 1.0193127760609683e-06, - "loss": 0.6738, - "step": 59582 - }, - { - "epoch": 1.53, - "learning_rate": 1.0192851107604718e-06, - "loss": 0.4426, - "step": 59583 - }, - { - "epoch": 1.53, - "learning_rate": 1.01925744544521e-06, - "loss": 0.3772, - "step": 59584 - }, - { - "epoch": 1.53, - "learning_rate": 1.0192297801152036e-06, - "loss": 0.6477, - "step": 59585 - }, - { - "epoch": 1.53, - "learning_rate": 1.0192021147704734e-06, - "loss": 0.4814, - "step": 59586 - }, - { - "epoch": 1.53, - "learning_rate": 1.0191744494110415e-06, - "loss": 0.469, - "step": 59587 - }, - { - "epoch": 1.53, - "learning_rate": 1.0191467840369285e-06, - "loss": 0.7178, - "step": 59588 - }, - { - "epoch": 1.53, - "learning_rate": 1.0191191186481556e-06, - "loss": 0.4893, - "step": 59589 - }, - { - "epoch": 1.53, - "learning_rate": 1.0190914532447442e-06, - "loss": 0.6135, - "step": 59590 - }, - { - "epoch": 1.53, - "learning_rate": 1.0190637878267151e-06, - "loss": 0.7891, - "step": 59591 - }, - { - "epoch": 1.53, - "learning_rate": 1.01903612239409e-06, - "loss": 0.6846, - "step": 59592 - }, - { - "epoch": 1.53, - "learning_rate": 1.0190084569468897e-06, - "loss": 0.665, - "step": 59593 - }, - { - "epoch": 1.53, - "learning_rate": 1.0189807914851354e-06, - "loss": 0.6333, - "step": 59594 - }, - { - "epoch": 1.53, - "learning_rate": 1.0189531260088489e-06, - "loss": 0.5837, - "step": 59595 - }, - { - "epoch": 1.53, - "learning_rate": 1.0189254605180501e-06, - "loss": 0.5918, - "step": 59596 - }, - { - "epoch": 1.53, - "learning_rate": 1.0188977950127614e-06, - "loss": 0.6289, - "step": 59597 - }, - { - "epoch": 1.53, - "learning_rate": 1.0188701294930033e-06, - "loss": 0.6973, - "step": 59598 - }, - { - "epoch": 1.53, - "learning_rate": 1.0188424639587973e-06, - "loss": 0.748, - "step": 59599 - }, - { - "epoch": 1.53, - "learning_rate": 1.0188147984101647e-06, - "loss": 0.71, - "step": 59600 - }, - { - "epoch": 1.53, - "learning_rate": 1.0187871328471265e-06, - "loss": 0.5713, - "step": 59601 - }, - { - "epoch": 1.53, - "learning_rate": 1.0187594672697033e-06, - "loss": 0.6904, - "step": 59602 - }, - { - "epoch": 1.53, - "learning_rate": 1.0187318016779175e-06, - "loss": 0.7158, - "step": 59603 - }, - { - "epoch": 1.53, - "learning_rate": 1.0187041360717889e-06, - "loss": 0.7744, - "step": 59604 - }, - { - "epoch": 1.53, - "learning_rate": 1.01867647045134e-06, - "loss": 0.7803, - "step": 59605 - }, - { - "epoch": 1.53, - "learning_rate": 1.0186488048165913e-06, - "loss": 0.7891, - "step": 59606 - }, - { - "epoch": 1.53, - "learning_rate": 1.018621139167564e-06, - "loss": 0.626, - "step": 59607 - }, - { - "epoch": 1.53, - "learning_rate": 1.0185934735042792e-06, - "loss": 0.7314, - "step": 59608 - }, - { - "epoch": 1.53, - "learning_rate": 1.0185658078267584e-06, - "loss": 0.8184, - "step": 59609 - }, - { - "epoch": 1.53, - "learning_rate": 1.0185381421350227e-06, - "loss": 0.6768, - "step": 59610 - }, - { - "epoch": 1.53, - "learning_rate": 1.0185104764290929e-06, - "loss": 0.668, - "step": 59611 - }, - { - "epoch": 1.53, - "learning_rate": 1.0184828107089907e-06, - "loss": 0.8281, - "step": 59612 - }, - { - "epoch": 1.53, - "learning_rate": 1.018455144974737e-06, - "loss": 0.7988, - "step": 59613 - }, - { - "epoch": 1.53, - "learning_rate": 1.018427479226353e-06, - "loss": 0.6074, - "step": 59614 - }, - { - "epoch": 1.53, - "learning_rate": 1.0183998134638601e-06, - "loss": 0.6897, - "step": 59615 - }, - { - "epoch": 1.53, - "learning_rate": 1.018372147687279e-06, - "loss": 0.6982, - "step": 59616 - }, - { - "epoch": 1.53, - "learning_rate": 1.0183444818966313e-06, - "loss": 0.6006, - "step": 59617 - }, - { - "epoch": 1.53, - "learning_rate": 1.0183168160919385e-06, - "loss": 0.574, - "step": 59618 - }, - { - "epoch": 1.53, - "learning_rate": 1.0182891502732207e-06, - "loss": 0.7051, - "step": 59619 - }, - { - "epoch": 1.53, - "learning_rate": 1.0182614844405004e-06, - "loss": 0.8018, - "step": 59620 - }, - { - "epoch": 1.53, - "learning_rate": 1.0182338185937975e-06, - "loss": 0.7773, - "step": 59621 - }, - { - "epoch": 1.53, - "learning_rate": 1.0182061527331343e-06, - "loss": 0.5901, - "step": 59622 - }, - { - "epoch": 1.53, - "learning_rate": 1.018178486858531e-06, - "loss": 0.2466, - "step": 59623 - }, - { - "epoch": 1.53, - "learning_rate": 1.0181508209700096e-06, - "loss": 0.4519, - "step": 59624 - }, - { - "epoch": 1.53, - "learning_rate": 1.0181231550675908e-06, - "loss": 0.5034, - "step": 59625 - }, - { - "epoch": 1.53, - "learning_rate": 1.0180954891512963e-06, - "loss": 0.7529, - "step": 59626 - }, - { - "epoch": 1.53, - "learning_rate": 1.0180678232211464e-06, - "loss": 0.5933, - "step": 59627 - }, - { - "epoch": 1.53, - "learning_rate": 1.018040157277163e-06, - "loss": 0.6064, - "step": 59628 - }, - { - "epoch": 1.53, - "learning_rate": 1.0180124913193671e-06, - "loss": 0.6836, - "step": 59629 - }, - { - "epoch": 1.53, - "learning_rate": 1.0179848253477798e-06, - "loss": 0.6172, - "step": 59630 - }, - { - "epoch": 1.53, - "learning_rate": 1.0179571593624225e-06, - "loss": 0.4814, - "step": 59631 - }, - { - "epoch": 1.53, - "learning_rate": 1.0179294933633163e-06, - "loss": 0.5737, - "step": 59632 - }, - { - "epoch": 1.53, - "learning_rate": 1.017901827350482e-06, - "loss": 0.5583, - "step": 59633 - }, - { - "epoch": 1.53, - "learning_rate": 1.0178741613239412e-06, - "loss": 0.5767, - "step": 59634 - }, - { - "epoch": 1.53, - "learning_rate": 1.0178464952837152e-06, - "loss": 0.5791, - "step": 59635 - }, - { - "epoch": 1.53, - "learning_rate": 1.0178188292298246e-06, - "loss": 0.5913, - "step": 59636 - }, - { - "epoch": 1.53, - "learning_rate": 1.0177911631622913e-06, - "loss": 0.568, - "step": 59637 - }, - { - "epoch": 1.53, - "learning_rate": 1.0177634970811357e-06, - "loss": 0.7061, - "step": 59638 - }, - { - "epoch": 1.53, - "learning_rate": 1.0177358309863798e-06, - "loss": 0.6616, - "step": 59639 - }, - { - "epoch": 1.53, - "learning_rate": 1.0177081648780443e-06, - "loss": 0.6987, - "step": 59640 - }, - { - "epoch": 1.53, - "learning_rate": 1.0176804987561505e-06, - "loss": 0.6089, - "step": 59641 - }, - { - "epoch": 1.53, - "learning_rate": 1.0176528326207193e-06, - "loss": 0.6577, - "step": 59642 - }, - { - "epoch": 1.53, - "learning_rate": 1.0176251664717724e-06, - "loss": 0.6943, - "step": 59643 - }, - { - "epoch": 1.53, - "learning_rate": 1.0175975003093305e-06, - "loss": 0.5161, - "step": 59644 - }, - { - "epoch": 1.53, - "learning_rate": 1.0175698341334154e-06, - "loss": 0.5854, - "step": 59645 - }, - { - "epoch": 1.53, - "learning_rate": 1.0175421679440474e-06, - "loss": 0.7207, - "step": 59646 - }, - { - "epoch": 1.53, - "learning_rate": 1.0175145017412485e-06, - "loss": 0.6895, - "step": 59647 - }, - { - "epoch": 1.53, - "learning_rate": 1.0174868355250393e-06, - "loss": 0.667, - "step": 59648 - }, - { - "epoch": 1.53, - "learning_rate": 1.0174591692954415e-06, - "loss": 0.5386, - "step": 59649 - }, - { - "epoch": 1.53, - "learning_rate": 1.017431503052476e-06, - "loss": 0.8076, - "step": 59650 - }, - { - "epoch": 1.53, - "learning_rate": 1.0174038367961639e-06, - "loss": 0.6631, - "step": 59651 - }, - { - "epoch": 1.53, - "learning_rate": 1.0173761705265262e-06, - "loss": 0.6372, - "step": 59652 - }, - { - "epoch": 1.53, - "learning_rate": 1.0173485042435848e-06, - "loss": 0.7939, - "step": 59653 - }, - { - "epoch": 1.53, - "learning_rate": 1.01732083794736e-06, - "loss": 0.7422, - "step": 59654 - }, - { - "epoch": 1.53, - "learning_rate": 1.017293171637874e-06, - "loss": 0.5459, - "step": 59655 - }, - { - "epoch": 1.53, - "learning_rate": 1.0172655053151472e-06, - "loss": 0.5664, - "step": 59656 - }, - { - "epoch": 1.53, - "learning_rate": 1.0172378389792006e-06, - "loss": 0.6099, - "step": 59657 - }, - { - "epoch": 1.53, - "learning_rate": 1.0172101726300564e-06, - "loss": 0.6689, - "step": 59658 - }, - { - "epoch": 1.53, - "learning_rate": 1.0171825062677347e-06, - "loss": 0.6982, - "step": 59659 - }, - { - "epoch": 1.53, - "learning_rate": 1.0171548398922577e-06, - "loss": 0.5051, - "step": 59660 - }, - { - "epoch": 1.53, - "learning_rate": 1.0171271735036453e-06, - "loss": 0.8027, - "step": 59661 - }, - { - "epoch": 1.53, - "learning_rate": 1.0170995071019199e-06, - "loss": 0.5928, - "step": 59662 - }, - { - "epoch": 1.53, - "learning_rate": 1.017071840687102e-06, - "loss": 0.6025, - "step": 59663 - }, - { - "epoch": 1.53, - "learning_rate": 1.0170441742592132e-06, - "loss": 0.5801, - "step": 59664 - }, - { - "epoch": 1.53, - "learning_rate": 1.0170165078182743e-06, - "loss": 0.5859, - "step": 59665 - }, - { - "epoch": 1.53, - "learning_rate": 1.0169888413643066e-06, - "loss": 0.7354, - "step": 59666 - }, - { - "epoch": 1.53, - "learning_rate": 1.0169611748973312e-06, - "loss": 0.6982, - "step": 59667 - }, - { - "epoch": 1.53, - "learning_rate": 1.0169335084173695e-06, - "loss": 0.5535, - "step": 59668 - }, - { - "epoch": 1.53, - "learning_rate": 1.0169058419244425e-06, - "loss": 0.6245, - "step": 59669 - }, - { - "epoch": 1.53, - "learning_rate": 1.016878175418572e-06, - "loss": 0.7188, - "step": 59670 - }, - { - "epoch": 1.53, - "learning_rate": 1.016850508899778e-06, - "loss": 0.6426, - "step": 59671 - }, - { - "epoch": 1.53, - "learning_rate": 1.0168228423680828e-06, - "loss": 0.7007, - "step": 59672 - }, - { - "epoch": 1.53, - "learning_rate": 1.0167951758235067e-06, - "loss": 0.6851, - "step": 59673 - }, - { - "epoch": 1.53, - "learning_rate": 1.0167675092660716e-06, - "loss": 0.5918, - "step": 59674 - }, - { - "epoch": 1.53, - "learning_rate": 1.0167398426957984e-06, - "loss": 0.6758, - "step": 59675 - }, - { - "epoch": 1.53, - "learning_rate": 1.0167121761127082e-06, - "loss": 0.7256, - "step": 59676 - }, - { - "epoch": 1.53, - "learning_rate": 1.0166845095168224e-06, - "loss": 0.7734, - "step": 59677 - }, - { - "epoch": 1.53, - "learning_rate": 1.016656842908162e-06, - "loss": 0.582, - "step": 59678 - }, - { - "epoch": 1.53, - "learning_rate": 1.0166291762867479e-06, - "loss": 0.7295, - "step": 59679 - }, - { - "epoch": 1.53, - "learning_rate": 1.016601509652602e-06, - "loss": 0.6436, - "step": 59680 - }, - { - "epoch": 1.53, - "learning_rate": 1.0165738430057448e-06, - "loss": 0.5828, - "step": 59681 - }, - { - "epoch": 1.53, - "learning_rate": 1.0165461763461978e-06, - "loss": 0.7002, - "step": 59682 - }, - { - "epoch": 1.53, - "learning_rate": 1.0165185096739823e-06, - "loss": 0.6626, - "step": 59683 - }, - { - "epoch": 1.53, - "learning_rate": 1.0164908429891193e-06, - "loss": 0.6611, - "step": 59684 - }, - { - "epoch": 1.53, - "learning_rate": 1.0164631762916302e-06, - "loss": 0.5142, - "step": 59685 - }, - { - "epoch": 1.53, - "learning_rate": 1.0164355095815356e-06, - "loss": 0.6558, - "step": 59686 - }, - { - "epoch": 1.53, - "learning_rate": 1.0164078428588573e-06, - "loss": 0.5786, - "step": 59687 - }, - { - "epoch": 1.53, - "learning_rate": 1.0163801761236162e-06, - "loss": 0.8125, - "step": 59688 - }, - { - "epoch": 1.53, - "learning_rate": 1.0163525093758335e-06, - "loss": 0.4976, - "step": 59689 - }, - { - "epoch": 1.53, - "learning_rate": 1.0163248426155308e-06, - "loss": 0.6621, - "step": 59690 - }, - { - "epoch": 1.53, - "learning_rate": 1.0162971758427287e-06, - "loss": 0.6069, - "step": 59691 - }, - { - "epoch": 1.53, - "learning_rate": 1.0162695090574485e-06, - "loss": 0.6006, - "step": 59692 - }, - { - "epoch": 1.53, - "learning_rate": 1.0162418422597116e-06, - "loss": 0.5327, - "step": 59693 - }, - { - "epoch": 1.53, - "learning_rate": 1.0162141754495388e-06, - "loss": 0.5908, - "step": 59694 - }, - { - "epoch": 1.53, - "learning_rate": 1.016186508626952e-06, - "loss": 0.7129, - "step": 59695 - }, - { - "epoch": 1.53, - "learning_rate": 1.0161588417919718e-06, - "loss": 0.7119, - "step": 59696 - }, - { - "epoch": 1.53, - "learning_rate": 1.0161311749446193e-06, - "loss": 0.5703, - "step": 59697 - }, - { - "epoch": 1.53, - "learning_rate": 1.016103508084916e-06, - "loss": 0.7002, - "step": 59698 - }, - { - "epoch": 1.53, - "learning_rate": 1.0160758412128831e-06, - "loss": 0.5029, - "step": 59699 - }, - { - "epoch": 1.53, - "learning_rate": 1.0160481743285416e-06, - "loss": 0.5327, - "step": 59700 - }, - { - "epoch": 1.53, - "learning_rate": 1.0160205074319125e-06, - "loss": 0.6978, - "step": 59701 - }, - { - "epoch": 1.53, - "learning_rate": 1.0159928405230176e-06, - "loss": 0.5752, - "step": 59702 - }, - { - "epoch": 1.53, - "learning_rate": 1.0159651736018775e-06, - "loss": 0.9062, - "step": 59703 - }, - { - "epoch": 1.53, - "learning_rate": 1.0159375066685135e-06, - "loss": 0.7871, - "step": 59704 - }, - { - "epoch": 1.53, - "learning_rate": 1.0159098397229474e-06, - "loss": 0.6123, - "step": 59705 - }, - { - "epoch": 1.53, - "learning_rate": 1.0158821727651996e-06, - "loss": 0.6631, - "step": 59706 - }, - { - "epoch": 1.53, - "learning_rate": 1.0158545057952912e-06, - "loss": 0.583, - "step": 59707 - }, - { - "epoch": 1.53, - "learning_rate": 1.015826838813244e-06, - "loss": 0.7139, - "step": 59708 - }, - { - "epoch": 1.53, - "learning_rate": 1.0157991718190789e-06, - "loss": 0.6738, - "step": 59709 - }, - { - "epoch": 1.53, - "learning_rate": 1.0157715048128175e-06, - "loss": 0.3671, - "step": 59710 - }, - { - "epoch": 1.53, - "learning_rate": 1.01574383779448e-06, - "loss": 0.5496, - "step": 59711 - }, - { - "epoch": 1.53, - "learning_rate": 1.0157161707640884e-06, - "loss": 0.5559, - "step": 59712 - }, - { - "epoch": 1.53, - "learning_rate": 1.0156885037216636e-06, - "loss": 0.6553, - "step": 59713 - }, - { - "epoch": 1.53, - "learning_rate": 1.015660836667227e-06, - "loss": 0.8184, - "step": 59714 - }, - { - "epoch": 1.53, - "learning_rate": 1.0156331696007994e-06, - "loss": 0.6992, - "step": 59715 - }, - { - "epoch": 1.53, - "learning_rate": 1.0156055025224024e-06, - "loss": 0.7246, - "step": 59716 - }, - { - "epoch": 1.53, - "learning_rate": 1.0155778354320567e-06, - "loss": 0.6328, - "step": 59717 - }, - { - "epoch": 1.53, - "learning_rate": 1.015550168329784e-06, - "loss": 0.6309, - "step": 59718 - }, - { - "epoch": 1.53, - "learning_rate": 1.015522501215605e-06, - "loss": 0.7539, - "step": 59719 - }, - { - "epoch": 1.53, - "learning_rate": 1.0154948340895415e-06, - "loss": 0.7178, - "step": 59720 - }, - { - "epoch": 1.53, - "learning_rate": 1.0154671669516142e-06, - "loss": 0.7031, - "step": 59721 - }, - { - "epoch": 1.53, - "learning_rate": 1.0154394998018445e-06, - "loss": 0.6943, - "step": 59722 - }, - { - "epoch": 1.53, - "learning_rate": 1.0154118326402531e-06, - "loss": 0.3767, - "step": 59723 - }, - { - "epoch": 1.53, - "learning_rate": 1.0153841654668618e-06, - "loss": 0.6299, - "step": 59724 - }, - { - "epoch": 1.53, - "learning_rate": 1.0153564982816918e-06, - "loss": 0.6982, - "step": 59725 - }, - { - "epoch": 1.53, - "learning_rate": 1.0153288310847636e-06, - "loss": 0.7754, - "step": 59726 - }, - { - "epoch": 1.53, - "learning_rate": 1.015301163876099e-06, - "loss": 0.9277, - "step": 59727 - }, - { - "epoch": 1.53, - "learning_rate": 1.0152734966557187e-06, - "loss": 0.6104, - "step": 59728 - }, - { - "epoch": 1.53, - "learning_rate": 1.0152458294236447e-06, - "loss": 0.6729, - "step": 59729 - }, - { - "epoch": 1.53, - "learning_rate": 1.0152181621798976e-06, - "loss": 0.4128, - "step": 59730 - }, - { - "epoch": 1.53, - "learning_rate": 1.0151904949244984e-06, - "loss": 0.7397, - "step": 59731 - }, - { - "epoch": 1.53, - "learning_rate": 1.0151628276574686e-06, - "loss": 0.7109, - "step": 59732 - }, - { - "epoch": 1.53, - "learning_rate": 1.0151351603788294e-06, - "loss": 0.8369, - "step": 59733 - }, - { - "epoch": 1.53, - "learning_rate": 1.015107493088602e-06, - "loss": 0.6445, - "step": 59734 - }, - { - "epoch": 1.53, - "learning_rate": 1.0150798257868074e-06, - "loss": 0.5894, - "step": 59735 - }, - { - "epoch": 1.53, - "learning_rate": 1.0150521584734668e-06, - "loss": 0.6914, - "step": 59736 - }, - { - "epoch": 1.53, - "learning_rate": 1.0150244911486014e-06, - "loss": 0.6133, - "step": 59737 - }, - { - "epoch": 1.53, - "learning_rate": 1.0149968238122326e-06, - "loss": 0.562, - "step": 59738 - }, - { - "epoch": 1.53, - "learning_rate": 1.0149691564643813e-06, - "loss": 0.5601, - "step": 59739 - }, - { - "epoch": 1.53, - "learning_rate": 1.014941489105069e-06, - "loss": 0.7881, - "step": 59740 - }, - { - "epoch": 1.53, - "learning_rate": 1.0149138217343164e-06, - "loss": 0.6475, - "step": 59741 - }, - { - "epoch": 1.53, - "learning_rate": 1.0148861543521452e-06, - "loss": 0.5596, - "step": 59742 - }, - { - "epoch": 1.53, - "learning_rate": 1.0148584869585764e-06, - "loss": 0.8262, - "step": 59743 - }, - { - "epoch": 1.53, - "learning_rate": 1.0148308195536308e-06, - "loss": 0.6982, - "step": 59744 - }, - { - "epoch": 1.53, - "learning_rate": 1.01480315213733e-06, - "loss": 0.6211, - "step": 59745 - }, - { - "epoch": 1.53, - "learning_rate": 1.0147754847096955e-06, - "loss": 0.7422, - "step": 59746 - }, - { - "epoch": 1.53, - "learning_rate": 1.0147478172707474e-06, - "loss": 0.5957, - "step": 59747 - }, - { - "epoch": 1.53, - "learning_rate": 1.0147201498205083e-06, - "loss": 0.542, - "step": 59748 - }, - { - "epoch": 1.53, - "learning_rate": 1.0146924823589982e-06, - "loss": 0.8447, - "step": 59749 - }, - { - "epoch": 1.53, - "learning_rate": 1.0146648148862392e-06, - "loss": 0.561, - "step": 59750 - }, - { - "epoch": 1.53, - "learning_rate": 1.0146371474022517e-06, - "loss": 0.5747, - "step": 59751 - }, - { - "epoch": 1.53, - "learning_rate": 1.0146094799070573e-06, - "loss": 0.5459, - "step": 59752 - }, - { - "epoch": 1.53, - "learning_rate": 1.014581812400677e-06, - "loss": 0.7822, - "step": 59753 - }, - { - "epoch": 1.53, - "learning_rate": 1.014554144883132e-06, - "loss": 0.4893, - "step": 59754 - }, - { - "epoch": 1.53, - "learning_rate": 1.0145264773544437e-06, - "loss": 0.7236, - "step": 59755 - }, - { - "epoch": 1.53, - "learning_rate": 1.0144988098146333e-06, - "loss": 0.6313, - "step": 59756 - }, - { - "epoch": 1.53, - "learning_rate": 1.0144711422637213e-06, - "loss": 0.7207, - "step": 59757 - }, - { - "epoch": 1.53, - "learning_rate": 1.0144434747017299e-06, - "loss": 0.6455, - "step": 59758 - }, - { - "epoch": 1.53, - "learning_rate": 1.0144158071286794e-06, - "loss": 0.7314, - "step": 59759 - }, - { - "epoch": 1.53, - "learning_rate": 1.014388139544592e-06, - "loss": 0.7783, - "step": 59760 - }, - { - "epoch": 1.53, - "learning_rate": 1.0143604719494878e-06, - "loss": 0.4931, - "step": 59761 - }, - { - "epoch": 1.53, - "learning_rate": 1.0143328043433886e-06, - "loss": 0.7004, - "step": 59762 - }, - { - "epoch": 1.53, - "learning_rate": 1.014305136726315e-06, - "loss": 0.623, - "step": 59763 - }, - { - "epoch": 1.53, - "learning_rate": 1.0142774690982894e-06, - "loss": 0.79, - "step": 59764 - }, - { - "epoch": 1.53, - "learning_rate": 1.0142498014593317e-06, - "loss": 0.5896, - "step": 59765 - }, - { - "epoch": 1.53, - "learning_rate": 1.0142221338094637e-06, - "loss": 0.6836, - "step": 59766 - }, - { - "epoch": 1.53, - "learning_rate": 1.0141944661487064e-06, - "loss": 0.7207, - "step": 59767 - }, - { - "epoch": 1.53, - "learning_rate": 1.0141667984770812e-06, - "loss": 0.605, - "step": 59768 - }, - { - "epoch": 1.53, - "learning_rate": 1.0141391307946088e-06, - "loss": 0.7715, - "step": 59769 - }, - { - "epoch": 1.53, - "learning_rate": 1.014111463101311e-06, - "loss": 0.5693, - "step": 59770 - }, - { - "epoch": 1.53, - "learning_rate": 1.0140837953972088e-06, - "loss": 0.6846, - "step": 59771 - }, - { - "epoch": 1.53, - "learning_rate": 1.0140561276823229e-06, - "loss": 0.6929, - "step": 59772 - }, - { - "epoch": 1.53, - "learning_rate": 1.0140284599566752e-06, - "loss": 0.6206, - "step": 59773 - }, - { - "epoch": 1.53, - "learning_rate": 1.0140007922202862e-06, - "loss": 0.5635, - "step": 59774 - }, - { - "epoch": 1.53, - "learning_rate": 1.0139731244731779e-06, - "loss": 0.5752, - "step": 59775 - }, - { - "epoch": 1.53, - "learning_rate": 1.0139454567153707e-06, - "loss": 0.7634, - "step": 59776 - }, - { - "epoch": 1.53, - "learning_rate": 1.0139177889468864e-06, - "loss": 0.7559, - "step": 59777 - }, - { - "epoch": 1.53, - "learning_rate": 1.0138901211677456e-06, - "loss": 0.8848, - "step": 59778 - }, - { - "epoch": 1.53, - "learning_rate": 1.0138624533779698e-06, - "loss": 0.7979, - "step": 59779 - }, - { - "epoch": 1.53, - "learning_rate": 1.0138347855775801e-06, - "loss": 0.7012, - "step": 59780 - }, - { - "epoch": 1.53, - "learning_rate": 1.013807117766598e-06, - "loss": 0.8018, - "step": 59781 - }, - { - "epoch": 1.53, - "learning_rate": 1.0137794499450442e-06, - "loss": 0.6499, - "step": 59782 - }, - { - "epoch": 1.53, - "learning_rate": 1.0137517821129403e-06, - "loss": 0.626, - "step": 59783 - }, - { - "epoch": 1.53, - "learning_rate": 1.013724114270307e-06, - "loss": 0.5959, - "step": 59784 - }, - { - "epoch": 1.53, - "learning_rate": 1.0136964464171662e-06, - "loss": 0.7441, - "step": 59785 - }, - { - "epoch": 1.53, - "learning_rate": 1.0136687785535385e-06, - "loss": 0.6196, - "step": 59786 - }, - { - "epoch": 1.53, - "learning_rate": 1.0136411106794451e-06, - "loss": 0.6689, - "step": 59787 - }, - { - "epoch": 1.53, - "learning_rate": 1.0136134427949071e-06, - "loss": 0.6826, - "step": 59788 - }, - { - "epoch": 1.53, - "learning_rate": 1.0135857748999467e-06, - "loss": 0.7354, - "step": 59789 - }, - { - "epoch": 1.53, - "learning_rate": 1.0135581069945837e-06, - "loss": 0.46, - "step": 59790 - }, - { - "epoch": 1.53, - "learning_rate": 1.0135304390788398e-06, - "loss": 0.7354, - "step": 59791 - }, - { - "epoch": 1.53, - "learning_rate": 1.0135027711527367e-06, - "loss": 0.5822, - "step": 59792 - }, - { - "epoch": 1.53, - "learning_rate": 1.0134751032162946e-06, - "loss": 0.6748, - "step": 59793 - }, - { - "epoch": 1.53, - "learning_rate": 1.0134474352695358e-06, - "loss": 0.5498, - "step": 59794 - }, - { - "epoch": 1.53, - "learning_rate": 1.0134197673124805e-06, - "loss": 0.4709, - "step": 59795 - }, - { - "epoch": 1.53, - "learning_rate": 1.0133920993451506e-06, - "loss": 0.5996, - "step": 59796 - }, - { - "epoch": 1.53, - "learning_rate": 1.0133644313675667e-06, - "loss": 0.7041, - "step": 59797 - }, - { - "epoch": 1.53, - "learning_rate": 1.0133367633797504e-06, - "loss": 0.6528, - "step": 59798 - }, - { - "epoch": 1.53, - "learning_rate": 1.0133090953817228e-06, - "loss": 0.6738, - "step": 59799 - }, - { - "epoch": 1.53, - "learning_rate": 1.013281427373505e-06, - "loss": 0.5791, - "step": 59800 - }, - { - "epoch": 1.53, - "learning_rate": 1.0132537593551183e-06, - "loss": 0.6064, - "step": 59801 - }, - { - "epoch": 1.53, - "learning_rate": 1.0132260913265837e-06, - "loss": 0.7129, - "step": 59802 - }, - { - "epoch": 1.53, - "learning_rate": 1.0131984232879226e-06, - "loss": 0.6121, - "step": 59803 - }, - { - "epoch": 1.53, - "learning_rate": 1.013170755239156e-06, - "loss": 0.4087, - "step": 59804 - }, - { - "epoch": 1.53, - "learning_rate": 1.0131430871803052e-06, - "loss": 0.4971, - "step": 59805 - }, - { - "epoch": 1.53, - "learning_rate": 1.0131154191113914e-06, - "loss": 0.6846, - "step": 59806 - }, - { - "epoch": 1.53, - "learning_rate": 1.0130877510324355e-06, - "loss": 0.7686, - "step": 59807 - }, - { - "epoch": 1.53, - "learning_rate": 1.013060082943459e-06, - "loss": 0.6592, - "step": 59808 - }, - { - "epoch": 1.53, - "learning_rate": 1.0130324148444829e-06, - "loss": 0.5713, - "step": 59809 - }, - { - "epoch": 1.53, - "learning_rate": 1.0130047467355286e-06, - "loss": 0.7764, - "step": 59810 - }, - { - "epoch": 1.53, - "learning_rate": 1.0129770786166173e-06, - "loss": 0.542, - "step": 59811 - }, - { - "epoch": 1.53, - "learning_rate": 1.01294941048777e-06, - "loss": 0.5562, - "step": 59812 - }, - { - "epoch": 1.53, - "learning_rate": 1.0129217423490078e-06, - "loss": 0.4797, - "step": 59813 - }, - { - "epoch": 1.53, - "learning_rate": 1.012894074200352e-06, - "loss": 0.8652, - "step": 59814 - }, - { - "epoch": 1.53, - "learning_rate": 1.012866406041824e-06, - "loss": 0.6631, - "step": 59815 - }, - { - "epoch": 1.53, - "learning_rate": 1.0128387378734444e-06, - "loss": 0.7598, - "step": 59816 - }, - { - "epoch": 1.53, - "learning_rate": 1.0128110696952352e-06, - "loss": 0.585, - "step": 59817 - }, - { - "epoch": 1.53, - "learning_rate": 1.0127834015072168e-06, - "loss": 0.5522, - "step": 59818 - }, - { - "epoch": 1.53, - "learning_rate": 1.012755733309411e-06, - "loss": 0.4041, - "step": 59819 - }, - { - "epoch": 1.53, - "learning_rate": 1.0127280651018387e-06, - "loss": 0.5005, - "step": 59820 - }, - { - "epoch": 1.53, - "learning_rate": 1.0127003968845212e-06, - "loss": 0.5854, - "step": 59821 - }, - { - "epoch": 1.53, - "learning_rate": 1.0126727286574793e-06, - "loss": 0.6631, - "step": 59822 - }, - { - "epoch": 1.53, - "learning_rate": 1.0126450604207346e-06, - "loss": 0.7656, - "step": 59823 - }, - { - "epoch": 1.53, - "learning_rate": 1.012617392174308e-06, - "loss": 0.4229, - "step": 59824 - }, - { - "epoch": 1.53, - "learning_rate": 1.0125897239182213e-06, - "loss": 0.6963, - "step": 59825 - }, - { - "epoch": 1.53, - "learning_rate": 1.0125620556524948e-06, - "loss": 0.8701, - "step": 59826 - }, - { - "epoch": 1.53, - "learning_rate": 1.01253438737715e-06, - "loss": 0.4637, - "step": 59827 - }, - { - "epoch": 1.53, - "learning_rate": 1.0125067190922086e-06, - "loss": 0.7129, - "step": 59828 - }, - { - "epoch": 1.53, - "learning_rate": 1.0124790507976912e-06, - "loss": 0.8867, - "step": 59829 - }, - { - "epoch": 1.53, - "learning_rate": 1.0124513824936193e-06, - "loss": 0.5278, - "step": 59830 - }, - { - "epoch": 1.53, - "learning_rate": 1.0124237141800139e-06, - "loss": 0.7588, - "step": 59831 - }, - { - "epoch": 1.53, - "learning_rate": 1.012396045856896e-06, - "loss": 0.5566, - "step": 59832 - }, - { - "epoch": 1.53, - "learning_rate": 1.0123683775242873e-06, - "loss": 0.6914, - "step": 59833 - }, - { - "epoch": 1.53, - "learning_rate": 1.0123407091822084e-06, - "loss": 0.6187, - "step": 59834 - }, - { - "epoch": 1.53, - "learning_rate": 1.012313040830681e-06, - "loss": 0.71, - "step": 59835 - }, - { - "epoch": 1.53, - "learning_rate": 1.0122853724697263e-06, - "loss": 0.5798, - "step": 59836 - }, - { - "epoch": 1.53, - "learning_rate": 1.0122577040993647e-06, - "loss": 0.4875, - "step": 59837 - }, - { - "epoch": 1.53, - "learning_rate": 1.0122300357196183e-06, - "loss": 0.8237, - "step": 59838 - }, - { - "epoch": 1.53, - "learning_rate": 1.012202367330508e-06, - "loss": 0.707, - "step": 59839 - }, - { - "epoch": 1.53, - "learning_rate": 1.0121746989320547e-06, - "loss": 0.6797, - "step": 59840 - }, - { - "epoch": 1.53, - "learning_rate": 1.0121470305242799e-06, - "loss": 0.5013, - "step": 59841 - }, - { - "epoch": 1.53, - "learning_rate": 1.0121193621072047e-06, - "loss": 0.574, - "step": 59842 - }, - { - "epoch": 1.53, - "learning_rate": 1.0120916936808498e-06, - "loss": 0.8086, - "step": 59843 - }, - { - "epoch": 1.53, - "learning_rate": 1.0120640252452377e-06, - "loss": 0.7354, - "step": 59844 - }, - { - "epoch": 1.53, - "learning_rate": 1.0120363568003883e-06, - "loss": 0.5576, - "step": 59845 - }, - { - "epoch": 1.53, - "learning_rate": 1.012008688346323e-06, - "loss": 0.5605, - "step": 59846 - }, - { - "epoch": 1.53, - "learning_rate": 1.0119810198830635e-06, - "loss": 0.7563, - "step": 59847 - }, - { - "epoch": 1.53, - "learning_rate": 1.0119533514106304e-06, - "loss": 0.6318, - "step": 59848 - }, - { - "epoch": 1.53, - "learning_rate": 1.0119256829290454e-06, - "loss": 0.5859, - "step": 59849 - }, - { - "epoch": 1.53, - "learning_rate": 1.0118980144383296e-06, - "loss": 0.6094, - "step": 59850 - }, - { - "epoch": 1.53, - "learning_rate": 1.0118703459385037e-06, - "loss": 0.6797, - "step": 59851 - }, - { - "epoch": 1.53, - "learning_rate": 1.0118426774295894e-06, - "loss": 0.5565, - "step": 59852 - }, - { - "epoch": 1.53, - "learning_rate": 1.0118150089116076e-06, - "loss": 0.5762, - "step": 59853 - }, - { - "epoch": 1.53, - "learning_rate": 1.0117873403845797e-06, - "loss": 0.6685, - "step": 59854 - }, - { - "epoch": 1.53, - "learning_rate": 1.0117596718485268e-06, - "loss": 0.71, - "step": 59855 - }, - { - "epoch": 1.53, - "learning_rate": 1.0117320033034698e-06, - "loss": 0.793, - "step": 59856 - }, - { - "epoch": 1.53, - "learning_rate": 1.0117043347494304e-06, - "loss": 0.6787, - "step": 59857 - }, - { - "epoch": 1.53, - "learning_rate": 1.0116766661864295e-06, - "loss": 0.7119, - "step": 59858 - }, - { - "epoch": 1.53, - "learning_rate": 1.0116489976144885e-06, - "loss": 0.5421, - "step": 59859 - }, - { - "epoch": 1.53, - "learning_rate": 1.011621329033628e-06, - "loss": 0.7754, - "step": 59860 - }, - { - "epoch": 1.53, - "learning_rate": 1.0115936604438697e-06, - "loss": 0.627, - "step": 59861 - }, - { - "epoch": 1.53, - "learning_rate": 1.0115659918452347e-06, - "loss": 0.6797, - "step": 59862 - }, - { - "epoch": 1.53, - "learning_rate": 1.0115383232377441e-06, - "loss": 0.6924, - "step": 59863 - }, - { - "epoch": 1.53, - "learning_rate": 1.0115106546214194e-06, - "loss": 0.7217, - "step": 59864 - }, - { - "epoch": 1.53, - "learning_rate": 1.0114829859962814e-06, - "loss": 0.4402, - "step": 59865 - }, - { - "epoch": 1.53, - "learning_rate": 1.0114553173623512e-06, - "loss": 0.5667, - "step": 59866 - }, - { - "epoch": 1.53, - "learning_rate": 1.0114276487196505e-06, - "loss": 0.3584, - "step": 59867 - }, - { - "epoch": 1.53, - "learning_rate": 1.0113999800681998e-06, - "loss": 0.554, - "step": 59868 - }, - { - "epoch": 1.53, - "learning_rate": 1.011372311408021e-06, - "loss": 0.7383, - "step": 59869 - }, - { - "epoch": 1.53, - "learning_rate": 1.0113446427391348e-06, - "loss": 0.8745, - "step": 59870 - }, - { - "epoch": 1.53, - "learning_rate": 1.0113169740615625e-06, - "loss": 0.5791, - "step": 59871 - }, - { - "epoch": 1.53, - "learning_rate": 1.0112893053753254e-06, - "loss": 0.748, - "step": 59872 - }, - { - "epoch": 1.53, - "learning_rate": 1.0112616366804446e-06, - "loss": 0.6719, - "step": 59873 - }, - { - "epoch": 1.53, - "learning_rate": 1.0112339679769414e-06, - "loss": 0.8779, - "step": 59874 - }, - { - "epoch": 1.53, - "learning_rate": 1.0112062992648365e-06, - "loss": 0.6069, - "step": 59875 - }, - { - "epoch": 1.53, - "learning_rate": 1.0111786305441517e-06, - "loss": 0.5693, - "step": 59876 - }, - { - "epoch": 1.53, - "learning_rate": 1.0111509618149078e-06, - "loss": 0.7559, - "step": 59877 - }, - { - "epoch": 1.53, - "learning_rate": 1.011123293077126e-06, - "loss": 0.6758, - "step": 59878 - }, - { - "epoch": 1.53, - "learning_rate": 1.011095624330828e-06, - "loss": 0.5947, - "step": 59879 - }, - { - "epoch": 1.53, - "learning_rate": 1.0110679555760343e-06, - "loss": 0.5295, - "step": 59880 - }, - { - "epoch": 1.53, - "learning_rate": 1.0110402868127666e-06, - "loss": 0.6553, - "step": 59881 - }, - { - "epoch": 1.53, - "learning_rate": 1.0110126180410457e-06, - "loss": 0.6274, - "step": 59882 - }, - { - "epoch": 1.53, - "learning_rate": 1.0109849492608928e-06, - "loss": 0.7808, - "step": 59883 - }, - { - "epoch": 1.53, - "learning_rate": 1.0109572804723297e-06, - "loss": 0.5605, - "step": 59884 - }, - { - "epoch": 1.53, - "learning_rate": 1.0109296116753767e-06, - "loss": 0.7705, - "step": 59885 - }, - { - "epoch": 1.53, - "learning_rate": 1.0109019428700555e-06, - "loss": 0.5918, - "step": 59886 - }, - { - "epoch": 1.53, - "learning_rate": 1.0108742740563872e-06, - "loss": 0.498, - "step": 59887 - }, - { - "epoch": 1.53, - "learning_rate": 1.0108466052343932e-06, - "loss": 0.6582, - "step": 59888 - }, - { - "epoch": 1.53, - "learning_rate": 1.0108189364040942e-06, - "loss": 0.7773, - "step": 59889 - }, - { - "epoch": 1.54, - "learning_rate": 1.0107912675655117e-06, - "loss": 0.7637, - "step": 59890 - }, - { - "epoch": 1.54, - "learning_rate": 1.0107635987186666e-06, - "loss": 0.6602, - "step": 59891 - }, - { - "epoch": 1.54, - "learning_rate": 1.0107359298635807e-06, - "loss": 0.6445, - "step": 59892 - }, - { - "epoch": 1.54, - "learning_rate": 1.0107082610002744e-06, - "loss": 0.7793, - "step": 59893 - }, - { - "epoch": 1.54, - "learning_rate": 1.0106805921287698e-06, - "loss": 0.5635, - "step": 59894 - }, - { - "epoch": 1.54, - "learning_rate": 1.0106529232490871e-06, - "loss": 0.7744, - "step": 59895 - }, - { - "epoch": 1.54, - "learning_rate": 1.0106252543612482e-06, - "loss": 0.6045, - "step": 59896 - }, - { - "epoch": 1.54, - "learning_rate": 1.0105975854652736e-06, - "loss": 0.6572, - "step": 59897 - }, - { - "epoch": 1.54, - "learning_rate": 1.0105699165611854e-06, - "loss": 0.6309, - "step": 59898 - }, - { - "epoch": 1.54, - "learning_rate": 1.0105422476490042e-06, - "loss": 0.8232, - "step": 59899 - }, - { - "epoch": 1.54, - "learning_rate": 1.010514578728751e-06, - "loss": 0.7803, - "step": 59900 - }, - { - "epoch": 1.54, - "learning_rate": 1.0104869098004476e-06, - "loss": 0.9287, - "step": 59901 - }, - { - "epoch": 1.54, - "learning_rate": 1.010459240864115e-06, - "loss": 0.6147, - "step": 59902 - }, - { - "epoch": 1.54, - "learning_rate": 1.0104315719197736e-06, - "loss": 0.668, - "step": 59903 - }, - { - "epoch": 1.54, - "learning_rate": 1.0104039029674455e-06, - "loss": 0.6719, - "step": 59904 - }, - { - "epoch": 1.54, - "learning_rate": 1.010376234007152e-06, - "loss": 0.5923, - "step": 59905 - }, - { - "epoch": 1.54, - "learning_rate": 1.0103485650389135e-06, - "loss": 0.6104, - "step": 59906 - }, - { - "epoch": 1.54, - "learning_rate": 1.0103208960627517e-06, - "loss": 0.4648, - "step": 59907 - }, - { - "epoch": 1.54, - "learning_rate": 1.0102932270786874e-06, - "loss": 0.5532, - "step": 59908 - }, - { - "epoch": 1.54, - "learning_rate": 1.0102655580867428e-06, - "loss": 0.792, - "step": 59909 - }, - { - "epoch": 1.54, - "learning_rate": 1.0102378890869375e-06, - "loss": 0.6943, - "step": 59910 - }, - { - "epoch": 1.54, - "learning_rate": 1.0102102200792938e-06, - "loss": 0.7305, - "step": 59911 - }, - { - "epoch": 1.54, - "learning_rate": 1.0101825510638326e-06, - "loss": 0.3728, - "step": 59912 - }, - { - "epoch": 1.54, - "learning_rate": 1.0101548820405753e-06, - "loss": 0.4618, - "step": 59913 - }, - { - "epoch": 1.54, - "learning_rate": 1.0101272130095429e-06, - "loss": 0.7852, - "step": 59914 - }, - { - "epoch": 1.54, - "learning_rate": 1.0100995439707565e-06, - "loss": 0.6309, - "step": 59915 - }, - { - "epoch": 1.54, - "learning_rate": 1.010071874924237e-06, - "loss": 0.5938, - "step": 59916 - }, - { - "epoch": 1.54, - "learning_rate": 1.0100442058700062e-06, - "loss": 0.6631, - "step": 59917 - }, - { - "epoch": 1.54, - "learning_rate": 1.0100165368080848e-06, - "loss": 0.502, - "step": 59918 - }, - { - "epoch": 1.54, - "learning_rate": 1.0099888677384944e-06, - "loss": 0.8232, - "step": 59919 - }, - { - "epoch": 1.54, - "learning_rate": 1.0099611986612559e-06, - "loss": 0.6885, - "step": 59920 - }, - { - "epoch": 1.54, - "learning_rate": 1.009933529576391e-06, - "loss": 0.4452, - "step": 59921 - }, - { - "epoch": 1.54, - "learning_rate": 1.0099058604839196e-06, - "loss": 0.5957, - "step": 59922 - }, - { - "epoch": 1.54, - "learning_rate": 1.0098781913838646e-06, - "loss": 0.7383, - "step": 59923 - }, - { - "epoch": 1.54, - "learning_rate": 1.009850522276246e-06, - "loss": 0.3878, - "step": 59924 - }, - { - "epoch": 1.54, - "learning_rate": 1.0098228531610848e-06, - "loss": 0.7441, - "step": 59925 - }, - { - "epoch": 1.54, - "learning_rate": 1.0097951840384034e-06, - "loss": 0.5552, - "step": 59926 - }, - { - "epoch": 1.54, - "learning_rate": 1.009767514908222e-06, - "loss": 0.79, - "step": 59927 - }, - { - "epoch": 1.54, - "learning_rate": 1.009739845770562e-06, - "loss": 0.7598, - "step": 59928 - }, - { - "epoch": 1.54, - "learning_rate": 1.0097121766254449e-06, - "loss": 0.6198, - "step": 59929 - }, - { - "epoch": 1.54, - "learning_rate": 1.0096845074728912e-06, - "loss": 0.7686, - "step": 59930 - }, - { - "epoch": 1.54, - "learning_rate": 1.0096568383129227e-06, - "loss": 0.6787, - "step": 59931 - }, - { - "epoch": 1.54, - "learning_rate": 1.0096291691455606e-06, - "loss": 0.5408, - "step": 59932 - }, - { - "epoch": 1.54, - "learning_rate": 1.0096014999708256e-06, - "loss": 0.6348, - "step": 59933 - }, - { - "epoch": 1.54, - "learning_rate": 1.0095738307887397e-06, - "loss": 0.6758, - "step": 59934 - }, - { - "epoch": 1.54, - "learning_rate": 1.0095461615993231e-06, - "loss": 0.6484, - "step": 59935 - }, - { - "epoch": 1.54, - "learning_rate": 1.0095184924025975e-06, - "loss": 0.7979, - "step": 59936 - }, - { - "epoch": 1.54, - "learning_rate": 1.009490823198584e-06, - "loss": 0.5439, - "step": 59937 - }, - { - "epoch": 1.54, - "learning_rate": 1.009463153987304e-06, - "loss": 0.5127, - "step": 59938 - }, - { - "epoch": 1.54, - "learning_rate": 1.0094354847687783e-06, - "loss": 0.5957, - "step": 59939 - }, - { - "epoch": 1.54, - "learning_rate": 1.0094078155430285e-06, - "loss": 0.6279, - "step": 59940 - }, - { - "epoch": 1.54, - "learning_rate": 1.0093801463100753e-06, - "loss": 0.751, - "step": 59941 - }, - { - "epoch": 1.54, - "learning_rate": 1.0093524770699403e-06, - "loss": 0.6191, - "step": 59942 - }, - { - "epoch": 1.54, - "learning_rate": 1.0093248078226444e-06, - "loss": 0.6719, - "step": 59943 - }, - { - "epoch": 1.54, - "learning_rate": 1.009297138568209e-06, - "loss": 0.6973, - "step": 59944 - }, - { - "epoch": 1.54, - "learning_rate": 1.0092694693066555e-06, - "loss": 0.6719, - "step": 59945 - }, - { - "epoch": 1.54, - "learning_rate": 1.0092418000380043e-06, - "loss": 0.5933, - "step": 59946 - }, - { - "epoch": 1.54, - "learning_rate": 1.0092141307622774e-06, - "loss": 0.7427, - "step": 59947 - }, - { - "epoch": 1.54, - "learning_rate": 1.0091864614794955e-06, - "loss": 0.7363, - "step": 59948 - }, - { - "epoch": 1.54, - "learning_rate": 1.0091587921896804e-06, - "loss": 0.6807, - "step": 59949 - }, - { - "epoch": 1.54, - "learning_rate": 1.0091311228928522e-06, - "loss": 0.6475, - "step": 59950 - }, - { - "epoch": 1.54, - "learning_rate": 1.009103453589033e-06, - "loss": 0.6187, - "step": 59951 - }, - { - "epoch": 1.54, - "learning_rate": 1.0090757842782436e-06, - "loss": 0.5903, - "step": 59952 - }, - { - "epoch": 1.54, - "learning_rate": 1.0090481149605055e-06, - "loss": 0.4103, - "step": 59953 - }, - { - "epoch": 1.54, - "learning_rate": 1.0090204456358396e-06, - "loss": 0.5996, - "step": 59954 - }, - { - "epoch": 1.54, - "learning_rate": 1.0089927763042672e-06, - "loss": 0.7881, - "step": 59955 - }, - { - "epoch": 1.54, - "learning_rate": 1.0089651069658093e-06, - "loss": 0.748, - "step": 59956 - }, - { - "epoch": 1.54, - "learning_rate": 1.0089374376204872e-06, - "loss": 0.5623, - "step": 59957 - }, - { - "epoch": 1.54, - "learning_rate": 1.008909768268322e-06, - "loss": 0.6899, - "step": 59958 - }, - { - "epoch": 1.54, - "learning_rate": 1.0088820989093357e-06, - "loss": 0.8389, - "step": 59959 - }, - { - "epoch": 1.54, - "learning_rate": 1.008854429543548e-06, - "loss": 0.5933, - "step": 59960 - }, - { - "epoch": 1.54, - "learning_rate": 1.0088267601709813e-06, - "loss": 0.6293, - "step": 59961 - }, - { - "epoch": 1.54, - "learning_rate": 1.008799090791656e-06, - "loss": 0.7607, - "step": 59962 - }, - { - "epoch": 1.54, - "learning_rate": 1.008771421405594e-06, - "loss": 0.5068, - "step": 59963 - }, - { - "epoch": 1.54, - "learning_rate": 1.008743752012816e-06, - "loss": 0.6787, - "step": 59964 - }, - { - "epoch": 1.54, - "learning_rate": 1.0087160826133434e-06, - "loss": 0.5649, - "step": 59965 - }, - { - "epoch": 1.54, - "learning_rate": 1.0086884132071972e-06, - "loss": 0.6338, - "step": 59966 - }, - { - "epoch": 1.54, - "learning_rate": 1.0086607437943985e-06, - "loss": 0.7261, - "step": 59967 - }, - { - "epoch": 1.54, - "learning_rate": 1.0086330743749687e-06, - "loss": 0.5742, - "step": 59968 - }, - { - "epoch": 1.54, - "learning_rate": 1.0086054049489292e-06, - "loss": 0.6279, - "step": 59969 - }, - { - "epoch": 1.54, - "learning_rate": 1.008577735516301e-06, - "loss": 0.5205, - "step": 59970 - }, - { - "epoch": 1.54, - "learning_rate": 1.0085500660771049e-06, - "loss": 0.5962, - "step": 59971 - }, - { - "epoch": 1.54, - "learning_rate": 1.0085223966313626e-06, - "loss": 0.7822, - "step": 59972 - }, - { - "epoch": 1.54, - "learning_rate": 1.008494727179095e-06, - "loss": 0.8594, - "step": 59973 - }, - { - "epoch": 1.54, - "learning_rate": 1.0084670577203236e-06, - "loss": 0.7695, - "step": 59974 - }, - { - "epoch": 1.54, - "learning_rate": 1.008439388255069e-06, - "loss": 0.6782, - "step": 59975 - }, - { - "epoch": 1.54, - "learning_rate": 1.008411718783353e-06, - "loss": 0.5991, - "step": 59976 - }, - { - "epoch": 1.54, - "learning_rate": 1.0083840493051964e-06, - "loss": 0.6533, - "step": 59977 - }, - { - "epoch": 1.54, - "learning_rate": 1.0083563798206206e-06, - "loss": 0.6826, - "step": 59978 - }, - { - "epoch": 1.54, - "learning_rate": 1.0083287103296467e-06, - "loss": 0.7334, - "step": 59979 - }, - { - "epoch": 1.54, - "learning_rate": 1.008301040832296e-06, - "loss": 0.6279, - "step": 59980 - }, - { - "epoch": 1.54, - "learning_rate": 1.0082733713285893e-06, - "loss": 0.6904, - "step": 59981 - }, - { - "epoch": 1.54, - "learning_rate": 1.0082457018185483e-06, - "loss": 0.5288, - "step": 59982 - }, - { - "epoch": 1.54, - "learning_rate": 1.0082180323021937e-06, - "loss": 0.5874, - "step": 59983 - }, - { - "epoch": 1.54, - "learning_rate": 1.0081903627795474e-06, - "loss": 0.6235, - "step": 59984 - }, - { - "epoch": 1.54, - "learning_rate": 1.0081626932506297e-06, - "loss": 0.5815, - "step": 59985 - }, - { - "epoch": 1.54, - "learning_rate": 1.0081350237154625e-06, - "loss": 0.7266, - "step": 59986 - }, - { - "epoch": 1.54, - "learning_rate": 1.0081073541740663e-06, - "loss": 0.5562, - "step": 59987 - }, - { - "epoch": 1.54, - "learning_rate": 1.008079684626463e-06, - "loss": 0.6802, - "step": 59988 - }, - { - "epoch": 1.54, - "learning_rate": 1.0080520150726731e-06, - "loss": 0.6147, - "step": 59989 - }, - { - "epoch": 1.54, - "learning_rate": 1.0080243455127184e-06, - "loss": 0.6729, - "step": 59990 - }, - { - "epoch": 1.54, - "learning_rate": 1.00799667594662e-06, - "loss": 0.625, - "step": 59991 - }, - { - "epoch": 1.54, - "learning_rate": 1.0079690063743984e-06, - "loss": 0.5186, - "step": 59992 - }, - { - "epoch": 1.54, - "learning_rate": 1.0079413367960756e-06, - "loss": 0.5469, - "step": 59993 - }, - { - "epoch": 1.54, - "learning_rate": 1.0079136672116725e-06, - "loss": 0.5332, - "step": 59994 - }, - { - "epoch": 1.54, - "learning_rate": 1.0078859976212106e-06, - "loss": 0.6523, - "step": 59995 - }, - { - "epoch": 1.54, - "learning_rate": 1.0078583280247102e-06, - "loss": 0.5415, - "step": 59996 - }, - { - "epoch": 1.54, - "learning_rate": 1.0078306584221934e-06, - "loss": 0.4824, - "step": 59997 - }, - { - "epoch": 1.54, - "learning_rate": 1.0078029888136808e-06, - "loss": 0.7109, - "step": 59998 - }, - { - "epoch": 1.54, - "learning_rate": 1.007775319199194e-06, - "loss": 0.6172, - "step": 59999 - }, - { - "epoch": 1.54, - "learning_rate": 1.0077476495787537e-06, - "loss": 0.7861, - "step": 60000 - }, - { - "epoch": 1.54, - "learning_rate": 1.0077199799523817e-06, - "loss": 0.6147, - "step": 60001 - }, - { - "epoch": 1.54, - "learning_rate": 1.0076923103200988e-06, - "loss": 0.6504, - "step": 60002 - }, - { - "epoch": 1.54, - "learning_rate": 1.007664640681926e-06, - "loss": 0.6758, - "step": 60003 - }, - { - "epoch": 1.54, - "learning_rate": 1.007636971037885e-06, - "loss": 0.646, - "step": 60004 - }, - { - "epoch": 1.54, - "learning_rate": 1.0076093013879966e-06, - "loss": 0.5085, - "step": 60005 - }, - { - "epoch": 1.54, - "learning_rate": 1.0075816317322823e-06, - "loss": 0.6406, - "step": 60006 - }, - { - "epoch": 1.54, - "learning_rate": 1.007553962070763e-06, - "loss": 0.5791, - "step": 60007 - }, - { - "epoch": 1.54, - "learning_rate": 1.0075262924034598e-06, - "loss": 0.5474, - "step": 60008 - }, - { - "epoch": 1.54, - "learning_rate": 1.0074986227303941e-06, - "loss": 0.5283, - "step": 60009 - }, - { - "epoch": 1.54, - "learning_rate": 1.0074709530515873e-06, - "loss": 0.5752, - "step": 60010 - }, - { - "epoch": 1.54, - "learning_rate": 1.0074432833670603e-06, - "loss": 0.7285, - "step": 60011 - }, - { - "epoch": 1.54, - "learning_rate": 1.0074156136768338e-06, - "loss": 0.6914, - "step": 60012 - }, - { - "epoch": 1.54, - "learning_rate": 1.00738794398093e-06, - "loss": 0.7441, - "step": 60013 - }, - { - "epoch": 1.54, - "learning_rate": 1.0073602742793697e-06, - "loss": 0.6746, - "step": 60014 - }, - { - "epoch": 1.54, - "learning_rate": 1.0073326045721735e-06, - "loss": 0.5845, - "step": 60015 - }, - { - "epoch": 1.54, - "learning_rate": 1.0073049348593634e-06, - "loss": 0.5962, - "step": 60016 - }, - { - "epoch": 1.54, - "learning_rate": 1.0072772651409601e-06, - "loss": 0.6367, - "step": 60017 - }, - { - "epoch": 1.54, - "learning_rate": 1.007249595416985e-06, - "loss": 0.4041, - "step": 60018 - }, - { - "epoch": 1.54, - "learning_rate": 1.0072219256874594e-06, - "loss": 0.6875, - "step": 60019 - }, - { - "epoch": 1.54, - "learning_rate": 1.0071942559524044e-06, - "loss": 0.5161, - "step": 60020 - }, - { - "epoch": 1.54, - "learning_rate": 1.0071665862118406e-06, - "loss": 0.7578, - "step": 60021 - }, - { - "epoch": 1.54, - "learning_rate": 1.0071389164657898e-06, - "loss": 0.6685, - "step": 60022 - }, - { - "epoch": 1.54, - "learning_rate": 1.007111246714273e-06, - "loss": 0.7705, - "step": 60023 - }, - { - "epoch": 1.54, - "learning_rate": 1.0070835769573118e-06, - "loss": 0.5806, - "step": 60024 - }, - { - "epoch": 1.54, - "learning_rate": 1.0070559071949267e-06, - "loss": 0.5693, - "step": 60025 - }, - { - "epoch": 1.54, - "learning_rate": 1.0070282374271395e-06, - "loss": 0.6201, - "step": 60026 - }, - { - "epoch": 1.54, - "learning_rate": 1.0070005676539707e-06, - "loss": 0.8076, - "step": 60027 - }, - { - "epoch": 1.54, - "learning_rate": 1.0069728978754423e-06, - "loss": 0.5425, - "step": 60028 - }, - { - "epoch": 1.54, - "learning_rate": 1.006945228091575e-06, - "loss": 0.7354, - "step": 60029 - }, - { - "epoch": 1.54, - "learning_rate": 1.0069175583023901e-06, - "loss": 0.6104, - "step": 60030 - }, - { - "epoch": 1.54, - "learning_rate": 1.0068898885079085e-06, - "loss": 0.5293, - "step": 60031 - }, - { - "epoch": 1.54, - "learning_rate": 1.0068622187081517e-06, - "loss": 0.5615, - "step": 60032 - }, - { - "epoch": 1.54, - "learning_rate": 1.0068345489031406e-06, - "loss": 0.5, - "step": 60033 - }, - { - "epoch": 1.54, - "learning_rate": 1.006806879092897e-06, - "loss": 0.5669, - "step": 60034 - }, - { - "epoch": 1.54, - "learning_rate": 1.0067792092774417e-06, - "loss": 0.6621, - "step": 60035 - }, - { - "epoch": 1.54, - "learning_rate": 1.0067515394567957e-06, - "loss": 0.6626, - "step": 60036 - }, - { - "epoch": 1.54, - "learning_rate": 1.0067238696309804e-06, - "loss": 0.7451, - "step": 60037 - }, - { - "epoch": 1.54, - "learning_rate": 1.006696199800017e-06, - "loss": 0.6069, - "step": 60038 - }, - { - "epoch": 1.54, - "learning_rate": 1.0066685299639264e-06, - "loss": 0.4805, - "step": 60039 - }, - { - "epoch": 1.54, - "learning_rate": 1.00664086012273e-06, - "loss": 0.7539, - "step": 60040 - }, - { - "epoch": 1.54, - "learning_rate": 1.0066131902764491e-06, - "loss": 0.7568, - "step": 60041 - }, - { - "epoch": 1.54, - "learning_rate": 1.0065855204251049e-06, - "loss": 0.5173, - "step": 60042 - }, - { - "epoch": 1.54, - "learning_rate": 1.0065578505687185e-06, - "loss": 0.6086, - "step": 60043 - }, - { - "epoch": 1.54, - "learning_rate": 1.006530180707311e-06, - "loss": 0.473, - "step": 60044 - }, - { - "epoch": 1.54, - "learning_rate": 1.0065025108409038e-06, - "loss": 0.6768, - "step": 60045 - }, - { - "epoch": 1.54, - "learning_rate": 1.0064748409695173e-06, - "loss": 0.605, - "step": 60046 - }, - { - "epoch": 1.54, - "learning_rate": 1.006447171093174e-06, - "loss": 0.627, - "step": 60047 - }, - { - "epoch": 1.54, - "learning_rate": 1.0064195012118939e-06, - "loss": 0.4822, - "step": 60048 - }, - { - "epoch": 1.54, - "learning_rate": 1.0063918313256991e-06, - "loss": 0.4761, - "step": 60049 - }, - { - "epoch": 1.54, - "learning_rate": 1.0063641614346102e-06, - "loss": 0.6006, - "step": 60050 - }, - { - "epoch": 1.54, - "learning_rate": 1.0063364915386485e-06, - "loss": 0.6597, - "step": 60051 - }, - { - "epoch": 1.54, - "learning_rate": 1.0063088216378352e-06, - "loss": 0.7993, - "step": 60052 - }, - { - "epoch": 1.54, - "learning_rate": 1.0062811517321917e-06, - "loss": 0.4128, - "step": 60053 - }, - { - "epoch": 1.54, - "learning_rate": 1.006253481821739e-06, - "loss": 0.5306, - "step": 60054 - }, - { - "epoch": 1.54, - "learning_rate": 1.0062258119064984e-06, - "loss": 0.6035, - "step": 60055 - }, - { - "epoch": 1.54, - "learning_rate": 1.0061981419864905e-06, - "loss": 0.6465, - "step": 60056 - }, - { - "epoch": 1.54, - "learning_rate": 1.0061704720617375e-06, - "loss": 0.6089, - "step": 60057 - }, - { - "epoch": 1.54, - "learning_rate": 1.0061428021322596e-06, - "loss": 0.6396, - "step": 60058 - }, - { - "epoch": 1.54, - "learning_rate": 1.0061151321980787e-06, - "loss": 0.6079, - "step": 60059 - }, - { - "epoch": 1.54, - "learning_rate": 1.0060874622592156e-06, - "loss": 0.6519, - "step": 60060 - }, - { - "epoch": 1.54, - "learning_rate": 1.0060597923156918e-06, - "loss": 0.7021, - "step": 60061 - }, - { - "epoch": 1.54, - "learning_rate": 1.006032122367528e-06, - "loss": 0.6455, - "step": 60062 - }, - { - "epoch": 1.54, - "learning_rate": 1.0060044524147457e-06, - "loss": 0.7363, - "step": 60063 - }, - { - "epoch": 1.54, - "learning_rate": 1.0059767824573667e-06, - "loss": 0.5117, - "step": 60064 - }, - { - "epoch": 1.54, - "learning_rate": 1.005949112495411e-06, - "loss": 0.4927, - "step": 60065 - }, - { - "epoch": 1.54, - "learning_rate": 1.0059214425289003e-06, - "loss": 0.7402, - "step": 60066 - }, - { - "epoch": 1.54, - "learning_rate": 1.0058937725578557e-06, - "loss": 0.7021, - "step": 60067 - }, - { - "epoch": 1.54, - "learning_rate": 1.005866102582299e-06, - "loss": 0.5708, - "step": 60068 - }, - { - "epoch": 1.54, - "learning_rate": 1.0058384326022506e-06, - "loss": 0.7539, - "step": 60069 - }, - { - "epoch": 1.54, - "learning_rate": 1.0058107626177323e-06, - "loss": 0.6787, - "step": 60070 - }, - { - "epoch": 1.54, - "learning_rate": 1.0057830926287645e-06, - "loss": 0.5649, - "step": 60071 - }, - { - "epoch": 1.54, - "learning_rate": 1.005755422635369e-06, - "loss": 0.6182, - "step": 60072 - }, - { - "epoch": 1.54, - "learning_rate": 1.0057277526375668e-06, - "loss": 0.6313, - "step": 60073 - }, - { - "epoch": 1.54, - "learning_rate": 1.0057000826353796e-06, - "loss": 0.6309, - "step": 60074 - }, - { - "epoch": 1.54, - "learning_rate": 1.0056724126288276e-06, - "loss": 0.5007, - "step": 60075 - }, - { - "epoch": 1.54, - "learning_rate": 1.0056447426179326e-06, - "loss": 0.7012, - "step": 60076 - }, - { - "epoch": 1.54, - "learning_rate": 1.0056170726027157e-06, - "loss": 0.6748, - "step": 60077 - }, - { - "epoch": 1.54, - "learning_rate": 1.005589402583198e-06, - "loss": 0.7627, - "step": 60078 - }, - { - "epoch": 1.54, - "learning_rate": 1.0055617325594007e-06, - "loss": 0.5957, - "step": 60079 - }, - { - "epoch": 1.54, - "learning_rate": 1.005534062531345e-06, - "loss": 0.7061, - "step": 60080 - }, - { - "epoch": 1.54, - "learning_rate": 1.0055063924990526e-06, - "loss": 0.5654, - "step": 60081 - }, - { - "epoch": 1.54, - "learning_rate": 1.0054787224625436e-06, - "loss": 0.5459, - "step": 60082 - }, - { - "epoch": 1.54, - "learning_rate": 1.0054510524218402e-06, - "loss": 0.7686, - "step": 60083 - }, - { - "epoch": 1.54, - "learning_rate": 1.0054233823769632e-06, - "loss": 0.6733, - "step": 60084 - }, - { - "epoch": 1.54, - "learning_rate": 1.0053957123279337e-06, - "loss": 0.7705, - "step": 60085 - }, - { - "epoch": 1.54, - "learning_rate": 1.0053680422747727e-06, - "loss": 0.6714, - "step": 60086 - }, - { - "epoch": 1.54, - "learning_rate": 1.0053403722175018e-06, - "loss": 0.4596, - "step": 60087 - }, - { - "epoch": 1.54, - "learning_rate": 1.005312702156142e-06, - "loss": 0.8486, - "step": 60088 - }, - { - "epoch": 1.54, - "learning_rate": 1.0052850320907147e-06, - "loss": 0.5015, - "step": 60089 - }, - { - "epoch": 1.54, - "learning_rate": 1.0052573620212405e-06, - "loss": 0.481, - "step": 60090 - }, - { - "epoch": 1.54, - "learning_rate": 1.0052296919477415e-06, - "loss": 0.5908, - "step": 60091 - }, - { - "epoch": 1.54, - "learning_rate": 1.005202021870238e-06, - "loss": 0.5354, - "step": 60092 - }, - { - "epoch": 1.54, - "learning_rate": 1.0051743517887517e-06, - "loss": 0.6914, - "step": 60093 - }, - { - "epoch": 1.54, - "learning_rate": 1.0051466817033035e-06, - "loss": 0.6006, - "step": 60094 - }, - { - "epoch": 1.54, - "learning_rate": 1.0051190116139148e-06, - "loss": 0.6738, - "step": 60095 - }, - { - "epoch": 1.54, - "learning_rate": 1.0050913415206065e-06, - "loss": 0.6233, - "step": 60096 - }, - { - "epoch": 1.54, - "learning_rate": 1.0050636714234004e-06, - "loss": 0.6709, - "step": 60097 - }, - { - "epoch": 1.54, - "learning_rate": 1.005036001322317e-06, - "loss": 0.5103, - "step": 60098 - }, - { - "epoch": 1.54, - "learning_rate": 1.0050083312173778e-06, - "loss": 0.6895, - "step": 60099 - }, - { - "epoch": 1.54, - "learning_rate": 1.004980661108604e-06, - "loss": 0.7451, - "step": 60100 - }, - { - "epoch": 1.54, - "learning_rate": 1.0049529909960168e-06, - "loss": 0.6064, - "step": 60101 - }, - { - "epoch": 1.54, - "learning_rate": 1.0049253208796372e-06, - "loss": 0.8926, - "step": 60102 - }, - { - "epoch": 1.54, - "learning_rate": 1.0048976507594866e-06, - "loss": 0.6123, - "step": 60103 - }, - { - "epoch": 1.54, - "learning_rate": 1.004869980635586e-06, - "loss": 0.6499, - "step": 60104 - }, - { - "epoch": 1.54, - "learning_rate": 1.0048423105079566e-06, - "loss": 0.6709, - "step": 60105 - }, - { - "epoch": 1.54, - "learning_rate": 1.00481464037662e-06, - "loss": 0.5034, - "step": 60106 - }, - { - "epoch": 1.54, - "learning_rate": 1.0047869702415967e-06, - "loss": 0.665, - "step": 60107 - }, - { - "epoch": 1.54, - "learning_rate": 1.0047593001029084e-06, - "loss": 0.6699, - "step": 60108 - }, - { - "epoch": 1.54, - "learning_rate": 1.0047316299605762e-06, - "loss": 0.7256, - "step": 60109 - }, - { - "epoch": 1.54, - "learning_rate": 1.0047039598146212e-06, - "loss": 0.7793, - "step": 60110 - }, - { - "epoch": 1.54, - "learning_rate": 1.0046762896650642e-06, - "loss": 0.79, - "step": 60111 - }, - { - "epoch": 1.54, - "learning_rate": 1.0046486195119272e-06, - "loss": 0.5295, - "step": 60112 - }, - { - "epoch": 1.54, - "learning_rate": 1.004620949355231e-06, - "loss": 0.6631, - "step": 60113 - }, - { - "epoch": 1.54, - "learning_rate": 1.0045932791949967e-06, - "loss": 0.6162, - "step": 60114 - }, - { - "epoch": 1.54, - "learning_rate": 1.0045656090312453e-06, - "loss": 0.6543, - "step": 60115 - }, - { - "epoch": 1.54, - "learning_rate": 1.0045379388639984e-06, - "loss": 0.7676, - "step": 60116 - }, - { - "epoch": 1.54, - "learning_rate": 1.0045102686932768e-06, - "loss": 0.4463, - "step": 60117 - }, - { - "epoch": 1.54, - "learning_rate": 1.004482598519102e-06, - "loss": 0.7959, - "step": 60118 - }, - { - "epoch": 1.54, - "learning_rate": 1.0044549283414954e-06, - "loss": 0.5361, - "step": 60119 - }, - { - "epoch": 1.54, - "learning_rate": 1.0044272581604779e-06, - "loss": 0.7056, - "step": 60120 - }, - { - "epoch": 1.54, - "learning_rate": 1.0043995879760701e-06, - "loss": 0.4377, - "step": 60121 - }, - { - "epoch": 1.54, - "learning_rate": 1.004371917788294e-06, - "loss": 0.5593, - "step": 60122 - }, - { - "epoch": 1.54, - "learning_rate": 1.0043442475971705e-06, - "loss": 0.7285, - "step": 60123 - }, - { - "epoch": 1.54, - "learning_rate": 1.0043165774027207e-06, - "loss": 0.5244, - "step": 60124 - }, - { - "epoch": 1.54, - "learning_rate": 1.0042889072049663e-06, - "loss": 0.5249, - "step": 60125 - }, - { - "epoch": 1.54, - "learning_rate": 1.0042612370039276e-06, - "loss": 0.5913, - "step": 60126 - }, - { - "epoch": 1.54, - "learning_rate": 1.0042335667996265e-06, - "loss": 0.5762, - "step": 60127 - }, - { - "epoch": 1.54, - "learning_rate": 1.0042058965920841e-06, - "loss": 0.5957, - "step": 60128 - }, - { - "epoch": 1.54, - "learning_rate": 1.0041782263813212e-06, - "loss": 0.7148, - "step": 60129 - }, - { - "epoch": 1.54, - "learning_rate": 1.0041505561673592e-06, - "loss": 0.6528, - "step": 60130 - }, - { - "epoch": 1.54, - "learning_rate": 1.0041228859502195e-06, - "loss": 0.5476, - "step": 60131 - }, - { - "epoch": 1.54, - "learning_rate": 1.0040952157299228e-06, - "loss": 0.6299, - "step": 60132 - }, - { - "epoch": 1.54, - "learning_rate": 1.0040675455064911e-06, - "loss": 0.5935, - "step": 60133 - }, - { - "epoch": 1.54, - "learning_rate": 1.0040398752799446e-06, - "loss": 0.5527, - "step": 60134 - }, - { - "epoch": 1.54, - "learning_rate": 1.0040122050503052e-06, - "loss": 0.5742, - "step": 60135 - }, - { - "epoch": 1.54, - "learning_rate": 1.0039845348175935e-06, - "loss": 0.4805, - "step": 60136 - }, - { - "epoch": 1.54, - "learning_rate": 1.0039568645818314e-06, - "loss": 0.52, - "step": 60137 - }, - { - "epoch": 1.54, - "learning_rate": 1.0039291943430397e-06, - "loss": 0.71, - "step": 60138 - }, - { - "epoch": 1.54, - "learning_rate": 1.0039015241012396e-06, - "loss": 0.5337, - "step": 60139 - }, - { - "epoch": 1.54, - "learning_rate": 1.003873853856452e-06, - "loss": 0.7881, - "step": 60140 - }, - { - "epoch": 1.54, - "learning_rate": 1.0038461836086984e-06, - "loss": 0.7461, - "step": 60141 - }, - { - "epoch": 1.54, - "learning_rate": 1.0038185133580001e-06, - "loss": 0.6104, - "step": 60142 - }, - { - "epoch": 1.54, - "learning_rate": 1.0037908431043781e-06, - "loss": 0.6396, - "step": 60143 - }, - { - "epoch": 1.54, - "learning_rate": 1.0037631728478538e-06, - "loss": 0.5122, - "step": 60144 - }, - { - "epoch": 1.54, - "learning_rate": 1.0037355025884482e-06, - "loss": 0.7124, - "step": 60145 - }, - { - "epoch": 1.54, - "learning_rate": 1.003707832326182e-06, - "loss": 0.5923, - "step": 60146 - }, - { - "epoch": 1.54, - "learning_rate": 1.0036801620610775e-06, - "loss": 0.6245, - "step": 60147 - }, - { - "epoch": 1.54, - "learning_rate": 1.003652491793155e-06, - "loss": 0.6582, - "step": 60148 - }, - { - "epoch": 1.54, - "learning_rate": 1.003624821522436e-06, - "loss": 0.707, - "step": 60149 - }, - { - "epoch": 1.54, - "learning_rate": 1.0035971512489414e-06, - "loss": 0.6826, - "step": 60150 - }, - { - "epoch": 1.54, - "learning_rate": 1.0035694809726927e-06, - "loss": 0.5928, - "step": 60151 - }, - { - "epoch": 1.54, - "learning_rate": 1.0035418106937111e-06, - "loss": 0.6904, - "step": 60152 - }, - { - "epoch": 1.54, - "learning_rate": 1.003514140412018e-06, - "loss": 0.6016, - "step": 60153 - }, - { - "epoch": 1.54, - "learning_rate": 1.003486470127634e-06, - "loss": 0.707, - "step": 60154 - }, - { - "epoch": 1.54, - "learning_rate": 1.0034587998405806e-06, - "loss": 0.7017, - "step": 60155 - }, - { - "epoch": 1.54, - "learning_rate": 1.003431129550879e-06, - "loss": 0.4719, - "step": 60156 - }, - { - "epoch": 1.54, - "learning_rate": 1.00340345925855e-06, - "loss": 0.6016, - "step": 60157 - }, - { - "epoch": 1.54, - "learning_rate": 1.0033757889636159e-06, - "loss": 0.6406, - "step": 60158 - }, - { - "epoch": 1.54, - "learning_rate": 1.0033481186660964e-06, - "loss": 0.5723, - "step": 60159 - }, - { - "epoch": 1.54, - "learning_rate": 1.0033204483660138e-06, - "loss": 0.7852, - "step": 60160 - }, - { - "epoch": 1.54, - "learning_rate": 1.0032927780633884e-06, - "loss": 0.7988, - "step": 60161 - }, - { - "epoch": 1.54, - "learning_rate": 1.0032651077582424e-06, - "loss": 0.5034, - "step": 60162 - }, - { - "epoch": 1.54, - "learning_rate": 1.0032374374505963e-06, - "loss": 0.5688, - "step": 60163 - }, - { - "epoch": 1.54, - "learning_rate": 1.0032097671404713e-06, - "loss": 0.5439, - "step": 60164 - }, - { - "epoch": 1.54, - "learning_rate": 1.0031820968278888e-06, - "loss": 0.6143, - "step": 60165 - }, - { - "epoch": 1.54, - "learning_rate": 1.00315442651287e-06, - "loss": 0.668, - "step": 60166 - }, - { - "epoch": 1.54, - "learning_rate": 1.0031267561954357e-06, - "loss": 0.7832, - "step": 60167 - }, - { - "epoch": 1.54, - "learning_rate": 1.003099085875608e-06, - "loss": 0.7334, - "step": 60168 - }, - { - "epoch": 1.54, - "learning_rate": 1.003071415553407e-06, - "loss": 0.8301, - "step": 60169 - }, - { - "epoch": 1.54, - "learning_rate": 1.0030437452288543e-06, - "loss": 0.6785, - "step": 60170 - }, - { - "epoch": 1.54, - "learning_rate": 1.0030160749019713e-06, - "loss": 0.5601, - "step": 60171 - }, - { - "epoch": 1.54, - "learning_rate": 1.002988404572779e-06, - "loss": 0.5518, - "step": 60172 - }, - { - "epoch": 1.54, - "learning_rate": 1.002960734241299e-06, - "loss": 0.6606, - "step": 60173 - }, - { - "epoch": 1.54, - "learning_rate": 1.0029330639075515e-06, - "loss": 0.7402, - "step": 60174 - }, - { - "epoch": 1.54, - "learning_rate": 1.0029053935715585e-06, - "loss": 0.6836, - "step": 60175 - }, - { - "epoch": 1.54, - "learning_rate": 1.002877723233341e-06, - "loss": 0.4028, - "step": 60176 - }, - { - "epoch": 1.54, - "learning_rate": 1.0028500528929201e-06, - "loss": 0.8057, - "step": 60177 - }, - { - "epoch": 1.54, - "learning_rate": 1.0028223825503173e-06, - "loss": 0.8066, - "step": 60178 - }, - { - "epoch": 1.54, - "learning_rate": 1.0027947122055533e-06, - "loss": 0.6768, - "step": 60179 - }, - { - "epoch": 1.54, - "learning_rate": 1.0027670418586493e-06, - "loss": 0.6699, - "step": 60180 - }, - { - "epoch": 1.54, - "learning_rate": 1.0027393715096273e-06, - "loss": 0.707, - "step": 60181 - }, - { - "epoch": 1.54, - "learning_rate": 1.0027117011585073e-06, - "loss": 0.625, - "step": 60182 - }, - { - "epoch": 1.54, - "learning_rate": 1.0026840308053115e-06, - "loss": 0.5796, - "step": 60183 - }, - { - "epoch": 1.54, - "learning_rate": 1.0026563604500604e-06, - "loss": 0.6001, - "step": 60184 - }, - { - "epoch": 1.54, - "learning_rate": 1.0026286900927756e-06, - "loss": 0.5295, - "step": 60185 - }, - { - "epoch": 1.54, - "learning_rate": 1.002601019733478e-06, - "loss": 0.688, - "step": 60186 - }, - { - "epoch": 1.54, - "learning_rate": 1.0025733493721892e-06, - "loss": 0.6338, - "step": 60187 - }, - { - "epoch": 1.54, - "learning_rate": 1.0025456790089298e-06, - "loss": 0.8564, - "step": 60188 - }, - { - "epoch": 1.54, - "learning_rate": 1.0025180086437214e-06, - "loss": 0.5303, - "step": 60189 - }, - { - "epoch": 1.54, - "learning_rate": 1.002490338276585e-06, - "loss": 0.5442, - "step": 60190 - }, - { - "epoch": 1.54, - "learning_rate": 1.002462667907542e-06, - "loss": 0.5757, - "step": 60191 - }, - { - "epoch": 1.54, - "learning_rate": 1.002434997536613e-06, - "loss": 0.6729, - "step": 60192 - }, - { - "epoch": 1.54, - "learning_rate": 1.0024073271638203e-06, - "loss": 0.5165, - "step": 60193 - }, - { - "epoch": 1.54, - "learning_rate": 1.0023796567891842e-06, - "loss": 0.5688, - "step": 60194 - }, - { - "epoch": 1.54, - "learning_rate": 1.002351986412726e-06, - "loss": 0.6377, - "step": 60195 - }, - { - "epoch": 1.54, - "learning_rate": 1.002324316034467e-06, - "loss": 0.6899, - "step": 60196 - }, - { - "epoch": 1.54, - "learning_rate": 1.0022966456544282e-06, - "loss": 0.7656, - "step": 60197 - }, - { - "epoch": 1.54, - "learning_rate": 1.0022689752726315e-06, - "loss": 0.6777, - "step": 60198 - }, - { - "epoch": 1.54, - "learning_rate": 1.002241304889097e-06, - "loss": 0.5797, - "step": 60199 - }, - { - "epoch": 1.54, - "learning_rate": 1.0022136345038468e-06, - "loss": 0.5132, - "step": 60200 - }, - { - "epoch": 1.54, - "learning_rate": 1.0021859641169012e-06, - "loss": 0.5386, - "step": 60201 - }, - { - "epoch": 1.54, - "learning_rate": 1.0021582937282824e-06, - "loss": 0.6709, - "step": 60202 - }, - { - "epoch": 1.54, - "learning_rate": 1.0021306233380112e-06, - "loss": 0.5337, - "step": 60203 - }, - { - "epoch": 1.54, - "learning_rate": 1.0021029529461085e-06, - "loss": 0.51, - "step": 60204 - }, - { - "epoch": 1.54, - "learning_rate": 1.0020752825525956e-06, - "loss": 0.748, - "step": 60205 - }, - { - "epoch": 1.54, - "learning_rate": 1.0020476121574937e-06, - "loss": 0.5137, - "step": 60206 - }, - { - "epoch": 1.54, - "learning_rate": 1.002019941760824e-06, - "loss": 0.6523, - "step": 60207 - }, - { - "epoch": 1.54, - "learning_rate": 1.0019922713626082e-06, - "loss": 0.6201, - "step": 60208 - }, - { - "epoch": 1.54, - "learning_rate": 1.0019646009628664e-06, - "loss": 0.7549, - "step": 60209 - }, - { - "epoch": 1.54, - "learning_rate": 1.0019369305616208e-06, - "loss": 0.5972, - "step": 60210 - }, - { - "epoch": 1.54, - "learning_rate": 1.0019092601588918e-06, - "loss": 0.6206, - "step": 60211 - }, - { - "epoch": 1.54, - "learning_rate": 1.0018815897547012e-06, - "loss": 0.6193, - "step": 60212 - }, - { - "epoch": 1.54, - "learning_rate": 1.00185391934907e-06, - "loss": 0.6025, - "step": 60213 - }, - { - "epoch": 1.54, - "learning_rate": 1.001826248942019e-06, - "loss": 0.7393, - "step": 60214 - }, - { - "epoch": 1.54, - "learning_rate": 1.0017985785335702e-06, - "loss": 0.6816, - "step": 60215 - }, - { - "epoch": 1.54, - "learning_rate": 1.001770908123744e-06, - "loss": 0.7607, - "step": 60216 - }, - { - "epoch": 1.54, - "learning_rate": 1.0017432377125621e-06, - "loss": 0.5811, - "step": 60217 - }, - { - "epoch": 1.54, - "learning_rate": 1.0017155673000454e-06, - "loss": 0.5757, - "step": 60218 - }, - { - "epoch": 1.54, - "learning_rate": 1.0016878968862152e-06, - "loss": 0.5703, - "step": 60219 - }, - { - "epoch": 1.54, - "learning_rate": 1.0016602264710924e-06, - "loss": 0.604, - "step": 60220 - }, - { - "epoch": 1.54, - "learning_rate": 1.001632556054699e-06, - "loss": 0.459, - "step": 60221 - }, - { - "epoch": 1.54, - "learning_rate": 1.0016048856370549e-06, - "loss": 0.7949, - "step": 60222 - }, - { - "epoch": 1.54, - "learning_rate": 1.0015772152181827e-06, - "loss": 0.8184, - "step": 60223 - }, - { - "epoch": 1.54, - "learning_rate": 1.0015495447981026e-06, - "loss": 0.5781, - "step": 60224 - }, - { - "epoch": 1.54, - "learning_rate": 1.001521874376836e-06, - "loss": 0.7134, - "step": 60225 - }, - { - "epoch": 1.54, - "learning_rate": 1.0014942039544042e-06, - "loss": 0.6992, - "step": 60226 - }, - { - "epoch": 1.54, - "learning_rate": 1.0014665335308285e-06, - "loss": 0.873, - "step": 60227 - }, - { - "epoch": 1.54, - "learning_rate": 1.00143886310613e-06, - "loss": 0.8086, - "step": 60228 - }, - { - "epoch": 1.54, - "learning_rate": 1.0014111926803297e-06, - "loss": 0.6494, - "step": 60229 - }, - { - "epoch": 1.54, - "learning_rate": 1.0013835222534488e-06, - "loss": 0.7881, - "step": 60230 - }, - { - "epoch": 1.54, - "learning_rate": 1.0013558518255087e-06, - "loss": 0.7275, - "step": 60231 - }, - { - "epoch": 1.54, - "learning_rate": 1.0013281813965303e-06, - "loss": 0.6042, - "step": 60232 - }, - { - "epoch": 1.54, - "learning_rate": 1.0013005109665353e-06, - "loss": 0.6392, - "step": 60233 - }, - { - "epoch": 1.54, - "learning_rate": 1.0012728405355444e-06, - "loss": 0.6592, - "step": 60234 - }, - { - "epoch": 1.54, - "learning_rate": 1.0012451701035792e-06, - "loss": 0.6455, - "step": 60235 - }, - { - "epoch": 1.54, - "learning_rate": 1.0012174996706602e-06, - "loss": 0.6794, - "step": 60236 - }, - { - "epoch": 1.54, - "learning_rate": 1.0011898292368093e-06, - "loss": 0.7324, - "step": 60237 - }, - { - "epoch": 1.54, - "learning_rate": 1.0011621588020474e-06, - "loss": 0.4565, - "step": 60238 - }, - { - "epoch": 1.54, - "learning_rate": 1.0011344883663953e-06, - "loss": 0.5864, - "step": 60239 - }, - { - "epoch": 1.54, - "learning_rate": 1.001106817929875e-06, - "loss": 0.5425, - "step": 60240 - }, - { - "epoch": 1.54, - "learning_rate": 1.001079147492507e-06, - "loss": 0.7979, - "step": 60241 - }, - { - "epoch": 1.54, - "learning_rate": 1.001051477054313e-06, - "loss": 0.7158, - "step": 60242 - }, - { - "epoch": 1.54, - "learning_rate": 1.0010238066153137e-06, - "loss": 0.9268, - "step": 60243 - }, - { - "epoch": 1.54, - "learning_rate": 1.0009961361755308e-06, - "loss": 0.7725, - "step": 60244 - }, - { - "epoch": 1.54, - "learning_rate": 1.0009684657349848e-06, - "loss": 0.627, - "step": 60245 - }, - { - "epoch": 1.54, - "learning_rate": 1.0009407952936978e-06, - "loss": 0.5664, - "step": 60246 - }, - { - "epoch": 1.54, - "learning_rate": 1.00091312485169e-06, - "loss": 0.6504, - "step": 60247 - }, - { - "epoch": 1.54, - "learning_rate": 1.0008854544089835e-06, - "loss": 0.5271, - "step": 60248 - }, - { - "epoch": 1.54, - "learning_rate": 1.0008577839655988e-06, - "loss": 0.6689, - "step": 60249 - }, - { - "epoch": 1.54, - "learning_rate": 1.0008301135215572e-06, - "loss": 0.5752, - "step": 60250 - }, - { - "epoch": 1.54, - "learning_rate": 1.00080244307688e-06, - "loss": 0.7422, - "step": 60251 - }, - { - "epoch": 1.54, - "learning_rate": 1.0007747726315886e-06, - "loss": 0.5908, - "step": 60252 - }, - { - "epoch": 1.54, - "learning_rate": 1.0007471021857041e-06, - "loss": 0.6245, - "step": 60253 - }, - { - "epoch": 1.54, - "learning_rate": 1.0007194317392475e-06, - "loss": 0.5303, - "step": 60254 - }, - { - "epoch": 1.54, - "learning_rate": 1.0006917612922398e-06, - "loss": 0.4619, - "step": 60255 - }, - { - "epoch": 1.54, - "learning_rate": 1.0006640908447027e-06, - "loss": 0.4778, - "step": 60256 - }, - { - "epoch": 1.54, - "learning_rate": 1.000636420396657e-06, - "loss": 0.6582, - "step": 60257 - }, - { - "epoch": 1.54, - "learning_rate": 1.0006087499481243e-06, - "loss": 0.7783, - "step": 60258 - }, - { - "epoch": 1.54, - "learning_rate": 1.0005810794991255e-06, - "loss": 0.5913, - "step": 60259 - }, - { - "epoch": 1.54, - "learning_rate": 1.0005534090496815e-06, - "loss": 0.7363, - "step": 60260 - }, - { - "epoch": 1.54, - "learning_rate": 1.0005257385998139e-06, - "loss": 0.626, - "step": 60261 - }, - { - "epoch": 1.54, - "learning_rate": 1.0004980681495436e-06, - "loss": 0.5239, - "step": 60262 - }, - { - "epoch": 1.54, - "learning_rate": 1.0004703976988925e-06, - "loss": 0.4545, - "step": 60263 - }, - { - "epoch": 1.54, - "learning_rate": 1.0004427272478807e-06, - "loss": 0.7773, - "step": 60264 - }, - { - "epoch": 1.54, - "learning_rate": 1.0004150567965298e-06, - "loss": 0.7275, - "step": 60265 - }, - { - "epoch": 1.54, - "learning_rate": 1.0003873863448616e-06, - "loss": 0.9746, - "step": 60266 - }, - { - "epoch": 1.54, - "learning_rate": 1.0003597158928965e-06, - "loss": 0.5538, - "step": 60267 - }, - { - "epoch": 1.54, - "learning_rate": 1.000332045440656e-06, - "loss": 0.6333, - "step": 60268 - }, - { - "epoch": 1.54, - "learning_rate": 1.0003043749881615e-06, - "loss": 0.5977, - "step": 60269 - }, - { - "epoch": 1.54, - "learning_rate": 1.0002767045354336e-06, - "loss": 0.4883, - "step": 60270 - }, - { - "epoch": 1.54, - "learning_rate": 1.0002490340824942e-06, - "loss": 0.5415, - "step": 60271 - }, - { - "epoch": 1.54, - "learning_rate": 1.0002213636293638e-06, - "loss": 0.6055, - "step": 60272 - }, - { - "epoch": 1.54, - "learning_rate": 1.0001936931760643e-06, - "loss": 0.8164, - "step": 60273 - }, - { - "epoch": 1.54, - "learning_rate": 1.000166022722616e-06, - "loss": 0.7295, - "step": 60274 - }, - { - "epoch": 1.54, - "learning_rate": 1.0001383522690411e-06, - "loss": 0.575, - "step": 60275 - }, - { - "epoch": 1.54, - "learning_rate": 1.00011068181536e-06, - "loss": 0.749, - "step": 60276 - }, - { - "epoch": 1.54, - "learning_rate": 1.0000830113615942e-06, - "loss": 0.4927, - "step": 60277 - }, - { - "epoch": 1.54, - "learning_rate": 1.0000553409077647e-06, - "loss": 0.5247, - "step": 60278 - }, - { - "epoch": 1.54, - "learning_rate": 1.0000276704538927e-06, - "loss": 0.7324, - "step": 60279 - }, - { - "epoch": 1.55, - "learning_rate": 1e-06, - "loss": 0.7705, - "step": 60280 - }, - { - "epoch": 1.55, - "learning_rate": 9.999723295461072e-07, - "loss": 0.7637, - "step": 60281 - }, - { - "epoch": 1.55, - "learning_rate": 9.999446590922352e-07, - "loss": 0.7344, - "step": 60282 - }, - { - "epoch": 1.55, - "learning_rate": 9.99916988638406e-07, - "loss": 0.7314, - "step": 60283 - }, - { - "epoch": 1.55, - "learning_rate": 9.9988931818464e-07, - "loss": 0.4971, - "step": 60284 - }, - { - "epoch": 1.55, - "learning_rate": 9.998616477309592e-07, - "loss": 0.668, - "step": 60285 - }, - { - "epoch": 1.55, - "learning_rate": 9.99833977277384e-07, - "loss": 0.6865, - "step": 60286 - }, - { - "epoch": 1.55, - "learning_rate": 9.998063068239358e-07, - "loss": 0.5713, - "step": 60287 - }, - { - "epoch": 1.55, - "learning_rate": 9.997786363706362e-07, - "loss": 0.5596, - "step": 60288 - }, - { - "epoch": 1.55, - "learning_rate": 9.99750965917506e-07, - "loss": 0.6802, - "step": 60289 - }, - { - "epoch": 1.55, - "learning_rate": 9.997232954645663e-07, - "loss": 0.6846, - "step": 60290 - }, - { - "epoch": 1.55, - "learning_rate": 9.996956250118384e-07, - "loss": 0.7295, - "step": 60291 - }, - { - "epoch": 1.55, - "learning_rate": 9.996679545593439e-07, - "loss": 0.6768, - "step": 60292 - }, - { - "epoch": 1.55, - "learning_rate": 9.996402841071032e-07, - "loss": 0.5918, - "step": 60293 - }, - { - "epoch": 1.55, - "learning_rate": 9.996126136551383e-07, - "loss": 0.8623, - "step": 60294 - }, - { - "epoch": 1.55, - "learning_rate": 9.995849432034703e-07, - "loss": 0.7861, - "step": 60295 - }, - { - "epoch": 1.55, - "learning_rate": 9.995572727521195e-07, - "loss": 0.6943, - "step": 60296 - }, - { - "epoch": 1.55, - "learning_rate": 9.995296023011079e-07, - "loss": 0.4783, - "step": 60297 - }, - { - "epoch": 1.55, - "learning_rate": 9.995019318504565e-07, - "loss": 0.5502, - "step": 60298 - }, - { - "epoch": 1.55, - "learning_rate": 9.994742614001863e-07, - "loss": 0.6118, - "step": 60299 - }, - { - "epoch": 1.55, - "learning_rate": 9.994465909503186e-07, - "loss": 0.7256, - "step": 60300 - }, - { - "epoch": 1.55, - "learning_rate": 9.994189205008747e-07, - "loss": 0.6523, - "step": 60301 - }, - { - "epoch": 1.55, - "learning_rate": 9.993912500518758e-07, - "loss": 0.7832, - "step": 60302 - }, - { - "epoch": 1.55, - "learning_rate": 9.993635796033427e-07, - "loss": 0.5573, - "step": 60303 - }, - { - "epoch": 1.55, - "learning_rate": 9.993359091552972e-07, - "loss": 0.4624, - "step": 60304 - }, - { - "epoch": 1.55, - "learning_rate": 9.993082387077603e-07, - "loss": 0.7188, - "step": 60305 - }, - { - "epoch": 1.55, - "learning_rate": 9.992805682607527e-07, - "loss": 0.7246, - "step": 60306 - }, - { - "epoch": 1.55, - "learning_rate": 9.992528978142962e-07, - "loss": 0.6367, - "step": 60307 - }, - { - "epoch": 1.55, - "learning_rate": 9.992252273684113e-07, - "loss": 0.6646, - "step": 60308 - }, - { - "epoch": 1.55, - "learning_rate": 9.9919755692312e-07, - "loss": 0.7266, - "step": 60309 - }, - { - "epoch": 1.55, - "learning_rate": 9.991698864784429e-07, - "loss": 0.5603, - "step": 60310 - }, - { - "epoch": 1.55, - "learning_rate": 9.991422160344013e-07, - "loss": 0.5034, - "step": 60311 - }, - { - "epoch": 1.55, - "learning_rate": 9.991145455910164e-07, - "loss": 0.563, - "step": 60312 - }, - { - "epoch": 1.55, - "learning_rate": 9.9908687514831e-07, - "loss": 0.749, - "step": 60313 - }, - { - "epoch": 1.55, - "learning_rate": 9.990592047063022e-07, - "loss": 0.8057, - "step": 60314 - }, - { - "epoch": 1.55, - "learning_rate": 9.990315342650154e-07, - "loss": 0.6445, - "step": 60315 - }, - { - "epoch": 1.55, - "learning_rate": 9.990038638244695e-07, - "loss": 0.5535, - "step": 60316 - }, - { - "epoch": 1.55, - "learning_rate": 9.989761933846864e-07, - "loss": 0.8467, - "step": 60317 - }, - { - "epoch": 1.55, - "learning_rate": 9.98948522945687e-07, - "loss": 0.6509, - "step": 60318 - }, - { - "epoch": 1.55, - "learning_rate": 9.98920852507493e-07, - "loss": 0.5624, - "step": 60319 - }, - { - "epoch": 1.55, - "learning_rate": 9.988931820701251e-07, - "loss": 0.6631, - "step": 60320 - }, - { - "epoch": 1.55, - "learning_rate": 9.988655116336046e-07, - "loss": 0.5481, - "step": 60321 - }, - { - "epoch": 1.55, - "learning_rate": 9.988378411979527e-07, - "loss": 0.5747, - "step": 60322 - }, - { - "epoch": 1.55, - "learning_rate": 9.988101707631908e-07, - "loss": 0.7188, - "step": 60323 - }, - { - "epoch": 1.55, - "learning_rate": 9.987825003293397e-07, - "loss": 0.7695, - "step": 60324 - }, - { - "epoch": 1.55, - "learning_rate": 9.987548298964211e-07, - "loss": 0.7036, - "step": 60325 - }, - { - "epoch": 1.55, - "learning_rate": 9.98727159464456e-07, - "loss": 0.6816, - "step": 60326 - }, - { - "epoch": 1.55, - "learning_rate": 9.986994890334648e-07, - "loss": 0.6533, - "step": 60327 - }, - { - "epoch": 1.55, - "learning_rate": 9.986718186034698e-07, - "loss": 0.7344, - "step": 60328 - }, - { - "epoch": 1.55, - "learning_rate": 9.986441481744912e-07, - "loss": 0.4391, - "step": 60329 - }, - { - "epoch": 1.55, - "learning_rate": 9.986164777465513e-07, - "loss": 0.5654, - "step": 60330 - }, - { - "epoch": 1.55, - "learning_rate": 9.985888073196702e-07, - "loss": 0.8242, - "step": 60331 - }, - { - "epoch": 1.55, - "learning_rate": 9.985611368938702e-07, - "loss": 0.577, - "step": 60332 - }, - { - "epoch": 1.55, - "learning_rate": 9.985334664691712e-07, - "loss": 0.5747, - "step": 60333 - }, - { - "epoch": 1.55, - "learning_rate": 9.985057960455957e-07, - "loss": 0.7734, - "step": 60334 - }, - { - "epoch": 1.55, - "learning_rate": 9.98478125623164e-07, - "loss": 0.7012, - "step": 60335 - }, - { - "epoch": 1.55, - "learning_rate": 9.984504552018977e-07, - "loss": 0.6101, - "step": 60336 - }, - { - "epoch": 1.55, - "learning_rate": 9.984227847818174e-07, - "loss": 0.7617, - "step": 60337 - }, - { - "epoch": 1.55, - "learning_rate": 9.98395114362945e-07, - "loss": 0.4521, - "step": 60338 - }, - { - "epoch": 1.55, - "learning_rate": 9.98367443945301e-07, - "loss": 0.7695, - "step": 60339 - }, - { - "epoch": 1.55, - "learning_rate": 9.983397735289075e-07, - "loss": 0.6626, - "step": 60340 - }, - { - "epoch": 1.55, - "learning_rate": 9.983121031137847e-07, - "loss": 0.585, - "step": 60341 - }, - { - "epoch": 1.55, - "learning_rate": 9.982844326999545e-07, - "loss": 0.6816, - "step": 60342 - }, - { - "epoch": 1.55, - "learning_rate": 9.982567622874378e-07, - "loss": 0.8237, - "step": 60343 - }, - { - "epoch": 1.55, - "learning_rate": 9.982290918762558e-07, - "loss": 0.7266, - "step": 60344 - }, - { - "epoch": 1.55, - "learning_rate": 9.982014214664301e-07, - "loss": 0.8037, - "step": 60345 - }, - { - "epoch": 1.55, - "learning_rate": 9.981737510579809e-07, - "loss": 0.707, - "step": 60346 - }, - { - "epoch": 1.55, - "learning_rate": 9.9814608065093e-07, - "loss": 0.6455, - "step": 60347 - }, - { - "epoch": 1.55, - "learning_rate": 9.98118410245299e-07, - "loss": 0.7744, - "step": 60348 - }, - { - "epoch": 1.55, - "learning_rate": 9.980907398411082e-07, - "loss": 0.7402, - "step": 60349 - }, - { - "epoch": 1.55, - "learning_rate": 9.980630694383794e-07, - "loss": 0.5732, - "step": 60350 - }, - { - "epoch": 1.55, - "learning_rate": 9.980353990371337e-07, - "loss": 0.8701, - "step": 60351 - }, - { - "epoch": 1.55, - "learning_rate": 9.98007728637392e-07, - "loss": 0.6528, - "step": 60352 - }, - { - "epoch": 1.55, - "learning_rate": 9.97980058239176e-07, - "loss": 0.6377, - "step": 60353 - }, - { - "epoch": 1.55, - "learning_rate": 9.979523878425064e-07, - "loss": 0.7041, - "step": 60354 - }, - { - "epoch": 1.55, - "learning_rate": 9.97924717447405e-07, - "loss": 0.6797, - "step": 60355 - }, - { - "epoch": 1.55, - "learning_rate": 9.978970470538918e-07, - "loss": 0.6431, - "step": 60356 - }, - { - "epoch": 1.55, - "learning_rate": 9.978693766619892e-07, - "loss": 0.5562, - "step": 60357 - }, - { - "epoch": 1.55, - "learning_rate": 9.978417062717175e-07, - "loss": 0.7607, - "step": 60358 - }, - { - "epoch": 1.55, - "learning_rate": 9.978140358830987e-07, - "loss": 0.6108, - "step": 60359 - }, - { - "epoch": 1.55, - "learning_rate": 9.977863654961533e-07, - "loss": 0.6836, - "step": 60360 - }, - { - "epoch": 1.55, - "learning_rate": 9.97758695110903e-07, - "loss": 0.6821, - "step": 60361 - }, - { - "epoch": 1.55, - "learning_rate": 9.977310247273687e-07, - "loss": 0.6553, - "step": 60362 - }, - { - "epoch": 1.55, - "learning_rate": 9.977033543455715e-07, - "loss": 0.7334, - "step": 60363 - }, - { - "epoch": 1.55, - "learning_rate": 9.976756839655328e-07, - "loss": 0.5081, - "step": 60364 - }, - { - "epoch": 1.55, - "learning_rate": 9.976480135872742e-07, - "loss": 0.5137, - "step": 60365 - }, - { - "epoch": 1.55, - "learning_rate": 9.976203432108161e-07, - "loss": 0.707, - "step": 60366 - }, - { - "epoch": 1.55, - "learning_rate": 9.975926728361798e-07, - "loss": 0.7207, - "step": 60367 - }, - { - "epoch": 1.55, - "learning_rate": 9.975650024633868e-07, - "loss": 0.5654, - "step": 60368 - }, - { - "epoch": 1.55, - "learning_rate": 9.97537332092458e-07, - "loss": 0.6362, - "step": 60369 - }, - { - "epoch": 1.55, - "learning_rate": 9.97509661723415e-07, - "loss": 0.4802, - "step": 60370 - }, - { - "epoch": 1.55, - "learning_rate": 9.974819913562788e-07, - "loss": 0.583, - "step": 60371 - }, - { - "epoch": 1.55, - "learning_rate": 9.974543209910701e-07, - "loss": 0.6748, - "step": 60372 - }, - { - "epoch": 1.55, - "learning_rate": 9.97426650627811e-07, - "loss": 0.7305, - "step": 60373 - }, - { - "epoch": 1.55, - "learning_rate": 9.973989802665218e-07, - "loss": 0.6777, - "step": 60374 - }, - { - "epoch": 1.55, - "learning_rate": 9.973713099072246e-07, - "loss": 0.5249, - "step": 60375 - }, - { - "epoch": 1.55, - "learning_rate": 9.9734363954994e-07, - "loss": 0.5957, - "step": 60376 - }, - { - "epoch": 1.55, - "learning_rate": 9.973159691946886e-07, - "loss": 0.791, - "step": 60377 - }, - { - "epoch": 1.55, - "learning_rate": 9.972882988414928e-07, - "loss": 0.6313, - "step": 60378 - }, - { - "epoch": 1.55, - "learning_rate": 9.972606284903729e-07, - "loss": 0.7393, - "step": 60379 - }, - { - "epoch": 1.55, - "learning_rate": 9.972329581413506e-07, - "loss": 0.6211, - "step": 60380 - }, - { - "epoch": 1.55, - "learning_rate": 9.972052877944468e-07, - "loss": 0.708, - "step": 60381 - }, - { - "epoch": 1.55, - "learning_rate": 9.971776174496828e-07, - "loss": 0.7686, - "step": 60382 - }, - { - "epoch": 1.55, - "learning_rate": 9.971499471070798e-07, - "loss": 0.6772, - "step": 60383 - }, - { - "epoch": 1.55, - "learning_rate": 9.97122276766659e-07, - "loss": 0.5923, - "step": 60384 - }, - { - "epoch": 1.55, - "learning_rate": 9.970946064284416e-07, - "loss": 0.8496, - "step": 60385 - }, - { - "epoch": 1.55, - "learning_rate": 9.970669360924486e-07, - "loss": 0.5586, - "step": 60386 - }, - { - "epoch": 1.55, - "learning_rate": 9.970392657587014e-07, - "loss": 0.5947, - "step": 60387 - }, - { - "epoch": 1.55, - "learning_rate": 9.970115954272212e-07, - "loss": 0.6265, - "step": 60388 - }, - { - "epoch": 1.55, - "learning_rate": 9.969839250980288e-07, - "loss": 0.749, - "step": 60389 - }, - { - "epoch": 1.55, - "learning_rate": 9.969562547711459e-07, - "loss": 0.5977, - "step": 60390 - }, - { - "epoch": 1.55, - "learning_rate": 9.969285844465931e-07, - "loss": 0.7051, - "step": 60391 - }, - { - "epoch": 1.55, - "learning_rate": 9.969009141243922e-07, - "loss": 0.7051, - "step": 60392 - }, - { - "epoch": 1.55, - "learning_rate": 9.968732438045642e-07, - "loss": 0.6692, - "step": 60393 - }, - { - "epoch": 1.55, - "learning_rate": 9.9684557348713e-07, - "loss": 0.2661, - "step": 60394 - }, - { - "epoch": 1.55, - "learning_rate": 9.968179031721116e-07, - "loss": 0.6196, - "step": 60395 - }, - { - "epoch": 1.55, - "learning_rate": 9.967902328595289e-07, - "loss": 0.5874, - "step": 60396 - }, - { - "epoch": 1.55, - "learning_rate": 9.967625625494038e-07, - "loss": 0.6836, - "step": 60397 - }, - { - "epoch": 1.55, - "learning_rate": 9.967348922417577e-07, - "loss": 0.6621, - "step": 60398 - }, - { - "epoch": 1.55, - "learning_rate": 9.967072219366115e-07, - "loss": 0.5674, - "step": 60399 - }, - { - "epoch": 1.55, - "learning_rate": 9.966795516339863e-07, - "loss": 0.5516, - "step": 60400 - }, - { - "epoch": 1.55, - "learning_rate": 9.966518813339037e-07, - "loss": 0.6528, - "step": 60401 - }, - { - "epoch": 1.55, - "learning_rate": 9.966242110363843e-07, - "loss": 0.5772, - "step": 60402 - }, - { - "epoch": 1.55, - "learning_rate": 9.965965407414497e-07, - "loss": 0.6558, - "step": 60403 - }, - { - "epoch": 1.55, - "learning_rate": 9.965688704491209e-07, - "loss": 0.5571, - "step": 60404 - }, - { - "epoch": 1.55, - "learning_rate": 9.965412001594197e-07, - "loss": 0.6665, - "step": 60405 - }, - { - "epoch": 1.55, - "learning_rate": 9.965135298723662e-07, - "loss": 0.7598, - "step": 60406 - }, - { - "epoch": 1.55, - "learning_rate": 9.964858595879823e-07, - "loss": 0.6738, - "step": 60407 - }, - { - "epoch": 1.55, - "learning_rate": 9.964581893062888e-07, - "loss": 0.5864, - "step": 60408 - }, - { - "epoch": 1.55, - "learning_rate": 9.964305190273072e-07, - "loss": 0.613, - "step": 60409 - }, - { - "epoch": 1.55, - "learning_rate": 9.964028487510585e-07, - "loss": 0.6123, - "step": 60410 - }, - { - "epoch": 1.55, - "learning_rate": 9.963751784775642e-07, - "loss": 0.6865, - "step": 60411 - }, - { - "epoch": 1.55, - "learning_rate": 9.96347508206845e-07, - "loss": 0.5181, - "step": 60412 - }, - { - "epoch": 1.55, - "learning_rate": 9.963198379389226e-07, - "loss": 0.5457, - "step": 60413 - }, - { - "epoch": 1.55, - "learning_rate": 9.962921676738178e-07, - "loss": 0.5444, - "step": 60414 - }, - { - "epoch": 1.55, - "learning_rate": 9.96264497411552e-07, - "loss": 0.7949, - "step": 60415 - }, - { - "epoch": 1.55, - "learning_rate": 9.962368271521466e-07, - "loss": 0.7764, - "step": 60416 - }, - { - "epoch": 1.55, - "learning_rate": 9.96209156895622e-07, - "loss": 0.5508, - "step": 60417 - }, - { - "epoch": 1.55, - "learning_rate": 9.96181486642e-07, - "loss": 0.457, - "step": 60418 - }, - { - "epoch": 1.55, - "learning_rate": 9.961538163913015e-07, - "loss": 0.5962, - "step": 60419 - }, - { - "epoch": 1.55, - "learning_rate": 9.96126146143548e-07, - "loss": 0.8086, - "step": 60420 - }, - { - "epoch": 1.55, - "learning_rate": 9.960984758987606e-07, - "loss": 0.6675, - "step": 60421 - }, - { - "epoch": 1.55, - "learning_rate": 9.960708056569604e-07, - "loss": 0.7178, - "step": 60422 - }, - { - "epoch": 1.55, - "learning_rate": 9.960431354181685e-07, - "loss": 0.5913, - "step": 60423 - }, - { - "epoch": 1.55, - "learning_rate": 9.960154651824062e-07, - "loss": 0.6714, - "step": 60424 - }, - { - "epoch": 1.55, - "learning_rate": 9.95987794949695e-07, - "loss": 0.4756, - "step": 60425 - }, - { - "epoch": 1.55, - "learning_rate": 9.959601247200556e-07, - "loss": 0.6289, - "step": 60426 - }, - { - "epoch": 1.55, - "learning_rate": 9.959324544935092e-07, - "loss": 0.5896, - "step": 60427 - }, - { - "epoch": 1.55, - "learning_rate": 9.959047842700772e-07, - "loss": 0.5957, - "step": 60428 - }, - { - "epoch": 1.55, - "learning_rate": 9.958771140497806e-07, - "loss": 0.7588, - "step": 60429 - }, - { - "epoch": 1.55, - "learning_rate": 9.958494438326408e-07, - "loss": 0.542, - "step": 60430 - }, - { - "epoch": 1.55, - "learning_rate": 9.958217736186787e-07, - "loss": 0.7695, - "step": 60431 - }, - { - "epoch": 1.55, - "learning_rate": 9.95794103407916e-07, - "loss": 0.7061, - "step": 60432 - }, - { - "epoch": 1.55, - "learning_rate": 9.957664332003734e-07, - "loss": 0.6426, - "step": 60433 - }, - { - "epoch": 1.55, - "learning_rate": 9.957387629960723e-07, - "loss": 0.6865, - "step": 60434 - }, - { - "epoch": 1.55, - "learning_rate": 9.95711092795034e-07, - "loss": 0.6455, - "step": 60435 - }, - { - "epoch": 1.55, - "learning_rate": 9.956834225972792e-07, - "loss": 0.5928, - "step": 60436 - }, - { - "epoch": 1.55, - "learning_rate": 9.956557524028297e-07, - "loss": 0.4871, - "step": 60437 - }, - { - "epoch": 1.55, - "learning_rate": 9.95628082211706e-07, - "loss": 0.6592, - "step": 60438 - }, - { - "epoch": 1.55, - "learning_rate": 9.9560041202393e-07, - "loss": 0.6533, - "step": 60439 - }, - { - "epoch": 1.55, - "learning_rate": 9.955727418395223e-07, - "loss": 0.5703, - "step": 60440 - }, - { - "epoch": 1.55, - "learning_rate": 9.955450716585048e-07, - "loss": 0.6157, - "step": 60441 - }, - { - "epoch": 1.55, - "learning_rate": 9.955174014808976e-07, - "loss": 0.7144, - "step": 60442 - }, - { - "epoch": 1.55, - "learning_rate": 9.95489731306723e-07, - "loss": 0.5686, - "step": 60443 - }, - { - "epoch": 1.55, - "learning_rate": 9.954620611360017e-07, - "loss": 0.707, - "step": 60444 - }, - { - "epoch": 1.55, - "learning_rate": 9.95434390968755e-07, - "loss": 0.624, - "step": 60445 - }, - { - "epoch": 1.55, - "learning_rate": 9.954067208050034e-07, - "loss": 0.6235, - "step": 60446 - }, - { - "epoch": 1.55, - "learning_rate": 9.953790506447692e-07, - "loss": 0.7422, - "step": 60447 - }, - { - "epoch": 1.55, - "learning_rate": 9.953513804880727e-07, - "loss": 0.665, - "step": 60448 - }, - { - "epoch": 1.55, - "learning_rate": 9.953237103349357e-07, - "loss": 0.5537, - "step": 60449 - }, - { - "epoch": 1.55, - "learning_rate": 9.952960401853787e-07, - "loss": 0.7295, - "step": 60450 - }, - { - "epoch": 1.55, - "learning_rate": 9.95268370039424e-07, - "loss": 0.5166, - "step": 60451 - }, - { - "epoch": 1.55, - "learning_rate": 9.952406998970913e-07, - "loss": 0.6851, - "step": 60452 - }, - { - "epoch": 1.55, - "learning_rate": 9.952130297584032e-07, - "loss": 0.5947, - "step": 60453 - }, - { - "epoch": 1.55, - "learning_rate": 9.9518535962338e-07, - "loss": 0.564, - "step": 60454 - }, - { - "epoch": 1.55, - "learning_rate": 9.951576894920433e-07, - "loss": 0.7627, - "step": 60455 - }, - { - "epoch": 1.55, - "learning_rate": 9.95130019364414e-07, - "loss": 0.5652, - "step": 60456 - }, - { - "epoch": 1.55, - "learning_rate": 9.951023492405135e-07, - "loss": 0.625, - "step": 60457 - }, - { - "epoch": 1.55, - "learning_rate": 9.95074679120363e-07, - "loss": 0.7637, - "step": 60458 - }, - { - "epoch": 1.55, - "learning_rate": 9.950470090039831e-07, - "loss": 0.6499, - "step": 60459 - }, - { - "epoch": 1.55, - "learning_rate": 9.95019338891396e-07, - "loss": 0.6465, - "step": 60460 - }, - { - "epoch": 1.55, - "learning_rate": 9.949916687826223e-07, - "loss": 0.71, - "step": 60461 - }, - { - "epoch": 1.55, - "learning_rate": 9.94963998677683e-07, - "loss": 0.4968, - "step": 60462 - }, - { - "epoch": 1.55, - "learning_rate": 9.949363285765997e-07, - "loss": 0.4373, - "step": 60463 - }, - { - "epoch": 1.55, - "learning_rate": 9.949086584793932e-07, - "loss": 0.8281, - "step": 60464 - }, - { - "epoch": 1.55, - "learning_rate": 9.948809883860853e-07, - "loss": 0.7627, - "step": 60465 - }, - { - "epoch": 1.55, - "learning_rate": 9.948533182966966e-07, - "loss": 0.7373, - "step": 60466 - }, - { - "epoch": 1.55, - "learning_rate": 9.948256482112484e-07, - "loss": 0.6328, - "step": 60467 - }, - { - "epoch": 1.55, - "learning_rate": 9.947979781297621e-07, - "loss": 0.75, - "step": 60468 - }, - { - "epoch": 1.55, - "learning_rate": 9.947703080522586e-07, - "loss": 0.6865, - "step": 60469 - }, - { - "epoch": 1.55, - "learning_rate": 9.947426379787594e-07, - "loss": 0.8193, - "step": 60470 - }, - { - "epoch": 1.55, - "learning_rate": 9.947149679092852e-07, - "loss": 0.6113, - "step": 60471 - }, - { - "epoch": 1.55, - "learning_rate": 9.946872978438578e-07, - "loss": 0.7549, - "step": 60472 - }, - { - "epoch": 1.55, - "learning_rate": 9.94659627782498e-07, - "loss": 0.8779, - "step": 60473 - }, - { - "epoch": 1.55, - "learning_rate": 9.94631957725227e-07, - "loss": 0.7422, - "step": 60474 - }, - { - "epoch": 1.55, - "learning_rate": 9.946042876720666e-07, - "loss": 0.6152, - "step": 60475 - }, - { - "epoch": 1.55, - "learning_rate": 9.94576617623037e-07, - "loss": 0.7129, - "step": 60476 - }, - { - "epoch": 1.55, - "learning_rate": 9.945489475781599e-07, - "loss": 0.6533, - "step": 60477 - }, - { - "epoch": 1.55, - "learning_rate": 9.945212775374563e-07, - "loss": 0.6885, - "step": 60478 - }, - { - "epoch": 1.55, - "learning_rate": 9.944936075009475e-07, - "loss": 0.6963, - "step": 60479 - }, - { - "epoch": 1.55, - "learning_rate": 9.944659374686548e-07, - "loss": 0.7026, - "step": 60480 - }, - { - "epoch": 1.55, - "learning_rate": 9.944382674405992e-07, - "loss": 0.594, - "step": 60481 - }, - { - "epoch": 1.55, - "learning_rate": 9.94410597416802e-07, - "loss": 0.7402, - "step": 60482 - }, - { - "epoch": 1.55, - "learning_rate": 9.943829273972843e-07, - "loss": 0.6196, - "step": 60483 - }, - { - "epoch": 1.55, - "learning_rate": 9.943552573820673e-07, - "loss": 0.6318, - "step": 60484 - }, - { - "epoch": 1.55, - "learning_rate": 9.943275873711728e-07, - "loss": 0.7109, - "step": 60485 - }, - { - "epoch": 1.55, - "learning_rate": 9.942999173646208e-07, - "loss": 0.6011, - "step": 60486 - }, - { - "epoch": 1.55, - "learning_rate": 9.942722473624333e-07, - "loss": 0.8623, - "step": 60487 - }, - { - "epoch": 1.55, - "learning_rate": 9.94244577364631e-07, - "loss": 0.665, - "step": 60488 - }, - { - "epoch": 1.55, - "learning_rate": 9.942169073712355e-07, - "loss": 0.7461, - "step": 60489 - }, - { - "epoch": 1.55, - "learning_rate": 9.941892373822678e-07, - "loss": 0.6675, - "step": 60490 - }, - { - "epoch": 1.55, - "learning_rate": 9.941615673977493e-07, - "loss": 0.5985, - "step": 60491 - }, - { - "epoch": 1.55, - "learning_rate": 9.941338974177007e-07, - "loss": 0.6045, - "step": 60492 - }, - { - "epoch": 1.55, - "learning_rate": 9.94106227442144e-07, - "loss": 0.5308, - "step": 60493 - }, - { - "epoch": 1.55, - "learning_rate": 9.940785574710994e-07, - "loss": 0.8789, - "step": 60494 - }, - { - "epoch": 1.55, - "learning_rate": 9.940508875045891e-07, - "loss": 0.6953, - "step": 60495 - }, - { - "epoch": 1.55, - "learning_rate": 9.940232175426336e-07, - "loss": 0.6416, - "step": 60496 - }, - { - "epoch": 1.55, - "learning_rate": 9.939955475852542e-07, - "loss": 0.7256, - "step": 60497 - }, - { - "epoch": 1.55, - "learning_rate": 9.939678776324719e-07, - "loss": 0.6294, - "step": 60498 - }, - { - "epoch": 1.55, - "learning_rate": 9.939402076843084e-07, - "loss": 0.6426, - "step": 60499 - }, - { - "epoch": 1.55, - "learning_rate": 9.939125377407843e-07, - "loss": 0.6499, - "step": 60500 - }, - { - "epoch": 1.55, - "learning_rate": 9.938848678019214e-07, - "loss": 0.6782, - "step": 60501 - }, - { - "epoch": 1.55, - "learning_rate": 9.938571978677403e-07, - "loss": 0.7051, - "step": 60502 - }, - { - "epoch": 1.55, - "learning_rate": 9.938295279382626e-07, - "loss": 0.8506, - "step": 60503 - }, - { - "epoch": 1.55, - "learning_rate": 9.938018580135092e-07, - "loss": 0.7344, - "step": 60504 - }, - { - "epoch": 1.55, - "learning_rate": 9.93774188093502e-07, - "loss": 0.5771, - "step": 60505 - }, - { - "epoch": 1.55, - "learning_rate": 9.937465181782613e-07, - "loss": 0.5654, - "step": 60506 - }, - { - "epoch": 1.55, - "learning_rate": 9.937188482678082e-07, - "loss": 0.7588, - "step": 60507 - }, - { - "epoch": 1.55, - "learning_rate": 9.936911783621647e-07, - "loss": 0.6196, - "step": 60508 - }, - { - "epoch": 1.55, - "learning_rate": 9.936635084613514e-07, - "loss": 0.7002, - "step": 60509 - }, - { - "epoch": 1.55, - "learning_rate": 9.9363583856539e-07, - "loss": 0.5679, - "step": 60510 - }, - { - "epoch": 1.55, - "learning_rate": 9.936081686743008e-07, - "loss": 0.5186, - "step": 60511 - }, - { - "epoch": 1.55, - "learning_rate": 9.935804987881058e-07, - "loss": 0.7295, - "step": 60512 - }, - { - "epoch": 1.55, - "learning_rate": 9.93552828906826e-07, - "loss": 0.6396, - "step": 60513 - }, - { - "epoch": 1.55, - "learning_rate": 9.935251590304824e-07, - "loss": 0.6719, - "step": 60514 - }, - { - "epoch": 1.55, - "learning_rate": 9.934974891590965e-07, - "loss": 0.543, - "step": 60515 - }, - { - "epoch": 1.55, - "learning_rate": 9.934698192926893e-07, - "loss": 0.7559, - "step": 60516 - }, - { - "epoch": 1.55, - "learning_rate": 9.934421494312816e-07, - "loss": 0.707, - "step": 60517 - }, - { - "epoch": 1.55, - "learning_rate": 9.93414479574895e-07, - "loss": 0.5161, - "step": 60518 - }, - { - "epoch": 1.55, - "learning_rate": 9.933868097235508e-07, - "loss": 0.4829, - "step": 60519 - }, - { - "epoch": 1.55, - "learning_rate": 9.9335913987727e-07, - "loss": 0.4512, - "step": 60520 - }, - { - "epoch": 1.55, - "learning_rate": 9.933314700360735e-07, - "loss": 0.584, - "step": 60521 - }, - { - "epoch": 1.55, - "learning_rate": 9.93303800199983e-07, - "loss": 0.5981, - "step": 60522 - }, - { - "epoch": 1.55, - "learning_rate": 9.932761303690195e-07, - "loss": 0.7036, - "step": 60523 - }, - { - "epoch": 1.55, - "learning_rate": 9.932484605432042e-07, - "loss": 0.7188, - "step": 60524 - }, - { - "epoch": 1.55, - "learning_rate": 9.932207907225586e-07, - "loss": 0.5693, - "step": 60525 - }, - { - "epoch": 1.55, - "learning_rate": 9.93193120907103e-07, - "loss": 0.2461, - "step": 60526 - }, - { - "epoch": 1.55, - "learning_rate": 9.931654510968593e-07, - "loss": 0.7266, - "step": 60527 - }, - { - "epoch": 1.55, - "learning_rate": 9.931377812918484e-07, - "loss": 0.6611, - "step": 60528 - }, - { - "epoch": 1.55, - "learning_rate": 9.931101114920916e-07, - "loss": 0.6899, - "step": 60529 - }, - { - "epoch": 1.55, - "learning_rate": 9.9308244169761e-07, - "loss": 0.6895, - "step": 60530 - }, - { - "epoch": 1.55, - "learning_rate": 9.93054771908425e-07, - "loss": 0.7344, - "step": 60531 - }, - { - "epoch": 1.55, - "learning_rate": 9.930271021245574e-07, - "loss": 0.6841, - "step": 60532 - }, - { - "epoch": 1.55, - "learning_rate": 9.92999432346029e-07, - "loss": 0.752, - "step": 60533 - }, - { - "epoch": 1.55, - "learning_rate": 9.929717625728606e-07, - "loss": 0.6299, - "step": 60534 - }, - { - "epoch": 1.55, - "learning_rate": 9.929440928050734e-07, - "loss": 0.6357, - "step": 60535 - }, - { - "epoch": 1.55, - "learning_rate": 9.929164230426884e-07, - "loss": 0.6592, - "step": 60536 - }, - { - "epoch": 1.55, - "learning_rate": 9.928887532857269e-07, - "loss": 0.5347, - "step": 60537 - }, - { - "epoch": 1.55, - "learning_rate": 9.928610835342101e-07, - "loss": 0.7705, - "step": 60538 - }, - { - "epoch": 1.55, - "learning_rate": 9.928334137881595e-07, - "loss": 0.748, - "step": 60539 - }, - { - "epoch": 1.55, - "learning_rate": 9.92805744047596e-07, - "loss": 0.5693, - "step": 60540 - }, - { - "epoch": 1.55, - "learning_rate": 9.927780743125407e-07, - "loss": 0.4807, - "step": 60541 - }, - { - "epoch": 1.55, - "learning_rate": 9.927504045830148e-07, - "loss": 0.5027, - "step": 60542 - }, - { - "epoch": 1.55, - "learning_rate": 9.927227348590398e-07, - "loss": 0.6377, - "step": 60543 - }, - { - "epoch": 1.55, - "learning_rate": 9.926950651406363e-07, - "loss": 0.7129, - "step": 60544 - }, - { - "epoch": 1.55, - "learning_rate": 9.926673954278264e-07, - "loss": 0.7529, - "step": 60545 - }, - { - "epoch": 1.55, - "learning_rate": 9.926397257206307e-07, - "loss": 0.6045, - "step": 60546 - }, - { - "epoch": 1.55, - "learning_rate": 9.9261205601907e-07, - "loss": 0.6016, - "step": 60547 - }, - { - "epoch": 1.55, - "learning_rate": 9.92584386323166e-07, - "loss": 0.7617, - "step": 60548 - }, - { - "epoch": 1.55, - "learning_rate": 9.925567166329398e-07, - "loss": 0.6133, - "step": 60549 - }, - { - "epoch": 1.55, - "learning_rate": 9.925290469484128e-07, - "loss": 0.5754, - "step": 60550 - }, - { - "epoch": 1.55, - "learning_rate": 9.92501377269606e-07, - "loss": 0.6406, - "step": 60551 - }, - { - "epoch": 1.55, - "learning_rate": 9.924737075965402e-07, - "loss": 0.6665, - "step": 60552 - }, - { - "epoch": 1.55, - "learning_rate": 9.924460379292371e-07, - "loss": 0.7891, - "step": 60553 - }, - { - "epoch": 1.55, - "learning_rate": 9.924183682677176e-07, - "loss": 0.79, - "step": 60554 - }, - { - "epoch": 1.55, - "learning_rate": 9.923906986120035e-07, - "loss": 0.5815, - "step": 60555 - }, - { - "epoch": 1.55, - "learning_rate": 9.923630289621152e-07, - "loss": 0.6855, - "step": 60556 - }, - { - "epoch": 1.55, - "learning_rate": 9.92335359318074e-07, - "loss": 0.6416, - "step": 60557 - }, - { - "epoch": 1.55, - "learning_rate": 9.923076896799013e-07, - "loss": 0.8984, - "step": 60558 - }, - { - "epoch": 1.55, - "learning_rate": 9.922800200476185e-07, - "loss": 0.8232, - "step": 60559 - }, - { - "epoch": 1.55, - "learning_rate": 9.922523504212462e-07, - "loss": 0.7285, - "step": 60560 - }, - { - "epoch": 1.55, - "learning_rate": 9.92224680800806e-07, - "loss": 0.5928, - "step": 60561 - }, - { - "epoch": 1.55, - "learning_rate": 9.921970111863192e-07, - "loss": 0.5542, - "step": 60562 - }, - { - "epoch": 1.55, - "learning_rate": 9.921693415778066e-07, - "loss": 0.5701, - "step": 60563 - }, - { - "epoch": 1.55, - "learning_rate": 9.921416719752897e-07, - "loss": 0.6665, - "step": 60564 - }, - { - "epoch": 1.55, - "learning_rate": 9.921140023787897e-07, - "loss": 0.708, - "step": 60565 - }, - { - "epoch": 1.55, - "learning_rate": 9.920863327883274e-07, - "loss": 0.6016, - "step": 60566 - }, - { - "epoch": 1.55, - "learning_rate": 9.920586632039243e-07, - "loss": 0.7227, - "step": 60567 - }, - { - "epoch": 1.55, - "learning_rate": 9.920309936256017e-07, - "loss": 0.5791, - "step": 60568 - }, - { - "epoch": 1.55, - "learning_rate": 9.920033240533802e-07, - "loss": 0.5645, - "step": 60569 - }, - { - "epoch": 1.55, - "learning_rate": 9.919756544872815e-07, - "loss": 1.0068, - "step": 60570 - }, - { - "epoch": 1.55, - "learning_rate": 9.919479849273268e-07, - "loss": 0.4917, - "step": 60571 - }, - { - "epoch": 1.55, - "learning_rate": 9.919203153735372e-07, - "loss": 0.7275, - "step": 60572 - }, - { - "epoch": 1.55, - "learning_rate": 9.918926458259337e-07, - "loss": 0.7656, - "step": 60573 - }, - { - "epoch": 1.55, - "learning_rate": 9.918649762845376e-07, - "loss": 0.6328, - "step": 60574 - }, - { - "epoch": 1.55, - "learning_rate": 9.918373067493705e-07, - "loss": 0.6147, - "step": 60575 - }, - { - "epoch": 1.55, - "learning_rate": 9.91809637220453e-07, - "loss": 0.6895, - "step": 60576 - }, - { - "epoch": 1.55, - "learning_rate": 9.917819676978064e-07, - "loss": 0.709, - "step": 60577 - }, - { - "epoch": 1.55, - "learning_rate": 9.917542981814518e-07, - "loss": 0.5693, - "step": 60578 - }, - { - "epoch": 1.55, - "learning_rate": 9.917266286714106e-07, - "loss": 0.8076, - "step": 60579 - }, - { - "epoch": 1.55, - "learning_rate": 9.91698959167704e-07, - "loss": 0.6758, - "step": 60580 - }, - { - "epoch": 1.55, - "learning_rate": 9.916712896703532e-07, - "loss": 0.5542, - "step": 60581 - }, - { - "epoch": 1.55, - "learning_rate": 9.916436201793791e-07, - "loss": 0.6694, - "step": 60582 - }, - { - "epoch": 1.55, - "learning_rate": 9.916159506948033e-07, - "loss": 0.6465, - "step": 60583 - }, - { - "epoch": 1.55, - "learning_rate": 9.915882812166472e-07, - "loss": 0.8535, - "step": 60584 - }, - { - "epoch": 1.55, - "learning_rate": 9.91560611744931e-07, - "loss": 0.6675, - "step": 60585 - }, - { - "epoch": 1.55, - "learning_rate": 9.915329422796767e-07, - "loss": 0.6006, - "step": 60586 - }, - { - "epoch": 1.55, - "learning_rate": 9.915052728209052e-07, - "loss": 0.7812, - "step": 60587 - }, - { - "epoch": 1.55, - "learning_rate": 9.914776033686375e-07, - "loss": 0.73, - "step": 60588 - }, - { - "epoch": 1.55, - "learning_rate": 9.914499339228953e-07, - "loss": 0.5088, - "step": 60589 - }, - { - "epoch": 1.55, - "learning_rate": 9.914222644836992e-07, - "loss": 0.6931, - "step": 60590 - }, - { - "epoch": 1.55, - "learning_rate": 9.913945950510707e-07, - "loss": 0.6152, - "step": 60591 - }, - { - "epoch": 1.55, - "learning_rate": 9.91366925625031e-07, - "loss": 0.5117, - "step": 60592 - }, - { - "epoch": 1.55, - "learning_rate": 9.913392562056014e-07, - "loss": 0.5791, - "step": 60593 - }, - { - "epoch": 1.55, - "learning_rate": 9.913115867928032e-07, - "loss": 0.5659, - "step": 60594 - }, - { - "epoch": 1.55, - "learning_rate": 9.91283917386657e-07, - "loss": 0.5684, - "step": 60595 - }, - { - "epoch": 1.55, - "learning_rate": 9.912562479871842e-07, - "loss": 0.5933, - "step": 60596 - }, - { - "epoch": 1.55, - "learning_rate": 9.91228578594406e-07, - "loss": 0.7979, - "step": 60597 - }, - { - "epoch": 1.55, - "learning_rate": 9.91200909208344e-07, - "loss": 0.7637, - "step": 60598 - }, - { - "epoch": 1.55, - "learning_rate": 9.911732398290188e-07, - "loss": 0.7344, - "step": 60599 - }, - { - "epoch": 1.55, - "learning_rate": 9.91145570456452e-07, - "loss": 0.6338, - "step": 60600 - }, - { - "epoch": 1.55, - "learning_rate": 9.911179010906645e-07, - "loss": 0.637, - "step": 60601 - }, - { - "epoch": 1.55, - "learning_rate": 9.910902317316778e-07, - "loss": 0.582, - "step": 60602 - }, - { - "epoch": 1.55, - "learning_rate": 9.910625623795125e-07, - "loss": 0.6821, - "step": 60603 - }, - { - "epoch": 1.55, - "learning_rate": 9.91034893034191e-07, - "loss": 0.6802, - "step": 60604 - }, - { - "epoch": 1.55, - "learning_rate": 9.910072236957331e-07, - "loss": 0.4978, - "step": 60605 - }, - { - "epoch": 1.55, - "learning_rate": 9.909795543641607e-07, - "loss": 0.6211, - "step": 60606 - }, - { - "epoch": 1.55, - "learning_rate": 9.909518850394946e-07, - "loss": 0.5867, - "step": 60607 - }, - { - "epoch": 1.55, - "learning_rate": 9.909242157217565e-07, - "loss": 0.5938, - "step": 60608 - }, - { - "epoch": 1.55, - "learning_rate": 9.90896546410967e-07, - "loss": 0.5732, - "step": 60609 - }, - { - "epoch": 1.55, - "learning_rate": 9.908688771071477e-07, - "loss": 0.5112, - "step": 60610 - }, - { - "epoch": 1.55, - "learning_rate": 9.908412078103198e-07, - "loss": 0.6118, - "step": 60611 - }, - { - "epoch": 1.55, - "learning_rate": 9.908135385205044e-07, - "loss": 0.6572, - "step": 60612 - }, - { - "epoch": 1.55, - "learning_rate": 9.907858692377225e-07, - "loss": 0.5695, - "step": 60613 - }, - { - "epoch": 1.55, - "learning_rate": 9.907581999619956e-07, - "loss": 0.6655, - "step": 60614 - }, - { - "epoch": 1.55, - "learning_rate": 9.907305306933448e-07, - "loss": 0.7793, - "step": 60615 - }, - { - "epoch": 1.55, - "learning_rate": 9.90702861431791e-07, - "loss": 0.5444, - "step": 60616 - }, - { - "epoch": 1.55, - "learning_rate": 9.906751921773557e-07, - "loss": 0.6816, - "step": 60617 - }, - { - "epoch": 1.55, - "learning_rate": 9.906475229300597e-07, - "loss": 0.7031, - "step": 60618 - }, - { - "epoch": 1.55, - "learning_rate": 9.906198536899249e-07, - "loss": 0.6333, - "step": 60619 - }, - { - "epoch": 1.55, - "learning_rate": 9.905921844569716e-07, - "loss": 0.5903, - "step": 60620 - }, - { - "epoch": 1.55, - "learning_rate": 9.905645152312218e-07, - "loss": 0.6431, - "step": 60621 - }, - { - "epoch": 1.55, - "learning_rate": 9.905368460126959e-07, - "loss": 0.488, - "step": 60622 - }, - { - "epoch": 1.55, - "learning_rate": 9.90509176801416e-07, - "loss": 0.6406, - "step": 60623 - }, - { - "epoch": 1.55, - "learning_rate": 9.904815075974028e-07, - "loss": 0.7051, - "step": 60624 - }, - { - "epoch": 1.55, - "learning_rate": 9.904538384006772e-07, - "loss": 0.5442, - "step": 60625 - }, - { - "epoch": 1.55, - "learning_rate": 9.904261692112606e-07, - "loss": 0.6787, - "step": 60626 - }, - { - "epoch": 1.55, - "learning_rate": 9.903985000291743e-07, - "loss": 0.6787, - "step": 60627 - }, - { - "epoch": 1.55, - "learning_rate": 9.903708308544393e-07, - "loss": 0.8682, - "step": 60628 - }, - { - "epoch": 1.55, - "learning_rate": 9.903431616870772e-07, - "loss": 0.7822, - "step": 60629 - }, - { - "epoch": 1.55, - "learning_rate": 9.903154925271088e-07, - "loss": 0.71, - "step": 60630 - }, - { - "epoch": 1.55, - "learning_rate": 9.902878233745553e-07, - "loss": 0.4467, - "step": 60631 - }, - { - "epoch": 1.55, - "learning_rate": 9.902601542294379e-07, - "loss": 0.4531, - "step": 60632 - }, - { - "epoch": 1.55, - "learning_rate": 9.90232485091778e-07, - "loss": 0.7158, - "step": 60633 - }, - { - "epoch": 1.55, - "learning_rate": 9.90204815961597e-07, - "loss": 0.7373, - "step": 60634 - }, - { - "epoch": 1.55, - "learning_rate": 9.901771468389152e-07, - "loss": 0.605, - "step": 60635 - }, - { - "epoch": 1.55, - "learning_rate": 9.901494777237544e-07, - "loss": 0.6533, - "step": 60636 - }, - { - "epoch": 1.55, - "learning_rate": 9.901218086161355e-07, - "loss": 0.9014, - "step": 60637 - }, - { - "epoch": 1.55, - "learning_rate": 9.900941395160803e-07, - "loss": 0.7305, - "step": 60638 - }, - { - "epoch": 1.55, - "learning_rate": 9.900664704236092e-07, - "loss": 0.583, - "step": 60639 - }, - { - "epoch": 1.55, - "learning_rate": 9.90038801338744e-07, - "loss": 0.6069, - "step": 60640 - }, - { - "epoch": 1.55, - "learning_rate": 9.900111322615055e-07, - "loss": 0.5979, - "step": 60641 - }, - { - "epoch": 1.55, - "learning_rate": 9.89983463191915e-07, - "loss": 0.5586, - "step": 60642 - }, - { - "epoch": 1.55, - "learning_rate": 9.89955794129994e-07, - "loss": 0.6514, - "step": 60643 - }, - { - "epoch": 1.55, - "learning_rate": 9.899281250757634e-07, - "loss": 0.6704, - "step": 60644 - }, - { - "epoch": 1.55, - "learning_rate": 9.899004560292438e-07, - "loss": 0.7222, - "step": 60645 - }, - { - "epoch": 1.55, - "learning_rate": 9.898727869904574e-07, - "loss": 0.4342, - "step": 60646 - }, - { - "epoch": 1.55, - "learning_rate": 9.898451179594248e-07, - "loss": 0.5474, - "step": 60647 - }, - { - "epoch": 1.55, - "learning_rate": 9.898174489361673e-07, - "loss": 0.6172, - "step": 60648 - }, - { - "epoch": 1.55, - "learning_rate": 9.89789779920706e-07, - "loss": 0.5228, - "step": 60649 - }, - { - "epoch": 1.55, - "learning_rate": 9.897621109130626e-07, - "loss": 0.7666, - "step": 60650 - }, - { - "epoch": 1.55, - "learning_rate": 9.897344419132573e-07, - "loss": 0.4736, - "step": 60651 - }, - { - "epoch": 1.55, - "learning_rate": 9.897067729213123e-07, - "loss": 0.6953, - "step": 60652 - }, - { - "epoch": 1.55, - "learning_rate": 9.896791039372482e-07, - "loss": 0.6416, - "step": 60653 - }, - { - "epoch": 1.55, - "learning_rate": 9.896514349610866e-07, - "loss": 0.7266, - "step": 60654 - }, - { - "epoch": 1.55, - "learning_rate": 9.896237659928483e-07, - "loss": 0.6826, - "step": 60655 - }, - { - "epoch": 1.55, - "learning_rate": 9.895960970325544e-07, - "loss": 0.5879, - "step": 60656 - }, - { - "epoch": 1.55, - "learning_rate": 9.895684280802264e-07, - "loss": 0.5605, - "step": 60657 - }, - { - "epoch": 1.55, - "learning_rate": 9.895407591358852e-07, - "loss": 0.6375, - "step": 60658 - }, - { - "epoch": 1.55, - "learning_rate": 9.895130901995526e-07, - "loss": 0.6621, - "step": 60659 - }, - { - "epoch": 1.55, - "learning_rate": 9.89485421271249e-07, - "loss": 0.7173, - "step": 60660 - }, - { - "epoch": 1.55, - "learning_rate": 9.89457752350996e-07, - "loss": 0.665, - "step": 60661 - }, - { - "epoch": 1.55, - "learning_rate": 9.894300834388147e-07, - "loss": 0.5425, - "step": 60662 - }, - { - "epoch": 1.55, - "learning_rate": 9.894024145347263e-07, - "loss": 0.6475, - "step": 60663 - }, - { - "epoch": 1.55, - "learning_rate": 9.893747456387522e-07, - "loss": 0.5139, - "step": 60664 - }, - { - "epoch": 1.55, - "learning_rate": 9.893470767509132e-07, - "loss": 0.5759, - "step": 60665 - }, - { - "epoch": 1.55, - "learning_rate": 9.893194078712305e-07, - "loss": 0.5042, - "step": 60666 - }, - { - "epoch": 1.55, - "learning_rate": 9.892917389997256e-07, - "loss": 0.749, - "step": 60667 - }, - { - "epoch": 1.55, - "learning_rate": 9.892640701364194e-07, - "loss": 0.6646, - "step": 60668 - }, - { - "epoch": 1.55, - "learning_rate": 9.892364012813333e-07, - "loss": 0.7021, - "step": 60669 - }, - { - "epoch": 1.56, - "learning_rate": 9.892087324344884e-07, - "loss": 0.604, - "step": 60670 - }, - { - "epoch": 1.56, - "learning_rate": 9.89181063595906e-07, - "loss": 0.7666, - "step": 60671 - }, - { - "epoch": 1.56, - "learning_rate": 9.891533947656067e-07, - "loss": 0.6675, - "step": 60672 - }, - { - "epoch": 1.56, - "learning_rate": 9.891257259436127e-07, - "loss": 0.748, - "step": 60673 - }, - { - "epoch": 1.56, - "learning_rate": 9.890980571299446e-07, - "loss": 0.7588, - "step": 60674 - }, - { - "epoch": 1.56, - "learning_rate": 9.890703883246234e-07, - "loss": 0.7588, - "step": 60675 - }, - { - "epoch": 1.56, - "learning_rate": 9.890427195276704e-07, - "loss": 0.6797, - "step": 60676 - }, - { - "epoch": 1.56, - "learning_rate": 9.890150507391071e-07, - "loss": 0.7549, - "step": 60677 - }, - { - "epoch": 1.56, - "learning_rate": 9.889873819589544e-07, - "loss": 0.5635, - "step": 60678 - }, - { - "epoch": 1.56, - "learning_rate": 9.889597131872335e-07, - "loss": 0.5991, - "step": 60679 - }, - { - "epoch": 1.56, - "learning_rate": 9.889320444239656e-07, - "loss": 0.6689, - "step": 60680 - }, - { - "epoch": 1.56, - "learning_rate": 9.88904375669172e-07, - "loss": 0.6748, - "step": 60681 - }, - { - "epoch": 1.56, - "learning_rate": 9.888767069228737e-07, - "loss": 0.5649, - "step": 60682 - }, - { - "epoch": 1.56, - "learning_rate": 9.888490381850923e-07, - "loss": 0.748, - "step": 60683 - }, - { - "epoch": 1.56, - "learning_rate": 9.888213694558486e-07, - "loss": 0.5127, - "step": 60684 - }, - { - "epoch": 1.56, - "learning_rate": 9.887937007351636e-07, - "loss": 0.6675, - "step": 60685 - }, - { - "epoch": 1.56, - "learning_rate": 9.887660320230592e-07, - "loss": 0.5952, - "step": 60686 - }, - { - "epoch": 1.56, - "learning_rate": 9.887383633195556e-07, - "loss": 0.5259, - "step": 60687 - }, - { - "epoch": 1.56, - "learning_rate": 9.887106946246747e-07, - "loss": 0.6699, - "step": 60688 - }, - { - "epoch": 1.56, - "learning_rate": 9.886830259384374e-07, - "loss": 0.4629, - "step": 60689 - }, - { - "epoch": 1.56, - "learning_rate": 9.886553572608653e-07, - "loss": 0.6309, - "step": 60690 - }, - { - "epoch": 1.56, - "learning_rate": 9.88627688591979e-07, - "loss": 0.7676, - "step": 60691 - }, - { - "epoch": 1.56, - "learning_rate": 9.886000199318e-07, - "loss": 0.7646, - "step": 60692 - }, - { - "epoch": 1.56, - "learning_rate": 9.885723512803494e-07, - "loss": 0.7842, - "step": 60693 - }, - { - "epoch": 1.56, - "learning_rate": 9.885446826376492e-07, - "loss": 0.6826, - "step": 60694 - }, - { - "epoch": 1.56, - "learning_rate": 9.88517014003719e-07, - "loss": 0.5723, - "step": 60695 - }, - { - "epoch": 1.56, - "learning_rate": 9.884893453785809e-07, - "loss": 0.6177, - "step": 60696 - }, - { - "epoch": 1.56, - "learning_rate": 9.884616767622558e-07, - "loss": 0.563, - "step": 60697 - }, - { - "epoch": 1.56, - "learning_rate": 9.884340081547655e-07, - "loss": 0.6418, - "step": 60698 - }, - { - "epoch": 1.56, - "learning_rate": 9.884063395561302e-07, - "loss": 0.5928, - "step": 60699 - }, - { - "epoch": 1.56, - "learning_rate": 9.883786709663721e-07, - "loss": 0.6182, - "step": 60700 - }, - { - "epoch": 1.56, - "learning_rate": 9.883510023855117e-07, - "loss": 0.5571, - "step": 60701 - }, - { - "epoch": 1.56, - "learning_rate": 9.883233338135705e-07, - "loss": 0.5728, - "step": 60702 - }, - { - "epoch": 1.56, - "learning_rate": 9.882956652505695e-07, - "loss": 0.3381, - "step": 60703 - }, - { - "epoch": 1.56, - "learning_rate": 9.882679966965303e-07, - "loss": 0.6675, - "step": 60704 - }, - { - "epoch": 1.56, - "learning_rate": 9.882403281514735e-07, - "loss": 0.6191, - "step": 60705 - }, - { - "epoch": 1.56, - "learning_rate": 9.882126596154202e-07, - "loss": 0.7852, - "step": 60706 - }, - { - "epoch": 1.56, - "learning_rate": 9.881849910883925e-07, - "loss": 0.47, - "step": 60707 - }, - { - "epoch": 1.56, - "learning_rate": 9.881573225704105e-07, - "loss": 0.5353, - "step": 60708 - }, - { - "epoch": 1.56, - "learning_rate": 9.881296540614964e-07, - "loss": 0.5688, - "step": 60709 - }, - { - "epoch": 1.56, - "learning_rate": 9.881019855616705e-07, - "loss": 0.6406, - "step": 60710 - }, - { - "epoch": 1.56, - "learning_rate": 9.880743170709545e-07, - "loss": 0.6504, - "step": 60711 - }, - { - "epoch": 1.56, - "learning_rate": 9.880466485893693e-07, - "loss": 0.6973, - "step": 60712 - }, - { - "epoch": 1.56, - "learning_rate": 9.880189801169364e-07, - "loss": 0.6289, - "step": 60713 - }, - { - "epoch": 1.56, - "learning_rate": 9.879913116536772e-07, - "loss": 0.6094, - "step": 60714 - }, - { - "epoch": 1.56, - "learning_rate": 9.87963643199612e-07, - "loss": 0.8193, - "step": 60715 - }, - { - "epoch": 1.56, - "learning_rate": 9.879359747547626e-07, - "loss": 0.644, - "step": 60716 - }, - { - "epoch": 1.56, - "learning_rate": 9.879083063191501e-07, - "loss": 0.4155, - "step": 60717 - }, - { - "epoch": 1.56, - "learning_rate": 9.878806378927954e-07, - "loss": 0.5391, - "step": 60718 - }, - { - "epoch": 1.56, - "learning_rate": 9.878529694757202e-07, - "loss": 0.4857, - "step": 60719 - }, - { - "epoch": 1.56, - "learning_rate": 9.878253010679453e-07, - "loss": 0.7021, - "step": 60720 - }, - { - "epoch": 1.56, - "learning_rate": 9.87797632669492e-07, - "loss": 0.583, - "step": 60721 - }, - { - "epoch": 1.56, - "learning_rate": 9.877699642803814e-07, - "loss": 0.53, - "step": 60722 - }, - { - "epoch": 1.56, - "learning_rate": 9.87742295900635e-07, - "loss": 0.6841, - "step": 60723 - }, - { - "epoch": 1.56, - "learning_rate": 9.87714627530274e-07, - "loss": 0.6748, - "step": 60724 - }, - { - "epoch": 1.56, - "learning_rate": 9.87686959169319e-07, - "loss": 0.7324, - "step": 60725 - }, - { - "epoch": 1.56, - "learning_rate": 9.876592908177917e-07, - "loss": 0.6982, - "step": 60726 - }, - { - "epoch": 1.56, - "learning_rate": 9.876316224757128e-07, - "loss": 0.6797, - "step": 60727 - }, - { - "epoch": 1.56, - "learning_rate": 9.876039541431041e-07, - "loss": 0.6694, - "step": 60728 - }, - { - "epoch": 1.56, - "learning_rate": 9.875762858199863e-07, - "loss": 0.5552, - "step": 60729 - }, - { - "epoch": 1.56, - "learning_rate": 9.875486175063808e-07, - "loss": 0.6475, - "step": 60730 - }, - { - "epoch": 1.56, - "learning_rate": 9.875209492023087e-07, - "loss": 0.6997, - "step": 60731 - }, - { - "epoch": 1.56, - "learning_rate": 9.874932809077913e-07, - "loss": 0.458, - "step": 60732 - }, - { - "epoch": 1.56, - "learning_rate": 9.874656126228499e-07, - "loss": 0.6084, - "step": 60733 - }, - { - "epoch": 1.56, - "learning_rate": 9.874379443475055e-07, - "loss": 0.5913, - "step": 60734 - }, - { - "epoch": 1.56, - "learning_rate": 9.87410276081779e-07, - "loss": 0.6626, - "step": 60735 - }, - { - "epoch": 1.56, - "learning_rate": 9.873826078256921e-07, - "loss": 0.606, - "step": 60736 - }, - { - "epoch": 1.56, - "learning_rate": 9.873549395792655e-07, - "loss": 0.6388, - "step": 60737 - }, - { - "epoch": 1.56, - "learning_rate": 9.873272713425208e-07, - "loss": 0.6406, - "step": 60738 - }, - { - "epoch": 1.56, - "learning_rate": 9.87299603115479e-07, - "loss": 0.7197, - "step": 60739 - }, - { - "epoch": 1.56, - "learning_rate": 9.872719348981614e-07, - "loss": 0.5583, - "step": 60740 - }, - { - "epoch": 1.56, - "learning_rate": 9.872442666905888e-07, - "loss": 0.6348, - "step": 60741 - }, - { - "epoch": 1.56, - "learning_rate": 9.872165984927831e-07, - "loss": 0.6738, - "step": 60742 - }, - { - "epoch": 1.56, - "learning_rate": 9.871889303047647e-07, - "loss": 0.6094, - "step": 60743 - }, - { - "epoch": 1.56, - "learning_rate": 9.871612621265555e-07, - "loss": 0.7002, - "step": 60744 - }, - { - "epoch": 1.56, - "learning_rate": 9.871335939581762e-07, - "loss": 0.624, - "step": 60745 - }, - { - "epoch": 1.56, - "learning_rate": 9.87105925799648e-07, - "loss": 0.6882, - "step": 60746 - }, - { - "epoch": 1.56, - "learning_rate": 9.870782576509923e-07, - "loss": 0.5571, - "step": 60747 - }, - { - "epoch": 1.56, - "learning_rate": 9.8705058951223e-07, - "loss": 0.7202, - "step": 60748 - }, - { - "epoch": 1.56, - "learning_rate": 9.870229213833826e-07, - "loss": 0.7295, - "step": 60749 - }, - { - "epoch": 1.56, - "learning_rate": 9.869952532644715e-07, - "loss": 0.5601, - "step": 60750 - }, - { - "epoch": 1.56, - "learning_rate": 9.86967585155517e-07, - "loss": 0.5586, - "step": 60751 - }, - { - "epoch": 1.56, - "learning_rate": 9.86939917056541e-07, - "loss": 0.6172, - "step": 60752 - }, - { - "epoch": 1.56, - "learning_rate": 9.869122489675645e-07, - "loss": 0.5552, - "step": 60753 - }, - { - "epoch": 1.56, - "learning_rate": 9.86884580888609e-07, - "loss": 0.7637, - "step": 60754 - }, - { - "epoch": 1.56, - "learning_rate": 9.868569128196952e-07, - "loss": 0.6436, - "step": 60755 - }, - { - "epoch": 1.56, - "learning_rate": 9.868292447608442e-07, - "loss": 0.6025, - "step": 60756 - }, - { - "epoch": 1.56, - "learning_rate": 9.868015767120775e-07, - "loss": 0.5936, - "step": 60757 - }, - { - "epoch": 1.56, - "learning_rate": 9.867739086734162e-07, - "loss": 0.7051, - "step": 60758 - }, - { - "epoch": 1.56, - "learning_rate": 9.867462406448818e-07, - "loss": 0.561, - "step": 60759 - }, - { - "epoch": 1.56, - "learning_rate": 9.867185726264948e-07, - "loss": 0.6196, - "step": 60760 - }, - { - "epoch": 1.56, - "learning_rate": 9.866909046182771e-07, - "loss": 0.7471, - "step": 60761 - }, - { - "epoch": 1.56, - "learning_rate": 9.866632366202493e-07, - "loss": 0.7998, - "step": 60762 - }, - { - "epoch": 1.56, - "learning_rate": 9.866355686324332e-07, - "loss": 0.7339, - "step": 60763 - }, - { - "epoch": 1.56, - "learning_rate": 9.866079006548497e-07, - "loss": 0.7197, - "step": 60764 - }, - { - "epoch": 1.56, - "learning_rate": 9.865802326875194e-07, - "loss": 0.8125, - "step": 60765 - }, - { - "epoch": 1.56, - "learning_rate": 9.865525647304644e-07, - "loss": 0.709, - "step": 60766 - }, - { - "epoch": 1.56, - "learning_rate": 9.865248967837055e-07, - "loss": 0.5068, - "step": 60767 - }, - { - "epoch": 1.56, - "learning_rate": 9.864972288472634e-07, - "loss": 0.5835, - "step": 60768 - }, - { - "epoch": 1.56, - "learning_rate": 9.8646956092116e-07, - "loss": 0.3438, - "step": 60769 - }, - { - "epoch": 1.56, - "learning_rate": 9.864418930054164e-07, - "loss": 0.793, - "step": 60770 - }, - { - "epoch": 1.56, - "learning_rate": 9.864142251000535e-07, - "loss": 0.7266, - "step": 60771 - }, - { - "epoch": 1.56, - "learning_rate": 9.863865572050925e-07, - "loss": 0.7617, - "step": 60772 - }, - { - "epoch": 1.56, - "learning_rate": 9.863588893205548e-07, - "loss": 0.585, - "step": 60773 - }, - { - "epoch": 1.56, - "learning_rate": 9.863312214464618e-07, - "loss": 0.7959, - "step": 60774 - }, - { - "epoch": 1.56, - "learning_rate": 9.86303553582834e-07, - "loss": 0.665, - "step": 60775 - }, - { - "epoch": 1.56, - "learning_rate": 9.86275885729693e-07, - "loss": 0.7383, - "step": 60776 - }, - { - "epoch": 1.56, - "learning_rate": 9.862482178870598e-07, - "loss": 0.6436, - "step": 60777 - }, - { - "epoch": 1.56, - "learning_rate": 9.862205500549557e-07, - "loss": 0.6738, - "step": 60778 - }, - { - "epoch": 1.56, - "learning_rate": 9.861928822334018e-07, - "loss": 0.6846, - "step": 60779 - }, - { - "epoch": 1.56, - "learning_rate": 9.861652144224198e-07, - "loss": 0.4863, - "step": 60780 - }, - { - "epoch": 1.56, - "learning_rate": 9.861375466220299e-07, - "loss": 0.7559, - "step": 60781 - }, - { - "epoch": 1.56, - "learning_rate": 9.861098788322544e-07, - "loss": 0.6362, - "step": 60782 - }, - { - "epoch": 1.56, - "learning_rate": 9.860822110531135e-07, - "loss": 0.48, - "step": 60783 - }, - { - "epoch": 1.56, - "learning_rate": 9.860545432846295e-07, - "loss": 0.6499, - "step": 60784 - }, - { - "epoch": 1.56, - "learning_rate": 9.860268755268222e-07, - "loss": 0.5376, - "step": 60785 - }, - { - "epoch": 1.56, - "learning_rate": 9.859992077797139e-07, - "loss": 0.6455, - "step": 60786 - }, - { - "epoch": 1.56, - "learning_rate": 9.85971540043325e-07, - "loss": 0.6973, - "step": 60787 - }, - { - "epoch": 1.56, - "learning_rate": 9.859438723176772e-07, - "loss": 0.6606, - "step": 60788 - }, - { - "epoch": 1.56, - "learning_rate": 9.859162046027913e-07, - "loss": 0.6411, - "step": 60789 - }, - { - "epoch": 1.56, - "learning_rate": 9.85888536898689e-07, - "loss": 0.8457, - "step": 60790 - }, - { - "epoch": 1.56, - "learning_rate": 9.85860869205391e-07, - "loss": 0.7627, - "step": 60791 - }, - { - "epoch": 1.56, - "learning_rate": 9.85833201522919e-07, - "loss": 0.5786, - "step": 60792 - }, - { - "epoch": 1.56, - "learning_rate": 9.858055338512935e-07, - "loss": 0.6172, - "step": 60793 - }, - { - "epoch": 1.56, - "learning_rate": 9.857778661905366e-07, - "loss": 0.6255, - "step": 60794 - }, - { - "epoch": 1.56, - "learning_rate": 9.857501985406685e-07, - "loss": 0.6504, - "step": 60795 - }, - { - "epoch": 1.56, - "learning_rate": 9.857225309017108e-07, - "loss": 0.6826, - "step": 60796 - }, - { - "epoch": 1.56, - "learning_rate": 9.856948632736849e-07, - "loss": 0.6787, - "step": 60797 - }, - { - "epoch": 1.56, - "learning_rate": 9.856671956566113e-07, - "loss": 0.625, - "step": 60798 - }, - { - "epoch": 1.56, - "learning_rate": 9.856395280505121e-07, - "loss": 0.7061, - "step": 60799 - }, - { - "epoch": 1.56, - "learning_rate": 9.85611860455408e-07, - "loss": 0.7451, - "step": 60800 - }, - { - "epoch": 1.56, - "learning_rate": 9.855841928713203e-07, - "loss": 0.5212, - "step": 60801 - }, - { - "epoch": 1.56, - "learning_rate": 9.8555652529827e-07, - "loss": 0.6992, - "step": 60802 - }, - { - "epoch": 1.56, - "learning_rate": 9.855288577362784e-07, - "loss": 0.6685, - "step": 60803 - }, - { - "epoch": 1.56, - "learning_rate": 9.85501190185367e-07, - "loss": 0.708, - "step": 60804 - }, - { - "epoch": 1.56, - "learning_rate": 9.854735226455564e-07, - "loss": 0.6108, - "step": 60805 - }, - { - "epoch": 1.56, - "learning_rate": 9.85445855116868e-07, - "loss": 0.7012, - "step": 60806 - }, - { - "epoch": 1.56, - "learning_rate": 9.854181875993232e-07, - "loss": 0.6895, - "step": 60807 - }, - { - "epoch": 1.56, - "learning_rate": 9.853905200929429e-07, - "loss": 0.8359, - "step": 60808 - }, - { - "epoch": 1.56, - "learning_rate": 9.853628525977485e-07, - "loss": 0.5256, - "step": 60809 - }, - { - "epoch": 1.56, - "learning_rate": 9.853351851137607e-07, - "loss": 0.7397, - "step": 60810 - }, - { - "epoch": 1.56, - "learning_rate": 9.853075176410017e-07, - "loss": 0.7256, - "step": 60811 - }, - { - "epoch": 1.56, - "learning_rate": 9.852798501794917e-07, - "loss": 0.5217, - "step": 60812 - }, - { - "epoch": 1.56, - "learning_rate": 9.85252182729252e-07, - "loss": 0.6836, - "step": 60813 - }, - { - "epoch": 1.56, - "learning_rate": 9.852245152903049e-07, - "loss": 0.6479, - "step": 60814 - }, - { - "epoch": 1.56, - "learning_rate": 9.851968478626698e-07, - "loss": 0.6162, - "step": 60815 - }, - { - "epoch": 1.56, - "learning_rate": 9.851691804463693e-07, - "loss": 0.6235, - "step": 60816 - }, - { - "epoch": 1.56, - "learning_rate": 9.851415130414238e-07, - "loss": 0.8105, - "step": 60817 - }, - { - "epoch": 1.56, - "learning_rate": 9.851138456478549e-07, - "loss": 0.7793, - "step": 60818 - }, - { - "epoch": 1.56, - "learning_rate": 9.850861782656835e-07, - "loss": 0.8496, - "step": 60819 - }, - { - "epoch": 1.56, - "learning_rate": 9.850585108949311e-07, - "loss": 0.7529, - "step": 60820 - }, - { - "epoch": 1.56, - "learning_rate": 9.850308435356186e-07, - "loss": 0.6758, - "step": 60821 - }, - { - "epoch": 1.56, - "learning_rate": 9.850031761877673e-07, - "loss": 0.7451, - "step": 60822 - }, - { - "epoch": 1.56, - "learning_rate": 9.849755088513985e-07, - "loss": 0.5602, - "step": 60823 - }, - { - "epoch": 1.56, - "learning_rate": 9.849478415265334e-07, - "loss": 0.4722, - "step": 60824 - }, - { - "epoch": 1.56, - "learning_rate": 9.849201742131927e-07, - "loss": 0.7061, - "step": 60825 - }, - { - "epoch": 1.56, - "learning_rate": 9.848925069113981e-07, - "loss": 0.8359, - "step": 60826 - }, - { - "epoch": 1.56, - "learning_rate": 9.848648396211705e-07, - "loss": 0.5546, - "step": 60827 - }, - { - "epoch": 1.56, - "learning_rate": 9.848371723425315e-07, - "loss": 0.5664, - "step": 60828 - }, - { - "epoch": 1.56, - "learning_rate": 9.848095050755015e-07, - "loss": 0.6211, - "step": 60829 - }, - { - "epoch": 1.56, - "learning_rate": 9.847818378201025e-07, - "loss": 0.563, - "step": 60830 - }, - { - "epoch": 1.56, - "learning_rate": 9.847541705763552e-07, - "loss": 0.6475, - "step": 60831 - }, - { - "epoch": 1.56, - "learning_rate": 9.84726503344281e-07, - "loss": 0.7334, - "step": 60832 - }, - { - "epoch": 1.56, - "learning_rate": 9.846988361239009e-07, - "loss": 0.5088, - "step": 60833 - }, - { - "epoch": 1.56, - "learning_rate": 9.846711689152366e-07, - "loss": 0.6567, - "step": 60834 - }, - { - "epoch": 1.56, - "learning_rate": 9.846435017183085e-07, - "loss": 0.668, - "step": 60835 - }, - { - "epoch": 1.56, - "learning_rate": 9.846158345331381e-07, - "loss": 0.5813, - "step": 60836 - }, - { - "epoch": 1.56, - "learning_rate": 9.84588167359747e-07, - "loss": 0.7031, - "step": 60837 - }, - { - "epoch": 1.56, - "learning_rate": 9.845605001981557e-07, - "loss": 0.5449, - "step": 60838 - }, - { - "epoch": 1.56, - "learning_rate": 9.84532833048386e-07, - "loss": 0.6978, - "step": 60839 - }, - { - "epoch": 1.56, - "learning_rate": 9.845051659104584e-07, - "loss": 0.6602, - "step": 60840 - }, - { - "epoch": 1.56, - "learning_rate": 9.844774987843946e-07, - "loss": 0.6191, - "step": 60841 - }, - { - "epoch": 1.56, - "learning_rate": 9.84449831670216e-07, - "loss": 0.6973, - "step": 60842 - }, - { - "epoch": 1.56, - "learning_rate": 9.84422164567943e-07, - "loss": 0.4824, - "step": 60843 - }, - { - "epoch": 1.56, - "learning_rate": 9.84394497477598e-07, - "loss": 0.5425, - "step": 60844 - }, - { - "epoch": 1.56, - "learning_rate": 9.843668303992007e-07, - "loss": 0.7871, - "step": 60845 - }, - { - "epoch": 1.56, - "learning_rate": 9.843391633327731e-07, - "loss": 0.5996, - "step": 60846 - }, - { - "epoch": 1.56, - "learning_rate": 9.843114962783363e-07, - "loss": 0.7021, - "step": 60847 - }, - { - "epoch": 1.56, - "learning_rate": 9.842838292359115e-07, - "loss": 0.6104, - "step": 60848 - }, - { - "epoch": 1.56, - "learning_rate": 9.842561622055199e-07, - "loss": 0.6758, - "step": 60849 - }, - { - "epoch": 1.56, - "learning_rate": 9.842284951871826e-07, - "loss": 0.5513, - "step": 60850 - }, - { - "epoch": 1.56, - "learning_rate": 9.842008281809208e-07, - "loss": 0.5596, - "step": 60851 - }, - { - "epoch": 1.56, - "learning_rate": 9.841731611867557e-07, - "loss": 0.4653, - "step": 60852 - }, - { - "epoch": 1.56, - "learning_rate": 9.841454942047087e-07, - "loss": 0.6558, - "step": 60853 - }, - { - "epoch": 1.56, - "learning_rate": 9.841178272348007e-07, - "loss": 0.6738, - "step": 60854 - }, - { - "epoch": 1.56, - "learning_rate": 9.840901602770527e-07, - "loss": 0.6777, - "step": 60855 - }, - { - "epoch": 1.56, - "learning_rate": 9.840624933314864e-07, - "loss": 0.7256, - "step": 60856 - }, - { - "epoch": 1.56, - "learning_rate": 9.840348263981226e-07, - "loss": 0.6201, - "step": 60857 - }, - { - "epoch": 1.56, - "learning_rate": 9.840071594769825e-07, - "loss": 0.6753, - "step": 60858 - }, - { - "epoch": 1.56, - "learning_rate": 9.839794925680874e-07, - "loss": 0.7007, - "step": 60859 - }, - { - "epoch": 1.56, - "learning_rate": 9.839518256714583e-07, - "loss": 0.5044, - "step": 60860 - }, - { - "epoch": 1.56, - "learning_rate": 9.83924158787117e-07, - "loss": 0.8047, - "step": 60861 - }, - { - "epoch": 1.56, - "learning_rate": 9.838964919150839e-07, - "loss": 0.583, - "step": 60862 - }, - { - "epoch": 1.56, - "learning_rate": 9.838688250553806e-07, - "loss": 0.6885, - "step": 60863 - }, - { - "epoch": 1.56, - "learning_rate": 9.838411582080286e-07, - "loss": 0.6973, - "step": 60864 - }, - { - "epoch": 1.56, - "learning_rate": 9.83813491373048e-07, - "loss": 0.6914, - "step": 60865 - }, - { - "epoch": 1.56, - "learning_rate": 9.837858245504611e-07, - "loss": 0.6553, - "step": 60866 - }, - { - "epoch": 1.56, - "learning_rate": 9.837581577402885e-07, - "loss": 0.7246, - "step": 60867 - }, - { - "epoch": 1.56, - "learning_rate": 9.837304909425516e-07, - "loss": 0.6143, - "step": 60868 - }, - { - "epoch": 1.56, - "learning_rate": 9.837028241572712e-07, - "loss": 0.6182, - "step": 60869 - }, - { - "epoch": 1.56, - "learning_rate": 9.83675157384469e-07, - "loss": 0.5664, - "step": 60870 - }, - { - "epoch": 1.56, - "learning_rate": 9.83647490624166e-07, - "loss": 0.4873, - "step": 60871 - }, - { - "epoch": 1.56, - "learning_rate": 9.836198238763835e-07, - "loss": 0.5488, - "step": 60872 - }, - { - "epoch": 1.56, - "learning_rate": 9.835921571411428e-07, - "loss": 0.7588, - "step": 60873 - }, - { - "epoch": 1.56, - "learning_rate": 9.835644904184645e-07, - "loss": 0.7666, - "step": 60874 - }, - { - "epoch": 1.56, - "learning_rate": 9.8353682370837e-07, - "loss": 0.5935, - "step": 60875 - }, - { - "epoch": 1.56, - "learning_rate": 9.835091570108808e-07, - "loss": 0.6777, - "step": 60876 - }, - { - "epoch": 1.56, - "learning_rate": 9.834814903260177e-07, - "loss": 0.6758, - "step": 60877 - }, - { - "epoch": 1.56, - "learning_rate": 9.834538236538022e-07, - "loss": 0.6621, - "step": 60878 - }, - { - "epoch": 1.56, - "learning_rate": 9.83426156994255e-07, - "loss": 0.6001, - "step": 60879 - }, - { - "epoch": 1.56, - "learning_rate": 9.83398490347398e-07, - "loss": 0.7686, - "step": 60880 - }, - { - "epoch": 1.56, - "learning_rate": 9.833708237132518e-07, - "loss": 0.5254, - "step": 60881 - }, - { - "epoch": 1.56, - "learning_rate": 9.833431570918382e-07, - "loss": 0.6748, - "step": 60882 - }, - { - "epoch": 1.56, - "learning_rate": 9.83315490483178e-07, - "loss": 0.5039, - "step": 60883 - }, - { - "epoch": 1.56, - "learning_rate": 9.832878238872917e-07, - "loss": 0.5809, - "step": 60884 - }, - { - "epoch": 1.56, - "learning_rate": 9.832601573042017e-07, - "loss": 0.7783, - "step": 60885 - }, - { - "epoch": 1.56, - "learning_rate": 9.832324907339283e-07, - "loss": 0.4893, - "step": 60886 - }, - { - "epoch": 1.56, - "learning_rate": 9.832048241764932e-07, - "loss": 0.6372, - "step": 60887 - }, - { - "epoch": 1.56, - "learning_rate": 9.831771576319173e-07, - "loss": 0.665, - "step": 60888 - }, - { - "epoch": 1.56, - "learning_rate": 9.83149491100222e-07, - "loss": 0.6758, - "step": 60889 - }, - { - "epoch": 1.56, - "learning_rate": 9.83121824581428e-07, - "loss": 0.6777, - "step": 60890 - }, - { - "epoch": 1.56, - "learning_rate": 9.830941580755572e-07, - "loss": 0.7393, - "step": 60891 - }, - { - "epoch": 1.56, - "learning_rate": 9.830664915826302e-07, - "loss": 0.6082, - "step": 60892 - }, - { - "epoch": 1.56, - "learning_rate": 9.830388251026691e-07, - "loss": 0.6504, - "step": 60893 - }, - { - "epoch": 1.56, - "learning_rate": 9.830111586356938e-07, - "loss": 0.8008, - "step": 60894 - }, - { - "epoch": 1.56, - "learning_rate": 9.829834921817263e-07, - "loss": 0.6108, - "step": 60895 - }, - { - "epoch": 1.56, - "learning_rate": 9.82955825740787e-07, - "loss": 0.6143, - "step": 60896 - }, - { - "epoch": 1.56, - "learning_rate": 9.829281593128981e-07, - "loss": 0.6064, - "step": 60897 - }, - { - "epoch": 1.56, - "learning_rate": 9.829004928980803e-07, - "loss": 0.6073, - "step": 60898 - }, - { - "epoch": 1.56, - "learning_rate": 9.828728264963546e-07, - "loss": 0.6914, - "step": 60899 - }, - { - "epoch": 1.56, - "learning_rate": 9.828451601077424e-07, - "loss": 0.707, - "step": 60900 - }, - { - "epoch": 1.56, - "learning_rate": 9.828174937322652e-07, - "loss": 0.6021, - "step": 60901 - }, - { - "epoch": 1.56, - "learning_rate": 9.827898273699435e-07, - "loss": 0.6313, - "step": 60902 - }, - { - "epoch": 1.56, - "learning_rate": 9.827621610207993e-07, - "loss": 0.7539, - "step": 60903 - }, - { - "epoch": 1.56, - "learning_rate": 9.82734494684853e-07, - "loss": 0.6353, - "step": 60904 - }, - { - "epoch": 1.56, - "learning_rate": 9.82706828362126e-07, - "loss": 0.6714, - "step": 60905 - }, - { - "epoch": 1.56, - "learning_rate": 9.826791620526399e-07, - "loss": 0.6538, - "step": 60906 - }, - { - "epoch": 1.56, - "learning_rate": 9.82651495756415e-07, - "loss": 0.5698, - "step": 60907 - }, - { - "epoch": 1.56, - "learning_rate": 9.826238294734737e-07, - "loss": 0.5266, - "step": 60908 - }, - { - "epoch": 1.56, - "learning_rate": 9.82596163203836e-07, - "loss": 0.5205, - "step": 60909 - }, - { - "epoch": 1.56, - "learning_rate": 9.82568496947524e-07, - "loss": 0.6328, - "step": 60910 - }, - { - "epoch": 1.56, - "learning_rate": 9.825408307045582e-07, - "loss": 0.6758, - "step": 60911 - }, - { - "epoch": 1.56, - "learning_rate": 9.825131644749604e-07, - "loss": 0.7178, - "step": 60912 - }, - { - "epoch": 1.56, - "learning_rate": 9.824854982587517e-07, - "loss": 0.5781, - "step": 60913 - }, - { - "epoch": 1.56, - "learning_rate": 9.824578320559527e-07, - "loss": 0.751, - "step": 60914 - }, - { - "epoch": 1.56, - "learning_rate": 9.82430165866585e-07, - "loss": 0.646, - "step": 60915 - }, - { - "epoch": 1.56, - "learning_rate": 9.824024996906696e-07, - "loss": 0.7461, - "step": 60916 - }, - { - "epoch": 1.56, - "learning_rate": 9.823748335282275e-07, - "loss": 0.5369, - "step": 60917 - }, - { - "epoch": 1.56, - "learning_rate": 9.823471673792806e-07, - "loss": 0.5518, - "step": 60918 - }, - { - "epoch": 1.56, - "learning_rate": 9.823195012438496e-07, - "loss": 0.499, - "step": 60919 - }, - { - "epoch": 1.56, - "learning_rate": 9.822918351219558e-07, - "loss": 0.6523, - "step": 60920 - }, - { - "epoch": 1.56, - "learning_rate": 9.822641690136201e-07, - "loss": 0.5681, - "step": 60921 - }, - { - "epoch": 1.56, - "learning_rate": 9.82236502918864e-07, - "loss": 0.7588, - "step": 60922 - }, - { - "epoch": 1.56, - "learning_rate": 9.82208836837709e-07, - "loss": 0.6572, - "step": 60923 - }, - { - "epoch": 1.56, - "learning_rate": 9.821811707701753e-07, - "loss": 0.509, - "step": 60924 - }, - { - "epoch": 1.56, - "learning_rate": 9.82153504716285e-07, - "loss": 0.7373, - "step": 60925 - }, - { - "epoch": 1.56, - "learning_rate": 9.821258386760587e-07, - "loss": 0.5264, - "step": 60926 - }, - { - "epoch": 1.56, - "learning_rate": 9.82098172649518e-07, - "loss": 0.4202, - "step": 60927 - }, - { - "epoch": 1.56, - "learning_rate": 9.820705066366838e-07, - "loss": 0.5679, - "step": 60928 - }, - { - "epoch": 1.56, - "learning_rate": 9.820428406375774e-07, - "loss": 0.667, - "step": 60929 - }, - { - "epoch": 1.56, - "learning_rate": 9.8201517465222e-07, - "loss": 0.6709, - "step": 60930 - }, - { - "epoch": 1.56, - "learning_rate": 9.819875086806328e-07, - "loss": 0.562, - "step": 60931 - }, - { - "epoch": 1.56, - "learning_rate": 9.819598427228368e-07, - "loss": 0.6655, - "step": 60932 - }, - { - "epoch": 1.56, - "learning_rate": 9.81932176778854e-07, - "loss": 0.7803, - "step": 60933 - }, - { - "epoch": 1.56, - "learning_rate": 9.81904510848704e-07, - "loss": 0.668, - "step": 60934 - }, - { - "epoch": 1.56, - "learning_rate": 9.818768449324094e-07, - "loss": 0.5349, - "step": 60935 - }, - { - "epoch": 1.56, - "learning_rate": 9.818491790299905e-07, - "loss": 0.585, - "step": 60936 - }, - { - "epoch": 1.56, - "learning_rate": 9.81821513141469e-07, - "loss": 0.6289, - "step": 60937 - }, - { - "epoch": 1.56, - "learning_rate": 9.817938472668659e-07, - "loss": 0.4854, - "step": 60938 - }, - { - "epoch": 1.56, - "learning_rate": 9.817661814062026e-07, - "loss": 0.6514, - "step": 60939 - }, - { - "epoch": 1.56, - "learning_rate": 9.817385155594997e-07, - "loss": 0.5459, - "step": 60940 - }, - { - "epoch": 1.56, - "learning_rate": 9.817108497267792e-07, - "loss": 0.4534, - "step": 60941 - }, - { - "epoch": 1.56, - "learning_rate": 9.816831839080614e-07, - "loss": 0.5558, - "step": 60942 - }, - { - "epoch": 1.56, - "learning_rate": 9.816555181033686e-07, - "loss": 0.6206, - "step": 60943 - }, - { - "epoch": 1.56, - "learning_rate": 9.81627852312721e-07, - "loss": 0.5386, - "step": 60944 - }, - { - "epoch": 1.56, - "learning_rate": 9.8160018653614e-07, - "loss": 0.4768, - "step": 60945 - }, - { - "epoch": 1.56, - "learning_rate": 9.81572520773647e-07, - "loss": 0.6357, - "step": 60946 - }, - { - "epoch": 1.56, - "learning_rate": 9.815448550252632e-07, - "loss": 0.6245, - "step": 60947 - }, - { - "epoch": 1.56, - "learning_rate": 9.815171892910094e-07, - "loss": 0.6973, - "step": 60948 - }, - { - "epoch": 1.56, - "learning_rate": 9.814895235709072e-07, - "loss": 0.5933, - "step": 60949 - }, - { - "epoch": 1.56, - "learning_rate": 9.814618578649774e-07, - "loss": 0.6523, - "step": 60950 - }, - { - "epoch": 1.56, - "learning_rate": 9.814341921732417e-07, - "loss": 0.6982, - "step": 60951 - }, - { - "epoch": 1.56, - "learning_rate": 9.814065264957207e-07, - "loss": 0.6826, - "step": 60952 - }, - { - "epoch": 1.56, - "learning_rate": 9.813788608324363e-07, - "loss": 0.7104, - "step": 60953 - }, - { - "epoch": 1.56, - "learning_rate": 9.813511951834088e-07, - "loss": 0.5635, - "step": 60954 - }, - { - "epoch": 1.56, - "learning_rate": 9.8132352954866e-07, - "loss": 0.6567, - "step": 60955 - }, - { - "epoch": 1.56, - "learning_rate": 9.81295863928211e-07, - "loss": 0.6738, - "step": 60956 - }, - { - "epoch": 1.56, - "learning_rate": 9.812681983220827e-07, - "loss": 0.4839, - "step": 60957 - }, - { - "epoch": 1.56, - "learning_rate": 9.812405327302967e-07, - "loss": 0.709, - "step": 60958 - }, - { - "epoch": 1.56, - "learning_rate": 9.812128671528736e-07, - "loss": 0.7783, - "step": 60959 - }, - { - "epoch": 1.56, - "learning_rate": 9.811852015898352e-07, - "loss": 0.519, - "step": 60960 - }, - { - "epoch": 1.56, - "learning_rate": 9.811575360412024e-07, - "loss": 0.8018, - "step": 60961 - }, - { - "epoch": 1.56, - "learning_rate": 9.811298705069964e-07, - "loss": 0.7393, - "step": 60962 - }, - { - "epoch": 1.56, - "learning_rate": 9.811022049872389e-07, - "loss": 0.5239, - "step": 60963 - }, - { - "epoch": 1.56, - "learning_rate": 9.8107453948195e-07, - "loss": 0.7334, - "step": 60964 - }, - { - "epoch": 1.56, - "learning_rate": 9.810468739911515e-07, - "loss": 0.4501, - "step": 60965 - }, - { - "epoch": 1.56, - "learning_rate": 9.810192085148645e-07, - "loss": 0.6562, - "step": 60966 - }, - { - "epoch": 1.56, - "learning_rate": 9.809915430531102e-07, - "loss": 0.6348, - "step": 60967 - }, - { - "epoch": 1.56, - "learning_rate": 9.809638776059101e-07, - "loss": 0.6357, - "step": 60968 - }, - { - "epoch": 1.56, - "learning_rate": 9.809362121732848e-07, - "loss": 0.3662, - "step": 60969 - }, - { - "epoch": 1.56, - "learning_rate": 9.80908546755256e-07, - "loss": 0.6577, - "step": 60970 - }, - { - "epoch": 1.56, - "learning_rate": 9.808808813518441e-07, - "loss": 0.4836, - "step": 60971 - }, - { - "epoch": 1.56, - "learning_rate": 9.808532159630714e-07, - "loss": 0.5376, - "step": 60972 - }, - { - "epoch": 1.56, - "learning_rate": 9.808255505889587e-07, - "loss": 0.6257, - "step": 60973 - }, - { - "epoch": 1.56, - "learning_rate": 9.807978852295265e-07, - "loss": 0.6123, - "step": 60974 - }, - { - "epoch": 1.56, - "learning_rate": 9.807702198847967e-07, - "loss": 0.4752, - "step": 60975 - }, - { - "epoch": 1.56, - "learning_rate": 9.8074255455479e-07, - "loss": 0.5537, - "step": 60976 - }, - { - "epoch": 1.56, - "learning_rate": 9.80714889239528e-07, - "loss": 0.623, - "step": 60977 - }, - { - "epoch": 1.56, - "learning_rate": 9.806872239390316e-07, - "loss": 0.5981, - "step": 60978 - }, - { - "epoch": 1.56, - "learning_rate": 9.806595586533225e-07, - "loss": 0.572, - "step": 60979 - }, - { - "epoch": 1.56, - "learning_rate": 9.80631893382421e-07, - "loss": 0.6846, - "step": 60980 - }, - { - "epoch": 1.56, - "learning_rate": 9.80604228126349e-07, - "loss": 0.5056, - "step": 60981 - }, - { - "epoch": 1.56, - "learning_rate": 9.805765628851273e-07, - "loss": 0.6396, - "step": 60982 - }, - { - "epoch": 1.56, - "learning_rate": 9.80548897658778e-07, - "loss": 0.376, - "step": 60983 - }, - { - "epoch": 1.56, - "learning_rate": 9.805212324473208e-07, - "loss": 0.5879, - "step": 60984 - }, - { - "epoch": 1.56, - "learning_rate": 9.804935672507777e-07, - "loss": 0.5342, - "step": 60985 - }, - { - "epoch": 1.56, - "learning_rate": 9.804659020691695e-07, - "loss": 0.6406, - "step": 60986 - }, - { - "epoch": 1.56, - "learning_rate": 9.804382369025182e-07, - "loss": 0.6035, - "step": 60987 - }, - { - "epoch": 1.56, - "learning_rate": 9.80410571750844e-07, - "loss": 0.6343, - "step": 60988 - }, - { - "epoch": 1.56, - "learning_rate": 9.803829066141688e-07, - "loss": 0.5669, - "step": 60989 - }, - { - "epoch": 1.56, - "learning_rate": 9.803552414925132e-07, - "loss": 0.666, - "step": 60990 - }, - { - "epoch": 1.56, - "learning_rate": 9.80327576385899e-07, - "loss": 0.5042, - "step": 60991 - }, - { - "epoch": 1.56, - "learning_rate": 9.802999112943467e-07, - "loss": 0.624, - "step": 60992 - }, - { - "epoch": 1.56, - "learning_rate": 9.802722462178785e-07, - "loss": 0.6748, - "step": 60993 - }, - { - "epoch": 1.56, - "learning_rate": 9.802445811565147e-07, - "loss": 0.675, - "step": 60994 - }, - { - "epoch": 1.56, - "learning_rate": 9.802169161102764e-07, - "loss": 0.6743, - "step": 60995 - }, - { - "epoch": 1.56, - "learning_rate": 9.801892510791853e-07, - "loss": 0.7734, - "step": 60996 - }, - { - "epoch": 1.56, - "learning_rate": 9.80161586063262e-07, - "loss": 0.7871, - "step": 60997 - }, - { - "epoch": 1.56, - "learning_rate": 9.801339210625287e-07, - "loss": 0.7598, - "step": 60998 - }, - { - "epoch": 1.56, - "learning_rate": 9.801062560770054e-07, - "loss": 0.668, - "step": 60999 - }, - { - "epoch": 1.56, - "learning_rate": 9.800785911067142e-07, - "loss": 0.6389, - "step": 61000 - }, - { - "epoch": 1.56, - "learning_rate": 9.800509261516757e-07, - "loss": 0.7178, - "step": 61001 - }, - { - "epoch": 1.56, - "learning_rate": 9.800232612119113e-07, - "loss": 0.4868, - "step": 61002 - }, - { - "epoch": 1.56, - "learning_rate": 9.799955962874426e-07, - "loss": 0.5591, - "step": 61003 - }, - { - "epoch": 1.56, - "learning_rate": 9.7996793137829e-07, - "loss": 0.4751, - "step": 61004 - }, - { - "epoch": 1.56, - "learning_rate": 9.79940266484475e-07, - "loss": 0.4846, - "step": 61005 - }, - { - "epoch": 1.56, - "learning_rate": 9.799126016060188e-07, - "loss": 0.5884, - "step": 61006 - }, - { - "epoch": 1.56, - "learning_rate": 9.798849367429427e-07, - "loss": 0.6509, - "step": 61007 - }, - { - "epoch": 1.56, - "learning_rate": 9.798572718952677e-07, - "loss": 0.6855, - "step": 61008 - }, - { - "epoch": 1.56, - "learning_rate": 9.798296070630149e-07, - "loss": 0.7063, - "step": 61009 - }, - { - "epoch": 1.56, - "learning_rate": 9.798019422462058e-07, - "loss": 0.6851, - "step": 61010 - }, - { - "epoch": 1.56, - "learning_rate": 9.797742774448614e-07, - "loss": 0.7529, - "step": 61011 - }, - { - "epoch": 1.56, - "learning_rate": 9.797466126590029e-07, - "loss": 0.4448, - "step": 61012 - }, - { - "epoch": 1.56, - "learning_rate": 9.79718947888652e-07, - "loss": 0.5659, - "step": 61013 - }, - { - "epoch": 1.56, - "learning_rate": 9.796912831338286e-07, - "loss": 0.6465, - "step": 61014 - }, - { - "epoch": 1.56, - "learning_rate": 9.796636183945552e-07, - "loss": 0.5288, - "step": 61015 - }, - { - "epoch": 1.56, - "learning_rate": 9.79635953670852e-07, - "loss": 0.5364, - "step": 61016 - }, - { - "epoch": 1.56, - "learning_rate": 9.79608288962741e-07, - "loss": 0.7461, - "step": 61017 - }, - { - "epoch": 1.56, - "learning_rate": 9.795806242702424e-07, - "loss": 0.7017, - "step": 61018 - }, - { - "epoch": 1.56, - "learning_rate": 9.795529595933786e-07, - "loss": 0.5864, - "step": 61019 - }, - { - "epoch": 1.56, - "learning_rate": 9.795252949321699e-07, - "loss": 0.5273, - "step": 61020 - }, - { - "epoch": 1.56, - "learning_rate": 9.794976302866376e-07, - "loss": 0.625, - "step": 61021 - }, - { - "epoch": 1.56, - "learning_rate": 9.794699656568032e-07, - "loss": 0.7383, - "step": 61022 - }, - { - "epoch": 1.56, - "learning_rate": 9.79442301042688e-07, - "loss": 0.708, - "step": 61023 - }, - { - "epoch": 1.56, - "learning_rate": 9.794146364443124e-07, - "loss": 0.7085, - "step": 61024 - }, - { - "epoch": 1.56, - "learning_rate": 9.793869718616984e-07, - "loss": 0.7451, - "step": 61025 - }, - { - "epoch": 1.56, - "learning_rate": 9.793593072948665e-07, - "loss": 0.6572, - "step": 61026 - }, - { - "epoch": 1.56, - "learning_rate": 9.793316427438386e-07, - "loss": 0.6572, - "step": 61027 - }, - { - "epoch": 1.56, - "learning_rate": 9.793039782086351e-07, - "loss": 0.4731, - "step": 61028 - }, - { - "epoch": 1.56, - "learning_rate": 9.792763136892782e-07, - "loss": 0.5835, - "step": 61029 - }, - { - "epoch": 1.56, - "learning_rate": 9.792486491857878e-07, - "loss": 0.7178, - "step": 61030 - }, - { - "epoch": 1.56, - "learning_rate": 9.792209846981861e-07, - "loss": 0.6665, - "step": 61031 - }, - { - "epoch": 1.56, - "learning_rate": 9.791933202264939e-07, - "loss": 0.5322, - "step": 61032 - }, - { - "epoch": 1.56, - "learning_rate": 9.791656557707326e-07, - "loss": 0.7832, - "step": 61033 - }, - { - "epoch": 1.56, - "learning_rate": 9.791379913309232e-07, - "loss": 0.6182, - "step": 61034 - }, - { - "epoch": 1.56, - "learning_rate": 9.791103269070864e-07, - "loss": 0.7373, - "step": 61035 - }, - { - "epoch": 1.56, - "learning_rate": 9.790826624992443e-07, - "loss": 0.7178, - "step": 61036 - }, - { - "epoch": 1.56, - "learning_rate": 9.790549981074176e-07, - "loss": 0.7422, - "step": 61037 - }, - { - "epoch": 1.56, - "learning_rate": 9.790273337316273e-07, - "loss": 0.5347, - "step": 61038 - }, - { - "epoch": 1.56, - "learning_rate": 9.78999669371895e-07, - "loss": 0.9043, - "step": 61039 - }, - { - "epoch": 1.56, - "learning_rate": 9.789720050282414e-07, - "loss": 0.6631, - "step": 61040 - }, - { - "epoch": 1.56, - "learning_rate": 9.789443407006883e-07, - "loss": 0.7734, - "step": 61041 - }, - { - "epoch": 1.56, - "learning_rate": 9.789166763892563e-07, - "loss": 0.7373, - "step": 61042 - }, - { - "epoch": 1.56, - "learning_rate": 9.788890120939673e-07, - "loss": 0.5139, - "step": 61043 - }, - { - "epoch": 1.56, - "learning_rate": 9.788613478148416e-07, - "loss": 0.709, - "step": 61044 - }, - { - "epoch": 1.56, - "learning_rate": 9.788336835519008e-07, - "loss": 0.7236, - "step": 61045 - }, - { - "epoch": 1.56, - "learning_rate": 9.788060193051663e-07, - "loss": 0.4851, - "step": 61046 - }, - { - "epoch": 1.56, - "learning_rate": 9.787783550746587e-07, - "loss": 0.6436, - "step": 61047 - }, - { - "epoch": 1.56, - "learning_rate": 9.787506908603999e-07, - "loss": 0.5546, - "step": 61048 - }, - { - "epoch": 1.56, - "learning_rate": 9.787230266624104e-07, - "loss": 0.6592, - "step": 61049 - }, - { - "epoch": 1.56, - "learning_rate": 9.78695362480712e-07, - "loss": 0.5291, - "step": 61050 - }, - { - "epoch": 1.56, - "learning_rate": 9.786676983153251e-07, - "loss": 0.3342, - "step": 61051 - }, - { - "epoch": 1.56, - "learning_rate": 9.78640034166272e-07, - "loss": 0.6543, - "step": 61052 - }, - { - "epoch": 1.56, - "learning_rate": 9.78612370033573e-07, - "loss": 0.667, - "step": 61053 - }, - { - "epoch": 1.56, - "learning_rate": 9.785847059172496e-07, - "loss": 0.752, - "step": 61054 - }, - { - "epoch": 1.56, - "learning_rate": 9.785570418173226e-07, - "loss": 0.6006, - "step": 61055 - }, - { - "epoch": 1.56, - "learning_rate": 9.785293777338138e-07, - "loss": 0.6289, - "step": 61056 - }, - { - "epoch": 1.56, - "learning_rate": 9.785017136667439e-07, - "loss": 0.6416, - "step": 61057 - }, - { - "epoch": 1.56, - "learning_rate": 9.784740496161343e-07, - "loss": 0.6387, - "step": 61058 - }, - { - "epoch": 1.56, - "learning_rate": 9.78446385582006e-07, - "loss": 0.6836, - "step": 61059 - }, - { - "epoch": 1.56, - "learning_rate": 9.784187215643804e-07, - "loss": 0.6641, - "step": 61060 - }, - { - "epoch": 1.57, - "learning_rate": 9.783910575632785e-07, - "loss": 0.5264, - "step": 61061 - }, - { - "epoch": 1.57, - "learning_rate": 9.783633935787218e-07, - "loss": 0.5344, - "step": 61062 - }, - { - "epoch": 1.57, - "learning_rate": 9.783357296107314e-07, - "loss": 0.6777, - "step": 61063 - }, - { - "epoch": 1.57, - "learning_rate": 9.78308065659328e-07, - "loss": 0.8232, - "step": 61064 - }, - { - "epoch": 1.57, - "learning_rate": 9.782804017245333e-07, - "loss": 0.6436, - "step": 61065 - }, - { - "epoch": 1.57, - "learning_rate": 9.782527378063682e-07, - "loss": 0.6348, - "step": 61066 - }, - { - "epoch": 1.57, - "learning_rate": 9.78225073904854e-07, - "loss": 0.6187, - "step": 61067 - }, - { - "epoch": 1.57, - "learning_rate": 9.781974100200115e-07, - "loss": 0.6494, - "step": 61068 - }, - { - "epoch": 1.57, - "learning_rate": 9.781697461518628e-07, - "loss": 0.5181, - "step": 61069 - }, - { - "epoch": 1.57, - "learning_rate": 9.78142082300428e-07, - "loss": 0.6221, - "step": 61070 - }, - { - "epoch": 1.57, - "learning_rate": 9.781144184657292e-07, - "loss": 0.5933, - "step": 61071 - }, - { - "epoch": 1.57, - "learning_rate": 9.78086754647787e-07, - "loss": 0.8154, - "step": 61072 - }, - { - "epoch": 1.57, - "learning_rate": 9.780590908466235e-07, - "loss": 0.6748, - "step": 61073 - }, - { - "epoch": 1.57, - "learning_rate": 9.780314270622584e-07, - "loss": 0.7158, - "step": 61074 - }, - { - "epoch": 1.57, - "learning_rate": 9.780037632947137e-07, - "loss": 0.5032, - "step": 61075 - }, - { - "epoch": 1.57, - "learning_rate": 9.779760995440103e-07, - "loss": 0.7285, - "step": 61076 - }, - { - "epoch": 1.57, - "learning_rate": 9.7794843581017e-07, - "loss": 0.5964, - "step": 61077 - }, - { - "epoch": 1.57, - "learning_rate": 9.779207720932132e-07, - "loss": 0.5481, - "step": 61078 - }, - { - "epoch": 1.57, - "learning_rate": 9.778931083931615e-07, - "loss": 0.6431, - "step": 61079 - }, - { - "epoch": 1.57, - "learning_rate": 9.778654447100362e-07, - "loss": 0.5439, - "step": 61080 - }, - { - "epoch": 1.57, - "learning_rate": 9.778377810438582e-07, - "loss": 0.5151, - "step": 61081 - }, - { - "epoch": 1.57, - "learning_rate": 9.77810117394649e-07, - "loss": 0.5405, - "step": 61082 - }, - { - "epoch": 1.57, - "learning_rate": 9.777824537624296e-07, - "loss": 0.7686, - "step": 61083 - }, - { - "epoch": 1.57, - "learning_rate": 9.77754790147221e-07, - "loss": 0.6885, - "step": 61084 - }, - { - "epoch": 1.57, - "learning_rate": 9.777271265490443e-07, - "loss": 0.6611, - "step": 61085 - }, - { - "epoch": 1.57, - "learning_rate": 9.776994629679214e-07, - "loss": 0.498, - "step": 61086 - }, - { - "epoch": 1.57, - "learning_rate": 9.776717994038726e-07, - "loss": 0.4708, - "step": 61087 - }, - { - "epoch": 1.57, - "learning_rate": 9.776441358569196e-07, - "loss": 0.5017, - "step": 61088 - }, - { - "epoch": 1.57, - "learning_rate": 9.776164723270833e-07, - "loss": 0.582, - "step": 61089 - }, - { - "epoch": 1.57, - "learning_rate": 9.775888088143854e-07, - "loss": 0.5513, - "step": 61090 - }, - { - "epoch": 1.57, - "learning_rate": 9.775611453188464e-07, - "loss": 0.5508, - "step": 61091 - }, - { - "epoch": 1.57, - "learning_rate": 9.775334818404879e-07, - "loss": 0.7207, - "step": 61092 - }, - { - "epoch": 1.57, - "learning_rate": 9.775058183793313e-07, - "loss": 0.7578, - "step": 61093 - }, - { - "epoch": 1.57, - "learning_rate": 9.774781549353972e-07, - "loss": 0.6309, - "step": 61094 - }, - { - "epoch": 1.57, - "learning_rate": 9.774504915087069e-07, - "loss": 0.7803, - "step": 61095 - }, - { - "epoch": 1.57, - "learning_rate": 9.77422828099282e-07, - "loss": 0.5283, - "step": 61096 - }, - { - "epoch": 1.57, - "learning_rate": 9.77395164707143e-07, - "loss": 0.5811, - "step": 61097 - }, - { - "epoch": 1.57, - "learning_rate": 9.773675013323119e-07, - "loss": 0.8672, - "step": 61098 - }, - { - "epoch": 1.57, - "learning_rate": 9.77339837974809e-07, - "loss": 0.6992, - "step": 61099 - }, - { - "epoch": 1.57, - "learning_rate": 9.773121746346564e-07, - "loss": 0.7041, - "step": 61100 - }, - { - "epoch": 1.57, - "learning_rate": 9.772845113118745e-07, - "loss": 0.5869, - "step": 61101 - }, - { - "epoch": 1.57, - "learning_rate": 9.77256848006485e-07, - "loss": 0.7275, - "step": 61102 - }, - { - "epoch": 1.57, - "learning_rate": 9.772291847185092e-07, - "loss": 0.7285, - "step": 61103 - }, - { - "epoch": 1.57, - "learning_rate": 9.772015214479674e-07, - "loss": 0.6445, - "step": 61104 - }, - { - "epoch": 1.57, - "learning_rate": 9.771738581948817e-07, - "loss": 0.595, - "step": 61105 - }, - { - "epoch": 1.57, - "learning_rate": 9.771461949592726e-07, - "loss": 0.4692, - "step": 61106 - }, - { - "epoch": 1.57, - "learning_rate": 9.771185317411618e-07, - "loss": 0.7607, - "step": 61107 - }, - { - "epoch": 1.57, - "learning_rate": 9.770908685405701e-07, - "loss": 0.6152, - "step": 61108 - }, - { - "epoch": 1.57, - "learning_rate": 9.770632053575192e-07, - "loss": 0.543, - "step": 61109 - }, - { - "epoch": 1.57, - "learning_rate": 9.770355421920299e-07, - "loss": 0.4549, - "step": 61110 - }, - { - "epoch": 1.57, - "learning_rate": 9.770078790441232e-07, - "loss": 0.6572, - "step": 61111 - }, - { - "epoch": 1.57, - "learning_rate": 9.769802159138207e-07, - "loss": 0.6265, - "step": 61112 - }, - { - "epoch": 1.57, - "learning_rate": 9.769525528011436e-07, - "loss": 0.7202, - "step": 61113 - }, - { - "epoch": 1.57, - "learning_rate": 9.769248897061124e-07, - "loss": 0.687, - "step": 61114 - }, - { - "epoch": 1.57, - "learning_rate": 9.76897226628749e-07, - "loss": 0.7354, - "step": 61115 - }, - { - "epoch": 1.57, - "learning_rate": 9.768695635690742e-07, - "loss": 0.5244, - "step": 61116 - }, - { - "epoch": 1.57, - "learning_rate": 9.768419005271095e-07, - "loss": 0.6982, - "step": 61117 - }, - { - "epoch": 1.57, - "learning_rate": 9.768142375028756e-07, - "loss": 0.6953, - "step": 61118 - }, - { - "epoch": 1.57, - "learning_rate": 9.767865744963942e-07, - "loss": 0.6489, - "step": 61119 - }, - { - "epoch": 1.57, - "learning_rate": 9.767589115076862e-07, - "loss": 0.5972, - "step": 61120 - }, - { - "epoch": 1.57, - "learning_rate": 9.767312485367728e-07, - "loss": 0.5928, - "step": 61121 - }, - { - "epoch": 1.57, - "learning_rate": 9.767035855836752e-07, - "loss": 0.5491, - "step": 61122 - }, - { - "epoch": 1.57, - "learning_rate": 9.766759226484147e-07, - "loss": 0.729, - "step": 61123 - }, - { - "epoch": 1.57, - "learning_rate": 9.766482597310124e-07, - "loss": 0.4917, - "step": 61124 - }, - { - "epoch": 1.57, - "learning_rate": 9.766205968314893e-07, - "loss": 0.5488, - "step": 61125 - }, - { - "epoch": 1.57, - "learning_rate": 9.76592933949867e-07, - "loss": 0.6235, - "step": 61126 - }, - { - "epoch": 1.57, - "learning_rate": 9.765652710861663e-07, - "loss": 0.625, - "step": 61127 - }, - { - "epoch": 1.57, - "learning_rate": 9.765376082404082e-07, - "loss": 0.5513, - "step": 61128 - }, - { - "epoch": 1.57, - "learning_rate": 9.765099454126144e-07, - "loss": 0.5452, - "step": 61129 - }, - { - "epoch": 1.57, - "learning_rate": 9.764822826028058e-07, - "loss": 0.6479, - "step": 61130 - }, - { - "epoch": 1.57, - "learning_rate": 9.764546198110037e-07, - "loss": 0.5557, - "step": 61131 - }, - { - "epoch": 1.57, - "learning_rate": 9.764269570372292e-07, - "loss": 0.7354, - "step": 61132 - }, - { - "epoch": 1.57, - "learning_rate": 9.763992942815036e-07, - "loss": 0.5225, - "step": 61133 - }, - { - "epoch": 1.57, - "learning_rate": 9.76371631543848e-07, - "loss": 0.6885, - "step": 61134 - }, - { - "epoch": 1.57, - "learning_rate": 9.763439688242832e-07, - "loss": 0.5327, - "step": 61135 - }, - { - "epoch": 1.57, - "learning_rate": 9.763163061228311e-07, - "loss": 0.6816, - "step": 61136 - }, - { - "epoch": 1.57, - "learning_rate": 9.762886434395121e-07, - "loss": 0.5806, - "step": 61137 - }, - { - "epoch": 1.57, - "learning_rate": 9.762609807743482e-07, - "loss": 0.7373, - "step": 61138 - }, - { - "epoch": 1.57, - "learning_rate": 9.762333181273599e-07, - "loss": 0.6548, - "step": 61139 - }, - { - "epoch": 1.57, - "learning_rate": 9.762056554985688e-07, - "loss": 0.6309, - "step": 61140 - }, - { - "epoch": 1.57, - "learning_rate": 9.76177992887996e-07, - "loss": 0.563, - "step": 61141 - }, - { - "epoch": 1.57, - "learning_rate": 9.761503302956625e-07, - "loss": 0.5972, - "step": 61142 - }, - { - "epoch": 1.57, - "learning_rate": 9.7612266772159e-07, - "loss": 0.5762, - "step": 61143 - }, - { - "epoch": 1.57, - "learning_rate": 9.76095005165799e-07, - "loss": 0.6587, - "step": 61144 - }, - { - "epoch": 1.57, - "learning_rate": 9.760673426283108e-07, - "loss": 0.4727, - "step": 61145 - }, - { - "epoch": 1.57, - "learning_rate": 9.760396801091468e-07, - "loss": 0.8438, - "step": 61146 - }, - { - "epoch": 1.57, - "learning_rate": 9.76012017608328e-07, - "loss": 0.6328, - "step": 61147 - }, - { - "epoch": 1.57, - "learning_rate": 9.759843551258758e-07, - "loss": 0.478, - "step": 61148 - }, - { - "epoch": 1.57, - "learning_rate": 9.759566926618113e-07, - "loss": 0.624, - "step": 61149 - }, - { - "epoch": 1.57, - "learning_rate": 9.759290302161557e-07, - "loss": 0.6934, - "step": 61150 - }, - { - "epoch": 1.57, - "learning_rate": 9.7590136778893e-07, - "loss": 0.7373, - "step": 61151 - }, - { - "epoch": 1.57, - "learning_rate": 9.758737053801556e-07, - "loss": 0.5991, - "step": 61152 - }, - { - "epoch": 1.57, - "learning_rate": 9.75846042989854e-07, - "loss": 0.6699, - "step": 61153 - }, - { - "epoch": 1.57, - "learning_rate": 9.758183806180454e-07, - "loss": 0.6343, - "step": 61154 - }, - { - "epoch": 1.57, - "learning_rate": 9.757907182647516e-07, - "loss": 0.6455, - "step": 61155 - }, - { - "epoch": 1.57, - "learning_rate": 9.757630559299936e-07, - "loss": 0.7007, - "step": 61156 - }, - { - "epoch": 1.57, - "learning_rate": 9.75735393613793e-07, - "loss": 0.6865, - "step": 61157 - }, - { - "epoch": 1.57, - "learning_rate": 9.757077313161707e-07, - "loss": 0.6003, - "step": 61158 - }, - { - "epoch": 1.57, - "learning_rate": 9.75680069037148e-07, - "loss": 0.6299, - "step": 61159 - }, - { - "epoch": 1.57, - "learning_rate": 9.756524067767457e-07, - "loss": 0.6992, - "step": 61160 - }, - { - "epoch": 1.57, - "learning_rate": 9.756247445349854e-07, - "loss": 0.6143, - "step": 61161 - }, - { - "epoch": 1.57, - "learning_rate": 9.755970823118877e-07, - "loss": 0.6025, - "step": 61162 - }, - { - "epoch": 1.57, - "learning_rate": 9.755694201074752e-07, - "loss": 0.5796, - "step": 61163 - }, - { - "epoch": 1.57, - "learning_rate": 9.755417579217673e-07, - "loss": 0.6943, - "step": 61164 - }, - { - "epoch": 1.57, - "learning_rate": 9.75514095754786e-07, - "loss": 0.8027, - "step": 61165 - }, - { - "epoch": 1.57, - "learning_rate": 9.754864336065523e-07, - "loss": 0.707, - "step": 61166 - }, - { - "epoch": 1.57, - "learning_rate": 9.754587714770878e-07, - "loss": 0.5803, - "step": 61167 - }, - { - "epoch": 1.57, - "learning_rate": 9.754311093664132e-07, - "loss": 0.5264, - "step": 61168 - }, - { - "epoch": 1.57, - "learning_rate": 9.7540344727455e-07, - "loss": 0.6128, - "step": 61169 - }, - { - "epoch": 1.57, - "learning_rate": 9.75375785201519e-07, - "loss": 0.4795, - "step": 61170 - }, - { - "epoch": 1.57, - "learning_rate": 9.75348123147342e-07, - "loss": 0.6289, - "step": 61171 - }, - { - "epoch": 1.57, - "learning_rate": 9.7532046111204e-07, - "loss": 0.7197, - "step": 61172 - }, - { - "epoch": 1.57, - "learning_rate": 9.752927990956332e-07, - "loss": 0.6367, - "step": 61173 - }, - { - "epoch": 1.57, - "learning_rate": 9.75265137098144e-07, - "loss": 0.6484, - "step": 61174 - }, - { - "epoch": 1.57, - "learning_rate": 9.75237475119593e-07, - "loss": 0.481, - "step": 61175 - }, - { - "epoch": 1.57, - "learning_rate": 9.75209813160002e-07, - "loss": 0.9219, - "step": 61176 - }, - { - "epoch": 1.57, - "learning_rate": 9.751821512193912e-07, - "loss": 0.6172, - "step": 61177 - }, - { - "epoch": 1.57, - "learning_rate": 9.751544892977825e-07, - "loss": 0.7021, - "step": 61178 - }, - { - "epoch": 1.57, - "learning_rate": 9.751268273951968e-07, - "loss": 0.499, - "step": 61179 - }, - { - "epoch": 1.57, - "learning_rate": 9.750991655116554e-07, - "loss": 0.6621, - "step": 61180 - }, - { - "epoch": 1.57, - "learning_rate": 9.750715036471792e-07, - "loss": 0.7007, - "step": 61181 - }, - { - "epoch": 1.57, - "learning_rate": 9.750438418017903e-07, - "loss": 0.7246, - "step": 61182 - }, - { - "epoch": 1.57, - "learning_rate": 9.750161799755085e-07, - "loss": 0.3639, - "step": 61183 - }, - { - "epoch": 1.57, - "learning_rate": 9.749885181683559e-07, - "loss": 0.6255, - "step": 61184 - }, - { - "epoch": 1.57, - "learning_rate": 9.749608563803532e-07, - "loss": 0.6025, - "step": 61185 - }, - { - "epoch": 1.57, - "learning_rate": 9.749331946115221e-07, - "loss": 0.8447, - "step": 61186 - }, - { - "epoch": 1.57, - "learning_rate": 9.749055328618835e-07, - "loss": 0.6929, - "step": 61187 - }, - { - "epoch": 1.57, - "learning_rate": 9.748778711314583e-07, - "loss": 0.4937, - "step": 61188 - }, - { - "epoch": 1.57, - "learning_rate": 9.74850209420268e-07, - "loss": 0.6328, - "step": 61189 - }, - { - "epoch": 1.57, - "learning_rate": 9.748225477283341e-07, - "loss": 0.5112, - "step": 61190 - }, - { - "epoch": 1.57, - "learning_rate": 9.74794886055677e-07, - "loss": 0.5508, - "step": 61191 - }, - { - "epoch": 1.57, - "learning_rate": 9.747672244023187e-07, - "loss": 0.6028, - "step": 61192 - }, - { - "epoch": 1.57, - "learning_rate": 9.7473956276828e-07, - "loss": 0.7549, - "step": 61193 - }, - { - "epoch": 1.57, - "learning_rate": 9.747119011535815e-07, - "loss": 0.7725, - "step": 61194 - }, - { - "epoch": 1.57, - "learning_rate": 9.746842395582454e-07, - "loss": 0.7485, - "step": 61195 - }, - { - "epoch": 1.57, - "learning_rate": 9.746565779822921e-07, - "loss": 0.5923, - "step": 61196 - }, - { - "epoch": 1.57, - "learning_rate": 9.746289164257433e-07, - "loss": 0.5752, - "step": 61197 - }, - { - "epoch": 1.57, - "learning_rate": 9.746012548886198e-07, - "loss": 0.8032, - "step": 61198 - }, - { - "epoch": 1.57, - "learning_rate": 9.745735933709432e-07, - "loss": 0.7559, - "step": 61199 - }, - { - "epoch": 1.57, - "learning_rate": 9.745459318727345e-07, - "loss": 0.6602, - "step": 61200 - }, - { - "epoch": 1.57, - "learning_rate": 9.745182703940145e-07, - "loss": 0.6562, - "step": 61201 - }, - { - "epoch": 1.57, - "learning_rate": 9.74490608934805e-07, - "loss": 0.7461, - "step": 61202 - }, - { - "epoch": 1.57, - "learning_rate": 9.744629474951269e-07, - "loss": 0.6406, - "step": 61203 - }, - { - "epoch": 1.57, - "learning_rate": 9.74435286075001e-07, - "loss": 0.7373, - "step": 61204 - }, - { - "epoch": 1.57, - "learning_rate": 9.74407624674449e-07, - "loss": 0.6152, - "step": 61205 - }, - { - "epoch": 1.57, - "learning_rate": 9.743799632934916e-07, - "loss": 0.6846, - "step": 61206 - }, - { - "epoch": 1.57, - "learning_rate": 9.743523019321507e-07, - "loss": 0.5527, - "step": 61207 - }, - { - "epoch": 1.57, - "learning_rate": 9.743246405904467e-07, - "loss": 0.531, - "step": 61208 - }, - { - "epoch": 1.57, - "learning_rate": 9.742969792684015e-07, - "loss": 0.6958, - "step": 61209 - }, - { - "epoch": 1.57, - "learning_rate": 9.742693179660357e-07, - "loss": 0.6729, - "step": 61210 - }, - { - "epoch": 1.57, - "learning_rate": 9.742416566833708e-07, - "loss": 0.5466, - "step": 61211 - }, - { - "epoch": 1.57, - "learning_rate": 9.742139954204282e-07, - "loss": 0.4937, - "step": 61212 - }, - { - "epoch": 1.57, - "learning_rate": 9.741863341772282e-07, - "loss": 0.7285, - "step": 61213 - }, - { - "epoch": 1.57, - "learning_rate": 9.74158672953793e-07, - "loss": 0.7842, - "step": 61214 - }, - { - "epoch": 1.57, - "learning_rate": 9.741310117501428e-07, - "loss": 0.7002, - "step": 61215 - }, - { - "epoch": 1.57, - "learning_rate": 9.741033505662995e-07, - "loss": 0.8623, - "step": 61216 - }, - { - "epoch": 1.57, - "learning_rate": 9.740756894022842e-07, - "loss": 0.7393, - "step": 61217 - }, - { - "epoch": 1.57, - "learning_rate": 9.74048028258118e-07, - "loss": 0.748, - "step": 61218 - }, - { - "epoch": 1.57, - "learning_rate": 9.740203671338219e-07, - "loss": 0.5308, - "step": 61219 - }, - { - "epoch": 1.57, - "learning_rate": 9.73992706029417e-07, - "loss": 0.751, - "step": 61220 - }, - { - "epoch": 1.57, - "learning_rate": 9.739650449449251e-07, - "loss": 0.7197, - "step": 61221 - }, - { - "epoch": 1.57, - "learning_rate": 9.73937383880367e-07, - "loss": 0.6367, - "step": 61222 - }, - { - "epoch": 1.57, - "learning_rate": 9.739097228357634e-07, - "loss": 0.7871, - "step": 61223 - }, - { - "epoch": 1.57, - "learning_rate": 9.738820618111363e-07, - "loss": 0.5142, - "step": 61224 - }, - { - "epoch": 1.57, - "learning_rate": 9.73854400806506e-07, - "loss": 0.4839, - "step": 61225 - }, - { - "epoch": 1.57, - "learning_rate": 9.738267398218947e-07, - "loss": 0.7192, - "step": 61226 - }, - { - "epoch": 1.57, - "learning_rate": 9.737990788573229e-07, - "loss": 0.7119, - "step": 61227 - }, - { - "epoch": 1.57, - "learning_rate": 9.737714179128121e-07, - "loss": 0.6826, - "step": 61228 - }, - { - "epoch": 1.57, - "learning_rate": 9.73743756988383e-07, - "loss": 0.6504, - "step": 61229 - }, - { - "epoch": 1.57, - "learning_rate": 9.737160960840573e-07, - "loss": 0.6621, - "step": 61230 - }, - { - "epoch": 1.57, - "learning_rate": 9.736884351998557e-07, - "loss": 0.4495, - "step": 61231 - }, - { - "epoch": 1.57, - "learning_rate": 9.736607743358004e-07, - "loss": 0.6963, - "step": 61232 - }, - { - "epoch": 1.57, - "learning_rate": 9.736331134919112e-07, - "loss": 0.6284, - "step": 61233 - }, - { - "epoch": 1.57, - "learning_rate": 9.7360545266821e-07, - "loss": 0.8301, - "step": 61234 - }, - { - "epoch": 1.57, - "learning_rate": 9.73577791864718e-07, - "loss": 0.6338, - "step": 61235 - }, - { - "epoch": 1.57, - "learning_rate": 9.735501310814563e-07, - "loss": 0.5437, - "step": 61236 - }, - { - "epoch": 1.57, - "learning_rate": 9.73522470318446e-07, - "loss": 0.7275, - "step": 61237 - }, - { - "epoch": 1.57, - "learning_rate": 9.734948095757082e-07, - "loss": 0.6233, - "step": 61238 - }, - { - "epoch": 1.57, - "learning_rate": 9.73467148853264e-07, - "loss": 0.5801, - "step": 61239 - }, - { - "epoch": 1.57, - "learning_rate": 9.734394881511352e-07, - "loss": 0.7861, - "step": 61240 - }, - { - "epoch": 1.57, - "learning_rate": 9.734118274693423e-07, - "loss": 0.5747, - "step": 61241 - }, - { - "epoch": 1.57, - "learning_rate": 9.73384166807907e-07, - "loss": 0.835, - "step": 61242 - }, - { - "epoch": 1.57, - "learning_rate": 9.733565061668503e-07, - "loss": 0.7695, - "step": 61243 - }, - { - "epoch": 1.57, - "learning_rate": 9.73328845546193e-07, - "loss": 0.5195, - "step": 61244 - }, - { - "epoch": 1.57, - "learning_rate": 9.733011849459568e-07, - "loss": 0.667, - "step": 61245 - }, - { - "epoch": 1.57, - "learning_rate": 9.732735243661623e-07, - "loss": 0.5278, - "step": 61246 - }, - { - "epoch": 1.57, - "learning_rate": 9.732458638068314e-07, - "loss": 0.7461, - "step": 61247 - }, - { - "epoch": 1.57, - "learning_rate": 9.732182032679846e-07, - "loss": 0.5159, - "step": 61248 - }, - { - "epoch": 1.57, - "learning_rate": 9.731905427496437e-07, - "loss": 0.5, - "step": 61249 - }, - { - "epoch": 1.57, - "learning_rate": 9.731628822518291e-07, - "loss": 0.6387, - "step": 61250 - }, - { - "epoch": 1.57, - "learning_rate": 9.73135221774563e-07, - "loss": 0.7695, - "step": 61251 - }, - { - "epoch": 1.57, - "learning_rate": 9.73107561317866e-07, - "loss": 0.6426, - "step": 61252 - }, - { - "epoch": 1.57, - "learning_rate": 9.730799008817592e-07, - "loss": 0.3396, - "step": 61253 - }, - { - "epoch": 1.57, - "learning_rate": 9.730522404662637e-07, - "loss": 0.6338, - "step": 61254 - }, - { - "epoch": 1.57, - "learning_rate": 9.73024580071401e-07, - "loss": 0.6045, - "step": 61255 - }, - { - "epoch": 1.57, - "learning_rate": 9.72996919697192e-07, - "loss": 0.7871, - "step": 61256 - }, - { - "epoch": 1.57, - "learning_rate": 9.72969259343658e-07, - "loss": 0.4629, - "step": 61257 - }, - { - "epoch": 1.57, - "learning_rate": 9.729415990108203e-07, - "loss": 0.6562, - "step": 61258 - }, - { - "epoch": 1.57, - "learning_rate": 9.729139386986999e-07, - "loss": 0.5967, - "step": 61259 - }, - { - "epoch": 1.57, - "learning_rate": 9.72886278407318e-07, - "loss": 0.6279, - "step": 61260 - }, - { - "epoch": 1.57, - "learning_rate": 9.72858618136696e-07, - "loss": 0.8145, - "step": 61261 - }, - { - "epoch": 1.57, - "learning_rate": 9.728309578868551e-07, - "loss": 0.6533, - "step": 61262 - }, - { - "epoch": 1.57, - "learning_rate": 9.72803297657816e-07, - "loss": 0.7471, - "step": 61263 - }, - { - "epoch": 1.57, - "learning_rate": 9.727756374496003e-07, - "loss": 0.5056, - "step": 61264 - }, - { - "epoch": 1.57, - "learning_rate": 9.727479772622288e-07, - "loss": 0.5708, - "step": 61265 - }, - { - "epoch": 1.57, - "learning_rate": 9.727203170957231e-07, - "loss": 0.6851, - "step": 61266 - }, - { - "epoch": 1.57, - "learning_rate": 9.72692656950104e-07, - "loss": 0.5996, - "step": 61267 - }, - { - "epoch": 1.57, - "learning_rate": 9.726649968253933e-07, - "loss": 0.5793, - "step": 61268 - }, - { - "epoch": 1.57, - "learning_rate": 9.726373367216112e-07, - "loss": 0.7139, - "step": 61269 - }, - { - "epoch": 1.57, - "learning_rate": 9.7260967663878e-07, - "loss": 0.668, - "step": 61270 - }, - { - "epoch": 1.57, - "learning_rate": 9.725820165769196e-07, - "loss": 0.6963, - "step": 61271 - }, - { - "epoch": 1.57, - "learning_rate": 9.72554356536053e-07, - "loss": 0.4697, - "step": 61272 - }, - { - "epoch": 1.57, - "learning_rate": 9.725266965161995e-07, - "loss": 0.6597, - "step": 61273 - }, - { - "epoch": 1.57, - "learning_rate": 9.724990365173812e-07, - "loss": 0.6875, - "step": 61274 - }, - { - "epoch": 1.57, - "learning_rate": 9.72471376539619e-07, - "loss": 0.5327, - "step": 61275 - }, - { - "epoch": 1.57, - "learning_rate": 9.724437165829344e-07, - "loss": 0.7529, - "step": 61276 - }, - { - "epoch": 1.57, - "learning_rate": 9.724160566473481e-07, - "loss": 0.5229, - "step": 61277 - }, - { - "epoch": 1.57, - "learning_rate": 9.723883967328818e-07, - "loss": 0.7334, - "step": 61278 - }, - { - "epoch": 1.57, - "learning_rate": 9.72360736839556e-07, - "loss": 0.5879, - "step": 61279 - }, - { - "epoch": 1.57, - "learning_rate": 9.723330769673928e-07, - "loss": 0.6602, - "step": 61280 - }, - { - "epoch": 1.57, - "learning_rate": 9.723054171164127e-07, - "loss": 0.5977, - "step": 61281 - }, - { - "epoch": 1.57, - "learning_rate": 9.722777572866373e-07, - "loss": 0.7861, - "step": 61282 - }, - { - "epoch": 1.57, - "learning_rate": 9.722500974780875e-07, - "loss": 0.6875, - "step": 61283 - }, - { - "epoch": 1.57, - "learning_rate": 9.722224376907843e-07, - "loss": 0.3678, - "step": 61284 - }, - { - "epoch": 1.57, - "learning_rate": 9.721947779247493e-07, - "loss": 0.6919, - "step": 61285 - }, - { - "epoch": 1.57, - "learning_rate": 9.721671181800031e-07, - "loss": 0.7148, - "step": 61286 - }, - { - "epoch": 1.57, - "learning_rate": 9.721394584565677e-07, - "loss": 0.5737, - "step": 61287 - }, - { - "epoch": 1.57, - "learning_rate": 9.721117987544635e-07, - "loss": 0.7188, - "step": 61288 - }, - { - "epoch": 1.57, - "learning_rate": 9.720841390737121e-07, - "loss": 0.5781, - "step": 61289 - }, - { - "epoch": 1.57, - "learning_rate": 9.720564794143348e-07, - "loss": 0.6826, - "step": 61290 - }, - { - "epoch": 1.57, - "learning_rate": 9.720288197763523e-07, - "loss": 0.5381, - "step": 61291 - }, - { - "epoch": 1.57, - "learning_rate": 9.720011601597866e-07, - "loss": 0.7666, - "step": 61292 - }, - { - "epoch": 1.57, - "learning_rate": 9.71973500564658e-07, - "loss": 0.7207, - "step": 61293 - }, - { - "epoch": 1.57, - "learning_rate": 9.719458409909877e-07, - "loss": 0.6191, - "step": 61294 - }, - { - "epoch": 1.57, - "learning_rate": 9.719181814387975e-07, - "loss": 0.6934, - "step": 61295 - }, - { - "epoch": 1.57, - "learning_rate": 9.71890521908108e-07, - "loss": 0.4392, - "step": 61296 - }, - { - "epoch": 1.57, - "learning_rate": 9.718628623989408e-07, - "loss": 0.7109, - "step": 61297 - }, - { - "epoch": 1.57, - "learning_rate": 9.718352029113168e-07, - "loss": 0.48, - "step": 61298 - }, - { - "epoch": 1.57, - "learning_rate": 9.718075434452574e-07, - "loss": 0.5203, - "step": 61299 - }, - { - "epoch": 1.57, - "learning_rate": 9.717798840007835e-07, - "loss": 0.8047, - "step": 61300 - }, - { - "epoch": 1.57, - "learning_rate": 9.717522245779167e-07, - "loss": 0.5278, - "step": 61301 - }, - { - "epoch": 1.57, - "learning_rate": 9.717245651766782e-07, - "loss": 0.6538, - "step": 61302 - }, - { - "epoch": 1.57, - "learning_rate": 9.716969057970883e-07, - "loss": 0.6343, - "step": 61303 - }, - { - "epoch": 1.57, - "learning_rate": 9.71669246439169e-07, - "loss": 0.5679, - "step": 61304 - }, - { - "epoch": 1.57, - "learning_rate": 9.71641587102941e-07, - "loss": 0.4775, - "step": 61305 - }, - { - "epoch": 1.57, - "learning_rate": 9.716139277884263e-07, - "loss": 0.7761, - "step": 61306 - }, - { - "epoch": 1.57, - "learning_rate": 9.715862684956452e-07, - "loss": 0.5243, - "step": 61307 - }, - { - "epoch": 1.57, - "learning_rate": 9.71558609224619e-07, - "loss": 0.8184, - "step": 61308 - }, - { - "epoch": 1.57, - "learning_rate": 9.715309499753695e-07, - "loss": 0.4261, - "step": 61309 - }, - { - "epoch": 1.57, - "learning_rate": 9.71503290747917e-07, - "loss": 0.5771, - "step": 61310 - }, - { - "epoch": 1.57, - "learning_rate": 9.714756315422834e-07, - "loss": 0.5815, - "step": 61311 - }, - { - "epoch": 1.57, - "learning_rate": 9.714479723584898e-07, - "loss": 0.7476, - "step": 61312 - }, - { - "epoch": 1.57, - "learning_rate": 9.714203131965568e-07, - "loss": 0.6558, - "step": 61313 - }, - { - "epoch": 1.57, - "learning_rate": 9.71392654056506e-07, - "loss": 0.6445, - "step": 61314 - }, - { - "epoch": 1.57, - "learning_rate": 9.713649949383583e-07, - "loss": 0.5718, - "step": 61315 - }, - { - "epoch": 1.57, - "learning_rate": 9.713373358421355e-07, - "loss": 0.6431, - "step": 61316 - }, - { - "epoch": 1.57, - "learning_rate": 9.71309676767858e-07, - "loss": 0.6919, - "step": 61317 - }, - { - "epoch": 1.57, - "learning_rate": 9.712820177155478e-07, - "loss": 0.5109, - "step": 61318 - }, - { - "epoch": 1.57, - "learning_rate": 9.712543586852252e-07, - "loss": 0.3787, - "step": 61319 - }, - { - "epoch": 1.57, - "learning_rate": 9.712266996769122e-07, - "loss": 0.668, - "step": 61320 - }, - { - "epoch": 1.57, - "learning_rate": 9.711990406906294e-07, - "loss": 0.4607, - "step": 61321 - }, - { - "epoch": 1.57, - "learning_rate": 9.711713817263985e-07, - "loss": 0.6758, - "step": 61322 - }, - { - "epoch": 1.57, - "learning_rate": 9.711437227842404e-07, - "loss": 0.9092, - "step": 61323 - }, - { - "epoch": 1.57, - "learning_rate": 9.711160638641759e-07, - "loss": 0.5404, - "step": 61324 - }, - { - "epoch": 1.57, - "learning_rate": 9.710884049662263e-07, - "loss": 0.5874, - "step": 61325 - }, - { - "epoch": 1.57, - "learning_rate": 9.710607460904132e-07, - "loss": 0.4418, - "step": 61326 - }, - { - "epoch": 1.57, - "learning_rate": 9.710330872367575e-07, - "loss": 0.6337, - "step": 61327 - }, - { - "epoch": 1.57, - "learning_rate": 9.710054284052806e-07, - "loss": 0.7334, - "step": 61328 - }, - { - "epoch": 1.57, - "learning_rate": 9.709777695960031e-07, - "loss": 0.8887, - "step": 61329 - }, - { - "epoch": 1.57, - "learning_rate": 9.70950110808947e-07, - "loss": 0.626, - "step": 61330 - }, - { - "epoch": 1.57, - "learning_rate": 9.709224520441328e-07, - "loss": 0.6738, - "step": 61331 - }, - { - "epoch": 1.57, - "learning_rate": 9.708947933015824e-07, - "loss": 0.6128, - "step": 61332 - }, - { - "epoch": 1.57, - "learning_rate": 9.708671345813163e-07, - "loss": 0.7705, - "step": 61333 - }, - { - "epoch": 1.57, - "learning_rate": 9.708394758833557e-07, - "loss": 0.5479, - "step": 61334 - }, - { - "epoch": 1.57, - "learning_rate": 9.70811817207722e-07, - "loss": 0.6245, - "step": 61335 - }, - { - "epoch": 1.57, - "learning_rate": 9.707841585544362e-07, - "loss": 0.6533, - "step": 61336 - }, - { - "epoch": 1.57, - "learning_rate": 9.7075649992352e-07, - "loss": 0.4175, - "step": 61337 - }, - { - "epoch": 1.57, - "learning_rate": 9.70728841314994e-07, - "loss": 0.7471, - "step": 61338 - }, - { - "epoch": 1.57, - "learning_rate": 9.707011827288796e-07, - "loss": 0.5356, - "step": 61339 - }, - { - "epoch": 1.57, - "learning_rate": 9.706735241651979e-07, - "loss": 0.5884, - "step": 61340 - }, - { - "epoch": 1.57, - "learning_rate": 9.706458656239701e-07, - "loss": 0.4736, - "step": 61341 - }, - { - "epoch": 1.57, - "learning_rate": 9.70618207105218e-07, - "loss": 0.6338, - "step": 61342 - }, - { - "epoch": 1.57, - "learning_rate": 9.70590548608962e-07, - "loss": 0.7061, - "step": 61343 - }, - { - "epoch": 1.57, - "learning_rate": 9.705628901352228e-07, - "loss": 0.7148, - "step": 61344 - }, - { - "epoch": 1.57, - "learning_rate": 9.705352316840228e-07, - "loss": 0.5459, - "step": 61345 - }, - { - "epoch": 1.57, - "learning_rate": 9.705075732553822e-07, - "loss": 0.687, - "step": 61346 - }, - { - "epoch": 1.57, - "learning_rate": 9.70479914849323e-07, - "loss": 0.7656, - "step": 61347 - }, - { - "epoch": 1.57, - "learning_rate": 9.704522564658657e-07, - "loss": 0.532, - "step": 61348 - }, - { - "epoch": 1.57, - "learning_rate": 9.704245981050318e-07, - "loss": 0.6973, - "step": 61349 - }, - { - "epoch": 1.57, - "learning_rate": 9.703969397668423e-07, - "loss": 0.7783, - "step": 61350 - }, - { - "epoch": 1.57, - "learning_rate": 9.703692814513188e-07, - "loss": 0.8232, - "step": 61351 - }, - { - "epoch": 1.57, - "learning_rate": 9.703416231584824e-07, - "loss": 0.6631, - "step": 61352 - }, - { - "epoch": 1.57, - "learning_rate": 9.703139648883536e-07, - "loss": 0.6689, - "step": 61353 - }, - { - "epoch": 1.57, - "learning_rate": 9.702863066409542e-07, - "loss": 0.6094, - "step": 61354 - }, - { - "epoch": 1.57, - "learning_rate": 9.70258648416305e-07, - "loss": 0.5381, - "step": 61355 - }, - { - "epoch": 1.57, - "learning_rate": 9.702309902144277e-07, - "loss": 0.626, - "step": 61356 - }, - { - "epoch": 1.57, - "learning_rate": 9.702033320353427e-07, - "loss": 0.6299, - "step": 61357 - }, - { - "epoch": 1.57, - "learning_rate": 9.70175673879072e-07, - "loss": 0.7236, - "step": 61358 - }, - { - "epoch": 1.57, - "learning_rate": 9.701480157456364e-07, - "loss": 0.7324, - "step": 61359 - }, - { - "epoch": 1.57, - "learning_rate": 9.701203576350571e-07, - "loss": 0.5066, - "step": 61360 - }, - { - "epoch": 1.57, - "learning_rate": 9.700926995473551e-07, - "loss": 0.5635, - "step": 61361 - }, - { - "epoch": 1.57, - "learning_rate": 9.700650414825523e-07, - "loss": 0.5811, - "step": 61362 - }, - { - "epoch": 1.57, - "learning_rate": 9.700373834406687e-07, - "loss": 0.6113, - "step": 61363 - }, - { - "epoch": 1.57, - "learning_rate": 9.700097254217265e-07, - "loss": 0.7056, - "step": 61364 - }, - { - "epoch": 1.57, - "learning_rate": 9.699820674257462e-07, - "loss": 0.6553, - "step": 61365 - }, - { - "epoch": 1.57, - "learning_rate": 9.699544094527492e-07, - "loss": 0.7065, - "step": 61366 - }, - { - "epoch": 1.57, - "learning_rate": 9.699267515027568e-07, - "loss": 0.6191, - "step": 61367 - }, - { - "epoch": 1.57, - "learning_rate": 9.698990935757901e-07, - "loss": 0.6338, - "step": 61368 - }, - { - "epoch": 1.57, - "learning_rate": 9.698714356718702e-07, - "loss": 0.7632, - "step": 61369 - }, - { - "epoch": 1.57, - "learning_rate": 9.698437777910185e-07, - "loss": 0.3727, - "step": 61370 - }, - { - "epoch": 1.57, - "learning_rate": 9.698161199332558e-07, - "loss": 0.4746, - "step": 61371 - }, - { - "epoch": 1.57, - "learning_rate": 9.69788462098604e-07, - "loss": 0.7109, - "step": 61372 - }, - { - "epoch": 1.57, - "learning_rate": 9.697608042870837e-07, - "loss": 0.5916, - "step": 61373 - }, - { - "epoch": 1.57, - "learning_rate": 9.697331464987158e-07, - "loss": 0.623, - "step": 61374 - }, - { - "epoch": 1.57, - "learning_rate": 9.69705488733522e-07, - "loss": 0.6772, - "step": 61375 - }, - { - "epoch": 1.57, - "learning_rate": 9.696778309915233e-07, - "loss": 0.4282, - "step": 61376 - }, - { - "epoch": 1.57, - "learning_rate": 9.69650173272741e-07, - "loss": 0.6616, - "step": 61377 - }, - { - "epoch": 1.57, - "learning_rate": 9.696225155771958e-07, - "loss": 0.7104, - "step": 61378 - }, - { - "epoch": 1.57, - "learning_rate": 9.695948579049097e-07, - "loss": 0.5989, - "step": 61379 - }, - { - "epoch": 1.57, - "learning_rate": 9.695672002559033e-07, - "loss": 0.707, - "step": 61380 - }, - { - "epoch": 1.57, - "learning_rate": 9.695395426301977e-07, - "loss": 0.6816, - "step": 61381 - }, - { - "epoch": 1.57, - "learning_rate": 9.695118850278147e-07, - "loss": 0.7188, - "step": 61382 - }, - { - "epoch": 1.57, - "learning_rate": 9.694842274487748e-07, - "loss": 0.645, - "step": 61383 - }, - { - "epoch": 1.57, - "learning_rate": 9.694565698930991e-07, - "loss": 0.6968, - "step": 61384 - }, - { - "epoch": 1.57, - "learning_rate": 9.694289123608096e-07, - "loss": 0.6338, - "step": 61385 - }, - { - "epoch": 1.57, - "learning_rate": 9.694012548519266e-07, - "loss": 0.4893, - "step": 61386 - }, - { - "epoch": 1.57, - "learning_rate": 9.693735973664718e-07, - "loss": 0.6978, - "step": 61387 - }, - { - "epoch": 1.57, - "learning_rate": 9.69345939904466e-07, - "loss": 0.5757, - "step": 61388 - }, - { - "epoch": 1.57, - "learning_rate": 9.69318282465931e-07, - "loss": 0.6553, - "step": 61389 - }, - { - "epoch": 1.57, - "learning_rate": 9.692906250508874e-07, - "loss": 0.6753, - "step": 61390 - }, - { - "epoch": 1.57, - "learning_rate": 9.692629676593565e-07, - "loss": 0.7529, - "step": 61391 - }, - { - "epoch": 1.57, - "learning_rate": 9.6923531029136e-07, - "loss": 0.689, - "step": 61392 - }, - { - "epoch": 1.57, - "learning_rate": 9.69207652946918e-07, - "loss": 0.6729, - "step": 61393 - }, - { - "epoch": 1.57, - "learning_rate": 9.691799956260528e-07, - "loss": 0.666, - "step": 61394 - }, - { - "epoch": 1.57, - "learning_rate": 9.691523383287844e-07, - "loss": 0.4927, - "step": 61395 - }, - { - "epoch": 1.57, - "learning_rate": 9.69124681055135e-07, - "loss": 0.6689, - "step": 61396 - }, - { - "epoch": 1.57, - "learning_rate": 9.690970238051256e-07, - "loss": 0.5488, - "step": 61397 - }, - { - "epoch": 1.57, - "learning_rate": 9.690693665787768e-07, - "loss": 0.5833, - "step": 61398 - }, - { - "epoch": 1.57, - "learning_rate": 9.690417093761105e-07, - "loss": 0.5627, - "step": 61399 - }, - { - "epoch": 1.57, - "learning_rate": 9.690140521971472e-07, - "loss": 0.6191, - "step": 61400 - }, - { - "epoch": 1.57, - "learning_rate": 9.689863950419087e-07, - "loss": 0.6641, - "step": 61401 - }, - { - "epoch": 1.57, - "learning_rate": 9.68958737910416e-07, - "loss": 0.7344, - "step": 61402 - }, - { - "epoch": 1.57, - "learning_rate": 9.6893108080269e-07, - "loss": 0.5315, - "step": 61403 - }, - { - "epoch": 1.57, - "learning_rate": 9.68903423718752e-07, - "loss": 0.7529, - "step": 61404 - }, - { - "epoch": 1.57, - "learning_rate": 9.68875766658623e-07, - "loss": 0.5244, - "step": 61405 - }, - { - "epoch": 1.57, - "learning_rate": 9.68848109622325e-07, - "loss": 0.6318, - "step": 61406 - }, - { - "epoch": 1.57, - "learning_rate": 9.68820452609878e-07, - "loss": 0.8496, - "step": 61407 - }, - { - "epoch": 1.57, - "learning_rate": 9.68792795621304e-07, - "loss": 0.6558, - "step": 61408 - }, - { - "epoch": 1.57, - "learning_rate": 9.687651386566237e-07, - "loss": 0.5947, - "step": 61409 - }, - { - "epoch": 1.57, - "learning_rate": 9.687374817158587e-07, - "loss": 0.4824, - "step": 61410 - }, - { - "epoch": 1.57, - "learning_rate": 9.687098247990297e-07, - "loss": 0.7266, - "step": 61411 - }, - { - "epoch": 1.57, - "learning_rate": 9.686821679061587e-07, - "loss": 0.5688, - "step": 61412 - }, - { - "epoch": 1.57, - "learning_rate": 9.68654511037266e-07, - "loss": 0.7139, - "step": 61413 - }, - { - "epoch": 1.57, - "learning_rate": 9.686268541923732e-07, - "loss": 0.7393, - "step": 61414 - }, - { - "epoch": 1.57, - "learning_rate": 9.685991973715011e-07, - "loss": 0.4573, - "step": 61415 - }, - { - "epoch": 1.57, - "learning_rate": 9.685715405746714e-07, - "loss": 0.8174, - "step": 61416 - }, - { - "epoch": 1.57, - "learning_rate": 9.68543883801905e-07, - "loss": 0.5273, - "step": 61417 - }, - { - "epoch": 1.57, - "learning_rate": 9.685162270532231e-07, - "loss": 0.5737, - "step": 61418 - }, - { - "epoch": 1.57, - "learning_rate": 9.684885703286466e-07, - "loss": 0.8008, - "step": 61419 - }, - { - "epoch": 1.57, - "learning_rate": 9.684609136281974e-07, - "loss": 0.7734, - "step": 61420 - }, - { - "epoch": 1.57, - "learning_rate": 9.684332569518959e-07, - "loss": 0.5747, - "step": 61421 - }, - { - "epoch": 1.57, - "learning_rate": 9.68405600299764e-07, - "loss": 0.7275, - "step": 61422 - }, - { - "epoch": 1.57, - "learning_rate": 9.683779436718223e-07, - "loss": 0.6953, - "step": 61423 - }, - { - "epoch": 1.57, - "learning_rate": 9.683502870680918e-07, - "loss": 0.6111, - "step": 61424 - }, - { - "epoch": 1.57, - "learning_rate": 9.683226304885945e-07, - "loss": 0.5342, - "step": 61425 - }, - { - "epoch": 1.57, - "learning_rate": 9.682949739333507e-07, - "loss": 0.6631, - "step": 61426 - }, - { - "epoch": 1.57, - "learning_rate": 9.682673174023822e-07, - "loss": 0.4697, - "step": 61427 - }, - { - "epoch": 1.57, - "learning_rate": 9.682396608957098e-07, - "loss": 0.5684, - "step": 61428 - }, - { - "epoch": 1.57, - "learning_rate": 9.68212004413355e-07, - "loss": 0.6826, - "step": 61429 - }, - { - "epoch": 1.57, - "learning_rate": 9.681843479553386e-07, - "loss": 0.3916, - "step": 61430 - }, - { - "epoch": 1.57, - "learning_rate": 9.681566915216823e-07, - "loss": 0.8154, - "step": 61431 - }, - { - "epoch": 1.57, - "learning_rate": 9.68129035112407e-07, - "loss": 0.6865, - "step": 61432 - }, - { - "epoch": 1.57, - "learning_rate": 9.681013787275338e-07, - "loss": 0.543, - "step": 61433 - }, - { - "epoch": 1.57, - "learning_rate": 9.680737223670836e-07, - "loss": 0.6641, - "step": 61434 - }, - { - "epoch": 1.57, - "learning_rate": 9.680460660310782e-07, - "loss": 0.6367, - "step": 61435 - }, - { - "epoch": 1.57, - "learning_rate": 9.68018409719538e-07, - "loss": 0.8086, - "step": 61436 - }, - { - "epoch": 1.57, - "learning_rate": 9.67990753432485e-07, - "loss": 0.5693, - "step": 61437 - }, - { - "epoch": 1.57, - "learning_rate": 9.679630971699397e-07, - "loss": 0.6348, - "step": 61438 - }, - { - "epoch": 1.57, - "learning_rate": 9.67935440931924e-07, - "loss": 0.7715, - "step": 61439 - }, - { - "epoch": 1.57, - "learning_rate": 9.679077847184582e-07, - "loss": 0.728, - "step": 61440 - }, - { - "epoch": 1.57, - "learning_rate": 9.678801285295644e-07, - "loss": 0.5024, - "step": 61441 - }, - { - "epoch": 1.57, - "learning_rate": 9.678524723652633e-07, - "loss": 0.8652, - "step": 61442 - }, - { - "epoch": 1.57, - "learning_rate": 9.67824816225576e-07, - "loss": 0.5698, - "step": 61443 - }, - { - "epoch": 1.57, - "learning_rate": 9.677971601105236e-07, - "loss": 0.6313, - "step": 61444 - }, - { - "epoch": 1.57, - "learning_rate": 9.677695040201272e-07, - "loss": 0.6001, - "step": 61445 - }, - { - "epoch": 1.57, - "learning_rate": 9.677418479544087e-07, - "loss": 0.688, - "step": 61446 - }, - { - "epoch": 1.57, - "learning_rate": 9.677141919133884e-07, - "loss": 0.6963, - "step": 61447 - }, - { - "epoch": 1.57, - "learning_rate": 9.676865358970882e-07, - "loss": 0.7524, - "step": 61448 - }, - { - "epoch": 1.57, - "learning_rate": 9.676588799055285e-07, - "loss": 0.6592, - "step": 61449 - }, - { - "epoch": 1.57, - "learning_rate": 9.676312239387314e-07, - "loss": 0.5669, - "step": 61450 - }, - { - "epoch": 1.58, - "learning_rate": 9.676035679967172e-07, - "loss": 0.626, - "step": 61451 - }, - { - "epoch": 1.58, - "learning_rate": 9.675759120795082e-07, - "loss": 0.532, - "step": 61452 - }, - { - "epoch": 1.58, - "learning_rate": 9.67548256187124e-07, - "loss": 0.5752, - "step": 61453 - }, - { - "epoch": 1.58, - "learning_rate": 9.675206003195868e-07, - "loss": 0.6494, - "step": 61454 - }, - { - "epoch": 1.58, - "learning_rate": 9.674929444769177e-07, - "loss": 0.6631, - "step": 61455 - }, - { - "epoch": 1.58, - "learning_rate": 9.674652886591377e-07, - "loss": 0.3945, - "step": 61456 - }, - { - "epoch": 1.58, - "learning_rate": 9.67437632866268e-07, - "loss": 0.6235, - "step": 61457 - }, - { - "epoch": 1.58, - "learning_rate": 9.674099770983299e-07, - "loss": 0.6758, - "step": 61458 - }, - { - "epoch": 1.58, - "learning_rate": 9.67382321355344e-07, - "loss": 0.6416, - "step": 61459 - }, - { - "epoch": 1.58, - "learning_rate": 9.673546656373326e-07, - "loss": 0.5869, - "step": 61460 - }, - { - "epoch": 1.58, - "learning_rate": 9.67327009944316e-07, - "loss": 0.606, - "step": 61461 - }, - { - "epoch": 1.58, - "learning_rate": 9.672993542763157e-07, - "loss": 0.7891, - "step": 61462 - }, - { - "epoch": 1.58, - "learning_rate": 9.672716986333529e-07, - "loss": 0.5386, - "step": 61463 - }, - { - "epoch": 1.58, - "learning_rate": 9.672440430154484e-07, - "loss": 0.6724, - "step": 61464 - }, - { - "epoch": 1.58, - "learning_rate": 9.672163874226238e-07, - "loss": 0.752, - "step": 61465 - }, - { - "epoch": 1.58, - "learning_rate": 9.671887318548997e-07, - "loss": 0.7051, - "step": 61466 - }, - { - "epoch": 1.58, - "learning_rate": 9.67161076312298e-07, - "loss": 0.6143, - "step": 61467 - }, - { - "epoch": 1.58, - "learning_rate": 9.671334207948395e-07, - "loss": 0.7905, - "step": 61468 - }, - { - "epoch": 1.58, - "learning_rate": 9.671057653025454e-07, - "loss": 0.5875, - "step": 61469 - }, - { - "epoch": 1.58, - "learning_rate": 9.670781098354372e-07, - "loss": 0.6733, - "step": 61470 - }, - { - "epoch": 1.58, - "learning_rate": 9.670504543935358e-07, - "loss": 0.5986, - "step": 61471 - }, - { - "epoch": 1.58, - "learning_rate": 9.670227989768618e-07, - "loss": 0.5327, - "step": 61472 - }, - { - "epoch": 1.58, - "learning_rate": 9.669951435854375e-07, - "loss": 0.6768, - "step": 61473 - }, - { - "epoch": 1.58, - "learning_rate": 9.669674882192829e-07, - "loss": 0.5241, - "step": 61474 - }, - { - "epoch": 1.58, - "learning_rate": 9.669398328784203e-07, - "loss": 0.6724, - "step": 61475 - }, - { - "epoch": 1.58, - "learning_rate": 9.6691217756287e-07, - "loss": 0.6289, - "step": 61476 - }, - { - "epoch": 1.58, - "learning_rate": 9.668845222726535e-07, - "loss": 0.7441, - "step": 61477 - }, - { - "epoch": 1.58, - "learning_rate": 9.668568670077922e-07, - "loss": 0.4766, - "step": 61478 - }, - { - "epoch": 1.58, - "learning_rate": 9.668292117683071e-07, - "loss": 0.8262, - "step": 61479 - }, - { - "epoch": 1.58, - "learning_rate": 9.66801556554219e-07, - "loss": 0.3895, - "step": 61480 - }, - { - "epoch": 1.58, - "learning_rate": 9.6677390136555e-07, - "loss": 0.748, - "step": 61481 - }, - { - "epoch": 1.58, - "learning_rate": 9.667462462023206e-07, - "loss": 0.606, - "step": 61482 - }, - { - "epoch": 1.58, - "learning_rate": 9.667185910645517e-07, - "loss": 0.5337, - "step": 61483 - }, - { - "epoch": 1.58, - "learning_rate": 9.666909359522652e-07, - "loss": 0.6504, - "step": 61484 - }, - { - "epoch": 1.58, - "learning_rate": 9.666632808654815e-07, - "loss": 0.6855, - "step": 61485 - }, - { - "epoch": 1.58, - "learning_rate": 9.666356258042226e-07, - "loss": 0.8535, - "step": 61486 - }, - { - "epoch": 1.58, - "learning_rate": 9.66607970768509e-07, - "loss": 0.4211, - "step": 61487 - }, - { - "epoch": 1.58, - "learning_rate": 9.665803157583622e-07, - "loss": 0.668, - "step": 61488 - }, - { - "epoch": 1.58, - "learning_rate": 9.665526607738033e-07, - "loss": 0.5232, - "step": 61489 - }, - { - "epoch": 1.58, - "learning_rate": 9.665250058148535e-07, - "loss": 0.5203, - "step": 61490 - }, - { - "epoch": 1.58, - "learning_rate": 9.664973508815342e-07, - "loss": 0.6318, - "step": 61491 - }, - { - "epoch": 1.58, - "learning_rate": 9.664696959738662e-07, - "loss": 0.6006, - "step": 61492 - }, - { - "epoch": 1.58, - "learning_rate": 9.664420410918706e-07, - "loss": 0.7705, - "step": 61493 - }, - { - "epoch": 1.58, - "learning_rate": 9.664143862355692e-07, - "loss": 0.623, - "step": 61494 - }, - { - "epoch": 1.58, - "learning_rate": 9.663867314049823e-07, - "loss": 0.519, - "step": 61495 - }, - { - "epoch": 1.58, - "learning_rate": 9.663590766001317e-07, - "loss": 0.6226, - "step": 61496 - }, - { - "epoch": 1.58, - "learning_rate": 9.663314218210383e-07, - "loss": 0.5669, - "step": 61497 - }, - { - "epoch": 1.58, - "learning_rate": 9.663037670677236e-07, - "loss": 0.7393, - "step": 61498 - }, - { - "epoch": 1.58, - "learning_rate": 9.662761123402084e-07, - "loss": 0.6797, - "step": 61499 - }, - { - "epoch": 1.58, - "learning_rate": 9.66248457638514e-07, - "loss": 0.792, - "step": 61500 - }, - { - "epoch": 1.58, - "learning_rate": 9.66220802962662e-07, - "loss": 0.5913, - "step": 61501 - }, - { - "epoch": 1.58, - "learning_rate": 9.66193148312673e-07, - "loss": 0.6099, - "step": 61502 - }, - { - "epoch": 1.58, - "learning_rate": 9.661654936885682e-07, - "loss": 0.6172, - "step": 61503 - }, - { - "epoch": 1.58, - "learning_rate": 9.66137839090369e-07, - "loss": 0.666, - "step": 61504 - }, - { - "epoch": 1.58, - "learning_rate": 9.661101845180964e-07, - "loss": 0.6431, - "step": 61505 - }, - { - "epoch": 1.58, - "learning_rate": 9.660825299717719e-07, - "loss": 0.7227, - "step": 61506 - }, - { - "epoch": 1.58, - "learning_rate": 9.66054875451416e-07, - "loss": 0.5049, - "step": 61507 - }, - { - "epoch": 1.58, - "learning_rate": 9.660272209570509e-07, - "loss": 0.6392, - "step": 61508 - }, - { - "epoch": 1.58, - "learning_rate": 9.659995664886966e-07, - "loss": 0.7334, - "step": 61509 - }, - { - "epoch": 1.58, - "learning_rate": 9.659719120463754e-07, - "loss": 0.6226, - "step": 61510 - }, - { - "epoch": 1.58, - "learning_rate": 9.659442576301079e-07, - "loss": 0.4514, - "step": 61511 - }, - { - "epoch": 1.58, - "learning_rate": 9.65916603239915e-07, - "loss": 0.3894, - "step": 61512 - }, - { - "epoch": 1.58, - "learning_rate": 9.658889488758184e-07, - "loss": 0.5908, - "step": 61513 - }, - { - "epoch": 1.58, - "learning_rate": 9.658612945378387e-07, - "loss": 0.583, - "step": 61514 - }, - { - "epoch": 1.58, - "learning_rate": 9.65833640225998e-07, - "loss": 0.5947, - "step": 61515 - }, - { - "epoch": 1.58, - "learning_rate": 9.658059859403164e-07, - "loss": 0.72, - "step": 61516 - }, - { - "epoch": 1.58, - "learning_rate": 9.657783316808159e-07, - "loss": 0.6455, - "step": 61517 - }, - { - "epoch": 1.58, - "learning_rate": 9.657506774475172e-07, - "loss": 0.6572, - "step": 61518 - }, - { - "epoch": 1.58, - "learning_rate": 9.657230232404418e-07, - "loss": 0.71, - "step": 61519 - }, - { - "epoch": 1.58, - "learning_rate": 9.656953690596103e-07, - "loss": 0.7461, - "step": 61520 - }, - { - "epoch": 1.58, - "learning_rate": 9.656677149050449e-07, - "loss": 0.7432, - "step": 61521 - }, - { - "epoch": 1.58, - "learning_rate": 9.65640060776766e-07, - "loss": 0.751, - "step": 61522 - }, - { - "epoch": 1.58, - "learning_rate": 9.656124066747947e-07, - "loss": 0.8052, - "step": 61523 - }, - { - "epoch": 1.58, - "learning_rate": 9.655847525991524e-07, - "loss": 0.6025, - "step": 61524 - }, - { - "epoch": 1.58, - "learning_rate": 9.655570985498605e-07, - "loss": 0.6826, - "step": 61525 - }, - { - "epoch": 1.58, - "learning_rate": 9.655294445269396e-07, - "loss": 0.8037, - "step": 61526 - }, - { - "epoch": 1.58, - "learning_rate": 9.655017905304114e-07, - "loss": 0.7534, - "step": 61527 - }, - { - "epoch": 1.58, - "learning_rate": 9.65474136560297e-07, - "loss": 0.5708, - "step": 61528 - }, - { - "epoch": 1.58, - "learning_rate": 9.654464826166173e-07, - "loss": 0.6426, - "step": 61529 - }, - { - "epoch": 1.58, - "learning_rate": 9.654188286993936e-07, - "loss": 0.5266, - "step": 61530 - }, - { - "epoch": 1.58, - "learning_rate": 9.653911748086476e-07, - "loss": 0.7598, - "step": 61531 - }, - { - "epoch": 1.58, - "learning_rate": 9.653635209443995e-07, - "loss": 0.4529, - "step": 61532 - }, - { - "epoch": 1.58, - "learning_rate": 9.65335867106671e-07, - "loss": 0.584, - "step": 61533 - }, - { - "epoch": 1.58, - "learning_rate": 9.653082132954833e-07, - "loss": 0.5776, - "step": 61534 - }, - { - "epoch": 1.58, - "learning_rate": 9.652805595108574e-07, - "loss": 0.5928, - "step": 61535 - }, - { - "epoch": 1.58, - "learning_rate": 9.652529057528148e-07, - "loss": 0.6641, - "step": 61536 - }, - { - "epoch": 1.58, - "learning_rate": 9.652252520213762e-07, - "loss": 0.6611, - "step": 61537 - }, - { - "epoch": 1.58, - "learning_rate": 9.651975983165632e-07, - "loss": 0.667, - "step": 61538 - }, - { - "epoch": 1.58, - "learning_rate": 9.651699446383966e-07, - "loss": 0.5239, - "step": 61539 - }, - { - "epoch": 1.58, - "learning_rate": 9.65142290986898e-07, - "loss": 0.5981, - "step": 61540 - }, - { - "epoch": 1.58, - "learning_rate": 9.651146373620885e-07, - "loss": 0.5908, - "step": 61541 - }, - { - "epoch": 1.58, - "learning_rate": 9.65086983763989e-07, - "loss": 0.6006, - "step": 61542 - }, - { - "epoch": 1.58, - "learning_rate": 9.650593301926205e-07, - "loss": 0.7246, - "step": 61543 - }, - { - "epoch": 1.58, - "learning_rate": 9.650316766480048e-07, - "loss": 0.5771, - "step": 61544 - }, - { - "epoch": 1.58, - "learning_rate": 9.650040231301624e-07, - "loss": 0.7637, - "step": 61545 - }, - { - "epoch": 1.58, - "learning_rate": 9.649763696391152e-07, - "loss": 0.6987, - "step": 61546 - }, - { - "epoch": 1.58, - "learning_rate": 9.649487161748835e-07, - "loss": 0.5962, - "step": 61547 - }, - { - "epoch": 1.58, - "learning_rate": 9.649210627374894e-07, - "loss": 0.7358, - "step": 61548 - }, - { - "epoch": 1.58, - "learning_rate": 9.648934093269532e-07, - "loss": 0.7666, - "step": 61549 - }, - { - "epoch": 1.58, - "learning_rate": 9.648657559432968e-07, - "loss": 0.6001, - "step": 61550 - }, - { - "epoch": 1.58, - "learning_rate": 9.648381025865415e-07, - "loss": 0.6558, - "step": 61551 - }, - { - "epoch": 1.58, - "learning_rate": 9.648104492567075e-07, - "loss": 0.4612, - "step": 61552 - }, - { - "epoch": 1.58, - "learning_rate": 9.647827959538167e-07, - "loss": 0.5488, - "step": 61553 - }, - { - "epoch": 1.58, - "learning_rate": 9.647551426778898e-07, - "loss": 0.499, - "step": 61554 - }, - { - "epoch": 1.58, - "learning_rate": 9.647274894289484e-07, - "loss": 0.6182, - "step": 61555 - }, - { - "epoch": 1.58, - "learning_rate": 9.646998362070135e-07, - "loss": 0.4961, - "step": 61556 - }, - { - "epoch": 1.58, - "learning_rate": 9.646721830121065e-07, - "loss": 0.6816, - "step": 61557 - }, - { - "epoch": 1.58, - "learning_rate": 9.646445298442482e-07, - "loss": 0.8066, - "step": 61558 - }, - { - "epoch": 1.58, - "learning_rate": 9.6461687670346e-07, - "loss": 0.4504, - "step": 61559 - }, - { - "epoch": 1.58, - "learning_rate": 9.645892235897632e-07, - "loss": 0.6934, - "step": 61560 - }, - { - "epoch": 1.58, - "learning_rate": 9.64561570503179e-07, - "loss": 0.6758, - "step": 61561 - }, - { - "epoch": 1.58, - "learning_rate": 9.64533917443728e-07, - "loss": 0.6602, - "step": 61562 - }, - { - "epoch": 1.58, - "learning_rate": 9.64506264411432e-07, - "loss": 0.7773, - "step": 61563 - }, - { - "epoch": 1.58, - "learning_rate": 9.644786114063114e-07, - "loss": 0.7202, - "step": 61564 - }, - { - "epoch": 1.58, - "learning_rate": 9.644509584283884e-07, - "loss": 0.7129, - "step": 61565 - }, - { - "epoch": 1.58, - "learning_rate": 9.644233054776834e-07, - "loss": 0.6699, - "step": 61566 - }, - { - "epoch": 1.58, - "learning_rate": 9.64395652554218e-07, - "loss": 0.4277, - "step": 61567 - }, - { - "epoch": 1.58, - "learning_rate": 9.64367999658013e-07, - "loss": 0.6021, - "step": 61568 - }, - { - "epoch": 1.58, - "learning_rate": 9.6434034678909e-07, - "loss": 0.4104, - "step": 61569 - }, - { - "epoch": 1.58, - "learning_rate": 9.643126939474699e-07, - "loss": 0.7109, - "step": 61570 - }, - { - "epoch": 1.58, - "learning_rate": 9.642850411331742e-07, - "loss": 0.6235, - "step": 61571 - }, - { - "epoch": 1.58, - "learning_rate": 9.642573883462235e-07, - "loss": 0.7227, - "step": 61572 - }, - { - "epoch": 1.58, - "learning_rate": 9.642297355866391e-07, - "loss": 0.7471, - "step": 61573 - }, - { - "epoch": 1.58, - "learning_rate": 9.642020828544427e-07, - "loss": 0.6836, - "step": 61574 - }, - { - "epoch": 1.58, - "learning_rate": 9.641744301496549e-07, - "loss": 0.6895, - "step": 61575 - }, - { - "epoch": 1.58, - "learning_rate": 9.64146777472297e-07, - "loss": 0.5042, - "step": 61576 - }, - { - "epoch": 1.58, - "learning_rate": 9.641191248223904e-07, - "loss": 0.4296, - "step": 61577 - }, - { - "epoch": 1.58, - "learning_rate": 9.640914721999563e-07, - "loss": 0.5493, - "step": 61578 - }, - { - "epoch": 1.58, - "learning_rate": 9.640638196050157e-07, - "loss": 0.4976, - "step": 61579 - }, - { - "epoch": 1.58, - "learning_rate": 9.640361670375894e-07, - "loss": 0.6367, - "step": 61580 - }, - { - "epoch": 1.58, - "learning_rate": 9.640085144976996e-07, - "loss": 0.5991, - "step": 61581 - }, - { - "epoch": 1.58, - "learning_rate": 9.639808619853665e-07, - "loss": 0.4822, - "step": 61582 - }, - { - "epoch": 1.58, - "learning_rate": 9.639532095006113e-07, - "loss": 0.6357, - "step": 61583 - }, - { - "epoch": 1.58, - "learning_rate": 9.639255570434558e-07, - "loss": 0.7324, - "step": 61584 - }, - { - "epoch": 1.58, - "learning_rate": 9.638979046139206e-07, - "loss": 0.7715, - "step": 61585 - }, - { - "epoch": 1.58, - "learning_rate": 9.638702522120273e-07, - "loss": 0.7334, - "step": 61586 - }, - { - "epoch": 1.58, - "learning_rate": 9.638425998377967e-07, - "loss": 0.668, - "step": 61587 - }, - { - "epoch": 1.58, - "learning_rate": 9.638149474912504e-07, - "loss": 0.4666, - "step": 61588 - }, - { - "epoch": 1.58, - "learning_rate": 9.63787295172409e-07, - "loss": 0.4268, - "step": 61589 - }, - { - "epoch": 1.58, - "learning_rate": 9.637596428812943e-07, - "loss": 0.5122, - "step": 61590 - }, - { - "epoch": 1.58, - "learning_rate": 9.637319906179275e-07, - "loss": 0.7166, - "step": 61591 - }, - { - "epoch": 1.58, - "learning_rate": 9.63704338382329e-07, - "loss": 0.5332, - "step": 61592 - }, - { - "epoch": 1.58, - "learning_rate": 9.636766861745205e-07, - "loss": 0.7178, - "step": 61593 - }, - { - "epoch": 1.58, - "learning_rate": 9.636490339945228e-07, - "loss": 0.6064, - "step": 61594 - }, - { - "epoch": 1.58, - "learning_rate": 9.636213818423577e-07, - "loss": 0.7207, - "step": 61595 - }, - { - "epoch": 1.58, - "learning_rate": 9.635937297180461e-07, - "loss": 0.791, - "step": 61596 - }, - { - "epoch": 1.58, - "learning_rate": 9.635660776216087e-07, - "loss": 0.7354, - "step": 61597 - }, - { - "epoch": 1.58, - "learning_rate": 9.635384255530675e-07, - "loss": 0.585, - "step": 61598 - }, - { - "epoch": 1.58, - "learning_rate": 9.63510773512443e-07, - "loss": 0.4575, - "step": 61599 - }, - { - "epoch": 1.58, - "learning_rate": 9.634831214997567e-07, - "loss": 0.5488, - "step": 61600 - }, - { - "epoch": 1.58, - "learning_rate": 9.6345546951503e-07, - "loss": 0.5718, - "step": 61601 - }, - { - "epoch": 1.58, - "learning_rate": 9.634278175582834e-07, - "loss": 0.7061, - "step": 61602 - }, - { - "epoch": 1.58, - "learning_rate": 9.634001656295386e-07, - "loss": 0.6543, - "step": 61603 - }, - { - "epoch": 1.58, - "learning_rate": 9.633725137288165e-07, - "loss": 0.6357, - "step": 61604 - }, - { - "epoch": 1.58, - "learning_rate": 9.633448618561383e-07, - "loss": 0.3599, - "step": 61605 - }, - { - "epoch": 1.58, - "learning_rate": 9.633172100115253e-07, - "loss": 0.6982, - "step": 61606 - }, - { - "epoch": 1.58, - "learning_rate": 9.632895581949988e-07, - "loss": 0.6558, - "step": 61607 - }, - { - "epoch": 1.58, - "learning_rate": 9.632619064065795e-07, - "loss": 0.5283, - "step": 61608 - }, - { - "epoch": 1.58, - "learning_rate": 9.632342546462892e-07, - "loss": 0.583, - "step": 61609 - }, - { - "epoch": 1.58, - "learning_rate": 9.632066029141484e-07, - "loss": 0.626, - "step": 61610 - }, - { - "epoch": 1.58, - "learning_rate": 9.63178951210179e-07, - "loss": 0.7715, - "step": 61611 - }, - { - "epoch": 1.58, - "learning_rate": 9.631512995344018e-07, - "loss": 0.6133, - "step": 61612 - }, - { - "epoch": 1.58, - "learning_rate": 9.631236478868378e-07, - "loss": 0.603, - "step": 61613 - }, - { - "epoch": 1.58, - "learning_rate": 9.63095996267508e-07, - "loss": 0.624, - "step": 61614 - }, - { - "epoch": 1.58, - "learning_rate": 9.630683446764345e-07, - "loss": 0.5068, - "step": 61615 - }, - { - "epoch": 1.58, - "learning_rate": 9.630406931136374e-07, - "loss": 0.748, - "step": 61616 - }, - { - "epoch": 1.58, - "learning_rate": 9.630130415791386e-07, - "loss": 0.7637, - "step": 61617 - }, - { - "epoch": 1.58, - "learning_rate": 9.629853900729586e-07, - "loss": 0.5967, - "step": 61618 - }, - { - "epoch": 1.58, - "learning_rate": 9.629577385951194e-07, - "loss": 0.6772, - "step": 61619 - }, - { - "epoch": 1.58, - "learning_rate": 9.629300871456415e-07, - "loss": 0.7686, - "step": 61620 - }, - { - "epoch": 1.58, - "learning_rate": 9.629024357245469e-07, - "loss": 0.708, - "step": 61621 - }, - { - "epoch": 1.58, - "learning_rate": 9.628747843318558e-07, - "loss": 0.5854, - "step": 61622 - }, - { - "epoch": 1.58, - "learning_rate": 9.628471329675897e-07, - "loss": 0.6411, - "step": 61623 - }, - { - "epoch": 1.58, - "learning_rate": 9.628194816317699e-07, - "loss": 0.7197, - "step": 61624 - }, - { - "epoch": 1.58, - "learning_rate": 9.627918303244171e-07, - "loss": 0.6763, - "step": 61625 - }, - { - "epoch": 1.58, - "learning_rate": 9.627641790455535e-07, - "loss": 0.449, - "step": 61626 - }, - { - "epoch": 1.58, - "learning_rate": 9.627365277951994e-07, - "loss": 0.666, - "step": 61627 - }, - { - "epoch": 1.58, - "learning_rate": 9.627088765733762e-07, - "loss": 0.6499, - "step": 61628 - }, - { - "epoch": 1.58, - "learning_rate": 9.62681225380105e-07, - "loss": 0.625, - "step": 61629 - }, - { - "epoch": 1.58, - "learning_rate": 9.626535742154073e-07, - "loss": 0.7422, - "step": 61630 - }, - { - "epoch": 1.58, - "learning_rate": 9.626259230793043e-07, - "loss": 0.6523, - "step": 61631 - }, - { - "epoch": 1.58, - "learning_rate": 9.625982719718167e-07, - "loss": 0.7988, - "step": 61632 - }, - { - "epoch": 1.58, - "learning_rate": 9.625706208929657e-07, - "loss": 0.668, - "step": 61633 - }, - { - "epoch": 1.58, - "learning_rate": 9.625429698427728e-07, - "loss": 0.7236, - "step": 61634 - }, - { - "epoch": 1.58, - "learning_rate": 9.625153188212588e-07, - "loss": 0.8213, - "step": 61635 - }, - { - "epoch": 1.58, - "learning_rate": 9.624876678284452e-07, - "loss": 0.6543, - "step": 61636 - }, - { - "epoch": 1.58, - "learning_rate": 9.62460016864353e-07, - "loss": 0.6577, - "step": 61637 - }, - { - "epoch": 1.58, - "learning_rate": 9.624323659290036e-07, - "loss": 0.4976, - "step": 61638 - }, - { - "epoch": 1.58, - "learning_rate": 9.62404715022418e-07, - "loss": 0.6416, - "step": 61639 - }, - { - "epoch": 1.58, - "learning_rate": 9.623770641446172e-07, - "loss": 0.493, - "step": 61640 - }, - { - "epoch": 1.58, - "learning_rate": 9.62349413295623e-07, - "loss": 0.5718, - "step": 61641 - }, - { - "epoch": 1.58, - "learning_rate": 9.623217624754557e-07, - "loss": 0.5129, - "step": 61642 - }, - { - "epoch": 1.58, - "learning_rate": 9.622941116841373e-07, - "loss": 0.6313, - "step": 61643 - }, - { - "epoch": 1.58, - "learning_rate": 9.62266460921688e-07, - "loss": 0.6543, - "step": 61644 - }, - { - "epoch": 1.58, - "learning_rate": 9.622388101881299e-07, - "loss": 0.6338, - "step": 61645 - }, - { - "epoch": 1.58, - "learning_rate": 9.622111594834837e-07, - "loss": 0.4424, - "step": 61646 - }, - { - "epoch": 1.58, - "learning_rate": 9.621835088077706e-07, - "loss": 0.7803, - "step": 61647 - }, - { - "epoch": 1.58, - "learning_rate": 9.62155858161012e-07, - "loss": 0.6421, - "step": 61648 - }, - { - "epoch": 1.58, - "learning_rate": 9.621282075432287e-07, - "loss": 0.5938, - "step": 61649 - }, - { - "epoch": 1.58, - "learning_rate": 9.621005569544424e-07, - "loss": 0.5356, - "step": 61650 - }, - { - "epoch": 1.58, - "learning_rate": 9.620729063946742e-07, - "loss": 0.6865, - "step": 61651 - }, - { - "epoch": 1.58, - "learning_rate": 9.620452558639444e-07, - "loss": 0.7227, - "step": 61652 - }, - { - "epoch": 1.58, - "learning_rate": 9.620176053622752e-07, - "loss": 0.6963, - "step": 61653 - }, - { - "epoch": 1.58, - "learning_rate": 9.61989954889687e-07, - "loss": 0.626, - "step": 61654 - }, - { - "epoch": 1.58, - "learning_rate": 9.619623044462018e-07, - "loss": 0.552, - "step": 61655 - }, - { - "epoch": 1.58, - "learning_rate": 9.619346540318397e-07, - "loss": 0.6086, - "step": 61656 - }, - { - "epoch": 1.58, - "learning_rate": 9.619070036466232e-07, - "loss": 0.6138, - "step": 61657 - }, - { - "epoch": 1.58, - "learning_rate": 9.618793532905723e-07, - "loss": 0.6689, - "step": 61658 - }, - { - "epoch": 1.58, - "learning_rate": 9.618517029637088e-07, - "loss": 0.3191, - "step": 61659 - }, - { - "epoch": 1.58, - "learning_rate": 9.618240526660534e-07, - "loss": 0.708, - "step": 61660 - }, - { - "epoch": 1.58, - "learning_rate": 9.61796402397628e-07, - "loss": 0.5283, - "step": 61661 - }, - { - "epoch": 1.58, - "learning_rate": 9.617687521584534e-07, - "loss": 0.7788, - "step": 61662 - }, - { - "epoch": 1.58, - "learning_rate": 9.617411019485502e-07, - "loss": 0.5762, - "step": 61663 - }, - { - "epoch": 1.58, - "learning_rate": 9.617134517679404e-07, - "loss": 0.5405, - "step": 61664 - }, - { - "epoch": 1.58, - "learning_rate": 9.616858016166447e-07, - "loss": 0.6821, - "step": 61665 - }, - { - "epoch": 1.58, - "learning_rate": 9.616581514946846e-07, - "loss": 0.7852, - "step": 61666 - }, - { - "epoch": 1.58, - "learning_rate": 9.616305014020809e-07, - "loss": 0.7432, - "step": 61667 - }, - { - "epoch": 1.58, - "learning_rate": 9.61602851338855e-07, - "loss": 0.5564, - "step": 61668 - }, - { - "epoch": 1.58, - "learning_rate": 9.615752013050284e-07, - "loss": 0.5366, - "step": 61669 - }, - { - "epoch": 1.58, - "learning_rate": 9.615475513006214e-07, - "loss": 0.5908, - "step": 61670 - }, - { - "epoch": 1.58, - "learning_rate": 9.615199013256561e-07, - "loss": 0.5171, - "step": 61671 - }, - { - "epoch": 1.58, - "learning_rate": 9.61492251380153e-07, - "loss": 0.6504, - "step": 61672 - }, - { - "epoch": 1.58, - "learning_rate": 9.614646014641334e-07, - "loss": 0.5913, - "step": 61673 - }, - { - "epoch": 1.58, - "learning_rate": 9.614369515776188e-07, - "loss": 0.5981, - "step": 61674 - }, - { - "epoch": 1.58, - "learning_rate": 9.6140930172063e-07, - "loss": 0.7939, - "step": 61675 - }, - { - "epoch": 1.58, - "learning_rate": 9.613816518931885e-07, - "loss": 0.5391, - "step": 61676 - }, - { - "epoch": 1.58, - "learning_rate": 9.61354002095315e-07, - "loss": 0.5908, - "step": 61677 - }, - { - "epoch": 1.58, - "learning_rate": 9.613263523270313e-07, - "loss": 0.7393, - "step": 61678 - }, - { - "epoch": 1.58, - "learning_rate": 9.612987025883577e-07, - "loss": 0.6558, - "step": 61679 - }, - { - "epoch": 1.58, - "learning_rate": 9.612710528793164e-07, - "loss": 0.5732, - "step": 61680 - }, - { - "epoch": 1.58, - "learning_rate": 9.612434031999282e-07, - "loss": 0.4714, - "step": 61681 - }, - { - "epoch": 1.58, - "learning_rate": 9.612157535502138e-07, - "loss": 0.6475, - "step": 61682 - }, - { - "epoch": 1.58, - "learning_rate": 9.611881039301948e-07, - "loss": 0.6528, - "step": 61683 - }, - { - "epoch": 1.58, - "learning_rate": 9.611604543398922e-07, - "loss": 0.6367, - "step": 61684 - }, - { - "epoch": 1.58, - "learning_rate": 9.611328047793275e-07, - "loss": 0.6543, - "step": 61685 - }, - { - "epoch": 1.58, - "learning_rate": 9.611051552485215e-07, - "loss": 0.7236, - "step": 61686 - }, - { - "epoch": 1.58, - "learning_rate": 9.610775057474954e-07, - "loss": 0.6006, - "step": 61687 - }, - { - "epoch": 1.58, - "learning_rate": 9.610498562762706e-07, - "loss": 0.7607, - "step": 61688 - }, - { - "epoch": 1.58, - "learning_rate": 9.61022206834868e-07, - "loss": 0.5713, - "step": 61689 - }, - { - "epoch": 1.58, - "learning_rate": 9.60994557423309e-07, - "loss": 0.7646, - "step": 61690 - }, - { - "epoch": 1.58, - "learning_rate": 9.609669080416147e-07, - "loss": 0.6387, - "step": 61691 - }, - { - "epoch": 1.58, - "learning_rate": 9.609392586898061e-07, - "loss": 0.3875, - "step": 61692 - }, - { - "epoch": 1.58, - "learning_rate": 9.609116093679048e-07, - "loss": 0.6592, - "step": 61693 - }, - { - "epoch": 1.58, - "learning_rate": 9.608839600759312e-07, - "loss": 0.5747, - "step": 61694 - }, - { - "epoch": 1.58, - "learning_rate": 9.608563108139073e-07, - "loss": 0.6855, - "step": 61695 - }, - { - "epoch": 1.58, - "learning_rate": 9.60828661581854e-07, - "loss": 0.4943, - "step": 61696 - }, - { - "epoch": 1.58, - "learning_rate": 9.608010123797923e-07, - "loss": 0.5142, - "step": 61697 - }, - { - "epoch": 1.58, - "learning_rate": 9.60773363207743e-07, - "loss": 0.6509, - "step": 61698 - }, - { - "epoch": 1.58, - "learning_rate": 9.607457140657283e-07, - "loss": 0.7314, - "step": 61699 - }, - { - "epoch": 1.58, - "learning_rate": 9.607180649537685e-07, - "loss": 0.8223, - "step": 61700 - }, - { - "epoch": 1.58, - "learning_rate": 9.606904158718856e-07, - "loss": 0.6401, - "step": 61701 - }, - { - "epoch": 1.58, - "learning_rate": 9.606627668200998e-07, - "loss": 0.6157, - "step": 61702 - }, - { - "epoch": 1.58, - "learning_rate": 9.60635117798433e-07, - "loss": 0.5398, - "step": 61703 - }, - { - "epoch": 1.58, - "learning_rate": 9.606074688069058e-07, - "loss": 0.4568, - "step": 61704 - }, - { - "epoch": 1.58, - "learning_rate": 9.605798198455395e-07, - "loss": 0.7295, - "step": 61705 - }, - { - "epoch": 1.58, - "learning_rate": 9.605521709143556e-07, - "loss": 0.6626, - "step": 61706 - }, - { - "epoch": 1.58, - "learning_rate": 9.605245220133753e-07, - "loss": 0.6523, - "step": 61707 - }, - { - "epoch": 1.58, - "learning_rate": 9.604968731426191e-07, - "loss": 0.625, - "step": 61708 - }, - { - "epoch": 1.58, - "learning_rate": 9.60469224302109e-07, - "loss": 0.6641, - "step": 61709 - }, - { - "epoch": 1.58, - "learning_rate": 9.604415754918656e-07, - "loss": 0.699, - "step": 61710 - }, - { - "epoch": 1.58, - "learning_rate": 9.604139267119105e-07, - "loss": 0.6641, - "step": 61711 - }, - { - "epoch": 1.58, - "learning_rate": 9.603862779622646e-07, - "loss": 0.6709, - "step": 61712 - }, - { - "epoch": 1.58, - "learning_rate": 9.603586292429489e-07, - "loss": 0.5723, - "step": 61713 - }, - { - "epoch": 1.58, - "learning_rate": 9.60330980553985e-07, - "loss": 0.5786, - "step": 61714 - }, - { - "epoch": 1.58, - "learning_rate": 9.603033318953935e-07, - "loss": 0.5415, - "step": 61715 - }, - { - "epoch": 1.58, - "learning_rate": 9.602756832671963e-07, - "loss": 0.5161, - "step": 61716 - }, - { - "epoch": 1.58, - "learning_rate": 9.602480346694136e-07, - "loss": 0.7588, - "step": 61717 - }, - { - "epoch": 1.58, - "learning_rate": 9.602203861020679e-07, - "loss": 0.616, - "step": 61718 - }, - { - "epoch": 1.58, - "learning_rate": 9.60192737565179e-07, - "loss": 0.6826, - "step": 61719 - }, - { - "epoch": 1.58, - "learning_rate": 9.60165089058769e-07, - "loss": 0.4333, - "step": 61720 - }, - { - "epoch": 1.58, - "learning_rate": 9.601374405828593e-07, - "loss": 0.7559, - "step": 61721 - }, - { - "epoch": 1.58, - "learning_rate": 9.6010979213747e-07, - "loss": 0.6172, - "step": 61722 - }, - { - "epoch": 1.58, - "learning_rate": 9.600821437226225e-07, - "loss": 0.6594, - "step": 61723 - }, - { - "epoch": 1.58, - "learning_rate": 9.600544953383385e-07, - "loss": 0.4338, - "step": 61724 - }, - { - "epoch": 1.58, - "learning_rate": 9.60026846984639e-07, - "loss": 0.7109, - "step": 61725 - }, - { - "epoch": 1.58, - "learning_rate": 9.599991986615452e-07, - "loss": 0.5352, - "step": 61726 - }, - { - "epoch": 1.58, - "learning_rate": 9.59971550369078e-07, - "loss": 0.6411, - "step": 61727 - }, - { - "epoch": 1.58, - "learning_rate": 9.599439021072586e-07, - "loss": 0.7729, - "step": 61728 - }, - { - "epoch": 1.58, - "learning_rate": 9.599162538761085e-07, - "loss": 0.4937, - "step": 61729 - }, - { - "epoch": 1.58, - "learning_rate": 9.598886056756487e-07, - "loss": 0.7261, - "step": 61730 - }, - { - "epoch": 1.58, - "learning_rate": 9.598609575059006e-07, - "loss": 0.407, - "step": 61731 - }, - { - "epoch": 1.58, - "learning_rate": 9.598333093668846e-07, - "loss": 0.5642, - "step": 61732 - }, - { - "epoch": 1.58, - "learning_rate": 9.598056612586229e-07, - "loss": 0.6699, - "step": 61733 - }, - { - "epoch": 1.58, - "learning_rate": 9.597780131811357e-07, - "loss": 0.5316, - "step": 61734 - }, - { - "epoch": 1.58, - "learning_rate": 9.597503651344448e-07, - "loss": 0.6543, - "step": 61735 - }, - { - "epoch": 1.58, - "learning_rate": 9.59722717118571e-07, - "loss": 0.6758, - "step": 61736 - }, - { - "epoch": 1.58, - "learning_rate": 9.596950691335361e-07, - "loss": 0.6465, - "step": 61737 - }, - { - "epoch": 1.58, - "learning_rate": 9.596674211793605e-07, - "loss": 0.7178, - "step": 61738 - }, - { - "epoch": 1.58, - "learning_rate": 9.59639773256066e-07, - "loss": 0.4648, - "step": 61739 - }, - { - "epoch": 1.58, - "learning_rate": 9.596121253636729e-07, - "loss": 0.6577, - "step": 61740 - }, - { - "epoch": 1.58, - "learning_rate": 9.59584477502204e-07, - "loss": 0.6787, - "step": 61741 - }, - { - "epoch": 1.58, - "learning_rate": 9.595568296716786e-07, - "loss": 0.5386, - "step": 61742 - }, - { - "epoch": 1.58, - "learning_rate": 9.595291818721188e-07, - "loss": 0.7666, - "step": 61743 - }, - { - "epoch": 1.58, - "learning_rate": 9.595015341035455e-07, - "loss": 0.5469, - "step": 61744 - }, - { - "epoch": 1.58, - "learning_rate": 9.594738863659803e-07, - "loss": 0.4487, - "step": 61745 - }, - { - "epoch": 1.58, - "learning_rate": 9.594462386594438e-07, - "loss": 0.5015, - "step": 61746 - }, - { - "epoch": 1.58, - "learning_rate": 9.594185909839577e-07, - "loss": 0.7354, - "step": 61747 - }, - { - "epoch": 1.58, - "learning_rate": 9.593909433395426e-07, - "loss": 0.5073, - "step": 61748 - }, - { - "epoch": 1.58, - "learning_rate": 9.593632957262202e-07, - "loss": 0.6333, - "step": 61749 - }, - { - "epoch": 1.58, - "learning_rate": 9.593356481440115e-07, - "loss": 0.6377, - "step": 61750 - }, - { - "epoch": 1.58, - "learning_rate": 9.593080005929378e-07, - "loss": 0.551, - "step": 61751 - }, - { - "epoch": 1.58, - "learning_rate": 9.5928035307302e-07, - "loss": 0.7295, - "step": 61752 - }, - { - "epoch": 1.58, - "learning_rate": 9.59252705584279e-07, - "loss": 0.7734, - "step": 61753 - }, - { - "epoch": 1.58, - "learning_rate": 9.592250581267368e-07, - "loss": 0.5841, - "step": 61754 - }, - { - "epoch": 1.58, - "learning_rate": 9.591974107004136e-07, - "loss": 0.8115, - "step": 61755 - }, - { - "epoch": 1.58, - "learning_rate": 9.591697633053314e-07, - "loss": 0.6025, - "step": 61756 - }, - { - "epoch": 1.58, - "learning_rate": 9.591421159415108e-07, - "loss": 0.6475, - "step": 61757 - }, - { - "epoch": 1.58, - "learning_rate": 9.591144686089735e-07, - "loss": 0.6084, - "step": 61758 - }, - { - "epoch": 1.58, - "learning_rate": 9.590868213077404e-07, - "loss": 0.8398, - "step": 61759 - }, - { - "epoch": 1.58, - "learning_rate": 9.590591740378327e-07, - "loss": 0.7686, - "step": 61760 - }, - { - "epoch": 1.58, - "learning_rate": 9.590315267992712e-07, - "loss": 0.7637, - "step": 61761 - }, - { - "epoch": 1.58, - "learning_rate": 9.590038795920776e-07, - "loss": 0.5205, - "step": 61762 - }, - { - "epoch": 1.58, - "learning_rate": 9.589762324162725e-07, - "loss": 0.6836, - "step": 61763 - }, - { - "epoch": 1.58, - "learning_rate": 9.589485852718777e-07, - "loss": 0.5947, - "step": 61764 - }, - { - "epoch": 1.58, - "learning_rate": 9.58920938158914e-07, - "loss": 0.6777, - "step": 61765 - }, - { - "epoch": 1.58, - "learning_rate": 9.588932910774027e-07, - "loss": 0.6719, - "step": 61766 - }, - { - "epoch": 1.58, - "learning_rate": 9.588656440273646e-07, - "loss": 0.6113, - "step": 61767 - }, - { - "epoch": 1.58, - "learning_rate": 9.588379970088215e-07, - "loss": 0.5601, - "step": 61768 - }, - { - "epoch": 1.58, - "learning_rate": 9.58810350021794e-07, - "loss": 0.5659, - "step": 61769 - }, - { - "epoch": 1.58, - "learning_rate": 9.587827030663041e-07, - "loss": 0.6865, - "step": 61770 - }, - { - "epoch": 1.58, - "learning_rate": 9.587550561423721e-07, - "loss": 0.7402, - "step": 61771 - }, - { - "epoch": 1.58, - "learning_rate": 9.587274092500192e-07, - "loss": 0.603, - "step": 61772 - }, - { - "epoch": 1.58, - "learning_rate": 9.586997623892671e-07, - "loss": 0.7227, - "step": 61773 - }, - { - "epoch": 1.58, - "learning_rate": 9.586721155601363e-07, - "loss": 0.6846, - "step": 61774 - }, - { - "epoch": 1.58, - "learning_rate": 9.586444687626487e-07, - "loss": 0.5178, - "step": 61775 - }, - { - "epoch": 1.58, - "learning_rate": 9.586168219968254e-07, - "loss": 0.5518, - "step": 61776 - }, - { - "epoch": 1.58, - "learning_rate": 9.585891752626868e-07, - "loss": 0.7695, - "step": 61777 - }, - { - "epoch": 1.58, - "learning_rate": 9.585615285602547e-07, - "loss": 0.4602, - "step": 61778 - }, - { - "epoch": 1.58, - "learning_rate": 9.585338818895502e-07, - "loss": 0.6343, - "step": 61779 - }, - { - "epoch": 1.58, - "learning_rate": 9.585062352505946e-07, - "loss": 0.624, - "step": 61780 - }, - { - "epoch": 1.58, - "learning_rate": 9.584785886434086e-07, - "loss": 0.6294, - "step": 61781 - }, - { - "epoch": 1.58, - "learning_rate": 9.584509420680135e-07, - "loss": 0.6719, - "step": 61782 - }, - { - "epoch": 1.58, - "learning_rate": 9.58423295524431e-07, - "loss": 0.7002, - "step": 61783 - }, - { - "epoch": 1.58, - "learning_rate": 9.583956490126814e-07, - "loss": 0.5298, - "step": 61784 - }, - { - "epoch": 1.58, - "learning_rate": 9.583680025327867e-07, - "loss": 0.7588, - "step": 61785 - }, - { - "epoch": 1.58, - "learning_rate": 9.583403560847675e-07, - "loss": 0.4594, - "step": 61786 - }, - { - "epoch": 1.58, - "learning_rate": 9.583127096686453e-07, - "loss": 0.5571, - "step": 61787 - }, - { - "epoch": 1.58, - "learning_rate": 9.58285063284441e-07, - "loss": 0.6982, - "step": 61788 - }, - { - "epoch": 1.58, - "learning_rate": 9.582574169321762e-07, - "loss": 0.5469, - "step": 61789 - }, - { - "epoch": 1.58, - "learning_rate": 9.582297706118718e-07, - "loss": 0.6074, - "step": 61790 - }, - { - "epoch": 1.58, - "learning_rate": 9.582021243235487e-07, - "loss": 0.6289, - "step": 61791 - }, - { - "epoch": 1.58, - "learning_rate": 9.581744780672283e-07, - "loss": 0.7227, - "step": 61792 - }, - { - "epoch": 1.58, - "learning_rate": 9.58146831842932e-07, - "loss": 0.6914, - "step": 61793 - }, - { - "epoch": 1.58, - "learning_rate": 9.581191856506803e-07, - "loss": 0.7246, - "step": 61794 - }, - { - "epoch": 1.58, - "learning_rate": 9.580915394904953e-07, - "loss": 0.7705, - "step": 61795 - }, - { - "epoch": 1.58, - "learning_rate": 9.580638933623973e-07, - "loss": 0.5115, - "step": 61796 - }, - { - "epoch": 1.58, - "learning_rate": 9.58036247266408e-07, - "loss": 0.5595, - "step": 61797 - }, - { - "epoch": 1.58, - "learning_rate": 9.580086012025484e-07, - "loss": 0.6753, - "step": 61798 - }, - { - "epoch": 1.58, - "learning_rate": 9.579809551708398e-07, - "loss": 0.6929, - "step": 61799 - }, - { - "epoch": 1.58, - "learning_rate": 9.579533091713034e-07, - "loss": 0.5366, - "step": 61800 - }, - { - "epoch": 1.58, - "learning_rate": 9.579256632039598e-07, - "loss": 0.7832, - "step": 61801 - }, - { - "epoch": 1.58, - "learning_rate": 9.57898017268831e-07, - "loss": 0.5342, - "step": 61802 - }, - { - "epoch": 1.58, - "learning_rate": 9.578703713659372e-07, - "loss": 0.6895, - "step": 61803 - }, - { - "epoch": 1.58, - "learning_rate": 9.578427254953007e-07, - "loss": 0.751, - "step": 61804 - }, - { - "epoch": 1.58, - "learning_rate": 9.578150796569417e-07, - "loss": 0.8105, - "step": 61805 - }, - { - "epoch": 1.58, - "learning_rate": 9.577874338508819e-07, - "loss": 0.7588, - "step": 61806 - }, - { - "epoch": 1.58, - "learning_rate": 9.57759788077142e-07, - "loss": 0.7549, - "step": 61807 - }, - { - "epoch": 1.58, - "learning_rate": 9.57732142335744e-07, - "loss": 0.6409, - "step": 61808 - }, - { - "epoch": 1.58, - "learning_rate": 9.577044966267082e-07, - "loss": 0.877, - "step": 61809 - }, - { - "epoch": 1.58, - "learning_rate": 9.576768509500568e-07, - "loss": 0.7119, - "step": 61810 - }, - { - "epoch": 1.58, - "learning_rate": 9.576492053058096e-07, - "loss": 0.6133, - "step": 61811 - }, - { - "epoch": 1.58, - "learning_rate": 9.576215596939888e-07, - "loss": 0.5669, - "step": 61812 - }, - { - "epoch": 1.58, - "learning_rate": 9.575939141146147e-07, - "loss": 0.7559, - "step": 61813 - }, - { - "epoch": 1.58, - "learning_rate": 9.575662685677094e-07, - "loss": 0.7998, - "step": 61814 - }, - { - "epoch": 1.58, - "learning_rate": 9.575386230532936e-07, - "loss": 0.791, - "step": 61815 - }, - { - "epoch": 1.58, - "learning_rate": 9.575109775713886e-07, - "loss": 0.5601, - "step": 61816 - }, - { - "epoch": 1.58, - "learning_rate": 9.574833321220151e-07, - "loss": 0.6387, - "step": 61817 - }, - { - "epoch": 1.58, - "learning_rate": 9.57455686705195e-07, - "loss": 0.4011, - "step": 61818 - }, - { - "epoch": 1.58, - "learning_rate": 9.57428041320949e-07, - "loss": 0.5176, - "step": 61819 - }, - { - "epoch": 1.58, - "learning_rate": 9.57400395969299e-07, - "loss": 0.6084, - "step": 61820 - }, - { - "epoch": 1.58, - "learning_rate": 9.573727506502648e-07, - "loss": 0.4901, - "step": 61821 - }, - { - "epoch": 1.58, - "learning_rate": 9.573451053638686e-07, - "loss": 0.6396, - "step": 61822 - }, - { - "epoch": 1.58, - "learning_rate": 9.573174601101312e-07, - "loss": 0.4089, - "step": 61823 - }, - { - "epoch": 1.58, - "learning_rate": 9.57289814889074e-07, - "loss": 0.6084, - "step": 61824 - }, - { - "epoch": 1.58, - "learning_rate": 9.572621697007178e-07, - "loss": 0.6411, - "step": 61825 - }, - { - "epoch": 1.58, - "learning_rate": 9.572345245450841e-07, - "loss": 0.7266, - "step": 61826 - }, - { - "epoch": 1.58, - "learning_rate": 9.57206879422194e-07, - "loss": 0.6025, - "step": 61827 - }, - { - "epoch": 1.58, - "learning_rate": 9.571792343320684e-07, - "loss": 0.7378, - "step": 61828 - }, - { - "epoch": 1.58, - "learning_rate": 9.57151589274729e-07, - "loss": 0.6797, - "step": 61829 - }, - { - "epoch": 1.58, - "learning_rate": 9.57123944250197e-07, - "loss": 0.5596, - "step": 61830 - }, - { - "epoch": 1.58, - "learning_rate": 9.570962992584928e-07, - "loss": 0.6904, - "step": 61831 - }, - { - "epoch": 1.58, - "learning_rate": 9.570686542996378e-07, - "loss": 0.5645, - "step": 61832 - }, - { - "epoch": 1.58, - "learning_rate": 9.570410093736537e-07, - "loss": 0.572, - "step": 61833 - }, - { - "epoch": 1.58, - "learning_rate": 9.570133644805609e-07, - "loss": 0.5603, - "step": 61834 - }, - { - "epoch": 1.58, - "learning_rate": 9.569857196203814e-07, - "loss": 0.5615, - "step": 61835 - }, - { - "epoch": 1.58, - "learning_rate": 9.569580747931357e-07, - "loss": 0.7715, - "step": 61836 - }, - { - "epoch": 1.58, - "learning_rate": 9.569304299988452e-07, - "loss": 0.5496, - "step": 61837 - }, - { - "epoch": 1.58, - "learning_rate": 9.56902785237531e-07, - "loss": 0.5205, - "step": 61838 - }, - { - "epoch": 1.58, - "learning_rate": 9.568751405092147e-07, - "loss": 0.6841, - "step": 61839 - }, - { - "epoch": 1.58, - "learning_rate": 9.568474958139173e-07, - "loss": 0.793, - "step": 61840 - }, - { - "epoch": 1.59, - "learning_rate": 9.568198511516593e-07, - "loss": 0.606, - "step": 61841 - }, - { - "epoch": 1.59, - "learning_rate": 9.567922065224628e-07, - "loss": 0.6963, - "step": 61842 - }, - { - "epoch": 1.59, - "learning_rate": 9.56764561926348e-07, - "loss": 0.6299, - "step": 61843 - }, - { - "epoch": 1.59, - "learning_rate": 9.56736917363337e-07, - "loss": 0.7305, - "step": 61844 - }, - { - "epoch": 1.59, - "learning_rate": 9.567092728334502e-07, - "loss": 0.665, - "step": 61845 - }, - { - "epoch": 1.59, - "learning_rate": 9.566816283367093e-07, - "loss": 0.5249, - "step": 61846 - }, - { - "epoch": 1.59, - "learning_rate": 9.566539838731352e-07, - "loss": 0.4888, - "step": 61847 - }, - { - "epoch": 1.59, - "learning_rate": 9.566263394427494e-07, - "loss": 0.5615, - "step": 61848 - }, - { - "epoch": 1.59, - "learning_rate": 9.565986950455726e-07, - "loss": 0.5494, - "step": 61849 - }, - { - "epoch": 1.59, - "learning_rate": 9.565710506816268e-07, - "loss": 0.4373, - "step": 61850 - }, - { - "epoch": 1.59, - "learning_rate": 9.565434063509317e-07, - "loss": 0.8018, - "step": 61851 - }, - { - "epoch": 1.59, - "learning_rate": 9.565157620535097e-07, - "loss": 0.3726, - "step": 61852 - }, - { - "epoch": 1.59, - "learning_rate": 9.564881177893814e-07, - "loss": 0.5945, - "step": 61853 - }, - { - "epoch": 1.59, - "learning_rate": 9.564604735585682e-07, - "loss": 0.6575, - "step": 61854 - }, - { - "epoch": 1.59, - "learning_rate": 9.564328293610912e-07, - "loss": 0.6228, - "step": 61855 - }, - { - "epoch": 1.59, - "learning_rate": 9.564051851969717e-07, - "loss": 0.6484, - "step": 61856 - }, - { - "epoch": 1.59, - "learning_rate": 9.563775410662304e-07, - "loss": 0.79, - "step": 61857 - }, - { - "epoch": 1.59, - "learning_rate": 9.563498969688894e-07, - "loss": 0.6689, - "step": 61858 - }, - { - "epoch": 1.59, - "learning_rate": 9.563222529049686e-07, - "loss": 0.6902, - "step": 61859 - }, - { - "epoch": 1.59, - "learning_rate": 9.562946088744906e-07, - "loss": 0.6621, - "step": 61860 - }, - { - "epoch": 1.59, - "learning_rate": 9.562669648774754e-07, - "loss": 0.6572, - "step": 61861 - }, - { - "epoch": 1.59, - "learning_rate": 9.562393209139445e-07, - "loss": 0.8711, - "step": 61862 - }, - { - "epoch": 1.59, - "learning_rate": 9.562116769839195e-07, - "loss": 0.6069, - "step": 61863 - }, - { - "epoch": 1.59, - "learning_rate": 9.561840330874206e-07, - "loss": 0.6543, - "step": 61864 - }, - { - "epoch": 1.59, - "learning_rate": 9.5615638922447e-07, - "loss": 0.7744, - "step": 61865 - }, - { - "epoch": 1.59, - "learning_rate": 9.561287453950884e-07, - "loss": 0.533, - "step": 61866 - }, - { - "epoch": 1.59, - "learning_rate": 9.56101101599297e-07, - "loss": 0.6519, - "step": 61867 - }, - { - "epoch": 1.59, - "learning_rate": 9.56073457837117e-07, - "loss": 0.5522, - "step": 61868 - }, - { - "epoch": 1.59, - "learning_rate": 9.560458141085693e-07, - "loss": 0.6201, - "step": 61869 - }, - { - "epoch": 1.59, - "learning_rate": 9.560181704136755e-07, - "loss": 0.6836, - "step": 61870 - }, - { - "epoch": 1.59, - "learning_rate": 9.559905267524568e-07, - "loss": 0.6719, - "step": 61871 - }, - { - "epoch": 1.59, - "learning_rate": 9.559628831249337e-07, - "loss": 0.6816, - "step": 61872 - }, - { - "epoch": 1.59, - "learning_rate": 9.55935239531128e-07, - "loss": 0.5591, - "step": 61873 - }, - { - "epoch": 1.59, - "learning_rate": 9.559075959710603e-07, - "loss": 0.4646, - "step": 61874 - }, - { - "epoch": 1.59, - "learning_rate": 9.558799524447526e-07, - "loss": 0.6104, - "step": 61875 - }, - { - "epoch": 1.59, - "learning_rate": 9.558523089522254e-07, - "loss": 0.668, - "step": 61876 - }, - { - "epoch": 1.59, - "learning_rate": 9.558246654935e-07, - "loss": 0.6963, - "step": 61877 - }, - { - "epoch": 1.59, - "learning_rate": 9.557970220685976e-07, - "loss": 0.7432, - "step": 61878 - }, - { - "epoch": 1.59, - "learning_rate": 9.557693786775397e-07, - "loss": 0.541, - "step": 61879 - }, - { - "epoch": 1.59, - "learning_rate": 9.557417353203471e-07, - "loss": 0.6079, - "step": 61880 - }, - { - "epoch": 1.59, - "learning_rate": 9.557140919970408e-07, - "loss": 0.4531, - "step": 61881 - }, - { - "epoch": 1.59, - "learning_rate": 9.556864487076422e-07, - "loss": 0.6499, - "step": 61882 - }, - { - "epoch": 1.59, - "learning_rate": 9.556588054521726e-07, - "loss": 0.5444, - "step": 61883 - }, - { - "epoch": 1.59, - "learning_rate": 9.556311622306528e-07, - "loss": 0.6714, - "step": 61884 - }, - { - "epoch": 1.59, - "learning_rate": 9.556035190431044e-07, - "loss": 0.5049, - "step": 61885 - }, - { - "epoch": 1.59, - "learning_rate": 9.555758758895481e-07, - "loss": 0.7695, - "step": 61886 - }, - { - "epoch": 1.59, - "learning_rate": 9.555482327700053e-07, - "loss": 0.4585, - "step": 61887 - }, - { - "epoch": 1.59, - "learning_rate": 9.555205896844973e-07, - "loss": 0.748, - "step": 61888 - }, - { - "epoch": 1.59, - "learning_rate": 9.554929466330454e-07, - "loss": 0.7432, - "step": 61889 - }, - { - "epoch": 1.59, - "learning_rate": 9.554653036156704e-07, - "loss": 0.6494, - "step": 61890 - }, - { - "epoch": 1.59, - "learning_rate": 9.554376606323933e-07, - "loss": 0.4958, - "step": 61891 - }, - { - "epoch": 1.59, - "learning_rate": 9.554100176832356e-07, - "loss": 0.6357, - "step": 61892 - }, - { - "epoch": 1.59, - "learning_rate": 9.553823747682184e-07, - "loss": 0.7529, - "step": 61893 - }, - { - "epoch": 1.59, - "learning_rate": 9.55354731887363e-07, - "loss": 0.7178, - "step": 61894 - }, - { - "epoch": 1.59, - "learning_rate": 9.553270890406903e-07, - "loss": 0.4391, - "step": 61895 - }, - { - "epoch": 1.59, - "learning_rate": 9.552994462282217e-07, - "loss": 0.7012, - "step": 61896 - }, - { - "epoch": 1.59, - "learning_rate": 9.55271803449978e-07, - "loss": 0.5161, - "step": 61897 - }, - { - "epoch": 1.59, - "learning_rate": 9.552441607059809e-07, - "loss": 0.6562, - "step": 61898 - }, - { - "epoch": 1.59, - "learning_rate": 9.55216517996251e-07, - "loss": 0.6904, - "step": 61899 - }, - { - "epoch": 1.59, - "learning_rate": 9.551888753208105e-07, - "loss": 0.5854, - "step": 61900 - }, - { - "epoch": 1.59, - "learning_rate": 9.55161232679679e-07, - "loss": 0.6338, - "step": 61901 - }, - { - "epoch": 1.59, - "learning_rate": 9.55133590072879e-07, - "loss": 0.5752, - "step": 61902 - }, - { - "epoch": 1.59, - "learning_rate": 9.55105947500431e-07, - "loss": 0.583, - "step": 61903 - }, - { - "epoch": 1.59, - "learning_rate": 9.55078304962356e-07, - "loss": 0.6204, - "step": 61904 - }, - { - "epoch": 1.59, - "learning_rate": 9.550506624586757e-07, - "loss": 0.7412, - "step": 61905 - }, - { - "epoch": 1.59, - "learning_rate": 9.55023019989411e-07, - "loss": 0.6504, - "step": 61906 - }, - { - "epoch": 1.59, - "learning_rate": 9.549953775545832e-07, - "loss": 0.7695, - "step": 61907 - }, - { - "epoch": 1.59, - "learning_rate": 9.549677351542133e-07, - "loss": 0.5449, - "step": 61908 - }, - { - "epoch": 1.59, - "learning_rate": 9.549400927883225e-07, - "loss": 0.4722, - "step": 61909 - }, - { - "epoch": 1.59, - "learning_rate": 9.549124504569321e-07, - "loss": 0.5757, - "step": 61910 - }, - { - "epoch": 1.59, - "learning_rate": 9.548848081600633e-07, - "loss": 0.7598, - "step": 61911 - }, - { - "epoch": 1.59, - "learning_rate": 9.548571658977369e-07, - "loss": 0.5757, - "step": 61912 - }, - { - "epoch": 1.59, - "learning_rate": 9.548295236699745e-07, - "loss": 0.6338, - "step": 61913 - }, - { - "epoch": 1.59, - "learning_rate": 9.548018814767966e-07, - "loss": 0.4045, - "step": 61914 - }, - { - "epoch": 1.59, - "learning_rate": 9.547742393182252e-07, - "loss": 0.5967, - "step": 61915 - }, - { - "epoch": 1.59, - "learning_rate": 9.547465971942809e-07, - "loss": 0.7109, - "step": 61916 - }, - { - "epoch": 1.59, - "learning_rate": 9.547189551049853e-07, - "loss": 0.7559, - "step": 61917 - }, - { - "epoch": 1.59, - "learning_rate": 9.54691313050359e-07, - "loss": 0.5425, - "step": 61918 - }, - { - "epoch": 1.59, - "learning_rate": 9.546636710304237e-07, - "loss": 0.6348, - "step": 61919 - }, - { - "epoch": 1.59, - "learning_rate": 9.546360290452005e-07, - "loss": 0.667, - "step": 61920 - }, - { - "epoch": 1.59, - "learning_rate": 9.546083870947103e-07, - "loss": 0.5874, - "step": 61921 - }, - { - "epoch": 1.59, - "learning_rate": 9.545807451789741e-07, - "loss": 0.6689, - "step": 61922 - }, - { - "epoch": 1.59, - "learning_rate": 9.545531032980135e-07, - "loss": 0.6738, - "step": 61923 - }, - { - "epoch": 1.59, - "learning_rate": 9.545254614518494e-07, - "loss": 0.6274, - "step": 61924 - }, - { - "epoch": 1.59, - "learning_rate": 9.544978196405032e-07, - "loss": 0.5903, - "step": 61925 - }, - { - "epoch": 1.59, - "learning_rate": 9.544701778639957e-07, - "loss": 0.772, - "step": 61926 - }, - { - "epoch": 1.59, - "learning_rate": 9.544425361223487e-07, - "loss": 0.5024, - "step": 61927 - }, - { - "epoch": 1.59, - "learning_rate": 9.544148944155825e-07, - "loss": 0.6436, - "step": 61928 - }, - { - "epoch": 1.59, - "learning_rate": 9.54387252743719e-07, - "loss": 0.4553, - "step": 61929 - }, - { - "epoch": 1.59, - "learning_rate": 9.543596111067794e-07, - "loss": 0.751, - "step": 61930 - }, - { - "epoch": 1.59, - "learning_rate": 9.54331969504784e-07, - "loss": 0.6943, - "step": 61931 - }, - { - "epoch": 1.59, - "learning_rate": 9.543043279377549e-07, - "loss": 0.6914, - "step": 61932 - }, - { - "epoch": 1.59, - "learning_rate": 9.542766864057125e-07, - "loss": 0.8125, - "step": 61933 - }, - { - "epoch": 1.59, - "learning_rate": 9.542490449086785e-07, - "loss": 0.5635, - "step": 61934 - }, - { - "epoch": 1.59, - "learning_rate": 9.542214034466739e-07, - "loss": 0.8135, - "step": 61935 - }, - { - "epoch": 1.59, - "learning_rate": 9.541937620197197e-07, - "loss": 0.6279, - "step": 61936 - }, - { - "epoch": 1.59, - "learning_rate": 9.541661206278374e-07, - "loss": 0.6494, - "step": 61937 - }, - { - "epoch": 1.59, - "learning_rate": 9.54138479271048e-07, - "loss": 0.707, - "step": 61938 - }, - { - "epoch": 1.59, - "learning_rate": 9.541108379493727e-07, - "loss": 0.6792, - "step": 61939 - }, - { - "epoch": 1.59, - "learning_rate": 9.54083196662833e-07, - "loss": 0.5474, - "step": 61940 - }, - { - "epoch": 1.59, - "learning_rate": 9.540555554114491e-07, - "loss": 0.5957, - "step": 61941 - }, - { - "epoch": 1.59, - "learning_rate": 9.54027914195243e-07, - "loss": 0.5557, - "step": 61942 - }, - { - "epoch": 1.59, - "learning_rate": 9.540002730142354e-07, - "loss": 0.6719, - "step": 61943 - }, - { - "epoch": 1.59, - "learning_rate": 9.539726318684479e-07, - "loss": 0.5684, - "step": 61944 - }, - { - "epoch": 1.59, - "learning_rate": 9.539449907579012e-07, - "loss": 0.5581, - "step": 61945 - }, - { - "epoch": 1.59, - "learning_rate": 9.539173496826169e-07, - "loss": 0.4077, - "step": 61946 - }, - { - "epoch": 1.59, - "learning_rate": 9.538897086426158e-07, - "loss": 0.6055, - "step": 61947 - }, - { - "epoch": 1.59, - "learning_rate": 9.538620676379194e-07, - "loss": 0.7637, - "step": 61948 - }, - { - "epoch": 1.59, - "learning_rate": 9.538344266685483e-07, - "loss": 0.7617, - "step": 61949 - }, - { - "epoch": 1.59, - "learning_rate": 9.538067857345248e-07, - "loss": 0.5361, - "step": 61950 - }, - { - "epoch": 1.59, - "learning_rate": 9.537791448358689e-07, - "loss": 0.7031, - "step": 61951 - }, - { - "epoch": 1.59, - "learning_rate": 9.537515039726022e-07, - "loss": 0.6865, - "step": 61952 - }, - { - "epoch": 1.59, - "learning_rate": 9.537238631447458e-07, - "loss": 0.8125, - "step": 61953 - }, - { - "epoch": 1.59, - "learning_rate": 9.536962223523207e-07, - "loss": 0.5786, - "step": 61954 - }, - { - "epoch": 1.59, - "learning_rate": 9.536685815953488e-07, - "loss": 0.7129, - "step": 61955 - }, - { - "epoch": 1.59, - "learning_rate": 9.536409408738505e-07, - "loss": 0.6855, - "step": 61956 - }, - { - "epoch": 1.59, - "learning_rate": 9.536133001878471e-07, - "loss": 0.7051, - "step": 61957 - }, - { - "epoch": 1.59, - "learning_rate": 9.5358565953736e-07, - "loss": 0.7417, - "step": 61958 - }, - { - "epoch": 1.59, - "learning_rate": 9.535580189224099e-07, - "loss": 0.439, - "step": 61959 - }, - { - "epoch": 1.59, - "learning_rate": 9.535303783430188e-07, - "loss": 0.522, - "step": 61960 - }, - { - "epoch": 1.59, - "learning_rate": 9.535027377992072e-07, - "loss": 0.636, - "step": 61961 - }, - { - "epoch": 1.59, - "learning_rate": 9.534750972909962e-07, - "loss": 0.6343, - "step": 61962 - }, - { - "epoch": 1.59, - "learning_rate": 9.534474568184073e-07, - "loss": 0.5181, - "step": 61963 - }, - { - "epoch": 1.59, - "learning_rate": 9.534198163814614e-07, - "loss": 0.4386, - "step": 61964 - }, - { - "epoch": 1.59, - "learning_rate": 9.533921759801801e-07, - "loss": 0.7871, - "step": 61965 - }, - { - "epoch": 1.59, - "learning_rate": 9.53364535614584e-07, - "loss": 0.6021, - "step": 61966 - }, - { - "epoch": 1.59, - "learning_rate": 9.533368952846946e-07, - "loss": 0.7139, - "step": 61967 - }, - { - "epoch": 1.59, - "learning_rate": 9.53309254990533e-07, - "loss": 0.8203, - "step": 61968 - }, - { - "epoch": 1.59, - "learning_rate": 9.532816147321203e-07, - "loss": 0.7188, - "step": 61969 - }, - { - "epoch": 1.59, - "learning_rate": 9.532539745094782e-07, - "loss": 0.5815, - "step": 61970 - }, - { - "epoch": 1.59, - "learning_rate": 9.532263343226268e-07, - "loss": 0.7373, - "step": 61971 - }, - { - "epoch": 1.59, - "learning_rate": 9.531986941715882e-07, - "loss": 0.5698, - "step": 61972 - }, - { - "epoch": 1.59, - "learning_rate": 9.53171054056383e-07, - "loss": 0.6641, - "step": 61973 - }, - { - "epoch": 1.59, - "learning_rate": 9.531434139770325e-07, - "loss": 0.6514, - "step": 61974 - }, - { - "epoch": 1.59, - "learning_rate": 9.531157739335582e-07, - "loss": 0.6436, - "step": 61975 - }, - { - "epoch": 1.59, - "learning_rate": 9.530881339259806e-07, - "loss": 0.7969, - "step": 61976 - }, - { - "epoch": 1.59, - "learning_rate": 9.530604939543215e-07, - "loss": 0.7363, - "step": 61977 - }, - { - "epoch": 1.59, - "learning_rate": 9.530328540186018e-07, - "loss": 0.605, - "step": 61978 - }, - { - "epoch": 1.59, - "learning_rate": 9.530052141188427e-07, - "loss": 0.6494, - "step": 61979 - }, - { - "epoch": 1.59, - "learning_rate": 9.529775742550656e-07, - "loss": 0.7627, - "step": 61980 - }, - { - "epoch": 1.59, - "learning_rate": 9.529499344272911e-07, - "loss": 0.5078, - "step": 61981 - }, - { - "epoch": 1.59, - "learning_rate": 9.529222946355408e-07, - "loss": 0.4312, - "step": 61982 - }, - { - "epoch": 1.59, - "learning_rate": 9.528946548798356e-07, - "loss": 0.6235, - "step": 61983 - }, - { - "epoch": 1.59, - "learning_rate": 9.528670151601968e-07, - "loss": 0.8359, - "step": 61984 - }, - { - "epoch": 1.59, - "learning_rate": 9.528393754766455e-07, - "loss": 0.7617, - "step": 61985 - }, - { - "epoch": 1.59, - "learning_rate": 9.528117358292031e-07, - "loss": 0.4795, - "step": 61986 - }, - { - "epoch": 1.59, - "learning_rate": 9.527840962178904e-07, - "loss": 0.6157, - "step": 61987 - }, - { - "epoch": 1.59, - "learning_rate": 9.527564566427289e-07, - "loss": 0.5508, - "step": 61988 - }, - { - "epoch": 1.59, - "learning_rate": 9.527288171037395e-07, - "loss": 0.6047, - "step": 61989 - }, - { - "epoch": 1.59, - "learning_rate": 9.527011776009441e-07, - "loss": 0.752, - "step": 61990 - }, - { - "epoch": 1.59, - "learning_rate": 9.526735381343624e-07, - "loss": 0.5918, - "step": 61991 - }, - { - "epoch": 1.59, - "learning_rate": 9.526458987040169e-07, - "loss": 0.6865, - "step": 61992 - }, - { - "epoch": 1.59, - "learning_rate": 9.526182593099279e-07, - "loss": 0.6367, - "step": 61993 - }, - { - "epoch": 1.59, - "learning_rate": 9.525906199521171e-07, - "loss": 0.667, - "step": 61994 - }, - { - "epoch": 1.59, - "learning_rate": 9.525629806306053e-07, - "loss": 0.6484, - "step": 61995 - }, - { - "epoch": 1.59, - "learning_rate": 9.525353413454141e-07, - "loss": 0.5154, - "step": 61996 - }, - { - "epoch": 1.59, - "learning_rate": 9.525077020965641e-07, - "loss": 0.5786, - "step": 61997 - }, - { - "epoch": 1.59, - "learning_rate": 9.52480062884077e-07, - "loss": 0.4736, - "step": 61998 - }, - { - "epoch": 1.59, - "learning_rate": 9.524524237079736e-07, - "loss": 0.624, - "step": 61999 - }, - { - "epoch": 1.59, - "learning_rate": 9.524247845682756e-07, - "loss": 0.604, - "step": 62000 - }, - { - "epoch": 1.59, - "learning_rate": 9.523971454650035e-07, - "loss": 0.7588, - "step": 62001 - }, - { - "epoch": 1.59, - "learning_rate": 9.523695063981784e-07, - "loss": 0.6621, - "step": 62002 - }, - { - "epoch": 1.59, - "learning_rate": 9.523418673678222e-07, - "loss": 0.3718, - "step": 62003 - }, - { - "epoch": 1.59, - "learning_rate": 9.523142283739553e-07, - "loss": 0.4351, - "step": 62004 - }, - { - "epoch": 1.59, - "learning_rate": 9.522865894165994e-07, - "loss": 0.5708, - "step": 62005 - }, - { - "epoch": 1.59, - "learning_rate": 9.522589504957754e-07, - "loss": 0.626, - "step": 62006 - }, - { - "epoch": 1.59, - "learning_rate": 9.522313116115046e-07, - "loss": 0.6748, - "step": 62007 - }, - { - "epoch": 1.59, - "learning_rate": 9.52203672763808e-07, - "loss": 0.5635, - "step": 62008 - }, - { - "epoch": 1.59, - "learning_rate": 9.521760339527069e-07, - "loss": 0.5776, - "step": 62009 - }, - { - "epoch": 1.59, - "learning_rate": 9.521483951782228e-07, - "loss": 0.5581, - "step": 62010 - }, - { - "epoch": 1.59, - "learning_rate": 9.521207564403761e-07, - "loss": 0.7393, - "step": 62011 - }, - { - "epoch": 1.59, - "learning_rate": 9.520931177391883e-07, - "loss": 0.5786, - "step": 62012 - }, - { - "epoch": 1.59, - "learning_rate": 9.520654790746806e-07, - "loss": 0.8105, - "step": 62013 - }, - { - "epoch": 1.59, - "learning_rate": 9.52037840446874e-07, - "loss": 0.6504, - "step": 62014 - }, - { - "epoch": 1.59, - "learning_rate": 9.520102018557902e-07, - "loss": 0.5103, - "step": 62015 - }, - { - "epoch": 1.59, - "learning_rate": 9.519825633014495e-07, - "loss": 0.7295, - "step": 62016 - }, - { - "epoch": 1.59, - "learning_rate": 9.51954924783874e-07, - "loss": 0.7275, - "step": 62017 - }, - { - "epoch": 1.59, - "learning_rate": 9.519272863030841e-07, - "loss": 0.7217, - "step": 62018 - }, - { - "epoch": 1.59, - "learning_rate": 9.518996478591015e-07, - "loss": 0.4031, - "step": 62019 - }, - { - "epoch": 1.59, - "learning_rate": 9.518720094519472e-07, - "loss": 0.4856, - "step": 62020 - }, - { - "epoch": 1.59, - "learning_rate": 9.518443710816421e-07, - "loss": 0.5181, - "step": 62021 - }, - { - "epoch": 1.59, - "learning_rate": 9.518167327482077e-07, - "loss": 0.7529, - "step": 62022 - }, - { - "epoch": 1.59, - "learning_rate": 9.517890944516646e-07, - "loss": 0.6865, - "step": 62023 - }, - { - "epoch": 1.59, - "learning_rate": 9.517614561920347e-07, - "loss": 0.752, - "step": 62024 - }, - { - "epoch": 1.59, - "learning_rate": 9.517338179693387e-07, - "loss": 0.7417, - "step": 62025 - }, - { - "epoch": 1.59, - "learning_rate": 9.51706179783598e-07, - "loss": 0.6826, - "step": 62026 - }, - { - "epoch": 1.59, - "learning_rate": 9.516785416348335e-07, - "loss": 0.6216, - "step": 62027 - }, - { - "epoch": 1.59, - "learning_rate": 9.516509035230668e-07, - "loss": 0.6602, - "step": 62028 - }, - { - "epoch": 1.59, - "learning_rate": 9.516232654483187e-07, - "loss": 0.5713, - "step": 62029 - }, - { - "epoch": 1.59, - "learning_rate": 9.515956274106107e-07, - "loss": 0.7285, - "step": 62030 - }, - { - "epoch": 1.59, - "learning_rate": 9.515679894099633e-07, - "loss": 0.5693, - "step": 62031 - }, - { - "epoch": 1.59, - "learning_rate": 9.515403514463982e-07, - "loss": 0.5225, - "step": 62032 - }, - { - "epoch": 1.59, - "learning_rate": 9.515127135199362e-07, - "loss": 0.7168, - "step": 62033 - }, - { - "epoch": 1.59, - "learning_rate": 9.51485075630599e-07, - "loss": 0.5249, - "step": 62034 - }, - { - "epoch": 1.59, - "learning_rate": 9.514574377784072e-07, - "loss": 0.4597, - "step": 62035 - }, - { - "epoch": 1.59, - "learning_rate": 9.514297999633822e-07, - "loss": 0.665, - "step": 62036 - }, - { - "epoch": 1.59, - "learning_rate": 9.514021621855452e-07, - "loss": 0.4883, - "step": 62037 - }, - { - "epoch": 1.59, - "learning_rate": 9.513745244449175e-07, - "loss": 0.6348, - "step": 62038 - }, - { - "epoch": 1.59, - "learning_rate": 9.513468867415199e-07, - "loss": 0.6064, - "step": 62039 - }, - { - "epoch": 1.59, - "learning_rate": 9.513192490753741e-07, - "loss": 0.4253, - "step": 62040 - }, - { - "epoch": 1.59, - "learning_rate": 9.512916114465009e-07, - "loss": 0.7183, - "step": 62041 - }, - { - "epoch": 1.59, - "learning_rate": 9.51263973854921e-07, - "loss": 0.5698, - "step": 62042 - }, - { - "epoch": 1.59, - "learning_rate": 9.512363363006563e-07, - "loss": 0.6777, - "step": 62043 - }, - { - "epoch": 1.59, - "learning_rate": 9.512086987837276e-07, - "loss": 0.7793, - "step": 62044 - }, - { - "epoch": 1.59, - "learning_rate": 9.511810613041562e-07, - "loss": 0.7285, - "step": 62045 - }, - { - "epoch": 1.59, - "learning_rate": 9.511534238619634e-07, - "loss": 0.6299, - "step": 62046 - }, - { - "epoch": 1.59, - "learning_rate": 9.511257864571699e-07, - "loss": 0.7017, - "step": 62047 - }, - { - "epoch": 1.59, - "learning_rate": 9.510981490897973e-07, - "loss": 0.6729, - "step": 62048 - }, - { - "epoch": 1.59, - "learning_rate": 9.510705117598664e-07, - "loss": 0.644, - "step": 62049 - }, - { - "epoch": 1.59, - "learning_rate": 9.510428744673991e-07, - "loss": 0.4419, - "step": 62050 - }, - { - "epoch": 1.59, - "learning_rate": 9.510152372124156e-07, - "loss": 0.5234, - "step": 62051 - }, - { - "epoch": 1.59, - "learning_rate": 9.509875999949374e-07, - "loss": 0.4214, - "step": 62052 - }, - { - "epoch": 1.59, - "learning_rate": 9.509599628149859e-07, - "loss": 0.7002, - "step": 62053 - }, - { - "epoch": 1.59, - "learning_rate": 9.50932325672582e-07, - "loss": 0.7891, - "step": 62054 - }, - { - "epoch": 1.59, - "learning_rate": 9.509046885677471e-07, - "loss": 0.6855, - "step": 62055 - }, - { - "epoch": 1.59, - "learning_rate": 9.508770515005019e-07, - "loss": 0.5908, - "step": 62056 - }, - { - "epoch": 1.59, - "learning_rate": 9.508494144708683e-07, - "loss": 0.6172, - "step": 62057 - }, - { - "epoch": 1.59, - "learning_rate": 9.508217774788667e-07, - "loss": 0.8174, - "step": 62058 - }, - { - "epoch": 1.59, - "learning_rate": 9.50794140524519e-07, - "loss": 0.6216, - "step": 62059 - }, - { - "epoch": 1.59, - "learning_rate": 9.507665036078458e-07, - "loss": 0.7432, - "step": 62060 - }, - { - "epoch": 1.59, - "learning_rate": 9.507388667288683e-07, - "loss": 0.6499, - "step": 62061 - }, - { - "epoch": 1.59, - "learning_rate": 9.507112298876079e-07, - "loss": 0.657, - "step": 62062 - }, - { - "epoch": 1.59, - "learning_rate": 9.506835930840856e-07, - "loss": 0.6641, - "step": 62063 - }, - { - "epoch": 1.59, - "learning_rate": 9.506559563183226e-07, - "loss": 0.7412, - "step": 62064 - }, - { - "epoch": 1.59, - "learning_rate": 9.506283195903401e-07, - "loss": 0.6216, - "step": 62065 - }, - { - "epoch": 1.59, - "learning_rate": 9.506006829001591e-07, - "loss": 0.7539, - "step": 62066 - }, - { - "epoch": 1.59, - "learning_rate": 9.50573046247801e-07, - "loss": 0.7598, - "step": 62067 - }, - { - "epoch": 1.59, - "learning_rate": 9.505454096332866e-07, - "loss": 0.4873, - "step": 62068 - }, - { - "epoch": 1.59, - "learning_rate": 9.505177730566378e-07, - "loss": 0.5879, - "step": 62069 - }, - { - "epoch": 1.59, - "learning_rate": 9.504901365178751e-07, - "loss": 0.7422, - "step": 62070 - }, - { - "epoch": 1.59, - "learning_rate": 9.504625000170195e-07, - "loss": 0.6348, - "step": 62071 - }, - { - "epoch": 1.59, - "learning_rate": 9.504348635540928e-07, - "loss": 0.7539, - "step": 62072 - }, - { - "epoch": 1.59, - "learning_rate": 9.504072271291157e-07, - "loss": 0.4907, - "step": 62073 - }, - { - "epoch": 1.59, - "learning_rate": 9.503795907421096e-07, - "loss": 0.6641, - "step": 62074 - }, - { - "epoch": 1.59, - "learning_rate": 9.503519543930953e-07, - "loss": 0.5186, - "step": 62075 - }, - { - "epoch": 1.59, - "learning_rate": 9.503243180820946e-07, - "loss": 0.876, - "step": 62076 - }, - { - "epoch": 1.59, - "learning_rate": 9.502966818091281e-07, - "loss": 0.5786, - "step": 62077 - }, - { - "epoch": 1.59, - "learning_rate": 9.502690455742172e-07, - "loss": 0.5942, - "step": 62078 - }, - { - "epoch": 1.59, - "learning_rate": 9.502414093773832e-07, - "loss": 0.5503, - "step": 62079 - }, - { - "epoch": 1.59, - "learning_rate": 9.502137732186467e-07, - "loss": 0.4368, - "step": 62080 - }, - { - "epoch": 1.59, - "learning_rate": 9.501861370980295e-07, - "loss": 0.6499, - "step": 62081 - }, - { - "epoch": 1.59, - "learning_rate": 9.501585010155524e-07, - "loss": 0.5222, - "step": 62082 - }, - { - "epoch": 1.59, - "learning_rate": 9.501308649712365e-07, - "loss": 0.5591, - "step": 62083 - }, - { - "epoch": 1.59, - "learning_rate": 9.501032289651033e-07, - "loss": 0.5967, - "step": 62084 - }, - { - "epoch": 1.59, - "learning_rate": 9.500755929971734e-07, - "loss": 0.8379, - "step": 62085 - }, - { - "epoch": 1.59, - "learning_rate": 9.500479570674687e-07, - "loss": 0.7114, - "step": 62086 - }, - { - "epoch": 1.59, - "learning_rate": 9.500203211760099e-07, - "loss": 0.7212, - "step": 62087 - }, - { - "epoch": 1.59, - "learning_rate": 9.499926853228182e-07, - "loss": 0.6475, - "step": 62088 - }, - { - "epoch": 1.59, - "learning_rate": 9.499650495079151e-07, - "loss": 0.6152, - "step": 62089 - }, - { - "epoch": 1.59, - "learning_rate": 9.499374137313209e-07, - "loss": 0.7656, - "step": 62090 - }, - { - "epoch": 1.59, - "learning_rate": 9.499097779930578e-07, - "loss": 0.604, - "step": 62091 - }, - { - "epoch": 1.59, - "learning_rate": 9.498821422931462e-07, - "loss": 0.5112, - "step": 62092 - }, - { - "epoch": 1.59, - "learning_rate": 9.498545066316076e-07, - "loss": 0.5586, - "step": 62093 - }, - { - "epoch": 1.59, - "learning_rate": 9.498268710084631e-07, - "loss": 0.4924, - "step": 62094 - }, - { - "epoch": 1.59, - "learning_rate": 9.497992354237338e-07, - "loss": 0.5645, - "step": 62095 - }, - { - "epoch": 1.59, - "learning_rate": 9.497715998774409e-07, - "loss": 0.6113, - "step": 62096 - }, - { - "epoch": 1.59, - "learning_rate": 9.497439643696057e-07, - "loss": 0.6035, - "step": 62097 - }, - { - "epoch": 1.59, - "learning_rate": 9.497163289002491e-07, - "loss": 0.7219, - "step": 62098 - }, - { - "epoch": 1.59, - "learning_rate": 9.49688693469393e-07, - "loss": 0.7056, - "step": 62099 - }, - { - "epoch": 1.59, - "learning_rate": 9.496610580770573e-07, - "loss": 0.8398, - "step": 62100 - }, - { - "epoch": 1.59, - "learning_rate": 9.496334227232641e-07, - "loss": 0.4678, - "step": 62101 - }, - { - "epoch": 1.59, - "learning_rate": 9.496057874080339e-07, - "loss": 0.6689, - "step": 62102 - }, - { - "epoch": 1.59, - "learning_rate": 9.495781521313886e-07, - "loss": 0.7041, - "step": 62103 - }, - { - "epoch": 1.59, - "learning_rate": 9.495505168933487e-07, - "loss": 0.5391, - "step": 62104 - }, - { - "epoch": 1.59, - "learning_rate": 9.495228816939359e-07, - "loss": 0.6069, - "step": 62105 - }, - { - "epoch": 1.59, - "learning_rate": 9.494952465331708e-07, - "loss": 0.6572, - "step": 62106 - }, - { - "epoch": 1.59, - "learning_rate": 9.494676114110753e-07, - "loss": 0.6106, - "step": 62107 - }, - { - "epoch": 1.59, - "learning_rate": 9.494399763276697e-07, - "loss": 0.5853, - "step": 62108 - }, - { - "epoch": 1.59, - "learning_rate": 9.494123412829761e-07, - "loss": 0.5288, - "step": 62109 - }, - { - "epoch": 1.59, - "learning_rate": 9.493847062770148e-07, - "loss": 0.7861, - "step": 62110 - }, - { - "epoch": 1.59, - "learning_rate": 9.493570713098073e-07, - "loss": 0.5864, - "step": 62111 - }, - { - "epoch": 1.59, - "learning_rate": 9.493294363813749e-07, - "loss": 0.6741, - "step": 62112 - }, - { - "epoch": 1.59, - "learning_rate": 9.493018014917383e-07, - "loss": 0.5498, - "step": 62113 - }, - { - "epoch": 1.59, - "learning_rate": 9.492741666409193e-07, - "loss": 0.376, - "step": 62114 - }, - { - "epoch": 1.59, - "learning_rate": 9.492465318289386e-07, - "loss": 0.7656, - "step": 62115 - }, - { - "epoch": 1.59, - "learning_rate": 9.492188970558175e-07, - "loss": 0.666, - "step": 62116 - }, - { - "epoch": 1.59, - "learning_rate": 9.491912623215771e-07, - "loss": 0.6953, - "step": 62117 - }, - { - "epoch": 1.59, - "learning_rate": 9.491636276262388e-07, - "loss": 0.7178, - "step": 62118 - }, - { - "epoch": 1.59, - "learning_rate": 9.491359929698237e-07, - "loss": 0.4448, - "step": 62119 - }, - { - "epoch": 1.59, - "learning_rate": 9.491083583523527e-07, - "loss": 0.7173, - "step": 62120 - }, - { - "epoch": 1.59, - "learning_rate": 9.49080723773847e-07, - "loss": 0.6177, - "step": 62121 - }, - { - "epoch": 1.59, - "learning_rate": 9.490530892343278e-07, - "loss": 0.6191, - "step": 62122 - }, - { - "epoch": 1.59, - "learning_rate": 9.490254547338162e-07, - "loss": 0.425, - "step": 62123 - }, - { - "epoch": 1.59, - "learning_rate": 9.489978202723338e-07, - "loss": 0.5879, - "step": 62124 - }, - { - "epoch": 1.59, - "learning_rate": 9.489701858499011e-07, - "loss": 0.6875, - "step": 62125 - }, - { - "epoch": 1.59, - "learning_rate": 9.489425514665398e-07, - "loss": 0.707, - "step": 62126 - }, - { - "epoch": 1.59, - "learning_rate": 9.489149171222705e-07, - "loss": 0.4863, - "step": 62127 - }, - { - "epoch": 1.59, - "learning_rate": 9.488872828171152e-07, - "loss": 0.7061, - "step": 62128 - }, - { - "epoch": 1.59, - "learning_rate": 9.488596485510945e-07, - "loss": 0.6055, - "step": 62129 - }, - { - "epoch": 1.59, - "learning_rate": 9.488320143242293e-07, - "loss": 0.3149, - "step": 62130 - }, - { - "epoch": 1.59, - "learning_rate": 9.488043801365413e-07, - "loss": 0.6509, - "step": 62131 - }, - { - "epoch": 1.59, - "learning_rate": 9.487767459880513e-07, - "loss": 0.6338, - "step": 62132 - }, - { - "epoch": 1.59, - "learning_rate": 9.487491118787807e-07, - "loss": 0.7109, - "step": 62133 - }, - { - "epoch": 1.59, - "learning_rate": 9.487214778087503e-07, - "loss": 0.5107, - "step": 62134 - }, - { - "epoch": 1.59, - "learning_rate": 9.486938437779818e-07, - "loss": 0.6108, - "step": 62135 - }, - { - "epoch": 1.59, - "learning_rate": 9.486662097864961e-07, - "loss": 0.6392, - "step": 62136 - }, - { - "epoch": 1.59, - "learning_rate": 9.48638575834314e-07, - "loss": 0.6436, - "step": 62137 - }, - { - "epoch": 1.59, - "learning_rate": 9.486109419214572e-07, - "loss": 0.5251, - "step": 62138 - }, - { - "epoch": 1.59, - "learning_rate": 9.485833080479469e-07, - "loss": 0.4761, - "step": 62139 - }, - { - "epoch": 1.59, - "learning_rate": 9.485556742138036e-07, - "loss": 0.6616, - "step": 62140 - }, - { - "epoch": 1.59, - "learning_rate": 9.48528040419049e-07, - "loss": 0.6074, - "step": 62141 - }, - { - "epoch": 1.59, - "learning_rate": 9.485004066637039e-07, - "loss": 0.6045, - "step": 62142 - }, - { - "epoch": 1.59, - "learning_rate": 9.4847277294779e-07, - "loss": 0.6763, - "step": 62143 - }, - { - "epoch": 1.59, - "learning_rate": 9.484451392713278e-07, - "loss": 0.5664, - "step": 62144 - }, - { - "epoch": 1.59, - "learning_rate": 9.48417505634339e-07, - "loss": 0.5552, - "step": 62145 - }, - { - "epoch": 1.59, - "learning_rate": 9.483898720368442e-07, - "loss": 0.7441, - "step": 62146 - }, - { - "epoch": 1.59, - "learning_rate": 9.483622384788654e-07, - "loss": 0.7002, - "step": 62147 - }, - { - "epoch": 1.59, - "learning_rate": 9.483346049604229e-07, - "loss": 0.6262, - "step": 62148 - }, - { - "epoch": 1.59, - "learning_rate": 9.483069714815387e-07, - "loss": 0.5972, - "step": 62149 - }, - { - "epoch": 1.59, - "learning_rate": 9.482793380422332e-07, - "loss": 0.7285, - "step": 62150 - }, - { - "epoch": 1.59, - "learning_rate": 9.482517046425276e-07, - "loss": 0.5947, - "step": 62151 - }, - { - "epoch": 1.59, - "learning_rate": 9.482240712824435e-07, - "loss": 0.6187, - "step": 62152 - }, - { - "epoch": 1.59, - "learning_rate": 9.48196437962002e-07, - "loss": 0.6123, - "step": 62153 - }, - { - "epoch": 1.59, - "learning_rate": 9.481688046812237e-07, - "loss": 0.5947, - "step": 62154 - }, - { - "epoch": 1.59, - "learning_rate": 9.481411714401305e-07, - "loss": 0.6333, - "step": 62155 - }, - { - "epoch": 1.59, - "learning_rate": 9.48113538238743e-07, - "loss": 0.7129, - "step": 62156 - }, - { - "epoch": 1.59, - "learning_rate": 9.480859050770827e-07, - "loss": 0.6699, - "step": 62157 - }, - { - "epoch": 1.59, - "learning_rate": 9.480582719551705e-07, - "loss": 0.8203, - "step": 62158 - }, - { - "epoch": 1.59, - "learning_rate": 9.480306388730281e-07, - "loss": 0.4741, - "step": 62159 - }, - { - "epoch": 1.59, - "learning_rate": 9.480030058306761e-07, - "loss": 0.6353, - "step": 62160 - }, - { - "epoch": 1.59, - "learning_rate": 9.479753728281355e-07, - "loss": 0.5079, - "step": 62161 - }, - { - "epoch": 1.59, - "learning_rate": 9.47947739865428e-07, - "loss": 0.6914, - "step": 62162 - }, - { - "epoch": 1.59, - "learning_rate": 9.479201069425743e-07, - "loss": 0.5161, - "step": 62163 - }, - { - "epoch": 1.59, - "learning_rate": 9.47892474059596e-07, - "loss": 0.6543, - "step": 62164 - }, - { - "epoch": 1.59, - "learning_rate": 9.478648412165139e-07, - "loss": 0.7803, - "step": 62165 - }, - { - "epoch": 1.59, - "learning_rate": 9.478372084133495e-07, - "loss": 0.6807, - "step": 62166 - }, - { - "epoch": 1.59, - "learning_rate": 9.478095756501235e-07, - "loss": 0.7363, - "step": 62167 - }, - { - "epoch": 1.59, - "learning_rate": 9.477819429268574e-07, - "loss": 0.7637, - "step": 62168 - }, - { - "epoch": 1.59, - "learning_rate": 9.477543102435726e-07, - "loss": 0.5029, - "step": 62169 - }, - { - "epoch": 1.59, - "learning_rate": 9.477266776002894e-07, - "loss": 0.6733, - "step": 62170 - }, - { - "epoch": 1.59, - "learning_rate": 9.476990449970297e-07, - "loss": 0.7148, - "step": 62171 - }, - { - "epoch": 1.59, - "learning_rate": 9.476714124338147e-07, - "loss": 0.708, - "step": 62172 - }, - { - "epoch": 1.59, - "learning_rate": 9.476437799106648e-07, - "loss": 0.6548, - "step": 62173 - }, - { - "epoch": 1.59, - "learning_rate": 9.47616147427602e-07, - "loss": 0.79, - "step": 62174 - }, - { - "epoch": 1.59, - "learning_rate": 9.475885149846469e-07, - "loss": 0.5215, - "step": 62175 - }, - { - "epoch": 1.59, - "learning_rate": 9.47560882581821e-07, - "loss": 0.6704, - "step": 62176 - }, - { - "epoch": 1.59, - "learning_rate": 9.47533250219145e-07, - "loss": 0.5735, - "step": 62177 - }, - { - "epoch": 1.59, - "learning_rate": 9.475056178966408e-07, - "loss": 0.5908, - "step": 62178 - }, - { - "epoch": 1.59, - "learning_rate": 9.474779856143292e-07, - "loss": 0.5645, - "step": 62179 - }, - { - "epoch": 1.59, - "learning_rate": 9.47450353372231e-07, - "loss": 0.6006, - "step": 62180 - }, - { - "epoch": 1.59, - "learning_rate": 9.474227211703678e-07, - "loss": 0.6216, - "step": 62181 - }, - { - "epoch": 1.59, - "learning_rate": 9.473950890087604e-07, - "loss": 0.5889, - "step": 62182 - }, - { - "epoch": 1.59, - "learning_rate": 9.473674568874304e-07, - "loss": 0.6094, - "step": 62183 - }, - { - "epoch": 1.59, - "learning_rate": 9.473398248063984e-07, - "loss": 0.6523, - "step": 62184 - }, - { - "epoch": 1.59, - "learning_rate": 9.473121927656862e-07, - "loss": 0.6118, - "step": 62185 - }, - { - "epoch": 1.59, - "learning_rate": 9.472845607653144e-07, - "loss": 0.5469, - "step": 62186 - }, - { - "epoch": 1.59, - "learning_rate": 9.472569288053045e-07, - "loss": 0.5233, - "step": 62187 - }, - { - "epoch": 1.59, - "learning_rate": 9.472292968856774e-07, - "loss": 0.6924, - "step": 62188 - }, - { - "epoch": 1.59, - "learning_rate": 9.47201665006455e-07, - "loss": 0.7363, - "step": 62189 - }, - { - "epoch": 1.59, - "learning_rate": 9.471740331676573e-07, - "loss": 0.6577, - "step": 62190 - }, - { - "epoch": 1.59, - "learning_rate": 9.471464013693062e-07, - "loss": 0.6621, - "step": 62191 - }, - { - "epoch": 1.59, - "learning_rate": 9.471187696114225e-07, - "loss": 0.5979, - "step": 62192 - }, - { - "epoch": 1.59, - "learning_rate": 9.470911378940276e-07, - "loss": 0.6504, - "step": 62193 - }, - { - "epoch": 1.59, - "learning_rate": 9.470635062171425e-07, - "loss": 0.7129, - "step": 62194 - }, - { - "epoch": 1.59, - "learning_rate": 9.470358745807886e-07, - "loss": 0.6553, - "step": 62195 - }, - { - "epoch": 1.59, - "learning_rate": 9.470082429849867e-07, - "loss": 0.7246, - "step": 62196 - }, - { - "epoch": 1.59, - "learning_rate": 9.469806114297583e-07, - "loss": 0.516, - "step": 62197 - }, - { - "epoch": 1.59, - "learning_rate": 9.469529799151243e-07, - "loss": 0.5913, - "step": 62198 - }, - { - "epoch": 1.59, - "learning_rate": 9.469253484411064e-07, - "loss": 0.6587, - "step": 62199 - }, - { - "epoch": 1.59, - "learning_rate": 9.46897717007725e-07, - "loss": 0.7559, - "step": 62200 - }, - { - "epoch": 1.59, - "learning_rate": 9.468700856150014e-07, - "loss": 0.5911, - "step": 62201 - }, - { - "epoch": 1.59, - "learning_rate": 9.468424542629572e-07, - "loss": 0.519, - "step": 62202 - }, - { - "epoch": 1.59, - "learning_rate": 9.46814822951613e-07, - "loss": 0.6729, - "step": 62203 - }, - { - "epoch": 1.59, - "learning_rate": 9.467871916809906e-07, - "loss": 0.6777, - "step": 62204 - }, - { - "epoch": 1.59, - "learning_rate": 9.467595604511104e-07, - "loss": 0.6719, - "step": 62205 - }, - { - "epoch": 1.59, - "learning_rate": 9.467319292619941e-07, - "loss": 0.7734, - "step": 62206 - }, - { - "epoch": 1.59, - "learning_rate": 9.467042981136627e-07, - "loss": 0.6387, - "step": 62207 - }, - { - "epoch": 1.59, - "learning_rate": 9.466766670061375e-07, - "loss": 0.6836, - "step": 62208 - }, - { - "epoch": 1.59, - "learning_rate": 9.466490359394399e-07, - "loss": 0.6221, - "step": 62209 - }, - { - "epoch": 1.59, - "learning_rate": 9.466214049135904e-07, - "loss": 0.8076, - "step": 62210 - }, - { - "epoch": 1.59, - "learning_rate": 9.465937739286101e-07, - "loss": 0.6211, - "step": 62211 - }, - { - "epoch": 1.59, - "learning_rate": 9.465661429845207e-07, - "loss": 0.4642, - "step": 62212 - }, - { - "epoch": 1.59, - "learning_rate": 9.465385120813429e-07, - "loss": 0.6885, - "step": 62213 - }, - { - "epoch": 1.59, - "learning_rate": 9.465108812190985e-07, - "loss": 0.6548, - "step": 62214 - }, - { - "epoch": 1.59, - "learning_rate": 9.464832503978079e-07, - "loss": 0.3291, - "step": 62215 - }, - { - "epoch": 1.59, - "learning_rate": 9.464556196174929e-07, - "loss": 0.5129, - "step": 62216 - }, - { - "epoch": 1.59, - "learning_rate": 9.464279888781741e-07, - "loss": 0.5498, - "step": 62217 - }, - { - "epoch": 1.59, - "learning_rate": 9.464003581798731e-07, - "loss": 0.751, - "step": 62218 - }, - { - "epoch": 1.59, - "learning_rate": 9.463727275226113e-07, - "loss": 0.6016, - "step": 62219 - }, - { - "epoch": 1.59, - "learning_rate": 9.463450969064088e-07, - "loss": 0.6738, - "step": 62220 - }, - { - "epoch": 1.59, - "learning_rate": 9.463174663312878e-07, - "loss": 0.7598, - "step": 62221 - }, - { - "epoch": 1.59, - "learning_rate": 9.462898357972687e-07, - "loss": 0.6841, - "step": 62222 - }, - { - "epoch": 1.59, - "learning_rate": 9.462622053043733e-07, - "loss": 0.5264, - "step": 62223 - }, - { - "epoch": 1.59, - "learning_rate": 9.462345748526222e-07, - "loss": 0.5146, - "step": 62224 - }, - { - "epoch": 1.59, - "learning_rate": 9.46206944442037e-07, - "loss": 0.4814, - "step": 62225 - }, - { - "epoch": 1.59, - "learning_rate": 9.461793140726387e-07, - "loss": 0.7461, - "step": 62226 - }, - { - "epoch": 1.59, - "learning_rate": 9.46151683744448e-07, - "loss": 0.6582, - "step": 62227 - }, - { - "epoch": 1.59, - "learning_rate": 9.46124053457487e-07, - "loss": 0.7559, - "step": 62228 - }, - { - "epoch": 1.59, - "learning_rate": 9.460964232117764e-07, - "loss": 0.5396, - "step": 62229 - }, - { - "epoch": 1.59, - "learning_rate": 9.460687930073369e-07, - "loss": 0.44, - "step": 62230 - }, - { - "epoch": 1.6, - "learning_rate": 9.460411628441904e-07, - "loss": 0.5938, - "step": 62231 - }, - { - "epoch": 1.6, - "learning_rate": 9.460135327223573e-07, - "loss": 0.7402, - "step": 62232 - }, - { - "epoch": 1.6, - "learning_rate": 9.459859026418593e-07, - "loss": 0.4114, - "step": 62233 - }, - { - "epoch": 1.6, - "learning_rate": 9.459582726027174e-07, - "loss": 0.6602, - "step": 62234 - }, - { - "epoch": 1.6, - "learning_rate": 9.459306426049528e-07, - "loss": 0.7427, - "step": 62235 - }, - { - "epoch": 1.6, - "learning_rate": 9.459030126485865e-07, - "loss": 0.6016, - "step": 62236 - }, - { - "epoch": 1.6, - "learning_rate": 9.4587538273364e-07, - "loss": 0.6504, - "step": 62237 - }, - { - "epoch": 1.6, - "learning_rate": 9.458477528601339e-07, - "loss": 0.7285, - "step": 62238 - }, - { - "epoch": 1.6, - "learning_rate": 9.458201230280903e-07, - "loss": 0.5547, - "step": 62239 - }, - { - "epoch": 1.6, - "learning_rate": 9.457924932375295e-07, - "loss": 0.4927, - "step": 62240 - }, - { - "epoch": 1.6, - "learning_rate": 9.457648634884726e-07, - "loss": 0.7529, - "step": 62241 - }, - { - "epoch": 1.6, - "learning_rate": 9.457372337809413e-07, - "loss": 0.5869, - "step": 62242 - }, - { - "epoch": 1.6, - "learning_rate": 9.457096041149562e-07, - "loss": 0.5132, - "step": 62243 - }, - { - "epoch": 1.6, - "learning_rate": 9.456819744905391e-07, - "loss": 0.8008, - "step": 62244 - }, - { - "epoch": 1.6, - "learning_rate": 9.456543449077108e-07, - "loss": 0.7197, - "step": 62245 - }, - { - "epoch": 1.6, - "learning_rate": 9.456267153664922e-07, - "loss": 0.668, - "step": 62246 - }, - { - "epoch": 1.6, - "learning_rate": 9.455990858669049e-07, - "loss": 0.6802, - "step": 62247 - }, - { - "epoch": 1.6, - "learning_rate": 9.455714564089697e-07, - "loss": 0.7568, - "step": 62248 - }, - { - "epoch": 1.6, - "learning_rate": 9.455438269927085e-07, - "loss": 0.5898, - "step": 62249 - }, - { - "epoch": 1.6, - "learning_rate": 9.455161976181415e-07, - "loss": 0.582, - "step": 62250 - }, - { - "epoch": 1.6, - "learning_rate": 9.454885682852901e-07, - "loss": 0.7129, - "step": 62251 - }, - { - "epoch": 1.6, - "learning_rate": 9.454609389941758e-07, - "loss": 0.5752, - "step": 62252 - }, - { - "epoch": 1.6, - "learning_rate": 9.454333097448194e-07, - "loss": 0.7539, - "step": 62253 - }, - { - "epoch": 1.6, - "learning_rate": 9.454056805372423e-07, - "loss": 0.7549, - "step": 62254 - }, - { - "epoch": 1.6, - "learning_rate": 9.453780513714654e-07, - "loss": 0.494, - "step": 62255 - }, - { - "epoch": 1.6, - "learning_rate": 9.453504222475103e-07, - "loss": 0.5854, - "step": 62256 - }, - { - "epoch": 1.6, - "learning_rate": 9.453227931653975e-07, - "loss": 0.5444, - "step": 62257 - }, - { - "epoch": 1.6, - "learning_rate": 9.452951641251489e-07, - "loss": 0.6299, - "step": 62258 - }, - { - "epoch": 1.6, - "learning_rate": 9.452675351267853e-07, - "loss": 0.667, - "step": 62259 - }, - { - "epoch": 1.6, - "learning_rate": 9.452399061703275e-07, - "loss": 0.8516, - "step": 62260 - }, - { - "epoch": 1.6, - "learning_rate": 9.452122772557973e-07, - "loss": 0.9287, - "step": 62261 - }, - { - "epoch": 1.6, - "learning_rate": 9.451846483832155e-07, - "loss": 0.564, - "step": 62262 - }, - { - "epoch": 1.6, - "learning_rate": 9.451570195526029e-07, - "loss": 0.5381, - "step": 62263 - }, - { - "epoch": 1.6, - "learning_rate": 9.451293907639814e-07, - "loss": 0.5542, - "step": 62264 - }, - { - "epoch": 1.6, - "learning_rate": 9.451017620173717e-07, - "loss": 0.5717, - "step": 62265 - }, - { - "epoch": 1.6, - "learning_rate": 9.450741333127951e-07, - "loss": 0.6484, - "step": 62266 - }, - { - "epoch": 1.6, - "learning_rate": 9.450465046502726e-07, - "loss": 0.4825, - "step": 62267 - }, - { - "epoch": 1.6, - "learning_rate": 9.450188760298256e-07, - "loss": 0.6038, - "step": 62268 - }, - { - "epoch": 1.6, - "learning_rate": 9.449912474514754e-07, - "loss": 0.3607, - "step": 62269 - }, - { - "epoch": 1.6, - "learning_rate": 9.449636189152425e-07, - "loss": 0.5649, - "step": 62270 - }, - { - "epoch": 1.6, - "learning_rate": 9.449359904211484e-07, - "loss": 0.6152, - "step": 62271 - }, - { - "epoch": 1.6, - "learning_rate": 9.449083619692143e-07, - "loss": 0.6211, - "step": 62272 - }, - { - "epoch": 1.6, - "learning_rate": 9.448807335594614e-07, - "loss": 0.7266, - "step": 62273 - }, - { - "epoch": 1.6, - "learning_rate": 9.448531051919106e-07, - "loss": 0.5273, - "step": 62274 - }, - { - "epoch": 1.6, - "learning_rate": 9.448254768665836e-07, - "loss": 0.7275, - "step": 62275 - }, - { - "epoch": 1.6, - "learning_rate": 9.447978485835008e-07, - "loss": 0.7976, - "step": 62276 - }, - { - "epoch": 1.6, - "learning_rate": 9.44770220342684e-07, - "loss": 0.8037, - "step": 62277 - }, - { - "epoch": 1.6, - "learning_rate": 9.44742592144154e-07, - "loss": 0.5215, - "step": 62278 - }, - { - "epoch": 1.6, - "learning_rate": 9.447149639879326e-07, - "loss": 0.7197, - "step": 62279 - }, - { - "epoch": 1.6, - "learning_rate": 9.446873358740398e-07, - "loss": 0.4393, - "step": 62280 - }, - { - "epoch": 1.6, - "learning_rate": 9.446597078024976e-07, - "loss": 0.4438, - "step": 62281 - }, - { - "epoch": 1.6, - "learning_rate": 9.446320797733267e-07, - "loss": 0.5527, - "step": 62282 - }, - { - "epoch": 1.6, - "learning_rate": 9.446044517865487e-07, - "loss": 0.6274, - "step": 62283 - }, - { - "epoch": 1.6, - "learning_rate": 9.445768238421841e-07, - "loss": 0.8359, - "step": 62284 - }, - { - "epoch": 1.6, - "learning_rate": 9.445491959402549e-07, - "loss": 0.7295, - "step": 62285 - }, - { - "epoch": 1.6, - "learning_rate": 9.445215680807817e-07, - "loss": 0.7061, - "step": 62286 - }, - { - "epoch": 1.6, - "learning_rate": 9.444939402637858e-07, - "loss": 0.7432, - "step": 62287 - }, - { - "epoch": 1.6, - "learning_rate": 9.444663124892882e-07, - "loss": 0.6855, - "step": 62288 - }, - { - "epoch": 1.6, - "learning_rate": 9.444386847573107e-07, - "loss": 0.457, - "step": 62289 - }, - { - "epoch": 1.6, - "learning_rate": 9.444110570678736e-07, - "loss": 0.6562, - "step": 62290 - }, - { - "epoch": 1.6, - "learning_rate": 9.443834294209983e-07, - "loss": 0.6138, - "step": 62291 - }, - { - "epoch": 1.6, - "learning_rate": 9.443558018167062e-07, - "loss": 0.6313, - "step": 62292 - }, - { - "epoch": 1.6, - "learning_rate": 9.443281742550179e-07, - "loss": 0.4912, - "step": 62293 - }, - { - "epoch": 1.6, - "learning_rate": 9.443005467359555e-07, - "loss": 0.4243, - "step": 62294 - }, - { - "epoch": 1.6, - "learning_rate": 9.442729192595392e-07, - "loss": 0.5923, - "step": 62295 - }, - { - "epoch": 1.6, - "learning_rate": 9.442452918257908e-07, - "loss": 0.4585, - "step": 62296 - }, - { - "epoch": 1.6, - "learning_rate": 9.442176644347311e-07, - "loss": 0.7324, - "step": 62297 - }, - { - "epoch": 1.6, - "learning_rate": 9.441900370863815e-07, - "loss": 0.6387, - "step": 62298 - }, - { - "epoch": 1.6, - "learning_rate": 9.441624097807632e-07, - "loss": 0.6152, - "step": 62299 - }, - { - "epoch": 1.6, - "learning_rate": 9.441347825178972e-07, - "loss": 0.8389, - "step": 62300 - }, - { - "epoch": 1.6, - "learning_rate": 9.441071552978042e-07, - "loss": 0.6826, - "step": 62301 - }, - { - "epoch": 1.6, - "learning_rate": 9.44079528120506e-07, - "loss": 0.687, - "step": 62302 - }, - { - "epoch": 1.6, - "learning_rate": 9.440519009860233e-07, - "loss": 0.6333, - "step": 62303 - }, - { - "epoch": 1.6, - "learning_rate": 9.440242738943778e-07, - "loss": 0.5781, - "step": 62304 - }, - { - "epoch": 1.6, - "learning_rate": 9.4399664684559e-07, - "loss": 0.666, - "step": 62305 - }, - { - "epoch": 1.6, - "learning_rate": 9.439690198396817e-07, - "loss": 0.5825, - "step": 62306 - }, - { - "epoch": 1.6, - "learning_rate": 9.439413928766735e-07, - "loss": 0.666, - "step": 62307 - }, - { - "epoch": 1.6, - "learning_rate": 9.43913765956587e-07, - "loss": 0.6118, - "step": 62308 - }, - { - "epoch": 1.6, - "learning_rate": 9.438861390794434e-07, - "loss": 0.5776, - "step": 62309 - }, - { - "epoch": 1.6, - "learning_rate": 9.438585122452631e-07, - "loss": 0.6328, - "step": 62310 - }, - { - "epoch": 1.6, - "learning_rate": 9.438308854540681e-07, - "loss": 0.4883, - "step": 62311 - }, - { - "epoch": 1.6, - "learning_rate": 9.43803258705879e-07, - "loss": 0.5649, - "step": 62312 - }, - { - "epoch": 1.6, - "learning_rate": 9.437756320007172e-07, - "loss": 0.6807, - "step": 62313 - }, - { - "epoch": 1.6, - "learning_rate": 9.437480053386038e-07, - "loss": 0.4487, - "step": 62314 - }, - { - "epoch": 1.6, - "learning_rate": 9.4372037871956e-07, - "loss": 0.5539, - "step": 62315 - }, - { - "epoch": 1.6, - "learning_rate": 9.43692752143607e-07, - "loss": 0.5591, - "step": 62316 - }, - { - "epoch": 1.6, - "learning_rate": 9.436651256107656e-07, - "loss": 0.7109, - "step": 62317 - }, - { - "epoch": 1.6, - "learning_rate": 9.436374991210575e-07, - "loss": 0.5071, - "step": 62318 - }, - { - "epoch": 1.6, - "learning_rate": 9.436098726745039e-07, - "loss": 0.4346, - "step": 62319 - }, - { - "epoch": 1.6, - "learning_rate": 9.43582246271125e-07, - "loss": 0.6816, - "step": 62320 - }, - { - "epoch": 1.6, - "learning_rate": 9.435546199109428e-07, - "loss": 0.686, - "step": 62321 - }, - { - "epoch": 1.6, - "learning_rate": 9.435269935939782e-07, - "loss": 0.5586, - "step": 62322 - }, - { - "epoch": 1.6, - "learning_rate": 9.434993673202524e-07, - "loss": 0.5476, - "step": 62323 - }, - { - "epoch": 1.6, - "learning_rate": 9.434717410897865e-07, - "loss": 0.5679, - "step": 62324 - }, - { - "epoch": 1.6, - "learning_rate": 9.434441149026018e-07, - "loss": 0.6875, - "step": 62325 - }, - { - "epoch": 1.6, - "learning_rate": 9.434164887587191e-07, - "loss": 0.7256, - "step": 62326 - }, - { - "epoch": 1.6, - "learning_rate": 9.4338886265816e-07, - "loss": 0.6401, - "step": 62327 - }, - { - "epoch": 1.6, - "learning_rate": 9.433612366009453e-07, - "loss": 0.5649, - "step": 62328 - }, - { - "epoch": 1.6, - "learning_rate": 9.433336105870968e-07, - "loss": 0.6753, - "step": 62329 - }, - { - "epoch": 1.6, - "learning_rate": 9.433059846166348e-07, - "loss": 0.613, - "step": 62330 - }, - { - "epoch": 1.6, - "learning_rate": 9.432783586895806e-07, - "loss": 0.6064, - "step": 62331 - }, - { - "epoch": 1.6, - "learning_rate": 9.432507328059558e-07, - "loss": 0.5549, - "step": 62332 - }, - { - "epoch": 1.6, - "learning_rate": 9.432231069657811e-07, - "loss": 0.7334, - "step": 62333 - }, - { - "epoch": 1.6, - "learning_rate": 9.431954811690781e-07, - "loss": 0.5986, - "step": 62334 - }, - { - "epoch": 1.6, - "learning_rate": 9.431678554158677e-07, - "loss": 0.6904, - "step": 62335 - }, - { - "epoch": 1.6, - "learning_rate": 9.431402297061707e-07, - "loss": 0.5833, - "step": 62336 - }, - { - "epoch": 1.6, - "learning_rate": 9.43112604040009e-07, - "loss": 0.5358, - "step": 62337 - }, - { - "epoch": 1.6, - "learning_rate": 9.430849784174031e-07, - "loss": 0.4495, - "step": 62338 - }, - { - "epoch": 1.6, - "learning_rate": 9.430573528383747e-07, - "loss": 0.7246, - "step": 62339 - }, - { - "epoch": 1.6, - "learning_rate": 9.430297273029446e-07, - "loss": 0.7539, - "step": 62340 - }, - { - "epoch": 1.6, - "learning_rate": 9.430021018111338e-07, - "loss": 0.6914, - "step": 62341 - }, - { - "epoch": 1.6, - "learning_rate": 9.429744763629639e-07, - "loss": 0.6294, - "step": 62342 - }, - { - "epoch": 1.6, - "learning_rate": 9.429468509584556e-07, - "loss": 0.6187, - "step": 62343 - }, - { - "epoch": 1.6, - "learning_rate": 9.429192255976304e-07, - "loss": 0.6436, - "step": 62344 - }, - { - "epoch": 1.6, - "learning_rate": 9.428916002805092e-07, - "loss": 0.6167, - "step": 62345 - }, - { - "epoch": 1.6, - "learning_rate": 9.428639750071135e-07, - "loss": 0.478, - "step": 62346 - }, - { - "epoch": 1.6, - "learning_rate": 9.428363497774639e-07, - "loss": 0.7715, - "step": 62347 - }, - { - "epoch": 1.6, - "learning_rate": 9.428087245915822e-07, - "loss": 0.4993, - "step": 62348 - }, - { - "epoch": 1.6, - "learning_rate": 9.427810994494894e-07, - "loss": 0.6816, - "step": 62349 - }, - { - "epoch": 1.6, - "learning_rate": 9.427534743512061e-07, - "loss": 0.7061, - "step": 62350 - }, - { - "epoch": 1.6, - "learning_rate": 9.42725849296754e-07, - "loss": 0.6714, - "step": 62351 - }, - { - "epoch": 1.6, - "learning_rate": 9.426982242861541e-07, - "loss": 0.6143, - "step": 62352 - }, - { - "epoch": 1.6, - "learning_rate": 9.426705993194273e-07, - "loss": 0.6787, - "step": 62353 - }, - { - "epoch": 1.6, - "learning_rate": 9.426429743965952e-07, - "loss": 0.6621, - "step": 62354 - }, - { - "epoch": 1.6, - "learning_rate": 9.426153495176786e-07, - "loss": 0.3123, - "step": 62355 - }, - { - "epoch": 1.6, - "learning_rate": 9.425877246826988e-07, - "loss": 0.605, - "step": 62356 - }, - { - "epoch": 1.6, - "learning_rate": 9.42560099891677e-07, - "loss": 0.6187, - "step": 62357 - }, - { - "epoch": 1.6, - "learning_rate": 9.425324751446345e-07, - "loss": 0.8174, - "step": 62358 - }, - { - "epoch": 1.6, - "learning_rate": 9.425048504415922e-07, - "loss": 0.6304, - "step": 62359 - }, - { - "epoch": 1.6, - "learning_rate": 9.424772257825709e-07, - "loss": 0.4212, - "step": 62360 - }, - { - "epoch": 1.6, - "learning_rate": 9.424496011675925e-07, - "loss": 0.6738, - "step": 62361 - }, - { - "epoch": 1.6, - "learning_rate": 9.424219765966774e-07, - "loss": 0.6631, - "step": 62362 - }, - { - "epoch": 1.6, - "learning_rate": 9.423943520698476e-07, - "loss": 0.4971, - "step": 62363 - }, - { - "epoch": 1.6, - "learning_rate": 9.423667275871234e-07, - "loss": 0.4692, - "step": 62364 - }, - { - "epoch": 1.6, - "learning_rate": 9.423391031485267e-07, - "loss": 0.6416, - "step": 62365 - }, - { - "epoch": 1.6, - "learning_rate": 9.423114787540781e-07, - "loss": 0.6026, - "step": 62366 - }, - { - "epoch": 1.6, - "learning_rate": 9.42283854403799e-07, - "loss": 0.7383, - "step": 62367 - }, - { - "epoch": 1.6, - "learning_rate": 9.422562300977108e-07, - "loss": 0.6016, - "step": 62368 - }, - { - "epoch": 1.6, - "learning_rate": 9.422286058358341e-07, - "loss": 0.6807, - "step": 62369 - }, - { - "epoch": 1.6, - "learning_rate": 9.422009816181901e-07, - "loss": 0.5537, - "step": 62370 - }, - { - "epoch": 1.6, - "learning_rate": 9.421733574448003e-07, - "loss": 0.6035, - "step": 62371 - }, - { - "epoch": 1.6, - "learning_rate": 9.421457333156856e-07, - "loss": 0.3418, - "step": 62372 - }, - { - "epoch": 1.6, - "learning_rate": 9.421181092308674e-07, - "loss": 0.4365, - "step": 62373 - }, - { - "epoch": 1.6, - "learning_rate": 9.420904851903665e-07, - "loss": 0.5728, - "step": 62374 - }, - { - "epoch": 1.6, - "learning_rate": 9.420628611942045e-07, - "loss": 0.6885, - "step": 62375 - }, - { - "epoch": 1.6, - "learning_rate": 9.420352372424021e-07, - "loss": 0.5122, - "step": 62376 - }, - { - "epoch": 1.6, - "learning_rate": 9.420076133349808e-07, - "loss": 0.4312, - "step": 62377 - }, - { - "epoch": 1.6, - "learning_rate": 9.419799894719619e-07, - "loss": 0.6689, - "step": 62378 - }, - { - "epoch": 1.6, - "learning_rate": 9.419523656533658e-07, - "loss": 0.5518, - "step": 62379 - }, - { - "epoch": 1.6, - "learning_rate": 9.419247418792143e-07, - "loss": 0.6021, - "step": 62380 - }, - { - "epoch": 1.6, - "learning_rate": 9.418971181495281e-07, - "loss": 0.4268, - "step": 62381 - }, - { - "epoch": 1.6, - "learning_rate": 9.418694944643289e-07, - "loss": 0.71, - "step": 62382 - }, - { - "epoch": 1.6, - "learning_rate": 9.418418708236373e-07, - "loss": 0.6699, - "step": 62383 - }, - { - "epoch": 1.6, - "learning_rate": 9.418142472274749e-07, - "loss": 0.6133, - "step": 62384 - }, - { - "epoch": 1.6, - "learning_rate": 9.417866236758625e-07, - "loss": 0.7559, - "step": 62385 - }, - { - "epoch": 1.6, - "learning_rate": 9.417590001688215e-07, - "loss": 0.6699, - "step": 62386 - }, - { - "epoch": 1.6, - "learning_rate": 9.417313767063728e-07, - "loss": 0.6064, - "step": 62387 - }, - { - "epoch": 1.6, - "learning_rate": 9.417037532885385e-07, - "loss": 0.4929, - "step": 62388 - }, - { - "epoch": 1.6, - "learning_rate": 9.41676129915338e-07, - "loss": 0.6895, - "step": 62389 - }, - { - "epoch": 1.6, - "learning_rate": 9.416485065867939e-07, - "loss": 0.6719, - "step": 62390 - }, - { - "epoch": 1.6, - "learning_rate": 9.416208833029266e-07, - "loss": 0.4021, - "step": 62391 - }, - { - "epoch": 1.6, - "learning_rate": 9.415932600637576e-07, - "loss": 0.5247, - "step": 62392 - }, - { - "epoch": 1.6, - "learning_rate": 9.415656368693078e-07, - "loss": 0.7705, - "step": 62393 - }, - { - "epoch": 1.6, - "learning_rate": 9.415380137195987e-07, - "loss": 0.5725, - "step": 62394 - }, - { - "epoch": 1.6, - "learning_rate": 9.41510390614651e-07, - "loss": 0.644, - "step": 62395 - }, - { - "epoch": 1.6, - "learning_rate": 9.414827675544865e-07, - "loss": 0.5498, - "step": 62396 - }, - { - "epoch": 1.6, - "learning_rate": 9.414551445391256e-07, - "loss": 0.7432, - "step": 62397 - }, - { - "epoch": 1.6, - "learning_rate": 9.414275215685903e-07, - "loss": 0.749, - "step": 62398 - }, - { - "epoch": 1.6, - "learning_rate": 9.413998986429009e-07, - "loss": 0.6328, - "step": 62399 - }, - { - "epoch": 1.6, - "learning_rate": 9.413722757620789e-07, - "loss": 0.6904, - "step": 62400 - }, - { - "epoch": 1.6, - "learning_rate": 9.413446529261455e-07, - "loss": 0.6855, - "step": 62401 - }, - { - "epoch": 1.6, - "learning_rate": 9.413170301351217e-07, - "loss": 0.5386, - "step": 62402 - }, - { - "epoch": 1.6, - "learning_rate": 9.412894073890289e-07, - "loss": 0.6606, - "step": 62403 - }, - { - "epoch": 1.6, - "learning_rate": 9.412617846878879e-07, - "loss": 0.6729, - "step": 62404 - }, - { - "epoch": 1.6, - "learning_rate": 9.412341620317201e-07, - "loss": 0.7998, - "step": 62405 - }, - { - "epoch": 1.6, - "learning_rate": 9.412065394205467e-07, - "loss": 0.7598, - "step": 62406 - }, - { - "epoch": 1.6, - "learning_rate": 9.411789168543887e-07, - "loss": 0.5032, - "step": 62407 - }, - { - "epoch": 1.6, - "learning_rate": 9.411512943332677e-07, - "loss": 0.6104, - "step": 62408 - }, - { - "epoch": 1.6, - "learning_rate": 9.411236718572041e-07, - "loss": 0.7578, - "step": 62409 - }, - { - "epoch": 1.6, - "learning_rate": 9.410960494262192e-07, - "loss": 0.5389, - "step": 62410 - }, - { - "epoch": 1.6, - "learning_rate": 9.410684270403347e-07, - "loss": 0.7188, - "step": 62411 - }, - { - "epoch": 1.6, - "learning_rate": 9.41040804699571e-07, - "loss": 0.7129, - "step": 62412 - }, - { - "epoch": 1.6, - "learning_rate": 9.4101318240395e-07, - "loss": 0.6357, - "step": 62413 - }, - { - "epoch": 1.6, - "learning_rate": 9.409855601534922e-07, - "loss": 0.666, - "step": 62414 - }, - { - "epoch": 1.6, - "learning_rate": 9.409579379482192e-07, - "loss": 0.584, - "step": 62415 - }, - { - "epoch": 1.6, - "learning_rate": 9.409303157881519e-07, - "loss": 0.791, - "step": 62416 - }, - { - "epoch": 1.6, - "learning_rate": 9.409026936733117e-07, - "loss": 0.6216, - "step": 62417 - }, - { - "epoch": 1.6, - "learning_rate": 9.408750716037198e-07, - "loss": 0.4746, - "step": 62418 - }, - { - "epoch": 1.6, - "learning_rate": 9.408474495793968e-07, - "loss": 0.7046, - "step": 62419 - }, - { - "epoch": 1.6, - "learning_rate": 9.408198276003642e-07, - "loss": 0.7314, - "step": 62420 - }, - { - "epoch": 1.6, - "learning_rate": 9.40792205666643e-07, - "loss": 0.562, - "step": 62421 - }, - { - "epoch": 1.6, - "learning_rate": 9.407645837782548e-07, - "loss": 0.627, - "step": 62422 - }, - { - "epoch": 1.6, - "learning_rate": 9.407369619352203e-07, - "loss": 0.6211, - "step": 62423 - }, - { - "epoch": 1.6, - "learning_rate": 9.407093401375607e-07, - "loss": 0.8408, - "step": 62424 - }, - { - "epoch": 1.6, - "learning_rate": 9.406817183852975e-07, - "loss": 0.6602, - "step": 62425 - }, - { - "epoch": 1.6, - "learning_rate": 9.406540966784512e-07, - "loss": 0.6953, - "step": 62426 - }, - { - "epoch": 1.6, - "learning_rate": 9.406264750170436e-07, - "loss": 0.5596, - "step": 62427 - }, - { - "epoch": 1.6, - "learning_rate": 9.405988534010958e-07, - "loss": 0.6699, - "step": 62428 - }, - { - "epoch": 1.6, - "learning_rate": 9.405712318306283e-07, - "loss": 0.6392, - "step": 62429 - }, - { - "epoch": 1.6, - "learning_rate": 9.40543610305663e-07, - "loss": 0.6182, - "step": 62430 - }, - { - "epoch": 1.6, - "learning_rate": 9.405159888262203e-07, - "loss": 0.6357, - "step": 62431 - }, - { - "epoch": 1.6, - "learning_rate": 9.40488367392322e-07, - "loss": 0.6846, - "step": 62432 - }, - { - "epoch": 1.6, - "learning_rate": 9.404607460039889e-07, - "loss": 0.5879, - "step": 62433 - }, - { - "epoch": 1.6, - "learning_rate": 9.404331246612425e-07, - "loss": 0.582, - "step": 62434 - }, - { - "epoch": 1.6, - "learning_rate": 9.404055033641036e-07, - "loss": 0.3972, - "step": 62435 - }, - { - "epoch": 1.6, - "learning_rate": 9.403778821125935e-07, - "loss": 0.6475, - "step": 62436 - }, - { - "epoch": 1.6, - "learning_rate": 9.403502609067331e-07, - "loss": 0.4285, - "step": 62437 - }, - { - "epoch": 1.6, - "learning_rate": 9.403226397465442e-07, - "loss": 0.5962, - "step": 62438 - }, - { - "epoch": 1.6, - "learning_rate": 9.402950186320474e-07, - "loss": 0.4026, - "step": 62439 - }, - { - "epoch": 1.6, - "learning_rate": 9.402673975632637e-07, - "loss": 0.7041, - "step": 62440 - }, - { - "epoch": 1.6, - "learning_rate": 9.402397765402147e-07, - "loss": 0.5796, - "step": 62441 - }, - { - "epoch": 1.6, - "learning_rate": 9.402121555629214e-07, - "loss": 0.6147, - "step": 62442 - }, - { - "epoch": 1.6, - "learning_rate": 9.401845346314046e-07, - "loss": 0.6128, - "step": 62443 - }, - { - "epoch": 1.6, - "learning_rate": 9.401569137456861e-07, - "loss": 0.7412, - "step": 62444 - }, - { - "epoch": 1.6, - "learning_rate": 9.401292929057864e-07, - "loss": 0.6597, - "step": 62445 - }, - { - "epoch": 1.6, - "learning_rate": 9.401016721117271e-07, - "loss": 0.5869, - "step": 62446 - }, - { - "epoch": 1.6, - "learning_rate": 9.40074051363529e-07, - "loss": 0.6069, - "step": 62447 - }, - { - "epoch": 1.6, - "learning_rate": 9.40046430661214e-07, - "loss": 0.708, - "step": 62448 - }, - { - "epoch": 1.6, - "learning_rate": 9.400188100048024e-07, - "loss": 0.3684, - "step": 62449 - }, - { - "epoch": 1.6, - "learning_rate": 9.399911893943154e-07, - "loss": 0.5663, - "step": 62450 - }, - { - "epoch": 1.6, - "learning_rate": 9.399635688297746e-07, - "loss": 0.5349, - "step": 62451 - }, - { - "epoch": 1.6, - "learning_rate": 9.399359483112008e-07, - "loss": 0.4644, - "step": 62452 - }, - { - "epoch": 1.6, - "learning_rate": 9.399083278386154e-07, - "loss": 0.7056, - "step": 62453 - }, - { - "epoch": 1.6, - "learning_rate": 9.398807074120393e-07, - "loss": 0.3629, - "step": 62454 - }, - { - "epoch": 1.6, - "learning_rate": 9.398530870314939e-07, - "loss": 0.6465, - "step": 62455 - }, - { - "epoch": 1.6, - "learning_rate": 9.39825466697e-07, - "loss": 0.7393, - "step": 62456 - }, - { - "epoch": 1.6, - "learning_rate": 9.397978464085793e-07, - "loss": 0.605, - "step": 62457 - }, - { - "epoch": 1.6, - "learning_rate": 9.397702261662527e-07, - "loss": 0.5293, - "step": 62458 - }, - { - "epoch": 1.6, - "learning_rate": 9.397426059700412e-07, - "loss": 0.4128, - "step": 62459 - }, - { - "epoch": 1.6, - "learning_rate": 9.397149858199658e-07, - "loss": 0.5996, - "step": 62460 - }, - { - "epoch": 1.6, - "learning_rate": 9.39687365716048e-07, - "loss": 0.6099, - "step": 62461 - }, - { - "epoch": 1.6, - "learning_rate": 9.396597456583087e-07, - "loss": 0.7441, - "step": 62462 - }, - { - "epoch": 1.6, - "learning_rate": 9.396321256467692e-07, - "loss": 0.5566, - "step": 62463 - }, - { - "epoch": 1.6, - "learning_rate": 9.396045056814504e-07, - "loss": 0.5537, - "step": 62464 - }, - { - "epoch": 1.6, - "learning_rate": 9.39576885762374e-07, - "loss": 0.4681, - "step": 62465 - }, - { - "epoch": 1.6, - "learning_rate": 9.395492658895605e-07, - "loss": 0.5273, - "step": 62466 - }, - { - "epoch": 1.6, - "learning_rate": 9.395216460630317e-07, - "loss": 0.7822, - "step": 62467 - }, - { - "epoch": 1.6, - "learning_rate": 9.394940262828084e-07, - "loss": 0.7217, - "step": 62468 - }, - { - "epoch": 1.6, - "learning_rate": 9.394664065489114e-07, - "loss": 0.6436, - "step": 62469 - }, - { - "epoch": 1.6, - "learning_rate": 9.394387868613625e-07, - "loss": 0.5035, - "step": 62470 - }, - { - "epoch": 1.6, - "learning_rate": 9.394111672201822e-07, - "loss": 0.8418, - "step": 62471 - }, - { - "epoch": 1.6, - "learning_rate": 9.393835476253922e-07, - "loss": 0.6084, - "step": 62472 - }, - { - "epoch": 1.6, - "learning_rate": 9.393559280770133e-07, - "loss": 0.5776, - "step": 62473 - }, - { - "epoch": 1.6, - "learning_rate": 9.393283085750669e-07, - "loss": 0.709, - "step": 62474 - }, - { - "epoch": 1.6, - "learning_rate": 9.393006891195739e-07, - "loss": 0.7578, - "step": 62475 - }, - { - "epoch": 1.6, - "learning_rate": 9.392730697105558e-07, - "loss": 0.5972, - "step": 62476 - }, - { - "epoch": 1.6, - "learning_rate": 9.392454503480332e-07, - "loss": 0.7529, - "step": 62477 - }, - { - "epoch": 1.6, - "learning_rate": 9.392178310320283e-07, - "loss": 0.7344, - "step": 62478 - }, - { - "epoch": 1.6, - "learning_rate": 9.391902117625608e-07, - "loss": 0.4397, - "step": 62479 - }, - { - "epoch": 1.6, - "learning_rate": 9.391625925396527e-07, - "loss": 0.5405, - "step": 62480 - }, - { - "epoch": 1.6, - "learning_rate": 9.391349733633249e-07, - "loss": 0.7588, - "step": 62481 - }, - { - "epoch": 1.6, - "learning_rate": 9.391073542335989e-07, - "loss": 0.6133, - "step": 62482 - }, - { - "epoch": 1.6, - "learning_rate": 9.390797351504953e-07, - "loss": 0.4644, - "step": 62483 - }, - { - "epoch": 1.6, - "learning_rate": 9.390521161140358e-07, - "loss": 0.5037, - "step": 62484 - }, - { - "epoch": 1.6, - "learning_rate": 9.390244971242411e-07, - "loss": 0.6484, - "step": 62485 - }, - { - "epoch": 1.6, - "learning_rate": 9.389968781811327e-07, - "loss": 0.5459, - "step": 62486 - }, - { - "epoch": 1.6, - "learning_rate": 9.389692592847314e-07, - "loss": 0.6768, - "step": 62487 - }, - { - "epoch": 1.6, - "learning_rate": 9.38941640435059e-07, - "loss": 0.6689, - "step": 62488 - }, - { - "epoch": 1.6, - "learning_rate": 9.389140216321359e-07, - "loss": 0.6777, - "step": 62489 - }, - { - "epoch": 1.6, - "learning_rate": 9.388864028759833e-07, - "loss": 0.6616, - "step": 62490 - }, - { - "epoch": 1.6, - "learning_rate": 9.388587841666228e-07, - "loss": 0.4568, - "step": 62491 - }, - { - "epoch": 1.6, - "learning_rate": 9.388311655040751e-07, - "loss": 0.5425, - "step": 62492 - }, - { - "epoch": 1.6, - "learning_rate": 9.388035468883619e-07, - "loss": 0.7109, - "step": 62493 - }, - { - "epoch": 1.6, - "learning_rate": 9.387759283195036e-07, - "loss": 0.5532, - "step": 62494 - }, - { - "epoch": 1.6, - "learning_rate": 9.387483097975221e-07, - "loss": 0.6431, - "step": 62495 - }, - { - "epoch": 1.6, - "learning_rate": 9.387206913224379e-07, - "loss": 0.5234, - "step": 62496 - }, - { - "epoch": 1.6, - "learning_rate": 9.386930728942728e-07, - "loss": 0.5605, - "step": 62497 - }, - { - "epoch": 1.6, - "learning_rate": 9.386654545130477e-07, - "loss": 0.646, - "step": 62498 - }, - { - "epoch": 1.6, - "learning_rate": 9.386378361787835e-07, - "loss": 0.5356, - "step": 62499 - }, - { - "epoch": 1.6, - "learning_rate": 9.386102178915012e-07, - "loss": 0.6792, - "step": 62500 - }, - { - "epoch": 1.6, - "learning_rate": 9.385825996512224e-07, - "loss": 0.6943, - "step": 62501 - }, - { - "epoch": 1.6, - "learning_rate": 9.38554981457968e-07, - "loss": 0.5645, - "step": 62502 - }, - { - "epoch": 1.6, - "learning_rate": 9.385273633117594e-07, - "loss": 0.6304, - "step": 62503 - }, - { - "epoch": 1.6, - "learning_rate": 9.384997452126174e-07, - "loss": 0.6113, - "step": 62504 - }, - { - "epoch": 1.6, - "learning_rate": 9.384721271605634e-07, - "loss": 0.6309, - "step": 62505 - }, - { - "epoch": 1.6, - "learning_rate": 9.384445091556184e-07, - "loss": 0.5864, - "step": 62506 - }, - { - "epoch": 1.6, - "learning_rate": 9.384168911978036e-07, - "loss": 0.676, - "step": 62507 - }, - { - "epoch": 1.6, - "learning_rate": 9.383892732871406e-07, - "loss": 0.4158, - "step": 62508 - }, - { - "epoch": 1.6, - "learning_rate": 9.383616554236496e-07, - "loss": 0.7144, - "step": 62509 - }, - { - "epoch": 1.6, - "learning_rate": 9.383340376073524e-07, - "loss": 0.5322, - "step": 62510 - }, - { - "epoch": 1.6, - "learning_rate": 9.383064198382697e-07, - "loss": 0.6182, - "step": 62511 - }, - { - "epoch": 1.6, - "learning_rate": 9.382788021164234e-07, - "loss": 0.5981, - "step": 62512 - }, - { - "epoch": 1.6, - "learning_rate": 9.382511844418338e-07, - "loss": 0.5715, - "step": 62513 - }, - { - "epoch": 1.6, - "learning_rate": 9.382235668145227e-07, - "loss": 0.7935, - "step": 62514 - }, - { - "epoch": 1.6, - "learning_rate": 9.381959492345109e-07, - "loss": 0.6465, - "step": 62515 - }, - { - "epoch": 1.6, - "learning_rate": 9.381683317018195e-07, - "loss": 0.6553, - "step": 62516 - }, - { - "epoch": 1.6, - "learning_rate": 9.381407142164699e-07, - "loss": 0.6301, - "step": 62517 - }, - { - "epoch": 1.6, - "learning_rate": 9.381130967784833e-07, - "loss": 0.6284, - "step": 62518 - }, - { - "epoch": 1.6, - "learning_rate": 9.380854793878804e-07, - "loss": 0.5215, - "step": 62519 - }, - { - "epoch": 1.6, - "learning_rate": 9.380578620446828e-07, - "loss": 0.4424, - "step": 62520 - }, - { - "epoch": 1.6, - "learning_rate": 9.380302447489111e-07, - "loss": 0.6348, - "step": 62521 - }, - { - "epoch": 1.6, - "learning_rate": 9.38002627500587e-07, - "loss": 0.606, - "step": 62522 - }, - { - "epoch": 1.6, - "learning_rate": 9.379750102997312e-07, - "loss": 0.6421, - "step": 62523 - }, - { - "epoch": 1.6, - "learning_rate": 9.379473931463655e-07, - "loss": 0.53, - "step": 62524 - }, - { - "epoch": 1.6, - "learning_rate": 9.379197760405102e-07, - "loss": 0.6221, - "step": 62525 - }, - { - "epoch": 1.6, - "learning_rate": 9.378921589821872e-07, - "loss": 0.4111, - "step": 62526 - }, - { - "epoch": 1.6, - "learning_rate": 9.37864541971417e-07, - "loss": 0.6475, - "step": 62527 - }, - { - "epoch": 1.6, - "learning_rate": 9.378369250082217e-07, - "loss": 0.7695, - "step": 62528 - }, - { - "epoch": 1.6, - "learning_rate": 9.378093080926215e-07, - "loss": 0.5835, - "step": 62529 - }, - { - "epoch": 1.6, - "learning_rate": 9.377816912246376e-07, - "loss": 0.6328, - "step": 62530 - }, - { - "epoch": 1.6, - "learning_rate": 9.377540744042916e-07, - "loss": 0.5903, - "step": 62531 - }, - { - "epoch": 1.6, - "learning_rate": 9.377264576316044e-07, - "loss": 0.8008, - "step": 62532 - }, - { - "epoch": 1.6, - "learning_rate": 9.37698840906597e-07, - "loss": 0.6807, - "step": 62533 - }, - { - "epoch": 1.6, - "learning_rate": 9.37671224229291e-07, - "loss": 0.4851, - "step": 62534 - }, - { - "epoch": 1.6, - "learning_rate": 9.376436075997071e-07, - "loss": 0.5444, - "step": 62535 - }, - { - "epoch": 1.6, - "learning_rate": 9.376159910178667e-07, - "loss": 0.5239, - "step": 62536 - }, - { - "epoch": 1.6, - "learning_rate": 9.375883744837907e-07, - "loss": 0.5977, - "step": 62537 - }, - { - "epoch": 1.6, - "learning_rate": 9.375607579975009e-07, - "loss": 0.623, - "step": 62538 - }, - { - "epoch": 1.6, - "learning_rate": 9.375331415590178e-07, - "loss": 0.4878, - "step": 62539 - }, - { - "epoch": 1.6, - "learning_rate": 9.375055251683624e-07, - "loss": 0.5181, - "step": 62540 - }, - { - "epoch": 1.6, - "learning_rate": 9.374779088255564e-07, - "loss": 0.6689, - "step": 62541 - }, - { - "epoch": 1.6, - "learning_rate": 9.374502925306203e-07, - "loss": 0.5703, - "step": 62542 - }, - { - "epoch": 1.6, - "learning_rate": 9.374226762835759e-07, - "loss": 0.47, - "step": 62543 - }, - { - "epoch": 1.6, - "learning_rate": 9.37395060084444e-07, - "loss": 0.7549, - "step": 62544 - }, - { - "epoch": 1.6, - "learning_rate": 9.37367443933246e-07, - "loss": 0.6943, - "step": 62545 - }, - { - "epoch": 1.6, - "learning_rate": 9.373398278300027e-07, - "loss": 0.7412, - "step": 62546 - }, - { - "epoch": 1.6, - "learning_rate": 9.373122117747356e-07, - "loss": 0.6158, - "step": 62547 - }, - { - "epoch": 1.6, - "learning_rate": 9.372845957674658e-07, - "loss": 0.4146, - "step": 62548 - }, - { - "epoch": 1.6, - "learning_rate": 9.372569798082142e-07, - "loss": 0.6045, - "step": 62549 - }, - { - "epoch": 1.6, - "learning_rate": 9.372293638970016e-07, - "loss": 0.5801, - "step": 62550 - }, - { - "epoch": 1.6, - "learning_rate": 9.3720174803385e-07, - "loss": 0.7646, - "step": 62551 - }, - { - "epoch": 1.6, - "learning_rate": 9.371741322187799e-07, - "loss": 0.541, - "step": 62552 - }, - { - "epoch": 1.6, - "learning_rate": 9.371465164518128e-07, - "loss": 0.5508, - "step": 62553 - }, - { - "epoch": 1.6, - "learning_rate": 9.371189007329696e-07, - "loss": 0.7441, - "step": 62554 - }, - { - "epoch": 1.6, - "learning_rate": 9.370912850622719e-07, - "loss": 0.8262, - "step": 62555 - }, - { - "epoch": 1.6, - "learning_rate": 9.370636694397401e-07, - "loss": 0.5229, - "step": 62556 - }, - { - "epoch": 1.6, - "learning_rate": 9.370360538653961e-07, - "loss": 0.6157, - "step": 62557 - }, - { - "epoch": 1.6, - "learning_rate": 9.370084383392608e-07, - "loss": 0.6113, - "step": 62558 - }, - { - "epoch": 1.6, - "learning_rate": 9.369808228613548e-07, - "loss": 0.5513, - "step": 62559 - }, - { - "epoch": 1.6, - "learning_rate": 9.369532074316999e-07, - "loss": 0.4302, - "step": 62560 - }, - { - "epoch": 1.6, - "learning_rate": 9.36925592050317e-07, - "loss": 0.6509, - "step": 62561 - }, - { - "epoch": 1.6, - "learning_rate": 9.368979767172272e-07, - "loss": 0.8359, - "step": 62562 - }, - { - "epoch": 1.6, - "learning_rate": 9.368703614324518e-07, - "loss": 0.752, - "step": 62563 - }, - { - "epoch": 1.6, - "learning_rate": 9.368427461960119e-07, - "loss": 0.4971, - "step": 62564 - }, - { - "epoch": 1.6, - "learning_rate": 9.368151310079285e-07, - "loss": 0.791, - "step": 62565 - }, - { - "epoch": 1.6, - "learning_rate": 9.36787515868223e-07, - "loss": 0.6934, - "step": 62566 - }, - { - "epoch": 1.6, - "learning_rate": 9.367599007769161e-07, - "loss": 0.6992, - "step": 62567 - }, - { - "epoch": 1.6, - "learning_rate": 9.367322857340299e-07, - "loss": 0.8164, - "step": 62568 - }, - { - "epoch": 1.6, - "learning_rate": 9.367046707395843e-07, - "loss": 0.5947, - "step": 62569 - }, - { - "epoch": 1.6, - "learning_rate": 9.366770557936012e-07, - "loss": 0.6045, - "step": 62570 - }, - { - "epoch": 1.6, - "learning_rate": 9.366494408961014e-07, - "loss": 0.6265, - "step": 62571 - }, - { - "epoch": 1.6, - "learning_rate": 9.366218260471064e-07, - "loss": 0.7871, - "step": 62572 - }, - { - "epoch": 1.6, - "learning_rate": 9.36594211246637e-07, - "loss": 0.749, - "step": 62573 - }, - { - "epoch": 1.6, - "learning_rate": 9.365665964947146e-07, - "loss": 0.5723, - "step": 62574 - }, - { - "epoch": 1.6, - "learning_rate": 9.3653898179136e-07, - "loss": 0.5381, - "step": 62575 - }, - { - "epoch": 1.6, - "learning_rate": 9.36511367136595e-07, - "loss": 0.6265, - "step": 62576 - }, - { - "epoch": 1.6, - "learning_rate": 9.3648375253044e-07, - "loss": 0.6387, - "step": 62577 - }, - { - "epoch": 1.6, - "learning_rate": 9.364561379729167e-07, - "loss": 0.7891, - "step": 62578 - }, - { - "epoch": 1.6, - "learning_rate": 9.364285234640461e-07, - "loss": 0.6294, - "step": 62579 - }, - { - "epoch": 1.6, - "learning_rate": 9.36400909003849e-07, - "loss": 0.5088, - "step": 62580 - }, - { - "epoch": 1.6, - "learning_rate": 9.363732945923469e-07, - "loss": 0.5864, - "step": 62581 - }, - { - "epoch": 1.6, - "learning_rate": 9.363456802295606e-07, - "loss": 0.5786, - "step": 62582 - }, - { - "epoch": 1.6, - "learning_rate": 9.363180659155119e-07, - "loss": 0.6416, - "step": 62583 - }, - { - "epoch": 1.6, - "learning_rate": 9.362904516502212e-07, - "loss": 0.564, - "step": 62584 - }, - { - "epoch": 1.6, - "learning_rate": 9.3626283743371e-07, - "loss": 0.7695, - "step": 62585 - }, - { - "epoch": 1.6, - "learning_rate": 9.362352232659995e-07, - "loss": 0.5354, - "step": 62586 - }, - { - "epoch": 1.6, - "learning_rate": 9.362076091471109e-07, - "loss": 0.6841, - "step": 62587 - }, - { - "epoch": 1.6, - "learning_rate": 9.361799950770653e-07, - "loss": 0.5435, - "step": 62588 - }, - { - "epoch": 1.6, - "learning_rate": 9.361523810558836e-07, - "loss": 0.7139, - "step": 62589 - }, - { - "epoch": 1.6, - "learning_rate": 9.361247670835868e-07, - "loss": 0.5889, - "step": 62590 - }, - { - "epoch": 1.6, - "learning_rate": 9.360971531601967e-07, - "loss": 0.6133, - "step": 62591 - }, - { - "epoch": 1.6, - "learning_rate": 9.360695392857336e-07, - "loss": 0.3765, - "step": 62592 - }, - { - "epoch": 1.6, - "learning_rate": 9.360419254602195e-07, - "loss": 0.6992, - "step": 62593 - }, - { - "epoch": 1.6, - "learning_rate": 9.36014311683675e-07, - "loss": 0.5952, - "step": 62594 - }, - { - "epoch": 1.6, - "learning_rate": 9.359866979561215e-07, - "loss": 0.6895, - "step": 62595 - }, - { - "epoch": 1.6, - "learning_rate": 9.359590842775798e-07, - "loss": 0.6899, - "step": 62596 - }, - { - "epoch": 1.6, - "learning_rate": 9.359314706480716e-07, - "loss": 0.708, - "step": 62597 - }, - { - "epoch": 1.6, - "learning_rate": 9.35903857067618e-07, - "loss": 0.4442, - "step": 62598 - }, - { - "epoch": 1.6, - "learning_rate": 9.358762435362393e-07, - "loss": 0.6421, - "step": 62599 - }, - { - "epoch": 1.6, - "learning_rate": 9.358486300539575e-07, - "loss": 0.4393, - "step": 62600 - }, - { - "epoch": 1.6, - "learning_rate": 9.358210166207932e-07, - "loss": 0.7256, - "step": 62601 - }, - { - "epoch": 1.6, - "learning_rate": 9.35793403236768e-07, - "loss": 0.6309, - "step": 62602 - }, - { - "epoch": 1.6, - "learning_rate": 9.357657899019027e-07, - "loss": 0.7549, - "step": 62603 - }, - { - "epoch": 1.6, - "learning_rate": 9.357381766162187e-07, - "loss": 0.6938, - "step": 62604 - }, - { - "epoch": 1.6, - "learning_rate": 9.357105633797371e-07, - "loss": 0.6895, - "step": 62605 - }, - { - "epoch": 1.6, - "learning_rate": 9.356829501924788e-07, - "loss": 0.521, - "step": 62606 - }, - { - "epoch": 1.6, - "learning_rate": 9.356553370544653e-07, - "loss": 0.7261, - "step": 62607 - }, - { - "epoch": 1.6, - "learning_rate": 9.356277239657176e-07, - "loss": 0.7461, - "step": 62608 - }, - { - "epoch": 1.6, - "learning_rate": 9.356001109262564e-07, - "loss": 0.4991, - "step": 62609 - }, - { - "epoch": 1.6, - "learning_rate": 9.355724979361036e-07, - "loss": 0.6528, - "step": 62610 - }, - { - "epoch": 1.6, - "learning_rate": 9.355448849952797e-07, - "loss": 0.6743, - "step": 62611 - }, - { - "epoch": 1.6, - "learning_rate": 9.355172721038063e-07, - "loss": 0.3672, - "step": 62612 - }, - { - "epoch": 1.6, - "learning_rate": 9.354896592617041e-07, - "loss": 0.7217, - "step": 62613 - }, - { - "epoch": 1.6, - "learning_rate": 9.354620464689949e-07, - "loss": 0.6743, - "step": 62614 - }, - { - "epoch": 1.6, - "learning_rate": 9.35434433725699e-07, - "loss": 0.8545, - "step": 62615 - }, - { - "epoch": 1.6, - "learning_rate": 9.354068210318383e-07, - "loss": 0.6543, - "step": 62616 - }, - { - "epoch": 1.6, - "learning_rate": 9.353792083874334e-07, - "loss": 0.4402, - "step": 62617 - }, - { - "epoch": 1.6, - "learning_rate": 9.353515957925061e-07, - "loss": 0.6963, - "step": 62618 - }, - { - "epoch": 1.6, - "learning_rate": 9.35323983247077e-07, - "loss": 0.5459, - "step": 62619 - }, - { - "epoch": 1.6, - "learning_rate": 9.35296370751167e-07, - "loss": 0.666, - "step": 62620 - }, - { - "epoch": 1.61, - "learning_rate": 9.352687583047978e-07, - "loss": 0.8037, - "step": 62621 - }, - { - "epoch": 1.61, - "learning_rate": 9.352411459079904e-07, - "loss": 0.6914, - "step": 62622 - }, - { - "epoch": 1.61, - "learning_rate": 9.352135335607657e-07, - "loss": 0.48, - "step": 62623 - }, - { - "epoch": 1.61, - "learning_rate": 9.351859212631452e-07, - "loss": 0.6001, - "step": 62624 - }, - { - "epoch": 1.61, - "learning_rate": 9.351583090151496e-07, - "loss": 0.6316, - "step": 62625 - }, - { - "epoch": 1.61, - "learning_rate": 9.351306968168006e-07, - "loss": 0.6533, - "step": 62626 - }, - { - "epoch": 1.61, - "learning_rate": 9.351030846681187e-07, - "loss": 0.5764, - "step": 62627 - }, - { - "epoch": 1.61, - "learning_rate": 9.350754725691259e-07, - "loss": 0.7617, - "step": 62628 - }, - { - "epoch": 1.61, - "learning_rate": 9.350478605198427e-07, - "loss": 0.749, - "step": 62629 - }, - { - "epoch": 1.61, - "learning_rate": 9.3502024852029e-07, - "loss": 0.7041, - "step": 62630 - }, - { - "epoch": 1.61, - "learning_rate": 9.349926365704895e-07, - "loss": 0.6895, - "step": 62631 - }, - { - "epoch": 1.61, - "learning_rate": 9.349650246704622e-07, - "loss": 0.5076, - "step": 62632 - }, - { - "epoch": 1.61, - "learning_rate": 9.349374128202291e-07, - "loss": 0.6187, - "step": 62633 - }, - { - "epoch": 1.61, - "learning_rate": 9.349098010198113e-07, - "loss": 0.647, - "step": 62634 - }, - { - "epoch": 1.61, - "learning_rate": 9.348821892692304e-07, - "loss": 0.4836, - "step": 62635 - }, - { - "epoch": 1.61, - "learning_rate": 9.348545775685068e-07, - "loss": 0.6357, - "step": 62636 - }, - { - "epoch": 1.61, - "learning_rate": 9.348269659176624e-07, - "loss": 0.5806, - "step": 62637 - }, - { - "epoch": 1.61, - "learning_rate": 9.347993543167182e-07, - "loss": 0.4961, - "step": 62638 - }, - { - "epoch": 1.61, - "learning_rate": 9.347717427656949e-07, - "loss": 0.5923, - "step": 62639 - }, - { - "epoch": 1.61, - "learning_rate": 9.347441312646137e-07, - "loss": 0.4724, - "step": 62640 - }, - { - "epoch": 1.61, - "learning_rate": 9.347165198134961e-07, - "loss": 0.7021, - "step": 62641 - }, - { - "epoch": 1.61, - "learning_rate": 9.346889084123629e-07, - "loss": 0.5493, - "step": 62642 - }, - { - "epoch": 1.61, - "learning_rate": 9.346612970612355e-07, - "loss": 0.6558, - "step": 62643 - }, - { - "epoch": 1.61, - "learning_rate": 9.346336857601349e-07, - "loss": 0.6484, - "step": 62644 - }, - { - "epoch": 1.61, - "learning_rate": 9.346060745090824e-07, - "loss": 0.5571, - "step": 62645 - }, - { - "epoch": 1.61, - "learning_rate": 9.345784633080987e-07, - "loss": 0.6675, - "step": 62646 - }, - { - "epoch": 1.61, - "learning_rate": 9.345508521572059e-07, - "loss": 0.4613, - "step": 62647 - }, - { - "epoch": 1.61, - "learning_rate": 9.345232410564241e-07, - "loss": 0.7056, - "step": 62648 - }, - { - "epoch": 1.61, - "learning_rate": 9.344956300057747e-07, - "loss": 0.4182, - "step": 62649 - }, - { - "epoch": 1.61, - "learning_rate": 9.344680190052793e-07, - "loss": 0.5493, - "step": 62650 - }, - { - "epoch": 1.61, - "learning_rate": 9.344404080549584e-07, - "loss": 0.6792, - "step": 62651 - }, - { - "epoch": 1.61, - "learning_rate": 9.344127971548336e-07, - "loss": 0.7104, - "step": 62652 - }, - { - "epoch": 1.61, - "learning_rate": 9.343851863049259e-07, - "loss": 0.519, - "step": 62653 - }, - { - "epoch": 1.61, - "learning_rate": 9.343575755052565e-07, - "loss": 0.4983, - "step": 62654 - }, - { - "epoch": 1.61, - "learning_rate": 9.343299647558463e-07, - "loss": 0.7021, - "step": 62655 - }, - { - "epoch": 1.61, - "learning_rate": 9.343023540567169e-07, - "loss": 0.6777, - "step": 62656 - }, - { - "epoch": 1.61, - "learning_rate": 9.342747434078894e-07, - "loss": 0.6206, - "step": 62657 - }, - { - "epoch": 1.61, - "learning_rate": 9.342471328093844e-07, - "loss": 0.6729, - "step": 62658 - }, - { - "epoch": 1.61, - "learning_rate": 9.342195222612231e-07, - "loss": 0.7607, - "step": 62659 - }, - { - "epoch": 1.61, - "learning_rate": 9.341919117634272e-07, - "loss": 0.7656, - "step": 62660 - }, - { - "epoch": 1.61, - "learning_rate": 9.341643013160173e-07, - "loss": 0.7715, - "step": 62661 - }, - { - "epoch": 1.61, - "learning_rate": 9.34136690919015e-07, - "loss": 0.6606, - "step": 62662 - }, - { - "epoch": 1.61, - "learning_rate": 9.341090805724408e-07, - "loss": 0.5261, - "step": 62663 - }, - { - "epoch": 1.61, - "learning_rate": 9.340814702763166e-07, - "loss": 0.3267, - "step": 62664 - }, - { - "epoch": 1.61, - "learning_rate": 9.340538600306631e-07, - "loss": 0.5103, - "step": 62665 - }, - { - "epoch": 1.61, - "learning_rate": 9.340262498355016e-07, - "loss": 0.6133, - "step": 62666 - }, - { - "epoch": 1.61, - "learning_rate": 9.339986396908534e-07, - "loss": 0.5127, - "step": 62667 - }, - { - "epoch": 1.61, - "learning_rate": 9.33971029596739e-07, - "loss": 0.6108, - "step": 62668 - }, - { - "epoch": 1.61, - "learning_rate": 9.339434195531802e-07, - "loss": 0.5061, - "step": 62669 - }, - { - "epoch": 1.61, - "learning_rate": 9.339158095601977e-07, - "loss": 0.624, - "step": 62670 - }, - { - "epoch": 1.61, - "learning_rate": 9.33888199617813e-07, - "loss": 0.624, - "step": 62671 - }, - { - "epoch": 1.61, - "learning_rate": 9.338605897260467e-07, - "loss": 0.7139, - "step": 62672 - }, - { - "epoch": 1.61, - "learning_rate": 9.338329798849207e-07, - "loss": 0.6592, - "step": 62673 - }, - { - "epoch": 1.61, - "learning_rate": 9.338053700944554e-07, - "loss": 0.707, - "step": 62674 - }, - { - "epoch": 1.61, - "learning_rate": 9.337777603546726e-07, - "loss": 0.6606, - "step": 62675 - }, - { - "epoch": 1.61, - "learning_rate": 9.337501506655928e-07, - "loss": 0.6621, - "step": 62676 - }, - { - "epoch": 1.61, - "learning_rate": 9.337225410272382e-07, - "loss": 0.623, - "step": 62677 - }, - { - "epoch": 1.61, - "learning_rate": 9.336949314396286e-07, - "loss": 0.5532, - "step": 62678 - }, - { - "epoch": 1.61, - "learning_rate": 9.336673219027858e-07, - "loss": 0.5476, - "step": 62679 - }, - { - "epoch": 1.61, - "learning_rate": 9.336397124167309e-07, - "loss": 0.4976, - "step": 62680 - }, - { - "epoch": 1.61, - "learning_rate": 9.33612102981485e-07, - "loss": 0.7046, - "step": 62681 - }, - { - "epoch": 1.61, - "learning_rate": 9.335844935970691e-07, - "loss": 0.7236, - "step": 62682 - }, - { - "epoch": 1.61, - "learning_rate": 9.335568842635049e-07, - "loss": 0.6846, - "step": 62683 - }, - { - "epoch": 1.61, - "learning_rate": 9.335292749808127e-07, - "loss": 0.8428, - "step": 62684 - }, - { - "epoch": 1.61, - "learning_rate": 9.335016657490144e-07, - "loss": 0.6055, - "step": 62685 - }, - { - "epoch": 1.61, - "learning_rate": 9.334740565681306e-07, - "loss": 0.6953, - "step": 62686 - }, - { - "epoch": 1.61, - "learning_rate": 9.33446447438183e-07, - "loss": 0.4355, - "step": 62687 - }, - { - "epoch": 1.61, - "learning_rate": 9.334188383591923e-07, - "loss": 0.561, - "step": 62688 - }, - { - "epoch": 1.61, - "learning_rate": 9.333912293311794e-07, - "loss": 0.6611, - "step": 62689 - }, - { - "epoch": 1.61, - "learning_rate": 9.333636203541662e-07, - "loss": 0.6826, - "step": 62690 - }, - { - "epoch": 1.61, - "learning_rate": 9.333360114281729e-07, - "loss": 0.6401, - "step": 62691 - }, - { - "epoch": 1.61, - "learning_rate": 9.333084025532216e-07, - "loss": 0.6318, - "step": 62692 - }, - { - "epoch": 1.61, - "learning_rate": 9.332807937293327e-07, - "loss": 0.4622, - "step": 62693 - }, - { - "epoch": 1.61, - "learning_rate": 9.332531849565279e-07, - "loss": 0.5474, - "step": 62694 - }, - { - "epoch": 1.61, - "learning_rate": 9.332255762348279e-07, - "loss": 0.7715, - "step": 62695 - }, - { - "epoch": 1.61, - "learning_rate": 9.331979675642538e-07, - "loss": 0.4868, - "step": 62696 - }, - { - "epoch": 1.61, - "learning_rate": 9.331703589448275e-07, - "loss": 0.6294, - "step": 62697 - }, - { - "epoch": 1.61, - "learning_rate": 9.331427503765694e-07, - "loss": 0.5947, - "step": 62698 - }, - { - "epoch": 1.61, - "learning_rate": 9.331151418595005e-07, - "loss": 0.7324, - "step": 62699 - }, - { - "epoch": 1.61, - "learning_rate": 9.330875333936426e-07, - "loss": 0.7217, - "step": 62700 - }, - { - "epoch": 1.61, - "learning_rate": 9.33059924979016e-07, - "loss": 0.6509, - "step": 62701 - }, - { - "epoch": 1.61, - "learning_rate": 9.330323166156428e-07, - "loss": 0.7227, - "step": 62702 - }, - { - "epoch": 1.61, - "learning_rate": 9.330047083035435e-07, - "loss": 0.6133, - "step": 62703 - }, - { - "epoch": 1.61, - "learning_rate": 9.329771000427395e-07, - "loss": 0.6133, - "step": 62704 - }, - { - "epoch": 1.61, - "learning_rate": 9.329494918332517e-07, - "loss": 0.6953, - "step": 62705 - }, - { - "epoch": 1.61, - "learning_rate": 9.329218836751016e-07, - "loss": 0.5986, - "step": 62706 - }, - { - "epoch": 1.61, - "learning_rate": 9.328942755683104e-07, - "loss": 0.5952, - "step": 62707 - }, - { - "epoch": 1.61, - "learning_rate": 9.328666675128985e-07, - "loss": 0.686, - "step": 62708 - }, - { - "epoch": 1.61, - "learning_rate": 9.328390595088877e-07, - "loss": 0.6445, - "step": 62709 - }, - { - "epoch": 1.61, - "learning_rate": 9.328114515562985e-07, - "loss": 0.5703, - "step": 62710 - }, - { - "epoch": 1.61, - "learning_rate": 9.32783843655153e-07, - "loss": 0.5803, - "step": 62711 - }, - { - "epoch": 1.61, - "learning_rate": 9.327562358054718e-07, - "loss": 0.5894, - "step": 62712 - }, - { - "epoch": 1.61, - "learning_rate": 9.327286280072757e-07, - "loss": 0.4177, - "step": 62713 - }, - { - "epoch": 1.61, - "learning_rate": 9.327010202605865e-07, - "loss": 0.6885, - "step": 62714 - }, - { - "epoch": 1.61, - "learning_rate": 9.326734125654249e-07, - "loss": 0.8569, - "step": 62715 - }, - { - "epoch": 1.61, - "learning_rate": 9.326458049218122e-07, - "loss": 0.814, - "step": 62716 - }, - { - "epoch": 1.61, - "learning_rate": 9.326181973297699e-07, - "loss": 0.7646, - "step": 62717 - }, - { - "epoch": 1.61, - "learning_rate": 9.325905897893182e-07, - "loss": 0.4868, - "step": 62718 - }, - { - "epoch": 1.61, - "learning_rate": 9.325629823004791e-07, - "loss": 0.6797, - "step": 62719 - }, - { - "epoch": 1.61, - "learning_rate": 9.325353748632731e-07, - "loss": 0.6084, - "step": 62720 - }, - { - "epoch": 1.61, - "learning_rate": 9.325077674777219e-07, - "loss": 0.6533, - "step": 62721 - }, - { - "epoch": 1.61, - "learning_rate": 9.324801601438462e-07, - "loss": 0.6963, - "step": 62722 - }, - { - "epoch": 1.61, - "learning_rate": 9.324525528616676e-07, - "loss": 0.5962, - "step": 62723 - }, - { - "epoch": 1.61, - "learning_rate": 9.324249456312066e-07, - "loss": 0.6626, - "step": 62724 - }, - { - "epoch": 1.61, - "learning_rate": 9.323973384524851e-07, - "loss": 0.542, - "step": 62725 - }, - { - "epoch": 1.61, - "learning_rate": 9.323697313255236e-07, - "loss": 0.5181, - "step": 62726 - }, - { - "epoch": 1.61, - "learning_rate": 9.32342124250344e-07, - "loss": 0.4622, - "step": 62727 - }, - { - "epoch": 1.61, - "learning_rate": 9.323145172269665e-07, - "loss": 0.6348, - "step": 62728 - }, - { - "epoch": 1.61, - "learning_rate": 9.322869102554128e-07, - "loss": 0.6245, - "step": 62729 - }, - { - "epoch": 1.61, - "learning_rate": 9.322593033357036e-07, - "loss": 0.6611, - "step": 62730 - }, - { - "epoch": 1.61, - "learning_rate": 9.322316964678607e-07, - "loss": 0.6553, - "step": 62731 - }, - { - "epoch": 1.61, - "learning_rate": 9.322040896519046e-07, - "loss": 0.5811, - "step": 62732 - }, - { - "epoch": 1.61, - "learning_rate": 9.321764828878567e-07, - "loss": 0.6284, - "step": 62733 - }, - { - "epoch": 1.61, - "learning_rate": 9.321488761757383e-07, - "loss": 0.627, - "step": 62734 - }, - { - "epoch": 1.61, - "learning_rate": 9.321212695155703e-07, - "loss": 0.7861, - "step": 62735 - }, - { - "epoch": 1.61, - "learning_rate": 9.320936629073739e-07, - "loss": 0.5027, - "step": 62736 - }, - { - "epoch": 1.61, - "learning_rate": 9.320660563511706e-07, - "loss": 0.7061, - "step": 62737 - }, - { - "epoch": 1.61, - "learning_rate": 9.32038449846981e-07, - "loss": 0.7041, - "step": 62738 - }, - { - "epoch": 1.61, - "learning_rate": 9.320108433948263e-07, - "loss": 0.5557, - "step": 62739 - }, - { - "epoch": 1.61, - "learning_rate": 9.319832369947279e-07, - "loss": 0.7275, - "step": 62740 - }, - { - "epoch": 1.61, - "learning_rate": 9.319556306467066e-07, - "loss": 0.5786, - "step": 62741 - }, - { - "epoch": 1.61, - "learning_rate": 9.319280243507839e-07, - "loss": 0.7295, - "step": 62742 - }, - { - "epoch": 1.61, - "learning_rate": 9.319004181069806e-07, - "loss": 0.668, - "step": 62743 - }, - { - "epoch": 1.61, - "learning_rate": 9.318728119153183e-07, - "loss": 0.6895, - "step": 62744 - }, - { - "epoch": 1.61, - "learning_rate": 9.318452057758176e-07, - "loss": 0.6226, - "step": 62745 - }, - { - "epoch": 1.61, - "learning_rate": 9.318175996885002e-07, - "loss": 0.791, - "step": 62746 - }, - { - "epoch": 1.61, - "learning_rate": 9.31789993653387e-07, - "loss": 0.5972, - "step": 62747 - }, - { - "epoch": 1.61, - "learning_rate": 9.317623876704988e-07, - "loss": 0.6533, - "step": 62748 - }, - { - "epoch": 1.61, - "learning_rate": 9.31734781739857e-07, - "loss": 0.6074, - "step": 62749 - }, - { - "epoch": 1.61, - "learning_rate": 9.317071758614828e-07, - "loss": 0.8213, - "step": 62750 - }, - { - "epoch": 1.61, - "learning_rate": 9.316795700353971e-07, - "loss": 0.4839, - "step": 62751 - }, - { - "epoch": 1.61, - "learning_rate": 9.316519642616214e-07, - "loss": 0.7002, - "step": 62752 - }, - { - "epoch": 1.61, - "learning_rate": 9.316243585401765e-07, - "loss": 0.7627, - "step": 62753 - }, - { - "epoch": 1.61, - "learning_rate": 9.315967528710839e-07, - "loss": 0.7822, - "step": 62754 - }, - { - "epoch": 1.61, - "learning_rate": 9.315691472543642e-07, - "loss": 0.5444, - "step": 62755 - }, - { - "epoch": 1.61, - "learning_rate": 9.315415416900392e-07, - "loss": 0.5405, - "step": 62756 - }, - { - "epoch": 1.61, - "learning_rate": 9.315139361781299e-07, - "loss": 0.6357, - "step": 62757 - }, - { - "epoch": 1.61, - "learning_rate": 9.314863307186567e-07, - "loss": 0.5566, - "step": 62758 - }, - { - "epoch": 1.61, - "learning_rate": 9.314587253116415e-07, - "loss": 0.6279, - "step": 62759 - }, - { - "epoch": 1.61, - "learning_rate": 9.31431119957105e-07, - "loss": 0.5298, - "step": 62760 - }, - { - "epoch": 1.61, - "learning_rate": 9.314035146550688e-07, - "loss": 0.6621, - "step": 62761 - }, - { - "epoch": 1.61, - "learning_rate": 9.313759094055535e-07, - "loss": 0.6465, - "step": 62762 - }, - { - "epoch": 1.61, - "learning_rate": 9.313483042085808e-07, - "loss": 0.6582, - "step": 62763 - }, - { - "epoch": 1.61, - "learning_rate": 9.313206990641713e-07, - "loss": 0.425, - "step": 62764 - }, - { - "epoch": 1.61, - "learning_rate": 9.312930939723465e-07, - "loss": 0.6097, - "step": 62765 - }, - { - "epoch": 1.61, - "learning_rate": 9.312654889331274e-07, - "loss": 0.5688, - "step": 62766 - }, - { - "epoch": 1.61, - "learning_rate": 9.312378839465357e-07, - "loss": 0.4829, - "step": 62767 - }, - { - "epoch": 1.61, - "learning_rate": 9.312102790125913e-07, - "loss": 0.8828, - "step": 62768 - }, - { - "epoch": 1.61, - "learning_rate": 9.311826741313164e-07, - "loss": 0.5918, - "step": 62769 - }, - { - "epoch": 1.61, - "learning_rate": 9.311550693027313e-07, - "loss": 0.7158, - "step": 62770 - }, - { - "epoch": 1.61, - "learning_rate": 9.311274645268579e-07, - "loss": 0.5869, - "step": 62771 - }, - { - "epoch": 1.61, - "learning_rate": 9.310998598037169e-07, - "loss": 0.6724, - "step": 62772 - }, - { - "epoch": 1.61, - "learning_rate": 9.310722551333298e-07, - "loss": 0.5237, - "step": 62773 - }, - { - "epoch": 1.61, - "learning_rate": 9.310446505157172e-07, - "loss": 0.6641, - "step": 62774 - }, - { - "epoch": 1.61, - "learning_rate": 9.310170459509008e-07, - "loss": 0.5486, - "step": 62775 - }, - { - "epoch": 1.61, - "learning_rate": 9.309894414389012e-07, - "loss": 0.7314, - "step": 62776 - }, - { - "epoch": 1.61, - "learning_rate": 9.309618369797403e-07, - "loss": 0.7148, - "step": 62777 - }, - { - "epoch": 1.61, - "learning_rate": 9.309342325734385e-07, - "loss": 0.5, - "step": 62778 - }, - { - "epoch": 1.61, - "learning_rate": 9.309066282200171e-07, - "loss": 0.5605, - "step": 62779 - }, - { - "epoch": 1.61, - "learning_rate": 9.308790239194973e-07, - "loss": 0.5811, - "step": 62780 - }, - { - "epoch": 1.61, - "learning_rate": 9.308514196719002e-07, - "loss": 0.625, - "step": 62781 - }, - { - "epoch": 1.61, - "learning_rate": 9.308238154772472e-07, - "loss": 0.7158, - "step": 62782 - }, - { - "epoch": 1.61, - "learning_rate": 9.30796211335559e-07, - "loss": 0.6465, - "step": 62783 - }, - { - "epoch": 1.61, - "learning_rate": 9.307686072468572e-07, - "loss": 0.5649, - "step": 62784 - }, - { - "epoch": 1.61, - "learning_rate": 9.307410032111626e-07, - "loss": 0.5021, - "step": 62785 - }, - { - "epoch": 1.61, - "learning_rate": 9.307133992284962e-07, - "loss": 0.5332, - "step": 62786 - }, - { - "epoch": 1.61, - "learning_rate": 9.306857952988798e-07, - "loss": 0.5291, - "step": 62787 - }, - { - "epoch": 1.61, - "learning_rate": 9.306581914223339e-07, - "loss": 0.7285, - "step": 62788 - }, - { - "epoch": 1.61, - "learning_rate": 9.306305875988796e-07, - "loss": 0.7666, - "step": 62789 - }, - { - "epoch": 1.61, - "learning_rate": 9.306029838285387e-07, - "loss": 0.5466, - "step": 62790 - }, - { - "epoch": 1.61, - "learning_rate": 9.305753801113316e-07, - "loss": 0.6294, - "step": 62791 - }, - { - "epoch": 1.61, - "learning_rate": 9.305477764472798e-07, - "loss": 0.7861, - "step": 62792 - }, - { - "epoch": 1.61, - "learning_rate": 9.305201728364042e-07, - "loss": 0.5547, - "step": 62793 - }, - { - "epoch": 1.61, - "learning_rate": 9.304925692787264e-07, - "loss": 0.4888, - "step": 62794 - }, - { - "epoch": 1.61, - "learning_rate": 9.304649657742669e-07, - "loss": 0.7021, - "step": 62795 - }, - { - "epoch": 1.61, - "learning_rate": 9.304373623230476e-07, - "loss": 0.5435, - "step": 62796 - }, - { - "epoch": 1.61, - "learning_rate": 9.304097589250892e-07, - "loss": 0.7344, - "step": 62797 - }, - { - "epoch": 1.61, - "learning_rate": 9.303821555804126e-07, - "loss": 0.8164, - "step": 62798 - }, - { - "epoch": 1.61, - "learning_rate": 9.303545522890393e-07, - "loss": 0.3901, - "step": 62799 - }, - { - "epoch": 1.61, - "learning_rate": 9.303269490509902e-07, - "loss": 0.6064, - "step": 62800 - }, - { - "epoch": 1.61, - "learning_rate": 9.302993458662867e-07, - "loss": 0.3881, - "step": 62801 - }, - { - "epoch": 1.61, - "learning_rate": 9.302717427349498e-07, - "loss": 0.5884, - "step": 62802 - }, - { - "epoch": 1.61, - "learning_rate": 9.302441396570003e-07, - "loss": 0.6885, - "step": 62803 - }, - { - "epoch": 1.61, - "learning_rate": 9.3021653663246e-07, - "loss": 0.7324, - "step": 62804 - }, - { - "epoch": 1.61, - "learning_rate": 9.301889336613494e-07, - "loss": 0.665, - "step": 62805 - }, - { - "epoch": 1.61, - "learning_rate": 9.301613307436902e-07, - "loss": 0.8252, - "step": 62806 - }, - { - "epoch": 1.61, - "learning_rate": 9.301337278795034e-07, - "loss": 0.5444, - "step": 62807 - }, - { - "epoch": 1.61, - "learning_rate": 9.301061250688095e-07, - "loss": 0.6904, - "step": 62808 - }, - { - "epoch": 1.61, - "learning_rate": 9.300785223116305e-07, - "loss": 0.6807, - "step": 62809 - }, - { - "epoch": 1.61, - "learning_rate": 9.30050919607987e-07, - "loss": 0.6445, - "step": 62810 - }, - { - "epoch": 1.61, - "learning_rate": 9.300233169579003e-07, - "loss": 0.5439, - "step": 62811 - }, - { - "epoch": 1.61, - "learning_rate": 9.299957143613915e-07, - "loss": 0.7393, - "step": 62812 - }, - { - "epoch": 1.61, - "learning_rate": 9.299681118184819e-07, - "loss": 0.3955, - "step": 62813 - }, - { - "epoch": 1.61, - "learning_rate": 9.299405093291922e-07, - "loss": 0.6914, - "step": 62814 - }, - { - "epoch": 1.61, - "learning_rate": 9.299129068935442e-07, - "loss": 0.6841, - "step": 62815 - }, - { - "epoch": 1.61, - "learning_rate": 9.298853045115584e-07, - "loss": 0.6318, - "step": 62816 - }, - { - "epoch": 1.61, - "learning_rate": 9.298577021832565e-07, - "loss": 0.7598, - "step": 62817 - }, - { - "epoch": 1.61, - "learning_rate": 9.298300999086593e-07, - "loss": 0.7402, - "step": 62818 - }, - { - "epoch": 1.61, - "learning_rate": 9.298024976877878e-07, - "loss": 0.6787, - "step": 62819 - }, - { - "epoch": 1.61, - "learning_rate": 9.297748955206633e-07, - "loss": 0.6504, - "step": 62820 - }, - { - "epoch": 1.61, - "learning_rate": 9.297472934073069e-07, - "loss": 0.5303, - "step": 62821 - }, - { - "epoch": 1.61, - "learning_rate": 9.297196913477397e-07, - "loss": 0.6973, - "step": 62822 - }, - { - "epoch": 1.61, - "learning_rate": 9.296920893419831e-07, - "loss": 0.6787, - "step": 62823 - }, - { - "epoch": 1.61, - "learning_rate": 9.296644873900577e-07, - "loss": 0.5786, - "step": 62824 - }, - { - "epoch": 1.61, - "learning_rate": 9.296368854919854e-07, - "loss": 0.6553, - "step": 62825 - }, - { - "epoch": 1.61, - "learning_rate": 9.296092836477865e-07, - "loss": 0.5815, - "step": 62826 - }, - { - "epoch": 1.61, - "learning_rate": 9.295816818574831e-07, - "loss": 0.606, - "step": 62827 - }, - { - "epoch": 1.61, - "learning_rate": 9.295540801210955e-07, - "loss": 0.6377, - "step": 62828 - }, - { - "epoch": 1.61, - "learning_rate": 9.295264784386449e-07, - "loss": 0.6152, - "step": 62829 - }, - { - "epoch": 1.61, - "learning_rate": 9.294988768101528e-07, - "loss": 0.7744, - "step": 62830 - }, - { - "epoch": 1.61, - "learning_rate": 9.2947127523564e-07, - "loss": 0.5483, - "step": 62831 - }, - { - "epoch": 1.61, - "learning_rate": 9.294436737151279e-07, - "loss": 0.6763, - "step": 62832 - }, - { - "epoch": 1.61, - "learning_rate": 9.294160722486375e-07, - "loss": 0.7373, - "step": 62833 - }, - { - "epoch": 1.61, - "learning_rate": 9.293884708361901e-07, - "loss": 0.615, - "step": 62834 - }, - { - "epoch": 1.61, - "learning_rate": 9.293608694778065e-07, - "loss": 0.7974, - "step": 62835 - }, - { - "epoch": 1.61, - "learning_rate": 9.293332681735083e-07, - "loss": 0.604, - "step": 62836 - }, - { - "epoch": 1.61, - "learning_rate": 9.293056669233164e-07, - "loss": 0.6279, - "step": 62837 - }, - { - "epoch": 1.61, - "learning_rate": 9.292780657272518e-07, - "loss": 0.6533, - "step": 62838 - }, - { - "epoch": 1.61, - "learning_rate": 9.292504645853355e-07, - "loss": 0.6855, - "step": 62839 - }, - { - "epoch": 1.61, - "learning_rate": 9.292228634975891e-07, - "loss": 0.5459, - "step": 62840 - }, - { - "epoch": 1.61, - "learning_rate": 9.291952624640333e-07, - "loss": 0.4248, - "step": 62841 - }, - { - "epoch": 1.61, - "learning_rate": 9.291676614846897e-07, - "loss": 0.5444, - "step": 62842 - }, - { - "epoch": 1.61, - "learning_rate": 9.291400605595788e-07, - "loss": 0.6719, - "step": 62843 - }, - { - "epoch": 1.61, - "learning_rate": 9.291124596887224e-07, - "loss": 0.6963, - "step": 62844 - }, - { - "epoch": 1.61, - "learning_rate": 9.290848588721412e-07, - "loss": 0.6562, - "step": 62845 - }, - { - "epoch": 1.61, - "learning_rate": 9.290572581098565e-07, - "loss": 0.5859, - "step": 62846 - }, - { - "epoch": 1.61, - "learning_rate": 9.290296574018896e-07, - "loss": 0.6064, - "step": 62847 - }, - { - "epoch": 1.61, - "learning_rate": 9.290020567482611e-07, - "loss": 0.5522, - "step": 62848 - }, - { - "epoch": 1.61, - "learning_rate": 9.289744561489927e-07, - "loss": 0.6885, - "step": 62849 - }, - { - "epoch": 1.61, - "learning_rate": 9.289468556041051e-07, - "loss": 0.5974, - "step": 62850 - }, - { - "epoch": 1.61, - "learning_rate": 9.289192551136198e-07, - "loss": 0.8018, - "step": 62851 - }, - { - "epoch": 1.61, - "learning_rate": 9.288916546775576e-07, - "loss": 0.5747, - "step": 62852 - }, - { - "epoch": 1.61, - "learning_rate": 9.288640542959398e-07, - "loss": 0.7441, - "step": 62853 - }, - { - "epoch": 1.61, - "learning_rate": 9.288364539687875e-07, - "loss": 0.5137, - "step": 62854 - }, - { - "epoch": 1.61, - "learning_rate": 9.288088536961221e-07, - "loss": 0.8545, - "step": 62855 - }, - { - "epoch": 1.61, - "learning_rate": 9.287812534779642e-07, - "loss": 0.575, - "step": 62856 - }, - { - "epoch": 1.61, - "learning_rate": 9.287536533143357e-07, - "loss": 0.3889, - "step": 62857 - }, - { - "epoch": 1.61, - "learning_rate": 9.287260532052569e-07, - "loss": 0.6279, - "step": 62858 - }, - { - "epoch": 1.61, - "learning_rate": 9.286984531507493e-07, - "loss": 0.5254, - "step": 62859 - }, - { - "epoch": 1.61, - "learning_rate": 9.286708531508338e-07, - "loss": 0.7559, - "step": 62860 - }, - { - "epoch": 1.61, - "learning_rate": 9.286432532055321e-07, - "loss": 0.3954, - "step": 62861 - }, - { - "epoch": 1.61, - "learning_rate": 9.286156533148647e-07, - "loss": 0.7529, - "step": 62862 - }, - { - "epoch": 1.61, - "learning_rate": 9.285880534788532e-07, - "loss": 0.7227, - "step": 62863 - }, - { - "epoch": 1.61, - "learning_rate": 9.285604536975183e-07, - "loss": 0.7168, - "step": 62864 - }, - { - "epoch": 1.61, - "learning_rate": 9.285328539708817e-07, - "loss": 0.7109, - "step": 62865 - }, - { - "epoch": 1.61, - "learning_rate": 9.285052542989639e-07, - "loss": 0.6973, - "step": 62866 - }, - { - "epoch": 1.61, - "learning_rate": 9.284776546817867e-07, - "loss": 0.6299, - "step": 62867 - }, - { - "epoch": 1.61, - "learning_rate": 9.284500551193708e-07, - "loss": 0.5991, - "step": 62868 - }, - { - "epoch": 1.61, - "learning_rate": 9.284224556117372e-07, - "loss": 0.7197, - "step": 62869 - }, - { - "epoch": 1.61, - "learning_rate": 9.283948561589074e-07, - "loss": 0.7119, - "step": 62870 - }, - { - "epoch": 1.61, - "learning_rate": 9.283672567609021e-07, - "loss": 0.6221, - "step": 62871 - }, - { - "epoch": 1.61, - "learning_rate": 9.283396574177429e-07, - "loss": 0.4966, - "step": 62872 - }, - { - "epoch": 1.61, - "learning_rate": 9.283120581294505e-07, - "loss": 0.7617, - "step": 62873 - }, - { - "epoch": 1.61, - "learning_rate": 9.282844588960466e-07, - "loss": 0.6304, - "step": 62874 - }, - { - "epoch": 1.61, - "learning_rate": 9.28256859717552e-07, - "loss": 0.6621, - "step": 62875 - }, - { - "epoch": 1.61, - "learning_rate": 9.282292605939876e-07, - "loss": 0.7656, - "step": 62876 - }, - { - "epoch": 1.61, - "learning_rate": 9.28201661525375e-07, - "loss": 0.6113, - "step": 62877 - }, - { - "epoch": 1.61, - "learning_rate": 9.281740625117351e-07, - "loss": 0.4568, - "step": 62878 - }, - { - "epoch": 1.61, - "learning_rate": 9.281464635530886e-07, - "loss": 0.7588, - "step": 62879 - }, - { - "epoch": 1.61, - "learning_rate": 9.281188646494574e-07, - "loss": 0.521, - "step": 62880 - }, - { - "epoch": 1.61, - "learning_rate": 9.280912658008621e-07, - "loss": 0.6758, - "step": 62881 - }, - { - "epoch": 1.61, - "learning_rate": 9.280636670073241e-07, - "loss": 0.6353, - "step": 62882 - }, - { - "epoch": 1.61, - "learning_rate": 9.280360682688643e-07, - "loss": 0.7617, - "step": 62883 - }, - { - "epoch": 1.61, - "learning_rate": 9.280084695855042e-07, - "loss": 0.573, - "step": 62884 - }, - { - "epoch": 1.61, - "learning_rate": 9.279808709572644e-07, - "loss": 0.6782, - "step": 62885 - }, - { - "epoch": 1.61, - "learning_rate": 9.279532723841667e-07, - "loss": 0.6132, - "step": 62886 - }, - { - "epoch": 1.61, - "learning_rate": 9.27925673866232e-07, - "loss": 0.8027, - "step": 62887 - }, - { - "epoch": 1.61, - "learning_rate": 9.278980754034807e-07, - "loss": 0.4673, - "step": 62888 - }, - { - "epoch": 1.61, - "learning_rate": 9.27870476995935e-07, - "loss": 0.6514, - "step": 62889 - }, - { - "epoch": 1.61, - "learning_rate": 9.278428786436152e-07, - "loss": 0.5732, - "step": 62890 - }, - { - "epoch": 1.61, - "learning_rate": 9.278152803465431e-07, - "loss": 0.6963, - "step": 62891 - }, - { - "epoch": 1.61, - "learning_rate": 9.277876821047395e-07, - "loss": 0.7188, - "step": 62892 - }, - { - "epoch": 1.61, - "learning_rate": 9.277600839182252e-07, - "loss": 0.4927, - "step": 62893 - }, - { - "epoch": 1.61, - "learning_rate": 9.277324857870222e-07, - "loss": 0.7822, - "step": 62894 - }, - { - "epoch": 1.61, - "learning_rate": 9.277048877111506e-07, - "loss": 0.626, - "step": 62895 - }, - { - "epoch": 1.61, - "learning_rate": 9.276772896906325e-07, - "loss": 0.5361, - "step": 62896 - }, - { - "epoch": 1.61, - "learning_rate": 9.276496917254886e-07, - "loss": 0.8057, - "step": 62897 - }, - { - "epoch": 1.61, - "learning_rate": 9.276220938157395e-07, - "loss": 0.6309, - "step": 62898 - }, - { - "epoch": 1.61, - "learning_rate": 9.275944959614072e-07, - "loss": 0.2593, - "step": 62899 - }, - { - "epoch": 1.61, - "learning_rate": 9.275668981625122e-07, - "loss": 0.5708, - "step": 62900 - }, - { - "epoch": 1.61, - "learning_rate": 9.275393004190763e-07, - "loss": 0.6748, - "step": 62901 - }, - { - "epoch": 1.61, - "learning_rate": 9.275117027311198e-07, - "loss": 0.5981, - "step": 62902 - }, - { - "epoch": 1.61, - "learning_rate": 9.274841050986645e-07, - "loss": 0.6196, - "step": 62903 - }, - { - "epoch": 1.61, - "learning_rate": 9.274565075217311e-07, - "loss": 0.7085, - "step": 62904 - }, - { - "epoch": 1.61, - "learning_rate": 9.274289100003411e-07, - "loss": 0.8379, - "step": 62905 - }, - { - "epoch": 1.61, - "learning_rate": 9.274013125345153e-07, - "loss": 0.5479, - "step": 62906 - }, - { - "epoch": 1.61, - "learning_rate": 9.273737151242754e-07, - "loss": 0.5952, - "step": 62907 - }, - { - "epoch": 1.61, - "learning_rate": 9.273461177696418e-07, - "loss": 0.6133, - "step": 62908 - }, - { - "epoch": 1.61, - "learning_rate": 9.27318520470636e-07, - "loss": 0.5339, - "step": 62909 - }, - { - "epoch": 1.61, - "learning_rate": 9.272909232272787e-07, - "loss": 0.5056, - "step": 62910 - }, - { - "epoch": 1.61, - "learning_rate": 9.272633260395919e-07, - "loss": 0.8418, - "step": 62911 - }, - { - "epoch": 1.61, - "learning_rate": 9.272357289075958e-07, - "loss": 0.6807, - "step": 62912 - }, - { - "epoch": 1.61, - "learning_rate": 9.272081318313123e-07, - "loss": 0.624, - "step": 62913 - }, - { - "epoch": 1.61, - "learning_rate": 9.271805348107618e-07, - "loss": 0.686, - "step": 62914 - }, - { - "epoch": 1.61, - "learning_rate": 9.271529378459662e-07, - "loss": 0.7163, - "step": 62915 - }, - { - "epoch": 1.61, - "learning_rate": 9.271253409369459e-07, - "loss": 0.6626, - "step": 62916 - }, - { - "epoch": 1.61, - "learning_rate": 9.27097744083723e-07, - "loss": 0.5771, - "step": 62917 - }, - { - "epoch": 1.61, - "learning_rate": 9.270701472863176e-07, - "loss": 0.7139, - "step": 62918 - }, - { - "epoch": 1.61, - "learning_rate": 9.270425505447511e-07, - "loss": 0.6719, - "step": 62919 - }, - { - "epoch": 1.61, - "learning_rate": 9.270149538590449e-07, - "loss": 0.6992, - "step": 62920 - }, - { - "epoch": 1.61, - "learning_rate": 9.2698735722922e-07, - "loss": 0.6465, - "step": 62921 - }, - { - "epoch": 1.61, - "learning_rate": 9.269597606552974e-07, - "loss": 0.5657, - "step": 62922 - }, - { - "epoch": 1.61, - "learning_rate": 9.269321641372985e-07, - "loss": 0.7202, - "step": 62923 - }, - { - "epoch": 1.61, - "learning_rate": 9.269045676752443e-07, - "loss": 0.5654, - "step": 62924 - }, - { - "epoch": 1.61, - "learning_rate": 9.268769712691557e-07, - "loss": 0.7783, - "step": 62925 - }, - { - "epoch": 1.61, - "learning_rate": 9.268493749190543e-07, - "loss": 0.7412, - "step": 62926 - }, - { - "epoch": 1.61, - "learning_rate": 9.268217786249611e-07, - "loss": 0.6416, - "step": 62927 - }, - { - "epoch": 1.61, - "learning_rate": 9.267941823868969e-07, - "loss": 0.5996, - "step": 62928 - }, - { - "epoch": 1.61, - "learning_rate": 9.267665862048829e-07, - "loss": 0.7783, - "step": 62929 - }, - { - "epoch": 1.61, - "learning_rate": 9.267389900789405e-07, - "loss": 0.6748, - "step": 62930 - }, - { - "epoch": 1.61, - "learning_rate": 9.267113940090905e-07, - "loss": 0.7588, - "step": 62931 - }, - { - "epoch": 1.61, - "learning_rate": 9.266837979953545e-07, - "loss": 0.6836, - "step": 62932 - }, - { - "epoch": 1.61, - "learning_rate": 9.26656202037753e-07, - "loss": 0.5437, - "step": 62933 - }, - { - "epoch": 1.61, - "learning_rate": 9.266286061363078e-07, - "loss": 0.5068, - "step": 62934 - }, - { - "epoch": 1.61, - "learning_rate": 9.266010102910394e-07, - "loss": 0.4402, - "step": 62935 - }, - { - "epoch": 1.61, - "learning_rate": 9.265734145019695e-07, - "loss": 0.5616, - "step": 62936 - }, - { - "epoch": 1.61, - "learning_rate": 9.265458187691191e-07, - "loss": 0.5713, - "step": 62937 - }, - { - "epoch": 1.61, - "learning_rate": 9.265182230925088e-07, - "loss": 0.7217, - "step": 62938 - }, - { - "epoch": 1.61, - "learning_rate": 9.264906274721603e-07, - "loss": 0.8945, - "step": 62939 - }, - { - "epoch": 1.61, - "learning_rate": 9.264630319080945e-07, - "loss": 0.6807, - "step": 62940 - }, - { - "epoch": 1.61, - "learning_rate": 9.264354364003326e-07, - "loss": 0.668, - "step": 62941 - }, - { - "epoch": 1.61, - "learning_rate": 9.264078409488955e-07, - "loss": 0.5361, - "step": 62942 - }, - { - "epoch": 1.61, - "learning_rate": 9.263802455538049e-07, - "loss": 0.7012, - "step": 62943 - }, - { - "epoch": 1.61, - "learning_rate": 9.263526502150813e-07, - "loss": 0.7764, - "step": 62944 - }, - { - "epoch": 1.61, - "learning_rate": 9.263250549327462e-07, - "loss": 0.5166, - "step": 62945 - }, - { - "epoch": 1.61, - "learning_rate": 9.26297459706821e-07, - "loss": 0.6367, - "step": 62946 - }, - { - "epoch": 1.61, - "learning_rate": 9.26269864537326e-07, - "loss": 0.6367, - "step": 62947 - }, - { - "epoch": 1.61, - "learning_rate": 9.262422694242827e-07, - "loss": 0.7236, - "step": 62948 - }, - { - "epoch": 1.61, - "learning_rate": 9.262146743677125e-07, - "loss": 0.75, - "step": 62949 - }, - { - "epoch": 1.61, - "learning_rate": 9.261870793676361e-07, - "loss": 0.6094, - "step": 62950 - }, - { - "epoch": 1.61, - "learning_rate": 9.261594844240751e-07, - "loss": 0.835, - "step": 62951 - }, - { - "epoch": 1.61, - "learning_rate": 9.261318895370501e-07, - "loss": 0.6719, - "step": 62952 - }, - { - "epoch": 1.61, - "learning_rate": 9.261042947065828e-07, - "loss": 0.4995, - "step": 62953 - }, - { - "epoch": 1.61, - "learning_rate": 9.260766999326939e-07, - "loss": 0.7158, - "step": 62954 - }, - { - "epoch": 1.61, - "learning_rate": 9.260491052154048e-07, - "loss": 0.6289, - "step": 62955 - }, - { - "epoch": 1.61, - "learning_rate": 9.260215105547367e-07, - "loss": 0.4543, - "step": 62956 - }, - { - "epoch": 1.61, - "learning_rate": 9.259939159507101e-07, - "loss": 0.359, - "step": 62957 - }, - { - "epoch": 1.61, - "learning_rate": 9.259663214033468e-07, - "loss": 0.5796, - "step": 62958 - }, - { - "epoch": 1.61, - "learning_rate": 9.259387269126675e-07, - "loss": 0.4028, - "step": 62959 - }, - { - "epoch": 1.61, - "learning_rate": 9.259111324786937e-07, - "loss": 0.6938, - "step": 62960 - }, - { - "epoch": 1.61, - "learning_rate": 9.258835381014461e-07, - "loss": 0.6904, - "step": 62961 - }, - { - "epoch": 1.61, - "learning_rate": 9.258559437809462e-07, - "loss": 0.6646, - "step": 62962 - }, - { - "epoch": 1.61, - "learning_rate": 9.258283495172149e-07, - "loss": 0.7744, - "step": 62963 - }, - { - "epoch": 1.61, - "learning_rate": 9.258007553102735e-07, - "loss": 0.668, - "step": 62964 - }, - { - "epoch": 1.61, - "learning_rate": 9.257731611601433e-07, - "loss": 0.6172, - "step": 62965 - }, - { - "epoch": 1.61, - "learning_rate": 9.257455670668453e-07, - "loss": 0.6572, - "step": 62966 - }, - { - "epoch": 1.61, - "learning_rate": 9.257179730303999e-07, - "loss": 0.748, - "step": 62967 - }, - { - "epoch": 1.61, - "learning_rate": 9.256903790508292e-07, - "loss": 0.79, - "step": 62968 - }, - { - "epoch": 1.61, - "learning_rate": 9.256627851281537e-07, - "loss": 0.635, - "step": 62969 - }, - { - "epoch": 1.61, - "learning_rate": 9.256351912623951e-07, - "loss": 0.6279, - "step": 62970 - }, - { - "epoch": 1.61, - "learning_rate": 9.256075974535739e-07, - "loss": 0.7051, - "step": 62971 - }, - { - "epoch": 1.61, - "learning_rate": 9.255800037017117e-07, - "loss": 0.4048, - "step": 62972 - }, - { - "epoch": 1.61, - "learning_rate": 9.255524100068293e-07, - "loss": 0.7134, - "step": 62973 - }, - { - "epoch": 1.61, - "learning_rate": 9.255248163689483e-07, - "loss": 0.7559, - "step": 62974 - }, - { - "epoch": 1.61, - "learning_rate": 9.254972227880893e-07, - "loss": 0.6155, - "step": 62975 - }, - { - "epoch": 1.61, - "learning_rate": 9.25469629264274e-07, - "loss": 0.6934, - "step": 62976 - }, - { - "epoch": 1.61, - "learning_rate": 9.25442035797523e-07, - "loss": 0.5825, - "step": 62977 - }, - { - "epoch": 1.61, - "learning_rate": 9.254144423878574e-07, - "loss": 0.5576, - "step": 62978 - }, - { - "epoch": 1.61, - "learning_rate": 9.253868490352987e-07, - "loss": 0.6973, - "step": 62979 - }, - { - "epoch": 1.61, - "learning_rate": 9.253592557398677e-07, - "loss": 0.7832, - "step": 62980 - }, - { - "epoch": 1.61, - "learning_rate": 9.25331662501586e-07, - "loss": 0.481, - "step": 62981 - }, - { - "epoch": 1.61, - "learning_rate": 9.253040693204741e-07, - "loss": 0.6987, - "step": 62982 - }, - { - "epoch": 1.61, - "learning_rate": 9.252764761965534e-07, - "loss": 0.8145, - "step": 62983 - }, - { - "epoch": 1.61, - "learning_rate": 9.252488831298454e-07, - "loss": 0.5916, - "step": 62984 - }, - { - "epoch": 1.61, - "learning_rate": 9.252212901203706e-07, - "loss": 0.6489, - "step": 62985 - }, - { - "epoch": 1.61, - "learning_rate": 9.251936971681508e-07, - "loss": 0.584, - "step": 62986 - }, - { - "epoch": 1.61, - "learning_rate": 9.251661042732065e-07, - "loss": 0.6641, - "step": 62987 - }, - { - "epoch": 1.61, - "learning_rate": 9.251385114355589e-07, - "loss": 0.564, - "step": 62988 - }, - { - "epoch": 1.61, - "learning_rate": 9.251109186552295e-07, - "loss": 0.6934, - "step": 62989 - }, - { - "epoch": 1.61, - "learning_rate": 9.250833259322391e-07, - "loss": 0.9033, - "step": 62990 - }, - { - "epoch": 1.61, - "learning_rate": 9.250557332666091e-07, - "loss": 0.6904, - "step": 62991 - }, - { - "epoch": 1.61, - "learning_rate": 9.250281406583602e-07, - "loss": 0.6416, - "step": 62992 - }, - { - "epoch": 1.61, - "learning_rate": 9.250005481075141e-07, - "loss": 0.7646, - "step": 62993 - }, - { - "epoch": 1.61, - "learning_rate": 9.249729556140915e-07, - "loss": 0.7515, - "step": 62994 - }, - { - "epoch": 1.61, - "learning_rate": 9.249453631781138e-07, - "loss": 0.6416, - "step": 62995 - }, - { - "epoch": 1.61, - "learning_rate": 9.249177707996021e-07, - "loss": 0.6499, - "step": 62996 - }, - { - "epoch": 1.61, - "learning_rate": 9.248901784785771e-07, - "loss": 0.5967, - "step": 62997 - }, - { - "epoch": 1.61, - "learning_rate": 9.248625862150604e-07, - "loss": 0.7407, - "step": 62998 - }, - { - "epoch": 1.61, - "learning_rate": 9.248349940090727e-07, - "loss": 0.6904, - "step": 62999 - }, - { - "epoch": 1.61, - "learning_rate": 9.248074018606356e-07, - "loss": 0.7148, - "step": 63000 - }, - { - "epoch": 1.61, - "learning_rate": 9.247798097697702e-07, - "loss": 0.606, - "step": 63001 - }, - { - "epoch": 1.61, - "learning_rate": 9.247522177364971e-07, - "loss": 0.6689, - "step": 63002 - }, - { - "epoch": 1.61, - "learning_rate": 9.24724625760838e-07, - "loss": 0.6719, - "step": 63003 - }, - { - "epoch": 1.61, - "learning_rate": 9.246970338428135e-07, - "loss": 0.6641, - "step": 63004 - }, - { - "epoch": 1.61, - "learning_rate": 9.246694419824454e-07, - "loss": 0.666, - "step": 63005 - }, - { - "epoch": 1.61, - "learning_rate": 9.246418501797545e-07, - "loss": 0.5254, - "step": 63006 - }, - { - "epoch": 1.61, - "learning_rate": 9.246142584347615e-07, - "loss": 0.583, - "step": 63007 - }, - { - "epoch": 1.61, - "learning_rate": 9.245866667474881e-07, - "loss": 0.5634, - "step": 63008 - }, - { - "epoch": 1.61, - "learning_rate": 9.24559075117955e-07, - "loss": 0.6753, - "step": 63009 - }, - { - "epoch": 1.61, - "learning_rate": 9.245314835461839e-07, - "loss": 0.6978, - "step": 63010 - }, - { - "epoch": 1.62, - "learning_rate": 9.245038920321951e-07, - "loss": 0.7334, - "step": 63011 - }, - { - "epoch": 1.62, - "learning_rate": 9.244763005760106e-07, - "loss": 0.6738, - "step": 63012 - }, - { - "epoch": 1.62, - "learning_rate": 9.244487091776508e-07, - "loss": 0.7285, - "step": 63013 - }, - { - "epoch": 1.62, - "learning_rate": 9.244211178371375e-07, - "loss": 0.6084, - "step": 63014 - }, - { - "epoch": 1.62, - "learning_rate": 9.243935265544911e-07, - "loss": 0.7275, - "step": 63015 - }, - { - "epoch": 1.62, - "learning_rate": 9.243659353297336e-07, - "loss": 0.6318, - "step": 63016 - }, - { - "epoch": 1.62, - "learning_rate": 9.243383441628854e-07, - "loss": 0.7236, - "step": 63017 - }, - { - "epoch": 1.62, - "learning_rate": 9.24310753053968e-07, - "loss": 0.6582, - "step": 63018 - }, - { - "epoch": 1.62, - "learning_rate": 9.24283162003002e-07, - "loss": 0.7441, - "step": 63019 - }, - { - "epoch": 1.62, - "learning_rate": 9.24255571010009e-07, - "loss": 0.5457, - "step": 63020 - }, - { - "epoch": 1.62, - "learning_rate": 9.242279800750101e-07, - "loss": 0.79, - "step": 63021 - }, - { - "epoch": 1.62, - "learning_rate": 9.242003891980264e-07, - "loss": 0.7207, - "step": 63022 - }, - { - "epoch": 1.62, - "learning_rate": 9.241727983790788e-07, - "loss": 0.5303, - "step": 63023 - }, - { - "epoch": 1.62, - "learning_rate": 9.241452076181888e-07, - "loss": 0.5952, - "step": 63024 - }, - { - "epoch": 1.62, - "learning_rate": 9.241176169153772e-07, - "loss": 0.6094, - "step": 63025 - }, - { - "epoch": 1.62, - "learning_rate": 9.240900262706655e-07, - "loss": 0.6138, - "step": 63026 - }, - { - "epoch": 1.62, - "learning_rate": 9.240624356840745e-07, - "loss": 0.6631, - "step": 63027 - }, - { - "epoch": 1.62, - "learning_rate": 9.240348451556251e-07, - "loss": 0.7373, - "step": 63028 - }, - { - "epoch": 1.62, - "learning_rate": 9.24007254685339e-07, - "loss": 0.6211, - "step": 63029 - }, - { - "epoch": 1.62, - "learning_rate": 9.239796642732368e-07, - "loss": 0.7432, - "step": 63030 - }, - { - "epoch": 1.62, - "learning_rate": 9.239520739193402e-07, - "loss": 0.8301, - "step": 63031 - }, - { - "epoch": 1.62, - "learning_rate": 9.239244836236697e-07, - "loss": 0.8047, - "step": 63032 - }, - { - "epoch": 1.62, - "learning_rate": 9.238968933862468e-07, - "loss": 0.6309, - "step": 63033 - }, - { - "epoch": 1.62, - "learning_rate": 9.238693032070926e-07, - "loss": 0.6626, - "step": 63034 - }, - { - "epoch": 1.62, - "learning_rate": 9.238417130862282e-07, - "loss": 0.5801, - "step": 63035 - }, - { - "epoch": 1.62, - "learning_rate": 9.23814123023675e-07, - "loss": 0.5128, - "step": 63036 - }, - { - "epoch": 1.62, - "learning_rate": 9.237865330194536e-07, - "loss": 0.6538, - "step": 63037 - }, - { - "epoch": 1.62, - "learning_rate": 9.237589430735851e-07, - "loss": 0.6294, - "step": 63038 - }, - { - "epoch": 1.62, - "learning_rate": 9.237313531860911e-07, - "loss": 0.5007, - "step": 63039 - }, - { - "epoch": 1.62, - "learning_rate": 9.237037633569923e-07, - "loss": 0.5439, - "step": 63040 - }, - { - "epoch": 1.62, - "learning_rate": 9.236761735863102e-07, - "loss": 0.5742, - "step": 63041 - }, - { - "epoch": 1.62, - "learning_rate": 9.236485838740656e-07, - "loss": 0.7871, - "step": 63042 - }, - { - "epoch": 1.62, - "learning_rate": 9.2362099422028e-07, - "loss": 0.5112, - "step": 63043 - }, - { - "epoch": 1.62, - "learning_rate": 9.235934046249739e-07, - "loss": 0.3789, - "step": 63044 - }, - { - "epoch": 1.62, - "learning_rate": 9.235658150881692e-07, - "loss": 0.4921, - "step": 63045 - }, - { - "epoch": 1.62, - "learning_rate": 9.235382256098867e-07, - "loss": 0.5559, - "step": 63046 - }, - { - "epoch": 1.62, - "learning_rate": 9.235106361901472e-07, - "loss": 0.5046, - "step": 63047 - }, - { - "epoch": 1.62, - "learning_rate": 9.234830468289722e-07, - "loss": 0.7236, - "step": 63048 - }, - { - "epoch": 1.62, - "learning_rate": 9.234554575263825e-07, - "loss": 0.6548, - "step": 63049 - }, - { - "epoch": 1.62, - "learning_rate": 9.234278682823997e-07, - "loss": 0.5308, - "step": 63050 - }, - { - "epoch": 1.62, - "learning_rate": 9.234002790970444e-07, - "loss": 0.5898, - "step": 63051 - }, - { - "epoch": 1.62, - "learning_rate": 9.233726899703382e-07, - "loss": 0.6582, - "step": 63052 - }, - { - "epoch": 1.62, - "learning_rate": 9.233451009023019e-07, - "loss": 0.8799, - "step": 63053 - }, - { - "epoch": 1.62, - "learning_rate": 9.23317511892957e-07, - "loss": 0.6084, - "step": 63054 - }, - { - "epoch": 1.62, - "learning_rate": 9.232899229423241e-07, - "loss": 0.6768, - "step": 63055 - }, - { - "epoch": 1.62, - "learning_rate": 9.23262334050425e-07, - "loss": 0.7334, - "step": 63056 - }, - { - "epoch": 1.62, - "learning_rate": 9.232347452172799e-07, - "loss": 0.7393, - "step": 63057 - }, - { - "epoch": 1.62, - "learning_rate": 9.232071564429106e-07, - "loss": 0.6758, - "step": 63058 - }, - { - "epoch": 1.62, - "learning_rate": 9.231795677273379e-07, - "loss": 0.5254, - "step": 63059 - }, - { - "epoch": 1.62, - "learning_rate": 9.231519790705831e-07, - "loss": 0.6738, - "step": 63060 - }, - { - "epoch": 1.62, - "learning_rate": 9.231243904726673e-07, - "loss": 0.7305, - "step": 63061 - }, - { - "epoch": 1.62, - "learning_rate": 9.230968019336118e-07, - "loss": 0.7109, - "step": 63062 - }, - { - "epoch": 1.62, - "learning_rate": 9.230692134534372e-07, - "loss": 0.3699, - "step": 63063 - }, - { - "epoch": 1.62, - "learning_rate": 9.230416250321653e-07, - "loss": 0.5045, - "step": 63064 - }, - { - "epoch": 1.62, - "learning_rate": 9.230140366698167e-07, - "loss": 0.4692, - "step": 63065 - }, - { - "epoch": 1.62, - "learning_rate": 9.229864483664132e-07, - "loss": 0.4692, - "step": 63066 - }, - { - "epoch": 1.62, - "learning_rate": 9.22958860121975e-07, - "loss": 0.6001, - "step": 63067 - }, - { - "epoch": 1.62, - "learning_rate": 9.229312719365235e-07, - "loss": 0.7363, - "step": 63068 - }, - { - "epoch": 1.62, - "learning_rate": 9.229036838100803e-07, - "loss": 0.479, - "step": 63069 - }, - { - "epoch": 1.62, - "learning_rate": 9.22876095742666e-07, - "loss": 0.7617, - "step": 63070 - }, - { - "epoch": 1.62, - "learning_rate": 9.22848507734302e-07, - "loss": 0.6401, - "step": 63071 - }, - { - "epoch": 1.62, - "learning_rate": 9.228209197850095e-07, - "loss": 0.7627, - "step": 63072 - }, - { - "epoch": 1.62, - "learning_rate": 9.227933318948092e-07, - "loss": 0.6807, - "step": 63073 - }, - { - "epoch": 1.62, - "learning_rate": 9.227657440637226e-07, - "loss": 0.6597, - "step": 63074 - }, - { - "epoch": 1.62, - "learning_rate": 9.227381562917707e-07, - "loss": 0.6689, - "step": 63075 - }, - { - "epoch": 1.62, - "learning_rate": 9.22710568578975e-07, - "loss": 0.6309, - "step": 63076 - }, - { - "epoch": 1.62, - "learning_rate": 9.22682980925356e-07, - "loss": 0.8418, - "step": 63077 - }, - { - "epoch": 1.62, - "learning_rate": 9.226553933309349e-07, - "loss": 0.5718, - "step": 63078 - }, - { - "epoch": 1.62, - "learning_rate": 9.226278057957333e-07, - "loss": 0.6865, - "step": 63079 - }, - { - "epoch": 1.62, - "learning_rate": 9.226002183197717e-07, - "loss": 0.437, - "step": 63080 - }, - { - "epoch": 1.62, - "learning_rate": 9.225726309030718e-07, - "loss": 0.6191, - "step": 63081 - }, - { - "epoch": 1.62, - "learning_rate": 9.225450435456543e-07, - "loss": 0.7705, - "step": 63082 - }, - { - "epoch": 1.62, - "learning_rate": 9.225174562475406e-07, - "loss": 0.4085, - "step": 63083 - }, - { - "epoch": 1.62, - "learning_rate": 9.224898690087516e-07, - "loss": 0.6333, - "step": 63084 - }, - { - "epoch": 1.62, - "learning_rate": 9.224622818293087e-07, - "loss": 0.6455, - "step": 63085 - }, - { - "epoch": 1.62, - "learning_rate": 9.224346947092332e-07, - "loss": 0.6572, - "step": 63086 - }, - { - "epoch": 1.62, - "learning_rate": 9.224071076485454e-07, - "loss": 0.6108, - "step": 63087 - }, - { - "epoch": 1.62, - "learning_rate": 9.223795206472671e-07, - "loss": 0.7158, - "step": 63088 - }, - { - "epoch": 1.62, - "learning_rate": 9.223519337054191e-07, - "loss": 0.4478, - "step": 63089 - }, - { - "epoch": 1.62, - "learning_rate": 9.223243468230227e-07, - "loss": 0.4315, - "step": 63090 - }, - { - "epoch": 1.62, - "learning_rate": 9.22296760000099e-07, - "loss": 0.6646, - "step": 63091 - }, - { - "epoch": 1.62, - "learning_rate": 9.222691732366691e-07, - "loss": 0.5991, - "step": 63092 - }, - { - "epoch": 1.62, - "learning_rate": 9.222415865327542e-07, - "loss": 0.6348, - "step": 63093 - }, - { - "epoch": 1.62, - "learning_rate": 9.222139998883751e-07, - "loss": 0.5974, - "step": 63094 - }, - { - "epoch": 1.62, - "learning_rate": 9.221864133035534e-07, - "loss": 0.5981, - "step": 63095 - }, - { - "epoch": 1.62, - "learning_rate": 9.221588267783102e-07, - "loss": 0.6865, - "step": 63096 - }, - { - "epoch": 1.62, - "learning_rate": 9.22131240312666e-07, - "loss": 0.6123, - "step": 63097 - }, - { - "epoch": 1.62, - "learning_rate": 9.221036539066425e-07, - "loss": 0.7188, - "step": 63098 - }, - { - "epoch": 1.62, - "learning_rate": 9.220760675602603e-07, - "loss": 0.6738, - "step": 63099 - }, - { - "epoch": 1.62, - "learning_rate": 9.220484812735414e-07, - "loss": 0.5415, - "step": 63100 - }, - { - "epoch": 1.62, - "learning_rate": 9.220208950465059e-07, - "loss": 0.6875, - "step": 63101 - }, - { - "epoch": 1.62, - "learning_rate": 9.219933088791758e-07, - "loss": 0.5979, - "step": 63102 - }, - { - "epoch": 1.62, - "learning_rate": 9.219657227715716e-07, - "loss": 0.5676, - "step": 63103 - }, - { - "epoch": 1.62, - "learning_rate": 9.219381367237148e-07, - "loss": 0.6543, - "step": 63104 - }, - { - "epoch": 1.62, - "learning_rate": 9.219105507356262e-07, - "loss": 0.5234, - "step": 63105 - }, - { - "epoch": 1.62, - "learning_rate": 9.218829648073275e-07, - "loss": 0.3706, - "step": 63106 - }, - { - "epoch": 1.62, - "learning_rate": 9.218553789388394e-07, - "loss": 0.71, - "step": 63107 - }, - { - "epoch": 1.62, - "learning_rate": 9.218277931301827e-07, - "loss": 0.3783, - "step": 63108 - }, - { - "epoch": 1.62, - "learning_rate": 9.218002073813789e-07, - "loss": 0.5596, - "step": 63109 - }, - { - "epoch": 1.62, - "learning_rate": 9.217726216924493e-07, - "loss": 0.6514, - "step": 63110 - }, - { - "epoch": 1.62, - "learning_rate": 9.217450360634145e-07, - "loss": 0.6455, - "step": 63111 - }, - { - "epoch": 1.62, - "learning_rate": 9.217174504942961e-07, - "loss": 0.6115, - "step": 63112 - }, - { - "epoch": 1.62, - "learning_rate": 9.216898649851151e-07, - "loss": 0.7754, - "step": 63113 - }, - { - "epoch": 1.62, - "learning_rate": 9.216622795358925e-07, - "loss": 0.6655, - "step": 63114 - }, - { - "epoch": 1.62, - "learning_rate": 9.216346941466493e-07, - "loss": 0.606, - "step": 63115 - }, - { - "epoch": 1.62, - "learning_rate": 9.216071088174073e-07, - "loss": 0.5518, - "step": 63116 - }, - { - "epoch": 1.62, - "learning_rate": 9.215795235481871e-07, - "loss": 0.6084, - "step": 63117 - }, - { - "epoch": 1.62, - "learning_rate": 9.215519383390093e-07, - "loss": 0.6787, - "step": 63118 - }, - { - "epoch": 1.62, - "learning_rate": 9.215243531898959e-07, - "loss": 0.7266, - "step": 63119 - }, - { - "epoch": 1.62, - "learning_rate": 9.214967681008677e-07, - "loss": 0.7832, - "step": 63120 - }, - { - "epoch": 1.62, - "learning_rate": 9.214691830719457e-07, - "loss": 0.8086, - "step": 63121 - }, - { - "epoch": 1.62, - "learning_rate": 9.214415981031511e-07, - "loss": 0.4722, - "step": 63122 - }, - { - "epoch": 1.62, - "learning_rate": 9.214140131945053e-07, - "loss": 0.6797, - "step": 63123 - }, - { - "epoch": 1.62, - "learning_rate": 9.213864283460288e-07, - "loss": 0.7646, - "step": 63124 - }, - { - "epoch": 1.62, - "learning_rate": 9.213588435577435e-07, - "loss": 0.5674, - "step": 63125 - }, - { - "epoch": 1.62, - "learning_rate": 9.213312588296703e-07, - "loss": 0.8311, - "step": 63126 - }, - { - "epoch": 1.62, - "learning_rate": 9.213036741618298e-07, - "loss": 1.0, - "step": 63127 - }, - { - "epoch": 1.62, - "learning_rate": 9.212760895542434e-07, - "loss": 0.6826, - "step": 63128 - }, - { - "epoch": 1.62, - "learning_rate": 9.212485050069324e-07, - "loss": 0.4392, - "step": 63129 - }, - { - "epoch": 1.62, - "learning_rate": 9.212209205199177e-07, - "loss": 0.6387, - "step": 63130 - }, - { - "epoch": 1.62, - "learning_rate": 9.211933360932206e-07, - "loss": 0.5635, - "step": 63131 - }, - { - "epoch": 1.62, - "learning_rate": 9.21165751726862e-07, - "loss": 0.5898, - "step": 63132 - }, - { - "epoch": 1.62, - "learning_rate": 9.211381674208633e-07, - "loss": 0.6699, - "step": 63133 - }, - { - "epoch": 1.62, - "learning_rate": 9.211105831752453e-07, - "loss": 0.3584, - "step": 63134 - }, - { - "epoch": 1.62, - "learning_rate": 9.210829989900295e-07, - "loss": 0.6211, - "step": 63135 - }, - { - "epoch": 1.62, - "learning_rate": 9.21055414865237e-07, - "loss": 0.585, - "step": 63136 - }, - { - "epoch": 1.62, - "learning_rate": 9.210278308008883e-07, - "loss": 0.6548, - "step": 63137 - }, - { - "epoch": 1.62, - "learning_rate": 9.210002467970053e-07, - "loss": 0.7471, - "step": 63138 - }, - { - "epoch": 1.62, - "learning_rate": 9.209726628536086e-07, - "loss": 0.6396, - "step": 63139 - }, - { - "epoch": 1.62, - "learning_rate": 9.209450789707195e-07, - "loss": 0.6279, - "step": 63140 - }, - { - "epoch": 1.62, - "learning_rate": 9.209174951483591e-07, - "loss": 0.7402, - "step": 63141 - }, - { - "epoch": 1.62, - "learning_rate": 9.208899113865485e-07, - "loss": 0.5732, - "step": 63142 - }, - { - "epoch": 1.62, - "learning_rate": 9.208623276853088e-07, - "loss": 0.6865, - "step": 63143 - }, - { - "epoch": 1.62, - "learning_rate": 9.208347440446615e-07, - "loss": 0.6482, - "step": 63144 - }, - { - "epoch": 1.62, - "learning_rate": 9.208071604646273e-07, - "loss": 0.7695, - "step": 63145 - }, - { - "epoch": 1.62, - "learning_rate": 9.207795769452275e-07, - "loss": 0.5576, - "step": 63146 - }, - { - "epoch": 1.62, - "learning_rate": 9.20751993486483e-07, - "loss": 0.79, - "step": 63147 - }, - { - "epoch": 1.62, - "learning_rate": 9.20724410088415e-07, - "loss": 0.571, - "step": 63148 - }, - { - "epoch": 1.62, - "learning_rate": 9.206968267510446e-07, - "loss": 0.6431, - "step": 63149 - }, - { - "epoch": 1.62, - "learning_rate": 9.206692434743931e-07, - "loss": 0.728, - "step": 63150 - }, - { - "epoch": 1.62, - "learning_rate": 9.206416602584814e-07, - "loss": 0.7646, - "step": 63151 - }, - { - "epoch": 1.62, - "learning_rate": 9.206140771033309e-07, - "loss": 0.6768, - "step": 63152 - }, - { - "epoch": 1.62, - "learning_rate": 9.205864940089623e-07, - "loss": 0.6479, - "step": 63153 - }, - { - "epoch": 1.62, - "learning_rate": 9.205589109753972e-07, - "loss": 0.7578, - "step": 63154 - }, - { - "epoch": 1.62, - "learning_rate": 9.205313280026563e-07, - "loss": 0.6465, - "step": 63155 - }, - { - "epoch": 1.62, - "learning_rate": 9.205037450907613e-07, - "loss": 0.6592, - "step": 63156 - }, - { - "epoch": 1.62, - "learning_rate": 9.204761622397328e-07, - "loss": 0.5596, - "step": 63157 - }, - { - "epoch": 1.62, - "learning_rate": 9.204485794495919e-07, - "loss": 0.6475, - "step": 63158 - }, - { - "epoch": 1.62, - "learning_rate": 9.204209967203599e-07, - "loss": 0.6914, - "step": 63159 - }, - { - "epoch": 1.62, - "learning_rate": 9.203934140520577e-07, - "loss": 0.8281, - "step": 63160 - }, - { - "epoch": 1.62, - "learning_rate": 9.20365831444707e-07, - "loss": 0.4509, - "step": 63161 - }, - { - "epoch": 1.62, - "learning_rate": 9.20338248898328e-07, - "loss": 0.6211, - "step": 63162 - }, - { - "epoch": 1.62, - "learning_rate": 9.203106664129428e-07, - "loss": 0.6787, - "step": 63163 - }, - { - "epoch": 1.62, - "learning_rate": 9.202830839885719e-07, - "loss": 0.7021, - "step": 63164 - }, - { - "epoch": 1.62, - "learning_rate": 9.202555016252365e-07, - "loss": 0.5879, - "step": 63165 - }, - { - "epoch": 1.62, - "learning_rate": 9.20227919322958e-07, - "loss": 0.7456, - "step": 63166 - }, - { - "epoch": 1.62, - "learning_rate": 9.202003370817574e-07, - "loss": 0.543, - "step": 63167 - }, - { - "epoch": 1.62, - "learning_rate": 9.201727549016554e-07, - "loss": 0.5957, - "step": 63168 - }, - { - "epoch": 1.62, - "learning_rate": 9.201451727826735e-07, - "loss": 0.5046, - "step": 63169 - }, - { - "epoch": 1.62, - "learning_rate": 9.201175907248327e-07, - "loss": 0.6199, - "step": 63170 - }, - { - "epoch": 1.62, - "learning_rate": 9.200900087281545e-07, - "loss": 0.5623, - "step": 63171 - }, - { - "epoch": 1.62, - "learning_rate": 9.200624267926593e-07, - "loss": 0.5432, - "step": 63172 - }, - { - "epoch": 1.62, - "learning_rate": 9.200348449183691e-07, - "loss": 0.7344, - "step": 63173 - }, - { - "epoch": 1.62, - "learning_rate": 9.20007263105304e-07, - "loss": 0.6689, - "step": 63174 - }, - { - "epoch": 1.62, - "learning_rate": 9.19979681353486e-07, - "loss": 0.752, - "step": 63175 - }, - { - "epoch": 1.62, - "learning_rate": 9.199520996629362e-07, - "loss": 0.624, - "step": 63176 - }, - { - "epoch": 1.62, - "learning_rate": 9.199245180336748e-07, - "loss": 0.5308, - "step": 63177 - }, - { - "epoch": 1.62, - "learning_rate": 9.198969364657239e-07, - "loss": 0.7139, - "step": 63178 - }, - { - "epoch": 1.62, - "learning_rate": 9.198693549591039e-07, - "loss": 0.6016, - "step": 63179 - }, - { - "epoch": 1.62, - "learning_rate": 9.198417735138365e-07, - "loss": 0.6274, - "step": 63180 - }, - { - "epoch": 1.62, - "learning_rate": 9.198141921299426e-07, - "loss": 0.6953, - "step": 63181 - }, - { - "epoch": 1.62, - "learning_rate": 9.19786610807443e-07, - "loss": 0.4951, - "step": 63182 - }, - { - "epoch": 1.62, - "learning_rate": 9.197590295463594e-07, - "loss": 0.6475, - "step": 63183 - }, - { - "epoch": 1.62, - "learning_rate": 9.197314483467124e-07, - "loss": 0.7158, - "step": 63184 - }, - { - "epoch": 1.62, - "learning_rate": 9.197038672085235e-07, - "loss": 0.918, - "step": 63185 - }, - { - "epoch": 1.62, - "learning_rate": 9.196762861318139e-07, - "loss": 0.6885, - "step": 63186 - }, - { - "epoch": 1.62, - "learning_rate": 9.196487051166041e-07, - "loss": 0.4902, - "step": 63187 - }, - { - "epoch": 1.62, - "learning_rate": 9.196211241629157e-07, - "loss": 0.7686, - "step": 63188 - }, - { - "epoch": 1.62, - "learning_rate": 9.195935432707696e-07, - "loss": 0.6002, - "step": 63189 - }, - { - "epoch": 1.62, - "learning_rate": 9.195659624401872e-07, - "loss": 0.6611, - "step": 63190 - }, - { - "epoch": 1.62, - "learning_rate": 9.195383816711892e-07, - "loss": 0.5886, - "step": 63191 - }, - { - "epoch": 1.62, - "learning_rate": 9.195108009637971e-07, - "loss": 0.6904, - "step": 63192 - }, - { - "epoch": 1.62, - "learning_rate": 9.194832203180317e-07, - "loss": 0.7285, - "step": 63193 - }, - { - "epoch": 1.62, - "learning_rate": 9.194556397339146e-07, - "loss": 0.6758, - "step": 63194 - }, - { - "epoch": 1.62, - "learning_rate": 9.194280592114664e-07, - "loss": 0.7139, - "step": 63195 - }, - { - "epoch": 1.62, - "learning_rate": 9.194004787507088e-07, - "loss": 0.5449, - "step": 63196 - }, - { - "epoch": 1.62, - "learning_rate": 9.193728983516623e-07, - "loss": 0.6963, - "step": 63197 - }, - { - "epoch": 1.62, - "learning_rate": 9.193453180143483e-07, - "loss": 0.646, - "step": 63198 - }, - { - "epoch": 1.62, - "learning_rate": 9.193177377387877e-07, - "loss": 0.6787, - "step": 63199 - }, - { - "epoch": 1.62, - "learning_rate": 9.19290157525002e-07, - "loss": 0.7256, - "step": 63200 - }, - { - "epoch": 1.62, - "learning_rate": 9.192625773730119e-07, - "loss": 0.6396, - "step": 63201 - }, - { - "epoch": 1.62, - "learning_rate": 9.192349972828389e-07, - "loss": 0.5254, - "step": 63202 - }, - { - "epoch": 1.62, - "learning_rate": 9.192074172545039e-07, - "loss": 0.6787, - "step": 63203 - }, - { - "epoch": 1.62, - "learning_rate": 9.191798372880281e-07, - "loss": 0.6934, - "step": 63204 - }, - { - "epoch": 1.62, - "learning_rate": 9.191522573834324e-07, - "loss": 0.6377, - "step": 63205 - }, - { - "epoch": 1.62, - "learning_rate": 9.191246775407386e-07, - "loss": 0.7139, - "step": 63206 - }, - { - "epoch": 1.62, - "learning_rate": 9.19097097759967e-07, - "loss": 0.5137, - "step": 63207 - }, - { - "epoch": 1.62, - "learning_rate": 9.19069518041139e-07, - "loss": 0.7227, - "step": 63208 - }, - { - "epoch": 1.62, - "learning_rate": 9.190419383842758e-07, - "loss": 0.5347, - "step": 63209 - }, - { - "epoch": 1.62, - "learning_rate": 9.190143587893983e-07, - "loss": 0.5488, - "step": 63210 - }, - { - "epoch": 1.62, - "learning_rate": 9.189867792565279e-07, - "loss": 0.6201, - "step": 63211 - }, - { - "epoch": 1.62, - "learning_rate": 9.189591997856854e-07, - "loss": 0.564, - "step": 63212 - }, - { - "epoch": 1.62, - "learning_rate": 9.189316203768924e-07, - "loss": 0.6343, - "step": 63213 - }, - { - "epoch": 1.62, - "learning_rate": 9.189040410301696e-07, - "loss": 0.6045, - "step": 63214 - }, - { - "epoch": 1.62, - "learning_rate": 9.188764617455383e-07, - "loss": 0.4961, - "step": 63215 - }, - { - "epoch": 1.62, - "learning_rate": 9.188488825230199e-07, - "loss": 0.8291, - "step": 63216 - }, - { - "epoch": 1.62, - "learning_rate": 9.18821303362635e-07, - "loss": 0.5664, - "step": 63217 - }, - { - "epoch": 1.62, - "learning_rate": 9.187937242644045e-07, - "loss": 0.6812, - "step": 63218 - }, - { - "epoch": 1.62, - "learning_rate": 9.187661452283502e-07, - "loss": 0.4111, - "step": 63219 - }, - { - "epoch": 1.62, - "learning_rate": 9.187385662544928e-07, - "loss": 0.5933, - "step": 63220 - }, - { - "epoch": 1.62, - "learning_rate": 9.187109873428537e-07, - "loss": 0.6055, - "step": 63221 - }, - { - "epoch": 1.62, - "learning_rate": 9.186834084934536e-07, - "loss": 0.6504, - "step": 63222 - }, - { - "epoch": 1.62, - "learning_rate": 9.186558297063142e-07, - "loss": 0.6436, - "step": 63223 - }, - { - "epoch": 1.62, - "learning_rate": 9.186282509814559e-07, - "loss": 0.7246, - "step": 63224 - }, - { - "epoch": 1.62, - "learning_rate": 9.186006723189006e-07, - "loss": 0.4796, - "step": 63225 - }, - { - "epoch": 1.62, - "learning_rate": 9.185730937186691e-07, - "loss": 0.5303, - "step": 63226 - }, - { - "epoch": 1.62, - "learning_rate": 9.18545515180782e-07, - "loss": 0.6116, - "step": 63227 - }, - { - "epoch": 1.62, - "learning_rate": 9.185179367052613e-07, - "loss": 0.5449, - "step": 63228 - }, - { - "epoch": 1.62, - "learning_rate": 9.184903582921272e-07, - "loss": 0.6802, - "step": 63229 - }, - { - "epoch": 1.62, - "learning_rate": 9.184627799414017e-07, - "loss": 0.6465, - "step": 63230 - }, - { - "epoch": 1.62, - "learning_rate": 9.18435201653105e-07, - "loss": 0.5786, - "step": 63231 - }, - { - "epoch": 1.62, - "learning_rate": 9.184076234272592e-07, - "loss": 0.7676, - "step": 63232 - }, - { - "epoch": 1.62, - "learning_rate": 9.183800452638845e-07, - "loss": 0.6865, - "step": 63233 - }, - { - "epoch": 1.62, - "learning_rate": 9.183524671630029e-07, - "loss": 0.6016, - "step": 63234 - }, - { - "epoch": 1.62, - "learning_rate": 9.183248891246349e-07, - "loss": 0.4863, - "step": 63235 - }, - { - "epoch": 1.62, - "learning_rate": 9.182973111488021e-07, - "loss": 0.6689, - "step": 63236 - }, - { - "epoch": 1.62, - "learning_rate": 9.182697332355248e-07, - "loss": 0.589, - "step": 63237 - }, - { - "epoch": 1.62, - "learning_rate": 9.182421553848248e-07, - "loss": 0.3691, - "step": 63238 - }, - { - "epoch": 1.62, - "learning_rate": 9.182145775967228e-07, - "loss": 0.7217, - "step": 63239 - }, - { - "epoch": 1.62, - "learning_rate": 9.181869998712404e-07, - "loss": 0.6416, - "step": 63240 - }, - { - "epoch": 1.62, - "learning_rate": 9.181594222083983e-07, - "loss": 0.8184, - "step": 63241 - }, - { - "epoch": 1.62, - "learning_rate": 9.181318446082178e-07, - "loss": 0.6069, - "step": 63242 - }, - { - "epoch": 1.62, - "learning_rate": 9.1810426707072e-07, - "loss": 0.6758, - "step": 63243 - }, - { - "epoch": 1.62, - "learning_rate": 9.18076689595926e-07, - "loss": 0.4662, - "step": 63244 - }, - { - "epoch": 1.62, - "learning_rate": 9.180491121838572e-07, - "loss": 0.6992, - "step": 63245 - }, - { - "epoch": 1.62, - "learning_rate": 9.18021534834534e-07, - "loss": 0.709, - "step": 63246 - }, - { - "epoch": 1.62, - "learning_rate": 9.179939575479782e-07, - "loss": 0.8076, - "step": 63247 - }, - { - "epoch": 1.62, - "learning_rate": 9.179663803242104e-07, - "loss": 0.6108, - "step": 63248 - }, - { - "epoch": 1.62, - "learning_rate": 9.179388031632522e-07, - "loss": 0.6357, - "step": 63249 - }, - { - "epoch": 1.62, - "learning_rate": 9.179112260651242e-07, - "loss": 0.6255, - "step": 63250 - }, - { - "epoch": 1.62, - "learning_rate": 9.178836490298481e-07, - "loss": 0.6475, - "step": 63251 - }, - { - "epoch": 1.62, - "learning_rate": 9.178560720574444e-07, - "loss": 0.6255, - "step": 63252 - }, - { - "epoch": 1.62, - "learning_rate": 9.178284951479349e-07, - "loss": 0.6006, - "step": 63253 - }, - { - "epoch": 1.62, - "learning_rate": 9.178009183013402e-07, - "loss": 0.5796, - "step": 63254 - }, - { - "epoch": 1.62, - "learning_rate": 9.17773341517682e-07, - "loss": 0.6914, - "step": 63255 - }, - { - "epoch": 1.62, - "learning_rate": 9.177457647969803e-07, - "loss": 0.6191, - "step": 63256 - }, - { - "epoch": 1.62, - "learning_rate": 9.177181881392571e-07, - "loss": 0.7212, - "step": 63257 - }, - { - "epoch": 1.62, - "learning_rate": 9.176906115445332e-07, - "loss": 0.5073, - "step": 63258 - }, - { - "epoch": 1.62, - "learning_rate": 9.1766303501283e-07, - "loss": 0.5996, - "step": 63259 - }, - { - "epoch": 1.62, - "learning_rate": 9.176354585441682e-07, - "loss": 0.7373, - "step": 63260 - }, - { - "epoch": 1.62, - "learning_rate": 9.176078821385693e-07, - "loss": 0.6943, - "step": 63261 - }, - { - "epoch": 1.62, - "learning_rate": 9.175803057960541e-07, - "loss": 0.6538, - "step": 63262 - }, - { - "epoch": 1.62, - "learning_rate": 9.175527295166441e-07, - "loss": 0.7617, - "step": 63263 - }, - { - "epoch": 1.62, - "learning_rate": 9.1752515330036e-07, - "loss": 0.5801, - "step": 63264 - }, - { - "epoch": 1.62, - "learning_rate": 9.174975771472234e-07, - "loss": 0.7422, - "step": 63265 - }, - { - "epoch": 1.62, - "learning_rate": 9.17470001057255e-07, - "loss": 0.5435, - "step": 63266 - }, - { - "epoch": 1.62, - "learning_rate": 9.174424250304758e-07, - "loss": 0.6016, - "step": 63267 - }, - { - "epoch": 1.62, - "learning_rate": 9.174148490669073e-07, - "loss": 0.6396, - "step": 63268 - }, - { - "epoch": 1.62, - "learning_rate": 9.173872731665703e-07, - "loss": 0.7471, - "step": 63269 - }, - { - "epoch": 1.62, - "learning_rate": 9.173596973294863e-07, - "loss": 0.4133, - "step": 63270 - }, - { - "epoch": 1.62, - "learning_rate": 9.173321215556761e-07, - "loss": 0.7256, - "step": 63271 - }, - { - "epoch": 1.62, - "learning_rate": 9.173045458451608e-07, - "loss": 0.6655, - "step": 63272 - }, - { - "epoch": 1.62, - "learning_rate": 9.172769701979616e-07, - "loss": 0.6836, - "step": 63273 - }, - { - "epoch": 1.62, - "learning_rate": 9.172493946140995e-07, - "loss": 0.7295, - "step": 63274 - }, - { - "epoch": 1.62, - "learning_rate": 9.172218190935963e-07, - "loss": 0.5166, - "step": 63275 - }, - { - "epoch": 1.62, - "learning_rate": 9.171942436364723e-07, - "loss": 0.4756, - "step": 63276 - }, - { - "epoch": 1.62, - "learning_rate": 9.171666682427486e-07, - "loss": 0.6255, - "step": 63277 - }, - { - "epoch": 1.62, - "learning_rate": 9.171390929124468e-07, - "loss": 0.7314, - "step": 63278 - }, - { - "epoch": 1.62, - "learning_rate": 9.171115176455875e-07, - "loss": 0.6108, - "step": 63279 - }, - { - "epoch": 1.62, - "learning_rate": 9.170839424421923e-07, - "loss": 0.6099, - "step": 63280 - }, - { - "epoch": 1.62, - "learning_rate": 9.17056367302282e-07, - "loss": 0.522, - "step": 63281 - }, - { - "epoch": 1.62, - "learning_rate": 9.170287922258781e-07, - "loss": 0.5967, - "step": 63282 - }, - { - "epoch": 1.62, - "learning_rate": 9.170012172130011e-07, - "loss": 0.7871, - "step": 63283 - }, - { - "epoch": 1.62, - "learning_rate": 9.169736422636725e-07, - "loss": 0.6313, - "step": 63284 - }, - { - "epoch": 1.62, - "learning_rate": 9.169460673779139e-07, - "loss": 0.5791, - "step": 63285 - }, - { - "epoch": 1.62, - "learning_rate": 9.169184925557453e-07, - "loss": 0.5885, - "step": 63286 - }, - { - "epoch": 1.62, - "learning_rate": 9.168909177971886e-07, - "loss": 0.5977, - "step": 63287 - }, - { - "epoch": 1.62, - "learning_rate": 9.168633431022648e-07, - "loss": 0.5537, - "step": 63288 - }, - { - "epoch": 1.62, - "learning_rate": 9.168357684709946e-07, - "loss": 0.7217, - "step": 63289 - }, - { - "epoch": 1.62, - "learning_rate": 9.168081939033996e-07, - "loss": 0.6191, - "step": 63290 - }, - { - "epoch": 1.62, - "learning_rate": 9.167806193995006e-07, - "loss": 0.5798, - "step": 63291 - }, - { - "epoch": 1.62, - "learning_rate": 9.16753044959319e-07, - "loss": 0.834, - "step": 63292 - }, - { - "epoch": 1.62, - "learning_rate": 9.167254705828758e-07, - "loss": 0.6582, - "step": 63293 - }, - { - "epoch": 1.62, - "learning_rate": 9.16697896270192e-07, - "loss": 0.7666, - "step": 63294 - }, - { - "epoch": 1.62, - "learning_rate": 9.166703220212892e-07, - "loss": 0.6328, - "step": 63295 - }, - { - "epoch": 1.62, - "learning_rate": 9.166427478361875e-07, - "loss": 0.554, - "step": 63296 - }, - { - "epoch": 1.62, - "learning_rate": 9.16615173714909e-07, - "loss": 0.5942, - "step": 63297 - }, - { - "epoch": 1.62, - "learning_rate": 9.16587599657474e-07, - "loss": 0.7236, - "step": 63298 - }, - { - "epoch": 1.62, - "learning_rate": 9.165600256639044e-07, - "loss": 0.6475, - "step": 63299 - }, - { - "epoch": 1.62, - "learning_rate": 9.165324517342208e-07, - "loss": 0.6621, - "step": 63300 - }, - { - "epoch": 1.62, - "learning_rate": 9.165048778684445e-07, - "loss": 0.5791, - "step": 63301 - }, - { - "epoch": 1.62, - "learning_rate": 9.164773040665966e-07, - "loss": 0.644, - "step": 63302 - }, - { - "epoch": 1.62, - "learning_rate": 9.164497303286981e-07, - "loss": 0.6943, - "step": 63303 - }, - { - "epoch": 1.62, - "learning_rate": 9.164221566547702e-07, - "loss": 0.7227, - "step": 63304 - }, - { - "epoch": 1.62, - "learning_rate": 9.163945830448346e-07, - "loss": 0.5947, - "step": 63305 - }, - { - "epoch": 1.62, - "learning_rate": 9.163670094989112e-07, - "loss": 0.6543, - "step": 63306 - }, - { - "epoch": 1.62, - "learning_rate": 9.163394360170219e-07, - "loss": 0.6113, - "step": 63307 - }, - { - "epoch": 1.62, - "learning_rate": 9.163118625991875e-07, - "loss": 0.5557, - "step": 63308 - }, - { - "epoch": 1.62, - "learning_rate": 9.162842892454295e-07, - "loss": 0.6301, - "step": 63309 - }, - { - "epoch": 1.62, - "learning_rate": 9.162567159557684e-07, - "loss": 0.7549, - "step": 63310 - }, - { - "epoch": 1.62, - "learning_rate": 9.16229142730226e-07, - "loss": 0.6934, - "step": 63311 - }, - { - "epoch": 1.62, - "learning_rate": 9.162015695688228e-07, - "loss": 0.5815, - "step": 63312 - }, - { - "epoch": 1.62, - "learning_rate": 9.161739964715805e-07, - "loss": 0.6284, - "step": 63313 - }, - { - "epoch": 1.62, - "learning_rate": 9.161464234385197e-07, - "loss": 0.7266, - "step": 63314 - }, - { - "epoch": 1.62, - "learning_rate": 9.161188504696622e-07, - "loss": 0.7256, - "step": 63315 - }, - { - "epoch": 1.62, - "learning_rate": 9.160912775650284e-07, - "loss": 0.6108, - "step": 63316 - }, - { - "epoch": 1.62, - "learning_rate": 9.160637047246394e-07, - "loss": 0.6592, - "step": 63317 - }, - { - "epoch": 1.62, - "learning_rate": 9.160361319485167e-07, - "loss": 0.6641, - "step": 63318 - }, - { - "epoch": 1.62, - "learning_rate": 9.160085592366811e-07, - "loss": 0.728, - "step": 63319 - }, - { - "epoch": 1.62, - "learning_rate": 9.159809865891542e-07, - "loss": 0.5393, - "step": 63320 - }, - { - "epoch": 1.62, - "learning_rate": 9.159534140059565e-07, - "loss": 0.5809, - "step": 63321 - }, - { - "epoch": 1.62, - "learning_rate": 9.159258414871096e-07, - "loss": 0.5581, - "step": 63322 - }, - { - "epoch": 1.62, - "learning_rate": 9.158982690326343e-07, - "loss": 0.5393, - "step": 63323 - }, - { - "epoch": 1.62, - "learning_rate": 9.15870696642552e-07, - "loss": 0.6143, - "step": 63324 - }, - { - "epoch": 1.62, - "learning_rate": 9.158431243168838e-07, - "loss": 0.6279, - "step": 63325 - }, - { - "epoch": 1.62, - "learning_rate": 9.158155520556506e-07, - "loss": 0.709, - "step": 63326 - }, - { - "epoch": 1.62, - "learning_rate": 9.157879798588731e-07, - "loss": 0.5687, - "step": 63327 - }, - { - "epoch": 1.62, - "learning_rate": 9.157604077265733e-07, - "loss": 0.71, - "step": 63328 - }, - { - "epoch": 1.62, - "learning_rate": 9.157328356587715e-07, - "loss": 0.423, - "step": 63329 - }, - { - "epoch": 1.62, - "learning_rate": 9.157052636554895e-07, - "loss": 0.6772, - "step": 63330 - }, - { - "epoch": 1.62, - "learning_rate": 9.156776917167479e-07, - "loss": 0.7695, - "step": 63331 - }, - { - "epoch": 1.62, - "learning_rate": 9.156501198425681e-07, - "loss": 0.5206, - "step": 63332 - }, - { - "epoch": 1.62, - "learning_rate": 9.156225480329711e-07, - "loss": 0.7744, - "step": 63333 - }, - { - "epoch": 1.62, - "learning_rate": 9.155949762879781e-07, - "loss": 0.749, - "step": 63334 - }, - { - "epoch": 1.62, - "learning_rate": 9.155674046076105e-07, - "loss": 0.6992, - "step": 63335 - }, - { - "epoch": 1.62, - "learning_rate": 9.155398329918885e-07, - "loss": 0.5908, - "step": 63336 - }, - { - "epoch": 1.62, - "learning_rate": 9.15512261440834e-07, - "loss": 0.6553, - "step": 63337 - }, - { - "epoch": 1.62, - "learning_rate": 9.154846899544678e-07, - "loss": 0.583, - "step": 63338 - }, - { - "epoch": 1.62, - "learning_rate": 9.154571185328112e-07, - "loss": 0.7939, - "step": 63339 - }, - { - "epoch": 1.62, - "learning_rate": 9.154295471758849e-07, - "loss": 0.7061, - "step": 63340 - }, - { - "epoch": 1.62, - "learning_rate": 9.154019758837106e-07, - "loss": 0.6084, - "step": 63341 - }, - { - "epoch": 1.62, - "learning_rate": 9.153744046563089e-07, - "loss": 0.5168, - "step": 63342 - }, - { - "epoch": 1.62, - "learning_rate": 9.153468334937013e-07, - "loss": 0.6758, - "step": 63343 - }, - { - "epoch": 1.62, - "learning_rate": 9.153192623959089e-07, - "loss": 0.5801, - "step": 63344 - }, - { - "epoch": 1.62, - "learning_rate": 9.152916913629527e-07, - "loss": 0.5552, - "step": 63345 - }, - { - "epoch": 1.62, - "learning_rate": 9.152641203948533e-07, - "loss": 0.6553, - "step": 63346 - }, - { - "epoch": 1.62, - "learning_rate": 9.152365494916325e-07, - "loss": 0.5718, - "step": 63347 - }, - { - "epoch": 1.62, - "learning_rate": 9.15208978653311e-07, - "loss": 0.6799, - "step": 63348 - }, - { - "epoch": 1.62, - "learning_rate": 9.151814078799104e-07, - "loss": 0.6089, - "step": 63349 - }, - { - "epoch": 1.62, - "learning_rate": 9.151538371714512e-07, - "loss": 0.7148, - "step": 63350 - }, - { - "epoch": 1.62, - "learning_rate": 9.15126266527955e-07, - "loss": 0.8633, - "step": 63351 - }, - { - "epoch": 1.62, - "learning_rate": 9.150986959494426e-07, - "loss": 0.6602, - "step": 63352 - }, - { - "epoch": 1.62, - "learning_rate": 9.150711254359353e-07, - "loss": 0.5615, - "step": 63353 - }, - { - "epoch": 1.62, - "learning_rate": 9.150435549874539e-07, - "loss": 0.6001, - "step": 63354 - }, - { - "epoch": 1.62, - "learning_rate": 9.150159846040203e-07, - "loss": 0.6475, - "step": 63355 - }, - { - "epoch": 1.62, - "learning_rate": 9.149884142856548e-07, - "loss": 0.5898, - "step": 63356 - }, - { - "epoch": 1.62, - "learning_rate": 9.149608440323785e-07, - "loss": 0.6797, - "step": 63357 - }, - { - "epoch": 1.62, - "learning_rate": 9.149332738442131e-07, - "loss": 0.7402, - "step": 63358 - }, - { - "epoch": 1.62, - "learning_rate": 9.149057037211791e-07, - "loss": 0.413, - "step": 63359 - }, - { - "epoch": 1.62, - "learning_rate": 9.148781336632981e-07, - "loss": 0.6895, - "step": 63360 - }, - { - "epoch": 1.62, - "learning_rate": 9.148505636705908e-07, - "loss": 0.5342, - "step": 63361 - }, - { - "epoch": 1.62, - "learning_rate": 9.148229937430786e-07, - "loss": 0.7588, - "step": 63362 - }, - { - "epoch": 1.62, - "learning_rate": 9.147954238807826e-07, - "loss": 0.7168, - "step": 63363 - }, - { - "epoch": 1.62, - "learning_rate": 9.147678540837236e-07, - "loss": 0.7412, - "step": 63364 - }, - { - "epoch": 1.62, - "learning_rate": 9.147402843519234e-07, - "loss": 0.7393, - "step": 63365 - }, - { - "epoch": 1.62, - "learning_rate": 9.147127146854023e-07, - "loss": 0.3306, - "step": 63366 - }, - { - "epoch": 1.62, - "learning_rate": 9.146851450841817e-07, - "loss": 0.7275, - "step": 63367 - }, - { - "epoch": 1.62, - "learning_rate": 9.14657575548283e-07, - "loss": 0.6641, - "step": 63368 - }, - { - "epoch": 1.62, - "learning_rate": 9.146300060777268e-07, - "loss": 0.7217, - "step": 63369 - }, - { - "epoch": 1.62, - "learning_rate": 9.146024366725347e-07, - "loss": 0.7959, - "step": 63370 - }, - { - "epoch": 1.62, - "learning_rate": 9.145748673327272e-07, - "loss": 0.5571, - "step": 63371 - }, - { - "epoch": 1.62, - "learning_rate": 9.145472980583263e-07, - "loss": 0.5235, - "step": 63372 - }, - { - "epoch": 1.62, - "learning_rate": 9.145197288493522e-07, - "loss": 0.7368, - "step": 63373 - }, - { - "epoch": 1.62, - "learning_rate": 9.144921597058268e-07, - "loss": 0.7461, - "step": 63374 - }, - { - "epoch": 1.62, - "learning_rate": 9.144645906277708e-07, - "loss": 0.6338, - "step": 63375 - }, - { - "epoch": 1.62, - "learning_rate": 9.144370216152051e-07, - "loss": 0.7842, - "step": 63376 - }, - { - "epoch": 1.62, - "learning_rate": 9.144094526681512e-07, - "loss": 0.7246, - "step": 63377 - }, - { - "epoch": 1.62, - "learning_rate": 9.1438188378663e-07, - "loss": 0.5549, - "step": 63378 - }, - { - "epoch": 1.62, - "learning_rate": 9.143543149706624e-07, - "loss": 0.5574, - "step": 63379 - }, - { - "epoch": 1.62, - "learning_rate": 9.143267462202701e-07, - "loss": 0.7144, - "step": 63380 - }, - { - "epoch": 1.62, - "learning_rate": 9.142991775354734e-07, - "loss": 0.5879, - "step": 63381 - }, - { - "epoch": 1.62, - "learning_rate": 9.142716089162944e-07, - "loss": 0.7256, - "step": 63382 - }, - { - "epoch": 1.62, - "learning_rate": 9.142440403627534e-07, - "loss": 0.6108, - "step": 63383 - }, - { - "epoch": 1.62, - "learning_rate": 9.14216471874872e-07, - "loss": 0.5352, - "step": 63384 - }, - { - "epoch": 1.62, - "learning_rate": 9.141889034526712e-07, - "loss": 0.708, - "step": 63385 - }, - { - "epoch": 1.62, - "learning_rate": 9.141613350961717e-07, - "loss": 0.6172, - "step": 63386 - }, - { - "epoch": 1.62, - "learning_rate": 9.141337668053951e-07, - "loss": 0.6978, - "step": 63387 - }, - { - "epoch": 1.62, - "learning_rate": 9.141061985803621e-07, - "loss": 0.5046, - "step": 63388 - }, - { - "epoch": 1.62, - "learning_rate": 9.140786304210942e-07, - "loss": 0.426, - "step": 63389 - }, - { - "epoch": 1.62, - "learning_rate": 9.140510623276123e-07, - "loss": 0.4487, - "step": 63390 - }, - { - "epoch": 1.62, - "learning_rate": 9.140234942999376e-07, - "loss": 0.6538, - "step": 63391 - }, - { - "epoch": 1.62, - "learning_rate": 9.13995926338091e-07, - "loss": 0.7676, - "step": 63392 - }, - { - "epoch": 1.62, - "learning_rate": 9.13968358442094e-07, - "loss": 0.6274, - "step": 63393 - }, - { - "epoch": 1.62, - "learning_rate": 9.139407906119671e-07, - "loss": 0.562, - "step": 63394 - }, - { - "epoch": 1.62, - "learning_rate": 9.139132228477326e-07, - "loss": 0.6348, - "step": 63395 - }, - { - "epoch": 1.62, - "learning_rate": 9.138856551494102e-07, - "loss": 0.5869, - "step": 63396 - }, - { - "epoch": 1.62, - "learning_rate": 9.138580875170217e-07, - "loss": 0.6157, - "step": 63397 - }, - { - "epoch": 1.62, - "learning_rate": 9.138305199505879e-07, - "loss": 0.6172, - "step": 63398 - }, - { - "epoch": 1.62, - "learning_rate": 9.138029524501303e-07, - "loss": 0.5864, - "step": 63399 - }, - { - "epoch": 1.62, - "learning_rate": 9.137753850156697e-07, - "loss": 0.5913, - "step": 63400 - }, - { - "epoch": 1.62, - "learning_rate": 9.137478176472275e-07, - "loss": 0.5623, - "step": 63401 - }, - { - "epoch": 1.63, - "learning_rate": 9.137202503448243e-07, - "loss": 0.4895, - "step": 63402 - }, - { - "epoch": 1.63, - "learning_rate": 9.136926831084818e-07, - "loss": 0.498, - "step": 63403 - }, - { - "epoch": 1.63, - "learning_rate": 9.136651159382206e-07, - "loss": 0.6411, - "step": 63404 - }, - { - "epoch": 1.63, - "learning_rate": 9.136375488340625e-07, - "loss": 0.5068, - "step": 63405 - }, - { - "epoch": 1.63, - "learning_rate": 9.13609981796028e-07, - "loss": 0.4407, - "step": 63406 - }, - { - "epoch": 1.63, - "learning_rate": 9.135824148241382e-07, - "loss": 0.6038, - "step": 63407 - }, - { - "epoch": 1.63, - "learning_rate": 9.135548479184146e-07, - "loss": 0.6064, - "step": 63408 - }, - { - "epoch": 1.63, - "learning_rate": 9.135272810788777e-07, - "loss": 0.5159, - "step": 63409 - }, - { - "epoch": 1.63, - "learning_rate": 9.134997143055492e-07, - "loss": 0.6187, - "step": 63410 - }, - { - "epoch": 1.63, - "learning_rate": 9.134721475984499e-07, - "loss": 0.4857, - "step": 63411 - }, - { - "epoch": 1.63, - "learning_rate": 9.134445809576011e-07, - "loss": 0.6465, - "step": 63412 - }, - { - "epoch": 1.63, - "learning_rate": 9.134170143830236e-07, - "loss": 0.5845, - "step": 63413 - }, - { - "epoch": 1.63, - "learning_rate": 9.13389447874739e-07, - "loss": 0.6582, - "step": 63414 - }, - { - "epoch": 1.63, - "learning_rate": 9.133618814327684e-07, - "loss": 0.5811, - "step": 63415 - }, - { - "epoch": 1.63, - "learning_rate": 9.133343150571323e-07, - "loss": 0.5197, - "step": 63416 - }, - { - "epoch": 1.63, - "learning_rate": 9.13306748747852e-07, - "loss": 0.6528, - "step": 63417 - }, - { - "epoch": 1.63, - "learning_rate": 9.132791825049488e-07, - "loss": 0.7705, - "step": 63418 - }, - { - "epoch": 1.63, - "learning_rate": 9.132516163284436e-07, - "loss": 0.6245, - "step": 63419 - }, - { - "epoch": 1.63, - "learning_rate": 9.132240502183579e-07, - "loss": 0.5698, - "step": 63420 - }, - { - "epoch": 1.63, - "learning_rate": 9.131964841747124e-07, - "loss": 0.6431, - "step": 63421 - }, - { - "epoch": 1.63, - "learning_rate": 9.131689181975284e-07, - "loss": 0.4824, - "step": 63422 - }, - { - "epoch": 1.63, - "learning_rate": 9.131413522868269e-07, - "loss": 0.7334, - "step": 63423 - }, - { - "epoch": 1.63, - "learning_rate": 9.131137864426293e-07, - "loss": 0.5278, - "step": 63424 - }, - { - "epoch": 1.63, - "learning_rate": 9.130862206649565e-07, - "loss": 0.708, - "step": 63425 - }, - { - "epoch": 1.63, - "learning_rate": 9.130586549538292e-07, - "loss": 0.4844, - "step": 63426 - }, - { - "epoch": 1.63, - "learning_rate": 9.130310893092693e-07, - "loss": 0.7041, - "step": 63427 - }, - { - "epoch": 1.63, - "learning_rate": 9.130035237312972e-07, - "loss": 0.5552, - "step": 63428 - }, - { - "epoch": 1.63, - "learning_rate": 9.129759582199344e-07, - "loss": 0.7129, - "step": 63429 - }, - { - "epoch": 1.63, - "learning_rate": 9.129483927752019e-07, - "loss": 0.6304, - "step": 63430 - }, - { - "epoch": 1.63, - "learning_rate": 9.129208273971208e-07, - "loss": 0.603, - "step": 63431 - }, - { - "epoch": 1.63, - "learning_rate": 9.128932620857122e-07, - "loss": 0.583, - "step": 63432 - }, - { - "epoch": 1.63, - "learning_rate": 9.128656968409974e-07, - "loss": 0.7402, - "step": 63433 - }, - { - "epoch": 1.63, - "learning_rate": 9.128381316629972e-07, - "loss": 0.6885, - "step": 63434 - }, - { - "epoch": 1.63, - "learning_rate": 9.128105665517332e-07, - "loss": 0.6973, - "step": 63435 - }, - { - "epoch": 1.63, - "learning_rate": 9.127830015072255e-07, - "loss": 0.6851, - "step": 63436 - }, - { - "epoch": 1.63, - "learning_rate": 9.127554365294963e-07, - "loss": 0.7471, - "step": 63437 - }, - { - "epoch": 1.63, - "learning_rate": 9.127278716185659e-07, - "loss": 0.7139, - "step": 63438 - }, - { - "epoch": 1.63, - "learning_rate": 9.12700306774456e-07, - "loss": 0.666, - "step": 63439 - }, - { - "epoch": 1.63, - "learning_rate": 9.126727419971873e-07, - "loss": 0.5776, - "step": 63440 - }, - { - "epoch": 1.63, - "learning_rate": 9.126451772867811e-07, - "loss": 0.8916, - "step": 63441 - }, - { - "epoch": 1.63, - "learning_rate": 9.126176126432584e-07, - "loss": 0.5806, - "step": 63442 - }, - { - "epoch": 1.63, - "learning_rate": 9.125900480666406e-07, - "loss": 0.749, - "step": 63443 - }, - { - "epoch": 1.63, - "learning_rate": 9.125624835569483e-07, - "loss": 0.5957, - "step": 63444 - }, - { - "epoch": 1.63, - "learning_rate": 9.125349191142034e-07, - "loss": 0.6963, - "step": 63445 - }, - { - "epoch": 1.63, - "learning_rate": 9.125073547384263e-07, - "loss": 0.469, - "step": 63446 - }, - { - "epoch": 1.63, - "learning_rate": 9.12479790429638e-07, - "loss": 0.5454, - "step": 63447 - }, - { - "epoch": 1.63, - "learning_rate": 9.124522261878601e-07, - "loss": 0.627, - "step": 63448 - }, - { - "epoch": 1.63, - "learning_rate": 9.124246620131133e-07, - "loss": 0.4619, - "step": 63449 - }, - { - "epoch": 1.63, - "learning_rate": 9.123970979054192e-07, - "loss": 0.5345, - "step": 63450 - }, - { - "epoch": 1.63, - "learning_rate": 9.123695338647986e-07, - "loss": 0.6499, - "step": 63451 - }, - { - "epoch": 1.63, - "learning_rate": 9.123419698912723e-07, - "loss": 0.666, - "step": 63452 - }, - { - "epoch": 1.63, - "learning_rate": 9.12314405984862e-07, - "loss": 0.5283, - "step": 63453 - }, - { - "epoch": 1.63, - "learning_rate": 9.122868421455883e-07, - "loss": 0.6519, - "step": 63454 - }, - { - "epoch": 1.63, - "learning_rate": 9.12259278373473e-07, - "loss": 0.6743, - "step": 63455 - }, - { - "epoch": 1.63, - "learning_rate": 9.122317146685365e-07, - "loss": 0.6973, - "step": 63456 - }, - { - "epoch": 1.63, - "learning_rate": 9.122041510308e-07, - "loss": 0.5337, - "step": 63457 - }, - { - "epoch": 1.63, - "learning_rate": 9.121765874602848e-07, - "loss": 0.4929, - "step": 63458 - }, - { - "epoch": 1.63, - "learning_rate": 9.121490239570118e-07, - "loss": 0.6621, - "step": 63459 - }, - { - "epoch": 1.63, - "learning_rate": 9.121214605210025e-07, - "loss": 0.5649, - "step": 63460 - }, - { - "epoch": 1.63, - "learning_rate": 9.120938971522775e-07, - "loss": 0.585, - "step": 63461 - }, - { - "epoch": 1.63, - "learning_rate": 9.120663338508584e-07, - "loss": 0.6768, - "step": 63462 - }, - { - "epoch": 1.63, - "learning_rate": 9.120387706167658e-07, - "loss": 0.5425, - "step": 63463 - }, - { - "epoch": 1.63, - "learning_rate": 9.120112074500213e-07, - "loss": 0.5596, - "step": 63464 - }, - { - "epoch": 1.63, - "learning_rate": 9.119836443506461e-07, - "loss": 0.5022, - "step": 63465 - }, - { - "epoch": 1.63, - "learning_rate": 9.119560813186605e-07, - "loss": 0.4922, - "step": 63466 - }, - { - "epoch": 1.63, - "learning_rate": 9.119285183540863e-07, - "loss": 0.626, - "step": 63467 - }, - { - "epoch": 1.63, - "learning_rate": 9.119009554569444e-07, - "loss": 0.5327, - "step": 63468 - }, - { - "epoch": 1.63, - "learning_rate": 9.118733926272555e-07, - "loss": 0.5015, - "step": 63469 - }, - { - "epoch": 1.63, - "learning_rate": 9.118458298650414e-07, - "loss": 0.8525, - "step": 63470 - }, - { - "epoch": 1.63, - "learning_rate": 9.118182671703227e-07, - "loss": 0.5869, - "step": 63471 - }, - { - "epoch": 1.63, - "learning_rate": 9.11790704543121e-07, - "loss": 0.6387, - "step": 63472 - }, - { - "epoch": 1.63, - "learning_rate": 9.117631419834568e-07, - "loss": 0.7471, - "step": 63473 - }, - { - "epoch": 1.63, - "learning_rate": 9.117355794913517e-07, - "loss": 0.5596, - "step": 63474 - }, - { - "epoch": 1.63, - "learning_rate": 9.117080170668268e-07, - "loss": 0.6191, - "step": 63475 - }, - { - "epoch": 1.63, - "learning_rate": 9.116804547099026e-07, - "loss": 0.668, - "step": 63476 - }, - { - "epoch": 1.63, - "learning_rate": 9.11652892420601e-07, - "loss": 0.5161, - "step": 63477 - }, - { - "epoch": 1.63, - "learning_rate": 9.116253301989423e-07, - "loss": 0.6816, - "step": 63478 - }, - { - "epoch": 1.63, - "learning_rate": 9.115977680449483e-07, - "loss": 0.6895, - "step": 63479 - }, - { - "epoch": 1.63, - "learning_rate": 9.115702059586396e-07, - "loss": 0.7754, - "step": 63480 - }, - { - "epoch": 1.63, - "learning_rate": 9.115426439400378e-07, - "loss": 0.5796, - "step": 63481 - }, - { - "epoch": 1.63, - "learning_rate": 9.115150819891634e-07, - "loss": 0.6152, - "step": 63482 - }, - { - "epoch": 1.63, - "learning_rate": 9.114875201060382e-07, - "loss": 0.499, - "step": 63483 - }, - { - "epoch": 1.63, - "learning_rate": 9.114599582906825e-07, - "loss": 0.6973, - "step": 63484 - }, - { - "epoch": 1.63, - "learning_rate": 9.114323965431186e-07, - "loss": 0.6577, - "step": 63485 - }, - { - "epoch": 1.63, - "learning_rate": 9.114048348633663e-07, - "loss": 0.7007, - "step": 63486 - }, - { - "epoch": 1.63, - "learning_rate": 9.113772732514475e-07, - "loss": 0.5317, - "step": 63487 - }, - { - "epoch": 1.63, - "learning_rate": 9.113497117073826e-07, - "loss": 0.4019, - "step": 63488 - }, - { - "epoch": 1.63, - "learning_rate": 9.113221502311935e-07, - "loss": 0.5679, - "step": 63489 - }, - { - "epoch": 1.63, - "learning_rate": 9.112945888229007e-07, - "loss": 0.5903, - "step": 63490 - }, - { - "epoch": 1.63, - "learning_rate": 9.112670274825258e-07, - "loss": 0.5242, - "step": 63491 - }, - { - "epoch": 1.63, - "learning_rate": 9.112394662100893e-07, - "loss": 0.6162, - "step": 63492 - }, - { - "epoch": 1.63, - "learning_rate": 9.11211905005613e-07, - "loss": 0.5225, - "step": 63493 - }, - { - "epoch": 1.63, - "learning_rate": 9.111843438691174e-07, - "loss": 0.6787, - "step": 63494 - }, - { - "epoch": 1.63, - "learning_rate": 9.111567828006244e-07, - "loss": 0.6489, - "step": 63495 - }, - { - "epoch": 1.63, - "learning_rate": 9.111292218001543e-07, - "loss": 0.582, - "step": 63496 - }, - { - "epoch": 1.63, - "learning_rate": 9.111016608677282e-07, - "loss": 0.7744, - "step": 63497 - }, - { - "epoch": 1.63, - "learning_rate": 9.110741000033678e-07, - "loss": 0.4829, - "step": 63498 - }, - { - "epoch": 1.63, - "learning_rate": 9.110465392070935e-07, - "loss": 0.645, - "step": 63499 - }, - { - "epoch": 1.63, - "learning_rate": 9.110189784789272e-07, - "loss": 0.5054, - "step": 63500 - }, - { - "epoch": 1.63, - "learning_rate": 9.109914178188892e-07, - "loss": 0.6665, - "step": 63501 - }, - { - "epoch": 1.63, - "learning_rate": 9.109638572270012e-07, - "loss": 0.6611, - "step": 63502 - }, - { - "epoch": 1.63, - "learning_rate": 9.109362967032838e-07, - "loss": 0.6284, - "step": 63503 - }, - { - "epoch": 1.63, - "learning_rate": 9.109087362477588e-07, - "loss": 0.8359, - "step": 63504 - }, - { - "epoch": 1.63, - "learning_rate": 9.10881175860447e-07, - "loss": 0.5688, - "step": 63505 - }, - { - "epoch": 1.63, - "learning_rate": 9.108536155413691e-07, - "loss": 0.6245, - "step": 63506 - }, - { - "epoch": 1.63, - "learning_rate": 9.108260552905464e-07, - "loss": 0.625, - "step": 63507 - }, - { - "epoch": 1.63, - "learning_rate": 9.107984951080003e-07, - "loss": 0.6011, - "step": 63508 - }, - { - "epoch": 1.63, - "learning_rate": 9.107709349937514e-07, - "loss": 0.666, - "step": 63509 - }, - { - "epoch": 1.63, - "learning_rate": 9.107433749478213e-07, - "loss": 0.6655, - "step": 63510 - }, - { - "epoch": 1.63, - "learning_rate": 9.107158149702306e-07, - "loss": 0.7676, - "step": 63511 - }, - { - "epoch": 1.63, - "learning_rate": 9.10688255061001e-07, - "loss": 0.5791, - "step": 63512 - }, - { - "epoch": 1.63, - "learning_rate": 9.106606952201531e-07, - "loss": 0.5762, - "step": 63513 - }, - { - "epoch": 1.63, - "learning_rate": 9.106331354477084e-07, - "loss": 0.647, - "step": 63514 - }, - { - "epoch": 1.63, - "learning_rate": 9.106055757436881e-07, - "loss": 0.6494, - "step": 63515 - }, - { - "epoch": 1.63, - "learning_rate": 9.105780161081124e-07, - "loss": 0.6133, - "step": 63516 - }, - { - "epoch": 1.63, - "learning_rate": 9.105504565410034e-07, - "loss": 0.5435, - "step": 63517 - }, - { - "epoch": 1.63, - "learning_rate": 9.105228970423813e-07, - "loss": 0.6338, - "step": 63518 - }, - { - "epoch": 1.63, - "learning_rate": 9.104953376122683e-07, - "loss": 0.6365, - "step": 63519 - }, - { - "epoch": 1.63, - "learning_rate": 9.104677782506844e-07, - "loss": 0.6338, - "step": 63520 - }, - { - "epoch": 1.63, - "learning_rate": 9.104402189576515e-07, - "loss": 0.6016, - "step": 63521 - }, - { - "epoch": 1.63, - "learning_rate": 9.104126597331902e-07, - "loss": 0.6768, - "step": 63522 - }, - { - "epoch": 1.63, - "learning_rate": 9.103851005773221e-07, - "loss": 0.4993, - "step": 63523 - }, - { - "epoch": 1.63, - "learning_rate": 9.103575414900679e-07, - "loss": 0.5659, - "step": 63524 - }, - { - "epoch": 1.63, - "learning_rate": 9.103299824714491e-07, - "loss": 0.5432, - "step": 63525 - }, - { - "epoch": 1.63, - "learning_rate": 9.10302423521486e-07, - "loss": 0.5483, - "step": 63526 - }, - { - "epoch": 1.63, - "learning_rate": 9.102748646402005e-07, - "loss": 0.6475, - "step": 63527 - }, - { - "epoch": 1.63, - "learning_rate": 9.102473058276132e-07, - "loss": 0.708, - "step": 63528 - }, - { - "epoch": 1.63, - "learning_rate": 9.102197470837456e-07, - "loss": 0.6333, - "step": 63529 - }, - { - "epoch": 1.63, - "learning_rate": 9.101921884086184e-07, - "loss": 0.6333, - "step": 63530 - }, - { - "epoch": 1.63, - "learning_rate": 9.101646298022531e-07, - "loss": 0.6187, - "step": 63531 - }, - { - "epoch": 1.63, - "learning_rate": 9.101370712646704e-07, - "loss": 0.7349, - "step": 63532 - }, - { - "epoch": 1.63, - "learning_rate": 9.101095127958918e-07, - "loss": 0.7441, - "step": 63533 - }, - { - "epoch": 1.63, - "learning_rate": 9.100819543959385e-07, - "loss": 0.6191, - "step": 63534 - }, - { - "epoch": 1.63, - "learning_rate": 9.100543960648308e-07, - "loss": 0.5898, - "step": 63535 - }, - { - "epoch": 1.63, - "learning_rate": 9.100268378025906e-07, - "loss": 0.6885, - "step": 63536 - }, - { - "epoch": 1.63, - "learning_rate": 9.099992796092385e-07, - "loss": 0.5376, - "step": 63537 - }, - { - "epoch": 1.63, - "learning_rate": 9.099717214847959e-07, - "loss": 0.666, - "step": 63538 - }, - { - "epoch": 1.63, - "learning_rate": 9.099441634292837e-07, - "loss": 0.6641, - "step": 63539 - }, - { - "epoch": 1.63, - "learning_rate": 9.099166054427234e-07, - "loss": 0.5845, - "step": 63540 - }, - { - "epoch": 1.63, - "learning_rate": 9.098890475251357e-07, - "loss": 1.0518, - "step": 63541 - }, - { - "epoch": 1.63, - "learning_rate": 9.098614896765417e-07, - "loss": 0.7686, - "step": 63542 - }, - { - "epoch": 1.63, - "learning_rate": 9.098339318969628e-07, - "loss": 0.6851, - "step": 63543 - }, - { - "epoch": 1.63, - "learning_rate": 9.0980637418642e-07, - "loss": 0.668, - "step": 63544 - }, - { - "epoch": 1.63, - "learning_rate": 9.097788165449341e-07, - "loss": 0.7637, - "step": 63545 - }, - { - "epoch": 1.63, - "learning_rate": 9.097512589725265e-07, - "loss": 0.5757, - "step": 63546 - }, - { - "epoch": 1.63, - "learning_rate": 9.09723701469218e-07, - "loss": 0.6763, - "step": 63547 - }, - { - "epoch": 1.63, - "learning_rate": 9.0969614403503e-07, - "loss": 0.4348, - "step": 63548 - }, - { - "epoch": 1.63, - "learning_rate": 9.096685866699835e-07, - "loss": 0.6001, - "step": 63549 - }, - { - "epoch": 1.63, - "learning_rate": 9.096410293740997e-07, - "loss": 0.5483, - "step": 63550 - }, - { - "epoch": 1.63, - "learning_rate": 9.096134721473995e-07, - "loss": 0.4819, - "step": 63551 - }, - { - "epoch": 1.63, - "learning_rate": 9.095859149899042e-07, - "loss": 0.5515, - "step": 63552 - }, - { - "epoch": 1.63, - "learning_rate": 9.095583579016347e-07, - "loss": 0.6152, - "step": 63553 - }, - { - "epoch": 1.63, - "learning_rate": 9.095308008826126e-07, - "loss": 0.646, - "step": 63554 - }, - { - "epoch": 1.63, - "learning_rate": 9.095032439328584e-07, - "loss": 0.7393, - "step": 63555 - }, - { - "epoch": 1.63, - "learning_rate": 9.09475687052393e-07, - "loss": 0.5239, - "step": 63556 - }, - { - "epoch": 1.63, - "learning_rate": 9.094481302412385e-07, - "loss": 0.6943, - "step": 63557 - }, - { - "epoch": 1.63, - "learning_rate": 9.094205734994152e-07, - "loss": 0.6709, - "step": 63558 - }, - { - "epoch": 1.63, - "learning_rate": 9.093930168269442e-07, - "loss": 0.564, - "step": 63559 - }, - { - "epoch": 1.63, - "learning_rate": 9.093654602238469e-07, - "loss": 0.6104, - "step": 63560 - }, - { - "epoch": 1.63, - "learning_rate": 9.093379036901442e-07, - "loss": 0.6323, - "step": 63561 - }, - { - "epoch": 1.63, - "learning_rate": 9.093103472258574e-07, - "loss": 0.5659, - "step": 63562 - }, - { - "epoch": 1.63, - "learning_rate": 9.092827908310075e-07, - "loss": 0.623, - "step": 63563 - }, - { - "epoch": 1.63, - "learning_rate": 9.092552345056159e-07, - "loss": 0.8389, - "step": 63564 - }, - { - "epoch": 1.63, - "learning_rate": 9.092276782497031e-07, - "loss": 0.53, - "step": 63565 - }, - { - "epoch": 1.63, - "learning_rate": 9.092001220632904e-07, - "loss": 0.5442, - "step": 63566 - }, - { - "epoch": 1.63, - "learning_rate": 9.091725659463991e-07, - "loss": 0.6387, - "step": 63567 - }, - { - "epoch": 1.63, - "learning_rate": 9.091450098990501e-07, - "loss": 0.5161, - "step": 63568 - }, - { - "epoch": 1.63, - "learning_rate": 9.091174539212647e-07, - "loss": 0.6509, - "step": 63569 - }, - { - "epoch": 1.63, - "learning_rate": 9.090898980130638e-07, - "loss": 0.5659, - "step": 63570 - }, - { - "epoch": 1.63, - "learning_rate": 9.090623421744688e-07, - "loss": 0.542, - "step": 63571 - }, - { - "epoch": 1.63, - "learning_rate": 9.090347864055002e-07, - "loss": 0.5771, - "step": 63572 - }, - { - "epoch": 1.63, - "learning_rate": 9.090072307061798e-07, - "loss": 0.5469, - "step": 63573 - }, - { - "epoch": 1.63, - "learning_rate": 9.089796750765285e-07, - "loss": 0.7383, - "step": 63574 - }, - { - "epoch": 1.63, - "learning_rate": 9.089521195165671e-07, - "loss": 0.5996, - "step": 63575 - }, - { - "epoch": 1.63, - "learning_rate": 9.089245640263168e-07, - "loss": 0.6279, - "step": 63576 - }, - { - "epoch": 1.63, - "learning_rate": 9.088970086057989e-07, - "loss": 0.4722, - "step": 63577 - }, - { - "epoch": 1.63, - "learning_rate": 9.08869453255034e-07, - "loss": 0.5889, - "step": 63578 - }, - { - "epoch": 1.63, - "learning_rate": 9.088418979740441e-07, - "loss": 0.5247, - "step": 63579 - }, - { - "epoch": 1.63, - "learning_rate": 9.088143427628493e-07, - "loss": 0.7061, - "step": 63580 - }, - { - "epoch": 1.63, - "learning_rate": 9.087867876214715e-07, - "loss": 0.7515, - "step": 63581 - }, - { - "epoch": 1.63, - "learning_rate": 9.087592325499312e-07, - "loss": 0.6924, - "step": 63582 - }, - { - "epoch": 1.63, - "learning_rate": 9.0873167754825e-07, - "loss": 0.6953, - "step": 63583 - }, - { - "epoch": 1.63, - "learning_rate": 9.087041226164489e-07, - "loss": 0.7979, - "step": 63584 - }, - { - "epoch": 1.63, - "learning_rate": 9.086765677545485e-07, - "loss": 0.6543, - "step": 63585 - }, - { - "epoch": 1.63, - "learning_rate": 9.086490129625705e-07, - "loss": 0.5566, - "step": 63586 - }, - { - "epoch": 1.63, - "learning_rate": 9.086214582405355e-07, - "loss": 0.7373, - "step": 63587 - }, - { - "epoch": 1.63, - "learning_rate": 9.08593903588465e-07, - "loss": 0.5405, - "step": 63588 - }, - { - "epoch": 1.63, - "learning_rate": 9.085663490063797e-07, - "loss": 0.7754, - "step": 63589 - }, - { - "epoch": 1.63, - "learning_rate": 9.085387944943013e-07, - "loss": 0.5991, - "step": 63590 - }, - { - "epoch": 1.63, - "learning_rate": 9.085112400522504e-07, - "loss": 0.7441, - "step": 63591 - }, - { - "epoch": 1.63, - "learning_rate": 9.084836856802482e-07, - "loss": 0.6396, - "step": 63592 - }, - { - "epoch": 1.63, - "learning_rate": 9.084561313783157e-07, - "loss": 0.4316, - "step": 63593 - }, - { - "epoch": 1.63, - "learning_rate": 9.084285771464748e-07, - "loss": 0.5278, - "step": 63594 - }, - { - "epoch": 1.63, - "learning_rate": 9.084010229847453e-07, - "loss": 0.6699, - "step": 63595 - }, - { - "epoch": 1.63, - "learning_rate": 9.083734688931492e-07, - "loss": 0.8525, - "step": 63596 - }, - { - "epoch": 1.63, - "learning_rate": 9.08345914871707e-07, - "loss": 0.6313, - "step": 63597 - }, - { - "epoch": 1.63, - "learning_rate": 9.083183609204404e-07, - "loss": 0.6494, - "step": 63598 - }, - { - "epoch": 1.63, - "learning_rate": 9.082908070393699e-07, - "loss": 0.7109, - "step": 63599 - }, - { - "epoch": 1.63, - "learning_rate": 9.082632532285173e-07, - "loss": 0.6421, - "step": 63600 - }, - { - "epoch": 1.63, - "learning_rate": 9.082356994879029e-07, - "loss": 0.4519, - "step": 63601 - }, - { - "epoch": 1.63, - "learning_rate": 9.082081458175485e-07, - "loss": 0.5977, - "step": 63602 - }, - { - "epoch": 1.63, - "learning_rate": 9.081805922174747e-07, - "loss": 0.4744, - "step": 63603 - }, - { - "epoch": 1.63, - "learning_rate": 9.081530386877032e-07, - "loss": 0.6533, - "step": 63604 - }, - { - "epoch": 1.63, - "learning_rate": 9.081254852282546e-07, - "loss": 0.4424, - "step": 63605 - }, - { - "epoch": 1.63, - "learning_rate": 9.080979318391498e-07, - "loss": 0.627, - "step": 63606 - }, - { - "epoch": 1.63, - "learning_rate": 9.080703785204103e-07, - "loss": 0.7627, - "step": 63607 - }, - { - "epoch": 1.63, - "learning_rate": 9.08042825272057e-07, - "loss": 0.6174, - "step": 63608 - }, - { - "epoch": 1.63, - "learning_rate": 9.080152720941112e-07, - "loss": 0.6729, - "step": 63609 - }, - { - "epoch": 1.63, - "learning_rate": 9.079877189865937e-07, - "loss": 0.5878, - "step": 63610 - }, - { - "epoch": 1.63, - "learning_rate": 9.079601659495261e-07, - "loss": 0.6836, - "step": 63611 - }, - { - "epoch": 1.63, - "learning_rate": 9.079326129829287e-07, - "loss": 0.7471, - "step": 63612 - }, - { - "epoch": 1.63, - "learning_rate": 9.079050600868236e-07, - "loss": 0.666, - "step": 63613 - }, - { - "epoch": 1.63, - "learning_rate": 9.078775072612314e-07, - "loss": 0.6309, - "step": 63614 - }, - { - "epoch": 1.63, - "learning_rate": 9.078499545061729e-07, - "loss": 0.7744, - "step": 63615 - }, - { - "epoch": 1.63, - "learning_rate": 9.078224018216692e-07, - "loss": 0.6479, - "step": 63616 - }, - { - "epoch": 1.63, - "learning_rate": 9.077948492077421e-07, - "loss": 0.6914, - "step": 63617 - }, - { - "epoch": 1.63, - "learning_rate": 9.077672966644119e-07, - "loss": 0.6172, - "step": 63618 - }, - { - "epoch": 1.63, - "learning_rate": 9.077397441917002e-07, - "loss": 0.8525, - "step": 63619 - }, - { - "epoch": 1.63, - "learning_rate": 9.077121917896278e-07, - "loss": 0.5234, - "step": 63620 - }, - { - "epoch": 1.63, - "learning_rate": 9.07684639458216e-07, - "loss": 0.5488, - "step": 63621 - }, - { - "epoch": 1.63, - "learning_rate": 9.076570871974858e-07, - "loss": 0.7246, - "step": 63622 - }, - { - "epoch": 1.63, - "learning_rate": 9.076295350074584e-07, - "loss": 0.5869, - "step": 63623 - }, - { - "epoch": 1.63, - "learning_rate": 9.076019828881551e-07, - "loss": 0.6324, - "step": 63624 - }, - { - "epoch": 1.63, - "learning_rate": 9.075744308395963e-07, - "loss": 0.6357, - "step": 63625 - }, - { - "epoch": 1.63, - "learning_rate": 9.075468788618037e-07, - "loss": 0.4751, - "step": 63626 - }, - { - "epoch": 1.63, - "learning_rate": 9.075193269547979e-07, - "loss": 0.6133, - "step": 63627 - }, - { - "epoch": 1.63, - "learning_rate": 9.074917751186006e-07, - "loss": 0.6846, - "step": 63628 - }, - { - "epoch": 1.63, - "learning_rate": 9.074642233532323e-07, - "loss": 0.7275, - "step": 63629 - }, - { - "epoch": 1.63, - "learning_rate": 9.074366716587148e-07, - "loss": 0.7622, - "step": 63630 - }, - { - "epoch": 1.63, - "learning_rate": 9.074091200350687e-07, - "loss": 0.7393, - "step": 63631 - }, - { - "epoch": 1.63, - "learning_rate": 9.073815684823149e-07, - "loss": 0.5361, - "step": 63632 - }, - { - "epoch": 1.63, - "learning_rate": 9.07354017000475e-07, - "loss": 0.6558, - "step": 63633 - }, - { - "epoch": 1.63, - "learning_rate": 9.0732646558957e-07, - "loss": 0.709, - "step": 63634 - }, - { - "epoch": 1.63, - "learning_rate": 9.072989142496206e-07, - "loss": 0.6543, - "step": 63635 - }, - { - "epoch": 1.63, - "learning_rate": 9.072713629806483e-07, - "loss": 0.6729, - "step": 63636 - }, - { - "epoch": 1.63, - "learning_rate": 9.072438117826739e-07, - "loss": 0.6504, - "step": 63637 - }, - { - "epoch": 1.63, - "learning_rate": 9.072162606557188e-07, - "loss": 0.426, - "step": 63638 - }, - { - "epoch": 1.63, - "learning_rate": 9.071887095998037e-07, - "loss": 0.6426, - "step": 63639 - }, - { - "epoch": 1.63, - "learning_rate": 9.071611586149503e-07, - "loss": 0.4778, - "step": 63640 - }, - { - "epoch": 1.63, - "learning_rate": 9.071336077011789e-07, - "loss": 0.6567, - "step": 63641 - }, - { - "epoch": 1.63, - "learning_rate": 9.071060568585114e-07, - "loss": 0.7056, - "step": 63642 - }, - { - "epoch": 1.63, - "learning_rate": 9.070785060869682e-07, - "loss": 0.7744, - "step": 63643 - }, - { - "epoch": 1.63, - "learning_rate": 9.070509553865713e-07, - "loss": 0.5459, - "step": 63644 - }, - { - "epoch": 1.63, - "learning_rate": 9.070234047573409e-07, - "loss": 0.7285, - "step": 63645 - }, - { - "epoch": 1.63, - "learning_rate": 9.069958541992981e-07, - "loss": 0.5336, - "step": 63646 - }, - { - "epoch": 1.63, - "learning_rate": 9.069683037124646e-07, - "loss": 0.79, - "step": 63647 - }, - { - "epoch": 1.63, - "learning_rate": 9.069407532968612e-07, - "loss": 0.7871, - "step": 63648 - }, - { - "epoch": 1.63, - "learning_rate": 9.069132029525088e-07, - "loss": 0.521, - "step": 63649 - }, - { - "epoch": 1.63, - "learning_rate": 9.068856526794288e-07, - "loss": 0.6611, - "step": 63650 - }, - { - "epoch": 1.63, - "learning_rate": 9.068581024776421e-07, - "loss": 0.7817, - "step": 63651 - }, - { - "epoch": 1.63, - "learning_rate": 9.0683055234717e-07, - "loss": 0.7637, - "step": 63652 - }, - { - "epoch": 1.63, - "learning_rate": 9.068030022880332e-07, - "loss": 0.4767, - "step": 63653 - }, - { - "epoch": 1.63, - "learning_rate": 9.067754523002535e-07, - "loss": 0.6196, - "step": 63654 - }, - { - "epoch": 1.63, - "learning_rate": 9.067479023838514e-07, - "loss": 0.7783, - "step": 63655 - }, - { - "epoch": 1.63, - "learning_rate": 9.067203525388478e-07, - "loss": 0.4922, - "step": 63656 - }, - { - "epoch": 1.63, - "learning_rate": 9.066928027652645e-07, - "loss": 0.4611, - "step": 63657 - }, - { - "epoch": 1.63, - "learning_rate": 9.06665253063122e-07, - "loss": 0.6729, - "step": 63658 - }, - { - "epoch": 1.63, - "learning_rate": 9.066377034324418e-07, - "loss": 0.5918, - "step": 63659 - }, - { - "epoch": 1.63, - "learning_rate": 9.066101538732446e-07, - "loss": 0.8525, - "step": 63660 - }, - { - "epoch": 1.63, - "learning_rate": 9.065826043855519e-07, - "loss": 0.6592, - "step": 63661 - }, - { - "epoch": 1.63, - "learning_rate": 9.065550549693845e-07, - "loss": 0.707, - "step": 63662 - }, - { - "epoch": 1.63, - "learning_rate": 9.065275056247636e-07, - "loss": 0.5781, - "step": 63663 - }, - { - "epoch": 1.63, - "learning_rate": 9.064999563517107e-07, - "loss": 0.7285, - "step": 63664 - }, - { - "epoch": 1.63, - "learning_rate": 9.06472407150246e-07, - "loss": 0.5989, - "step": 63665 - }, - { - "epoch": 1.63, - "learning_rate": 9.064448580203913e-07, - "loss": 0.5488, - "step": 63666 - }, - { - "epoch": 1.63, - "learning_rate": 9.064173089621674e-07, - "loss": 0.6709, - "step": 63667 - }, - { - "epoch": 1.63, - "learning_rate": 9.063897599755953e-07, - "loss": 0.6504, - "step": 63668 - }, - { - "epoch": 1.63, - "learning_rate": 9.063622110606965e-07, - "loss": 0.626, - "step": 63669 - }, - { - "epoch": 1.63, - "learning_rate": 9.063346622174917e-07, - "loss": 0.6089, - "step": 63670 - }, - { - "epoch": 1.63, - "learning_rate": 9.063071134460022e-07, - "loss": 0.6943, - "step": 63671 - }, - { - "epoch": 1.63, - "learning_rate": 9.062795647462489e-07, - "loss": 0.6631, - "step": 63672 - }, - { - "epoch": 1.63, - "learning_rate": 9.062520161182532e-07, - "loss": 0.5422, - "step": 63673 - }, - { - "epoch": 1.63, - "learning_rate": 9.062244675620362e-07, - "loss": 0.7529, - "step": 63674 - }, - { - "epoch": 1.63, - "learning_rate": 9.061969190776185e-07, - "loss": 0.7178, - "step": 63675 - }, - { - "epoch": 1.63, - "learning_rate": 9.061693706650216e-07, - "loss": 0.6064, - "step": 63676 - }, - { - "epoch": 1.63, - "learning_rate": 9.061418223242664e-07, - "loss": 0.7715, - "step": 63677 - }, - { - "epoch": 1.63, - "learning_rate": 9.061142740553742e-07, - "loss": 0.6367, - "step": 63678 - }, - { - "epoch": 1.63, - "learning_rate": 9.060867258583658e-07, - "loss": 0.6367, - "step": 63679 - }, - { - "epoch": 1.63, - "learning_rate": 9.060591777332628e-07, - "loss": 0.6221, - "step": 63680 - }, - { - "epoch": 1.63, - "learning_rate": 9.060316296800858e-07, - "loss": 0.8096, - "step": 63681 - }, - { - "epoch": 1.63, - "learning_rate": 9.06004081698856e-07, - "loss": 0.5537, - "step": 63682 - }, - { - "epoch": 1.63, - "learning_rate": 9.059765337895945e-07, - "loss": 0.7656, - "step": 63683 - }, - { - "epoch": 1.63, - "learning_rate": 9.059489859523231e-07, - "loss": 0.8555, - "step": 63684 - }, - { - "epoch": 1.63, - "learning_rate": 9.059214381870615e-07, - "loss": 0.5864, - "step": 63685 - }, - { - "epoch": 1.63, - "learning_rate": 9.058938904938319e-07, - "loss": 0.6187, - "step": 63686 - }, - { - "epoch": 1.63, - "learning_rate": 9.058663428726547e-07, - "loss": 0.5947, - "step": 63687 - }, - { - "epoch": 1.63, - "learning_rate": 9.058387953235515e-07, - "loss": 0.623, - "step": 63688 - }, - { - "epoch": 1.63, - "learning_rate": 9.05811247846543e-07, - "loss": 0.6436, - "step": 63689 - }, - { - "epoch": 1.63, - "learning_rate": 9.057837004416507e-07, - "loss": 0.6826, - "step": 63690 - }, - { - "epoch": 1.63, - "learning_rate": 9.057561531088955e-07, - "loss": 0.5107, - "step": 63691 - }, - { - "epoch": 1.63, - "learning_rate": 9.057286058482985e-07, - "loss": 0.6487, - "step": 63692 - }, - { - "epoch": 1.63, - "learning_rate": 9.057010586598805e-07, - "loss": 0.666, - "step": 63693 - }, - { - "epoch": 1.63, - "learning_rate": 9.056735115436633e-07, - "loss": 0.5491, - "step": 63694 - }, - { - "epoch": 1.63, - "learning_rate": 9.056459644996674e-07, - "loss": 0.6885, - "step": 63695 - }, - { - "epoch": 1.63, - "learning_rate": 9.056184175279139e-07, - "loss": 0.5332, - "step": 63696 - }, - { - "epoch": 1.63, - "learning_rate": 9.055908706284242e-07, - "loss": 0.7437, - "step": 63697 - }, - { - "epoch": 1.63, - "learning_rate": 9.055633238012191e-07, - "loss": 0.5122, - "step": 63698 - }, - { - "epoch": 1.63, - "learning_rate": 9.055357770463198e-07, - "loss": 0.6489, - "step": 63699 - }, - { - "epoch": 1.63, - "learning_rate": 9.055082303637473e-07, - "loss": 0.7812, - "step": 63700 - }, - { - "epoch": 1.63, - "learning_rate": 9.054806837535231e-07, - "loss": 0.6279, - "step": 63701 - }, - { - "epoch": 1.63, - "learning_rate": 9.054531372156677e-07, - "loss": 0.4487, - "step": 63702 - }, - { - "epoch": 1.63, - "learning_rate": 9.054255907502027e-07, - "loss": 0.5356, - "step": 63703 - }, - { - "epoch": 1.63, - "learning_rate": 9.053980443571493e-07, - "loss": 0.6543, - "step": 63704 - }, - { - "epoch": 1.63, - "learning_rate": 9.053704980365279e-07, - "loss": 0.6494, - "step": 63705 - }, - { - "epoch": 1.63, - "learning_rate": 9.053429517883598e-07, - "loss": 0.5447, - "step": 63706 - }, - { - "epoch": 1.63, - "learning_rate": 9.053154056126666e-07, - "loss": 0.7441, - "step": 63707 - }, - { - "epoch": 1.63, - "learning_rate": 9.052878595094687e-07, - "loss": 0.7861, - "step": 63708 - }, - { - "epoch": 1.63, - "learning_rate": 9.052603134787878e-07, - "loss": 0.6216, - "step": 63709 - }, - { - "epoch": 1.63, - "learning_rate": 9.052327675206444e-07, - "loss": 0.7031, - "step": 63710 - }, - { - "epoch": 1.63, - "learning_rate": 9.052052216350602e-07, - "loss": 0.4858, - "step": 63711 - }, - { - "epoch": 1.63, - "learning_rate": 9.051776758220557e-07, - "loss": 0.748, - "step": 63712 - }, - { - "epoch": 1.63, - "learning_rate": 9.051501300816527e-07, - "loss": 0.4192, - "step": 63713 - }, - { - "epoch": 1.63, - "learning_rate": 9.051225844138719e-07, - "loss": 0.478, - "step": 63714 - }, - { - "epoch": 1.63, - "learning_rate": 9.05095038818734e-07, - "loss": 0.8457, - "step": 63715 - }, - { - "epoch": 1.63, - "learning_rate": 9.050674932962607e-07, - "loss": 0.5327, - "step": 63716 - }, - { - "epoch": 1.63, - "learning_rate": 9.050399478464727e-07, - "loss": 0.666, - "step": 63717 - }, - { - "epoch": 1.63, - "learning_rate": 9.050124024693915e-07, - "loss": 0.7812, - "step": 63718 - }, - { - "epoch": 1.63, - "learning_rate": 9.049848571650376e-07, - "loss": 0.6943, - "step": 63719 - }, - { - "epoch": 1.63, - "learning_rate": 9.049573119334326e-07, - "loss": 0.7031, - "step": 63720 - }, - { - "epoch": 1.63, - "learning_rate": 9.049297667745975e-07, - "loss": 0.5212, - "step": 63721 - }, - { - "epoch": 1.63, - "learning_rate": 9.049022216885531e-07, - "loss": 0.6328, - "step": 63722 - }, - { - "epoch": 1.63, - "learning_rate": 9.048746766753209e-07, - "loss": 0.5703, - "step": 63723 - }, - { - "epoch": 1.63, - "learning_rate": 9.04847131734922e-07, - "loss": 0.5627, - "step": 63724 - }, - { - "epoch": 1.63, - "learning_rate": 9.048195868673768e-07, - "loss": 0.4658, - "step": 63725 - }, - { - "epoch": 1.63, - "learning_rate": 9.047920420727071e-07, - "loss": 0.666, - "step": 63726 - }, - { - "epoch": 1.63, - "learning_rate": 9.047644973509337e-07, - "loss": 0.3472, - "step": 63727 - }, - { - "epoch": 1.63, - "learning_rate": 9.047369527020778e-07, - "loss": 0.7822, - "step": 63728 - }, - { - "epoch": 1.63, - "learning_rate": 9.047094081261602e-07, - "loss": 0.7363, - "step": 63729 - }, - { - "epoch": 1.63, - "learning_rate": 9.046818636232024e-07, - "loss": 0.6377, - "step": 63730 - }, - { - "epoch": 1.63, - "learning_rate": 9.046543191932252e-07, - "loss": 0.6167, - "step": 63731 - }, - { - "epoch": 1.63, - "learning_rate": 9.0462677483625e-07, - "loss": 0.6602, - "step": 63732 - }, - { - "epoch": 1.63, - "learning_rate": 9.045992305522975e-07, - "loss": 0.6201, - "step": 63733 - }, - { - "epoch": 1.63, - "learning_rate": 9.045716863413894e-07, - "loss": 0.6274, - "step": 63734 - }, - { - "epoch": 1.63, - "learning_rate": 9.045441422035462e-07, - "loss": 0.5591, - "step": 63735 - }, - { - "epoch": 1.63, - "learning_rate": 9.045165981387887e-07, - "loss": 0.6309, - "step": 63736 - }, - { - "epoch": 1.63, - "learning_rate": 9.044890541471389e-07, - "loss": 0.6904, - "step": 63737 - }, - { - "epoch": 1.63, - "learning_rate": 9.044615102286175e-07, - "loss": 0.6738, - "step": 63738 - }, - { - "epoch": 1.63, - "learning_rate": 9.044339663832452e-07, - "loss": 0.8018, - "step": 63739 - }, - { - "epoch": 1.63, - "learning_rate": 9.044064226110436e-07, - "loss": 0.6079, - "step": 63740 - }, - { - "epoch": 1.63, - "learning_rate": 9.043788789120334e-07, - "loss": 0.5459, - "step": 63741 - }, - { - "epoch": 1.63, - "learning_rate": 9.043513352862362e-07, - "loss": 0.6704, - "step": 63742 - }, - { - "epoch": 1.63, - "learning_rate": 9.043237917336725e-07, - "loss": 0.5972, - "step": 63743 - }, - { - "epoch": 1.63, - "learning_rate": 9.042962482543641e-07, - "loss": 0.5538, - "step": 63744 - }, - { - "epoch": 1.63, - "learning_rate": 9.042687048483315e-07, - "loss": 0.6719, - "step": 63745 - }, - { - "epoch": 1.63, - "learning_rate": 9.042411615155957e-07, - "loss": 0.667, - "step": 63746 - }, - { - "epoch": 1.63, - "learning_rate": 9.042136182561782e-07, - "loss": 0.6011, - "step": 63747 - }, - { - "epoch": 1.63, - "learning_rate": 9.041860750700998e-07, - "loss": 0.446, - "step": 63748 - }, - { - "epoch": 1.63, - "learning_rate": 9.04158531957382e-07, - "loss": 0.5063, - "step": 63749 - }, - { - "epoch": 1.63, - "learning_rate": 9.041309889180451e-07, - "loss": 0.8076, - "step": 63750 - }, - { - "epoch": 1.63, - "learning_rate": 9.041034459521111e-07, - "loss": 0.5957, - "step": 63751 - }, - { - "epoch": 1.63, - "learning_rate": 9.040759030596006e-07, - "loss": 0.6237, - "step": 63752 - }, - { - "epoch": 1.63, - "learning_rate": 9.040483602405347e-07, - "loss": 0.7173, - "step": 63753 - }, - { - "epoch": 1.63, - "learning_rate": 9.04020817494935e-07, - "loss": 0.5112, - "step": 63754 - }, - { - "epoch": 1.63, - "learning_rate": 9.039932748228216e-07, - "loss": 0.6797, - "step": 63755 - }, - { - "epoch": 1.63, - "learning_rate": 9.039657322242164e-07, - "loss": 0.5942, - "step": 63756 - }, - { - "epoch": 1.63, - "learning_rate": 9.039381896991402e-07, - "loss": 0.6914, - "step": 63757 - }, - { - "epoch": 1.63, - "learning_rate": 9.03910647247614e-07, - "loss": 0.6084, - "step": 63758 - }, - { - "epoch": 1.63, - "learning_rate": 9.038831048696592e-07, - "loss": 0.667, - "step": 63759 - }, - { - "epoch": 1.63, - "learning_rate": 9.038555625652962e-07, - "loss": 0.427, - "step": 63760 - }, - { - "epoch": 1.63, - "learning_rate": 9.038280203345471e-07, - "loss": 0.5708, - "step": 63761 - }, - { - "epoch": 1.63, - "learning_rate": 9.038004781774321e-07, - "loss": 0.728, - "step": 63762 - }, - { - "epoch": 1.63, - "learning_rate": 9.037729360939729e-07, - "loss": 0.7344, - "step": 63763 - }, - { - "epoch": 1.63, - "learning_rate": 9.037453940841906e-07, - "loss": 0.5962, - "step": 63764 - }, - { - "epoch": 1.63, - "learning_rate": 9.037178521481055e-07, - "loss": 0.7949, - "step": 63765 - }, - { - "epoch": 1.63, - "learning_rate": 9.036903102857395e-07, - "loss": 0.6768, - "step": 63766 - }, - { - "epoch": 1.63, - "learning_rate": 9.036627684971132e-07, - "loss": 0.5679, - "step": 63767 - }, - { - "epoch": 1.63, - "learning_rate": 9.036352267822481e-07, - "loss": 0.5454, - "step": 63768 - }, - { - "epoch": 1.63, - "learning_rate": 9.036076851411647e-07, - "loss": 0.5884, - "step": 63769 - }, - { - "epoch": 1.63, - "learning_rate": 9.035801435738848e-07, - "loss": 0.6582, - "step": 63770 - }, - { - "epoch": 1.63, - "learning_rate": 9.03552602080429e-07, - "loss": 0.6436, - "step": 63771 - }, - { - "epoch": 1.63, - "learning_rate": 9.035250606608186e-07, - "loss": 0.5815, - "step": 63772 - }, - { - "epoch": 1.63, - "learning_rate": 9.034975193150746e-07, - "loss": 0.4535, - "step": 63773 - }, - { - "epoch": 1.63, - "learning_rate": 9.034699780432186e-07, - "loss": 0.7441, - "step": 63774 - }, - { - "epoch": 1.63, - "learning_rate": 9.034424368452707e-07, - "loss": 0.5923, - "step": 63775 - }, - { - "epoch": 1.63, - "learning_rate": 9.034148957212526e-07, - "loss": 0.7266, - "step": 63776 - }, - { - "epoch": 1.63, - "learning_rate": 9.03387354671185e-07, - "loss": 0.5205, - "step": 63777 - }, - { - "epoch": 1.63, - "learning_rate": 9.033598136950897e-07, - "loss": 0.71, - "step": 63778 - }, - { - "epoch": 1.63, - "learning_rate": 9.033322727929868e-07, - "loss": 0.7617, - "step": 63779 - }, - { - "epoch": 1.63, - "learning_rate": 9.033047319648984e-07, - "loss": 0.5615, - "step": 63780 - }, - { - "epoch": 1.63, - "learning_rate": 9.032771912108448e-07, - "loss": 0.623, - "step": 63781 - }, - { - "epoch": 1.63, - "learning_rate": 9.032496505308477e-07, - "loss": 0.6431, - "step": 63782 - }, - { - "epoch": 1.63, - "learning_rate": 9.032221099249276e-07, - "loss": 0.4873, - "step": 63783 - }, - { - "epoch": 1.63, - "learning_rate": 9.031945693931064e-07, - "loss": 0.6226, - "step": 63784 - }, - { - "epoch": 1.63, - "learning_rate": 9.031670289354044e-07, - "loss": 0.6641, - "step": 63785 - }, - { - "epoch": 1.63, - "learning_rate": 9.031394885518428e-07, - "loss": 0.7158, - "step": 63786 - }, - { - "epoch": 1.63, - "learning_rate": 9.03111948242443e-07, - "loss": 0.5234, - "step": 63787 - }, - { - "epoch": 1.63, - "learning_rate": 9.030844080072257e-07, - "loss": 0.6006, - "step": 63788 - }, - { - "epoch": 1.63, - "learning_rate": 9.030568678462124e-07, - "loss": 0.563, - "step": 63789 - }, - { - "epoch": 1.63, - "learning_rate": 9.030293277594237e-07, - "loss": 0.7695, - "step": 63790 - }, - { - "epoch": 1.63, - "learning_rate": 9.030017877468814e-07, - "loss": 0.6914, - "step": 63791 - }, - { - "epoch": 1.64, - "learning_rate": 9.029742478086059e-07, - "loss": 0.6816, - "step": 63792 - }, - { - "epoch": 1.64, - "learning_rate": 9.029467079446186e-07, - "loss": 0.6172, - "step": 63793 - }, - { - "epoch": 1.64, - "learning_rate": 9.02919168154941e-07, - "loss": 0.707, - "step": 63794 - }, - { - "epoch": 1.64, - "learning_rate": 9.028916284395935e-07, - "loss": 0.7188, - "step": 63795 - }, - { - "epoch": 1.64, - "learning_rate": 9.02864088798597e-07, - "loss": 0.7998, - "step": 63796 - }, - { - "epoch": 1.64, - "learning_rate": 9.028365492319734e-07, - "loss": 0.5599, - "step": 63797 - }, - { - "epoch": 1.64, - "learning_rate": 9.02809009739743e-07, - "loss": 0.45, - "step": 63798 - }, - { - "epoch": 1.64, - "learning_rate": 9.027814703219277e-07, - "loss": 0.7871, - "step": 63799 - }, - { - "epoch": 1.64, - "learning_rate": 9.027539309785478e-07, - "loss": 0.7646, - "step": 63800 - }, - { - "epoch": 1.64, - "learning_rate": 9.027263917096249e-07, - "loss": 0.5845, - "step": 63801 - }, - { - "epoch": 1.64, - "learning_rate": 9.026988525151799e-07, - "loss": 0.7861, - "step": 63802 - }, - { - "epoch": 1.64, - "learning_rate": 9.026713133952339e-07, - "loss": 0.7705, - "step": 63803 - }, - { - "epoch": 1.64, - "learning_rate": 9.026437743498084e-07, - "loss": 0.6523, - "step": 63804 - }, - { - "epoch": 1.64, - "learning_rate": 9.026162353789236e-07, - "loss": 0.6035, - "step": 63805 - }, - { - "epoch": 1.64, - "learning_rate": 9.025886964826014e-07, - "loss": 0.5809, - "step": 63806 - }, - { - "epoch": 1.64, - "learning_rate": 9.025611576608622e-07, - "loss": 0.5859, - "step": 63807 - }, - { - "epoch": 1.64, - "learning_rate": 9.025336189137277e-07, - "loss": 0.8203, - "step": 63808 - }, - { - "epoch": 1.64, - "learning_rate": 9.025060802412184e-07, - "loss": 0.7422, - "step": 63809 - }, - { - "epoch": 1.64, - "learning_rate": 9.024785416433562e-07, - "loss": 0.5503, - "step": 63810 - }, - { - "epoch": 1.64, - "learning_rate": 9.024510031201614e-07, - "loss": 0.6787, - "step": 63811 - }, - { - "epoch": 1.64, - "learning_rate": 9.024234646716553e-07, - "loss": 0.5605, - "step": 63812 - }, - { - "epoch": 1.64, - "learning_rate": 9.023959262978593e-07, - "loss": 0.5737, - "step": 63813 - }, - { - "epoch": 1.64, - "learning_rate": 9.023683879987945e-07, - "loss": 0.7773, - "step": 63814 - }, - { - "epoch": 1.64, - "learning_rate": 9.023408497744813e-07, - "loss": 0.644, - "step": 63815 - }, - { - "epoch": 1.64, - "learning_rate": 9.023133116249413e-07, - "loss": 0.8066, - "step": 63816 - }, - { - "epoch": 1.64, - "learning_rate": 9.022857735501953e-07, - "loss": 0.7021, - "step": 63817 - }, - { - "epoch": 1.64, - "learning_rate": 9.022582355502649e-07, - "loss": 0.6091, - "step": 63818 - }, - { - "epoch": 1.64, - "learning_rate": 9.022306976251705e-07, - "loss": 0.6855, - "step": 63819 - }, - { - "epoch": 1.64, - "learning_rate": 9.02203159774934e-07, - "loss": 0.6265, - "step": 63820 - }, - { - "epoch": 1.64, - "learning_rate": 9.021756219995757e-07, - "loss": 0.6504, - "step": 63821 - }, - { - "epoch": 1.64, - "learning_rate": 9.021480842991174e-07, - "loss": 0.7217, - "step": 63822 - }, - { - "epoch": 1.64, - "learning_rate": 9.021205466735794e-07, - "loss": 0.6279, - "step": 63823 - }, - { - "epoch": 1.64, - "learning_rate": 9.020930091229837e-07, - "loss": 0.6611, - "step": 63824 - }, - { - "epoch": 1.64, - "learning_rate": 9.020654716473507e-07, - "loss": 0.6069, - "step": 63825 - }, - { - "epoch": 1.64, - "learning_rate": 9.020379342467014e-07, - "loss": 0.7598, - "step": 63826 - }, - { - "epoch": 1.64, - "learning_rate": 9.020103969210574e-07, - "loss": 0.5703, - "step": 63827 - }, - { - "epoch": 1.64, - "learning_rate": 9.019828596704393e-07, - "loss": 0.6221, - "step": 63828 - }, - { - "epoch": 1.64, - "learning_rate": 9.019553224948687e-07, - "loss": 0.7285, - "step": 63829 - }, - { - "epoch": 1.64, - "learning_rate": 9.019277853943664e-07, - "loss": 0.7627, - "step": 63830 - }, - { - "epoch": 1.64, - "learning_rate": 9.019002483689531e-07, - "loss": 0.6641, - "step": 63831 - }, - { - "epoch": 1.64, - "learning_rate": 9.018727114186506e-07, - "loss": 0.7617, - "step": 63832 - }, - { - "epoch": 1.64, - "learning_rate": 9.018451745434799e-07, - "loss": 0.6797, - "step": 63833 - }, - { - "epoch": 1.64, - "learning_rate": 9.018176377434613e-07, - "loss": 0.6226, - "step": 63834 - }, - { - "epoch": 1.64, - "learning_rate": 9.017901010186167e-07, - "loss": 0.5962, - "step": 63835 - }, - { - "epoch": 1.64, - "learning_rate": 9.017625643689667e-07, - "loss": 0.5962, - "step": 63836 - }, - { - "epoch": 1.64, - "learning_rate": 9.017350277945328e-07, - "loss": 0.6489, - "step": 63837 - }, - { - "epoch": 1.64, - "learning_rate": 9.017074912953357e-07, - "loss": 0.6943, - "step": 63838 - }, - { - "epoch": 1.64, - "learning_rate": 9.016799548713968e-07, - "loss": 0.6113, - "step": 63839 - }, - { - "epoch": 1.64, - "learning_rate": 9.016524185227368e-07, - "loss": 0.7598, - "step": 63840 - }, - { - "epoch": 1.64, - "learning_rate": 9.016248822493773e-07, - "loss": 0.665, - "step": 63841 - }, - { - "epoch": 1.64, - "learning_rate": 9.015973460513389e-07, - "loss": 0.6284, - "step": 63842 - }, - { - "epoch": 1.64, - "learning_rate": 9.015698099286432e-07, - "loss": 0.7939, - "step": 63843 - }, - { - "epoch": 1.64, - "learning_rate": 9.015422738813109e-07, - "loss": 0.6455, - "step": 63844 - }, - { - "epoch": 1.64, - "learning_rate": 9.015147379093629e-07, - "loss": 0.6797, - "step": 63845 - }, - { - "epoch": 1.64, - "learning_rate": 9.014872020128207e-07, - "loss": 0.637, - "step": 63846 - }, - { - "epoch": 1.64, - "learning_rate": 9.014596661917052e-07, - "loss": 0.5396, - "step": 63847 - }, - { - "epoch": 1.64, - "learning_rate": 9.014321304460374e-07, - "loss": 0.6484, - "step": 63848 - }, - { - "epoch": 1.64, - "learning_rate": 9.014045947758387e-07, - "loss": 0.6035, - "step": 63849 - }, - { - "epoch": 1.64, - "learning_rate": 9.013770591811296e-07, - "loss": 0.5537, - "step": 63850 - }, - { - "epoch": 1.64, - "learning_rate": 9.013495236619318e-07, - "loss": 0.6665, - "step": 63851 - }, - { - "epoch": 1.64, - "learning_rate": 9.01321988218266e-07, - "loss": 0.665, - "step": 63852 - }, - { - "epoch": 1.64, - "learning_rate": 9.012944528501538e-07, - "loss": 0.6162, - "step": 63853 - }, - { - "epoch": 1.64, - "learning_rate": 9.012669175576158e-07, - "loss": 0.9404, - "step": 63854 - }, - { - "epoch": 1.64, - "learning_rate": 9.012393823406728e-07, - "loss": 0.6621, - "step": 63855 - }, - { - "epoch": 1.64, - "learning_rate": 9.012118471993466e-07, - "loss": 0.5562, - "step": 63856 - }, - { - "epoch": 1.64, - "learning_rate": 9.011843121336577e-07, - "loss": 0.5503, - "step": 63857 - }, - { - "epoch": 1.64, - "learning_rate": 9.011567771436276e-07, - "loss": 0.4727, - "step": 63858 - }, - { - "epoch": 1.64, - "learning_rate": 9.01129242229277e-07, - "loss": 0.6187, - "step": 63859 - }, - { - "epoch": 1.64, - "learning_rate": 9.011017073906274e-07, - "loss": 0.6006, - "step": 63860 - }, - { - "epoch": 1.64, - "learning_rate": 9.010741726276994e-07, - "loss": 0.6436, - "step": 63861 - }, - { - "epoch": 1.64, - "learning_rate": 9.010466379405148e-07, - "loss": 0.6611, - "step": 63862 - }, - { - "epoch": 1.64, - "learning_rate": 9.010191033290943e-07, - "loss": 0.7578, - "step": 63863 - }, - { - "epoch": 1.64, - "learning_rate": 9.009915687934587e-07, - "loss": 0.6758, - "step": 63864 - }, - { - "epoch": 1.64, - "learning_rate": 9.009640343336291e-07, - "loss": 0.7939, - "step": 63865 - }, - { - "epoch": 1.64, - "learning_rate": 9.00936499949627e-07, - "loss": 0.5532, - "step": 63866 - }, - { - "epoch": 1.64, - "learning_rate": 9.009089656414731e-07, - "loss": 0.5952, - "step": 63867 - }, - { - "epoch": 1.64, - "learning_rate": 9.008814314091888e-07, - "loss": 0.6465, - "step": 63868 - }, - { - "epoch": 1.64, - "learning_rate": 9.008538972527948e-07, - "loss": 0.665, - "step": 63869 - }, - { - "epoch": 1.64, - "learning_rate": 9.008263631723128e-07, - "loss": 0.5276, - "step": 63870 - }, - { - "epoch": 1.64, - "learning_rate": 9.00798829167763e-07, - "loss": 0.5967, - "step": 63871 - }, - { - "epoch": 1.64, - "learning_rate": 9.007712952391673e-07, - "loss": 0.7051, - "step": 63872 - }, - { - "epoch": 1.64, - "learning_rate": 9.007437613865468e-07, - "loss": 0.5972, - "step": 63873 - }, - { - "epoch": 1.64, - "learning_rate": 9.007162276099218e-07, - "loss": 0.6846, - "step": 63874 - }, - { - "epoch": 1.64, - "learning_rate": 9.006886939093139e-07, - "loss": 0.5796, - "step": 63875 - }, - { - "epoch": 1.64, - "learning_rate": 9.006611602847439e-07, - "loss": 0.6035, - "step": 63876 - }, - { - "epoch": 1.64, - "learning_rate": 9.006336267362333e-07, - "loss": 0.5186, - "step": 63877 - }, - { - "epoch": 1.64, - "learning_rate": 9.006060932638029e-07, - "loss": 0.5596, - "step": 63878 - }, - { - "epoch": 1.64, - "learning_rate": 9.005785598674739e-07, - "loss": 0.5447, - "step": 63879 - }, - { - "epoch": 1.64, - "learning_rate": 9.005510265472672e-07, - "loss": 0.5308, - "step": 63880 - }, - { - "epoch": 1.64, - "learning_rate": 9.005234933032041e-07, - "loss": 0.6943, - "step": 63881 - }, - { - "epoch": 1.64, - "learning_rate": 9.004959601353055e-07, - "loss": 0.5474, - "step": 63882 - }, - { - "epoch": 1.64, - "learning_rate": 9.004684270435931e-07, - "loss": 0.5088, - "step": 63883 - }, - { - "epoch": 1.64, - "learning_rate": 9.004408940280869e-07, - "loss": 0.5674, - "step": 63884 - }, - { - "epoch": 1.64, - "learning_rate": 9.004133610888087e-07, - "loss": 0.6499, - "step": 63885 - }, - { - "epoch": 1.64, - "learning_rate": 9.003858282257791e-07, - "loss": 0.5171, - "step": 63886 - }, - { - "epoch": 1.64, - "learning_rate": 9.003582954390198e-07, - "loss": 0.3039, - "step": 63887 - }, - { - "epoch": 1.64, - "learning_rate": 9.003307627285514e-07, - "loss": 0.5312, - "step": 63888 - }, - { - "epoch": 1.64, - "learning_rate": 9.003032300943953e-07, - "loss": 0.6367, - "step": 63889 - }, - { - "epoch": 1.64, - "learning_rate": 9.002756975365723e-07, - "loss": 0.5566, - "step": 63890 - }, - { - "epoch": 1.64, - "learning_rate": 9.002481650551038e-07, - "loss": 0.6392, - "step": 63891 - }, - { - "epoch": 1.64, - "learning_rate": 9.002206326500105e-07, - "loss": 0.7275, - "step": 63892 - }, - { - "epoch": 1.64, - "learning_rate": 9.00193100321314e-07, - "loss": 0.7354, - "step": 63893 - }, - { - "epoch": 1.64, - "learning_rate": 9.001655680690349e-07, - "loss": 0.6743, - "step": 63894 - }, - { - "epoch": 1.64, - "learning_rate": 9.001380358931942e-07, - "loss": 0.6304, - "step": 63895 - }, - { - "epoch": 1.64, - "learning_rate": 9.001105037938135e-07, - "loss": 0.6245, - "step": 63896 - }, - { - "epoch": 1.64, - "learning_rate": 9.000829717709133e-07, - "loss": 0.8574, - "step": 63897 - }, - { - "epoch": 1.64, - "learning_rate": 9.000554398245152e-07, - "loss": 0.6406, - "step": 63898 - }, - { - "epoch": 1.64, - "learning_rate": 9.000279079546399e-07, - "loss": 0.7842, - "step": 63899 - }, - { - "epoch": 1.64, - "learning_rate": 9.000003761613088e-07, - "loss": 0.4658, - "step": 63900 - }, - { - "epoch": 1.64, - "learning_rate": 8.999728444445428e-07, - "loss": 0.5344, - "step": 63901 - }, - { - "epoch": 1.64, - "learning_rate": 8.999453128043628e-07, - "loss": 0.7422, - "step": 63902 - }, - { - "epoch": 1.64, - "learning_rate": 8.999177812407905e-07, - "loss": 0.5435, - "step": 63903 - }, - { - "epoch": 1.64, - "learning_rate": 8.998902497538463e-07, - "loss": 0.6914, - "step": 63904 - }, - { - "epoch": 1.64, - "learning_rate": 8.998627183435513e-07, - "loss": 0.7168, - "step": 63905 - }, - { - "epoch": 1.64, - "learning_rate": 8.998351870099271e-07, - "loss": 0.7236, - "step": 63906 - }, - { - "epoch": 1.64, - "learning_rate": 8.998076557529944e-07, - "loss": 0.5005, - "step": 63907 - }, - { - "epoch": 1.64, - "learning_rate": 8.997801245727743e-07, - "loss": 0.6982, - "step": 63908 - }, - { - "epoch": 1.64, - "learning_rate": 8.997525934692879e-07, - "loss": 0.5491, - "step": 63909 - }, - { - "epoch": 1.64, - "learning_rate": 8.997250624425565e-07, - "loss": 0.5903, - "step": 63910 - }, - { - "epoch": 1.64, - "learning_rate": 8.996975314926009e-07, - "loss": 0.5674, - "step": 63911 - }, - { - "epoch": 1.64, - "learning_rate": 8.996700006194425e-07, - "loss": 0.7031, - "step": 63912 - }, - { - "epoch": 1.64, - "learning_rate": 8.996424698231022e-07, - "loss": 0.626, - "step": 63913 - }, - { - "epoch": 1.64, - "learning_rate": 8.996149391036006e-07, - "loss": 0.5356, - "step": 63914 - }, - { - "epoch": 1.64, - "learning_rate": 8.995874084609596e-07, - "loss": 0.5581, - "step": 63915 - }, - { - "epoch": 1.64, - "learning_rate": 8.995598778951998e-07, - "loss": 0.6875, - "step": 63916 - }, - { - "epoch": 1.64, - "learning_rate": 8.995323474063423e-07, - "loss": 0.5723, - "step": 63917 - }, - { - "epoch": 1.64, - "learning_rate": 8.995048169944082e-07, - "loss": 0.4263, - "step": 63918 - }, - { - "epoch": 1.64, - "learning_rate": 8.994772866594189e-07, - "loss": 0.6509, - "step": 63919 - }, - { - "epoch": 1.64, - "learning_rate": 8.994497564013952e-07, - "loss": 0.6313, - "step": 63920 - }, - { - "epoch": 1.64, - "learning_rate": 8.994222262203579e-07, - "loss": 0.4771, - "step": 63921 - }, - { - "epoch": 1.64, - "learning_rate": 8.993946961163287e-07, - "loss": 0.647, - "step": 63922 - }, - { - "epoch": 1.64, - "learning_rate": 8.993671660893285e-07, - "loss": 0.6069, - "step": 63923 - }, - { - "epoch": 1.64, - "learning_rate": 8.993396361393778e-07, - "loss": 0.7505, - "step": 63924 - }, - { - "epoch": 1.64, - "learning_rate": 8.993121062664984e-07, - "loss": 0.5249, - "step": 63925 - }, - { - "epoch": 1.64, - "learning_rate": 8.992845764707108e-07, - "loss": 0.6436, - "step": 63926 - }, - { - "epoch": 1.64, - "learning_rate": 8.992570467520366e-07, - "loss": 0.5654, - "step": 63927 - }, - { - "epoch": 1.64, - "learning_rate": 8.992295171104963e-07, - "loss": 0.5493, - "step": 63928 - }, - { - "epoch": 1.64, - "learning_rate": 8.992019875461118e-07, - "loss": 0.5474, - "step": 63929 - }, - { - "epoch": 1.64, - "learning_rate": 8.991744580589033e-07, - "loss": 0.5715, - "step": 63930 - }, - { - "epoch": 1.64, - "learning_rate": 8.991469286488926e-07, - "loss": 0.6504, - "step": 63931 - }, - { - "epoch": 1.64, - "learning_rate": 8.991193993161002e-07, - "loss": 0.7217, - "step": 63932 - }, - { - "epoch": 1.64, - "learning_rate": 8.990918700605479e-07, - "loss": 0.8125, - "step": 63933 - }, - { - "epoch": 1.64, - "learning_rate": 8.99064340882256e-07, - "loss": 0.6333, - "step": 63934 - }, - { - "epoch": 1.64, - "learning_rate": 8.990368117812458e-07, - "loss": 0.6226, - "step": 63935 - }, - { - "epoch": 1.64, - "learning_rate": 8.990092827575386e-07, - "loss": 0.876, - "step": 63936 - }, - { - "epoch": 1.64, - "learning_rate": 8.989817538111554e-07, - "loss": 0.5942, - "step": 63937 - }, - { - "epoch": 1.64, - "learning_rate": 8.98954224942117e-07, - "loss": 0.7773, - "step": 63938 - }, - { - "epoch": 1.64, - "learning_rate": 8.98926696150445e-07, - "loss": 0.4991, - "step": 63939 - }, - { - "epoch": 1.64, - "learning_rate": 8.988991674361597e-07, - "loss": 0.5283, - "step": 63940 - }, - { - "epoch": 1.64, - "learning_rate": 8.988716387992832e-07, - "loss": 0.6343, - "step": 63941 - }, - { - "epoch": 1.64, - "learning_rate": 8.988441102398357e-07, - "loss": 0.6636, - "step": 63942 - }, - { - "epoch": 1.64, - "learning_rate": 8.988165817578389e-07, - "loss": 0.6313, - "step": 63943 - }, - { - "epoch": 1.64, - "learning_rate": 8.987890533533136e-07, - "loss": 0.5869, - "step": 63944 - }, - { - "epoch": 1.64, - "learning_rate": 8.987615250262804e-07, - "loss": 0.5586, - "step": 63945 - }, - { - "epoch": 1.64, - "learning_rate": 8.987339967767613e-07, - "loss": 0.5781, - "step": 63946 - }, - { - "epoch": 1.64, - "learning_rate": 8.987064686047766e-07, - "loss": 0.7852, - "step": 63947 - }, - { - "epoch": 1.64, - "learning_rate": 8.986789405103478e-07, - "loss": 0.416, - "step": 63948 - }, - { - "epoch": 1.64, - "learning_rate": 8.98651412493496e-07, - "loss": 0.6514, - "step": 63949 - }, - { - "epoch": 1.64, - "learning_rate": 8.986238845542421e-07, - "loss": 0.6572, - "step": 63950 - }, - { - "epoch": 1.64, - "learning_rate": 8.985963566926071e-07, - "loss": 0.5825, - "step": 63951 - }, - { - "epoch": 1.64, - "learning_rate": 8.985688289086124e-07, - "loss": 0.7168, - "step": 63952 - }, - { - "epoch": 1.64, - "learning_rate": 8.985413012022791e-07, - "loss": 0.5059, - "step": 63953 - }, - { - "epoch": 1.64, - "learning_rate": 8.985137735736278e-07, - "loss": 0.7246, - "step": 63954 - }, - { - "epoch": 1.64, - "learning_rate": 8.984862460226797e-07, - "loss": 0.5205, - "step": 63955 - }, - { - "epoch": 1.64, - "learning_rate": 8.984587185494561e-07, - "loss": 0.6182, - "step": 63956 - }, - { - "epoch": 1.64, - "learning_rate": 8.984311911539779e-07, - "loss": 0.5645, - "step": 63957 - }, - { - "epoch": 1.64, - "learning_rate": 8.984036638362664e-07, - "loss": 0.6206, - "step": 63958 - }, - { - "epoch": 1.64, - "learning_rate": 8.983761365963425e-07, - "loss": 0.5078, - "step": 63959 - }, - { - "epoch": 1.64, - "learning_rate": 8.983486094342273e-07, - "loss": 0.6982, - "step": 63960 - }, - { - "epoch": 1.64, - "learning_rate": 8.983210823499419e-07, - "loss": 0.6338, - "step": 63961 - }, - { - "epoch": 1.64, - "learning_rate": 8.982935553435074e-07, - "loss": 0.7295, - "step": 63962 - }, - { - "epoch": 1.64, - "learning_rate": 8.982660284149452e-07, - "loss": 0.8184, - "step": 63963 - }, - { - "epoch": 1.64, - "learning_rate": 8.982385015642755e-07, - "loss": 0.5718, - "step": 63964 - }, - { - "epoch": 1.64, - "learning_rate": 8.982109747915202e-07, - "loss": 0.5825, - "step": 63965 - }, - { - "epoch": 1.64, - "learning_rate": 8.981834480966997e-07, - "loss": 0.7061, - "step": 63966 - }, - { - "epoch": 1.64, - "learning_rate": 8.981559214798359e-07, - "loss": 0.6318, - "step": 63967 - }, - { - "epoch": 1.64, - "learning_rate": 8.98128394940949e-07, - "loss": 0.533, - "step": 63968 - }, - { - "epoch": 1.64, - "learning_rate": 8.981008684800608e-07, - "loss": 0.6655, - "step": 63969 - }, - { - "epoch": 1.64, - "learning_rate": 8.980733420971918e-07, - "loss": 0.5571, - "step": 63970 - }, - { - "epoch": 1.64, - "learning_rate": 8.980458157923638e-07, - "loss": 0.7246, - "step": 63971 - }, - { - "epoch": 1.64, - "learning_rate": 8.98018289565597e-07, - "loss": 0.7178, - "step": 63972 - }, - { - "epoch": 1.64, - "learning_rate": 8.979907634169137e-07, - "loss": 0.6777, - "step": 63973 - }, - { - "epoch": 1.64, - "learning_rate": 8.979632373463334e-07, - "loss": 0.6934, - "step": 63974 - }, - { - "epoch": 1.64, - "learning_rate": 8.979357113538783e-07, - "loss": 0.4824, - "step": 63975 - }, - { - "epoch": 1.64, - "learning_rate": 8.979081854395687e-07, - "loss": 0.6562, - "step": 63976 - }, - { - "epoch": 1.64, - "learning_rate": 8.978806596034265e-07, - "loss": 0.5078, - "step": 63977 - }, - { - "epoch": 1.64, - "learning_rate": 8.978531338454721e-07, - "loss": 0.5422, - "step": 63978 - }, - { - "epoch": 1.64, - "learning_rate": 8.978256081657271e-07, - "loss": 0.5895, - "step": 63979 - }, - { - "epoch": 1.64, - "learning_rate": 8.977980825642122e-07, - "loss": 0.7598, - "step": 63980 - }, - { - "epoch": 1.64, - "learning_rate": 8.977705570409487e-07, - "loss": 0.6758, - "step": 63981 - }, - { - "epoch": 1.64, - "learning_rate": 8.977430315959575e-07, - "loss": 0.3647, - "step": 63982 - }, - { - "epoch": 1.64, - "learning_rate": 8.977155062292601e-07, - "loss": 0.6128, - "step": 63983 - }, - { - "epoch": 1.64, - "learning_rate": 8.976879809408769e-07, - "loss": 0.6387, - "step": 63984 - }, - { - "epoch": 1.64, - "learning_rate": 8.976604557308293e-07, - "loss": 0.6353, - "step": 63985 - }, - { - "epoch": 1.64, - "learning_rate": 8.976329305991385e-07, - "loss": 0.6592, - "step": 63986 - }, - { - "epoch": 1.64, - "learning_rate": 8.976054055458253e-07, - "loss": 0.8291, - "step": 63987 - }, - { - "epoch": 1.64, - "learning_rate": 8.975778805709111e-07, - "loss": 0.5171, - "step": 63988 - }, - { - "epoch": 1.64, - "learning_rate": 8.975503556744166e-07, - "loss": 0.4854, - "step": 63989 - }, - { - "epoch": 1.64, - "learning_rate": 8.975228308563632e-07, - "loss": 0.6802, - "step": 63990 - }, - { - "epoch": 1.64, - "learning_rate": 8.974953061167721e-07, - "loss": 0.6953, - "step": 63991 - }, - { - "epoch": 1.64, - "learning_rate": 8.974677814556637e-07, - "loss": 0.6167, - "step": 63992 - }, - { - "epoch": 1.64, - "learning_rate": 8.9744025687306e-07, - "loss": 0.792, - "step": 63993 - }, - { - "epoch": 1.64, - "learning_rate": 8.974127323689814e-07, - "loss": 0.5854, - "step": 63994 - }, - { - "epoch": 1.64, - "learning_rate": 8.973852079434489e-07, - "loss": 0.5908, - "step": 63995 - }, - { - "epoch": 1.64, - "learning_rate": 8.97357683596484e-07, - "loss": 0.7305, - "step": 63996 - }, - { - "epoch": 1.64, - "learning_rate": 8.973301593281075e-07, - "loss": 0.6284, - "step": 63997 - }, - { - "epoch": 1.64, - "learning_rate": 8.973026351383407e-07, - "loss": 0.6572, - "step": 63998 - }, - { - "epoch": 1.64, - "learning_rate": 8.972751110272044e-07, - "loss": 0.6748, - "step": 63999 - }, - { - "epoch": 1.64, - "learning_rate": 8.972475869947199e-07, - "loss": 0.6167, - "step": 64000 - }, - { - "epoch": 1.64, - "learning_rate": 8.972200630409081e-07, - "loss": 0.3369, - "step": 64001 - }, - { - "epoch": 1.64, - "learning_rate": 8.971925391657904e-07, - "loss": 0.6929, - "step": 64002 - }, - { - "epoch": 1.64, - "learning_rate": 8.971650153693878e-07, - "loss": 0.647, - "step": 64003 - }, - { - "epoch": 1.64, - "learning_rate": 8.971374916517209e-07, - "loss": 0.5615, - "step": 64004 - }, - { - "epoch": 1.64, - "learning_rate": 8.971099680128113e-07, - "loss": 0.5139, - "step": 64005 - }, - { - "epoch": 1.64, - "learning_rate": 8.970824444526794e-07, - "loss": 0.6807, - "step": 64006 - }, - { - "epoch": 1.64, - "learning_rate": 8.970549209713471e-07, - "loss": 0.6763, - "step": 64007 - }, - { - "epoch": 1.64, - "learning_rate": 8.97027397568835e-07, - "loss": 0.7441, - "step": 64008 - }, - { - "epoch": 1.64, - "learning_rate": 8.969998742451645e-07, - "loss": 0.6377, - "step": 64009 - }, - { - "epoch": 1.64, - "learning_rate": 8.969723510003564e-07, - "loss": 0.626, - "step": 64010 - }, - { - "epoch": 1.64, - "learning_rate": 8.969448278344316e-07, - "loss": 0.5349, - "step": 64011 - }, - { - "epoch": 1.64, - "learning_rate": 8.969173047474116e-07, - "loss": 0.6553, - "step": 64012 - }, - { - "epoch": 1.64, - "learning_rate": 8.968897817393176e-07, - "loss": 0.5186, - "step": 64013 - }, - { - "epoch": 1.64, - "learning_rate": 8.968622588101699e-07, - "loss": 0.7119, - "step": 64014 - }, - { - "epoch": 1.64, - "learning_rate": 8.968347359599901e-07, - "loss": 0.6562, - "step": 64015 - }, - { - "epoch": 1.64, - "learning_rate": 8.968072131887991e-07, - "loss": 0.7881, - "step": 64016 - }, - { - "epoch": 1.64, - "learning_rate": 8.967796904966183e-07, - "loss": 0.6475, - "step": 64017 - }, - { - "epoch": 1.64, - "learning_rate": 8.967521678834683e-07, - "loss": 0.6299, - "step": 64018 - }, - { - "epoch": 1.64, - "learning_rate": 8.967246453493707e-07, - "loss": 0.6152, - "step": 64019 - }, - { - "epoch": 1.64, - "learning_rate": 8.966971228943458e-07, - "loss": 0.7607, - "step": 64020 - }, - { - "epoch": 1.64, - "learning_rate": 8.966696005184157e-07, - "loss": 0.4971, - "step": 64021 - }, - { - "epoch": 1.64, - "learning_rate": 8.966420782216006e-07, - "loss": 0.4658, - "step": 64022 - }, - { - "epoch": 1.64, - "learning_rate": 8.966145560039223e-07, - "loss": 0.624, - "step": 64023 - }, - { - "epoch": 1.64, - "learning_rate": 8.965870338654014e-07, - "loss": 0.4866, - "step": 64024 - }, - { - "epoch": 1.64, - "learning_rate": 8.965595118060587e-07, - "loss": 0.8252, - "step": 64025 - }, - { - "epoch": 1.64, - "learning_rate": 8.965319898259158e-07, - "loss": 0.7305, - "step": 64026 - }, - { - "epoch": 1.64, - "learning_rate": 8.965044679249938e-07, - "loss": 0.667, - "step": 64027 - }, - { - "epoch": 1.64, - "learning_rate": 8.964769461033133e-07, - "loss": 0.6377, - "step": 64028 - }, - { - "epoch": 1.64, - "learning_rate": 8.964494243608957e-07, - "loss": 0.6602, - "step": 64029 - }, - { - "epoch": 1.64, - "learning_rate": 8.964219026977619e-07, - "loss": 0.5317, - "step": 64030 - }, - { - "epoch": 1.64, - "learning_rate": 8.963943811139333e-07, - "loss": 0.8564, - "step": 64031 - }, - { - "epoch": 1.64, - "learning_rate": 8.963668596094305e-07, - "loss": 0.5049, - "step": 64032 - }, - { - "epoch": 1.64, - "learning_rate": 8.963393381842753e-07, - "loss": 0.6021, - "step": 64033 - }, - { - "epoch": 1.64, - "learning_rate": 8.963118168384881e-07, - "loss": 0.5139, - "step": 64034 - }, - { - "epoch": 1.64, - "learning_rate": 8.9628429557209e-07, - "loss": 0.561, - "step": 64035 - }, - { - "epoch": 1.64, - "learning_rate": 8.962567743851024e-07, - "loss": 0.6816, - "step": 64036 - }, - { - "epoch": 1.64, - "learning_rate": 8.962292532775459e-07, - "loss": 0.708, - "step": 64037 - }, - { - "epoch": 1.64, - "learning_rate": 8.962017322494423e-07, - "loss": 0.7695, - "step": 64038 - }, - { - "epoch": 1.64, - "learning_rate": 8.961742113008119e-07, - "loss": 0.6396, - "step": 64039 - }, - { - "epoch": 1.64, - "learning_rate": 8.961466904316764e-07, - "loss": 0.5635, - "step": 64040 - }, - { - "epoch": 1.64, - "learning_rate": 8.961191696420564e-07, - "loss": 0.6279, - "step": 64041 - }, - { - "epoch": 1.64, - "learning_rate": 8.960916489319734e-07, - "loss": 0.6844, - "step": 64042 - }, - { - "epoch": 1.64, - "learning_rate": 8.960641283014485e-07, - "loss": 0.7622, - "step": 64043 - }, - { - "epoch": 1.64, - "learning_rate": 8.960366077505023e-07, - "loss": 0.5918, - "step": 64044 - }, - { - "epoch": 1.64, - "learning_rate": 8.960090872791558e-07, - "loss": 0.6865, - "step": 64045 - }, - { - "epoch": 1.64, - "learning_rate": 8.959815668874305e-07, - "loss": 0.4868, - "step": 64046 - }, - { - "epoch": 1.64, - "learning_rate": 8.959540465753474e-07, - "loss": 0.6025, - "step": 64047 - }, - { - "epoch": 1.64, - "learning_rate": 8.959265263429274e-07, - "loss": 0.5195, - "step": 64048 - }, - { - "epoch": 1.64, - "learning_rate": 8.958990061901917e-07, - "loss": 0.5862, - "step": 64049 - }, - { - "epoch": 1.64, - "learning_rate": 8.958714861171614e-07, - "loss": 0.7705, - "step": 64050 - }, - { - "epoch": 1.64, - "learning_rate": 8.958439661238573e-07, - "loss": 0.6484, - "step": 64051 - }, - { - "epoch": 1.64, - "learning_rate": 8.958164462103009e-07, - "loss": 0.666, - "step": 64052 - }, - { - "epoch": 1.64, - "learning_rate": 8.957889263765134e-07, - "loss": 0.7217, - "step": 64053 - }, - { - "epoch": 1.64, - "learning_rate": 8.957614066225149e-07, - "loss": 0.6484, - "step": 64054 - }, - { - "epoch": 1.64, - "learning_rate": 8.957338869483276e-07, - "loss": 0.6514, - "step": 64055 - }, - { - "epoch": 1.64, - "learning_rate": 8.957063673539716e-07, - "loss": 0.7354, - "step": 64056 - }, - { - "epoch": 1.64, - "learning_rate": 8.956788478394688e-07, - "loss": 0.6914, - "step": 64057 - }, - { - "epoch": 1.64, - "learning_rate": 8.956513284048396e-07, - "loss": 0.583, - "step": 64058 - }, - { - "epoch": 1.64, - "learning_rate": 8.956238090501057e-07, - "loss": 0.7979, - "step": 64059 - }, - { - "epoch": 1.64, - "learning_rate": 8.955962897752876e-07, - "loss": 0.6321, - "step": 64060 - }, - { - "epoch": 1.64, - "learning_rate": 8.955687705804067e-07, - "loss": 0.6553, - "step": 64061 - }, - { - "epoch": 1.64, - "learning_rate": 8.955412514654839e-07, - "loss": 0.6294, - "step": 64062 - }, - { - "epoch": 1.64, - "learning_rate": 8.955137324305409e-07, - "loss": 0.6377, - "step": 64063 - }, - { - "epoch": 1.64, - "learning_rate": 8.954862134755978e-07, - "loss": 0.6841, - "step": 64064 - }, - { - "epoch": 1.64, - "learning_rate": 8.954586946006761e-07, - "loss": 0.7783, - "step": 64065 - }, - { - "epoch": 1.64, - "learning_rate": 8.954311758057969e-07, - "loss": 0.7637, - "step": 64066 - }, - { - "epoch": 1.64, - "learning_rate": 8.954036570909813e-07, - "loss": 0.4819, - "step": 64067 - }, - { - "epoch": 1.64, - "learning_rate": 8.953761384562499e-07, - "loss": 0.604, - "step": 64068 - }, - { - "epoch": 1.64, - "learning_rate": 8.953486199016246e-07, - "loss": 0.8096, - "step": 64069 - }, - { - "epoch": 1.64, - "learning_rate": 8.953211014271259e-07, - "loss": 0.5562, - "step": 64070 - }, - { - "epoch": 1.64, - "learning_rate": 8.952935830327751e-07, - "loss": 0.5811, - "step": 64071 - }, - { - "epoch": 1.64, - "learning_rate": 8.95266064718593e-07, - "loss": 0.6108, - "step": 64072 - }, - { - "epoch": 1.64, - "learning_rate": 8.952385464846014e-07, - "loss": 0.5188, - "step": 64073 - }, - { - "epoch": 1.64, - "learning_rate": 8.952110283308205e-07, - "loss": 0.7266, - "step": 64074 - }, - { - "epoch": 1.64, - "learning_rate": 8.951835102572716e-07, - "loss": 0.7285, - "step": 64075 - }, - { - "epoch": 1.64, - "learning_rate": 8.95155992263976e-07, - "loss": 0.566, - "step": 64076 - }, - { - "epoch": 1.64, - "learning_rate": 8.951284743509544e-07, - "loss": 0.5835, - "step": 64077 - }, - { - "epoch": 1.64, - "learning_rate": 8.951009565182283e-07, - "loss": 0.875, - "step": 64078 - }, - { - "epoch": 1.64, - "learning_rate": 8.950734387658183e-07, - "loss": 0.6562, - "step": 64079 - }, - { - "epoch": 1.64, - "learning_rate": 8.950459210937462e-07, - "loss": 0.4822, - "step": 64080 - }, - { - "epoch": 1.64, - "learning_rate": 8.950184035020321e-07, - "loss": 0.6792, - "step": 64081 - }, - { - "epoch": 1.64, - "learning_rate": 8.949908859906981e-07, - "loss": 0.7402, - "step": 64082 - }, - { - "epoch": 1.64, - "learning_rate": 8.949633685597647e-07, - "loss": 0.3672, - "step": 64083 - }, - { - "epoch": 1.64, - "learning_rate": 8.94935851209253e-07, - "loss": 0.6992, - "step": 64084 - }, - { - "epoch": 1.64, - "learning_rate": 8.949083339391837e-07, - "loss": 0.6172, - "step": 64085 - }, - { - "epoch": 1.64, - "learning_rate": 8.948808167495786e-07, - "loss": 0.5605, - "step": 64086 - }, - { - "epoch": 1.64, - "learning_rate": 8.948532996404582e-07, - "loss": 0.6904, - "step": 64087 - }, - { - "epoch": 1.64, - "learning_rate": 8.948257826118439e-07, - "loss": 0.7588, - "step": 64088 - }, - { - "epoch": 1.64, - "learning_rate": 8.947982656637566e-07, - "loss": 0.6611, - "step": 64089 - }, - { - "epoch": 1.64, - "learning_rate": 8.947707487962175e-07, - "loss": 0.6895, - "step": 64090 - }, - { - "epoch": 1.64, - "learning_rate": 8.947432320092475e-07, - "loss": 0.5669, - "step": 64091 - }, - { - "epoch": 1.64, - "learning_rate": 8.94715715302868e-07, - "loss": 0.6787, - "step": 64092 - }, - { - "epoch": 1.64, - "learning_rate": 8.946881986771e-07, - "loss": 0.6885, - "step": 64093 - }, - { - "epoch": 1.64, - "learning_rate": 8.946606821319639e-07, - "loss": 0.5078, - "step": 64094 - }, - { - "epoch": 1.64, - "learning_rate": 8.946331656674816e-07, - "loss": 0.4719, - "step": 64095 - }, - { - "epoch": 1.64, - "learning_rate": 8.946056492836736e-07, - "loss": 0.4592, - "step": 64096 - }, - { - "epoch": 1.64, - "learning_rate": 8.945781329805613e-07, - "loss": 0.6174, - "step": 64097 - }, - { - "epoch": 1.64, - "learning_rate": 8.945506167581655e-07, - "loss": 0.6177, - "step": 64098 - }, - { - "epoch": 1.64, - "learning_rate": 8.945231006165079e-07, - "loss": 0.7754, - "step": 64099 - }, - { - "epoch": 1.64, - "learning_rate": 8.944955845556088e-07, - "loss": 0.6758, - "step": 64100 - }, - { - "epoch": 1.64, - "learning_rate": 8.944680685754895e-07, - "loss": 0.3979, - "step": 64101 - }, - { - "epoch": 1.64, - "learning_rate": 8.944405526761714e-07, - "loss": 0.5977, - "step": 64102 - }, - { - "epoch": 1.64, - "learning_rate": 8.944130368576754e-07, - "loss": 0.6465, - "step": 64103 - }, - { - "epoch": 1.64, - "learning_rate": 8.943855211200222e-07, - "loss": 0.5957, - "step": 64104 - }, - { - "epoch": 1.64, - "learning_rate": 8.943580054632334e-07, - "loss": 0.5347, - "step": 64105 - }, - { - "epoch": 1.64, - "learning_rate": 8.943304898873294e-07, - "loss": 0.3381, - "step": 64106 - }, - { - "epoch": 1.64, - "learning_rate": 8.94302974392332e-07, - "loss": 0.4387, - "step": 64107 - }, - { - "epoch": 1.64, - "learning_rate": 8.942754589782617e-07, - "loss": 0.6094, - "step": 64108 - }, - { - "epoch": 1.64, - "learning_rate": 8.942479436451401e-07, - "loss": 0.667, - "step": 64109 - }, - { - "epoch": 1.64, - "learning_rate": 8.942204283929879e-07, - "loss": 0.3755, - "step": 64110 - }, - { - "epoch": 1.64, - "learning_rate": 8.941929132218262e-07, - "loss": 0.6562, - "step": 64111 - }, - { - "epoch": 1.64, - "learning_rate": 8.94165398131676e-07, - "loss": 0.625, - "step": 64112 - }, - { - "epoch": 1.64, - "learning_rate": 8.94137883122559e-07, - "loss": 0.4338, - "step": 64113 - }, - { - "epoch": 1.64, - "learning_rate": 8.941103681944955e-07, - "loss": 0.4849, - "step": 64114 - }, - { - "epoch": 1.64, - "learning_rate": 8.940828533475066e-07, - "loss": 0.6377, - "step": 64115 - }, - { - "epoch": 1.64, - "learning_rate": 8.940553385816137e-07, - "loss": 0.6841, - "step": 64116 - }, - { - "epoch": 1.64, - "learning_rate": 8.940278238968379e-07, - "loss": 0.6523, - "step": 64117 - }, - { - "epoch": 1.64, - "learning_rate": 8.940003092931999e-07, - "loss": 0.6245, - "step": 64118 - }, - { - "epoch": 1.64, - "learning_rate": 8.939727947707212e-07, - "loss": 0.6763, - "step": 64119 - }, - { - "epoch": 1.64, - "learning_rate": 8.939452803294224e-07, - "loss": 0.6467, - "step": 64120 - }, - { - "epoch": 1.64, - "learning_rate": 8.93917765969325e-07, - "loss": 0.4954, - "step": 64121 - }, - { - "epoch": 1.64, - "learning_rate": 8.938902516904497e-07, - "loss": 0.5308, - "step": 64122 - }, - { - "epoch": 1.64, - "learning_rate": 8.938627374928182e-07, - "loss": 0.6987, - "step": 64123 - }, - { - "epoch": 1.64, - "learning_rate": 8.938352233764509e-07, - "loss": 0.5625, - "step": 64124 - }, - { - "epoch": 1.64, - "learning_rate": 8.938077093413689e-07, - "loss": 0.7109, - "step": 64125 - }, - { - "epoch": 1.64, - "learning_rate": 8.937801953875937e-07, - "loss": 0.4004, - "step": 64126 - }, - { - "epoch": 1.64, - "learning_rate": 8.937526815151459e-07, - "loss": 0.4854, - "step": 64127 - }, - { - "epoch": 1.64, - "learning_rate": 8.937251677240469e-07, - "loss": 0.7344, - "step": 64128 - }, - { - "epoch": 1.64, - "learning_rate": 8.936976540143175e-07, - "loss": 0.624, - "step": 64129 - }, - { - "epoch": 1.64, - "learning_rate": 8.936701403859791e-07, - "loss": 0.5906, - "step": 64130 - }, - { - "epoch": 1.64, - "learning_rate": 8.936426268390524e-07, - "loss": 0.5288, - "step": 64131 - }, - { - "epoch": 1.64, - "learning_rate": 8.936151133735591e-07, - "loss": 0.552, - "step": 64132 - }, - { - "epoch": 1.64, - "learning_rate": 8.935875999895195e-07, - "loss": 0.4695, - "step": 64133 - }, - { - "epoch": 1.64, - "learning_rate": 8.935600866869551e-07, - "loss": 0.7627, - "step": 64134 - }, - { - "epoch": 1.64, - "learning_rate": 8.935325734658866e-07, - "loss": 0.4861, - "step": 64135 - }, - { - "epoch": 1.64, - "learning_rate": 8.935050603263356e-07, - "loss": 0.5415, - "step": 64136 - }, - { - "epoch": 1.64, - "learning_rate": 8.934775472683224e-07, - "loss": 0.5728, - "step": 64137 - }, - { - "epoch": 1.64, - "learning_rate": 8.93450034291869e-07, - "loss": 0.4638, - "step": 64138 - }, - { - "epoch": 1.64, - "learning_rate": 8.934225213969958e-07, - "loss": 0.792, - "step": 64139 - }, - { - "epoch": 1.64, - "learning_rate": 8.933950085837242e-07, - "loss": 0.7021, - "step": 64140 - }, - { - "epoch": 1.64, - "learning_rate": 8.933674958520749e-07, - "loss": 0.4536, - "step": 64141 - }, - { - "epoch": 1.64, - "learning_rate": 8.933399832020697e-07, - "loss": 0.5796, - "step": 64142 - }, - { - "epoch": 1.64, - "learning_rate": 8.93312470633729e-07, - "loss": 0.6562, - "step": 64143 - }, - { - "epoch": 1.64, - "learning_rate": 8.932849581470737e-07, - "loss": 0.6323, - "step": 64144 - }, - { - "epoch": 1.64, - "learning_rate": 8.932574457421256e-07, - "loss": 0.7617, - "step": 64145 - }, - { - "epoch": 1.64, - "learning_rate": 8.932299334189049e-07, - "loss": 0.6265, - "step": 64146 - }, - { - "epoch": 1.64, - "learning_rate": 8.932024211774335e-07, - "loss": 0.6416, - "step": 64147 - }, - { - "epoch": 1.64, - "learning_rate": 8.931749090177318e-07, - "loss": 0.6011, - "step": 64148 - }, - { - "epoch": 1.64, - "learning_rate": 8.931473969398215e-07, - "loss": 0.3865, - "step": 64149 - }, - { - "epoch": 1.64, - "learning_rate": 8.93119884943723e-07, - "loss": 0.6321, - "step": 64150 - }, - { - "epoch": 1.64, - "learning_rate": 8.93092373029458e-07, - "loss": 0.6714, - "step": 64151 - }, - { - "epoch": 1.64, - "learning_rate": 8.930648611970475e-07, - "loss": 0.5581, - "step": 64152 - }, - { - "epoch": 1.64, - "learning_rate": 8.93037349446512e-07, - "loss": 0.5833, - "step": 64153 - }, - { - "epoch": 1.64, - "learning_rate": 8.930098377778727e-07, - "loss": 0.564, - "step": 64154 - }, - { - "epoch": 1.64, - "learning_rate": 8.92982326191151e-07, - "loss": 0.5591, - "step": 64155 - }, - { - "epoch": 1.64, - "learning_rate": 8.929548146863677e-07, - "loss": 0.5513, - "step": 64156 - }, - { - "epoch": 1.64, - "learning_rate": 8.92927303263544e-07, - "loss": 0.6982, - "step": 64157 - }, - { - "epoch": 1.64, - "learning_rate": 8.928997919227009e-07, - "loss": 0.752, - "step": 64158 - }, - { - "epoch": 1.64, - "learning_rate": 8.928722806638597e-07, - "loss": 0.5358, - "step": 64159 - }, - { - "epoch": 1.64, - "learning_rate": 8.92844769487041e-07, - "loss": 0.5693, - "step": 64160 - }, - { - "epoch": 1.64, - "learning_rate": 8.928172583922664e-07, - "loss": 0.6895, - "step": 64161 - }, - { - "epoch": 1.64, - "learning_rate": 8.92789747379557e-07, - "loss": 0.5068, - "step": 64162 - }, - { - "epoch": 1.64, - "learning_rate": 8.92762236448933e-07, - "loss": 0.6602, - "step": 64163 - }, - { - "epoch": 1.64, - "learning_rate": 8.927347256004162e-07, - "loss": 0.749, - "step": 64164 - }, - { - "epoch": 1.64, - "learning_rate": 8.927072148340273e-07, - "loss": 0.6113, - "step": 64165 - }, - { - "epoch": 1.64, - "learning_rate": 8.926797041497878e-07, - "loss": 0.4634, - "step": 64166 - }, - { - "epoch": 1.64, - "learning_rate": 8.926521935477183e-07, - "loss": 0.7598, - "step": 64167 - }, - { - "epoch": 1.64, - "learning_rate": 8.926246830278403e-07, - "loss": 0.604, - "step": 64168 - }, - { - "epoch": 1.64, - "learning_rate": 8.925971725901745e-07, - "loss": 0.6914, - "step": 64169 - }, - { - "epoch": 1.64, - "learning_rate": 8.925696622347423e-07, - "loss": 0.4893, - "step": 64170 - }, - { - "epoch": 1.64, - "learning_rate": 8.925421519615642e-07, - "loss": 0.6309, - "step": 64171 - }, - { - "epoch": 1.64, - "learning_rate": 8.925146417706625e-07, - "loss": 0.5732, - "step": 64172 - }, - { - "epoch": 1.64, - "learning_rate": 8.924871316620566e-07, - "loss": 0.5649, - "step": 64173 - }, - { - "epoch": 1.64, - "learning_rate": 8.924596216357686e-07, - "loss": 0.6758, - "step": 64174 - }, - { - "epoch": 1.64, - "learning_rate": 8.924321116918191e-07, - "loss": 0.6416, - "step": 64175 - }, - { - "epoch": 1.64, - "learning_rate": 8.924046018302297e-07, - "loss": 0.5967, - "step": 64176 - }, - { - "epoch": 1.64, - "learning_rate": 8.923770920510209e-07, - "loss": 0.7236, - "step": 64177 - }, - { - "epoch": 1.64, - "learning_rate": 8.923495823542141e-07, - "loss": 0.5542, - "step": 64178 - }, - { - "epoch": 1.64, - "learning_rate": 8.923220727398302e-07, - "loss": 0.4839, - "step": 64179 - }, - { - "epoch": 1.64, - "learning_rate": 8.922945632078905e-07, - "loss": 0.5649, - "step": 64180 - }, - { - "epoch": 1.64, - "learning_rate": 8.922670537584156e-07, - "loss": 0.7295, - "step": 64181 - }, - { - "epoch": 1.65, - "learning_rate": 8.922395443914274e-07, - "loss": 0.6328, - "step": 64182 - }, - { - "epoch": 1.65, - "learning_rate": 8.922120351069462e-07, - "loss": 0.4889, - "step": 64183 - }, - { - "epoch": 1.65, - "learning_rate": 8.921845259049931e-07, - "loss": 0.4729, - "step": 64184 - }, - { - "epoch": 1.65, - "learning_rate": 8.921570167855894e-07, - "loss": 0.7119, - "step": 64185 - }, - { - "epoch": 1.65, - "learning_rate": 8.92129507748756e-07, - "loss": 0.7549, - "step": 64186 - }, - { - "epoch": 1.65, - "learning_rate": 8.921019987945144e-07, - "loss": 0.6333, - "step": 64187 - }, - { - "epoch": 1.65, - "learning_rate": 8.920744899228851e-07, - "loss": 0.7715, - "step": 64188 - }, - { - "epoch": 1.65, - "learning_rate": 8.920469811338894e-07, - "loss": 0.4742, - "step": 64189 - }, - { - "epoch": 1.65, - "learning_rate": 8.920194724275486e-07, - "loss": 0.6445, - "step": 64190 - }, - { - "epoch": 1.65, - "learning_rate": 8.919919638038832e-07, - "loss": 0.6528, - "step": 64191 - }, - { - "epoch": 1.65, - "learning_rate": 8.919644552629151e-07, - "loss": 0.5908, - "step": 64192 - }, - { - "epoch": 1.65, - "learning_rate": 8.919369468046644e-07, - "loss": 0.7314, - "step": 64193 - }, - { - "epoch": 1.65, - "learning_rate": 8.919094384291527e-07, - "loss": 0.6196, - "step": 64194 - }, - { - "epoch": 1.65, - "learning_rate": 8.918819301364011e-07, - "loss": 0.6582, - "step": 64195 - }, - { - "epoch": 1.65, - "learning_rate": 8.918544219264302e-07, - "loss": 0.7529, - "step": 64196 - }, - { - "epoch": 1.65, - "learning_rate": 8.918269137992618e-07, - "loss": 0.6548, - "step": 64197 - }, - { - "epoch": 1.65, - "learning_rate": 8.917994057549161e-07, - "loss": 0.6729, - "step": 64198 - }, - { - "epoch": 1.65, - "learning_rate": 8.91771897793415e-07, - "loss": 0.6196, - "step": 64199 - }, - { - "epoch": 1.65, - "learning_rate": 8.917443899147789e-07, - "loss": 0.4061, - "step": 64200 - }, - { - "epoch": 1.65, - "learning_rate": 8.917168821190295e-07, - "loss": 0.6445, - "step": 64201 - }, - { - "epoch": 1.65, - "learning_rate": 8.916893744061875e-07, - "loss": 0.5581, - "step": 64202 - }, - { - "epoch": 1.65, - "learning_rate": 8.916618667762737e-07, - "loss": 0.7109, - "step": 64203 - }, - { - "epoch": 1.65, - "learning_rate": 8.916343592293096e-07, - "loss": 0.8086, - "step": 64204 - }, - { - "epoch": 1.65, - "learning_rate": 8.916068517653159e-07, - "loss": 0.7803, - "step": 64205 - }, - { - "epoch": 1.65, - "learning_rate": 8.91579344384314e-07, - "loss": 0.751, - "step": 64206 - }, - { - "epoch": 1.65, - "learning_rate": 8.915518370863249e-07, - "loss": 0.5835, - "step": 64207 - }, - { - "epoch": 1.65, - "learning_rate": 8.915243298713693e-07, - "loss": 0.6299, - "step": 64208 - }, - { - "epoch": 1.65, - "learning_rate": 8.914968227394687e-07, - "loss": 0.5532, - "step": 64209 - }, - { - "epoch": 1.65, - "learning_rate": 8.914693156906438e-07, - "loss": 0.6816, - "step": 64210 - }, - { - "epoch": 1.65, - "learning_rate": 8.91441808724916e-07, - "loss": 0.7549, - "step": 64211 - }, - { - "epoch": 1.65, - "learning_rate": 8.914143018423066e-07, - "loss": 0.5947, - "step": 64212 - }, - { - "epoch": 1.65, - "learning_rate": 8.913867950428357e-07, - "loss": 0.6523, - "step": 64213 - }, - { - "epoch": 1.65, - "learning_rate": 8.913592883265253e-07, - "loss": 0.6357, - "step": 64214 - }, - { - "epoch": 1.65, - "learning_rate": 8.913317816933958e-07, - "loss": 0.6646, - "step": 64215 - }, - { - "epoch": 1.65, - "learning_rate": 8.913042751434687e-07, - "loss": 0.5974, - "step": 64216 - }, - { - "epoch": 1.65, - "learning_rate": 8.912767686767649e-07, - "loss": 0.7281, - "step": 64217 - }, - { - "epoch": 1.65, - "learning_rate": 8.912492622933055e-07, - "loss": 0.6797, - "step": 64218 - }, - { - "epoch": 1.65, - "learning_rate": 8.912217559931115e-07, - "loss": 0.6055, - "step": 64219 - }, - { - "epoch": 1.65, - "learning_rate": 8.911942497762041e-07, - "loss": 0.7021, - "step": 64220 - }, - { - "epoch": 1.65, - "learning_rate": 8.91166743642604e-07, - "loss": 0.6138, - "step": 64221 - }, - { - "epoch": 1.65, - "learning_rate": 8.91139237592333e-07, - "loss": 0.6184, - "step": 64222 - }, - { - "epoch": 1.65, - "learning_rate": 8.911117316254115e-07, - "loss": 0.4824, - "step": 64223 - }, - { - "epoch": 1.65, - "learning_rate": 8.910842257418607e-07, - "loss": 0.6831, - "step": 64224 - }, - { - "epoch": 1.65, - "learning_rate": 8.910567199417015e-07, - "loss": 0.5986, - "step": 64225 - }, - { - "epoch": 1.65, - "learning_rate": 8.910292142249553e-07, - "loss": 0.7095, - "step": 64226 - }, - { - "epoch": 1.65, - "learning_rate": 8.91001708591643e-07, - "loss": 0.559, - "step": 64227 - }, - { - "epoch": 1.65, - "learning_rate": 8.909742030417858e-07, - "loss": 0.627, - "step": 64228 - }, - { - "epoch": 1.65, - "learning_rate": 8.909466975754043e-07, - "loss": 0.5103, - "step": 64229 - }, - { - "epoch": 1.65, - "learning_rate": 8.909191921925202e-07, - "loss": 0.6436, - "step": 64230 - }, - { - "epoch": 1.65, - "learning_rate": 8.90891686893154e-07, - "loss": 0.7031, - "step": 64231 - }, - { - "epoch": 1.65, - "learning_rate": 8.908641816773276e-07, - "loss": 0.751, - "step": 64232 - }, - { - "epoch": 1.65, - "learning_rate": 8.908366765450611e-07, - "loss": 0.6929, - "step": 64233 - }, - { - "epoch": 1.65, - "learning_rate": 8.908091714963758e-07, - "loss": 0.6738, - "step": 64234 - }, - { - "epoch": 1.65, - "learning_rate": 8.907816665312932e-07, - "loss": 0.445, - "step": 64235 - }, - { - "epoch": 1.65, - "learning_rate": 8.907541616498337e-07, - "loss": 0.6289, - "step": 64236 - }, - { - "epoch": 1.65, - "learning_rate": 8.907266568520189e-07, - "loss": 0.427, - "step": 64237 - }, - { - "epoch": 1.65, - "learning_rate": 8.906991521378696e-07, - "loss": 0.5642, - "step": 64238 - }, - { - "epoch": 1.65, - "learning_rate": 8.906716475074071e-07, - "loss": 0.5898, - "step": 64239 - }, - { - "epoch": 1.65, - "learning_rate": 8.906441429606521e-07, - "loss": 0.7402, - "step": 64240 - }, - { - "epoch": 1.65, - "learning_rate": 8.906166384976259e-07, - "loss": 0.5366, - "step": 64241 - }, - { - "epoch": 1.65, - "learning_rate": 8.9058913411835e-07, - "loss": 0.7432, - "step": 64242 - }, - { - "epoch": 1.65, - "learning_rate": 8.905616298228445e-07, - "loss": 0.9053, - "step": 64243 - }, - { - "epoch": 1.65, - "learning_rate": 8.905341256111309e-07, - "loss": 0.6709, - "step": 64244 - }, - { - "epoch": 1.65, - "learning_rate": 8.905066214832303e-07, - "loss": 0.6077, - "step": 64245 - }, - { - "epoch": 1.65, - "learning_rate": 8.904791174391638e-07, - "loss": 0.6211, - "step": 64246 - }, - { - "epoch": 1.65, - "learning_rate": 8.904516134789524e-07, - "loss": 0.4768, - "step": 64247 - }, - { - "epoch": 1.65, - "learning_rate": 8.904241096026169e-07, - "loss": 0.4883, - "step": 64248 - }, - { - "epoch": 1.65, - "learning_rate": 8.903966058101789e-07, - "loss": 0.6611, - "step": 64249 - }, - { - "epoch": 1.65, - "learning_rate": 8.90369102101659e-07, - "loss": 0.6445, - "step": 64250 - }, - { - "epoch": 1.65, - "learning_rate": 8.903415984770788e-07, - "loss": 0.6726, - "step": 64251 - }, - { - "epoch": 1.65, - "learning_rate": 8.90314094936459e-07, - "loss": 0.7441, - "step": 64252 - }, - { - "epoch": 1.65, - "learning_rate": 8.902865914798204e-07, - "loss": 0.7324, - "step": 64253 - }, - { - "epoch": 1.65, - "learning_rate": 8.902590881071844e-07, - "loss": 0.7041, - "step": 64254 - }, - { - "epoch": 1.65, - "learning_rate": 8.902315848185718e-07, - "loss": 0.6265, - "step": 64255 - }, - { - "epoch": 1.65, - "learning_rate": 8.90204081614004e-07, - "loss": 0.6865, - "step": 64256 - }, - { - "epoch": 1.65, - "learning_rate": 8.901765784935017e-07, - "loss": 0.6045, - "step": 64257 - }, - { - "epoch": 1.65, - "learning_rate": 8.901490754570864e-07, - "loss": 0.8145, - "step": 64258 - }, - { - "epoch": 1.65, - "learning_rate": 8.901215725047786e-07, - "loss": 0.7373, - "step": 64259 - }, - { - "epoch": 1.65, - "learning_rate": 8.900940696365999e-07, - "loss": 0.6353, - "step": 64260 - }, - { - "epoch": 1.65, - "learning_rate": 8.900665668525709e-07, - "loss": 0.5864, - "step": 64261 - }, - { - "epoch": 1.65, - "learning_rate": 8.900390641527136e-07, - "loss": 0.6846, - "step": 64262 - }, - { - "epoch": 1.65, - "learning_rate": 8.900115615370476e-07, - "loss": 0.6572, - "step": 64263 - }, - { - "epoch": 1.65, - "learning_rate": 8.899840590055949e-07, - "loss": 0.636, - "step": 64264 - }, - { - "epoch": 1.65, - "learning_rate": 8.899565565583762e-07, - "loss": 0.7578, - "step": 64265 - }, - { - "epoch": 1.65, - "learning_rate": 8.899290541954128e-07, - "loss": 0.5474, - "step": 64266 - }, - { - "epoch": 1.65, - "learning_rate": 8.899015519167257e-07, - "loss": 0.688, - "step": 64267 - }, - { - "epoch": 1.65, - "learning_rate": 8.89874049722336e-07, - "loss": 0.6155, - "step": 64268 - }, - { - "epoch": 1.65, - "learning_rate": 8.898465476122643e-07, - "loss": 0.6377, - "step": 64269 - }, - { - "epoch": 1.65, - "learning_rate": 8.898190455865324e-07, - "loss": 0.6738, - "step": 64270 - }, - { - "epoch": 1.65, - "learning_rate": 8.897915436451607e-07, - "loss": 0.7451, - "step": 64271 - }, - { - "epoch": 1.65, - "learning_rate": 8.897640417881711e-07, - "loss": 0.5156, - "step": 64272 - }, - { - "epoch": 1.65, - "learning_rate": 8.897365400155838e-07, - "loss": 0.7012, - "step": 64273 - }, - { - "epoch": 1.65, - "learning_rate": 8.897090383274199e-07, - "loss": 0.6382, - "step": 64274 - }, - { - "epoch": 1.65, - "learning_rate": 8.89681536723701e-07, - "loss": 0.4492, - "step": 64275 - }, - { - "epoch": 1.65, - "learning_rate": 8.896540352044477e-07, - "loss": 0.5923, - "step": 64276 - }, - { - "epoch": 1.65, - "learning_rate": 8.896265337696814e-07, - "loss": 0.52, - "step": 64277 - }, - { - "epoch": 1.65, - "learning_rate": 8.895990324194228e-07, - "loss": 0.7461, - "step": 64278 - }, - { - "epoch": 1.65, - "learning_rate": 8.895715311536934e-07, - "loss": 0.5879, - "step": 64279 - }, - { - "epoch": 1.65, - "learning_rate": 8.895440299725139e-07, - "loss": 0.6035, - "step": 64280 - }, - { - "epoch": 1.65, - "learning_rate": 8.895165288759053e-07, - "loss": 0.6011, - "step": 64281 - }, - { - "epoch": 1.65, - "learning_rate": 8.894890278638891e-07, - "loss": 0.5771, - "step": 64282 - }, - { - "epoch": 1.65, - "learning_rate": 8.89461526936486e-07, - "loss": 0.6948, - "step": 64283 - }, - { - "epoch": 1.65, - "learning_rate": 8.89434026093717e-07, - "loss": 0.7422, - "step": 64284 - }, - { - "epoch": 1.65, - "learning_rate": 8.894065253356033e-07, - "loss": 0.584, - "step": 64285 - }, - { - "epoch": 1.65, - "learning_rate": 8.893790246621658e-07, - "loss": 0.7578, - "step": 64286 - }, - { - "epoch": 1.65, - "learning_rate": 8.893515240734259e-07, - "loss": 0.5342, - "step": 64287 - }, - { - "epoch": 1.65, - "learning_rate": 8.893240235694042e-07, - "loss": 0.6448, - "step": 64288 - }, - { - "epoch": 1.65, - "learning_rate": 8.892965231501224e-07, - "loss": 0.606, - "step": 64289 - }, - { - "epoch": 1.65, - "learning_rate": 8.892690228156008e-07, - "loss": 0.6597, - "step": 64290 - }, - { - "epoch": 1.65, - "learning_rate": 8.89241522565861e-07, - "loss": 0.5464, - "step": 64291 - }, - { - "epoch": 1.65, - "learning_rate": 8.892140224009242e-07, - "loss": 0.7246, - "step": 64292 - }, - { - "epoch": 1.65, - "learning_rate": 8.891865223208107e-07, - "loss": 0.5444, - "step": 64293 - }, - { - "epoch": 1.65, - "learning_rate": 8.891590223255421e-07, - "loss": 0.6841, - "step": 64294 - }, - { - "epoch": 1.65, - "learning_rate": 8.891315224151392e-07, - "loss": 0.5674, - "step": 64295 - }, - { - "epoch": 1.65, - "learning_rate": 8.891040225896234e-07, - "loss": 0.4468, - "step": 64296 - }, - { - "epoch": 1.65, - "learning_rate": 8.890765228490155e-07, - "loss": 0.5742, - "step": 64297 - }, - { - "epoch": 1.65, - "learning_rate": 8.890490231933364e-07, - "loss": 0.6611, - "step": 64298 - }, - { - "epoch": 1.65, - "learning_rate": 8.890215236226077e-07, - "loss": 0.6348, - "step": 64299 - }, - { - "epoch": 1.65, - "learning_rate": 8.889940241368496e-07, - "loss": 0.6494, - "step": 64300 - }, - { - "epoch": 1.65, - "learning_rate": 8.889665247360841e-07, - "loss": 0.7012, - "step": 64301 - }, - { - "epoch": 1.65, - "learning_rate": 8.889390254203321e-07, - "loss": 0.6396, - "step": 64302 - }, - { - "epoch": 1.65, - "learning_rate": 8.889115261896139e-07, - "loss": 0.6558, - "step": 64303 - }, - { - "epoch": 1.65, - "learning_rate": 8.888840270439512e-07, - "loss": 0.5552, - "step": 64304 - }, - { - "epoch": 1.65, - "learning_rate": 8.888565279833647e-07, - "loss": 0.6558, - "step": 64305 - }, - { - "epoch": 1.65, - "learning_rate": 8.88829029007876e-07, - "loss": 0.7695, - "step": 64306 - }, - { - "epoch": 1.65, - "learning_rate": 8.888015301175054e-07, - "loss": 0.5601, - "step": 64307 - }, - { - "epoch": 1.65, - "learning_rate": 8.887740313122746e-07, - "loss": 0.5164, - "step": 64308 - }, - { - "epoch": 1.65, - "learning_rate": 8.887465325922041e-07, - "loss": 0.7559, - "step": 64309 - }, - { - "epoch": 1.65, - "learning_rate": 8.887190339573157e-07, - "loss": 0.7227, - "step": 64310 - }, - { - "epoch": 1.65, - "learning_rate": 8.886915354076297e-07, - "loss": 0.7031, - "step": 64311 - }, - { - "epoch": 1.65, - "learning_rate": 8.886640369431678e-07, - "loss": 0.6104, - "step": 64312 - }, - { - "epoch": 1.65, - "learning_rate": 8.886365385639508e-07, - "loss": 0.6353, - "step": 64313 - }, - { - "epoch": 1.65, - "learning_rate": 8.886090402699994e-07, - "loss": 0.5659, - "step": 64314 - }, - { - "epoch": 1.65, - "learning_rate": 8.885815420613348e-07, - "loss": 0.7275, - "step": 64315 - }, - { - "epoch": 1.65, - "learning_rate": 8.885540439379783e-07, - "loss": 0.7197, - "step": 64316 - }, - { - "epoch": 1.65, - "learning_rate": 8.885265458999509e-07, - "loss": 0.7129, - "step": 64317 - }, - { - "epoch": 1.65, - "learning_rate": 8.884990479472736e-07, - "loss": 0.4475, - "step": 64318 - }, - { - "epoch": 1.65, - "learning_rate": 8.884715500799673e-07, - "loss": 0.6479, - "step": 64319 - }, - { - "epoch": 1.65, - "learning_rate": 8.884440522980534e-07, - "loss": 0.5615, - "step": 64320 - }, - { - "epoch": 1.65, - "learning_rate": 8.884165546015526e-07, - "loss": 0.4993, - "step": 64321 - }, - { - "epoch": 1.65, - "learning_rate": 8.883890569904866e-07, - "loss": 0.5938, - "step": 64322 - }, - { - "epoch": 1.65, - "learning_rate": 8.883615594648756e-07, - "loss": 0.5513, - "step": 64323 - }, - { - "epoch": 1.65, - "learning_rate": 8.883340620247409e-07, - "loss": 0.583, - "step": 64324 - }, - { - "epoch": 1.65, - "learning_rate": 8.883065646701039e-07, - "loss": 0.6401, - "step": 64325 - }, - { - "epoch": 1.65, - "learning_rate": 8.882790674009851e-07, - "loss": 0.6426, - "step": 64326 - }, - { - "epoch": 1.65, - "learning_rate": 8.882515702174062e-07, - "loss": 0.6836, - "step": 64327 - }, - { - "epoch": 1.65, - "learning_rate": 8.882240731193876e-07, - "loss": 0.5796, - "step": 64328 - }, - { - "epoch": 1.65, - "learning_rate": 8.881965761069511e-07, - "loss": 0.6248, - "step": 64329 - }, - { - "epoch": 1.65, - "learning_rate": 8.88169079180117e-07, - "loss": 0.7939, - "step": 64330 - }, - { - "epoch": 1.65, - "learning_rate": 8.881415823389069e-07, - "loss": 0.5032, - "step": 64331 - }, - { - "epoch": 1.65, - "learning_rate": 8.881140855833419e-07, - "loss": 0.6592, - "step": 64332 - }, - { - "epoch": 1.65, - "learning_rate": 8.880865889134425e-07, - "loss": 0.7773, - "step": 64333 - }, - { - "epoch": 1.65, - "learning_rate": 8.880590923292299e-07, - "loss": 0.6514, - "step": 64334 - }, - { - "epoch": 1.65, - "learning_rate": 8.880315958307256e-07, - "loss": 0.5369, - "step": 64335 - }, - { - "epoch": 1.65, - "learning_rate": 8.8800409941795e-07, - "loss": 0.7148, - "step": 64336 - }, - { - "epoch": 1.65, - "learning_rate": 8.879766030909249e-07, - "loss": 0.5385, - "step": 64337 - }, - { - "epoch": 1.65, - "learning_rate": 8.879491068496707e-07, - "loss": 0.665, - "step": 64338 - }, - { - "epoch": 1.65, - "learning_rate": 8.879216106942088e-07, - "loss": 0.6699, - "step": 64339 - }, - { - "epoch": 1.65, - "learning_rate": 8.8789411462456e-07, - "loss": 0.5664, - "step": 64340 - }, - { - "epoch": 1.65, - "learning_rate": 8.878666186407458e-07, - "loss": 0.6445, - "step": 64341 - }, - { - "epoch": 1.65, - "learning_rate": 8.878391227427872e-07, - "loss": 0.4833, - "step": 64342 - }, - { - "epoch": 1.65, - "learning_rate": 8.878116269307046e-07, - "loss": 0.8066, - "step": 64343 - }, - { - "epoch": 1.65, - "learning_rate": 8.877841312045195e-07, - "loss": 0.4019, - "step": 64344 - }, - { - "epoch": 1.65, - "learning_rate": 8.877566355642529e-07, - "loss": 0.5435, - "step": 64345 - }, - { - "epoch": 1.65, - "learning_rate": 8.877291400099262e-07, - "loss": 0.6035, - "step": 64346 - }, - { - "epoch": 1.65, - "learning_rate": 8.877016445415597e-07, - "loss": 0.4995, - "step": 64347 - }, - { - "epoch": 1.65, - "learning_rate": 8.876741491591752e-07, - "loss": 0.7939, - "step": 64348 - }, - { - "epoch": 1.65, - "learning_rate": 8.876466538627932e-07, - "loss": 0.7891, - "step": 64349 - }, - { - "epoch": 1.65, - "learning_rate": 8.876191586524352e-07, - "loss": 0.6846, - "step": 64350 - }, - { - "epoch": 1.65, - "learning_rate": 8.875916635281219e-07, - "loss": 0.6072, - "step": 64351 - }, - { - "epoch": 1.65, - "learning_rate": 8.875641684898751e-07, - "loss": 0.8018, - "step": 64352 - }, - { - "epoch": 1.65, - "learning_rate": 8.875366735377145e-07, - "loss": 0.4006, - "step": 64353 - }, - { - "epoch": 1.65, - "learning_rate": 8.875091786716622e-07, - "loss": 0.7607, - "step": 64354 - }, - { - "epoch": 1.65, - "learning_rate": 8.874816838917387e-07, - "loss": 0.7578, - "step": 64355 - }, - { - "epoch": 1.65, - "learning_rate": 8.874541891979657e-07, - "loss": 0.7295, - "step": 64356 - }, - { - "epoch": 1.65, - "learning_rate": 8.874266945903635e-07, - "loss": 0.5474, - "step": 64357 - }, - { - "epoch": 1.65, - "learning_rate": 8.873992000689536e-07, - "loss": 0.6904, - "step": 64358 - }, - { - "epoch": 1.65, - "learning_rate": 8.873717056337569e-07, - "loss": 0.3857, - "step": 64359 - }, - { - "epoch": 1.65, - "learning_rate": 8.873442112847946e-07, - "loss": 0.6172, - "step": 64360 - }, - { - "epoch": 1.65, - "learning_rate": 8.873167170220876e-07, - "loss": 0.7754, - "step": 64361 - }, - { - "epoch": 1.65, - "learning_rate": 8.872892228456573e-07, - "loss": 0.6772, - "step": 64362 - }, - { - "epoch": 1.65, - "learning_rate": 8.872617287555243e-07, - "loss": 0.6411, - "step": 64363 - }, - { - "epoch": 1.65, - "learning_rate": 8.872342347517096e-07, - "loss": 0.4902, - "step": 64364 - }, - { - "epoch": 1.65, - "learning_rate": 8.872067408342346e-07, - "loss": 0.7363, - "step": 64365 - }, - { - "epoch": 1.65, - "learning_rate": 8.871792470031201e-07, - "loss": 0.6689, - "step": 64366 - }, - { - "epoch": 1.65, - "learning_rate": 8.871517532583875e-07, - "loss": 0.7764, - "step": 64367 - }, - { - "epoch": 1.65, - "learning_rate": 8.871242596000573e-07, - "loss": 0.6768, - "step": 64368 - }, - { - "epoch": 1.65, - "learning_rate": 8.870967660281511e-07, - "loss": 0.6826, - "step": 64369 - }, - { - "epoch": 1.65, - "learning_rate": 8.870692725426897e-07, - "loss": 0.6611, - "step": 64370 - }, - { - "epoch": 1.65, - "learning_rate": 8.870417791436939e-07, - "loss": 0.7402, - "step": 64371 - }, - { - "epoch": 1.65, - "learning_rate": 8.870142858311857e-07, - "loss": 0.666, - "step": 64372 - }, - { - "epoch": 1.65, - "learning_rate": 8.86986792605185e-07, - "loss": 0.6421, - "step": 64373 - }, - { - "epoch": 1.65, - "learning_rate": 8.869592994657131e-07, - "loss": 0.6006, - "step": 64374 - }, - { - "epoch": 1.65, - "learning_rate": 8.869318064127917e-07, - "loss": 0.5552, - "step": 64375 - }, - { - "epoch": 1.65, - "learning_rate": 8.86904313446441e-07, - "loss": 0.6055, - "step": 64376 - }, - { - "epoch": 1.65, - "learning_rate": 8.868768205666827e-07, - "loss": 0.6218, - "step": 64377 - }, - { - "epoch": 1.65, - "learning_rate": 8.868493277735375e-07, - "loss": 0.5474, - "step": 64378 - }, - { - "epoch": 1.65, - "learning_rate": 8.868218350670267e-07, - "loss": 0.6157, - "step": 64379 - }, - { - "epoch": 1.65, - "learning_rate": 8.867943424471711e-07, - "loss": 0.4735, - "step": 64380 - }, - { - "epoch": 1.65, - "learning_rate": 8.86766849913992e-07, - "loss": 0.4414, - "step": 64381 - }, - { - "epoch": 1.65, - "learning_rate": 8.867393574675105e-07, - "loss": 0.5229, - "step": 64382 - }, - { - "epoch": 1.65, - "learning_rate": 8.867118651077471e-07, - "loss": 0.7988, - "step": 64383 - }, - { - "epoch": 1.65, - "learning_rate": 8.866843728347234e-07, - "loss": 0.6504, - "step": 64384 - }, - { - "epoch": 1.65, - "learning_rate": 8.8665688064846e-07, - "loss": 0.7773, - "step": 64385 - }, - { - "epoch": 1.65, - "learning_rate": 8.866293885489786e-07, - "loss": 0.5527, - "step": 64386 - }, - { - "epoch": 1.65, - "learning_rate": 8.866018965362997e-07, - "loss": 0.6895, - "step": 64387 - }, - { - "epoch": 1.65, - "learning_rate": 8.865744046104444e-07, - "loss": 0.6865, - "step": 64388 - }, - { - "epoch": 1.65, - "learning_rate": 8.86546912771434e-07, - "loss": 0.6504, - "step": 64389 - }, - { - "epoch": 1.65, - "learning_rate": 8.865194210192892e-07, - "loss": 0.7432, - "step": 64390 - }, - { - "epoch": 1.65, - "learning_rate": 8.864919293540315e-07, - "loss": 0.7012, - "step": 64391 - }, - { - "epoch": 1.65, - "learning_rate": 8.86464437775682e-07, - "loss": 0.6611, - "step": 64392 - }, - { - "epoch": 1.65, - "learning_rate": 8.86436946284261e-07, - "loss": 0.6699, - "step": 64393 - }, - { - "epoch": 1.65, - "learning_rate": 8.864094548797901e-07, - "loss": 0.6904, - "step": 64394 - }, - { - "epoch": 1.65, - "learning_rate": 8.863819635622901e-07, - "loss": 0.5076, - "step": 64395 - }, - { - "epoch": 1.65, - "learning_rate": 8.863544723317825e-07, - "loss": 0.6782, - "step": 64396 - }, - { - "epoch": 1.65, - "learning_rate": 8.863269811882877e-07, - "loss": 0.5107, - "step": 64397 - }, - { - "epoch": 1.65, - "learning_rate": 8.862994901318275e-07, - "loss": 0.5908, - "step": 64398 - }, - { - "epoch": 1.65, - "learning_rate": 8.862719991624222e-07, - "loss": 0.6562, - "step": 64399 - }, - { - "epoch": 1.65, - "learning_rate": 8.862445082800934e-07, - "loss": 0.5686, - "step": 64400 - }, - { - "epoch": 1.65, - "learning_rate": 8.862170174848619e-07, - "loss": 0.6479, - "step": 64401 - }, - { - "epoch": 1.65, - "learning_rate": 8.861895267767491e-07, - "loss": 0.6479, - "step": 64402 - }, - { - "epoch": 1.65, - "learning_rate": 8.861620361557755e-07, - "loss": 0.7197, - "step": 64403 - }, - { - "epoch": 1.65, - "learning_rate": 8.861345456219626e-07, - "loss": 0.6396, - "step": 64404 - }, - { - "epoch": 1.65, - "learning_rate": 8.861070551753308e-07, - "loss": 0.6631, - "step": 64405 - }, - { - "epoch": 1.65, - "learning_rate": 8.860795648159018e-07, - "loss": 0.6387, - "step": 64406 - }, - { - "epoch": 1.65, - "learning_rate": 8.860520745436963e-07, - "loss": 0.5039, - "step": 64407 - }, - { - "epoch": 1.65, - "learning_rate": 8.860245843587357e-07, - "loss": 0.5752, - "step": 64408 - }, - { - "epoch": 1.65, - "learning_rate": 8.859970942610406e-07, - "loss": 0.6157, - "step": 64409 - }, - { - "epoch": 1.65, - "learning_rate": 8.859696042506326e-07, - "loss": 0.689, - "step": 64410 - }, - { - "epoch": 1.65, - "learning_rate": 8.859421143275322e-07, - "loss": 0.5781, - "step": 64411 - }, - { - "epoch": 1.65, - "learning_rate": 8.85914624491761e-07, - "loss": 0.7012, - "step": 64412 - }, - { - "epoch": 1.65, - "learning_rate": 8.858871347433396e-07, - "loss": 0.6064, - "step": 64413 - }, - { - "epoch": 1.65, - "learning_rate": 8.858596450822888e-07, - "loss": 0.5151, - "step": 64414 - }, - { - "epoch": 1.65, - "learning_rate": 8.858321555086305e-07, - "loss": 0.623, - "step": 64415 - }, - { - "epoch": 1.65, - "learning_rate": 8.858046660223848e-07, - "loss": 0.8018, - "step": 64416 - }, - { - "epoch": 1.65, - "learning_rate": 8.857771766235735e-07, - "loss": 0.7188, - "step": 64417 - }, - { - "epoch": 1.65, - "learning_rate": 8.857496873122174e-07, - "loss": 0.4678, - "step": 64418 - }, - { - "epoch": 1.65, - "learning_rate": 8.857221980883374e-07, - "loss": 0.8018, - "step": 64419 - }, - { - "epoch": 1.65, - "learning_rate": 8.856947089519545e-07, - "loss": 0.6611, - "step": 64420 - }, - { - "epoch": 1.65, - "learning_rate": 8.856672199030905e-07, - "loss": 0.6104, - "step": 64421 - }, - { - "epoch": 1.65, - "learning_rate": 8.856397309417655e-07, - "loss": 0.7739, - "step": 64422 - }, - { - "epoch": 1.65, - "learning_rate": 8.856122420680008e-07, - "loss": 0.6807, - "step": 64423 - }, - { - "epoch": 1.65, - "learning_rate": 8.855847532818176e-07, - "loss": 0.7007, - "step": 64424 - }, - { - "epoch": 1.65, - "learning_rate": 8.85557264583237e-07, - "loss": 0.6719, - "step": 64425 - }, - { - "epoch": 1.65, - "learning_rate": 8.855297759722796e-07, - "loss": 0.6494, - "step": 64426 - }, - { - "epoch": 1.65, - "learning_rate": 8.855022874489671e-07, - "loss": 0.6514, - "step": 64427 - }, - { - "epoch": 1.65, - "learning_rate": 8.854747990133201e-07, - "loss": 0.5884, - "step": 64428 - }, - { - "epoch": 1.65, - "learning_rate": 8.8544731066536e-07, - "loss": 0.707, - "step": 64429 - }, - { - "epoch": 1.65, - "learning_rate": 8.854198224051073e-07, - "loss": 0.5247, - "step": 64430 - }, - { - "epoch": 1.65, - "learning_rate": 8.853923342325838e-07, - "loss": 0.6084, - "step": 64431 - }, - { - "epoch": 1.65, - "learning_rate": 8.853648461478099e-07, - "loss": 0.6606, - "step": 64432 - }, - { - "epoch": 1.65, - "learning_rate": 8.853373581508067e-07, - "loss": 0.584, - "step": 64433 - }, - { - "epoch": 1.65, - "learning_rate": 8.853098702415955e-07, - "loss": 0.7324, - "step": 64434 - }, - { - "epoch": 1.65, - "learning_rate": 8.852823824201972e-07, - "loss": 0.7393, - "step": 64435 - }, - { - "epoch": 1.65, - "learning_rate": 8.852548946866332e-07, - "loss": 0.6479, - "step": 64436 - }, - { - "epoch": 1.65, - "learning_rate": 8.852274070409238e-07, - "loss": 0.6821, - "step": 64437 - }, - { - "epoch": 1.65, - "learning_rate": 8.851999194830908e-07, - "loss": 0.5144, - "step": 64438 - }, - { - "epoch": 1.65, - "learning_rate": 8.851724320131548e-07, - "loss": 0.584, - "step": 64439 - }, - { - "epoch": 1.65, - "learning_rate": 8.851449446311372e-07, - "loss": 0.5913, - "step": 64440 - }, - { - "epoch": 1.65, - "learning_rate": 8.85117457337059e-07, - "loss": 0.8652, - "step": 64441 - }, - { - "epoch": 1.65, - "learning_rate": 8.850899701309409e-07, - "loss": 0.6517, - "step": 64442 - }, - { - "epoch": 1.65, - "learning_rate": 8.850624830128038e-07, - "loss": 0.6084, - "step": 64443 - }, - { - "epoch": 1.65, - "learning_rate": 8.850349959826694e-07, - "loss": 0.687, - "step": 64444 - }, - { - "epoch": 1.65, - "learning_rate": 8.850075090405582e-07, - "loss": 0.7686, - "step": 64445 - }, - { - "epoch": 1.65, - "learning_rate": 8.849800221864916e-07, - "loss": 0.6621, - "step": 64446 - }, - { - "epoch": 1.65, - "learning_rate": 8.849525354204903e-07, - "loss": 0.6675, - "step": 64447 - }, - { - "epoch": 1.65, - "learning_rate": 8.849250487425759e-07, - "loss": 0.5974, - "step": 64448 - }, - { - "epoch": 1.65, - "learning_rate": 8.848975621527688e-07, - "loss": 0.5737, - "step": 64449 - }, - { - "epoch": 1.65, - "learning_rate": 8.848700756510905e-07, - "loss": 0.4956, - "step": 64450 - }, - { - "epoch": 1.65, - "learning_rate": 8.848425892375621e-07, - "loss": 0.6709, - "step": 64451 - }, - { - "epoch": 1.65, - "learning_rate": 8.848151029122042e-07, - "loss": 0.6309, - "step": 64452 - }, - { - "epoch": 1.65, - "learning_rate": 8.847876166750381e-07, - "loss": 0.6021, - "step": 64453 - }, - { - "epoch": 1.65, - "learning_rate": 8.847601305260846e-07, - "loss": 0.5864, - "step": 64454 - }, - { - "epoch": 1.65, - "learning_rate": 8.847326444653653e-07, - "loss": 0.7607, - "step": 64455 - }, - { - "epoch": 1.65, - "learning_rate": 8.847051584929006e-07, - "loss": 0.6455, - "step": 64456 - }, - { - "epoch": 1.65, - "learning_rate": 8.846776726087122e-07, - "loss": 0.7891, - "step": 64457 - }, - { - "epoch": 1.65, - "learning_rate": 8.846501868128204e-07, - "loss": 0.5425, - "step": 64458 - }, - { - "epoch": 1.65, - "learning_rate": 8.846227011052471e-07, - "loss": 0.6504, - "step": 64459 - }, - { - "epoch": 1.65, - "learning_rate": 8.845952154860128e-07, - "loss": 0.6006, - "step": 64460 - }, - { - "epoch": 1.65, - "learning_rate": 8.845677299551387e-07, - "loss": 0.4795, - "step": 64461 - }, - { - "epoch": 1.65, - "learning_rate": 8.845402445126456e-07, - "loss": 0.5769, - "step": 64462 - }, - { - "epoch": 1.65, - "learning_rate": 8.845127591585547e-07, - "loss": 0.4531, - "step": 64463 - }, - { - "epoch": 1.65, - "learning_rate": 8.84485273892887e-07, - "loss": 0.5498, - "step": 64464 - }, - { - "epoch": 1.65, - "learning_rate": 8.844577887156638e-07, - "loss": 0.6172, - "step": 64465 - }, - { - "epoch": 1.65, - "learning_rate": 8.844303036269058e-07, - "loss": 0.6274, - "step": 64466 - }, - { - "epoch": 1.65, - "learning_rate": 8.844028186266343e-07, - "loss": 0.6777, - "step": 64467 - }, - { - "epoch": 1.65, - "learning_rate": 8.8437533371487e-07, - "loss": 0.6807, - "step": 64468 - }, - { - "epoch": 1.65, - "learning_rate": 8.843478488916346e-07, - "loss": 0.6172, - "step": 64469 - }, - { - "epoch": 1.65, - "learning_rate": 8.843203641569484e-07, - "loss": 0.7012, - "step": 64470 - }, - { - "epoch": 1.65, - "learning_rate": 8.842928795108332e-07, - "loss": 0.5315, - "step": 64471 - }, - { - "epoch": 1.65, - "learning_rate": 8.842653949533094e-07, - "loss": 0.6445, - "step": 64472 - }, - { - "epoch": 1.65, - "learning_rate": 8.842379104843982e-07, - "loss": 0.5386, - "step": 64473 - }, - { - "epoch": 1.65, - "learning_rate": 8.842104261041207e-07, - "loss": 0.6689, - "step": 64474 - }, - { - "epoch": 1.65, - "learning_rate": 8.841829418124978e-07, - "loss": 0.5591, - "step": 64475 - }, - { - "epoch": 1.65, - "learning_rate": 8.84155457609551e-07, - "loss": 0.5234, - "step": 64476 - }, - { - "epoch": 1.65, - "learning_rate": 8.84127973495301e-07, - "loss": 0.6665, - "step": 64477 - }, - { - "epoch": 1.65, - "learning_rate": 8.841004894697687e-07, - "loss": 0.5962, - "step": 64478 - }, - { - "epoch": 1.65, - "learning_rate": 8.840730055329755e-07, - "loss": 0.6367, - "step": 64479 - }, - { - "epoch": 1.65, - "learning_rate": 8.840455216849421e-07, - "loss": 0.6221, - "step": 64480 - }, - { - "epoch": 1.65, - "learning_rate": 8.8401803792569e-07, - "loss": 0.8145, - "step": 64481 - }, - { - "epoch": 1.65, - "learning_rate": 8.839905542552398e-07, - "loss": 0.6992, - "step": 64482 - }, - { - "epoch": 1.65, - "learning_rate": 8.839630706736125e-07, - "loss": 0.7236, - "step": 64483 - }, - { - "epoch": 1.65, - "learning_rate": 8.839355871808296e-07, - "loss": 0.6758, - "step": 64484 - }, - { - "epoch": 1.65, - "learning_rate": 8.839081037769117e-07, - "loss": 0.4636, - "step": 64485 - }, - { - "epoch": 1.65, - "learning_rate": 8.838806204618802e-07, - "loss": 0.8213, - "step": 64486 - }, - { - "epoch": 1.65, - "learning_rate": 8.838531372357557e-07, - "loss": 0.5645, - "step": 64487 - }, - { - "epoch": 1.65, - "learning_rate": 8.838256540985598e-07, - "loss": 0.7227, - "step": 64488 - }, - { - "epoch": 1.65, - "learning_rate": 8.83798171050313e-07, - "loss": 0.6934, - "step": 64489 - }, - { - "epoch": 1.65, - "learning_rate": 8.837706880910369e-07, - "loss": 0.6064, - "step": 64490 - }, - { - "epoch": 1.65, - "learning_rate": 8.837432052207523e-07, - "loss": 0.7676, - "step": 64491 - }, - { - "epoch": 1.65, - "learning_rate": 8.837157224394797e-07, - "loss": 0.5625, - "step": 64492 - }, - { - "epoch": 1.65, - "learning_rate": 8.836882397472411e-07, - "loss": 0.7031, - "step": 64493 - }, - { - "epoch": 1.65, - "learning_rate": 8.83660757144057e-07, - "loss": 0.5654, - "step": 64494 - }, - { - "epoch": 1.65, - "learning_rate": 8.836332746299481e-07, - "loss": 0.5637, - "step": 64495 - }, - { - "epoch": 1.65, - "learning_rate": 8.836057922049363e-07, - "loss": 0.7339, - "step": 64496 - }, - { - "epoch": 1.65, - "learning_rate": 8.835783098690418e-07, - "loss": 0.5134, - "step": 64497 - }, - { - "epoch": 1.65, - "learning_rate": 8.835508276222863e-07, - "loss": 0.792, - "step": 64498 - }, - { - "epoch": 1.65, - "learning_rate": 8.835233454646904e-07, - "loss": 0.5835, - "step": 64499 - }, - { - "epoch": 1.65, - "learning_rate": 8.834958633962756e-07, - "loss": 0.5259, - "step": 64500 - }, - { - "epoch": 1.65, - "learning_rate": 8.834683814170627e-07, - "loss": 0.7305, - "step": 64501 - }, - { - "epoch": 1.65, - "learning_rate": 8.834408995270725e-07, - "loss": 0.6826, - "step": 64502 - }, - { - "epoch": 1.65, - "learning_rate": 8.834134177263263e-07, - "loss": 0.6455, - "step": 64503 - }, - { - "epoch": 1.65, - "learning_rate": 8.833859360148448e-07, - "loss": 0.8037, - "step": 64504 - }, - { - "epoch": 1.65, - "learning_rate": 8.833584543926497e-07, - "loss": 0.5952, - "step": 64505 - }, - { - "epoch": 1.65, - "learning_rate": 8.833309728597613e-07, - "loss": 0.8604, - "step": 64506 - }, - { - "epoch": 1.65, - "learning_rate": 8.833034914162014e-07, - "loss": 0.6094, - "step": 64507 - }, - { - "epoch": 1.65, - "learning_rate": 8.832760100619903e-07, - "loss": 0.709, - "step": 64508 - }, - { - "epoch": 1.65, - "learning_rate": 8.832485287971496e-07, - "loss": 0.6328, - "step": 64509 - }, - { - "epoch": 1.65, - "learning_rate": 8.832210476217e-07, - "loss": 0.5293, - "step": 64510 - }, - { - "epoch": 1.65, - "learning_rate": 8.831935665356631e-07, - "loss": 0.5386, - "step": 64511 - }, - { - "epoch": 1.65, - "learning_rate": 8.831660855390593e-07, - "loss": 0.7529, - "step": 64512 - }, - { - "epoch": 1.65, - "learning_rate": 8.831386046319098e-07, - "loss": 0.6479, - "step": 64513 - }, - { - "epoch": 1.65, - "learning_rate": 8.831111238142356e-07, - "loss": 0.7026, - "step": 64514 - }, - { - "epoch": 1.65, - "learning_rate": 8.830836430860579e-07, - "loss": 0.6367, - "step": 64515 - }, - { - "epoch": 1.65, - "learning_rate": 8.830561624473976e-07, - "loss": 0.667, - "step": 64516 - }, - { - "epoch": 1.65, - "learning_rate": 8.830286818982759e-07, - "loss": 0.7119, - "step": 64517 - }, - { - "epoch": 1.65, - "learning_rate": 8.830012014387136e-07, - "loss": 0.7227, - "step": 64518 - }, - { - "epoch": 1.65, - "learning_rate": 8.829737210687321e-07, - "loss": 0.6582, - "step": 64519 - }, - { - "epoch": 1.65, - "learning_rate": 8.829462407883522e-07, - "loss": 0.7959, - "step": 64520 - }, - { - "epoch": 1.65, - "learning_rate": 8.829187605975952e-07, - "loss": 0.7412, - "step": 64521 - }, - { - "epoch": 1.65, - "learning_rate": 8.828912804964818e-07, - "loss": 0.5151, - "step": 64522 - }, - { - "epoch": 1.65, - "learning_rate": 8.828638004850328e-07, - "loss": 0.7344, - "step": 64523 - }, - { - "epoch": 1.65, - "learning_rate": 8.828363205632701e-07, - "loss": 0.6768, - "step": 64524 - }, - { - "epoch": 1.65, - "learning_rate": 8.828088407312137e-07, - "loss": 0.5542, - "step": 64525 - }, - { - "epoch": 1.65, - "learning_rate": 8.827813609888856e-07, - "loss": 0.584, - "step": 64526 - }, - { - "epoch": 1.65, - "learning_rate": 8.827538813363062e-07, - "loss": 0.8418, - "step": 64527 - }, - { - "epoch": 1.65, - "learning_rate": 8.827264017734969e-07, - "loss": 0.5063, - "step": 64528 - }, - { - "epoch": 1.65, - "learning_rate": 8.826989223004785e-07, - "loss": 0.6602, - "step": 64529 - }, - { - "epoch": 1.65, - "learning_rate": 8.826714429172723e-07, - "loss": 0.7344, - "step": 64530 - }, - { - "epoch": 1.65, - "learning_rate": 8.826439636238993e-07, - "loss": 0.623, - "step": 64531 - }, - { - "epoch": 1.65, - "learning_rate": 8.826164844203802e-07, - "loss": 0.7437, - "step": 64532 - }, - { - "epoch": 1.65, - "learning_rate": 8.825890053067362e-07, - "loss": 0.4678, - "step": 64533 - }, - { - "epoch": 1.65, - "learning_rate": 8.825615262829886e-07, - "loss": 0.7021, - "step": 64534 - }, - { - "epoch": 1.65, - "learning_rate": 8.82534047349158e-07, - "loss": 0.7007, - "step": 64535 - }, - { - "epoch": 1.65, - "learning_rate": 8.825065685052659e-07, - "loss": 0.6826, - "step": 64536 - }, - { - "epoch": 1.65, - "learning_rate": 8.824790897513328e-07, - "loss": 0.6377, - "step": 64537 - }, - { - "epoch": 1.65, - "learning_rate": 8.824516110873803e-07, - "loss": 0.7622, - "step": 64538 - }, - { - "epoch": 1.65, - "learning_rate": 8.824241325134291e-07, - "loss": 0.7158, - "step": 64539 - }, - { - "epoch": 1.65, - "learning_rate": 8.823966540295005e-07, - "loss": 0.5776, - "step": 64540 - }, - { - "epoch": 1.65, - "learning_rate": 8.823691756356155e-07, - "loss": 0.6079, - "step": 64541 - }, - { - "epoch": 1.65, - "learning_rate": 8.823416973317946e-07, - "loss": 0.6592, - "step": 64542 - }, - { - "epoch": 1.65, - "learning_rate": 8.823142191180596e-07, - "loss": 0.4427, - "step": 64543 - }, - { - "epoch": 1.65, - "learning_rate": 8.82286740994431e-07, - "loss": 0.6006, - "step": 64544 - }, - { - "epoch": 1.65, - "learning_rate": 8.8225926296093e-07, - "loss": 0.6797, - "step": 64545 - }, - { - "epoch": 1.65, - "learning_rate": 8.822317850175775e-07, - "loss": 0.6963, - "step": 64546 - }, - { - "epoch": 1.65, - "learning_rate": 8.822043071643951e-07, - "loss": 0.6113, - "step": 64547 - }, - { - "epoch": 1.65, - "learning_rate": 8.821768294014031e-07, - "loss": 0.4442, - "step": 64548 - }, - { - "epoch": 1.65, - "learning_rate": 8.821493517286231e-07, - "loss": 0.4866, - "step": 64549 - }, - { - "epoch": 1.65, - "learning_rate": 8.821218741460761e-07, - "loss": 0.6367, - "step": 64550 - }, - { - "epoch": 1.65, - "learning_rate": 8.820943966537829e-07, - "loss": 0.6245, - "step": 64551 - }, - { - "epoch": 1.65, - "learning_rate": 8.820669192517644e-07, - "loss": 0.7168, - "step": 64552 - }, - { - "epoch": 1.65, - "learning_rate": 8.820394419400418e-07, - "loss": 0.6421, - "step": 64553 - }, - { - "epoch": 1.65, - "learning_rate": 8.820119647186363e-07, - "loss": 0.4469, - "step": 64554 - }, - { - "epoch": 1.65, - "learning_rate": 8.819844875875688e-07, - "loss": 0.8711, - "step": 64555 - }, - { - "epoch": 1.65, - "learning_rate": 8.819570105468602e-07, - "loss": 0.5873, - "step": 64556 - }, - { - "epoch": 1.65, - "learning_rate": 8.819295335965319e-07, - "loss": 0.8535, - "step": 64557 - }, - { - "epoch": 1.65, - "learning_rate": 8.819020567366044e-07, - "loss": 0.7153, - "step": 64558 - }, - { - "epoch": 1.65, - "learning_rate": 8.818745799670994e-07, - "loss": 0.6021, - "step": 64559 - }, - { - "epoch": 1.65, - "learning_rate": 8.818471032880374e-07, - "loss": 0.606, - "step": 64560 - }, - { - "epoch": 1.65, - "learning_rate": 8.818196266994401e-07, - "loss": 0.665, - "step": 64561 - }, - { - "epoch": 1.65, - "learning_rate": 8.817921502013278e-07, - "loss": 0.7119, - "step": 64562 - }, - { - "epoch": 1.65, - "learning_rate": 8.817646737937216e-07, - "loss": 0.6299, - "step": 64563 - }, - { - "epoch": 1.65, - "learning_rate": 8.81737197476643e-07, - "loss": 0.4985, - "step": 64564 - }, - { - "epoch": 1.65, - "learning_rate": 8.817097212501125e-07, - "loss": 0.6445, - "step": 64565 - }, - { - "epoch": 1.65, - "learning_rate": 8.816822451141517e-07, - "loss": 0.8154, - "step": 64566 - }, - { - "epoch": 1.65, - "learning_rate": 8.816547690687813e-07, - "loss": 0.6455, - "step": 64567 - }, - { - "epoch": 1.65, - "learning_rate": 8.816272931140222e-07, - "loss": 0.6562, - "step": 64568 - }, - { - "epoch": 1.65, - "learning_rate": 8.815998172498959e-07, - "loss": 0.498, - "step": 64569 - }, - { - "epoch": 1.65, - "learning_rate": 8.81572341476423e-07, - "loss": 0.7256, - "step": 64570 - }, - { - "epoch": 1.65, - "learning_rate": 8.81544865793625e-07, - "loss": 0.4746, - "step": 64571 - }, - { - "epoch": 1.66, - "learning_rate": 8.815173902015226e-07, - "loss": 0.5016, - "step": 64572 - }, - { - "epoch": 1.66, - "learning_rate": 8.814899147001367e-07, - "loss": 0.7197, - "step": 64573 - }, - { - "epoch": 1.66, - "learning_rate": 8.814624392894886e-07, - "loss": 0.4905, - "step": 64574 - }, - { - "epoch": 1.66, - "learning_rate": 8.814349639695991e-07, - "loss": 0.6182, - "step": 64575 - }, - { - "epoch": 1.66, - "learning_rate": 8.814074887404895e-07, - "loss": 0.8154, - "step": 64576 - }, - { - "epoch": 1.66, - "learning_rate": 8.813800136021806e-07, - "loss": 0.541, - "step": 64577 - }, - { - "epoch": 1.66, - "learning_rate": 8.813525385546939e-07, - "loss": 0.5288, - "step": 64578 - }, - { - "epoch": 1.66, - "learning_rate": 8.813250635980497e-07, - "loss": 0.6631, - "step": 64579 - }, - { - "epoch": 1.66, - "learning_rate": 8.812975887322698e-07, - "loss": 0.6528, - "step": 64580 - }, - { - "epoch": 1.66, - "learning_rate": 8.81270113957375e-07, - "loss": 0.665, - "step": 64581 - }, - { - "epoch": 1.66, - "learning_rate": 8.812426392733858e-07, - "loss": 0.6895, - "step": 64582 - }, - { - "epoch": 1.66, - "learning_rate": 8.812151646803238e-07, - "loss": 0.5654, - "step": 64583 - }, - { - "epoch": 1.66, - "learning_rate": 8.811876901782099e-07, - "loss": 0.4512, - "step": 64584 - }, - { - "epoch": 1.66, - "learning_rate": 8.811602157670652e-07, - "loss": 0.4785, - "step": 64585 - }, - { - "epoch": 1.66, - "learning_rate": 8.811327414469107e-07, - "loss": 0.6406, - "step": 64586 - }, - { - "epoch": 1.66, - "learning_rate": 8.81105267217767e-07, - "loss": 0.5967, - "step": 64587 - }, - { - "epoch": 1.66, - "learning_rate": 8.810777930796559e-07, - "loss": 0.8525, - "step": 64588 - }, - { - "epoch": 1.66, - "learning_rate": 8.810503190325979e-07, - "loss": 0.7949, - "step": 64589 - }, - { - "epoch": 1.66, - "learning_rate": 8.810228450766143e-07, - "loss": 0.5654, - "step": 64590 - }, - { - "epoch": 1.66, - "learning_rate": 8.809953712117263e-07, - "loss": 0.7178, - "step": 64591 - }, - { - "epoch": 1.66, - "learning_rate": 8.809678974379543e-07, - "loss": 0.6147, - "step": 64592 - }, - { - "epoch": 1.66, - "learning_rate": 8.809404237553198e-07, - "loss": 0.6973, - "step": 64593 - }, - { - "epoch": 1.66, - "learning_rate": 8.809129501638436e-07, - "loss": 0.6782, - "step": 64594 - }, - { - "epoch": 1.66, - "learning_rate": 8.80885476663547e-07, - "loss": 0.6357, - "step": 64595 - }, - { - "epoch": 1.66, - "learning_rate": 8.808580032544509e-07, - "loss": 0.7822, - "step": 64596 - }, - { - "epoch": 1.66, - "learning_rate": 8.808305299365765e-07, - "loss": 0.5864, - "step": 64597 - }, - { - "epoch": 1.66, - "learning_rate": 8.808030567099443e-07, - "loss": 0.7568, - "step": 64598 - }, - { - "epoch": 1.66, - "learning_rate": 8.807755835745761e-07, - "loss": 0.6318, - "step": 64599 - }, - { - "epoch": 1.66, - "learning_rate": 8.807481105304922e-07, - "loss": 0.5959, - "step": 64600 - }, - { - "epoch": 1.66, - "learning_rate": 8.807206375777146e-07, - "loss": 0.6152, - "step": 64601 - }, - { - "epoch": 1.66, - "learning_rate": 8.806931647162634e-07, - "loss": 0.8203, - "step": 64602 - }, - { - "epoch": 1.66, - "learning_rate": 8.806656919461599e-07, - "loss": 0.5337, - "step": 64603 - }, - { - "epoch": 1.66, - "learning_rate": 8.806382192674251e-07, - "loss": 0.6216, - "step": 64604 - }, - { - "epoch": 1.66, - "learning_rate": 8.806107466800803e-07, - "loss": 0.5352, - "step": 64605 - }, - { - "epoch": 1.66, - "learning_rate": 8.805832741841461e-07, - "loss": 0.6406, - "step": 64606 - }, - { - "epoch": 1.66, - "learning_rate": 8.80555801779644e-07, - "loss": 0.7422, - "step": 64607 - }, - { - "epoch": 1.66, - "learning_rate": 8.805283294665947e-07, - "loss": 0.5474, - "step": 64608 - }, - { - "epoch": 1.66, - "learning_rate": 8.805008572450196e-07, - "loss": 0.5938, - "step": 64609 - }, - { - "epoch": 1.66, - "learning_rate": 8.804733851149392e-07, - "loss": 0.5269, - "step": 64610 - }, - { - "epoch": 1.66, - "learning_rate": 8.804459130763752e-07, - "loss": 0.5679, - "step": 64611 - }, - { - "epoch": 1.66, - "learning_rate": 8.804184411293482e-07, - "loss": 0.5244, - "step": 64612 - }, - { - "epoch": 1.66, - "learning_rate": 8.803909692738791e-07, - "loss": 0.6543, - "step": 64613 - }, - { - "epoch": 1.66, - "learning_rate": 8.803634975099893e-07, - "loss": 0.6001, - "step": 64614 - }, - { - "epoch": 1.66, - "learning_rate": 8.803360258376994e-07, - "loss": 0.7441, - "step": 64615 - }, - { - "epoch": 1.66, - "learning_rate": 8.80308554257031e-07, - "loss": 0.7402, - "step": 64616 - }, - { - "epoch": 1.66, - "learning_rate": 8.802810827680045e-07, - "loss": 0.5742, - "step": 64617 - }, - { - "epoch": 1.66, - "learning_rate": 8.802536113706415e-07, - "loss": 0.6152, - "step": 64618 - }, - { - "epoch": 1.66, - "learning_rate": 8.802261400649628e-07, - "loss": 0.7852, - "step": 64619 - }, - { - "epoch": 1.66, - "learning_rate": 8.801986688509894e-07, - "loss": 0.5312, - "step": 64620 - }, - { - "epoch": 1.66, - "learning_rate": 8.801711977287428e-07, - "loss": 0.4028, - "step": 64621 - }, - { - "epoch": 1.66, - "learning_rate": 8.801437266982432e-07, - "loss": 0.5176, - "step": 64622 - }, - { - "epoch": 1.66, - "learning_rate": 8.801162557595118e-07, - "loss": 0.5791, - "step": 64623 - }, - { - "epoch": 1.66, - "learning_rate": 8.800887849125702e-07, - "loss": 0.6016, - "step": 64624 - }, - { - "epoch": 1.66, - "learning_rate": 8.800613141574389e-07, - "loss": 0.8672, - "step": 64625 - }, - { - "epoch": 1.66, - "learning_rate": 8.800338434941393e-07, - "loss": 0.8735, - "step": 64626 - }, - { - "epoch": 1.66, - "learning_rate": 8.800063729226921e-07, - "loss": 0.7822, - "step": 64627 - }, - { - "epoch": 1.66, - "learning_rate": 8.799789024431188e-07, - "loss": 0.438, - "step": 64628 - }, - { - "epoch": 1.66, - "learning_rate": 8.799514320554397e-07, - "loss": 0.7451, - "step": 64629 - }, - { - "epoch": 1.66, - "learning_rate": 8.799239617596767e-07, - "loss": 0.6553, - "step": 64630 - }, - { - "epoch": 1.66, - "learning_rate": 8.798964915558505e-07, - "loss": 0.6846, - "step": 64631 - }, - { - "epoch": 1.66, - "learning_rate": 8.798690214439815e-07, - "loss": 0.8926, - "step": 64632 - }, - { - "epoch": 1.66, - "learning_rate": 8.798415514240917e-07, - "loss": 0.604, - "step": 64633 - }, - { - "epoch": 1.66, - "learning_rate": 8.798140814962014e-07, - "loss": 0.8232, - "step": 64634 - }, - { - "epoch": 1.66, - "learning_rate": 8.797866116603321e-07, - "loss": 0.6855, - "step": 64635 - }, - { - "epoch": 1.66, - "learning_rate": 8.797591419165045e-07, - "loss": 0.6152, - "step": 64636 - }, - { - "epoch": 1.66, - "learning_rate": 8.7973167226474e-07, - "loss": 0.6694, - "step": 64637 - }, - { - "epoch": 1.66, - "learning_rate": 8.797042027050592e-07, - "loss": 0.4227, - "step": 64638 - }, - { - "epoch": 1.66, - "learning_rate": 8.796767332374835e-07, - "loss": 0.6387, - "step": 64639 - }, - { - "epoch": 1.66, - "learning_rate": 8.796492638620339e-07, - "loss": 0.5159, - "step": 64640 - }, - { - "epoch": 1.66, - "learning_rate": 8.796217945787315e-07, - "loss": 0.5269, - "step": 64641 - }, - { - "epoch": 1.66, - "learning_rate": 8.795943253875968e-07, - "loss": 0.6025, - "step": 64642 - }, - { - "epoch": 1.66, - "learning_rate": 8.795668562886513e-07, - "loss": 0.6035, - "step": 64643 - }, - { - "epoch": 1.66, - "learning_rate": 8.795393872819158e-07, - "loss": 0.665, - "step": 64644 - }, - { - "epoch": 1.66, - "learning_rate": 8.795119183674116e-07, - "loss": 0.6104, - "step": 64645 - }, - { - "epoch": 1.66, - "learning_rate": 8.794844495451593e-07, - "loss": 0.6631, - "step": 64646 - }, - { - "epoch": 1.66, - "learning_rate": 8.794569808151806e-07, - "loss": 0.6714, - "step": 64647 - }, - { - "epoch": 1.66, - "learning_rate": 8.794295121774959e-07, - "loss": 0.5908, - "step": 64648 - }, - { - "epoch": 1.66, - "learning_rate": 8.794020436321266e-07, - "loss": 0.7031, - "step": 64649 - }, - { - "epoch": 1.66, - "learning_rate": 8.793745751790935e-07, - "loss": 0.6753, - "step": 64650 - }, - { - "epoch": 1.66, - "learning_rate": 8.793471068184179e-07, - "loss": 0.6235, - "step": 64651 - }, - { - "epoch": 1.66, - "learning_rate": 8.793196385501208e-07, - "loss": 0.5659, - "step": 64652 - }, - { - "epoch": 1.66, - "learning_rate": 8.792921703742227e-07, - "loss": 0.6201, - "step": 64653 - }, - { - "epoch": 1.66, - "learning_rate": 8.792647022907454e-07, - "loss": 0.8359, - "step": 64654 - }, - { - "epoch": 1.66, - "learning_rate": 8.792372342997092e-07, - "loss": 0.7305, - "step": 64655 - }, - { - "epoch": 1.66, - "learning_rate": 8.792097664011358e-07, - "loss": 0.6533, - "step": 64656 - }, - { - "epoch": 1.66, - "learning_rate": 8.791822985950459e-07, - "loss": 0.4971, - "step": 64657 - }, - { - "epoch": 1.66, - "learning_rate": 8.791548308814602e-07, - "loss": 0.707, - "step": 64658 - }, - { - "epoch": 1.66, - "learning_rate": 8.791273632604005e-07, - "loss": 0.5859, - "step": 64659 - }, - { - "epoch": 1.66, - "learning_rate": 8.790998957318871e-07, - "loss": 0.6233, - "step": 64660 - }, - { - "epoch": 1.66, - "learning_rate": 8.790724282959419e-07, - "loss": 0.7207, - "step": 64661 - }, - { - "epoch": 1.66, - "learning_rate": 8.790449609525851e-07, - "loss": 0.668, - "step": 64662 - }, - { - "epoch": 1.66, - "learning_rate": 8.790174937018377e-07, - "loss": 0.55, - "step": 64663 - }, - { - "epoch": 1.66, - "learning_rate": 8.789900265437215e-07, - "loss": 0.8936, - "step": 64664 - }, - { - "epoch": 1.66, - "learning_rate": 8.789625594782566e-07, - "loss": 0.6064, - "step": 64665 - }, - { - "epoch": 1.66, - "learning_rate": 8.789350925054648e-07, - "loss": 0.75, - "step": 64666 - }, - { - "epoch": 1.66, - "learning_rate": 8.789076256253666e-07, - "loss": 0.5903, - "step": 64667 - }, - { - "epoch": 1.66, - "learning_rate": 8.788801588379837e-07, - "loss": 0.7656, - "step": 64668 - }, - { - "epoch": 1.66, - "learning_rate": 8.788526921433363e-07, - "loss": 0.7266, - "step": 64669 - }, - { - "epoch": 1.66, - "learning_rate": 8.788252255414459e-07, - "loss": 0.6958, - "step": 64670 - }, - { - "epoch": 1.66, - "learning_rate": 8.787977590323339e-07, - "loss": 0.7393, - "step": 64671 - }, - { - "epoch": 1.66, - "learning_rate": 8.787702926160204e-07, - "loss": 0.7441, - "step": 64672 - }, - { - "epoch": 1.66, - "learning_rate": 8.787428262925269e-07, - "loss": 0.6038, - "step": 64673 - }, - { - "epoch": 1.66, - "learning_rate": 8.787153600618746e-07, - "loss": 0.666, - "step": 64674 - }, - { - "epoch": 1.66, - "learning_rate": 8.786878939240842e-07, - "loss": 0.7266, - "step": 64675 - }, - { - "epoch": 1.66, - "learning_rate": 8.786604278791772e-07, - "loss": 0.6924, - "step": 64676 - }, - { - "epoch": 1.66, - "learning_rate": 8.78632961927174e-07, - "loss": 0.5327, - "step": 64677 - }, - { - "epoch": 1.66, - "learning_rate": 8.786054960680962e-07, - "loss": 0.79, - "step": 64678 - }, - { - "epoch": 1.66, - "learning_rate": 8.785780303019644e-07, - "loss": 0.5894, - "step": 64679 - }, - { - "epoch": 1.66, - "learning_rate": 8.785505646288e-07, - "loss": 0.5684, - "step": 64680 - }, - { - "epoch": 1.66, - "learning_rate": 8.78523099048624e-07, - "loss": 0.5732, - "step": 64681 - }, - { - "epoch": 1.66, - "learning_rate": 8.784956335614569e-07, - "loss": 0.509, - "step": 64682 - }, - { - "epoch": 1.66, - "learning_rate": 8.784681681673204e-07, - "loss": 0.8623, - "step": 64683 - }, - { - "epoch": 1.66, - "learning_rate": 8.78440702866235e-07, - "loss": 0.604, - "step": 64684 - }, - { - "epoch": 1.66, - "learning_rate": 8.784132376582221e-07, - "loss": 0.5679, - "step": 64685 - }, - { - "epoch": 1.66, - "learning_rate": 8.783857725433024e-07, - "loss": 0.7988, - "step": 64686 - }, - { - "epoch": 1.66, - "learning_rate": 8.783583075214973e-07, - "loss": 0.6387, - "step": 64687 - }, - { - "epoch": 1.66, - "learning_rate": 8.783308425928275e-07, - "loss": 0.5669, - "step": 64688 - }, - { - "epoch": 1.66, - "learning_rate": 8.783033777573144e-07, - "loss": 0.5225, - "step": 64689 - }, - { - "epoch": 1.66, - "learning_rate": 8.782759130149785e-07, - "loss": 0.79, - "step": 64690 - }, - { - "epoch": 1.66, - "learning_rate": 8.782484483658417e-07, - "loss": 0.6465, - "step": 64691 - }, - { - "epoch": 1.66, - "learning_rate": 8.782209838099241e-07, - "loss": 0.6528, - "step": 64692 - }, - { - "epoch": 1.66, - "learning_rate": 8.781935193472473e-07, - "loss": 0.4194, - "step": 64693 - }, - { - "epoch": 1.66, - "learning_rate": 8.781660549778317e-07, - "loss": 0.7422, - "step": 64694 - }, - { - "epoch": 1.66, - "learning_rate": 8.781385907016991e-07, - "loss": 0.5317, - "step": 64695 - }, - { - "epoch": 1.66, - "learning_rate": 8.781111265188699e-07, - "loss": 0.6064, - "step": 64696 - }, - { - "epoch": 1.66, - "learning_rate": 8.780836624293656e-07, - "loss": 0.606, - "step": 64697 - }, - { - "epoch": 1.66, - "learning_rate": 8.780561984332069e-07, - "loss": 0.6011, - "step": 64698 - }, - { - "epoch": 1.66, - "learning_rate": 8.780287345304151e-07, - "loss": 0.6279, - "step": 64699 - }, - { - "epoch": 1.66, - "learning_rate": 8.780012707210109e-07, - "loss": 0.7178, - "step": 64700 - }, - { - "epoch": 1.66, - "learning_rate": 8.77973807005016e-07, - "loss": 0.6729, - "step": 64701 - }, - { - "epoch": 1.66, - "learning_rate": 8.779463433824507e-07, - "loss": 0.5908, - "step": 64702 - }, - { - "epoch": 1.66, - "learning_rate": 8.77918879853336e-07, - "loss": 0.7832, - "step": 64703 - }, - { - "epoch": 1.66, - "learning_rate": 8.778914164176934e-07, - "loss": 0.6108, - "step": 64704 - }, - { - "epoch": 1.66, - "learning_rate": 8.778639530755436e-07, - "loss": 0.6738, - "step": 64705 - }, - { - "epoch": 1.66, - "learning_rate": 8.77836489826908e-07, - "loss": 0.6973, - "step": 64706 - }, - { - "epoch": 1.66, - "learning_rate": 8.77809026671807e-07, - "loss": 0.8076, - "step": 64707 - }, - { - "epoch": 1.66, - "learning_rate": 8.777815636102624e-07, - "loss": 0.6641, - "step": 64708 - }, - { - "epoch": 1.66, - "learning_rate": 8.777541006422945e-07, - "loss": 0.6711, - "step": 64709 - }, - { - "epoch": 1.66, - "learning_rate": 8.77726637767925e-07, - "loss": 0.5757, - "step": 64710 - }, - { - "epoch": 1.66, - "learning_rate": 8.776991749871747e-07, - "loss": 0.542, - "step": 64711 - }, - { - "epoch": 1.66, - "learning_rate": 8.776717123000643e-07, - "loss": 0.4817, - "step": 64712 - }, - { - "epoch": 1.66, - "learning_rate": 8.776442497066149e-07, - "loss": 0.7422, - "step": 64713 - }, - { - "epoch": 1.66, - "learning_rate": 8.776167872068479e-07, - "loss": 0.7734, - "step": 64714 - }, - { - "epoch": 1.66, - "learning_rate": 8.775893248007839e-07, - "loss": 0.5913, - "step": 64715 - }, - { - "epoch": 1.66, - "learning_rate": 8.775618624884442e-07, - "loss": 0.7686, - "step": 64716 - }, - { - "epoch": 1.66, - "learning_rate": 8.775344002698496e-07, - "loss": 0.571, - "step": 64717 - }, - { - "epoch": 1.66, - "learning_rate": 8.775069381450215e-07, - "loss": 0.6309, - "step": 64718 - }, - { - "epoch": 1.66, - "learning_rate": 8.774794761139805e-07, - "loss": 0.6846, - "step": 64719 - }, - { - "epoch": 1.66, - "learning_rate": 8.774520141767483e-07, - "loss": 0.707, - "step": 64720 - }, - { - "epoch": 1.66, - "learning_rate": 8.774245523333452e-07, - "loss": 0.543, - "step": 64721 - }, - { - "epoch": 1.66, - "learning_rate": 8.773970905837922e-07, - "loss": 0.645, - "step": 64722 - }, - { - "epoch": 1.66, - "learning_rate": 8.773696289281109e-07, - "loss": 0.6519, - "step": 64723 - }, - { - "epoch": 1.66, - "learning_rate": 8.77342167366322e-07, - "loss": 0.6689, - "step": 64724 - }, - { - "epoch": 1.66, - "learning_rate": 8.773147058984465e-07, - "loss": 0.834, - "step": 64725 - }, - { - "epoch": 1.66, - "learning_rate": 8.772872445245053e-07, - "loss": 0.6748, - "step": 64726 - }, - { - "epoch": 1.66, - "learning_rate": 8.7725978324452e-07, - "loss": 0.646, - "step": 64727 - }, - { - "epoch": 1.66, - "learning_rate": 8.772323220585108e-07, - "loss": 0.6982, - "step": 64728 - }, - { - "epoch": 1.66, - "learning_rate": 8.772048609664996e-07, - "loss": 0.5708, - "step": 64729 - }, - { - "epoch": 1.66, - "learning_rate": 8.771773999685071e-07, - "loss": 0.7002, - "step": 64730 - }, - { - "epoch": 1.66, - "learning_rate": 8.77149939064554e-07, - "loss": 0.6548, - "step": 64731 - }, - { - "epoch": 1.66, - "learning_rate": 8.771224782546614e-07, - "loss": 0.5254, - "step": 64732 - }, - { - "epoch": 1.66, - "learning_rate": 8.770950175388507e-07, - "loss": 0.6733, - "step": 64733 - }, - { - "epoch": 1.66, - "learning_rate": 8.770675569171423e-07, - "loss": 0.5479, - "step": 64734 - }, - { - "epoch": 1.66, - "learning_rate": 8.770400963895579e-07, - "loss": 0.599, - "step": 64735 - }, - { - "epoch": 1.66, - "learning_rate": 8.770126359561181e-07, - "loss": 0.6641, - "step": 64736 - }, - { - "epoch": 1.66, - "learning_rate": 8.769851756168443e-07, - "loss": 0.5369, - "step": 64737 - }, - { - "epoch": 1.66, - "learning_rate": 8.76957715371757e-07, - "loss": 0.5126, - "step": 64738 - }, - { - "epoch": 1.66, - "learning_rate": 8.769302552208778e-07, - "loss": 0.6172, - "step": 64739 - }, - { - "epoch": 1.66, - "learning_rate": 8.769027951642276e-07, - "loss": 0.7061, - "step": 64740 - }, - { - "epoch": 1.66, - "learning_rate": 8.768753352018269e-07, - "loss": 0.646, - "step": 64741 - }, - { - "epoch": 1.66, - "learning_rate": 8.768478753336974e-07, - "loss": 0.5479, - "step": 64742 - }, - { - "epoch": 1.66, - "learning_rate": 8.768204155598593e-07, - "loss": 0.6938, - "step": 64743 - }, - { - "epoch": 1.66, - "learning_rate": 8.767929558803347e-07, - "loss": 0.6611, - "step": 64744 - }, - { - "epoch": 1.66, - "learning_rate": 8.767654962951437e-07, - "loss": 0.6299, - "step": 64745 - }, - { - "epoch": 1.66, - "learning_rate": 8.767380368043078e-07, - "loss": 0.481, - "step": 64746 - }, - { - "epoch": 1.66, - "learning_rate": 8.767105774078478e-07, - "loss": 0.5928, - "step": 64747 - }, - { - "epoch": 1.66, - "learning_rate": 8.76683118105785e-07, - "loss": 0.7998, - "step": 64748 - }, - { - "epoch": 1.66, - "learning_rate": 8.766556588981404e-07, - "loss": 0.6904, - "step": 64749 - }, - { - "epoch": 1.66, - "learning_rate": 8.76628199784935e-07, - "loss": 0.6528, - "step": 64750 - }, - { - "epoch": 1.66, - "learning_rate": 8.766007407661893e-07, - "loss": 0.626, - "step": 64751 - }, - { - "epoch": 1.66, - "learning_rate": 8.76573281841925e-07, - "loss": 0.7012, - "step": 64752 - }, - { - "epoch": 1.66, - "learning_rate": 8.765458230121626e-07, - "loss": 0.6953, - "step": 64753 - }, - { - "epoch": 1.66, - "learning_rate": 8.765183642769236e-07, - "loss": 0.4121, - "step": 64754 - }, - { - "epoch": 1.66, - "learning_rate": 8.764909056362286e-07, - "loss": 0.5435, - "step": 64755 - }, - { - "epoch": 1.66, - "learning_rate": 8.764634470900991e-07, - "loss": 0.7656, - "step": 64756 - }, - { - "epoch": 1.66, - "learning_rate": 8.764359886385556e-07, - "loss": 0.5903, - "step": 64757 - }, - { - "epoch": 1.66, - "learning_rate": 8.764085302816196e-07, - "loss": 0.5957, - "step": 64758 - }, - { - "epoch": 1.66, - "learning_rate": 8.763810720193118e-07, - "loss": 0.6963, - "step": 64759 - }, - { - "epoch": 1.66, - "learning_rate": 8.763536138516536e-07, - "loss": 0.4824, - "step": 64760 - }, - { - "epoch": 1.66, - "learning_rate": 8.763261557786656e-07, - "loss": 0.6372, - "step": 64761 - }, - { - "epoch": 1.66, - "learning_rate": 8.762986978003688e-07, - "loss": 0.6387, - "step": 64762 - }, - { - "epoch": 1.66, - "learning_rate": 8.762712399167846e-07, - "loss": 0.8613, - "step": 64763 - }, - { - "epoch": 1.66, - "learning_rate": 8.762437821279335e-07, - "loss": 0.6968, - "step": 64764 - }, - { - "epoch": 1.66, - "learning_rate": 8.762163244338371e-07, - "loss": 0.6895, - "step": 64765 - }, - { - "epoch": 1.66, - "learning_rate": 8.761888668345162e-07, - "loss": 0.7383, - "step": 64766 - }, - { - "epoch": 1.66, - "learning_rate": 8.761614093299916e-07, - "loss": 0.7446, - "step": 64767 - }, - { - "epoch": 1.66, - "learning_rate": 8.761339519202848e-07, - "loss": 0.5527, - "step": 64768 - }, - { - "epoch": 1.66, - "learning_rate": 8.761064946054162e-07, - "loss": 0.625, - "step": 64769 - }, - { - "epoch": 1.66, - "learning_rate": 8.760790373854076e-07, - "loss": 0.5068, - "step": 64770 - }, - { - "epoch": 1.66, - "learning_rate": 8.760515802602793e-07, - "loss": 0.6309, - "step": 64771 - }, - { - "epoch": 1.66, - "learning_rate": 8.760241232300526e-07, - "loss": 0.6582, - "step": 64772 - }, - { - "epoch": 1.66, - "learning_rate": 8.759966662947487e-07, - "loss": 0.5605, - "step": 64773 - }, - { - "epoch": 1.66, - "learning_rate": 8.75969209454388e-07, - "loss": 0.6401, - "step": 64774 - }, - { - "epoch": 1.66, - "learning_rate": 8.759417527089924e-07, - "loss": 0.4548, - "step": 64775 - }, - { - "epoch": 1.66, - "learning_rate": 8.759142960585822e-07, - "loss": 0.5903, - "step": 64776 - }, - { - "epoch": 1.66, - "learning_rate": 8.75886839503179e-07, - "loss": 0.626, - "step": 64777 - }, - { - "epoch": 1.66, - "learning_rate": 8.758593830428032e-07, - "loss": 0.7236, - "step": 64778 - }, - { - "epoch": 1.66, - "learning_rate": 8.758319266774766e-07, - "loss": 0.6587, - "step": 64779 - }, - { - "epoch": 1.66, - "learning_rate": 8.758044704072198e-07, - "loss": 0.6802, - "step": 64780 - }, - { - "epoch": 1.66, - "learning_rate": 8.757770142320536e-07, - "loss": 0.6128, - "step": 64781 - }, - { - "epoch": 1.66, - "learning_rate": 8.757495581519991e-07, - "loss": 0.6929, - "step": 64782 - }, - { - "epoch": 1.66, - "learning_rate": 8.757221021670777e-07, - "loss": 0.6836, - "step": 64783 - }, - { - "epoch": 1.66, - "learning_rate": 8.756946462773099e-07, - "loss": 0.6973, - "step": 64784 - }, - { - "epoch": 1.66, - "learning_rate": 8.756671904827172e-07, - "loss": 0.6108, - "step": 64785 - }, - { - "epoch": 1.66, - "learning_rate": 8.756397347833203e-07, - "loss": 0.5938, - "step": 64786 - }, - { - "epoch": 1.66, - "learning_rate": 8.756122791791404e-07, - "loss": 0.6353, - "step": 64787 - }, - { - "epoch": 1.66, - "learning_rate": 8.755848236701982e-07, - "loss": 0.5803, - "step": 64788 - }, - { - "epoch": 1.66, - "learning_rate": 8.755573682565154e-07, - "loss": 0.5701, - "step": 64789 - }, - { - "epoch": 1.66, - "learning_rate": 8.755299129381126e-07, - "loss": 0.5869, - "step": 64790 - }, - { - "epoch": 1.66, - "learning_rate": 8.755024577150105e-07, - "loss": 0.6328, - "step": 64791 - }, - { - "epoch": 1.66, - "learning_rate": 8.754750025872308e-07, - "loss": 0.6943, - "step": 64792 - }, - { - "epoch": 1.66, - "learning_rate": 8.754475475547937e-07, - "loss": 0.7832, - "step": 64793 - }, - { - "epoch": 1.66, - "learning_rate": 8.75420092617721e-07, - "loss": 0.7295, - "step": 64794 - }, - { - "epoch": 1.66, - "learning_rate": 8.753926377760333e-07, - "loss": 0.4084, - "step": 64795 - }, - { - "epoch": 1.66, - "learning_rate": 8.753651830297517e-07, - "loss": 0.5603, - "step": 64796 - }, - { - "epoch": 1.66, - "learning_rate": 8.753377283788972e-07, - "loss": 0.6162, - "step": 64797 - }, - { - "epoch": 1.66, - "learning_rate": 8.75310273823491e-07, - "loss": 0.593, - "step": 64798 - }, - { - "epoch": 1.66, - "learning_rate": 8.75282819363554e-07, - "loss": 0.688, - "step": 64799 - }, - { - "epoch": 1.66, - "learning_rate": 8.752553649991076e-07, - "loss": 0.5508, - "step": 64800 - }, - { - "epoch": 1.66, - "learning_rate": 8.752279107301719e-07, - "loss": 0.666, - "step": 64801 - }, - { - "epoch": 1.66, - "learning_rate": 8.752004565567687e-07, - "loss": 0.877, - "step": 64802 - }, - { - "epoch": 1.66, - "learning_rate": 8.751730024789185e-07, - "loss": 0.5889, - "step": 64803 - }, - { - "epoch": 1.66, - "learning_rate": 8.751455484966428e-07, - "loss": 0.6016, - "step": 64804 - }, - { - "epoch": 1.66, - "learning_rate": 8.751180946099621e-07, - "loss": 0.502, - "step": 64805 - }, - { - "epoch": 1.66, - "learning_rate": 8.750906408188981e-07, - "loss": 0.5509, - "step": 64806 - }, - { - "epoch": 1.66, - "learning_rate": 8.750631871234712e-07, - "loss": 0.5557, - "step": 64807 - }, - { - "epoch": 1.66, - "learning_rate": 8.750357335237029e-07, - "loss": 0.4956, - "step": 64808 - }, - { - "epoch": 1.66, - "learning_rate": 8.750082800196138e-07, - "loss": 0.6191, - "step": 64809 - }, - { - "epoch": 1.66, - "learning_rate": 8.749808266112255e-07, - "loss": 0.5967, - "step": 64810 - }, - { - "epoch": 1.66, - "learning_rate": 8.749533732985583e-07, - "loss": 0.6904, - "step": 64811 - }, - { - "epoch": 1.66, - "learning_rate": 8.749259200816335e-07, - "loss": 0.6914, - "step": 64812 - }, - { - "epoch": 1.66, - "learning_rate": 8.748984669604724e-07, - "loss": 0.7124, - "step": 64813 - }, - { - "epoch": 1.66, - "learning_rate": 8.748710139350954e-07, - "loss": 0.5244, - "step": 64814 - }, - { - "epoch": 1.66, - "learning_rate": 8.748435610055244e-07, - "loss": 0.6772, - "step": 64815 - }, - { - "epoch": 1.66, - "learning_rate": 8.748161081717795e-07, - "loss": 0.7432, - "step": 64816 - }, - { - "epoch": 1.66, - "learning_rate": 8.747886554338824e-07, - "loss": 0.6431, - "step": 64817 - }, - { - "epoch": 1.66, - "learning_rate": 8.747612027918537e-07, - "loss": 0.5659, - "step": 64818 - }, - { - "epoch": 1.66, - "learning_rate": 8.747337502457148e-07, - "loss": 0.8506, - "step": 64819 - }, - { - "epoch": 1.66, - "learning_rate": 8.747062977954867e-07, - "loss": 0.6836, - "step": 64820 - }, - { - "epoch": 1.66, - "learning_rate": 8.7467884544119e-07, - "loss": 0.6567, - "step": 64821 - }, - { - "epoch": 1.66, - "learning_rate": 8.746513931828458e-07, - "loss": 0.5664, - "step": 64822 - }, - { - "epoch": 1.66, - "learning_rate": 8.746239410204754e-07, - "loss": 0.6426, - "step": 64823 - }, - { - "epoch": 1.66, - "learning_rate": 8.745964889540995e-07, - "loss": 0.6812, - "step": 64824 - }, - { - "epoch": 1.66, - "learning_rate": 8.745690369837395e-07, - "loss": 0.6787, - "step": 64825 - }, - { - "epoch": 1.66, - "learning_rate": 8.74541585109416e-07, - "loss": 0.6807, - "step": 64826 - }, - { - "epoch": 1.66, - "learning_rate": 8.745141333311506e-07, - "loss": 0.6714, - "step": 64827 - }, - { - "epoch": 1.66, - "learning_rate": 8.744866816489635e-07, - "loss": 0.792, - "step": 64828 - }, - { - "epoch": 1.66, - "learning_rate": 8.744592300628765e-07, - "loss": 0.6196, - "step": 64829 - }, - { - "epoch": 1.66, - "learning_rate": 8.744317785729106e-07, - "loss": 0.5586, - "step": 64830 - }, - { - "epoch": 1.66, - "learning_rate": 8.744043271790859e-07, - "loss": 0.5668, - "step": 64831 - }, - { - "epoch": 1.66, - "learning_rate": 8.743768758814244e-07, - "loss": 0.6836, - "step": 64832 - }, - { - "epoch": 1.66, - "learning_rate": 8.743494246799465e-07, - "loss": 0.7861, - "step": 64833 - }, - { - "epoch": 1.66, - "learning_rate": 8.743219735746737e-07, - "loss": 0.519, - "step": 64834 - }, - { - "epoch": 1.66, - "learning_rate": 8.742945225656264e-07, - "loss": 0.8115, - "step": 64835 - }, - { - "epoch": 1.66, - "learning_rate": 8.742670716528264e-07, - "loss": 0.7007, - "step": 64836 - }, - { - "epoch": 1.66, - "learning_rate": 8.742396208362941e-07, - "loss": 0.6006, - "step": 64837 - }, - { - "epoch": 1.66, - "learning_rate": 8.742121701160508e-07, - "loss": 0.6733, - "step": 64838 - }, - { - "epoch": 1.66, - "learning_rate": 8.741847194921176e-07, - "loss": 0.6514, - "step": 64839 - }, - { - "epoch": 1.66, - "learning_rate": 8.741572689645156e-07, - "loss": 0.665, - "step": 64840 - }, - { - "epoch": 1.66, - "learning_rate": 8.741298185332651e-07, - "loss": 0.6499, - "step": 64841 - }, - { - "epoch": 1.66, - "learning_rate": 8.741023681983879e-07, - "loss": 0.7451, - "step": 64842 - }, - { - "epoch": 1.66, - "learning_rate": 8.740749179599045e-07, - "loss": 0.5413, - "step": 64843 - }, - { - "epoch": 1.66, - "learning_rate": 8.740474678178363e-07, - "loss": 0.6914, - "step": 64844 - }, - { - "epoch": 1.66, - "learning_rate": 8.740200177722039e-07, - "loss": 0.6304, - "step": 64845 - }, - { - "epoch": 1.66, - "learning_rate": 8.739925678230288e-07, - "loss": 0.5542, - "step": 64846 - }, - { - "epoch": 1.66, - "learning_rate": 8.739651179703318e-07, - "loss": 0.5459, - "step": 64847 - }, - { - "epoch": 1.66, - "learning_rate": 8.739376682141339e-07, - "loss": 0.5928, - "step": 64848 - }, - { - "epoch": 1.66, - "learning_rate": 8.73910218554456e-07, - "loss": 0.5957, - "step": 64849 - }, - { - "epoch": 1.66, - "learning_rate": 8.738827689913198e-07, - "loss": 0.6357, - "step": 64850 - }, - { - "epoch": 1.66, - "learning_rate": 8.738553195247453e-07, - "loss": 0.7656, - "step": 64851 - }, - { - "epoch": 1.66, - "learning_rate": 8.738278701547539e-07, - "loss": 0.6094, - "step": 64852 - }, - { - "epoch": 1.66, - "learning_rate": 8.738004208813669e-07, - "loss": 0.6196, - "step": 64853 - }, - { - "epoch": 1.66, - "learning_rate": 8.73772971704605e-07, - "loss": 0.6528, - "step": 64854 - }, - { - "epoch": 1.66, - "learning_rate": 8.737455226244894e-07, - "loss": 0.6128, - "step": 64855 - }, - { - "epoch": 1.66, - "learning_rate": 8.737180736410411e-07, - "loss": 0.6211, - "step": 64856 - }, - { - "epoch": 1.66, - "learning_rate": 8.736906247542808e-07, - "loss": 0.5396, - "step": 64857 - }, - { - "epoch": 1.66, - "learning_rate": 8.736631759642302e-07, - "loss": 0.5283, - "step": 64858 - }, - { - "epoch": 1.66, - "learning_rate": 8.736357272709094e-07, - "loss": 0.6238, - "step": 64859 - }, - { - "epoch": 1.66, - "learning_rate": 8.736082786743405e-07, - "loss": 0.5254, - "step": 64860 - }, - { - "epoch": 1.66, - "learning_rate": 8.735808301745436e-07, - "loss": 0.5708, - "step": 64861 - }, - { - "epoch": 1.66, - "learning_rate": 8.735533817715399e-07, - "loss": 0.7793, - "step": 64862 - }, - { - "epoch": 1.66, - "learning_rate": 8.735259334653508e-07, - "loss": 0.7021, - "step": 64863 - }, - { - "epoch": 1.66, - "learning_rate": 8.734984852559969e-07, - "loss": 0.6036, - "step": 64864 - }, - { - "epoch": 1.66, - "learning_rate": 8.734710371434996e-07, - "loss": 0.6382, - "step": 64865 - }, - { - "epoch": 1.66, - "learning_rate": 8.734435891278794e-07, - "loss": 0.4995, - "step": 64866 - }, - { - "epoch": 1.66, - "learning_rate": 8.734161412091578e-07, - "loss": 0.54, - "step": 64867 - }, - { - "epoch": 1.66, - "learning_rate": 8.733886933873556e-07, - "loss": 0.4243, - "step": 64868 - }, - { - "epoch": 1.66, - "learning_rate": 8.73361245662494e-07, - "loss": 0.6582, - "step": 64869 - }, - { - "epoch": 1.66, - "learning_rate": 8.733337980345941e-07, - "loss": 0.7686, - "step": 64870 - }, - { - "epoch": 1.66, - "learning_rate": 8.733063505036762e-07, - "loss": 0.4672, - "step": 64871 - }, - { - "epoch": 1.66, - "learning_rate": 8.73278903069762e-07, - "loss": 0.7109, - "step": 64872 - }, - { - "epoch": 1.66, - "learning_rate": 8.732514557328725e-07, - "loss": 0.5977, - "step": 64873 - }, - { - "epoch": 1.66, - "learning_rate": 8.732240084930281e-07, - "loss": 0.5366, - "step": 64874 - }, - { - "epoch": 1.66, - "learning_rate": 8.731965613502505e-07, - "loss": 0.5513, - "step": 64875 - }, - { - "epoch": 1.66, - "learning_rate": 8.731691143045603e-07, - "loss": 0.4143, - "step": 64876 - }, - { - "epoch": 1.66, - "learning_rate": 8.731416673559789e-07, - "loss": 0.5508, - "step": 64877 - }, - { - "epoch": 1.66, - "learning_rate": 8.731142205045269e-07, - "loss": 0.603, - "step": 64878 - }, - { - "epoch": 1.66, - "learning_rate": 8.730867737502257e-07, - "loss": 0.5713, - "step": 64879 - }, - { - "epoch": 1.66, - "learning_rate": 8.730593270930963e-07, - "loss": 0.6333, - "step": 64880 - }, - { - "epoch": 1.66, - "learning_rate": 8.730318805331591e-07, - "loss": 0.7119, - "step": 64881 - }, - { - "epoch": 1.66, - "learning_rate": 8.730044340704359e-07, - "loss": 0.666, - "step": 64882 - }, - { - "epoch": 1.66, - "learning_rate": 8.72976987704947e-07, - "loss": 0.6436, - "step": 64883 - }, - { - "epoch": 1.66, - "learning_rate": 8.729495414367141e-07, - "loss": 0.7324, - "step": 64884 - }, - { - "epoch": 1.66, - "learning_rate": 8.729220952657576e-07, - "loss": 0.8232, - "step": 64885 - }, - { - "epoch": 1.66, - "learning_rate": 8.72894649192099e-07, - "loss": 0.6504, - "step": 64886 - }, - { - "epoch": 1.66, - "learning_rate": 8.72867203215759e-07, - "loss": 0.5979, - "step": 64887 - }, - { - "epoch": 1.66, - "learning_rate": 8.728397573367589e-07, - "loss": 0.6152, - "step": 64888 - }, - { - "epoch": 1.66, - "learning_rate": 8.728123115551193e-07, - "loss": 0.5151, - "step": 64889 - }, - { - "epoch": 1.66, - "learning_rate": 8.727848658708621e-07, - "loss": 0.6826, - "step": 64890 - }, - { - "epoch": 1.66, - "learning_rate": 8.727574202840071e-07, - "loss": 0.5446, - "step": 64891 - }, - { - "epoch": 1.66, - "learning_rate": 8.727299747945761e-07, - "loss": 0.603, - "step": 64892 - }, - { - "epoch": 1.66, - "learning_rate": 8.727025294025896e-07, - "loss": 0.6221, - "step": 64893 - }, - { - "epoch": 1.66, - "learning_rate": 8.726750841080692e-07, - "loss": 0.5811, - "step": 64894 - }, - { - "epoch": 1.66, - "learning_rate": 8.726476389110355e-07, - "loss": 0.5493, - "step": 64895 - }, - { - "epoch": 1.66, - "learning_rate": 8.726201938115098e-07, - "loss": 0.603, - "step": 64896 - }, - { - "epoch": 1.66, - "learning_rate": 8.725927488095127e-07, - "loss": 0.6357, - "step": 64897 - }, - { - "epoch": 1.66, - "learning_rate": 8.725653039050658e-07, - "loss": 0.5764, - "step": 64898 - }, - { - "epoch": 1.66, - "learning_rate": 8.725378590981895e-07, - "loss": 0.6079, - "step": 64899 - }, - { - "epoch": 1.66, - "learning_rate": 8.725104143889055e-07, - "loss": 0.6934, - "step": 64900 - }, - { - "epoch": 1.66, - "learning_rate": 8.724829697772342e-07, - "loss": 0.6001, - "step": 64901 - }, - { - "epoch": 1.66, - "learning_rate": 8.724555252631967e-07, - "loss": 0.6665, - "step": 64902 - }, - { - "epoch": 1.66, - "learning_rate": 8.724280808468143e-07, - "loss": 0.4741, - "step": 64903 - }, - { - "epoch": 1.66, - "learning_rate": 8.724006365281076e-07, - "loss": 0.7178, - "step": 64904 - }, - { - "epoch": 1.66, - "learning_rate": 8.72373192307098e-07, - "loss": 0.6738, - "step": 64905 - }, - { - "epoch": 1.66, - "learning_rate": 8.723457481838064e-07, - "loss": 0.5212, - "step": 64906 - }, - { - "epoch": 1.66, - "learning_rate": 8.723183041582538e-07, - "loss": 0.7393, - "step": 64907 - }, - { - "epoch": 1.66, - "learning_rate": 8.72290860230461e-07, - "loss": 0.5016, - "step": 64908 - }, - { - "epoch": 1.66, - "learning_rate": 8.722634164004496e-07, - "loss": 0.5996, - "step": 64909 - }, - { - "epoch": 1.66, - "learning_rate": 8.722359726682403e-07, - "loss": 0.4175, - "step": 64910 - }, - { - "epoch": 1.66, - "learning_rate": 8.722085290338539e-07, - "loss": 0.5913, - "step": 64911 - }, - { - "epoch": 1.66, - "learning_rate": 8.721810854973112e-07, - "loss": 0.6748, - "step": 64912 - }, - { - "epoch": 1.66, - "learning_rate": 8.72153642058634e-07, - "loss": 0.647, - "step": 64913 - }, - { - "epoch": 1.66, - "learning_rate": 8.721261987178426e-07, - "loss": 0.6211, - "step": 64914 - }, - { - "epoch": 1.66, - "learning_rate": 8.720987554749585e-07, - "loss": 0.6201, - "step": 64915 - }, - { - "epoch": 1.66, - "learning_rate": 8.720713123300022e-07, - "loss": 0.3367, - "step": 64916 - }, - { - "epoch": 1.66, - "learning_rate": 8.720438692829953e-07, - "loss": 0.6606, - "step": 64917 - }, - { - "epoch": 1.66, - "learning_rate": 8.720164263339583e-07, - "loss": 0.708, - "step": 64918 - }, - { - "epoch": 1.66, - "learning_rate": 8.719889834829126e-07, - "loss": 0.3324, - "step": 64919 - }, - { - "epoch": 1.66, - "learning_rate": 8.719615407298793e-07, - "loss": 0.5801, - "step": 64920 - }, - { - "epoch": 1.66, - "learning_rate": 8.719340980748788e-07, - "loss": 0.8564, - "step": 64921 - }, - { - "epoch": 1.66, - "learning_rate": 8.719066555179326e-07, - "loss": 0.604, - "step": 64922 - }, - { - "epoch": 1.66, - "learning_rate": 8.718792130590613e-07, - "loss": 0.7402, - "step": 64923 - }, - { - "epoch": 1.66, - "learning_rate": 8.718517706982865e-07, - "loss": 0.5396, - "step": 64924 - }, - { - "epoch": 1.66, - "learning_rate": 8.718243284356287e-07, - "loss": 0.6582, - "step": 64925 - }, - { - "epoch": 1.66, - "learning_rate": 8.717968862711094e-07, - "loss": 0.6216, - "step": 64926 - }, - { - "epoch": 1.66, - "learning_rate": 8.71769444204749e-07, - "loss": 0.6904, - "step": 64927 - }, - { - "epoch": 1.66, - "learning_rate": 8.717420022365692e-07, - "loss": 0.5234, - "step": 64928 - }, - { - "epoch": 1.66, - "learning_rate": 8.717145603665904e-07, - "loss": 0.5747, - "step": 64929 - }, - { - "epoch": 1.66, - "learning_rate": 8.716871185948342e-07, - "loss": 0.6279, - "step": 64930 - }, - { - "epoch": 1.66, - "learning_rate": 8.716596769213209e-07, - "loss": 0.6641, - "step": 64931 - }, - { - "epoch": 1.66, - "learning_rate": 8.716322353460721e-07, - "loss": 0.6982, - "step": 64932 - }, - { - "epoch": 1.66, - "learning_rate": 8.716047938691084e-07, - "loss": 0.6792, - "step": 64933 - }, - { - "epoch": 1.66, - "learning_rate": 8.715773524904511e-07, - "loss": 0.667, - "step": 64934 - }, - { - "epoch": 1.66, - "learning_rate": 8.71549911210121e-07, - "loss": 0.6504, - "step": 64935 - }, - { - "epoch": 1.66, - "learning_rate": 8.715224700281394e-07, - "loss": 0.5967, - "step": 64936 - }, - { - "epoch": 1.66, - "learning_rate": 8.714950289445269e-07, - "loss": 0.4773, - "step": 64937 - }, - { - "epoch": 1.66, - "learning_rate": 8.714675879593049e-07, - "loss": 0.7803, - "step": 64938 - }, - { - "epoch": 1.66, - "learning_rate": 8.714401470724942e-07, - "loss": 0.5513, - "step": 64939 - }, - { - "epoch": 1.66, - "learning_rate": 8.714127062841162e-07, - "loss": 0.6121, - "step": 64940 - }, - { - "epoch": 1.66, - "learning_rate": 8.713852655941914e-07, - "loss": 0.4902, - "step": 64941 - }, - { - "epoch": 1.66, - "learning_rate": 8.713578250027408e-07, - "loss": 0.6885, - "step": 64942 - }, - { - "epoch": 1.66, - "learning_rate": 8.713303845097859e-07, - "loss": 0.6748, - "step": 64943 - }, - { - "epoch": 1.66, - "learning_rate": 8.71302944115347e-07, - "loss": 0.4602, - "step": 64944 - }, - { - "epoch": 1.66, - "learning_rate": 8.712755038194458e-07, - "loss": 0.3499, - "step": 64945 - }, - { - "epoch": 1.66, - "learning_rate": 8.71248063622103e-07, - "loss": 0.75, - "step": 64946 - }, - { - "epoch": 1.66, - "learning_rate": 8.712206235233395e-07, - "loss": 0.5879, - "step": 64947 - }, - { - "epoch": 1.66, - "learning_rate": 8.711931835231766e-07, - "loss": 0.4783, - "step": 64948 - }, - { - "epoch": 1.66, - "learning_rate": 8.71165743621635e-07, - "loss": 0.6665, - "step": 64949 - }, - { - "epoch": 1.66, - "learning_rate": 8.711383038187362e-07, - "loss": 0.6826, - "step": 64950 - }, - { - "epoch": 1.66, - "learning_rate": 8.711108641145008e-07, - "loss": 0.8467, - "step": 64951 - }, - { - "epoch": 1.66, - "learning_rate": 8.710834245089495e-07, - "loss": 0.8262, - "step": 64952 - }, - { - "epoch": 1.66, - "learning_rate": 8.71055985002104e-07, - "loss": 0.5732, - "step": 64953 - }, - { - "epoch": 1.66, - "learning_rate": 8.710285455939848e-07, - "loss": 0.605, - "step": 64954 - }, - { - "epoch": 1.66, - "learning_rate": 8.710011062846133e-07, - "loss": 0.6064, - "step": 64955 - }, - { - "epoch": 1.66, - "learning_rate": 8.709736670740102e-07, - "loss": 0.7109, - "step": 64956 - }, - { - "epoch": 1.66, - "learning_rate": 8.709462279621968e-07, - "loss": 0.5942, - "step": 64957 - }, - { - "epoch": 1.66, - "learning_rate": 8.709187889491936e-07, - "loss": 0.603, - "step": 64958 - }, - { - "epoch": 1.66, - "learning_rate": 8.708913500350223e-07, - "loss": 0.6611, - "step": 64959 - }, - { - "epoch": 1.66, - "learning_rate": 8.708639112197037e-07, - "loss": 0.7061, - "step": 64960 - }, - { - "epoch": 1.66, - "learning_rate": 8.708364725032583e-07, - "loss": 0.6426, - "step": 64961 - }, - { - "epoch": 1.67, - "learning_rate": 8.708090338857076e-07, - "loss": 0.5288, - "step": 64962 - }, - { - "epoch": 1.67, - "learning_rate": 8.707815953670726e-07, - "loss": 0.5923, - "step": 64963 - }, - { - "epoch": 1.67, - "learning_rate": 8.707541569473739e-07, - "loss": 0.6875, - "step": 64964 - }, - { - "epoch": 1.67, - "learning_rate": 8.70726718626633e-07, - "loss": 0.2667, - "step": 64965 - }, - { - "epoch": 1.67, - "learning_rate": 8.706992804048705e-07, - "loss": 0.6123, - "step": 64966 - }, - { - "epoch": 1.67, - "learning_rate": 8.706718422821079e-07, - "loss": 0.7188, - "step": 64967 - }, - { - "epoch": 1.67, - "learning_rate": 8.706444042583656e-07, - "loss": 0.5947, - "step": 64968 - }, - { - "epoch": 1.67, - "learning_rate": 8.706169663336652e-07, - "loss": 0.6455, - "step": 64969 - }, - { - "epoch": 1.67, - "learning_rate": 8.705895285080277e-07, - "loss": 0.6711, - "step": 64970 - }, - { - "epoch": 1.67, - "learning_rate": 8.705620907814733e-07, - "loss": 0.626, - "step": 64971 - }, - { - "epoch": 1.67, - "learning_rate": 8.705346531540238e-07, - "loss": 0.7764, - "step": 64972 - }, - { - "epoch": 1.67, - "learning_rate": 8.705072156256998e-07, - "loss": 0.6333, - "step": 64973 - }, - { - "epoch": 1.67, - "learning_rate": 8.704797781965227e-07, - "loss": 0.4651, - "step": 64974 - }, - { - "epoch": 1.67, - "learning_rate": 8.704523408665131e-07, - "loss": 0.7539, - "step": 64975 - }, - { - "epoch": 1.67, - "learning_rate": 8.704249036356923e-07, - "loss": 0.5554, - "step": 64976 - }, - { - "epoch": 1.67, - "learning_rate": 8.70397466504081e-07, - "loss": 0.7031, - "step": 64977 - }, - { - "epoch": 1.67, - "learning_rate": 8.703700294717007e-07, - "loss": 0.6997, - "step": 64978 - }, - { - "epoch": 1.67, - "learning_rate": 8.703425925385718e-07, - "loss": 0.751, - "step": 64979 - }, - { - "epoch": 1.67, - "learning_rate": 8.703151557047164e-07, - "loss": 0.6592, - "step": 64980 - }, - { - "epoch": 1.67, - "learning_rate": 8.702877189701538e-07, - "loss": 0.7393, - "step": 64981 - }, - { - "epoch": 1.67, - "learning_rate": 8.702602823349063e-07, - "loss": 0.6362, - "step": 64982 - }, - { - "epoch": 1.67, - "learning_rate": 8.702328457989945e-07, - "loss": 0.52, - "step": 64983 - }, - { - "epoch": 1.67, - "learning_rate": 8.702054093624393e-07, - "loss": 0.6196, - "step": 64984 - }, - { - "epoch": 1.67, - "learning_rate": 8.701779730252619e-07, - "loss": 0.6123, - "step": 64985 - }, - { - "epoch": 1.67, - "learning_rate": 8.701505367874834e-07, - "loss": 0.4768, - "step": 64986 - }, - { - "epoch": 1.67, - "learning_rate": 8.701231006491245e-07, - "loss": 0.7158, - "step": 64987 - }, - { - "epoch": 1.67, - "learning_rate": 8.700956646102064e-07, - "loss": 0.7373, - "step": 64988 - }, - { - "epoch": 1.67, - "learning_rate": 8.700682286707501e-07, - "loss": 0.4431, - "step": 64989 - }, - { - "epoch": 1.67, - "learning_rate": 8.700407928307769e-07, - "loss": 0.6196, - "step": 64990 - }, - { - "epoch": 1.67, - "learning_rate": 8.700133570903073e-07, - "loss": 0.7451, - "step": 64991 - }, - { - "epoch": 1.67, - "learning_rate": 8.699859214493622e-07, - "loss": 0.7812, - "step": 64992 - }, - { - "epoch": 1.67, - "learning_rate": 8.699584859079632e-07, - "loss": 0.573, - "step": 64993 - }, - { - "epoch": 1.67, - "learning_rate": 8.699310504661308e-07, - "loss": 0.4912, - "step": 64994 - }, - { - "epoch": 1.67, - "learning_rate": 8.699036151238863e-07, - "loss": 0.6177, - "step": 64995 - }, - { - "epoch": 1.67, - "learning_rate": 8.698761798812507e-07, - "loss": 0.7803, - "step": 64996 - }, - { - "epoch": 1.67, - "learning_rate": 8.698487447382447e-07, - "loss": 0.6924, - "step": 64997 - }, - { - "epoch": 1.67, - "learning_rate": 8.698213096948897e-07, - "loss": 0.7012, - "step": 64998 - }, - { - "epoch": 1.67, - "learning_rate": 8.697938747512066e-07, - "loss": 0.7021, - "step": 64999 - }, - { - "epoch": 1.67, - "learning_rate": 8.697664399072166e-07, - "loss": 0.6416, - "step": 65000 - }, - { - "epoch": 1.67, - "learning_rate": 8.697390051629402e-07, - "loss": 0.647, - "step": 65001 - }, - { - "epoch": 1.67, - "learning_rate": 8.697115705183984e-07, - "loss": 0.5986, - "step": 65002 - }, - { - "epoch": 1.67, - "learning_rate": 8.696841359736127e-07, - "loss": 0.6035, - "step": 65003 - }, - { - "epoch": 1.67, - "learning_rate": 8.696567015286037e-07, - "loss": 0.6846, - "step": 65004 - }, - { - "epoch": 1.67, - "learning_rate": 8.696292671833927e-07, - "loss": 0.5737, - "step": 65005 - }, - { - "epoch": 1.67, - "learning_rate": 8.696018329380003e-07, - "loss": 0.6299, - "step": 65006 - }, - { - "epoch": 1.67, - "learning_rate": 8.695743987924482e-07, - "loss": 0.6592, - "step": 65007 - }, - { - "epoch": 1.67, - "learning_rate": 8.695469647467567e-07, - "loss": 0.6426, - "step": 65008 - }, - { - "epoch": 1.67, - "learning_rate": 8.695195308009473e-07, - "loss": 0.6465, - "step": 65009 - }, - { - "epoch": 1.67, - "learning_rate": 8.69492096955041e-07, - "loss": 0.6621, - "step": 65010 - }, - { - "epoch": 1.67, - "learning_rate": 8.694646632090582e-07, - "loss": 0.6924, - "step": 65011 - }, - { - "epoch": 1.67, - "learning_rate": 8.694372295630204e-07, - "loss": 0.7881, - "step": 65012 - }, - { - "epoch": 1.67, - "learning_rate": 8.694097960169484e-07, - "loss": 0.7549, - "step": 65013 - }, - { - "epoch": 1.67, - "learning_rate": 8.693823625708636e-07, - "loss": 0.5713, - "step": 65014 - }, - { - "epoch": 1.67, - "learning_rate": 8.693549292247864e-07, - "loss": 0.6377, - "step": 65015 - }, - { - "epoch": 1.67, - "learning_rate": 8.693274959787383e-07, - "loss": 0.6455, - "step": 65016 - }, - { - "epoch": 1.67, - "learning_rate": 8.6930006283274e-07, - "loss": 0.6494, - "step": 65017 - }, - { - "epoch": 1.67, - "learning_rate": 8.692726297868128e-07, - "loss": 0.5, - "step": 65018 - }, - { - "epoch": 1.67, - "learning_rate": 8.692451968409777e-07, - "loss": 0.7271, - "step": 65019 - }, - { - "epoch": 1.67, - "learning_rate": 8.692177639952555e-07, - "loss": 0.6025, - "step": 65020 - }, - { - "epoch": 1.67, - "learning_rate": 8.691903312496669e-07, - "loss": 0.519, - "step": 65021 - }, - { - "epoch": 1.67, - "learning_rate": 8.691628986042335e-07, - "loss": 0.7061, - "step": 65022 - }, - { - "epoch": 1.67, - "learning_rate": 8.691354660589758e-07, - "loss": 0.5186, - "step": 65023 - }, - { - "epoch": 1.67, - "learning_rate": 8.691080336139153e-07, - "loss": 0.6206, - "step": 65024 - }, - { - "epoch": 1.67, - "learning_rate": 8.690806012690725e-07, - "loss": 0.7734, - "step": 65025 - }, - { - "epoch": 1.67, - "learning_rate": 8.690531690244689e-07, - "loss": 0.4861, - "step": 65026 - }, - { - "epoch": 1.67, - "learning_rate": 8.690257368801251e-07, - "loss": 0.4944, - "step": 65027 - }, - { - "epoch": 1.67, - "learning_rate": 8.689983048360625e-07, - "loss": 0.7686, - "step": 65028 - }, - { - "epoch": 1.67, - "learning_rate": 8.68970872892302e-07, - "loss": 0.668, - "step": 65029 - }, - { - "epoch": 1.67, - "learning_rate": 8.68943441048864e-07, - "loss": 0.5969, - "step": 65030 - }, - { - "epoch": 1.67, - "learning_rate": 8.689160093057703e-07, - "loss": 0.751, - "step": 65031 - }, - { - "epoch": 1.67, - "learning_rate": 8.688885776630414e-07, - "loss": 0.5332, - "step": 65032 - }, - { - "epoch": 1.67, - "learning_rate": 8.688611461206987e-07, - "loss": 0.4998, - "step": 65033 - }, - { - "epoch": 1.67, - "learning_rate": 8.688337146787628e-07, - "loss": 0.7998, - "step": 65034 - }, - { - "epoch": 1.67, - "learning_rate": 8.688062833372549e-07, - "loss": 0.5742, - "step": 65035 - }, - { - "epoch": 1.67, - "learning_rate": 8.687788520961961e-07, - "loss": 0.5532, - "step": 65036 - }, - { - "epoch": 1.67, - "learning_rate": 8.687514209556072e-07, - "loss": 0.4434, - "step": 65037 - }, - { - "epoch": 1.67, - "learning_rate": 8.687239899155095e-07, - "loss": 0.6855, - "step": 65038 - }, - { - "epoch": 1.67, - "learning_rate": 8.68696558975924e-07, - "loss": 0.5771, - "step": 65039 - }, - { - "epoch": 1.67, - "learning_rate": 8.68669128136871e-07, - "loss": 0.71, - "step": 65040 - }, - { - "epoch": 1.67, - "learning_rate": 8.686416973983722e-07, - "loss": 0.6445, - "step": 65041 - }, - { - "epoch": 1.67, - "learning_rate": 8.686142667604484e-07, - "loss": 0.6973, - "step": 65042 - }, - { - "epoch": 1.67, - "learning_rate": 8.685868362231206e-07, - "loss": 0.5564, - "step": 65043 - }, - { - "epoch": 1.67, - "learning_rate": 8.685594057864096e-07, - "loss": 0.6377, - "step": 65044 - }, - { - "epoch": 1.67, - "learning_rate": 8.68531975450337e-07, - "loss": 0.7119, - "step": 65045 - }, - { - "epoch": 1.67, - "learning_rate": 8.685045452149231e-07, - "loss": 0.5596, - "step": 65046 - }, - { - "epoch": 1.67, - "learning_rate": 8.684771150801895e-07, - "loss": 0.54, - "step": 65047 - }, - { - "epoch": 1.67, - "learning_rate": 8.684496850461567e-07, - "loss": 0.8135, - "step": 65048 - }, - { - "epoch": 1.67, - "learning_rate": 8.684222551128464e-07, - "loss": 0.707, - "step": 65049 - }, - { - "epoch": 1.67, - "learning_rate": 8.683948252802787e-07, - "loss": 0.6523, - "step": 65050 - }, - { - "epoch": 1.67, - "learning_rate": 8.68367395548475e-07, - "loss": 0.6992, - "step": 65051 - }, - { - "epoch": 1.67, - "learning_rate": 8.683399659174566e-07, - "loss": 0.604, - "step": 65052 - }, - { - "epoch": 1.67, - "learning_rate": 8.683125363872442e-07, - "loss": 0.7021, - "step": 65053 - }, - { - "epoch": 1.67, - "learning_rate": 8.682851069578585e-07, - "loss": 0.6807, - "step": 65054 - }, - { - "epoch": 1.67, - "learning_rate": 8.682576776293211e-07, - "loss": 0.6987, - "step": 65055 - }, - { - "epoch": 1.67, - "learning_rate": 8.682302484016526e-07, - "loss": 0.8018, - "step": 65056 - }, - { - "epoch": 1.67, - "learning_rate": 8.682028192748742e-07, - "loss": 0.5146, - "step": 65057 - }, - { - "epoch": 1.67, - "learning_rate": 8.681753902490068e-07, - "loss": 0.625, - "step": 65058 - }, - { - "epoch": 1.67, - "learning_rate": 8.681479613240718e-07, - "loss": 0.6196, - "step": 65059 - }, - { - "epoch": 1.67, - "learning_rate": 8.681205325000896e-07, - "loss": 0.6797, - "step": 65060 - }, - { - "epoch": 1.67, - "learning_rate": 8.680931037770812e-07, - "loss": 0.5229, - "step": 65061 - }, - { - "epoch": 1.67, - "learning_rate": 8.680656751550681e-07, - "loss": 0.6504, - "step": 65062 - }, - { - "epoch": 1.67, - "learning_rate": 8.68038246634071e-07, - "loss": 0.6572, - "step": 65063 - }, - { - "epoch": 1.67, - "learning_rate": 8.680108182141109e-07, - "loss": 0.7393, - "step": 65064 - }, - { - "epoch": 1.67, - "learning_rate": 8.679833898952088e-07, - "loss": 0.4739, - "step": 65065 - }, - { - "epoch": 1.67, - "learning_rate": 8.679559616773859e-07, - "loss": 0.6016, - "step": 65066 - }, - { - "epoch": 1.67, - "learning_rate": 8.679285335606628e-07, - "loss": 0.7754, - "step": 65067 - }, - { - "epoch": 1.67, - "learning_rate": 8.67901105545061e-07, - "loss": 0.6621, - "step": 65068 - }, - { - "epoch": 1.67, - "learning_rate": 8.678736776306015e-07, - "loss": 0.7822, - "step": 65069 - }, - { - "epoch": 1.67, - "learning_rate": 8.678462498173048e-07, - "loss": 0.7734, - "step": 65070 - }, - { - "epoch": 1.67, - "learning_rate": 8.678188221051919e-07, - "loss": 0.6855, - "step": 65071 - }, - { - "epoch": 1.67, - "learning_rate": 8.677913944942843e-07, - "loss": 0.5786, - "step": 65072 - }, - { - "epoch": 1.67, - "learning_rate": 8.677639669846027e-07, - "loss": 0.7646, - "step": 65073 - }, - { - "epoch": 1.67, - "learning_rate": 8.677365395761681e-07, - "loss": 0.7256, - "step": 65074 - }, - { - "epoch": 1.67, - "learning_rate": 8.677091122690015e-07, - "loss": 0.7383, - "step": 65075 - }, - { - "epoch": 1.67, - "learning_rate": 8.67681685063124e-07, - "loss": 0.5359, - "step": 65076 - }, - { - "epoch": 1.67, - "learning_rate": 8.676542579585564e-07, - "loss": 0.626, - "step": 65077 - }, - { - "epoch": 1.67, - "learning_rate": 8.676268309553202e-07, - "loss": 0.7495, - "step": 65078 - }, - { - "epoch": 1.67, - "learning_rate": 8.675994040534362e-07, - "loss": 0.6885, - "step": 65079 - }, - { - "epoch": 1.67, - "learning_rate": 8.675719772529247e-07, - "loss": 0.752, - "step": 65080 - }, - { - "epoch": 1.67, - "learning_rate": 8.675445505538076e-07, - "loss": 0.627, - "step": 65081 - }, - { - "epoch": 1.67, - "learning_rate": 8.675171239561052e-07, - "loss": 0.6758, - "step": 65082 - }, - { - "epoch": 1.67, - "learning_rate": 8.674896974598391e-07, - "loss": 0.4558, - "step": 65083 - }, - { - "epoch": 1.67, - "learning_rate": 8.674622710650299e-07, - "loss": 0.793, - "step": 65084 - }, - { - "epoch": 1.67, - "learning_rate": 8.67434844771699e-07, - "loss": 0.6367, - "step": 65085 - }, - { - "epoch": 1.67, - "learning_rate": 8.674074185798668e-07, - "loss": 0.5898, - "step": 65086 - }, - { - "epoch": 1.67, - "learning_rate": 8.67379992489555e-07, - "loss": 0.6394, - "step": 65087 - }, - { - "epoch": 1.67, - "learning_rate": 8.673525665007839e-07, - "loss": 0.7124, - "step": 65088 - }, - { - "epoch": 1.67, - "learning_rate": 8.673251406135755e-07, - "loss": 0.6362, - "step": 65089 - }, - { - "epoch": 1.67, - "learning_rate": 8.672977148279495e-07, - "loss": 0.6646, - "step": 65090 - }, - { - "epoch": 1.67, - "learning_rate": 8.672702891439279e-07, - "loss": 0.5166, - "step": 65091 - }, - { - "epoch": 1.67, - "learning_rate": 8.67242863561531e-07, - "loss": 0.502, - "step": 65092 - }, - { - "epoch": 1.67, - "learning_rate": 8.672154380807804e-07, - "loss": 0.7412, - "step": 65093 - }, - { - "epoch": 1.67, - "learning_rate": 8.671880127016963e-07, - "loss": 0.8213, - "step": 65094 - }, - { - "epoch": 1.67, - "learning_rate": 8.671605874243008e-07, - "loss": 0.5532, - "step": 65095 - }, - { - "epoch": 1.67, - "learning_rate": 8.671331622486141e-07, - "loss": 0.8242, - "step": 65096 - }, - { - "epoch": 1.67, - "learning_rate": 8.671057371746575e-07, - "loss": 0.6904, - "step": 65097 - }, - { - "epoch": 1.67, - "learning_rate": 8.670783122024519e-07, - "loss": 0.6758, - "step": 65098 - }, - { - "epoch": 1.67, - "learning_rate": 8.670508873320186e-07, - "loss": 0.7324, - "step": 65099 - }, - { - "epoch": 1.67, - "learning_rate": 8.670234625633781e-07, - "loss": 0.7812, - "step": 65100 - }, - { - "epoch": 1.67, - "learning_rate": 8.669960378965515e-07, - "loss": 0.6357, - "step": 65101 - }, - { - "epoch": 1.67, - "learning_rate": 8.669686133315601e-07, - "loss": 0.7598, - "step": 65102 - }, - { - "epoch": 1.67, - "learning_rate": 8.669411888684244e-07, - "loss": 0.5481, - "step": 65103 - }, - { - "epoch": 1.67, - "learning_rate": 8.66913764507166e-07, - "loss": 0.5483, - "step": 65104 - }, - { - "epoch": 1.67, - "learning_rate": 8.668863402478055e-07, - "loss": 0.5106, - "step": 65105 - }, - { - "epoch": 1.67, - "learning_rate": 8.668589160903641e-07, - "loss": 0.6562, - "step": 65106 - }, - { - "epoch": 1.67, - "learning_rate": 8.668314920348625e-07, - "loss": 0.6611, - "step": 65107 - }, - { - "epoch": 1.67, - "learning_rate": 8.668040680813222e-07, - "loss": 0.4812, - "step": 65108 - }, - { - "epoch": 1.67, - "learning_rate": 8.66776644229764e-07, - "loss": 0.6494, - "step": 65109 - }, - { - "epoch": 1.67, - "learning_rate": 8.667492204802087e-07, - "loss": 0.7021, - "step": 65110 - }, - { - "epoch": 1.67, - "learning_rate": 8.667217968326771e-07, - "loss": 0.4702, - "step": 65111 - }, - { - "epoch": 1.67, - "learning_rate": 8.666943732871908e-07, - "loss": 0.5146, - "step": 65112 - }, - { - "epoch": 1.67, - "learning_rate": 8.666669498437701e-07, - "loss": 0.6704, - "step": 65113 - }, - { - "epoch": 1.67, - "learning_rate": 8.666395265024367e-07, - "loss": 0.7109, - "step": 65114 - }, - { - "epoch": 1.67, - "learning_rate": 8.666121032632111e-07, - "loss": 0.708, - "step": 65115 - }, - { - "epoch": 1.67, - "learning_rate": 8.665846801261146e-07, - "loss": 0.5938, - "step": 65116 - }, - { - "epoch": 1.67, - "learning_rate": 8.66557257091168e-07, - "loss": 0.5854, - "step": 65117 - }, - { - "epoch": 1.67, - "learning_rate": 8.665298341583924e-07, - "loss": 0.7012, - "step": 65118 - }, - { - "epoch": 1.67, - "learning_rate": 8.665024113278092e-07, - "loss": 0.6592, - "step": 65119 - }, - { - "epoch": 1.67, - "learning_rate": 8.664749885994384e-07, - "loss": 0.6338, - "step": 65120 - }, - { - "epoch": 1.67, - "learning_rate": 8.664475659733018e-07, - "loss": 0.6338, - "step": 65121 - }, - { - "epoch": 1.67, - "learning_rate": 8.664201434494199e-07, - "loss": 0.6558, - "step": 65122 - }, - { - "epoch": 1.67, - "learning_rate": 8.663927210278144e-07, - "loss": 0.5688, - "step": 65123 - }, - { - "epoch": 1.67, - "learning_rate": 8.663652987085052e-07, - "loss": 0.4788, - "step": 65124 - }, - { - "epoch": 1.67, - "learning_rate": 8.663378764915146e-07, - "loss": 0.6821, - "step": 65125 - }, - { - "epoch": 1.67, - "learning_rate": 8.663104543768626e-07, - "loss": 0.613, - "step": 65126 - }, - { - "epoch": 1.67, - "learning_rate": 8.662830323645705e-07, - "loss": 0.5601, - "step": 65127 - }, - { - "epoch": 1.67, - "learning_rate": 8.662556104546596e-07, - "loss": 0.6318, - "step": 65128 - }, - { - "epoch": 1.67, - "learning_rate": 8.662281886471508e-07, - "loss": 0.6504, - "step": 65129 - }, - { - "epoch": 1.67, - "learning_rate": 8.662007669420644e-07, - "loss": 0.6865, - "step": 65130 - }, - { - "epoch": 1.67, - "learning_rate": 8.661733453394222e-07, - "loss": 0.5979, - "step": 65131 - }, - { - "epoch": 1.67, - "learning_rate": 8.661459238392448e-07, - "loss": 0.4546, - "step": 65132 - }, - { - "epoch": 1.67, - "learning_rate": 8.661185024415533e-07, - "loss": 0.5518, - "step": 65133 - }, - { - "epoch": 1.67, - "learning_rate": 8.660910811463688e-07, - "loss": 0.6738, - "step": 65134 - }, - { - "epoch": 1.67, - "learning_rate": 8.660636599537121e-07, - "loss": 0.5977, - "step": 65135 - }, - { - "epoch": 1.67, - "learning_rate": 8.660362388636042e-07, - "loss": 0.749, - "step": 65136 - }, - { - "epoch": 1.67, - "learning_rate": 8.660088178760665e-07, - "loss": 0.6206, - "step": 65137 - }, - { - "epoch": 1.67, - "learning_rate": 8.659813969911194e-07, - "loss": 0.5498, - "step": 65138 - }, - { - "epoch": 1.67, - "learning_rate": 8.659539762087846e-07, - "loss": 0.6797, - "step": 65139 - }, - { - "epoch": 1.67, - "learning_rate": 8.659265555290824e-07, - "loss": 0.584, - "step": 65140 - }, - { - "epoch": 1.67, - "learning_rate": 8.658991349520341e-07, - "loss": 0.5933, - "step": 65141 - }, - { - "epoch": 1.67, - "learning_rate": 8.658717144776607e-07, - "loss": 0.7451, - "step": 65142 - }, - { - "epoch": 1.67, - "learning_rate": 8.658442941059832e-07, - "loss": 0.7539, - "step": 65143 - }, - { - "epoch": 1.67, - "learning_rate": 8.658168738370222e-07, - "loss": 0.5215, - "step": 65144 - }, - { - "epoch": 1.67, - "learning_rate": 8.657894536707995e-07, - "loss": 0.6162, - "step": 65145 - }, - { - "epoch": 1.67, - "learning_rate": 8.657620336073353e-07, - "loss": 0.6748, - "step": 65146 - }, - { - "epoch": 1.67, - "learning_rate": 8.65734613646651e-07, - "loss": 0.5461, - "step": 65147 - }, - { - "epoch": 1.67, - "learning_rate": 8.657071937887675e-07, - "loss": 0.6191, - "step": 65148 - }, - { - "epoch": 1.67, - "learning_rate": 8.656797740337063e-07, - "loss": 0.5245, - "step": 65149 - }, - { - "epoch": 1.67, - "learning_rate": 8.656523543814876e-07, - "loss": 0.5347, - "step": 65150 - }, - { - "epoch": 1.67, - "learning_rate": 8.656249348321325e-07, - "loss": 0.7627, - "step": 65151 - }, - { - "epoch": 1.67, - "learning_rate": 8.655975153856625e-07, - "loss": 0.5513, - "step": 65152 - }, - { - "epoch": 1.67, - "learning_rate": 8.65570096042098e-07, - "loss": 0.6758, - "step": 65153 - }, - { - "epoch": 1.67, - "learning_rate": 8.655426768014607e-07, - "loss": 0.7998, - "step": 65154 - }, - { - "epoch": 1.67, - "learning_rate": 8.655152576637708e-07, - "loss": 0.6963, - "step": 65155 - }, - { - "epoch": 1.67, - "learning_rate": 8.654878386290499e-07, - "loss": 0.4182, - "step": 65156 - }, - { - "epoch": 1.67, - "learning_rate": 8.654604196973186e-07, - "loss": 0.5981, - "step": 65157 - }, - { - "epoch": 1.67, - "learning_rate": 8.654330008685983e-07, - "loss": 0.667, - "step": 65158 - }, - { - "epoch": 1.67, - "learning_rate": 8.654055821429101e-07, - "loss": 0.792, - "step": 65159 - }, - { - "epoch": 1.67, - "learning_rate": 8.653781635202742e-07, - "loss": 0.6313, - "step": 65160 - }, - { - "epoch": 1.67, - "learning_rate": 8.653507450007119e-07, - "loss": 0.6348, - "step": 65161 - }, - { - "epoch": 1.67, - "learning_rate": 8.653233265842446e-07, - "loss": 0.7285, - "step": 65162 - }, - { - "epoch": 1.67, - "learning_rate": 8.652959082708929e-07, - "loss": 0.6797, - "step": 65163 - }, - { - "epoch": 1.67, - "learning_rate": 8.652684900606779e-07, - "loss": 0.5225, - "step": 65164 - }, - { - "epoch": 1.67, - "learning_rate": 8.652410719536207e-07, - "loss": 0.5396, - "step": 65165 - }, - { - "epoch": 1.67, - "learning_rate": 8.652136539497423e-07, - "loss": 0.7949, - "step": 65166 - }, - { - "epoch": 1.67, - "learning_rate": 8.651862360490634e-07, - "loss": 0.6836, - "step": 65167 - }, - { - "epoch": 1.67, - "learning_rate": 8.651588182516054e-07, - "loss": 0.7949, - "step": 65168 - }, - { - "epoch": 1.67, - "learning_rate": 8.651314005573894e-07, - "loss": 0.5884, - "step": 65169 - }, - { - "epoch": 1.67, - "learning_rate": 8.651039829664355e-07, - "loss": 0.6816, - "step": 65170 - }, - { - "epoch": 1.67, - "learning_rate": 8.650765654787655e-07, - "loss": 0.6299, - "step": 65171 - }, - { - "epoch": 1.67, - "learning_rate": 8.650491480944e-07, - "loss": 0.5454, - "step": 65172 - }, - { - "epoch": 1.67, - "learning_rate": 8.650217308133603e-07, - "loss": 0.6494, - "step": 65173 - }, - { - "epoch": 1.67, - "learning_rate": 8.649943136356672e-07, - "loss": 0.6953, - "step": 65174 - }, - { - "epoch": 1.67, - "learning_rate": 8.649668965613419e-07, - "loss": 0.6172, - "step": 65175 - }, - { - "epoch": 1.67, - "learning_rate": 8.649394795904051e-07, - "loss": 0.6685, - "step": 65176 - }, - { - "epoch": 1.67, - "learning_rate": 8.649120627228781e-07, - "loss": 0.6006, - "step": 65177 - }, - { - "epoch": 1.67, - "learning_rate": 8.648846459587814e-07, - "loss": 0.6562, - "step": 65178 - }, - { - "epoch": 1.67, - "learning_rate": 8.648572292981371e-07, - "loss": 0.6436, - "step": 65179 - }, - { - "epoch": 1.67, - "learning_rate": 8.648298127409646e-07, - "loss": 0.5664, - "step": 65180 - }, - { - "epoch": 1.67, - "learning_rate": 8.64802396287286e-07, - "loss": 0.6416, - "step": 65181 - }, - { - "epoch": 1.67, - "learning_rate": 8.647749799371218e-07, - "loss": 0.7295, - "step": 65182 - }, - { - "epoch": 1.67, - "learning_rate": 8.647475636904934e-07, - "loss": 0.7363, - "step": 65183 - }, - { - "epoch": 1.67, - "learning_rate": 8.647201475474213e-07, - "loss": 0.6265, - "step": 65184 - }, - { - "epoch": 1.67, - "learning_rate": 8.64692731507927e-07, - "loss": 0.7588, - "step": 65185 - }, - { - "epoch": 1.67, - "learning_rate": 8.64665315572031e-07, - "loss": 0.6455, - "step": 65186 - }, - { - "epoch": 1.67, - "learning_rate": 8.646378997397548e-07, - "loss": 0.7744, - "step": 65187 - }, - { - "epoch": 1.67, - "learning_rate": 8.646104840111191e-07, - "loss": 0.5938, - "step": 65188 - }, - { - "epoch": 1.67, - "learning_rate": 8.64583068386145e-07, - "loss": 0.6831, - "step": 65189 - }, - { - "epoch": 1.67, - "learning_rate": 8.645556528648535e-07, - "loss": 0.5388, - "step": 65190 - }, - { - "epoch": 1.67, - "learning_rate": 8.645282374472651e-07, - "loss": 0.6543, - "step": 65191 - }, - { - "epoch": 1.67, - "learning_rate": 8.645008221334016e-07, - "loss": 0.7549, - "step": 65192 - }, - { - "epoch": 1.67, - "learning_rate": 8.644734069232832e-07, - "loss": 0.6777, - "step": 65193 - }, - { - "epoch": 1.67, - "learning_rate": 8.644459918169315e-07, - "loss": 0.7578, - "step": 65194 - }, - { - "epoch": 1.67, - "learning_rate": 8.644185768143671e-07, - "loss": 0.5239, - "step": 65195 - }, - { - "epoch": 1.67, - "learning_rate": 8.643911619156114e-07, - "loss": 0.8271, - "step": 65196 - }, - { - "epoch": 1.67, - "learning_rate": 8.643637471206851e-07, - "loss": 0.7207, - "step": 65197 - }, - { - "epoch": 1.67, - "learning_rate": 8.643363324296091e-07, - "loss": 0.4932, - "step": 65198 - }, - { - "epoch": 1.67, - "learning_rate": 8.643089178424051e-07, - "loss": 0.5, - "step": 65199 - }, - { - "epoch": 1.67, - "learning_rate": 8.642815033590931e-07, - "loss": 0.6396, - "step": 65200 - }, - { - "epoch": 1.67, - "learning_rate": 8.642540889796943e-07, - "loss": 0.7061, - "step": 65201 - }, - { - "epoch": 1.67, - "learning_rate": 8.642266747042302e-07, - "loss": 0.8193, - "step": 65202 - }, - { - "epoch": 1.67, - "learning_rate": 8.641992605327211e-07, - "loss": 0.6973, - "step": 65203 - }, - { - "epoch": 1.67, - "learning_rate": 8.641718464651888e-07, - "loss": 0.4221, - "step": 65204 - }, - { - "epoch": 1.67, - "learning_rate": 8.641444325016536e-07, - "loss": 0.5898, - "step": 65205 - }, - { - "epoch": 1.67, - "learning_rate": 8.641170186421371e-07, - "loss": 0.6011, - "step": 65206 - }, - { - "epoch": 1.67, - "learning_rate": 8.640896048866595e-07, - "loss": 0.6167, - "step": 65207 - }, - { - "epoch": 1.67, - "learning_rate": 8.640621912352426e-07, - "loss": 0.6934, - "step": 65208 - }, - { - "epoch": 1.67, - "learning_rate": 8.640347776879071e-07, - "loss": 0.4792, - "step": 65209 - }, - { - "epoch": 1.67, - "learning_rate": 8.640073642446737e-07, - "loss": 0.749, - "step": 65210 - }, - { - "epoch": 1.67, - "learning_rate": 8.639799509055637e-07, - "loss": 0.7188, - "step": 65211 - }, - { - "epoch": 1.67, - "learning_rate": 8.639525376705979e-07, - "loss": 0.6855, - "step": 65212 - }, - { - "epoch": 1.67, - "learning_rate": 8.639251245397973e-07, - "loss": 0.5947, - "step": 65213 - }, - { - "epoch": 1.67, - "learning_rate": 8.63897711513183e-07, - "loss": 0.6045, - "step": 65214 - }, - { - "epoch": 1.67, - "learning_rate": 8.638702985907762e-07, - "loss": 0.5991, - "step": 65215 - }, - { - "epoch": 1.67, - "learning_rate": 8.638428857725975e-07, - "loss": 0.7754, - "step": 65216 - }, - { - "epoch": 1.67, - "learning_rate": 8.638154730586679e-07, - "loss": 0.6201, - "step": 65217 - }, - { - "epoch": 1.67, - "learning_rate": 8.637880604490089e-07, - "loss": 0.6968, - "step": 65218 - }, - { - "epoch": 1.67, - "learning_rate": 8.637606479436411e-07, - "loss": 0.7612, - "step": 65219 - }, - { - "epoch": 1.67, - "learning_rate": 8.637332355425852e-07, - "loss": 0.6118, - "step": 65220 - }, - { - "epoch": 1.67, - "learning_rate": 8.637058232458627e-07, - "loss": 0.7383, - "step": 65221 - }, - { - "epoch": 1.67, - "learning_rate": 8.636784110534942e-07, - "loss": 0.7021, - "step": 65222 - }, - { - "epoch": 1.67, - "learning_rate": 8.63650998965501e-07, - "loss": 0.71, - "step": 65223 - }, - { - "epoch": 1.67, - "learning_rate": 8.636235869819038e-07, - "loss": 0.6348, - "step": 65224 - }, - { - "epoch": 1.67, - "learning_rate": 8.635961751027239e-07, - "loss": 0.5669, - "step": 65225 - }, - { - "epoch": 1.67, - "learning_rate": 8.63568763327982e-07, - "loss": 0.7119, - "step": 65226 - }, - { - "epoch": 1.67, - "learning_rate": 8.635413516576995e-07, - "loss": 0.6523, - "step": 65227 - }, - { - "epoch": 1.67, - "learning_rate": 8.635139400918968e-07, - "loss": 0.748, - "step": 65228 - }, - { - "epoch": 1.67, - "learning_rate": 8.634865286305956e-07, - "loss": 0.6934, - "step": 65229 - }, - { - "epoch": 1.67, - "learning_rate": 8.634591172738162e-07, - "loss": 0.6367, - "step": 65230 - }, - { - "epoch": 1.67, - "learning_rate": 8.634317060215798e-07, - "loss": 0.6682, - "step": 65231 - }, - { - "epoch": 1.67, - "learning_rate": 8.634042948739078e-07, - "loss": 0.5786, - "step": 65232 - }, - { - "epoch": 1.67, - "learning_rate": 8.633768838308206e-07, - "loss": 0.4668, - "step": 65233 - }, - { - "epoch": 1.67, - "learning_rate": 8.633494728923394e-07, - "loss": 0.752, - "step": 65234 - }, - { - "epoch": 1.67, - "learning_rate": 8.633220620584853e-07, - "loss": 0.4934, - "step": 65235 - }, - { - "epoch": 1.67, - "learning_rate": 8.63294651329279e-07, - "loss": 0.5688, - "step": 65236 - }, - { - "epoch": 1.67, - "learning_rate": 8.63267240704742e-07, - "loss": 0.5431, - "step": 65237 - }, - { - "epoch": 1.67, - "learning_rate": 8.632398301848948e-07, - "loss": 0.7705, - "step": 65238 - }, - { - "epoch": 1.67, - "learning_rate": 8.63212419769759e-07, - "loss": 0.6812, - "step": 65239 - }, - { - "epoch": 1.67, - "learning_rate": 8.631850094593547e-07, - "loss": 0.6982, - "step": 65240 - }, - { - "epoch": 1.67, - "learning_rate": 8.631575992537035e-07, - "loss": 0.6572, - "step": 65241 - }, - { - "epoch": 1.67, - "learning_rate": 8.631301891528262e-07, - "loss": 0.6113, - "step": 65242 - }, - { - "epoch": 1.67, - "learning_rate": 8.631027791567438e-07, - "loss": 0.6807, - "step": 65243 - }, - { - "epoch": 1.67, - "learning_rate": 8.630753692654773e-07, - "loss": 0.6548, - "step": 65244 - }, - { - "epoch": 1.67, - "learning_rate": 8.630479594790476e-07, - "loss": 0.562, - "step": 65245 - }, - { - "epoch": 1.67, - "learning_rate": 8.63020549797476e-07, - "loss": 0.5793, - "step": 65246 - }, - { - "epoch": 1.67, - "learning_rate": 8.629931402207831e-07, - "loss": 0.5708, - "step": 65247 - }, - { - "epoch": 1.67, - "learning_rate": 8.629657307489902e-07, - "loss": 0.5752, - "step": 65248 - }, - { - "epoch": 1.67, - "learning_rate": 8.629383213821183e-07, - "loss": 0.5757, - "step": 65249 - }, - { - "epoch": 1.67, - "learning_rate": 8.629109121201881e-07, - "loss": 0.4954, - "step": 65250 - }, - { - "epoch": 1.67, - "learning_rate": 8.628835029632205e-07, - "loss": 0.6523, - "step": 65251 - }, - { - "epoch": 1.67, - "learning_rate": 8.628560939112368e-07, - "loss": 0.6333, - "step": 65252 - }, - { - "epoch": 1.67, - "learning_rate": 8.628286849642577e-07, - "loss": 0.5276, - "step": 65253 - }, - { - "epoch": 1.67, - "learning_rate": 8.628012761223047e-07, - "loss": 0.7168, - "step": 65254 - }, - { - "epoch": 1.67, - "learning_rate": 8.627738673853982e-07, - "loss": 0.748, - "step": 65255 - }, - { - "epoch": 1.67, - "learning_rate": 8.627464587535596e-07, - "loss": 0.7236, - "step": 65256 - }, - { - "epoch": 1.67, - "learning_rate": 8.627190502268095e-07, - "loss": 0.7734, - "step": 65257 - }, - { - "epoch": 1.67, - "learning_rate": 8.626916418051693e-07, - "loss": 0.5679, - "step": 65258 - }, - { - "epoch": 1.67, - "learning_rate": 8.626642334886602e-07, - "loss": 0.7119, - "step": 65259 - }, - { - "epoch": 1.67, - "learning_rate": 8.62636825277302e-07, - "loss": 0.667, - "step": 65260 - }, - { - "epoch": 1.67, - "learning_rate": 8.62609417171117e-07, - "loss": 0.6523, - "step": 65261 - }, - { - "epoch": 1.67, - "learning_rate": 8.625820091701254e-07, - "loss": 0.5962, - "step": 65262 - }, - { - "epoch": 1.67, - "learning_rate": 8.625546012743485e-07, - "loss": 0.7051, - "step": 65263 - }, - { - "epoch": 1.67, - "learning_rate": 8.625271934838071e-07, - "loss": 0.6091, - "step": 65264 - }, - { - "epoch": 1.67, - "learning_rate": 8.624997857985226e-07, - "loss": 0.6602, - "step": 65265 - }, - { - "epoch": 1.67, - "learning_rate": 8.624723782185153e-07, - "loss": 0.6533, - "step": 65266 - }, - { - "epoch": 1.67, - "learning_rate": 8.624449707438069e-07, - "loss": 0.6973, - "step": 65267 - }, - { - "epoch": 1.67, - "learning_rate": 8.624175633744179e-07, - "loss": 0.6582, - "step": 65268 - }, - { - "epoch": 1.67, - "learning_rate": 8.623901561103699e-07, - "loss": 0.561, - "step": 65269 - }, - { - "epoch": 1.67, - "learning_rate": 8.623627489516829e-07, - "loss": 0.5933, - "step": 65270 - }, - { - "epoch": 1.67, - "learning_rate": 8.623353418983788e-07, - "loss": 0.6504, - "step": 65271 - }, - { - "epoch": 1.67, - "learning_rate": 8.623079349504777e-07, - "loss": 0.5825, - "step": 65272 - }, - { - "epoch": 1.67, - "learning_rate": 8.622805281080014e-07, - "loss": 0.6533, - "step": 65273 - }, - { - "epoch": 1.67, - "learning_rate": 8.622531213709704e-07, - "loss": 0.709, - "step": 65274 - }, - { - "epoch": 1.67, - "learning_rate": 8.622257147394061e-07, - "loss": 0.6533, - "step": 65275 - }, - { - "epoch": 1.67, - "learning_rate": 8.621983082133288e-07, - "loss": 0.7188, - "step": 65276 - }, - { - "epoch": 1.67, - "learning_rate": 8.621709017927605e-07, - "loss": 0.5627, - "step": 65277 - }, - { - "epoch": 1.67, - "learning_rate": 8.621434954777212e-07, - "loss": 0.6826, - "step": 65278 - }, - { - "epoch": 1.67, - "learning_rate": 8.621160892682326e-07, - "loss": 0.5017, - "step": 65279 - }, - { - "epoch": 1.67, - "learning_rate": 8.620886831643153e-07, - "loss": 0.4847, - "step": 65280 - }, - { - "epoch": 1.67, - "learning_rate": 8.6206127716599e-07, - "loss": 0.7085, - "step": 65281 - }, - { - "epoch": 1.67, - "learning_rate": 8.620338712732785e-07, - "loss": 0.7461, - "step": 65282 - }, - { - "epoch": 1.67, - "learning_rate": 8.620064654862008e-07, - "loss": 0.521, - "step": 65283 - }, - { - "epoch": 1.67, - "learning_rate": 8.619790598047788e-07, - "loss": 0.6172, - "step": 65284 - }, - { - "epoch": 1.67, - "learning_rate": 8.619516542290329e-07, - "loss": 0.7109, - "step": 65285 - }, - { - "epoch": 1.67, - "learning_rate": 8.619242487589844e-07, - "loss": 0.7832, - "step": 65286 - }, - { - "epoch": 1.67, - "learning_rate": 8.618968433946539e-07, - "loss": 0.7979, - "step": 65287 - }, - { - "epoch": 1.67, - "learning_rate": 8.61869438136063e-07, - "loss": 0.6309, - "step": 65288 - }, - { - "epoch": 1.67, - "learning_rate": 8.618420329832323e-07, - "loss": 0.6533, - "step": 65289 - }, - { - "epoch": 1.67, - "learning_rate": 8.618146279361829e-07, - "loss": 0.6279, - "step": 65290 - }, - { - "epoch": 1.67, - "learning_rate": 8.617872229949352e-07, - "loss": 0.5122, - "step": 65291 - }, - { - "epoch": 1.67, - "learning_rate": 8.61759818159511e-07, - "loss": 0.4038, - "step": 65292 - }, - { - "epoch": 1.67, - "learning_rate": 8.617324134299307e-07, - "loss": 0.6504, - "step": 65293 - }, - { - "epoch": 1.67, - "learning_rate": 8.617050088062158e-07, - "loss": 0.4727, - "step": 65294 - }, - { - "epoch": 1.67, - "learning_rate": 8.616776042883868e-07, - "loss": 0.8057, - "step": 65295 - }, - { - "epoch": 1.67, - "learning_rate": 8.61650199876465e-07, - "loss": 0.6465, - "step": 65296 - }, - { - "epoch": 1.67, - "learning_rate": 8.616227955704712e-07, - "loss": 0.5759, - "step": 65297 - }, - { - "epoch": 1.67, - "learning_rate": 8.615953913704267e-07, - "loss": 0.7354, - "step": 65298 - }, - { - "epoch": 1.67, - "learning_rate": 8.615679872763524e-07, - "loss": 0.5568, - "step": 65299 - }, - { - "epoch": 1.67, - "learning_rate": 8.615405832882686e-07, - "loss": 0.7588, - "step": 65300 - }, - { - "epoch": 1.67, - "learning_rate": 8.615131794061972e-07, - "loss": 0.7354, - "step": 65301 - }, - { - "epoch": 1.67, - "learning_rate": 8.614857756301584e-07, - "loss": 0.7783, - "step": 65302 - }, - { - "epoch": 1.67, - "learning_rate": 8.614583719601739e-07, - "loss": 0.6035, - "step": 65303 - }, - { - "epoch": 1.67, - "learning_rate": 8.614309683962642e-07, - "loss": 0.6885, - "step": 65304 - }, - { - "epoch": 1.67, - "learning_rate": 8.614035649384506e-07, - "loss": 0.665, - "step": 65305 - }, - { - "epoch": 1.67, - "learning_rate": 8.613761615867539e-07, - "loss": 0.6147, - "step": 65306 - }, - { - "epoch": 1.67, - "learning_rate": 8.613487583411947e-07, - "loss": 0.4941, - "step": 65307 - }, - { - "epoch": 1.67, - "learning_rate": 8.613213552017951e-07, - "loss": 0.5933, - "step": 65308 - }, - { - "epoch": 1.67, - "learning_rate": 8.612939521685749e-07, - "loss": 0.5742, - "step": 65309 - }, - { - "epoch": 1.67, - "learning_rate": 8.612665492415555e-07, - "loss": 0.7861, - "step": 65310 - }, - { - "epoch": 1.67, - "learning_rate": 8.612391464207581e-07, - "loss": 0.564, - "step": 65311 - }, - { - "epoch": 1.67, - "learning_rate": 8.612117437062033e-07, - "loss": 0.6299, - "step": 65312 - }, - { - "epoch": 1.67, - "learning_rate": 8.611843410979125e-07, - "loss": 0.6465, - "step": 65313 - }, - { - "epoch": 1.67, - "learning_rate": 8.611569385959062e-07, - "loss": 0.5488, - "step": 65314 - }, - { - "epoch": 1.67, - "learning_rate": 8.611295362002059e-07, - "loss": 0.4443, - "step": 65315 - }, - { - "epoch": 1.67, - "learning_rate": 8.611021339108321e-07, - "loss": 0.4495, - "step": 65316 - }, - { - "epoch": 1.67, - "learning_rate": 8.610747317278062e-07, - "loss": 0.6211, - "step": 65317 - }, - { - "epoch": 1.67, - "learning_rate": 8.610473296511493e-07, - "loss": 0.7051, - "step": 65318 - }, - { - "epoch": 1.67, - "learning_rate": 8.610199276808816e-07, - "loss": 0.7061, - "step": 65319 - }, - { - "epoch": 1.67, - "learning_rate": 8.609925258170248e-07, - "loss": 0.5918, - "step": 65320 - }, - { - "epoch": 1.67, - "learning_rate": 8.609651240595994e-07, - "loss": 0.4585, - "step": 65321 - }, - { - "epoch": 1.67, - "learning_rate": 8.609377224086267e-07, - "loss": 0.6392, - "step": 65322 - }, - { - "epoch": 1.67, - "learning_rate": 8.609103208641277e-07, - "loss": 0.6768, - "step": 65323 - }, - { - "epoch": 1.67, - "learning_rate": 8.60882919426123e-07, - "loss": 0.6111, - "step": 65324 - }, - { - "epoch": 1.67, - "learning_rate": 8.608555180946341e-07, - "loss": 0.6221, - "step": 65325 - }, - { - "epoch": 1.67, - "learning_rate": 8.608281168696816e-07, - "loss": 0.6895, - "step": 65326 - }, - { - "epoch": 1.67, - "learning_rate": 8.608007157512867e-07, - "loss": 0.5298, - "step": 65327 - }, - { - "epoch": 1.67, - "learning_rate": 8.607733147394706e-07, - "loss": 0.6528, - "step": 65328 - }, - { - "epoch": 1.67, - "learning_rate": 8.607459138342534e-07, - "loss": 0.5713, - "step": 65329 - }, - { - "epoch": 1.67, - "learning_rate": 8.60718513035657e-07, - "loss": 0.7168, - "step": 65330 - }, - { - "epoch": 1.67, - "learning_rate": 8.606911123437017e-07, - "loss": 0.5977, - "step": 65331 - }, - { - "epoch": 1.67, - "learning_rate": 8.606637117584092e-07, - "loss": 0.3945, - "step": 65332 - }, - { - "epoch": 1.67, - "learning_rate": 8.606363112797997e-07, - "loss": 0.4766, - "step": 65333 - }, - { - "epoch": 1.67, - "learning_rate": 8.606089109078949e-07, - "loss": 0.7148, - "step": 65334 - }, - { - "epoch": 1.67, - "learning_rate": 8.605815106427152e-07, - "loss": 0.5747, - "step": 65335 - }, - { - "epoch": 1.67, - "learning_rate": 8.60554110484282e-07, - "loss": 0.7578, - "step": 65336 - }, - { - "epoch": 1.67, - "learning_rate": 8.605267104326159e-07, - "loss": 0.4846, - "step": 65337 - }, - { - "epoch": 1.67, - "learning_rate": 8.604993104877386e-07, - "loss": 0.5859, - "step": 65338 - }, - { - "epoch": 1.67, - "learning_rate": 8.604719106496703e-07, - "loss": 0.5474, - "step": 65339 - }, - { - "epoch": 1.67, - "learning_rate": 8.60444510918432e-07, - "loss": 0.7422, - "step": 65340 - }, - { - "epoch": 1.67, - "learning_rate": 8.604171112940451e-07, - "loss": 0.7119, - "step": 65341 - }, - { - "epoch": 1.67, - "learning_rate": 8.603897117765305e-07, - "loss": 0.4556, - "step": 65342 - }, - { - "epoch": 1.67, - "learning_rate": 8.603623123659088e-07, - "loss": 0.6006, - "step": 65343 - }, - { - "epoch": 1.67, - "learning_rate": 8.603349130622015e-07, - "loss": 0.5962, - "step": 65344 - }, - { - "epoch": 1.67, - "learning_rate": 8.603075138654291e-07, - "loss": 0.6353, - "step": 65345 - }, - { - "epoch": 1.67, - "learning_rate": 8.602801147756132e-07, - "loss": 0.8916, - "step": 65346 - }, - { - "epoch": 1.67, - "learning_rate": 8.60252715792774e-07, - "loss": 0.6556, - "step": 65347 - }, - { - "epoch": 1.67, - "learning_rate": 8.602253169169333e-07, - "loss": 0.5037, - "step": 65348 - }, - { - "epoch": 1.67, - "learning_rate": 8.601979181481113e-07, - "loss": 0.6631, - "step": 65349 - }, - { - "epoch": 1.67, - "learning_rate": 8.601705194863294e-07, - "loss": 0.5537, - "step": 65350 - }, - { - "epoch": 1.67, - "learning_rate": 8.601431209316084e-07, - "loss": 0.6846, - "step": 65351 - }, - { - "epoch": 1.68, - "learning_rate": 8.601157224839694e-07, - "loss": 0.6045, - "step": 65352 - }, - { - "epoch": 1.68, - "learning_rate": 8.600883241434336e-07, - "loss": 0.5967, - "step": 65353 - }, - { - "epoch": 1.68, - "learning_rate": 8.600609259100213e-07, - "loss": 0.6196, - "step": 65354 - }, - { - "epoch": 1.68, - "learning_rate": 8.600335277837543e-07, - "loss": 0.5154, - "step": 65355 - }, - { - "epoch": 1.68, - "learning_rate": 8.60006129764653e-07, - "loss": 0.5449, - "step": 65356 - }, - { - "epoch": 1.68, - "learning_rate": 8.599787318527387e-07, - "loss": 0.6411, - "step": 65357 - }, - { - "epoch": 1.68, - "learning_rate": 8.599513340480325e-07, - "loss": 0.51, - "step": 65358 - }, - { - "epoch": 1.68, - "learning_rate": 8.599239363505548e-07, - "loss": 0.5151, - "step": 65359 - }, - { - "epoch": 1.68, - "learning_rate": 8.598965387603269e-07, - "loss": 0.7236, - "step": 65360 - }, - { - "epoch": 1.68, - "learning_rate": 8.598691412773698e-07, - "loss": 0.7295, - "step": 65361 - }, - { - "epoch": 1.68, - "learning_rate": 8.598417439017044e-07, - "loss": 0.8066, - "step": 65362 - }, - { - "epoch": 1.68, - "learning_rate": 8.598143466333518e-07, - "loss": 0.6221, - "step": 65363 - }, - { - "epoch": 1.68, - "learning_rate": 8.597869494723328e-07, - "loss": 0.7002, - "step": 65364 - }, - { - "epoch": 1.68, - "learning_rate": 8.597595524186687e-07, - "loss": 0.6245, - "step": 65365 - }, - { - "epoch": 1.68, - "learning_rate": 8.5973215547238e-07, - "loss": 0.748, - "step": 65366 - }, - { - "epoch": 1.68, - "learning_rate": 8.597047586334881e-07, - "loss": 0.6409, - "step": 65367 - }, - { - "epoch": 1.68, - "learning_rate": 8.596773619020141e-07, - "loss": 0.5007, - "step": 65368 - }, - { - "epoch": 1.68, - "learning_rate": 8.596499652779783e-07, - "loss": 0.5303, - "step": 65369 - }, - { - "epoch": 1.68, - "learning_rate": 8.596225687614022e-07, - "loss": 0.7129, - "step": 65370 - }, - { - "epoch": 1.68, - "learning_rate": 8.595951723523065e-07, - "loss": 0.4945, - "step": 65371 - }, - { - "epoch": 1.68, - "learning_rate": 8.595677760507125e-07, - "loss": 0.7383, - "step": 65372 - }, - { - "epoch": 1.68, - "learning_rate": 8.595403798566408e-07, - "loss": 0.5996, - "step": 65373 - }, - { - "epoch": 1.68, - "learning_rate": 8.595129837701127e-07, - "loss": 0.7178, - "step": 65374 - }, - { - "epoch": 1.68, - "learning_rate": 8.594855877911489e-07, - "loss": 0.5396, - "step": 65375 - }, - { - "epoch": 1.68, - "learning_rate": 8.594581919197708e-07, - "loss": 0.5659, - "step": 65376 - }, - { - "epoch": 1.68, - "learning_rate": 8.594307961559988e-07, - "loss": 0.7314, - "step": 65377 - }, - { - "epoch": 1.68, - "learning_rate": 8.594034004998548e-07, - "loss": 0.9614, - "step": 65378 - }, - { - "epoch": 1.68, - "learning_rate": 8.593760049513586e-07, - "loss": 0.5249, - "step": 65379 - }, - { - "epoch": 1.68, - "learning_rate": 8.593486095105319e-07, - "loss": 0.6865, - "step": 65380 - }, - { - "epoch": 1.68, - "learning_rate": 8.593212141773952e-07, - "loss": 0.5312, - "step": 65381 - }, - { - "epoch": 1.68, - "learning_rate": 8.592938189519702e-07, - "loss": 0.6665, - "step": 65382 - }, - { - "epoch": 1.68, - "learning_rate": 8.592664238342771e-07, - "loss": 0.5269, - "step": 65383 - }, - { - "epoch": 1.68, - "learning_rate": 8.592390288243374e-07, - "loss": 0.665, - "step": 65384 - }, - { - "epoch": 1.68, - "learning_rate": 8.592116339221718e-07, - "loss": 0.6904, - "step": 65385 - }, - { - "epoch": 1.68, - "learning_rate": 8.591842391278015e-07, - "loss": 0.4327, - "step": 65386 - }, - { - "epoch": 1.68, - "learning_rate": 8.591568444412471e-07, - "loss": 0.6377, - "step": 65387 - }, - { - "epoch": 1.68, - "learning_rate": 8.591294498625304e-07, - "loss": 0.6973, - "step": 65388 - }, - { - "epoch": 1.68, - "learning_rate": 8.591020553916715e-07, - "loss": 0.5996, - "step": 65389 - }, - { - "epoch": 1.68, - "learning_rate": 8.590746610286915e-07, - "loss": 0.6611, - "step": 65390 - }, - { - "epoch": 1.68, - "learning_rate": 8.590472667736117e-07, - "loss": 0.6924, - "step": 65391 - }, - { - "epoch": 1.68, - "learning_rate": 8.590198726264528e-07, - "loss": 0.5288, - "step": 65392 - }, - { - "epoch": 1.68, - "learning_rate": 8.589924785872361e-07, - "loss": 0.6597, - "step": 65393 - }, - { - "epoch": 1.68, - "learning_rate": 8.589650846559822e-07, - "loss": 0.571, - "step": 65394 - }, - { - "epoch": 1.68, - "learning_rate": 8.589376908327123e-07, - "loss": 0.6338, - "step": 65395 - }, - { - "epoch": 1.68, - "learning_rate": 8.589102971174476e-07, - "loss": 0.6013, - "step": 65396 - }, - { - "epoch": 1.68, - "learning_rate": 8.588829035102084e-07, - "loss": 0.4756, - "step": 65397 - }, - { - "epoch": 1.68, - "learning_rate": 8.588555100110164e-07, - "loss": 0.5566, - "step": 65398 - }, - { - "epoch": 1.68, - "learning_rate": 8.588281166198921e-07, - "loss": 0.5303, - "step": 65399 - }, - { - "epoch": 1.68, - "learning_rate": 8.588007233368564e-07, - "loss": 0.4475, - "step": 65400 - }, - { - "epoch": 1.68, - "learning_rate": 8.587733301619309e-07, - "loss": 0.7129, - "step": 65401 - }, - { - "epoch": 1.68, - "learning_rate": 8.587459370951358e-07, - "loss": 0.4858, - "step": 65402 - }, - { - "epoch": 1.68, - "learning_rate": 8.587185441364927e-07, - "loss": 0.6675, - "step": 65403 - }, - { - "epoch": 1.68, - "learning_rate": 8.58691151286022e-07, - "loss": 0.5747, - "step": 65404 - }, - { - "epoch": 1.68, - "learning_rate": 8.586637585437452e-07, - "loss": 0.7744, - "step": 65405 - }, - { - "epoch": 1.68, - "learning_rate": 8.58636365909683e-07, - "loss": 0.6279, - "step": 65406 - }, - { - "epoch": 1.68, - "learning_rate": 8.586089733838567e-07, - "loss": 0.5269, - "step": 65407 - }, - { - "epoch": 1.68, - "learning_rate": 8.585815809662869e-07, - "loss": 0.5266, - "step": 65408 - }, - { - "epoch": 1.68, - "learning_rate": 8.585541886569945e-07, - "loss": 0.5752, - "step": 65409 - }, - { - "epoch": 1.68, - "learning_rate": 8.585267964560007e-07, - "loss": 0.6187, - "step": 65410 - }, - { - "epoch": 1.68, - "learning_rate": 8.584994043633265e-07, - "loss": 0.6729, - "step": 65411 - }, - { - "epoch": 1.68, - "learning_rate": 8.584720123789929e-07, - "loss": 0.5024, - "step": 65412 - }, - { - "epoch": 1.68, - "learning_rate": 8.584446205030206e-07, - "loss": 0.6924, - "step": 65413 - }, - { - "epoch": 1.68, - "learning_rate": 8.584172287354307e-07, - "loss": 0.5498, - "step": 65414 - }, - { - "epoch": 1.68, - "learning_rate": 8.583898370762444e-07, - "loss": 0.5116, - "step": 65415 - }, - { - "epoch": 1.68, - "learning_rate": 8.583624455254821e-07, - "loss": 0.627, - "step": 65416 - }, - { - "epoch": 1.68, - "learning_rate": 8.583350540831655e-07, - "loss": 0.6758, - "step": 65417 - }, - { - "epoch": 1.68, - "learning_rate": 8.583076627493156e-07, - "loss": 0.6211, - "step": 65418 - }, - { - "epoch": 1.68, - "learning_rate": 8.582802715239524e-07, - "loss": 0.6504, - "step": 65419 - }, - { - "epoch": 1.68, - "learning_rate": 8.582528804070978e-07, - "loss": 0.7959, - "step": 65420 - }, - { - "epoch": 1.68, - "learning_rate": 8.582254893987721e-07, - "loss": 0.3722, - "step": 65421 - }, - { - "epoch": 1.68, - "learning_rate": 8.581980984989969e-07, - "loss": 0.6511, - "step": 65422 - }, - { - "epoch": 1.68, - "learning_rate": 8.581707077077927e-07, - "loss": 0.5479, - "step": 65423 - }, - { - "epoch": 1.68, - "learning_rate": 8.581433170251809e-07, - "loss": 0.7783, - "step": 65424 - }, - { - "epoch": 1.68, - "learning_rate": 8.58115926451182e-07, - "loss": 0.7773, - "step": 65425 - }, - { - "epoch": 1.68, - "learning_rate": 8.580885359858174e-07, - "loss": 0.6553, - "step": 65426 - }, - { - "epoch": 1.68, - "learning_rate": 8.580611456291079e-07, - "loss": 0.8027, - "step": 65427 - }, - { - "epoch": 1.68, - "learning_rate": 8.580337553810745e-07, - "loss": 0.543, - "step": 65428 - }, - { - "epoch": 1.68, - "learning_rate": 8.580063652417382e-07, - "loss": 0.6484, - "step": 65429 - }, - { - "epoch": 1.68, - "learning_rate": 8.579789752111195e-07, - "loss": 0.6211, - "step": 65430 - }, - { - "epoch": 1.68, - "learning_rate": 8.579515852892401e-07, - "loss": 0.6846, - "step": 65431 - }, - { - "epoch": 1.68, - "learning_rate": 8.579241954761206e-07, - "loss": 0.4543, - "step": 65432 - }, - { - "epoch": 1.68, - "learning_rate": 8.578968057717818e-07, - "loss": 0.7607, - "step": 65433 - }, - { - "epoch": 1.68, - "learning_rate": 8.578694161762451e-07, - "loss": 0.6494, - "step": 65434 - }, - { - "epoch": 1.68, - "learning_rate": 8.57842026689531e-07, - "loss": 0.5728, - "step": 65435 - }, - { - "epoch": 1.68, - "learning_rate": 8.57814637311661e-07, - "loss": 0.6543, - "step": 65436 - }, - { - "epoch": 1.68, - "learning_rate": 8.577872480426556e-07, - "loss": 0.6318, - "step": 65437 - }, - { - "epoch": 1.68, - "learning_rate": 8.577598588825364e-07, - "loss": 0.5293, - "step": 65438 - }, - { - "epoch": 1.68, - "learning_rate": 8.577324698313236e-07, - "loss": 0.5244, - "step": 65439 - }, - { - "epoch": 1.68, - "learning_rate": 8.577050808890383e-07, - "loss": 0.6953, - "step": 65440 - }, - { - "epoch": 1.68, - "learning_rate": 8.57677692055702e-07, - "loss": 0.6816, - "step": 65441 - }, - { - "epoch": 1.68, - "learning_rate": 8.57650303331335e-07, - "loss": 0.7148, - "step": 65442 - }, - { - "epoch": 1.68, - "learning_rate": 8.57622914715959e-07, - "loss": 0.5825, - "step": 65443 - }, - { - "epoch": 1.68, - "learning_rate": 8.575955262095943e-07, - "loss": 0.6392, - "step": 65444 - }, - { - "epoch": 1.68, - "learning_rate": 8.575681378122623e-07, - "loss": 0.6826, - "step": 65445 - }, - { - "epoch": 1.68, - "learning_rate": 8.575407495239837e-07, - "loss": 0.4434, - "step": 65446 - }, - { - "epoch": 1.68, - "learning_rate": 8.575133613447798e-07, - "loss": 0.6025, - "step": 65447 - }, - { - "epoch": 1.68, - "learning_rate": 8.574859732746715e-07, - "loss": 0.5632, - "step": 65448 - }, - { - "epoch": 1.68, - "learning_rate": 8.574585853136795e-07, - "loss": 0.5796, - "step": 65449 - }, - { - "epoch": 1.68, - "learning_rate": 8.574311974618247e-07, - "loss": 0.5713, - "step": 65450 - }, - { - "epoch": 1.68, - "learning_rate": 8.574038097191285e-07, - "loss": 0.5786, - "step": 65451 - }, - { - "epoch": 1.68, - "learning_rate": 8.573764220856115e-07, - "loss": 0.8379, - "step": 65452 - }, - { - "epoch": 1.68, - "learning_rate": 8.573490345612948e-07, - "loss": 0.624, - "step": 65453 - }, - { - "epoch": 1.68, - "learning_rate": 8.573216471461994e-07, - "loss": 0.6504, - "step": 65454 - }, - { - "epoch": 1.68, - "learning_rate": 8.572942598403463e-07, - "loss": 0.71, - "step": 65455 - }, - { - "epoch": 1.68, - "learning_rate": 8.572668726437563e-07, - "loss": 0.6909, - "step": 65456 - }, - { - "epoch": 1.68, - "learning_rate": 8.572394855564507e-07, - "loss": 0.6982, - "step": 65457 - }, - { - "epoch": 1.68, - "learning_rate": 8.572120985784504e-07, - "loss": 0.6182, - "step": 65458 - }, - { - "epoch": 1.68, - "learning_rate": 8.571847117097759e-07, - "loss": 0.6431, - "step": 65459 - }, - { - "epoch": 1.68, - "learning_rate": 8.571573249504487e-07, - "loss": 0.4893, - "step": 65460 - }, - { - "epoch": 1.68, - "learning_rate": 8.571299383004893e-07, - "loss": 0.5732, - "step": 65461 - }, - { - "epoch": 1.68, - "learning_rate": 8.571025517599193e-07, - "loss": 0.4791, - "step": 65462 - }, - { - "epoch": 1.68, - "learning_rate": 8.570751653287589e-07, - "loss": 0.8975, - "step": 65463 - }, - { - "epoch": 1.68, - "learning_rate": 8.570477790070297e-07, - "loss": 0.6787, - "step": 65464 - }, - { - "epoch": 1.68, - "learning_rate": 8.570203927947524e-07, - "loss": 0.5728, - "step": 65465 - }, - { - "epoch": 1.68, - "learning_rate": 8.56993006691948e-07, - "loss": 0.6082, - "step": 65466 - }, - { - "epoch": 1.68, - "learning_rate": 8.569656206986376e-07, - "loss": 0.5669, - "step": 65467 - }, - { - "epoch": 1.68, - "learning_rate": 8.569382348148424e-07, - "loss": 0.6953, - "step": 65468 - }, - { - "epoch": 1.68, - "learning_rate": 8.569108490405824e-07, - "loss": 0.6489, - "step": 65469 - }, - { - "epoch": 1.68, - "learning_rate": 8.568834633758795e-07, - "loss": 0.416, - "step": 65470 - }, - { - "epoch": 1.68, - "learning_rate": 8.568560778207541e-07, - "loss": 0.7061, - "step": 65471 - }, - { - "epoch": 1.68, - "learning_rate": 8.568286923752274e-07, - "loss": 0.5879, - "step": 65472 - }, - { - "epoch": 1.68, - "learning_rate": 8.568013070393205e-07, - "loss": 0.5801, - "step": 65473 - }, - { - "epoch": 1.68, - "learning_rate": 8.567739218130544e-07, - "loss": 0.7969, - "step": 65474 - }, - { - "epoch": 1.68, - "learning_rate": 8.567465366964497e-07, - "loss": 0.5161, - "step": 65475 - }, - { - "epoch": 1.68, - "learning_rate": 8.567191516895277e-07, - "loss": 0.4927, - "step": 65476 - }, - { - "epoch": 1.68, - "learning_rate": 8.566917667923092e-07, - "loss": 0.6865, - "step": 65477 - }, - { - "epoch": 1.68, - "learning_rate": 8.566643820048156e-07, - "loss": 0.6445, - "step": 65478 - }, - { - "epoch": 1.68, - "learning_rate": 8.566369973270672e-07, - "loss": 0.6875, - "step": 65479 - }, - { - "epoch": 1.68, - "learning_rate": 8.566096127590851e-07, - "loss": 0.6353, - "step": 65480 - }, - { - "epoch": 1.68, - "learning_rate": 8.565822283008906e-07, - "loss": 0.5498, - "step": 65481 - }, - { - "epoch": 1.68, - "learning_rate": 8.565548439525043e-07, - "loss": 0.5438, - "step": 65482 - }, - { - "epoch": 1.68, - "learning_rate": 8.565274597139476e-07, - "loss": 0.5098, - "step": 65483 - }, - { - "epoch": 1.68, - "learning_rate": 8.565000755852409e-07, - "loss": 0.6582, - "step": 65484 - }, - { - "epoch": 1.68, - "learning_rate": 8.564726915664059e-07, - "loss": 0.6221, - "step": 65485 - }, - { - "epoch": 1.68, - "learning_rate": 8.56445307657463e-07, - "loss": 0.6147, - "step": 65486 - }, - { - "epoch": 1.68, - "learning_rate": 8.564179238584332e-07, - "loss": 0.5881, - "step": 65487 - }, - { - "epoch": 1.68, - "learning_rate": 8.563905401693379e-07, - "loss": 0.7588, - "step": 65488 - }, - { - "epoch": 1.68, - "learning_rate": 8.563631565901978e-07, - "loss": 0.7305, - "step": 65489 - }, - { - "epoch": 1.68, - "learning_rate": 8.563357731210334e-07, - "loss": 0.7246, - "step": 65490 - }, - { - "epoch": 1.68, - "learning_rate": 8.563083897618663e-07, - "loss": 0.5483, - "step": 65491 - }, - { - "epoch": 1.68, - "learning_rate": 8.562810065127172e-07, - "loss": 0.6714, - "step": 65492 - }, - { - "epoch": 1.68, - "learning_rate": 8.562536233736071e-07, - "loss": 0.8213, - "step": 65493 - }, - { - "epoch": 1.68, - "learning_rate": 8.562262403445571e-07, - "loss": 0.6626, - "step": 65494 - }, - { - "epoch": 1.68, - "learning_rate": 8.56198857425588e-07, - "loss": 0.6953, - "step": 65495 - }, - { - "epoch": 1.68, - "learning_rate": 8.561714746167208e-07, - "loss": 0.5601, - "step": 65496 - }, - { - "epoch": 1.68, - "learning_rate": 8.561440919179765e-07, - "loss": 0.6108, - "step": 65497 - }, - { - "epoch": 1.68, - "learning_rate": 8.561167093293764e-07, - "loss": 0.7461, - "step": 65498 - }, - { - "epoch": 1.68, - "learning_rate": 8.560893268509407e-07, - "loss": 0.7148, - "step": 65499 - }, - { - "epoch": 1.68, - "learning_rate": 8.56061944482691e-07, - "loss": 0.4834, - "step": 65500 - }, - { - "epoch": 1.68, - "learning_rate": 8.560345622246478e-07, - "loss": 0.6143, - "step": 65501 - }, - { - "epoch": 1.68, - "learning_rate": 8.560071800768325e-07, - "loss": 0.7119, - "step": 65502 - }, - { - "epoch": 1.68, - "learning_rate": 8.559797980392657e-07, - "loss": 0.623, - "step": 65503 - }, - { - "epoch": 1.68, - "learning_rate": 8.559524161119688e-07, - "loss": 0.8037, - "step": 65504 - }, - { - "epoch": 1.68, - "learning_rate": 8.559250342949624e-07, - "loss": 0.543, - "step": 65505 - }, - { - "epoch": 1.68, - "learning_rate": 8.558976525882675e-07, - "loss": 0.6289, - "step": 65506 - }, - { - "epoch": 1.68, - "learning_rate": 8.558702709919052e-07, - "loss": 0.7314, - "step": 65507 - }, - { - "epoch": 1.68, - "learning_rate": 8.558428895058967e-07, - "loss": 0.6084, - "step": 65508 - }, - { - "epoch": 1.68, - "learning_rate": 8.558155081302623e-07, - "loss": 0.6011, - "step": 65509 - }, - { - "epoch": 1.68, - "learning_rate": 8.557881268650236e-07, - "loss": 0.6862, - "step": 65510 - }, - { - "epoch": 1.68, - "learning_rate": 8.55760745710201e-07, - "loss": 0.6943, - "step": 65511 - }, - { - "epoch": 1.68, - "learning_rate": 8.557333646658158e-07, - "loss": 0.3956, - "step": 65512 - }, - { - "epoch": 1.68, - "learning_rate": 8.55705983731889e-07, - "loss": 0.6123, - "step": 65513 - }, - { - "epoch": 1.68, - "learning_rate": 8.556786029084415e-07, - "loss": 0.6821, - "step": 65514 - }, - { - "epoch": 1.68, - "learning_rate": 8.556512221954941e-07, - "loss": 0.6865, - "step": 65515 - }, - { - "epoch": 1.68, - "learning_rate": 8.556238415930682e-07, - "loss": 0.7334, - "step": 65516 - }, - { - "epoch": 1.68, - "learning_rate": 8.555964611011843e-07, - "loss": 0.6904, - "step": 65517 - }, - { - "epoch": 1.68, - "learning_rate": 8.555690807198638e-07, - "loss": 0.572, - "step": 65518 - }, - { - "epoch": 1.68, - "learning_rate": 8.555417004491274e-07, - "loss": 0.6602, - "step": 65519 - }, - { - "epoch": 1.68, - "learning_rate": 8.555143202889959e-07, - "loss": 0.6182, - "step": 65520 - }, - { - "epoch": 1.68, - "learning_rate": 8.554869402394904e-07, - "loss": 0.6714, - "step": 65521 - }, - { - "epoch": 1.68, - "learning_rate": 8.554595603006321e-07, - "loss": 0.6445, - "step": 65522 - }, - { - "epoch": 1.68, - "learning_rate": 8.554321804724415e-07, - "loss": 0.6143, - "step": 65523 - }, - { - "epoch": 1.68, - "learning_rate": 8.554048007549401e-07, - "loss": 0.6008, - "step": 65524 - }, - { - "epoch": 1.68, - "learning_rate": 8.553774211481482e-07, - "loss": 0.4453, - "step": 65525 - }, - { - "epoch": 1.68, - "learning_rate": 8.553500416520876e-07, - "loss": 0.7305, - "step": 65526 - }, - { - "epoch": 1.68, - "learning_rate": 8.553226622667784e-07, - "loss": 0.6875, - "step": 65527 - }, - { - "epoch": 1.68, - "learning_rate": 8.552952829922426e-07, - "loss": 0.7051, - "step": 65528 - }, - { - "epoch": 1.68, - "learning_rate": 8.552679038285002e-07, - "loss": 0.7412, - "step": 65529 - }, - { - "epoch": 1.68, - "learning_rate": 8.552405247755724e-07, - "loss": 0.8369, - "step": 65530 - }, - { - "epoch": 1.68, - "learning_rate": 8.552131458334803e-07, - "loss": 0.7559, - "step": 65531 - }, - { - "epoch": 1.68, - "learning_rate": 8.551857670022449e-07, - "loss": 0.6709, - "step": 65532 - }, - { - "epoch": 1.68, - "learning_rate": 8.551583882818872e-07, - "loss": 0.7305, - "step": 65533 - }, - { - "epoch": 1.68, - "learning_rate": 8.551310096724278e-07, - "loss": 0.5571, - "step": 65534 - }, - { - "epoch": 1.68, - "learning_rate": 8.551036311738882e-07, - "loss": 0.5283, - "step": 65535 - }, - { - "epoch": 1.68, - "learning_rate": 8.550762527862887e-07, - "loss": 0.5432, - "step": 65536 - }, - { - "epoch": 1.68, - "learning_rate": 8.550488745096512e-07, - "loss": 0.4685, - "step": 65537 - }, - { - "epoch": 1.68, - "learning_rate": 8.55021496343996e-07, - "loss": 0.6431, - "step": 65538 - }, - { - "epoch": 1.68, - "learning_rate": 8.549941182893441e-07, - "loss": 0.7139, - "step": 65539 - }, - { - "epoch": 1.68, - "learning_rate": 8.549667403457163e-07, - "loss": 0.5513, - "step": 65540 - }, - { - "epoch": 1.68, - "learning_rate": 8.549393625131341e-07, - "loss": 0.5947, - "step": 65541 - }, - { - "epoch": 1.68, - "learning_rate": 8.549119847916177e-07, - "loss": 0.6807, - "step": 65542 - }, - { - "epoch": 1.68, - "learning_rate": 8.54884607181189e-07, - "loss": 0.6104, - "step": 65543 - }, - { - "epoch": 1.68, - "learning_rate": 8.548572296818681e-07, - "loss": 0.5947, - "step": 65544 - }, - { - "epoch": 1.68, - "learning_rate": 8.548298522936766e-07, - "loss": 0.3641, - "step": 65545 - }, - { - "epoch": 1.68, - "learning_rate": 8.54802475016635e-07, - "loss": 0.5718, - "step": 65546 - }, - { - "epoch": 1.68, - "learning_rate": 8.547750978507647e-07, - "loss": 0.6123, - "step": 65547 - }, - { - "epoch": 1.68, - "learning_rate": 8.547477207960867e-07, - "loss": 0.7046, - "step": 65548 - }, - { - "epoch": 1.68, - "learning_rate": 8.547203438526213e-07, - "loss": 0.605, - "step": 65549 - }, - { - "epoch": 1.68, - "learning_rate": 8.546929670203899e-07, - "loss": 0.7061, - "step": 65550 - }, - { - "epoch": 1.68, - "learning_rate": 8.546655902994133e-07, - "loss": 0.4492, - "step": 65551 - }, - { - "epoch": 1.68, - "learning_rate": 8.546382136897127e-07, - "loss": 0.5557, - "step": 65552 - }, - { - "epoch": 1.68, - "learning_rate": 8.546108371913089e-07, - "loss": 0.4873, - "step": 65553 - }, - { - "epoch": 1.68, - "learning_rate": 8.545834608042229e-07, - "loss": 0.5664, - "step": 65554 - }, - { - "epoch": 1.68, - "learning_rate": 8.545560845284756e-07, - "loss": 0.5605, - "step": 65555 - }, - { - "epoch": 1.68, - "learning_rate": 8.545287083640882e-07, - "loss": 0.8115, - "step": 65556 - }, - { - "epoch": 1.68, - "learning_rate": 8.545013323110812e-07, - "loss": 0.5542, - "step": 65557 - }, - { - "epoch": 1.68, - "learning_rate": 8.544739563694765e-07, - "loss": 0.3495, - "step": 65558 - }, - { - "epoch": 1.68, - "learning_rate": 8.544465805392937e-07, - "loss": 0.6758, - "step": 65559 - }, - { - "epoch": 1.68, - "learning_rate": 8.544192048205548e-07, - "loss": 0.4863, - "step": 65560 - }, - { - "epoch": 1.68, - "learning_rate": 8.543918292132803e-07, - "loss": 0.6279, - "step": 65561 - }, - { - "epoch": 1.68, - "learning_rate": 8.543644537174913e-07, - "loss": 0.5916, - "step": 65562 - }, - { - "epoch": 1.68, - "learning_rate": 8.543370783332085e-07, - "loss": 0.387, - "step": 65563 - }, - { - "epoch": 1.68, - "learning_rate": 8.543097030604534e-07, - "loss": 0.6704, - "step": 65564 - }, - { - "epoch": 1.68, - "learning_rate": 8.542823278992465e-07, - "loss": 0.7988, - "step": 65565 - }, - { - "epoch": 1.68, - "learning_rate": 8.542549528496091e-07, - "loss": 0.5358, - "step": 65566 - }, - { - "epoch": 1.68, - "learning_rate": 8.542275779115617e-07, - "loss": 0.5364, - "step": 65567 - }, - { - "epoch": 1.68, - "learning_rate": 8.542002030851261e-07, - "loss": 0.6299, - "step": 65568 - }, - { - "epoch": 1.68, - "learning_rate": 8.541728283703223e-07, - "loss": 0.7822, - "step": 65569 - }, - { - "epoch": 1.68, - "learning_rate": 8.541454537671716e-07, - "loss": 0.6885, - "step": 65570 - }, - { - "epoch": 1.68, - "learning_rate": 8.541180792756952e-07, - "loss": 0.6216, - "step": 65571 - }, - { - "epoch": 1.68, - "learning_rate": 8.540907048959136e-07, - "loss": 0.7305, - "step": 65572 - }, - { - "epoch": 1.68, - "learning_rate": 8.540633306278484e-07, - "loss": 0.687, - "step": 65573 - }, - { - "epoch": 1.68, - "learning_rate": 8.540359564715198e-07, - "loss": 0.6689, - "step": 65574 - }, - { - "epoch": 1.68, - "learning_rate": 8.540085824269495e-07, - "loss": 0.5029, - "step": 65575 - }, - { - "epoch": 1.68, - "learning_rate": 8.53981208494158e-07, - "loss": 0.4651, - "step": 65576 - }, - { - "epoch": 1.68, - "learning_rate": 8.539538346731663e-07, - "loss": 0.6792, - "step": 65577 - }, - { - "epoch": 1.68, - "learning_rate": 8.539264609639958e-07, - "loss": 0.6035, - "step": 65578 - }, - { - "epoch": 1.68, - "learning_rate": 8.538990873666669e-07, - "loss": 0.6362, - "step": 65579 - }, - { - "epoch": 1.68, - "learning_rate": 8.538717138812004e-07, - "loss": 0.4749, - "step": 65580 - }, - { - "epoch": 1.68, - "learning_rate": 8.53844340507618e-07, - "loss": 0.5825, - "step": 65581 - }, - { - "epoch": 1.68, - "learning_rate": 8.5381696724594e-07, - "loss": 0.5264, - "step": 65582 - }, - { - "epoch": 1.68, - "learning_rate": 8.537895940961878e-07, - "loss": 0.6372, - "step": 65583 - }, - { - "epoch": 1.68, - "learning_rate": 8.537622210583819e-07, - "loss": 0.5732, - "step": 65584 - }, - { - "epoch": 1.68, - "learning_rate": 8.537348481325439e-07, - "loss": 0.5913, - "step": 65585 - }, - { - "epoch": 1.68, - "learning_rate": 8.537074753186941e-07, - "loss": 0.6738, - "step": 65586 - }, - { - "epoch": 1.68, - "learning_rate": 8.536801026168541e-07, - "loss": 0.6982, - "step": 65587 - }, - { - "epoch": 1.68, - "learning_rate": 8.536527300270446e-07, - "loss": 0.5977, - "step": 65588 - }, - { - "epoch": 1.68, - "learning_rate": 8.536253575492861e-07, - "loss": 0.7109, - "step": 65589 - }, - { - "epoch": 1.68, - "learning_rate": 8.535979851836002e-07, - "loss": 0.8467, - "step": 65590 - }, - { - "epoch": 1.68, - "learning_rate": 8.535706129300073e-07, - "loss": 0.6719, - "step": 65591 - }, - { - "epoch": 1.68, - "learning_rate": 8.535432407885289e-07, - "loss": 0.6826, - "step": 65592 - }, - { - "epoch": 1.68, - "learning_rate": 8.535158687591855e-07, - "loss": 0.6279, - "step": 65593 - }, - { - "epoch": 1.68, - "learning_rate": 8.534884968419984e-07, - "loss": 0.5757, - "step": 65594 - }, - { - "epoch": 1.68, - "learning_rate": 8.534611250369885e-07, - "loss": 0.7764, - "step": 65595 - }, - { - "epoch": 1.68, - "learning_rate": 8.534337533441765e-07, - "loss": 0.561, - "step": 65596 - }, - { - "epoch": 1.68, - "learning_rate": 8.534063817635836e-07, - "loss": 0.604, - "step": 65597 - }, - { - "epoch": 1.68, - "learning_rate": 8.533790102952309e-07, - "loss": 0.4473, - "step": 65598 - }, - { - "epoch": 1.68, - "learning_rate": 8.533516389391388e-07, - "loss": 0.7051, - "step": 65599 - }, - { - "epoch": 1.68, - "learning_rate": 8.533242676953289e-07, - "loss": 0.6455, - "step": 65600 - }, - { - "epoch": 1.68, - "learning_rate": 8.532968965638217e-07, - "loss": 0.5713, - "step": 65601 - }, - { - "epoch": 1.68, - "learning_rate": 8.532695255446383e-07, - "loss": 0.5649, - "step": 65602 - }, - { - "epoch": 1.68, - "learning_rate": 8.532421546377996e-07, - "loss": 0.6924, - "step": 65603 - }, - { - "epoch": 1.68, - "learning_rate": 8.532147838433267e-07, - "loss": 0.8027, - "step": 65604 - }, - { - "epoch": 1.68, - "learning_rate": 8.531874131612406e-07, - "loss": 0.7021, - "step": 65605 - }, - { - "epoch": 1.68, - "learning_rate": 8.531600425915621e-07, - "loss": 0.5129, - "step": 65606 - }, - { - "epoch": 1.68, - "learning_rate": 8.531326721343125e-07, - "loss": 0.5364, - "step": 65607 - }, - { - "epoch": 1.68, - "learning_rate": 8.53105301789512e-07, - "loss": 0.6992, - "step": 65608 - }, - { - "epoch": 1.68, - "learning_rate": 8.530779315571823e-07, - "loss": 0.5879, - "step": 65609 - }, - { - "epoch": 1.68, - "learning_rate": 8.530505614373438e-07, - "loss": 0.625, - "step": 65610 - }, - { - "epoch": 1.68, - "learning_rate": 8.530231914300179e-07, - "loss": 0.6357, - "step": 65611 - }, - { - "epoch": 1.68, - "learning_rate": 8.529958215352255e-07, - "loss": 0.6733, - "step": 65612 - }, - { - "epoch": 1.68, - "learning_rate": 8.529684517529871e-07, - "loss": 0.6333, - "step": 65613 - }, - { - "epoch": 1.68, - "learning_rate": 8.529410820833243e-07, - "loss": 0.5618, - "step": 65614 - }, - { - "epoch": 1.68, - "learning_rate": 8.529137125262575e-07, - "loss": 0.6436, - "step": 65615 - }, - { - "epoch": 1.68, - "learning_rate": 8.528863430818081e-07, - "loss": 0.6416, - "step": 65616 - }, - { - "epoch": 1.68, - "learning_rate": 8.528589737499971e-07, - "loss": 0.6396, - "step": 65617 - }, - { - "epoch": 1.68, - "learning_rate": 8.528316045308447e-07, - "loss": 0.7676, - "step": 65618 - }, - { - "epoch": 1.68, - "learning_rate": 8.528042354243727e-07, - "loss": 0.6899, - "step": 65619 - }, - { - "epoch": 1.68, - "learning_rate": 8.527768664306016e-07, - "loss": 0.5659, - "step": 65620 - }, - { - "epoch": 1.68, - "learning_rate": 8.527494975495526e-07, - "loss": 0.7754, - "step": 65621 - }, - { - "epoch": 1.68, - "learning_rate": 8.527221287812462e-07, - "loss": 0.5343, - "step": 65622 - }, - { - "epoch": 1.68, - "learning_rate": 8.526947601257042e-07, - "loss": 0.6855, - "step": 65623 - }, - { - "epoch": 1.68, - "learning_rate": 8.526673915829466e-07, - "loss": 0.4601, - "step": 65624 - }, - { - "epoch": 1.68, - "learning_rate": 8.526400231529951e-07, - "loss": 0.7324, - "step": 65625 - }, - { - "epoch": 1.68, - "learning_rate": 8.526126548358701e-07, - "loss": 0.7041, - "step": 65626 - }, - { - "epoch": 1.68, - "learning_rate": 8.525852866315933e-07, - "loss": 0.7217, - "step": 65627 - }, - { - "epoch": 1.68, - "learning_rate": 8.525579185401849e-07, - "loss": 0.8193, - "step": 65628 - }, - { - "epoch": 1.68, - "learning_rate": 8.525305505616661e-07, - "loss": 0.6572, - "step": 65629 - }, - { - "epoch": 1.68, - "learning_rate": 8.525031826960577e-07, - "loss": 0.6064, - "step": 65630 - }, - { - "epoch": 1.68, - "learning_rate": 8.524758149433811e-07, - "loss": 0.4502, - "step": 65631 - }, - { - "epoch": 1.68, - "learning_rate": 8.524484473036567e-07, - "loss": 0.7617, - "step": 65632 - }, - { - "epoch": 1.68, - "learning_rate": 8.52421079776906e-07, - "loss": 0.6831, - "step": 65633 - }, - { - "epoch": 1.68, - "learning_rate": 8.523937123631494e-07, - "loss": 0.5571, - "step": 65634 - }, - { - "epoch": 1.68, - "learning_rate": 8.523663450624084e-07, - "loss": 0.6543, - "step": 65635 - }, - { - "epoch": 1.68, - "learning_rate": 8.523389778747035e-07, - "loss": 0.5029, - "step": 65636 - }, - { - "epoch": 1.68, - "learning_rate": 8.523116108000563e-07, - "loss": 0.627, - "step": 65637 - }, - { - "epoch": 1.68, - "learning_rate": 8.522842438384872e-07, - "loss": 0.6348, - "step": 65638 - }, - { - "epoch": 1.68, - "learning_rate": 8.522568769900168e-07, - "loss": 0.6143, - "step": 65639 - }, - { - "epoch": 1.68, - "learning_rate": 8.522295102546668e-07, - "loss": 0.7305, - "step": 65640 - }, - { - "epoch": 1.68, - "learning_rate": 8.522021436324578e-07, - "loss": 0.7803, - "step": 65641 - }, - { - "epoch": 1.68, - "learning_rate": 8.521747771234109e-07, - "loss": 0.6895, - "step": 65642 - }, - { - "epoch": 1.68, - "learning_rate": 8.521474107275468e-07, - "loss": 0.5796, - "step": 65643 - }, - { - "epoch": 1.68, - "learning_rate": 8.521200444448869e-07, - "loss": 0.4736, - "step": 65644 - }, - { - "epoch": 1.68, - "learning_rate": 8.520926782754516e-07, - "loss": 0.5659, - "step": 65645 - }, - { - "epoch": 1.68, - "learning_rate": 8.520653122192624e-07, - "loss": 0.6426, - "step": 65646 - }, - { - "epoch": 1.68, - "learning_rate": 8.520379462763402e-07, - "loss": 0.5715, - "step": 65647 - }, - { - "epoch": 1.68, - "learning_rate": 8.520105804467055e-07, - "loss": 0.5625, - "step": 65648 - }, - { - "epoch": 1.68, - "learning_rate": 8.519832147303793e-07, - "loss": 0.7227, - "step": 65649 - }, - { - "epoch": 1.68, - "learning_rate": 8.519558491273829e-07, - "loss": 0.6523, - "step": 65650 - }, - { - "epoch": 1.68, - "learning_rate": 8.51928483637737e-07, - "loss": 0.6392, - "step": 65651 - }, - { - "epoch": 1.68, - "learning_rate": 8.519011182614627e-07, - "loss": 0.667, - "step": 65652 - }, - { - "epoch": 1.68, - "learning_rate": 8.518737529985808e-07, - "loss": 0.6299, - "step": 65653 - }, - { - "epoch": 1.68, - "learning_rate": 8.518463878491126e-07, - "loss": 0.6396, - "step": 65654 - }, - { - "epoch": 1.68, - "learning_rate": 8.518190228130785e-07, - "loss": 0.748, - "step": 65655 - }, - { - "epoch": 1.68, - "learning_rate": 8.517916578905e-07, - "loss": 0.708, - "step": 65656 - }, - { - "epoch": 1.68, - "learning_rate": 8.517642930813981e-07, - "loss": 0.6792, - "step": 65657 - }, - { - "epoch": 1.68, - "learning_rate": 8.51736928385793e-07, - "loss": 0.502, - "step": 65658 - }, - { - "epoch": 1.68, - "learning_rate": 8.517095638037063e-07, - "loss": 0.7568, - "step": 65659 - }, - { - "epoch": 1.68, - "learning_rate": 8.516821993351586e-07, - "loss": 0.7358, - "step": 65660 - }, - { - "epoch": 1.68, - "learning_rate": 8.516548349801711e-07, - "loss": 0.6797, - "step": 65661 - }, - { - "epoch": 1.68, - "learning_rate": 8.516274707387646e-07, - "loss": 0.6123, - "step": 65662 - }, - { - "epoch": 1.68, - "learning_rate": 8.516001066109604e-07, - "loss": 0.8477, - "step": 65663 - }, - { - "epoch": 1.68, - "learning_rate": 8.515727425967788e-07, - "loss": 0.5391, - "step": 65664 - }, - { - "epoch": 1.68, - "learning_rate": 8.515453786962415e-07, - "loss": 0.8867, - "step": 65665 - }, - { - "epoch": 1.68, - "learning_rate": 8.515180149093686e-07, - "loss": 0.5217, - "step": 65666 - }, - { - "epoch": 1.68, - "learning_rate": 8.514906512361823e-07, - "loss": 0.8174, - "step": 65667 - }, - { - "epoch": 1.68, - "learning_rate": 8.514632876767023e-07, - "loss": 0.5137, - "step": 65668 - }, - { - "epoch": 1.68, - "learning_rate": 8.514359242309501e-07, - "loss": 0.665, - "step": 65669 - }, - { - "epoch": 1.68, - "learning_rate": 8.514085608989463e-07, - "loss": 0.7578, - "step": 65670 - }, - { - "epoch": 1.68, - "learning_rate": 8.513811976807125e-07, - "loss": 0.6357, - "step": 65671 - }, - { - "epoch": 1.68, - "learning_rate": 8.51353834576269e-07, - "loss": 0.686, - "step": 65672 - }, - { - "epoch": 1.68, - "learning_rate": 8.513264715856372e-07, - "loss": 0.7549, - "step": 65673 - }, - { - "epoch": 1.68, - "learning_rate": 8.512991087088377e-07, - "loss": 0.6445, - "step": 65674 - }, - { - "epoch": 1.68, - "learning_rate": 8.512717459458919e-07, - "loss": 0.5786, - "step": 65675 - }, - { - "epoch": 1.68, - "learning_rate": 8.512443832968202e-07, - "loss": 0.6152, - "step": 65676 - }, - { - "epoch": 1.68, - "learning_rate": 8.512170207616444e-07, - "loss": 0.7627, - "step": 65677 - }, - { - "epoch": 1.68, - "learning_rate": 8.511896583403846e-07, - "loss": 0.5471, - "step": 65678 - }, - { - "epoch": 1.68, - "learning_rate": 8.511622960330617e-07, - "loss": 0.6943, - "step": 65679 - }, - { - "epoch": 1.68, - "learning_rate": 8.511349338396974e-07, - "loss": 0.6348, - "step": 65680 - }, - { - "epoch": 1.68, - "learning_rate": 8.511075717603117e-07, - "loss": 0.7188, - "step": 65681 - }, - { - "epoch": 1.68, - "learning_rate": 8.510802097949266e-07, - "loss": 0.6738, - "step": 65682 - }, - { - "epoch": 1.68, - "learning_rate": 8.510528479435623e-07, - "loss": 0.7314, - "step": 65683 - }, - { - "epoch": 1.68, - "learning_rate": 8.510254862062401e-07, - "loss": 0.5681, - "step": 65684 - }, - { - "epoch": 1.68, - "learning_rate": 8.50998124582981e-07, - "loss": 0.5032, - "step": 65685 - }, - { - "epoch": 1.68, - "learning_rate": 8.509707630738053e-07, - "loss": 0.793, - "step": 65686 - }, - { - "epoch": 1.68, - "learning_rate": 8.509434016787351e-07, - "loss": 0.7231, - "step": 65687 - }, - { - "epoch": 1.68, - "learning_rate": 8.509160403977904e-07, - "loss": 0.6035, - "step": 65688 - }, - { - "epoch": 1.68, - "learning_rate": 8.508886792309921e-07, - "loss": 0.6367, - "step": 65689 - }, - { - "epoch": 1.68, - "learning_rate": 8.508613181783618e-07, - "loss": 0.7822, - "step": 65690 - }, - { - "epoch": 1.68, - "learning_rate": 8.508339572399199e-07, - "loss": 0.8281, - "step": 65691 - }, - { - "epoch": 1.68, - "learning_rate": 8.508065964156878e-07, - "loss": 0.6826, - "step": 65692 - }, - { - "epoch": 1.68, - "learning_rate": 8.507792357056862e-07, - "loss": 0.7715, - "step": 65693 - }, - { - "epoch": 1.68, - "learning_rate": 8.50751875109936e-07, - "loss": 0.5767, - "step": 65694 - }, - { - "epoch": 1.68, - "learning_rate": 8.507245146284581e-07, - "loss": 0.4414, - "step": 65695 - }, - { - "epoch": 1.68, - "learning_rate": 8.506971542612738e-07, - "loss": 0.6846, - "step": 65696 - }, - { - "epoch": 1.68, - "learning_rate": 8.506697940084041e-07, - "loss": 0.5933, - "step": 65697 - }, - { - "epoch": 1.68, - "learning_rate": 8.506424338698692e-07, - "loss": 0.6855, - "step": 65698 - }, - { - "epoch": 1.68, - "learning_rate": 8.506150738456907e-07, - "loss": 0.5044, - "step": 65699 - }, - { - "epoch": 1.68, - "learning_rate": 8.505877139358892e-07, - "loss": 0.5564, - "step": 65700 - }, - { - "epoch": 1.68, - "learning_rate": 8.50560354140486e-07, - "loss": 0.6382, - "step": 65701 - }, - { - "epoch": 1.68, - "learning_rate": 8.505329944595019e-07, - "loss": 0.7695, - "step": 65702 - }, - { - "epoch": 1.68, - "learning_rate": 8.505056348929575e-07, - "loss": 0.6475, - "step": 65703 - }, - { - "epoch": 1.68, - "learning_rate": 8.504782754408743e-07, - "loss": 0.7002, - "step": 65704 - }, - { - "epoch": 1.68, - "learning_rate": 8.504509161032729e-07, - "loss": 0.6143, - "step": 65705 - }, - { - "epoch": 1.68, - "learning_rate": 8.504235568801745e-07, - "loss": 0.6655, - "step": 65706 - }, - { - "epoch": 1.68, - "learning_rate": 8.503961977716002e-07, - "loss": 0.9082, - "step": 65707 - }, - { - "epoch": 1.68, - "learning_rate": 8.503688387775703e-07, - "loss": 0.7812, - "step": 65708 - }, - { - "epoch": 1.68, - "learning_rate": 8.503414798981061e-07, - "loss": 0.6719, - "step": 65709 - }, - { - "epoch": 1.68, - "learning_rate": 8.503141211332285e-07, - "loss": 0.3951, - "step": 65710 - }, - { - "epoch": 1.68, - "learning_rate": 8.502867624829585e-07, - "loss": 0.6562, - "step": 65711 - }, - { - "epoch": 1.68, - "learning_rate": 8.50259403947317e-07, - "loss": 0.917, - "step": 65712 - }, - { - "epoch": 1.68, - "learning_rate": 8.502320455263251e-07, - "loss": 0.6733, - "step": 65713 - }, - { - "epoch": 1.68, - "learning_rate": 8.502046872200035e-07, - "loss": 0.6543, - "step": 65714 - }, - { - "epoch": 1.68, - "learning_rate": 8.501773290283734e-07, - "loss": 0.6597, - "step": 65715 - }, - { - "epoch": 1.68, - "learning_rate": 8.501499709514556e-07, - "loss": 0.5615, - "step": 65716 - }, - { - "epoch": 1.68, - "learning_rate": 8.501226129892714e-07, - "loss": 0.6213, - "step": 65717 - }, - { - "epoch": 1.68, - "learning_rate": 8.500952551418412e-07, - "loss": 0.5127, - "step": 65718 - }, - { - "epoch": 1.68, - "learning_rate": 8.500678974091862e-07, - "loss": 0.501, - "step": 65719 - }, - { - "epoch": 1.68, - "learning_rate": 8.500405397913271e-07, - "loss": 0.6943, - "step": 65720 - }, - { - "epoch": 1.68, - "learning_rate": 8.500131822882852e-07, - "loss": 0.5752, - "step": 65721 - }, - { - "epoch": 1.68, - "learning_rate": 8.499858249000811e-07, - "loss": 0.6191, - "step": 65722 - }, - { - "epoch": 1.68, - "learning_rate": 8.499584676267362e-07, - "loss": 0.6233, - "step": 65723 - }, - { - "epoch": 1.68, - "learning_rate": 8.49931110468271e-07, - "loss": 0.9092, - "step": 65724 - }, - { - "epoch": 1.68, - "learning_rate": 8.499037534247068e-07, - "loss": 0.6777, - "step": 65725 - }, - { - "epoch": 1.68, - "learning_rate": 8.498763964960644e-07, - "loss": 0.7246, - "step": 65726 - }, - { - "epoch": 1.68, - "learning_rate": 8.49849039682365e-07, - "loss": 0.645, - "step": 65727 - }, - { - "epoch": 1.68, - "learning_rate": 8.498216829836291e-07, - "loss": 0.5859, - "step": 65728 - }, - { - "epoch": 1.68, - "learning_rate": 8.497943263998775e-07, - "loss": 0.5981, - "step": 65729 - }, - { - "epoch": 1.68, - "learning_rate": 8.497669699311318e-07, - "loss": 0.6299, - "step": 65730 - }, - { - "epoch": 1.68, - "learning_rate": 8.497396135774125e-07, - "loss": 0.687, - "step": 65731 - }, - { - "epoch": 1.68, - "learning_rate": 8.497122573387407e-07, - "loss": 0.6606, - "step": 65732 - }, - { - "epoch": 1.68, - "learning_rate": 8.496849012151372e-07, - "loss": 0.5479, - "step": 65733 - }, - { - "epoch": 1.68, - "learning_rate": 8.496575452066234e-07, - "loss": 0.7656, - "step": 65734 - }, - { - "epoch": 1.68, - "learning_rate": 8.496301893132195e-07, - "loss": 0.3424, - "step": 65735 - }, - { - "epoch": 1.68, - "learning_rate": 8.496028335349471e-07, - "loss": 0.6836, - "step": 65736 - }, - { - "epoch": 1.68, - "learning_rate": 8.495754778718272e-07, - "loss": 0.5796, - "step": 65737 - }, - { - "epoch": 1.68, - "learning_rate": 8.4954812232388e-07, - "loss": 0.8076, - "step": 65738 - }, - { - "epoch": 1.68, - "learning_rate": 8.49520766891127e-07, - "loss": 0.5713, - "step": 65739 - }, - { - "epoch": 1.68, - "learning_rate": 8.49493411573589e-07, - "loss": 0.6582, - "step": 65740 - }, - { - "epoch": 1.68, - "learning_rate": 8.494660563712869e-07, - "loss": 0.6177, - "step": 65741 - }, - { - "epoch": 1.69, - "learning_rate": 8.494387012842418e-07, - "loss": 0.7397, - "step": 65742 - }, - { - "epoch": 1.69, - "learning_rate": 8.494113463124743e-07, - "loss": 0.4883, - "step": 65743 - }, - { - "epoch": 1.69, - "learning_rate": 8.49383991456006e-07, - "loss": 0.6221, - "step": 65744 - }, - { - "epoch": 1.69, - "learning_rate": 8.493566367148573e-07, - "loss": 0.6016, - "step": 65745 - }, - { - "epoch": 1.69, - "learning_rate": 8.493292820890493e-07, - "loss": 0.6245, - "step": 65746 - }, - { - "epoch": 1.69, - "learning_rate": 8.493019275786033e-07, - "loss": 0.7891, - "step": 65747 - }, - { - "epoch": 1.69, - "learning_rate": 8.492745731835394e-07, - "loss": 0.5923, - "step": 65748 - }, - { - "epoch": 1.69, - "learning_rate": 8.492472189038792e-07, - "loss": 0.6826, - "step": 65749 - }, - { - "epoch": 1.69, - "learning_rate": 8.492198647396433e-07, - "loss": 0.6387, - "step": 65750 - }, - { - "epoch": 1.69, - "learning_rate": 8.491925106908531e-07, - "loss": 0.7275, - "step": 65751 - }, - { - "epoch": 1.69, - "learning_rate": 8.491651567575289e-07, - "loss": 0.832, - "step": 65752 - }, - { - "epoch": 1.69, - "learning_rate": 8.491378029396923e-07, - "loss": 0.3721, - "step": 65753 - }, - { - "epoch": 1.69, - "learning_rate": 8.491104492373638e-07, - "loss": 0.7461, - "step": 65754 - }, - { - "epoch": 1.69, - "learning_rate": 8.490830956505645e-07, - "loss": 0.6357, - "step": 65755 - }, - { - "epoch": 1.69, - "learning_rate": 8.490557421793153e-07, - "loss": 0.6133, - "step": 65756 - }, - { - "epoch": 1.69, - "learning_rate": 8.490283888236378e-07, - "loss": 0.5947, - "step": 65757 - }, - { - "epoch": 1.69, - "learning_rate": 8.490010355835516e-07, - "loss": 0.5068, - "step": 65758 - }, - { - "epoch": 1.69, - "learning_rate": 8.489736824590786e-07, - "loss": 0.6885, - "step": 65759 - }, - { - "epoch": 1.69, - "learning_rate": 8.489463294502394e-07, - "loss": 0.8184, - "step": 65760 - }, - { - "epoch": 1.69, - "learning_rate": 8.489189765570551e-07, - "loss": 0.707, - "step": 65761 - }, - { - "epoch": 1.69, - "learning_rate": 8.488916237795465e-07, - "loss": 0.8125, - "step": 65762 - }, - { - "epoch": 1.69, - "learning_rate": 8.488642711177347e-07, - "loss": 0.5701, - "step": 65763 - }, - { - "epoch": 1.69, - "learning_rate": 8.488369185716405e-07, - "loss": 0.5371, - "step": 65764 - }, - { - "epoch": 1.69, - "learning_rate": 8.488095661412852e-07, - "loss": 0.7168, - "step": 65765 - }, - { - "epoch": 1.69, - "learning_rate": 8.487822138266891e-07, - "loss": 0.6265, - "step": 65766 - }, - { - "epoch": 1.69, - "learning_rate": 8.487548616278741e-07, - "loss": 0.46, - "step": 65767 - }, - { - "epoch": 1.69, - "learning_rate": 8.487275095448602e-07, - "loss": 0.5259, - "step": 65768 - }, - { - "epoch": 1.69, - "learning_rate": 8.487001575776685e-07, - "loss": 0.8232, - "step": 65769 - }, - { - "epoch": 1.69, - "learning_rate": 8.486728057263203e-07, - "loss": 0.6543, - "step": 65770 - }, - { - "epoch": 1.69, - "learning_rate": 8.486454539908362e-07, - "loss": 0.6768, - "step": 65771 - }, - { - "epoch": 1.69, - "learning_rate": 8.486181023712375e-07, - "loss": 0.5343, - "step": 65772 - }, - { - "epoch": 1.69, - "learning_rate": 8.485907508675448e-07, - "loss": 0.6372, - "step": 65773 - }, - { - "epoch": 1.69, - "learning_rate": 8.485633994797794e-07, - "loss": 0.8125, - "step": 65774 - }, - { - "epoch": 1.69, - "learning_rate": 8.485360482079621e-07, - "loss": 0.6606, - "step": 65775 - }, - { - "epoch": 1.69, - "learning_rate": 8.485086970521135e-07, - "loss": 0.5942, - "step": 65776 - }, - { - "epoch": 1.69, - "learning_rate": 8.484813460122553e-07, - "loss": 0.4692, - "step": 65777 - }, - { - "epoch": 1.69, - "learning_rate": 8.484539950884077e-07, - "loss": 0.6426, - "step": 65778 - }, - { - "epoch": 1.69, - "learning_rate": 8.484266442805916e-07, - "loss": 0.6533, - "step": 65779 - }, - { - "epoch": 1.69, - "learning_rate": 8.483992935888287e-07, - "loss": 0.5964, - "step": 65780 - }, - { - "epoch": 1.69, - "learning_rate": 8.48371943013139e-07, - "loss": 0.5068, - "step": 65781 - }, - { - "epoch": 1.69, - "learning_rate": 8.483445925535444e-07, - "loss": 0.6855, - "step": 65782 - }, - { - "epoch": 1.69, - "learning_rate": 8.483172422100651e-07, - "loss": 0.5957, - "step": 65783 - }, - { - "epoch": 1.69, - "learning_rate": 8.482898919827224e-07, - "loss": 0.4897, - "step": 65784 - }, - { - "epoch": 1.69, - "learning_rate": 8.48262541871537e-07, - "loss": 0.7129, - "step": 65785 - }, - { - "epoch": 1.69, - "learning_rate": 8.482351918765303e-07, - "loss": 0.457, - "step": 65786 - }, - { - "epoch": 1.69, - "learning_rate": 8.48207841997723e-07, - "loss": 0.6646, - "step": 65787 - }, - { - "epoch": 1.69, - "learning_rate": 8.481804922351357e-07, - "loss": 0.7295, - "step": 65788 - }, - { - "epoch": 1.69, - "learning_rate": 8.481531425887898e-07, - "loss": 0.6733, - "step": 65789 - }, - { - "epoch": 1.69, - "learning_rate": 8.481257930587058e-07, - "loss": 0.6631, - "step": 65790 - }, - { - "epoch": 1.69, - "learning_rate": 8.48098443644905e-07, - "loss": 0.7627, - "step": 65791 - }, - { - "epoch": 1.69, - "learning_rate": 8.480710943474084e-07, - "loss": 0.6816, - "step": 65792 - }, - { - "epoch": 1.69, - "learning_rate": 8.480437451662365e-07, - "loss": 0.7012, - "step": 65793 - }, - { - "epoch": 1.69, - "learning_rate": 8.480163961014108e-07, - "loss": 0.7454, - "step": 65794 - }, - { - "epoch": 1.69, - "learning_rate": 8.479890471529516e-07, - "loss": 0.7319, - "step": 65795 - }, - { - "epoch": 1.69, - "learning_rate": 8.479616983208805e-07, - "loss": 0.4592, - "step": 65796 - }, - { - "epoch": 1.69, - "learning_rate": 8.479343496052183e-07, - "loss": 0.5879, - "step": 65797 - }, - { - "epoch": 1.69, - "learning_rate": 8.479070010059854e-07, - "loss": 0.7861, - "step": 65798 - }, - { - "epoch": 1.69, - "learning_rate": 8.478796525232034e-07, - "loss": 0.7061, - "step": 65799 - }, - { - "epoch": 1.69, - "learning_rate": 8.478523041568926e-07, - "loss": 0.6807, - "step": 65800 - }, - { - "epoch": 1.69, - "learning_rate": 8.478249559070746e-07, - "loss": 0.6729, - "step": 65801 - }, - { - "epoch": 1.69, - "learning_rate": 8.477976077737698e-07, - "loss": 0.6299, - "step": 65802 - }, - { - "epoch": 1.69, - "learning_rate": 8.477702597569996e-07, - "loss": 0.7627, - "step": 65803 - }, - { - "epoch": 1.69, - "learning_rate": 8.477429118567845e-07, - "loss": 0.6201, - "step": 65804 - }, - { - "epoch": 1.69, - "learning_rate": 8.477155640731458e-07, - "loss": 0.5421, - "step": 65805 - }, - { - "epoch": 1.69, - "learning_rate": 8.476882164061041e-07, - "loss": 0.6455, - "step": 65806 - }, - { - "epoch": 1.69, - "learning_rate": 8.47660868855681e-07, - "loss": 0.7451, - "step": 65807 - }, - { - "epoch": 1.69, - "learning_rate": 8.476335214218967e-07, - "loss": 0.6064, - "step": 65808 - }, - { - "epoch": 1.69, - "learning_rate": 8.476061741047725e-07, - "loss": 0.71, - "step": 65809 - }, - { - "epoch": 1.69, - "learning_rate": 8.475788269043289e-07, - "loss": 0.6836, - "step": 65810 - }, - { - "epoch": 1.69, - "learning_rate": 8.475514798205875e-07, - "loss": 0.5649, - "step": 65811 - }, - { - "epoch": 1.69, - "learning_rate": 8.475241328535687e-07, - "loss": 0.6572, - "step": 65812 - }, - { - "epoch": 1.69, - "learning_rate": 8.474967860032938e-07, - "loss": 0.8047, - "step": 65813 - }, - { - "epoch": 1.69, - "learning_rate": 8.474694392697834e-07, - "loss": 0.5486, - "step": 65814 - }, - { - "epoch": 1.69, - "learning_rate": 8.47442092653059e-07, - "loss": 0.8057, - "step": 65815 - }, - { - "epoch": 1.69, - "learning_rate": 8.474147461531408e-07, - "loss": 0.7227, - "step": 65816 - }, - { - "epoch": 1.69, - "learning_rate": 8.473873997700506e-07, - "loss": 0.6875, - "step": 65817 - }, - { - "epoch": 1.69, - "learning_rate": 8.473600535038086e-07, - "loss": 0.562, - "step": 65818 - }, - { - "epoch": 1.69, - "learning_rate": 8.473327073544358e-07, - "loss": 0.48, - "step": 65819 - }, - { - "epoch": 1.69, - "learning_rate": 8.473053613219535e-07, - "loss": 0.8115, - "step": 65820 - }, - { - "epoch": 1.69, - "learning_rate": 8.472780154063824e-07, - "loss": 0.6079, - "step": 65821 - }, - { - "epoch": 1.69, - "learning_rate": 8.472506696077435e-07, - "loss": 0.7256, - "step": 65822 - }, - { - "epoch": 1.69, - "learning_rate": 8.472233239260576e-07, - "loss": 0.3335, - "step": 65823 - }, - { - "epoch": 1.69, - "learning_rate": 8.471959783613461e-07, - "loss": 0.7129, - "step": 65824 - }, - { - "epoch": 1.69, - "learning_rate": 8.471686329136293e-07, - "loss": 0.7266, - "step": 65825 - }, - { - "epoch": 1.69, - "learning_rate": 8.471412875829287e-07, - "loss": 0.7212, - "step": 65826 - }, - { - "epoch": 1.69, - "learning_rate": 8.471139423692652e-07, - "loss": 0.6304, - "step": 65827 - }, - { - "epoch": 1.69, - "learning_rate": 8.470865972726593e-07, - "loss": 0.7144, - "step": 65828 - }, - { - "epoch": 1.69, - "learning_rate": 8.47059252293132e-07, - "loss": 0.8047, - "step": 65829 - }, - { - "epoch": 1.69, - "learning_rate": 8.470319074307044e-07, - "loss": 0.6807, - "step": 65830 - }, - { - "epoch": 1.69, - "learning_rate": 8.470045626853974e-07, - "loss": 0.5903, - "step": 65831 - }, - { - "epoch": 1.69, - "learning_rate": 8.469772180572322e-07, - "loss": 0.6826, - "step": 65832 - }, - { - "epoch": 1.69, - "learning_rate": 8.469498735462293e-07, - "loss": 0.7783, - "step": 65833 - }, - { - "epoch": 1.69, - "learning_rate": 8.469225291524099e-07, - "loss": 0.6826, - "step": 65834 - }, - { - "epoch": 1.69, - "learning_rate": 8.468951848757948e-07, - "loss": 0.7026, - "step": 65835 - }, - { - "epoch": 1.69, - "learning_rate": 8.468678407164052e-07, - "loss": 0.6343, - "step": 65836 - }, - { - "epoch": 1.69, - "learning_rate": 8.468404966742622e-07, - "loss": 0.5322, - "step": 65837 - }, - { - "epoch": 1.69, - "learning_rate": 8.468131527493858e-07, - "loss": 0.7344, - "step": 65838 - }, - { - "epoch": 1.69, - "learning_rate": 8.467858089417978e-07, - "loss": 0.5209, - "step": 65839 - }, - { - "epoch": 1.69, - "learning_rate": 8.467584652515185e-07, - "loss": 0.6013, - "step": 65840 - }, - { - "epoch": 1.69, - "learning_rate": 8.467311216785695e-07, - "loss": 0.6602, - "step": 65841 - }, - { - "epoch": 1.69, - "learning_rate": 8.467037782229714e-07, - "loss": 0.5405, - "step": 65842 - }, - { - "epoch": 1.69, - "learning_rate": 8.466764348847451e-07, - "loss": 0.8154, - "step": 65843 - }, - { - "epoch": 1.69, - "learning_rate": 8.466490916639116e-07, - "loss": 0.6768, - "step": 65844 - }, - { - "epoch": 1.69, - "learning_rate": 8.46621748560492e-07, - "loss": 0.7129, - "step": 65845 - }, - { - "epoch": 1.69, - "learning_rate": 8.465944055745068e-07, - "loss": 0.7412, - "step": 65846 - }, - { - "epoch": 1.69, - "learning_rate": 8.465670627059778e-07, - "loss": 0.4684, - "step": 65847 - }, - { - "epoch": 1.69, - "learning_rate": 8.465397199549249e-07, - "loss": 0.5708, - "step": 65848 - }, - { - "epoch": 1.69, - "learning_rate": 8.465123773213696e-07, - "loss": 0.519, - "step": 65849 - }, - { - "epoch": 1.69, - "learning_rate": 8.464850348053326e-07, - "loss": 0.7178, - "step": 65850 - }, - { - "epoch": 1.69, - "learning_rate": 8.464576924068349e-07, - "loss": 0.7012, - "step": 65851 - }, - { - "epoch": 1.69, - "learning_rate": 8.464303501258975e-07, - "loss": 0.5361, - "step": 65852 - }, - { - "epoch": 1.69, - "learning_rate": 8.464030079625414e-07, - "loss": 0.5293, - "step": 65853 - }, - { - "epoch": 1.69, - "learning_rate": 8.463756659167874e-07, - "loss": 0.7793, - "step": 65854 - }, - { - "epoch": 1.69, - "learning_rate": 8.463483239886565e-07, - "loss": 0.5889, - "step": 65855 - }, - { - "epoch": 1.69, - "learning_rate": 8.463209821781695e-07, - "loss": 0.6807, - "step": 65856 - }, - { - "epoch": 1.69, - "learning_rate": 8.462936404853479e-07, - "loss": 0.6089, - "step": 65857 - }, - { - "epoch": 1.69, - "learning_rate": 8.462662989102121e-07, - "loss": 0.5347, - "step": 65858 - }, - { - "epoch": 1.69, - "learning_rate": 8.462389574527826e-07, - "loss": 0.7021, - "step": 65859 - }, - { - "epoch": 1.69, - "learning_rate": 8.462116161130814e-07, - "loss": 0.688, - "step": 65860 - }, - { - "epoch": 1.69, - "learning_rate": 8.461842748911285e-07, - "loss": 0.6167, - "step": 65861 - }, - { - "epoch": 1.69, - "learning_rate": 8.461569337869454e-07, - "loss": 0.8242, - "step": 65862 - }, - { - "epoch": 1.69, - "learning_rate": 8.461295928005528e-07, - "loss": 0.6328, - "step": 65863 - }, - { - "epoch": 1.69, - "learning_rate": 8.461022519319719e-07, - "loss": 0.6709, - "step": 65864 - }, - { - "epoch": 1.69, - "learning_rate": 8.460749111812233e-07, - "loss": 0.6533, - "step": 65865 - }, - { - "epoch": 1.69, - "learning_rate": 8.460475705483278e-07, - "loss": 0.6709, - "step": 65866 - }, - { - "epoch": 1.69, - "learning_rate": 8.460202300333073e-07, - "loss": 0.4055, - "step": 65867 - }, - { - "epoch": 1.69, - "learning_rate": 8.459928896361816e-07, - "loss": 0.4274, - "step": 65868 - }, - { - "epoch": 1.69, - "learning_rate": 8.45965549356972e-07, - "loss": 0.5371, - "step": 65869 - }, - { - "epoch": 1.69, - "learning_rate": 8.459382091956996e-07, - "loss": 0.533, - "step": 65870 - }, - { - "epoch": 1.69, - "learning_rate": 8.45910869152385e-07, - "loss": 0.5486, - "step": 65871 - }, - { - "epoch": 1.69, - "learning_rate": 8.458835292270496e-07, - "loss": 0.6455, - "step": 65872 - }, - { - "epoch": 1.69, - "learning_rate": 8.458561894197138e-07, - "loss": 0.7168, - "step": 65873 - }, - { - "epoch": 1.69, - "learning_rate": 8.458288497303992e-07, - "loss": 0.6631, - "step": 65874 - }, - { - "epoch": 1.69, - "learning_rate": 8.45801510159126e-07, - "loss": 0.5669, - "step": 65875 - }, - { - "epoch": 1.69, - "learning_rate": 8.457741707059158e-07, - "loss": 0.7261, - "step": 65876 - }, - { - "epoch": 1.69, - "learning_rate": 8.457468313707895e-07, - "loss": 0.4729, - "step": 65877 - }, - { - "epoch": 1.69, - "learning_rate": 8.457194921537673e-07, - "loss": 0.6562, - "step": 65878 - }, - { - "epoch": 1.69, - "learning_rate": 8.456921530548707e-07, - "loss": 0.6934, - "step": 65879 - }, - { - "epoch": 1.69, - "learning_rate": 8.456648140741204e-07, - "loss": 0.4998, - "step": 65880 - }, - { - "epoch": 1.69, - "learning_rate": 8.456374752115376e-07, - "loss": 0.7197, - "step": 65881 - }, - { - "epoch": 1.69, - "learning_rate": 8.456101364671431e-07, - "loss": 0.397, - "step": 65882 - }, - { - "epoch": 1.69, - "learning_rate": 8.455827978409578e-07, - "loss": 0.7109, - "step": 65883 - }, - { - "epoch": 1.69, - "learning_rate": 8.455554593330025e-07, - "loss": 0.7432, - "step": 65884 - }, - { - "epoch": 1.69, - "learning_rate": 8.455281209432984e-07, - "loss": 0.7656, - "step": 65885 - }, - { - "epoch": 1.69, - "learning_rate": 8.455007826718663e-07, - "loss": 0.6316, - "step": 65886 - }, - { - "epoch": 1.69, - "learning_rate": 8.454734445187274e-07, - "loss": 0.5894, - "step": 65887 - }, - { - "epoch": 1.69, - "learning_rate": 8.454461064839021e-07, - "loss": 0.6636, - "step": 65888 - }, - { - "epoch": 1.69, - "learning_rate": 8.454187685674118e-07, - "loss": 0.7104, - "step": 65889 - }, - { - "epoch": 1.69, - "learning_rate": 8.453914307692768e-07, - "loss": 0.689, - "step": 65890 - }, - { - "epoch": 1.69, - "learning_rate": 8.45364093089519e-07, - "loss": 0.6587, - "step": 65891 - }, - { - "epoch": 1.69, - "learning_rate": 8.453367555281584e-07, - "loss": 0.7256, - "step": 65892 - }, - { - "epoch": 1.69, - "learning_rate": 8.453094180852166e-07, - "loss": 0.5913, - "step": 65893 - }, - { - "epoch": 1.69, - "learning_rate": 8.452820807607139e-07, - "loss": 0.6611, - "step": 65894 - }, - { - "epoch": 1.69, - "learning_rate": 8.45254743554672e-07, - "loss": 0.6387, - "step": 65895 - }, - { - "epoch": 1.69, - "learning_rate": 8.452274064671112e-07, - "loss": 0.5737, - "step": 65896 - }, - { - "epoch": 1.69, - "learning_rate": 8.452000694980531e-07, - "loss": 0.645, - "step": 65897 - }, - { - "epoch": 1.69, - "learning_rate": 8.451727326475179e-07, - "loss": 0.5923, - "step": 65898 - }, - { - "epoch": 1.69, - "learning_rate": 8.451453959155268e-07, - "loss": 0.5029, - "step": 65899 - }, - { - "epoch": 1.69, - "learning_rate": 8.451180593021006e-07, - "loss": 0.6602, - "step": 65900 - }, - { - "epoch": 1.69, - "learning_rate": 8.450907228072606e-07, - "loss": 0.749, - "step": 65901 - }, - { - "epoch": 1.69, - "learning_rate": 8.450633864310272e-07, - "loss": 0.6133, - "step": 65902 - }, - { - "epoch": 1.69, - "learning_rate": 8.450360501734219e-07, - "loss": 0.5879, - "step": 65903 - }, - { - "epoch": 1.69, - "learning_rate": 8.450087140344653e-07, - "loss": 0.6436, - "step": 65904 - }, - { - "epoch": 1.69, - "learning_rate": 8.449813780141784e-07, - "loss": 0.6641, - "step": 65905 - }, - { - "epoch": 1.69, - "learning_rate": 8.449540421125824e-07, - "loss": 0.6038, - "step": 65906 - }, - { - "epoch": 1.69, - "learning_rate": 8.449267063296977e-07, - "loss": 0.5698, - "step": 65907 - }, - { - "epoch": 1.69, - "learning_rate": 8.448993706655455e-07, - "loss": 0.6953, - "step": 65908 - }, - { - "epoch": 1.69, - "learning_rate": 8.448720351201466e-07, - "loss": 0.5757, - "step": 65909 - }, - { - "epoch": 1.69, - "learning_rate": 8.448446996935222e-07, - "loss": 0.6079, - "step": 65910 - }, - { - "epoch": 1.69, - "learning_rate": 8.44817364385693e-07, - "loss": 0.6514, - "step": 65911 - }, - { - "epoch": 1.69, - "learning_rate": 8.447900291966801e-07, - "loss": 0.467, - "step": 65912 - }, - { - "epoch": 1.69, - "learning_rate": 8.447626941265041e-07, - "loss": 0.6265, - "step": 65913 - }, - { - "epoch": 1.69, - "learning_rate": 8.447353591751865e-07, - "loss": 0.6084, - "step": 65914 - }, - { - "epoch": 1.69, - "learning_rate": 8.447080243427476e-07, - "loss": 0.7295, - "step": 65915 - }, - { - "epoch": 1.69, - "learning_rate": 8.446806896292094e-07, - "loss": 0.7178, - "step": 65916 - }, - { - "epoch": 1.69, - "learning_rate": 8.446533550345912e-07, - "loss": 0.6299, - "step": 65917 - }, - { - "epoch": 1.69, - "learning_rate": 8.446260205589151e-07, - "loss": 0.7373, - "step": 65918 - }, - { - "epoch": 1.69, - "learning_rate": 8.445986862022014e-07, - "loss": 0.5796, - "step": 65919 - }, - { - "epoch": 1.69, - "learning_rate": 8.445713519644717e-07, - "loss": 0.6152, - "step": 65920 - }, - { - "epoch": 1.69, - "learning_rate": 8.445440178457463e-07, - "loss": 0.7344, - "step": 65921 - }, - { - "epoch": 1.69, - "learning_rate": 8.445166838460467e-07, - "loss": 0.8486, - "step": 65922 - }, - { - "epoch": 1.69, - "learning_rate": 8.444893499653931e-07, - "loss": 0.7109, - "step": 65923 - }, - { - "epoch": 1.69, - "learning_rate": 8.444620162038073e-07, - "loss": 0.665, - "step": 65924 - }, - { - "epoch": 1.69, - "learning_rate": 8.444346825613094e-07, - "loss": 0.6753, - "step": 65925 - }, - { - "epoch": 1.69, - "learning_rate": 8.444073490379212e-07, - "loss": 0.8916, - "step": 65926 - }, - { - "epoch": 1.69, - "learning_rate": 8.443800156336629e-07, - "loss": 0.6406, - "step": 65927 - }, - { - "epoch": 1.69, - "learning_rate": 8.443526823485555e-07, - "loss": 0.873, - "step": 65928 - }, - { - "epoch": 1.69, - "learning_rate": 8.443253491826204e-07, - "loss": 0.4657, - "step": 65929 - }, - { - "epoch": 1.69, - "learning_rate": 8.442980161358779e-07, - "loss": 0.6357, - "step": 65930 - }, - { - "epoch": 1.69, - "learning_rate": 8.442706832083494e-07, - "loss": 0.6914, - "step": 65931 - }, - { - "epoch": 1.69, - "learning_rate": 8.442433504000555e-07, - "loss": 0.5171, - "step": 65932 - }, - { - "epoch": 1.69, - "learning_rate": 8.442160177110175e-07, - "loss": 0.7236, - "step": 65933 - }, - { - "epoch": 1.69, - "learning_rate": 8.441886851412559e-07, - "loss": 0.5576, - "step": 65934 - }, - { - "epoch": 1.69, - "learning_rate": 8.441613526907922e-07, - "loss": 0.6636, - "step": 65935 - }, - { - "epoch": 1.69, - "learning_rate": 8.441340203596472e-07, - "loss": 0.3677, - "step": 65936 - }, - { - "epoch": 1.69, - "learning_rate": 8.441066881478414e-07, - "loss": 0.5791, - "step": 65937 - }, - { - "epoch": 1.69, - "learning_rate": 8.440793560553956e-07, - "loss": 0.5996, - "step": 65938 - }, - { - "epoch": 1.69, - "learning_rate": 8.440520240823313e-07, - "loss": 0.6567, - "step": 65939 - }, - { - "epoch": 1.69, - "learning_rate": 8.44024692228669e-07, - "loss": 0.4696, - "step": 65940 - }, - { - "epoch": 1.69, - "learning_rate": 8.4399736049443e-07, - "loss": 0.7158, - "step": 65941 - }, - { - "epoch": 1.69, - "learning_rate": 8.439700288796349e-07, - "loss": 0.6396, - "step": 65942 - }, - { - "epoch": 1.69, - "learning_rate": 8.439426973843051e-07, - "loss": 0.5474, - "step": 65943 - }, - { - "epoch": 1.69, - "learning_rate": 8.439153660084608e-07, - "loss": 0.6758, - "step": 65944 - }, - { - "epoch": 1.69, - "learning_rate": 8.438880347521235e-07, - "loss": 0.917, - "step": 65945 - }, - { - "epoch": 1.69, - "learning_rate": 8.438607036153143e-07, - "loss": 0.6865, - "step": 65946 - }, - { - "epoch": 1.69, - "learning_rate": 8.438333725980534e-07, - "loss": 0.7637, - "step": 65947 - }, - { - "epoch": 1.69, - "learning_rate": 8.438060417003623e-07, - "loss": 0.5361, - "step": 65948 - }, - { - "epoch": 1.69, - "learning_rate": 8.437787109222614e-07, - "loss": 0.667, - "step": 65949 - }, - { - "epoch": 1.69, - "learning_rate": 8.437513802637722e-07, - "loss": 0.8057, - "step": 65950 - }, - { - "epoch": 1.69, - "learning_rate": 8.437240497249153e-07, - "loss": 0.4927, - "step": 65951 - }, - { - "epoch": 1.69, - "learning_rate": 8.436967193057118e-07, - "loss": 0.6924, - "step": 65952 - }, - { - "epoch": 1.69, - "learning_rate": 8.436693890061824e-07, - "loss": 0.6826, - "step": 65953 - }, - { - "epoch": 1.69, - "learning_rate": 8.436420588263484e-07, - "loss": 0.5601, - "step": 65954 - }, - { - "epoch": 1.69, - "learning_rate": 8.436147287662303e-07, - "loss": 0.5735, - "step": 65955 - }, - { - "epoch": 1.69, - "learning_rate": 8.435873988258495e-07, - "loss": 0.6855, - "step": 65956 - }, - { - "epoch": 1.69, - "learning_rate": 8.435600690052262e-07, - "loss": 0.5713, - "step": 65957 - }, - { - "epoch": 1.69, - "learning_rate": 8.43532739304382e-07, - "loss": 0.8066, - "step": 65958 - }, - { - "epoch": 1.69, - "learning_rate": 8.435054097233375e-07, - "loss": 0.6001, - "step": 65959 - }, - { - "epoch": 1.69, - "learning_rate": 8.434780802621138e-07, - "loss": 0.5854, - "step": 65960 - }, - { - "epoch": 1.69, - "learning_rate": 8.434507509207316e-07, - "loss": 0.5854, - "step": 65961 - }, - { - "epoch": 1.69, - "learning_rate": 8.434234216992121e-07, - "loss": 0.6191, - "step": 65962 - }, - { - "epoch": 1.69, - "learning_rate": 8.433960925975759e-07, - "loss": 0.7012, - "step": 65963 - }, - { - "epoch": 1.69, - "learning_rate": 8.433687636158443e-07, - "loss": 0.8008, - "step": 65964 - }, - { - "epoch": 1.69, - "learning_rate": 8.433414347540378e-07, - "loss": 0.6216, - "step": 65965 - }, - { - "epoch": 1.69, - "learning_rate": 8.43314106012178e-07, - "loss": 0.6094, - "step": 65966 - }, - { - "epoch": 1.69, - "learning_rate": 8.432867773902852e-07, - "loss": 0.5339, - "step": 65967 - }, - { - "epoch": 1.69, - "learning_rate": 8.432594488883803e-07, - "loss": 0.5676, - "step": 65968 - }, - { - "epoch": 1.69, - "learning_rate": 8.432321205064847e-07, - "loss": 0.4907, - "step": 65969 - }, - { - "epoch": 1.69, - "learning_rate": 8.432047922446187e-07, - "loss": 0.7432, - "step": 65970 - }, - { - "epoch": 1.69, - "learning_rate": 8.431774641028039e-07, - "loss": 0.8018, - "step": 65971 - }, - { - "epoch": 1.69, - "learning_rate": 8.431501360810609e-07, - "loss": 0.6226, - "step": 65972 - }, - { - "epoch": 1.69, - "learning_rate": 8.431228081794104e-07, - "loss": 0.6348, - "step": 65973 - }, - { - "epoch": 1.69, - "learning_rate": 8.430954803978739e-07, - "loss": 0.6611, - "step": 65974 - }, - { - "epoch": 1.69, - "learning_rate": 8.430681527364714e-07, - "loss": 0.4231, - "step": 65975 - }, - { - "epoch": 1.69, - "learning_rate": 8.430408251952251e-07, - "loss": 0.834, - "step": 65976 - }, - { - "epoch": 1.69, - "learning_rate": 8.430134977741549e-07, - "loss": 0.5742, - "step": 65977 - }, - { - "epoch": 1.69, - "learning_rate": 8.42986170473282e-07, - "loss": 0.3323, - "step": 65978 - }, - { - "epoch": 1.69, - "learning_rate": 8.429588432926274e-07, - "loss": 0.4312, - "step": 65979 - }, - { - "epoch": 1.69, - "learning_rate": 8.42931516232212e-07, - "loss": 0.7266, - "step": 65980 - }, - { - "epoch": 1.69, - "learning_rate": 8.429041892920567e-07, - "loss": 0.644, - "step": 65981 - }, - { - "epoch": 1.69, - "learning_rate": 8.428768624721823e-07, - "loss": 0.5713, - "step": 65982 - }, - { - "epoch": 1.69, - "learning_rate": 8.428495357726101e-07, - "loss": 0.6748, - "step": 65983 - }, - { - "epoch": 1.69, - "learning_rate": 8.428222091933606e-07, - "loss": 0.6143, - "step": 65984 - }, - { - "epoch": 1.69, - "learning_rate": 8.427948827344549e-07, - "loss": 0.7437, - "step": 65985 - }, - { - "epoch": 1.69, - "learning_rate": 8.427675563959145e-07, - "loss": 0.5461, - "step": 65986 - }, - { - "epoch": 1.69, - "learning_rate": 8.427402301777591e-07, - "loss": 0.6492, - "step": 65987 - }, - { - "epoch": 1.69, - "learning_rate": 8.427129040800105e-07, - "loss": 0.5713, - "step": 65988 - }, - { - "epoch": 1.69, - "learning_rate": 8.426855781026895e-07, - "loss": 0.7061, - "step": 65989 - }, - { - "epoch": 1.69, - "learning_rate": 8.426582522458165e-07, - "loss": 0.5791, - "step": 65990 - }, - { - "epoch": 1.69, - "learning_rate": 8.426309265094133e-07, - "loss": 0.7354, - "step": 65991 - }, - { - "epoch": 1.69, - "learning_rate": 8.426036008935e-07, - "loss": 0.6318, - "step": 65992 - }, - { - "epoch": 1.69, - "learning_rate": 8.425762753980982e-07, - "loss": 0.6929, - "step": 65993 - }, - { - "epoch": 1.69, - "learning_rate": 8.425489500232283e-07, - "loss": 0.7354, - "step": 65994 - }, - { - "epoch": 1.69, - "learning_rate": 8.425216247689115e-07, - "loss": 0.6606, - "step": 65995 - }, - { - "epoch": 1.69, - "learning_rate": 8.42494299635169e-07, - "loss": 0.6494, - "step": 65996 - }, - { - "epoch": 1.69, - "learning_rate": 8.424669746220208e-07, - "loss": 0.7563, - "step": 65997 - }, - { - "epoch": 1.69, - "learning_rate": 8.424396497294887e-07, - "loss": 0.7139, - "step": 65998 - }, - { - "epoch": 1.69, - "learning_rate": 8.424123249575931e-07, - "loss": 0.7549, - "step": 65999 - }, - { - "epoch": 1.69, - "learning_rate": 8.423850003063553e-07, - "loss": 0.7969, - "step": 66000 - }, - { - "epoch": 1.69, - "learning_rate": 8.42357675775796e-07, - "loss": 0.5791, - "step": 66001 - }, - { - "epoch": 1.69, - "learning_rate": 8.423303513659362e-07, - "loss": 0.7388, - "step": 66002 - }, - { - "epoch": 1.69, - "learning_rate": 8.423030270767967e-07, - "loss": 0.5034, - "step": 66003 - }, - { - "epoch": 1.69, - "learning_rate": 8.422757029083987e-07, - "loss": 0.4434, - "step": 66004 - }, - { - "epoch": 1.69, - "learning_rate": 8.422483788607627e-07, - "loss": 0.6104, - "step": 66005 - }, - { - "epoch": 1.69, - "learning_rate": 8.422210549339104e-07, - "loss": 0.6357, - "step": 66006 - }, - { - "epoch": 1.69, - "learning_rate": 8.421937311278618e-07, - "loss": 0.5605, - "step": 66007 - }, - { - "epoch": 1.69, - "learning_rate": 8.421664074426383e-07, - "loss": 0.5095, - "step": 66008 - }, - { - "epoch": 1.69, - "learning_rate": 8.421390838782605e-07, - "loss": 0.6338, - "step": 66009 - }, - { - "epoch": 1.69, - "learning_rate": 8.421117604347499e-07, - "loss": 0.6089, - "step": 66010 - }, - { - "epoch": 1.69, - "learning_rate": 8.420844371121267e-07, - "loss": 0.5093, - "step": 66011 - }, - { - "epoch": 1.69, - "learning_rate": 8.420571139104123e-07, - "loss": 0.5938, - "step": 66012 - }, - { - "epoch": 1.69, - "learning_rate": 8.420297908296275e-07, - "loss": 0.501, - "step": 66013 - }, - { - "epoch": 1.69, - "learning_rate": 8.420024678697932e-07, - "loss": 0.6057, - "step": 66014 - }, - { - "epoch": 1.69, - "learning_rate": 8.419751450309304e-07, - "loss": 0.6611, - "step": 66015 - }, - { - "epoch": 1.69, - "learning_rate": 8.419478223130603e-07, - "loss": 0.7593, - "step": 66016 - }, - { - "epoch": 1.69, - "learning_rate": 8.419204997162032e-07, - "loss": 0.6162, - "step": 66017 - }, - { - "epoch": 1.69, - "learning_rate": 8.418931772403801e-07, - "loss": 0.7637, - "step": 66018 - }, - { - "epoch": 1.69, - "learning_rate": 8.418658548856124e-07, - "loss": 0.6479, - "step": 66019 - }, - { - "epoch": 1.69, - "learning_rate": 8.418385326519205e-07, - "loss": 0.7754, - "step": 66020 - }, - { - "epoch": 1.69, - "learning_rate": 8.418112105393258e-07, - "loss": 0.5217, - "step": 66021 - }, - { - "epoch": 1.69, - "learning_rate": 8.417838885478488e-07, - "loss": 0.7217, - "step": 66022 - }, - { - "epoch": 1.69, - "learning_rate": 8.417565666775108e-07, - "loss": 0.5674, - "step": 66023 - }, - { - "epoch": 1.69, - "learning_rate": 8.417292449283322e-07, - "loss": 0.5073, - "step": 66024 - }, - { - "epoch": 1.69, - "learning_rate": 8.417019233003344e-07, - "loss": 0.7095, - "step": 66025 - }, - { - "epoch": 1.69, - "learning_rate": 8.416746017935386e-07, - "loss": 0.5786, - "step": 66026 - }, - { - "epoch": 1.69, - "learning_rate": 8.41647280407965e-07, - "loss": 0.6226, - "step": 66027 - }, - { - "epoch": 1.69, - "learning_rate": 8.416199591436344e-07, - "loss": 0.7871, - "step": 66028 - }, - { - "epoch": 1.69, - "learning_rate": 8.415926380005686e-07, - "loss": 0.5569, - "step": 66029 - }, - { - "epoch": 1.69, - "learning_rate": 8.415653169787876e-07, - "loss": 0.6582, - "step": 66030 - }, - { - "epoch": 1.69, - "learning_rate": 8.415379960783131e-07, - "loss": 0.6318, - "step": 66031 - }, - { - "epoch": 1.69, - "learning_rate": 8.415106752991655e-07, - "loss": 0.834, - "step": 66032 - }, - { - "epoch": 1.69, - "learning_rate": 8.414833546413659e-07, - "loss": 0.6475, - "step": 66033 - }, - { - "epoch": 1.69, - "learning_rate": 8.414560341049351e-07, - "loss": 0.5002, - "step": 66034 - }, - { - "epoch": 1.69, - "learning_rate": 8.414287136898943e-07, - "loss": 0.7021, - "step": 66035 - }, - { - "epoch": 1.69, - "learning_rate": 8.414013933962645e-07, - "loss": 0.7158, - "step": 66036 - }, - { - "epoch": 1.69, - "learning_rate": 8.413740732240659e-07, - "loss": 0.8291, - "step": 66037 - }, - { - "epoch": 1.69, - "learning_rate": 8.413467531733203e-07, - "loss": 0.8701, - "step": 66038 - }, - { - "epoch": 1.69, - "learning_rate": 8.413194332440477e-07, - "loss": 0.8115, - "step": 66039 - }, - { - "epoch": 1.69, - "learning_rate": 8.412921134362698e-07, - "loss": 0.5533, - "step": 66040 - }, - { - "epoch": 1.69, - "learning_rate": 8.412647937500071e-07, - "loss": 0.7354, - "step": 66041 - }, - { - "epoch": 1.69, - "learning_rate": 8.412374741852808e-07, - "loss": 0.6123, - "step": 66042 - }, - { - "epoch": 1.69, - "learning_rate": 8.412101547421116e-07, - "loss": 0.5691, - "step": 66043 - }, - { - "epoch": 1.69, - "learning_rate": 8.411828354205205e-07, - "loss": 0.4631, - "step": 66044 - }, - { - "epoch": 1.69, - "learning_rate": 8.411555162205284e-07, - "loss": 0.7295, - "step": 66045 - }, - { - "epoch": 1.69, - "learning_rate": 8.411281971421566e-07, - "loss": 0.624, - "step": 66046 - }, - { - "epoch": 1.69, - "learning_rate": 8.411008781854249e-07, - "loss": 0.7725, - "step": 66047 - }, - { - "epoch": 1.69, - "learning_rate": 8.410735593503555e-07, - "loss": 0.5879, - "step": 66048 - }, - { - "epoch": 1.69, - "learning_rate": 8.410462406369683e-07, - "loss": 0.585, - "step": 66049 - }, - { - "epoch": 1.69, - "learning_rate": 8.410189220452851e-07, - "loss": 0.6143, - "step": 66050 - }, - { - "epoch": 1.69, - "learning_rate": 8.409916035753262e-07, - "loss": 0.5781, - "step": 66051 - }, - { - "epoch": 1.69, - "learning_rate": 8.409642852271128e-07, - "loss": 0.667, - "step": 66052 - }, - { - "epoch": 1.69, - "learning_rate": 8.409369670006655e-07, - "loss": 0.627, - "step": 66053 - }, - { - "epoch": 1.69, - "learning_rate": 8.409096488960058e-07, - "loss": 0.6431, - "step": 66054 - }, - { - "epoch": 1.69, - "learning_rate": 8.40882330913154e-07, - "loss": 0.5371, - "step": 66055 - }, - { - "epoch": 1.69, - "learning_rate": 8.408550130521316e-07, - "loss": 0.5312, - "step": 66056 - }, - { - "epoch": 1.69, - "learning_rate": 8.408276953129591e-07, - "loss": 0.6001, - "step": 66057 - }, - { - "epoch": 1.69, - "learning_rate": 8.408003776956573e-07, - "loss": 0.542, - "step": 66058 - }, - { - "epoch": 1.69, - "learning_rate": 8.407730602002475e-07, - "loss": 0.7197, - "step": 66059 - }, - { - "epoch": 1.69, - "learning_rate": 8.407457428267503e-07, - "loss": 0.5889, - "step": 66060 - }, - { - "epoch": 1.69, - "learning_rate": 8.407184255751869e-07, - "loss": 0.5576, - "step": 66061 - }, - { - "epoch": 1.69, - "learning_rate": 8.406911084455781e-07, - "loss": 0.7285, - "step": 66062 - }, - { - "epoch": 1.69, - "learning_rate": 8.406637914379445e-07, - "loss": 0.5215, - "step": 66063 - }, - { - "epoch": 1.69, - "learning_rate": 8.406364745523076e-07, - "loss": 0.5459, - "step": 66064 - }, - { - "epoch": 1.69, - "learning_rate": 8.406091577886879e-07, - "loss": 0.6438, - "step": 66065 - }, - { - "epoch": 1.69, - "learning_rate": 8.405818411471067e-07, - "loss": 0.7832, - "step": 66066 - }, - { - "epoch": 1.69, - "learning_rate": 8.405545246275845e-07, - "loss": 0.6777, - "step": 66067 - }, - { - "epoch": 1.69, - "learning_rate": 8.405272082301422e-07, - "loss": 0.6025, - "step": 66068 - }, - { - "epoch": 1.69, - "learning_rate": 8.404998919548012e-07, - "loss": 0.6206, - "step": 66069 - }, - { - "epoch": 1.69, - "learning_rate": 8.404725758015817e-07, - "loss": 0.563, - "step": 66070 - }, - { - "epoch": 1.69, - "learning_rate": 8.404452597705053e-07, - "loss": 0.6172, - "step": 66071 - }, - { - "epoch": 1.69, - "learning_rate": 8.404179438615924e-07, - "loss": 0.5684, - "step": 66072 - }, - { - "epoch": 1.69, - "learning_rate": 8.403906280748643e-07, - "loss": 0.7031, - "step": 66073 - }, - { - "epoch": 1.69, - "learning_rate": 8.403633124103417e-07, - "loss": 0.6899, - "step": 66074 - }, - { - "epoch": 1.69, - "learning_rate": 8.403359968680457e-07, - "loss": 0.5874, - "step": 66075 - }, - { - "epoch": 1.69, - "learning_rate": 8.403086814479972e-07, - "loss": 0.5771, - "step": 66076 - }, - { - "epoch": 1.69, - "learning_rate": 8.402813661502166e-07, - "loss": 0.6836, - "step": 66077 - }, - { - "epoch": 1.69, - "learning_rate": 8.402540509747256e-07, - "loss": 0.6426, - "step": 66078 - }, - { - "epoch": 1.69, - "learning_rate": 8.402267359215445e-07, - "loss": 0.627, - "step": 66079 - }, - { - "epoch": 1.69, - "learning_rate": 8.401994209906944e-07, - "loss": 0.6416, - "step": 66080 - }, - { - "epoch": 1.69, - "learning_rate": 8.401721061821965e-07, - "loss": 0.6777, - "step": 66081 - }, - { - "epoch": 1.69, - "learning_rate": 8.401447914960711e-07, - "loss": 0.5054, - "step": 66082 - }, - { - "epoch": 1.69, - "learning_rate": 8.401174769323398e-07, - "loss": 0.5032, - "step": 66083 - }, - { - "epoch": 1.69, - "learning_rate": 8.400901624910228e-07, - "loss": 0.8281, - "step": 66084 - }, - { - "epoch": 1.69, - "learning_rate": 8.400628481721419e-07, - "loss": 0.5892, - "step": 66085 - }, - { - "epoch": 1.69, - "learning_rate": 8.400355339757176e-07, - "loss": 0.6904, - "step": 66086 - }, - { - "epoch": 1.69, - "learning_rate": 8.400082199017703e-07, - "loss": 0.5845, - "step": 66087 - }, - { - "epoch": 1.69, - "learning_rate": 8.399809059503216e-07, - "loss": 0.6016, - "step": 66088 - }, - { - "epoch": 1.69, - "learning_rate": 8.399535921213918e-07, - "loss": 0.8779, - "step": 66089 - }, - { - "epoch": 1.69, - "learning_rate": 8.399262784150027e-07, - "loss": 0.6318, - "step": 66090 - }, - { - "epoch": 1.69, - "learning_rate": 8.398989648311742e-07, - "loss": 0.7192, - "step": 66091 - }, - { - "epoch": 1.69, - "learning_rate": 8.39871651369928e-07, - "loss": 0.6133, - "step": 66092 - }, - { - "epoch": 1.69, - "learning_rate": 8.398443380312845e-07, - "loss": 0.6372, - "step": 66093 - }, - { - "epoch": 1.69, - "learning_rate": 8.398170248152651e-07, - "loss": 0.8135, - "step": 66094 - }, - { - "epoch": 1.69, - "learning_rate": 8.397897117218902e-07, - "loss": 0.5625, - "step": 66095 - }, - { - "epoch": 1.69, - "learning_rate": 8.397623987511813e-07, - "loss": 0.5361, - "step": 66096 - }, - { - "epoch": 1.69, - "learning_rate": 8.397350859031588e-07, - "loss": 0.7041, - "step": 66097 - }, - { - "epoch": 1.69, - "learning_rate": 8.397077731778437e-07, - "loss": 0.6562, - "step": 66098 - }, - { - "epoch": 1.69, - "learning_rate": 8.396804605752569e-07, - "loss": 0.75, - "step": 66099 - }, - { - "epoch": 1.69, - "learning_rate": 8.396531480954195e-07, - "loss": 0.5483, - "step": 66100 - }, - { - "epoch": 1.69, - "learning_rate": 8.396258357383523e-07, - "loss": 0.5396, - "step": 66101 - }, - { - "epoch": 1.69, - "learning_rate": 8.395985235040762e-07, - "loss": 0.7368, - "step": 66102 - }, - { - "epoch": 1.69, - "learning_rate": 8.39571211392612e-07, - "loss": 0.584, - "step": 66103 - }, - { - "epoch": 1.69, - "learning_rate": 8.39543899403981e-07, - "loss": 0.6904, - "step": 66104 - }, - { - "epoch": 1.69, - "learning_rate": 8.395165875382036e-07, - "loss": 0.6787, - "step": 66105 - }, - { - "epoch": 1.69, - "learning_rate": 8.394892757953014e-07, - "loss": 0.667, - "step": 66106 - }, - { - "epoch": 1.69, - "learning_rate": 8.394619641752947e-07, - "loss": 0.7773, - "step": 66107 - }, - { - "epoch": 1.69, - "learning_rate": 8.394346526782043e-07, - "loss": 0.446, - "step": 66108 - }, - { - "epoch": 1.69, - "learning_rate": 8.394073413040518e-07, - "loss": 0.6357, - "step": 66109 - }, - { - "epoch": 1.69, - "learning_rate": 8.393800300528573e-07, - "loss": 0.4493, - "step": 66110 - }, - { - "epoch": 1.69, - "learning_rate": 8.393527189246424e-07, - "loss": 0.6094, - "step": 66111 - }, - { - "epoch": 1.69, - "learning_rate": 8.393254079194276e-07, - "loss": 0.2987, - "step": 66112 - }, - { - "epoch": 1.69, - "learning_rate": 8.392980970372341e-07, - "loss": 0.4878, - "step": 66113 - }, - { - "epoch": 1.69, - "learning_rate": 8.392707862780825e-07, - "loss": 0.3899, - "step": 66114 - }, - { - "epoch": 1.69, - "learning_rate": 8.392434756419939e-07, - "loss": 0.9658, - "step": 66115 - }, - { - "epoch": 1.69, - "learning_rate": 8.392161651289896e-07, - "loss": 0.6318, - "step": 66116 - }, - { - "epoch": 1.69, - "learning_rate": 8.391888547390899e-07, - "loss": 0.6523, - "step": 66117 - }, - { - "epoch": 1.69, - "learning_rate": 8.391615444723154e-07, - "loss": 0.6841, - "step": 66118 - }, - { - "epoch": 1.69, - "learning_rate": 8.39134234328688e-07, - "loss": 0.2665, - "step": 66119 - }, - { - "epoch": 1.69, - "learning_rate": 8.391069243082278e-07, - "loss": 0.627, - "step": 66120 - }, - { - "epoch": 1.69, - "learning_rate": 8.390796144109563e-07, - "loss": 0.6099, - "step": 66121 - }, - { - "epoch": 1.69, - "learning_rate": 8.390523046368938e-07, - "loss": 0.5317, - "step": 66122 - }, - { - "epoch": 1.69, - "learning_rate": 8.390249949860619e-07, - "loss": 0.625, - "step": 66123 - }, - { - "epoch": 1.69, - "learning_rate": 8.389976854584809e-07, - "loss": 0.6812, - "step": 66124 - }, - { - "epoch": 1.69, - "learning_rate": 8.389703760541722e-07, - "loss": 0.6311, - "step": 66125 - }, - { - "epoch": 1.69, - "learning_rate": 8.389430667731566e-07, - "loss": 0.6553, - "step": 66126 - }, - { - "epoch": 1.69, - "learning_rate": 8.389157576154547e-07, - "loss": 0.5874, - "step": 66127 - }, - { - "epoch": 1.69, - "learning_rate": 8.388884485810875e-07, - "loss": 0.5151, - "step": 66128 - }, - { - "epoch": 1.69, - "learning_rate": 8.38861139670076e-07, - "loss": 0.6777, - "step": 66129 - }, - { - "epoch": 1.69, - "learning_rate": 8.388338308824412e-07, - "loss": 0.5867, - "step": 66130 - }, - { - "epoch": 1.69, - "learning_rate": 8.388065222182038e-07, - "loss": 0.528, - "step": 66131 - }, - { - "epoch": 1.69, - "learning_rate": 8.387792136773851e-07, - "loss": 0.5457, - "step": 66132 - }, - { - "epoch": 1.7, - "learning_rate": 8.387519052600054e-07, - "loss": 0.7285, - "step": 66133 - }, - { - "epoch": 1.7, - "learning_rate": 8.387245969660863e-07, - "loss": 0.5693, - "step": 66134 - }, - { - "epoch": 1.7, - "learning_rate": 8.386972887956481e-07, - "loss": 0.6587, - "step": 66135 - }, - { - "epoch": 1.7, - "learning_rate": 8.386699807487124e-07, - "loss": 0.6113, - "step": 66136 - }, - { - "epoch": 1.7, - "learning_rate": 8.386426728252994e-07, - "loss": 0.5913, - "step": 66137 - }, - { - "epoch": 1.7, - "learning_rate": 8.386153650254302e-07, - "loss": 0.5908, - "step": 66138 - }, - { - "epoch": 1.7, - "learning_rate": 8.385880573491257e-07, - "loss": 0.6157, - "step": 66139 - }, - { - "epoch": 1.7, - "learning_rate": 8.385607497964071e-07, - "loss": 0.5874, - "step": 66140 - }, - { - "epoch": 1.7, - "learning_rate": 8.385334423672948e-07, - "loss": 0.7627, - "step": 66141 - }, - { - "epoch": 1.7, - "learning_rate": 8.385061350618104e-07, - "loss": 0.7139, - "step": 66142 - }, - { - "epoch": 1.7, - "learning_rate": 8.384788278799741e-07, - "loss": 0.4014, - "step": 66143 - }, - { - "epoch": 1.7, - "learning_rate": 8.384515208218075e-07, - "loss": 0.6377, - "step": 66144 - }, - { - "epoch": 1.7, - "learning_rate": 8.384242138873308e-07, - "loss": 0.6016, - "step": 66145 - }, - { - "epoch": 1.7, - "learning_rate": 8.383969070765657e-07, - "loss": 0.5752, - "step": 66146 - }, - { - "epoch": 1.7, - "learning_rate": 8.383696003895324e-07, - "loss": 0.4167, - "step": 66147 - }, - { - "epoch": 1.7, - "learning_rate": 8.383422938262519e-07, - "loss": 0.6504, - "step": 66148 - }, - { - "epoch": 1.7, - "learning_rate": 8.383149873867455e-07, - "loss": 0.7451, - "step": 66149 - }, - { - "epoch": 1.7, - "learning_rate": 8.382876810710336e-07, - "loss": 0.8438, - "step": 66150 - }, - { - "epoch": 1.7, - "learning_rate": 8.382603748791377e-07, - "loss": 0.5781, - "step": 66151 - }, - { - "epoch": 1.7, - "learning_rate": 8.382330688110784e-07, - "loss": 0.6553, - "step": 66152 - }, - { - "epoch": 1.7, - "learning_rate": 8.382057628668763e-07, - "loss": 0.3699, - "step": 66153 - }, - { - "epoch": 1.7, - "learning_rate": 8.381784570465529e-07, - "loss": 0.5273, - "step": 66154 - }, - { - "epoch": 1.7, - "learning_rate": 8.381511513501285e-07, - "loss": 0.7139, - "step": 66155 - }, - { - "epoch": 1.7, - "learning_rate": 8.381238457776248e-07, - "loss": 0.6323, - "step": 66156 - }, - { - "epoch": 1.7, - "learning_rate": 8.38096540329062e-07, - "loss": 0.7036, - "step": 66157 - }, - { - "epoch": 1.7, - "learning_rate": 8.380692350044612e-07, - "loss": 0.6826, - "step": 66158 - }, - { - "epoch": 1.7, - "learning_rate": 8.380419298038433e-07, - "loss": 0.6895, - "step": 66159 - }, - { - "epoch": 1.7, - "learning_rate": 8.380146247272291e-07, - "loss": 0.7539, - "step": 66160 - }, - { - "epoch": 1.7, - "learning_rate": 8.379873197746399e-07, - "loss": 0.7383, - "step": 66161 - }, - { - "epoch": 1.7, - "learning_rate": 8.379600149460962e-07, - "loss": 0.6455, - "step": 66162 - }, - { - "epoch": 1.7, - "learning_rate": 8.379327102416191e-07, - "loss": 0.7148, - "step": 66163 - }, - { - "epoch": 1.7, - "learning_rate": 8.379054056612295e-07, - "loss": 0.6001, - "step": 66164 - }, - { - "epoch": 1.7, - "learning_rate": 8.378781012049483e-07, - "loss": 0.5344, - "step": 66165 - }, - { - "epoch": 1.7, - "learning_rate": 8.378507968727967e-07, - "loss": 0.4023, - "step": 66166 - }, - { - "epoch": 1.7, - "learning_rate": 8.378234926647948e-07, - "loss": 0.6943, - "step": 66167 - }, - { - "epoch": 1.7, - "learning_rate": 8.377961885809642e-07, - "loss": 0.6016, - "step": 66168 - }, - { - "epoch": 1.7, - "learning_rate": 8.377688846213256e-07, - "loss": 0.428, - "step": 66169 - }, - { - "epoch": 1.7, - "learning_rate": 8.377415807858998e-07, - "loss": 0.4912, - "step": 66170 - }, - { - "epoch": 1.7, - "learning_rate": 8.377142770747079e-07, - "loss": 0.5151, - "step": 66171 - }, - { - "epoch": 1.7, - "learning_rate": 8.376869734877706e-07, - "loss": 0.709, - "step": 66172 - }, - { - "epoch": 1.7, - "learning_rate": 8.376596700251092e-07, - "loss": 0.5737, - "step": 66173 - }, - { - "epoch": 1.7, - "learning_rate": 8.37632366686744e-07, - "loss": 0.6118, - "step": 66174 - }, - { - "epoch": 1.7, - "learning_rate": 8.376050634726964e-07, - "loss": 0.5527, - "step": 66175 - }, - { - "epoch": 1.7, - "learning_rate": 8.375777603829875e-07, - "loss": 0.5674, - "step": 66176 - }, - { - "epoch": 1.7, - "learning_rate": 8.375504574176372e-07, - "loss": 0.707, - "step": 66177 - }, - { - "epoch": 1.7, - "learning_rate": 8.375231545766674e-07, - "loss": 0.4482, - "step": 66178 - }, - { - "epoch": 1.7, - "learning_rate": 8.374958518600984e-07, - "loss": 0.6357, - "step": 66179 - }, - { - "epoch": 1.7, - "learning_rate": 8.374685492679515e-07, - "loss": 0.5498, - "step": 66180 - }, - { - "epoch": 1.7, - "learning_rate": 8.374412468002474e-07, - "loss": 0.4805, - "step": 66181 - }, - { - "epoch": 1.7, - "learning_rate": 8.374139444570072e-07, - "loss": 0.6133, - "step": 66182 - }, - { - "epoch": 1.7, - "learning_rate": 8.373866422382514e-07, - "loss": 0.3939, - "step": 66183 - }, - { - "epoch": 1.7, - "learning_rate": 8.373593401440014e-07, - "loss": 0.5399, - "step": 66184 - }, - { - "epoch": 1.7, - "learning_rate": 8.373320381742777e-07, - "loss": 0.6865, - "step": 66185 - }, - { - "epoch": 1.7, - "learning_rate": 8.373047363291018e-07, - "loss": 0.6992, - "step": 66186 - }, - { - "epoch": 1.7, - "learning_rate": 8.37277434608494e-07, - "loss": 0.6079, - "step": 66187 - }, - { - "epoch": 1.7, - "learning_rate": 8.372501330124754e-07, - "loss": 0.5, - "step": 66188 - }, - { - "epoch": 1.7, - "learning_rate": 8.372228315410666e-07, - "loss": 0.6904, - "step": 66189 - }, - { - "epoch": 1.7, - "learning_rate": 8.37195530194289e-07, - "loss": 0.6973, - "step": 66190 - }, - { - "epoch": 1.7, - "learning_rate": 8.371682289721631e-07, - "loss": 0.6562, - "step": 66191 - }, - { - "epoch": 1.7, - "learning_rate": 8.371409278747104e-07, - "loss": 0.4868, - "step": 66192 - }, - { - "epoch": 1.7, - "learning_rate": 8.371136269019509e-07, - "loss": 0.7241, - "step": 66193 - }, - { - "epoch": 1.7, - "learning_rate": 8.370863260539064e-07, - "loss": 0.6909, - "step": 66194 - }, - { - "epoch": 1.7, - "learning_rate": 8.370590253305976e-07, - "loss": 0.7188, - "step": 66195 - }, - { - "epoch": 1.7, - "learning_rate": 8.370317247320446e-07, - "loss": 0.6763, - "step": 66196 - }, - { - "epoch": 1.7, - "learning_rate": 8.370044242582693e-07, - "loss": 0.792, - "step": 66197 - }, - { - "epoch": 1.7, - "learning_rate": 8.36977123909292e-07, - "loss": 0.5811, - "step": 66198 - }, - { - "epoch": 1.7, - "learning_rate": 8.36949823685134e-07, - "loss": 0.6299, - "step": 66199 - }, - { - "epoch": 1.7, - "learning_rate": 8.36922523585816e-07, - "loss": 0.7861, - "step": 66200 - }, - { - "epoch": 1.7, - "learning_rate": 8.368952236113589e-07, - "loss": 0.5474, - "step": 66201 - }, - { - "epoch": 1.7, - "learning_rate": 8.368679237617834e-07, - "loss": 0.6196, - "step": 66202 - }, - { - "epoch": 1.7, - "learning_rate": 8.36840624037111e-07, - "loss": 0.624, - "step": 66203 - }, - { - "epoch": 1.7, - "learning_rate": 8.368133244373619e-07, - "loss": 0.5334, - "step": 66204 - }, - { - "epoch": 1.7, - "learning_rate": 8.36786024962558e-07, - "loss": 0.6543, - "step": 66205 - }, - { - "epoch": 1.7, - "learning_rate": 8.367587256127188e-07, - "loss": 0.6738, - "step": 66206 - }, - { - "epoch": 1.7, - "learning_rate": 8.367314263878664e-07, - "loss": 0.688, - "step": 66207 - }, - { - "epoch": 1.7, - "learning_rate": 8.367041272880209e-07, - "loss": 0.5875, - "step": 66208 - }, - { - "epoch": 1.7, - "learning_rate": 8.366768283132038e-07, - "loss": 0.6357, - "step": 66209 - }, - { - "epoch": 1.7, - "learning_rate": 8.366495294634354e-07, - "loss": 0.4175, - "step": 66210 - }, - { - "epoch": 1.7, - "learning_rate": 8.366222307387372e-07, - "loss": 0.5835, - "step": 66211 - }, - { - "epoch": 1.7, - "learning_rate": 8.365949321391297e-07, - "loss": 0.8076, - "step": 66212 - }, - { - "epoch": 1.7, - "learning_rate": 8.365676336646341e-07, - "loss": 0.6172, - "step": 66213 - }, - { - "epoch": 1.7, - "learning_rate": 8.365403353152709e-07, - "loss": 0.6924, - "step": 66214 - }, - { - "epoch": 1.7, - "learning_rate": 8.365130370910618e-07, - "loss": 0.6973, - "step": 66215 - }, - { - "epoch": 1.7, - "learning_rate": 8.364857389920268e-07, - "loss": 0.6299, - "step": 66216 - }, - { - "epoch": 1.7, - "learning_rate": 8.36458441018187e-07, - "loss": 0.4888, - "step": 66217 - }, - { - "epoch": 1.7, - "learning_rate": 8.364311431695638e-07, - "loss": 0.5034, - "step": 66218 - }, - { - "epoch": 1.7, - "learning_rate": 8.364038454461774e-07, - "loss": 0.5669, - "step": 66219 - }, - { - "epoch": 1.7, - "learning_rate": 8.363765478480493e-07, - "loss": 0.6279, - "step": 66220 - }, - { - "epoch": 1.7, - "learning_rate": 8.363492503751999e-07, - "loss": 0.5352, - "step": 66221 - }, - { - "epoch": 1.7, - "learning_rate": 8.363219530276505e-07, - "loss": 0.5723, - "step": 66222 - }, - { - "epoch": 1.7, - "learning_rate": 8.362946558054218e-07, - "loss": 0.8125, - "step": 66223 - }, - { - "epoch": 1.7, - "learning_rate": 8.362673587085348e-07, - "loss": 0.554, - "step": 66224 - }, - { - "epoch": 1.7, - "learning_rate": 8.362400617370107e-07, - "loss": 0.7314, - "step": 66225 - }, - { - "epoch": 1.7, - "learning_rate": 8.362127648908698e-07, - "loss": 0.624, - "step": 66226 - }, - { - "epoch": 1.7, - "learning_rate": 8.361854681701331e-07, - "loss": 0.8184, - "step": 66227 - }, - { - "epoch": 1.7, - "learning_rate": 8.361581715748218e-07, - "loss": 0.6016, - "step": 66228 - }, - { - "epoch": 1.7, - "learning_rate": 8.361308751049565e-07, - "loss": 0.5256, - "step": 66229 - }, - { - "epoch": 1.7, - "learning_rate": 8.361035787605584e-07, - "loss": 0.7012, - "step": 66230 - }, - { - "epoch": 1.7, - "learning_rate": 8.360762825416481e-07, - "loss": 0.5896, - "step": 66231 - }, - { - "epoch": 1.7, - "learning_rate": 8.360489864482467e-07, - "loss": 0.6606, - "step": 66232 - }, - { - "epoch": 1.7, - "learning_rate": 8.36021690480375e-07, - "loss": 0.6348, - "step": 66233 - }, - { - "epoch": 1.7, - "learning_rate": 8.35994394638054e-07, - "loss": 0.6406, - "step": 66234 - }, - { - "epoch": 1.7, - "learning_rate": 8.35967098921305e-07, - "loss": 0.6343, - "step": 66235 - }, - { - "epoch": 1.7, - "learning_rate": 8.359398033301479e-07, - "loss": 0.6494, - "step": 66236 - }, - { - "epoch": 1.7, - "learning_rate": 8.359125078646044e-07, - "loss": 0.8096, - "step": 66237 - }, - { - "epoch": 1.7, - "learning_rate": 8.358852125246949e-07, - "loss": 0.6108, - "step": 66238 - }, - { - "epoch": 1.7, - "learning_rate": 8.358579173104409e-07, - "loss": 0.4963, - "step": 66239 - }, - { - "epoch": 1.7, - "learning_rate": 8.358306222218625e-07, - "loss": 0.5952, - "step": 66240 - }, - { - "epoch": 1.7, - "learning_rate": 8.358033272589814e-07, - "loss": 0.7305, - "step": 66241 - }, - { - "epoch": 1.7, - "learning_rate": 8.357760324218182e-07, - "loss": 0.8154, - "step": 66242 - }, - { - "epoch": 1.7, - "learning_rate": 8.357487377103934e-07, - "loss": 0.6494, - "step": 66243 - }, - { - "epoch": 1.7, - "learning_rate": 8.357214431247285e-07, - "loss": 0.5806, - "step": 66244 - }, - { - "epoch": 1.7, - "learning_rate": 8.356941486648444e-07, - "loss": 0.5718, - "step": 66245 - }, - { - "epoch": 1.7, - "learning_rate": 8.356668543307611e-07, - "loss": 0.6252, - "step": 66246 - }, - { - "epoch": 1.7, - "learning_rate": 8.356395601225006e-07, - "loss": 0.5527, - "step": 66247 - }, - { - "epoch": 1.7, - "learning_rate": 8.35612266040083e-07, - "loss": 0.4946, - "step": 66248 - }, - { - "epoch": 1.7, - "learning_rate": 8.355849720835297e-07, - "loss": 0.5352, - "step": 66249 - }, - { - "epoch": 1.7, - "learning_rate": 8.355576782528612e-07, - "loss": 0.7646, - "step": 66250 - }, - { - "epoch": 1.7, - "learning_rate": 8.35530384548099e-07, - "loss": 0.6499, - "step": 66251 - }, - { - "epoch": 1.7, - "learning_rate": 8.355030909692633e-07, - "loss": 0.6445, - "step": 66252 - }, - { - "epoch": 1.7, - "learning_rate": 8.354757975163755e-07, - "loss": 0.7334, - "step": 66253 - }, - { - "epoch": 1.7, - "learning_rate": 8.354485041894562e-07, - "loss": 0.8311, - "step": 66254 - }, - { - "epoch": 1.7, - "learning_rate": 8.354212109885268e-07, - "loss": 0.6309, - "step": 66255 - }, - { - "epoch": 1.7, - "learning_rate": 8.353939179136076e-07, - "loss": 0.6069, - "step": 66256 - }, - { - "epoch": 1.7, - "learning_rate": 8.353666249647194e-07, - "loss": 0.7393, - "step": 66257 - }, - { - "epoch": 1.7, - "learning_rate": 8.353393321418838e-07, - "loss": 0.6104, - "step": 66258 - }, - { - "epoch": 1.7, - "learning_rate": 8.353120394451209e-07, - "loss": 0.5737, - "step": 66259 - }, - { - "epoch": 1.7, - "learning_rate": 8.352847468744524e-07, - "loss": 0.4868, - "step": 66260 - }, - { - "epoch": 1.7, - "learning_rate": 8.352574544298987e-07, - "loss": 0.6143, - "step": 66261 - }, - { - "epoch": 1.7, - "learning_rate": 8.352301621114805e-07, - "loss": 0.5557, - "step": 66262 - }, - { - "epoch": 1.7, - "learning_rate": 8.352028699192193e-07, - "loss": 0.6235, - "step": 66263 - }, - { - "epoch": 1.7, - "learning_rate": 8.351755778531355e-07, - "loss": 0.4688, - "step": 66264 - }, - { - "epoch": 1.7, - "learning_rate": 8.351482859132506e-07, - "loss": 0.624, - "step": 66265 - }, - { - "epoch": 1.7, - "learning_rate": 8.351209940995848e-07, - "loss": 0.6343, - "step": 66266 - }, - { - "epoch": 1.7, - "learning_rate": 8.35093702412159e-07, - "loss": 0.6494, - "step": 66267 - }, - { - "epoch": 1.7, - "learning_rate": 8.350664108509947e-07, - "loss": 0.6431, - "step": 66268 - }, - { - "epoch": 1.7, - "learning_rate": 8.350391194161123e-07, - "loss": 0.6875, - "step": 66269 - }, - { - "epoch": 1.7, - "learning_rate": 8.350118281075329e-07, - "loss": 0.7568, - "step": 66270 - }, - { - "epoch": 1.7, - "learning_rate": 8.349845369252773e-07, - "loss": 0.6353, - "step": 66271 - }, - { - "epoch": 1.7, - "learning_rate": 8.349572458693665e-07, - "loss": 0.6216, - "step": 66272 - }, - { - "epoch": 1.7, - "learning_rate": 8.349299549398213e-07, - "loss": 0.6387, - "step": 66273 - }, - { - "epoch": 1.7, - "learning_rate": 8.349026641366628e-07, - "loss": 0.7324, - "step": 66274 - }, - { - "epoch": 1.7, - "learning_rate": 8.34875373459912e-07, - "loss": 0.5933, - "step": 66275 - }, - { - "epoch": 1.7, - "learning_rate": 8.348480829095889e-07, - "loss": 0.5137, - "step": 66276 - }, - { - "epoch": 1.7, - "learning_rate": 8.348207924857154e-07, - "loss": 0.7432, - "step": 66277 - }, - { - "epoch": 1.7, - "learning_rate": 8.347935021883121e-07, - "loss": 0.4852, - "step": 66278 - }, - { - "epoch": 1.7, - "learning_rate": 8.347662120173995e-07, - "loss": 0.6484, - "step": 66279 - }, - { - "epoch": 1.7, - "learning_rate": 8.347389219729991e-07, - "loss": 0.6514, - "step": 66280 - }, - { - "epoch": 1.7, - "learning_rate": 8.347116320551312e-07, - "loss": 0.5781, - "step": 66281 - }, - { - "epoch": 1.7, - "learning_rate": 8.346843422638174e-07, - "loss": 0.5386, - "step": 66282 - }, - { - "epoch": 1.7, - "learning_rate": 8.346570525990777e-07, - "loss": 0.6934, - "step": 66283 - }, - { - "epoch": 1.7, - "learning_rate": 8.34629763060934e-07, - "loss": 0.7178, - "step": 66284 - }, - { - "epoch": 1.7, - "learning_rate": 8.346024736494066e-07, - "loss": 0.6553, - "step": 66285 - }, - { - "epoch": 1.7, - "learning_rate": 8.345751843645164e-07, - "loss": 0.5767, - "step": 66286 - }, - { - "epoch": 1.7, - "learning_rate": 8.345478952062843e-07, - "loss": 0.7129, - "step": 66287 - }, - { - "epoch": 1.7, - "learning_rate": 8.345206061747312e-07, - "loss": 0.6299, - "step": 66288 - }, - { - "epoch": 1.7, - "learning_rate": 8.344933172698782e-07, - "loss": 0.6724, - "step": 66289 - }, - { - "epoch": 1.7, - "learning_rate": 8.344660284917458e-07, - "loss": 0.5493, - "step": 66290 - }, - { - "epoch": 1.7, - "learning_rate": 8.344387398403554e-07, - "loss": 0.79, - "step": 66291 - }, - { - "epoch": 1.7, - "learning_rate": 8.344114513157275e-07, - "loss": 0.6855, - "step": 66292 - }, - { - "epoch": 1.7, - "learning_rate": 8.343841629178834e-07, - "loss": 0.834, - "step": 66293 - }, - { - "epoch": 1.7, - "learning_rate": 8.343568746468433e-07, - "loss": 0.7441, - "step": 66294 - }, - { - "epoch": 1.7, - "learning_rate": 8.343295865026294e-07, - "loss": 0.7393, - "step": 66295 - }, - { - "epoch": 1.7, - "learning_rate": 8.34302298485261e-07, - "loss": 0.6689, - "step": 66296 - }, - { - "epoch": 1.7, - "learning_rate": 8.342750105947599e-07, - "loss": 0.6396, - "step": 66297 - }, - { - "epoch": 1.7, - "learning_rate": 8.342477228311465e-07, - "loss": 0.6846, - "step": 66298 - }, - { - "epoch": 1.7, - "learning_rate": 8.342204351944425e-07, - "loss": 0.7529, - "step": 66299 - }, - { - "epoch": 1.7, - "learning_rate": 8.341931476846678e-07, - "loss": 0.5918, - "step": 66300 - }, - { - "epoch": 1.7, - "learning_rate": 8.34165860301844e-07, - "loss": 0.6221, - "step": 66301 - }, - { - "epoch": 1.7, - "learning_rate": 8.341385730459917e-07, - "loss": 0.6562, - "step": 66302 - }, - { - "epoch": 1.7, - "learning_rate": 8.34111285917132e-07, - "loss": 0.4323, - "step": 66303 - }, - { - "epoch": 1.7, - "learning_rate": 8.340839989152854e-07, - "loss": 0.6274, - "step": 66304 - }, - { - "epoch": 1.7, - "learning_rate": 8.340567120404735e-07, - "loss": 0.6318, - "step": 66305 - }, - { - "epoch": 1.7, - "learning_rate": 8.340294252927167e-07, - "loss": 0.7021, - "step": 66306 - }, - { - "epoch": 1.7, - "learning_rate": 8.340021386720356e-07, - "loss": 0.6611, - "step": 66307 - }, - { - "epoch": 1.7, - "learning_rate": 8.339748521784517e-07, - "loss": 0.6562, - "step": 66308 - }, - { - "epoch": 1.7, - "learning_rate": 8.339475658119852e-07, - "loss": 0.5732, - "step": 66309 - }, - { - "epoch": 1.7, - "learning_rate": 8.339202795726579e-07, - "loss": 0.7158, - "step": 66310 - }, - { - "epoch": 1.7, - "learning_rate": 8.338929934604898e-07, - "loss": 0.6367, - "step": 66311 - }, - { - "epoch": 1.7, - "learning_rate": 8.338657074755026e-07, - "loss": 0.6416, - "step": 66312 - }, - { - "epoch": 1.7, - "learning_rate": 8.338384216177163e-07, - "loss": 0.7451, - "step": 66313 - }, - { - "epoch": 1.7, - "learning_rate": 8.338111358871527e-07, - "loss": 0.6152, - "step": 66314 - }, - { - "epoch": 1.7, - "learning_rate": 8.337838502838325e-07, - "loss": 0.5271, - "step": 66315 - }, - { - "epoch": 1.7, - "learning_rate": 8.33756564807776e-07, - "loss": 0.6099, - "step": 66316 - }, - { - "epoch": 1.7, - "learning_rate": 8.337292794590044e-07, - "loss": 0.6309, - "step": 66317 - }, - { - "epoch": 1.7, - "learning_rate": 8.337019942375387e-07, - "loss": 0.615, - "step": 66318 - }, - { - "epoch": 1.7, - "learning_rate": 8.336747091433996e-07, - "loss": 0.6055, - "step": 66319 - }, - { - "epoch": 1.7, - "learning_rate": 8.336474241766085e-07, - "loss": 0.7173, - "step": 66320 - }, - { - "epoch": 1.7, - "learning_rate": 8.336201393371855e-07, - "loss": 0.5469, - "step": 66321 - }, - { - "epoch": 1.7, - "learning_rate": 8.335928546251522e-07, - "loss": 0.5815, - "step": 66322 - }, - { - "epoch": 1.7, - "learning_rate": 8.335655700405289e-07, - "loss": 0.5942, - "step": 66323 - }, - { - "epoch": 1.7, - "learning_rate": 8.335382855833371e-07, - "loss": 0.4219, - "step": 66324 - }, - { - "epoch": 1.7, - "learning_rate": 8.335110012535976e-07, - "loss": 0.5732, - "step": 66325 - }, - { - "epoch": 1.7, - "learning_rate": 8.334837170513306e-07, - "loss": 0.5283, - "step": 66326 - }, - { - "epoch": 1.7, - "learning_rate": 8.334564329765577e-07, - "loss": 0.6157, - "step": 66327 - }, - { - "epoch": 1.7, - "learning_rate": 8.334291490292993e-07, - "loss": 0.6704, - "step": 66328 - }, - { - "epoch": 1.7, - "learning_rate": 8.334018652095767e-07, - "loss": 0.7344, - "step": 66329 - }, - { - "epoch": 1.7, - "learning_rate": 8.333745815174106e-07, - "loss": 0.6963, - "step": 66330 - }, - { - "epoch": 1.7, - "learning_rate": 8.33347297952822e-07, - "loss": 0.7842, - "step": 66331 - }, - { - "epoch": 1.7, - "learning_rate": 8.333200145158314e-07, - "loss": 0.6211, - "step": 66332 - }, - { - "epoch": 1.7, - "learning_rate": 8.332927312064604e-07, - "loss": 0.5425, - "step": 66333 - }, - { - "epoch": 1.7, - "learning_rate": 8.332654480247294e-07, - "loss": 0.582, - "step": 66334 - }, - { - "epoch": 1.7, - "learning_rate": 8.332381649706597e-07, - "loss": 0.6138, - "step": 66335 - }, - { - "epoch": 1.7, - "learning_rate": 8.332108820442713e-07, - "loss": 0.5532, - "step": 66336 - }, - { - "epoch": 1.7, - "learning_rate": 8.33183599245586e-07, - "loss": 0.6396, - "step": 66337 - }, - { - "epoch": 1.7, - "learning_rate": 8.33156316574624e-07, - "loss": 0.6182, - "step": 66338 - }, - { - "epoch": 1.7, - "learning_rate": 8.331290340314069e-07, - "loss": 0.6199, - "step": 66339 - }, - { - "epoch": 1.7, - "learning_rate": 8.331017516159549e-07, - "loss": 0.5896, - "step": 66340 - }, - { - "epoch": 1.7, - "learning_rate": 8.330744693282895e-07, - "loss": 0.7666, - "step": 66341 - }, - { - "epoch": 1.7, - "learning_rate": 8.33047187168431e-07, - "loss": 0.5298, - "step": 66342 - }, - { - "epoch": 1.7, - "learning_rate": 8.330199051364009e-07, - "loss": 0.6885, - "step": 66343 - }, - { - "epoch": 1.7, - "learning_rate": 8.329926232322195e-07, - "loss": 0.5991, - "step": 66344 - }, - { - "epoch": 1.7, - "learning_rate": 8.329653414559085e-07, - "loss": 0.6113, - "step": 66345 - }, - { - "epoch": 1.7, - "learning_rate": 8.329380598074878e-07, - "loss": 0.6963, - "step": 66346 - }, - { - "epoch": 1.7, - "learning_rate": 8.329107782869787e-07, - "loss": 0.6895, - "step": 66347 - }, - { - "epoch": 1.7, - "learning_rate": 8.328834968944024e-07, - "loss": 0.751, - "step": 66348 - }, - { - "epoch": 1.7, - "learning_rate": 8.328562156297793e-07, - "loss": 0.7109, - "step": 66349 - }, - { - "epoch": 1.7, - "learning_rate": 8.328289344931306e-07, - "loss": 0.6396, - "step": 66350 - }, - { - "epoch": 1.7, - "learning_rate": 8.328016534844773e-07, - "loss": 0.4336, - "step": 66351 - }, - { - "epoch": 1.7, - "learning_rate": 8.327743726038396e-07, - "loss": 0.5508, - "step": 66352 - }, - { - "epoch": 1.7, - "learning_rate": 8.327470918512393e-07, - "loss": 0.4797, - "step": 66353 - }, - { - "epoch": 1.7, - "learning_rate": 8.327198112266967e-07, - "loss": 0.6216, - "step": 66354 - }, - { - "epoch": 1.7, - "learning_rate": 8.32692530730233e-07, - "loss": 0.6318, - "step": 66355 - }, - { - "epoch": 1.7, - "learning_rate": 8.326652503618689e-07, - "loss": 0.9189, - "step": 66356 - }, - { - "epoch": 1.7, - "learning_rate": 8.326379701216251e-07, - "loss": 0.5366, - "step": 66357 - }, - { - "epoch": 1.7, - "learning_rate": 8.326106900095229e-07, - "loss": 0.7793, - "step": 66358 - }, - { - "epoch": 1.7, - "learning_rate": 8.325834100255829e-07, - "loss": 0.7358, - "step": 66359 - }, - { - "epoch": 1.7, - "learning_rate": 8.325561301698262e-07, - "loss": 0.5986, - "step": 66360 - }, - { - "epoch": 1.7, - "learning_rate": 8.325288504422733e-07, - "loss": 0.6514, - "step": 66361 - }, - { - "epoch": 1.7, - "learning_rate": 8.325015708429455e-07, - "loss": 0.8203, - "step": 66362 - }, - { - "epoch": 1.7, - "learning_rate": 8.324742913718637e-07, - "loss": 0.667, - "step": 66363 - }, - { - "epoch": 1.7, - "learning_rate": 8.324470120290485e-07, - "loss": 0.4736, - "step": 66364 - }, - { - "epoch": 1.7, - "learning_rate": 8.324197328145212e-07, - "loss": 0.387, - "step": 66365 - }, - { - "epoch": 1.7, - "learning_rate": 8.32392453728302e-07, - "loss": 0.7422, - "step": 66366 - }, - { - "epoch": 1.7, - "learning_rate": 8.323651747704124e-07, - "loss": 0.7949, - "step": 66367 - }, - { - "epoch": 1.7, - "learning_rate": 8.323378959408731e-07, - "loss": 0.6748, - "step": 66368 - }, - { - "epoch": 1.7, - "learning_rate": 8.323106172397047e-07, - "loss": 0.6816, - "step": 66369 - }, - { - "epoch": 1.7, - "learning_rate": 8.322833386669288e-07, - "loss": 0.6084, - "step": 66370 - }, - { - "epoch": 1.7, - "learning_rate": 8.322560602225653e-07, - "loss": 0.4545, - "step": 66371 - }, - { - "epoch": 1.7, - "learning_rate": 8.322287819066361e-07, - "loss": 0.7266, - "step": 66372 - }, - { - "epoch": 1.7, - "learning_rate": 8.322015037191613e-07, - "loss": 0.6416, - "step": 66373 - }, - { - "epoch": 1.7, - "learning_rate": 8.321742256601622e-07, - "loss": 0.6245, - "step": 66374 - }, - { - "epoch": 1.7, - "learning_rate": 8.321469477296599e-07, - "loss": 0.5356, - "step": 66375 - }, - { - "epoch": 1.7, - "learning_rate": 8.321196699276744e-07, - "loss": 0.6157, - "step": 66376 - }, - { - "epoch": 1.7, - "learning_rate": 8.320923922542275e-07, - "loss": 0.5261, - "step": 66377 - }, - { - "epoch": 1.7, - "learning_rate": 8.320651147093395e-07, - "loss": 0.6143, - "step": 66378 - }, - { - "epoch": 1.7, - "learning_rate": 8.320378372930317e-07, - "loss": 0.5, - "step": 66379 - }, - { - "epoch": 1.7, - "learning_rate": 8.320105600053246e-07, - "loss": 0.5952, - "step": 66380 - }, - { - "epoch": 1.7, - "learning_rate": 8.319832828462396e-07, - "loss": 0.5396, - "step": 66381 - }, - { - "epoch": 1.7, - "learning_rate": 8.319560058157968e-07, - "loss": 0.5544, - "step": 66382 - }, - { - "epoch": 1.7, - "learning_rate": 8.31928728914018e-07, - "loss": 0.6484, - "step": 66383 - }, - { - "epoch": 1.7, - "learning_rate": 8.319014521409233e-07, - "loss": 0.668, - "step": 66384 - }, - { - "epoch": 1.7, - "learning_rate": 8.318741754965347e-07, - "loss": 0.6416, - "step": 66385 - }, - { - "epoch": 1.7, - "learning_rate": 8.318468989808717e-07, - "loss": 0.5928, - "step": 66386 - }, - { - "epoch": 1.7, - "learning_rate": 8.318196225939559e-07, - "loss": 0.6772, - "step": 66387 - }, - { - "epoch": 1.7, - "learning_rate": 8.317923463358079e-07, - "loss": 0.6274, - "step": 66388 - }, - { - "epoch": 1.7, - "learning_rate": 8.317650702064489e-07, - "loss": 0.6953, - "step": 66389 - }, - { - "epoch": 1.7, - "learning_rate": 8.317377942058996e-07, - "loss": 0.7598, - "step": 66390 - }, - { - "epoch": 1.7, - "learning_rate": 8.31710518334181e-07, - "loss": 0.7148, - "step": 66391 - }, - { - "epoch": 1.7, - "learning_rate": 8.316832425913138e-07, - "loss": 0.4584, - "step": 66392 - }, - { - "epoch": 1.7, - "learning_rate": 8.316559669773192e-07, - "loss": 0.5938, - "step": 66393 - }, - { - "epoch": 1.7, - "learning_rate": 8.316286914922176e-07, - "loss": 0.6943, - "step": 66394 - }, - { - "epoch": 1.7, - "learning_rate": 8.316014161360307e-07, - "loss": 0.5215, - "step": 66395 - }, - { - "epoch": 1.7, - "learning_rate": 8.315741409087785e-07, - "loss": 0.7598, - "step": 66396 - }, - { - "epoch": 1.7, - "learning_rate": 8.315468658104822e-07, - "loss": 0.834, - "step": 66397 - }, - { - "epoch": 1.7, - "learning_rate": 8.315195908411628e-07, - "loss": 0.5508, - "step": 66398 - }, - { - "epoch": 1.7, - "learning_rate": 8.314923160008409e-07, - "loss": 0.5664, - "step": 66399 - }, - { - "epoch": 1.7, - "learning_rate": 8.314650412895379e-07, - "loss": 0.5879, - "step": 66400 - }, - { - "epoch": 1.7, - "learning_rate": 8.314377667072741e-07, - "loss": 0.6631, - "step": 66401 - }, - { - "epoch": 1.7, - "learning_rate": 8.314104922540708e-07, - "loss": 0.6462, - "step": 66402 - }, - { - "epoch": 1.7, - "learning_rate": 8.313832179299486e-07, - "loss": 0.6719, - "step": 66403 - }, - { - "epoch": 1.7, - "learning_rate": 8.313559437349287e-07, - "loss": 0.626, - "step": 66404 - }, - { - "epoch": 1.7, - "learning_rate": 8.313286696690321e-07, - "loss": 0.6172, - "step": 66405 - }, - { - "epoch": 1.7, - "learning_rate": 8.31301395732279e-07, - "loss": 0.6035, - "step": 66406 - }, - { - "epoch": 1.7, - "learning_rate": 8.312741219246904e-07, - "loss": 0.8047, - "step": 66407 - }, - { - "epoch": 1.7, - "learning_rate": 8.312468482462878e-07, - "loss": 0.6348, - "step": 66408 - }, - { - "epoch": 1.7, - "learning_rate": 8.312195746970915e-07, - "loss": 0.709, - "step": 66409 - }, - { - "epoch": 1.7, - "learning_rate": 8.311923012771229e-07, - "loss": 0.4673, - "step": 66410 - }, - { - "epoch": 1.7, - "learning_rate": 8.311650279864024e-07, - "loss": 0.6836, - "step": 66411 - }, - { - "epoch": 1.7, - "learning_rate": 8.311377548249511e-07, - "loss": 0.6592, - "step": 66412 - }, - { - "epoch": 1.7, - "learning_rate": 8.311104817927899e-07, - "loss": 0.7109, - "step": 66413 - }, - { - "epoch": 1.7, - "learning_rate": 8.310832088899396e-07, - "loss": 0.7207, - "step": 66414 - }, - { - "epoch": 1.7, - "learning_rate": 8.310559361164214e-07, - "loss": 0.5381, - "step": 66415 - }, - { - "epoch": 1.7, - "learning_rate": 8.310286634722556e-07, - "loss": 0.5063, - "step": 66416 - }, - { - "epoch": 1.7, - "learning_rate": 8.310013909574634e-07, - "loss": 0.6045, - "step": 66417 - }, - { - "epoch": 1.7, - "learning_rate": 8.309741185720656e-07, - "loss": 0.7134, - "step": 66418 - }, - { - "epoch": 1.7, - "learning_rate": 8.309468463160833e-07, - "loss": 0.7598, - "step": 66419 - }, - { - "epoch": 1.7, - "learning_rate": 8.30919574189537e-07, - "loss": 0.4785, - "step": 66420 - }, - { - "epoch": 1.7, - "learning_rate": 8.308923021924481e-07, - "loss": 0.448, - "step": 66421 - }, - { - "epoch": 1.7, - "learning_rate": 8.308650303248369e-07, - "loss": 0.519, - "step": 66422 - }, - { - "epoch": 1.7, - "learning_rate": 8.308377585867248e-07, - "loss": 0.7393, - "step": 66423 - }, - { - "epoch": 1.7, - "learning_rate": 8.308104869781324e-07, - "loss": 0.5415, - "step": 66424 - }, - { - "epoch": 1.7, - "learning_rate": 8.30783215499081e-07, - "loss": 0.5303, - "step": 66425 - }, - { - "epoch": 1.7, - "learning_rate": 8.307559441495905e-07, - "loss": 0.6846, - "step": 66426 - }, - { - "epoch": 1.7, - "learning_rate": 8.307286729296827e-07, - "loss": 0.4192, - "step": 66427 - }, - { - "epoch": 1.7, - "learning_rate": 8.307014018393778e-07, - "loss": 0.6143, - "step": 66428 - }, - { - "epoch": 1.7, - "learning_rate": 8.306741308786975e-07, - "loss": 0.5312, - "step": 66429 - }, - { - "epoch": 1.7, - "learning_rate": 8.306468600476619e-07, - "loss": 0.6826, - "step": 66430 - }, - { - "epoch": 1.7, - "learning_rate": 8.306195893462925e-07, - "loss": 0.6367, - "step": 66431 - }, - { - "epoch": 1.7, - "learning_rate": 8.305923187746096e-07, - "loss": 0.5889, - "step": 66432 - }, - { - "epoch": 1.7, - "learning_rate": 8.305650483326346e-07, - "loss": 0.689, - "step": 66433 - }, - { - "epoch": 1.7, - "learning_rate": 8.30537778020388e-07, - "loss": 0.7246, - "step": 66434 - }, - { - "epoch": 1.7, - "learning_rate": 8.305105078378913e-07, - "loss": 0.7607, - "step": 66435 - }, - { - "epoch": 1.7, - "learning_rate": 8.304832377851645e-07, - "loss": 0.7002, - "step": 66436 - }, - { - "epoch": 1.7, - "learning_rate": 8.304559678622288e-07, - "loss": 0.7349, - "step": 66437 - }, - { - "epoch": 1.7, - "learning_rate": 8.304286980691054e-07, - "loss": 0.5635, - "step": 66438 - }, - { - "epoch": 1.7, - "learning_rate": 8.304014284058148e-07, - "loss": 0.7656, - "step": 66439 - }, - { - "epoch": 1.7, - "learning_rate": 8.303741588723781e-07, - "loss": 0.7656, - "step": 66440 - }, - { - "epoch": 1.7, - "learning_rate": 8.303468894688162e-07, - "loss": 0.585, - "step": 66441 - }, - { - "epoch": 1.7, - "learning_rate": 8.303196201951495e-07, - "loss": 0.6655, - "step": 66442 - }, - { - "epoch": 1.7, - "learning_rate": 8.302923510513996e-07, - "loss": 0.5771, - "step": 66443 - }, - { - "epoch": 1.7, - "learning_rate": 8.30265082037587e-07, - "loss": 0.7119, - "step": 66444 - }, - { - "epoch": 1.7, - "learning_rate": 8.302378131537327e-07, - "loss": 0.6582, - "step": 66445 - }, - { - "epoch": 1.7, - "learning_rate": 8.302105443998575e-07, - "loss": 0.4797, - "step": 66446 - }, - { - "epoch": 1.7, - "learning_rate": 8.301832757759821e-07, - "loss": 0.5923, - "step": 66447 - }, - { - "epoch": 1.7, - "learning_rate": 8.301560072821276e-07, - "loss": 0.5674, - "step": 66448 - }, - { - "epoch": 1.7, - "learning_rate": 8.301287389183149e-07, - "loss": 0.6797, - "step": 66449 - }, - { - "epoch": 1.7, - "learning_rate": 8.301014706845649e-07, - "loss": 0.6182, - "step": 66450 - }, - { - "epoch": 1.7, - "learning_rate": 8.30074202580898e-07, - "loss": 0.4524, - "step": 66451 - }, - { - "epoch": 1.7, - "learning_rate": 8.300469346073357e-07, - "loss": 0.5962, - "step": 66452 - }, - { - "epoch": 1.7, - "learning_rate": 8.300196667638986e-07, - "loss": 0.665, - "step": 66453 - }, - { - "epoch": 1.7, - "learning_rate": 8.299923990506079e-07, - "loss": 0.7139, - "step": 66454 - }, - { - "epoch": 1.7, - "learning_rate": 8.299651314674843e-07, - "loss": 0.7793, - "step": 66455 - }, - { - "epoch": 1.7, - "learning_rate": 8.299378640145481e-07, - "loss": 0.6309, - "step": 66456 - }, - { - "epoch": 1.7, - "learning_rate": 8.299105966918209e-07, - "loss": 0.7725, - "step": 66457 - }, - { - "epoch": 1.7, - "learning_rate": 8.298833294993235e-07, - "loss": 0.8096, - "step": 66458 - }, - { - "epoch": 1.7, - "learning_rate": 8.298560624370762e-07, - "loss": 0.6924, - "step": 66459 - }, - { - "epoch": 1.7, - "learning_rate": 8.298287955051005e-07, - "loss": 0.5662, - "step": 66460 - }, - { - "epoch": 1.7, - "learning_rate": 8.29801528703417e-07, - "loss": 0.5518, - "step": 66461 - }, - { - "epoch": 1.7, - "learning_rate": 8.297742620320468e-07, - "loss": 0.5962, - "step": 66462 - }, - { - "epoch": 1.7, - "learning_rate": 8.297469954910104e-07, - "loss": 0.5391, - "step": 66463 - }, - { - "epoch": 1.7, - "learning_rate": 8.297197290803291e-07, - "loss": 0.6069, - "step": 66464 - }, - { - "epoch": 1.7, - "learning_rate": 8.296924628000237e-07, - "loss": 0.5216, - "step": 66465 - }, - { - "epoch": 1.7, - "learning_rate": 8.296651966501147e-07, - "loss": 0.729, - "step": 66466 - }, - { - "epoch": 1.7, - "learning_rate": 8.296379306306232e-07, - "loss": 0.4922, - "step": 66467 - }, - { - "epoch": 1.7, - "learning_rate": 8.296106647415701e-07, - "loss": 0.626, - "step": 66468 - }, - { - "epoch": 1.7, - "learning_rate": 8.295833989829764e-07, - "loss": 0.625, - "step": 66469 - }, - { - "epoch": 1.7, - "learning_rate": 8.295561333548627e-07, - "loss": 0.5503, - "step": 66470 - }, - { - "epoch": 1.7, - "learning_rate": 8.295288678572502e-07, - "loss": 0.7422, - "step": 66471 - }, - { - "epoch": 1.7, - "learning_rate": 8.295016024901595e-07, - "loss": 0.522, - "step": 66472 - }, - { - "epoch": 1.7, - "learning_rate": 8.294743372536118e-07, - "loss": 0.6387, - "step": 66473 - }, - { - "epoch": 1.7, - "learning_rate": 8.294470721476273e-07, - "loss": 0.4585, - "step": 66474 - }, - { - "epoch": 1.7, - "learning_rate": 8.294198071722282e-07, - "loss": 0.522, - "step": 66475 - }, - { - "epoch": 1.7, - "learning_rate": 8.293925423274337e-07, - "loss": 0.5989, - "step": 66476 - }, - { - "epoch": 1.7, - "learning_rate": 8.293652776132658e-07, - "loss": 0.7544, - "step": 66477 - }, - { - "epoch": 1.7, - "learning_rate": 8.293380130297449e-07, - "loss": 0.7021, - "step": 66478 - }, - { - "epoch": 1.7, - "learning_rate": 8.293107485768922e-07, - "loss": 0.488, - "step": 66479 - }, - { - "epoch": 1.7, - "learning_rate": 8.292834842547282e-07, - "loss": 0.7559, - "step": 66480 - }, - { - "epoch": 1.7, - "learning_rate": 8.292562200632742e-07, - "loss": 0.7275, - "step": 66481 - }, - { - "epoch": 1.7, - "learning_rate": 8.292289560025506e-07, - "loss": 0.6504, - "step": 66482 - }, - { - "epoch": 1.7, - "learning_rate": 8.292016920725788e-07, - "loss": 0.7041, - "step": 66483 - }, - { - "epoch": 1.7, - "learning_rate": 8.291744282733792e-07, - "loss": 0.5798, - "step": 66484 - }, - { - "epoch": 1.7, - "learning_rate": 8.291471646049733e-07, - "loss": 0.5444, - "step": 66485 - }, - { - "epoch": 1.7, - "learning_rate": 8.291199010673813e-07, - "loss": 0.6514, - "step": 66486 - }, - { - "epoch": 1.7, - "learning_rate": 8.290926376606242e-07, - "loss": 0.4392, - "step": 66487 - }, - { - "epoch": 1.7, - "learning_rate": 8.290653743847231e-07, - "loss": 0.5269, - "step": 66488 - }, - { - "epoch": 1.7, - "learning_rate": 8.290381112396987e-07, - "loss": 0.6562, - "step": 66489 - }, - { - "epoch": 1.7, - "learning_rate": 8.290108482255722e-07, - "loss": 0.6709, - "step": 66490 - }, - { - "epoch": 1.7, - "learning_rate": 8.289835853423639e-07, - "loss": 0.4834, - "step": 66491 - }, - { - "epoch": 1.7, - "learning_rate": 8.289563225900953e-07, - "loss": 0.667, - "step": 66492 - }, - { - "epoch": 1.7, - "learning_rate": 8.289290599687867e-07, - "loss": 0.7275, - "step": 66493 - }, - { - "epoch": 1.7, - "learning_rate": 8.289017974784599e-07, - "loss": 0.7402, - "step": 66494 - }, - { - "epoch": 1.7, - "learning_rate": 8.288745351191345e-07, - "loss": 0.5195, - "step": 66495 - }, - { - "epoch": 1.7, - "learning_rate": 8.288472728908322e-07, - "loss": 0.7114, - "step": 66496 - }, - { - "epoch": 1.7, - "learning_rate": 8.288200107935736e-07, - "loss": 0.5796, - "step": 66497 - }, - { - "epoch": 1.7, - "learning_rate": 8.287927488273797e-07, - "loss": 0.5781, - "step": 66498 - }, - { - "epoch": 1.7, - "learning_rate": 8.287654869922711e-07, - "loss": 0.6318, - "step": 66499 - }, - { - "epoch": 1.7, - "learning_rate": 8.287382252882692e-07, - "loss": 0.7935, - "step": 66500 - }, - { - "epoch": 1.7, - "learning_rate": 8.287109637153942e-07, - "loss": 0.3816, - "step": 66501 - }, - { - "epoch": 1.7, - "learning_rate": 8.286837022736678e-07, - "loss": 0.6562, - "step": 66502 - }, - { - "epoch": 1.7, - "learning_rate": 8.286564409631101e-07, - "loss": 0.5605, - "step": 66503 - }, - { - "epoch": 1.7, - "learning_rate": 8.286291797837426e-07, - "loss": 0.5269, - "step": 66504 - }, - { - "epoch": 1.7, - "learning_rate": 8.286019187355857e-07, - "loss": 0.6279, - "step": 66505 - }, - { - "epoch": 1.7, - "learning_rate": 8.285746578186602e-07, - "loss": 0.6162, - "step": 66506 - }, - { - "epoch": 1.7, - "learning_rate": 8.285473970329875e-07, - "loss": 0.603, - "step": 66507 - }, - { - "epoch": 1.7, - "learning_rate": 8.285201363785879e-07, - "loss": 0.7646, - "step": 66508 - }, - { - "epoch": 1.7, - "learning_rate": 8.284928758554828e-07, - "loss": 0.563, - "step": 66509 - }, - { - "epoch": 1.7, - "learning_rate": 8.284656154636925e-07, - "loss": 0.6841, - "step": 66510 - }, - { - "epoch": 1.7, - "learning_rate": 8.284383552032386e-07, - "loss": 0.7178, - "step": 66511 - }, - { - "epoch": 1.7, - "learning_rate": 8.284110950741411e-07, - "loss": 0.4133, - "step": 66512 - }, - { - "epoch": 1.7, - "learning_rate": 8.283838350764217e-07, - "loss": 0.7461, - "step": 66513 - }, - { - "epoch": 1.7, - "learning_rate": 8.283565752101011e-07, - "loss": 0.8242, - "step": 66514 - }, - { - "epoch": 1.7, - "learning_rate": 8.283293154751998e-07, - "loss": 0.6777, - "step": 66515 - }, - { - "epoch": 1.7, - "learning_rate": 8.283020558717386e-07, - "loss": 0.6211, - "step": 66516 - }, - { - "epoch": 1.7, - "learning_rate": 8.282747963997387e-07, - "loss": 0.6533, - "step": 66517 - }, - { - "epoch": 1.7, - "learning_rate": 8.282475370592209e-07, - "loss": 0.479, - "step": 66518 - }, - { - "epoch": 1.7, - "learning_rate": 8.282202778502062e-07, - "loss": 0.5439, - "step": 66519 - }, - { - "epoch": 1.7, - "learning_rate": 8.281930187727151e-07, - "loss": 0.5776, - "step": 66520 - }, - { - "epoch": 1.7, - "learning_rate": 8.281657598267689e-07, - "loss": 0.5366, - "step": 66521 - }, - { - "epoch": 1.7, - "learning_rate": 8.281385010123881e-07, - "loss": 0.6738, - "step": 66522 - }, - { - "epoch": 1.71, - "learning_rate": 8.281112423295939e-07, - "loss": 0.541, - "step": 66523 - }, - { - "epoch": 1.71, - "learning_rate": 8.280839837784074e-07, - "loss": 0.6006, - "step": 66524 - }, - { - "epoch": 1.71, - "learning_rate": 8.280567253588485e-07, - "loss": 0.6113, - "step": 66525 - }, - { - "epoch": 1.71, - "learning_rate": 8.280294670709389e-07, - "loss": 0.583, - "step": 66526 - }, - { - "epoch": 1.71, - "learning_rate": 8.280022089146989e-07, - "loss": 0.5581, - "step": 66527 - }, - { - "epoch": 1.71, - "learning_rate": 8.279749508901501e-07, - "loss": 0.582, - "step": 66528 - }, - { - "epoch": 1.71, - "learning_rate": 8.279476929973128e-07, - "loss": 0.6934, - "step": 66529 - }, - { - "epoch": 1.71, - "learning_rate": 8.279204352362081e-07, - "loss": 0.4775, - "step": 66530 - }, - { - "epoch": 1.71, - "learning_rate": 8.278931776068569e-07, - "loss": 0.6709, - "step": 66531 - }, - { - "epoch": 1.71, - "learning_rate": 8.278659201092797e-07, - "loss": 0.5078, - "step": 66532 - }, - { - "epoch": 1.71, - "learning_rate": 8.278386627434979e-07, - "loss": 0.6162, - "step": 66533 - }, - { - "epoch": 1.71, - "learning_rate": 8.278114055095324e-07, - "loss": 0.7607, - "step": 66534 - }, - { - "epoch": 1.71, - "learning_rate": 8.277841484074033e-07, - "loss": 0.5205, - "step": 66535 - }, - { - "epoch": 1.71, - "learning_rate": 8.277568914371322e-07, - "loss": 0.666, - "step": 66536 - }, - { - "epoch": 1.71, - "learning_rate": 8.277296345987395e-07, - "loss": 0.8135, - "step": 66537 - }, - { - "epoch": 1.71, - "learning_rate": 8.277023778922464e-07, - "loss": 0.6646, - "step": 66538 - }, - { - "epoch": 1.71, - "learning_rate": 8.276751213176736e-07, - "loss": 0.4399, - "step": 66539 - }, - { - "epoch": 1.71, - "learning_rate": 8.276478648750421e-07, - "loss": 0.4668, - "step": 66540 - }, - { - "epoch": 1.71, - "learning_rate": 8.276206085643727e-07, - "loss": 0.7637, - "step": 66541 - }, - { - "epoch": 1.71, - "learning_rate": 8.275933523856862e-07, - "loss": 0.7617, - "step": 66542 - }, - { - "epoch": 1.71, - "learning_rate": 8.275660963390035e-07, - "loss": 0.6863, - "step": 66543 - }, - { - "epoch": 1.71, - "learning_rate": 8.275388404243459e-07, - "loss": 0.7061, - "step": 66544 - }, - { - "epoch": 1.71, - "learning_rate": 8.275115846417338e-07, - "loss": 0.7988, - "step": 66545 - }, - { - "epoch": 1.71, - "learning_rate": 8.274843289911879e-07, - "loss": 0.6421, - "step": 66546 - }, - { - "epoch": 1.71, - "learning_rate": 8.274570734727295e-07, - "loss": 0.7441, - "step": 66547 - }, - { - "epoch": 1.71, - "learning_rate": 8.274298180863792e-07, - "loss": 0.6084, - "step": 66548 - }, - { - "epoch": 1.71, - "learning_rate": 8.274025628321578e-07, - "loss": 0.6113, - "step": 66549 - }, - { - "epoch": 1.71, - "learning_rate": 8.273753077100865e-07, - "loss": 0.5215, - "step": 66550 - }, - { - "epoch": 1.71, - "learning_rate": 8.273480527201858e-07, - "loss": 0.709, - "step": 66551 - }, - { - "epoch": 1.71, - "learning_rate": 8.27320797862477e-07, - "loss": 0.7383, - "step": 66552 - }, - { - "epoch": 1.71, - "learning_rate": 8.272935431369806e-07, - "loss": 0.7168, - "step": 66553 - }, - { - "epoch": 1.71, - "learning_rate": 8.272662885437179e-07, - "loss": 0.7568, - "step": 66554 - }, - { - "epoch": 1.71, - "learning_rate": 8.272390340827091e-07, - "loss": 0.7119, - "step": 66555 - }, - { - "epoch": 1.71, - "learning_rate": 8.272117797539755e-07, - "loss": 0.7026, - "step": 66556 - }, - { - "epoch": 1.71, - "learning_rate": 8.271845255575379e-07, - "loss": 0.6758, - "step": 66557 - }, - { - "epoch": 1.71, - "learning_rate": 8.27157271493417e-07, - "loss": 0.6641, - "step": 66558 - }, - { - "epoch": 1.71, - "learning_rate": 8.271300175616341e-07, - "loss": 0.4893, - "step": 66559 - }, - { - "epoch": 1.71, - "learning_rate": 8.271027637622095e-07, - "loss": 0.7344, - "step": 66560 - }, - { - "epoch": 1.71, - "learning_rate": 8.270755100951648e-07, - "loss": 0.5344, - "step": 66561 - }, - { - "epoch": 1.71, - "learning_rate": 8.270482565605199e-07, - "loss": 0.6572, - "step": 66562 - }, - { - "epoch": 1.71, - "learning_rate": 8.270210031582966e-07, - "loss": 0.624, - "step": 66563 - }, - { - "epoch": 1.71, - "learning_rate": 8.269937498885156e-07, - "loss": 0.6357, - "step": 66564 - }, - { - "epoch": 1.71, - "learning_rate": 8.269664967511972e-07, - "loss": 0.75, - "step": 66565 - }, - { - "epoch": 1.71, - "learning_rate": 8.269392437463625e-07, - "loss": 0.5015, - "step": 66566 - }, - { - "epoch": 1.71, - "learning_rate": 8.269119908740325e-07, - "loss": 0.5134, - "step": 66567 - }, - { - "epoch": 1.71, - "learning_rate": 8.26884738134228e-07, - "loss": 0.5486, - "step": 66568 - }, - { - "epoch": 1.71, - "learning_rate": 8.2685748552697e-07, - "loss": 0.7236, - "step": 66569 - }, - { - "epoch": 1.71, - "learning_rate": 8.268302330522791e-07, - "loss": 0.6216, - "step": 66570 - }, - { - "epoch": 1.71, - "learning_rate": 8.268029807101765e-07, - "loss": 0.5798, - "step": 66571 - }, - { - "epoch": 1.71, - "learning_rate": 8.267757285006828e-07, - "loss": 0.7036, - "step": 66572 - }, - { - "epoch": 1.71, - "learning_rate": 8.26748476423819e-07, - "loss": 0.5229, - "step": 66573 - }, - { - "epoch": 1.71, - "learning_rate": 8.267212244796062e-07, - "loss": 0.7134, - "step": 66574 - }, - { - "epoch": 1.71, - "learning_rate": 8.266939726680646e-07, - "loss": 0.5781, - "step": 66575 - }, - { - "epoch": 1.71, - "learning_rate": 8.266667209892157e-07, - "loss": 0.6748, - "step": 66576 - }, - { - "epoch": 1.71, - "learning_rate": 8.266394694430798e-07, - "loss": 0.6724, - "step": 66577 - }, - { - "epoch": 1.71, - "learning_rate": 8.266122180296784e-07, - "loss": 0.7158, - "step": 66578 - }, - { - "epoch": 1.71, - "learning_rate": 8.265849667490319e-07, - "loss": 0.6975, - "step": 66579 - }, - { - "epoch": 1.71, - "learning_rate": 8.265577156011614e-07, - "loss": 0.6836, - "step": 66580 - }, - { - "epoch": 1.71, - "learning_rate": 8.265304645860874e-07, - "loss": 0.6187, - "step": 66581 - }, - { - "epoch": 1.71, - "learning_rate": 8.265032137038315e-07, - "loss": 0.584, - "step": 66582 - }, - { - "epoch": 1.71, - "learning_rate": 8.264759629544136e-07, - "loss": 0.5518, - "step": 66583 - }, - { - "epoch": 1.71, - "learning_rate": 8.26448712337856e-07, - "loss": 0.4969, - "step": 66584 - }, - { - "epoch": 1.71, - "learning_rate": 8.264214618541778e-07, - "loss": 0.6348, - "step": 66585 - }, - { - "epoch": 1.71, - "learning_rate": 8.26394211503401e-07, - "loss": 0.7974, - "step": 66586 - }, - { - "epoch": 1.71, - "learning_rate": 8.26366961285546e-07, - "loss": 0.5469, - "step": 66587 - }, - { - "epoch": 1.71, - "learning_rate": 8.26339711200634e-07, - "loss": 0.7725, - "step": 66588 - }, - { - "epoch": 1.71, - "learning_rate": 8.263124612486855e-07, - "loss": 0.6924, - "step": 66589 - }, - { - "epoch": 1.71, - "learning_rate": 8.262852114297217e-07, - "loss": 0.7285, - "step": 66590 - }, - { - "epoch": 1.71, - "learning_rate": 8.262579617437633e-07, - "loss": 0.6294, - "step": 66591 - }, - { - "epoch": 1.71, - "learning_rate": 8.262307121908312e-07, - "loss": 0.6104, - "step": 66592 - }, - { - "epoch": 1.71, - "learning_rate": 8.262034627709461e-07, - "loss": 0.5181, - "step": 66593 - }, - { - "epoch": 1.71, - "learning_rate": 8.261762134841294e-07, - "loss": 0.4778, - "step": 66594 - }, - { - "epoch": 1.71, - "learning_rate": 8.261489643304015e-07, - "loss": 0.5908, - "step": 66595 - }, - { - "epoch": 1.71, - "learning_rate": 8.26121715309783e-07, - "loss": 0.646, - "step": 66596 - }, - { - "epoch": 1.71, - "learning_rate": 8.260944664222955e-07, - "loss": 0.7471, - "step": 66597 - }, - { - "epoch": 1.71, - "learning_rate": 8.260672176679591e-07, - "loss": 0.6362, - "step": 66598 - }, - { - "epoch": 1.71, - "learning_rate": 8.260399690467953e-07, - "loss": 0.6685, - "step": 66599 - }, - { - "epoch": 1.71, - "learning_rate": 8.260127205588245e-07, - "loss": 0.7036, - "step": 66600 - }, - { - "epoch": 1.71, - "learning_rate": 8.259854722040679e-07, - "loss": 0.4072, - "step": 66601 - }, - { - "epoch": 1.71, - "learning_rate": 8.25958223982546e-07, - "loss": 0.5415, - "step": 66602 - }, - { - "epoch": 1.71, - "learning_rate": 8.259309758942802e-07, - "loss": 0.3787, - "step": 66603 - }, - { - "epoch": 1.71, - "learning_rate": 8.259037279392912e-07, - "loss": 0.5298, - "step": 66604 - }, - { - "epoch": 1.71, - "learning_rate": 8.258764801175994e-07, - "loss": 0.7158, - "step": 66605 - }, - { - "epoch": 1.71, - "learning_rate": 8.25849232429226e-07, - "loss": 0.7261, - "step": 66606 - }, - { - "epoch": 1.71, - "learning_rate": 8.258219848741918e-07, - "loss": 0.5869, - "step": 66607 - }, - { - "epoch": 1.71, - "learning_rate": 8.257947374525177e-07, - "loss": 0.6973, - "step": 66608 - }, - { - "epoch": 1.71, - "learning_rate": 8.257674901642247e-07, - "loss": 0.7041, - "step": 66609 - }, - { - "epoch": 1.71, - "learning_rate": 8.257402430093332e-07, - "loss": 0.6133, - "step": 66610 - }, - { - "epoch": 1.71, - "learning_rate": 8.257129959878647e-07, - "loss": 0.6406, - "step": 66611 - }, - { - "epoch": 1.71, - "learning_rate": 8.256857490998394e-07, - "loss": 0.366, - "step": 66612 - }, - { - "epoch": 1.71, - "learning_rate": 8.256585023452789e-07, - "loss": 0.6006, - "step": 66613 - }, - { - "epoch": 1.71, - "learning_rate": 8.256312557242039e-07, - "loss": 0.4707, - "step": 66614 - }, - { - "epoch": 1.71, - "learning_rate": 8.256040092366344e-07, - "loss": 0.4553, - "step": 66615 - }, - { - "epoch": 1.71, - "learning_rate": 8.255767628825923e-07, - "loss": 0.5859, - "step": 66616 - }, - { - "epoch": 1.71, - "learning_rate": 8.255495166620977e-07, - "loss": 0.8188, - "step": 66617 - }, - { - "epoch": 1.71, - "learning_rate": 8.255222705751721e-07, - "loss": 0.5381, - "step": 66618 - }, - { - "epoch": 1.71, - "learning_rate": 8.254950246218358e-07, - "loss": 0.4536, - "step": 66619 - }, - { - "epoch": 1.71, - "learning_rate": 8.254677788021103e-07, - "loss": 0.5439, - "step": 66620 - }, - { - "epoch": 1.71, - "learning_rate": 8.254405331160159e-07, - "loss": 0.5396, - "step": 66621 - }, - { - "epoch": 1.71, - "learning_rate": 8.254132875635736e-07, - "loss": 0.6279, - "step": 66622 - }, - { - "epoch": 1.71, - "learning_rate": 8.253860421448045e-07, - "loss": 0.6914, - "step": 66623 - }, - { - "epoch": 1.71, - "learning_rate": 8.253587968597294e-07, - "loss": 0.7085, - "step": 66624 - }, - { - "epoch": 1.71, - "learning_rate": 8.253315517083686e-07, - "loss": 0.8008, - "step": 66625 - }, - { - "epoch": 1.71, - "learning_rate": 8.253043066907438e-07, - "loss": 0.7219, - "step": 66626 - }, - { - "epoch": 1.71, - "learning_rate": 8.252770618068751e-07, - "loss": 0.6328, - "step": 66627 - }, - { - "epoch": 1.71, - "learning_rate": 8.25249817056784e-07, - "loss": 0.6553, - "step": 66628 - }, - { - "epoch": 1.71, - "learning_rate": 8.252225724404908e-07, - "loss": 0.6802, - "step": 66629 - }, - { - "epoch": 1.71, - "learning_rate": 8.251953279580169e-07, - "loss": 0.5757, - "step": 66630 - }, - { - "epoch": 1.71, - "learning_rate": 8.251680836093826e-07, - "loss": 0.5845, - "step": 66631 - }, - { - "epoch": 1.71, - "learning_rate": 8.251408393946093e-07, - "loss": 0.6719, - "step": 66632 - }, - { - "epoch": 1.71, - "learning_rate": 8.251135953137175e-07, - "loss": 0.5365, - "step": 66633 - }, - { - "epoch": 1.71, - "learning_rate": 8.250863513667285e-07, - "loss": 0.6514, - "step": 66634 - }, - { - "epoch": 1.71, - "learning_rate": 8.250591075536628e-07, - "loss": 0.6523, - "step": 66635 - }, - { - "epoch": 1.71, - "learning_rate": 8.25031863874541e-07, - "loss": 0.7061, - "step": 66636 - }, - { - "epoch": 1.71, - "learning_rate": 8.250046203293843e-07, - "loss": 0.4697, - "step": 66637 - }, - { - "epoch": 1.71, - "learning_rate": 8.249773769182137e-07, - "loss": 0.6494, - "step": 66638 - }, - { - "epoch": 1.71, - "learning_rate": 8.249501336410496e-07, - "loss": 0.7119, - "step": 66639 - }, - { - "epoch": 1.71, - "learning_rate": 8.249228904979133e-07, - "loss": 0.5352, - "step": 66640 - }, - { - "epoch": 1.71, - "learning_rate": 8.248956474888254e-07, - "loss": 0.7998, - "step": 66641 - }, - { - "epoch": 1.71, - "learning_rate": 8.248684046138071e-07, - "loss": 0.3916, - "step": 66642 - }, - { - "epoch": 1.71, - "learning_rate": 8.248411618728785e-07, - "loss": 0.6357, - "step": 66643 - }, - { - "epoch": 1.71, - "learning_rate": 8.248139192660617e-07, - "loss": 0.71, - "step": 66644 - }, - { - "epoch": 1.71, - "learning_rate": 8.247866767933765e-07, - "loss": 0.5171, - "step": 66645 - }, - { - "epoch": 1.71, - "learning_rate": 8.247594344548438e-07, - "loss": 0.7236, - "step": 66646 - }, - { - "epoch": 1.71, - "learning_rate": 8.24732192250485e-07, - "loss": 0.627, - "step": 66647 - }, - { - "epoch": 1.71, - "learning_rate": 8.247049501803206e-07, - "loss": 0.6299, - "step": 66648 - }, - { - "epoch": 1.71, - "learning_rate": 8.246777082443717e-07, - "loss": 0.6289, - "step": 66649 - }, - { - "epoch": 1.71, - "learning_rate": 8.246504664426588e-07, - "loss": 0.5405, - "step": 66650 - }, - { - "epoch": 1.71, - "learning_rate": 8.246232247752032e-07, - "loss": 0.7432, - "step": 66651 - }, - { - "epoch": 1.71, - "learning_rate": 8.245959832420253e-07, - "loss": 0.7686, - "step": 66652 - }, - { - "epoch": 1.71, - "learning_rate": 8.245687418431464e-07, - "loss": 0.7275, - "step": 66653 - }, - { - "epoch": 1.71, - "learning_rate": 8.245415005785874e-07, - "loss": 0.8096, - "step": 66654 - }, - { - "epoch": 1.71, - "learning_rate": 8.245142594483686e-07, - "loss": 0.6074, - "step": 66655 - }, - { - "epoch": 1.71, - "learning_rate": 8.24487018452511e-07, - "loss": 0.6777, - "step": 66656 - }, - { - "epoch": 1.71, - "learning_rate": 8.244597775910358e-07, - "loss": 0.5847, - "step": 66657 - }, - { - "epoch": 1.71, - "learning_rate": 8.244325368639635e-07, - "loss": 0.71, - "step": 66658 - }, - { - "epoch": 1.71, - "learning_rate": 8.244052962713154e-07, - "loss": 0.7314, - "step": 66659 - }, - { - "epoch": 1.71, - "learning_rate": 8.243780558131118e-07, - "loss": 0.7354, - "step": 66660 - }, - { - "epoch": 1.71, - "learning_rate": 8.243508154893741e-07, - "loss": 0.6992, - "step": 66661 - }, - { - "epoch": 1.71, - "learning_rate": 8.243235753001228e-07, - "loss": 0.7275, - "step": 66662 - }, - { - "epoch": 1.71, - "learning_rate": 8.242963352453789e-07, - "loss": 0.4755, - "step": 66663 - }, - { - "epoch": 1.71, - "learning_rate": 8.242690953251635e-07, - "loss": 0.7808, - "step": 66664 - }, - { - "epoch": 1.71, - "learning_rate": 8.242418555394967e-07, - "loss": 0.7324, - "step": 66665 - }, - { - "epoch": 1.71, - "learning_rate": 8.242146158884e-07, - "loss": 0.6245, - "step": 66666 - }, - { - "epoch": 1.71, - "learning_rate": 8.241873763718941e-07, - "loss": 0.5977, - "step": 66667 - }, - { - "epoch": 1.71, - "learning_rate": 8.241601369899997e-07, - "loss": 0.5747, - "step": 66668 - }, - { - "epoch": 1.71, - "learning_rate": 8.24132897742738e-07, - "loss": 0.5684, - "step": 66669 - }, - { - "epoch": 1.71, - "learning_rate": 8.241056586301296e-07, - "loss": 0.5166, - "step": 66670 - }, - { - "epoch": 1.71, - "learning_rate": 8.240784196521953e-07, - "loss": 0.5947, - "step": 66671 - }, - { - "epoch": 1.71, - "learning_rate": 8.240511808089561e-07, - "loss": 0.5654, - "step": 66672 - }, - { - "epoch": 1.71, - "learning_rate": 8.240239421004328e-07, - "loss": 0.668, - "step": 66673 - }, - { - "epoch": 1.71, - "learning_rate": 8.239967035266468e-07, - "loss": 0.7041, - "step": 66674 - }, - { - "epoch": 1.71, - "learning_rate": 8.239694650876179e-07, - "loss": 0.6797, - "step": 66675 - }, - { - "epoch": 1.71, - "learning_rate": 8.239422267833677e-07, - "loss": 0.6836, - "step": 66676 - }, - { - "epoch": 1.71, - "learning_rate": 8.239149886139165e-07, - "loss": 0.6313, - "step": 66677 - }, - { - "epoch": 1.71, - "learning_rate": 8.238877505792858e-07, - "loss": 0.5322, - "step": 66678 - }, - { - "epoch": 1.71, - "learning_rate": 8.238605126794958e-07, - "loss": 0.6426, - "step": 66679 - }, - { - "epoch": 1.71, - "learning_rate": 8.238332749145681e-07, - "loss": 0.6582, - "step": 66680 - }, - { - "epoch": 1.71, - "learning_rate": 8.23806037284523e-07, - "loss": 0.5493, - "step": 66681 - }, - { - "epoch": 1.71, - "learning_rate": 8.237787997893815e-07, - "loss": 0.5679, - "step": 66682 - }, - { - "epoch": 1.71, - "learning_rate": 8.237515624291644e-07, - "loss": 0.5725, - "step": 66683 - }, - { - "epoch": 1.71, - "learning_rate": 8.23724325203893e-07, - "loss": 0.7227, - "step": 66684 - }, - { - "epoch": 1.71, - "learning_rate": 8.236970881135876e-07, - "loss": 0.7852, - "step": 66685 - }, - { - "epoch": 1.71, - "learning_rate": 8.23669851158269e-07, - "loss": 0.5476, - "step": 66686 - }, - { - "epoch": 1.71, - "learning_rate": 8.236426143379586e-07, - "loss": 0.5879, - "step": 66687 - }, - { - "epoch": 1.71, - "learning_rate": 8.236153776526766e-07, - "loss": 0.5928, - "step": 66688 - }, - { - "epoch": 1.71, - "learning_rate": 8.235881411024444e-07, - "loss": 0.4468, - "step": 66689 - }, - { - "epoch": 1.71, - "learning_rate": 8.235609046872824e-07, - "loss": 0.6772, - "step": 66690 - }, - { - "epoch": 1.71, - "learning_rate": 8.23533668407212e-07, - "loss": 0.603, - "step": 66691 - }, - { - "epoch": 1.71, - "learning_rate": 8.235064322622535e-07, - "loss": 0.6982, - "step": 66692 - }, - { - "epoch": 1.71, - "learning_rate": 8.234791962524284e-07, - "loss": 0.583, - "step": 66693 - }, - { - "epoch": 1.71, - "learning_rate": 8.234519603777573e-07, - "loss": 0.6577, - "step": 66694 - }, - { - "epoch": 1.71, - "learning_rate": 8.234247246382606e-07, - "loss": 0.6323, - "step": 66695 - }, - { - "epoch": 1.71, - "learning_rate": 8.233974890339593e-07, - "loss": 0.6304, - "step": 66696 - }, - { - "epoch": 1.71, - "learning_rate": 8.233702535648745e-07, - "loss": 0.5853, - "step": 66697 - }, - { - "epoch": 1.71, - "learning_rate": 8.233430182310271e-07, - "loss": 0.6348, - "step": 66698 - }, - { - "epoch": 1.71, - "learning_rate": 8.233157830324378e-07, - "loss": 0.6631, - "step": 66699 - }, - { - "epoch": 1.71, - "learning_rate": 8.232885479691273e-07, - "loss": 0.5715, - "step": 66700 - }, - { - "epoch": 1.71, - "learning_rate": 8.232613130411168e-07, - "loss": 0.532, - "step": 66701 - }, - { - "epoch": 1.71, - "learning_rate": 8.232340782484268e-07, - "loss": 0.7266, - "step": 66702 - }, - { - "epoch": 1.71, - "learning_rate": 8.232068435910786e-07, - "loss": 0.71, - "step": 66703 - }, - { - "epoch": 1.71, - "learning_rate": 8.23179609069093e-07, - "loss": 0.707, - "step": 66704 - }, - { - "epoch": 1.71, - "learning_rate": 8.231523746824902e-07, - "loss": 0.6699, - "step": 66705 - }, - { - "epoch": 1.71, - "learning_rate": 8.231251404312916e-07, - "loss": 0.7466, - "step": 66706 - }, - { - "epoch": 1.71, - "learning_rate": 8.230979063155179e-07, - "loss": 0.4719, - "step": 66707 - }, - { - "epoch": 1.71, - "learning_rate": 8.230706723351901e-07, - "loss": 0.5874, - "step": 66708 - }, - { - "epoch": 1.71, - "learning_rate": 8.230434384903289e-07, - "loss": 0.5615, - "step": 66709 - }, - { - "epoch": 1.71, - "learning_rate": 8.230162047809553e-07, - "loss": 0.5078, - "step": 66710 - }, - { - "epoch": 1.71, - "learning_rate": 8.2298897120709e-07, - "loss": 0.666, - "step": 66711 - }, - { - "epoch": 1.71, - "learning_rate": 8.229617377687538e-07, - "loss": 0.4598, - "step": 66712 - }, - { - "epoch": 1.71, - "learning_rate": 8.229345044659678e-07, - "loss": 0.5581, - "step": 66713 - }, - { - "epoch": 1.71, - "learning_rate": 8.22907271298753e-07, - "loss": 0.3634, - "step": 66714 - }, - { - "epoch": 1.71, - "learning_rate": 8.228800382671294e-07, - "loss": 0.707, - "step": 66715 - }, - { - "epoch": 1.71, - "learning_rate": 8.228528053711187e-07, - "loss": 0.71, - "step": 66716 - }, - { - "epoch": 1.71, - "learning_rate": 8.228255726107412e-07, - "loss": 0.6416, - "step": 66717 - }, - { - "epoch": 1.71, - "learning_rate": 8.227983399860183e-07, - "loss": 0.7188, - "step": 66718 - }, - { - "epoch": 1.71, - "learning_rate": 8.227711074969703e-07, - "loss": 0.6123, - "step": 66719 - }, - { - "epoch": 1.71, - "learning_rate": 8.227438751436186e-07, - "loss": 0.5505, - "step": 66720 - }, - { - "epoch": 1.71, - "learning_rate": 8.227166429259835e-07, - "loss": 0.5903, - "step": 66721 - }, - { - "epoch": 1.71, - "learning_rate": 8.226894108440863e-07, - "loss": 0.6113, - "step": 66722 - }, - { - "epoch": 1.71, - "learning_rate": 8.226621788979476e-07, - "loss": 0.4746, - "step": 66723 - }, - { - "epoch": 1.71, - "learning_rate": 8.226349470875885e-07, - "loss": 0.8701, - "step": 66724 - }, - { - "epoch": 1.71, - "learning_rate": 8.226077154130296e-07, - "loss": 0.6455, - "step": 66725 - }, - { - "epoch": 1.71, - "learning_rate": 8.225804838742915e-07, - "loss": 0.7197, - "step": 66726 - }, - { - "epoch": 1.71, - "learning_rate": 8.225532524713958e-07, - "loss": 0.6006, - "step": 66727 - }, - { - "epoch": 1.71, - "learning_rate": 8.225260212043627e-07, - "loss": 0.7148, - "step": 66728 - }, - { - "epoch": 1.71, - "learning_rate": 8.224987900732131e-07, - "loss": 0.5728, - "step": 66729 - }, - { - "epoch": 1.71, - "learning_rate": 8.224715590779682e-07, - "loss": 0.6924, - "step": 66730 - }, - { - "epoch": 1.71, - "learning_rate": 8.224443282186486e-07, - "loss": 0.5381, - "step": 66731 - }, - { - "epoch": 1.71, - "learning_rate": 8.224170974952753e-07, - "loss": 0.6729, - "step": 66732 - }, - { - "epoch": 1.71, - "learning_rate": 8.223898669078688e-07, - "loss": 0.7998, - "step": 66733 - }, - { - "epoch": 1.71, - "learning_rate": 8.223626364564507e-07, - "loss": 0.5562, - "step": 66734 - }, - { - "epoch": 1.71, - "learning_rate": 8.223354061410412e-07, - "loss": 0.499, - "step": 66735 - }, - { - "epoch": 1.71, - "learning_rate": 8.22308175961661e-07, - "loss": 0.7344, - "step": 66736 - }, - { - "epoch": 1.71, - "learning_rate": 8.222809459183316e-07, - "loss": 0.6338, - "step": 66737 - }, - { - "epoch": 1.71, - "learning_rate": 8.222537160110732e-07, - "loss": 0.7178, - "step": 66738 - }, - { - "epoch": 1.71, - "learning_rate": 8.222264862399072e-07, - "loss": 0.6689, - "step": 66739 - }, - { - "epoch": 1.71, - "learning_rate": 8.22199256604854e-07, - "loss": 0.7822, - "step": 66740 - }, - { - "epoch": 1.71, - "learning_rate": 8.221720271059349e-07, - "loss": 0.4966, - "step": 66741 - }, - { - "epoch": 1.71, - "learning_rate": 8.221447977431702e-07, - "loss": 0.4877, - "step": 66742 - }, - { - "epoch": 1.71, - "learning_rate": 8.221175685165813e-07, - "loss": 0.469, - "step": 66743 - }, - { - "epoch": 1.71, - "learning_rate": 8.220903394261891e-07, - "loss": 0.8154, - "step": 66744 - }, - { - "epoch": 1.71, - "learning_rate": 8.220631104720138e-07, - "loss": 0.6616, - "step": 66745 - }, - { - "epoch": 1.71, - "learning_rate": 8.220358816540765e-07, - "loss": 0.6021, - "step": 66746 - }, - { - "epoch": 1.71, - "learning_rate": 8.220086529723982e-07, - "loss": 0.8105, - "step": 66747 - }, - { - "epoch": 1.71, - "learning_rate": 8.219814244269996e-07, - "loss": 0.7095, - "step": 66748 - }, - { - "epoch": 1.71, - "learning_rate": 8.219541960179018e-07, - "loss": 0.6128, - "step": 66749 - }, - { - "epoch": 1.71, - "learning_rate": 8.219269677451253e-07, - "loss": 0.6328, - "step": 66750 - }, - { - "epoch": 1.71, - "learning_rate": 8.218997396086913e-07, - "loss": 0.6592, - "step": 66751 - }, - { - "epoch": 1.71, - "learning_rate": 8.218725116086203e-07, - "loss": 0.5786, - "step": 66752 - }, - { - "epoch": 1.71, - "learning_rate": 8.218452837449337e-07, - "loss": 0.6973, - "step": 66753 - }, - { - "epoch": 1.71, - "learning_rate": 8.218180560176519e-07, - "loss": 0.6904, - "step": 66754 - }, - { - "epoch": 1.71, - "learning_rate": 8.217908284267955e-07, - "loss": 0.4648, - "step": 66755 - }, - { - "epoch": 1.71, - "learning_rate": 8.21763600972386e-07, - "loss": 0.6982, - "step": 66756 - }, - { - "epoch": 1.71, - "learning_rate": 8.217363736544436e-07, - "loss": 0.7109, - "step": 66757 - }, - { - "epoch": 1.71, - "learning_rate": 8.217091464729897e-07, - "loss": 0.7822, - "step": 66758 - }, - { - "epoch": 1.71, - "learning_rate": 8.216819194280447e-07, - "loss": 0.7031, - "step": 66759 - }, - { - "epoch": 1.71, - "learning_rate": 8.216546925196298e-07, - "loss": 0.7383, - "step": 66760 - }, - { - "epoch": 1.71, - "learning_rate": 8.216274657477656e-07, - "loss": 0.5874, - "step": 66761 - }, - { - "epoch": 1.71, - "learning_rate": 8.216002391124731e-07, - "loss": 0.7007, - "step": 66762 - }, - { - "epoch": 1.71, - "learning_rate": 8.21573012613773e-07, - "loss": 0.7129, - "step": 66763 - }, - { - "epoch": 1.71, - "learning_rate": 8.215457862516869e-07, - "loss": 0.5435, - "step": 66764 - }, - { - "epoch": 1.71, - "learning_rate": 8.215185600262343e-07, - "loss": 0.6572, - "step": 66765 - }, - { - "epoch": 1.71, - "learning_rate": 8.21491333937437e-07, - "loss": 0.5276, - "step": 66766 - }, - { - "epoch": 1.71, - "learning_rate": 8.214641079853153e-07, - "loss": 0.5742, - "step": 66767 - }, - { - "epoch": 1.71, - "learning_rate": 8.214368821698905e-07, - "loss": 0.5078, - "step": 66768 - }, - { - "epoch": 1.71, - "learning_rate": 8.214096564911831e-07, - "loss": 0.7695, - "step": 66769 - }, - { - "epoch": 1.71, - "learning_rate": 8.213824309492143e-07, - "loss": 0.4634, - "step": 66770 - }, - { - "epoch": 1.71, - "learning_rate": 8.213552055440046e-07, - "loss": 0.7451, - "step": 66771 - }, - { - "epoch": 1.71, - "learning_rate": 8.213279802755752e-07, - "loss": 0.7412, - "step": 66772 - }, - { - "epoch": 1.71, - "learning_rate": 8.213007551439465e-07, - "loss": 0.6191, - "step": 66773 - }, - { - "epoch": 1.71, - "learning_rate": 8.212735301491401e-07, - "loss": 0.6514, - "step": 66774 - }, - { - "epoch": 1.71, - "learning_rate": 8.212463052911761e-07, - "loss": 0.5518, - "step": 66775 - }, - { - "epoch": 1.71, - "learning_rate": 8.212190805700753e-07, - "loss": 0.6685, - "step": 66776 - }, - { - "epoch": 1.71, - "learning_rate": 8.211918559858592e-07, - "loss": 0.667, - "step": 66777 - }, - { - "epoch": 1.71, - "learning_rate": 8.211646315385479e-07, - "loss": 0.6689, - "step": 66778 - }, - { - "epoch": 1.71, - "learning_rate": 8.21137407228163e-07, - "loss": 0.4761, - "step": 66779 - }, - { - "epoch": 1.71, - "learning_rate": 8.211101830547245e-07, - "loss": 0.5122, - "step": 66780 - }, - { - "epoch": 1.71, - "learning_rate": 8.210829590182541e-07, - "loss": 0.5859, - "step": 66781 - }, - { - "epoch": 1.71, - "learning_rate": 8.21055735118772e-07, - "loss": 0.6602, - "step": 66782 - }, - { - "epoch": 1.71, - "learning_rate": 8.210285113562995e-07, - "loss": 0.5464, - "step": 66783 - }, - { - "epoch": 1.71, - "learning_rate": 8.210012877308574e-07, - "loss": 0.6587, - "step": 66784 - }, - { - "epoch": 1.71, - "learning_rate": 8.209740642424662e-07, - "loss": 0.6777, - "step": 66785 - }, - { - "epoch": 1.71, - "learning_rate": 8.209468408911469e-07, - "loss": 0.594, - "step": 66786 - }, - { - "epoch": 1.71, - "learning_rate": 8.209196176769204e-07, - "loss": 0.6953, - "step": 66787 - }, - { - "epoch": 1.71, - "learning_rate": 8.208923945998073e-07, - "loss": 0.6001, - "step": 66788 - }, - { - "epoch": 1.71, - "learning_rate": 8.20865171659829e-07, - "loss": 0.6504, - "step": 66789 - }, - { - "epoch": 1.71, - "learning_rate": 8.208379488570057e-07, - "loss": 0.5636, - "step": 66790 - }, - { - "epoch": 1.71, - "learning_rate": 8.208107261913586e-07, - "loss": 0.7686, - "step": 66791 - }, - { - "epoch": 1.71, - "learning_rate": 8.207835036629084e-07, - "loss": 0.6118, - "step": 66792 - }, - { - "epoch": 1.71, - "learning_rate": 8.207562812716766e-07, - "loss": 0.645, - "step": 66793 - }, - { - "epoch": 1.71, - "learning_rate": 8.207290590176831e-07, - "loss": 0.5962, - "step": 66794 - }, - { - "epoch": 1.71, - "learning_rate": 8.207018369009488e-07, - "loss": 0.6396, - "step": 66795 - }, - { - "epoch": 1.71, - "learning_rate": 8.206746149214954e-07, - "loss": 0.7129, - "step": 66796 - }, - { - "epoch": 1.71, - "learning_rate": 8.206473930793427e-07, - "loss": 0.6167, - "step": 66797 - }, - { - "epoch": 1.71, - "learning_rate": 8.206201713745125e-07, - "loss": 0.6934, - "step": 66798 - }, - { - "epoch": 1.71, - "learning_rate": 8.205929498070248e-07, - "loss": 0.6001, - "step": 66799 - }, - { - "epoch": 1.71, - "learning_rate": 8.20565728376901e-07, - "loss": 0.5522, - "step": 66800 - }, - { - "epoch": 1.71, - "learning_rate": 8.205385070841619e-07, - "loss": 0.7451, - "step": 66801 - }, - { - "epoch": 1.71, - "learning_rate": 8.205112859288279e-07, - "loss": 0.3633, - "step": 66802 - }, - { - "epoch": 1.71, - "learning_rate": 8.204840649109206e-07, - "loss": 0.6943, - "step": 66803 - }, - { - "epoch": 1.71, - "learning_rate": 8.204568440304602e-07, - "loss": 0.6396, - "step": 66804 - }, - { - "epoch": 1.71, - "learning_rate": 8.204296232874675e-07, - "loss": 0.7578, - "step": 66805 - }, - { - "epoch": 1.71, - "learning_rate": 8.20402402681964e-07, - "loss": 0.7041, - "step": 66806 - }, - { - "epoch": 1.71, - "learning_rate": 8.203751822139696e-07, - "loss": 0.6597, - "step": 66807 - }, - { - "epoch": 1.71, - "learning_rate": 8.203479618835061e-07, - "loss": 0.792, - "step": 66808 - }, - { - "epoch": 1.71, - "learning_rate": 8.203207416905935e-07, - "loss": 0.6479, - "step": 66809 - }, - { - "epoch": 1.71, - "learning_rate": 8.202935216352534e-07, - "loss": 0.5869, - "step": 66810 - }, - { - "epoch": 1.71, - "learning_rate": 8.202663017175061e-07, - "loss": 0.5635, - "step": 66811 - }, - { - "epoch": 1.71, - "learning_rate": 8.202390819373728e-07, - "loss": 0.5381, - "step": 66812 - }, - { - "epoch": 1.71, - "learning_rate": 8.202118622948743e-07, - "loss": 0.6992, - "step": 66813 - }, - { - "epoch": 1.71, - "learning_rate": 8.20184642790031e-07, - "loss": 0.8086, - "step": 66814 - }, - { - "epoch": 1.71, - "learning_rate": 8.201574234228642e-07, - "loss": 0.6567, - "step": 66815 - }, - { - "epoch": 1.71, - "learning_rate": 8.201302041933944e-07, - "loss": 0.7764, - "step": 66816 - }, - { - "epoch": 1.71, - "learning_rate": 8.201029851016428e-07, - "loss": 0.4706, - "step": 66817 - }, - { - "epoch": 1.71, - "learning_rate": 8.200757661476302e-07, - "loss": 0.6421, - "step": 66818 - }, - { - "epoch": 1.71, - "learning_rate": 8.20048547331377e-07, - "loss": 0.5469, - "step": 66819 - }, - { - "epoch": 1.71, - "learning_rate": 8.200213286529045e-07, - "loss": 0.792, - "step": 66820 - }, - { - "epoch": 1.71, - "learning_rate": 8.199941101122332e-07, - "loss": 0.5647, - "step": 66821 - }, - { - "epoch": 1.71, - "learning_rate": 8.199668917093845e-07, - "loss": 0.6602, - "step": 66822 - }, - { - "epoch": 1.71, - "learning_rate": 8.19939673444379e-07, - "loss": 0.542, - "step": 66823 - }, - { - "epoch": 1.71, - "learning_rate": 8.19912455317237e-07, - "loss": 0.7876, - "step": 66824 - }, - { - "epoch": 1.71, - "learning_rate": 8.198852373279798e-07, - "loss": 0.6055, - "step": 66825 - }, - { - "epoch": 1.71, - "learning_rate": 8.198580194766282e-07, - "loss": 0.6382, - "step": 66826 - }, - { - "epoch": 1.71, - "learning_rate": 8.198308017632032e-07, - "loss": 0.6216, - "step": 66827 - }, - { - "epoch": 1.71, - "learning_rate": 8.198035841877252e-07, - "loss": 0.749, - "step": 66828 - }, - { - "epoch": 1.71, - "learning_rate": 8.197763667502156e-07, - "loss": 0.4946, - "step": 66829 - }, - { - "epoch": 1.71, - "learning_rate": 8.197491494506946e-07, - "loss": 0.7461, - "step": 66830 - }, - { - "epoch": 1.71, - "learning_rate": 8.197219322891837e-07, - "loss": 0.8701, - "step": 66831 - }, - { - "epoch": 1.71, - "learning_rate": 8.196947152657032e-07, - "loss": 0.7314, - "step": 66832 - }, - { - "epoch": 1.71, - "learning_rate": 8.196674983802746e-07, - "loss": 0.6895, - "step": 66833 - }, - { - "epoch": 1.71, - "learning_rate": 8.196402816329181e-07, - "loss": 0.6357, - "step": 66834 - }, - { - "epoch": 1.71, - "learning_rate": 8.196130650236547e-07, - "loss": 0.4448, - "step": 66835 - }, - { - "epoch": 1.71, - "learning_rate": 8.195858485525052e-07, - "loss": 0.7188, - "step": 66836 - }, - { - "epoch": 1.71, - "learning_rate": 8.195586322194905e-07, - "loss": 0.6436, - "step": 66837 - }, - { - "epoch": 1.71, - "learning_rate": 8.195314160246314e-07, - "loss": 0.6362, - "step": 66838 - }, - { - "epoch": 1.71, - "learning_rate": 8.19504199967949e-07, - "loss": 0.6875, - "step": 66839 - }, - { - "epoch": 1.71, - "learning_rate": 8.194769840494636e-07, - "loss": 0.5757, - "step": 66840 - }, - { - "epoch": 1.71, - "learning_rate": 8.194497682691968e-07, - "loss": 0.6255, - "step": 66841 - }, - { - "epoch": 1.71, - "learning_rate": 8.194225526271686e-07, - "loss": 0.6172, - "step": 66842 - }, - { - "epoch": 1.71, - "learning_rate": 8.193953371234008e-07, - "loss": 0.8545, - "step": 66843 - }, - { - "epoch": 1.71, - "learning_rate": 8.193681217579134e-07, - "loss": 0.7012, - "step": 66844 - }, - { - "epoch": 1.71, - "learning_rate": 8.193409065307273e-07, - "loss": 0.6621, - "step": 66845 - }, - { - "epoch": 1.71, - "learning_rate": 8.193136914418639e-07, - "loss": 0.6309, - "step": 66846 - }, - { - "epoch": 1.71, - "learning_rate": 8.192864764913434e-07, - "loss": 0.6179, - "step": 66847 - }, - { - "epoch": 1.71, - "learning_rate": 8.192592616791871e-07, - "loss": 0.6113, - "step": 66848 - }, - { - "epoch": 1.71, - "learning_rate": 8.192320470054155e-07, - "loss": 0.6509, - "step": 66849 - }, - { - "epoch": 1.71, - "learning_rate": 8.192048324700499e-07, - "loss": 0.5776, - "step": 66850 - }, - { - "epoch": 1.71, - "learning_rate": 8.191776180731104e-07, - "loss": 0.6123, - "step": 66851 - }, - { - "epoch": 1.71, - "learning_rate": 8.191504038146188e-07, - "loss": 0.71, - "step": 66852 - }, - { - "epoch": 1.71, - "learning_rate": 8.191231896945955e-07, - "loss": 0.7549, - "step": 66853 - }, - { - "epoch": 1.71, - "learning_rate": 8.19095975713061e-07, - "loss": 0.7451, - "step": 66854 - }, - { - "epoch": 1.71, - "learning_rate": 8.190687618700362e-07, - "loss": 0.6846, - "step": 66855 - }, - { - "epoch": 1.71, - "learning_rate": 8.190415481655424e-07, - "loss": 0.6606, - "step": 66856 - }, - { - "epoch": 1.71, - "learning_rate": 8.190143345995999e-07, - "loss": 0.5161, - "step": 66857 - }, - { - "epoch": 1.71, - "learning_rate": 8.189871211722301e-07, - "loss": 0.7041, - "step": 66858 - }, - { - "epoch": 1.71, - "learning_rate": 8.189599078834533e-07, - "loss": 0.7686, - "step": 66859 - }, - { - "epoch": 1.71, - "learning_rate": 8.189326947332906e-07, - "loss": 0.6655, - "step": 66860 - }, - { - "epoch": 1.71, - "learning_rate": 8.189054817217628e-07, - "loss": 0.5386, - "step": 66861 - }, - { - "epoch": 1.71, - "learning_rate": 8.188782688488909e-07, - "loss": 0.6777, - "step": 66862 - }, - { - "epoch": 1.71, - "learning_rate": 8.188510561146957e-07, - "loss": 0.5889, - "step": 66863 - }, - { - "epoch": 1.71, - "learning_rate": 8.188238435191976e-07, - "loss": 0.7036, - "step": 66864 - }, - { - "epoch": 1.71, - "learning_rate": 8.18796631062418e-07, - "loss": 0.5801, - "step": 66865 - }, - { - "epoch": 1.71, - "learning_rate": 8.187694187443772e-07, - "loss": 0.6865, - "step": 66866 - }, - { - "epoch": 1.71, - "learning_rate": 8.187422065650966e-07, - "loss": 0.75, - "step": 66867 - }, - { - "epoch": 1.71, - "learning_rate": 8.187149945245965e-07, - "loss": 0.6636, - "step": 66868 - }, - { - "epoch": 1.71, - "learning_rate": 8.186877826228982e-07, - "loss": 0.6953, - "step": 66869 - }, - { - "epoch": 1.71, - "learning_rate": 8.186605708600221e-07, - "loss": 0.6709, - "step": 66870 - }, - { - "epoch": 1.71, - "learning_rate": 8.186333592359895e-07, - "loss": 0.5591, - "step": 66871 - }, - { - "epoch": 1.71, - "learning_rate": 8.186061477508209e-07, - "loss": 0.6816, - "step": 66872 - }, - { - "epoch": 1.71, - "learning_rate": 8.185789364045377e-07, - "loss": 0.7373, - "step": 66873 - }, - { - "epoch": 1.71, - "learning_rate": 8.185517251971596e-07, - "loss": 0.52, - "step": 66874 - }, - { - "epoch": 1.71, - "learning_rate": 8.185245141287085e-07, - "loss": 0.6875, - "step": 66875 - }, - { - "epoch": 1.71, - "learning_rate": 8.184973031992044e-07, - "loss": 0.7871, - "step": 66876 - }, - { - "epoch": 1.71, - "learning_rate": 8.18470092408669e-07, - "loss": 0.6108, - "step": 66877 - }, - { - "epoch": 1.71, - "learning_rate": 8.184428817571223e-07, - "loss": 0.7012, - "step": 66878 - }, - { - "epoch": 1.71, - "learning_rate": 8.184156712445859e-07, - "loss": 0.6851, - "step": 66879 - }, - { - "epoch": 1.71, - "learning_rate": 8.1838846087108e-07, - "loss": 0.6426, - "step": 66880 - }, - { - "epoch": 1.71, - "learning_rate": 8.183612506366258e-07, - "loss": 0.709, - "step": 66881 - }, - { - "epoch": 1.71, - "learning_rate": 8.18334040541244e-07, - "loss": 0.7803, - "step": 66882 - }, - { - "epoch": 1.71, - "learning_rate": 8.183068305849558e-07, - "loss": 0.6021, - "step": 66883 - }, - { - "epoch": 1.71, - "learning_rate": 8.182796207677815e-07, - "loss": 0.7754, - "step": 66884 - }, - { - "epoch": 1.71, - "learning_rate": 8.182524110897421e-07, - "loss": 0.7734, - "step": 66885 - }, - { - "epoch": 1.71, - "learning_rate": 8.182252015508585e-07, - "loss": 0.7158, - "step": 66886 - }, - { - "epoch": 1.71, - "learning_rate": 8.181979921511514e-07, - "loss": 0.6064, - "step": 66887 - }, - { - "epoch": 1.71, - "learning_rate": 8.181707828906419e-07, - "loss": 0.6279, - "step": 66888 - }, - { - "epoch": 1.71, - "learning_rate": 8.181435737693504e-07, - "loss": 0.7734, - "step": 66889 - }, - { - "epoch": 1.71, - "learning_rate": 8.181163647872982e-07, - "loss": 0.5959, - "step": 66890 - }, - { - "epoch": 1.71, - "learning_rate": 8.18089155944506e-07, - "loss": 0.6538, - "step": 66891 - }, - { - "epoch": 1.71, - "learning_rate": 8.180619472409944e-07, - "loss": 0.7266, - "step": 66892 - }, - { - "epoch": 1.71, - "learning_rate": 8.180347386767848e-07, - "loss": 0.5791, - "step": 66893 - }, - { - "epoch": 1.71, - "learning_rate": 8.180075302518974e-07, - "loss": 0.6318, - "step": 66894 - }, - { - "epoch": 1.71, - "learning_rate": 8.17980321966353e-07, - "loss": 0.4624, - "step": 66895 - }, - { - "epoch": 1.71, - "learning_rate": 8.17953113820173e-07, - "loss": 0.7148, - "step": 66896 - }, - { - "epoch": 1.71, - "learning_rate": 8.179259058133776e-07, - "loss": 0.7002, - "step": 66897 - }, - { - "epoch": 1.71, - "learning_rate": 8.178986979459883e-07, - "loss": 0.6514, - "step": 66898 - }, - { - "epoch": 1.71, - "learning_rate": 8.178714902180254e-07, - "loss": 0.8896, - "step": 66899 - }, - { - "epoch": 1.71, - "learning_rate": 8.1784428262951e-07, - "loss": 0.7251, - "step": 66900 - }, - { - "epoch": 1.71, - "learning_rate": 8.178170751804627e-07, - "loss": 0.48, - "step": 66901 - }, - { - "epoch": 1.71, - "learning_rate": 8.177898678709048e-07, - "loss": 0.7285, - "step": 66902 - }, - { - "epoch": 1.71, - "learning_rate": 8.17762660700857e-07, - "loss": 0.5581, - "step": 66903 - }, - { - "epoch": 1.71, - "learning_rate": 8.177354536703393e-07, - "loss": 0.71, - "step": 66904 - }, - { - "epoch": 1.71, - "learning_rate": 8.177082467793736e-07, - "loss": 0.6519, - "step": 66905 - }, - { - "epoch": 1.71, - "learning_rate": 8.176810400279801e-07, - "loss": 0.5188, - "step": 66906 - }, - { - "epoch": 1.71, - "learning_rate": 8.176538334161801e-07, - "loss": 0.6338, - "step": 66907 - }, - { - "epoch": 1.71, - "learning_rate": 8.176266269439941e-07, - "loss": 0.5786, - "step": 66908 - }, - { - "epoch": 1.71, - "learning_rate": 8.175994206114428e-07, - "loss": 0.7295, - "step": 66909 - }, - { - "epoch": 1.71, - "learning_rate": 8.175722144185475e-07, - "loss": 0.7656, - "step": 66910 - }, - { - "epoch": 1.71, - "learning_rate": 8.175450083653285e-07, - "loss": 0.582, - "step": 66911 - }, - { - "epoch": 1.71, - "learning_rate": 8.175178024518071e-07, - "loss": 0.7256, - "step": 66912 - }, - { - "epoch": 1.72, - "learning_rate": 8.174905966780041e-07, - "loss": 0.4478, - "step": 66913 - }, - { - "epoch": 1.72, - "learning_rate": 8.174633910439398e-07, - "loss": 0.7725, - "step": 66914 - }, - { - "epoch": 1.72, - "learning_rate": 8.174361855496356e-07, - "loss": 0.7607, - "step": 66915 - }, - { - "epoch": 1.72, - "learning_rate": 8.174089801951119e-07, - "loss": 0.8369, - "step": 66916 - }, - { - "epoch": 1.72, - "learning_rate": 8.1738177498039e-07, - "loss": 0.7158, - "step": 66917 - }, - { - "epoch": 1.72, - "learning_rate": 8.173545699054902e-07, - "loss": 0.5967, - "step": 66918 - }, - { - "epoch": 1.72, - "learning_rate": 8.173273649704337e-07, - "loss": 0.5933, - "step": 66919 - }, - { - "epoch": 1.72, - "learning_rate": 8.173001601752413e-07, - "loss": 0.4891, - "step": 66920 - }, - { - "epoch": 1.72, - "learning_rate": 8.172729555199338e-07, - "loss": 0.564, - "step": 66921 - }, - { - "epoch": 1.72, - "learning_rate": 8.172457510045319e-07, - "loss": 0.6831, - "step": 66922 - }, - { - "epoch": 1.72, - "learning_rate": 8.172185466290569e-07, - "loss": 0.5967, - "step": 66923 - }, - { - "epoch": 1.72, - "learning_rate": 8.171913423935289e-07, - "loss": 0.6447, - "step": 66924 - }, - { - "epoch": 1.72, - "learning_rate": 8.171641382979691e-07, - "loss": 0.626, - "step": 66925 - }, - { - "epoch": 1.72, - "learning_rate": 8.171369343423984e-07, - "loss": 0.6074, - "step": 66926 - }, - { - "epoch": 1.72, - "learning_rate": 8.171097305268375e-07, - "loss": 0.6084, - "step": 66927 - }, - { - "epoch": 1.72, - "learning_rate": 8.170825268513071e-07, - "loss": 0.7871, - "step": 66928 - }, - { - "epoch": 1.72, - "learning_rate": 8.170553233158285e-07, - "loss": 0.5977, - "step": 66929 - }, - { - "epoch": 1.72, - "learning_rate": 8.170281199204219e-07, - "loss": 0.5239, - "step": 66930 - }, - { - "epoch": 1.72, - "learning_rate": 8.170009166651087e-07, - "loss": 0.6362, - "step": 66931 - }, - { - "epoch": 1.72, - "learning_rate": 8.169737135499093e-07, - "loss": 0.6279, - "step": 66932 - }, - { - "epoch": 1.72, - "learning_rate": 8.169465105748451e-07, - "loss": 0.7061, - "step": 66933 - }, - { - "epoch": 1.72, - "learning_rate": 8.169193077399363e-07, - "loss": 0.6748, - "step": 66934 - }, - { - "epoch": 1.72, - "learning_rate": 8.168921050452037e-07, - "loss": 0.71, - "step": 66935 - }, - { - "epoch": 1.72, - "learning_rate": 8.168649024906688e-07, - "loss": 0.7656, - "step": 66936 - }, - { - "epoch": 1.72, - "learning_rate": 8.168377000763518e-07, - "loss": 0.7495, - "step": 66937 - }, - { - "epoch": 1.72, - "learning_rate": 8.168104978022738e-07, - "loss": 0.415, - "step": 66938 - }, - { - "epoch": 1.72, - "learning_rate": 8.167832956684555e-07, - "loss": 0.7344, - "step": 66939 - }, - { - "epoch": 1.72, - "learning_rate": 8.167560936749179e-07, - "loss": 0.4961, - "step": 66940 - }, - { - "epoch": 1.72, - "learning_rate": 8.167288918216816e-07, - "loss": 0.8472, - "step": 66941 - }, - { - "epoch": 1.72, - "learning_rate": 8.167016901087678e-07, - "loss": 0.7002, - "step": 66942 - }, - { - "epoch": 1.72, - "learning_rate": 8.166744885361972e-07, - "loss": 0.5854, - "step": 66943 - }, - { - "epoch": 1.72, - "learning_rate": 8.166472871039904e-07, - "loss": 0.7461, - "step": 66944 - }, - { - "epoch": 1.72, - "learning_rate": 8.166200858121681e-07, - "loss": 0.7402, - "step": 66945 - }, - { - "epoch": 1.72, - "learning_rate": 8.165928846607516e-07, - "loss": 0.6187, - "step": 66946 - }, - { - "epoch": 1.72, - "learning_rate": 8.165656836497612e-07, - "loss": 0.6641, - "step": 66947 - }, - { - "epoch": 1.72, - "learning_rate": 8.165384827792183e-07, - "loss": 0.6436, - "step": 66948 - }, - { - "epoch": 1.72, - "learning_rate": 8.165112820491433e-07, - "loss": 0.623, - "step": 66949 - }, - { - "epoch": 1.72, - "learning_rate": 8.164840814595573e-07, - "loss": 0.5371, - "step": 66950 - }, - { - "epoch": 1.72, - "learning_rate": 8.164568810104807e-07, - "loss": 0.5464, - "step": 66951 - }, - { - "epoch": 1.72, - "learning_rate": 8.16429680701935e-07, - "loss": 0.4688, - "step": 66952 - }, - { - "epoch": 1.72, - "learning_rate": 8.164024805339408e-07, - "loss": 0.7891, - "step": 66953 - }, - { - "epoch": 1.72, - "learning_rate": 8.163752805065182e-07, - "loss": 0.5732, - "step": 66954 - }, - { - "epoch": 1.72, - "learning_rate": 8.16348080619689e-07, - "loss": 0.3974, - "step": 66955 - }, - { - "epoch": 1.72, - "learning_rate": 8.163208808734735e-07, - "loss": 0.8438, - "step": 66956 - }, - { - "epoch": 1.72, - "learning_rate": 8.162936812678928e-07, - "loss": 0.7188, - "step": 66957 - }, - { - "epoch": 1.72, - "learning_rate": 8.162664818029673e-07, - "loss": 0.533, - "step": 66958 - }, - { - "epoch": 1.72, - "learning_rate": 8.162392824787184e-07, - "loss": 0.5977, - "step": 66959 - }, - { - "epoch": 1.72, - "learning_rate": 8.162120832951662e-07, - "loss": 0.7969, - "step": 66960 - }, - { - "epoch": 1.72, - "learning_rate": 8.161848842523324e-07, - "loss": 0.6685, - "step": 66961 - }, - { - "epoch": 1.72, - "learning_rate": 8.16157685350237e-07, - "loss": 0.7227, - "step": 66962 - }, - { - "epoch": 1.72, - "learning_rate": 8.16130486588902e-07, - "loss": 0.6982, - "step": 66963 - }, - { - "epoch": 1.72, - "learning_rate": 8.161032879683468e-07, - "loss": 0.6885, - "step": 66964 - }, - { - "epoch": 1.72, - "learning_rate": 8.16076089488593e-07, - "loss": 0.48, - "step": 66965 - }, - { - "epoch": 1.72, - "learning_rate": 8.160488911496611e-07, - "loss": 0.6953, - "step": 66966 - }, - { - "epoch": 1.72, - "learning_rate": 8.160216929515723e-07, - "loss": 0.6963, - "step": 66967 - }, - { - "epoch": 1.72, - "learning_rate": 8.15994494894347e-07, - "loss": 0.4879, - "step": 66968 - }, - { - "epoch": 1.72, - "learning_rate": 8.159672969780065e-07, - "loss": 0.7334, - "step": 66969 - }, - { - "epoch": 1.72, - "learning_rate": 8.159400992025711e-07, - "loss": 0.8311, - "step": 66970 - }, - { - "epoch": 1.72, - "learning_rate": 8.159129015680622e-07, - "loss": 0.6057, - "step": 66971 - }, - { - "epoch": 1.72, - "learning_rate": 8.158857040745001e-07, - "loss": 0.3887, - "step": 66972 - }, - { - "epoch": 1.72, - "learning_rate": 8.158585067219063e-07, - "loss": 0.7178, - "step": 66973 - }, - { - "epoch": 1.72, - "learning_rate": 8.158313095103009e-07, - "loss": 0.7305, - "step": 66974 - }, - { - "epoch": 1.72, - "learning_rate": 8.158041124397048e-07, - "loss": 0.4568, - "step": 66975 - }, - { - "epoch": 1.72, - "learning_rate": 8.157769155101392e-07, - "loss": 0.7168, - "step": 66976 - }, - { - "epoch": 1.72, - "learning_rate": 8.157497187216245e-07, - "loss": 0.5933, - "step": 66977 - }, - { - "epoch": 1.72, - "learning_rate": 8.157225220741821e-07, - "loss": 0.6592, - "step": 66978 - }, - { - "epoch": 1.72, - "learning_rate": 8.156953255678323e-07, - "loss": 0.7012, - "step": 66979 - }, - { - "epoch": 1.72, - "learning_rate": 8.156681292025962e-07, - "loss": 0.7656, - "step": 66980 - }, - { - "epoch": 1.72, - "learning_rate": 8.156409329784946e-07, - "loss": 0.6743, - "step": 66981 - }, - { - "epoch": 1.72, - "learning_rate": 8.156137368955481e-07, - "loss": 0.6055, - "step": 66982 - }, - { - "epoch": 1.72, - "learning_rate": 8.15586540953778e-07, - "loss": 0.7324, - "step": 66983 - }, - { - "epoch": 1.72, - "learning_rate": 8.155593451532046e-07, - "loss": 0.6289, - "step": 66984 - }, - { - "epoch": 1.72, - "learning_rate": 8.155321494938488e-07, - "loss": 0.6885, - "step": 66985 - }, - { - "epoch": 1.72, - "learning_rate": 8.155049539757317e-07, - "loss": 0.6558, - "step": 66986 - }, - { - "epoch": 1.72, - "learning_rate": 8.154777585988737e-07, - "loss": 0.6963, - "step": 66987 - }, - { - "epoch": 1.72, - "learning_rate": 8.154505633632963e-07, - "loss": 0.5708, - "step": 66988 - }, - { - "epoch": 1.72, - "learning_rate": 8.154233682690196e-07, - "loss": 0.6284, - "step": 66989 - }, - { - "epoch": 1.72, - "learning_rate": 8.15396173316065e-07, - "loss": 0.4614, - "step": 66990 - }, - { - "epoch": 1.72, - "learning_rate": 8.153689785044528e-07, - "loss": 0.6768, - "step": 66991 - }, - { - "epoch": 1.72, - "learning_rate": 8.153417838342043e-07, - "loss": 0.7744, - "step": 66992 - }, - { - "epoch": 1.72, - "learning_rate": 8.153145893053403e-07, - "loss": 0.6621, - "step": 66993 - }, - { - "epoch": 1.72, - "learning_rate": 8.15287394917881e-07, - "loss": 0.5576, - "step": 66994 - }, - { - "epoch": 1.72, - "learning_rate": 8.152602006718479e-07, - "loss": 0.6406, - "step": 66995 - }, - { - "epoch": 1.72, - "learning_rate": 8.152330065672613e-07, - "loss": 0.6592, - "step": 66996 - }, - { - "epoch": 1.72, - "learning_rate": 8.152058126041426e-07, - "loss": 0.6162, - "step": 66997 - }, - { - "epoch": 1.72, - "learning_rate": 8.151786187825121e-07, - "loss": 0.5449, - "step": 66998 - }, - { - "epoch": 1.72, - "learning_rate": 8.151514251023908e-07, - "loss": 0.627, - "step": 66999 - }, - { - "epoch": 1.72, - "learning_rate": 8.151242315637998e-07, - "loss": 0.5801, - "step": 67000 - }, - { - "epoch": 1.72, - "learning_rate": 8.150970381667595e-07, - "loss": 0.6587, - "step": 67001 - }, - { - "epoch": 1.72, - "learning_rate": 8.150698449112909e-07, - "loss": 0.6768, - "step": 67002 - }, - { - "epoch": 1.72, - "learning_rate": 8.150426517974152e-07, - "loss": 0.6714, - "step": 67003 - }, - { - "epoch": 1.72, - "learning_rate": 8.150154588251523e-07, - "loss": 0.7109, - "step": 67004 - }, - { - "epoch": 1.72, - "learning_rate": 8.149882659945238e-07, - "loss": 0.4888, - "step": 67005 - }, - { - "epoch": 1.72, - "learning_rate": 8.1496107330555e-07, - "loss": 0.6089, - "step": 67006 - }, - { - "epoch": 1.72, - "learning_rate": 8.149338807582525e-07, - "loss": 0.5518, - "step": 67007 - }, - { - "epoch": 1.72, - "learning_rate": 8.149066883526511e-07, - "loss": 0.6416, - "step": 67008 - }, - { - "epoch": 1.72, - "learning_rate": 8.148794960887675e-07, - "loss": 0.7129, - "step": 67009 - }, - { - "epoch": 1.72, - "learning_rate": 8.148523039666218e-07, - "loss": 0.7559, - "step": 67010 - }, - { - "epoch": 1.72, - "learning_rate": 8.148251119862355e-07, - "loss": 0.6641, - "step": 67011 - }, - { - "epoch": 1.72, - "learning_rate": 8.147979201476289e-07, - "loss": 0.5396, - "step": 67012 - }, - { - "epoch": 1.72, - "learning_rate": 8.147707284508234e-07, - "loss": 0.6597, - "step": 67013 - }, - { - "epoch": 1.72, - "learning_rate": 8.147435368958392e-07, - "loss": 0.7441, - "step": 67014 - }, - { - "epoch": 1.72, - "learning_rate": 8.147163454826972e-07, - "loss": 0.6611, - "step": 67015 - }, - { - "epoch": 1.72, - "learning_rate": 8.146891542114186e-07, - "loss": 0.4202, - "step": 67016 - }, - { - "epoch": 1.72, - "learning_rate": 8.146619630820239e-07, - "loss": 0.6299, - "step": 67017 - }, - { - "epoch": 1.72, - "learning_rate": 8.146347720945339e-07, - "loss": 0.7334, - "step": 67018 - }, - { - "epoch": 1.72, - "learning_rate": 8.146075812489696e-07, - "loss": 0.7734, - "step": 67019 - }, - { - "epoch": 1.72, - "learning_rate": 8.145803905453518e-07, - "loss": 0.7227, - "step": 67020 - }, - { - "epoch": 1.72, - "learning_rate": 8.145531999837012e-07, - "loss": 0.708, - "step": 67021 - }, - { - "epoch": 1.72, - "learning_rate": 8.145260095640387e-07, - "loss": 0.4767, - "step": 67022 - }, - { - "epoch": 1.72, - "learning_rate": 8.144988192863854e-07, - "loss": 0.5752, - "step": 67023 - }, - { - "epoch": 1.72, - "learning_rate": 8.144716291507616e-07, - "loss": 0.5938, - "step": 67024 - }, - { - "epoch": 1.72, - "learning_rate": 8.144444391571882e-07, - "loss": 0.6321, - "step": 67025 - }, - { - "epoch": 1.72, - "learning_rate": 8.144172493056863e-07, - "loss": 0.6758, - "step": 67026 - }, - { - "epoch": 1.72, - "learning_rate": 8.143900595962765e-07, - "loss": 0.5029, - "step": 67027 - }, - { - "epoch": 1.72, - "learning_rate": 8.143628700289797e-07, - "loss": 0.5747, - "step": 67028 - }, - { - "epoch": 1.72, - "learning_rate": 8.143356806038167e-07, - "loss": 0.5928, - "step": 67029 - }, - { - "epoch": 1.72, - "learning_rate": 8.143084913208085e-07, - "loss": 0.6167, - "step": 67030 - }, - { - "epoch": 1.72, - "learning_rate": 8.142813021799755e-07, - "loss": 0.6592, - "step": 67031 - }, - { - "epoch": 1.72, - "learning_rate": 8.142541131813389e-07, - "loss": 0.7324, - "step": 67032 - }, - { - "epoch": 1.72, - "learning_rate": 8.142269243249198e-07, - "loss": 0.6929, - "step": 67033 - }, - { - "epoch": 1.72, - "learning_rate": 8.141997356107381e-07, - "loss": 0.6494, - "step": 67034 - }, - { - "epoch": 1.72, - "learning_rate": 8.141725470388152e-07, - "loss": 0.572, - "step": 67035 - }, - { - "epoch": 1.72, - "learning_rate": 8.141453586091719e-07, - "loss": 0.6003, - "step": 67036 - }, - { - "epoch": 1.72, - "learning_rate": 8.141181703218287e-07, - "loss": 0.6431, - "step": 67037 - }, - { - "epoch": 1.72, - "learning_rate": 8.140909821768071e-07, - "loss": 0.6323, - "step": 67038 - }, - { - "epoch": 1.72, - "learning_rate": 8.14063794174127e-07, - "loss": 0.668, - "step": 67039 - }, - { - "epoch": 1.72, - "learning_rate": 8.140366063138101e-07, - "loss": 0.4912, - "step": 67040 - }, - { - "epoch": 1.72, - "learning_rate": 8.140094185958766e-07, - "loss": 0.585, - "step": 67041 - }, - { - "epoch": 1.72, - "learning_rate": 8.139822310203477e-07, - "loss": 0.7305, - "step": 67042 - }, - { - "epoch": 1.72, - "learning_rate": 8.139550435872442e-07, - "loss": 0.6367, - "step": 67043 - }, - { - "epoch": 1.72, - "learning_rate": 8.139278562965865e-07, - "loss": 0.6094, - "step": 67044 - }, - { - "epoch": 1.72, - "learning_rate": 8.139006691483958e-07, - "loss": 0.5125, - "step": 67045 - }, - { - "epoch": 1.72, - "learning_rate": 8.138734821426924e-07, - "loss": 0.5737, - "step": 67046 - }, - { - "epoch": 1.72, - "learning_rate": 8.13846295279498e-07, - "loss": 0.4315, - "step": 67047 - }, - { - "epoch": 1.72, - "learning_rate": 8.138191085588326e-07, - "loss": 0.7988, - "step": 67048 - }, - { - "epoch": 1.72, - "learning_rate": 8.137919219807177e-07, - "loss": 0.5742, - "step": 67049 - }, - { - "epoch": 1.72, - "learning_rate": 8.137647355451733e-07, - "loss": 0.6196, - "step": 67050 - }, - { - "epoch": 1.72, - "learning_rate": 8.137375492522212e-07, - "loss": 0.561, - "step": 67051 - }, - { - "epoch": 1.72, - "learning_rate": 8.137103631018813e-07, - "loss": 0.7603, - "step": 67052 - }, - { - "epoch": 1.72, - "learning_rate": 8.136831770941755e-07, - "loss": 0.7041, - "step": 67053 - }, - { - "epoch": 1.72, - "learning_rate": 8.136559912291232e-07, - "loss": 0.5718, - "step": 67054 - }, - { - "epoch": 1.72, - "learning_rate": 8.136288055067462e-07, - "loss": 0.3956, - "step": 67055 - }, - { - "epoch": 1.72, - "learning_rate": 8.136016199270647e-07, - "loss": 0.7715, - "step": 67056 - }, - { - "epoch": 1.72, - "learning_rate": 8.135744344901003e-07, - "loss": 0.5977, - "step": 67057 - }, - { - "epoch": 1.72, - "learning_rate": 8.135472491958732e-07, - "loss": 0.6689, - "step": 67058 - }, - { - "epoch": 1.72, - "learning_rate": 8.135200640444044e-07, - "loss": 0.6777, - "step": 67059 - }, - { - "epoch": 1.72, - "learning_rate": 8.134928790357147e-07, - "loss": 0.6465, - "step": 67060 - }, - { - "epoch": 1.72, - "learning_rate": 8.13465694169825e-07, - "loss": 0.6089, - "step": 67061 - }, - { - "epoch": 1.72, - "learning_rate": 8.134385094467559e-07, - "loss": 0.5898, - "step": 67062 - }, - { - "epoch": 1.72, - "learning_rate": 8.134113248665287e-07, - "loss": 0.605, - "step": 67063 - }, - { - "epoch": 1.72, - "learning_rate": 8.133841404291638e-07, - "loss": 0.5358, - "step": 67064 - }, - { - "epoch": 1.72, - "learning_rate": 8.133569561346818e-07, - "loss": 0.7559, - "step": 67065 - }, - { - "epoch": 1.72, - "learning_rate": 8.13329771983104e-07, - "loss": 0.6797, - "step": 67066 - }, - { - "epoch": 1.72, - "learning_rate": 8.133025879744507e-07, - "loss": 0.8164, - "step": 67067 - }, - { - "epoch": 1.72, - "learning_rate": 8.132754041087434e-07, - "loss": 0.7295, - "step": 67068 - }, - { - "epoch": 1.72, - "learning_rate": 8.132482203860022e-07, - "loss": 0.6143, - "step": 67069 - }, - { - "epoch": 1.72, - "learning_rate": 8.132210368062485e-07, - "loss": 0.6729, - "step": 67070 - }, - { - "epoch": 1.72, - "learning_rate": 8.131938533695029e-07, - "loss": 0.8203, - "step": 67071 - }, - { - "epoch": 1.72, - "learning_rate": 8.13166670075786e-07, - "loss": 0.5679, - "step": 67072 - }, - { - "epoch": 1.72, - "learning_rate": 8.131394869251191e-07, - "loss": 0.5535, - "step": 67073 - }, - { - "epoch": 1.72, - "learning_rate": 8.131123039175227e-07, - "loss": 0.7002, - "step": 67074 - }, - { - "epoch": 1.72, - "learning_rate": 8.130851210530172e-07, - "loss": 0.5103, - "step": 67075 - }, - { - "epoch": 1.72, - "learning_rate": 8.130579383316241e-07, - "loss": 0.5376, - "step": 67076 - }, - { - "epoch": 1.72, - "learning_rate": 8.130307557533637e-07, - "loss": 0.6587, - "step": 67077 - }, - { - "epoch": 1.72, - "learning_rate": 8.130035733182572e-07, - "loss": 0.5244, - "step": 67078 - }, - { - "epoch": 1.72, - "learning_rate": 8.129763910263252e-07, - "loss": 0.5835, - "step": 67079 - }, - { - "epoch": 1.72, - "learning_rate": 8.129492088775887e-07, - "loss": 0.6157, - "step": 67080 - }, - { - "epoch": 1.72, - "learning_rate": 8.129220268720682e-07, - "loss": 0.5898, - "step": 67081 - }, - { - "epoch": 1.72, - "learning_rate": 8.128948450097853e-07, - "loss": 0.4208, - "step": 67082 - }, - { - "epoch": 1.72, - "learning_rate": 8.128676632907597e-07, - "loss": 0.532, - "step": 67083 - }, - { - "epoch": 1.72, - "learning_rate": 8.128404817150127e-07, - "loss": 0.3574, - "step": 67084 - }, - { - "epoch": 1.72, - "learning_rate": 8.128133002825653e-07, - "loss": 0.52, - "step": 67085 - }, - { - "epoch": 1.72, - "learning_rate": 8.127861189934378e-07, - "loss": 0.5186, - "step": 67086 - }, - { - "epoch": 1.72, - "learning_rate": 8.127589378476518e-07, - "loss": 0.6592, - "step": 67087 - }, - { - "epoch": 1.72, - "learning_rate": 8.127317568452274e-07, - "loss": 0.6299, - "step": 67088 - }, - { - "epoch": 1.72, - "learning_rate": 8.127045759861858e-07, - "loss": 0.4712, - "step": 67089 - }, - { - "epoch": 1.72, - "learning_rate": 8.126773952705477e-07, - "loss": 0.5652, - "step": 67090 - }, - { - "epoch": 1.72, - "learning_rate": 8.126502146983339e-07, - "loss": 0.7114, - "step": 67091 - }, - { - "epoch": 1.72, - "learning_rate": 8.126230342695655e-07, - "loss": 0.7051, - "step": 67092 - }, - { - "epoch": 1.72, - "learning_rate": 8.125958539842628e-07, - "loss": 0.7383, - "step": 67093 - }, - { - "epoch": 1.72, - "learning_rate": 8.125686738424465e-07, - "loss": 0.6914, - "step": 67094 - }, - { - "epoch": 1.72, - "learning_rate": 8.125414938441381e-07, - "loss": 0.6523, - "step": 67095 - }, - { - "epoch": 1.72, - "learning_rate": 8.125143139893579e-07, - "loss": 0.7256, - "step": 67096 - }, - { - "epoch": 1.72, - "learning_rate": 8.124871342781269e-07, - "loss": 0.4692, - "step": 67097 - }, - { - "epoch": 1.72, - "learning_rate": 8.124599547104659e-07, - "loss": 0.6392, - "step": 67098 - }, - { - "epoch": 1.72, - "learning_rate": 8.124327752863957e-07, - "loss": 0.6436, - "step": 67099 - }, - { - "epoch": 1.72, - "learning_rate": 8.124055960059371e-07, - "loss": 0.5273, - "step": 67100 - }, - { - "epoch": 1.72, - "learning_rate": 8.12378416869111e-07, - "loss": 0.5059, - "step": 67101 - }, - { - "epoch": 1.72, - "learning_rate": 8.123512378759382e-07, - "loss": 0.6367, - "step": 67102 - }, - { - "epoch": 1.72, - "learning_rate": 8.123240590264391e-07, - "loss": 0.5151, - "step": 67103 - }, - { - "epoch": 1.72, - "learning_rate": 8.122968803206352e-07, - "loss": 0.6592, - "step": 67104 - }, - { - "epoch": 1.72, - "learning_rate": 8.122697017585466e-07, - "loss": 0.5312, - "step": 67105 - }, - { - "epoch": 1.72, - "learning_rate": 8.122425233401947e-07, - "loss": 0.6201, - "step": 67106 - }, - { - "epoch": 1.72, - "learning_rate": 8.122153450656001e-07, - "loss": 0.7061, - "step": 67107 - }, - { - "epoch": 1.72, - "learning_rate": 8.121881669347832e-07, - "loss": 0.5344, - "step": 67108 - }, - { - "epoch": 1.72, - "learning_rate": 8.121609889477657e-07, - "loss": 0.5271, - "step": 67109 - }, - { - "epoch": 1.72, - "learning_rate": 8.121338111045673e-07, - "loss": 0.5928, - "step": 67110 - }, - { - "epoch": 1.72, - "learning_rate": 8.121066334052099e-07, - "loss": 0.4517, - "step": 67111 - }, - { - "epoch": 1.72, - "learning_rate": 8.12079455849714e-07, - "loss": 0.8369, - "step": 67112 - }, - { - "epoch": 1.72, - "learning_rate": 8.120522784380997e-07, - "loss": 0.6338, - "step": 67113 - }, - { - "epoch": 1.72, - "learning_rate": 8.120251011703884e-07, - "loss": 0.5581, - "step": 67114 - }, - { - "epoch": 1.72, - "learning_rate": 8.119979240466009e-07, - "loss": 0.6792, - "step": 67115 - }, - { - "epoch": 1.72, - "learning_rate": 8.11970747066758e-07, - "loss": 0.5381, - "step": 67116 - }, - { - "epoch": 1.72, - "learning_rate": 8.119435702308803e-07, - "loss": 0.666, - "step": 67117 - }, - { - "epoch": 1.72, - "learning_rate": 8.11916393538989e-07, - "loss": 0.6033, - "step": 67118 - }, - { - "epoch": 1.72, - "learning_rate": 8.118892169911044e-07, - "loss": 0.5986, - "step": 67119 - }, - { - "epoch": 1.72, - "learning_rate": 8.118620405872478e-07, - "loss": 0.519, - "step": 67120 - }, - { - "epoch": 1.72, - "learning_rate": 8.118348643274396e-07, - "loss": 0.6484, - "step": 67121 - }, - { - "epoch": 1.72, - "learning_rate": 8.118076882117013e-07, - "loss": 0.6226, - "step": 67122 - }, - { - "epoch": 1.72, - "learning_rate": 8.117805122400529e-07, - "loss": 0.5857, - "step": 67123 - }, - { - "epoch": 1.72, - "learning_rate": 8.117533364125155e-07, - "loss": 0.7031, - "step": 67124 - }, - { - "epoch": 1.72, - "learning_rate": 8.117261607291097e-07, - "loss": 0.5903, - "step": 67125 - }, - { - "epoch": 1.72, - "learning_rate": 8.116989851898567e-07, - "loss": 0.5437, - "step": 67126 - }, - { - "epoch": 1.72, - "learning_rate": 8.116718097947769e-07, - "loss": 0.8486, - "step": 67127 - }, - { - "epoch": 1.72, - "learning_rate": 8.116446345438916e-07, - "loss": 0.5854, - "step": 67128 - }, - { - "epoch": 1.72, - "learning_rate": 8.116174594372212e-07, - "loss": 0.4541, - "step": 67129 - }, - { - "epoch": 1.72, - "learning_rate": 8.115902844747867e-07, - "loss": 0.6865, - "step": 67130 - }, - { - "epoch": 1.72, - "learning_rate": 8.115631096566088e-07, - "loss": 0.5015, - "step": 67131 - }, - { - "epoch": 1.72, - "learning_rate": 8.115359349827087e-07, - "loss": 0.6367, - "step": 67132 - }, - { - "epoch": 1.72, - "learning_rate": 8.115087604531067e-07, - "loss": 0.5146, - "step": 67133 - }, - { - "epoch": 1.72, - "learning_rate": 8.114815860678235e-07, - "loss": 0.5054, - "step": 67134 - }, - { - "epoch": 1.72, - "learning_rate": 8.114544118268804e-07, - "loss": 0.5898, - "step": 67135 - }, - { - "epoch": 1.72, - "learning_rate": 8.114272377302978e-07, - "loss": 0.7959, - "step": 67136 - }, - { - "epoch": 1.72, - "learning_rate": 8.11400063778097e-07, - "loss": 0.668, - "step": 67137 - }, - { - "epoch": 1.72, - "learning_rate": 8.113728899702981e-07, - "loss": 0.6416, - "step": 67138 - }, - { - "epoch": 1.72, - "learning_rate": 8.113457163069226e-07, - "loss": 0.6904, - "step": 67139 - }, - { - "epoch": 1.72, - "learning_rate": 8.113185427879909e-07, - "loss": 0.4801, - "step": 67140 - }, - { - "epoch": 1.72, - "learning_rate": 8.11291369413524e-07, - "loss": 0.7158, - "step": 67141 - }, - { - "epoch": 1.72, - "learning_rate": 8.112641961835429e-07, - "loss": 0.6797, - "step": 67142 - }, - { - "epoch": 1.72, - "learning_rate": 8.112370230980679e-07, - "loss": 0.5879, - "step": 67143 - }, - { - "epoch": 1.72, - "learning_rate": 8.112098501571199e-07, - "loss": 0.5945, - "step": 67144 - }, - { - "epoch": 1.72, - "learning_rate": 8.111826773607199e-07, - "loss": 0.7344, - "step": 67145 - }, - { - "epoch": 1.72, - "learning_rate": 8.111555047088885e-07, - "loss": 0.6304, - "step": 67146 - }, - { - "epoch": 1.72, - "learning_rate": 8.111283322016468e-07, - "loss": 0.7246, - "step": 67147 - }, - { - "epoch": 1.72, - "learning_rate": 8.111011598390153e-07, - "loss": 0.5879, - "step": 67148 - }, - { - "epoch": 1.72, - "learning_rate": 8.11073987621015e-07, - "loss": 0.7749, - "step": 67149 - }, - { - "epoch": 1.72, - "learning_rate": 8.110468155476668e-07, - "loss": 0.666, - "step": 67150 - }, - { - "epoch": 1.72, - "learning_rate": 8.110196436189913e-07, - "loss": 0.6152, - "step": 67151 - }, - { - "epoch": 1.72, - "learning_rate": 8.109924718350097e-07, - "loss": 0.6138, - "step": 67152 - }, - { - "epoch": 1.72, - "learning_rate": 8.109653001957421e-07, - "loss": 0.6602, - "step": 67153 - }, - { - "epoch": 1.72, - "learning_rate": 8.109381287012097e-07, - "loss": 0.7603, - "step": 67154 - }, - { - "epoch": 1.72, - "learning_rate": 8.109109573514332e-07, - "loss": 0.6465, - "step": 67155 - }, - { - "epoch": 1.72, - "learning_rate": 8.108837861464337e-07, - "loss": 0.4375, - "step": 67156 - }, - { - "epoch": 1.72, - "learning_rate": 8.108566150862314e-07, - "loss": 0.6895, - "step": 67157 - }, - { - "epoch": 1.72, - "learning_rate": 8.108294441708479e-07, - "loss": 0.6135, - "step": 67158 - }, - { - "epoch": 1.72, - "learning_rate": 8.108022734003033e-07, - "loss": 0.541, - "step": 67159 - }, - { - "epoch": 1.72, - "learning_rate": 8.107751027746191e-07, - "loss": 0.8047, - "step": 67160 - }, - { - "epoch": 1.72, - "learning_rate": 8.107479322938156e-07, - "loss": 0.6543, - "step": 67161 - }, - { - "epoch": 1.72, - "learning_rate": 8.107207619579137e-07, - "loss": 0.7188, - "step": 67162 - }, - { - "epoch": 1.72, - "learning_rate": 8.10693591766934e-07, - "loss": 0.5762, - "step": 67163 - }, - { - "epoch": 1.72, - "learning_rate": 8.106664217208978e-07, - "loss": 0.6797, - "step": 67164 - }, - { - "epoch": 1.72, - "learning_rate": 8.106392518198252e-07, - "loss": 0.6582, - "step": 67165 - }, - { - "epoch": 1.72, - "learning_rate": 8.106120820637377e-07, - "loss": 0.7402, - "step": 67166 - }, - { - "epoch": 1.72, - "learning_rate": 8.105849124526556e-07, - "loss": 0.5186, - "step": 67167 - }, - { - "epoch": 1.72, - "learning_rate": 8.105577429866002e-07, - "loss": 0.7891, - "step": 67168 - }, - { - "epoch": 1.72, - "learning_rate": 8.105305736655918e-07, - "loss": 0.5044, - "step": 67169 - }, - { - "epoch": 1.72, - "learning_rate": 8.105034044896515e-07, - "loss": 0.6499, - "step": 67170 - }, - { - "epoch": 1.72, - "learning_rate": 8.104762354587999e-07, - "loss": 0.6758, - "step": 67171 - }, - { - "epoch": 1.72, - "learning_rate": 8.104490665730585e-07, - "loss": 0.6133, - "step": 67172 - }, - { - "epoch": 1.72, - "learning_rate": 8.104218978324472e-07, - "loss": 0.4756, - "step": 67173 - }, - { - "epoch": 1.72, - "learning_rate": 8.103947292369868e-07, - "loss": 0.667, - "step": 67174 - }, - { - "epoch": 1.72, - "learning_rate": 8.103675607866989e-07, - "loss": 0.5161, - "step": 67175 - }, - { - "epoch": 1.72, - "learning_rate": 8.103403924816034e-07, - "loss": 0.6909, - "step": 67176 - }, - { - "epoch": 1.72, - "learning_rate": 8.103132243217219e-07, - "loss": 0.6938, - "step": 67177 - }, - { - "epoch": 1.72, - "learning_rate": 8.102860563070746e-07, - "loss": 0.7148, - "step": 67178 - }, - { - "epoch": 1.72, - "learning_rate": 8.102588884376827e-07, - "loss": 0.6709, - "step": 67179 - }, - { - "epoch": 1.72, - "learning_rate": 8.10231720713567e-07, - "loss": 0.5718, - "step": 67180 - }, - { - "epoch": 1.72, - "learning_rate": 8.102045531347478e-07, - "loss": 0.6445, - "step": 67181 - }, - { - "epoch": 1.72, - "learning_rate": 8.101773857012466e-07, - "loss": 0.6328, - "step": 67182 - }, - { - "epoch": 1.72, - "learning_rate": 8.101502184130837e-07, - "loss": 0.6343, - "step": 67183 - }, - { - "epoch": 1.72, - "learning_rate": 8.101230512702799e-07, - "loss": 0.6958, - "step": 67184 - }, - { - "epoch": 1.72, - "learning_rate": 8.100958842728564e-07, - "loss": 0.5537, - "step": 67185 - }, - { - "epoch": 1.72, - "learning_rate": 8.100687174208334e-07, - "loss": 0.7271, - "step": 67186 - }, - { - "epoch": 1.72, - "learning_rate": 8.100415507142323e-07, - "loss": 0.7402, - "step": 67187 - }, - { - "epoch": 1.72, - "learning_rate": 8.100143841530735e-07, - "loss": 0.6299, - "step": 67188 - }, - { - "epoch": 1.72, - "learning_rate": 8.09987217737378e-07, - "loss": 0.6289, - "step": 67189 - }, - { - "epoch": 1.72, - "learning_rate": 8.099600514671666e-07, - "loss": 0.7529, - "step": 67190 - }, - { - "epoch": 1.72, - "learning_rate": 8.099328853424601e-07, - "loss": 0.6714, - "step": 67191 - }, - { - "epoch": 1.72, - "learning_rate": 8.099057193632795e-07, - "loss": 0.6523, - "step": 67192 - }, - { - "epoch": 1.72, - "learning_rate": 8.098785535296448e-07, - "loss": 0.7676, - "step": 67193 - }, - { - "epoch": 1.72, - "learning_rate": 8.098513878415778e-07, - "loss": 0.7251, - "step": 67194 - }, - { - "epoch": 1.72, - "learning_rate": 8.098242222990985e-07, - "loss": 0.6372, - "step": 67195 - }, - { - "epoch": 1.72, - "learning_rate": 8.097970569022283e-07, - "loss": 0.5283, - "step": 67196 - }, - { - "epoch": 1.72, - "learning_rate": 8.097698916509876e-07, - "loss": 0.5391, - "step": 67197 - }, - { - "epoch": 1.72, - "learning_rate": 8.097427265453974e-07, - "loss": 0.6289, - "step": 67198 - }, - { - "epoch": 1.72, - "learning_rate": 8.097155615854785e-07, - "loss": 0.6538, - "step": 67199 - }, - { - "epoch": 1.72, - "learning_rate": 8.096883967712513e-07, - "loss": 0.583, - "step": 67200 - }, - { - "epoch": 1.72, - "learning_rate": 8.096612321027374e-07, - "loss": 0.667, - "step": 67201 - }, - { - "epoch": 1.72, - "learning_rate": 8.096340675799572e-07, - "loss": 0.8018, - "step": 67202 - }, - { - "epoch": 1.72, - "learning_rate": 8.096069032029311e-07, - "loss": 0.6558, - "step": 67203 - }, - { - "epoch": 1.72, - "learning_rate": 8.095797389716804e-07, - "loss": 0.582, - "step": 67204 - }, - { - "epoch": 1.72, - "learning_rate": 8.095525748862257e-07, - "loss": 0.55, - "step": 67205 - }, - { - "epoch": 1.72, - "learning_rate": 8.095254109465878e-07, - "loss": 0.6768, - "step": 67206 - }, - { - "epoch": 1.72, - "learning_rate": 8.094982471527873e-07, - "loss": 0.6543, - "step": 67207 - }, - { - "epoch": 1.72, - "learning_rate": 8.094710835048457e-07, - "loss": 0.5894, - "step": 67208 - }, - { - "epoch": 1.72, - "learning_rate": 8.094439200027829e-07, - "loss": 0.5983, - "step": 67209 - }, - { - "epoch": 1.72, - "learning_rate": 8.094167566466204e-07, - "loss": 0.6875, - "step": 67210 - }, - { - "epoch": 1.72, - "learning_rate": 8.093895934363785e-07, - "loss": 0.6426, - "step": 67211 - }, - { - "epoch": 1.72, - "learning_rate": 8.093624303720788e-07, - "loss": 0.749, - "step": 67212 - }, - { - "epoch": 1.72, - "learning_rate": 8.093352674537412e-07, - "loss": 0.3982, - "step": 67213 - }, - { - "epoch": 1.72, - "learning_rate": 8.093081046813868e-07, - "loss": 0.8145, - "step": 67214 - }, - { - "epoch": 1.72, - "learning_rate": 8.092809420550363e-07, - "loss": 0.6963, - "step": 67215 - }, - { - "epoch": 1.72, - "learning_rate": 8.092537795747108e-07, - "loss": 0.605, - "step": 67216 - }, - { - "epoch": 1.72, - "learning_rate": 8.092266172404305e-07, - "loss": 0.605, - "step": 67217 - }, - { - "epoch": 1.72, - "learning_rate": 8.09199455052217e-07, - "loss": 0.5007, - "step": 67218 - }, - { - "epoch": 1.72, - "learning_rate": 8.091722930100904e-07, - "loss": 0.554, - "step": 67219 - }, - { - "epoch": 1.72, - "learning_rate": 8.091451311140721e-07, - "loss": 0.4814, - "step": 67220 - }, - { - "epoch": 1.72, - "learning_rate": 8.091179693641823e-07, - "loss": 0.5942, - "step": 67221 - }, - { - "epoch": 1.72, - "learning_rate": 8.090908077604426e-07, - "loss": 0.5781, - "step": 67222 - }, - { - "epoch": 1.72, - "learning_rate": 8.09063646302873e-07, - "loss": 0.5117, - "step": 67223 - }, - { - "epoch": 1.72, - "learning_rate": 8.090364849914945e-07, - "loss": 0.6523, - "step": 67224 - }, - { - "epoch": 1.72, - "learning_rate": 8.090093238263281e-07, - "loss": 0.5786, - "step": 67225 - }, - { - "epoch": 1.72, - "learning_rate": 8.089821628073943e-07, - "loss": 0.5698, - "step": 67226 - }, - { - "epoch": 1.72, - "learning_rate": 8.089550019347142e-07, - "loss": 0.4849, - "step": 67227 - }, - { - "epoch": 1.72, - "learning_rate": 8.089278412083084e-07, - "loss": 0.6943, - "step": 67228 - }, - { - "epoch": 1.72, - "learning_rate": 8.08900680628198e-07, - "loss": 0.6348, - "step": 67229 - }, - { - "epoch": 1.72, - "learning_rate": 8.088735201944031e-07, - "loss": 0.5815, - "step": 67230 - }, - { - "epoch": 1.72, - "learning_rate": 8.088463599069454e-07, - "loss": 0.6934, - "step": 67231 - }, - { - "epoch": 1.72, - "learning_rate": 8.088191997658453e-07, - "loss": 0.5996, - "step": 67232 - }, - { - "epoch": 1.72, - "learning_rate": 8.087920397711236e-07, - "loss": 0.6885, - "step": 67233 - }, - { - "epoch": 1.72, - "learning_rate": 8.087648799228006e-07, - "loss": 0.6309, - "step": 67234 - }, - { - "epoch": 1.72, - "learning_rate": 8.087377202208978e-07, - "loss": 0.7129, - "step": 67235 - }, - { - "epoch": 1.72, - "learning_rate": 8.087105606654355e-07, - "loss": 0.6807, - "step": 67236 - }, - { - "epoch": 1.72, - "learning_rate": 8.08683401256435e-07, - "loss": 0.8564, - "step": 67237 - }, - { - "epoch": 1.72, - "learning_rate": 8.086562419939166e-07, - "loss": 0.4568, - "step": 67238 - }, - { - "epoch": 1.72, - "learning_rate": 8.086290828779015e-07, - "loss": 0.6782, - "step": 67239 - }, - { - "epoch": 1.72, - "learning_rate": 8.086019239084101e-07, - "loss": 0.4985, - "step": 67240 - }, - { - "epoch": 1.72, - "learning_rate": 8.085747650854636e-07, - "loss": 0.4873, - "step": 67241 - }, - { - "epoch": 1.72, - "learning_rate": 8.085476064090828e-07, - "loss": 0.7422, - "step": 67242 - }, - { - "epoch": 1.72, - "learning_rate": 8.08520447879288e-07, - "loss": 0.4656, - "step": 67243 - }, - { - "epoch": 1.72, - "learning_rate": 8.084932894961004e-07, - "loss": 0.6011, - "step": 67244 - }, - { - "epoch": 1.72, - "learning_rate": 8.084661312595405e-07, - "loss": 0.4176, - "step": 67245 - }, - { - "epoch": 1.72, - "learning_rate": 8.084389731696295e-07, - "loss": 0.6631, - "step": 67246 - }, - { - "epoch": 1.72, - "learning_rate": 8.084118152263877e-07, - "loss": 0.6807, - "step": 67247 - }, - { - "epoch": 1.72, - "learning_rate": 8.083846574298363e-07, - "loss": 0.6885, - "step": 67248 - }, - { - "epoch": 1.72, - "learning_rate": 8.083574997799958e-07, - "loss": 0.6421, - "step": 67249 - }, - { - "epoch": 1.72, - "learning_rate": 8.083303422768875e-07, - "loss": 0.6226, - "step": 67250 - }, - { - "epoch": 1.72, - "learning_rate": 8.083031849205315e-07, - "loss": 0.5991, - "step": 67251 - }, - { - "epoch": 1.72, - "learning_rate": 8.082760277109497e-07, - "loss": 0.4849, - "step": 67252 - }, - { - "epoch": 1.72, - "learning_rate": 8.082488706481613e-07, - "loss": 0.6357, - "step": 67253 - }, - { - "epoch": 1.72, - "learning_rate": 8.082217137321882e-07, - "loss": 0.8027, - "step": 67254 - }, - { - "epoch": 1.72, - "learning_rate": 8.081945569630508e-07, - "loss": 0.7461, - "step": 67255 - }, - { - "epoch": 1.72, - "learning_rate": 8.081674003407702e-07, - "loss": 0.7144, - "step": 67256 - }, - { - "epoch": 1.72, - "learning_rate": 8.081402438653668e-07, - "loss": 0.6914, - "step": 67257 - }, - { - "epoch": 1.72, - "learning_rate": 8.081130875368618e-07, - "loss": 0.573, - "step": 67258 - }, - { - "epoch": 1.72, - "learning_rate": 8.080859313552755e-07, - "loss": 0.7197, - "step": 67259 - }, - { - "epoch": 1.72, - "learning_rate": 8.080587753206293e-07, - "loss": 0.3683, - "step": 67260 - }, - { - "epoch": 1.72, - "learning_rate": 8.080316194329433e-07, - "loss": 0.5571, - "step": 67261 - }, - { - "epoch": 1.72, - "learning_rate": 8.080044636922392e-07, - "loss": 0.6733, - "step": 67262 - }, - { - "epoch": 1.72, - "learning_rate": 8.07977308098537e-07, - "loss": 0.6914, - "step": 67263 - }, - { - "epoch": 1.72, - "learning_rate": 8.079501526518576e-07, - "loss": 0.5298, - "step": 67264 - }, - { - "epoch": 1.72, - "learning_rate": 8.07922997352222e-07, - "loss": 0.6191, - "step": 67265 - }, - { - "epoch": 1.72, - "learning_rate": 8.078958421996509e-07, - "loss": 0.478, - "step": 67266 - }, - { - "epoch": 1.72, - "learning_rate": 8.078686871941652e-07, - "loss": 0.5864, - "step": 67267 - }, - { - "epoch": 1.72, - "learning_rate": 8.078415323357855e-07, - "loss": 0.5752, - "step": 67268 - }, - { - "epoch": 1.72, - "learning_rate": 8.078143776245327e-07, - "loss": 0.457, - "step": 67269 - }, - { - "epoch": 1.72, - "learning_rate": 8.077872230604279e-07, - "loss": 0.6807, - "step": 67270 - }, - { - "epoch": 1.72, - "learning_rate": 8.077600686434913e-07, - "loss": 0.6025, - "step": 67271 - }, - { - "epoch": 1.72, - "learning_rate": 8.077329143737443e-07, - "loss": 0.6729, - "step": 67272 - }, - { - "epoch": 1.72, - "learning_rate": 8.07705760251207e-07, - "loss": 0.7681, - "step": 67273 - }, - { - "epoch": 1.72, - "learning_rate": 8.076786062759007e-07, - "loss": 0.4907, - "step": 67274 - }, - { - "epoch": 1.72, - "learning_rate": 8.076514524478461e-07, - "loss": 0.3872, - "step": 67275 - }, - { - "epoch": 1.72, - "learning_rate": 8.076242987670637e-07, - "loss": 0.7061, - "step": 67276 - }, - { - "epoch": 1.72, - "learning_rate": 8.075971452335747e-07, - "loss": 0.6213, - "step": 67277 - }, - { - "epoch": 1.72, - "learning_rate": 8.075699918473995e-07, - "loss": 0.5381, - "step": 67278 - }, - { - "epoch": 1.72, - "learning_rate": 8.075428386085595e-07, - "loss": 0.8379, - "step": 67279 - }, - { - "epoch": 1.72, - "learning_rate": 8.075156855170747e-07, - "loss": 0.5547, - "step": 67280 - }, - { - "epoch": 1.72, - "learning_rate": 8.074885325729666e-07, - "loss": 0.6133, - "step": 67281 - }, - { - "epoch": 1.72, - "learning_rate": 8.074613797762558e-07, - "loss": 0.5542, - "step": 67282 - }, - { - "epoch": 1.72, - "learning_rate": 8.074342271269627e-07, - "loss": 0.5728, - "step": 67283 - }, - { - "epoch": 1.72, - "learning_rate": 8.074070746251083e-07, - "loss": 0.6455, - "step": 67284 - }, - { - "epoch": 1.72, - "learning_rate": 8.073799222707135e-07, - "loss": 0.5552, - "step": 67285 - }, - { - "epoch": 1.72, - "learning_rate": 8.073527700637992e-07, - "loss": 0.5295, - "step": 67286 - }, - { - "epoch": 1.72, - "learning_rate": 8.073256180043859e-07, - "loss": 0.7324, - "step": 67287 - }, - { - "epoch": 1.72, - "learning_rate": 8.072984660924944e-07, - "loss": 0.3894, - "step": 67288 - }, - { - "epoch": 1.72, - "learning_rate": 8.072713143281459e-07, - "loss": 0.6426, - "step": 67289 - }, - { - "epoch": 1.72, - "learning_rate": 8.072441627113605e-07, - "loss": 0.709, - "step": 67290 - }, - { - "epoch": 1.72, - "learning_rate": 8.072170112421597e-07, - "loss": 0.6465, - "step": 67291 - }, - { - "epoch": 1.72, - "learning_rate": 8.071898599205642e-07, - "loss": 0.625, - "step": 67292 - }, - { - "epoch": 1.72, - "learning_rate": 8.071627087465941e-07, - "loss": 0.606, - "step": 67293 - }, - { - "epoch": 1.72, - "learning_rate": 8.071355577202709e-07, - "loss": 0.6973, - "step": 67294 - }, - { - "epoch": 1.72, - "learning_rate": 8.071084068416149e-07, - "loss": 0.71, - "step": 67295 - }, - { - "epoch": 1.72, - "learning_rate": 8.070812561106472e-07, - "loss": 0.584, - "step": 67296 - }, - { - "epoch": 1.72, - "learning_rate": 8.070541055273884e-07, - "loss": 0.5654, - "step": 67297 - }, - { - "epoch": 1.72, - "learning_rate": 8.070269550918597e-07, - "loss": 0.6147, - "step": 67298 - }, - { - "epoch": 1.72, - "learning_rate": 8.069998048040813e-07, - "loss": 0.6528, - "step": 67299 - }, - { - "epoch": 1.72, - "learning_rate": 8.069726546640745e-07, - "loss": 0.6543, - "step": 67300 - }, - { - "epoch": 1.72, - "learning_rate": 8.069455046718596e-07, - "loss": 0.6719, - "step": 67301 - }, - { - "epoch": 1.72, - "learning_rate": 8.069183548274581e-07, - "loss": 0.6328, - "step": 67302 - }, - { - "epoch": 1.73, - "learning_rate": 8.068912051308901e-07, - "loss": 0.4861, - "step": 67303 - }, - { - "epoch": 1.73, - "learning_rate": 8.068640555821768e-07, - "loss": 0.7256, - "step": 67304 - }, - { - "epoch": 1.73, - "learning_rate": 8.068369061813384e-07, - "loss": 0.4995, - "step": 67305 - }, - { - "epoch": 1.73, - "learning_rate": 8.068097569283964e-07, - "loss": 0.5869, - "step": 67306 - }, - { - "epoch": 1.73, - "learning_rate": 8.06782607823371e-07, - "loss": 0.583, - "step": 67307 - }, - { - "epoch": 1.73, - "learning_rate": 8.067554588662835e-07, - "loss": 0.7461, - "step": 67308 - }, - { - "epoch": 1.73, - "learning_rate": 8.067283100571542e-07, - "loss": 0.6616, - "step": 67309 - }, - { - "epoch": 1.73, - "learning_rate": 8.067011613960045e-07, - "loss": 0.6924, - "step": 67310 - }, - { - "epoch": 1.73, - "learning_rate": 8.066740128828546e-07, - "loss": 0.5754, - "step": 67311 - }, - { - "epoch": 1.73, - "learning_rate": 8.066468645177259e-07, - "loss": 0.6133, - "step": 67312 - }, - { - "epoch": 1.73, - "learning_rate": 8.066197163006386e-07, - "loss": 0.7256, - "step": 67313 - }, - { - "epoch": 1.73, - "learning_rate": 8.065925682316135e-07, - "loss": 0.4976, - "step": 67314 - }, - { - "epoch": 1.73, - "learning_rate": 8.065654203106717e-07, - "loss": 0.6689, - "step": 67315 - }, - { - "epoch": 1.73, - "learning_rate": 8.065382725378337e-07, - "loss": 0.7178, - "step": 67316 - }, - { - "epoch": 1.73, - "learning_rate": 8.065111249131207e-07, - "loss": 0.4836, - "step": 67317 - }, - { - "epoch": 1.73, - "learning_rate": 8.064839774365531e-07, - "loss": 0.7109, - "step": 67318 - }, - { - "epoch": 1.73, - "learning_rate": 8.064568301081518e-07, - "loss": 0.6826, - "step": 67319 - }, - { - "epoch": 1.73, - "learning_rate": 8.064296829279375e-07, - "loss": 0.6787, - "step": 67320 - }, - { - "epoch": 1.73, - "learning_rate": 8.064025358959314e-07, - "loss": 0.5874, - "step": 67321 - }, - { - "epoch": 1.73, - "learning_rate": 8.063753890121541e-07, - "loss": 0.6748, - "step": 67322 - }, - { - "epoch": 1.73, - "learning_rate": 8.063482422766261e-07, - "loss": 0.5542, - "step": 67323 - }, - { - "epoch": 1.73, - "learning_rate": 8.06321095689368e-07, - "loss": 0.7432, - "step": 67324 - }, - { - "epoch": 1.73, - "learning_rate": 8.062939492504012e-07, - "loss": 0.71, - "step": 67325 - }, - { - "epoch": 1.73, - "learning_rate": 8.062668029597461e-07, - "loss": 0.7021, - "step": 67326 - }, - { - "epoch": 1.73, - "learning_rate": 8.062396568174238e-07, - "loss": 0.6309, - "step": 67327 - }, - { - "epoch": 1.73, - "learning_rate": 8.062125108234547e-07, - "loss": 0.5254, - "step": 67328 - }, - { - "epoch": 1.73, - "learning_rate": 8.061853649778598e-07, - "loss": 0.7178, - "step": 67329 - }, - { - "epoch": 1.73, - "learning_rate": 8.061582192806599e-07, - "loss": 0.5605, - "step": 67330 - }, - { - "epoch": 1.73, - "learning_rate": 8.061310737318757e-07, - "loss": 0.5708, - "step": 67331 - }, - { - "epoch": 1.73, - "learning_rate": 8.061039283315284e-07, - "loss": 0.4834, - "step": 67332 - }, - { - "epoch": 1.73, - "learning_rate": 8.060767830796379e-07, - "loss": 0.6562, - "step": 67333 - }, - { - "epoch": 1.73, - "learning_rate": 8.060496379762257e-07, - "loss": 0.7812, - "step": 67334 - }, - { - "epoch": 1.73, - "learning_rate": 8.060224930213121e-07, - "loss": 0.6865, - "step": 67335 - }, - { - "epoch": 1.73, - "learning_rate": 8.059953482149186e-07, - "loss": 0.7568, - "step": 67336 - }, - { - "epoch": 1.73, - "learning_rate": 8.059682035570651e-07, - "loss": 0.6802, - "step": 67337 - }, - { - "epoch": 1.73, - "learning_rate": 8.059410590477732e-07, - "loss": 0.6934, - "step": 67338 - }, - { - "epoch": 1.73, - "learning_rate": 8.05913914687063e-07, - "loss": 0.6948, - "step": 67339 - }, - { - "epoch": 1.73, - "learning_rate": 8.058867704749559e-07, - "loss": 0.6367, - "step": 67340 - }, - { - "epoch": 1.73, - "learning_rate": 8.058596264114719e-07, - "loss": 0.6057, - "step": 67341 - }, - { - "epoch": 1.73, - "learning_rate": 8.058324824966332e-07, - "loss": 0.7129, - "step": 67342 - }, - { - "epoch": 1.73, - "learning_rate": 8.058053387304588e-07, - "loss": 0.6555, - "step": 67343 - }, - { - "epoch": 1.73, - "learning_rate": 8.057781951129708e-07, - "loss": 0.7451, - "step": 67344 - }, - { - "epoch": 1.73, - "learning_rate": 8.05751051644189e-07, - "loss": 0.6758, - "step": 67345 - }, - { - "epoch": 1.73, - "learning_rate": 8.05723908324135e-07, - "loss": 0.5957, - "step": 67346 - }, - { - "epoch": 1.73, - "learning_rate": 8.056967651528292e-07, - "loss": 0.5088, - "step": 67347 - }, - { - "epoch": 1.73, - "learning_rate": 8.056696221302924e-07, - "loss": 0.5767, - "step": 67348 - }, - { - "epoch": 1.73, - "learning_rate": 8.056424792565454e-07, - "loss": 0.5483, - "step": 67349 - }, - { - "epoch": 1.73, - "learning_rate": 8.056153365316092e-07, - "loss": 0.4844, - "step": 67350 - }, - { - "epoch": 1.73, - "learning_rate": 8.055881939555041e-07, - "loss": 0.8154, - "step": 67351 - }, - { - "epoch": 1.73, - "learning_rate": 8.055610515282517e-07, - "loss": 0.6553, - "step": 67352 - }, - { - "epoch": 1.73, - "learning_rate": 8.055339092498721e-07, - "loss": 0.573, - "step": 67353 - }, - { - "epoch": 1.73, - "learning_rate": 8.055067671203859e-07, - "loss": 0.6807, - "step": 67354 - }, - { - "epoch": 1.73, - "learning_rate": 8.054796251398145e-07, - "loss": 0.626, - "step": 67355 - }, - { - "epoch": 1.73, - "learning_rate": 8.054524833081782e-07, - "loss": 0.6348, - "step": 67356 - }, - { - "epoch": 1.73, - "learning_rate": 8.054253416254982e-07, - "loss": 0.8086, - "step": 67357 - }, - { - "epoch": 1.73, - "learning_rate": 8.053982000917948e-07, - "loss": 0.5753, - "step": 67358 - }, - { - "epoch": 1.73, - "learning_rate": 8.053710587070894e-07, - "loss": 0.6294, - "step": 67359 - }, - { - "epoch": 1.73, - "learning_rate": 8.053439174714023e-07, - "loss": 0.6084, - "step": 67360 - }, - { - "epoch": 1.73, - "learning_rate": 8.053167763847543e-07, - "loss": 0.6323, - "step": 67361 - }, - { - "epoch": 1.73, - "learning_rate": 8.052896354471666e-07, - "loss": 0.3367, - "step": 67362 - }, - { - "epoch": 1.73, - "learning_rate": 8.052624946586595e-07, - "loss": 0.6353, - "step": 67363 - }, - { - "epoch": 1.73, - "learning_rate": 8.052353540192538e-07, - "loss": 0.6611, - "step": 67364 - }, - { - "epoch": 1.73, - "learning_rate": 8.052082135289706e-07, - "loss": 0.6333, - "step": 67365 - }, - { - "epoch": 1.73, - "learning_rate": 8.051810731878304e-07, - "loss": 0.8057, - "step": 67366 - }, - { - "epoch": 1.73, - "learning_rate": 8.051539329958541e-07, - "loss": 0.583, - "step": 67367 - }, - { - "epoch": 1.73, - "learning_rate": 8.051267929530624e-07, - "loss": 0.7012, - "step": 67368 - }, - { - "epoch": 1.73, - "learning_rate": 8.050996530594764e-07, - "loss": 0.8379, - "step": 67369 - }, - { - "epoch": 1.73, - "learning_rate": 8.050725133151164e-07, - "loss": 0.4436, - "step": 67370 - }, - { - "epoch": 1.73, - "learning_rate": 8.050453737200036e-07, - "loss": 0.4143, - "step": 67371 - }, - { - "epoch": 1.73, - "learning_rate": 8.050182342741587e-07, - "loss": 0.7363, - "step": 67372 - }, - { - "epoch": 1.73, - "learning_rate": 8.049910949776021e-07, - "loss": 0.6924, - "step": 67373 - }, - { - "epoch": 1.73, - "learning_rate": 8.049639558303549e-07, - "loss": 0.707, - "step": 67374 - }, - { - "epoch": 1.73, - "learning_rate": 8.049368168324378e-07, - "loss": 0.6904, - "step": 67375 - }, - { - "epoch": 1.73, - "learning_rate": 8.049096779838717e-07, - "loss": 0.4886, - "step": 67376 - }, - { - "epoch": 1.73, - "learning_rate": 8.048825392846774e-07, - "loss": 0.7627, - "step": 67377 - }, - { - "epoch": 1.73, - "learning_rate": 8.048554007348753e-07, - "loss": 0.604, - "step": 67378 - }, - { - "epoch": 1.73, - "learning_rate": 8.048282623344867e-07, - "loss": 0.4971, - "step": 67379 - }, - { - "epoch": 1.73, - "learning_rate": 8.048011240835318e-07, - "loss": 0.6152, - "step": 67380 - }, - { - "epoch": 1.73, - "learning_rate": 8.047739859820322e-07, - "loss": 0.5339, - "step": 67381 - }, - { - "epoch": 1.73, - "learning_rate": 8.04746848030008e-07, - "loss": 0.4279, - "step": 67382 - }, - { - "epoch": 1.73, - "learning_rate": 8.047197102274798e-07, - "loss": 0.6011, - "step": 67383 - }, - { - "epoch": 1.73, - "learning_rate": 8.046925725744692e-07, - "loss": 0.7471, - "step": 67384 - }, - { - "epoch": 1.73, - "learning_rate": 8.046654350709962e-07, - "loss": 0.9062, - "step": 67385 - }, - { - "epoch": 1.73, - "learning_rate": 8.04638297717082e-07, - "loss": 0.623, - "step": 67386 - }, - { - "epoch": 1.73, - "learning_rate": 8.046111605127471e-07, - "loss": 0.6226, - "step": 67387 - }, - { - "epoch": 1.73, - "learning_rate": 8.045840234580128e-07, - "loss": 0.6816, - "step": 67388 - }, - { - "epoch": 1.73, - "learning_rate": 8.045568865528991e-07, - "loss": 0.7783, - "step": 67389 - }, - { - "epoch": 1.73, - "learning_rate": 8.045297497974276e-07, - "loss": 0.5479, - "step": 67390 - }, - { - "epoch": 1.73, - "learning_rate": 8.045026131916188e-07, - "loss": 0.7842, - "step": 67391 - }, - { - "epoch": 1.73, - "learning_rate": 8.04475476735493e-07, - "loss": 0.3367, - "step": 67392 - }, - { - "epoch": 1.73, - "learning_rate": 8.044483404290715e-07, - "loss": 0.5977, - "step": 67393 - }, - { - "epoch": 1.73, - "learning_rate": 8.044212042723749e-07, - "loss": 0.5278, - "step": 67394 - }, - { - "epoch": 1.73, - "learning_rate": 8.043940682654238e-07, - "loss": 0.6599, - "step": 67395 - }, - { - "epoch": 1.73, - "learning_rate": 8.043669324082394e-07, - "loss": 0.7969, - "step": 67396 - }, - { - "epoch": 1.73, - "learning_rate": 8.043397967008421e-07, - "loss": 0.6118, - "step": 67397 - }, - { - "epoch": 1.73, - "learning_rate": 8.043126611432529e-07, - "loss": 0.5859, - "step": 67398 - }, - { - "epoch": 1.73, - "learning_rate": 8.042855257354923e-07, - "loss": 0.6763, - "step": 67399 - }, - { - "epoch": 1.73, - "learning_rate": 8.042583904775814e-07, - "loss": 0.7725, - "step": 67400 - }, - { - "epoch": 1.73, - "learning_rate": 8.042312553695414e-07, - "loss": 0.731, - "step": 67401 - }, - { - "epoch": 1.73, - "learning_rate": 8.042041204113918e-07, - "loss": 0.5996, - "step": 67402 - }, - { - "epoch": 1.73, - "learning_rate": 8.041769856031544e-07, - "loss": 0.5591, - "step": 67403 - }, - { - "epoch": 1.73, - "learning_rate": 8.041498509448494e-07, - "loss": 0.6494, - "step": 67404 - }, - { - "epoch": 1.73, - "learning_rate": 8.041227164364982e-07, - "loss": 0.6689, - "step": 67405 - }, - { - "epoch": 1.73, - "learning_rate": 8.04095582078121e-07, - "loss": 0.5938, - "step": 67406 - }, - { - "epoch": 1.73, - "learning_rate": 8.040684478697389e-07, - "loss": 0.4883, - "step": 67407 - }, - { - "epoch": 1.73, - "learning_rate": 8.040413138113724e-07, - "loss": 0.6348, - "step": 67408 - }, - { - "epoch": 1.73, - "learning_rate": 8.040141799030428e-07, - "loss": 0.5781, - "step": 67409 - }, - { - "epoch": 1.73, - "learning_rate": 8.039870461447702e-07, - "loss": 0.5762, - "step": 67410 - }, - { - "epoch": 1.73, - "learning_rate": 8.039599125365763e-07, - "loss": 0.5586, - "step": 67411 - }, - { - "epoch": 1.73, - "learning_rate": 8.039327790784808e-07, - "loss": 0.7075, - "step": 67412 - }, - { - "epoch": 1.73, - "learning_rate": 8.03905645770505e-07, - "loss": 0.6221, - "step": 67413 - }, - { - "epoch": 1.73, - "learning_rate": 8.038785126126694e-07, - "loss": 0.6953, - "step": 67414 - }, - { - "epoch": 1.73, - "learning_rate": 8.038513796049954e-07, - "loss": 0.6646, - "step": 67415 - }, - { - "epoch": 1.73, - "learning_rate": 8.038242467475032e-07, - "loss": 0.7314, - "step": 67416 - }, - { - "epoch": 1.73, - "learning_rate": 8.037971140402138e-07, - "loss": 0.7227, - "step": 67417 - }, - { - "epoch": 1.73, - "learning_rate": 8.037699814831477e-07, - "loss": 0.7344, - "step": 67418 - }, - { - "epoch": 1.73, - "learning_rate": 8.037428490763262e-07, - "loss": 0.4812, - "step": 67419 - }, - { - "epoch": 1.73, - "learning_rate": 8.037157168197695e-07, - "loss": 0.6021, - "step": 67420 - }, - { - "epoch": 1.73, - "learning_rate": 8.036885847134991e-07, - "loss": 0.4878, - "step": 67421 - }, - { - "epoch": 1.73, - "learning_rate": 8.036614527575352e-07, - "loss": 0.6641, - "step": 67422 - }, - { - "epoch": 1.73, - "learning_rate": 8.036343209518983e-07, - "loss": 0.5728, - "step": 67423 - }, - { - "epoch": 1.73, - "learning_rate": 8.0360718929661e-07, - "loss": 0.6543, - "step": 67424 - }, - { - "epoch": 1.73, - "learning_rate": 8.035800577916902e-07, - "loss": 0.5686, - "step": 67425 - }, - { - "epoch": 1.73, - "learning_rate": 8.035529264371605e-07, - "loss": 0.8232, - "step": 67426 - }, - { - "epoch": 1.73, - "learning_rate": 8.035257952330411e-07, - "loss": 0.8418, - "step": 67427 - }, - { - "epoch": 1.73, - "learning_rate": 8.034986641793531e-07, - "loss": 0.6274, - "step": 67428 - }, - { - "epoch": 1.73, - "learning_rate": 8.03471533276117e-07, - "loss": 0.4644, - "step": 67429 - }, - { - "epoch": 1.73, - "learning_rate": 8.034444025233537e-07, - "loss": 0.6318, - "step": 67430 - }, - { - "epoch": 1.73, - "learning_rate": 8.034172719210845e-07, - "loss": 0.7207, - "step": 67431 - }, - { - "epoch": 1.73, - "learning_rate": 8.033901414693292e-07, - "loss": 0.571, - "step": 67432 - }, - { - "epoch": 1.73, - "learning_rate": 8.033630111681089e-07, - "loss": 0.4241, - "step": 67433 - }, - { - "epoch": 1.73, - "learning_rate": 8.033358810174448e-07, - "loss": 0.5487, - "step": 67434 - }, - { - "epoch": 1.73, - "learning_rate": 8.033087510173571e-07, - "loss": 0.5913, - "step": 67435 - }, - { - "epoch": 1.73, - "learning_rate": 8.03281621167867e-07, - "loss": 0.5078, - "step": 67436 - }, - { - "epoch": 1.73, - "learning_rate": 8.032544914689949e-07, - "loss": 0.5947, - "step": 67437 - }, - { - "epoch": 1.73, - "learning_rate": 8.032273619207621e-07, - "loss": 0.6436, - "step": 67438 - }, - { - "epoch": 1.73, - "learning_rate": 8.032002325231888e-07, - "loss": 0.4116, - "step": 67439 - }, - { - "epoch": 1.73, - "learning_rate": 8.031731032762963e-07, - "loss": 0.6934, - "step": 67440 - }, - { - "epoch": 1.73, - "learning_rate": 8.031459741801052e-07, - "loss": 0.7266, - "step": 67441 - }, - { - "epoch": 1.73, - "learning_rate": 8.031188452346358e-07, - "loss": 0.6289, - "step": 67442 - }, - { - "epoch": 1.73, - "learning_rate": 8.030917164399094e-07, - "loss": 0.7231, - "step": 67443 - }, - { - "epoch": 1.73, - "learning_rate": 8.030645877959465e-07, - "loss": 0.6055, - "step": 67444 - }, - { - "epoch": 1.73, - "learning_rate": 8.030374593027682e-07, - "loss": 0.5977, - "step": 67445 - }, - { - "epoch": 1.73, - "learning_rate": 8.030103309603948e-07, - "loss": 0.7568, - "step": 67446 - }, - { - "epoch": 1.73, - "learning_rate": 8.029832027688477e-07, - "loss": 0.5901, - "step": 67447 - }, - { - "epoch": 1.73, - "learning_rate": 8.02956074728147e-07, - "loss": 0.7124, - "step": 67448 - }, - { - "epoch": 1.73, - "learning_rate": 8.02928946838314e-07, - "loss": 0.5063, - "step": 67449 - }, - { - "epoch": 1.73, - "learning_rate": 8.02901819099369e-07, - "loss": 0.54, - "step": 67450 - }, - { - "epoch": 1.73, - "learning_rate": 8.028746915113336e-07, - "loss": 0.5132, - "step": 67451 - }, - { - "epoch": 1.73, - "learning_rate": 8.028475640742273e-07, - "loss": 0.4878, - "step": 67452 - }, - { - "epoch": 1.73, - "learning_rate": 8.028204367880719e-07, - "loss": 0.5352, - "step": 67453 - }, - { - "epoch": 1.73, - "learning_rate": 8.027933096528875e-07, - "loss": 0.8701, - "step": 67454 - }, - { - "epoch": 1.73, - "learning_rate": 8.027661826686955e-07, - "loss": 0.666, - "step": 67455 - }, - { - "epoch": 1.73, - "learning_rate": 8.02739055835516e-07, - "loss": 0.4695, - "step": 67456 - }, - { - "epoch": 1.73, - "learning_rate": 8.027119291533706e-07, - "loss": 0.5449, - "step": 67457 - }, - { - "epoch": 1.73, - "learning_rate": 8.026848026222792e-07, - "loss": 0.7236, - "step": 67458 - }, - { - "epoch": 1.73, - "learning_rate": 8.026576762422632e-07, - "loss": 0.4275, - "step": 67459 - }, - { - "epoch": 1.73, - "learning_rate": 8.02630550013343e-07, - "loss": 0.5635, - "step": 67460 - }, - { - "epoch": 1.73, - "learning_rate": 8.026034239355399e-07, - "loss": 0.6182, - "step": 67461 - }, - { - "epoch": 1.73, - "learning_rate": 8.025762980088742e-07, - "loss": 0.5767, - "step": 67462 - }, - { - "epoch": 1.73, - "learning_rate": 8.025491722333664e-07, - "loss": 0.686, - "step": 67463 - }, - { - "epoch": 1.73, - "learning_rate": 8.025220466090378e-07, - "loss": 0.7314, - "step": 67464 - }, - { - "epoch": 1.73, - "learning_rate": 8.024949211359089e-07, - "loss": 0.5415, - "step": 67465 - }, - { - "epoch": 1.73, - "learning_rate": 8.024677958140007e-07, - "loss": 0.5811, - "step": 67466 - }, - { - "epoch": 1.73, - "learning_rate": 8.024406706433338e-07, - "loss": 0.6416, - "step": 67467 - }, - { - "epoch": 1.73, - "learning_rate": 8.024135456239289e-07, - "loss": 0.6714, - "step": 67468 - }, - { - "epoch": 1.73, - "learning_rate": 8.023864207558069e-07, - "loss": 0.4604, - "step": 67469 - }, - { - "epoch": 1.73, - "learning_rate": 8.023592960389884e-07, - "loss": 0.7656, - "step": 67470 - }, - { - "epoch": 1.73, - "learning_rate": 8.023321714734948e-07, - "loss": 0.542, - "step": 67471 - }, - { - "epoch": 1.73, - "learning_rate": 8.02305047059346e-07, - "loss": 0.7188, - "step": 67472 - }, - { - "epoch": 1.73, - "learning_rate": 8.02277922796563e-07, - "loss": 0.5049, - "step": 67473 - }, - { - "epoch": 1.73, - "learning_rate": 8.022507986851669e-07, - "loss": 0.562, - "step": 67474 - }, - { - "epoch": 1.73, - "learning_rate": 8.022236747251781e-07, - "loss": 0.7773, - "step": 67475 - }, - { - "epoch": 1.73, - "learning_rate": 8.021965509166178e-07, - "loss": 0.5591, - "step": 67476 - }, - { - "epoch": 1.73, - "learning_rate": 8.021694272595061e-07, - "loss": 0.7456, - "step": 67477 - }, - { - "epoch": 1.73, - "learning_rate": 8.021423037538646e-07, - "loss": 0.5835, - "step": 67478 - }, - { - "epoch": 1.73, - "learning_rate": 8.021151803997133e-07, - "loss": 0.4683, - "step": 67479 - }, - { - "epoch": 1.73, - "learning_rate": 8.020880571970735e-07, - "loss": 0.4727, - "step": 67480 - }, - { - "epoch": 1.73, - "learning_rate": 8.020609341459661e-07, - "loss": 0.5549, - "step": 67481 - }, - { - "epoch": 1.73, - "learning_rate": 8.02033811246411e-07, - "loss": 0.5894, - "step": 67482 - }, - { - "epoch": 1.73, - "learning_rate": 8.020066884984298e-07, - "loss": 0.6357, - "step": 67483 - }, - { - "epoch": 1.73, - "learning_rate": 8.01979565902043e-07, - "loss": 0.4526, - "step": 67484 - }, - { - "epoch": 1.73, - "learning_rate": 8.019524434572711e-07, - "loss": 0.7129, - "step": 67485 - }, - { - "epoch": 1.73, - "learning_rate": 8.019253211641352e-07, - "loss": 0.7285, - "step": 67486 - }, - { - "epoch": 1.73, - "learning_rate": 8.018981990226558e-07, - "loss": 0.4316, - "step": 67487 - }, - { - "epoch": 1.73, - "learning_rate": 8.018710770328543e-07, - "loss": 0.7773, - "step": 67488 - }, - { - "epoch": 1.73, - "learning_rate": 8.018439551947505e-07, - "loss": 0.6846, - "step": 67489 - }, - { - "epoch": 1.73, - "learning_rate": 8.018168335083661e-07, - "loss": 0.6416, - "step": 67490 - }, - { - "epoch": 1.73, - "learning_rate": 8.017897119737215e-07, - "loss": 0.5835, - "step": 67491 - }, - { - "epoch": 1.73, - "learning_rate": 8.01762590590837e-07, - "loss": 0.7207, - "step": 67492 - }, - { - "epoch": 1.73, - "learning_rate": 8.01735469359734e-07, - "loss": 0.748, - "step": 67493 - }, - { - "epoch": 1.73, - "learning_rate": 8.017083482804329e-07, - "loss": 0.5449, - "step": 67494 - }, - { - "epoch": 1.73, - "learning_rate": 8.016812273529548e-07, - "loss": 0.6038, - "step": 67495 - }, - { - "epoch": 1.73, - "learning_rate": 8.016541065773199e-07, - "loss": 0.6987, - "step": 67496 - }, - { - "epoch": 1.73, - "learning_rate": 8.016269859535496e-07, - "loss": 0.7598, - "step": 67497 - }, - { - "epoch": 1.73, - "learning_rate": 8.015998654816642e-07, - "loss": 0.6709, - "step": 67498 - }, - { - "epoch": 1.73, - "learning_rate": 8.015727451616849e-07, - "loss": 0.6611, - "step": 67499 - }, - { - "epoch": 1.73, - "learning_rate": 8.01545624993632e-07, - "loss": 0.5483, - "step": 67500 - }, - { - "epoch": 1.73, - "learning_rate": 8.015185049775271e-07, - "loss": 0.6421, - "step": 67501 - }, - { - "epoch": 1.73, - "learning_rate": 8.014913851133897e-07, - "loss": 0.6069, - "step": 67502 - }, - { - "epoch": 1.73, - "learning_rate": 8.014642654012416e-07, - "loss": 0.708, - "step": 67503 - }, - { - "epoch": 1.73, - "learning_rate": 8.014371458411029e-07, - "loss": 0.5278, - "step": 67504 - }, - { - "epoch": 1.73, - "learning_rate": 8.014100264329947e-07, - "loss": 0.6445, - "step": 67505 - }, - { - "epoch": 1.73, - "learning_rate": 8.013829071769377e-07, - "loss": 0.7119, - "step": 67506 - }, - { - "epoch": 1.73, - "learning_rate": 8.013557880729528e-07, - "loss": 0.6279, - "step": 67507 - }, - { - "epoch": 1.73, - "learning_rate": 8.013286691210604e-07, - "loss": 0.606, - "step": 67508 - }, - { - "epoch": 1.73, - "learning_rate": 8.013015503212817e-07, - "loss": 0.792, - "step": 67509 - }, - { - "epoch": 1.73, - "learning_rate": 8.012744316736371e-07, - "loss": 0.5869, - "step": 67510 - }, - { - "epoch": 1.73, - "learning_rate": 8.01247313178148e-07, - "loss": 0.7354, - "step": 67511 - }, - { - "epoch": 1.73, - "learning_rate": 8.012201948348343e-07, - "loss": 0.3353, - "step": 67512 - }, - { - "epoch": 1.73, - "learning_rate": 8.011930766437171e-07, - "loss": 0.5918, - "step": 67513 - }, - { - "epoch": 1.73, - "learning_rate": 8.011659586048174e-07, - "loss": 0.5688, - "step": 67514 - }, - { - "epoch": 1.73, - "learning_rate": 8.011388407181556e-07, - "loss": 0.6455, - "step": 67515 - }, - { - "epoch": 1.73, - "learning_rate": 8.011117229837529e-07, - "loss": 0.5164, - "step": 67516 - }, - { - "epoch": 1.73, - "learning_rate": 8.010846054016295e-07, - "loss": 0.6621, - "step": 67517 - }, - { - "epoch": 1.73, - "learning_rate": 8.010574879718067e-07, - "loss": 0.6221, - "step": 67518 - }, - { - "epoch": 1.73, - "learning_rate": 8.01030370694305e-07, - "loss": 0.5723, - "step": 67519 - }, - { - "epoch": 1.73, - "learning_rate": 8.010032535691451e-07, - "loss": 0.6338, - "step": 67520 - }, - { - "epoch": 1.73, - "learning_rate": 8.009761365963482e-07, - "loss": 0.6167, - "step": 67521 - }, - { - "epoch": 1.73, - "learning_rate": 8.009490197759346e-07, - "loss": 0.7109, - "step": 67522 - }, - { - "epoch": 1.73, - "learning_rate": 8.009219031079249e-07, - "loss": 0.5815, - "step": 67523 - }, - { - "epoch": 1.73, - "learning_rate": 8.008947865923404e-07, - "loss": 0.6147, - "step": 67524 - }, - { - "epoch": 1.73, - "learning_rate": 8.008676702292013e-07, - "loss": 0.5303, - "step": 67525 - }, - { - "epoch": 1.73, - "learning_rate": 8.008405540185288e-07, - "loss": 0.7676, - "step": 67526 - }, - { - "epoch": 1.73, - "learning_rate": 8.008134379603435e-07, - "loss": 0.6509, - "step": 67527 - }, - { - "epoch": 1.73, - "learning_rate": 8.007863220546663e-07, - "loss": 0.6758, - "step": 67528 - }, - { - "epoch": 1.73, - "learning_rate": 8.007592063015177e-07, - "loss": 0.4158, - "step": 67529 - }, - { - "epoch": 1.73, - "learning_rate": 8.007320907009189e-07, - "loss": 0.6396, - "step": 67530 - }, - { - "epoch": 1.73, - "learning_rate": 8.007049752528905e-07, - "loss": 0.6245, - "step": 67531 - }, - { - "epoch": 1.73, - "learning_rate": 8.006778599574526e-07, - "loss": 0.6536, - "step": 67532 - }, - { - "epoch": 1.73, - "learning_rate": 8.006507448146269e-07, - "loss": 0.7998, - "step": 67533 - }, - { - "epoch": 1.73, - "learning_rate": 8.006236298244334e-07, - "loss": 0.687, - "step": 67534 - }, - { - "epoch": 1.73, - "learning_rate": 8.005965149868935e-07, - "loss": 0.6875, - "step": 67535 - }, - { - "epoch": 1.73, - "learning_rate": 8.005694003020276e-07, - "loss": 0.6787, - "step": 67536 - }, - { - "epoch": 1.73, - "learning_rate": 8.005422857698565e-07, - "loss": 0.7549, - "step": 67537 - }, - { - "epoch": 1.73, - "learning_rate": 8.00515171390401e-07, - "loss": 0.6606, - "step": 67538 - }, - { - "epoch": 1.73, - "learning_rate": 8.004880571636819e-07, - "loss": 0.5142, - "step": 67539 - }, - { - "epoch": 1.73, - "learning_rate": 8.0046094308972e-07, - "loss": 0.627, - "step": 67540 - }, - { - "epoch": 1.73, - "learning_rate": 8.004338291685362e-07, - "loss": 0.7715, - "step": 67541 - }, - { - "epoch": 1.73, - "learning_rate": 8.004067154001505e-07, - "loss": 0.7861, - "step": 67542 - }, - { - "epoch": 1.73, - "learning_rate": 8.003796017845847e-07, - "loss": 0.4829, - "step": 67543 - }, - { - "epoch": 1.73, - "learning_rate": 8.003524883218587e-07, - "loss": 0.5298, - "step": 67544 - }, - { - "epoch": 1.73, - "learning_rate": 8.003253750119938e-07, - "loss": 0.564, - "step": 67545 - }, - { - "epoch": 1.73, - "learning_rate": 8.002982618550103e-07, - "loss": 0.7021, - "step": 67546 - }, - { - "epoch": 1.73, - "learning_rate": 8.002711488509296e-07, - "loss": 0.6533, - "step": 67547 - }, - { - "epoch": 1.73, - "learning_rate": 8.002440359997718e-07, - "loss": 0.5146, - "step": 67548 - }, - { - "epoch": 1.73, - "learning_rate": 8.002169233015581e-07, - "loss": 0.5996, - "step": 67549 - }, - { - "epoch": 1.73, - "learning_rate": 8.00189810756309e-07, - "loss": 0.7646, - "step": 67550 - }, - { - "epoch": 1.73, - "learning_rate": 8.001626983640458e-07, - "loss": 0.7207, - "step": 67551 - }, - { - "epoch": 1.73, - "learning_rate": 8.001355861247886e-07, - "loss": 0.6064, - "step": 67552 - }, - { - "epoch": 1.73, - "learning_rate": 8.001084740385582e-07, - "loss": 0.6885, - "step": 67553 - }, - { - "epoch": 1.73, - "learning_rate": 8.000813621053757e-07, - "loss": 0.6357, - "step": 67554 - }, - { - "epoch": 1.73, - "learning_rate": 8.000542503252616e-07, - "loss": 0.7012, - "step": 67555 - }, - { - "epoch": 1.73, - "learning_rate": 8.000271386982369e-07, - "loss": 0.6089, - "step": 67556 - }, - { - "epoch": 1.73, - "learning_rate": 8.000000272243222e-07, - "loss": 0.6572, - "step": 67557 - }, - { - "epoch": 1.73, - "learning_rate": 7.999729159035381e-07, - "loss": 0.6414, - "step": 67558 - }, - { - "epoch": 1.73, - "learning_rate": 7.999458047359058e-07, - "loss": 0.5249, - "step": 67559 - }, - { - "epoch": 1.73, - "learning_rate": 7.999186937214456e-07, - "loss": 0.6426, - "step": 67560 - }, - { - "epoch": 1.73, - "learning_rate": 7.998915828601788e-07, - "loss": 0.5781, - "step": 67561 - }, - { - "epoch": 1.73, - "learning_rate": 7.998644721521256e-07, - "loss": 0.665, - "step": 67562 - }, - { - "epoch": 1.73, - "learning_rate": 7.998373615973068e-07, - "loss": 0.554, - "step": 67563 - }, - { - "epoch": 1.73, - "learning_rate": 7.998102511957437e-07, - "loss": 0.4762, - "step": 67564 - }, - { - "epoch": 1.73, - "learning_rate": 7.997831409474561e-07, - "loss": 0.6538, - "step": 67565 - }, - { - "epoch": 1.73, - "learning_rate": 7.997560308524658e-07, - "loss": 0.5576, - "step": 67566 - }, - { - "epoch": 1.73, - "learning_rate": 7.99728920910793e-07, - "loss": 0.5884, - "step": 67567 - }, - { - "epoch": 1.73, - "learning_rate": 7.997018111224585e-07, - "loss": 0.6821, - "step": 67568 - }, - { - "epoch": 1.73, - "learning_rate": 7.996747014874831e-07, - "loss": 0.4702, - "step": 67569 - }, - { - "epoch": 1.73, - "learning_rate": 7.996475920058876e-07, - "loss": 0.5903, - "step": 67570 - }, - { - "epoch": 1.73, - "learning_rate": 7.996204826776931e-07, - "loss": 0.4473, - "step": 67571 - }, - { - "epoch": 1.73, - "learning_rate": 7.995933735029195e-07, - "loss": 0.6333, - "step": 67572 - }, - { - "epoch": 1.73, - "learning_rate": 7.995662644815883e-07, - "loss": 0.5273, - "step": 67573 - }, - { - "epoch": 1.73, - "learning_rate": 7.995391556137199e-07, - "loss": 0.8408, - "step": 67574 - }, - { - "epoch": 1.73, - "learning_rate": 7.995120468993349e-07, - "loss": 0.5513, - "step": 67575 - }, - { - "epoch": 1.73, - "learning_rate": 7.994849383384547e-07, - "loss": 0.8018, - "step": 67576 - }, - { - "epoch": 1.73, - "learning_rate": 7.994578299310993e-07, - "loss": 0.6494, - "step": 67577 - }, - { - "epoch": 1.73, - "learning_rate": 7.994307216772901e-07, - "loss": 0.7251, - "step": 67578 - }, - { - "epoch": 1.73, - "learning_rate": 7.994036135770473e-07, - "loss": 0.6807, - "step": 67579 - }, - { - "epoch": 1.73, - "learning_rate": 7.993765056303922e-07, - "loss": 0.7046, - "step": 67580 - }, - { - "epoch": 1.73, - "learning_rate": 7.993493978373456e-07, - "loss": 0.5537, - "step": 67581 - }, - { - "epoch": 1.73, - "learning_rate": 7.993222901979273e-07, - "loss": 0.4634, - "step": 67582 - }, - { - "epoch": 1.73, - "learning_rate": 7.992951827121591e-07, - "loss": 0.666, - "step": 67583 - }, - { - "epoch": 1.73, - "learning_rate": 7.992680753800609e-07, - "loss": 0.6602, - "step": 67584 - }, - { - "epoch": 1.73, - "learning_rate": 7.992409682016544e-07, - "loss": 0.6543, - "step": 67585 - }, - { - "epoch": 1.73, - "learning_rate": 7.992138611769595e-07, - "loss": 0.6309, - "step": 67586 - }, - { - "epoch": 1.73, - "learning_rate": 7.991867543059975e-07, - "loss": 0.7441, - "step": 67587 - }, - { - "epoch": 1.73, - "learning_rate": 7.991596475887888e-07, - "loss": 0.7139, - "step": 67588 - }, - { - "epoch": 1.73, - "learning_rate": 7.991325410253545e-07, - "loss": 0.6343, - "step": 67589 - }, - { - "epoch": 1.73, - "learning_rate": 7.99105434615715e-07, - "loss": 0.5298, - "step": 67590 - }, - { - "epoch": 1.73, - "learning_rate": 7.990783283598916e-07, - "loss": 0.4927, - "step": 67591 - }, - { - "epoch": 1.73, - "learning_rate": 7.990512222579046e-07, - "loss": 0.7363, - "step": 67592 - }, - { - "epoch": 1.73, - "learning_rate": 7.990241163097747e-07, - "loss": 0.6017, - "step": 67593 - }, - { - "epoch": 1.73, - "learning_rate": 7.989970105155227e-07, - "loss": 0.6602, - "step": 67594 - }, - { - "epoch": 1.73, - "learning_rate": 7.989699048751696e-07, - "loss": 0.5469, - "step": 67595 - }, - { - "epoch": 1.73, - "learning_rate": 7.989427993887357e-07, - "loss": 0.5591, - "step": 67596 - }, - { - "epoch": 1.73, - "learning_rate": 7.989156940562425e-07, - "loss": 0.707, - "step": 67597 - }, - { - "epoch": 1.73, - "learning_rate": 7.988885888777099e-07, - "loss": 0.604, - "step": 67598 - }, - { - "epoch": 1.73, - "learning_rate": 7.988614838531594e-07, - "loss": 0.5923, - "step": 67599 - }, - { - "epoch": 1.73, - "learning_rate": 7.988343789826111e-07, - "loss": 0.665, - "step": 67600 - }, - { - "epoch": 1.73, - "learning_rate": 7.988072742660864e-07, - "loss": 0.6543, - "step": 67601 - }, - { - "epoch": 1.73, - "learning_rate": 7.987801697036056e-07, - "loss": 0.6084, - "step": 67602 - }, - { - "epoch": 1.73, - "learning_rate": 7.987530652951895e-07, - "loss": 0.8154, - "step": 67603 - }, - { - "epoch": 1.73, - "learning_rate": 7.98725961040859e-07, - "loss": 0.6318, - "step": 67604 - }, - { - "epoch": 1.73, - "learning_rate": 7.986988569406346e-07, - "loss": 0.7764, - "step": 67605 - }, - { - "epoch": 1.73, - "learning_rate": 7.986717529945374e-07, - "loss": 0.5825, - "step": 67606 - }, - { - "epoch": 1.73, - "learning_rate": 7.986446492025878e-07, - "loss": 0.5791, - "step": 67607 - }, - { - "epoch": 1.73, - "learning_rate": 7.986175455648068e-07, - "loss": 0.6134, - "step": 67608 - }, - { - "epoch": 1.73, - "learning_rate": 7.98590442081215e-07, - "loss": 0.7637, - "step": 67609 - }, - { - "epoch": 1.73, - "learning_rate": 7.985633387518336e-07, - "loss": 0.7388, - "step": 67610 - }, - { - "epoch": 1.73, - "learning_rate": 7.98536235576683e-07, - "loss": 0.6099, - "step": 67611 - }, - { - "epoch": 1.73, - "learning_rate": 7.985091325557838e-07, - "loss": 0.5703, - "step": 67612 - }, - { - "epoch": 1.73, - "learning_rate": 7.984820296891567e-07, - "loss": 0.6006, - "step": 67613 - }, - { - "epoch": 1.73, - "learning_rate": 7.984549269768228e-07, - "loss": 0.6484, - "step": 67614 - }, - { - "epoch": 1.73, - "learning_rate": 7.984278244188025e-07, - "loss": 0.6328, - "step": 67615 - }, - { - "epoch": 1.73, - "learning_rate": 7.98400722015117e-07, - "loss": 0.5173, - "step": 67616 - }, - { - "epoch": 1.73, - "learning_rate": 7.983736197657866e-07, - "loss": 0.6592, - "step": 67617 - }, - { - "epoch": 1.73, - "learning_rate": 7.983465176708324e-07, - "loss": 0.7324, - "step": 67618 - }, - { - "epoch": 1.73, - "learning_rate": 7.983194157302747e-07, - "loss": 0.7178, - "step": 67619 - }, - { - "epoch": 1.73, - "learning_rate": 7.982923139441349e-07, - "loss": 0.5845, - "step": 67620 - }, - { - "epoch": 1.73, - "learning_rate": 7.982652123124336e-07, - "loss": 0.5518, - "step": 67621 - }, - { - "epoch": 1.73, - "learning_rate": 7.982381108351909e-07, - "loss": 0.6587, - "step": 67622 - }, - { - "epoch": 1.73, - "learning_rate": 7.982110095124282e-07, - "loss": 0.7666, - "step": 67623 - }, - { - "epoch": 1.73, - "learning_rate": 7.981839083441659e-07, - "loss": 0.502, - "step": 67624 - }, - { - "epoch": 1.73, - "learning_rate": 7.98156807330425e-07, - "loss": 0.6592, - "step": 67625 - }, - { - "epoch": 1.73, - "learning_rate": 7.98129706471226e-07, - "loss": 0.6431, - "step": 67626 - }, - { - "epoch": 1.73, - "learning_rate": 7.981026057665901e-07, - "loss": 0.6602, - "step": 67627 - }, - { - "epoch": 1.73, - "learning_rate": 7.980755052165374e-07, - "loss": 0.8125, - "step": 67628 - }, - { - "epoch": 1.73, - "learning_rate": 7.980484048210892e-07, - "loss": 0.5322, - "step": 67629 - }, - { - "epoch": 1.73, - "learning_rate": 7.980213045802662e-07, - "loss": 0.5957, - "step": 67630 - }, - { - "epoch": 1.73, - "learning_rate": 7.979942044940892e-07, - "loss": 0.6348, - "step": 67631 - }, - { - "epoch": 1.73, - "learning_rate": 7.979671045625782e-07, - "loss": 0.5986, - "step": 67632 - }, - { - "epoch": 1.73, - "learning_rate": 7.979400047857547e-07, - "loss": 0.6719, - "step": 67633 - }, - { - "epoch": 1.73, - "learning_rate": 7.979129051636392e-07, - "loss": 0.4277, - "step": 67634 - }, - { - "epoch": 1.73, - "learning_rate": 7.978858056962526e-07, - "loss": 0.5127, - "step": 67635 - }, - { - "epoch": 1.73, - "learning_rate": 7.978587063836153e-07, - "loss": 0.562, - "step": 67636 - }, - { - "epoch": 1.73, - "learning_rate": 7.978316072257486e-07, - "loss": 0.8027, - "step": 67637 - }, - { - "epoch": 1.73, - "learning_rate": 7.978045082226727e-07, - "loss": 0.6255, - "step": 67638 - }, - { - "epoch": 1.73, - "learning_rate": 7.977774093744087e-07, - "loss": 0.7217, - "step": 67639 - }, - { - "epoch": 1.73, - "learning_rate": 7.977503106809772e-07, - "loss": 0.4811, - "step": 67640 - }, - { - "epoch": 1.73, - "learning_rate": 7.977232121423994e-07, - "loss": 0.252, - "step": 67641 - }, - { - "epoch": 1.73, - "learning_rate": 7.976961137586952e-07, - "loss": 0.5956, - "step": 67642 - }, - { - "epoch": 1.73, - "learning_rate": 7.976690155298858e-07, - "loss": 0.7139, - "step": 67643 - }, - { - "epoch": 1.73, - "learning_rate": 7.97641917455992e-07, - "loss": 0.6357, - "step": 67644 - }, - { - "epoch": 1.73, - "learning_rate": 7.976148195370344e-07, - "loss": 0.6562, - "step": 67645 - }, - { - "epoch": 1.73, - "learning_rate": 7.975877217730341e-07, - "loss": 0.7168, - "step": 67646 - }, - { - "epoch": 1.73, - "learning_rate": 7.975606241640114e-07, - "loss": 0.6157, - "step": 67647 - }, - { - "epoch": 1.73, - "learning_rate": 7.97533526709987e-07, - "loss": 0.7598, - "step": 67648 - }, - { - "epoch": 1.73, - "learning_rate": 7.975064294109821e-07, - "loss": 0.5596, - "step": 67649 - }, - { - "epoch": 1.73, - "learning_rate": 7.974793322670171e-07, - "loss": 0.6992, - "step": 67650 - }, - { - "epoch": 1.73, - "learning_rate": 7.974522352781133e-07, - "loss": 0.6758, - "step": 67651 - }, - { - "epoch": 1.73, - "learning_rate": 7.974251384442906e-07, - "loss": 0.675, - "step": 67652 - }, - { - "epoch": 1.73, - "learning_rate": 7.973980417655702e-07, - "loss": 0.5532, - "step": 67653 - }, - { - "epoch": 1.73, - "learning_rate": 7.973709452419728e-07, - "loss": 0.623, - "step": 67654 - }, - { - "epoch": 1.73, - "learning_rate": 7.97343848873519e-07, - "loss": 0.7275, - "step": 67655 - }, - { - "epoch": 1.73, - "learning_rate": 7.973167526602299e-07, - "loss": 0.7549, - "step": 67656 - }, - { - "epoch": 1.73, - "learning_rate": 7.972896566021259e-07, - "loss": 0.4897, - "step": 67657 - }, - { - "epoch": 1.73, - "learning_rate": 7.97262560699228e-07, - "loss": 0.6299, - "step": 67658 - }, - { - "epoch": 1.73, - "learning_rate": 7.972354649515567e-07, - "loss": 0.4449, - "step": 67659 - }, - { - "epoch": 1.73, - "learning_rate": 7.972083693591331e-07, - "loss": 0.5293, - "step": 67660 - }, - { - "epoch": 1.73, - "learning_rate": 7.971812739219779e-07, - "loss": 0.6719, - "step": 67661 - }, - { - "epoch": 1.73, - "learning_rate": 7.971541786401112e-07, - "loss": 0.71, - "step": 67662 - }, - { - "epoch": 1.73, - "learning_rate": 7.971270835135546e-07, - "loss": 0.7344, - "step": 67663 - }, - { - "epoch": 1.73, - "learning_rate": 7.970999885423284e-07, - "loss": 0.4392, - "step": 67664 - }, - { - "epoch": 1.73, - "learning_rate": 7.970728937264531e-07, - "loss": 0.6655, - "step": 67665 - }, - { - "epoch": 1.73, - "learning_rate": 7.9704579906595e-07, - "loss": 0.4204, - "step": 67666 - }, - { - "epoch": 1.73, - "learning_rate": 7.970187045608394e-07, - "loss": 0.665, - "step": 67667 - }, - { - "epoch": 1.73, - "learning_rate": 7.969916102111425e-07, - "loss": 0.6924, - "step": 67668 - }, - { - "epoch": 1.73, - "learning_rate": 7.969645160168795e-07, - "loss": 0.8125, - "step": 67669 - }, - { - "epoch": 1.73, - "learning_rate": 7.969374219780718e-07, - "loss": 0.5566, - "step": 67670 - }, - { - "epoch": 1.73, - "learning_rate": 7.969103280947398e-07, - "loss": 0.6963, - "step": 67671 - }, - { - "epoch": 1.73, - "learning_rate": 7.96883234366904e-07, - "loss": 0.4714, - "step": 67672 - }, - { - "epoch": 1.73, - "learning_rate": 7.968561407945854e-07, - "loss": 0.6084, - "step": 67673 - }, - { - "epoch": 1.73, - "learning_rate": 7.968290473778045e-07, - "loss": 0.6755, - "step": 67674 - }, - { - "epoch": 1.73, - "learning_rate": 7.968019541165826e-07, - "loss": 0.8301, - "step": 67675 - }, - { - "epoch": 1.73, - "learning_rate": 7.967748610109399e-07, - "loss": 0.7207, - "step": 67676 - }, - { - "epoch": 1.73, - "learning_rate": 7.967477680608974e-07, - "loss": 0.519, - "step": 67677 - }, - { - "epoch": 1.73, - "learning_rate": 7.967206752664757e-07, - "loss": 0.5576, - "step": 67678 - }, - { - "epoch": 1.73, - "learning_rate": 7.966935826276957e-07, - "loss": 0.6885, - "step": 67679 - }, - { - "epoch": 1.73, - "learning_rate": 7.966664901445784e-07, - "loss": 0.6592, - "step": 67680 - }, - { - "epoch": 1.73, - "learning_rate": 7.966393978171438e-07, - "loss": 0.583, - "step": 67681 - }, - { - "epoch": 1.73, - "learning_rate": 7.966123056454133e-07, - "loss": 0.7627, - "step": 67682 - }, - { - "epoch": 1.73, - "learning_rate": 7.965852136294074e-07, - "loss": 0.5996, - "step": 67683 - }, - { - "epoch": 1.73, - "learning_rate": 7.965581217691465e-07, - "loss": 0.6785, - "step": 67684 - }, - { - "epoch": 1.73, - "learning_rate": 7.96531030064652e-07, - "loss": 0.6045, - "step": 67685 - }, - { - "epoch": 1.73, - "learning_rate": 7.965039385159441e-07, - "loss": 0.5142, - "step": 67686 - }, - { - "epoch": 1.73, - "learning_rate": 7.964768471230441e-07, - "loss": 0.5967, - "step": 67687 - }, - { - "epoch": 1.73, - "learning_rate": 7.964497558859721e-07, - "loss": 0.6279, - "step": 67688 - }, - { - "epoch": 1.73, - "learning_rate": 7.964226648047494e-07, - "loss": 0.7417, - "step": 67689 - }, - { - "epoch": 1.73, - "learning_rate": 7.963955738793967e-07, - "loss": 0.7451, - "step": 67690 - }, - { - "epoch": 1.73, - "learning_rate": 7.963684831099341e-07, - "loss": 0.5527, - "step": 67691 - }, - { - "epoch": 1.73, - "learning_rate": 7.963413924963831e-07, - "loss": 0.7861, - "step": 67692 - }, - { - "epoch": 1.74, - "learning_rate": 7.963143020387638e-07, - "loss": 0.6802, - "step": 67693 - }, - { - "epoch": 1.74, - "learning_rate": 7.962872117370976e-07, - "loss": 0.4609, - "step": 67694 - }, - { - "epoch": 1.74, - "learning_rate": 7.962601215914046e-07, - "loss": 0.8662, - "step": 67695 - }, - { - "epoch": 1.74, - "learning_rate": 7.962330316017061e-07, - "loss": 0.7295, - "step": 67696 - }, - { - "epoch": 1.74, - "learning_rate": 7.962059417680224e-07, - "loss": 0.6099, - "step": 67697 - }, - { - "epoch": 1.74, - "learning_rate": 7.961788520903746e-07, - "loss": 0.415, - "step": 67698 - }, - { - "epoch": 1.74, - "learning_rate": 7.961517625687832e-07, - "loss": 0.6934, - "step": 67699 - }, - { - "epoch": 1.74, - "learning_rate": 7.961246732032696e-07, - "loss": 0.7012, - "step": 67700 - }, - { - "epoch": 1.74, - "learning_rate": 7.960975839938533e-07, - "loss": 0.7109, - "step": 67701 - }, - { - "epoch": 1.74, - "learning_rate": 7.960704949405559e-07, - "loss": 0.6567, - "step": 67702 - }, - { - "epoch": 1.74, - "learning_rate": 7.960434060433977e-07, - "loss": 0.6465, - "step": 67703 - }, - { - "epoch": 1.74, - "learning_rate": 7.960163173024e-07, - "loss": 0.6138, - "step": 67704 - }, - { - "epoch": 1.74, - "learning_rate": 7.959892287175829e-07, - "loss": 0.8516, - "step": 67705 - }, - { - "epoch": 1.74, - "learning_rate": 7.959621402889678e-07, - "loss": 0.6182, - "step": 67706 - }, - { - "epoch": 1.74, - "learning_rate": 7.959350520165748e-07, - "loss": 0.5649, - "step": 67707 - }, - { - "epoch": 1.74, - "learning_rate": 7.959079639004252e-07, - "loss": 0.6602, - "step": 67708 - }, - { - "epoch": 1.74, - "learning_rate": 7.958808759405393e-07, - "loss": 0.6323, - "step": 67709 - }, - { - "epoch": 1.74, - "learning_rate": 7.958537881369385e-07, - "loss": 0.4602, - "step": 67710 - }, - { - "epoch": 1.74, - "learning_rate": 7.958267004896427e-07, - "loss": 0.7002, - "step": 67711 - }, - { - "epoch": 1.74, - "learning_rate": 7.957996129986728e-07, - "loss": 0.5657, - "step": 67712 - }, - { - "epoch": 1.74, - "learning_rate": 7.957725256640502e-07, - "loss": 0.6895, - "step": 67713 - }, - { - "epoch": 1.74, - "learning_rate": 7.957454384857947e-07, - "loss": 0.5066, - "step": 67714 - }, - { - "epoch": 1.74, - "learning_rate": 7.957183514639278e-07, - "loss": 0.537, - "step": 67715 - }, - { - "epoch": 1.74, - "learning_rate": 7.956912645984699e-07, - "loss": 0.6533, - "step": 67716 - }, - { - "epoch": 1.74, - "learning_rate": 7.956641778894419e-07, - "loss": 0.71, - "step": 67717 - }, - { - "epoch": 1.74, - "learning_rate": 7.956370913368642e-07, - "loss": 0.4661, - "step": 67718 - }, - { - "epoch": 1.74, - "learning_rate": 7.956100049407581e-07, - "loss": 0.5464, - "step": 67719 - }, - { - "epoch": 1.74, - "learning_rate": 7.955829187011442e-07, - "loss": 0.7129, - "step": 67720 - }, - { - "epoch": 1.74, - "learning_rate": 7.955558326180428e-07, - "loss": 0.634, - "step": 67721 - }, - { - "epoch": 1.74, - "learning_rate": 7.955287466914747e-07, - "loss": 0.7236, - "step": 67722 - }, - { - "epoch": 1.74, - "learning_rate": 7.955016609214611e-07, - "loss": 0.623, - "step": 67723 - }, - { - "epoch": 1.74, - "learning_rate": 7.954745753080222e-07, - "loss": 0.533, - "step": 67724 - }, - { - "epoch": 1.74, - "learning_rate": 7.954474898511792e-07, - "loss": 0.6846, - "step": 67725 - }, - { - "epoch": 1.74, - "learning_rate": 7.954204045509525e-07, - "loss": 0.5844, - "step": 67726 - }, - { - "epoch": 1.74, - "learning_rate": 7.953933194073632e-07, - "loss": 0.6738, - "step": 67727 - }, - { - "epoch": 1.74, - "learning_rate": 7.953662344204316e-07, - "loss": 0.7104, - "step": 67728 - }, - { - "epoch": 1.74, - "learning_rate": 7.953391495901788e-07, - "loss": 0.7021, - "step": 67729 - }, - { - "epoch": 1.74, - "learning_rate": 7.953120649166259e-07, - "loss": 0.666, - "step": 67730 - }, - { - "epoch": 1.74, - "learning_rate": 7.952849803997924e-07, - "loss": 0.5464, - "step": 67731 - }, - { - "epoch": 1.74, - "learning_rate": 7.952578960397001e-07, - "loss": 0.6572, - "step": 67732 - }, - { - "epoch": 1.74, - "learning_rate": 7.952308118363692e-07, - "loss": 0.6895, - "step": 67733 - }, - { - "epoch": 1.74, - "learning_rate": 7.95203727789821e-07, - "loss": 0.6523, - "step": 67734 - }, - { - "epoch": 1.74, - "learning_rate": 7.951766439000754e-07, - "loss": 0.5728, - "step": 67735 - }, - { - "epoch": 1.74, - "learning_rate": 7.95149560167154e-07, - "loss": 0.447, - "step": 67736 - }, - { - "epoch": 1.74, - "learning_rate": 7.951224765910771e-07, - "loss": 0.7002, - "step": 67737 - }, - { - "epoch": 1.74, - "learning_rate": 7.950953931718654e-07, - "loss": 0.6855, - "step": 67738 - }, - { - "epoch": 1.74, - "learning_rate": 7.950683099095399e-07, - "loss": 0.752, - "step": 67739 - }, - { - "epoch": 1.74, - "learning_rate": 7.950412268041214e-07, - "loss": 0.5386, - "step": 67740 - }, - { - "epoch": 1.74, - "learning_rate": 7.9501414385563e-07, - "loss": 0.7178, - "step": 67741 - }, - { - "epoch": 1.74, - "learning_rate": 7.949870610640868e-07, - "loss": 0.5203, - "step": 67742 - }, - { - "epoch": 1.74, - "learning_rate": 7.949599784295127e-07, - "loss": 0.6475, - "step": 67743 - }, - { - "epoch": 1.74, - "learning_rate": 7.949328959519283e-07, - "loss": 0.5183, - "step": 67744 - }, - { - "epoch": 1.74, - "learning_rate": 7.949058136313543e-07, - "loss": 0.4617, - "step": 67745 - }, - { - "epoch": 1.74, - "learning_rate": 7.948787314678116e-07, - "loss": 0.4321, - "step": 67746 - }, - { - "epoch": 1.74, - "learning_rate": 7.948516494613207e-07, - "loss": 0.6135, - "step": 67747 - }, - { - "epoch": 1.74, - "learning_rate": 7.948245676119026e-07, - "loss": 0.8008, - "step": 67748 - }, - { - "epoch": 1.74, - "learning_rate": 7.947974859195777e-07, - "loss": 0.624, - "step": 67749 - }, - { - "epoch": 1.74, - "learning_rate": 7.947704043843674e-07, - "loss": 0.6335, - "step": 67750 - }, - { - "epoch": 1.74, - "learning_rate": 7.947433230062918e-07, - "loss": 0.627, - "step": 67751 - }, - { - "epoch": 1.74, - "learning_rate": 7.947162417853714e-07, - "loss": 0.6816, - "step": 67752 - }, - { - "epoch": 1.74, - "learning_rate": 7.946891607216278e-07, - "loss": 0.8389, - "step": 67753 - }, - { - "epoch": 1.74, - "learning_rate": 7.946620798150807e-07, - "loss": 0.6035, - "step": 67754 - }, - { - "epoch": 1.74, - "learning_rate": 7.94634999065752e-07, - "loss": 0.3752, - "step": 67755 - }, - { - "epoch": 1.74, - "learning_rate": 7.946079184736616e-07, - "loss": 0.6836, - "step": 67756 - }, - { - "epoch": 1.74, - "learning_rate": 7.945808380388302e-07, - "loss": 0.6772, - "step": 67757 - }, - { - "epoch": 1.74, - "learning_rate": 7.945537577612792e-07, - "loss": 0.5991, - "step": 67758 - }, - { - "epoch": 1.74, - "learning_rate": 7.945266776410287e-07, - "loss": 0.5872, - "step": 67759 - }, - { - "epoch": 1.74, - "learning_rate": 7.944995976781001e-07, - "loss": 0.5854, - "step": 67760 - }, - { - "epoch": 1.74, - "learning_rate": 7.944725178725134e-07, - "loss": 0.7236, - "step": 67761 - }, - { - "epoch": 1.74, - "learning_rate": 7.944454382242896e-07, - "loss": 0.4858, - "step": 67762 - }, - { - "epoch": 1.74, - "learning_rate": 7.944183587334495e-07, - "loss": 0.4695, - "step": 67763 - }, - { - "epoch": 1.74, - "learning_rate": 7.943912794000137e-07, - "loss": 0.6318, - "step": 67764 - }, - { - "epoch": 1.74, - "learning_rate": 7.943642002240032e-07, - "loss": 0.6895, - "step": 67765 - }, - { - "epoch": 1.74, - "learning_rate": 7.943371212054384e-07, - "loss": 0.6025, - "step": 67766 - }, - { - "epoch": 1.74, - "learning_rate": 7.943100423443404e-07, - "loss": 0.6846, - "step": 67767 - }, - { - "epoch": 1.74, - "learning_rate": 7.942829636407296e-07, - "loss": 0.6436, - "step": 67768 - }, - { - "epoch": 1.74, - "learning_rate": 7.94255885094627e-07, - "loss": 0.7148, - "step": 67769 - }, - { - "epoch": 1.74, - "learning_rate": 7.942288067060536e-07, - "loss": 0.6187, - "step": 67770 - }, - { - "epoch": 1.74, - "learning_rate": 7.942017284750291e-07, - "loss": 0.7285, - "step": 67771 - }, - { - "epoch": 1.74, - "learning_rate": 7.941746504015751e-07, - "loss": 0.6504, - "step": 67772 - }, - { - "epoch": 1.74, - "learning_rate": 7.941475724857122e-07, - "loss": 0.7549, - "step": 67773 - }, - { - "epoch": 1.74, - "learning_rate": 7.941204947274608e-07, - "loss": 0.573, - "step": 67774 - }, - { - "epoch": 1.74, - "learning_rate": 7.940934171268421e-07, - "loss": 0.8271, - "step": 67775 - }, - { - "epoch": 1.74, - "learning_rate": 7.940663396838764e-07, - "loss": 0.6255, - "step": 67776 - }, - { - "epoch": 1.74, - "learning_rate": 7.940392623985848e-07, - "loss": 0.3284, - "step": 67777 - }, - { - "epoch": 1.74, - "learning_rate": 7.940121852709875e-07, - "loss": 0.6875, - "step": 67778 - }, - { - "epoch": 1.74, - "learning_rate": 7.939851083011062e-07, - "loss": 0.6416, - "step": 67779 - }, - { - "epoch": 1.74, - "learning_rate": 7.939580314889609e-07, - "loss": 0.71, - "step": 67780 - }, - { - "epoch": 1.74, - "learning_rate": 7.939309548345722e-07, - "loss": 0.5747, - "step": 67781 - }, - { - "epoch": 1.74, - "learning_rate": 7.939038783379612e-07, - "loss": 0.6016, - "step": 67782 - }, - { - "epoch": 1.74, - "learning_rate": 7.938768019991484e-07, - "loss": 0.7734, - "step": 67783 - }, - { - "epoch": 1.74, - "learning_rate": 7.938497258181549e-07, - "loss": 0.6553, - "step": 67784 - }, - { - "epoch": 1.74, - "learning_rate": 7.938226497950009e-07, - "loss": 0.708, - "step": 67785 - }, - { - "epoch": 1.74, - "learning_rate": 7.937955739297077e-07, - "loss": 0.6504, - "step": 67786 - }, - { - "epoch": 1.74, - "learning_rate": 7.937684982222954e-07, - "loss": 0.6934, - "step": 67787 - }, - { - "epoch": 1.74, - "learning_rate": 7.937414226727854e-07, - "loss": 0.6406, - "step": 67788 - }, - { - "epoch": 1.74, - "learning_rate": 7.937143472811978e-07, - "loss": 0.3868, - "step": 67789 - }, - { - "epoch": 1.74, - "learning_rate": 7.936872720475545e-07, - "loss": 0.4309, - "step": 67790 - }, - { - "epoch": 1.74, - "learning_rate": 7.936601969718744e-07, - "loss": 0.5439, - "step": 67791 - }, - { - "epoch": 1.74, - "learning_rate": 7.936331220541796e-07, - "loss": 0.7354, - "step": 67792 - }, - { - "epoch": 1.74, - "learning_rate": 7.936060472944903e-07, - "loss": 0.604, - "step": 67793 - }, - { - "epoch": 1.74, - "learning_rate": 7.935789726928275e-07, - "loss": 0.6362, - "step": 67794 - }, - { - "epoch": 1.74, - "learning_rate": 7.935518982492115e-07, - "loss": 0.5615, - "step": 67795 - }, - { - "epoch": 1.74, - "learning_rate": 7.935248239636636e-07, - "loss": 0.6143, - "step": 67796 - }, - { - "epoch": 1.74, - "learning_rate": 7.934977498362039e-07, - "loss": 0.375, - "step": 67797 - }, - { - "epoch": 1.74, - "learning_rate": 7.934706758668539e-07, - "loss": 0.5376, - "step": 67798 - }, - { - "epoch": 1.74, - "learning_rate": 7.934436020556336e-07, - "loss": 0.5312, - "step": 67799 - }, - { - "epoch": 1.74, - "learning_rate": 7.934165284025645e-07, - "loss": 0.6016, - "step": 67800 - }, - { - "epoch": 1.74, - "learning_rate": 7.933894549076666e-07, - "loss": 0.6572, - "step": 67801 - }, - { - "epoch": 1.74, - "learning_rate": 7.933623815709607e-07, - "loss": 0.7334, - "step": 67802 - }, - { - "epoch": 1.74, - "learning_rate": 7.93335308392468e-07, - "loss": 0.5815, - "step": 67803 - }, - { - "epoch": 1.74, - "learning_rate": 7.933082353722086e-07, - "loss": 0.627, - "step": 67804 - }, - { - "epoch": 1.74, - "learning_rate": 7.932811625102038e-07, - "loss": 0.5542, - "step": 67805 - }, - { - "epoch": 1.74, - "learning_rate": 7.93254089806474e-07, - "loss": 0.5728, - "step": 67806 - }, - { - "epoch": 1.74, - "learning_rate": 7.932270172610403e-07, - "loss": 0.7939, - "step": 67807 - }, - { - "epoch": 1.74, - "learning_rate": 7.931999448739228e-07, - "loss": 0.6963, - "step": 67808 - }, - { - "epoch": 1.74, - "learning_rate": 7.931728726451429e-07, - "loss": 0.6226, - "step": 67809 - }, - { - "epoch": 1.74, - "learning_rate": 7.931458005747213e-07, - "loss": 0.5237, - "step": 67810 - }, - { - "epoch": 1.74, - "learning_rate": 7.931187286626781e-07, - "loss": 0.623, - "step": 67811 - }, - { - "epoch": 1.74, - "learning_rate": 7.930916569090342e-07, - "loss": 0.645, - "step": 67812 - }, - { - "epoch": 1.74, - "learning_rate": 7.930645853138107e-07, - "loss": 0.6294, - "step": 67813 - }, - { - "epoch": 1.74, - "learning_rate": 7.93037513877028e-07, - "loss": 0.6797, - "step": 67814 - }, - { - "epoch": 1.74, - "learning_rate": 7.930104425987071e-07, - "loss": 0.6572, - "step": 67815 - }, - { - "epoch": 1.74, - "learning_rate": 7.929833714788683e-07, - "loss": 0.606, - "step": 67816 - }, - { - "epoch": 1.74, - "learning_rate": 7.92956300517533e-07, - "loss": 0.4856, - "step": 67817 - }, - { - "epoch": 1.74, - "learning_rate": 7.929292297147212e-07, - "loss": 0.6177, - "step": 67818 - }, - { - "epoch": 1.74, - "learning_rate": 7.929021590704543e-07, - "loss": 0.5403, - "step": 67819 - }, - { - "epoch": 1.74, - "learning_rate": 7.928750885847527e-07, - "loss": 0.6963, - "step": 67820 - }, - { - "epoch": 1.74, - "learning_rate": 7.928480182576369e-07, - "loss": 0.8545, - "step": 67821 - }, - { - "epoch": 1.74, - "learning_rate": 7.928209480891279e-07, - "loss": 0.6768, - "step": 67822 - }, - { - "epoch": 1.74, - "learning_rate": 7.927938780792463e-07, - "loss": 0.5874, - "step": 67823 - }, - { - "epoch": 1.74, - "learning_rate": 7.92766808228013e-07, - "loss": 0.6172, - "step": 67824 - }, - { - "epoch": 1.74, - "learning_rate": 7.927397385354485e-07, - "loss": 0.7207, - "step": 67825 - }, - { - "epoch": 1.74, - "learning_rate": 7.927126690015738e-07, - "loss": 0.6353, - "step": 67826 - }, - { - "epoch": 1.74, - "learning_rate": 7.926855996264096e-07, - "loss": 0.468, - "step": 67827 - }, - { - "epoch": 1.74, - "learning_rate": 7.926585304099762e-07, - "loss": 0.7275, - "step": 67828 - }, - { - "epoch": 1.74, - "learning_rate": 7.926314613522949e-07, - "loss": 0.6802, - "step": 67829 - }, - { - "epoch": 1.74, - "learning_rate": 7.926043924533862e-07, - "loss": 0.6401, - "step": 67830 - }, - { - "epoch": 1.74, - "learning_rate": 7.925773237132705e-07, - "loss": 0.7842, - "step": 67831 - }, - { - "epoch": 1.74, - "learning_rate": 7.92550255131969e-07, - "loss": 0.7559, - "step": 67832 - }, - { - "epoch": 1.74, - "learning_rate": 7.92523186709502e-07, - "loss": 0.6484, - "step": 67833 - }, - { - "epoch": 1.74, - "learning_rate": 7.924961184458907e-07, - "loss": 0.6235, - "step": 67834 - }, - { - "epoch": 1.74, - "learning_rate": 7.924690503411553e-07, - "loss": 0.4771, - "step": 67835 - }, - { - "epoch": 1.74, - "learning_rate": 7.924419823953171e-07, - "loss": 0.8535, - "step": 67836 - }, - { - "epoch": 1.74, - "learning_rate": 7.924149146083963e-07, - "loss": 0.7539, - "step": 67837 - }, - { - "epoch": 1.74, - "learning_rate": 7.92387846980414e-07, - "loss": 0.4558, - "step": 67838 - }, - { - "epoch": 1.74, - "learning_rate": 7.923607795113907e-07, - "loss": 0.7139, - "step": 67839 - }, - { - "epoch": 1.74, - "learning_rate": 7.923337122013475e-07, - "loss": 0.6636, - "step": 67840 - }, - { - "epoch": 1.74, - "learning_rate": 7.923066450503046e-07, - "loss": 0.8125, - "step": 67841 - }, - { - "epoch": 1.74, - "learning_rate": 7.922795780582828e-07, - "loss": 0.625, - "step": 67842 - }, - { - "epoch": 1.74, - "learning_rate": 7.922525112253033e-07, - "loss": 0.8184, - "step": 67843 - }, - { - "epoch": 1.74, - "learning_rate": 7.92225444551386e-07, - "loss": 0.4097, - "step": 67844 - }, - { - "epoch": 1.74, - "learning_rate": 7.921983780365526e-07, - "loss": 0.668, - "step": 67845 - }, - { - "epoch": 1.74, - "learning_rate": 7.921713116808233e-07, - "loss": 0.6499, - "step": 67846 - }, - { - "epoch": 1.74, - "learning_rate": 7.921442454842187e-07, - "loss": 0.6836, - "step": 67847 - }, - { - "epoch": 1.74, - "learning_rate": 7.921171794467598e-07, - "loss": 0.6904, - "step": 67848 - }, - { - "epoch": 1.74, - "learning_rate": 7.92090113568467e-07, - "loss": 0.6812, - "step": 67849 - }, - { - "epoch": 1.74, - "learning_rate": 7.920630478493617e-07, - "loss": 0.6328, - "step": 67850 - }, - { - "epoch": 1.74, - "learning_rate": 7.920359822894638e-07, - "loss": 0.7104, - "step": 67851 - }, - { - "epoch": 1.74, - "learning_rate": 7.920089168887945e-07, - "loss": 0.7354, - "step": 67852 - }, - { - "epoch": 1.74, - "learning_rate": 7.919818516473743e-07, - "loss": 0.5811, - "step": 67853 - }, - { - "epoch": 1.74, - "learning_rate": 7.919547865652239e-07, - "loss": 0.6865, - "step": 67854 - }, - { - "epoch": 1.74, - "learning_rate": 7.919277216423646e-07, - "loss": 1.0908, - "step": 67855 - }, - { - "epoch": 1.74, - "learning_rate": 7.919006568788162e-07, - "loss": 0.7319, - "step": 67856 - }, - { - "epoch": 1.74, - "learning_rate": 7.918735922746002e-07, - "loss": 0.5308, - "step": 67857 - }, - { - "epoch": 1.74, - "learning_rate": 7.918465278297368e-07, - "loss": 0.6011, - "step": 67858 - }, - { - "epoch": 1.74, - "learning_rate": 7.918194635442471e-07, - "loss": 0.7998, - "step": 67859 - }, - { - "epoch": 1.74, - "learning_rate": 7.91792399418152e-07, - "loss": 0.4629, - "step": 67860 - }, - { - "epoch": 1.74, - "learning_rate": 7.917653354514714e-07, - "loss": 0.6553, - "step": 67861 - }, - { - "epoch": 1.74, - "learning_rate": 7.917382716442267e-07, - "loss": 0.7129, - "step": 67862 - }, - { - "epoch": 1.74, - "learning_rate": 7.917112079964384e-07, - "loss": 0.5737, - "step": 67863 - }, - { - "epoch": 1.74, - "learning_rate": 7.916841445081272e-07, - "loss": 0.6396, - "step": 67864 - }, - { - "epoch": 1.74, - "learning_rate": 7.916570811793138e-07, - "loss": 0.7041, - "step": 67865 - }, - { - "epoch": 1.74, - "learning_rate": 7.91630018010019e-07, - "loss": 0.6338, - "step": 67866 - }, - { - "epoch": 1.74, - "learning_rate": 7.916029550002636e-07, - "loss": 0.6636, - "step": 67867 - }, - { - "epoch": 1.74, - "learning_rate": 7.915758921500682e-07, - "loss": 0.4731, - "step": 67868 - }, - { - "epoch": 1.74, - "learning_rate": 7.915488294594537e-07, - "loss": 0.5718, - "step": 67869 - }, - { - "epoch": 1.74, - "learning_rate": 7.915217669284409e-07, - "loss": 0.6055, - "step": 67870 - }, - { - "epoch": 1.74, - "learning_rate": 7.914947045570496e-07, - "loss": 0.6455, - "step": 67871 - }, - { - "epoch": 1.74, - "learning_rate": 7.914676423453019e-07, - "loss": 0.6963, - "step": 67872 - }, - { - "epoch": 1.74, - "learning_rate": 7.914405802932173e-07, - "loss": 0.6475, - "step": 67873 - }, - { - "epoch": 1.74, - "learning_rate": 7.914135184008173e-07, - "loss": 0.6836, - "step": 67874 - }, - { - "epoch": 1.74, - "learning_rate": 7.913864566681223e-07, - "loss": 0.7598, - "step": 67875 - }, - { - "epoch": 1.74, - "learning_rate": 7.913593950951532e-07, - "loss": 0.79, - "step": 67876 - }, - { - "epoch": 1.74, - "learning_rate": 7.913323336819304e-07, - "loss": 0.5923, - "step": 67877 - }, - { - "epoch": 1.74, - "learning_rate": 7.913052724284751e-07, - "loss": 0.7446, - "step": 67878 - }, - { - "epoch": 1.74, - "learning_rate": 7.912782113348076e-07, - "loss": 0.7402, - "step": 67879 - }, - { - "epoch": 1.74, - "learning_rate": 7.912511504009493e-07, - "loss": 0.6152, - "step": 67880 - }, - { - "epoch": 1.74, - "learning_rate": 7.912240896269198e-07, - "loss": 0.6602, - "step": 67881 - }, - { - "epoch": 1.74, - "learning_rate": 7.911970290127405e-07, - "loss": 0.7363, - "step": 67882 - }, - { - "epoch": 1.74, - "learning_rate": 7.911699685584321e-07, - "loss": 0.5771, - "step": 67883 - }, - { - "epoch": 1.74, - "learning_rate": 7.911429082640153e-07, - "loss": 0.5977, - "step": 67884 - }, - { - "epoch": 1.74, - "learning_rate": 7.911158481295106e-07, - "loss": 0.7061, - "step": 67885 - }, - { - "epoch": 1.74, - "learning_rate": 7.910887881549391e-07, - "loss": 0.6387, - "step": 67886 - }, - { - "epoch": 1.74, - "learning_rate": 7.910617283403209e-07, - "loss": 0.6885, - "step": 67887 - }, - { - "epoch": 1.74, - "learning_rate": 7.910346686856776e-07, - "loss": 0.6484, - "step": 67888 - }, - { - "epoch": 1.74, - "learning_rate": 7.910076091910291e-07, - "loss": 0.71, - "step": 67889 - }, - { - "epoch": 1.74, - "learning_rate": 7.90980549856397e-07, - "loss": 0.6885, - "step": 67890 - }, - { - "epoch": 1.74, - "learning_rate": 7.909534906818012e-07, - "loss": 0.7637, - "step": 67891 - }, - { - "epoch": 1.74, - "learning_rate": 7.909264316672625e-07, - "loss": 0.427, - "step": 67892 - }, - { - "epoch": 1.74, - "learning_rate": 7.90899372812802e-07, - "loss": 0.5176, - "step": 67893 - }, - { - "epoch": 1.74, - "learning_rate": 7.9087231411844e-07, - "loss": 0.5967, - "step": 67894 - }, - { - "epoch": 1.74, - "learning_rate": 7.908452555841978e-07, - "loss": 0.7861, - "step": 67895 - }, - { - "epoch": 1.74, - "learning_rate": 7.908181972100954e-07, - "loss": 0.5781, - "step": 67896 - }, - { - "epoch": 1.74, - "learning_rate": 7.907911389961541e-07, - "loss": 0.6318, - "step": 67897 - }, - { - "epoch": 1.74, - "learning_rate": 7.907640809423943e-07, - "loss": 0.7344, - "step": 67898 - }, - { - "epoch": 1.74, - "learning_rate": 7.90737023048837e-07, - "loss": 0.541, - "step": 67899 - }, - { - "epoch": 1.74, - "learning_rate": 7.90709965315503e-07, - "loss": 0.5767, - "step": 67900 - }, - { - "epoch": 1.74, - "learning_rate": 7.906829077424125e-07, - "loss": 0.6112, - "step": 67901 - }, - { - "epoch": 1.74, - "learning_rate": 7.906558503295863e-07, - "loss": 0.7959, - "step": 67902 - }, - { - "epoch": 1.74, - "learning_rate": 7.906287930770454e-07, - "loss": 0.6348, - "step": 67903 - }, - { - "epoch": 1.74, - "learning_rate": 7.906017359848103e-07, - "loss": 0.8193, - "step": 67904 - }, - { - "epoch": 1.74, - "learning_rate": 7.905746790529019e-07, - "loss": 0.6011, - "step": 67905 - }, - { - "epoch": 1.74, - "learning_rate": 7.905476222813408e-07, - "loss": 0.5478, - "step": 67906 - }, - { - "epoch": 1.74, - "learning_rate": 7.905205656701478e-07, - "loss": 0.7168, - "step": 67907 - }, - { - "epoch": 1.74, - "learning_rate": 7.904935092193435e-07, - "loss": 0.7432, - "step": 67908 - }, - { - "epoch": 1.74, - "learning_rate": 7.904664529289487e-07, - "loss": 0.5874, - "step": 67909 - }, - { - "epoch": 1.74, - "learning_rate": 7.904393967989845e-07, - "loss": 0.6001, - "step": 67910 - }, - { - "epoch": 1.74, - "learning_rate": 7.904123408294707e-07, - "loss": 0.6787, - "step": 67911 - }, - { - "epoch": 1.74, - "learning_rate": 7.903852850204289e-07, - "loss": 0.6519, - "step": 67912 - }, - { - "epoch": 1.74, - "learning_rate": 7.90358229371879e-07, - "loss": 0.6943, - "step": 67913 - }, - { - "epoch": 1.74, - "learning_rate": 7.903311738838425e-07, - "loss": 0.6094, - "step": 67914 - }, - { - "epoch": 1.74, - "learning_rate": 7.903041185563396e-07, - "loss": 0.6138, - "step": 67915 - }, - { - "epoch": 1.74, - "learning_rate": 7.902770633893914e-07, - "loss": 0.6323, - "step": 67916 - }, - { - "epoch": 1.74, - "learning_rate": 7.902500083830181e-07, - "loss": 0.7002, - "step": 67917 - }, - { - "epoch": 1.74, - "learning_rate": 7.902229535372411e-07, - "loss": 0.6655, - "step": 67918 - }, - { - "epoch": 1.74, - "learning_rate": 7.901958988520806e-07, - "loss": 0.6328, - "step": 67919 - }, - { - "epoch": 1.74, - "learning_rate": 7.901688443275577e-07, - "loss": 0.7627, - "step": 67920 - }, - { - "epoch": 1.74, - "learning_rate": 7.901417899636925e-07, - "loss": 0.4741, - "step": 67921 - }, - { - "epoch": 1.74, - "learning_rate": 7.901147357605063e-07, - "loss": 0.5591, - "step": 67922 - }, - { - "epoch": 1.74, - "learning_rate": 7.900876817180193e-07, - "loss": 0.5547, - "step": 67923 - }, - { - "epoch": 1.74, - "learning_rate": 7.900606278362527e-07, - "loss": 0.6318, - "step": 67924 - }, - { - "epoch": 1.74, - "learning_rate": 7.900335741152269e-07, - "loss": 0.7256, - "step": 67925 - }, - { - "epoch": 1.74, - "learning_rate": 7.900065205549629e-07, - "loss": 0.7222, - "step": 67926 - }, - { - "epoch": 1.74, - "learning_rate": 7.899794671554811e-07, - "loss": 0.6821, - "step": 67927 - }, - { - "epoch": 1.74, - "learning_rate": 7.899524139168024e-07, - "loss": 0.6064, - "step": 67928 - }, - { - "epoch": 1.74, - "learning_rate": 7.899253608389474e-07, - "loss": 0.5879, - "step": 67929 - }, - { - "epoch": 1.74, - "learning_rate": 7.898983079219375e-07, - "loss": 0.4756, - "step": 67930 - }, - { - "epoch": 1.74, - "learning_rate": 7.898712551657924e-07, - "loss": 0.6572, - "step": 67931 - }, - { - "epoch": 1.74, - "learning_rate": 7.89844202570533e-07, - "loss": 0.5518, - "step": 67932 - }, - { - "epoch": 1.74, - "learning_rate": 7.898171501361803e-07, - "loss": 0.6504, - "step": 67933 - }, - { - "epoch": 1.74, - "learning_rate": 7.89790097862755e-07, - "loss": 0.7275, - "step": 67934 - }, - { - "epoch": 1.74, - "learning_rate": 7.897630457502779e-07, - "loss": 0.5737, - "step": 67935 - }, - { - "epoch": 1.74, - "learning_rate": 7.897359937987694e-07, - "loss": 0.6396, - "step": 67936 - }, - { - "epoch": 1.74, - "learning_rate": 7.897089420082503e-07, - "loss": 0.7153, - "step": 67937 - }, - { - "epoch": 1.74, - "learning_rate": 7.896818903787417e-07, - "loss": 0.6626, - "step": 67938 - }, - { - "epoch": 1.74, - "learning_rate": 7.896548389102636e-07, - "loss": 0.6582, - "step": 67939 - }, - { - "epoch": 1.74, - "learning_rate": 7.896277876028376e-07, - "loss": 0.5659, - "step": 67940 - }, - { - "epoch": 1.74, - "learning_rate": 7.896007364564838e-07, - "loss": 0.5718, - "step": 67941 - }, - { - "epoch": 1.74, - "learning_rate": 7.895736854712228e-07, - "loss": 0.521, - "step": 67942 - }, - { - "epoch": 1.74, - "learning_rate": 7.895466346470758e-07, - "loss": 0.481, - "step": 67943 - }, - { - "epoch": 1.74, - "learning_rate": 7.895195839840629e-07, - "loss": 0.5703, - "step": 67944 - }, - { - "epoch": 1.74, - "learning_rate": 7.894925334822055e-07, - "loss": 0.6797, - "step": 67945 - }, - { - "epoch": 1.74, - "learning_rate": 7.894654831415238e-07, - "loss": 0.7227, - "step": 67946 - }, - { - "epoch": 1.74, - "learning_rate": 7.894384329620389e-07, - "loss": 0.5488, - "step": 67947 - }, - { - "epoch": 1.74, - "learning_rate": 7.894113829437711e-07, - "loss": 0.8799, - "step": 67948 - }, - { - "epoch": 1.74, - "learning_rate": 7.893843330867415e-07, - "loss": 0.7471, - "step": 67949 - }, - { - "epoch": 1.74, - "learning_rate": 7.893572833909709e-07, - "loss": 0.667, - "step": 67950 - }, - { - "epoch": 1.74, - "learning_rate": 7.893302338564793e-07, - "loss": 0.7812, - "step": 67951 - }, - { - "epoch": 1.74, - "learning_rate": 7.893031844832879e-07, - "loss": 0.5312, - "step": 67952 - }, - { - "epoch": 1.74, - "learning_rate": 7.892761352714176e-07, - "loss": 0.7744, - "step": 67953 - }, - { - "epoch": 1.74, - "learning_rate": 7.892490862208885e-07, - "loss": 0.5073, - "step": 67954 - }, - { - "epoch": 1.74, - "learning_rate": 7.89222037331722e-07, - "loss": 0.5698, - "step": 67955 - }, - { - "epoch": 1.74, - "learning_rate": 7.891949886039382e-07, - "loss": 0.5693, - "step": 67956 - }, - { - "epoch": 1.74, - "learning_rate": 7.891679400375584e-07, - "loss": 0.6553, - "step": 67957 - }, - { - "epoch": 1.74, - "learning_rate": 7.891408916326026e-07, - "loss": 0.5183, - "step": 67958 - }, - { - "epoch": 1.74, - "learning_rate": 7.891138433890923e-07, - "loss": 0.7471, - "step": 67959 - }, - { - "epoch": 1.74, - "learning_rate": 7.890867953070481e-07, - "loss": 0.6328, - "step": 67960 - }, - { - "epoch": 1.74, - "learning_rate": 7.8905974738649e-07, - "loss": 0.6597, - "step": 67961 - }, - { - "epoch": 1.74, - "learning_rate": 7.890326996274394e-07, - "loss": 0.7549, - "step": 67962 - }, - { - "epoch": 1.74, - "learning_rate": 7.890056520299164e-07, - "loss": 0.5337, - "step": 67963 - }, - { - "epoch": 1.74, - "learning_rate": 7.889786045939423e-07, - "loss": 0.6572, - "step": 67964 - }, - { - "epoch": 1.74, - "learning_rate": 7.889515573195375e-07, - "loss": 0.7441, - "step": 67965 - }, - { - "epoch": 1.74, - "learning_rate": 7.889245102067229e-07, - "loss": 0.6416, - "step": 67966 - }, - { - "epoch": 1.74, - "learning_rate": 7.888974632555189e-07, - "loss": 0.603, - "step": 67967 - }, - { - "epoch": 1.74, - "learning_rate": 7.888704164659465e-07, - "loss": 0.6787, - "step": 67968 - }, - { - "epoch": 1.74, - "learning_rate": 7.888433698380268e-07, - "loss": 0.5093, - "step": 67969 - }, - { - "epoch": 1.74, - "learning_rate": 7.888163233717796e-07, - "loss": 0.6392, - "step": 67970 - }, - { - "epoch": 1.74, - "learning_rate": 7.887892770672259e-07, - "loss": 0.7178, - "step": 67971 - }, - { - "epoch": 1.74, - "learning_rate": 7.887622309243867e-07, - "loss": 0.6035, - "step": 67972 - }, - { - "epoch": 1.74, - "learning_rate": 7.887351849432824e-07, - "loss": 0.6523, - "step": 67973 - }, - { - "epoch": 1.74, - "learning_rate": 7.887081391239341e-07, - "loss": 0.8076, - "step": 67974 - }, - { - "epoch": 1.74, - "learning_rate": 7.886810934663619e-07, - "loss": 0.644, - "step": 67975 - }, - { - "epoch": 1.74, - "learning_rate": 7.886540479705872e-07, - "loss": 0.531, - "step": 67976 - }, - { - "epoch": 1.74, - "learning_rate": 7.8862700263663e-07, - "loss": 0.6074, - "step": 67977 - }, - { - "epoch": 1.74, - "learning_rate": 7.885999574645118e-07, - "loss": 0.6582, - "step": 67978 - }, - { - "epoch": 1.74, - "learning_rate": 7.88572912454253e-07, - "loss": 0.4626, - "step": 67979 - }, - { - "epoch": 1.74, - "learning_rate": 7.885458676058739e-07, - "loss": 0.6582, - "step": 67980 - }, - { - "epoch": 1.74, - "learning_rate": 7.885188229193955e-07, - "loss": 0.5044, - "step": 67981 - }, - { - "epoch": 1.74, - "learning_rate": 7.884917783948385e-07, - "loss": 0.5811, - "step": 67982 - }, - { - "epoch": 1.74, - "learning_rate": 7.884647340322237e-07, - "loss": 0.5825, - "step": 67983 - }, - { - "epoch": 1.74, - "learning_rate": 7.884376898315717e-07, - "loss": 0.668, - "step": 67984 - }, - { - "epoch": 1.74, - "learning_rate": 7.884106457929032e-07, - "loss": 0.7217, - "step": 67985 - }, - { - "epoch": 1.74, - "learning_rate": 7.883836019162389e-07, - "loss": 0.583, - "step": 67986 - }, - { - "epoch": 1.74, - "learning_rate": 7.883565582015997e-07, - "loss": 0.71, - "step": 67987 - }, - { - "epoch": 1.74, - "learning_rate": 7.883295146490059e-07, - "loss": 0.5361, - "step": 67988 - }, - { - "epoch": 1.74, - "learning_rate": 7.883024712584792e-07, - "loss": 0.8213, - "step": 67989 - }, - { - "epoch": 1.74, - "learning_rate": 7.882754280300388e-07, - "loss": 0.6499, - "step": 67990 - }, - { - "epoch": 1.74, - "learning_rate": 7.882483849637065e-07, - "loss": 0.6914, - "step": 67991 - }, - { - "epoch": 1.74, - "learning_rate": 7.882213420595023e-07, - "loss": 0.6045, - "step": 67992 - }, - { - "epoch": 1.74, - "learning_rate": 7.881942993174477e-07, - "loss": 0.4005, - "step": 67993 - }, - { - "epoch": 1.74, - "learning_rate": 7.881672567375627e-07, - "loss": 0.5811, - "step": 67994 - }, - { - "epoch": 1.74, - "learning_rate": 7.881402143198684e-07, - "loss": 0.6016, - "step": 67995 - }, - { - "epoch": 1.74, - "learning_rate": 7.881131720643853e-07, - "loss": 0.6465, - "step": 67996 - }, - { - "epoch": 1.74, - "learning_rate": 7.880861299711343e-07, - "loss": 0.6206, - "step": 67997 - }, - { - "epoch": 1.74, - "learning_rate": 7.880590880401359e-07, - "loss": 0.7178, - "step": 67998 - }, - { - "epoch": 1.74, - "learning_rate": 7.880320462714113e-07, - "loss": 0.6631, - "step": 67999 - }, - { - "epoch": 1.74, - "learning_rate": 7.880050046649806e-07, - "loss": 0.5186, - "step": 68000 - }, - { - "epoch": 1.74, - "learning_rate": 7.879779632208645e-07, - "loss": 0.6104, - "step": 68001 - }, - { - "epoch": 1.74, - "learning_rate": 7.879509219390842e-07, - "loss": 0.7109, - "step": 68002 - }, - { - "epoch": 1.74, - "learning_rate": 7.879238808196598e-07, - "loss": 0.5667, - "step": 68003 - }, - { - "epoch": 1.74, - "learning_rate": 7.878968398626127e-07, - "loss": 0.6494, - "step": 68004 - }, - { - "epoch": 1.74, - "learning_rate": 7.878697990679629e-07, - "loss": 0.5898, - "step": 68005 - }, - { - "epoch": 1.74, - "learning_rate": 7.878427584357316e-07, - "loss": 0.5396, - "step": 68006 - }, - { - "epoch": 1.74, - "learning_rate": 7.878157179659393e-07, - "loss": 0.6377, - "step": 68007 - }, - { - "epoch": 1.74, - "learning_rate": 7.877886776586069e-07, - "loss": 0.7852, - "step": 68008 - }, - { - "epoch": 1.74, - "learning_rate": 7.877616375137551e-07, - "loss": 0.626, - "step": 68009 - }, - { - "epoch": 1.74, - "learning_rate": 7.877345975314044e-07, - "loss": 0.688, - "step": 68010 - }, - { - "epoch": 1.74, - "learning_rate": 7.877075577115751e-07, - "loss": 0.604, - "step": 68011 - }, - { - "epoch": 1.74, - "learning_rate": 7.876805180542888e-07, - "loss": 0.5244, - "step": 68012 - }, - { - "epoch": 1.74, - "learning_rate": 7.876534785595654e-07, - "loss": 0.5737, - "step": 68013 - }, - { - "epoch": 1.74, - "learning_rate": 7.876264392274263e-07, - "loss": 0.5537, - "step": 68014 - }, - { - "epoch": 1.74, - "learning_rate": 7.875994000578916e-07, - "loss": 0.6567, - "step": 68015 - }, - { - "epoch": 1.74, - "learning_rate": 7.875723610509825e-07, - "loss": 0.583, - "step": 68016 - }, - { - "epoch": 1.74, - "learning_rate": 7.875453222067192e-07, - "loss": 0.6035, - "step": 68017 - }, - { - "epoch": 1.74, - "learning_rate": 7.87518283525123e-07, - "loss": 0.5454, - "step": 68018 - }, - { - "epoch": 1.74, - "learning_rate": 7.874912450062145e-07, - "loss": 0.7573, - "step": 68019 - }, - { - "epoch": 1.74, - "learning_rate": 7.874642066500137e-07, - "loss": 0.7012, - "step": 68020 - }, - { - "epoch": 1.74, - "learning_rate": 7.87437168456542e-07, - "loss": 0.6426, - "step": 68021 - }, - { - "epoch": 1.74, - "learning_rate": 7.874101304258196e-07, - "loss": 0.6284, - "step": 68022 - }, - { - "epoch": 1.74, - "learning_rate": 7.873830925578677e-07, - "loss": 0.6377, - "step": 68023 - }, - { - "epoch": 1.74, - "learning_rate": 7.873560548527066e-07, - "loss": 0.5635, - "step": 68024 - }, - { - "epoch": 1.74, - "learning_rate": 7.873290173103575e-07, - "loss": 0.8652, - "step": 68025 - }, - { - "epoch": 1.74, - "learning_rate": 7.873019799308407e-07, - "loss": 0.7598, - "step": 68026 - }, - { - "epoch": 1.74, - "learning_rate": 7.872749427141768e-07, - "loss": 0.6621, - "step": 68027 - }, - { - "epoch": 1.74, - "learning_rate": 7.872479056603869e-07, - "loss": 0.7764, - "step": 68028 - }, - { - "epoch": 1.74, - "learning_rate": 7.872208687694918e-07, - "loss": 0.5459, - "step": 68029 - }, - { - "epoch": 1.74, - "learning_rate": 7.871938320415114e-07, - "loss": 0.345, - "step": 68030 - }, - { - "epoch": 1.74, - "learning_rate": 7.871667954764671e-07, - "loss": 0.5024, - "step": 68031 - }, - { - "epoch": 1.74, - "learning_rate": 7.871397590743792e-07, - "loss": 0.6045, - "step": 68032 - }, - { - "epoch": 1.74, - "learning_rate": 7.871127228352689e-07, - "loss": 0.7168, - "step": 68033 - }, - { - "epoch": 1.74, - "learning_rate": 7.870856867591563e-07, - "loss": 0.6377, - "step": 68034 - }, - { - "epoch": 1.74, - "learning_rate": 7.870586508460627e-07, - "loss": 0.686, - "step": 68035 - }, - { - "epoch": 1.74, - "learning_rate": 7.87031615096008e-07, - "loss": 0.6069, - "step": 68036 - }, - { - "epoch": 1.74, - "learning_rate": 7.870045795090139e-07, - "loss": 0.6335, - "step": 68037 - }, - { - "epoch": 1.74, - "learning_rate": 7.869775440851002e-07, - "loss": 0.5981, - "step": 68038 - }, - { - "epoch": 1.74, - "learning_rate": 7.869505088242886e-07, - "loss": 0.5811, - "step": 68039 - }, - { - "epoch": 1.74, - "learning_rate": 7.869234737265988e-07, - "loss": 0.5469, - "step": 68040 - }, - { - "epoch": 1.74, - "learning_rate": 7.868964387920519e-07, - "loss": 0.665, - "step": 68041 - }, - { - "epoch": 1.74, - "learning_rate": 7.868694040206687e-07, - "loss": 0.6914, - "step": 68042 - }, - { - "epoch": 1.74, - "learning_rate": 7.868423694124698e-07, - "loss": 0.7334, - "step": 68043 - }, - { - "epoch": 1.74, - "learning_rate": 7.868153349674757e-07, - "loss": 0.6328, - "step": 68044 - }, - { - "epoch": 1.74, - "learning_rate": 7.867883006857074e-07, - "loss": 0.6191, - "step": 68045 - }, - { - "epoch": 1.74, - "learning_rate": 7.867612665671855e-07, - "loss": 0.3959, - "step": 68046 - }, - { - "epoch": 1.74, - "learning_rate": 7.867342326119307e-07, - "loss": 0.6914, - "step": 68047 - }, - { - "epoch": 1.74, - "learning_rate": 7.867071988199637e-07, - "loss": 0.7129, - "step": 68048 - }, - { - "epoch": 1.74, - "learning_rate": 7.866801651913053e-07, - "loss": 0.7109, - "step": 68049 - }, - { - "epoch": 1.74, - "learning_rate": 7.866531317259761e-07, - "loss": 0.6885, - "step": 68050 - }, - { - "epoch": 1.74, - "learning_rate": 7.866260984239966e-07, - "loss": 0.6396, - "step": 68051 - }, - { - "epoch": 1.74, - "learning_rate": 7.865990652853878e-07, - "loss": 0.7266, - "step": 68052 - }, - { - "epoch": 1.74, - "learning_rate": 7.8657203231017e-07, - "loss": 0.5115, - "step": 68053 - }, - { - "epoch": 1.74, - "learning_rate": 7.865449994983645e-07, - "loss": 0.7041, - "step": 68054 - }, - { - "epoch": 1.74, - "learning_rate": 7.865179668499915e-07, - "loss": 0.6846, - "step": 68055 - }, - { - "epoch": 1.74, - "learning_rate": 7.864909343650721e-07, - "loss": 0.6919, - "step": 68056 - }, - { - "epoch": 1.74, - "learning_rate": 7.864639020436265e-07, - "loss": 0.6562, - "step": 68057 - }, - { - "epoch": 1.74, - "learning_rate": 7.864368698856758e-07, - "loss": 0.6621, - "step": 68058 - }, - { - "epoch": 1.74, - "learning_rate": 7.86409837891241e-07, - "loss": 0.6099, - "step": 68059 - }, - { - "epoch": 1.74, - "learning_rate": 7.863828060603419e-07, - "loss": 0.4417, - "step": 68060 - }, - { - "epoch": 1.74, - "learning_rate": 7.863557743929997e-07, - "loss": 0.7803, - "step": 68061 - }, - { - "epoch": 1.74, - "learning_rate": 7.863287428892351e-07, - "loss": 0.4756, - "step": 68062 - }, - { - "epoch": 1.74, - "learning_rate": 7.863017115490685e-07, - "loss": 0.7402, - "step": 68063 - }, - { - "epoch": 1.74, - "learning_rate": 7.862746803725212e-07, - "loss": 0.6719, - "step": 68064 - }, - { - "epoch": 1.74, - "learning_rate": 7.862476493596133e-07, - "loss": 0.5491, - "step": 68065 - }, - { - "epoch": 1.74, - "learning_rate": 7.86220618510366e-07, - "loss": 0.4438, - "step": 68066 - }, - { - "epoch": 1.74, - "learning_rate": 7.861935878247994e-07, - "loss": 0.6963, - "step": 68067 - }, - { - "epoch": 1.74, - "learning_rate": 7.861665573029348e-07, - "loss": 0.5903, - "step": 68068 - }, - { - "epoch": 1.74, - "learning_rate": 7.86139526944793e-07, - "loss": 0.4945, - "step": 68069 - }, - { - "epoch": 1.74, - "learning_rate": 7.861124967503937e-07, - "loss": 0.5811, - "step": 68070 - }, - { - "epoch": 1.74, - "learning_rate": 7.860854667197585e-07, - "loss": 0.4714, - "step": 68071 - }, - { - "epoch": 1.74, - "learning_rate": 7.860584368529077e-07, - "loss": 0.8369, - "step": 68072 - }, - { - "epoch": 1.74, - "learning_rate": 7.860314071498622e-07, - "loss": 0.5137, - "step": 68073 - }, - { - "epoch": 1.74, - "learning_rate": 7.860043776106425e-07, - "loss": 0.6396, - "step": 68074 - }, - { - "epoch": 1.74, - "learning_rate": 7.859773482352696e-07, - "loss": 0.707, - "step": 68075 - }, - { - "epoch": 1.74, - "learning_rate": 7.859503190237638e-07, - "loss": 0.8359, - "step": 68076 - }, - { - "epoch": 1.74, - "learning_rate": 7.859232899761462e-07, - "loss": 0.5977, - "step": 68077 - }, - { - "epoch": 1.74, - "learning_rate": 7.858962610924371e-07, - "loss": 0.6343, - "step": 68078 - }, - { - "epoch": 1.74, - "learning_rate": 7.85869232372658e-07, - "loss": 0.751, - "step": 68079 - }, - { - "epoch": 1.74, - "learning_rate": 7.858422038168283e-07, - "loss": 0.5752, - "step": 68080 - }, - { - "epoch": 1.74, - "learning_rate": 7.858151754249697e-07, - "loss": 0.6309, - "step": 68081 - }, - { - "epoch": 1.74, - "learning_rate": 7.857881471971022e-07, - "loss": 0.6885, - "step": 68082 - }, - { - "epoch": 1.75, - "learning_rate": 7.857611191332471e-07, - "loss": 0.7949, - "step": 68083 - }, - { - "epoch": 1.75, - "learning_rate": 7.857340912334249e-07, - "loss": 0.6909, - "step": 68084 - }, - { - "epoch": 1.75, - "learning_rate": 7.857070634976562e-07, - "loss": 0.561, - "step": 68085 - }, - { - "epoch": 1.75, - "learning_rate": 7.856800359259616e-07, - "loss": 0.5364, - "step": 68086 - }, - { - "epoch": 1.75, - "learning_rate": 7.856530085183621e-07, - "loss": 0.7686, - "step": 68087 - }, - { - "epoch": 1.75, - "learning_rate": 7.856259812748782e-07, - "loss": 0.5889, - "step": 68088 - }, - { - "epoch": 1.75, - "learning_rate": 7.85598954195531e-07, - "loss": 0.6255, - "step": 68089 - }, - { - "epoch": 1.75, - "learning_rate": 7.855719272803404e-07, - "loss": 0.6816, - "step": 68090 - }, - { - "epoch": 1.75, - "learning_rate": 7.855449005293276e-07, - "loss": 0.5381, - "step": 68091 - }, - { - "epoch": 1.75, - "learning_rate": 7.855178739425132e-07, - "loss": 0.5723, - "step": 68092 - }, - { - "epoch": 1.75, - "learning_rate": 7.854908475199178e-07, - "loss": 0.7227, - "step": 68093 - }, - { - "epoch": 1.75, - "learning_rate": 7.854638212615624e-07, - "loss": 0.75, - "step": 68094 - }, - { - "epoch": 1.75, - "learning_rate": 7.854367951674673e-07, - "loss": 0.7041, - "step": 68095 - }, - { - "epoch": 1.75, - "learning_rate": 7.854097692376535e-07, - "loss": 0.623, - "step": 68096 - }, - { - "epoch": 1.75, - "learning_rate": 7.853827434721414e-07, - "loss": 0.6855, - "step": 68097 - }, - { - "epoch": 1.75, - "learning_rate": 7.853557178709521e-07, - "loss": 0.689, - "step": 68098 - }, - { - "epoch": 1.75, - "learning_rate": 7.853286924341063e-07, - "loss": 0.6841, - "step": 68099 - }, - { - "epoch": 1.75, - "learning_rate": 7.853016671616242e-07, - "loss": 0.6802, - "step": 68100 - }, - { - "epoch": 1.75, - "learning_rate": 7.852746420535265e-07, - "loss": 0.5791, - "step": 68101 - }, - { - "epoch": 1.75, - "learning_rate": 7.852476171098343e-07, - "loss": 0.6465, - "step": 68102 - }, - { - "epoch": 1.75, - "learning_rate": 7.85220592330568e-07, - "loss": 0.6733, - "step": 68103 - }, - { - "epoch": 1.75, - "learning_rate": 7.851935677157486e-07, - "loss": 0.583, - "step": 68104 - }, - { - "epoch": 1.75, - "learning_rate": 7.851665432653965e-07, - "loss": 0.7285, - "step": 68105 - }, - { - "epoch": 1.75, - "learning_rate": 7.851395189795326e-07, - "loss": 0.6992, - "step": 68106 - }, - { - "epoch": 1.75, - "learning_rate": 7.851124948581773e-07, - "loss": 0.4077, - "step": 68107 - }, - { - "epoch": 1.75, - "learning_rate": 7.850854709013517e-07, - "loss": 0.5283, - "step": 68108 - }, - { - "epoch": 1.75, - "learning_rate": 7.850584471090764e-07, - "loss": 0.4645, - "step": 68109 - }, - { - "epoch": 1.75, - "learning_rate": 7.850314234813716e-07, - "loss": 0.709, - "step": 68110 - }, - { - "epoch": 1.75, - "learning_rate": 7.850044000182586e-07, - "loss": 0.5969, - "step": 68111 - }, - { - "epoch": 1.75, - "learning_rate": 7.849773767197577e-07, - "loss": 0.5864, - "step": 68112 - }, - { - "epoch": 1.75, - "learning_rate": 7.849503535858898e-07, - "loss": 0.5864, - "step": 68113 - }, - { - "epoch": 1.75, - "learning_rate": 7.849233306166754e-07, - "loss": 0.6587, - "step": 68114 - }, - { - "epoch": 1.75, - "learning_rate": 7.848963078121354e-07, - "loss": 0.6829, - "step": 68115 - }, - { - "epoch": 1.75, - "learning_rate": 7.848692851722906e-07, - "loss": 0.6641, - "step": 68116 - }, - { - "epoch": 1.75, - "learning_rate": 7.848422626971611e-07, - "loss": 0.5522, - "step": 68117 - }, - { - "epoch": 1.75, - "learning_rate": 7.848152403867684e-07, - "loss": 0.5552, - "step": 68118 - }, - { - "epoch": 1.75, - "learning_rate": 7.847882182411328e-07, - "loss": 0.7305, - "step": 68119 - }, - { - "epoch": 1.75, - "learning_rate": 7.847611962602747e-07, - "loss": 0.6162, - "step": 68120 - }, - { - "epoch": 1.75, - "learning_rate": 7.847341744442152e-07, - "loss": 0.5938, - "step": 68121 - }, - { - "epoch": 1.75, - "learning_rate": 7.847071527929747e-07, - "loss": 0.8057, - "step": 68122 - }, - { - "epoch": 1.75, - "learning_rate": 7.846801313065741e-07, - "loss": 0.5981, - "step": 68123 - }, - { - "epoch": 1.75, - "learning_rate": 7.846531099850338e-07, - "loss": 0.4714, - "step": 68124 - }, - { - "epoch": 1.75, - "learning_rate": 7.84626088828375e-07, - "loss": 0.6084, - "step": 68125 - }, - { - "epoch": 1.75, - "learning_rate": 7.845990678366179e-07, - "loss": 0.6523, - "step": 68126 - }, - { - "epoch": 1.75, - "learning_rate": 7.845720470097837e-07, - "loss": 0.665, - "step": 68127 - }, - { - "epoch": 1.75, - "learning_rate": 7.845450263478923e-07, - "loss": 0.6431, - "step": 68128 - }, - { - "epoch": 1.75, - "learning_rate": 7.845180058509655e-07, - "loss": 0.7139, - "step": 68129 - }, - { - "epoch": 1.75, - "learning_rate": 7.844909855190231e-07, - "loss": 0.6089, - "step": 68130 - }, - { - "epoch": 1.75, - "learning_rate": 7.844639653520858e-07, - "loss": 0.5869, - "step": 68131 - }, - { - "epoch": 1.75, - "learning_rate": 7.844369453501748e-07, - "loss": 0.492, - "step": 68132 - }, - { - "epoch": 1.75, - "learning_rate": 7.844099255133105e-07, - "loss": 0.6753, - "step": 68133 - }, - { - "epoch": 1.75, - "learning_rate": 7.843829058415134e-07, - "loss": 0.644, - "step": 68134 - }, - { - "epoch": 1.75, - "learning_rate": 7.843558863348045e-07, - "loss": 0.6504, - "step": 68135 - }, - { - "epoch": 1.75, - "learning_rate": 7.843288669932043e-07, - "loss": 0.6504, - "step": 68136 - }, - { - "epoch": 1.75, - "learning_rate": 7.843018478167338e-07, - "loss": 0.6694, - "step": 68137 - }, - { - "epoch": 1.75, - "learning_rate": 7.84274828805413e-07, - "loss": 0.6128, - "step": 68138 - }, - { - "epoch": 1.75, - "learning_rate": 7.842478099592638e-07, - "loss": 0.3174, - "step": 68139 - }, - { - "epoch": 1.75, - "learning_rate": 7.842207912783058e-07, - "loss": 0.5105, - "step": 68140 - }, - { - "epoch": 1.75, - "learning_rate": 7.841937727625597e-07, - "loss": 0.6016, - "step": 68141 - }, - { - "epoch": 1.75, - "learning_rate": 7.841667544120468e-07, - "loss": 0.5889, - "step": 68142 - }, - { - "epoch": 1.75, - "learning_rate": 7.841397362267873e-07, - "loss": 0.5166, - "step": 68143 - }, - { - "epoch": 1.75, - "learning_rate": 7.841127182068023e-07, - "loss": 0.4692, - "step": 68144 - }, - { - "epoch": 1.75, - "learning_rate": 7.84085700352112e-07, - "loss": 0.5498, - "step": 68145 - }, - { - "epoch": 1.75, - "learning_rate": 7.840586826627375e-07, - "loss": 0.6562, - "step": 68146 - }, - { - "epoch": 1.75, - "learning_rate": 7.840316651386992e-07, - "loss": 0.6309, - "step": 68147 - }, - { - "epoch": 1.75, - "learning_rate": 7.840046477800182e-07, - "loss": 0.7202, - "step": 68148 - }, - { - "epoch": 1.75, - "learning_rate": 7.83977630586715e-07, - "loss": 0.8574, - "step": 68149 - }, - { - "epoch": 1.75, - "learning_rate": 7.839506135588101e-07, - "loss": 0.707, - "step": 68150 - }, - { - "epoch": 1.75, - "learning_rate": 7.83923596696324e-07, - "loss": 0.7227, - "step": 68151 - }, - { - "epoch": 1.75, - "learning_rate": 7.838965799992779e-07, - "loss": 0.6016, - "step": 68152 - }, - { - "epoch": 1.75, - "learning_rate": 7.83869563467692e-07, - "loss": 0.8447, - "step": 68153 - }, - { - "epoch": 1.75, - "learning_rate": 7.838425471015875e-07, - "loss": 0.4248, - "step": 68154 - }, - { - "epoch": 1.75, - "learning_rate": 7.838155309009846e-07, - "loss": 0.7051, - "step": 68155 - }, - { - "epoch": 1.75, - "learning_rate": 7.837885148659045e-07, - "loss": 0.4003, - "step": 68156 - }, - { - "epoch": 1.75, - "learning_rate": 7.837614989963672e-07, - "loss": 0.6201, - "step": 68157 - }, - { - "epoch": 1.75, - "learning_rate": 7.837344832923941e-07, - "loss": 0.6118, - "step": 68158 - }, - { - "epoch": 1.75, - "learning_rate": 7.837074677540057e-07, - "loss": 0.4536, - "step": 68159 - }, - { - "epoch": 1.75, - "learning_rate": 7.836804523812223e-07, - "loss": 0.5183, - "step": 68160 - }, - { - "epoch": 1.75, - "learning_rate": 7.836534371740648e-07, - "loss": 0.6338, - "step": 68161 - }, - { - "epoch": 1.75, - "learning_rate": 7.836264221325539e-07, - "loss": 0.6328, - "step": 68162 - }, - { - "epoch": 1.75, - "learning_rate": 7.835994072567105e-07, - "loss": 0.6807, - "step": 68163 - }, - { - "epoch": 1.75, - "learning_rate": 7.835723925465547e-07, - "loss": 0.7041, - "step": 68164 - }, - { - "epoch": 1.75, - "learning_rate": 7.835453780021079e-07, - "loss": 0.5674, - "step": 68165 - }, - { - "epoch": 1.75, - "learning_rate": 7.835183636233903e-07, - "loss": 0.6104, - "step": 68166 - }, - { - "epoch": 1.75, - "learning_rate": 7.834913494104228e-07, - "loss": 0.6709, - "step": 68167 - }, - { - "epoch": 1.75, - "learning_rate": 7.834643353632259e-07, - "loss": 0.6816, - "step": 68168 - }, - { - "epoch": 1.75, - "learning_rate": 7.834373214818211e-07, - "loss": 0.7207, - "step": 68169 - }, - { - "epoch": 1.75, - "learning_rate": 7.834103077662276e-07, - "loss": 0.6968, - "step": 68170 - }, - { - "epoch": 1.75, - "learning_rate": 7.833832942164672e-07, - "loss": 0.6348, - "step": 68171 - }, - { - "epoch": 1.75, - "learning_rate": 7.8335628083256e-07, - "loss": 0.5542, - "step": 68172 - }, - { - "epoch": 1.75, - "learning_rate": 7.833292676145271e-07, - "loss": 0.5869, - "step": 68173 - }, - { - "epoch": 1.75, - "learning_rate": 7.833022545623889e-07, - "loss": 0.5481, - "step": 68174 - }, - { - "epoch": 1.75, - "learning_rate": 7.832752416761663e-07, - "loss": 0.7207, - "step": 68175 - }, - { - "epoch": 1.75, - "learning_rate": 7.832482289558798e-07, - "loss": 0.5957, - "step": 68176 - }, - { - "epoch": 1.75, - "learning_rate": 7.832212164015501e-07, - "loss": 0.5664, - "step": 68177 - }, - { - "epoch": 1.75, - "learning_rate": 7.831942040131981e-07, - "loss": 0.8555, - "step": 68178 - }, - { - "epoch": 1.75, - "learning_rate": 7.831671917908445e-07, - "loss": 0.5308, - "step": 68179 - }, - { - "epoch": 1.75, - "learning_rate": 7.831401797345096e-07, - "loss": 0.6807, - "step": 68180 - }, - { - "epoch": 1.75, - "learning_rate": 7.831131678442142e-07, - "loss": 0.7178, - "step": 68181 - }, - { - "epoch": 1.75, - "learning_rate": 7.830861561199793e-07, - "loss": 0.7119, - "step": 68182 - }, - { - "epoch": 1.75, - "learning_rate": 7.830591445618251e-07, - "loss": 0.7598, - "step": 68183 - }, - { - "epoch": 1.75, - "learning_rate": 7.830321331697727e-07, - "loss": 0.5439, - "step": 68184 - }, - { - "epoch": 1.75, - "learning_rate": 7.830051219438425e-07, - "loss": 0.8105, - "step": 68185 - }, - { - "epoch": 1.75, - "learning_rate": 7.829781108840554e-07, - "loss": 0.6992, - "step": 68186 - }, - { - "epoch": 1.75, - "learning_rate": 7.829510999904318e-07, - "loss": 0.6885, - "step": 68187 - }, - { - "epoch": 1.75, - "learning_rate": 7.829240892629929e-07, - "loss": 0.7681, - "step": 68188 - }, - { - "epoch": 1.75, - "learning_rate": 7.828970787017591e-07, - "loss": 0.4771, - "step": 68189 - }, - { - "epoch": 1.75, - "learning_rate": 7.82870068306751e-07, - "loss": 0.543, - "step": 68190 - }, - { - "epoch": 1.75, - "learning_rate": 7.828430580779889e-07, - "loss": 0.6592, - "step": 68191 - }, - { - "epoch": 1.75, - "learning_rate": 7.828160480154942e-07, - "loss": 0.6592, - "step": 68192 - }, - { - "epoch": 1.75, - "learning_rate": 7.82789038119287e-07, - "loss": 0.583, - "step": 68193 - }, - { - "epoch": 1.75, - "learning_rate": 7.827620283893885e-07, - "loss": 0.5742, - "step": 68194 - }, - { - "epoch": 1.75, - "learning_rate": 7.827350188258188e-07, - "loss": 0.7373, - "step": 68195 - }, - { - "epoch": 1.75, - "learning_rate": 7.827080094285993e-07, - "loss": 0.5669, - "step": 68196 - }, - { - "epoch": 1.75, - "learning_rate": 7.826810001977499e-07, - "loss": 0.5103, - "step": 68197 - }, - { - "epoch": 1.75, - "learning_rate": 7.82653991133292e-07, - "loss": 0.6616, - "step": 68198 - }, - { - "epoch": 1.75, - "learning_rate": 7.826269822352461e-07, - "loss": 0.6396, - "step": 68199 - }, - { - "epoch": 1.75, - "learning_rate": 7.825999735036324e-07, - "loss": 0.563, - "step": 68200 - }, - { - "epoch": 1.75, - "learning_rate": 7.825729649384721e-07, - "loss": 0.5472, - "step": 68201 - }, - { - "epoch": 1.75, - "learning_rate": 7.825459565397853e-07, - "loss": 0.687, - "step": 68202 - }, - { - "epoch": 1.75, - "learning_rate": 7.825189483075934e-07, - "loss": 0.7207, - "step": 68203 - }, - { - "epoch": 1.75, - "learning_rate": 7.824919402419165e-07, - "loss": 0.4476, - "step": 68204 - }, - { - "epoch": 1.75, - "learning_rate": 7.824649323427758e-07, - "loss": 0.748, - "step": 68205 - }, - { - "epoch": 1.75, - "learning_rate": 7.824379246101916e-07, - "loss": 0.5908, - "step": 68206 - }, - { - "epoch": 1.75, - "learning_rate": 7.824109170441845e-07, - "loss": 0.5562, - "step": 68207 - }, - { - "epoch": 1.75, - "learning_rate": 7.823839096447755e-07, - "loss": 0.5332, - "step": 68208 - }, - { - "epoch": 1.75, - "learning_rate": 7.823569024119855e-07, - "loss": 0.6729, - "step": 68209 - }, - { - "epoch": 1.75, - "learning_rate": 7.823298953458343e-07, - "loss": 0.6772, - "step": 68210 - }, - { - "epoch": 1.75, - "learning_rate": 7.823028884463433e-07, - "loss": 0.6113, - "step": 68211 - }, - { - "epoch": 1.75, - "learning_rate": 7.822758817135328e-07, - "loss": 0.7334, - "step": 68212 - }, - { - "epoch": 1.75, - "learning_rate": 7.822488751474239e-07, - "loss": 0.7144, - "step": 68213 - }, - { - "epoch": 1.75, - "learning_rate": 7.822218687480366e-07, - "loss": 0.6479, - "step": 68214 - }, - { - "epoch": 1.75, - "learning_rate": 7.821948625153924e-07, - "loss": 0.7354, - "step": 68215 - }, - { - "epoch": 1.75, - "learning_rate": 7.821678564495114e-07, - "loss": 0.7207, - "step": 68216 - }, - { - "epoch": 1.75, - "learning_rate": 7.821408505504146e-07, - "loss": 0.6772, - "step": 68217 - }, - { - "epoch": 1.75, - "learning_rate": 7.821138448181222e-07, - "loss": 0.6611, - "step": 68218 - }, - { - "epoch": 1.75, - "learning_rate": 7.820868392526557e-07, - "loss": 0.8555, - "step": 68219 - }, - { - "epoch": 1.75, - "learning_rate": 7.820598338540351e-07, - "loss": 0.6133, - "step": 68220 - }, - { - "epoch": 1.75, - "learning_rate": 7.820328286222812e-07, - "loss": 0.7725, - "step": 68221 - }, - { - "epoch": 1.75, - "learning_rate": 7.820058235574147e-07, - "loss": 0.5161, - "step": 68222 - }, - { - "epoch": 1.75, - "learning_rate": 7.819788186594565e-07, - "loss": 0.6245, - "step": 68223 - }, - { - "epoch": 1.75, - "learning_rate": 7.819518139284268e-07, - "loss": 0.6196, - "step": 68224 - }, - { - "epoch": 1.75, - "learning_rate": 7.819248093643468e-07, - "loss": 0.6121, - "step": 68225 - }, - { - "epoch": 1.75, - "learning_rate": 7.818978049672368e-07, - "loss": 0.707, - "step": 68226 - }, - { - "epoch": 1.75, - "learning_rate": 7.818708007371178e-07, - "loss": 0.5996, - "step": 68227 - }, - { - "epoch": 1.75, - "learning_rate": 7.8184379667401e-07, - "loss": 0.8438, - "step": 68228 - }, - { - "epoch": 1.75, - "learning_rate": 7.818167927779349e-07, - "loss": 0.6211, - "step": 68229 - }, - { - "epoch": 1.75, - "learning_rate": 7.817897890489123e-07, - "loss": 0.6709, - "step": 68230 - }, - { - "epoch": 1.75, - "learning_rate": 7.817627854869631e-07, - "loss": 0.6362, - "step": 68231 - }, - { - "epoch": 1.75, - "learning_rate": 7.817357820921083e-07, - "loss": 0.601, - "step": 68232 - }, - { - "epoch": 1.75, - "learning_rate": 7.817087788643683e-07, - "loss": 0.7339, - "step": 68233 - }, - { - "epoch": 1.75, - "learning_rate": 7.816817758037639e-07, - "loss": 0.6357, - "step": 68234 - }, - { - "epoch": 1.75, - "learning_rate": 7.816547729103155e-07, - "loss": 0.4135, - "step": 68235 - }, - { - "epoch": 1.75, - "learning_rate": 7.816277701840444e-07, - "loss": 0.6069, - "step": 68236 - }, - { - "epoch": 1.75, - "learning_rate": 7.816007676249704e-07, - "loss": 0.7012, - "step": 68237 - }, - { - "epoch": 1.75, - "learning_rate": 7.81573765233115e-07, - "loss": 0.6396, - "step": 68238 - }, - { - "epoch": 1.75, - "learning_rate": 7.815467630084988e-07, - "loss": 0.7627, - "step": 68239 - }, - { - "epoch": 1.75, - "learning_rate": 7.815197609511419e-07, - "loss": 0.4907, - "step": 68240 - }, - { - "epoch": 1.75, - "learning_rate": 7.814927590610651e-07, - "loss": 0.502, - "step": 68241 - }, - { - "epoch": 1.75, - "learning_rate": 7.814657573382894e-07, - "loss": 0.7959, - "step": 68242 - }, - { - "epoch": 1.75, - "learning_rate": 7.814387557828352e-07, - "loss": 0.6279, - "step": 68243 - }, - { - "epoch": 1.75, - "learning_rate": 7.814117543947234e-07, - "loss": 0.6895, - "step": 68244 - }, - { - "epoch": 1.75, - "learning_rate": 7.813847531739744e-07, - "loss": 0.5688, - "step": 68245 - }, - { - "epoch": 1.75, - "learning_rate": 7.813577521206092e-07, - "loss": 0.4875, - "step": 68246 - }, - { - "epoch": 1.75, - "learning_rate": 7.813307512346483e-07, - "loss": 0.6187, - "step": 68247 - }, - { - "epoch": 1.75, - "learning_rate": 7.813037505161124e-07, - "loss": 0.5996, - "step": 68248 - }, - { - "epoch": 1.75, - "learning_rate": 7.812767499650225e-07, - "loss": 0.7197, - "step": 68249 - }, - { - "epoch": 1.75, - "learning_rate": 7.812497495813984e-07, - "loss": 0.6675, - "step": 68250 - }, - { - "epoch": 1.75, - "learning_rate": 7.812227493652616e-07, - "loss": 0.6201, - "step": 68251 - }, - { - "epoch": 1.75, - "learning_rate": 7.811957493166322e-07, - "loss": 0.5942, - "step": 68252 - }, - { - "epoch": 1.75, - "learning_rate": 7.811687494355315e-07, - "loss": 0.5859, - "step": 68253 - }, - { - "epoch": 1.75, - "learning_rate": 7.811417497219794e-07, - "loss": 0.6558, - "step": 68254 - }, - { - "epoch": 1.75, - "learning_rate": 7.811147501759974e-07, - "loss": 0.5127, - "step": 68255 - }, - { - "epoch": 1.75, - "learning_rate": 7.810877507976055e-07, - "loss": 0.7168, - "step": 68256 - }, - { - "epoch": 1.75, - "learning_rate": 7.810607515868248e-07, - "loss": 0.7295, - "step": 68257 - }, - { - "epoch": 1.75, - "learning_rate": 7.810337525436758e-07, - "loss": 0.3813, - "step": 68258 - }, - { - "epoch": 1.75, - "learning_rate": 7.810067536681796e-07, - "loss": 0.5516, - "step": 68259 - }, - { - "epoch": 1.75, - "learning_rate": 7.80979754960356e-07, - "loss": 0.6631, - "step": 68260 - }, - { - "epoch": 1.75, - "learning_rate": 7.809527564202261e-07, - "loss": 0.5303, - "step": 68261 - }, - { - "epoch": 1.75, - "learning_rate": 7.809257580478106e-07, - "loss": 0.6118, - "step": 68262 - }, - { - "epoch": 1.75, - "learning_rate": 7.808987598431302e-07, - "loss": 0.7227, - "step": 68263 - }, - { - "epoch": 1.75, - "learning_rate": 7.808717618062055e-07, - "loss": 0.8096, - "step": 68264 - }, - { - "epoch": 1.75, - "learning_rate": 7.808447639370575e-07, - "loss": 0.5527, - "step": 68265 - }, - { - "epoch": 1.75, - "learning_rate": 7.808177662357062e-07, - "loss": 0.5879, - "step": 68266 - }, - { - "epoch": 1.75, - "learning_rate": 7.80790768702173e-07, - "loss": 0.7275, - "step": 68267 - }, - { - "epoch": 1.75, - "learning_rate": 7.807637713364783e-07, - "loss": 0.6421, - "step": 68268 - }, - { - "epoch": 1.75, - "learning_rate": 7.807367741386423e-07, - "loss": 0.7393, - "step": 68269 - }, - { - "epoch": 1.75, - "learning_rate": 7.807097771086864e-07, - "loss": 0.5476, - "step": 68270 - }, - { - "epoch": 1.75, - "learning_rate": 7.806827802466306e-07, - "loss": 0.6787, - "step": 68271 - }, - { - "epoch": 1.75, - "learning_rate": 7.806557835524962e-07, - "loss": 0.7422, - "step": 68272 - }, - { - "epoch": 1.75, - "learning_rate": 7.806287870263034e-07, - "loss": 0.4905, - "step": 68273 - }, - { - "epoch": 1.75, - "learning_rate": 7.806017906680732e-07, - "loss": 0.6553, - "step": 68274 - }, - { - "epoch": 1.75, - "learning_rate": 7.805747944778258e-07, - "loss": 0.5889, - "step": 68275 - }, - { - "epoch": 1.75, - "learning_rate": 7.805477984555826e-07, - "loss": 0.5552, - "step": 68276 - }, - { - "epoch": 1.75, - "learning_rate": 7.805208026013636e-07, - "loss": 0.7104, - "step": 68277 - }, - { - "epoch": 1.75, - "learning_rate": 7.804938069151903e-07, - "loss": 0.6284, - "step": 68278 - }, - { - "epoch": 1.75, - "learning_rate": 7.804668113970822e-07, - "loss": 0.6123, - "step": 68279 - }, - { - "epoch": 1.75, - "learning_rate": 7.804398160470608e-07, - "loss": 0.8096, - "step": 68280 - }, - { - "epoch": 1.75, - "learning_rate": 7.804128208651462e-07, - "loss": 0.6104, - "step": 68281 - }, - { - "epoch": 1.75, - "learning_rate": 7.803858258513598e-07, - "loss": 0.6494, - "step": 68282 - }, - { - "epoch": 1.75, - "learning_rate": 7.803588310057216e-07, - "loss": 0.6484, - "step": 68283 - }, - { - "epoch": 1.75, - "learning_rate": 7.803318363282527e-07, - "loss": 0.5962, - "step": 68284 - }, - { - "epoch": 1.75, - "learning_rate": 7.803048418189734e-07, - "loss": 0.7168, - "step": 68285 - }, - { - "epoch": 1.75, - "learning_rate": 7.802778474779049e-07, - "loss": 0.625, - "step": 68286 - }, - { - "epoch": 1.75, - "learning_rate": 7.802508533050673e-07, - "loss": 0.7275, - "step": 68287 - }, - { - "epoch": 1.75, - "learning_rate": 7.802238593004819e-07, - "loss": 0.6875, - "step": 68288 - }, - { - "epoch": 1.75, - "learning_rate": 7.801968654641688e-07, - "loss": 0.562, - "step": 68289 - }, - { - "epoch": 1.75, - "learning_rate": 7.801698717961485e-07, - "loss": 0.6885, - "step": 68290 - }, - { - "epoch": 1.75, - "learning_rate": 7.801428782964424e-07, - "loss": 0.5723, - "step": 68291 - }, - { - "epoch": 1.75, - "learning_rate": 7.801158849650706e-07, - "loss": 0.626, - "step": 68292 - }, - { - "epoch": 1.75, - "learning_rate": 7.80088891802054e-07, - "loss": 0.8223, - "step": 68293 - }, - { - "epoch": 1.75, - "learning_rate": 7.800618988074132e-07, - "loss": 0.6973, - "step": 68294 - }, - { - "epoch": 1.75, - "learning_rate": 7.80034905981169e-07, - "loss": 0.7285, - "step": 68295 - }, - { - "epoch": 1.75, - "learning_rate": 7.80007913323342e-07, - "loss": 0.5414, - "step": 68296 - }, - { - "epoch": 1.75, - "learning_rate": 7.799809208339525e-07, - "loss": 0.6592, - "step": 68297 - }, - { - "epoch": 1.75, - "learning_rate": 7.799539285130221e-07, - "loss": 0.7637, - "step": 68298 - }, - { - "epoch": 1.75, - "learning_rate": 7.799269363605705e-07, - "loss": 0.7119, - "step": 68299 - }, - { - "epoch": 1.75, - "learning_rate": 7.798999443766185e-07, - "loss": 0.5776, - "step": 68300 - }, - { - "epoch": 1.75, - "learning_rate": 7.798729525611874e-07, - "loss": 0.561, - "step": 68301 - }, - { - "epoch": 1.75, - "learning_rate": 7.798459609142971e-07, - "loss": 0.5859, - "step": 68302 - }, - { - "epoch": 1.75, - "learning_rate": 7.798189694359688e-07, - "loss": 0.666, - "step": 68303 - }, - { - "epoch": 1.75, - "learning_rate": 7.797919781262229e-07, - "loss": 0.5781, - "step": 68304 - }, - { - "epoch": 1.75, - "learning_rate": 7.797649869850802e-07, - "loss": 0.7363, - "step": 68305 - }, - { - "epoch": 1.75, - "learning_rate": 7.797379960125613e-07, - "loss": 0.5952, - "step": 68306 - }, - { - "epoch": 1.75, - "learning_rate": 7.79711005208687e-07, - "loss": 0.667, - "step": 68307 - }, - { - "epoch": 1.75, - "learning_rate": 7.796840145734781e-07, - "loss": 0.7256, - "step": 68308 - }, - { - "epoch": 1.75, - "learning_rate": 7.796570241069545e-07, - "loss": 0.5245, - "step": 68309 - }, - { - "epoch": 1.75, - "learning_rate": 7.796300338091378e-07, - "loss": 0.6509, - "step": 68310 - }, - { - "epoch": 1.75, - "learning_rate": 7.796030436800479e-07, - "loss": 0.7451, - "step": 68311 - }, - { - "epoch": 1.75, - "learning_rate": 7.795760537197059e-07, - "loss": 0.6636, - "step": 68312 - }, - { - "epoch": 1.75, - "learning_rate": 7.795490639281325e-07, - "loss": 0.4402, - "step": 68313 - }, - { - "epoch": 1.75, - "learning_rate": 7.795220743053481e-07, - "loss": 0.7646, - "step": 68314 - }, - { - "epoch": 1.75, - "learning_rate": 7.794950848513737e-07, - "loss": 0.6086, - "step": 68315 - }, - { - "epoch": 1.75, - "learning_rate": 7.794680955662295e-07, - "loss": 0.6392, - "step": 68316 - }, - { - "epoch": 1.75, - "learning_rate": 7.794411064499366e-07, - "loss": 0.5845, - "step": 68317 - }, - { - "epoch": 1.75, - "learning_rate": 7.794141175025159e-07, - "loss": 0.7002, - "step": 68318 - }, - { - "epoch": 1.75, - "learning_rate": 7.793871287239871e-07, - "loss": 0.6851, - "step": 68319 - }, - { - "epoch": 1.75, - "learning_rate": 7.793601401143717e-07, - "loss": 0.5508, - "step": 68320 - }, - { - "epoch": 1.75, - "learning_rate": 7.793331516736899e-07, - "loss": 0.6938, - "step": 68321 - }, - { - "epoch": 1.75, - "learning_rate": 7.793061634019628e-07, - "loss": 0.7471, - "step": 68322 - }, - { - "epoch": 1.75, - "learning_rate": 7.792791752992105e-07, - "loss": 0.6738, - "step": 68323 - }, - { - "epoch": 1.75, - "learning_rate": 7.792521873654543e-07, - "loss": 0.6689, - "step": 68324 - }, - { - "epoch": 1.75, - "learning_rate": 7.792251996007142e-07, - "loss": 0.6855, - "step": 68325 - }, - { - "epoch": 1.75, - "learning_rate": 7.791982120050115e-07, - "loss": 0.5479, - "step": 68326 - }, - { - "epoch": 1.75, - "learning_rate": 7.791712245783664e-07, - "loss": 0.5898, - "step": 68327 - }, - { - "epoch": 1.75, - "learning_rate": 7.791442373208001e-07, - "loss": 0.6953, - "step": 68328 - }, - { - "epoch": 1.75, - "learning_rate": 7.791172502323329e-07, - "loss": 0.5791, - "step": 68329 - }, - { - "epoch": 1.75, - "learning_rate": 7.790902633129853e-07, - "loss": 0.5342, - "step": 68330 - }, - { - "epoch": 1.75, - "learning_rate": 7.790632765627779e-07, - "loss": 0.7295, - "step": 68331 - }, - { - "epoch": 1.75, - "learning_rate": 7.790362899817317e-07, - "loss": 0.7012, - "step": 68332 - }, - { - "epoch": 1.75, - "learning_rate": 7.790093035698672e-07, - "loss": 0.5608, - "step": 68333 - }, - { - "epoch": 1.75, - "learning_rate": 7.789823173272053e-07, - "loss": 0.6606, - "step": 68334 - }, - { - "epoch": 1.75, - "learning_rate": 7.789553312537662e-07, - "loss": 0.4453, - "step": 68335 - }, - { - "epoch": 1.75, - "learning_rate": 7.789283453495712e-07, - "loss": 0.5164, - "step": 68336 - }, - { - "epoch": 1.75, - "learning_rate": 7.789013596146402e-07, - "loss": 0.6108, - "step": 68337 - }, - { - "epoch": 1.75, - "learning_rate": 7.788743740489948e-07, - "loss": 0.5283, - "step": 68338 - }, - { - "epoch": 1.75, - "learning_rate": 7.788473886526549e-07, - "loss": 0.6841, - "step": 68339 - }, - { - "epoch": 1.75, - "learning_rate": 7.788204034256411e-07, - "loss": 0.6611, - "step": 68340 - }, - { - "epoch": 1.75, - "learning_rate": 7.787934183679746e-07, - "loss": 0.6162, - "step": 68341 - }, - { - "epoch": 1.75, - "learning_rate": 7.787664334796757e-07, - "loss": 0.5381, - "step": 68342 - }, - { - "epoch": 1.75, - "learning_rate": 7.787394487607653e-07, - "loss": 0.4832, - "step": 68343 - }, - { - "epoch": 1.75, - "learning_rate": 7.787124642112637e-07, - "loss": 0.6152, - "step": 68344 - }, - { - "epoch": 1.75, - "learning_rate": 7.786854798311921e-07, - "loss": 0.7998, - "step": 68345 - }, - { - "epoch": 1.75, - "learning_rate": 7.786584956205704e-07, - "loss": 0.4814, - "step": 68346 - }, - { - "epoch": 1.75, - "learning_rate": 7.786315115794202e-07, - "loss": 0.6318, - "step": 68347 - }, - { - "epoch": 1.75, - "learning_rate": 7.786045277077617e-07, - "loss": 0.6514, - "step": 68348 - }, - { - "epoch": 1.75, - "learning_rate": 7.785775440056154e-07, - "loss": 0.5554, - "step": 68349 - }, - { - "epoch": 1.75, - "learning_rate": 7.785505604730018e-07, - "loss": 0.6201, - "step": 68350 - }, - { - "epoch": 1.75, - "learning_rate": 7.785235771099422e-07, - "loss": 0.4951, - "step": 68351 - }, - { - "epoch": 1.75, - "learning_rate": 7.784965939164566e-07, - "loss": 0.6858, - "step": 68352 - }, - { - "epoch": 1.75, - "learning_rate": 7.784696108925663e-07, - "loss": 0.6284, - "step": 68353 - }, - { - "epoch": 1.75, - "learning_rate": 7.784426280382913e-07, - "loss": 0.6982, - "step": 68354 - }, - { - "epoch": 1.75, - "learning_rate": 7.784156453536528e-07, - "loss": 0.5186, - "step": 68355 - }, - { - "epoch": 1.75, - "learning_rate": 7.783886628386711e-07, - "loss": 0.4883, - "step": 68356 - }, - { - "epoch": 1.75, - "learning_rate": 7.783616804933673e-07, - "loss": 0.6211, - "step": 68357 - }, - { - "epoch": 1.75, - "learning_rate": 7.783346983177619e-07, - "loss": 0.5693, - "step": 68358 - }, - { - "epoch": 1.75, - "learning_rate": 7.78307716311875e-07, - "loss": 0.7383, - "step": 68359 - }, - { - "epoch": 1.75, - "learning_rate": 7.782807344757278e-07, - "loss": 0.8438, - "step": 68360 - }, - { - "epoch": 1.75, - "learning_rate": 7.782537528093407e-07, - "loss": 0.5786, - "step": 68361 - }, - { - "epoch": 1.75, - "learning_rate": 7.782267713127349e-07, - "loss": 0.6323, - "step": 68362 - }, - { - "epoch": 1.75, - "learning_rate": 7.781997899859301e-07, - "loss": 0.5576, - "step": 68363 - }, - { - "epoch": 1.75, - "learning_rate": 7.781728088289481e-07, - "loss": 0.6763, - "step": 68364 - }, - { - "epoch": 1.75, - "learning_rate": 7.781458278418085e-07, - "loss": 0.8428, - "step": 68365 - }, - { - "epoch": 1.75, - "learning_rate": 7.781188470245328e-07, - "loss": 0.541, - "step": 68366 - }, - { - "epoch": 1.75, - "learning_rate": 7.780918663771409e-07, - "loss": 0.6938, - "step": 68367 - }, - { - "epoch": 1.75, - "learning_rate": 7.780648858996548e-07, - "loss": 0.5234, - "step": 68368 - }, - { - "epoch": 1.75, - "learning_rate": 7.780379055920934e-07, - "loss": 0.6323, - "step": 68369 - }, - { - "epoch": 1.75, - "learning_rate": 7.780109254544783e-07, - "loss": 0.52, - "step": 68370 - }, - { - "epoch": 1.75, - "learning_rate": 7.7798394548683e-07, - "loss": 0.8574, - "step": 68371 - }, - { - "epoch": 1.75, - "learning_rate": 7.779569656891693e-07, - "loss": 0.792, - "step": 68372 - }, - { - "epoch": 1.75, - "learning_rate": 7.779299860615165e-07, - "loss": 0.6543, - "step": 68373 - }, - { - "epoch": 1.75, - "learning_rate": 7.779030066038928e-07, - "loss": 0.7212, - "step": 68374 - }, - { - "epoch": 1.75, - "learning_rate": 7.778760273163182e-07, - "loss": 0.8467, - "step": 68375 - }, - { - "epoch": 1.75, - "learning_rate": 7.77849048198814e-07, - "loss": 0.6455, - "step": 68376 - }, - { - "epoch": 1.75, - "learning_rate": 7.778220692514003e-07, - "loss": 0.7656, - "step": 68377 - }, - { - "epoch": 1.75, - "learning_rate": 7.777950904740985e-07, - "loss": 0.6016, - "step": 68378 - }, - { - "epoch": 1.75, - "learning_rate": 7.777681118669286e-07, - "loss": 0.6846, - "step": 68379 - }, - { - "epoch": 1.75, - "learning_rate": 7.777411334299113e-07, - "loss": 0.6768, - "step": 68380 - }, - { - "epoch": 1.75, - "learning_rate": 7.777141551630675e-07, - "loss": 0.7412, - "step": 68381 - }, - { - "epoch": 1.75, - "learning_rate": 7.776871770664175e-07, - "loss": 0.7158, - "step": 68382 - }, - { - "epoch": 1.75, - "learning_rate": 7.776601991399825e-07, - "loss": 0.665, - "step": 68383 - }, - { - "epoch": 1.75, - "learning_rate": 7.776332213837826e-07, - "loss": 0.6797, - "step": 68384 - }, - { - "epoch": 1.75, - "learning_rate": 7.776062437978389e-07, - "loss": 0.6904, - "step": 68385 - }, - { - "epoch": 1.75, - "learning_rate": 7.77579266382172e-07, - "loss": 0.6182, - "step": 68386 - }, - { - "epoch": 1.75, - "learning_rate": 7.775522891368021e-07, - "loss": 0.6357, - "step": 68387 - }, - { - "epoch": 1.75, - "learning_rate": 7.775253120617506e-07, - "loss": 0.5457, - "step": 68388 - }, - { - "epoch": 1.75, - "learning_rate": 7.774983351570376e-07, - "loss": 0.6377, - "step": 68389 - }, - { - "epoch": 1.75, - "learning_rate": 7.774713584226838e-07, - "loss": 0.709, - "step": 68390 - }, - { - "epoch": 1.75, - "learning_rate": 7.774443818587098e-07, - "loss": 0.7764, - "step": 68391 - }, - { - "epoch": 1.75, - "learning_rate": 7.774174054651366e-07, - "loss": 0.7256, - "step": 68392 - }, - { - "epoch": 1.75, - "learning_rate": 7.773904292419846e-07, - "loss": 0.5327, - "step": 68393 - }, - { - "epoch": 1.75, - "learning_rate": 7.773634531892743e-07, - "loss": 0.4839, - "step": 68394 - }, - { - "epoch": 1.75, - "learning_rate": 7.773364773070269e-07, - "loss": 0.5215, - "step": 68395 - }, - { - "epoch": 1.75, - "learning_rate": 7.773095015952625e-07, - "loss": 0.7676, - "step": 68396 - }, - { - "epoch": 1.75, - "learning_rate": 7.772825260540021e-07, - "loss": 0.4886, - "step": 68397 - }, - { - "epoch": 1.75, - "learning_rate": 7.772555506832665e-07, - "loss": 0.5508, - "step": 68398 - }, - { - "epoch": 1.75, - "learning_rate": 7.772285754830756e-07, - "loss": 0.7354, - "step": 68399 - }, - { - "epoch": 1.75, - "learning_rate": 7.77201600453451e-07, - "loss": 0.4409, - "step": 68400 - }, - { - "epoch": 1.75, - "learning_rate": 7.771746255944124e-07, - "loss": 0.5747, - "step": 68401 - }, - { - "epoch": 1.75, - "learning_rate": 7.771476509059812e-07, - "loss": 0.4113, - "step": 68402 - }, - { - "epoch": 1.75, - "learning_rate": 7.771206763881779e-07, - "loss": 0.5767, - "step": 68403 - }, - { - "epoch": 1.75, - "learning_rate": 7.770937020410226e-07, - "loss": 0.5342, - "step": 68404 - }, - { - "epoch": 1.75, - "learning_rate": 7.770667278645368e-07, - "loss": 0.6182, - "step": 68405 - }, - { - "epoch": 1.75, - "learning_rate": 7.770397538587407e-07, - "loss": 0.6143, - "step": 68406 - }, - { - "epoch": 1.75, - "learning_rate": 7.77012780023655e-07, - "loss": 0.4905, - "step": 68407 - }, - { - "epoch": 1.75, - "learning_rate": 7.769858063593007e-07, - "loss": 0.5015, - "step": 68408 - }, - { - "epoch": 1.75, - "learning_rate": 7.769588328656975e-07, - "loss": 0.7246, - "step": 68409 - }, - { - "epoch": 1.75, - "learning_rate": 7.76931859542867e-07, - "loss": 0.6299, - "step": 68410 - }, - { - "epoch": 1.75, - "learning_rate": 7.769048863908293e-07, - "loss": 0.5203, - "step": 68411 - }, - { - "epoch": 1.75, - "learning_rate": 7.768779134096055e-07, - "loss": 0.6934, - "step": 68412 - }, - { - "epoch": 1.75, - "learning_rate": 7.768509405992157e-07, - "loss": 0.6216, - "step": 68413 - }, - { - "epoch": 1.75, - "learning_rate": 7.768239679596812e-07, - "loss": 0.6433, - "step": 68414 - }, - { - "epoch": 1.75, - "learning_rate": 7.767969954910221e-07, - "loss": 0.6426, - "step": 68415 - }, - { - "epoch": 1.75, - "learning_rate": 7.767700231932595e-07, - "loss": 0.6133, - "step": 68416 - }, - { - "epoch": 1.75, - "learning_rate": 7.767430510664135e-07, - "loss": 0.4834, - "step": 68417 - }, - { - "epoch": 1.75, - "learning_rate": 7.767160791105056e-07, - "loss": 0.52, - "step": 68418 - }, - { - "epoch": 1.75, - "learning_rate": 7.766891073255558e-07, - "loss": 0.5486, - "step": 68419 - }, - { - "epoch": 1.75, - "learning_rate": 7.766621357115847e-07, - "loss": 0.6865, - "step": 68420 - }, - { - "epoch": 1.75, - "learning_rate": 7.766351642686131e-07, - "loss": 0.6743, - "step": 68421 - }, - { - "epoch": 1.75, - "learning_rate": 7.766081929966619e-07, - "loss": 0.5977, - "step": 68422 - }, - { - "epoch": 1.75, - "learning_rate": 7.765812218957513e-07, - "loss": 0.6167, - "step": 68423 - }, - { - "epoch": 1.75, - "learning_rate": 7.765542509659022e-07, - "loss": 0.5986, - "step": 68424 - }, - { - "epoch": 1.75, - "learning_rate": 7.765272802071352e-07, - "loss": 0.7686, - "step": 68425 - }, - { - "epoch": 1.75, - "learning_rate": 7.765003096194711e-07, - "loss": 0.3273, - "step": 68426 - }, - { - "epoch": 1.75, - "learning_rate": 7.764733392029303e-07, - "loss": 0.5986, - "step": 68427 - }, - { - "epoch": 1.75, - "learning_rate": 7.764463689575341e-07, - "loss": 0.5876, - "step": 68428 - }, - { - "epoch": 1.75, - "learning_rate": 7.764193988833022e-07, - "loss": 0.5791, - "step": 68429 - }, - { - "epoch": 1.75, - "learning_rate": 7.763924289802557e-07, - "loss": 0.5312, - "step": 68430 - }, - { - "epoch": 1.75, - "learning_rate": 7.763654592484152e-07, - "loss": 0.562, - "step": 68431 - }, - { - "epoch": 1.75, - "learning_rate": 7.763384896878014e-07, - "loss": 0.6992, - "step": 68432 - }, - { - "epoch": 1.75, - "learning_rate": 7.763115202984351e-07, - "loss": 0.5603, - "step": 68433 - }, - { - "epoch": 1.75, - "learning_rate": 7.762845510803364e-07, - "loss": 0.6426, - "step": 68434 - }, - { - "epoch": 1.75, - "learning_rate": 7.762575820335268e-07, - "loss": 0.4414, - "step": 68435 - }, - { - "epoch": 1.75, - "learning_rate": 7.76230613158026e-07, - "loss": 0.5571, - "step": 68436 - }, - { - "epoch": 1.75, - "learning_rate": 7.762036444538556e-07, - "loss": 0.6206, - "step": 68437 - }, - { - "epoch": 1.75, - "learning_rate": 7.761766759210358e-07, - "loss": 0.6001, - "step": 68438 - }, - { - "epoch": 1.75, - "learning_rate": 7.761497075595872e-07, - "loss": 0.6289, - "step": 68439 - }, - { - "epoch": 1.75, - "learning_rate": 7.761227393695301e-07, - "loss": 0.6924, - "step": 68440 - }, - { - "epoch": 1.75, - "learning_rate": 7.760957713508858e-07, - "loss": 0.7832, - "step": 68441 - }, - { - "epoch": 1.75, - "learning_rate": 7.760688035036745e-07, - "loss": 0.6013, - "step": 68442 - }, - { - "epoch": 1.75, - "learning_rate": 7.760418358279172e-07, - "loss": 0.6182, - "step": 68443 - }, - { - "epoch": 1.75, - "learning_rate": 7.76014868323634e-07, - "loss": 0.6772, - "step": 68444 - }, - { - "epoch": 1.75, - "learning_rate": 7.759879009908463e-07, - "loss": 0.5093, - "step": 68445 - }, - { - "epoch": 1.75, - "learning_rate": 7.759609338295741e-07, - "loss": 0.625, - "step": 68446 - }, - { - "epoch": 1.75, - "learning_rate": 7.759339668398386e-07, - "loss": 0.7437, - "step": 68447 - }, - { - "epoch": 1.75, - "learning_rate": 7.759070000216604e-07, - "loss": 0.5723, - "step": 68448 - }, - { - "epoch": 1.75, - "learning_rate": 7.758800333750594e-07, - "loss": 0.6255, - "step": 68449 - }, - { - "epoch": 1.75, - "learning_rate": 7.75853066900057e-07, - "loss": 0.5967, - "step": 68450 - }, - { - "epoch": 1.75, - "learning_rate": 7.758261005966733e-07, - "loss": 0.7109, - "step": 68451 - }, - { - "epoch": 1.75, - "learning_rate": 7.757991344649295e-07, - "loss": 0.6597, - "step": 68452 - }, - { - "epoch": 1.75, - "learning_rate": 7.757721685048457e-07, - "loss": 0.5859, - "step": 68453 - }, - { - "epoch": 1.75, - "learning_rate": 7.757452027164431e-07, - "loss": 0.4956, - "step": 68454 - }, - { - "epoch": 1.75, - "learning_rate": 7.757182370997421e-07, - "loss": 0.6785, - "step": 68455 - }, - { - "epoch": 1.75, - "learning_rate": 7.756912716547632e-07, - "loss": 0.522, - "step": 68456 - }, - { - "epoch": 1.75, - "learning_rate": 7.756643063815272e-07, - "loss": 0.6562, - "step": 68457 - }, - { - "epoch": 1.75, - "learning_rate": 7.756373412800553e-07, - "loss": 0.4312, - "step": 68458 - }, - { - "epoch": 1.75, - "learning_rate": 7.75610376350367e-07, - "loss": 0.7158, - "step": 68459 - }, - { - "epoch": 1.75, - "learning_rate": 7.755834115924837e-07, - "loss": 0.7227, - "step": 68460 - }, - { - "epoch": 1.75, - "learning_rate": 7.755564470064255e-07, - "loss": 0.7871, - "step": 68461 - }, - { - "epoch": 1.75, - "learning_rate": 7.755294825922137e-07, - "loss": 0.8496, - "step": 68462 - }, - { - "epoch": 1.75, - "learning_rate": 7.755025183498685e-07, - "loss": 0.5986, - "step": 68463 - }, - { - "epoch": 1.75, - "learning_rate": 7.754755542794109e-07, - "loss": 0.6572, - "step": 68464 - }, - { - "epoch": 1.75, - "learning_rate": 7.75448590380861e-07, - "loss": 0.4089, - "step": 68465 - }, - { - "epoch": 1.75, - "learning_rate": 7.754216266542401e-07, - "loss": 0.6069, - "step": 68466 - }, - { - "epoch": 1.75, - "learning_rate": 7.753946630995684e-07, - "loss": 0.5342, - "step": 68467 - }, - { - "epoch": 1.75, - "learning_rate": 7.753676997168671e-07, - "loss": 0.6133, - "step": 68468 - }, - { - "epoch": 1.75, - "learning_rate": 7.753407365061562e-07, - "loss": 0.7705, - "step": 68469 - }, - { - "epoch": 1.75, - "learning_rate": 7.753137734674563e-07, - "loss": 0.4678, - "step": 68470 - }, - { - "epoch": 1.75, - "learning_rate": 7.752868106007885e-07, - "loss": 0.7144, - "step": 68471 - }, - { - "epoch": 1.75, - "learning_rate": 7.75259847906173e-07, - "loss": 0.5518, - "step": 68472 - }, - { - "epoch": 1.75, - "learning_rate": 7.75232885383631e-07, - "loss": 0.6426, - "step": 68473 - }, - { - "epoch": 1.76, - "learning_rate": 7.752059230331826e-07, - "loss": 0.8447, - "step": 68474 - }, - { - "epoch": 1.76, - "learning_rate": 7.75178960854849e-07, - "loss": 0.533, - "step": 68475 - }, - { - "epoch": 1.76, - "learning_rate": 7.751519988486504e-07, - "loss": 0.5693, - "step": 68476 - }, - { - "epoch": 1.76, - "learning_rate": 7.751250370146074e-07, - "loss": 0.5815, - "step": 68477 - }, - { - "epoch": 1.76, - "learning_rate": 7.750980753527413e-07, - "loss": 0.6733, - "step": 68478 - }, - { - "epoch": 1.76, - "learning_rate": 7.750711138630721e-07, - "loss": 0.5713, - "step": 68479 - }, - { - "epoch": 1.76, - "learning_rate": 7.750441525456203e-07, - "loss": 0.8271, - "step": 68480 - }, - { - "epoch": 1.76, - "learning_rate": 7.75017191400407e-07, - "loss": 0.6704, - "step": 68481 - }, - { - "epoch": 1.76, - "learning_rate": 7.749902304274526e-07, - "loss": 0.5469, - "step": 68482 - }, - { - "epoch": 1.76, - "learning_rate": 7.74963269626778e-07, - "loss": 0.6138, - "step": 68483 - }, - { - "epoch": 1.76, - "learning_rate": 7.749363089984033e-07, - "loss": 0.5859, - "step": 68484 - }, - { - "epoch": 1.76, - "learning_rate": 7.7490934854235e-07, - "loss": 0.5728, - "step": 68485 - }, - { - "epoch": 1.76, - "learning_rate": 7.74882388258638e-07, - "loss": 0.5774, - "step": 68486 - }, - { - "epoch": 1.76, - "learning_rate": 7.748554281472883e-07, - "loss": 0.6318, - "step": 68487 - }, - { - "epoch": 1.76, - "learning_rate": 7.748284682083217e-07, - "loss": 0.7554, - "step": 68488 - }, - { - "epoch": 1.76, - "learning_rate": 7.748015084417582e-07, - "loss": 0.7266, - "step": 68489 - }, - { - "epoch": 1.76, - "learning_rate": 7.74774548847619e-07, - "loss": 0.6758, - "step": 68490 - }, - { - "epoch": 1.76, - "learning_rate": 7.747475894259243e-07, - "loss": 0.6328, - "step": 68491 - }, - { - "epoch": 1.76, - "learning_rate": 7.747206301766955e-07, - "loss": 0.4814, - "step": 68492 - }, - { - "epoch": 1.76, - "learning_rate": 7.746936710999524e-07, - "loss": 0.5305, - "step": 68493 - }, - { - "epoch": 1.76, - "learning_rate": 7.74666712195716e-07, - "loss": 0.5405, - "step": 68494 - }, - { - "epoch": 1.76, - "learning_rate": 7.746397534640071e-07, - "loss": 0.6377, - "step": 68495 - }, - { - "epoch": 1.76, - "learning_rate": 7.74612794904846e-07, - "loss": 0.5796, - "step": 68496 - }, - { - "epoch": 1.76, - "learning_rate": 7.745858365182535e-07, - "loss": 0.6104, - "step": 68497 - }, - { - "epoch": 1.76, - "learning_rate": 7.745588783042508e-07, - "loss": 0.5522, - "step": 68498 - }, - { - "epoch": 1.76, - "learning_rate": 7.745319202628574e-07, - "loss": 0.6934, - "step": 68499 - }, - { - "epoch": 1.76, - "learning_rate": 7.745049623940948e-07, - "loss": 0.626, - "step": 68500 - }, - { - "epoch": 1.76, - "learning_rate": 7.744780046979832e-07, - "loss": 0.6519, - "step": 68501 - }, - { - "epoch": 1.76, - "learning_rate": 7.744510471745436e-07, - "loss": 0.5952, - "step": 68502 - }, - { - "epoch": 1.76, - "learning_rate": 7.744240898237963e-07, - "loss": 0.7129, - "step": 68503 - }, - { - "epoch": 1.76, - "learning_rate": 7.743971326457622e-07, - "loss": 0.6621, - "step": 68504 - }, - { - "epoch": 1.76, - "learning_rate": 7.743701756404617e-07, - "loss": 0.5605, - "step": 68505 - }, - { - "epoch": 1.76, - "learning_rate": 7.743432188079157e-07, - "loss": 0.5171, - "step": 68506 - }, - { - "epoch": 1.76, - "learning_rate": 7.743162621481447e-07, - "loss": 0.6543, - "step": 68507 - }, - { - "epoch": 1.76, - "learning_rate": 7.742893056611697e-07, - "loss": 0.5278, - "step": 68508 - }, - { - "epoch": 1.76, - "learning_rate": 7.742623493470107e-07, - "loss": 0.5859, - "step": 68509 - }, - { - "epoch": 1.76, - "learning_rate": 7.742353932056885e-07, - "loss": 0.4253, - "step": 68510 - }, - { - "epoch": 1.76, - "learning_rate": 7.742084372372241e-07, - "loss": 0.7432, - "step": 68511 - }, - { - "epoch": 1.76, - "learning_rate": 7.741814814416379e-07, - "loss": 0.4819, - "step": 68512 - }, - { - "epoch": 1.76, - "learning_rate": 7.741545258189503e-07, - "loss": 0.6035, - "step": 68513 - }, - { - "epoch": 1.76, - "learning_rate": 7.741275703691826e-07, - "loss": 0.4594, - "step": 68514 - }, - { - "epoch": 1.76, - "learning_rate": 7.741006150923546e-07, - "loss": 0.6592, - "step": 68515 - }, - { - "epoch": 1.76, - "learning_rate": 7.740736599884876e-07, - "loss": 0.6475, - "step": 68516 - }, - { - "epoch": 1.76, - "learning_rate": 7.740467050576019e-07, - "loss": 0.7832, - "step": 68517 - }, - { - "epoch": 1.76, - "learning_rate": 7.740197502997186e-07, - "loss": 0.6426, - "step": 68518 - }, - { - "epoch": 1.76, - "learning_rate": 7.739927957148577e-07, - "loss": 0.6494, - "step": 68519 - }, - { - "epoch": 1.76, - "learning_rate": 7.739658413030401e-07, - "loss": 0.5435, - "step": 68520 - }, - { - "epoch": 1.76, - "learning_rate": 7.739388870642867e-07, - "loss": 0.6865, - "step": 68521 - }, - { - "epoch": 1.76, - "learning_rate": 7.739119329986174e-07, - "loss": 0.3762, - "step": 68522 - }, - { - "epoch": 1.76, - "learning_rate": 7.738849791060538e-07, - "loss": 0.458, - "step": 68523 - }, - { - "epoch": 1.76, - "learning_rate": 7.738580253866158e-07, - "loss": 0.7446, - "step": 68524 - }, - { - "epoch": 1.76, - "learning_rate": 7.738310718403245e-07, - "loss": 0.5679, - "step": 68525 - }, - { - "epoch": 1.76, - "learning_rate": 7.738041184672002e-07, - "loss": 0.6758, - "step": 68526 - }, - { - "epoch": 1.76, - "learning_rate": 7.737771652672637e-07, - "loss": 0.8613, - "step": 68527 - }, - { - "epoch": 1.76, - "learning_rate": 7.737502122405362e-07, - "loss": 0.6943, - "step": 68528 - }, - { - "epoch": 1.76, - "learning_rate": 7.737232593870372e-07, - "loss": 0.5479, - "step": 68529 - }, - { - "epoch": 1.76, - "learning_rate": 7.736963067067878e-07, - "loss": 0.4258, - "step": 68530 - }, - { - "epoch": 1.76, - "learning_rate": 7.736693541998089e-07, - "loss": 0.6787, - "step": 68531 - }, - { - "epoch": 1.76, - "learning_rate": 7.73642401866121e-07, - "loss": 0.6311, - "step": 68532 - }, - { - "epoch": 1.76, - "learning_rate": 7.736154497057447e-07, - "loss": 0.6299, - "step": 68533 - }, - { - "epoch": 1.76, - "learning_rate": 7.735884977187003e-07, - "loss": 0.5732, - "step": 68534 - }, - { - "epoch": 1.76, - "learning_rate": 7.735615459050092e-07, - "loss": 0.6084, - "step": 68535 - }, - { - "epoch": 1.76, - "learning_rate": 7.735345942646913e-07, - "loss": 0.6846, - "step": 68536 - }, - { - "epoch": 1.76, - "learning_rate": 7.735076427977679e-07, - "loss": 0.6455, - "step": 68537 - }, - { - "epoch": 1.76, - "learning_rate": 7.734806915042594e-07, - "loss": 0.627, - "step": 68538 - }, - { - "epoch": 1.76, - "learning_rate": 7.734537403841859e-07, - "loss": 0.6641, - "step": 68539 - }, - { - "epoch": 1.76, - "learning_rate": 7.734267894375687e-07, - "loss": 0.6553, - "step": 68540 - }, - { - "epoch": 1.76, - "learning_rate": 7.733998386644279e-07, - "loss": 0.5498, - "step": 68541 - }, - { - "epoch": 1.76, - "learning_rate": 7.733728880647848e-07, - "loss": 0.5483, - "step": 68542 - }, - { - "epoch": 1.76, - "learning_rate": 7.733459376386592e-07, - "loss": 0.6909, - "step": 68543 - }, - { - "epoch": 1.76, - "learning_rate": 7.733189873860726e-07, - "loss": 0.5625, - "step": 68544 - }, - { - "epoch": 1.76, - "learning_rate": 7.732920373070449e-07, - "loss": 0.6982, - "step": 68545 - }, - { - "epoch": 1.76, - "learning_rate": 7.732650874015973e-07, - "loss": 0.8184, - "step": 68546 - }, - { - "epoch": 1.76, - "learning_rate": 7.7323813766975e-07, - "loss": 0.7666, - "step": 68547 - }, - { - "epoch": 1.76, - "learning_rate": 7.732111881115245e-07, - "loss": 0.3745, - "step": 68548 - }, - { - "epoch": 1.76, - "learning_rate": 7.7318423872694e-07, - "loss": 0.4338, - "step": 68549 - }, - { - "epoch": 1.76, - "learning_rate": 7.731572895160183e-07, - "loss": 0.5056, - "step": 68550 - }, - { - "epoch": 1.76, - "learning_rate": 7.731303404787793e-07, - "loss": 0.5531, - "step": 68551 - }, - { - "epoch": 1.76, - "learning_rate": 7.731033916152443e-07, - "loss": 0.707, - "step": 68552 - }, - { - "epoch": 1.76, - "learning_rate": 7.730764429254333e-07, - "loss": 0.7012, - "step": 68553 - }, - { - "epoch": 1.76, - "learning_rate": 7.730494944093674e-07, - "loss": 0.6631, - "step": 68554 - }, - { - "epoch": 1.76, - "learning_rate": 7.73022546067067e-07, - "loss": 0.5859, - "step": 68555 - }, - { - "epoch": 1.76, - "learning_rate": 7.729955978985528e-07, - "loss": 0.6499, - "step": 68556 - }, - { - "epoch": 1.76, - "learning_rate": 7.729686499038454e-07, - "loss": 0.6406, - "step": 68557 - }, - { - "epoch": 1.76, - "learning_rate": 7.729417020829658e-07, - "loss": 0.6455, - "step": 68558 - }, - { - "epoch": 1.76, - "learning_rate": 7.729147544359341e-07, - "loss": 0.6377, - "step": 68559 - }, - { - "epoch": 1.76, - "learning_rate": 7.728878069627709e-07, - "loss": 0.6992, - "step": 68560 - }, - { - "epoch": 1.76, - "learning_rate": 7.728608596634974e-07, - "loss": 0.6191, - "step": 68561 - }, - { - "epoch": 1.76, - "learning_rate": 7.728339125381336e-07, - "loss": 0.7705, - "step": 68562 - }, - { - "epoch": 1.76, - "learning_rate": 7.728069655867005e-07, - "loss": 0.7715, - "step": 68563 - }, - { - "epoch": 1.76, - "learning_rate": 7.727800188092186e-07, - "loss": 0.4717, - "step": 68564 - }, - { - "epoch": 1.76, - "learning_rate": 7.727530722057087e-07, - "loss": 0.6255, - "step": 68565 - }, - { - "epoch": 1.76, - "learning_rate": 7.727261257761915e-07, - "loss": 0.6592, - "step": 68566 - }, - { - "epoch": 1.76, - "learning_rate": 7.726991795206877e-07, - "loss": 0.5859, - "step": 68567 - }, - { - "epoch": 1.76, - "learning_rate": 7.726722334392171e-07, - "loss": 0.7017, - "step": 68568 - }, - { - "epoch": 1.76, - "learning_rate": 7.72645287531801e-07, - "loss": 0.6543, - "step": 68569 - }, - { - "epoch": 1.76, - "learning_rate": 7.7261834179846e-07, - "loss": 0.3845, - "step": 68570 - }, - { - "epoch": 1.76, - "learning_rate": 7.725913962392148e-07, - "loss": 0.6401, - "step": 68571 - }, - { - "epoch": 1.76, - "learning_rate": 7.725644508540856e-07, - "loss": 0.6145, - "step": 68572 - }, - { - "epoch": 1.76, - "learning_rate": 7.725375056430937e-07, - "loss": 0.6357, - "step": 68573 - }, - { - "epoch": 1.76, - "learning_rate": 7.725105606062591e-07, - "loss": 0.4558, - "step": 68574 - }, - { - "epoch": 1.76, - "learning_rate": 7.72483615743603e-07, - "loss": 0.667, - "step": 68575 - }, - { - "epoch": 1.76, - "learning_rate": 7.724566710551453e-07, - "loss": 0.5669, - "step": 68576 - }, - { - "epoch": 1.76, - "learning_rate": 7.724297265409077e-07, - "loss": 0.7012, - "step": 68577 - }, - { - "epoch": 1.76, - "learning_rate": 7.724027822009099e-07, - "loss": 0.6074, - "step": 68578 - }, - { - "epoch": 1.76, - "learning_rate": 7.723758380351725e-07, - "loss": 0.6035, - "step": 68579 - }, - { - "epoch": 1.76, - "learning_rate": 7.72348894043717e-07, - "loss": 0.7583, - "step": 68580 - }, - { - "epoch": 1.76, - "learning_rate": 7.72321950226563e-07, - "loss": 0.6841, - "step": 68581 - }, - { - "epoch": 1.76, - "learning_rate": 7.722950065837319e-07, - "loss": 0.6516, - "step": 68582 - }, - { - "epoch": 1.76, - "learning_rate": 7.722680631152441e-07, - "loss": 0.5718, - "step": 68583 - }, - { - "epoch": 1.76, - "learning_rate": 7.722411198211198e-07, - "loss": 0.6387, - "step": 68584 - }, - { - "epoch": 1.76, - "learning_rate": 7.722141767013803e-07, - "loss": 0.5488, - "step": 68585 - }, - { - "epoch": 1.76, - "learning_rate": 7.721872337560458e-07, - "loss": 0.5635, - "step": 68586 - }, - { - "epoch": 1.76, - "learning_rate": 7.721602909851375e-07, - "loss": 0.4854, - "step": 68587 - }, - { - "epoch": 1.76, - "learning_rate": 7.721333483886752e-07, - "loss": 0.6875, - "step": 68588 - }, - { - "epoch": 1.76, - "learning_rate": 7.721064059666798e-07, - "loss": 0.583, - "step": 68589 - }, - { - "epoch": 1.76, - "learning_rate": 7.720794637191722e-07, - "loss": 0.5898, - "step": 68590 - }, - { - "epoch": 1.76, - "learning_rate": 7.720525216461728e-07, - "loss": 0.6729, - "step": 68591 - }, - { - "epoch": 1.76, - "learning_rate": 7.720255797477025e-07, - "loss": 0.6904, - "step": 68592 - }, - { - "epoch": 1.76, - "learning_rate": 7.719986380237813e-07, - "loss": 0.7798, - "step": 68593 - }, - { - "epoch": 1.76, - "learning_rate": 7.719716964744306e-07, - "loss": 0.7002, - "step": 68594 - }, - { - "epoch": 1.76, - "learning_rate": 7.719447550996705e-07, - "loss": 0.666, - "step": 68595 - }, - { - "epoch": 1.76, - "learning_rate": 7.71917813899522e-07, - "loss": 0.5898, - "step": 68596 - }, - { - "epoch": 1.76, - "learning_rate": 7.718908728740059e-07, - "loss": 0.6836, - "step": 68597 - }, - { - "epoch": 1.76, - "learning_rate": 7.718639320231419e-07, - "loss": 0.6758, - "step": 68598 - }, - { - "epoch": 1.76, - "learning_rate": 7.718369913469514e-07, - "loss": 0.7051, - "step": 68599 - }, - { - "epoch": 1.76, - "learning_rate": 7.718100508454546e-07, - "loss": 0.627, - "step": 68600 - }, - { - "epoch": 1.76, - "learning_rate": 7.717831105186726e-07, - "loss": 0.5747, - "step": 68601 - }, - { - "epoch": 1.76, - "learning_rate": 7.717561703666259e-07, - "loss": 0.7549, - "step": 68602 - }, - { - "epoch": 1.76, - "learning_rate": 7.717292303893346e-07, - "loss": 0.6143, - "step": 68603 - }, - { - "epoch": 1.76, - "learning_rate": 7.7170229058682e-07, - "loss": 0.6514, - "step": 68604 - }, - { - "epoch": 1.76, - "learning_rate": 7.716753509591023e-07, - "loss": 0.6816, - "step": 68605 - }, - { - "epoch": 1.76, - "learning_rate": 7.716484115062026e-07, - "loss": 0.5532, - "step": 68606 - }, - { - "epoch": 1.76, - "learning_rate": 7.716214722281412e-07, - "loss": 0.8662, - "step": 68607 - }, - { - "epoch": 1.76, - "learning_rate": 7.715945331249383e-07, - "loss": 0.6709, - "step": 68608 - }, - { - "epoch": 1.76, - "learning_rate": 7.715675941966153e-07, - "loss": 0.8389, - "step": 68609 - }, - { - "epoch": 1.76, - "learning_rate": 7.715406554431923e-07, - "loss": 0.6787, - "step": 68610 - }, - { - "epoch": 1.76, - "learning_rate": 7.715137168646903e-07, - "loss": 0.6777, - "step": 68611 - }, - { - "epoch": 1.76, - "learning_rate": 7.714867784611295e-07, - "loss": 0.582, - "step": 68612 - }, - { - "epoch": 1.76, - "learning_rate": 7.714598402325309e-07, - "loss": 0.7314, - "step": 68613 - }, - { - "epoch": 1.76, - "learning_rate": 7.71432902178915e-07, - "loss": 0.5732, - "step": 68614 - }, - { - "epoch": 1.76, - "learning_rate": 7.714059643003025e-07, - "loss": 0.6165, - "step": 68615 - }, - { - "epoch": 1.76, - "learning_rate": 7.713790265967137e-07, - "loss": 0.5608, - "step": 68616 - }, - { - "epoch": 1.76, - "learning_rate": 7.713520890681699e-07, - "loss": 0.4237, - "step": 68617 - }, - { - "epoch": 1.76, - "learning_rate": 7.713251517146911e-07, - "loss": 0.8184, - "step": 68618 - }, - { - "epoch": 1.76, - "learning_rate": 7.712982145362982e-07, - "loss": 0.6187, - "step": 68619 - }, - { - "epoch": 1.76, - "learning_rate": 7.712712775330115e-07, - "loss": 0.5562, - "step": 68620 - }, - { - "epoch": 1.76, - "learning_rate": 7.712443407048519e-07, - "loss": 0.4248, - "step": 68621 - }, - { - "epoch": 1.76, - "learning_rate": 7.7121740405184e-07, - "loss": 0.6973, - "step": 68622 - }, - { - "epoch": 1.76, - "learning_rate": 7.711904675739965e-07, - "loss": 0.6328, - "step": 68623 - }, - { - "epoch": 1.76, - "learning_rate": 7.711635312713417e-07, - "loss": 0.6836, - "step": 68624 - }, - { - "epoch": 1.76, - "learning_rate": 7.711365951438968e-07, - "loss": 0.6123, - "step": 68625 - }, - { - "epoch": 1.76, - "learning_rate": 7.711096591916818e-07, - "loss": 0.5569, - "step": 68626 - }, - { - "epoch": 1.76, - "learning_rate": 7.71082723414718e-07, - "loss": 0.6304, - "step": 68627 - }, - { - "epoch": 1.76, - "learning_rate": 7.710557878130255e-07, - "loss": 0.4595, - "step": 68628 - }, - { - "epoch": 1.76, - "learning_rate": 7.710288523866248e-07, - "loss": 0.7393, - "step": 68629 - }, - { - "epoch": 1.76, - "learning_rate": 7.71001917135537e-07, - "loss": 0.5415, - "step": 68630 - }, - { - "epoch": 1.76, - "learning_rate": 7.709749820597823e-07, - "loss": 0.5737, - "step": 68631 - }, - { - "epoch": 1.76, - "learning_rate": 7.709480471593817e-07, - "loss": 0.6445, - "step": 68632 - }, - { - "epoch": 1.76, - "learning_rate": 7.709211124343555e-07, - "loss": 0.7168, - "step": 68633 - }, - { - "epoch": 1.76, - "learning_rate": 7.708941778847246e-07, - "loss": 0.6992, - "step": 68634 - }, - { - "epoch": 1.76, - "learning_rate": 7.708672435105093e-07, - "loss": 0.5391, - "step": 68635 - }, - { - "epoch": 1.76, - "learning_rate": 7.708403093117306e-07, - "loss": 0.7168, - "step": 68636 - }, - { - "epoch": 1.76, - "learning_rate": 7.708133752884093e-07, - "loss": 0.7002, - "step": 68637 - }, - { - "epoch": 1.76, - "learning_rate": 7.707864414405654e-07, - "loss": 0.6138, - "step": 68638 - }, - { - "epoch": 1.76, - "learning_rate": 7.707595077682195e-07, - "loss": 0.7041, - "step": 68639 - }, - { - "epoch": 1.76, - "learning_rate": 7.707325742713926e-07, - "loss": 0.7373, - "step": 68640 - }, - { - "epoch": 1.76, - "learning_rate": 7.707056409501051e-07, - "loss": 0.6216, - "step": 68641 - }, - { - "epoch": 1.76, - "learning_rate": 7.706787078043782e-07, - "loss": 0.6035, - "step": 68642 - }, - { - "epoch": 1.76, - "learning_rate": 7.706517748342316e-07, - "loss": 0.9268, - "step": 68643 - }, - { - "epoch": 1.76, - "learning_rate": 7.706248420396866e-07, - "loss": 0.4668, - "step": 68644 - }, - { - "epoch": 1.76, - "learning_rate": 7.705979094207635e-07, - "loss": 0.6489, - "step": 68645 - }, - { - "epoch": 1.76, - "learning_rate": 7.705709769774832e-07, - "loss": 0.7021, - "step": 68646 - }, - { - "epoch": 1.76, - "learning_rate": 7.705440447098663e-07, - "loss": 0.7852, - "step": 68647 - }, - { - "epoch": 1.76, - "learning_rate": 7.705171126179331e-07, - "loss": 0.6924, - "step": 68648 - }, - { - "epoch": 1.76, - "learning_rate": 7.704901807017044e-07, - "loss": 0.6316, - "step": 68649 - }, - { - "epoch": 1.76, - "learning_rate": 7.704632489612007e-07, - "loss": 0.6279, - "step": 68650 - }, - { - "epoch": 1.76, - "learning_rate": 7.704363173964427e-07, - "loss": 0.6177, - "step": 68651 - }, - { - "epoch": 1.76, - "learning_rate": 7.704093860074511e-07, - "loss": 0.5581, - "step": 68652 - }, - { - "epoch": 1.76, - "learning_rate": 7.703824547942465e-07, - "loss": 0.6514, - "step": 68653 - }, - { - "epoch": 1.76, - "learning_rate": 7.703555237568495e-07, - "loss": 0.6787, - "step": 68654 - }, - { - "epoch": 1.76, - "learning_rate": 7.703285928952808e-07, - "loss": 0.7129, - "step": 68655 - }, - { - "epoch": 1.76, - "learning_rate": 7.703016622095611e-07, - "loss": 0.8242, - "step": 68656 - }, - { - "epoch": 1.76, - "learning_rate": 7.702747316997109e-07, - "loss": 0.7539, - "step": 68657 - }, - { - "epoch": 1.76, - "learning_rate": 7.702478013657503e-07, - "loss": 0.4314, - "step": 68658 - }, - { - "epoch": 1.76, - "learning_rate": 7.702208712077007e-07, - "loss": 0.5981, - "step": 68659 - }, - { - "epoch": 1.76, - "learning_rate": 7.701939412255822e-07, - "loss": 0.4202, - "step": 68660 - }, - { - "epoch": 1.76, - "learning_rate": 7.701670114194159e-07, - "loss": 0.7969, - "step": 68661 - }, - { - "epoch": 1.76, - "learning_rate": 7.701400817892219e-07, - "loss": 0.7686, - "step": 68662 - }, - { - "epoch": 1.76, - "learning_rate": 7.701131523350211e-07, - "loss": 0.5254, - "step": 68663 - }, - { - "epoch": 1.76, - "learning_rate": 7.700862230568342e-07, - "loss": 0.8223, - "step": 68664 - }, - { - "epoch": 1.76, - "learning_rate": 7.700592939546817e-07, - "loss": 0.5889, - "step": 68665 - }, - { - "epoch": 1.76, - "learning_rate": 7.70032365028584e-07, - "loss": 0.6211, - "step": 68666 - }, - { - "epoch": 1.76, - "learning_rate": 7.700054362785625e-07, - "loss": 0.512, - "step": 68667 - }, - { - "epoch": 1.76, - "learning_rate": 7.69978507704637e-07, - "loss": 0.6206, - "step": 68668 - }, - { - "epoch": 1.76, - "learning_rate": 7.699515793068281e-07, - "loss": 0.668, - "step": 68669 - }, - { - "epoch": 1.76, - "learning_rate": 7.699246510851571e-07, - "loss": 0.6992, - "step": 68670 - }, - { - "epoch": 1.76, - "learning_rate": 7.698977230396437e-07, - "loss": 0.6318, - "step": 68671 - }, - { - "epoch": 1.76, - "learning_rate": 7.698707951703095e-07, - "loss": 0.5571, - "step": 68672 - }, - { - "epoch": 1.76, - "learning_rate": 7.698438674771743e-07, - "loss": 0.6426, - "step": 68673 - }, - { - "epoch": 1.76, - "learning_rate": 7.698169399602593e-07, - "loss": 0.5186, - "step": 68674 - }, - { - "epoch": 1.76, - "learning_rate": 7.69790012619585e-07, - "loss": 0.5703, - "step": 68675 - }, - { - "epoch": 1.76, - "learning_rate": 7.697630854551715e-07, - "loss": 0.6733, - "step": 68676 - }, - { - "epoch": 1.76, - "learning_rate": 7.697361584670404e-07, - "loss": 0.8164, - "step": 68677 - }, - { - "epoch": 1.76, - "learning_rate": 7.697092316552115e-07, - "loss": 0.7031, - "step": 68678 - }, - { - "epoch": 1.76, - "learning_rate": 7.696823050197055e-07, - "loss": 0.7295, - "step": 68679 - }, - { - "epoch": 1.76, - "learning_rate": 7.696553785605432e-07, - "loss": 0.6992, - "step": 68680 - }, - { - "epoch": 1.76, - "learning_rate": 7.696284522777451e-07, - "loss": 0.6113, - "step": 68681 - }, - { - "epoch": 1.76, - "learning_rate": 7.69601526171332e-07, - "loss": 0.7471, - "step": 68682 - }, - { - "epoch": 1.76, - "learning_rate": 7.695746002413243e-07, - "loss": 0.6606, - "step": 68683 - }, - { - "epoch": 1.76, - "learning_rate": 7.695476744877429e-07, - "loss": 0.6953, - "step": 68684 - }, - { - "epoch": 1.76, - "learning_rate": 7.695207489106082e-07, - "loss": 0.6494, - "step": 68685 - }, - { - "epoch": 1.76, - "learning_rate": 7.694938235099409e-07, - "loss": 0.7119, - "step": 68686 - }, - { - "epoch": 1.76, - "learning_rate": 7.694668982857618e-07, - "loss": 0.4263, - "step": 68687 - }, - { - "epoch": 1.76, - "learning_rate": 7.69439973238091e-07, - "loss": 0.7529, - "step": 68688 - }, - { - "epoch": 1.76, - "learning_rate": 7.694130483669494e-07, - "loss": 0.5435, - "step": 68689 - }, - { - "epoch": 1.76, - "learning_rate": 7.693861236723575e-07, - "loss": 0.6357, - "step": 68690 - }, - { - "epoch": 1.76, - "learning_rate": 7.693591991543364e-07, - "loss": 0.7549, - "step": 68691 - }, - { - "epoch": 1.76, - "learning_rate": 7.693322748129063e-07, - "loss": 0.5151, - "step": 68692 - }, - { - "epoch": 1.76, - "learning_rate": 7.693053506480876e-07, - "loss": 0.6162, - "step": 68693 - }, - { - "epoch": 1.76, - "learning_rate": 7.692784266599014e-07, - "loss": 0.6187, - "step": 68694 - }, - { - "epoch": 1.76, - "learning_rate": 7.692515028483679e-07, - "loss": 0.4042, - "step": 68695 - }, - { - "epoch": 1.76, - "learning_rate": 7.692245792135081e-07, - "loss": 0.791, - "step": 68696 - }, - { - "epoch": 1.76, - "learning_rate": 7.691976557553426e-07, - "loss": 0.7119, - "step": 68697 - }, - { - "epoch": 1.76, - "learning_rate": 7.691707324738915e-07, - "loss": 0.8232, - "step": 68698 - }, - { - "epoch": 1.76, - "learning_rate": 7.69143809369176e-07, - "loss": 0.6064, - "step": 68699 - }, - { - "epoch": 1.76, - "learning_rate": 7.691168864412162e-07, - "loss": 0.4612, - "step": 68700 - }, - { - "epoch": 1.76, - "learning_rate": 7.690899636900333e-07, - "loss": 0.6689, - "step": 68701 - }, - { - "epoch": 1.76, - "learning_rate": 7.690630411156473e-07, - "loss": 0.5688, - "step": 68702 - }, - { - "epoch": 1.76, - "learning_rate": 7.690361187180792e-07, - "loss": 0.6357, - "step": 68703 - }, - { - "epoch": 1.76, - "learning_rate": 7.690091964973494e-07, - "loss": 0.582, - "step": 68704 - }, - { - "epoch": 1.76, - "learning_rate": 7.689822744534789e-07, - "loss": 0.5586, - "step": 68705 - }, - { - "epoch": 1.76, - "learning_rate": 7.689553525864878e-07, - "loss": 0.5869, - "step": 68706 - }, - { - "epoch": 1.76, - "learning_rate": 7.689284308963975e-07, - "loss": 0.9199, - "step": 68707 - }, - { - "epoch": 1.76, - "learning_rate": 7.689015093832277e-07, - "loss": 0.749, - "step": 68708 - }, - { - "epoch": 1.76, - "learning_rate": 7.688745880469994e-07, - "loss": 0.6611, - "step": 68709 - }, - { - "epoch": 1.76, - "learning_rate": 7.68847666887733e-07, - "loss": 0.7881, - "step": 68710 - }, - { - "epoch": 1.76, - "learning_rate": 7.688207459054497e-07, - "loss": 0.5322, - "step": 68711 - }, - { - "epoch": 1.76, - "learning_rate": 7.687938251001694e-07, - "loss": 0.6479, - "step": 68712 - }, - { - "epoch": 1.76, - "learning_rate": 7.687669044719131e-07, - "loss": 0.5002, - "step": 68713 - }, - { - "epoch": 1.76, - "learning_rate": 7.687399840207014e-07, - "loss": 0.4712, - "step": 68714 - }, - { - "epoch": 1.76, - "learning_rate": 7.687130637465548e-07, - "loss": 0.5239, - "step": 68715 - }, - { - "epoch": 1.76, - "learning_rate": 7.68686143649494e-07, - "loss": 0.8369, - "step": 68716 - }, - { - "epoch": 1.76, - "learning_rate": 7.686592237295399e-07, - "loss": 0.7666, - "step": 68717 - }, - { - "epoch": 1.76, - "learning_rate": 7.686323039867125e-07, - "loss": 0.7271, - "step": 68718 - }, - { - "epoch": 1.76, - "learning_rate": 7.686053844210326e-07, - "loss": 0.7056, - "step": 68719 - }, - { - "epoch": 1.76, - "learning_rate": 7.685784650325211e-07, - "loss": 0.4459, - "step": 68720 - }, - { - "epoch": 1.76, - "learning_rate": 7.685515458211983e-07, - "loss": 0.7568, - "step": 68721 - }, - { - "epoch": 1.76, - "learning_rate": 7.68524626787085e-07, - "loss": 0.6504, - "step": 68722 - }, - { - "epoch": 1.76, - "learning_rate": 7.684977079302016e-07, - "loss": 0.7383, - "step": 68723 - }, - { - "epoch": 1.76, - "learning_rate": 7.684707892505692e-07, - "loss": 0.6611, - "step": 68724 - }, - { - "epoch": 1.76, - "learning_rate": 7.684438707482077e-07, - "loss": 0.4934, - "step": 68725 - }, - { - "epoch": 1.76, - "learning_rate": 7.684169524231383e-07, - "loss": 0.6445, - "step": 68726 - }, - { - "epoch": 1.76, - "learning_rate": 7.683900342753817e-07, - "loss": 0.5857, - "step": 68727 - }, - { - "epoch": 1.76, - "learning_rate": 7.68363116304958e-07, - "loss": 0.5432, - "step": 68728 - }, - { - "epoch": 1.76, - "learning_rate": 7.683361985118877e-07, - "loss": 0.8389, - "step": 68729 - }, - { - "epoch": 1.76, - "learning_rate": 7.68309280896192e-07, - "loss": 0.5479, - "step": 68730 - }, - { - "epoch": 1.76, - "learning_rate": 7.682823634578909e-07, - "loss": 0.6372, - "step": 68731 - }, - { - "epoch": 1.76, - "learning_rate": 7.682554461970056e-07, - "loss": 0.6533, - "step": 68732 - }, - { - "epoch": 1.76, - "learning_rate": 7.682285291135563e-07, - "loss": 0.3787, - "step": 68733 - }, - { - "epoch": 1.76, - "learning_rate": 7.68201612207564e-07, - "loss": 0.6455, - "step": 68734 - }, - { - "epoch": 1.76, - "learning_rate": 7.681746954790487e-07, - "loss": 0.7402, - "step": 68735 - }, - { - "epoch": 1.76, - "learning_rate": 7.681477789280317e-07, - "loss": 0.5518, - "step": 68736 - }, - { - "epoch": 1.76, - "learning_rate": 7.681208625545335e-07, - "loss": 0.6465, - "step": 68737 - }, - { - "epoch": 1.76, - "learning_rate": 7.680939463585741e-07, - "loss": 0.7783, - "step": 68738 - }, - { - "epoch": 1.76, - "learning_rate": 7.680670303401746e-07, - "loss": 0.7734, - "step": 68739 - }, - { - "epoch": 1.76, - "learning_rate": 7.680401144993554e-07, - "loss": 0.7539, - "step": 68740 - }, - { - "epoch": 1.76, - "learning_rate": 7.680131988361374e-07, - "loss": 0.6924, - "step": 68741 - }, - { - "epoch": 1.76, - "learning_rate": 7.679862833505409e-07, - "loss": 0.54, - "step": 68742 - }, - { - "epoch": 1.76, - "learning_rate": 7.679593680425867e-07, - "loss": 0.6738, - "step": 68743 - }, - { - "epoch": 1.76, - "learning_rate": 7.679324529122951e-07, - "loss": 0.603, - "step": 68744 - }, - { - "epoch": 1.76, - "learning_rate": 7.679055379596872e-07, - "loss": 0.7527, - "step": 68745 - }, - { - "epoch": 1.76, - "learning_rate": 7.678786231847835e-07, - "loss": 0.7695, - "step": 68746 - }, - { - "epoch": 1.76, - "learning_rate": 7.678517085876045e-07, - "loss": 0.6165, - "step": 68747 - }, - { - "epoch": 1.76, - "learning_rate": 7.678247941681705e-07, - "loss": 0.6504, - "step": 68748 - }, - { - "epoch": 1.76, - "learning_rate": 7.677978799265024e-07, - "loss": 0.6748, - "step": 68749 - }, - { - "epoch": 1.76, - "learning_rate": 7.677709658626208e-07, - "loss": 0.6826, - "step": 68750 - }, - { - "epoch": 1.76, - "learning_rate": 7.677440519765464e-07, - "loss": 0.707, - "step": 68751 - }, - { - "epoch": 1.76, - "learning_rate": 7.677171382682995e-07, - "loss": 0.6851, - "step": 68752 - }, - { - "epoch": 1.76, - "learning_rate": 7.676902247379011e-07, - "loss": 0.7148, - "step": 68753 - }, - { - "epoch": 1.76, - "learning_rate": 7.676633113853715e-07, - "loss": 0.6592, - "step": 68754 - }, - { - "epoch": 1.76, - "learning_rate": 7.676363982107315e-07, - "loss": 0.7148, - "step": 68755 - }, - { - "epoch": 1.76, - "learning_rate": 7.676094852140014e-07, - "loss": 0.7158, - "step": 68756 - }, - { - "epoch": 1.76, - "learning_rate": 7.675825723952026e-07, - "loss": 0.5674, - "step": 68757 - }, - { - "epoch": 1.76, - "learning_rate": 7.675556597543548e-07, - "loss": 0.7266, - "step": 68758 - }, - { - "epoch": 1.76, - "learning_rate": 7.675287472914787e-07, - "loss": 0.6758, - "step": 68759 - }, - { - "epoch": 1.76, - "learning_rate": 7.675018350065954e-07, - "loss": 0.5114, - "step": 68760 - }, - { - "epoch": 1.76, - "learning_rate": 7.67474922899725e-07, - "loss": 0.6973, - "step": 68761 - }, - { - "epoch": 1.76, - "learning_rate": 7.674480109708887e-07, - "loss": 0.6914, - "step": 68762 - }, - { - "epoch": 1.76, - "learning_rate": 7.674210992201064e-07, - "loss": 0.5151, - "step": 68763 - }, - { - "epoch": 1.76, - "learning_rate": 7.673941876473995e-07, - "loss": 0.7041, - "step": 68764 - }, - { - "epoch": 1.76, - "learning_rate": 7.67367276252788e-07, - "loss": 0.7578, - "step": 68765 - }, - { - "epoch": 1.76, - "learning_rate": 7.673403650362927e-07, - "loss": 0.5702, - "step": 68766 - }, - { - "epoch": 1.76, - "learning_rate": 7.673134539979342e-07, - "loss": 0.6641, - "step": 68767 - }, - { - "epoch": 1.76, - "learning_rate": 7.672865431377332e-07, - "loss": 0.5894, - "step": 68768 - }, - { - "epoch": 1.76, - "learning_rate": 7.672596324557099e-07, - "loss": 0.7158, - "step": 68769 - }, - { - "epoch": 1.76, - "learning_rate": 7.672327219518854e-07, - "loss": 0.499, - "step": 68770 - }, - { - "epoch": 1.76, - "learning_rate": 7.672058116262798e-07, - "loss": 0.7295, - "step": 68771 - }, - { - "epoch": 1.76, - "learning_rate": 7.671789014789144e-07, - "loss": 0.4697, - "step": 68772 - }, - { - "epoch": 1.76, - "learning_rate": 7.671519915098091e-07, - "loss": 0.6445, - "step": 68773 - }, - { - "epoch": 1.76, - "learning_rate": 7.671250817189849e-07, - "loss": 0.6348, - "step": 68774 - }, - { - "epoch": 1.76, - "learning_rate": 7.670981721064624e-07, - "loss": 0.6279, - "step": 68775 - }, - { - "epoch": 1.76, - "learning_rate": 7.670712626722621e-07, - "loss": 0.5273, - "step": 68776 - }, - { - "epoch": 1.76, - "learning_rate": 7.670443534164049e-07, - "loss": 0.6636, - "step": 68777 - }, - { - "epoch": 1.76, - "learning_rate": 7.670174443389107e-07, - "loss": 0.5444, - "step": 68778 - }, - { - "epoch": 1.76, - "learning_rate": 7.669905354398008e-07, - "loss": 0.6143, - "step": 68779 - }, - { - "epoch": 1.76, - "learning_rate": 7.669636267190952e-07, - "loss": 0.6807, - "step": 68780 - }, - { - "epoch": 1.76, - "learning_rate": 7.669367181768152e-07, - "loss": 0.4927, - "step": 68781 - }, - { - "epoch": 1.76, - "learning_rate": 7.669098098129809e-07, - "loss": 0.6431, - "step": 68782 - }, - { - "epoch": 1.76, - "learning_rate": 7.668829016276128e-07, - "loss": 0.7749, - "step": 68783 - }, - { - "epoch": 1.76, - "learning_rate": 7.66855993620732e-07, - "loss": 0.4912, - "step": 68784 - }, - { - "epoch": 1.76, - "learning_rate": 7.668290857923587e-07, - "loss": 0.8145, - "step": 68785 - }, - { - "epoch": 1.76, - "learning_rate": 7.668021781425138e-07, - "loss": 0.5093, - "step": 68786 - }, - { - "epoch": 1.76, - "learning_rate": 7.66775270671218e-07, - "loss": 0.7275, - "step": 68787 - }, - { - "epoch": 1.76, - "learning_rate": 7.667483633784913e-07, - "loss": 0.5884, - "step": 68788 - }, - { - "epoch": 1.76, - "learning_rate": 7.667214562643547e-07, - "loss": 0.5278, - "step": 68789 - }, - { - "epoch": 1.76, - "learning_rate": 7.666945493288287e-07, - "loss": 0.8076, - "step": 68790 - }, - { - "epoch": 1.76, - "learning_rate": 7.666676425719341e-07, - "loss": 0.6621, - "step": 68791 - }, - { - "epoch": 1.76, - "learning_rate": 7.66640735993691e-07, - "loss": 0.6289, - "step": 68792 - }, - { - "epoch": 1.76, - "learning_rate": 7.666138295941208e-07, - "loss": 0.5774, - "step": 68793 - }, - { - "epoch": 1.76, - "learning_rate": 7.665869233732434e-07, - "loss": 0.7188, - "step": 68794 - }, - { - "epoch": 1.76, - "learning_rate": 7.665600173310798e-07, - "loss": 0.5205, - "step": 68795 - }, - { - "epoch": 1.76, - "learning_rate": 7.665331114676503e-07, - "loss": 0.3379, - "step": 68796 - }, - { - "epoch": 1.76, - "learning_rate": 7.665062057829761e-07, - "loss": 0.7168, - "step": 68797 - }, - { - "epoch": 1.76, - "learning_rate": 7.66479300277077e-07, - "loss": 0.6348, - "step": 68798 - }, - { - "epoch": 1.76, - "learning_rate": 7.664523949499741e-07, - "loss": 0.6387, - "step": 68799 - }, - { - "epoch": 1.76, - "learning_rate": 7.664254898016877e-07, - "loss": 0.6841, - "step": 68800 - }, - { - "epoch": 1.76, - "learning_rate": 7.663985848322386e-07, - "loss": 0.6719, - "step": 68801 - }, - { - "epoch": 1.76, - "learning_rate": 7.663716800416473e-07, - "loss": 0.6768, - "step": 68802 - }, - { - "epoch": 1.76, - "learning_rate": 7.663447754299346e-07, - "loss": 0.4719, - "step": 68803 - }, - { - "epoch": 1.76, - "learning_rate": 7.663178709971207e-07, - "loss": 0.5439, - "step": 68804 - }, - { - "epoch": 1.76, - "learning_rate": 7.662909667432268e-07, - "loss": 0.5427, - "step": 68805 - }, - { - "epoch": 1.76, - "learning_rate": 7.662640626682729e-07, - "loss": 0.4548, - "step": 68806 - }, - { - "epoch": 1.76, - "learning_rate": 7.662371587722804e-07, - "loss": 0.5173, - "step": 68807 - }, - { - "epoch": 1.76, - "learning_rate": 7.662102550552689e-07, - "loss": 0.6318, - "step": 68808 - }, - { - "epoch": 1.76, - "learning_rate": 7.661833515172594e-07, - "loss": 0.6211, - "step": 68809 - }, - { - "epoch": 1.76, - "learning_rate": 7.661564481582727e-07, - "loss": 0.6245, - "step": 68810 - }, - { - "epoch": 1.76, - "learning_rate": 7.661295449783292e-07, - "loss": 0.4683, - "step": 68811 - }, - { - "epoch": 1.76, - "learning_rate": 7.661026419774496e-07, - "loss": 0.6685, - "step": 68812 - }, - { - "epoch": 1.76, - "learning_rate": 7.660757391556543e-07, - "loss": 0.7129, - "step": 68813 - }, - { - "epoch": 1.76, - "learning_rate": 7.660488365129643e-07, - "loss": 0.5461, - "step": 68814 - }, - { - "epoch": 1.76, - "learning_rate": 7.660219340493996e-07, - "loss": 0.6455, - "step": 68815 - }, - { - "epoch": 1.76, - "learning_rate": 7.659950317649815e-07, - "loss": 0.7578, - "step": 68816 - }, - { - "epoch": 1.76, - "learning_rate": 7.659681296597303e-07, - "loss": 0.6782, - "step": 68817 - }, - { - "epoch": 1.76, - "learning_rate": 7.659412277336666e-07, - "loss": 0.6895, - "step": 68818 - }, - { - "epoch": 1.76, - "learning_rate": 7.659143259868104e-07, - "loss": 0.541, - "step": 68819 - }, - { - "epoch": 1.76, - "learning_rate": 7.658874244191833e-07, - "loss": 0.6299, - "step": 68820 - }, - { - "epoch": 1.76, - "learning_rate": 7.658605230308051e-07, - "loss": 0.832, - "step": 68821 - }, - { - "epoch": 1.76, - "learning_rate": 7.65833621821697e-07, - "loss": 0.8594, - "step": 68822 - }, - { - "epoch": 1.76, - "learning_rate": 7.65806720791879e-07, - "loss": 0.6064, - "step": 68823 - }, - { - "epoch": 1.76, - "learning_rate": 7.657798199413724e-07, - "loss": 0.6528, - "step": 68824 - }, - { - "epoch": 1.76, - "learning_rate": 7.657529192701971e-07, - "loss": 0.5586, - "step": 68825 - }, - { - "epoch": 1.76, - "learning_rate": 7.657260187783743e-07, - "loss": 0.6221, - "step": 68826 - }, - { - "epoch": 1.76, - "learning_rate": 7.656991184659245e-07, - "loss": 0.6465, - "step": 68827 - }, - { - "epoch": 1.76, - "learning_rate": 7.656722183328677e-07, - "loss": 0.4785, - "step": 68828 - }, - { - "epoch": 1.76, - "learning_rate": 7.656453183792251e-07, - "loss": 0.6245, - "step": 68829 - }, - { - "epoch": 1.76, - "learning_rate": 7.656184186050168e-07, - "loss": 0.7324, - "step": 68830 - }, - { - "epoch": 1.76, - "learning_rate": 7.655915190102641e-07, - "loss": 0.6499, - "step": 68831 - }, - { - "epoch": 1.76, - "learning_rate": 7.655646195949869e-07, - "loss": 0.6582, - "step": 68832 - }, - { - "epoch": 1.76, - "learning_rate": 7.655377203592063e-07, - "loss": 0.6074, - "step": 68833 - }, - { - "epoch": 1.76, - "learning_rate": 7.655108213029424e-07, - "loss": 0.585, - "step": 68834 - }, - { - "epoch": 1.76, - "learning_rate": 7.654839224262164e-07, - "loss": 0.5488, - "step": 68835 - }, - { - "epoch": 1.76, - "learning_rate": 7.654570237290483e-07, - "loss": 0.5938, - "step": 68836 - }, - { - "epoch": 1.76, - "learning_rate": 7.654301252114597e-07, - "loss": 0.7793, - "step": 68837 - }, - { - "epoch": 1.76, - "learning_rate": 7.654032268734697e-07, - "loss": 0.5283, - "step": 68838 - }, - { - "epoch": 1.76, - "learning_rate": 7.653763287151e-07, - "loss": 0.5774, - "step": 68839 - }, - { - "epoch": 1.76, - "learning_rate": 7.653494307363706e-07, - "loss": 0.7344, - "step": 68840 - }, - { - "epoch": 1.76, - "learning_rate": 7.653225329373025e-07, - "loss": 0.6748, - "step": 68841 - }, - { - "epoch": 1.76, - "learning_rate": 7.65295635317916e-07, - "loss": 0.5664, - "step": 68842 - }, - { - "epoch": 1.76, - "learning_rate": 7.652687378782321e-07, - "loss": 0.542, - "step": 68843 - }, - { - "epoch": 1.76, - "learning_rate": 7.652418406182708e-07, - "loss": 0.7061, - "step": 68844 - }, - { - "epoch": 1.76, - "learning_rate": 7.652149435380533e-07, - "loss": 0.5107, - "step": 68845 - }, - { - "epoch": 1.76, - "learning_rate": 7.651880466375998e-07, - "loss": 0.4658, - "step": 68846 - }, - { - "epoch": 1.76, - "learning_rate": 7.651611499169313e-07, - "loss": 0.5398, - "step": 68847 - }, - { - "epoch": 1.76, - "learning_rate": 7.651342533760679e-07, - "loss": 0.6709, - "step": 68848 - }, - { - "epoch": 1.76, - "learning_rate": 7.651073570150303e-07, - "loss": 0.6006, - "step": 68849 - }, - { - "epoch": 1.76, - "learning_rate": 7.650804608338393e-07, - "loss": 0.7051, - "step": 68850 - }, - { - "epoch": 1.76, - "learning_rate": 7.650535648325151e-07, - "loss": 0.6865, - "step": 68851 - }, - { - "epoch": 1.76, - "learning_rate": 7.65026669011079e-07, - "loss": 0.4832, - "step": 68852 - }, - { - "epoch": 1.76, - "learning_rate": 7.64999773369551e-07, - "loss": 0.7261, - "step": 68853 - }, - { - "epoch": 1.76, - "learning_rate": 7.649728779079518e-07, - "loss": 0.8027, - "step": 68854 - }, - { - "epoch": 1.76, - "learning_rate": 7.649459826263023e-07, - "loss": 0.7578, - "step": 68855 - }, - { - "epoch": 1.76, - "learning_rate": 7.64919087524623e-07, - "loss": 0.7227, - "step": 68856 - }, - { - "epoch": 1.76, - "learning_rate": 7.64892192602934e-07, - "loss": 0.7773, - "step": 68857 - }, - { - "epoch": 1.76, - "learning_rate": 7.648652978612562e-07, - "loss": 0.6963, - "step": 68858 - }, - { - "epoch": 1.76, - "learning_rate": 7.648384032996102e-07, - "loss": 0.6245, - "step": 68859 - }, - { - "epoch": 1.76, - "learning_rate": 7.648115089180168e-07, - "loss": 0.5286, - "step": 68860 - }, - { - "epoch": 1.76, - "learning_rate": 7.647846147164962e-07, - "loss": 0.7422, - "step": 68861 - }, - { - "epoch": 1.76, - "learning_rate": 7.647577206950694e-07, - "loss": 0.6042, - "step": 68862 - }, - { - "epoch": 1.76, - "learning_rate": 7.647308268537567e-07, - "loss": 0.5801, - "step": 68863 - }, - { - "epoch": 1.77, - "learning_rate": 7.647039331925789e-07, - "loss": 0.7646, - "step": 68864 - }, - { - "epoch": 1.77, - "learning_rate": 7.646770397115563e-07, - "loss": 0.8799, - "step": 68865 - }, - { - "epoch": 1.77, - "learning_rate": 7.6465014641071e-07, - "loss": 0.6572, - "step": 68866 - }, - { - "epoch": 1.77, - "learning_rate": 7.646232532900601e-07, - "loss": 0.8604, - "step": 68867 - }, - { - "epoch": 1.77, - "learning_rate": 7.645963603496271e-07, - "loss": 0.623, - "step": 68868 - }, - { - "epoch": 1.77, - "learning_rate": 7.645694675894322e-07, - "loss": 0.5879, - "step": 68869 - }, - { - "epoch": 1.77, - "learning_rate": 7.645425750094954e-07, - "loss": 0.4858, - "step": 68870 - }, - { - "epoch": 1.77, - "learning_rate": 7.645156826098375e-07, - "loss": 0.6426, - "step": 68871 - }, - { - "epoch": 1.77, - "learning_rate": 7.644887903904794e-07, - "loss": 0.6924, - "step": 68872 - }, - { - "epoch": 1.77, - "learning_rate": 7.644618983514411e-07, - "loss": 0.6665, - "step": 68873 - }, - { - "epoch": 1.77, - "learning_rate": 7.644350064927436e-07, - "loss": 0.791, - "step": 68874 - }, - { - "epoch": 1.77, - "learning_rate": 7.644081148144073e-07, - "loss": 0.79, - "step": 68875 - }, - { - "epoch": 1.77, - "learning_rate": 7.643812233164533e-07, - "loss": 0.5044, - "step": 68876 - }, - { - "epoch": 1.77, - "learning_rate": 7.643543319989014e-07, - "loss": 0.5596, - "step": 68877 - }, - { - "epoch": 1.77, - "learning_rate": 7.643274408617724e-07, - "loss": 0.6465, - "step": 68878 - }, - { - "epoch": 1.77, - "learning_rate": 7.643005499050874e-07, - "loss": 0.7432, - "step": 68879 - }, - { - "epoch": 1.77, - "learning_rate": 7.642736591288663e-07, - "loss": 0.7393, - "step": 68880 - }, - { - "epoch": 1.77, - "learning_rate": 7.642467685331303e-07, - "loss": 0.522, - "step": 68881 - }, - { - "epoch": 1.77, - "learning_rate": 7.642198781178995e-07, - "loss": 0.752, - "step": 68882 - }, - { - "epoch": 1.77, - "learning_rate": 7.641929878831948e-07, - "loss": 0.7451, - "step": 68883 - }, - { - "epoch": 1.77, - "learning_rate": 7.641660978290365e-07, - "loss": 0.7236, - "step": 68884 - }, - { - "epoch": 1.77, - "learning_rate": 7.641392079554456e-07, - "loss": 0.4626, - "step": 68885 - }, - { - "epoch": 1.77, - "learning_rate": 7.641123182624427e-07, - "loss": 0.6997, - "step": 68886 - }, - { - "epoch": 1.77, - "learning_rate": 7.640854287500478e-07, - "loss": 0.7158, - "step": 68887 - }, - { - "epoch": 1.77, - "learning_rate": 7.640585394182819e-07, - "loss": 0.6104, - "step": 68888 - }, - { - "epoch": 1.77, - "learning_rate": 7.640316502671657e-07, - "loss": 0.4883, - "step": 68889 - }, - { - "epoch": 1.77, - "learning_rate": 7.640047612967192e-07, - "loss": 0.6982, - "step": 68890 - }, - { - "epoch": 1.77, - "learning_rate": 7.639778725069637e-07, - "loss": 0.6113, - "step": 68891 - }, - { - "epoch": 1.77, - "learning_rate": 7.639509838979194e-07, - "loss": 0.5195, - "step": 68892 - }, - { - "epoch": 1.77, - "learning_rate": 7.63924095469607e-07, - "loss": 0.616, - "step": 68893 - }, - { - "epoch": 1.77, - "learning_rate": 7.63897207222047e-07, - "loss": 0.7734, - "step": 68894 - }, - { - "epoch": 1.77, - "learning_rate": 7.638703191552602e-07, - "loss": 0.8438, - "step": 68895 - }, - { - "epoch": 1.77, - "learning_rate": 7.638434312692672e-07, - "loss": 0.5371, - "step": 68896 - }, - { - "epoch": 1.77, - "learning_rate": 7.638165435640881e-07, - "loss": 0.6689, - "step": 68897 - }, - { - "epoch": 1.77, - "learning_rate": 7.63789656039744e-07, - "loss": 0.6758, - "step": 68898 - }, - { - "epoch": 1.77, - "learning_rate": 7.637627686962551e-07, - "loss": 0.6738, - "step": 68899 - }, - { - "epoch": 1.77, - "learning_rate": 7.637358815336423e-07, - "loss": 0.8086, - "step": 68900 - }, - { - "epoch": 1.77, - "learning_rate": 7.637089945519259e-07, - "loss": 0.8418, - "step": 68901 - }, - { - "epoch": 1.77, - "learning_rate": 7.63682107751127e-07, - "loss": 0.6445, - "step": 68902 - }, - { - "epoch": 1.77, - "learning_rate": 7.636552211312654e-07, - "loss": 0.7236, - "step": 68903 - }, - { - "epoch": 1.77, - "learning_rate": 7.636283346923626e-07, - "loss": 0.6177, - "step": 68904 - }, - { - "epoch": 1.77, - "learning_rate": 7.636014484344383e-07, - "loss": 0.6099, - "step": 68905 - }, - { - "epoch": 1.77, - "learning_rate": 7.635745623575143e-07, - "loss": 0.564, - "step": 68906 - }, - { - "epoch": 1.77, - "learning_rate": 7.635476764616096e-07, - "loss": 0.6118, - "step": 68907 - }, - { - "epoch": 1.77, - "learning_rate": 7.635207907467458e-07, - "loss": 0.8359, - "step": 68908 - }, - { - "epoch": 1.77, - "learning_rate": 7.634939052129431e-07, - "loss": 0.6504, - "step": 68909 - }, - { - "epoch": 1.77, - "learning_rate": 7.634670198602224e-07, - "loss": 0.6758, - "step": 68910 - }, - { - "epoch": 1.77, - "learning_rate": 7.63440134688604e-07, - "loss": 0.6992, - "step": 68911 - }, - { - "epoch": 1.77, - "learning_rate": 7.634132496981088e-07, - "loss": 0.7998, - "step": 68912 - }, - { - "epoch": 1.77, - "learning_rate": 7.63386364888757e-07, - "loss": 0.7539, - "step": 68913 - }, - { - "epoch": 1.77, - "learning_rate": 7.633594802605696e-07, - "loss": 0.5776, - "step": 68914 - }, - { - "epoch": 1.77, - "learning_rate": 7.633325958135667e-07, - "loss": 0.4922, - "step": 68915 - }, - { - "epoch": 1.77, - "learning_rate": 7.633057115477696e-07, - "loss": 0.564, - "step": 68916 - }, - { - "epoch": 1.77, - "learning_rate": 7.632788274631982e-07, - "loss": 0.7051, - "step": 68917 - }, - { - "epoch": 1.77, - "learning_rate": 7.632519435598731e-07, - "loss": 0.7705, - "step": 68918 - }, - { - "epoch": 1.77, - "learning_rate": 7.632250598378152e-07, - "loss": 0.583, - "step": 68919 - }, - { - "epoch": 1.77, - "learning_rate": 7.631981762970449e-07, - "loss": 0.625, - "step": 68920 - }, - { - "epoch": 1.77, - "learning_rate": 7.631712929375832e-07, - "loss": 0.6494, - "step": 68921 - }, - { - "epoch": 1.77, - "learning_rate": 7.6314440975945e-07, - "loss": 0.728, - "step": 68922 - }, - { - "epoch": 1.77, - "learning_rate": 7.631175267626663e-07, - "loss": 0.5249, - "step": 68923 - }, - { - "epoch": 1.77, - "learning_rate": 7.630906439472527e-07, - "loss": 0.6162, - "step": 68924 - }, - { - "epoch": 1.77, - "learning_rate": 7.630637613132298e-07, - "loss": 0.5815, - "step": 68925 - }, - { - "epoch": 1.77, - "learning_rate": 7.630368788606183e-07, - "loss": 0.666, - "step": 68926 - }, - { - "epoch": 1.77, - "learning_rate": 7.630099965894384e-07, - "loss": 0.7432, - "step": 68927 - }, - { - "epoch": 1.77, - "learning_rate": 7.629831144997106e-07, - "loss": 0.729, - "step": 68928 - }, - { - "epoch": 1.77, - "learning_rate": 7.629562325914558e-07, - "loss": 0.7363, - "step": 68929 - }, - { - "epoch": 1.77, - "learning_rate": 7.629293508646943e-07, - "loss": 0.6455, - "step": 68930 - }, - { - "epoch": 1.77, - "learning_rate": 7.629024693194474e-07, - "loss": 0.6086, - "step": 68931 - }, - { - "epoch": 1.77, - "learning_rate": 7.628755879557347e-07, - "loss": 0.6709, - "step": 68932 - }, - { - "epoch": 1.77, - "learning_rate": 7.628487067735776e-07, - "loss": 0.6953, - "step": 68933 - }, - { - "epoch": 1.77, - "learning_rate": 7.62821825772996e-07, - "loss": 0.5273, - "step": 68934 - }, - { - "epoch": 1.77, - "learning_rate": 7.627949449540112e-07, - "loss": 0.707, - "step": 68935 - }, - { - "epoch": 1.77, - "learning_rate": 7.627680643166436e-07, - "loss": 0.584, - "step": 68936 - }, - { - "epoch": 1.77, - "learning_rate": 7.62741183860913e-07, - "loss": 0.563, - "step": 68937 - }, - { - "epoch": 1.77, - "learning_rate": 7.627143035868409e-07, - "loss": 0.4648, - "step": 68938 - }, - { - "epoch": 1.77, - "learning_rate": 7.626874234944473e-07, - "loss": 0.6865, - "step": 68939 - }, - { - "epoch": 1.77, - "learning_rate": 7.626605435837532e-07, - "loss": 0.5532, - "step": 68940 - }, - { - "epoch": 1.77, - "learning_rate": 7.626336638547789e-07, - "loss": 0.6904, - "step": 68941 - }, - { - "epoch": 1.77, - "learning_rate": 7.626067843075452e-07, - "loss": 0.4216, - "step": 68942 - }, - { - "epoch": 1.77, - "learning_rate": 7.625799049420724e-07, - "loss": 0.709, - "step": 68943 - }, - { - "epoch": 1.77, - "learning_rate": 7.625530257583814e-07, - "loss": 0.7285, - "step": 68944 - }, - { - "epoch": 1.77, - "learning_rate": 7.625261467564927e-07, - "loss": 0.5896, - "step": 68945 - }, - { - "epoch": 1.77, - "learning_rate": 7.62499267936427e-07, - "loss": 0.5911, - "step": 68946 - }, - { - "epoch": 1.77, - "learning_rate": 7.624723892982043e-07, - "loss": 0.6406, - "step": 68947 - }, - { - "epoch": 1.77, - "learning_rate": 7.624455108418458e-07, - "loss": 0.7891, - "step": 68948 - }, - { - "epoch": 1.77, - "learning_rate": 7.624186325673716e-07, - "loss": 0.4708, - "step": 68949 - }, - { - "epoch": 1.77, - "learning_rate": 7.623917544748028e-07, - "loss": 0.6343, - "step": 68950 - }, - { - "epoch": 1.77, - "learning_rate": 7.623648765641594e-07, - "loss": 0.5139, - "step": 68951 - }, - { - "epoch": 1.77, - "learning_rate": 7.623379988354626e-07, - "loss": 0.6182, - "step": 68952 - }, - { - "epoch": 1.77, - "learning_rate": 7.623111212887323e-07, - "loss": 0.5928, - "step": 68953 - }, - { - "epoch": 1.77, - "learning_rate": 7.622842439239898e-07, - "loss": 0.6685, - "step": 68954 - }, - { - "epoch": 1.77, - "learning_rate": 7.622573667412551e-07, - "loss": 0.6221, - "step": 68955 - }, - { - "epoch": 1.77, - "learning_rate": 7.622304897405494e-07, - "loss": 0.5781, - "step": 68956 - }, - { - "epoch": 1.77, - "learning_rate": 7.622036129218926e-07, - "loss": 0.7134, - "step": 68957 - }, - { - "epoch": 1.77, - "learning_rate": 7.621767362853055e-07, - "loss": 0.5174, - "step": 68958 - }, - { - "epoch": 1.77, - "learning_rate": 7.621498598308087e-07, - "loss": 0.8086, - "step": 68959 - }, - { - "epoch": 1.77, - "learning_rate": 7.621229835584229e-07, - "loss": 0.6885, - "step": 68960 - }, - { - "epoch": 1.77, - "learning_rate": 7.620961074681686e-07, - "loss": 0.5757, - "step": 68961 - }, - { - "epoch": 1.77, - "learning_rate": 7.620692315600664e-07, - "loss": 0.6699, - "step": 68962 - }, - { - "epoch": 1.77, - "learning_rate": 7.620423558341366e-07, - "loss": 0.5781, - "step": 68963 - }, - { - "epoch": 1.77, - "learning_rate": 7.620154802904004e-07, - "loss": 0.5349, - "step": 68964 - }, - { - "epoch": 1.77, - "learning_rate": 7.619886049288777e-07, - "loss": 0.8184, - "step": 68965 - }, - { - "epoch": 1.77, - "learning_rate": 7.619617297495898e-07, - "loss": 0.6484, - "step": 68966 - }, - { - "epoch": 1.77, - "learning_rate": 7.619348547525567e-07, - "loss": 0.5598, - "step": 68967 - }, - { - "epoch": 1.77, - "learning_rate": 7.619079799377989e-07, - "loss": 0.6758, - "step": 68968 - }, - { - "epoch": 1.77, - "learning_rate": 7.618811053053373e-07, - "loss": 0.5195, - "step": 68969 - }, - { - "epoch": 1.77, - "learning_rate": 7.618542308551923e-07, - "loss": 0.5928, - "step": 68970 - }, - { - "epoch": 1.77, - "learning_rate": 7.618273565873847e-07, - "loss": 0.708, - "step": 68971 - }, - { - "epoch": 1.77, - "learning_rate": 7.618004825019349e-07, - "loss": 0.5918, - "step": 68972 - }, - { - "epoch": 1.77, - "learning_rate": 7.617736085988636e-07, - "loss": 0.5825, - "step": 68973 - }, - { - "epoch": 1.77, - "learning_rate": 7.617467348781911e-07, - "loss": 0.375, - "step": 68974 - }, - { - "epoch": 1.77, - "learning_rate": 7.617198613399383e-07, - "loss": 0.6704, - "step": 68975 - }, - { - "epoch": 1.77, - "learning_rate": 7.61692987984126e-07, - "loss": 0.6323, - "step": 68976 - }, - { - "epoch": 1.77, - "learning_rate": 7.61666114810774e-07, - "loss": 0.6157, - "step": 68977 - }, - { - "epoch": 1.77, - "learning_rate": 7.616392418199033e-07, - "loss": 0.6582, - "step": 68978 - }, - { - "epoch": 1.77, - "learning_rate": 7.616123690115347e-07, - "loss": 0.6313, - "step": 68979 - }, - { - "epoch": 1.77, - "learning_rate": 7.615854963856882e-07, - "loss": 0.6118, - "step": 68980 - }, - { - "epoch": 1.77, - "learning_rate": 7.61558623942385e-07, - "loss": 0.5625, - "step": 68981 - }, - { - "epoch": 1.77, - "learning_rate": 7.615317516816452e-07, - "loss": 0.5947, - "step": 68982 - }, - { - "epoch": 1.77, - "learning_rate": 7.615048796034897e-07, - "loss": 0.5654, - "step": 68983 - }, - { - "epoch": 1.77, - "learning_rate": 7.614780077079388e-07, - "loss": 0.5198, - "step": 68984 - }, - { - "epoch": 1.77, - "learning_rate": 7.614511359950134e-07, - "loss": 0.6035, - "step": 68985 - }, - { - "epoch": 1.77, - "learning_rate": 7.614242644647342e-07, - "loss": 0.5048, - "step": 68986 - }, - { - "epoch": 1.77, - "learning_rate": 7.613973931171209e-07, - "loss": 0.6846, - "step": 68987 - }, - { - "epoch": 1.77, - "learning_rate": 7.61370521952195e-07, - "loss": 0.5288, - "step": 68988 - }, - { - "epoch": 1.77, - "learning_rate": 7.613436509699765e-07, - "loss": 0.6719, - "step": 68989 - }, - { - "epoch": 1.77, - "learning_rate": 7.613167801704862e-07, - "loss": 0.5337, - "step": 68990 - }, - { - "epoch": 1.77, - "learning_rate": 7.612899095537448e-07, - "loss": 0.5757, - "step": 68991 - }, - { - "epoch": 1.77, - "learning_rate": 7.612630391197727e-07, - "loss": 0.5913, - "step": 68992 - }, - { - "epoch": 1.77, - "learning_rate": 7.612361688685903e-07, - "loss": 0.666, - "step": 68993 - }, - { - "epoch": 1.77, - "learning_rate": 7.612092988002187e-07, - "loss": 0.5007, - "step": 68994 - }, - { - "epoch": 1.77, - "learning_rate": 7.611824289146779e-07, - "loss": 0.6484, - "step": 68995 - }, - { - "epoch": 1.77, - "learning_rate": 7.611555592119893e-07, - "loss": 0.5757, - "step": 68996 - }, - { - "epoch": 1.77, - "learning_rate": 7.611286896921723e-07, - "loss": 0.7345, - "step": 68997 - }, - { - "epoch": 1.77, - "learning_rate": 7.611018203552484e-07, - "loss": 0.6045, - "step": 68998 - }, - { - "epoch": 1.77, - "learning_rate": 7.610749512012375e-07, - "loss": 0.5424, - "step": 68999 - }, - { - "epoch": 1.77, - "learning_rate": 7.610480822301609e-07, - "loss": 0.5547, - "step": 69000 - }, - { - "epoch": 1.77, - "learning_rate": 7.610212134420385e-07, - "loss": 0.6401, - "step": 69001 - }, - { - "epoch": 1.77, - "learning_rate": 7.609943448368914e-07, - "loss": 0.6836, - "step": 69002 - }, - { - "epoch": 1.77, - "learning_rate": 7.609674764147397e-07, - "loss": 0.499, - "step": 69003 - }, - { - "epoch": 1.77, - "learning_rate": 7.609406081756045e-07, - "loss": 0.4883, - "step": 69004 - }, - { - "epoch": 1.77, - "learning_rate": 7.609137401195057e-07, - "loss": 0.7266, - "step": 69005 - }, - { - "epoch": 1.77, - "learning_rate": 7.608868722464648e-07, - "loss": 0.6357, - "step": 69006 - }, - { - "epoch": 1.77, - "learning_rate": 7.608600045565016e-07, - "loss": 0.6318, - "step": 69007 - }, - { - "epoch": 1.77, - "learning_rate": 7.608331370496367e-07, - "loss": 0.7744, - "step": 69008 - }, - { - "epoch": 1.77, - "learning_rate": 7.60806269725891e-07, - "loss": 0.6846, - "step": 69009 - }, - { - "epoch": 1.77, - "learning_rate": 7.607794025852849e-07, - "loss": 0.7397, - "step": 69010 - }, - { - "epoch": 1.77, - "learning_rate": 7.60752535627839e-07, - "loss": 0.7368, - "step": 69011 - }, - { - "epoch": 1.77, - "learning_rate": 7.607256688535739e-07, - "loss": 0.6289, - "step": 69012 - }, - { - "epoch": 1.77, - "learning_rate": 7.606988022625102e-07, - "loss": 0.6387, - "step": 69013 - }, - { - "epoch": 1.77, - "learning_rate": 7.606719358546682e-07, - "loss": 0.6731, - "step": 69014 - }, - { - "epoch": 1.77, - "learning_rate": 7.60645069630069e-07, - "loss": 0.7158, - "step": 69015 - }, - { - "epoch": 1.77, - "learning_rate": 7.606182035887329e-07, - "loss": 0.6768, - "step": 69016 - }, - { - "epoch": 1.77, - "learning_rate": 7.605913377306805e-07, - "loss": 0.7832, - "step": 69017 - }, - { - "epoch": 1.77, - "learning_rate": 7.60564472055932e-07, - "loss": 0.6074, - "step": 69018 - }, - { - "epoch": 1.77, - "learning_rate": 7.605376065645084e-07, - "loss": 0.5796, - "step": 69019 - }, - { - "epoch": 1.77, - "learning_rate": 7.6051074125643e-07, - "loss": 0.3811, - "step": 69020 - }, - { - "epoch": 1.77, - "learning_rate": 7.604838761317177e-07, - "loss": 0.5669, - "step": 69021 - }, - { - "epoch": 1.77, - "learning_rate": 7.604570111903916e-07, - "loss": 0.6709, - "step": 69022 - }, - { - "epoch": 1.77, - "learning_rate": 7.604301464324729e-07, - "loss": 0.7065, - "step": 69023 - }, - { - "epoch": 1.77, - "learning_rate": 7.604032818579815e-07, - "loss": 0.6543, - "step": 69024 - }, - { - "epoch": 1.77, - "learning_rate": 7.603764174669386e-07, - "loss": 0.7314, - "step": 69025 - }, - { - "epoch": 1.77, - "learning_rate": 7.603495532593647e-07, - "loss": 0.75, - "step": 69026 - }, - { - "epoch": 1.77, - "learning_rate": 7.603226892352796e-07, - "loss": 0.5715, - "step": 69027 - }, - { - "epoch": 1.77, - "learning_rate": 7.602958253947045e-07, - "loss": 0.5273, - "step": 69028 - }, - { - "epoch": 1.77, - "learning_rate": 7.602689617376598e-07, - "loss": 0.6094, - "step": 69029 - }, - { - "epoch": 1.77, - "learning_rate": 7.602420982641664e-07, - "loss": 0.6064, - "step": 69030 - }, - { - "epoch": 1.77, - "learning_rate": 7.602152349742443e-07, - "loss": 0.6514, - "step": 69031 - }, - { - "epoch": 1.77, - "learning_rate": 7.601883718679146e-07, - "loss": 0.5957, - "step": 69032 - }, - { - "epoch": 1.77, - "learning_rate": 7.601615089451974e-07, - "loss": 0.6152, - "step": 69033 - }, - { - "epoch": 1.77, - "learning_rate": 7.601346462061138e-07, - "loss": 0.6123, - "step": 69034 - }, - { - "epoch": 1.77, - "learning_rate": 7.601077836506839e-07, - "loss": 0.502, - "step": 69035 - }, - { - "epoch": 1.77, - "learning_rate": 7.600809212789289e-07, - "loss": 0.6628, - "step": 69036 - }, - { - "epoch": 1.77, - "learning_rate": 7.600540590908683e-07, - "loss": 0.5791, - "step": 69037 - }, - { - "epoch": 1.77, - "learning_rate": 7.600271970865235e-07, - "loss": 0.6699, - "step": 69038 - }, - { - "epoch": 1.77, - "learning_rate": 7.600003352659146e-07, - "loss": 0.4398, - "step": 69039 - }, - { - "epoch": 1.77, - "learning_rate": 7.599734736290627e-07, - "loss": 0.6248, - "step": 69040 - }, - { - "epoch": 1.77, - "learning_rate": 7.599466121759878e-07, - "loss": 0.6914, - "step": 69041 - }, - { - "epoch": 1.77, - "learning_rate": 7.599197509067112e-07, - "loss": 0.689, - "step": 69042 - }, - { - "epoch": 1.77, - "learning_rate": 7.598928898212524e-07, - "loss": 0.8286, - "step": 69043 - }, - { - "epoch": 1.77, - "learning_rate": 7.59866028919633e-07, - "loss": 0.6436, - "step": 69044 - }, - { - "epoch": 1.77, - "learning_rate": 7.598391682018729e-07, - "loss": 0.5264, - "step": 69045 - }, - { - "epoch": 1.77, - "learning_rate": 7.598123076679935e-07, - "loss": 0.7334, - "step": 69046 - }, - { - "epoch": 1.77, - "learning_rate": 7.597854473180143e-07, - "loss": 0.6519, - "step": 69047 - }, - { - "epoch": 1.77, - "learning_rate": 7.597585871519563e-07, - "loss": 0.5552, - "step": 69048 - }, - { - "epoch": 1.77, - "learning_rate": 7.597317271698402e-07, - "loss": 0.7871, - "step": 69049 - }, - { - "epoch": 1.77, - "learning_rate": 7.597048673716863e-07, - "loss": 0.4691, - "step": 69050 - }, - { - "epoch": 1.77, - "learning_rate": 7.596780077575156e-07, - "loss": 0.6787, - "step": 69051 - }, - { - "epoch": 1.77, - "learning_rate": 7.596511483273482e-07, - "loss": 0.582, - "step": 69052 - }, - { - "epoch": 1.77, - "learning_rate": 7.596242890812047e-07, - "loss": 0.6782, - "step": 69053 - }, - { - "epoch": 1.77, - "learning_rate": 7.595974300191063e-07, - "loss": 0.6025, - "step": 69054 - }, - { - "epoch": 1.77, - "learning_rate": 7.595705711410727e-07, - "loss": 0.7036, - "step": 69055 - }, - { - "epoch": 1.77, - "learning_rate": 7.595437124471253e-07, - "loss": 0.582, - "step": 69056 - }, - { - "epoch": 1.77, - "learning_rate": 7.59516853937284e-07, - "loss": 0.6797, - "step": 69057 - }, - { - "epoch": 1.77, - "learning_rate": 7.594899956115693e-07, - "loss": 0.7451, - "step": 69058 - }, - { - "epoch": 1.77, - "learning_rate": 7.594631374700025e-07, - "loss": 0.5752, - "step": 69059 - }, - { - "epoch": 1.77, - "learning_rate": 7.594362795126032e-07, - "loss": 0.7178, - "step": 69060 - }, - { - "epoch": 1.77, - "learning_rate": 7.594094217393929e-07, - "loss": 0.6333, - "step": 69061 - }, - { - "epoch": 1.77, - "learning_rate": 7.593825641503915e-07, - "loss": 0.6626, - "step": 69062 - }, - { - "epoch": 1.77, - "learning_rate": 7.5935570674562e-07, - "loss": 0.8037, - "step": 69063 - }, - { - "epoch": 1.77, - "learning_rate": 7.593288495250985e-07, - "loss": 0.541, - "step": 69064 - }, - { - "epoch": 1.77, - "learning_rate": 7.593019924888481e-07, - "loss": 0.5703, - "step": 69065 - }, - { - "epoch": 1.77, - "learning_rate": 7.592751356368892e-07, - "loss": 0.6934, - "step": 69066 - }, - { - "epoch": 1.77, - "learning_rate": 7.59248278969242e-07, - "loss": 0.4214, - "step": 69067 - }, - { - "epoch": 1.77, - "learning_rate": 7.592214224859275e-07, - "loss": 0.7051, - "step": 69068 - }, - { - "epoch": 1.77, - "learning_rate": 7.591945661869661e-07, - "loss": 0.5923, - "step": 69069 - }, - { - "epoch": 1.77, - "learning_rate": 7.591677100723782e-07, - "loss": 0.6357, - "step": 69070 - }, - { - "epoch": 1.77, - "learning_rate": 7.591408541421845e-07, - "loss": 0.8467, - "step": 69071 - }, - { - "epoch": 1.77, - "learning_rate": 7.591139983964054e-07, - "loss": 0.6084, - "step": 69072 - }, - { - "epoch": 1.77, - "learning_rate": 7.590871428350621e-07, - "loss": 0.644, - "step": 69073 - }, - { - "epoch": 1.77, - "learning_rate": 7.590602874581742e-07, - "loss": 0.7842, - "step": 69074 - }, - { - "epoch": 1.77, - "learning_rate": 7.590334322657631e-07, - "loss": 0.6982, - "step": 69075 - }, - { - "epoch": 1.77, - "learning_rate": 7.590065772578492e-07, - "loss": 0.5361, - "step": 69076 - }, - { - "epoch": 1.77, - "learning_rate": 7.589797224344525e-07, - "loss": 0.7383, - "step": 69077 - }, - { - "epoch": 1.77, - "learning_rate": 7.589528677955941e-07, - "loss": 0.5981, - "step": 69078 - }, - { - "epoch": 1.77, - "learning_rate": 7.589260133412942e-07, - "loss": 0.5029, - "step": 69079 - }, - { - "epoch": 1.77, - "learning_rate": 7.588991590715738e-07, - "loss": 0.7021, - "step": 69080 - }, - { - "epoch": 1.77, - "learning_rate": 7.58872304986453e-07, - "loss": 0.916, - "step": 69081 - }, - { - "epoch": 1.77, - "learning_rate": 7.588454510859528e-07, - "loss": 0.7705, - "step": 69082 - }, - { - "epoch": 1.77, - "learning_rate": 7.588185973700934e-07, - "loss": 0.7441, - "step": 69083 - }, - { - "epoch": 1.77, - "learning_rate": 7.587917438388958e-07, - "loss": 0.5654, - "step": 69084 - }, - { - "epoch": 1.77, - "learning_rate": 7.587648904923798e-07, - "loss": 0.6484, - "step": 69085 - }, - { - "epoch": 1.77, - "learning_rate": 7.587380373305673e-07, - "loss": 0.5898, - "step": 69086 - }, - { - "epoch": 1.77, - "learning_rate": 7.587111843534773e-07, - "loss": 0.5596, - "step": 69087 - }, - { - "epoch": 1.77, - "learning_rate": 7.586843315611311e-07, - "loss": 0.6118, - "step": 69088 - }, - { - "epoch": 1.77, - "learning_rate": 7.586574789535492e-07, - "loss": 0.6191, - "step": 69089 - }, - { - "epoch": 1.77, - "learning_rate": 7.586306265307523e-07, - "loss": 0.6606, - "step": 69090 - }, - { - "epoch": 1.77, - "learning_rate": 7.586037742927606e-07, - "loss": 0.5703, - "step": 69091 - }, - { - "epoch": 1.77, - "learning_rate": 7.585769222395951e-07, - "loss": 0.5137, - "step": 69092 - }, - { - "epoch": 1.77, - "learning_rate": 7.585500703712759e-07, - "loss": 0.6406, - "step": 69093 - }, - { - "epoch": 1.77, - "learning_rate": 7.585232186878242e-07, - "loss": 0.5991, - "step": 69094 - }, - { - "epoch": 1.77, - "learning_rate": 7.584963671892598e-07, - "loss": 0.6265, - "step": 69095 - }, - { - "epoch": 1.77, - "learning_rate": 7.584695158756042e-07, - "loss": 0.5806, - "step": 69096 - }, - { - "epoch": 1.77, - "learning_rate": 7.58442664746877e-07, - "loss": 0.561, - "step": 69097 - }, - { - "epoch": 1.77, - "learning_rate": 7.584158138030989e-07, - "loss": 0.7441, - "step": 69098 - }, - { - "epoch": 1.77, - "learning_rate": 7.583889630442911e-07, - "loss": 0.6895, - "step": 69099 - }, - { - "epoch": 1.77, - "learning_rate": 7.583621124704734e-07, - "loss": 0.708, - "step": 69100 - }, - { - "epoch": 1.77, - "learning_rate": 7.58335262081667e-07, - "loss": 0.6865, - "step": 69101 - }, - { - "epoch": 1.77, - "learning_rate": 7.58308411877892e-07, - "loss": 0.501, - "step": 69102 - }, - { - "epoch": 1.77, - "learning_rate": 7.582815618591694e-07, - "loss": 0.7549, - "step": 69103 - }, - { - "epoch": 1.77, - "learning_rate": 7.582547120255191e-07, - "loss": 0.6279, - "step": 69104 - }, - { - "epoch": 1.77, - "learning_rate": 7.582278623769623e-07, - "loss": 0.6611, - "step": 69105 - }, - { - "epoch": 1.77, - "learning_rate": 7.582010129135197e-07, - "loss": 0.6621, - "step": 69106 - }, - { - "epoch": 1.77, - "learning_rate": 7.581741636352111e-07, - "loss": 0.5605, - "step": 69107 - }, - { - "epoch": 1.77, - "learning_rate": 7.581473145420571e-07, - "loss": 0.6729, - "step": 69108 - }, - { - "epoch": 1.77, - "learning_rate": 7.58120465634079e-07, - "loss": 0.5723, - "step": 69109 - }, - { - "epoch": 1.77, - "learning_rate": 7.580936169112967e-07, - "loss": 0.6028, - "step": 69110 - }, - { - "epoch": 1.77, - "learning_rate": 7.580667683737312e-07, - "loss": 0.7568, - "step": 69111 - }, - { - "epoch": 1.77, - "learning_rate": 7.580399200214026e-07, - "loss": 0.4736, - "step": 69112 - }, - { - "epoch": 1.77, - "learning_rate": 7.580130718543318e-07, - "loss": 0.5376, - "step": 69113 - }, - { - "epoch": 1.77, - "learning_rate": 7.579862238725393e-07, - "loss": 0.564, - "step": 69114 - }, - { - "epoch": 1.77, - "learning_rate": 7.579593760760457e-07, - "loss": 0.6929, - "step": 69115 - }, - { - "epoch": 1.77, - "learning_rate": 7.579325284648716e-07, - "loss": 0.6094, - "step": 69116 - }, - { - "epoch": 1.77, - "learning_rate": 7.579056810390371e-07, - "loss": 0.7656, - "step": 69117 - }, - { - "epoch": 1.77, - "learning_rate": 7.578788337985633e-07, - "loss": 0.6675, - "step": 69118 - }, - { - "epoch": 1.77, - "learning_rate": 7.578519867434704e-07, - "loss": 0.604, - "step": 69119 - }, - { - "epoch": 1.77, - "learning_rate": 7.578251398737793e-07, - "loss": 0.542, - "step": 69120 - }, - { - "epoch": 1.77, - "learning_rate": 7.577982931895101e-07, - "loss": 0.6084, - "step": 69121 - }, - { - "epoch": 1.77, - "learning_rate": 7.577714466906837e-07, - "loss": 0.6924, - "step": 69122 - }, - { - "epoch": 1.77, - "learning_rate": 7.577446003773204e-07, - "loss": 0.6523, - "step": 69123 - }, - { - "epoch": 1.77, - "learning_rate": 7.577177542494412e-07, - "loss": 0.6963, - "step": 69124 - }, - { - "epoch": 1.77, - "learning_rate": 7.576909083070665e-07, - "loss": 0.8154, - "step": 69125 - }, - { - "epoch": 1.77, - "learning_rate": 7.576640625502169e-07, - "loss": 0.7988, - "step": 69126 - }, - { - "epoch": 1.77, - "learning_rate": 7.576372169789122e-07, - "loss": 0.6128, - "step": 69127 - }, - { - "epoch": 1.77, - "learning_rate": 7.576103715931739e-07, - "loss": 0.7549, - "step": 69128 - }, - { - "epoch": 1.77, - "learning_rate": 7.575835263930218e-07, - "loss": 0.4854, - "step": 69129 - }, - { - "epoch": 1.77, - "learning_rate": 7.575566813784771e-07, - "loss": 0.4802, - "step": 69130 - }, - { - "epoch": 1.77, - "learning_rate": 7.5752983654956e-07, - "loss": 0.6045, - "step": 69131 - }, - { - "epoch": 1.77, - "learning_rate": 7.575029919062914e-07, - "loss": 0.4613, - "step": 69132 - }, - { - "epoch": 1.77, - "learning_rate": 7.574761474486913e-07, - "loss": 0.6079, - "step": 69133 - }, - { - "epoch": 1.77, - "learning_rate": 7.574493031767808e-07, - "loss": 0.5361, - "step": 69134 - }, - { - "epoch": 1.77, - "learning_rate": 7.5742245909058e-07, - "loss": 0.6885, - "step": 69135 - }, - { - "epoch": 1.77, - "learning_rate": 7.573956151901101e-07, - "loss": 0.7388, - "step": 69136 - }, - { - "epoch": 1.77, - "learning_rate": 7.57368771475391e-07, - "loss": 0.4663, - "step": 69137 - }, - { - "epoch": 1.77, - "learning_rate": 7.573419279464433e-07, - "loss": 0.6182, - "step": 69138 - }, - { - "epoch": 1.77, - "learning_rate": 7.573150846032879e-07, - "loss": 0.5903, - "step": 69139 - }, - { - "epoch": 1.77, - "learning_rate": 7.572882414459449e-07, - "loss": 0.4796, - "step": 69140 - }, - { - "epoch": 1.77, - "learning_rate": 7.572613984744355e-07, - "loss": 0.7686, - "step": 69141 - }, - { - "epoch": 1.77, - "learning_rate": 7.572345556887798e-07, - "loss": 0.8164, - "step": 69142 - }, - { - "epoch": 1.77, - "learning_rate": 7.572077130889982e-07, - "loss": 0.6621, - "step": 69143 - }, - { - "epoch": 1.77, - "learning_rate": 7.571808706751117e-07, - "loss": 0.499, - "step": 69144 - }, - { - "epoch": 1.77, - "learning_rate": 7.571540284471405e-07, - "loss": 0.582, - "step": 69145 - }, - { - "epoch": 1.77, - "learning_rate": 7.571271864051056e-07, - "loss": 0.4155, - "step": 69146 - }, - { - "epoch": 1.77, - "learning_rate": 7.571003445490272e-07, - "loss": 0.7173, - "step": 69147 - }, - { - "epoch": 1.77, - "learning_rate": 7.570735028789256e-07, - "loss": 0.7725, - "step": 69148 - }, - { - "epoch": 1.77, - "learning_rate": 7.570466613948218e-07, - "loss": 0.4927, - "step": 69149 - }, - { - "epoch": 1.77, - "learning_rate": 7.570198200967362e-07, - "loss": 0.54, - "step": 69150 - }, - { - "epoch": 1.77, - "learning_rate": 7.569929789846893e-07, - "loss": 0.5552, - "step": 69151 - }, - { - "epoch": 1.77, - "learning_rate": 7.569661380587016e-07, - "loss": 0.8271, - "step": 69152 - }, - { - "epoch": 1.77, - "learning_rate": 7.56939297318794e-07, - "loss": 0.6982, - "step": 69153 - }, - { - "epoch": 1.77, - "learning_rate": 7.569124567649865e-07, - "loss": 0.5654, - "step": 69154 - }, - { - "epoch": 1.77, - "learning_rate": 7.568856163973005e-07, - "loss": 0.5459, - "step": 69155 - }, - { - "epoch": 1.77, - "learning_rate": 7.568587762157557e-07, - "loss": 0.6846, - "step": 69156 - }, - { - "epoch": 1.77, - "learning_rate": 7.568319362203728e-07, - "loss": 0.5898, - "step": 69157 - }, - { - "epoch": 1.77, - "learning_rate": 7.568050964111727e-07, - "loss": 0.793, - "step": 69158 - }, - { - "epoch": 1.77, - "learning_rate": 7.567782567881757e-07, - "loss": 0.4506, - "step": 69159 - }, - { - "epoch": 1.77, - "learning_rate": 7.567514173514023e-07, - "loss": 0.4351, - "step": 69160 - }, - { - "epoch": 1.77, - "learning_rate": 7.567245781008734e-07, - "loss": 0.729, - "step": 69161 - }, - { - "epoch": 1.77, - "learning_rate": 7.566977390366088e-07, - "loss": 0.6372, - "step": 69162 - }, - { - "epoch": 1.77, - "learning_rate": 7.5667090015863e-07, - "loss": 0.5887, - "step": 69163 - }, - { - "epoch": 1.77, - "learning_rate": 7.566440614669569e-07, - "loss": 0.6436, - "step": 69164 - }, - { - "epoch": 1.77, - "learning_rate": 7.566172229616106e-07, - "loss": 0.4547, - "step": 69165 - }, - { - "epoch": 1.77, - "learning_rate": 7.565903846426111e-07, - "loss": 0.4746, - "step": 69166 - }, - { - "epoch": 1.77, - "learning_rate": 7.56563546509979e-07, - "loss": 0.6543, - "step": 69167 - }, - { - "epoch": 1.77, - "learning_rate": 7.565367085637352e-07, - "loss": 0.668, - "step": 69168 - }, - { - "epoch": 1.77, - "learning_rate": 7.565098708038997e-07, - "loss": 0.6899, - "step": 69169 - }, - { - "epoch": 1.77, - "learning_rate": 7.564830332304938e-07, - "loss": 0.8311, - "step": 69170 - }, - { - "epoch": 1.77, - "learning_rate": 7.564561958435373e-07, - "loss": 0.7422, - "step": 69171 - }, - { - "epoch": 1.77, - "learning_rate": 7.564293586430514e-07, - "loss": 0.6812, - "step": 69172 - }, - { - "epoch": 1.77, - "learning_rate": 7.56402521629056e-07, - "loss": 0.623, - "step": 69173 - }, - { - "epoch": 1.77, - "learning_rate": 7.563756848015723e-07, - "loss": 0.6704, - "step": 69174 - }, - { - "epoch": 1.77, - "learning_rate": 7.563488481606209e-07, - "loss": 0.5903, - "step": 69175 - }, - { - "epoch": 1.77, - "learning_rate": 7.563220117062212e-07, - "loss": 0.7266, - "step": 69176 - }, - { - "epoch": 1.77, - "learning_rate": 7.562951754383951e-07, - "loss": 0.6372, - "step": 69177 - }, - { - "epoch": 1.77, - "learning_rate": 7.562683393571622e-07, - "loss": 0.5547, - "step": 69178 - }, - { - "epoch": 1.77, - "learning_rate": 7.562415034625436e-07, - "loss": 0.749, - "step": 69179 - }, - { - "epoch": 1.77, - "learning_rate": 7.562146677545596e-07, - "loss": 0.6953, - "step": 69180 - }, - { - "epoch": 1.77, - "learning_rate": 7.561878322332307e-07, - "loss": 0.5498, - "step": 69181 - }, - { - "epoch": 1.77, - "learning_rate": 7.561609968985778e-07, - "loss": 0.645, - "step": 69182 - }, - { - "epoch": 1.77, - "learning_rate": 7.561341617506211e-07, - "loss": 0.6582, - "step": 69183 - }, - { - "epoch": 1.77, - "learning_rate": 7.561073267893813e-07, - "loss": 0.6514, - "step": 69184 - }, - { - "epoch": 1.77, - "learning_rate": 7.560804920148792e-07, - "loss": 0.6885, - "step": 69185 - }, - { - "epoch": 1.77, - "learning_rate": 7.560536574271345e-07, - "loss": 0.7515, - "step": 69186 - }, - { - "epoch": 1.77, - "learning_rate": 7.560268230261687e-07, - "loss": 0.5889, - "step": 69187 - }, - { - "epoch": 1.77, - "learning_rate": 7.559999888120017e-07, - "loss": 0.4897, - "step": 69188 - }, - { - "epoch": 1.77, - "learning_rate": 7.559731547846544e-07, - "loss": 0.6128, - "step": 69189 - }, - { - "epoch": 1.77, - "learning_rate": 7.559463209441471e-07, - "loss": 0.623, - "step": 69190 - }, - { - "epoch": 1.77, - "learning_rate": 7.559194872905005e-07, - "loss": 0.6782, - "step": 69191 - }, - { - "epoch": 1.77, - "learning_rate": 7.558926538237353e-07, - "loss": 0.6777, - "step": 69192 - }, - { - "epoch": 1.77, - "learning_rate": 7.558658205438718e-07, - "loss": 0.4617, - "step": 69193 - }, - { - "epoch": 1.77, - "learning_rate": 7.558389874509305e-07, - "loss": 0.5347, - "step": 69194 - }, - { - "epoch": 1.77, - "learning_rate": 7.558121545449327e-07, - "loss": 0.4531, - "step": 69195 - }, - { - "epoch": 1.77, - "learning_rate": 7.557853218258976e-07, - "loss": 0.6504, - "step": 69196 - }, - { - "epoch": 1.77, - "learning_rate": 7.557584892938466e-07, - "loss": 0.7432, - "step": 69197 - }, - { - "epoch": 1.77, - "learning_rate": 7.557316569488e-07, - "loss": 0.6211, - "step": 69198 - }, - { - "epoch": 1.77, - "learning_rate": 7.557048247907787e-07, - "loss": 0.6326, - "step": 69199 - }, - { - "epoch": 1.77, - "learning_rate": 7.556779928198027e-07, - "loss": 0.5432, - "step": 69200 - }, - { - "epoch": 1.77, - "learning_rate": 7.55651161035893e-07, - "loss": 0.7031, - "step": 69201 - }, - { - "epoch": 1.77, - "learning_rate": 7.556243294390699e-07, - "loss": 0.6167, - "step": 69202 - }, - { - "epoch": 1.77, - "learning_rate": 7.55597498029354e-07, - "loss": 0.4595, - "step": 69203 - }, - { - "epoch": 1.77, - "learning_rate": 7.555706668067658e-07, - "loss": 0.6367, - "step": 69204 - }, - { - "epoch": 1.77, - "learning_rate": 7.555438357713262e-07, - "loss": 0.7324, - "step": 69205 - }, - { - "epoch": 1.77, - "learning_rate": 7.555170049230554e-07, - "loss": 0.5688, - "step": 69206 - }, - { - "epoch": 1.77, - "learning_rate": 7.554901742619737e-07, - "loss": 0.6958, - "step": 69207 - }, - { - "epoch": 1.77, - "learning_rate": 7.554633437881021e-07, - "loss": 0.6328, - "step": 69208 - }, - { - "epoch": 1.77, - "learning_rate": 7.554365135014609e-07, - "loss": 0.791, - "step": 69209 - }, - { - "epoch": 1.77, - "learning_rate": 7.554096834020707e-07, - "loss": 0.6782, - "step": 69210 - }, - { - "epoch": 1.77, - "learning_rate": 7.55382853489952e-07, - "loss": 0.5142, - "step": 69211 - }, - { - "epoch": 1.77, - "learning_rate": 7.553560237651256e-07, - "loss": 0.7373, - "step": 69212 - }, - { - "epoch": 1.77, - "learning_rate": 7.553291942276116e-07, - "loss": 0.6875, - "step": 69213 - }, - { - "epoch": 1.77, - "learning_rate": 7.55302364877431e-07, - "loss": 0.552, - "step": 69214 - }, - { - "epoch": 1.77, - "learning_rate": 7.552755357146044e-07, - "loss": 0.5933, - "step": 69215 - }, - { - "epoch": 1.77, - "learning_rate": 7.552487067391518e-07, - "loss": 0.7246, - "step": 69216 - }, - { - "epoch": 1.77, - "learning_rate": 7.55221877951094e-07, - "loss": 0.8877, - "step": 69217 - }, - { - "epoch": 1.77, - "learning_rate": 7.551950493504514e-07, - "loss": 0.4077, - "step": 69218 - }, - { - "epoch": 1.77, - "learning_rate": 7.551682209372447e-07, - "loss": 0.644, - "step": 69219 - }, - { - "epoch": 1.77, - "learning_rate": 7.551413927114946e-07, - "loss": 0.6133, - "step": 69220 - }, - { - "epoch": 1.77, - "learning_rate": 7.551145646732213e-07, - "loss": 0.7183, - "step": 69221 - }, - { - "epoch": 1.77, - "learning_rate": 7.550877368224458e-07, - "loss": 0.6895, - "step": 69222 - }, - { - "epoch": 1.77, - "learning_rate": 7.550609091591879e-07, - "loss": 0.6416, - "step": 69223 - }, - { - "epoch": 1.77, - "learning_rate": 7.55034081683469e-07, - "loss": 0.6885, - "step": 69224 - }, - { - "epoch": 1.77, - "learning_rate": 7.550072543953095e-07, - "loss": 0.6719, - "step": 69225 - }, - { - "epoch": 1.77, - "learning_rate": 7.549804272947292e-07, - "loss": 0.6058, - "step": 69226 - }, - { - "epoch": 1.77, - "learning_rate": 7.549536003817493e-07, - "loss": 0.5225, - "step": 69227 - }, - { - "epoch": 1.77, - "learning_rate": 7.549267736563899e-07, - "loss": 0.7031, - "step": 69228 - }, - { - "epoch": 1.77, - "learning_rate": 7.548999471186722e-07, - "loss": 0.6216, - "step": 69229 - }, - { - "epoch": 1.77, - "learning_rate": 7.548731207686159e-07, - "loss": 0.6543, - "step": 69230 - }, - { - "epoch": 1.77, - "learning_rate": 7.548462946062423e-07, - "loss": 0.5562, - "step": 69231 - }, - { - "epoch": 1.77, - "learning_rate": 7.548194686315715e-07, - "loss": 0.7451, - "step": 69232 - }, - { - "epoch": 1.77, - "learning_rate": 7.54792642844624e-07, - "loss": 0.8564, - "step": 69233 - }, - { - "epoch": 1.77, - "learning_rate": 7.547658172454209e-07, - "loss": 0.5991, - "step": 69234 - }, - { - "epoch": 1.77, - "learning_rate": 7.547389918339823e-07, - "loss": 0.5151, - "step": 69235 - }, - { - "epoch": 1.77, - "learning_rate": 7.547121666103286e-07, - "loss": 0.5918, - "step": 69236 - }, - { - "epoch": 1.77, - "learning_rate": 7.546853415744805e-07, - "loss": 0.7773, - "step": 69237 - }, - { - "epoch": 1.77, - "learning_rate": 7.546585167264586e-07, - "loss": 0.6021, - "step": 69238 - }, - { - "epoch": 1.77, - "learning_rate": 7.546316920662833e-07, - "loss": 0.6836, - "step": 69239 - }, - { - "epoch": 1.77, - "learning_rate": 7.546048675939751e-07, - "loss": 0.4785, - "step": 69240 - }, - { - "epoch": 1.77, - "learning_rate": 7.54578043309555e-07, - "loss": 0.6699, - "step": 69241 - }, - { - "epoch": 1.77, - "learning_rate": 7.54551219213043e-07, - "loss": 0.7314, - "step": 69242 - }, - { - "epoch": 1.77, - "learning_rate": 7.5452439530446e-07, - "loss": 0.5371, - "step": 69243 - }, - { - "epoch": 1.77, - "learning_rate": 7.54497571583826e-07, - "loss": 0.6566, - "step": 69244 - }, - { - "epoch": 1.77, - "learning_rate": 7.544707480511626e-07, - "loss": 0.5835, - "step": 69245 - }, - { - "epoch": 1.77, - "learning_rate": 7.544439247064893e-07, - "loss": 0.7744, - "step": 69246 - }, - { - "epoch": 1.77, - "learning_rate": 7.54417101549827e-07, - "loss": 0.6162, - "step": 69247 - }, - { - "epoch": 1.77, - "learning_rate": 7.543902785811962e-07, - "loss": 0.6006, - "step": 69248 - }, - { - "epoch": 1.77, - "learning_rate": 7.543634558006176e-07, - "loss": 0.6523, - "step": 69249 - }, - { - "epoch": 1.77, - "learning_rate": 7.543366332081114e-07, - "loss": 0.7559, - "step": 69250 - }, - { - "epoch": 1.77, - "learning_rate": 7.543098108036985e-07, - "loss": 0.5723, - "step": 69251 - }, - { - "epoch": 1.77, - "learning_rate": 7.542829885873991e-07, - "loss": 0.478, - "step": 69252 - }, - { - "epoch": 1.77, - "learning_rate": 7.54256166559234e-07, - "loss": 0.7534, - "step": 69253 - }, - { - "epoch": 1.78, - "learning_rate": 7.542293447192236e-07, - "loss": 0.5527, - "step": 69254 - }, - { - "epoch": 1.78, - "learning_rate": 7.542025230673888e-07, - "loss": 0.4822, - "step": 69255 - }, - { - "epoch": 1.78, - "learning_rate": 7.541757016037497e-07, - "loss": 0.5962, - "step": 69256 - }, - { - "epoch": 1.78, - "learning_rate": 7.541488803283267e-07, - "loss": 0.5624, - "step": 69257 - }, - { - "epoch": 1.78, - "learning_rate": 7.541220592411408e-07, - "loss": 0.4399, - "step": 69258 - }, - { - "epoch": 1.78, - "learning_rate": 7.540952383422122e-07, - "loss": 0.6147, - "step": 69259 - }, - { - "epoch": 1.78, - "learning_rate": 7.540684176315617e-07, - "loss": 0.5352, - "step": 69260 - }, - { - "epoch": 1.78, - "learning_rate": 7.540415971092096e-07, - "loss": 0.6631, - "step": 69261 - }, - { - "epoch": 1.78, - "learning_rate": 7.540147767751766e-07, - "loss": 0.6431, - "step": 69262 - }, - { - "epoch": 1.78, - "learning_rate": 7.539879566294832e-07, - "loss": 0.4443, - "step": 69263 - }, - { - "epoch": 1.78, - "learning_rate": 7.539611366721499e-07, - "loss": 0.7104, - "step": 69264 - }, - { - "epoch": 1.78, - "learning_rate": 7.539343169031975e-07, - "loss": 0.5862, - "step": 69265 - }, - { - "epoch": 1.78, - "learning_rate": 7.539074973226459e-07, - "loss": 0.4834, - "step": 69266 - }, - { - "epoch": 1.78, - "learning_rate": 7.538806779305162e-07, - "loss": 0.5742, - "step": 69267 - }, - { - "epoch": 1.78, - "learning_rate": 7.538538587268287e-07, - "loss": 0.5747, - "step": 69268 - }, - { - "epoch": 1.78, - "learning_rate": 7.538270397116038e-07, - "loss": 0.6401, - "step": 69269 - }, - { - "epoch": 1.78, - "learning_rate": 7.538002208848625e-07, - "loss": 0.6348, - "step": 69270 - }, - { - "epoch": 1.78, - "learning_rate": 7.537734022466248e-07, - "loss": 0.6758, - "step": 69271 - }, - { - "epoch": 1.78, - "learning_rate": 7.537465837969117e-07, - "loss": 0.4912, - "step": 69272 - }, - { - "epoch": 1.78, - "learning_rate": 7.537197655357433e-07, - "loss": 0.5435, - "step": 69273 - }, - { - "epoch": 1.78, - "learning_rate": 7.536929474631405e-07, - "loss": 0.7734, - "step": 69274 - }, - { - "epoch": 1.78, - "learning_rate": 7.53666129579124e-07, - "loss": 0.7441, - "step": 69275 - }, - { - "epoch": 1.78, - "learning_rate": 7.536393118837136e-07, - "loss": 0.8574, - "step": 69276 - }, - { - "epoch": 1.78, - "learning_rate": 7.536124943769303e-07, - "loss": 0.52, - "step": 69277 - }, - { - "epoch": 1.78, - "learning_rate": 7.535856770587945e-07, - "loss": 0.6689, - "step": 69278 - }, - { - "epoch": 1.78, - "learning_rate": 7.53558859929327e-07, - "loss": 0.6533, - "step": 69279 - }, - { - "epoch": 1.78, - "learning_rate": 7.535320429885478e-07, - "loss": 0.4573, - "step": 69280 - }, - { - "epoch": 1.78, - "learning_rate": 7.535052262364782e-07, - "loss": 0.5977, - "step": 69281 - }, - { - "epoch": 1.78, - "learning_rate": 7.534784096731381e-07, - "loss": 0.7471, - "step": 69282 - }, - { - "epoch": 1.78, - "learning_rate": 7.534515932985484e-07, - "loss": 0.5576, - "step": 69283 - }, - { - "epoch": 1.78, - "learning_rate": 7.534247771127293e-07, - "loss": 0.7188, - "step": 69284 - }, - { - "epoch": 1.78, - "learning_rate": 7.533979611157021e-07, - "loss": 0.6089, - "step": 69285 - }, - { - "epoch": 1.78, - "learning_rate": 7.533711453074861e-07, - "loss": 0.6372, - "step": 69286 - }, - { - "epoch": 1.78, - "learning_rate": 7.533443296881028e-07, - "loss": 0.7109, - "step": 69287 - }, - { - "epoch": 1.78, - "learning_rate": 7.533175142575721e-07, - "loss": 0.6079, - "step": 69288 - }, - { - "epoch": 1.78, - "learning_rate": 7.532906990159149e-07, - "loss": 0.7129, - "step": 69289 - }, - { - "epoch": 1.78, - "learning_rate": 7.532638839631516e-07, - "loss": 0.6763, - "step": 69290 - }, - { - "epoch": 1.78, - "learning_rate": 7.532370690993031e-07, - "loss": 0.5933, - "step": 69291 - }, - { - "epoch": 1.78, - "learning_rate": 7.532102544243893e-07, - "loss": 0.6416, - "step": 69292 - }, - { - "epoch": 1.78, - "learning_rate": 7.531834399384314e-07, - "loss": 0.6699, - "step": 69293 - }, - { - "epoch": 1.78, - "learning_rate": 7.531566256414492e-07, - "loss": 0.5094, - "step": 69294 - }, - { - "epoch": 1.78, - "learning_rate": 7.531298115334641e-07, - "loss": 0.499, - "step": 69295 - }, - { - "epoch": 1.78, - "learning_rate": 7.53102997614496e-07, - "loss": 0.5391, - "step": 69296 - }, - { - "epoch": 1.78, - "learning_rate": 7.530761838845653e-07, - "loss": 0.6602, - "step": 69297 - }, - { - "epoch": 1.78, - "learning_rate": 7.530493703436931e-07, - "loss": 0.6953, - "step": 69298 - }, - { - "epoch": 1.78, - "learning_rate": 7.530225569918993e-07, - "loss": 0.5165, - "step": 69299 - }, - { - "epoch": 1.78, - "learning_rate": 7.529957438292052e-07, - "loss": 0.5049, - "step": 69300 - }, - { - "epoch": 1.78, - "learning_rate": 7.529689308556305e-07, - "loss": 0.4843, - "step": 69301 - }, - { - "epoch": 1.78, - "learning_rate": 7.529421180711964e-07, - "loss": 0.6182, - "step": 69302 - }, - { - "epoch": 1.78, - "learning_rate": 7.52915305475923e-07, - "loss": 0.8311, - "step": 69303 - }, - { - "epoch": 1.78, - "learning_rate": 7.528884930698312e-07, - "loss": 0.5791, - "step": 69304 - }, - { - "epoch": 1.78, - "learning_rate": 7.528616808529415e-07, - "loss": 0.7334, - "step": 69305 - }, - { - "epoch": 1.78, - "learning_rate": 7.528348688252739e-07, - "loss": 0.6223, - "step": 69306 - }, - { - "epoch": 1.78, - "learning_rate": 7.528080569868492e-07, - "loss": 0.5408, - "step": 69307 - }, - { - "epoch": 1.78, - "learning_rate": 7.527812453376883e-07, - "loss": 0.6777, - "step": 69308 - }, - { - "epoch": 1.78, - "learning_rate": 7.527544338778112e-07, - "loss": 0.625, - "step": 69309 - }, - { - "epoch": 1.78, - "learning_rate": 7.527276226072386e-07, - "loss": 0.8169, - "step": 69310 - }, - { - "epoch": 1.78, - "learning_rate": 7.527008115259911e-07, - "loss": 0.6484, - "step": 69311 - }, - { - "epoch": 1.78, - "learning_rate": 7.526740006340894e-07, - "loss": 0.5552, - "step": 69312 - }, - { - "epoch": 1.78, - "learning_rate": 7.526471899315537e-07, - "loss": 0.5886, - "step": 69313 - }, - { - "epoch": 1.78, - "learning_rate": 7.526203794184048e-07, - "loss": 0.4897, - "step": 69314 - }, - { - "epoch": 1.78, - "learning_rate": 7.525935690946633e-07, - "loss": 0.792, - "step": 69315 - }, - { - "epoch": 1.78, - "learning_rate": 7.525667589603491e-07, - "loss": 0.791, - "step": 69316 - }, - { - "epoch": 1.78, - "learning_rate": 7.525399490154834e-07, - "loss": 0.7402, - "step": 69317 - }, - { - "epoch": 1.78, - "learning_rate": 7.525131392600863e-07, - "loss": 0.5674, - "step": 69318 - }, - { - "epoch": 1.78, - "learning_rate": 7.524863296941788e-07, - "loss": 0.791, - "step": 69319 - }, - { - "epoch": 1.78, - "learning_rate": 7.524595203177808e-07, - "loss": 0.6455, - "step": 69320 - }, - { - "epoch": 1.78, - "learning_rate": 7.524327111309135e-07, - "loss": 0.6926, - "step": 69321 - }, - { - "epoch": 1.78, - "learning_rate": 7.524059021335969e-07, - "loss": 0.7578, - "step": 69322 - }, - { - "epoch": 1.78, - "learning_rate": 7.523790933258516e-07, - "loss": 0.5894, - "step": 69323 - }, - { - "epoch": 1.78, - "learning_rate": 7.523522847076984e-07, - "loss": 0.709, - "step": 69324 - }, - { - "epoch": 1.78, - "learning_rate": 7.52325476279158e-07, - "loss": 0.5425, - "step": 69325 - }, - { - "epoch": 1.78, - "learning_rate": 7.5229866804025e-07, - "loss": 0.6335, - "step": 69326 - }, - { - "epoch": 1.78, - "learning_rate": 7.522718599909958e-07, - "loss": 0.5415, - "step": 69327 - }, - { - "epoch": 1.78, - "learning_rate": 7.522450521314155e-07, - "loss": 0.5469, - "step": 69328 - }, - { - "epoch": 1.78, - "learning_rate": 7.522182444615299e-07, - "loss": 0.6108, - "step": 69329 - }, - { - "epoch": 1.78, - "learning_rate": 7.521914369813594e-07, - "loss": 0.5757, - "step": 69330 - }, - { - "epoch": 1.78, - "learning_rate": 7.521646296909244e-07, - "loss": 0.6484, - "step": 69331 - }, - { - "epoch": 1.78, - "learning_rate": 7.521378225902455e-07, - "loss": 0.5439, - "step": 69332 - }, - { - "epoch": 1.78, - "learning_rate": 7.521110156793435e-07, - "loss": 0.4326, - "step": 69333 - }, - { - "epoch": 1.78, - "learning_rate": 7.520842089582386e-07, - "loss": 0.7725, - "step": 69334 - }, - { - "epoch": 1.78, - "learning_rate": 7.520574024269517e-07, - "loss": 0.4594, - "step": 69335 - }, - { - "epoch": 1.78, - "learning_rate": 7.520305960855028e-07, - "loss": 0.5566, - "step": 69336 - }, - { - "epoch": 1.78, - "learning_rate": 7.520037899339124e-07, - "loss": 0.6135, - "step": 69337 - }, - { - "epoch": 1.78, - "learning_rate": 7.519769839722017e-07, - "loss": 0.6006, - "step": 69338 - }, - { - "epoch": 1.78, - "learning_rate": 7.519501782003905e-07, - "loss": 0.7637, - "step": 69339 - }, - { - "epoch": 1.78, - "learning_rate": 7.519233726184999e-07, - "loss": 0.6533, - "step": 69340 - }, - { - "epoch": 1.78, - "learning_rate": 7.518965672265502e-07, - "loss": 0.5884, - "step": 69341 - }, - { - "epoch": 1.78, - "learning_rate": 7.518697620245616e-07, - "loss": 0.6533, - "step": 69342 - }, - { - "epoch": 1.78, - "learning_rate": 7.518429570125551e-07, - "loss": 0.6406, - "step": 69343 - }, - { - "epoch": 1.78, - "learning_rate": 7.51816152190551e-07, - "loss": 0.7539, - "step": 69344 - }, - { - "epoch": 1.78, - "learning_rate": 7.5178934755857e-07, - "loss": 0.5403, - "step": 69345 - }, - { - "epoch": 1.78, - "learning_rate": 7.517625431166325e-07, - "loss": 0.5488, - "step": 69346 - }, - { - "epoch": 1.78, - "learning_rate": 7.517357388647587e-07, - "loss": 0.6499, - "step": 69347 - }, - { - "epoch": 1.78, - "learning_rate": 7.517089348029697e-07, - "loss": 0.7188, - "step": 69348 - }, - { - "epoch": 1.78, - "learning_rate": 7.516821309312855e-07, - "loss": 0.6621, - "step": 69349 - }, - { - "epoch": 1.78, - "learning_rate": 7.51655327249727e-07, - "loss": 0.6626, - "step": 69350 - }, - { - "epoch": 1.78, - "learning_rate": 7.516285237583146e-07, - "loss": 0.644, - "step": 69351 - }, - { - "epoch": 1.78, - "learning_rate": 7.516017204570689e-07, - "loss": 0.6919, - "step": 69352 - }, - { - "epoch": 1.78, - "learning_rate": 7.515749173460101e-07, - "loss": 0.5918, - "step": 69353 - }, - { - "epoch": 1.78, - "learning_rate": 7.515481144251592e-07, - "loss": 0.7178, - "step": 69354 - }, - { - "epoch": 1.78, - "learning_rate": 7.515213116945367e-07, - "loss": 0.5212, - "step": 69355 - }, - { - "epoch": 1.78, - "learning_rate": 7.514945091541624e-07, - "loss": 0.6382, - "step": 69356 - }, - { - "epoch": 1.78, - "learning_rate": 7.514677068040578e-07, - "loss": 0.7197, - "step": 69357 - }, - { - "epoch": 1.78, - "learning_rate": 7.514409046442427e-07, - "loss": 0.5444, - "step": 69358 - }, - { - "epoch": 1.78, - "learning_rate": 7.514141026747378e-07, - "loss": 0.5752, - "step": 69359 - }, - { - "epoch": 1.78, - "learning_rate": 7.513873008955638e-07, - "loss": 0.6548, - "step": 69360 - }, - { - "epoch": 1.78, - "learning_rate": 7.513604993067409e-07, - "loss": 0.5918, - "step": 69361 - }, - { - "epoch": 1.78, - "learning_rate": 7.513336979082901e-07, - "loss": 0.6338, - "step": 69362 - }, - { - "epoch": 1.78, - "learning_rate": 7.513068967002314e-07, - "loss": 0.499, - "step": 69363 - }, - { - "epoch": 1.78, - "learning_rate": 7.512800956825859e-07, - "loss": 0.5188, - "step": 69364 - }, - { - "epoch": 1.78, - "learning_rate": 7.512532948553739e-07, - "loss": 0.689, - "step": 69365 - }, - { - "epoch": 1.78, - "learning_rate": 7.512264942186154e-07, - "loss": 0.5815, - "step": 69366 - }, - { - "epoch": 1.78, - "learning_rate": 7.511996937723316e-07, - "loss": 0.4506, - "step": 69367 - }, - { - "epoch": 1.78, - "learning_rate": 7.511728935165424e-07, - "loss": 0.7266, - "step": 69368 - }, - { - "epoch": 1.78, - "learning_rate": 7.51146093451269e-07, - "loss": 0.5508, - "step": 69369 - }, - { - "epoch": 1.78, - "learning_rate": 7.511192935765314e-07, - "loss": 0.709, - "step": 69370 - }, - { - "epoch": 1.78, - "learning_rate": 7.510924938923506e-07, - "loss": 0.5825, - "step": 69371 - }, - { - "epoch": 1.78, - "learning_rate": 7.510656943987464e-07, - "loss": 0.5972, - "step": 69372 - }, - { - "epoch": 1.78, - "learning_rate": 7.510388950957401e-07, - "loss": 0.7363, - "step": 69373 - }, - { - "epoch": 1.78, - "learning_rate": 7.510120959833517e-07, - "loss": 0.5283, - "step": 69374 - }, - { - "epoch": 1.78, - "learning_rate": 7.509852970616024e-07, - "loss": 0.5718, - "step": 69375 - }, - { - "epoch": 1.78, - "learning_rate": 7.509584983305116e-07, - "loss": 0.6924, - "step": 69376 - }, - { - "epoch": 1.78, - "learning_rate": 7.509316997901008e-07, - "loss": 0.604, - "step": 69377 - }, - { - "epoch": 1.78, - "learning_rate": 7.509049014403897e-07, - "loss": 0.7085, - "step": 69378 - }, - { - "epoch": 1.78, - "learning_rate": 7.508781032813996e-07, - "loss": 0.6475, - "step": 69379 - }, - { - "epoch": 1.78, - "learning_rate": 7.508513053131505e-07, - "loss": 0.377, - "step": 69380 - }, - { - "epoch": 1.78, - "learning_rate": 7.508245075356631e-07, - "loss": 0.624, - "step": 69381 - }, - { - "epoch": 1.78, - "learning_rate": 7.507977099489579e-07, - "loss": 0.6675, - "step": 69382 - }, - { - "epoch": 1.78, - "learning_rate": 7.507709125530557e-07, - "loss": 0.6582, - "step": 69383 - }, - { - "epoch": 1.78, - "learning_rate": 7.507441153479764e-07, - "loss": 0.5747, - "step": 69384 - }, - { - "epoch": 1.78, - "learning_rate": 7.507173183337415e-07, - "loss": 0.6729, - "step": 69385 - }, - { - "epoch": 1.78, - "learning_rate": 7.506905215103704e-07, - "loss": 0.5215, - "step": 69386 - }, - { - "epoch": 1.78, - "learning_rate": 7.50663724877884e-07, - "loss": 0.4514, - "step": 69387 - }, - { - "epoch": 1.78, - "learning_rate": 7.506369284363032e-07, - "loss": 0.5298, - "step": 69388 - }, - { - "epoch": 1.78, - "learning_rate": 7.50610132185648e-07, - "loss": 0.6348, - "step": 69389 - }, - { - "epoch": 1.78, - "learning_rate": 7.505833361259393e-07, - "loss": 0.6602, - "step": 69390 - }, - { - "epoch": 1.78, - "learning_rate": 7.505565402571973e-07, - "loss": 0.6816, - "step": 69391 - }, - { - "epoch": 1.78, - "learning_rate": 7.505297445794428e-07, - "loss": 0.7412, - "step": 69392 - }, - { - "epoch": 1.78, - "learning_rate": 7.505029490926962e-07, - "loss": 0.7227, - "step": 69393 - }, - { - "epoch": 1.78, - "learning_rate": 7.50476153796978e-07, - "loss": 0.6079, - "step": 69394 - }, - { - "epoch": 1.78, - "learning_rate": 7.504493586923091e-07, - "loss": 0.6592, - "step": 69395 - }, - { - "epoch": 1.78, - "learning_rate": 7.504225637787094e-07, - "loss": 0.7051, - "step": 69396 - }, - { - "epoch": 1.78, - "learning_rate": 7.503957690561995e-07, - "loss": 0.6592, - "step": 69397 - }, - { - "epoch": 1.78, - "learning_rate": 7.503689745248003e-07, - "loss": 0.6919, - "step": 69398 - }, - { - "epoch": 1.78, - "learning_rate": 7.503421801845318e-07, - "loss": 0.6523, - "step": 69399 - }, - { - "epoch": 1.78, - "learning_rate": 7.50315386035415e-07, - "loss": 0.5913, - "step": 69400 - }, - { - "epoch": 1.78, - "learning_rate": 7.502885920774702e-07, - "loss": 0.7422, - "step": 69401 - }, - { - "epoch": 1.78, - "learning_rate": 7.50261798310718e-07, - "loss": 0.7202, - "step": 69402 - }, - { - "epoch": 1.78, - "learning_rate": 7.502350047351786e-07, - "loss": 0.6016, - "step": 69403 - }, - { - "epoch": 1.78, - "learning_rate": 7.502082113508732e-07, - "loss": 0.7979, - "step": 69404 - }, - { - "epoch": 1.78, - "learning_rate": 7.501814181578219e-07, - "loss": 0.6836, - "step": 69405 - }, - { - "epoch": 1.78, - "learning_rate": 7.501546251560449e-07, - "loss": 0.6318, - "step": 69406 - }, - { - "epoch": 1.78, - "learning_rate": 7.501278323455631e-07, - "loss": 0.7832, - "step": 69407 - }, - { - "epoch": 1.78, - "learning_rate": 7.501010397263968e-07, - "loss": 0.686, - "step": 69408 - }, - { - "epoch": 1.78, - "learning_rate": 7.500742472985668e-07, - "loss": 0.689, - "step": 69409 - }, - { - "epoch": 1.78, - "learning_rate": 7.500474550620933e-07, - "loss": 0.6182, - "step": 69410 - }, - { - "epoch": 1.78, - "learning_rate": 7.500206630169972e-07, - "loss": 0.6128, - "step": 69411 - }, - { - "epoch": 1.78, - "learning_rate": 7.499938711632987e-07, - "loss": 0.5088, - "step": 69412 - }, - { - "epoch": 1.78, - "learning_rate": 7.499670795010183e-07, - "loss": 0.5361, - "step": 69413 - }, - { - "epoch": 1.78, - "learning_rate": 7.499402880301769e-07, - "loss": 0.5708, - "step": 69414 - }, - { - "epoch": 1.78, - "learning_rate": 7.499134967507947e-07, - "loss": 0.686, - "step": 69415 - }, - { - "epoch": 1.78, - "learning_rate": 7.49886705662892e-07, - "loss": 0.4614, - "step": 69416 - }, - { - "epoch": 1.78, - "learning_rate": 7.498599147664896e-07, - "loss": 0.6465, - "step": 69417 - }, - { - "epoch": 1.78, - "learning_rate": 7.498331240616078e-07, - "loss": 0.6357, - "step": 69418 - }, - { - "epoch": 1.78, - "learning_rate": 7.498063335482675e-07, - "loss": 0.6743, - "step": 69419 - }, - { - "epoch": 1.78, - "learning_rate": 7.497795432264888e-07, - "loss": 0.4443, - "step": 69420 - }, - { - "epoch": 1.78, - "learning_rate": 7.497527530962926e-07, - "loss": 0.4478, - "step": 69421 - }, - { - "epoch": 1.78, - "learning_rate": 7.49725963157699e-07, - "loss": 0.3788, - "step": 69422 - }, - { - "epoch": 1.78, - "learning_rate": 7.49699173410729e-07, - "loss": 0.5432, - "step": 69423 - }, - { - "epoch": 1.78, - "learning_rate": 7.496723838554025e-07, - "loss": 0.6426, - "step": 69424 - }, - { - "epoch": 1.78, - "learning_rate": 7.496455944917408e-07, - "loss": 0.5784, - "step": 69425 - }, - { - "epoch": 1.78, - "learning_rate": 7.496188053197637e-07, - "loss": 0.5796, - "step": 69426 - }, - { - "epoch": 1.78, - "learning_rate": 7.495920163394918e-07, - "loss": 0.5518, - "step": 69427 - }, - { - "epoch": 1.78, - "learning_rate": 7.495652275509461e-07, - "loss": 0.6045, - "step": 69428 - }, - { - "epoch": 1.78, - "learning_rate": 7.495384389541464e-07, - "loss": 0.5386, - "step": 69429 - }, - { - "epoch": 1.78, - "learning_rate": 7.495116505491139e-07, - "loss": 0.707, - "step": 69430 - }, - { - "epoch": 1.78, - "learning_rate": 7.494848623358688e-07, - "loss": 0.6523, - "step": 69431 - }, - { - "epoch": 1.78, - "learning_rate": 7.494580743144314e-07, - "loss": 0.4976, - "step": 69432 - }, - { - "epoch": 1.78, - "learning_rate": 7.494312864848227e-07, - "loss": 0.6377, - "step": 69433 - }, - { - "epoch": 1.78, - "learning_rate": 7.494044988470627e-07, - "loss": 0.6855, - "step": 69434 - }, - { - "epoch": 1.78, - "learning_rate": 7.493777114011726e-07, - "loss": 0.7578, - "step": 69435 - }, - { - "epoch": 1.78, - "learning_rate": 7.493509241471722e-07, - "loss": 0.6128, - "step": 69436 - }, - { - "epoch": 1.78, - "learning_rate": 7.49324137085082e-07, - "loss": 0.4553, - "step": 69437 - }, - { - "epoch": 1.78, - "learning_rate": 7.492973502149232e-07, - "loss": 0.5942, - "step": 69438 - }, - { - "epoch": 1.78, - "learning_rate": 7.492705635367156e-07, - "loss": 0.5952, - "step": 69439 - }, - { - "epoch": 1.78, - "learning_rate": 7.4924377705048e-07, - "loss": 0.5647, - "step": 69440 - }, - { - "epoch": 1.78, - "learning_rate": 7.492169907562369e-07, - "loss": 0.7783, - "step": 69441 - }, - { - "epoch": 1.78, - "learning_rate": 7.491902046540071e-07, - "loss": 0.6314, - "step": 69442 - }, - { - "epoch": 1.78, - "learning_rate": 7.491634187438105e-07, - "loss": 0.6611, - "step": 69443 - }, - { - "epoch": 1.78, - "learning_rate": 7.491366330256681e-07, - "loss": 0.5591, - "step": 69444 - }, - { - "epoch": 1.78, - "learning_rate": 7.491098474996005e-07, - "loss": 0.6494, - "step": 69445 - }, - { - "epoch": 1.78, - "learning_rate": 7.490830621656277e-07, - "loss": 0.6035, - "step": 69446 - }, - { - "epoch": 1.78, - "learning_rate": 7.490562770237703e-07, - "loss": 0.5444, - "step": 69447 - }, - { - "epoch": 1.78, - "learning_rate": 7.490294920740493e-07, - "loss": 0.6426, - "step": 69448 - }, - { - "epoch": 1.78, - "learning_rate": 7.490027073164847e-07, - "loss": 0.7026, - "step": 69449 - }, - { - "epoch": 1.78, - "learning_rate": 7.489759227510971e-07, - "loss": 0.5305, - "step": 69450 - }, - { - "epoch": 1.78, - "learning_rate": 7.489491383779071e-07, - "loss": 0.5166, - "step": 69451 - }, - { - "epoch": 1.78, - "learning_rate": 7.489223541969353e-07, - "loss": 0.7754, - "step": 69452 - }, - { - "epoch": 1.78, - "learning_rate": 7.488955702082019e-07, - "loss": 0.6807, - "step": 69453 - }, - { - "epoch": 1.78, - "learning_rate": 7.488687864117281e-07, - "loss": 0.5241, - "step": 69454 - }, - { - "epoch": 1.78, - "learning_rate": 7.488420028075337e-07, - "loss": 0.6387, - "step": 69455 - }, - { - "epoch": 1.78, - "learning_rate": 7.488152193956392e-07, - "loss": 0.6709, - "step": 69456 - }, - { - "epoch": 1.78, - "learning_rate": 7.487884361760657e-07, - "loss": 0.4626, - "step": 69457 - }, - { - "epoch": 1.78, - "learning_rate": 7.487616531488329e-07, - "loss": 0.6162, - "step": 69458 - }, - { - "epoch": 1.78, - "learning_rate": 7.48734870313962e-07, - "loss": 0.5728, - "step": 69459 - }, - { - "epoch": 1.78, - "learning_rate": 7.487080876714731e-07, - "loss": 0.6704, - "step": 69460 - }, - { - "epoch": 1.78, - "learning_rate": 7.486813052213872e-07, - "loss": 0.6924, - "step": 69461 - }, - { - "epoch": 1.78, - "learning_rate": 7.48654522963724e-07, - "loss": 0.7783, - "step": 69462 - }, - { - "epoch": 1.78, - "learning_rate": 7.486277408985049e-07, - "loss": 0.5234, - "step": 69463 - }, - { - "epoch": 1.78, - "learning_rate": 7.4860095902575e-07, - "loss": 0.6235, - "step": 69464 - }, - { - "epoch": 1.78, - "learning_rate": 7.485741773454798e-07, - "loss": 0.5244, - "step": 69465 - }, - { - "epoch": 1.78, - "learning_rate": 7.485473958577144e-07, - "loss": 0.5369, - "step": 69466 - }, - { - "epoch": 1.78, - "learning_rate": 7.485206145624749e-07, - "loss": 0.707, - "step": 69467 - }, - { - "epoch": 1.78, - "learning_rate": 7.484938334597815e-07, - "loss": 0.6963, - "step": 69468 - }, - { - "epoch": 1.78, - "learning_rate": 7.484670525496551e-07, - "loss": 0.6963, - "step": 69469 - }, - { - "epoch": 1.78, - "learning_rate": 7.484402718321155e-07, - "loss": 0.5732, - "step": 69470 - }, - { - "epoch": 1.78, - "learning_rate": 7.48413491307184e-07, - "loss": 0.5557, - "step": 69471 - }, - { - "epoch": 1.78, - "learning_rate": 7.483867109748804e-07, - "loss": 0.5649, - "step": 69472 - }, - { - "epoch": 1.78, - "learning_rate": 7.483599308352258e-07, - "loss": 0.5557, - "step": 69473 - }, - { - "epoch": 1.78, - "learning_rate": 7.483331508882405e-07, - "loss": 0.7041, - "step": 69474 - }, - { - "epoch": 1.78, - "learning_rate": 7.483063711339446e-07, - "loss": 0.4834, - "step": 69475 - }, - { - "epoch": 1.78, - "learning_rate": 7.482795915723592e-07, - "loss": 0.4556, - "step": 69476 - }, - { - "epoch": 1.78, - "learning_rate": 7.482528122035044e-07, - "loss": 0.6719, - "step": 69477 - }, - { - "epoch": 1.78, - "learning_rate": 7.482260330274009e-07, - "loss": 0.7637, - "step": 69478 - }, - { - "epoch": 1.78, - "learning_rate": 7.481992540440689e-07, - "loss": 0.6465, - "step": 69479 - }, - { - "epoch": 1.78, - "learning_rate": 7.481724752535294e-07, - "loss": 0.4971, - "step": 69480 - }, - { - "epoch": 1.78, - "learning_rate": 7.481456966558026e-07, - "loss": 0.6094, - "step": 69481 - }, - { - "epoch": 1.78, - "learning_rate": 7.481189182509092e-07, - "loss": 0.5626, - "step": 69482 - }, - { - "epoch": 1.78, - "learning_rate": 7.480921400388693e-07, - "loss": 0.7881, - "step": 69483 - }, - { - "epoch": 1.78, - "learning_rate": 7.480653620197044e-07, - "loss": 0.5217, - "step": 69484 - }, - { - "epoch": 1.78, - "learning_rate": 7.480385841934335e-07, - "loss": 0.3916, - "step": 69485 - }, - { - "epoch": 1.78, - "learning_rate": 7.480118065600781e-07, - "loss": 0.5977, - "step": 69486 - }, - { - "epoch": 1.78, - "learning_rate": 7.479850291196583e-07, - "loss": 0.5146, - "step": 69487 - }, - { - "epoch": 1.78, - "learning_rate": 7.47958251872195e-07, - "loss": 0.7373, - "step": 69488 - }, - { - "epoch": 1.78, - "learning_rate": 7.479314748177082e-07, - "loss": 0.7178, - "step": 69489 - }, - { - "epoch": 1.78, - "learning_rate": 7.47904697956219e-07, - "loss": 0.6289, - "step": 69490 - }, - { - "epoch": 1.78, - "learning_rate": 7.478779212877473e-07, - "loss": 0.6567, - "step": 69491 - }, - { - "epoch": 1.78, - "learning_rate": 7.478511448123141e-07, - "loss": 0.5845, - "step": 69492 - }, - { - "epoch": 1.78, - "learning_rate": 7.478243685299394e-07, - "loss": 0.6282, - "step": 69493 - }, - { - "epoch": 1.78, - "learning_rate": 7.477975924406446e-07, - "loss": 0.7314, - "step": 69494 - }, - { - "epoch": 1.78, - "learning_rate": 7.477708165444491e-07, - "loss": 0.5942, - "step": 69495 - }, - { - "epoch": 1.78, - "learning_rate": 7.47744040841374e-07, - "loss": 0.6846, - "step": 69496 - }, - { - "epoch": 1.78, - "learning_rate": 7.477172653314397e-07, - "loss": 0.5874, - "step": 69497 - }, - { - "epoch": 1.78, - "learning_rate": 7.476904900146666e-07, - "loss": 0.7734, - "step": 69498 - }, - { - "epoch": 1.78, - "learning_rate": 7.476637148910754e-07, - "loss": 0.5942, - "step": 69499 - }, - { - "epoch": 1.78, - "learning_rate": 7.476369399606862e-07, - "loss": 0.6162, - "step": 69500 - }, - { - "epoch": 1.78, - "learning_rate": 7.4761016522352e-07, - "loss": 0.5073, - "step": 69501 - }, - { - "epoch": 1.78, - "learning_rate": 7.475833906795972e-07, - "loss": 0.6299, - "step": 69502 - }, - { - "epoch": 1.78, - "learning_rate": 7.475566163289381e-07, - "loss": 0.6255, - "step": 69503 - }, - { - "epoch": 1.78, - "learning_rate": 7.475298421715635e-07, - "loss": 0.5303, - "step": 69504 - }, - { - "epoch": 1.78, - "learning_rate": 7.475030682074937e-07, - "loss": 0.6074, - "step": 69505 - }, - { - "epoch": 1.78, - "learning_rate": 7.474762944367487e-07, - "loss": 0.7451, - "step": 69506 - }, - { - "epoch": 1.78, - "learning_rate": 7.474495208593499e-07, - "loss": 0.7568, - "step": 69507 - }, - { - "epoch": 1.78, - "learning_rate": 7.474227474753172e-07, - "loss": 0.6338, - "step": 69508 - }, - { - "epoch": 1.78, - "learning_rate": 7.473959742846714e-07, - "loss": 0.5903, - "step": 69509 - }, - { - "epoch": 1.78, - "learning_rate": 7.473692012874326e-07, - "loss": 0.7812, - "step": 69510 - }, - { - "epoch": 1.78, - "learning_rate": 7.47342428483622e-07, - "loss": 0.688, - "step": 69511 - }, - { - "epoch": 1.78, - "learning_rate": 7.473156558732594e-07, - "loss": 0.665, - "step": 69512 - }, - { - "epoch": 1.78, - "learning_rate": 7.472888834563657e-07, - "loss": 0.6572, - "step": 69513 - }, - { - "epoch": 1.78, - "learning_rate": 7.472621112329616e-07, - "loss": 0.7217, - "step": 69514 - }, - { - "epoch": 1.78, - "learning_rate": 7.472353392030668e-07, - "loss": 0.6289, - "step": 69515 - }, - { - "epoch": 1.78, - "learning_rate": 7.472085673667026e-07, - "loss": 0.6489, - "step": 69516 - }, - { - "epoch": 1.78, - "learning_rate": 7.471817957238888e-07, - "loss": 0.5703, - "step": 69517 - }, - { - "epoch": 1.78, - "learning_rate": 7.471550242746465e-07, - "loss": 0.6914, - "step": 69518 - }, - { - "epoch": 1.78, - "learning_rate": 7.471282530189959e-07, - "loss": 0.4622, - "step": 69519 - }, - { - "epoch": 1.78, - "learning_rate": 7.471014819569577e-07, - "loss": 0.6704, - "step": 69520 - }, - { - "epoch": 1.78, - "learning_rate": 7.470747110885523e-07, - "loss": 0.7432, - "step": 69521 - }, - { - "epoch": 1.78, - "learning_rate": 7.470479404137998e-07, - "loss": 0.624, - "step": 69522 - }, - { - "epoch": 1.78, - "learning_rate": 7.470211699327214e-07, - "loss": 0.4297, - "step": 69523 - }, - { - "epoch": 1.78, - "learning_rate": 7.469943996453375e-07, - "loss": 0.5068, - "step": 69524 - }, - { - "epoch": 1.78, - "learning_rate": 7.469676295516678e-07, - "loss": 0.6357, - "step": 69525 - }, - { - "epoch": 1.78, - "learning_rate": 7.469408596517337e-07, - "loss": 0.5137, - "step": 69526 - }, - { - "epoch": 1.78, - "learning_rate": 7.46914089945555e-07, - "loss": 0.7783, - "step": 69527 - }, - { - "epoch": 1.78, - "learning_rate": 7.468873204331529e-07, - "loss": 0.5311, - "step": 69528 - }, - { - "epoch": 1.78, - "learning_rate": 7.468605511145474e-07, - "loss": 0.6616, - "step": 69529 - }, - { - "epoch": 1.78, - "learning_rate": 7.468337819897592e-07, - "loss": 0.6855, - "step": 69530 - }, - { - "epoch": 1.78, - "learning_rate": 7.468070130588085e-07, - "loss": 0.6172, - "step": 69531 - }, - { - "epoch": 1.78, - "learning_rate": 7.467802443217162e-07, - "loss": 0.5469, - "step": 69532 - }, - { - "epoch": 1.78, - "learning_rate": 7.467534757785026e-07, - "loss": 0.5703, - "step": 69533 - }, - { - "epoch": 1.78, - "learning_rate": 7.467267074291885e-07, - "loss": 0.7061, - "step": 69534 - }, - { - "epoch": 1.78, - "learning_rate": 7.46699939273794e-07, - "loss": 0.7168, - "step": 69535 - }, - { - "epoch": 1.78, - "learning_rate": 7.466731713123393e-07, - "loss": 0.7568, - "step": 69536 - }, - { - "epoch": 1.78, - "learning_rate": 7.466464035448457e-07, - "loss": 0.7749, - "step": 69537 - }, - { - "epoch": 1.78, - "learning_rate": 7.466196359713333e-07, - "loss": 0.7041, - "step": 69538 - }, - { - "epoch": 1.78, - "learning_rate": 7.465928685918224e-07, - "loss": 0.623, - "step": 69539 - }, - { - "epoch": 1.78, - "learning_rate": 7.465661014063338e-07, - "loss": 0.373, - "step": 69540 - }, - { - "epoch": 1.78, - "learning_rate": 7.465393344148876e-07, - "loss": 0.6738, - "step": 69541 - }, - { - "epoch": 1.78, - "learning_rate": 7.46512567617505e-07, - "loss": 0.7031, - "step": 69542 - }, - { - "epoch": 1.78, - "learning_rate": 7.464858010142056e-07, - "loss": 0.666, - "step": 69543 - }, - { - "epoch": 1.78, - "learning_rate": 7.46459034605011e-07, - "loss": 0.6445, - "step": 69544 - }, - { - "epoch": 1.78, - "learning_rate": 7.464322683899408e-07, - "loss": 0.4788, - "step": 69545 - }, - { - "epoch": 1.78, - "learning_rate": 7.464055023690155e-07, - "loss": 0.6016, - "step": 69546 - }, - { - "epoch": 1.78, - "learning_rate": 7.463787365422562e-07, - "loss": 0.7979, - "step": 69547 - }, - { - "epoch": 1.78, - "learning_rate": 7.463519709096826e-07, - "loss": 0.6431, - "step": 69548 - }, - { - "epoch": 1.78, - "learning_rate": 7.46325205471316e-07, - "loss": 0.751, - "step": 69549 - }, - { - "epoch": 1.78, - "learning_rate": 7.462984402271764e-07, - "loss": 0.6064, - "step": 69550 - }, - { - "epoch": 1.78, - "learning_rate": 7.462716751772844e-07, - "loss": 0.405, - "step": 69551 - }, - { - "epoch": 1.78, - "learning_rate": 7.462449103216604e-07, - "loss": 0.688, - "step": 69552 - }, - { - "epoch": 1.78, - "learning_rate": 7.462181456603253e-07, - "loss": 0.7593, - "step": 69553 - }, - { - "epoch": 1.78, - "learning_rate": 7.461913811932994e-07, - "loss": 0.7271, - "step": 69554 - }, - { - "epoch": 1.78, - "learning_rate": 7.461646169206029e-07, - "loss": 0.625, - "step": 69555 - }, - { - "epoch": 1.78, - "learning_rate": 7.461378528422562e-07, - "loss": 0.5596, - "step": 69556 - }, - { - "epoch": 1.78, - "learning_rate": 7.461110889582805e-07, - "loss": 0.7065, - "step": 69557 - }, - { - "epoch": 1.78, - "learning_rate": 7.460843252686955e-07, - "loss": 0.6504, - "step": 69558 - }, - { - "epoch": 1.78, - "learning_rate": 7.460575617735223e-07, - "loss": 0.666, - "step": 69559 - }, - { - "epoch": 1.78, - "learning_rate": 7.460307984727809e-07, - "loss": 0.6782, - "step": 69560 - }, - { - "epoch": 1.78, - "learning_rate": 7.460040353664923e-07, - "loss": 0.3838, - "step": 69561 - }, - { - "epoch": 1.78, - "learning_rate": 7.459772724546765e-07, - "loss": 0.5693, - "step": 69562 - }, - { - "epoch": 1.78, - "learning_rate": 7.459505097373544e-07, - "loss": 0.5801, - "step": 69563 - }, - { - "epoch": 1.78, - "learning_rate": 7.459237472145465e-07, - "loss": 0.7021, - "step": 69564 - }, - { - "epoch": 1.78, - "learning_rate": 7.458969848862727e-07, - "loss": 0.6836, - "step": 69565 - }, - { - "epoch": 1.78, - "learning_rate": 7.458702227525542e-07, - "loss": 0.75, - "step": 69566 - }, - { - "epoch": 1.78, - "learning_rate": 7.458434608134108e-07, - "loss": 0.6738, - "step": 69567 - }, - { - "epoch": 1.78, - "learning_rate": 7.458166990688638e-07, - "loss": 0.8369, - "step": 69568 - }, - { - "epoch": 1.78, - "learning_rate": 7.45789937518933e-07, - "loss": 0.5017, - "step": 69569 - }, - { - "epoch": 1.78, - "learning_rate": 7.457631761636393e-07, - "loss": 0.6016, - "step": 69570 - }, - { - "epoch": 1.78, - "learning_rate": 7.457364150030028e-07, - "loss": 0.6631, - "step": 69571 - }, - { - "epoch": 1.78, - "learning_rate": 7.457096540370444e-07, - "loss": 0.532, - "step": 69572 - }, - { - "epoch": 1.78, - "learning_rate": 7.456828932657843e-07, - "loss": 0.6631, - "step": 69573 - }, - { - "epoch": 1.78, - "learning_rate": 7.456561326892439e-07, - "loss": 0.6565, - "step": 69574 - }, - { - "epoch": 1.78, - "learning_rate": 7.456293723074421e-07, - "loss": 0.6689, - "step": 69575 - }, - { - "epoch": 1.78, - "learning_rate": 7.456026121204004e-07, - "loss": 0.6763, - "step": 69576 - }, - { - "epoch": 1.78, - "learning_rate": 7.45575852128139e-07, - "loss": 0.6807, - "step": 69577 - }, - { - "epoch": 1.78, - "learning_rate": 7.455490923306787e-07, - "loss": 0.6904, - "step": 69578 - }, - { - "epoch": 1.78, - "learning_rate": 7.455223327280393e-07, - "loss": 0.7334, - "step": 69579 - }, - { - "epoch": 1.78, - "learning_rate": 7.454955733202421e-07, - "loss": 0.7266, - "step": 69580 - }, - { - "epoch": 1.78, - "learning_rate": 7.454688141073071e-07, - "loss": 0.6743, - "step": 69581 - }, - { - "epoch": 1.78, - "learning_rate": 7.45442055089255e-07, - "loss": 0.6528, - "step": 69582 - }, - { - "epoch": 1.78, - "learning_rate": 7.45415296266106e-07, - "loss": 0.7168, - "step": 69583 - }, - { - "epoch": 1.78, - "learning_rate": 7.453885376378815e-07, - "loss": 0.6025, - "step": 69584 - }, - { - "epoch": 1.78, - "learning_rate": 7.453617792046007e-07, - "loss": 0.6133, - "step": 69585 - }, - { - "epoch": 1.78, - "learning_rate": 7.453350209662848e-07, - "loss": 0.6943, - "step": 69586 - }, - { - "epoch": 1.78, - "learning_rate": 7.453082629229541e-07, - "loss": 0.6553, - "step": 69587 - }, - { - "epoch": 1.78, - "learning_rate": 7.45281505074629e-07, - "loss": 0.5625, - "step": 69588 - }, - { - "epoch": 1.78, - "learning_rate": 7.452547474213304e-07, - "loss": 0.6533, - "step": 69589 - }, - { - "epoch": 1.78, - "learning_rate": 7.452279899630783e-07, - "loss": 0.7109, - "step": 69590 - }, - { - "epoch": 1.78, - "learning_rate": 7.452012326998938e-07, - "loss": 0.5679, - "step": 69591 - }, - { - "epoch": 1.78, - "learning_rate": 7.451744756317966e-07, - "loss": 0.7852, - "step": 69592 - }, - { - "epoch": 1.78, - "learning_rate": 7.451477187588077e-07, - "loss": 0.4087, - "step": 69593 - }, - { - "epoch": 1.78, - "learning_rate": 7.451209620809479e-07, - "loss": 0.6182, - "step": 69594 - }, - { - "epoch": 1.78, - "learning_rate": 7.450942055982369e-07, - "loss": 0.7578, - "step": 69595 - }, - { - "epoch": 1.78, - "learning_rate": 7.450674493106954e-07, - "loss": 0.5991, - "step": 69596 - }, - { - "epoch": 1.78, - "learning_rate": 7.450406932183443e-07, - "loss": 0.5474, - "step": 69597 - }, - { - "epoch": 1.78, - "learning_rate": 7.450139373212035e-07, - "loss": 0.6567, - "step": 69598 - }, - { - "epoch": 1.78, - "learning_rate": 7.449871816192941e-07, - "loss": 0.6865, - "step": 69599 - }, - { - "epoch": 1.78, - "learning_rate": 7.449604261126361e-07, - "loss": 0.5366, - "step": 69600 - }, - { - "epoch": 1.78, - "learning_rate": 7.449336708012503e-07, - "loss": 0.6421, - "step": 69601 - }, - { - "epoch": 1.78, - "learning_rate": 7.449069156851568e-07, - "loss": 0.6375, - "step": 69602 - }, - { - "epoch": 1.78, - "learning_rate": 7.448801607643767e-07, - "loss": 0.7256, - "step": 69603 - }, - { - "epoch": 1.78, - "learning_rate": 7.448534060389302e-07, - "loss": 0.6162, - "step": 69604 - }, - { - "epoch": 1.78, - "learning_rate": 7.448266515088374e-07, - "loss": 0.6401, - "step": 69605 - }, - { - "epoch": 1.78, - "learning_rate": 7.447998971741193e-07, - "loss": 0.6836, - "step": 69606 - }, - { - "epoch": 1.78, - "learning_rate": 7.447731430347958e-07, - "loss": 0.6758, - "step": 69607 - }, - { - "epoch": 1.78, - "learning_rate": 7.447463890908883e-07, - "loss": 0.8271, - "step": 69608 - }, - { - "epoch": 1.78, - "learning_rate": 7.447196353424164e-07, - "loss": 0.6045, - "step": 69609 - }, - { - "epoch": 1.78, - "learning_rate": 7.446928817894011e-07, - "loss": 0.5291, - "step": 69610 - }, - { - "epoch": 1.78, - "learning_rate": 7.446661284318627e-07, - "loss": 0.4719, - "step": 69611 - }, - { - "epoch": 1.78, - "learning_rate": 7.446393752698214e-07, - "loss": 0.7036, - "step": 69612 - }, - { - "epoch": 1.78, - "learning_rate": 7.446126223032984e-07, - "loss": 0.6279, - "step": 69613 - }, - { - "epoch": 1.78, - "learning_rate": 7.44585869532314e-07, - "loss": 0.8853, - "step": 69614 - }, - { - "epoch": 1.78, - "learning_rate": 7.445591169568879e-07, - "loss": 0.5464, - "step": 69615 - }, - { - "epoch": 1.78, - "learning_rate": 7.445323645770414e-07, - "loss": 0.5088, - "step": 69616 - }, - { - "epoch": 1.78, - "learning_rate": 7.445056123927945e-07, - "loss": 0.5398, - "step": 69617 - }, - { - "epoch": 1.78, - "learning_rate": 7.444788604041681e-07, - "loss": 0.5713, - "step": 69618 - }, - { - "epoch": 1.78, - "learning_rate": 7.444521086111824e-07, - "loss": 0.6182, - "step": 69619 - }, - { - "epoch": 1.78, - "learning_rate": 7.44425357013858e-07, - "loss": 0.4998, - "step": 69620 - }, - { - "epoch": 1.78, - "learning_rate": 7.443986056122152e-07, - "loss": 0.4751, - "step": 69621 - }, - { - "epoch": 1.78, - "learning_rate": 7.443718544062749e-07, - "loss": 0.3971, - "step": 69622 - }, - { - "epoch": 1.78, - "learning_rate": 7.443451033960571e-07, - "loss": 0.6816, - "step": 69623 - }, - { - "epoch": 1.78, - "learning_rate": 7.443183525815829e-07, - "loss": 0.709, - "step": 69624 - }, - { - "epoch": 1.78, - "learning_rate": 7.442916019628723e-07, - "loss": 0.5659, - "step": 69625 - }, - { - "epoch": 1.78, - "learning_rate": 7.442648515399455e-07, - "loss": 0.7266, - "step": 69626 - }, - { - "epoch": 1.78, - "learning_rate": 7.442381013128234e-07, - "loss": 0.3699, - "step": 69627 - }, - { - "epoch": 1.78, - "learning_rate": 7.442113512815266e-07, - "loss": 0.532, - "step": 69628 - }, - { - "epoch": 1.78, - "learning_rate": 7.441846014460753e-07, - "loss": 0.7358, - "step": 69629 - }, - { - "epoch": 1.78, - "learning_rate": 7.441578518064901e-07, - "loss": 0.7266, - "step": 69630 - }, - { - "epoch": 1.78, - "learning_rate": 7.441311023627915e-07, - "loss": 0.7061, - "step": 69631 - }, - { - "epoch": 1.78, - "learning_rate": 7.44104353115e-07, - "loss": 0.5933, - "step": 69632 - }, - { - "epoch": 1.78, - "learning_rate": 7.440776040631358e-07, - "loss": 0.709, - "step": 69633 - }, - { - "epoch": 1.78, - "learning_rate": 7.4405085520722e-07, - "loss": 0.5674, - "step": 69634 - }, - { - "epoch": 1.78, - "learning_rate": 7.440241065472725e-07, - "loss": 0.5835, - "step": 69635 - }, - { - "epoch": 1.78, - "learning_rate": 7.439973580833139e-07, - "loss": 0.667, - "step": 69636 - }, - { - "epoch": 1.78, - "learning_rate": 7.439706098153648e-07, - "loss": 0.7607, - "step": 69637 - }, - { - "epoch": 1.78, - "learning_rate": 7.439438617434454e-07, - "loss": 0.478, - "step": 69638 - }, - { - "epoch": 1.78, - "learning_rate": 7.439171138675768e-07, - "loss": 0.6069, - "step": 69639 - }, - { - "epoch": 1.78, - "learning_rate": 7.438903661877788e-07, - "loss": 0.6113, - "step": 69640 - }, - { - "epoch": 1.78, - "learning_rate": 7.438636187040724e-07, - "loss": 0.5547, - "step": 69641 - }, - { - "epoch": 1.78, - "learning_rate": 7.438368714164775e-07, - "loss": 0.7256, - "step": 69642 - }, - { - "epoch": 1.78, - "learning_rate": 7.438101243250153e-07, - "loss": 0.5911, - "step": 69643 - }, - { - "epoch": 1.79, - "learning_rate": 7.437833774297061e-07, - "loss": 0.5815, - "step": 69644 - }, - { - "epoch": 1.79, - "learning_rate": 7.4375663073057e-07, - "loss": 0.4531, - "step": 69645 - }, - { - "epoch": 1.79, - "learning_rate": 7.437298842276274e-07, - "loss": 0.7778, - "step": 69646 - }, - { - "epoch": 1.79, - "learning_rate": 7.437031379208992e-07, - "loss": 0.7021, - "step": 69647 - }, - { - "epoch": 1.79, - "learning_rate": 7.436763918104056e-07, - "loss": 0.6475, - "step": 69648 - }, - { - "epoch": 1.79, - "learning_rate": 7.436496458961674e-07, - "loss": 0.6621, - "step": 69649 - }, - { - "epoch": 1.79, - "learning_rate": 7.436229001782046e-07, - "loss": 0.5505, - "step": 69650 - }, - { - "epoch": 1.79, - "learning_rate": 7.435961546565383e-07, - "loss": 0.6938, - "step": 69651 - }, - { - "epoch": 1.79, - "learning_rate": 7.435694093311882e-07, - "loss": 0.6333, - "step": 69652 - }, - { - "epoch": 1.79, - "learning_rate": 7.435426642021756e-07, - "loss": 0.7217, - "step": 69653 - }, - { - "epoch": 1.79, - "learning_rate": 7.435159192695208e-07, - "loss": 0.5347, - "step": 69654 - }, - { - "epoch": 1.79, - "learning_rate": 7.434891745332436e-07, - "loss": 0.8574, - "step": 69655 - }, - { - "epoch": 1.79, - "learning_rate": 7.434624299933651e-07, - "loss": 0.7578, - "step": 69656 - }, - { - "epoch": 1.79, - "learning_rate": 7.434356856499055e-07, - "loss": 0.6455, - "step": 69657 - }, - { - "epoch": 1.79, - "learning_rate": 7.434089415028857e-07, - "loss": 0.7109, - "step": 69658 - }, - { - "epoch": 1.79, - "learning_rate": 7.433821975523255e-07, - "loss": 0.6514, - "step": 69659 - }, - { - "epoch": 1.79, - "learning_rate": 7.43355453798246e-07, - "loss": 0.5278, - "step": 69660 - }, - { - "epoch": 1.79, - "learning_rate": 7.433287102406672e-07, - "loss": 0.5117, - "step": 69661 - }, - { - "epoch": 1.79, - "learning_rate": 7.433019668796101e-07, - "loss": 0.8408, - "step": 69662 - }, - { - "epoch": 1.79, - "learning_rate": 7.432752237150945e-07, - "loss": 0.6821, - "step": 69663 - }, - { - "epoch": 1.79, - "learning_rate": 7.432484807471421e-07, - "loss": 0.7324, - "step": 69664 - }, - { - "epoch": 1.79, - "learning_rate": 7.432217379757717e-07, - "loss": 0.5972, - "step": 69665 - }, - { - "epoch": 1.79, - "learning_rate": 7.431949954010051e-07, - "loss": 0.5532, - "step": 69666 - }, - { - "epoch": 1.79, - "learning_rate": 7.431682530228618e-07, - "loss": 0.7715, - "step": 69667 - }, - { - "epoch": 1.79, - "learning_rate": 7.43141510841363e-07, - "loss": 0.7295, - "step": 69668 - }, - { - "epoch": 1.79, - "learning_rate": 7.431147688565288e-07, - "loss": 0.8525, - "step": 69669 - }, - { - "epoch": 1.79, - "learning_rate": 7.4308802706838e-07, - "loss": 0.71, - "step": 69670 - }, - { - "epoch": 1.79, - "learning_rate": 7.430612854769367e-07, - "loss": 0.7744, - "step": 69671 - }, - { - "epoch": 1.79, - "learning_rate": 7.430345440822198e-07, - "loss": 0.7031, - "step": 69672 - }, - { - "epoch": 1.79, - "learning_rate": 7.430078028842492e-07, - "loss": 0.5488, - "step": 69673 - }, - { - "epoch": 1.79, - "learning_rate": 7.429810618830462e-07, - "loss": 0.5269, - "step": 69674 - }, - { - "epoch": 1.79, - "learning_rate": 7.429543210786306e-07, - "loss": 0.5859, - "step": 69675 - }, - { - "epoch": 1.79, - "learning_rate": 7.429275804710229e-07, - "loss": 0.6079, - "step": 69676 - }, - { - "epoch": 1.79, - "learning_rate": 7.429008400602438e-07, - "loss": 0.5975, - "step": 69677 - }, - { - "epoch": 1.79, - "learning_rate": 7.428740998463136e-07, - "loss": 0.6494, - "step": 69678 - }, - { - "epoch": 1.79, - "learning_rate": 7.42847359829253e-07, - "loss": 0.5933, - "step": 69679 - }, - { - "epoch": 1.79, - "learning_rate": 7.428206200090822e-07, - "loss": 0.6082, - "step": 69680 - }, - { - "epoch": 1.79, - "learning_rate": 7.427938803858221e-07, - "loss": 0.4421, - "step": 69681 - }, - { - "epoch": 1.79, - "learning_rate": 7.427671409594926e-07, - "loss": 0.665, - "step": 69682 - }, - { - "epoch": 1.79, - "learning_rate": 7.427404017301147e-07, - "loss": 0.6885, - "step": 69683 - }, - { - "epoch": 1.79, - "learning_rate": 7.427136626977089e-07, - "loss": 0.6162, - "step": 69684 - }, - { - "epoch": 1.79, - "learning_rate": 7.42686923862295e-07, - "loss": 0.7178, - "step": 69685 - }, - { - "epoch": 1.79, - "learning_rate": 7.426601852238939e-07, - "loss": 0.5908, - "step": 69686 - }, - { - "epoch": 1.79, - "learning_rate": 7.426334467825262e-07, - "loss": 0.6631, - "step": 69687 - }, - { - "epoch": 1.79, - "learning_rate": 7.42606708538212e-07, - "loss": 0.6426, - "step": 69688 - }, - { - "epoch": 1.79, - "learning_rate": 7.425799704909723e-07, - "loss": 0.4897, - "step": 69689 - }, - { - "epoch": 1.79, - "learning_rate": 7.425532326408271e-07, - "loss": 0.8359, - "step": 69690 - }, - { - "epoch": 1.79, - "learning_rate": 7.425264949877972e-07, - "loss": 0.7012, - "step": 69691 - }, - { - "epoch": 1.79, - "learning_rate": 7.424997575319027e-07, - "loss": 0.6172, - "step": 69692 - }, - { - "epoch": 1.79, - "learning_rate": 7.424730202731644e-07, - "loss": 0.7188, - "step": 69693 - }, - { - "epoch": 1.79, - "learning_rate": 7.42446283211603e-07, - "loss": 0.7666, - "step": 69694 - }, - { - "epoch": 1.79, - "learning_rate": 7.424195463472382e-07, - "loss": 0.5156, - "step": 69695 - }, - { - "epoch": 1.79, - "learning_rate": 7.423928096800911e-07, - "loss": 0.7158, - "step": 69696 - }, - { - "epoch": 1.79, - "learning_rate": 7.423660732101818e-07, - "loss": 0.7012, - "step": 69697 - }, - { - "epoch": 1.79, - "learning_rate": 7.423393369375313e-07, - "loss": 0.6162, - "step": 69698 - }, - { - "epoch": 1.79, - "learning_rate": 7.423126008621593e-07, - "loss": 0.7588, - "step": 69699 - }, - { - "epoch": 1.79, - "learning_rate": 7.422858649840869e-07, - "loss": 0.5928, - "step": 69700 - }, - { - "epoch": 1.79, - "learning_rate": 7.422591293033344e-07, - "loss": 0.5461, - "step": 69701 - }, - { - "epoch": 1.79, - "learning_rate": 7.422323938199222e-07, - "loss": 0.79, - "step": 69702 - }, - { - "epoch": 1.79, - "learning_rate": 7.422056585338708e-07, - "loss": 0.6067, - "step": 69703 - }, - { - "epoch": 1.79, - "learning_rate": 7.42178923445201e-07, - "loss": 0.4937, - "step": 69704 - }, - { - "epoch": 1.79, - "learning_rate": 7.421521885539325e-07, - "loss": 0.54, - "step": 69705 - }, - { - "epoch": 1.79, - "learning_rate": 7.421254538600864e-07, - "loss": 0.7275, - "step": 69706 - }, - { - "epoch": 1.79, - "learning_rate": 7.420987193636828e-07, - "loss": 0.6592, - "step": 69707 - }, - { - "epoch": 1.79, - "learning_rate": 7.420719850647425e-07, - "loss": 0.7002, - "step": 69708 - }, - { - "epoch": 1.79, - "learning_rate": 7.420452509632857e-07, - "loss": 0.4304, - "step": 69709 - }, - { - "epoch": 1.79, - "learning_rate": 7.420185170593332e-07, - "loss": 0.7007, - "step": 69710 - }, - { - "epoch": 1.79, - "learning_rate": 7.419917833529049e-07, - "loss": 0.7266, - "step": 69711 - }, - { - "epoch": 1.79, - "learning_rate": 7.41965049844022e-07, - "loss": 0.5181, - "step": 69712 - }, - { - "epoch": 1.79, - "learning_rate": 7.419383165327042e-07, - "loss": 0.5452, - "step": 69713 - }, - { - "epoch": 1.79, - "learning_rate": 7.41911583418973e-07, - "loss": 0.4404, - "step": 69714 - }, - { - "epoch": 1.79, - "learning_rate": 7.418848505028479e-07, - "loss": 0.5908, - "step": 69715 - }, - { - "epoch": 1.79, - "learning_rate": 7.418581177843495e-07, - "loss": 0.6367, - "step": 69716 - }, - { - "epoch": 1.79, - "learning_rate": 7.418313852634988e-07, - "loss": 0.6533, - "step": 69717 - }, - { - "epoch": 1.79, - "learning_rate": 7.418046529403157e-07, - "loss": 0.8564, - "step": 69718 - }, - { - "epoch": 1.79, - "learning_rate": 7.417779208148209e-07, - "loss": 0.6802, - "step": 69719 - }, - { - "epoch": 1.79, - "learning_rate": 7.41751188887035e-07, - "loss": 0.6504, - "step": 69720 - }, - { - "epoch": 1.79, - "learning_rate": 7.417244571569781e-07, - "loss": 0.6553, - "step": 69721 - }, - { - "epoch": 1.79, - "learning_rate": 7.416977256246713e-07, - "loss": 0.6978, - "step": 69722 - }, - { - "epoch": 1.79, - "learning_rate": 7.416709942901343e-07, - "loss": 0.5967, - "step": 69723 - }, - { - "epoch": 1.79, - "learning_rate": 7.416442631533883e-07, - "loss": 0.6729, - "step": 69724 - }, - { - "epoch": 1.79, - "learning_rate": 7.416175322144534e-07, - "loss": 0.5386, - "step": 69725 - }, - { - "epoch": 1.79, - "learning_rate": 7.415908014733497e-07, - "loss": 0.6494, - "step": 69726 - }, - { - "epoch": 1.79, - "learning_rate": 7.415640709300983e-07, - "loss": 0.6289, - "step": 69727 - }, - { - "epoch": 1.79, - "learning_rate": 7.415373405847192e-07, - "loss": 0.5381, - "step": 69728 - }, - { - "epoch": 1.79, - "learning_rate": 7.415106104372333e-07, - "loss": 0.689, - "step": 69729 - }, - { - "epoch": 1.79, - "learning_rate": 7.414838804876607e-07, - "loss": 0.6255, - "step": 69730 - }, - { - "epoch": 1.79, - "learning_rate": 7.41457150736022e-07, - "loss": 0.7168, - "step": 69731 - }, - { - "epoch": 1.79, - "learning_rate": 7.414304211823376e-07, - "loss": 0.6895, - "step": 69732 - }, - { - "epoch": 1.79, - "learning_rate": 7.414036918266282e-07, - "loss": 0.6426, - "step": 69733 - }, - { - "epoch": 1.79, - "learning_rate": 7.413769626689144e-07, - "loss": 0.7695, - "step": 69734 - }, - { - "epoch": 1.79, - "learning_rate": 7.413502337092161e-07, - "loss": 0.6396, - "step": 69735 - }, - { - "epoch": 1.79, - "learning_rate": 7.413235049475539e-07, - "loss": 0.7314, - "step": 69736 - }, - { - "epoch": 1.79, - "learning_rate": 7.412967763839484e-07, - "loss": 0.5522, - "step": 69737 - }, - { - "epoch": 1.79, - "learning_rate": 7.412700480184201e-07, - "loss": 0.6172, - "step": 69738 - }, - { - "epoch": 1.79, - "learning_rate": 7.412433198509896e-07, - "loss": 0.7891, - "step": 69739 - }, - { - "epoch": 1.79, - "learning_rate": 7.412165918816768e-07, - "loss": 0.7207, - "step": 69740 - }, - { - "epoch": 1.79, - "learning_rate": 7.41189864110503e-07, - "loss": 0.5327, - "step": 69741 - }, - { - "epoch": 1.79, - "learning_rate": 7.411631365374877e-07, - "loss": 0.552, - "step": 69742 - }, - { - "epoch": 1.79, - "learning_rate": 7.411364091626526e-07, - "loss": 0.8086, - "step": 69743 - }, - { - "epoch": 1.79, - "learning_rate": 7.411096819860172e-07, - "loss": 0.493, - "step": 69744 - }, - { - "epoch": 1.79, - "learning_rate": 7.410829550076019e-07, - "loss": 0.5551, - "step": 69745 - }, - { - "epoch": 1.79, - "learning_rate": 7.410562282274277e-07, - "loss": 0.7891, - "step": 69746 - }, - { - "epoch": 1.79, - "learning_rate": 7.410295016455145e-07, - "loss": 0.561, - "step": 69747 - }, - { - "epoch": 1.79, - "learning_rate": 7.410027752618837e-07, - "loss": 0.5801, - "step": 69748 - }, - { - "epoch": 1.79, - "learning_rate": 7.409760490765546e-07, - "loss": 0.6592, - "step": 69749 - }, - { - "epoch": 1.79, - "learning_rate": 7.409493230895486e-07, - "loss": 0.5654, - "step": 69750 - }, - { - "epoch": 1.79, - "learning_rate": 7.409225973008855e-07, - "loss": 0.7432, - "step": 69751 - }, - { - "epoch": 1.79, - "learning_rate": 7.408958717105864e-07, - "loss": 0.4244, - "step": 69752 - }, - { - "epoch": 1.79, - "learning_rate": 7.408691463186714e-07, - "loss": 0.6069, - "step": 69753 - }, - { - "epoch": 1.79, - "learning_rate": 7.40842421125161e-07, - "loss": 0.4849, - "step": 69754 - }, - { - "epoch": 1.79, - "learning_rate": 7.408156961300753e-07, - "loss": 0.4719, - "step": 69755 - }, - { - "epoch": 1.79, - "learning_rate": 7.407889713334355e-07, - "loss": 0.5176, - "step": 69756 - }, - { - "epoch": 1.79, - "learning_rate": 7.407622467352613e-07, - "loss": 0.4352, - "step": 69757 - }, - { - "epoch": 1.79, - "learning_rate": 7.407355223355736e-07, - "loss": 0.7598, - "step": 69758 - }, - { - "epoch": 1.79, - "learning_rate": 7.407087981343927e-07, - "loss": 0.6421, - "step": 69759 - }, - { - "epoch": 1.79, - "learning_rate": 7.406820741317394e-07, - "loss": 0.7598, - "step": 69760 - }, - { - "epoch": 1.79, - "learning_rate": 7.406553503276337e-07, - "loss": 0.75, - "step": 69761 - }, - { - "epoch": 1.79, - "learning_rate": 7.406286267220965e-07, - "loss": 0.6899, - "step": 69762 - }, - { - "epoch": 1.79, - "learning_rate": 7.406019033151483e-07, - "loss": 0.6191, - "step": 69763 - }, - { - "epoch": 1.79, - "learning_rate": 7.405751801068088e-07, - "loss": 0.4777, - "step": 69764 - }, - { - "epoch": 1.79, - "learning_rate": 7.40548457097099e-07, - "loss": 0.5122, - "step": 69765 - }, - { - "epoch": 1.79, - "learning_rate": 7.405217342860392e-07, - "loss": 0.6494, - "step": 69766 - }, - { - "epoch": 1.79, - "learning_rate": 7.404950116736503e-07, - "loss": 0.5342, - "step": 69767 - }, - { - "epoch": 1.79, - "learning_rate": 7.404682892599523e-07, - "loss": 0.644, - "step": 69768 - }, - { - "epoch": 1.79, - "learning_rate": 7.404415670449657e-07, - "loss": 0.5957, - "step": 69769 - }, - { - "epoch": 1.79, - "learning_rate": 7.404148450287111e-07, - "loss": 0.6006, - "step": 69770 - }, - { - "epoch": 1.79, - "learning_rate": 7.40388123211209e-07, - "loss": 0.7017, - "step": 69771 - }, - { - "epoch": 1.79, - "learning_rate": 7.403614015924797e-07, - "loss": 0.3773, - "step": 69772 - }, - { - "epoch": 1.79, - "learning_rate": 7.403346801725443e-07, - "loss": 0.8125, - "step": 69773 - }, - { - "epoch": 1.79, - "learning_rate": 7.40307958951422e-07, - "loss": 0.4778, - "step": 69774 - }, - { - "epoch": 1.79, - "learning_rate": 7.402812379291343e-07, - "loss": 0.6162, - "step": 69775 - }, - { - "epoch": 1.79, - "learning_rate": 7.40254517105701e-07, - "loss": 0.4275, - "step": 69776 - }, - { - "epoch": 1.79, - "learning_rate": 7.40227796481143e-07, - "loss": 0.6631, - "step": 69777 - }, - { - "epoch": 1.79, - "learning_rate": 7.402010760554807e-07, - "loss": 0.708, - "step": 69778 - }, - { - "epoch": 1.79, - "learning_rate": 7.401743558287345e-07, - "loss": 0.4824, - "step": 69779 - }, - { - "epoch": 1.79, - "learning_rate": 7.401476358009246e-07, - "loss": 0.5769, - "step": 69780 - }, - { - "epoch": 1.79, - "learning_rate": 7.40120915972072e-07, - "loss": 0.561, - "step": 69781 - }, - { - "epoch": 1.79, - "learning_rate": 7.400941963421967e-07, - "loss": 0.5656, - "step": 69782 - }, - { - "epoch": 1.79, - "learning_rate": 7.400674769113197e-07, - "loss": 0.4346, - "step": 69783 - }, - { - "epoch": 1.79, - "learning_rate": 7.400407576794608e-07, - "loss": 0.4524, - "step": 69784 - }, - { - "epoch": 1.79, - "learning_rate": 7.400140386466406e-07, - "loss": 0.7256, - "step": 69785 - }, - { - "epoch": 1.79, - "learning_rate": 7.399873198128799e-07, - "loss": 0.6191, - "step": 69786 - }, - { - "epoch": 1.79, - "learning_rate": 7.399606011781987e-07, - "loss": 0.5381, - "step": 69787 - }, - { - "epoch": 1.79, - "learning_rate": 7.399338827426179e-07, - "loss": 0.7261, - "step": 69788 - }, - { - "epoch": 1.79, - "learning_rate": 7.399071645061576e-07, - "loss": 0.8467, - "step": 69789 - }, - { - "epoch": 1.79, - "learning_rate": 7.398804464688387e-07, - "loss": 0.3276, - "step": 69790 - }, - { - "epoch": 1.79, - "learning_rate": 7.398537286306814e-07, - "loss": 0.7275, - "step": 69791 - }, - { - "epoch": 1.79, - "learning_rate": 7.398270109917058e-07, - "loss": 0.6235, - "step": 69792 - }, - { - "epoch": 1.79, - "learning_rate": 7.398002935519332e-07, - "loss": 0.6582, - "step": 69793 - }, - { - "epoch": 1.79, - "learning_rate": 7.397735763113832e-07, - "loss": 0.6602, - "step": 69794 - }, - { - "epoch": 1.79, - "learning_rate": 7.397468592700766e-07, - "loss": 0.6973, - "step": 69795 - }, - { - "epoch": 1.79, - "learning_rate": 7.397201424280339e-07, - "loss": 0.7295, - "step": 69796 - }, - { - "epoch": 1.79, - "learning_rate": 7.396934257852754e-07, - "loss": 0.6426, - "step": 69797 - }, - { - "epoch": 1.79, - "learning_rate": 7.396667093418219e-07, - "loss": 0.6855, - "step": 69798 - }, - { - "epoch": 1.79, - "learning_rate": 7.396399930976934e-07, - "loss": 0.7256, - "step": 69799 - }, - { - "epoch": 1.79, - "learning_rate": 7.396132770529107e-07, - "loss": 0.6265, - "step": 69800 - }, - { - "epoch": 1.79, - "learning_rate": 7.395865612074941e-07, - "loss": 0.6938, - "step": 69801 - }, - { - "epoch": 1.79, - "learning_rate": 7.395598455614643e-07, - "loss": 0.7441, - "step": 69802 - }, - { - "epoch": 1.79, - "learning_rate": 7.395331301148417e-07, - "loss": 0.8184, - "step": 69803 - }, - { - "epoch": 1.79, - "learning_rate": 7.395064148676461e-07, - "loss": 0.6021, - "step": 69804 - }, - { - "epoch": 1.79, - "learning_rate": 7.394796998198988e-07, - "loss": 0.6758, - "step": 69805 - }, - { - "epoch": 1.79, - "learning_rate": 7.394529849716195e-07, - "loss": 0.8242, - "step": 69806 - }, - { - "epoch": 1.79, - "learning_rate": 7.394262703228295e-07, - "loss": 0.4727, - "step": 69807 - }, - { - "epoch": 1.79, - "learning_rate": 7.393995558735488e-07, - "loss": 0.4482, - "step": 69808 - }, - { - "epoch": 1.79, - "learning_rate": 7.393728416237976e-07, - "loss": 0.6069, - "step": 69809 - }, - { - "epoch": 1.79, - "learning_rate": 7.393461275735968e-07, - "loss": 0.7393, - "step": 69810 - }, - { - "epoch": 1.79, - "learning_rate": 7.393194137229666e-07, - "loss": 0.6709, - "step": 69811 - }, - { - "epoch": 1.79, - "learning_rate": 7.392927000719277e-07, - "loss": 0.5752, - "step": 69812 - }, - { - "epoch": 1.79, - "learning_rate": 7.392659866205006e-07, - "loss": 0.7627, - "step": 69813 - }, - { - "epoch": 1.79, - "learning_rate": 7.392392733687051e-07, - "loss": 0.5415, - "step": 69814 - }, - { - "epoch": 1.79, - "learning_rate": 7.392125603165622e-07, - "loss": 0.6152, - "step": 69815 - }, - { - "epoch": 1.79, - "learning_rate": 7.391858474640922e-07, - "loss": 0.6484, - "step": 69816 - }, - { - "epoch": 1.79, - "learning_rate": 7.391591348113157e-07, - "loss": 0.4443, - "step": 69817 - }, - { - "epoch": 1.79, - "learning_rate": 7.39132422358253e-07, - "loss": 0.667, - "step": 69818 - }, - { - "epoch": 1.79, - "learning_rate": 7.391057101049247e-07, - "loss": 0.561, - "step": 69819 - }, - { - "epoch": 1.79, - "learning_rate": 7.390789980513509e-07, - "loss": 0.7451, - "step": 69820 - }, - { - "epoch": 1.79, - "learning_rate": 7.390522861975527e-07, - "loss": 0.6553, - "step": 69821 - }, - { - "epoch": 1.79, - "learning_rate": 7.390255745435499e-07, - "loss": 0.562, - "step": 69822 - }, - { - "epoch": 1.79, - "learning_rate": 7.389988630893636e-07, - "loss": 0.6484, - "step": 69823 - }, - { - "epoch": 1.79, - "learning_rate": 7.389721518350137e-07, - "loss": 0.5525, - "step": 69824 - }, - { - "epoch": 1.79, - "learning_rate": 7.389454407805208e-07, - "loss": 0.8984, - "step": 69825 - }, - { - "epoch": 1.79, - "learning_rate": 7.389187299259052e-07, - "loss": 0.6094, - "step": 69826 - }, - { - "epoch": 1.79, - "learning_rate": 7.388920192711876e-07, - "loss": 0.6592, - "step": 69827 - }, - { - "epoch": 1.79, - "learning_rate": 7.388653088163883e-07, - "loss": 0.6924, - "step": 69828 - }, - { - "epoch": 1.79, - "learning_rate": 7.38838598561528e-07, - "loss": 0.667, - "step": 69829 - }, - { - "epoch": 1.79, - "learning_rate": 7.388118885066268e-07, - "loss": 0.5031, - "step": 69830 - }, - { - "epoch": 1.79, - "learning_rate": 7.387851786517054e-07, - "loss": 0.6353, - "step": 69831 - }, - { - "epoch": 1.79, - "learning_rate": 7.387584689967841e-07, - "loss": 0.6191, - "step": 69832 - }, - { - "epoch": 1.79, - "learning_rate": 7.387317595418838e-07, - "loss": 0.7021, - "step": 69833 - }, - { - "epoch": 1.79, - "learning_rate": 7.387050502870243e-07, - "loss": 0.5724, - "step": 69834 - }, - { - "epoch": 1.79, - "learning_rate": 7.386783412322262e-07, - "loss": 0.6133, - "step": 69835 - }, - { - "epoch": 1.79, - "learning_rate": 7.386516323775103e-07, - "loss": 0.7822, - "step": 69836 - }, - { - "epoch": 1.79, - "learning_rate": 7.386249237228967e-07, - "loss": 0.7373, - "step": 69837 - }, - { - "epoch": 1.79, - "learning_rate": 7.38598215268406e-07, - "loss": 0.8203, - "step": 69838 - }, - { - "epoch": 1.79, - "learning_rate": 7.385715070140586e-07, - "loss": 0.7129, - "step": 69839 - }, - { - "epoch": 1.79, - "learning_rate": 7.38544798959875e-07, - "loss": 0.6855, - "step": 69840 - }, - { - "epoch": 1.79, - "learning_rate": 7.385180911058755e-07, - "loss": 0.4854, - "step": 69841 - }, - { - "epoch": 1.79, - "learning_rate": 7.384913834520809e-07, - "loss": 0.4663, - "step": 69842 - }, - { - "epoch": 1.79, - "learning_rate": 7.384646759985116e-07, - "loss": 0.6328, - "step": 69843 - }, - { - "epoch": 1.79, - "learning_rate": 7.384379687451877e-07, - "loss": 0.7485, - "step": 69844 - }, - { - "epoch": 1.79, - "learning_rate": 7.384112616921297e-07, - "loss": 0.7041, - "step": 69845 - }, - { - "epoch": 1.79, - "learning_rate": 7.383845548393582e-07, - "loss": 0.7734, - "step": 69846 - }, - { - "epoch": 1.79, - "learning_rate": 7.383578481868935e-07, - "loss": 0.7148, - "step": 69847 - }, - { - "epoch": 1.79, - "learning_rate": 7.383311417347563e-07, - "loss": 0.6543, - "step": 69848 - }, - { - "epoch": 1.79, - "learning_rate": 7.383044354829667e-07, - "loss": 0.7334, - "step": 69849 - }, - { - "epoch": 1.79, - "learning_rate": 7.382777294315457e-07, - "loss": 0.6494, - "step": 69850 - }, - { - "epoch": 1.79, - "learning_rate": 7.382510235805131e-07, - "loss": 0.5938, - "step": 69851 - }, - { - "epoch": 1.79, - "learning_rate": 7.382243179298899e-07, - "loss": 0.6533, - "step": 69852 - }, - { - "epoch": 1.79, - "learning_rate": 7.381976124796965e-07, - "loss": 0.6104, - "step": 69853 - }, - { - "epoch": 1.79, - "learning_rate": 7.381709072299527e-07, - "loss": 0.748, - "step": 69854 - }, - { - "epoch": 1.79, - "learning_rate": 7.381442021806797e-07, - "loss": 0.5662, - "step": 69855 - }, - { - "epoch": 1.79, - "learning_rate": 7.381174973318973e-07, - "loss": 0.5635, - "step": 69856 - }, - { - "epoch": 1.79, - "learning_rate": 7.380907926836267e-07, - "loss": 0.7158, - "step": 69857 - }, - { - "epoch": 1.79, - "learning_rate": 7.380640882358875e-07, - "loss": 0.5088, - "step": 69858 - }, - { - "epoch": 1.79, - "learning_rate": 7.380373839887008e-07, - "loss": 0.5605, - "step": 69859 - }, - { - "epoch": 1.79, - "learning_rate": 7.380106799420868e-07, - "loss": 0.6606, - "step": 69860 - }, - { - "epoch": 1.79, - "learning_rate": 7.379839760960662e-07, - "loss": 0.7949, - "step": 69861 - }, - { - "epoch": 1.79, - "learning_rate": 7.379572724506589e-07, - "loss": 0.6631, - "step": 69862 - }, - { - "epoch": 1.79, - "learning_rate": 7.379305690058863e-07, - "loss": 0.5972, - "step": 69863 - }, - { - "epoch": 1.79, - "learning_rate": 7.379038657617675e-07, - "loss": 0.6392, - "step": 69864 - }, - { - "epoch": 1.79, - "learning_rate": 7.37877162718324e-07, - "loss": 0.9053, - "step": 69865 - }, - { - "epoch": 1.79, - "learning_rate": 7.378504598755757e-07, - "loss": 0.6089, - "step": 69866 - }, - { - "epoch": 1.79, - "learning_rate": 7.378237572335434e-07, - "loss": 0.55, - "step": 69867 - }, - { - "epoch": 1.79, - "learning_rate": 7.377970547922472e-07, - "loss": 0.6279, - "step": 69868 - }, - { - "epoch": 1.79, - "learning_rate": 7.377703525517079e-07, - "loss": 0.6587, - "step": 69869 - }, - { - "epoch": 1.79, - "learning_rate": 7.377436505119456e-07, - "loss": 0.4351, - "step": 69870 - }, - { - "epoch": 1.79, - "learning_rate": 7.377169486729812e-07, - "loss": 0.6973, - "step": 69871 - }, - { - "epoch": 1.79, - "learning_rate": 7.376902470348346e-07, - "loss": 0.5112, - "step": 69872 - }, - { - "epoch": 1.79, - "learning_rate": 7.376635455975271e-07, - "loss": 0.6836, - "step": 69873 - }, - { - "epoch": 1.79, - "learning_rate": 7.37636844361078e-07, - "loss": 0.769, - "step": 69874 - }, - { - "epoch": 1.79, - "learning_rate": 7.376101433255084e-07, - "loss": 0.5957, - "step": 69875 - }, - { - "epoch": 1.79, - "learning_rate": 7.375834424908388e-07, - "loss": 0.7334, - "step": 69876 - }, - { - "epoch": 1.79, - "learning_rate": 7.375567418570892e-07, - "loss": 0.6528, - "step": 69877 - }, - { - "epoch": 1.79, - "learning_rate": 7.375300414242807e-07, - "loss": 0.6592, - "step": 69878 - }, - { - "epoch": 1.79, - "learning_rate": 7.375033411924329e-07, - "loss": 0.667, - "step": 69879 - }, - { - "epoch": 1.79, - "learning_rate": 7.374766411615672e-07, - "loss": 0.7363, - "step": 69880 - }, - { - "epoch": 1.79, - "learning_rate": 7.374499413317034e-07, - "loss": 0.6812, - "step": 69881 - }, - { - "epoch": 1.79, - "learning_rate": 7.37423241702862e-07, - "loss": 0.708, - "step": 69882 - }, - { - "epoch": 1.79, - "learning_rate": 7.373965422750639e-07, - "loss": 0.5437, - "step": 69883 - }, - { - "epoch": 1.79, - "learning_rate": 7.373698430483291e-07, - "loss": 0.7402, - "step": 69884 - }, - { - "epoch": 1.79, - "learning_rate": 7.373431440226778e-07, - "loss": 0.7256, - "step": 69885 - }, - { - "epoch": 1.79, - "learning_rate": 7.373164451981309e-07, - "loss": 0.7617, - "step": 69886 - }, - { - "epoch": 1.79, - "learning_rate": 7.372897465747087e-07, - "loss": 0.5239, - "step": 69887 - }, - { - "epoch": 1.79, - "learning_rate": 7.372630481524317e-07, - "loss": 0.6284, - "step": 69888 - }, - { - "epoch": 1.79, - "learning_rate": 7.372363499313203e-07, - "loss": 0.5547, - "step": 69889 - }, - { - "epoch": 1.79, - "learning_rate": 7.37209651911395e-07, - "loss": 0.6821, - "step": 69890 - }, - { - "epoch": 1.79, - "learning_rate": 7.371829540926759e-07, - "loss": 0.7959, - "step": 69891 - }, - { - "epoch": 1.79, - "learning_rate": 7.371562564751841e-07, - "loss": 0.6626, - "step": 69892 - }, - { - "epoch": 1.79, - "learning_rate": 7.371295590589399e-07, - "loss": 0.5125, - "step": 69893 - }, - { - "epoch": 1.79, - "learning_rate": 7.37102861843963e-07, - "loss": 0.6602, - "step": 69894 - }, - { - "epoch": 1.79, - "learning_rate": 7.370761648302745e-07, - "loss": 0.6816, - "step": 69895 - }, - { - "epoch": 1.79, - "learning_rate": 7.370494680178947e-07, - "loss": 0.7295, - "step": 69896 - }, - { - "epoch": 1.79, - "learning_rate": 7.370227714068441e-07, - "loss": 0.627, - "step": 69897 - }, - { - "epoch": 1.79, - "learning_rate": 7.369960749971431e-07, - "loss": 0.6011, - "step": 69898 - }, - { - "epoch": 1.79, - "learning_rate": 7.369693787888118e-07, - "loss": 0.626, - "step": 69899 - }, - { - "epoch": 1.79, - "learning_rate": 7.369426827818714e-07, - "loss": 0.6611, - "step": 69900 - }, - { - "epoch": 1.79, - "learning_rate": 7.369159869763415e-07, - "loss": 0.6802, - "step": 69901 - }, - { - "epoch": 1.79, - "learning_rate": 7.368892913722431e-07, - "loss": 0.4232, - "step": 69902 - }, - { - "epoch": 1.79, - "learning_rate": 7.368625959695967e-07, - "loss": 0.543, - "step": 69903 - }, - { - "epoch": 1.79, - "learning_rate": 7.368359007684221e-07, - "loss": 0.4802, - "step": 69904 - }, - { - "epoch": 1.79, - "learning_rate": 7.368092057687405e-07, - "loss": 0.5532, - "step": 69905 - }, - { - "epoch": 1.79, - "learning_rate": 7.367825109705716e-07, - "loss": 0.6274, - "step": 69906 - }, - { - "epoch": 1.79, - "learning_rate": 7.367558163739367e-07, - "loss": 0.752, - "step": 69907 - }, - { - "epoch": 1.79, - "learning_rate": 7.367291219788552e-07, - "loss": 0.6064, - "step": 69908 - }, - { - "epoch": 1.79, - "learning_rate": 7.367024277853486e-07, - "loss": 0.5906, - "step": 69909 - }, - { - "epoch": 1.79, - "learning_rate": 7.366757337934365e-07, - "loss": 0.4452, - "step": 69910 - }, - { - "epoch": 1.79, - "learning_rate": 7.3664904000314e-07, - "loss": 0.5547, - "step": 69911 - }, - { - "epoch": 1.79, - "learning_rate": 7.36622346414479e-07, - "loss": 0.707, - "step": 69912 - }, - { - "epoch": 1.79, - "learning_rate": 7.365956530274744e-07, - "loss": 0.6582, - "step": 69913 - }, - { - "epoch": 1.79, - "learning_rate": 7.365689598421463e-07, - "loss": 0.6963, - "step": 69914 - }, - { - "epoch": 1.79, - "learning_rate": 7.365422668585153e-07, - "loss": 0.6094, - "step": 69915 - }, - { - "epoch": 1.79, - "learning_rate": 7.365155740766013e-07, - "loss": 0.6387, - "step": 69916 - }, - { - "epoch": 1.79, - "learning_rate": 7.364888814964258e-07, - "loss": 0.6719, - "step": 69917 - }, - { - "epoch": 1.79, - "learning_rate": 7.364621891180081e-07, - "loss": 0.7627, - "step": 69918 - }, - { - "epoch": 1.79, - "learning_rate": 7.364354969413696e-07, - "loss": 0.6172, - "step": 69919 - }, - { - "epoch": 1.79, - "learning_rate": 7.3640880496653e-07, - "loss": 0.6426, - "step": 69920 - }, - { - "epoch": 1.79, - "learning_rate": 7.363821131935104e-07, - "loss": 0.6123, - "step": 69921 - }, - { - "epoch": 1.79, - "learning_rate": 7.363554216223307e-07, - "loss": 0.5762, - "step": 69922 - }, - { - "epoch": 1.79, - "learning_rate": 7.363287302530118e-07, - "loss": 0.5249, - "step": 69923 - }, - { - "epoch": 1.79, - "learning_rate": 7.363020390855737e-07, - "loss": 0.5908, - "step": 69924 - }, - { - "epoch": 1.79, - "learning_rate": 7.362753481200367e-07, - "loss": 0.6592, - "step": 69925 - }, - { - "epoch": 1.79, - "learning_rate": 7.36248657356422e-07, - "loss": 0.6094, - "step": 69926 - }, - { - "epoch": 1.79, - "learning_rate": 7.362219667947491e-07, - "loss": 0.7314, - "step": 69927 - }, - { - "epoch": 1.79, - "learning_rate": 7.361952764350394e-07, - "loss": 0.5293, - "step": 69928 - }, - { - "epoch": 1.79, - "learning_rate": 7.361685862773124e-07, - "loss": 0.4436, - "step": 69929 - }, - { - "epoch": 1.79, - "learning_rate": 7.361418963215893e-07, - "loss": 0.6777, - "step": 69930 - }, - { - "epoch": 1.79, - "learning_rate": 7.3611520656789e-07, - "loss": 0.4849, - "step": 69931 - }, - { - "epoch": 1.79, - "learning_rate": 7.360885170162353e-07, - "loss": 0.5398, - "step": 69932 - }, - { - "epoch": 1.79, - "learning_rate": 7.360618276666457e-07, - "loss": 0.7544, - "step": 69933 - }, - { - "epoch": 1.79, - "learning_rate": 7.360351385191412e-07, - "loss": 0.5942, - "step": 69934 - }, - { - "epoch": 1.79, - "learning_rate": 7.360084495737424e-07, - "loss": 0.4827, - "step": 69935 - }, - { - "epoch": 1.79, - "learning_rate": 7.359817608304699e-07, - "loss": 0.5898, - "step": 69936 - }, - { - "epoch": 1.79, - "learning_rate": 7.359550722893438e-07, - "loss": 0.5254, - "step": 69937 - }, - { - "epoch": 1.79, - "learning_rate": 7.35928383950385e-07, - "loss": 0.604, - "step": 69938 - }, - { - "epoch": 1.79, - "learning_rate": 7.359016958136135e-07, - "loss": 0.584, - "step": 69939 - }, - { - "epoch": 1.79, - "learning_rate": 7.358750078790501e-07, - "loss": 0.5845, - "step": 69940 - }, - { - "epoch": 1.79, - "learning_rate": 7.35848320146715e-07, - "loss": 0.6846, - "step": 69941 - }, - { - "epoch": 1.79, - "learning_rate": 7.358216326166287e-07, - "loss": 0.6392, - "step": 69942 - }, - { - "epoch": 1.79, - "learning_rate": 7.35794945288812e-07, - "loss": 0.6641, - "step": 69943 - }, - { - "epoch": 1.79, - "learning_rate": 7.357682581632843e-07, - "loss": 0.667, - "step": 69944 - }, - { - "epoch": 1.79, - "learning_rate": 7.35741571240067e-07, - "loss": 0.6162, - "step": 69945 - }, - { - "epoch": 1.79, - "learning_rate": 7.357148845191801e-07, - "loss": 0.7163, - "step": 69946 - }, - { - "epoch": 1.79, - "learning_rate": 7.356881980006445e-07, - "loss": 0.6777, - "step": 69947 - }, - { - "epoch": 1.79, - "learning_rate": 7.356615116844797e-07, - "loss": 0.7197, - "step": 69948 - }, - { - "epoch": 1.79, - "learning_rate": 7.356348255707072e-07, - "loss": 0.4685, - "step": 69949 - }, - { - "epoch": 1.79, - "learning_rate": 7.356081396593467e-07, - "loss": 0.6147, - "step": 69950 - }, - { - "epoch": 1.79, - "learning_rate": 7.355814539504192e-07, - "loss": 0.6284, - "step": 69951 - }, - { - "epoch": 1.79, - "learning_rate": 7.355547684439445e-07, - "loss": 0.5752, - "step": 69952 - }, - { - "epoch": 1.79, - "learning_rate": 7.355280831399439e-07, - "loss": 0.5601, - "step": 69953 - }, - { - "epoch": 1.79, - "learning_rate": 7.355013980384369e-07, - "loss": 0.686, - "step": 69954 - }, - { - "epoch": 1.79, - "learning_rate": 7.354747131394443e-07, - "loss": 0.7734, - "step": 69955 - }, - { - "epoch": 1.79, - "learning_rate": 7.354480284429865e-07, - "loss": 0.4375, - "step": 69956 - }, - { - "epoch": 1.79, - "learning_rate": 7.354213439490842e-07, - "loss": 0.75, - "step": 69957 - }, - { - "epoch": 1.79, - "learning_rate": 7.353946596577572e-07, - "loss": 0.731, - "step": 69958 - }, - { - "epoch": 1.79, - "learning_rate": 7.353679755690267e-07, - "loss": 0.7246, - "step": 69959 - }, - { - "epoch": 1.79, - "learning_rate": 7.353412916829125e-07, - "loss": 0.6719, - "step": 69960 - }, - { - "epoch": 1.79, - "learning_rate": 7.353146079994356e-07, - "loss": 0.6816, - "step": 69961 - }, - { - "epoch": 1.79, - "learning_rate": 7.352879245186158e-07, - "loss": 0.6934, - "step": 69962 - }, - { - "epoch": 1.79, - "learning_rate": 7.352612412404744e-07, - "loss": 0.751, - "step": 69963 - }, - { - "epoch": 1.79, - "learning_rate": 7.35234558165031e-07, - "loss": 0.5215, - "step": 69964 - }, - { - "epoch": 1.79, - "learning_rate": 7.352078752923063e-07, - "loss": 0.6748, - "step": 69965 - }, - { - "epoch": 1.79, - "learning_rate": 7.351811926223209e-07, - "loss": 0.751, - "step": 69966 - }, - { - "epoch": 1.79, - "learning_rate": 7.351545101550947e-07, - "loss": 0.5537, - "step": 69967 - }, - { - "epoch": 1.79, - "learning_rate": 7.351278278906488e-07, - "loss": 0.3777, - "step": 69968 - }, - { - "epoch": 1.79, - "learning_rate": 7.351011458290031e-07, - "loss": 0.6592, - "step": 69969 - }, - { - "epoch": 1.79, - "learning_rate": 7.350744639701785e-07, - "loss": 0.4027, - "step": 69970 - }, - { - "epoch": 1.79, - "learning_rate": 7.350477823141953e-07, - "loss": 0.7666, - "step": 69971 - }, - { - "epoch": 1.79, - "learning_rate": 7.350211008610735e-07, - "loss": 0.6973, - "step": 69972 - }, - { - "epoch": 1.79, - "learning_rate": 7.349944196108345e-07, - "loss": 0.4917, - "step": 69973 - }, - { - "epoch": 1.79, - "learning_rate": 7.349677385634976e-07, - "loss": 0.4526, - "step": 69974 - }, - { - "epoch": 1.79, - "learning_rate": 7.349410577190835e-07, - "loss": 0.6162, - "step": 69975 - }, - { - "epoch": 1.79, - "learning_rate": 7.349143770776133e-07, - "loss": 0.5894, - "step": 69976 - }, - { - "epoch": 1.79, - "learning_rate": 7.348876966391067e-07, - "loss": 0.6846, - "step": 69977 - }, - { - "epoch": 1.79, - "learning_rate": 7.348610164035844e-07, - "loss": 0.7676, - "step": 69978 - }, - { - "epoch": 1.79, - "learning_rate": 7.348343363710667e-07, - "loss": 0.5903, - "step": 69979 - }, - { - "epoch": 1.79, - "learning_rate": 7.348076565415746e-07, - "loss": 0.6362, - "step": 69980 - }, - { - "epoch": 1.79, - "learning_rate": 7.347809769151277e-07, - "loss": 0.4045, - "step": 69981 - }, - { - "epoch": 1.79, - "learning_rate": 7.34754297491747e-07, - "loss": 0.5771, - "step": 69982 - }, - { - "epoch": 1.79, - "learning_rate": 7.34727618271453e-07, - "loss": 0.5889, - "step": 69983 - }, - { - "epoch": 1.79, - "learning_rate": 7.347009392542654e-07, - "loss": 0.6045, - "step": 69984 - }, - { - "epoch": 1.79, - "learning_rate": 7.346742604402053e-07, - "loss": 0.7139, - "step": 69985 - }, - { - "epoch": 1.79, - "learning_rate": 7.346475818292927e-07, - "loss": 0.5654, - "step": 69986 - }, - { - "epoch": 1.79, - "learning_rate": 7.346209034215484e-07, - "loss": 0.5762, - "step": 69987 - }, - { - "epoch": 1.79, - "learning_rate": 7.345942252169928e-07, - "loss": 0.5522, - "step": 69988 - }, - { - "epoch": 1.79, - "learning_rate": 7.345675472156461e-07, - "loss": 0.6738, - "step": 69989 - }, - { - "epoch": 1.79, - "learning_rate": 7.345408694175288e-07, - "loss": 0.6204, - "step": 69990 - }, - { - "epoch": 1.79, - "learning_rate": 7.345141918226612e-07, - "loss": 0.5371, - "step": 69991 - }, - { - "epoch": 1.79, - "learning_rate": 7.34487514431064e-07, - "loss": 0.5898, - "step": 69992 - }, - { - "epoch": 1.79, - "learning_rate": 7.344608372427579e-07, - "loss": 0.6377, - "step": 69993 - }, - { - "epoch": 1.79, - "learning_rate": 7.344341602577624e-07, - "loss": 0.5933, - "step": 69994 - }, - { - "epoch": 1.79, - "learning_rate": 7.344074834760987e-07, - "loss": 0.6528, - "step": 69995 - }, - { - "epoch": 1.79, - "learning_rate": 7.343808068977868e-07, - "loss": 0.4229, - "step": 69996 - }, - { - "epoch": 1.79, - "learning_rate": 7.343541305228475e-07, - "loss": 0.5498, - "step": 69997 - }, - { - "epoch": 1.79, - "learning_rate": 7.343274543513007e-07, - "loss": 0.6475, - "step": 69998 - }, - { - "epoch": 1.79, - "learning_rate": 7.343007783831675e-07, - "loss": 0.635, - "step": 69999 - }, - { - "epoch": 1.79, - "learning_rate": 7.342741026184676e-07, - "loss": 0.6748, - "step": 70000 - }, - { - "epoch": 1.79, - "learning_rate": 7.342474270572222e-07, - "loss": 0.4531, - "step": 70001 - }, - { - "epoch": 1.79, - "learning_rate": 7.342207516994511e-07, - "loss": 0.6675, - "step": 70002 - }, - { - "epoch": 1.79, - "learning_rate": 7.341940765451753e-07, - "loss": 0.541, - "step": 70003 - }, - { - "epoch": 1.79, - "learning_rate": 7.341674015944146e-07, - "loss": 0.71, - "step": 70004 - }, - { - "epoch": 1.79, - "learning_rate": 7.341407268471898e-07, - "loss": 0.6279, - "step": 70005 - }, - { - "epoch": 1.79, - "learning_rate": 7.34114052303521e-07, - "loss": 0.542, - "step": 70006 - }, - { - "epoch": 1.79, - "learning_rate": 7.34087377963429e-07, - "loss": 0.6123, - "step": 70007 - }, - { - "epoch": 1.79, - "learning_rate": 7.34060703826934e-07, - "loss": 0.6152, - "step": 70008 - }, - { - "epoch": 1.79, - "learning_rate": 7.340340298940565e-07, - "loss": 0.6611, - "step": 70009 - }, - { - "epoch": 1.79, - "learning_rate": 7.340073561648168e-07, - "loss": 0.7607, - "step": 70010 - }, - { - "epoch": 1.79, - "learning_rate": 7.339806826392356e-07, - "loss": 0.583, - "step": 70011 - }, - { - "epoch": 1.79, - "learning_rate": 7.339540093173331e-07, - "loss": 0.436, - "step": 70012 - }, - { - "epoch": 1.79, - "learning_rate": 7.339273361991301e-07, - "loss": 0.4478, - "step": 70013 - }, - { - "epoch": 1.79, - "learning_rate": 7.339006632846465e-07, - "loss": 0.6743, - "step": 70014 - }, - { - "epoch": 1.79, - "learning_rate": 7.338739905739027e-07, - "loss": 0.5164, - "step": 70015 - }, - { - "epoch": 1.79, - "learning_rate": 7.338473180669196e-07, - "loss": 0.5039, - "step": 70016 - }, - { - "epoch": 1.79, - "learning_rate": 7.338206457637171e-07, - "loss": 0.5361, - "step": 70017 - }, - { - "epoch": 1.79, - "learning_rate": 7.337939736643161e-07, - "loss": 0.6411, - "step": 70018 - }, - { - "epoch": 1.79, - "learning_rate": 7.337673017687365e-07, - "loss": 0.6079, - "step": 70019 - }, - { - "epoch": 1.79, - "learning_rate": 7.337406300769995e-07, - "loss": 0.6465, - "step": 70020 - }, - { - "epoch": 1.79, - "learning_rate": 7.337139585891247e-07, - "loss": 0.6445, - "step": 70021 - }, - { - "epoch": 1.79, - "learning_rate": 7.336872873051331e-07, - "loss": 0.6377, - "step": 70022 - }, - { - "epoch": 1.79, - "learning_rate": 7.336606162250451e-07, - "loss": 0.6406, - "step": 70023 - }, - { - "epoch": 1.79, - "learning_rate": 7.336339453488808e-07, - "loss": 0.7344, - "step": 70024 - }, - { - "epoch": 1.79, - "learning_rate": 7.336072746766604e-07, - "loss": 0.5073, - "step": 70025 - }, - { - "epoch": 1.79, - "learning_rate": 7.335806042084049e-07, - "loss": 0.688, - "step": 70026 - }, - { - "epoch": 1.79, - "learning_rate": 7.335539339441343e-07, - "loss": 0.7432, - "step": 70027 - }, - { - "epoch": 1.79, - "learning_rate": 7.335272638838694e-07, - "loss": 0.4583, - "step": 70028 - }, - { - "epoch": 1.79, - "learning_rate": 7.335005940276303e-07, - "loss": 0.6543, - "step": 70029 - }, - { - "epoch": 1.79, - "learning_rate": 7.334739243754376e-07, - "loss": 0.7793, - "step": 70030 - }, - { - "epoch": 1.79, - "learning_rate": 7.334472549273116e-07, - "loss": 0.4722, - "step": 70031 - }, - { - "epoch": 1.79, - "learning_rate": 7.33420585683273e-07, - "loss": 0.7451, - "step": 70032 - }, - { - "epoch": 1.79, - "learning_rate": 7.333939166433421e-07, - "loss": 0.5708, - "step": 70033 - }, - { - "epoch": 1.8, - "learning_rate": 7.333672478075388e-07, - "loss": 0.6597, - "step": 70034 - }, - { - "epoch": 1.8, - "learning_rate": 7.333405791758842e-07, - "loss": 0.6445, - "step": 70035 - }, - { - "epoch": 1.8, - "learning_rate": 7.333139107483981e-07, - "loss": 0.7129, - "step": 70036 - }, - { - "epoch": 1.8, - "learning_rate": 7.332872425251017e-07, - "loss": 0.6885, - "step": 70037 - }, - { - "epoch": 1.8, - "learning_rate": 7.332605745060147e-07, - "loss": 0.3818, - "step": 70038 - }, - { - "epoch": 1.8, - "learning_rate": 7.332339066911579e-07, - "loss": 0.5791, - "step": 70039 - }, - { - "epoch": 1.8, - "learning_rate": 7.332072390805516e-07, - "loss": 0.5337, - "step": 70040 - }, - { - "epoch": 1.8, - "learning_rate": 7.331805716742165e-07, - "loss": 0.6875, - "step": 70041 - }, - { - "epoch": 1.8, - "learning_rate": 7.331539044721728e-07, - "loss": 0.6577, - "step": 70042 - }, - { - "epoch": 1.8, - "learning_rate": 7.331272374744408e-07, - "loss": 0.5935, - "step": 70043 - }, - { - "epoch": 1.8, - "learning_rate": 7.331005706810407e-07, - "loss": 0.7007, - "step": 70044 - }, - { - "epoch": 1.8, - "learning_rate": 7.330739040919934e-07, - "loss": 0.7422, - "step": 70045 - }, - { - "epoch": 1.8, - "learning_rate": 7.330472377073191e-07, - "loss": 0.5459, - "step": 70046 - }, - { - "epoch": 1.8, - "learning_rate": 7.330205715270383e-07, - "loss": 0.4849, - "step": 70047 - }, - { - "epoch": 1.8, - "learning_rate": 7.329939055511713e-07, - "loss": 0.6523, - "step": 70048 - }, - { - "epoch": 1.8, - "learning_rate": 7.329672397797386e-07, - "loss": 0.5918, - "step": 70049 - }, - { - "epoch": 1.8, - "learning_rate": 7.329405742127606e-07, - "loss": 0.6934, - "step": 70050 - }, - { - "epoch": 1.8, - "learning_rate": 7.329139088502579e-07, - "loss": 0.6406, - "step": 70051 - }, - { - "epoch": 1.8, - "learning_rate": 7.328872436922508e-07, - "loss": 0.623, - "step": 70052 - }, - { - "epoch": 1.8, - "learning_rate": 7.328605787387594e-07, - "loss": 0.6045, - "step": 70053 - }, - { - "epoch": 1.8, - "learning_rate": 7.328339139898046e-07, - "loss": 0.709, - "step": 70054 - }, - { - "epoch": 1.8, - "learning_rate": 7.328072494454063e-07, - "loss": 0.5098, - "step": 70055 - }, - { - "epoch": 1.8, - "learning_rate": 7.327805851055853e-07, - "loss": 0.6123, - "step": 70056 - }, - { - "epoch": 1.8, - "learning_rate": 7.327539209703619e-07, - "loss": 0.6519, - "step": 70057 - }, - { - "epoch": 1.8, - "learning_rate": 7.327272570397567e-07, - "loss": 0.6616, - "step": 70058 - }, - { - "epoch": 1.8, - "learning_rate": 7.327005933137896e-07, - "loss": 0.4763, - "step": 70059 - }, - { - "epoch": 1.8, - "learning_rate": 7.326739297924818e-07, - "loss": 0.7236, - "step": 70060 - }, - { - "epoch": 1.8, - "learning_rate": 7.326472664758531e-07, - "loss": 0.707, - "step": 70061 - }, - { - "epoch": 1.8, - "learning_rate": 7.326206033639244e-07, - "loss": 0.5859, - "step": 70062 - }, - { - "epoch": 1.8, - "learning_rate": 7.325939404567153e-07, - "loss": 0.708, - "step": 70063 - }, - { - "epoch": 1.8, - "learning_rate": 7.32567277754247e-07, - "loss": 0.6196, - "step": 70064 - }, - { - "epoch": 1.8, - "learning_rate": 7.325406152565394e-07, - "loss": 0.7051, - "step": 70065 - }, - { - "epoch": 1.8, - "learning_rate": 7.325139529636133e-07, - "loss": 0.6069, - "step": 70066 - }, - { - "epoch": 1.8, - "learning_rate": 7.324872908754888e-07, - "loss": 0.6455, - "step": 70067 - }, - { - "epoch": 1.8, - "learning_rate": 7.324606289921868e-07, - "loss": 0.5229, - "step": 70068 - }, - { - "epoch": 1.8, - "learning_rate": 7.324339673137272e-07, - "loss": 0.709, - "step": 70069 - }, - { - "epoch": 1.8, - "learning_rate": 7.324073058401308e-07, - "loss": 0.6465, - "step": 70070 - }, - { - "epoch": 1.8, - "learning_rate": 7.323806445714175e-07, - "loss": 0.6216, - "step": 70071 - }, - { - "epoch": 1.8, - "learning_rate": 7.323539835076084e-07, - "loss": 0.6953, - "step": 70072 - }, - { - "epoch": 1.8, - "learning_rate": 7.323273226487234e-07, - "loss": 0.752, - "step": 70073 - }, - { - "epoch": 1.8, - "learning_rate": 7.323006619947829e-07, - "loss": 0.7725, - "step": 70074 - }, - { - "epoch": 1.8, - "learning_rate": 7.322740015458078e-07, - "loss": 0.571, - "step": 70075 - }, - { - "epoch": 1.8, - "learning_rate": 7.322473413018178e-07, - "loss": 0.6758, - "step": 70076 - }, - { - "epoch": 1.8, - "learning_rate": 7.32220681262834e-07, - "loss": 0.6331, - "step": 70077 - }, - { - "epoch": 1.8, - "learning_rate": 7.321940214288765e-07, - "loss": 0.6987, - "step": 70078 - }, - { - "epoch": 1.8, - "learning_rate": 7.321673617999654e-07, - "loss": 0.6191, - "step": 70079 - }, - { - "epoch": 1.8, - "learning_rate": 7.321407023761217e-07, - "loss": 0.6099, - "step": 70080 - }, - { - "epoch": 1.8, - "learning_rate": 7.321140431573653e-07, - "loss": 0.5723, - "step": 70081 - }, - { - "epoch": 1.8, - "learning_rate": 7.320873841437174e-07, - "loss": 0.5615, - "step": 70082 - }, - { - "epoch": 1.8, - "learning_rate": 7.320607253351976e-07, - "loss": 0.6973, - "step": 70083 - }, - { - "epoch": 1.8, - "learning_rate": 7.320340667318265e-07, - "loss": 0.5393, - "step": 70084 - }, - { - "epoch": 1.8, - "learning_rate": 7.320074083336246e-07, - "loss": 0.666, - "step": 70085 - }, - { - "epoch": 1.8, - "learning_rate": 7.319807501406122e-07, - "loss": 0.6758, - "step": 70086 - }, - { - "epoch": 1.8, - "learning_rate": 7.3195409215281e-07, - "loss": 0.4636, - "step": 70087 - }, - { - "epoch": 1.8, - "learning_rate": 7.319274343702379e-07, - "loss": 0.4233, - "step": 70088 - }, - { - "epoch": 1.8, - "learning_rate": 7.319007767929171e-07, - "loss": 0.4948, - "step": 70089 - }, - { - "epoch": 1.8, - "learning_rate": 7.318741194208672e-07, - "loss": 0.6157, - "step": 70090 - }, - { - "epoch": 1.8, - "learning_rate": 7.318474622541091e-07, - "loss": 0.564, - "step": 70091 - }, - { - "epoch": 1.8, - "learning_rate": 7.318208052926634e-07, - "loss": 0.668, - "step": 70092 - }, - { - "epoch": 1.8, - "learning_rate": 7.317941485365497e-07, - "loss": 0.5815, - "step": 70093 - }, - { - "epoch": 1.8, - "learning_rate": 7.317674919857892e-07, - "loss": 0.4631, - "step": 70094 - }, - { - "epoch": 1.8, - "learning_rate": 7.317408356404016e-07, - "loss": 0.7568, - "step": 70095 - }, - { - "epoch": 1.8, - "learning_rate": 7.31714179500408e-07, - "loss": 0.7891, - "step": 70096 - }, - { - "epoch": 1.8, - "learning_rate": 7.316875235658287e-07, - "loss": 0.6538, - "step": 70097 - }, - { - "epoch": 1.8, - "learning_rate": 7.316608678366833e-07, - "loss": 0.7285, - "step": 70098 - }, - { - "epoch": 1.8, - "learning_rate": 7.316342123129935e-07, - "loss": 0.6025, - "step": 70099 - }, - { - "epoch": 1.8, - "learning_rate": 7.316075569947786e-07, - "loss": 0.6172, - "step": 70100 - }, - { - "epoch": 1.8, - "learning_rate": 7.315809018820595e-07, - "loss": 0.6816, - "step": 70101 - }, - { - "epoch": 1.8, - "learning_rate": 7.315542469748571e-07, - "loss": 0.5107, - "step": 70102 - }, - { - "epoch": 1.8, - "learning_rate": 7.315275922731907e-07, - "loss": 0.6191, - "step": 70103 - }, - { - "epoch": 1.8, - "learning_rate": 7.315009377770816e-07, - "loss": 0.5371, - "step": 70104 - }, - { - "epoch": 1.8, - "learning_rate": 7.314742834865495e-07, - "loss": 0.5374, - "step": 70105 - }, - { - "epoch": 1.8, - "learning_rate": 7.314476294016155e-07, - "loss": 0.5898, - "step": 70106 - }, - { - "epoch": 1.8, - "learning_rate": 7.314209755222993e-07, - "loss": 0.4438, - "step": 70107 - }, - { - "epoch": 1.8, - "learning_rate": 7.313943218486221e-07, - "loss": 0.5928, - "step": 70108 - }, - { - "epoch": 1.8, - "learning_rate": 7.313676683806038e-07, - "loss": 0.5581, - "step": 70109 - }, - { - "epoch": 1.8, - "learning_rate": 7.313410151182651e-07, - "loss": 0.5879, - "step": 70110 - }, - { - "epoch": 1.8, - "learning_rate": 7.313143620616258e-07, - "loss": 0.5122, - "step": 70111 - }, - { - "epoch": 1.8, - "learning_rate": 7.312877092107074e-07, - "loss": 0.6567, - "step": 70112 - }, - { - "epoch": 1.8, - "learning_rate": 7.312610565655292e-07, - "loss": 0.7842, - "step": 70113 - }, - { - "epoch": 1.8, - "learning_rate": 7.312344041261123e-07, - "loss": 0.5498, - "step": 70114 - }, - { - "epoch": 1.8, - "learning_rate": 7.312077518924765e-07, - "loss": 0.5986, - "step": 70115 - }, - { - "epoch": 1.8, - "learning_rate": 7.311810998646428e-07, - "loss": 0.4902, - "step": 70116 - }, - { - "epoch": 1.8, - "learning_rate": 7.311544480426313e-07, - "loss": 0.6377, - "step": 70117 - }, - { - "epoch": 1.8, - "learning_rate": 7.311277964264625e-07, - "loss": 0.52, - "step": 70118 - }, - { - "epoch": 1.8, - "learning_rate": 7.311011450161566e-07, - "loss": 0.6006, - "step": 70119 - }, - { - "epoch": 1.8, - "learning_rate": 7.310744938117344e-07, - "loss": 0.6357, - "step": 70120 - }, - { - "epoch": 1.8, - "learning_rate": 7.310478428132161e-07, - "loss": 0.7207, - "step": 70121 - }, - { - "epoch": 1.8, - "learning_rate": 7.310211920206222e-07, - "loss": 0.6675, - "step": 70122 - }, - { - "epoch": 1.8, - "learning_rate": 7.30994541433973e-07, - "loss": 0.7026, - "step": 70123 - }, - { - "epoch": 1.8, - "learning_rate": 7.309678910532886e-07, - "loss": 0.6353, - "step": 70124 - }, - { - "epoch": 1.8, - "learning_rate": 7.3094124087859e-07, - "loss": 0.4524, - "step": 70125 - }, - { - "epoch": 1.8, - "learning_rate": 7.30914590909897e-07, - "loss": 0.4702, - "step": 70126 - }, - { - "epoch": 1.8, - "learning_rate": 7.308879411472306e-07, - "loss": 0.5322, - "step": 70127 - }, - { - "epoch": 1.8, - "learning_rate": 7.308612915906108e-07, - "loss": 0.6562, - "step": 70128 - }, - { - "epoch": 1.8, - "learning_rate": 7.308346422400583e-07, - "loss": 0.6167, - "step": 70129 - }, - { - "epoch": 1.8, - "learning_rate": 7.30807993095593e-07, - "loss": 0.6836, - "step": 70130 - }, - { - "epoch": 1.8, - "learning_rate": 7.30781344157236e-07, - "loss": 0.6016, - "step": 70131 - }, - { - "epoch": 1.8, - "learning_rate": 7.307546954250076e-07, - "loss": 0.6963, - "step": 70132 - }, - { - "epoch": 1.8, - "learning_rate": 7.307280468989276e-07, - "loss": 0.6343, - "step": 70133 - }, - { - "epoch": 1.8, - "learning_rate": 7.307013985790166e-07, - "loss": 0.5552, - "step": 70134 - }, - { - "epoch": 1.8, - "learning_rate": 7.306747504652954e-07, - "loss": 0.6499, - "step": 70135 - }, - { - "epoch": 1.8, - "learning_rate": 7.306481025577838e-07, - "loss": 0.5735, - "step": 70136 - }, - { - "epoch": 1.8, - "learning_rate": 7.306214548565029e-07, - "loss": 0.627, - "step": 70137 - }, - { - "epoch": 1.8, - "learning_rate": 7.305948073614725e-07, - "loss": 0.5781, - "step": 70138 - }, - { - "epoch": 1.8, - "learning_rate": 7.305681600727136e-07, - "loss": 0.6196, - "step": 70139 - }, - { - "epoch": 1.8, - "learning_rate": 7.30541512990246e-07, - "loss": 0.6167, - "step": 70140 - }, - { - "epoch": 1.8, - "learning_rate": 7.305148661140905e-07, - "loss": 0.6914, - "step": 70141 - }, - { - "epoch": 1.8, - "learning_rate": 7.304882194442677e-07, - "loss": 0.5254, - "step": 70142 - }, - { - "epoch": 1.8, - "learning_rate": 7.304615729807971e-07, - "loss": 0.626, - "step": 70143 - }, - { - "epoch": 1.8, - "learning_rate": 7.304349267237e-07, - "loss": 0.6792, - "step": 70144 - }, - { - "epoch": 1.8, - "learning_rate": 7.304082806729964e-07, - "loss": 0.6865, - "step": 70145 - }, - { - "epoch": 1.8, - "learning_rate": 7.303816348287069e-07, - "loss": 0.6855, - "step": 70146 - }, - { - "epoch": 1.8, - "learning_rate": 7.303549891908514e-07, - "loss": 0.748, - "step": 70147 - }, - { - "epoch": 1.8, - "learning_rate": 7.303283437594509e-07, - "loss": 0.5391, - "step": 70148 - }, - { - "epoch": 1.8, - "learning_rate": 7.303016985345256e-07, - "loss": 0.7549, - "step": 70149 - }, - { - "epoch": 1.8, - "learning_rate": 7.30275053516096e-07, - "loss": 0.5991, - "step": 70150 - }, - { - "epoch": 1.8, - "learning_rate": 7.302484087041825e-07, - "loss": 0.7549, - "step": 70151 - }, - { - "epoch": 1.8, - "learning_rate": 7.302217640988054e-07, - "loss": 0.6514, - "step": 70152 - }, - { - "epoch": 1.8, - "learning_rate": 7.301951196999848e-07, - "loss": 0.59, - "step": 70153 - }, - { - "epoch": 1.8, - "learning_rate": 7.301684755077415e-07, - "loss": 0.6099, - "step": 70154 - }, - { - "epoch": 1.8, - "learning_rate": 7.301418315220958e-07, - "loss": 0.5889, - "step": 70155 - }, - { - "epoch": 1.8, - "learning_rate": 7.301151877430681e-07, - "loss": 0.6113, - "step": 70156 - }, - { - "epoch": 1.8, - "learning_rate": 7.300885441706786e-07, - "loss": 0.6514, - "step": 70157 - }, - { - "epoch": 1.8, - "learning_rate": 7.300619008049481e-07, - "loss": 0.6758, - "step": 70158 - }, - { - "epoch": 1.8, - "learning_rate": 7.300352576458966e-07, - "loss": 0.6841, - "step": 70159 - }, - { - "epoch": 1.8, - "learning_rate": 7.300086146935449e-07, - "loss": 0.6143, - "step": 70160 - }, - { - "epoch": 1.8, - "learning_rate": 7.29981971947913e-07, - "loss": 0.6387, - "step": 70161 - }, - { - "epoch": 1.8, - "learning_rate": 7.299553294090219e-07, - "loss": 0.791, - "step": 70162 - }, - { - "epoch": 1.8, - "learning_rate": 7.299286870768914e-07, - "loss": 0.6538, - "step": 70163 - }, - { - "epoch": 1.8, - "learning_rate": 7.299020449515419e-07, - "loss": 0.6523, - "step": 70164 - }, - { - "epoch": 1.8, - "learning_rate": 7.298754030329941e-07, - "loss": 0.6045, - "step": 70165 - }, - { - "epoch": 1.8, - "learning_rate": 7.29848761321268e-07, - "loss": 0.7822, - "step": 70166 - }, - { - "epoch": 1.8, - "learning_rate": 7.298221198163847e-07, - "loss": 0.7207, - "step": 70167 - }, - { - "epoch": 1.8, - "learning_rate": 7.297954785183641e-07, - "loss": 0.7002, - "step": 70168 - }, - { - "epoch": 1.8, - "learning_rate": 7.297688374272264e-07, - "loss": 0.6963, - "step": 70169 - }, - { - "epoch": 1.8, - "learning_rate": 7.297421965429926e-07, - "loss": 0.5259, - "step": 70170 - }, - { - "epoch": 1.8, - "learning_rate": 7.297155558656825e-07, - "loss": 0.5396, - "step": 70171 - }, - { - "epoch": 1.8, - "learning_rate": 7.296889153953172e-07, - "loss": 0.4915, - "step": 70172 - }, - { - "epoch": 1.8, - "learning_rate": 7.296622751319165e-07, - "loss": 0.7324, - "step": 70173 - }, - { - "epoch": 1.8, - "learning_rate": 7.296356350755007e-07, - "loss": 0.7402, - "step": 70174 - }, - { - "epoch": 1.8, - "learning_rate": 7.296089952260907e-07, - "loss": 0.5757, - "step": 70175 - }, - { - "epoch": 1.8, - "learning_rate": 7.295823555837064e-07, - "loss": 0.8008, - "step": 70176 - }, - { - "epoch": 1.8, - "learning_rate": 7.295557161483688e-07, - "loss": 0.7578, - "step": 70177 - }, - { - "epoch": 1.8, - "learning_rate": 7.295290769200975e-07, - "loss": 0.4276, - "step": 70178 - }, - { - "epoch": 1.8, - "learning_rate": 7.295024378989137e-07, - "loss": 0.6318, - "step": 70179 - }, - { - "epoch": 1.8, - "learning_rate": 7.294757990848373e-07, - "loss": 0.7021, - "step": 70180 - }, - { - "epoch": 1.8, - "learning_rate": 7.29449160477889e-07, - "loss": 0.6729, - "step": 70181 - }, - { - "epoch": 1.8, - "learning_rate": 7.294225220780892e-07, - "loss": 0.6865, - "step": 70182 - }, - { - "epoch": 1.8, - "learning_rate": 7.293958838854577e-07, - "loss": 0.5201, - "step": 70183 - }, - { - "epoch": 1.8, - "learning_rate": 7.293692459000156e-07, - "loss": 0.4905, - "step": 70184 - }, - { - "epoch": 1.8, - "learning_rate": 7.293426081217828e-07, - "loss": 0.5747, - "step": 70185 - }, - { - "epoch": 1.8, - "learning_rate": 7.293159705507801e-07, - "loss": 0.6484, - "step": 70186 - }, - { - "epoch": 1.8, - "learning_rate": 7.292893331870277e-07, - "loss": 0.6294, - "step": 70187 - }, - { - "epoch": 1.8, - "learning_rate": 7.29262696030546e-07, - "loss": 0.6499, - "step": 70188 - }, - { - "epoch": 1.8, - "learning_rate": 7.292360590813555e-07, - "loss": 0.7168, - "step": 70189 - }, - { - "epoch": 1.8, - "learning_rate": 7.292094223394762e-07, - "loss": 0.6816, - "step": 70190 - }, - { - "epoch": 1.8, - "learning_rate": 7.291827858049291e-07, - "loss": 0.6104, - "step": 70191 - }, - { - "epoch": 1.8, - "learning_rate": 7.291561494777343e-07, - "loss": 0.5103, - "step": 70192 - }, - { - "epoch": 1.8, - "learning_rate": 7.29129513357912e-07, - "loss": 0.6895, - "step": 70193 - }, - { - "epoch": 1.8, - "learning_rate": 7.291028774454828e-07, - "loss": 0.7119, - "step": 70194 - }, - { - "epoch": 1.8, - "learning_rate": 7.29076241740467e-07, - "loss": 0.7666, - "step": 70195 - }, - { - "epoch": 1.8, - "learning_rate": 7.290496062428853e-07, - "loss": 0.5776, - "step": 70196 - }, - { - "epoch": 1.8, - "learning_rate": 7.290229709527575e-07, - "loss": 0.6172, - "step": 70197 - }, - { - "epoch": 1.8, - "learning_rate": 7.289963358701048e-07, - "loss": 0.6426, - "step": 70198 - }, - { - "epoch": 1.8, - "learning_rate": 7.289697009949467e-07, - "loss": 0.7344, - "step": 70199 - }, - { - "epoch": 1.8, - "learning_rate": 7.289430663273044e-07, - "loss": 0.7959, - "step": 70200 - }, - { - "epoch": 1.8, - "learning_rate": 7.289164318671976e-07, - "loss": 0.6289, - "step": 70201 - }, - { - "epoch": 1.8, - "learning_rate": 7.288897976146475e-07, - "loss": 0.6836, - "step": 70202 - }, - { - "epoch": 1.8, - "learning_rate": 7.288631635696738e-07, - "loss": 0.6665, - "step": 70203 - }, - { - "epoch": 1.8, - "learning_rate": 7.288365297322971e-07, - "loss": 0.6279, - "step": 70204 - }, - { - "epoch": 1.8, - "learning_rate": 7.288098961025375e-07, - "loss": 0.7188, - "step": 70205 - }, - { - "epoch": 1.8, - "learning_rate": 7.28783262680416e-07, - "loss": 0.6235, - "step": 70206 - }, - { - "epoch": 1.8, - "learning_rate": 7.287566294659526e-07, - "loss": 0.5723, - "step": 70207 - }, - { - "epoch": 1.8, - "learning_rate": 7.287299964591677e-07, - "loss": 0.5908, - "step": 70208 - }, - { - "epoch": 1.8, - "learning_rate": 7.287033636600819e-07, - "loss": 0.6636, - "step": 70209 - }, - { - "epoch": 1.8, - "learning_rate": 7.286767310687154e-07, - "loss": 0.603, - "step": 70210 - }, - { - "epoch": 1.8, - "learning_rate": 7.286500986850885e-07, - "loss": 0.6865, - "step": 70211 - }, - { - "epoch": 1.8, - "learning_rate": 7.286234665092223e-07, - "loss": 0.5771, - "step": 70212 - }, - { - "epoch": 1.8, - "learning_rate": 7.285968345411363e-07, - "loss": 0.543, - "step": 70213 - }, - { - "epoch": 1.8, - "learning_rate": 7.28570202780851e-07, - "loss": 0.4961, - "step": 70214 - }, - { - "epoch": 1.8, - "learning_rate": 7.285435712283873e-07, - "loss": 0.7549, - "step": 70215 - }, - { - "epoch": 1.8, - "learning_rate": 7.285169398837651e-07, - "loss": 0.4469, - "step": 70216 - }, - { - "epoch": 1.8, - "learning_rate": 7.284903087470051e-07, - "loss": 0.5469, - "step": 70217 - }, - { - "epoch": 1.8, - "learning_rate": 7.284636778181275e-07, - "loss": 0.5281, - "step": 70218 - }, - { - "epoch": 1.8, - "learning_rate": 7.284370470971528e-07, - "loss": 0.7139, - "step": 70219 - }, - { - "epoch": 1.8, - "learning_rate": 7.284104165841014e-07, - "loss": 0.5718, - "step": 70220 - }, - { - "epoch": 1.8, - "learning_rate": 7.283837862789936e-07, - "loss": 0.6592, - "step": 70221 - }, - { - "epoch": 1.8, - "learning_rate": 7.283571561818502e-07, - "loss": 0.6045, - "step": 70222 - }, - { - "epoch": 1.8, - "learning_rate": 7.283305262926911e-07, - "loss": 0.5923, - "step": 70223 - }, - { - "epoch": 1.8, - "learning_rate": 7.283038966115364e-07, - "loss": 0.6909, - "step": 70224 - }, - { - "epoch": 1.8, - "learning_rate": 7.282772671384074e-07, - "loss": 0.6992, - "step": 70225 - }, - { - "epoch": 1.8, - "learning_rate": 7.282506378733236e-07, - "loss": 0.6367, - "step": 70226 - }, - { - "epoch": 1.8, - "learning_rate": 7.282240088163061e-07, - "loss": 0.6008, - "step": 70227 - }, - { - "epoch": 1.8, - "learning_rate": 7.281973799673747e-07, - "loss": 0.7676, - "step": 70228 - }, - { - "epoch": 1.8, - "learning_rate": 7.281707513265503e-07, - "loss": 0.606, - "step": 70229 - }, - { - "epoch": 1.8, - "learning_rate": 7.281441228938529e-07, - "loss": 0.8135, - "step": 70230 - }, - { - "epoch": 1.8, - "learning_rate": 7.281174946693032e-07, - "loss": 0.7036, - "step": 70231 - }, - { - "epoch": 1.8, - "learning_rate": 7.280908666529217e-07, - "loss": 0.6211, - "step": 70232 - }, - { - "epoch": 1.8, - "learning_rate": 7.28064238844728e-07, - "loss": 0.7749, - "step": 70233 - }, - { - "epoch": 1.8, - "learning_rate": 7.280376112447433e-07, - "loss": 0.595, - "step": 70234 - }, - { - "epoch": 1.8, - "learning_rate": 7.280109838529875e-07, - "loss": 0.4766, - "step": 70235 - }, - { - "epoch": 1.8, - "learning_rate": 7.279843566694812e-07, - "loss": 0.6162, - "step": 70236 - }, - { - "epoch": 1.8, - "learning_rate": 7.279577296942448e-07, - "loss": 0.5864, - "step": 70237 - }, - { - "epoch": 1.8, - "learning_rate": 7.279311029272988e-07, - "loss": 0.5989, - "step": 70238 - }, - { - "epoch": 1.8, - "learning_rate": 7.279044763686631e-07, - "loss": 0.7075, - "step": 70239 - }, - { - "epoch": 1.8, - "learning_rate": 7.278778500183589e-07, - "loss": 0.5679, - "step": 70240 - }, - { - "epoch": 1.8, - "learning_rate": 7.278512238764059e-07, - "loss": 0.6963, - "step": 70241 - }, - { - "epoch": 1.8, - "learning_rate": 7.27824597942825e-07, - "loss": 0.6748, - "step": 70242 - }, - { - "epoch": 1.8, - "learning_rate": 7.277979722176358e-07, - "loss": 0.5254, - "step": 70243 - }, - { - "epoch": 1.8, - "learning_rate": 7.277713467008595e-07, - "loss": 0.6211, - "step": 70244 - }, - { - "epoch": 1.8, - "learning_rate": 7.277447213925159e-07, - "loss": 0.6699, - "step": 70245 - }, - { - "epoch": 1.8, - "learning_rate": 7.277180962926258e-07, - "loss": 0.6846, - "step": 70246 - }, - { - "epoch": 1.8, - "learning_rate": 7.276914714012092e-07, - "loss": 0.71, - "step": 70247 - }, - { - "epoch": 1.8, - "learning_rate": 7.276648467182871e-07, - "loss": 0.6641, - "step": 70248 - }, - { - "epoch": 1.8, - "learning_rate": 7.276382222438792e-07, - "loss": 0.5249, - "step": 70249 - }, - { - "epoch": 1.8, - "learning_rate": 7.276115979780064e-07, - "loss": 0.5112, - "step": 70250 - }, - { - "epoch": 1.8, - "learning_rate": 7.275849739206887e-07, - "loss": 0.3789, - "step": 70251 - }, - { - "epoch": 1.8, - "learning_rate": 7.27558350071947e-07, - "loss": 0.5059, - "step": 70252 - }, - { - "epoch": 1.8, - "learning_rate": 7.275317264318012e-07, - "loss": 0.5933, - "step": 70253 - }, - { - "epoch": 1.8, - "learning_rate": 7.275051030002716e-07, - "loss": 0.6338, - "step": 70254 - }, - { - "epoch": 1.8, - "learning_rate": 7.27478479777379e-07, - "loss": 0.585, - "step": 70255 - }, - { - "epoch": 1.8, - "learning_rate": 7.274518567631433e-07, - "loss": 0.5864, - "step": 70256 - }, - { - "epoch": 1.8, - "learning_rate": 7.274252339575856e-07, - "loss": 0.5962, - "step": 70257 - }, - { - "epoch": 1.8, - "learning_rate": 7.273986113607256e-07, - "loss": 0.7073, - "step": 70258 - }, - { - "epoch": 1.8, - "learning_rate": 7.27371988972584e-07, - "loss": 0.4501, - "step": 70259 - }, - { - "epoch": 1.8, - "learning_rate": 7.273453667931813e-07, - "loss": 0.6743, - "step": 70260 - }, - { - "epoch": 1.8, - "learning_rate": 7.273187448225374e-07, - "loss": 0.5342, - "step": 70261 - }, - { - "epoch": 1.8, - "learning_rate": 7.272921230606734e-07, - "loss": 0.6689, - "step": 70262 - }, - { - "epoch": 1.8, - "learning_rate": 7.272655015076093e-07, - "loss": 0.4846, - "step": 70263 - }, - { - "epoch": 1.8, - "learning_rate": 7.272388801633651e-07, - "loss": 0.5918, - "step": 70264 - }, - { - "epoch": 1.8, - "learning_rate": 7.272122590279617e-07, - "loss": 0.4517, - "step": 70265 - }, - { - "epoch": 1.8, - "learning_rate": 7.271856381014192e-07, - "loss": 0.667, - "step": 70266 - }, - { - "epoch": 1.8, - "learning_rate": 7.271590173837583e-07, - "loss": 0.6421, - "step": 70267 - }, - { - "epoch": 1.8, - "learning_rate": 7.27132396874999e-07, - "loss": 0.7549, - "step": 70268 - }, - { - "epoch": 1.8, - "learning_rate": 7.27105776575162e-07, - "loss": 0.4805, - "step": 70269 - }, - { - "epoch": 1.8, - "learning_rate": 7.270791564842673e-07, - "loss": 0.5781, - "step": 70270 - }, - { - "epoch": 1.8, - "learning_rate": 7.270525366023359e-07, - "loss": 0.6289, - "step": 70271 - }, - { - "epoch": 1.8, - "learning_rate": 7.270259169293879e-07, - "loss": 0.8623, - "step": 70272 - }, - { - "epoch": 1.8, - "learning_rate": 7.269992974654434e-07, - "loss": 0.4548, - "step": 70273 - }, - { - "epoch": 1.8, - "learning_rate": 7.269726782105231e-07, - "loss": 0.6641, - "step": 70274 - }, - { - "epoch": 1.8, - "learning_rate": 7.26946059164647e-07, - "loss": 0.5771, - "step": 70275 - }, - { - "epoch": 1.8, - "learning_rate": 7.26919440327836e-07, - "loss": 0.6367, - "step": 70276 - }, - { - "epoch": 1.8, - "learning_rate": 7.268928217001102e-07, - "loss": 0.6089, - "step": 70277 - }, - { - "epoch": 1.8, - "learning_rate": 7.268662032814899e-07, - "loss": 0.667, - "step": 70278 - }, - { - "epoch": 1.8, - "learning_rate": 7.268395850719957e-07, - "loss": 0.6602, - "step": 70279 - }, - { - "epoch": 1.8, - "learning_rate": 7.268129670716477e-07, - "loss": 0.5547, - "step": 70280 - }, - { - "epoch": 1.8, - "learning_rate": 7.267863492804666e-07, - "loss": 0.543, - "step": 70281 - }, - { - "epoch": 1.8, - "learning_rate": 7.267597316984728e-07, - "loss": 0.5923, - "step": 70282 - }, - { - "epoch": 1.8, - "learning_rate": 7.267331143256863e-07, - "loss": 0.6094, - "step": 70283 - }, - { - "epoch": 1.8, - "learning_rate": 7.267064971621277e-07, - "loss": 0.7383, - "step": 70284 - }, - { - "epoch": 1.8, - "learning_rate": 7.266798802078172e-07, - "loss": 0.7783, - "step": 70285 - }, - { - "epoch": 1.8, - "learning_rate": 7.266532634627755e-07, - "loss": 0.6787, - "step": 70286 - }, - { - "epoch": 1.8, - "learning_rate": 7.266266469270228e-07, - "loss": 0.6448, - "step": 70287 - }, - { - "epoch": 1.8, - "learning_rate": 7.266000306005796e-07, - "loss": 0.4209, - "step": 70288 - }, - { - "epoch": 1.8, - "learning_rate": 7.265734144834659e-07, - "loss": 0.7607, - "step": 70289 - }, - { - "epoch": 1.8, - "learning_rate": 7.265467985757028e-07, - "loss": 0.6533, - "step": 70290 - }, - { - "epoch": 1.8, - "learning_rate": 7.265201828773097e-07, - "loss": 0.5762, - "step": 70291 - }, - { - "epoch": 1.8, - "learning_rate": 7.264935673883084e-07, - "loss": 0.6152, - "step": 70292 - }, - { - "epoch": 1.8, - "learning_rate": 7.264669521087178e-07, - "loss": 0.7725, - "step": 70293 - }, - { - "epoch": 1.8, - "learning_rate": 7.26440337038559e-07, - "loss": 0.4767, - "step": 70294 - }, - { - "epoch": 1.8, - "learning_rate": 7.264137221778521e-07, - "loss": 0.875, - "step": 70295 - }, - { - "epoch": 1.8, - "learning_rate": 7.263871075266177e-07, - "loss": 0.5073, - "step": 70296 - }, - { - "epoch": 1.8, - "learning_rate": 7.26360493084876e-07, - "loss": 0.6982, - "step": 70297 - }, - { - "epoch": 1.8, - "learning_rate": 7.263338788526477e-07, - "loss": 0.6212, - "step": 70298 - }, - { - "epoch": 1.8, - "learning_rate": 7.263072648299528e-07, - "loss": 0.3146, - "step": 70299 - }, - { - "epoch": 1.8, - "learning_rate": 7.262806510168121e-07, - "loss": 0.559, - "step": 70300 - }, - { - "epoch": 1.8, - "learning_rate": 7.262540374132453e-07, - "loss": 0.5425, - "step": 70301 - }, - { - "epoch": 1.8, - "learning_rate": 7.262274240192737e-07, - "loss": 0.6084, - "step": 70302 - }, - { - "epoch": 1.8, - "learning_rate": 7.26200810834917e-07, - "loss": 0.6602, - "step": 70303 - }, - { - "epoch": 1.8, - "learning_rate": 7.261741978601955e-07, - "loss": 0.5552, - "step": 70304 - }, - { - "epoch": 1.8, - "learning_rate": 7.261475850951301e-07, - "loss": 0.6367, - "step": 70305 - }, - { - "epoch": 1.8, - "learning_rate": 7.261209725397406e-07, - "loss": 0.5327, - "step": 70306 - }, - { - "epoch": 1.8, - "learning_rate": 7.260943601940479e-07, - "loss": 0.4844, - "step": 70307 - }, - { - "epoch": 1.8, - "learning_rate": 7.260677480580722e-07, - "loss": 0.4421, - "step": 70308 - }, - { - "epoch": 1.8, - "learning_rate": 7.260411361318337e-07, - "loss": 0.6816, - "step": 70309 - }, - { - "epoch": 1.8, - "learning_rate": 7.260145244153528e-07, - "loss": 0.6064, - "step": 70310 - }, - { - "epoch": 1.8, - "learning_rate": 7.259879129086503e-07, - "loss": 0.6353, - "step": 70311 - }, - { - "epoch": 1.8, - "learning_rate": 7.259613016117463e-07, - "loss": 0.6538, - "step": 70312 - }, - { - "epoch": 1.8, - "learning_rate": 7.259346905246611e-07, - "loss": 0.6807, - "step": 70313 - }, - { - "epoch": 1.8, - "learning_rate": 7.259080796474146e-07, - "loss": 0.8154, - "step": 70314 - }, - { - "epoch": 1.8, - "learning_rate": 7.258814689800281e-07, - "loss": 0.6421, - "step": 70315 - }, - { - "epoch": 1.8, - "learning_rate": 7.258548585225214e-07, - "loss": 0.5225, - "step": 70316 - }, - { - "epoch": 1.8, - "learning_rate": 7.258282482749152e-07, - "loss": 0.4937, - "step": 70317 - }, - { - "epoch": 1.8, - "learning_rate": 7.258016382372294e-07, - "loss": 0.5334, - "step": 70318 - }, - { - "epoch": 1.8, - "learning_rate": 7.25775028409485e-07, - "loss": 0.5312, - "step": 70319 - }, - { - "epoch": 1.8, - "learning_rate": 7.257484187917018e-07, - "loss": 0.6597, - "step": 70320 - }, - { - "epoch": 1.8, - "learning_rate": 7.257218093839005e-07, - "loss": 0.7148, - "step": 70321 - }, - { - "epoch": 1.8, - "learning_rate": 7.256952001861019e-07, - "loss": 0.6748, - "step": 70322 - }, - { - "epoch": 1.8, - "learning_rate": 7.256685911983252e-07, - "loss": 0.8379, - "step": 70323 - }, - { - "epoch": 1.8, - "learning_rate": 7.256419824205917e-07, - "loss": 0.5608, - "step": 70324 - }, - { - "epoch": 1.8, - "learning_rate": 7.256153738529214e-07, - "loss": 0.6357, - "step": 70325 - }, - { - "epoch": 1.8, - "learning_rate": 7.25588765495335e-07, - "loss": 0.4661, - "step": 70326 - }, - { - "epoch": 1.8, - "learning_rate": 7.255621573478523e-07, - "loss": 0.4341, - "step": 70327 - }, - { - "epoch": 1.8, - "learning_rate": 7.255355494104945e-07, - "loss": 0.4458, - "step": 70328 - }, - { - "epoch": 1.8, - "learning_rate": 7.255089416832812e-07, - "loss": 0.7734, - "step": 70329 - }, - { - "epoch": 1.8, - "learning_rate": 7.25482334166233e-07, - "loss": 0.4089, - "step": 70330 - }, - { - "epoch": 1.8, - "learning_rate": 7.254557268593707e-07, - "loss": 0.6294, - "step": 70331 - }, - { - "epoch": 1.8, - "learning_rate": 7.254291197627145e-07, - "loss": 0.463, - "step": 70332 - }, - { - "epoch": 1.8, - "learning_rate": 7.25402512876284e-07, - "loss": 0.6572, - "step": 70333 - }, - { - "epoch": 1.8, - "learning_rate": 7.253759062001005e-07, - "loss": 0.6943, - "step": 70334 - }, - { - "epoch": 1.8, - "learning_rate": 7.253492997341839e-07, - "loss": 0.7803, - "step": 70335 - }, - { - "epoch": 1.8, - "learning_rate": 7.253226934785548e-07, - "loss": 0.5537, - "step": 70336 - }, - { - "epoch": 1.8, - "learning_rate": 7.252960874332335e-07, - "loss": 0.5028, - "step": 70337 - }, - { - "epoch": 1.8, - "learning_rate": 7.252694815982403e-07, - "loss": 0.4043, - "step": 70338 - }, - { - "epoch": 1.8, - "learning_rate": 7.252428759735955e-07, - "loss": 0.6758, - "step": 70339 - }, - { - "epoch": 1.8, - "learning_rate": 7.252162705593198e-07, - "loss": 0.553, - "step": 70340 - }, - { - "epoch": 1.8, - "learning_rate": 7.251896653554336e-07, - "loss": 0.6562, - "step": 70341 - }, - { - "epoch": 1.8, - "learning_rate": 7.251630603619566e-07, - "loss": 0.5542, - "step": 70342 - }, - { - "epoch": 1.8, - "learning_rate": 7.251364555789098e-07, - "loss": 0.5442, - "step": 70343 - }, - { - "epoch": 1.8, - "learning_rate": 7.251098510063131e-07, - "loss": 0.7505, - "step": 70344 - }, - { - "epoch": 1.8, - "learning_rate": 7.250832466441876e-07, - "loss": 0.5962, - "step": 70345 - }, - { - "epoch": 1.8, - "learning_rate": 7.250566424925528e-07, - "loss": 0.5608, - "step": 70346 - }, - { - "epoch": 1.8, - "learning_rate": 7.250300385514296e-07, - "loss": 0.5674, - "step": 70347 - }, - { - "epoch": 1.8, - "learning_rate": 7.250034348208383e-07, - "loss": 0.5693, - "step": 70348 - }, - { - "epoch": 1.8, - "learning_rate": 7.249768313007994e-07, - "loss": 0.7178, - "step": 70349 - }, - { - "epoch": 1.8, - "learning_rate": 7.249502279913329e-07, - "loss": 0.5615, - "step": 70350 - }, - { - "epoch": 1.8, - "learning_rate": 7.249236248924597e-07, - "loss": 0.6091, - "step": 70351 - }, - { - "epoch": 1.8, - "learning_rate": 7.248970220041994e-07, - "loss": 0.6646, - "step": 70352 - }, - { - "epoch": 1.8, - "learning_rate": 7.248704193265731e-07, - "loss": 0.666, - "step": 70353 - }, - { - "epoch": 1.8, - "learning_rate": 7.248438168596005e-07, - "loss": 0.6147, - "step": 70354 - }, - { - "epoch": 1.8, - "learning_rate": 7.248172146033027e-07, - "loss": 0.6807, - "step": 70355 - }, - { - "epoch": 1.8, - "learning_rate": 7.247906125576995e-07, - "loss": 0.7109, - "step": 70356 - }, - { - "epoch": 1.8, - "learning_rate": 7.247640107228115e-07, - "loss": 0.751, - "step": 70357 - }, - { - "epoch": 1.8, - "learning_rate": 7.247374090986589e-07, - "loss": 0.6543, - "step": 70358 - }, - { - "epoch": 1.8, - "learning_rate": 7.247108076852625e-07, - "loss": 0.6782, - "step": 70359 - }, - { - "epoch": 1.8, - "learning_rate": 7.246842064826421e-07, - "loss": 0.7378, - "step": 70360 - }, - { - "epoch": 1.8, - "learning_rate": 7.246576054908188e-07, - "loss": 0.5308, - "step": 70361 - }, - { - "epoch": 1.8, - "learning_rate": 7.246310047098123e-07, - "loss": 0.4829, - "step": 70362 - }, - { - "epoch": 1.8, - "learning_rate": 7.246044041396429e-07, - "loss": 0.4998, - "step": 70363 - }, - { - "epoch": 1.8, - "learning_rate": 7.245778037803316e-07, - "loss": 0.5698, - "step": 70364 - }, - { - "epoch": 1.8, - "learning_rate": 7.245512036318982e-07, - "loss": 0.6128, - "step": 70365 - }, - { - "epoch": 1.8, - "learning_rate": 7.245246036943633e-07, - "loss": 0.8086, - "step": 70366 - }, - { - "epoch": 1.8, - "learning_rate": 7.244980039677473e-07, - "loss": 0.6162, - "step": 70367 - }, - { - "epoch": 1.8, - "learning_rate": 7.244714044520703e-07, - "loss": 0.752, - "step": 70368 - }, - { - "epoch": 1.8, - "learning_rate": 7.244448051473531e-07, - "loss": 0.6997, - "step": 70369 - }, - { - "epoch": 1.8, - "learning_rate": 7.244182060536157e-07, - "loss": 0.7466, - "step": 70370 - }, - { - "epoch": 1.8, - "learning_rate": 7.243916071708791e-07, - "loss": 0.5898, - "step": 70371 - }, - { - "epoch": 1.8, - "learning_rate": 7.243650084991628e-07, - "loss": 0.5559, - "step": 70372 - }, - { - "epoch": 1.8, - "learning_rate": 7.243384100384873e-07, - "loss": 0.8076, - "step": 70373 - }, - { - "epoch": 1.8, - "learning_rate": 7.243118117888736e-07, - "loss": 0.5127, - "step": 70374 - }, - { - "epoch": 1.8, - "learning_rate": 7.242852137503412e-07, - "loss": 0.6934, - "step": 70375 - }, - { - "epoch": 1.8, - "learning_rate": 7.242586159229113e-07, - "loss": 0.6992, - "step": 70376 - }, - { - "epoch": 1.8, - "learning_rate": 7.242320183066038e-07, - "loss": 0.6455, - "step": 70377 - }, - { - "epoch": 1.8, - "learning_rate": 7.242054209014392e-07, - "loss": 0.7036, - "step": 70378 - }, - { - "epoch": 1.8, - "learning_rate": 7.241788237074377e-07, - "loss": 0.7773, - "step": 70379 - }, - { - "epoch": 1.8, - "learning_rate": 7.241522267246201e-07, - "loss": 0.572, - "step": 70380 - }, - { - "epoch": 1.8, - "learning_rate": 7.241256299530065e-07, - "loss": 0.3828, - "step": 70381 - }, - { - "epoch": 1.8, - "learning_rate": 7.240990333926168e-07, - "loss": 0.7095, - "step": 70382 - }, - { - "epoch": 1.8, - "learning_rate": 7.240724370434721e-07, - "loss": 0.4741, - "step": 70383 - }, - { - "epoch": 1.8, - "learning_rate": 7.240458409055923e-07, - "loss": 0.8047, - "step": 70384 - }, - { - "epoch": 1.8, - "learning_rate": 7.240192449789979e-07, - "loss": 0.7432, - "step": 70385 - }, - { - "epoch": 1.8, - "learning_rate": 7.239926492637094e-07, - "loss": 0.6934, - "step": 70386 - }, - { - "epoch": 1.8, - "learning_rate": 7.239660537597467e-07, - "loss": 0.8896, - "step": 70387 - }, - { - "epoch": 1.8, - "learning_rate": 7.239394584671308e-07, - "loss": 0.4351, - "step": 70388 - }, - { - "epoch": 1.8, - "learning_rate": 7.239128633858816e-07, - "loss": 0.3593, - "step": 70389 - }, - { - "epoch": 1.8, - "learning_rate": 7.238862685160199e-07, - "loss": 0.6172, - "step": 70390 - }, - { - "epoch": 1.8, - "learning_rate": 7.238596738575657e-07, - "loss": 0.7861, - "step": 70391 - }, - { - "epoch": 1.8, - "learning_rate": 7.238330794105394e-07, - "loss": 0.6689, - "step": 70392 - }, - { - "epoch": 1.8, - "learning_rate": 7.238064851749614e-07, - "loss": 0.7305, - "step": 70393 - }, - { - "epoch": 1.8, - "learning_rate": 7.237798911508519e-07, - "loss": 0.4209, - "step": 70394 - }, - { - "epoch": 1.8, - "learning_rate": 7.237532973382316e-07, - "loss": 0.4961, - "step": 70395 - }, - { - "epoch": 1.8, - "learning_rate": 7.237267037371206e-07, - "loss": 0.7505, - "step": 70396 - }, - { - "epoch": 1.8, - "learning_rate": 7.237001103475396e-07, - "loss": 0.6904, - "step": 70397 - }, - { - "epoch": 1.8, - "learning_rate": 7.236735171695084e-07, - "loss": 0.4932, - "step": 70398 - }, - { - "epoch": 1.8, - "learning_rate": 7.236469242030479e-07, - "loss": 0.6211, - "step": 70399 - }, - { - "epoch": 1.8, - "learning_rate": 7.23620331448178e-07, - "loss": 0.6465, - "step": 70400 - }, - { - "epoch": 1.8, - "learning_rate": 7.2359373890492e-07, - "loss": 0.7695, - "step": 70401 - }, - { - "epoch": 1.8, - "learning_rate": 7.23567146573293e-07, - "loss": 0.6396, - "step": 70402 - }, - { - "epoch": 1.8, - "learning_rate": 7.235405544533179e-07, - "loss": 0.6211, - "step": 70403 - }, - { - "epoch": 1.8, - "learning_rate": 7.235139625450152e-07, - "loss": 0.6514, - "step": 70404 - }, - { - "epoch": 1.8, - "learning_rate": 7.234873708484052e-07, - "loss": 0.708, - "step": 70405 - }, - { - "epoch": 1.8, - "learning_rate": 7.23460779363508e-07, - "loss": 0.6523, - "step": 70406 - }, - { - "epoch": 1.8, - "learning_rate": 7.234341880903443e-07, - "loss": 0.5488, - "step": 70407 - }, - { - "epoch": 1.8, - "learning_rate": 7.234075970289342e-07, - "loss": 0.5967, - "step": 70408 - }, - { - "epoch": 1.8, - "learning_rate": 7.233810061792984e-07, - "loss": 0.5234, - "step": 70409 - }, - { - "epoch": 1.8, - "learning_rate": 7.233544155414569e-07, - "loss": 0.45, - "step": 70410 - }, - { - "epoch": 1.8, - "learning_rate": 7.233278251154304e-07, - "loss": 0.6699, - "step": 70411 - }, - { - "epoch": 1.8, - "learning_rate": 7.23301234901239e-07, - "loss": 0.54, - "step": 70412 - }, - { - "epoch": 1.8, - "learning_rate": 7.232746448989029e-07, - "loss": 0.6787, - "step": 70413 - }, - { - "epoch": 1.8, - "learning_rate": 7.232480551084428e-07, - "loss": 0.6768, - "step": 70414 - }, - { - "epoch": 1.8, - "learning_rate": 7.232214655298789e-07, - "loss": 0.7402, - "step": 70415 - }, - { - "epoch": 1.8, - "learning_rate": 7.231948761632317e-07, - "loss": 0.533, - "step": 70416 - }, - { - "epoch": 1.8, - "learning_rate": 7.231682870085212e-07, - "loss": 0.604, - "step": 70417 - }, - { - "epoch": 1.8, - "learning_rate": 7.231416980657683e-07, - "loss": 0.5747, - "step": 70418 - }, - { - "epoch": 1.8, - "learning_rate": 7.231151093349928e-07, - "loss": 0.6001, - "step": 70419 - }, - { - "epoch": 1.8, - "learning_rate": 7.230885208162156e-07, - "loss": 0.6592, - "step": 70420 - }, - { - "epoch": 1.8, - "learning_rate": 7.230619325094572e-07, - "loss": 0.5146, - "step": 70421 - }, - { - "epoch": 1.8, - "learning_rate": 7.23035344414737e-07, - "loss": 0.5527, - "step": 70422 - }, - { - "epoch": 1.8, - "learning_rate": 7.230087565320758e-07, - "loss": 0.3786, - "step": 70423 - }, - { - "epoch": 1.81, - "learning_rate": 7.229821688614943e-07, - "loss": 0.5723, - "step": 70424 - }, - { - "epoch": 1.81, - "learning_rate": 7.229555814030124e-07, - "loss": 0.5703, - "step": 70425 - }, - { - "epoch": 1.81, - "learning_rate": 7.229289941566508e-07, - "loss": 0.623, - "step": 70426 - }, - { - "epoch": 1.81, - "learning_rate": 7.229024071224297e-07, - "loss": 0.3494, - "step": 70427 - }, - { - "epoch": 1.81, - "learning_rate": 7.228758203003695e-07, - "loss": 0.709, - "step": 70428 - }, - { - "epoch": 1.81, - "learning_rate": 7.228492336904904e-07, - "loss": 0.8096, - "step": 70429 - }, - { - "epoch": 1.81, - "learning_rate": 7.228226472928131e-07, - "loss": 0.5181, - "step": 70430 - }, - { - "epoch": 1.81, - "learning_rate": 7.22796061107358e-07, - "loss": 0.6621, - "step": 70431 - }, - { - "epoch": 1.81, - "learning_rate": 7.227694751341448e-07, - "loss": 0.7588, - "step": 70432 - }, - { - "epoch": 1.81, - "learning_rate": 7.227428893731945e-07, - "loss": 0.5168, - "step": 70433 - }, - { - "epoch": 1.81, - "learning_rate": 7.22716303824527e-07, - "loss": 0.665, - "step": 70434 - }, - { - "epoch": 1.81, - "learning_rate": 7.22689718488163e-07, - "loss": 0.5645, - "step": 70435 - }, - { - "epoch": 1.81, - "learning_rate": 7.226631333641227e-07, - "loss": 0.582, - "step": 70436 - }, - { - "epoch": 1.81, - "learning_rate": 7.226365484524264e-07, - "loss": 0.6562, - "step": 70437 - }, - { - "epoch": 1.81, - "learning_rate": 7.226099637530946e-07, - "loss": 0.645, - "step": 70438 - }, - { - "epoch": 1.81, - "learning_rate": 7.225833792661476e-07, - "loss": 0.7383, - "step": 70439 - }, - { - "epoch": 1.81, - "learning_rate": 7.22556794991606e-07, - "loss": 0.6606, - "step": 70440 - }, - { - "epoch": 1.81, - "learning_rate": 7.2253021092949e-07, - "loss": 0.6611, - "step": 70441 - }, - { - "epoch": 1.81, - "learning_rate": 7.225036270798193e-07, - "loss": 0.5408, - "step": 70442 - }, - { - "epoch": 1.81, - "learning_rate": 7.224770434426152e-07, - "loss": 0.6846, - "step": 70443 - }, - { - "epoch": 1.81, - "learning_rate": 7.224504600178973e-07, - "loss": 0.5349, - "step": 70444 - }, - { - "epoch": 1.81, - "learning_rate": 7.224238768056867e-07, - "loss": 0.7139, - "step": 70445 - }, - { - "epoch": 1.81, - "learning_rate": 7.22397293806003e-07, - "loss": 0.6641, - "step": 70446 - }, - { - "epoch": 1.81, - "learning_rate": 7.223707110188672e-07, - "loss": 0.5217, - "step": 70447 - }, - { - "epoch": 1.81, - "learning_rate": 7.223441284442992e-07, - "loss": 0.5918, - "step": 70448 - }, - { - "epoch": 1.81, - "learning_rate": 7.223175460823199e-07, - "loss": 0.54, - "step": 70449 - }, - { - "epoch": 1.81, - "learning_rate": 7.222909639329489e-07, - "loss": 0.5923, - "step": 70450 - }, - { - "epoch": 1.81, - "learning_rate": 7.222643819962073e-07, - "loss": 0.6367, - "step": 70451 - }, - { - "epoch": 1.81, - "learning_rate": 7.22237800272115e-07, - "loss": 0.6089, - "step": 70452 - }, - { - "epoch": 1.81, - "learning_rate": 7.222112187606921e-07, - "loss": 0.6787, - "step": 70453 - }, - { - "epoch": 1.81, - "learning_rate": 7.221846374619597e-07, - "loss": 0.6494, - "step": 70454 - }, - { - "epoch": 1.81, - "learning_rate": 7.221580563759374e-07, - "loss": 0.5967, - "step": 70455 - }, - { - "epoch": 1.81, - "learning_rate": 7.221314755026462e-07, - "loss": 0.5151, - "step": 70456 - }, - { - "epoch": 1.81, - "learning_rate": 7.22104894842106e-07, - "loss": 0.5628, - "step": 70457 - }, - { - "epoch": 1.81, - "learning_rate": 7.220783143943372e-07, - "loss": 0.6602, - "step": 70458 - }, - { - "epoch": 1.81, - "learning_rate": 7.220517341593605e-07, - "loss": 0.6621, - "step": 70459 - }, - { - "epoch": 1.81, - "learning_rate": 7.220251541371957e-07, - "loss": 0.6675, - "step": 70460 - }, - { - "epoch": 1.81, - "learning_rate": 7.219985743278641e-07, - "loss": 0.7412, - "step": 70461 - }, - { - "epoch": 1.81, - "learning_rate": 7.21971994731385e-07, - "loss": 0.5845, - "step": 70462 - }, - { - "epoch": 1.81, - "learning_rate": 7.219454153477788e-07, - "loss": 0.6296, - "step": 70463 - }, - { - "epoch": 1.81, - "learning_rate": 7.219188361770667e-07, - "loss": 0.6436, - "step": 70464 - }, - { - "epoch": 1.81, - "learning_rate": 7.218922572192682e-07, - "loss": 0.6118, - "step": 70465 - }, - { - "epoch": 1.81, - "learning_rate": 7.218656784744043e-07, - "loss": 0.7305, - "step": 70466 - }, - { - "epoch": 1.81, - "learning_rate": 7.218390999424948e-07, - "loss": 0.6426, - "step": 70467 - }, - { - "epoch": 1.81, - "learning_rate": 7.218125216235607e-07, - "loss": 0.5225, - "step": 70468 - }, - { - "epoch": 1.81, - "learning_rate": 7.217859435176215e-07, - "loss": 0.8086, - "step": 70469 - }, - { - "epoch": 1.81, - "learning_rate": 7.217593656246983e-07, - "loss": 0.5449, - "step": 70470 - }, - { - "epoch": 1.81, - "learning_rate": 7.217327879448114e-07, - "loss": 0.6104, - "step": 70471 - }, - { - "epoch": 1.81, - "learning_rate": 7.217062104779806e-07, - "loss": 0.5986, - "step": 70472 - }, - { - "epoch": 1.81, - "learning_rate": 7.216796332242265e-07, - "loss": 0.79, - "step": 70473 - }, - { - "epoch": 1.81, - "learning_rate": 7.216530561835696e-07, - "loss": 0.6865, - "step": 70474 - }, - { - "epoch": 1.81, - "learning_rate": 7.216264793560301e-07, - "loss": 0.6431, - "step": 70475 - }, - { - "epoch": 1.81, - "learning_rate": 7.215999027416286e-07, - "loss": 0.5957, - "step": 70476 - }, - { - "epoch": 1.81, - "learning_rate": 7.21573326340385e-07, - "loss": 0.623, - "step": 70477 - }, - { - "epoch": 1.81, - "learning_rate": 7.2154675015232e-07, - "loss": 0.5835, - "step": 70478 - }, - { - "epoch": 1.81, - "learning_rate": 7.215201741774537e-07, - "loss": 0.5369, - "step": 70479 - }, - { - "epoch": 1.81, - "learning_rate": 7.214935984158068e-07, - "loss": 0.7373, - "step": 70480 - }, - { - "epoch": 1.81, - "learning_rate": 7.214670228673995e-07, - "loss": 0.8545, - "step": 70481 - }, - { - "epoch": 1.81, - "learning_rate": 7.21440447532252e-07, - "loss": 0.6079, - "step": 70482 - }, - { - "epoch": 1.81, - "learning_rate": 7.214138724103848e-07, - "loss": 0.5986, - "step": 70483 - }, - { - "epoch": 1.81, - "learning_rate": 7.213872975018181e-07, - "loss": 0.6094, - "step": 70484 - }, - { - "epoch": 1.81, - "learning_rate": 7.213607228065723e-07, - "loss": 0.6655, - "step": 70485 - }, - { - "epoch": 1.81, - "learning_rate": 7.213341483246677e-07, - "loss": 0.6572, - "step": 70486 - }, - { - "epoch": 1.81, - "learning_rate": 7.21307574056125e-07, - "loss": 0.5273, - "step": 70487 - }, - { - "epoch": 1.81, - "learning_rate": 7.212810000009639e-07, - "loss": 0.6572, - "step": 70488 - }, - { - "epoch": 1.81, - "learning_rate": 7.212544261592055e-07, - "loss": 0.6543, - "step": 70489 - }, - { - "epoch": 1.81, - "learning_rate": 7.212278525308695e-07, - "loss": 0.5771, - "step": 70490 - }, - { - "epoch": 1.81, - "learning_rate": 7.212012791159771e-07, - "loss": 0.7344, - "step": 70491 - }, - { - "epoch": 1.81, - "learning_rate": 7.211747059145474e-07, - "loss": 0.6709, - "step": 70492 - }, - { - "epoch": 1.81, - "learning_rate": 7.211481329266017e-07, - "loss": 0.6099, - "step": 70493 - }, - { - "epoch": 1.81, - "learning_rate": 7.211215601521599e-07, - "loss": 0.7002, - "step": 70494 - }, - { - "epoch": 1.81, - "learning_rate": 7.210949875912426e-07, - "loss": 0.793, - "step": 70495 - }, - { - "epoch": 1.81, - "learning_rate": 7.210684152438698e-07, - "loss": 0.5693, - "step": 70496 - }, - { - "epoch": 1.81, - "learning_rate": 7.210418431100624e-07, - "loss": 0.5571, - "step": 70497 - }, - { - "epoch": 1.81, - "learning_rate": 7.210152711898402e-07, - "loss": 0.6016, - "step": 70498 - }, - { - "epoch": 1.81, - "learning_rate": 7.20988699483224e-07, - "loss": 0.4774, - "step": 70499 - }, - { - "epoch": 1.81, - "learning_rate": 7.209621279902336e-07, - "loss": 0.5492, - "step": 70500 - }, - { - "epoch": 1.81, - "learning_rate": 7.209355567108903e-07, - "loss": 0.5952, - "step": 70501 - }, - { - "epoch": 1.81, - "learning_rate": 7.209089856452134e-07, - "loss": 0.5596, - "step": 70502 - }, - { - "epoch": 1.81, - "learning_rate": 7.208824147932235e-07, - "loss": 0.5254, - "step": 70503 - }, - { - "epoch": 1.81, - "learning_rate": 7.208558441549414e-07, - "loss": 0.7637, - "step": 70504 - }, - { - "epoch": 1.81, - "learning_rate": 7.208292737303869e-07, - "loss": 0.7012, - "step": 70505 - }, - { - "epoch": 1.81, - "learning_rate": 7.208027035195807e-07, - "loss": 0.7646, - "step": 70506 - }, - { - "epoch": 1.81, - "learning_rate": 7.20776133522543e-07, - "loss": 0.3984, - "step": 70507 - }, - { - "epoch": 1.81, - "learning_rate": 7.207495637392942e-07, - "loss": 0.3967, - "step": 70508 - }, - { - "epoch": 1.81, - "learning_rate": 7.207229941698545e-07, - "loss": 0.3989, - "step": 70509 - }, - { - "epoch": 1.81, - "learning_rate": 7.206964248142446e-07, - "loss": 0.7075, - "step": 70510 - }, - { - "epoch": 1.81, - "learning_rate": 7.206698556724847e-07, - "loss": 0.6719, - "step": 70511 - }, - { - "epoch": 1.81, - "learning_rate": 7.206432867445949e-07, - "loss": 0.5649, - "step": 70512 - }, - { - "epoch": 1.81, - "learning_rate": 7.206167180305956e-07, - "loss": 0.4865, - "step": 70513 - }, - { - "epoch": 1.81, - "learning_rate": 7.205901495305073e-07, - "loss": 0.6094, - "step": 70514 - }, - { - "epoch": 1.81, - "learning_rate": 7.2056358124435e-07, - "loss": 0.2463, - "step": 70515 - }, - { - "epoch": 1.81, - "learning_rate": 7.205370131721447e-07, - "loss": 0.7607, - "step": 70516 - }, - { - "epoch": 1.81, - "learning_rate": 7.205104453139111e-07, - "loss": 0.562, - "step": 70517 - }, - { - "epoch": 1.81, - "learning_rate": 7.2048387766967e-07, - "loss": 0.7314, - "step": 70518 - }, - { - "epoch": 1.81, - "learning_rate": 7.204573102394414e-07, - "loss": 0.6956, - "step": 70519 - }, - { - "epoch": 1.81, - "learning_rate": 7.204307430232458e-07, - "loss": 0.4785, - "step": 70520 - }, - { - "epoch": 1.81, - "learning_rate": 7.20404176021104e-07, - "loss": 0.5996, - "step": 70521 - }, - { - "epoch": 1.81, - "learning_rate": 7.203776092330352e-07, - "loss": 0.5874, - "step": 70522 - }, - { - "epoch": 1.81, - "learning_rate": 7.203510426590606e-07, - "loss": 0.6206, - "step": 70523 - }, - { - "epoch": 1.81, - "learning_rate": 7.203244762992004e-07, - "loss": 0.5649, - "step": 70524 - }, - { - "epoch": 1.81, - "learning_rate": 7.20297910153475e-07, - "loss": 0.5977, - "step": 70525 - }, - { - "epoch": 1.81, - "learning_rate": 7.202713442219042e-07, - "loss": 0.6475, - "step": 70526 - }, - { - "epoch": 1.81, - "learning_rate": 7.202447785045091e-07, - "loss": 0.6572, - "step": 70527 - }, - { - "epoch": 1.81, - "learning_rate": 7.202182130013097e-07, - "loss": 0.5679, - "step": 70528 - }, - { - "epoch": 1.81, - "learning_rate": 7.201916477123264e-07, - "loss": 0.4874, - "step": 70529 - }, - { - "epoch": 1.81, - "learning_rate": 7.201650826375795e-07, - "loss": 0.7183, - "step": 70530 - }, - { - "epoch": 1.81, - "learning_rate": 7.201385177770896e-07, - "loss": 0.707, - "step": 70531 - }, - { - "epoch": 1.81, - "learning_rate": 7.201119531308762e-07, - "loss": 0.4204, - "step": 70532 - }, - { - "epoch": 1.81, - "learning_rate": 7.200853886989604e-07, - "loss": 0.5405, - "step": 70533 - }, - { - "epoch": 1.81, - "learning_rate": 7.200588244813624e-07, - "loss": 0.6436, - "step": 70534 - }, - { - "epoch": 1.81, - "learning_rate": 7.200322604781024e-07, - "loss": 0.6831, - "step": 70535 - }, - { - "epoch": 1.81, - "learning_rate": 7.200056966892007e-07, - "loss": 0.4932, - "step": 70536 - }, - { - "epoch": 1.81, - "learning_rate": 7.199791331146781e-07, - "loss": 0.6406, - "step": 70537 - }, - { - "epoch": 1.81, - "learning_rate": 7.199525697545543e-07, - "loss": 0.7803, - "step": 70538 - }, - { - "epoch": 1.81, - "learning_rate": 7.199260066088501e-07, - "loss": 0.7109, - "step": 70539 - }, - { - "epoch": 1.81, - "learning_rate": 7.198994436775856e-07, - "loss": 0.5991, - "step": 70540 - }, - { - "epoch": 1.81, - "learning_rate": 7.198728809607817e-07, - "loss": 0.5745, - "step": 70541 - }, - { - "epoch": 1.81, - "learning_rate": 7.198463184584578e-07, - "loss": 0.7451, - "step": 70542 - }, - { - "epoch": 1.81, - "learning_rate": 7.198197561706346e-07, - "loss": 0.5581, - "step": 70543 - }, - { - "epoch": 1.81, - "learning_rate": 7.197931940973327e-07, - "loss": 0.5562, - "step": 70544 - }, - { - "epoch": 1.81, - "learning_rate": 7.197666322385722e-07, - "loss": 0.4834, - "step": 70545 - }, - { - "epoch": 1.81, - "learning_rate": 7.197400705943736e-07, - "loss": 0.5317, - "step": 70546 - }, - { - "epoch": 1.81, - "learning_rate": 7.197135091647572e-07, - "loss": 0.8203, - "step": 70547 - }, - { - "epoch": 1.81, - "learning_rate": 7.196869479497429e-07, - "loss": 0.5415, - "step": 70548 - }, - { - "epoch": 1.81, - "learning_rate": 7.196603869493518e-07, - "loss": 0.5586, - "step": 70549 - }, - { - "epoch": 1.81, - "learning_rate": 7.196338261636036e-07, - "loss": 0.5227, - "step": 70550 - }, - { - "epoch": 1.81, - "learning_rate": 7.196072655925193e-07, - "loss": 0.6348, - "step": 70551 - }, - { - "epoch": 1.81, - "learning_rate": 7.195807052361185e-07, - "loss": 0.6677, - "step": 70552 - }, - { - "epoch": 1.81, - "learning_rate": 7.195541450944218e-07, - "loss": 0.6875, - "step": 70553 - }, - { - "epoch": 1.81, - "learning_rate": 7.195275851674498e-07, - "loss": 0.5217, - "step": 70554 - }, - { - "epoch": 1.81, - "learning_rate": 7.195010254552224e-07, - "loss": 0.6172, - "step": 70555 - }, - { - "epoch": 1.81, - "learning_rate": 7.194744659577602e-07, - "loss": 0.7598, - "step": 70556 - }, - { - "epoch": 1.81, - "learning_rate": 7.194479066750836e-07, - "loss": 0.4719, - "step": 70557 - }, - { - "epoch": 1.81, - "learning_rate": 7.194213476072128e-07, - "loss": 0.5989, - "step": 70558 - }, - { - "epoch": 1.81, - "learning_rate": 7.193947887541682e-07, - "loss": 0.5718, - "step": 70559 - }, - { - "epoch": 1.81, - "learning_rate": 7.193682301159701e-07, - "loss": 0.749, - "step": 70560 - }, - { - "epoch": 1.81, - "learning_rate": 7.193416716926392e-07, - "loss": 0.644, - "step": 70561 - }, - { - "epoch": 1.81, - "learning_rate": 7.193151134841951e-07, - "loss": 0.6567, - "step": 70562 - }, - { - "epoch": 1.81, - "learning_rate": 7.192885554906585e-07, - "loss": 0.6367, - "step": 70563 - }, - { - "epoch": 1.81, - "learning_rate": 7.192619977120497e-07, - "loss": 0.6543, - "step": 70564 - }, - { - "epoch": 1.81, - "learning_rate": 7.192354401483891e-07, - "loss": 0.6729, - "step": 70565 - }, - { - "epoch": 1.81, - "learning_rate": 7.192088827996971e-07, - "loss": 0.7451, - "step": 70566 - }, - { - "epoch": 1.81, - "learning_rate": 7.191823256659939e-07, - "loss": 0.665, - "step": 70567 - }, - { - "epoch": 1.81, - "learning_rate": 7.191557687473e-07, - "loss": 0.5188, - "step": 70568 - }, - { - "epoch": 1.81, - "learning_rate": 7.191292120436354e-07, - "loss": 0.6421, - "step": 70569 - }, - { - "epoch": 1.81, - "learning_rate": 7.191026555550208e-07, - "loss": 0.5767, - "step": 70570 - }, - { - "epoch": 1.81, - "learning_rate": 7.190760992814766e-07, - "loss": 0.6885, - "step": 70571 - }, - { - "epoch": 1.81, - "learning_rate": 7.190495432230226e-07, - "loss": 0.8438, - "step": 70572 - }, - { - "epoch": 1.81, - "learning_rate": 7.190229873796796e-07, - "loss": 0.5117, - "step": 70573 - }, - { - "epoch": 1.81, - "learning_rate": 7.189964317514675e-07, - "loss": 0.8115, - "step": 70574 - }, - { - "epoch": 1.81, - "learning_rate": 7.189698763384071e-07, - "loss": 0.6777, - "step": 70575 - }, - { - "epoch": 1.81, - "learning_rate": 7.189433211405185e-07, - "loss": 0.5713, - "step": 70576 - }, - { - "epoch": 1.81, - "learning_rate": 7.189167661578222e-07, - "loss": 0.624, - "step": 70577 - }, - { - "epoch": 1.81, - "learning_rate": 7.188902113903382e-07, - "loss": 0.6719, - "step": 70578 - }, - { - "epoch": 1.81, - "learning_rate": 7.188636568380872e-07, - "loss": 0.6738, - "step": 70579 - }, - { - "epoch": 1.81, - "learning_rate": 7.188371025010891e-07, - "loss": 0.7695, - "step": 70580 - }, - { - "epoch": 1.81, - "learning_rate": 7.188105483793653e-07, - "loss": 0.8086, - "step": 70581 - }, - { - "epoch": 1.81, - "learning_rate": 7.187839944729347e-07, - "loss": 0.7324, - "step": 70582 - }, - { - "epoch": 1.81, - "learning_rate": 7.187574407818184e-07, - "loss": 0.7412, - "step": 70583 - }, - { - "epoch": 1.81, - "learning_rate": 7.187308873060364e-07, - "loss": 0.5605, - "step": 70584 - }, - { - "epoch": 1.81, - "learning_rate": 7.187043340456094e-07, - "loss": 0.6533, - "step": 70585 - }, - { - "epoch": 1.81, - "learning_rate": 7.186777810005573e-07, - "loss": 0.5824, - "step": 70586 - }, - { - "epoch": 1.81, - "learning_rate": 7.186512281709011e-07, - "loss": 0.5659, - "step": 70587 - }, - { - "epoch": 1.81, - "learning_rate": 7.186246755566602e-07, - "loss": 0.6924, - "step": 70588 - }, - { - "epoch": 1.81, - "learning_rate": 7.18598123157856e-07, - "loss": 0.8564, - "step": 70589 - }, - { - "epoch": 1.81, - "learning_rate": 7.185715709745079e-07, - "loss": 0.7275, - "step": 70590 - }, - { - "epoch": 1.81, - "learning_rate": 7.185450190066372e-07, - "loss": 0.5757, - "step": 70591 - }, - { - "epoch": 1.81, - "learning_rate": 7.185184672542631e-07, - "loss": 0.5713, - "step": 70592 - }, - { - "epoch": 1.81, - "learning_rate": 7.184919157174064e-07, - "loss": 0.6313, - "step": 70593 - }, - { - "epoch": 1.81, - "learning_rate": 7.184653643960878e-07, - "loss": 0.4771, - "step": 70594 - }, - { - "epoch": 1.81, - "learning_rate": 7.18438813290327e-07, - "loss": 0.5166, - "step": 70595 - }, - { - "epoch": 1.81, - "learning_rate": 7.184122624001449e-07, - "loss": 0.618, - "step": 70596 - }, - { - "epoch": 1.81, - "learning_rate": 7.183857117255614e-07, - "loss": 0.6738, - "step": 70597 - }, - { - "epoch": 1.81, - "learning_rate": 7.183591612665971e-07, - "loss": 0.7383, - "step": 70598 - }, - { - "epoch": 1.81, - "learning_rate": 7.183326110232722e-07, - "loss": 0.793, - "step": 70599 - }, - { - "epoch": 1.81, - "learning_rate": 7.183060609956073e-07, - "loss": 0.657, - "step": 70600 - }, - { - "epoch": 1.81, - "learning_rate": 7.182795111836226e-07, - "loss": 0.7158, - "step": 70601 - }, - { - "epoch": 1.81, - "learning_rate": 7.182529615873381e-07, - "loss": 0.4766, - "step": 70602 - }, - { - "epoch": 1.81, - "learning_rate": 7.182264122067741e-07, - "loss": 0.4106, - "step": 70603 - }, - { - "epoch": 1.81, - "learning_rate": 7.181998630419514e-07, - "loss": 0.7598, - "step": 70604 - }, - { - "epoch": 1.81, - "learning_rate": 7.1817331409289e-07, - "loss": 0.6401, - "step": 70605 - }, - { - "epoch": 1.81, - "learning_rate": 7.181467653596106e-07, - "loss": 0.4761, - "step": 70606 - }, - { - "epoch": 1.81, - "learning_rate": 7.18120216842133e-07, - "loss": 0.6328, - "step": 70607 - }, - { - "epoch": 1.81, - "learning_rate": 7.180936685404779e-07, - "loss": 0.6641, - "step": 70608 - }, - { - "epoch": 1.81, - "learning_rate": 7.180671204546654e-07, - "loss": 0.7612, - "step": 70609 - }, - { - "epoch": 1.81, - "learning_rate": 7.180405725847161e-07, - "loss": 0.6108, - "step": 70610 - }, - { - "epoch": 1.81, - "learning_rate": 7.180140249306503e-07, - "loss": 0.7271, - "step": 70611 - }, - { - "epoch": 1.81, - "learning_rate": 7.179874774924879e-07, - "loss": 0.6807, - "step": 70612 - }, - { - "epoch": 1.81, - "learning_rate": 7.179609302702498e-07, - "loss": 0.6846, - "step": 70613 - }, - { - "epoch": 1.81, - "learning_rate": 7.179343832639557e-07, - "loss": 0.6914, - "step": 70614 - }, - { - "epoch": 1.81, - "learning_rate": 7.179078364736265e-07, - "loss": 0.5314, - "step": 70615 - }, - { - "epoch": 1.81, - "learning_rate": 7.178812898992821e-07, - "loss": 0.6055, - "step": 70616 - }, - { - "epoch": 1.81, - "learning_rate": 7.178547435409432e-07, - "loss": 0.6309, - "step": 70617 - }, - { - "epoch": 1.81, - "learning_rate": 7.178281973986297e-07, - "loss": 0.7041, - "step": 70618 - }, - { - "epoch": 1.81, - "learning_rate": 7.178016514723626e-07, - "loss": 0.8301, - "step": 70619 - }, - { - "epoch": 1.81, - "learning_rate": 7.177751057621617e-07, - "loss": 0.7988, - "step": 70620 - }, - { - "epoch": 1.81, - "learning_rate": 7.177485602680475e-07, - "loss": 0.6367, - "step": 70621 - }, - { - "epoch": 1.81, - "learning_rate": 7.1772201499004e-07, - "loss": 0.7466, - "step": 70622 - }, - { - "epoch": 1.81, - "learning_rate": 7.176954699281599e-07, - "loss": 0.4572, - "step": 70623 - }, - { - "epoch": 1.81, - "learning_rate": 7.176689250824273e-07, - "loss": 0.5693, - "step": 70624 - }, - { - "epoch": 1.81, - "learning_rate": 7.176423804528626e-07, - "loss": 0.5482, - "step": 70625 - }, - { - "epoch": 1.81, - "learning_rate": 7.176158360394862e-07, - "loss": 0.4497, - "step": 70626 - }, - { - "epoch": 1.81, - "learning_rate": 7.175892918423183e-07, - "loss": 0.5579, - "step": 70627 - }, - { - "epoch": 1.81, - "learning_rate": 7.175627478613792e-07, - "loss": 0.6685, - "step": 70628 - }, - { - "epoch": 1.81, - "learning_rate": 7.175362040966897e-07, - "loss": 0.5928, - "step": 70629 - }, - { - "epoch": 1.81, - "learning_rate": 7.175096605482698e-07, - "loss": 0.6992, - "step": 70630 - }, - { - "epoch": 1.81, - "learning_rate": 7.174831172161393e-07, - "loss": 0.6104, - "step": 70631 - }, - { - "epoch": 1.81, - "learning_rate": 7.174565741003193e-07, - "loss": 0.6553, - "step": 70632 - }, - { - "epoch": 1.81, - "learning_rate": 7.174300312008295e-07, - "loss": 0.499, - "step": 70633 - }, - { - "epoch": 1.81, - "learning_rate": 7.174034885176908e-07, - "loss": 0.5078, - "step": 70634 - }, - { - "epoch": 1.81, - "learning_rate": 7.173769460509231e-07, - "loss": 0.5366, - "step": 70635 - }, - { - "epoch": 1.81, - "learning_rate": 7.17350403800547e-07, - "loss": 0.6265, - "step": 70636 - }, - { - "epoch": 1.81, - "learning_rate": 7.173238617665827e-07, - "loss": 0.5913, - "step": 70637 - }, - { - "epoch": 1.81, - "learning_rate": 7.172973199490505e-07, - "loss": 0.5591, - "step": 70638 - }, - { - "epoch": 1.81, - "learning_rate": 7.172707783479705e-07, - "loss": 0.5303, - "step": 70639 - }, - { - "epoch": 1.81, - "learning_rate": 7.172442369633639e-07, - "loss": 0.6128, - "step": 70640 - }, - { - "epoch": 1.81, - "learning_rate": 7.172176957952498e-07, - "loss": 0.8516, - "step": 70641 - }, - { - "epoch": 1.81, - "learning_rate": 7.171911548436494e-07, - "loss": 0.5216, - "step": 70642 - }, - { - "epoch": 1.81, - "learning_rate": 7.171646141085824e-07, - "loss": 0.7432, - "step": 70643 - }, - { - "epoch": 1.81, - "learning_rate": 7.171380735900699e-07, - "loss": 0.7373, - "step": 70644 - }, - { - "epoch": 1.81, - "learning_rate": 7.171115332881313e-07, - "loss": 0.5112, - "step": 70645 - }, - { - "epoch": 1.81, - "learning_rate": 7.170849932027876e-07, - "loss": 0.6221, - "step": 70646 - }, - { - "epoch": 1.81, - "learning_rate": 7.170584533340589e-07, - "loss": 0.5972, - "step": 70647 - }, - { - "epoch": 1.81, - "learning_rate": 7.170319136819656e-07, - "loss": 0.437, - "step": 70648 - }, - { - "epoch": 1.81, - "learning_rate": 7.170053742465278e-07, - "loss": 0.6465, - "step": 70649 - }, - { - "epoch": 1.81, - "learning_rate": 7.169788350277663e-07, - "loss": 0.6616, - "step": 70650 - }, - { - "epoch": 1.81, - "learning_rate": 7.169522960257009e-07, - "loss": 0.606, - "step": 70651 - }, - { - "epoch": 1.81, - "learning_rate": 7.16925757240352e-07, - "loss": 0.6338, - "step": 70652 - }, - { - "epoch": 1.81, - "learning_rate": 7.168992186717402e-07, - "loss": 0.4312, - "step": 70653 - }, - { - "epoch": 1.81, - "learning_rate": 7.168726803198857e-07, - "loss": 0.4712, - "step": 70654 - }, - { - "epoch": 1.81, - "learning_rate": 7.168461421848085e-07, - "loss": 0.8076, - "step": 70655 - }, - { - "epoch": 1.81, - "learning_rate": 7.168196042665293e-07, - "loss": 0.6987, - "step": 70656 - }, - { - "epoch": 1.81, - "learning_rate": 7.167930665650683e-07, - "loss": 0.7366, - "step": 70657 - }, - { - "epoch": 1.81, - "learning_rate": 7.167665290804459e-07, - "loss": 0.6875, - "step": 70658 - }, - { - "epoch": 1.81, - "learning_rate": 7.167399918126822e-07, - "loss": 0.512, - "step": 70659 - }, - { - "epoch": 1.81, - "learning_rate": 7.16713454761798e-07, - "loss": 0.5155, - "step": 70660 - }, - { - "epoch": 1.81, - "learning_rate": 7.166869179278132e-07, - "loss": 0.6035, - "step": 70661 - }, - { - "epoch": 1.81, - "learning_rate": 7.166603813107479e-07, - "loss": 0.6382, - "step": 70662 - }, - { - "epoch": 1.81, - "learning_rate": 7.16633844910623e-07, - "loss": 0.6064, - "step": 70663 - }, - { - "epoch": 1.81, - "learning_rate": 7.166073087274582e-07, - "loss": 0.6274, - "step": 70664 - }, - { - "epoch": 1.81, - "learning_rate": 7.165807727612745e-07, - "loss": 0.5503, - "step": 70665 - }, - { - "epoch": 1.81, - "learning_rate": 7.165542370120915e-07, - "loss": 0.5629, - "step": 70666 - }, - { - "epoch": 1.81, - "learning_rate": 7.165277014799303e-07, - "loss": 0.485, - "step": 70667 - }, - { - "epoch": 1.81, - "learning_rate": 7.165011661648104e-07, - "loss": 0.71, - "step": 70668 - }, - { - "epoch": 1.81, - "learning_rate": 7.164746310667529e-07, - "loss": 0.5366, - "step": 70669 - }, - { - "epoch": 1.81, - "learning_rate": 7.164480961857777e-07, - "loss": 0.6562, - "step": 70670 - }, - { - "epoch": 1.81, - "learning_rate": 7.164215615219052e-07, - "loss": 0.5649, - "step": 70671 - }, - { - "epoch": 1.81, - "learning_rate": 7.163950270751553e-07, - "loss": 0.5957, - "step": 70672 - }, - { - "epoch": 1.81, - "learning_rate": 7.163684928455491e-07, - "loss": 0.7271, - "step": 70673 - }, - { - "epoch": 1.81, - "learning_rate": 7.163419588331061e-07, - "loss": 0.5615, - "step": 70674 - }, - { - "epoch": 1.81, - "learning_rate": 7.163154250378474e-07, - "loss": 0.5247, - "step": 70675 - }, - { - "epoch": 1.81, - "learning_rate": 7.162888914597925e-07, - "loss": 0.5479, - "step": 70676 - }, - { - "epoch": 1.81, - "learning_rate": 7.162623580989625e-07, - "loss": 0.6807, - "step": 70677 - }, - { - "epoch": 1.81, - "learning_rate": 7.162358249553772e-07, - "loss": 0.7432, - "step": 70678 - }, - { - "epoch": 1.81, - "learning_rate": 7.162092920290572e-07, - "loss": 0.6113, - "step": 70679 - }, - { - "epoch": 1.81, - "learning_rate": 7.16182759320023e-07, - "loss": 0.5703, - "step": 70680 - }, - { - "epoch": 1.81, - "learning_rate": 7.16156226828294e-07, - "loss": 0.7041, - "step": 70681 - }, - { - "epoch": 1.81, - "learning_rate": 7.161296945538915e-07, - "loss": 0.5625, - "step": 70682 - }, - { - "epoch": 1.81, - "learning_rate": 7.161031624968353e-07, - "loss": 0.5852, - "step": 70683 - }, - { - "epoch": 1.81, - "learning_rate": 7.160766306571458e-07, - "loss": 0.6187, - "step": 70684 - }, - { - "epoch": 1.81, - "learning_rate": 7.160500990348433e-07, - "loss": 0.6123, - "step": 70685 - }, - { - "epoch": 1.81, - "learning_rate": 7.160235676299484e-07, - "loss": 0.6729, - "step": 70686 - }, - { - "epoch": 1.81, - "learning_rate": 7.15997036442481e-07, - "loss": 0.5742, - "step": 70687 - }, - { - "epoch": 1.81, - "learning_rate": 7.159705054724618e-07, - "loss": 0.7432, - "step": 70688 - }, - { - "epoch": 1.81, - "learning_rate": 7.159439747199107e-07, - "loss": 0.7515, - "step": 70689 - }, - { - "epoch": 1.81, - "learning_rate": 7.15917444184849e-07, - "loss": 0.752, - "step": 70690 - }, - { - "epoch": 1.81, - "learning_rate": 7.158909138672955e-07, - "loss": 0.6226, - "step": 70691 - }, - { - "epoch": 1.81, - "learning_rate": 7.158643837672714e-07, - "loss": 0.5681, - "step": 70692 - }, - { - "epoch": 1.81, - "learning_rate": 7.158378538847968e-07, - "loss": 0.5896, - "step": 70693 - }, - { - "epoch": 1.81, - "learning_rate": 7.158113242198922e-07, - "loss": 0.665, - "step": 70694 - }, - { - "epoch": 1.81, - "learning_rate": 7.157847947725777e-07, - "loss": 0.7793, - "step": 70695 - }, - { - "epoch": 1.81, - "learning_rate": 7.157582655428739e-07, - "loss": 0.5145, - "step": 70696 - }, - { - "epoch": 1.81, - "learning_rate": 7.157317365308006e-07, - "loss": 0.7061, - "step": 70697 - }, - { - "epoch": 1.81, - "learning_rate": 7.157052077363788e-07, - "loss": 0.5823, - "step": 70698 - }, - { - "epoch": 1.81, - "learning_rate": 7.156786791596281e-07, - "loss": 0.7344, - "step": 70699 - }, - { - "epoch": 1.81, - "learning_rate": 7.156521508005697e-07, - "loss": 0.6543, - "step": 70700 - }, - { - "epoch": 1.81, - "learning_rate": 7.156256226592231e-07, - "loss": 0.6162, - "step": 70701 - }, - { - "epoch": 1.81, - "learning_rate": 7.155990947356088e-07, - "loss": 0.52, - "step": 70702 - }, - { - "epoch": 1.81, - "learning_rate": 7.155725670297473e-07, - "loss": 0.5972, - "step": 70703 - }, - { - "epoch": 1.81, - "learning_rate": 7.155460395416585e-07, - "loss": 0.4755, - "step": 70704 - }, - { - "epoch": 1.81, - "learning_rate": 7.155195122713633e-07, - "loss": 0.6172, - "step": 70705 - }, - { - "epoch": 1.81, - "learning_rate": 7.154929852188816e-07, - "loss": 0.6797, - "step": 70706 - }, - { - "epoch": 1.81, - "learning_rate": 7.15466458384234e-07, - "loss": 0.7285, - "step": 70707 - }, - { - "epoch": 1.81, - "learning_rate": 7.154399317674404e-07, - "loss": 0.4541, - "step": 70708 - }, - { - "epoch": 1.81, - "learning_rate": 7.154134053685216e-07, - "loss": 0.8516, - "step": 70709 - }, - { - "epoch": 1.81, - "learning_rate": 7.15386879187498e-07, - "loss": 0.5508, - "step": 70710 - }, - { - "epoch": 1.81, - "learning_rate": 7.153603532243891e-07, - "loss": 0.5864, - "step": 70711 - }, - { - "epoch": 1.81, - "learning_rate": 7.153338274792157e-07, - "loss": 0.6196, - "step": 70712 - }, - { - "epoch": 1.81, - "learning_rate": 7.153073019519982e-07, - "loss": 0.7402, - "step": 70713 - }, - { - "epoch": 1.81, - "learning_rate": 7.152807766427567e-07, - "loss": 0.5526, - "step": 70714 - }, - { - "epoch": 1.81, - "learning_rate": 7.152542515515116e-07, - "loss": 0.5986, - "step": 70715 - }, - { - "epoch": 1.81, - "learning_rate": 7.152277266782834e-07, - "loss": 0.5894, - "step": 70716 - }, - { - "epoch": 1.81, - "learning_rate": 7.152012020230921e-07, - "loss": 0.584, - "step": 70717 - }, - { - "epoch": 1.81, - "learning_rate": 7.151746775859581e-07, - "loss": 0.5752, - "step": 70718 - }, - { - "epoch": 1.81, - "learning_rate": 7.15148153366902e-07, - "loss": 0.6257, - "step": 70719 - }, - { - "epoch": 1.81, - "learning_rate": 7.151216293659439e-07, - "loss": 0.7622, - "step": 70720 - }, - { - "epoch": 1.81, - "learning_rate": 7.150951055831038e-07, - "loss": 0.6367, - "step": 70721 - }, - { - "epoch": 1.81, - "learning_rate": 7.150685820184023e-07, - "loss": 0.8203, - "step": 70722 - }, - { - "epoch": 1.81, - "learning_rate": 7.150420586718598e-07, - "loss": 0.6846, - "step": 70723 - }, - { - "epoch": 1.81, - "learning_rate": 7.150155355434963e-07, - "loss": 0.5625, - "step": 70724 - }, - { - "epoch": 1.81, - "learning_rate": 7.149890126333325e-07, - "loss": 0.4924, - "step": 70725 - }, - { - "epoch": 1.81, - "learning_rate": 7.149624899413884e-07, - "loss": 0.6411, - "step": 70726 - }, - { - "epoch": 1.81, - "learning_rate": 7.149359674676844e-07, - "loss": 0.5146, - "step": 70727 - }, - { - "epoch": 1.81, - "learning_rate": 7.149094452122408e-07, - "loss": 0.7349, - "step": 70728 - }, - { - "epoch": 1.81, - "learning_rate": 7.148829231750781e-07, - "loss": 0.7109, - "step": 70729 - }, - { - "epoch": 1.81, - "learning_rate": 7.148564013562167e-07, - "loss": 0.6719, - "step": 70730 - }, - { - "epoch": 1.81, - "learning_rate": 7.148298797556762e-07, - "loss": 0.4082, - "step": 70731 - }, - { - "epoch": 1.81, - "learning_rate": 7.148033583734775e-07, - "loss": 0.623, - "step": 70732 - }, - { - "epoch": 1.81, - "learning_rate": 7.147768372096405e-07, - "loss": 0.792, - "step": 70733 - }, - { - "epoch": 1.81, - "learning_rate": 7.14750316264186e-07, - "loss": 0.7607, - "step": 70734 - }, - { - "epoch": 1.81, - "learning_rate": 7.147237955371339e-07, - "loss": 0.5776, - "step": 70735 - }, - { - "epoch": 1.81, - "learning_rate": 7.14697275028505e-07, - "loss": 0.6108, - "step": 70736 - }, - { - "epoch": 1.81, - "learning_rate": 7.146707547383188e-07, - "loss": 0.8252, - "step": 70737 - }, - { - "epoch": 1.81, - "learning_rate": 7.146442346665964e-07, - "loss": 0.4653, - "step": 70738 - }, - { - "epoch": 1.81, - "learning_rate": 7.146177148133577e-07, - "loss": 0.6914, - "step": 70739 - }, - { - "epoch": 1.81, - "learning_rate": 7.145911951786234e-07, - "loss": 0.626, - "step": 70740 - }, - { - "epoch": 1.81, - "learning_rate": 7.145646757624133e-07, - "loss": 0.5996, - "step": 70741 - }, - { - "epoch": 1.81, - "learning_rate": 7.145381565647477e-07, - "loss": 0.5571, - "step": 70742 - }, - { - "epoch": 1.81, - "learning_rate": 7.145116375856472e-07, - "loss": 0.7783, - "step": 70743 - }, - { - "epoch": 1.81, - "learning_rate": 7.144851188251322e-07, - "loss": 0.563, - "step": 70744 - }, - { - "epoch": 1.81, - "learning_rate": 7.144586002832226e-07, - "loss": 0.8096, - "step": 70745 - }, - { - "epoch": 1.81, - "learning_rate": 7.14432081959939e-07, - "loss": 0.6074, - "step": 70746 - }, - { - "epoch": 1.81, - "learning_rate": 7.144055638553015e-07, - "loss": 0.5811, - "step": 70747 - }, - { - "epoch": 1.81, - "learning_rate": 7.143790459693307e-07, - "loss": 0.7061, - "step": 70748 - }, - { - "epoch": 1.81, - "learning_rate": 7.143525283020466e-07, - "loss": 0.6309, - "step": 70749 - }, - { - "epoch": 1.81, - "learning_rate": 7.1432601085347e-07, - "loss": 0.6831, - "step": 70750 - }, - { - "epoch": 1.81, - "learning_rate": 7.142994936236206e-07, - "loss": 0.7637, - "step": 70751 - }, - { - "epoch": 1.81, - "learning_rate": 7.142729766125189e-07, - "loss": 0.6587, - "step": 70752 - }, - { - "epoch": 1.81, - "learning_rate": 7.142464598201851e-07, - "loss": 0.6343, - "step": 70753 - }, - { - "epoch": 1.81, - "learning_rate": 7.142199432466397e-07, - "loss": 0.4646, - "step": 70754 - }, - { - "epoch": 1.81, - "learning_rate": 7.141934268919031e-07, - "loss": 0.4778, - "step": 70755 - }, - { - "epoch": 1.81, - "learning_rate": 7.141669107559953e-07, - "loss": 0.6172, - "step": 70756 - }, - { - "epoch": 1.81, - "learning_rate": 7.141403948389369e-07, - "loss": 0.459, - "step": 70757 - }, - { - "epoch": 1.81, - "learning_rate": 7.141138791407478e-07, - "loss": 0.6152, - "step": 70758 - }, - { - "epoch": 1.81, - "learning_rate": 7.140873636614488e-07, - "loss": 0.4519, - "step": 70759 - }, - { - "epoch": 1.81, - "learning_rate": 7.140608484010602e-07, - "loss": 0.4971, - "step": 70760 - }, - { - "epoch": 1.81, - "learning_rate": 7.140343333596017e-07, - "loss": 0.7871, - "step": 70761 - }, - { - "epoch": 1.81, - "learning_rate": 7.140078185370941e-07, - "loss": 0.6279, - "step": 70762 - }, - { - "epoch": 1.81, - "learning_rate": 7.139813039335576e-07, - "loss": 0.709, - "step": 70763 - }, - { - "epoch": 1.81, - "learning_rate": 7.139547895490121e-07, - "loss": 0.7207, - "step": 70764 - }, - { - "epoch": 1.81, - "learning_rate": 7.139282753834786e-07, - "loss": 0.6475, - "step": 70765 - }, - { - "epoch": 1.81, - "learning_rate": 7.139017614369769e-07, - "loss": 0.6445, - "step": 70766 - }, - { - "epoch": 1.81, - "learning_rate": 7.138752477095276e-07, - "loss": 0.5112, - "step": 70767 - }, - { - "epoch": 1.81, - "learning_rate": 7.138487342011508e-07, - "loss": 0.5991, - "step": 70768 - }, - { - "epoch": 1.81, - "learning_rate": 7.138222209118668e-07, - "loss": 0.3817, - "step": 70769 - }, - { - "epoch": 1.81, - "learning_rate": 7.137957078416964e-07, - "loss": 0.7305, - "step": 70770 - }, - { - "epoch": 1.81, - "learning_rate": 7.13769194990659e-07, - "loss": 0.6655, - "step": 70771 - }, - { - "epoch": 1.81, - "learning_rate": 7.137426823587756e-07, - "loss": 0.6924, - "step": 70772 - }, - { - "epoch": 1.81, - "learning_rate": 7.137161699460659e-07, - "loss": 0.6504, - "step": 70773 - }, - { - "epoch": 1.81, - "learning_rate": 7.13689657752551e-07, - "loss": 0.4985, - "step": 70774 - }, - { - "epoch": 1.81, - "learning_rate": 7.136631457782504e-07, - "loss": 0.6846, - "step": 70775 - }, - { - "epoch": 1.81, - "learning_rate": 7.136366340231849e-07, - "loss": 0.5376, - "step": 70776 - }, - { - "epoch": 1.81, - "learning_rate": 7.136101224873747e-07, - "loss": 0.6211, - "step": 70777 - }, - { - "epoch": 1.81, - "learning_rate": 7.135836111708401e-07, - "loss": 0.8584, - "step": 70778 - }, - { - "epoch": 1.81, - "learning_rate": 7.135571000736012e-07, - "loss": 0.6553, - "step": 70779 - }, - { - "epoch": 1.81, - "learning_rate": 7.135305891956791e-07, - "loss": 0.5039, - "step": 70780 - }, - { - "epoch": 1.81, - "learning_rate": 7.135040785370927e-07, - "loss": 0.5532, - "step": 70781 - }, - { - "epoch": 1.81, - "learning_rate": 7.134775680978634e-07, - "loss": 0.5005, - "step": 70782 - }, - { - "epoch": 1.81, - "learning_rate": 7.13451057878011e-07, - "loss": 0.7588, - "step": 70783 - }, - { - "epoch": 1.81, - "learning_rate": 7.13424547877556e-07, - "loss": 0.5093, - "step": 70784 - }, - { - "epoch": 1.81, - "learning_rate": 7.133980380965186e-07, - "loss": 0.6367, - "step": 70785 - }, - { - "epoch": 1.81, - "learning_rate": 7.133715285349191e-07, - "loss": 0.6865, - "step": 70786 - }, - { - "epoch": 1.81, - "learning_rate": 7.133450191927779e-07, - "loss": 0.5664, - "step": 70787 - }, - { - "epoch": 1.81, - "learning_rate": 7.133185100701153e-07, - "loss": 0.7275, - "step": 70788 - }, - { - "epoch": 1.81, - "learning_rate": 7.132920011669514e-07, - "loss": 0.6479, - "step": 70789 - }, - { - "epoch": 1.81, - "learning_rate": 7.13265492483307e-07, - "loss": 0.5806, - "step": 70790 - }, - { - "epoch": 1.81, - "learning_rate": 7.132389840192018e-07, - "loss": 0.7842, - "step": 70791 - }, - { - "epoch": 1.81, - "learning_rate": 7.132124757746561e-07, - "loss": 0.6221, - "step": 70792 - }, - { - "epoch": 1.81, - "learning_rate": 7.131859677496908e-07, - "loss": 0.8545, - "step": 70793 - }, - { - "epoch": 1.81, - "learning_rate": 7.131594599443254e-07, - "loss": 0.6768, - "step": 70794 - }, - { - "epoch": 1.81, - "learning_rate": 7.131329523585809e-07, - "loss": 0.6348, - "step": 70795 - }, - { - "epoch": 1.81, - "learning_rate": 7.131064449924771e-07, - "loss": 0.6958, - "step": 70796 - }, - { - "epoch": 1.81, - "learning_rate": 7.130799378460347e-07, - "loss": 0.5645, - "step": 70797 - }, - { - "epoch": 1.81, - "learning_rate": 7.130534309192736e-07, - "loss": 0.7705, - "step": 70798 - }, - { - "epoch": 1.81, - "learning_rate": 7.130269242122144e-07, - "loss": 0.5776, - "step": 70799 - }, - { - "epoch": 1.81, - "learning_rate": 7.130004177248777e-07, - "loss": 0.6855, - "step": 70800 - }, - { - "epoch": 1.81, - "learning_rate": 7.12973911457283e-07, - "loss": 0.708, - "step": 70801 - }, - { - "epoch": 1.81, - "learning_rate": 7.129474054094509e-07, - "loss": 0.5439, - "step": 70802 - }, - { - "epoch": 1.81, - "learning_rate": 7.12920899581402e-07, - "loss": 0.7412, - "step": 70803 - }, - { - "epoch": 1.81, - "learning_rate": 7.12894393973156e-07, - "loss": 0.6216, - "step": 70804 - }, - { - "epoch": 1.81, - "learning_rate": 7.128678885847339e-07, - "loss": 0.5615, - "step": 70805 - }, - { - "epoch": 1.81, - "learning_rate": 7.128413834161554e-07, - "loss": 0.5615, - "step": 70806 - }, - { - "epoch": 1.81, - "learning_rate": 7.128148784674412e-07, - "loss": 0.6562, - "step": 70807 - }, - { - "epoch": 1.81, - "learning_rate": 7.127883737386113e-07, - "loss": 0.6367, - "step": 70808 - }, - { - "epoch": 1.81, - "learning_rate": 7.127618692296864e-07, - "loss": 0.5718, - "step": 70809 - }, - { - "epoch": 1.81, - "learning_rate": 7.127353649406867e-07, - "loss": 0.6272, - "step": 70810 - }, - { - "epoch": 1.81, - "learning_rate": 7.127088608716319e-07, - "loss": 0.5342, - "step": 70811 - }, - { - "epoch": 1.81, - "learning_rate": 7.126823570225429e-07, - "loss": 0.6709, - "step": 70812 - }, - { - "epoch": 1.81, - "learning_rate": 7.126558533934396e-07, - "loss": 0.7363, - "step": 70813 - }, - { - "epoch": 1.81, - "learning_rate": 7.126293499843427e-07, - "loss": 0.5837, - "step": 70814 - }, - { - "epoch": 1.82, - "learning_rate": 7.12602846795272e-07, - "loss": 0.5674, - "step": 70815 - }, - { - "epoch": 1.82, - "learning_rate": 7.125763438262485e-07, - "loss": 0.6128, - "step": 70816 - }, - { - "epoch": 1.82, - "learning_rate": 7.12549841077292e-07, - "loss": 0.5645, - "step": 70817 - }, - { - "epoch": 1.82, - "learning_rate": 7.125233385484226e-07, - "loss": 0.6973, - "step": 70818 - }, - { - "epoch": 1.82, - "learning_rate": 7.124968362396611e-07, - "loss": 0.5332, - "step": 70819 - }, - { - "epoch": 1.82, - "learning_rate": 7.124703341510278e-07, - "loss": 0.4814, - "step": 70820 - }, - { - "epoch": 1.82, - "learning_rate": 7.124438322825423e-07, - "loss": 0.7275, - "step": 70821 - }, - { - "epoch": 1.82, - "learning_rate": 7.124173306342255e-07, - "loss": 0.6099, - "step": 70822 - }, - { - "epoch": 1.82, - "learning_rate": 7.123908292060973e-07, - "loss": 0.6846, - "step": 70823 - }, - { - "epoch": 1.82, - "learning_rate": 7.123643279981786e-07, - "loss": 0.5781, - "step": 70824 - }, - { - "epoch": 1.82, - "learning_rate": 7.12337827010489e-07, - "loss": 0.5066, - "step": 70825 - }, - { - "epoch": 1.82, - "learning_rate": 7.123113262430492e-07, - "loss": 0.394, - "step": 70826 - }, - { - "epoch": 1.82, - "learning_rate": 7.122848256958792e-07, - "loss": 0.6299, - "step": 70827 - }, - { - "epoch": 1.82, - "learning_rate": 7.122583253689998e-07, - "loss": 0.7314, - "step": 70828 - }, - { - "epoch": 1.82, - "learning_rate": 7.122318252624307e-07, - "loss": 0.5608, - "step": 70829 - }, - { - "epoch": 1.82, - "learning_rate": 7.122053253761928e-07, - "loss": 0.6807, - "step": 70830 - }, - { - "epoch": 1.82, - "learning_rate": 7.12178825710306e-07, - "loss": 0.6611, - "step": 70831 - }, - { - "epoch": 1.82, - "learning_rate": 7.121523262647903e-07, - "loss": 0.6147, - "step": 70832 - }, - { - "epoch": 1.82, - "learning_rate": 7.121258270396666e-07, - "loss": 0.8848, - "step": 70833 - }, - { - "epoch": 1.82, - "learning_rate": 7.12099328034955e-07, - "loss": 0.4941, - "step": 70834 - }, - { - "epoch": 1.82, - "learning_rate": 7.120728292506754e-07, - "loss": 0.7656, - "step": 70835 - }, - { - "epoch": 1.82, - "learning_rate": 7.120463306868487e-07, - "loss": 0.7188, - "step": 70836 - }, - { - "epoch": 1.82, - "learning_rate": 7.120198323434945e-07, - "loss": 0.4399, - "step": 70837 - }, - { - "epoch": 1.82, - "learning_rate": 7.119933342206337e-07, - "loss": 0.7988, - "step": 70838 - }, - { - "epoch": 1.82, - "learning_rate": 7.119668363182864e-07, - "loss": 0.6455, - "step": 70839 - }, - { - "epoch": 1.82, - "learning_rate": 7.119403386364731e-07, - "loss": 0.5947, - "step": 70840 - }, - { - "epoch": 1.82, - "learning_rate": 7.119138411752136e-07, - "loss": 0.5371, - "step": 70841 - }, - { - "epoch": 1.82, - "learning_rate": 7.118873439345282e-07, - "loss": 0.5659, - "step": 70842 - }, - { - "epoch": 1.82, - "learning_rate": 7.118608469144376e-07, - "loss": 0.5664, - "step": 70843 - }, - { - "epoch": 1.82, - "learning_rate": 7.118343501149617e-07, - "loss": 0.6011, - "step": 70844 - }, - { - "epoch": 1.82, - "learning_rate": 7.118078535361214e-07, - "loss": 0.6211, - "step": 70845 - }, - { - "epoch": 1.82, - "learning_rate": 7.117813571779361e-07, - "loss": 0.5654, - "step": 70846 - }, - { - "epoch": 1.82, - "learning_rate": 7.117548610404269e-07, - "loss": 0.5596, - "step": 70847 - }, - { - "epoch": 1.82, - "learning_rate": 7.117283651236135e-07, - "loss": 0.7764, - "step": 70848 - }, - { - "epoch": 1.82, - "learning_rate": 7.117018694275168e-07, - "loss": 0.5928, - "step": 70849 - }, - { - "epoch": 1.82, - "learning_rate": 7.116753739521569e-07, - "loss": 0.6509, - "step": 70850 - }, - { - "epoch": 1.82, - "learning_rate": 7.116488786975532e-07, - "loss": 0.7217, - "step": 70851 - }, - { - "epoch": 1.82, - "learning_rate": 7.116223836637272e-07, - "loss": 0.707, - "step": 70852 - }, - { - "epoch": 1.82, - "learning_rate": 7.115958888506986e-07, - "loss": 0.4626, - "step": 70853 - }, - { - "epoch": 1.82, - "learning_rate": 7.115693942584875e-07, - "loss": 0.5261, - "step": 70854 - }, - { - "epoch": 1.82, - "learning_rate": 7.115428998871147e-07, - "loss": 0.6343, - "step": 70855 - }, - { - "epoch": 1.82, - "learning_rate": 7.115164057366e-07, - "loss": 0.5747, - "step": 70856 - }, - { - "epoch": 1.82, - "learning_rate": 7.114899118069642e-07, - "loss": 0.6406, - "step": 70857 - }, - { - "epoch": 1.82, - "learning_rate": 7.114634180982271e-07, - "loss": 0.5913, - "step": 70858 - }, - { - "epoch": 1.82, - "learning_rate": 7.114369246104093e-07, - "loss": 0.6963, - "step": 70859 - }, - { - "epoch": 1.82, - "learning_rate": 7.114104313435312e-07, - "loss": 0.3267, - "step": 70860 - }, - { - "epoch": 1.82, - "learning_rate": 7.113839382976126e-07, - "loss": 0.6514, - "step": 70861 - }, - { - "epoch": 1.82, - "learning_rate": 7.113574454726741e-07, - "loss": 0.7871, - "step": 70862 - }, - { - "epoch": 1.82, - "learning_rate": 7.113309528687356e-07, - "loss": 0.6846, - "step": 70863 - }, - { - "epoch": 1.82, - "learning_rate": 7.113044604858182e-07, - "loss": 0.6479, - "step": 70864 - }, - { - "epoch": 1.82, - "learning_rate": 7.112779683239414e-07, - "loss": 0.7148, - "step": 70865 - }, - { - "epoch": 1.82, - "learning_rate": 7.112514763831259e-07, - "loss": 0.7627, - "step": 70866 - }, - { - "epoch": 1.82, - "learning_rate": 7.112249846633917e-07, - "loss": 0.6934, - "step": 70867 - }, - { - "epoch": 1.82, - "learning_rate": 7.111984931647597e-07, - "loss": 0.751, - "step": 70868 - }, - { - "epoch": 1.82, - "learning_rate": 7.111720018872493e-07, - "loss": 0.7432, - "step": 70869 - }, - { - "epoch": 1.82, - "learning_rate": 7.111455108308818e-07, - "loss": 0.603, - "step": 70870 - }, - { - "epoch": 1.82, - "learning_rate": 7.111190199956763e-07, - "loss": 0.6953, - "step": 70871 - }, - { - "epoch": 1.82, - "learning_rate": 7.11092529381654e-07, - "loss": 0.5986, - "step": 70872 - }, - { - "epoch": 1.82, - "learning_rate": 7.110660389888345e-07, - "loss": 0.7129, - "step": 70873 - }, - { - "epoch": 1.82, - "learning_rate": 7.110395488172388e-07, - "loss": 0.6304, - "step": 70874 - }, - { - "epoch": 1.82, - "learning_rate": 7.110130588668865e-07, - "loss": 0.5239, - "step": 70875 - }, - { - "epoch": 1.82, - "learning_rate": 7.109865691377985e-07, - "loss": 0.502, - "step": 70876 - }, - { - "epoch": 1.82, - "learning_rate": 7.109600796299946e-07, - "loss": 0.584, - "step": 70877 - }, - { - "epoch": 1.82, - "learning_rate": 7.109335903434955e-07, - "loss": 0.6667, - "step": 70878 - }, - { - "epoch": 1.82, - "learning_rate": 7.10907101278321e-07, - "loss": 0.7725, - "step": 70879 - }, - { - "epoch": 1.82, - "learning_rate": 7.108806124344921e-07, - "loss": 0.624, - "step": 70880 - }, - { - "epoch": 1.82, - "learning_rate": 7.108541238120284e-07, - "loss": 0.5322, - "step": 70881 - }, - { - "epoch": 1.82, - "learning_rate": 7.108276354109501e-07, - "loss": 0.6968, - "step": 70882 - }, - { - "epoch": 1.82, - "learning_rate": 7.108011472312782e-07, - "loss": 0.5303, - "step": 70883 - }, - { - "epoch": 1.82, - "learning_rate": 7.107746592730322e-07, - "loss": 0.6567, - "step": 70884 - }, - { - "epoch": 1.82, - "learning_rate": 7.107481715362329e-07, - "loss": 0.4507, - "step": 70885 - }, - { - "epoch": 1.82, - "learning_rate": 7.107216840209003e-07, - "loss": 0.5701, - "step": 70886 - }, - { - "epoch": 1.82, - "learning_rate": 7.106951967270551e-07, - "loss": 0.7744, - "step": 70887 - }, - { - "epoch": 1.82, - "learning_rate": 7.106687096547169e-07, - "loss": 0.8223, - "step": 70888 - }, - { - "epoch": 1.82, - "learning_rate": 7.106422228039068e-07, - "loss": 0.6826, - "step": 70889 - }, - { - "epoch": 1.82, - "learning_rate": 7.106157361746446e-07, - "loss": 0.46, - "step": 70890 - }, - { - "epoch": 1.82, - "learning_rate": 7.105892497669505e-07, - "loss": 0.6992, - "step": 70891 - }, - { - "epoch": 1.82, - "learning_rate": 7.105627635808447e-07, - "loss": 0.4951, - "step": 70892 - }, - { - "epoch": 1.82, - "learning_rate": 7.10536277616348e-07, - "loss": 0.5474, - "step": 70893 - }, - { - "epoch": 1.82, - "learning_rate": 7.1050979187348e-07, - "loss": 0.6167, - "step": 70894 - }, - { - "epoch": 1.82, - "learning_rate": 7.104833063522618e-07, - "loss": 0.6411, - "step": 70895 - }, - { - "epoch": 1.82, - "learning_rate": 7.104568210527126e-07, - "loss": 0.625, - "step": 70896 - }, - { - "epoch": 1.82, - "learning_rate": 7.104303359748538e-07, - "loss": 0.7783, - "step": 70897 - }, - { - "epoch": 1.82, - "learning_rate": 7.104038511187049e-07, - "loss": 0.6287, - "step": 70898 - }, - { - "epoch": 1.82, - "learning_rate": 7.103773664842867e-07, - "loss": 0.7227, - "step": 70899 - }, - { - "epoch": 1.82, - "learning_rate": 7.103508820716194e-07, - "loss": 0.4171, - "step": 70900 - }, - { - "epoch": 1.82, - "learning_rate": 7.103243978807227e-07, - "loss": 0.5425, - "step": 70901 - }, - { - "epoch": 1.82, - "learning_rate": 7.102979139116176e-07, - "loss": 0.6458, - "step": 70902 - }, - { - "epoch": 1.82, - "learning_rate": 7.102714301643237e-07, - "loss": 0.5986, - "step": 70903 - }, - { - "epoch": 1.82, - "learning_rate": 7.102449466388619e-07, - "loss": 0.6064, - "step": 70904 - }, - { - "epoch": 1.82, - "learning_rate": 7.10218463335252e-07, - "loss": 0.5923, - "step": 70905 - }, - { - "epoch": 1.82, - "learning_rate": 7.101919802535148e-07, - "loss": 0.6934, - "step": 70906 - }, - { - "epoch": 1.82, - "learning_rate": 7.101654973936702e-07, - "loss": 0.6714, - "step": 70907 - }, - { - "epoch": 1.82, - "learning_rate": 7.101390147557382e-07, - "loss": 0.6807, - "step": 70908 - }, - { - "epoch": 1.82, - "learning_rate": 7.101125323397399e-07, - "loss": 0.6699, - "step": 70909 - }, - { - "epoch": 1.82, - "learning_rate": 7.100860501456953e-07, - "loss": 0.7881, - "step": 70910 - }, - { - "epoch": 1.82, - "learning_rate": 7.100595681736239e-07, - "loss": 0.644, - "step": 70911 - }, - { - "epoch": 1.82, - "learning_rate": 7.100330864235469e-07, - "loss": 0.627, - "step": 70912 - }, - { - "epoch": 1.82, - "learning_rate": 7.100066048954838e-07, - "loss": 0.6401, - "step": 70913 - }, - { - "epoch": 1.82, - "learning_rate": 7.099801235894557e-07, - "loss": 0.71, - "step": 70914 - }, - { - "epoch": 1.82, - "learning_rate": 7.099536425054822e-07, - "loss": 0.6152, - "step": 70915 - }, - { - "epoch": 1.82, - "learning_rate": 7.099271616435842e-07, - "loss": 0.5488, - "step": 70916 - }, - { - "epoch": 1.82, - "learning_rate": 7.099006810037813e-07, - "loss": 0.6611, - "step": 70917 - }, - { - "epoch": 1.82, - "learning_rate": 7.098742005860944e-07, - "loss": 0.6846, - "step": 70918 - }, - { - "epoch": 1.82, - "learning_rate": 7.098477203905432e-07, - "loss": 0.7617, - "step": 70919 - }, - { - "epoch": 1.82, - "learning_rate": 7.098212404171486e-07, - "loss": 0.5098, - "step": 70920 - }, - { - "epoch": 1.82, - "learning_rate": 7.097947606659304e-07, - "loss": 0.6226, - "step": 70921 - }, - { - "epoch": 1.82, - "learning_rate": 7.09768281136909e-07, - "loss": 0.7178, - "step": 70922 - }, - { - "epoch": 1.82, - "learning_rate": 7.097418018301046e-07, - "loss": 0.6772, - "step": 70923 - }, - { - "epoch": 1.82, - "learning_rate": 7.097153227455378e-07, - "loss": 0.5513, - "step": 70924 - }, - { - "epoch": 1.82, - "learning_rate": 7.096888438832283e-07, - "loss": 0.3379, - "step": 70925 - }, - { - "epoch": 1.82, - "learning_rate": 7.096623652431969e-07, - "loss": 0.5793, - "step": 70926 - }, - { - "epoch": 1.82, - "learning_rate": 7.096358868254635e-07, - "loss": 0.6094, - "step": 70927 - }, - { - "epoch": 1.82, - "learning_rate": 7.096094086300487e-07, - "loss": 0.6934, - "step": 70928 - }, - { - "epoch": 1.82, - "learning_rate": 7.095829306569729e-07, - "loss": 0.5127, - "step": 70929 - }, - { - "epoch": 1.82, - "learning_rate": 7.095564529062556e-07, - "loss": 0.5933, - "step": 70930 - }, - { - "epoch": 1.82, - "learning_rate": 7.095299753779178e-07, - "loss": 0.8057, - "step": 70931 - }, - { - "epoch": 1.82, - "learning_rate": 7.095034980719794e-07, - "loss": 0.7075, - "step": 70932 - }, - { - "epoch": 1.82, - "learning_rate": 7.094770209884611e-07, - "loss": 0.4583, - "step": 70933 - }, - { - "epoch": 1.82, - "learning_rate": 7.094505441273824e-07, - "loss": 0.7422, - "step": 70934 - }, - { - "epoch": 1.82, - "learning_rate": 7.094240674887645e-07, - "loss": 0.6484, - "step": 70935 - }, - { - "epoch": 1.82, - "learning_rate": 7.093975910726269e-07, - "loss": 0.7568, - "step": 70936 - }, - { - "epoch": 1.82, - "learning_rate": 7.093711148789905e-07, - "loss": 0.519, - "step": 70937 - }, - { - "epoch": 1.82, - "learning_rate": 7.09344638907875e-07, - "loss": 0.76, - "step": 70938 - }, - { - "epoch": 1.82, - "learning_rate": 7.093181631593014e-07, - "loss": 0.6406, - "step": 70939 - }, - { - "epoch": 1.82, - "learning_rate": 7.092916876332893e-07, - "loss": 0.6016, - "step": 70940 - }, - { - "epoch": 1.82, - "learning_rate": 7.09265212329859e-07, - "loss": 0.5776, - "step": 70941 - }, - { - "epoch": 1.82, - "learning_rate": 7.092387372490311e-07, - "loss": 0.5269, - "step": 70942 - }, - { - "epoch": 1.82, - "learning_rate": 7.092122623908259e-07, - "loss": 0.7168, - "step": 70943 - }, - { - "epoch": 1.82, - "learning_rate": 7.091857877552631e-07, - "loss": 0.6289, - "step": 70944 - }, - { - "epoch": 1.82, - "learning_rate": 7.091593133423637e-07, - "loss": 0.7012, - "step": 70945 - }, - { - "epoch": 1.82, - "learning_rate": 7.091328391521473e-07, - "loss": 0.5293, - "step": 70946 - }, - { - "epoch": 1.82, - "learning_rate": 7.091063651846348e-07, - "loss": 0.665, - "step": 70947 - }, - { - "epoch": 1.82, - "learning_rate": 7.090798914398459e-07, - "loss": 0.6611, - "step": 70948 - }, - { - "epoch": 1.82, - "learning_rate": 7.090534179178017e-07, - "loss": 0.6865, - "step": 70949 - }, - { - "epoch": 1.82, - "learning_rate": 7.090269446185217e-07, - "loss": 0.7217, - "step": 70950 - }, - { - "epoch": 1.82, - "learning_rate": 7.090004715420261e-07, - "loss": 0.6299, - "step": 70951 - }, - { - "epoch": 1.82, - "learning_rate": 7.089739986883356e-07, - "loss": 0.5767, - "step": 70952 - }, - { - "epoch": 1.82, - "learning_rate": 7.089475260574703e-07, - "loss": 0.5454, - "step": 70953 - }, - { - "epoch": 1.82, - "learning_rate": 7.089210536494506e-07, - "loss": 0.5552, - "step": 70954 - }, - { - "epoch": 1.82, - "learning_rate": 7.088945814642964e-07, - "loss": 0.5594, - "step": 70955 - }, - { - "epoch": 1.82, - "learning_rate": 7.088681095020285e-07, - "loss": 0.7158, - "step": 70956 - }, - { - "epoch": 1.82, - "learning_rate": 7.088416377626667e-07, - "loss": 0.749, - "step": 70957 - }, - { - "epoch": 1.82, - "learning_rate": 7.088151662462318e-07, - "loss": 0.6584, - "step": 70958 - }, - { - "epoch": 1.82, - "learning_rate": 7.087886949527438e-07, - "loss": 0.5508, - "step": 70959 - }, - { - "epoch": 1.82, - "learning_rate": 7.087622238822227e-07, - "loss": 0.5625, - "step": 70960 - }, - { - "epoch": 1.82, - "learning_rate": 7.087357530346888e-07, - "loss": 0.4946, - "step": 70961 - }, - { - "epoch": 1.82, - "learning_rate": 7.087092824101628e-07, - "loss": 0.5615, - "step": 70962 - }, - { - "epoch": 1.82, - "learning_rate": 7.086828120086644e-07, - "loss": 0.627, - "step": 70963 - }, - { - "epoch": 1.82, - "learning_rate": 7.086563418302145e-07, - "loss": 0.6475, - "step": 70964 - }, - { - "epoch": 1.82, - "learning_rate": 7.086298718748327e-07, - "loss": 0.364, - "step": 70965 - }, - { - "epoch": 1.82, - "learning_rate": 7.086034021425399e-07, - "loss": 0.7109, - "step": 70966 - }, - { - "epoch": 1.82, - "learning_rate": 7.085769326333558e-07, - "loss": 0.7559, - "step": 70967 - }, - { - "epoch": 1.82, - "learning_rate": 7.085504633473012e-07, - "loss": 0.7979, - "step": 70968 - }, - { - "epoch": 1.82, - "learning_rate": 7.085239942843964e-07, - "loss": 0.5225, - "step": 70969 - }, - { - "epoch": 1.82, - "learning_rate": 7.084975254446608e-07, - "loss": 0.6562, - "step": 70970 - }, - { - "epoch": 1.82, - "learning_rate": 7.084710568281155e-07, - "loss": 0.6602, - "step": 70971 - }, - { - "epoch": 1.82, - "learning_rate": 7.084445884347803e-07, - "loss": 0.5144, - "step": 70972 - }, - { - "epoch": 1.82, - "learning_rate": 7.084181202646759e-07, - "loss": 0.7314, - "step": 70973 - }, - { - "epoch": 1.82, - "learning_rate": 7.083916523178222e-07, - "loss": 0.8613, - "step": 70974 - }, - { - "epoch": 1.82, - "learning_rate": 7.083651845942398e-07, - "loss": 0.5098, - "step": 70975 - }, - { - "epoch": 1.82, - "learning_rate": 7.083387170939486e-07, - "loss": 0.3721, - "step": 70976 - }, - { - "epoch": 1.82, - "learning_rate": 7.08312249816969e-07, - "loss": 0.5786, - "step": 70977 - }, - { - "epoch": 1.82, - "learning_rate": 7.082857827633213e-07, - "loss": 0.6841, - "step": 70978 - }, - { - "epoch": 1.82, - "learning_rate": 7.082593159330263e-07, - "loss": 0.5962, - "step": 70979 - }, - { - "epoch": 1.82, - "learning_rate": 7.082328493261031e-07, - "loss": 0.6206, - "step": 70980 - }, - { - "epoch": 1.82, - "learning_rate": 7.082063829425729e-07, - "loss": 0.5293, - "step": 70981 - }, - { - "epoch": 1.82, - "learning_rate": 7.081799167824554e-07, - "loss": 0.5693, - "step": 70982 - }, - { - "epoch": 1.82, - "learning_rate": 7.081534508457713e-07, - "loss": 0.7314, - "step": 70983 - }, - { - "epoch": 1.82, - "learning_rate": 7.081269851325404e-07, - "loss": 0.6436, - "step": 70984 - }, - { - "epoch": 1.82, - "learning_rate": 7.081005196427836e-07, - "loss": 0.7598, - "step": 70985 - }, - { - "epoch": 1.82, - "learning_rate": 7.080740543765205e-07, - "loss": 0.5874, - "step": 70986 - }, - { - "epoch": 1.82, - "learning_rate": 7.080475893337718e-07, - "loss": 0.7979, - "step": 70987 - }, - { - "epoch": 1.82, - "learning_rate": 7.080211245145576e-07, - "loss": 0.6577, - "step": 70988 - }, - { - "epoch": 1.82, - "learning_rate": 7.079946599188987e-07, - "loss": 0.5664, - "step": 70989 - }, - { - "epoch": 1.82, - "learning_rate": 7.079681955468144e-07, - "loss": 0.5437, - "step": 70990 - }, - { - "epoch": 1.82, - "learning_rate": 7.079417313983254e-07, - "loss": 0.6738, - "step": 70991 - }, - { - "epoch": 1.82, - "learning_rate": 7.079152674734521e-07, - "loss": 0.54, - "step": 70992 - }, - { - "epoch": 1.82, - "learning_rate": 7.078888037722144e-07, - "loss": 0.6196, - "step": 70993 - }, - { - "epoch": 1.82, - "learning_rate": 7.078623402946331e-07, - "loss": 0.7324, - "step": 70994 - }, - { - "epoch": 1.82, - "learning_rate": 7.07835877040728e-07, - "loss": 0.6143, - "step": 70995 - }, - { - "epoch": 1.82, - "learning_rate": 7.078094140105197e-07, - "loss": 0.7314, - "step": 70996 - }, - { - "epoch": 1.82, - "learning_rate": 7.077829512040283e-07, - "loss": 0.7852, - "step": 70997 - }, - { - "epoch": 1.82, - "learning_rate": 7.077564886212739e-07, - "loss": 0.6748, - "step": 70998 - }, - { - "epoch": 1.82, - "learning_rate": 7.077300262622772e-07, - "loss": 0.7285, - "step": 70999 - }, - { - "epoch": 1.82, - "learning_rate": 7.077035641270581e-07, - "loss": 0.6963, - "step": 71000 - }, - { - "epoch": 1.82, - "learning_rate": 7.076771022156367e-07, - "loss": 0.5269, - "step": 71001 - }, - { - "epoch": 1.82, - "learning_rate": 7.076506405280336e-07, - "loss": 0.6504, - "step": 71002 - }, - { - "epoch": 1.82, - "learning_rate": 7.076241790642689e-07, - "loss": 0.7471, - "step": 71003 - }, - { - "epoch": 1.82, - "learning_rate": 7.07597717824363e-07, - "loss": 0.6431, - "step": 71004 - }, - { - "epoch": 1.82, - "learning_rate": 7.075712568083361e-07, - "loss": 0.5513, - "step": 71005 - }, - { - "epoch": 1.82, - "learning_rate": 7.075447960162084e-07, - "loss": 0.4443, - "step": 71006 - }, - { - "epoch": 1.82, - "learning_rate": 7.075183354480001e-07, - "loss": 0.5825, - "step": 71007 - }, - { - "epoch": 1.82, - "learning_rate": 7.074918751037317e-07, - "loss": 0.6621, - "step": 71008 - }, - { - "epoch": 1.82, - "learning_rate": 7.074654149834236e-07, - "loss": 0.6587, - "step": 71009 - }, - { - "epoch": 1.82, - "learning_rate": 7.074389550870954e-07, - "loss": 0.6797, - "step": 71010 - }, - { - "epoch": 1.82, - "learning_rate": 7.07412495414768e-07, - "loss": 0.7002, - "step": 71011 - }, - { - "epoch": 1.82, - "learning_rate": 7.073860359664609e-07, - "loss": 0.7383, - "step": 71012 - }, - { - "epoch": 1.82, - "learning_rate": 7.073595767421954e-07, - "loss": 0.748, - "step": 71013 - }, - { - "epoch": 1.82, - "learning_rate": 7.073331177419907e-07, - "loss": 0.5693, - "step": 71014 - }, - { - "epoch": 1.82, - "learning_rate": 7.073066589658681e-07, - "loss": 0.5459, - "step": 71015 - }, - { - "epoch": 1.82, - "learning_rate": 7.072802004138472e-07, - "loss": 0.7676, - "step": 71016 - }, - { - "epoch": 1.82, - "learning_rate": 7.072537420859481e-07, - "loss": 0.4183, - "step": 71017 - }, - { - "epoch": 1.82, - "learning_rate": 7.072272839821916e-07, - "loss": 0.5259, - "step": 71018 - }, - { - "epoch": 1.82, - "learning_rate": 7.072008261025981e-07, - "loss": 0.6558, - "step": 71019 - }, - { - "epoch": 1.82, - "learning_rate": 7.071743684471868e-07, - "loss": 0.6689, - "step": 71020 - }, - { - "epoch": 1.82, - "learning_rate": 7.071479110159789e-07, - "loss": 0.793, - "step": 71021 - }, - { - "epoch": 1.82, - "learning_rate": 7.071214538089943e-07, - "loss": 0.7275, - "step": 71022 - }, - { - "epoch": 1.82, - "learning_rate": 7.070949968262534e-07, - "loss": 0.7363, - "step": 71023 - }, - { - "epoch": 1.82, - "learning_rate": 7.070685400677762e-07, - "loss": 0.7334, - "step": 71024 - }, - { - "epoch": 1.82, - "learning_rate": 7.070420835335833e-07, - "loss": 0.3972, - "step": 71025 - }, - { - "epoch": 1.82, - "learning_rate": 7.070156272236946e-07, - "loss": 0.6777, - "step": 71026 - }, - { - "epoch": 1.82, - "learning_rate": 7.06989171138131e-07, - "loss": 0.5884, - "step": 71027 - }, - { - "epoch": 1.82, - "learning_rate": 7.069627152769119e-07, - "loss": 0.6211, - "step": 71028 - }, - { - "epoch": 1.82, - "learning_rate": 7.069362596400585e-07, - "loss": 0.7085, - "step": 71029 - }, - { - "epoch": 1.82, - "learning_rate": 7.069098042275903e-07, - "loss": 0.5977, - "step": 71030 - }, - { - "epoch": 1.82, - "learning_rate": 7.068833490395275e-07, - "loss": 0.6279, - "step": 71031 - }, - { - "epoch": 1.82, - "learning_rate": 7.068568940758908e-07, - "loss": 0.427, - "step": 71032 - }, - { - "epoch": 1.82, - "learning_rate": 7.068304393367005e-07, - "loss": 0.4592, - "step": 71033 - }, - { - "epoch": 1.82, - "learning_rate": 7.068039848219763e-07, - "loss": 0.519, - "step": 71034 - }, - { - "epoch": 1.82, - "learning_rate": 7.067775305317391e-07, - "loss": 0.4492, - "step": 71035 - }, - { - "epoch": 1.82, - "learning_rate": 7.067510764660086e-07, - "loss": 0.8262, - "step": 71036 - }, - { - "epoch": 1.82, - "learning_rate": 7.067246226248056e-07, - "loss": 0.5742, - "step": 71037 - }, - { - "epoch": 1.82, - "learning_rate": 7.066981690081497e-07, - "loss": 0.5483, - "step": 71038 - }, - { - "epoch": 1.82, - "learning_rate": 7.06671715616062e-07, - "loss": 0.6812, - "step": 71039 - }, - { - "epoch": 1.82, - "learning_rate": 7.066452624485622e-07, - "loss": 0.6104, - "step": 71040 - }, - { - "epoch": 1.82, - "learning_rate": 7.066188095056702e-07, - "loss": 0.4399, - "step": 71041 - }, - { - "epoch": 1.82, - "learning_rate": 7.065923567874072e-07, - "loss": 0.7383, - "step": 71042 - }, - { - "epoch": 1.82, - "learning_rate": 7.065659042937924e-07, - "loss": 0.5161, - "step": 71043 - }, - { - "epoch": 1.82, - "learning_rate": 7.065394520248471e-07, - "loss": 0.6177, - "step": 71044 - }, - { - "epoch": 1.82, - "learning_rate": 7.065129999805906e-07, - "loss": 0.5647, - "step": 71045 - }, - { - "epoch": 1.82, - "learning_rate": 7.06486548161044e-07, - "loss": 0.5659, - "step": 71046 - }, - { - "epoch": 1.82, - "learning_rate": 7.064600965662268e-07, - "loss": 0.562, - "step": 71047 - }, - { - "epoch": 1.82, - "learning_rate": 7.064336451961599e-07, - "loss": 0.7627, - "step": 71048 - }, - { - "epoch": 1.82, - "learning_rate": 7.064071940508635e-07, - "loss": 0.6211, - "step": 71049 - }, - { - "epoch": 1.82, - "learning_rate": 7.063807431303573e-07, - "loss": 0.7744, - "step": 71050 - }, - { - "epoch": 1.82, - "learning_rate": 7.063542924346618e-07, - "loss": 0.5652, - "step": 71051 - }, - { - "epoch": 1.82, - "learning_rate": 7.063278419637973e-07, - "loss": 0.7773, - "step": 71052 - }, - { - "epoch": 1.82, - "learning_rate": 7.063013917177841e-07, - "loss": 0.8066, - "step": 71053 - }, - { - "epoch": 1.82, - "learning_rate": 7.062749416966425e-07, - "loss": 0.7256, - "step": 71054 - }, - { - "epoch": 1.82, - "learning_rate": 7.062484919003924e-07, - "loss": 0.5879, - "step": 71055 - }, - { - "epoch": 1.82, - "learning_rate": 7.062220423290545e-07, - "loss": 0.9297, - "step": 71056 - }, - { - "epoch": 1.82, - "learning_rate": 7.061955929826489e-07, - "loss": 0.5815, - "step": 71057 - }, - { - "epoch": 1.82, - "learning_rate": 7.061691438611959e-07, - "loss": 0.5452, - "step": 71058 - }, - { - "epoch": 1.82, - "learning_rate": 7.061426949647159e-07, - "loss": 0.6836, - "step": 71059 - }, - { - "epoch": 1.82, - "learning_rate": 7.061162462932284e-07, - "loss": 0.7568, - "step": 71060 - }, - { - "epoch": 1.82, - "learning_rate": 7.060897978467546e-07, - "loss": 0.7285, - "step": 71061 - }, - { - "epoch": 1.82, - "learning_rate": 7.06063349625314e-07, - "loss": 0.5532, - "step": 71062 - }, - { - "epoch": 1.82, - "learning_rate": 7.060369016289274e-07, - "loss": 0.8428, - "step": 71063 - }, - { - "epoch": 1.82, - "learning_rate": 7.060104538576146e-07, - "loss": 0.6924, - "step": 71064 - }, - { - "epoch": 1.82, - "learning_rate": 7.059840063113962e-07, - "loss": 0.6538, - "step": 71065 - }, - { - "epoch": 1.82, - "learning_rate": 7.059575589902923e-07, - "loss": 0.5947, - "step": 71066 - }, - { - "epoch": 1.82, - "learning_rate": 7.059311118943233e-07, - "loss": 0.6592, - "step": 71067 - }, - { - "epoch": 1.82, - "learning_rate": 7.05904665023509e-07, - "loss": 0.4854, - "step": 71068 - }, - { - "epoch": 1.82, - "learning_rate": 7.058782183778709e-07, - "loss": 0.5002, - "step": 71069 - }, - { - "epoch": 1.82, - "learning_rate": 7.058517719574275e-07, - "loss": 0.7178, - "step": 71070 - }, - { - "epoch": 1.82, - "learning_rate": 7.058253257622e-07, - "loss": 0.6514, - "step": 71071 - }, - { - "epoch": 1.82, - "learning_rate": 7.057988797922086e-07, - "loss": 0.5767, - "step": 71072 - }, - { - "epoch": 1.82, - "learning_rate": 7.057724340474734e-07, - "loss": 0.6982, - "step": 71073 - }, - { - "epoch": 1.82, - "learning_rate": 7.057459885280145e-07, - "loss": 0.6846, - "step": 71074 - }, - { - "epoch": 1.82, - "learning_rate": 7.057195432338527e-07, - "loss": 0.6992, - "step": 71075 - }, - { - "epoch": 1.82, - "learning_rate": 7.056930981650078e-07, - "loss": 0.6372, - "step": 71076 - }, - { - "epoch": 1.82, - "learning_rate": 7.056666533215001e-07, - "loss": 0.5558, - "step": 71077 - }, - { - "epoch": 1.82, - "learning_rate": 7.056402087033499e-07, - "loss": 0.7529, - "step": 71078 - }, - { - "epoch": 1.82, - "learning_rate": 7.056137643105779e-07, - "loss": 0.5688, - "step": 71079 - }, - { - "epoch": 1.82, - "learning_rate": 7.055873201432035e-07, - "loss": 0.6514, - "step": 71080 - }, - { - "epoch": 1.82, - "learning_rate": 7.055608762012472e-07, - "loss": 0.5566, - "step": 71081 - }, - { - "epoch": 1.82, - "learning_rate": 7.055344324847299e-07, - "loss": 0.5811, - "step": 71082 - }, - { - "epoch": 1.82, - "learning_rate": 7.055079889936708e-07, - "loss": 0.603, - "step": 71083 - }, - { - "epoch": 1.82, - "learning_rate": 7.05481545728091e-07, - "loss": 0.7275, - "step": 71084 - }, - { - "epoch": 1.82, - "learning_rate": 7.054551026880103e-07, - "loss": 0.5603, - "step": 71085 - }, - { - "epoch": 1.82, - "learning_rate": 7.054286598734491e-07, - "loss": 0.6987, - "step": 71086 - }, - { - "epoch": 1.82, - "learning_rate": 7.054022172844278e-07, - "loss": 0.771, - "step": 71087 - }, - { - "epoch": 1.82, - "learning_rate": 7.053757749209664e-07, - "loss": 0.6416, - "step": 71088 - }, - { - "epoch": 1.82, - "learning_rate": 7.053493327830853e-07, - "loss": 0.5653, - "step": 71089 - }, - { - "epoch": 1.82, - "learning_rate": 7.053228908708047e-07, - "loss": 0.666, - "step": 71090 - }, - { - "epoch": 1.82, - "learning_rate": 7.052964491841445e-07, - "loss": 0.5934, - "step": 71091 - }, - { - "epoch": 1.82, - "learning_rate": 7.052700077231255e-07, - "loss": 0.646, - "step": 71092 - }, - { - "epoch": 1.82, - "learning_rate": 7.052435664877675e-07, - "loss": 0.6304, - "step": 71093 - }, - { - "epoch": 1.82, - "learning_rate": 7.052171254780912e-07, - "loss": 0.6313, - "step": 71094 - }, - { - "epoch": 1.82, - "learning_rate": 7.051906846941162e-07, - "loss": 0.7402, - "step": 71095 - }, - { - "epoch": 1.82, - "learning_rate": 7.051642441358636e-07, - "loss": 0.6162, - "step": 71096 - }, - { - "epoch": 1.82, - "learning_rate": 7.051378038033529e-07, - "loss": 0.7891, - "step": 71097 - }, - { - "epoch": 1.82, - "learning_rate": 7.051113636966047e-07, - "loss": 0.7422, - "step": 71098 - }, - { - "epoch": 1.82, - "learning_rate": 7.050849238156396e-07, - "loss": 0.5635, - "step": 71099 - }, - { - "epoch": 1.82, - "learning_rate": 7.050584841604767e-07, - "loss": 0.6445, - "step": 71100 - }, - { - "epoch": 1.82, - "learning_rate": 7.050320447311374e-07, - "loss": 0.6738, - "step": 71101 - }, - { - "epoch": 1.82, - "learning_rate": 7.050056055276412e-07, - "loss": 0.5249, - "step": 71102 - }, - { - "epoch": 1.82, - "learning_rate": 7.049791665500089e-07, - "loss": 0.5193, - "step": 71103 - }, - { - "epoch": 1.82, - "learning_rate": 7.049527277982602e-07, - "loss": 0.7119, - "step": 71104 - }, - { - "epoch": 1.82, - "learning_rate": 7.049262892724159e-07, - "loss": 0.6855, - "step": 71105 - }, - { - "epoch": 1.82, - "learning_rate": 7.048998509724959e-07, - "loss": 0.6113, - "step": 71106 - }, - { - "epoch": 1.82, - "learning_rate": 7.048734128985204e-07, - "loss": 0.6543, - "step": 71107 - }, - { - "epoch": 1.82, - "learning_rate": 7.048469750505099e-07, - "loss": 0.6455, - "step": 71108 - }, - { - "epoch": 1.82, - "learning_rate": 7.048205374284848e-07, - "loss": 0.6235, - "step": 71109 - }, - { - "epoch": 1.82, - "learning_rate": 7.047941000324645e-07, - "loss": 0.4824, - "step": 71110 - }, - { - "epoch": 1.82, - "learning_rate": 7.047676628624701e-07, - "loss": 0.6865, - "step": 71111 - }, - { - "epoch": 1.82, - "learning_rate": 7.047412259185213e-07, - "loss": 0.7637, - "step": 71112 - }, - { - "epoch": 1.82, - "learning_rate": 7.047147892006388e-07, - "loss": 0.7041, - "step": 71113 - }, - { - "epoch": 1.82, - "learning_rate": 7.046883527088423e-07, - "loss": 0.7246, - "step": 71114 - }, - { - "epoch": 1.82, - "learning_rate": 7.046619164431526e-07, - "loss": 0.5676, - "step": 71115 - }, - { - "epoch": 1.82, - "learning_rate": 7.046354804035894e-07, - "loss": 0.6221, - "step": 71116 - }, - { - "epoch": 1.82, - "learning_rate": 7.046090445901736e-07, - "loss": 0.6602, - "step": 71117 - }, - { - "epoch": 1.82, - "learning_rate": 7.045826090029247e-07, - "loss": 0.5415, - "step": 71118 - }, - { - "epoch": 1.82, - "learning_rate": 7.045561736418639e-07, - "loss": 0.7061, - "step": 71119 - }, - { - "epoch": 1.82, - "learning_rate": 7.045297385070106e-07, - "loss": 0.6602, - "step": 71120 - }, - { - "epoch": 1.82, - "learning_rate": 7.045033035983851e-07, - "loss": 0.5928, - "step": 71121 - }, - { - "epoch": 1.82, - "learning_rate": 7.044768689160078e-07, - "loss": 0.6958, - "step": 71122 - }, - { - "epoch": 1.82, - "learning_rate": 7.044504344598994e-07, - "loss": 0.6128, - "step": 71123 - }, - { - "epoch": 1.82, - "learning_rate": 7.044240002300791e-07, - "loss": 0.5767, - "step": 71124 - }, - { - "epoch": 1.82, - "learning_rate": 7.043975662265682e-07, - "loss": 0.7065, - "step": 71125 - }, - { - "epoch": 1.82, - "learning_rate": 7.043711324493862e-07, - "loss": 0.6787, - "step": 71126 - }, - { - "epoch": 1.82, - "learning_rate": 7.043446988985538e-07, - "loss": 0.5342, - "step": 71127 - }, - { - "epoch": 1.82, - "learning_rate": 7.043182655740909e-07, - "loss": 0.5244, - "step": 71128 - }, - { - "epoch": 1.82, - "learning_rate": 7.042918324760184e-07, - "loss": 0.5557, - "step": 71129 - }, - { - "epoch": 1.82, - "learning_rate": 7.042653996043558e-07, - "loss": 0.8008, - "step": 71130 - }, - { - "epoch": 1.82, - "learning_rate": 7.042389669591233e-07, - "loss": 0.6162, - "step": 71131 - }, - { - "epoch": 1.82, - "learning_rate": 7.042125345403418e-07, - "loss": 0.4187, - "step": 71132 - }, - { - "epoch": 1.82, - "learning_rate": 7.041861023480308e-07, - "loss": 0.5366, - "step": 71133 - }, - { - "epoch": 1.82, - "learning_rate": 7.041596703822111e-07, - "loss": 0.8281, - "step": 71134 - }, - { - "epoch": 1.82, - "learning_rate": 7.041332386429026e-07, - "loss": 0.6267, - "step": 71135 - }, - { - "epoch": 1.82, - "learning_rate": 7.04106807130126e-07, - "loss": 0.7578, - "step": 71136 - }, - { - "epoch": 1.82, - "learning_rate": 7.040803758439006e-07, - "loss": 0.6167, - "step": 71137 - }, - { - "epoch": 1.82, - "learning_rate": 7.040539447842479e-07, - "loss": 0.6235, - "step": 71138 - }, - { - "epoch": 1.82, - "learning_rate": 7.040275139511875e-07, - "loss": 0.6035, - "step": 71139 - }, - { - "epoch": 1.82, - "learning_rate": 7.040010833447394e-07, - "loss": 0.5181, - "step": 71140 - }, - { - "epoch": 1.82, - "learning_rate": 7.039746529649239e-07, - "loss": 0.6064, - "step": 71141 - }, - { - "epoch": 1.82, - "learning_rate": 7.039482228117616e-07, - "loss": 0.7578, - "step": 71142 - }, - { - "epoch": 1.82, - "learning_rate": 7.039217928852724e-07, - "loss": 0.6523, - "step": 71143 - }, - { - "epoch": 1.82, - "learning_rate": 7.038953631854767e-07, - "loss": 0.615, - "step": 71144 - }, - { - "epoch": 1.82, - "learning_rate": 7.038689337123946e-07, - "loss": 0.6079, - "step": 71145 - }, - { - "epoch": 1.82, - "learning_rate": 7.038425044660465e-07, - "loss": 0.615, - "step": 71146 - }, - { - "epoch": 1.82, - "learning_rate": 7.038160754464527e-07, - "loss": 0.6133, - "step": 71147 - }, - { - "epoch": 1.82, - "learning_rate": 7.037896466536333e-07, - "loss": 0.5625, - "step": 71148 - }, - { - "epoch": 1.82, - "learning_rate": 7.037632180876087e-07, - "loss": 0.5095, - "step": 71149 - }, - { - "epoch": 1.82, - "learning_rate": 7.037367897483987e-07, - "loss": 0.6079, - "step": 71150 - }, - { - "epoch": 1.82, - "learning_rate": 7.037103616360239e-07, - "loss": 0.7539, - "step": 71151 - }, - { - "epoch": 1.82, - "learning_rate": 7.036839337505043e-07, - "loss": 0.6875, - "step": 71152 - }, - { - "epoch": 1.82, - "learning_rate": 7.036575060918606e-07, - "loss": 0.7871, - "step": 71153 - }, - { - "epoch": 1.82, - "learning_rate": 7.036310786601124e-07, - "loss": 0.6895, - "step": 71154 - }, - { - "epoch": 1.82, - "learning_rate": 7.036046514552805e-07, - "loss": 0.7031, - "step": 71155 - }, - { - "epoch": 1.82, - "learning_rate": 7.035782244773847e-07, - "loss": 0.6406, - "step": 71156 - }, - { - "epoch": 1.82, - "learning_rate": 7.035517977264456e-07, - "loss": 0.5669, - "step": 71157 - }, - { - "epoch": 1.82, - "learning_rate": 7.035253712024831e-07, - "loss": 0.4261, - "step": 71158 - }, - { - "epoch": 1.82, - "learning_rate": 7.034989449055181e-07, - "loss": 0.5454, - "step": 71159 - }, - { - "epoch": 1.82, - "learning_rate": 7.034725188355697e-07, - "loss": 0.7539, - "step": 71160 - }, - { - "epoch": 1.82, - "learning_rate": 7.034460929926591e-07, - "loss": 0.5728, - "step": 71161 - }, - { - "epoch": 1.82, - "learning_rate": 7.034196673768058e-07, - "loss": 0.6318, - "step": 71162 - }, - { - "epoch": 1.82, - "learning_rate": 7.033932419880309e-07, - "loss": 0.7021, - "step": 71163 - }, - { - "epoch": 1.82, - "learning_rate": 7.033668168263538e-07, - "loss": 0.8242, - "step": 71164 - }, - { - "epoch": 1.82, - "learning_rate": 7.033403918917952e-07, - "loss": 0.6323, - "step": 71165 - }, - { - "epoch": 1.82, - "learning_rate": 7.033139671843751e-07, - "loss": 0.6445, - "step": 71166 - }, - { - "epoch": 1.82, - "learning_rate": 7.032875427041141e-07, - "loss": 0.5654, - "step": 71167 - }, - { - "epoch": 1.82, - "learning_rate": 7.03261118451032e-07, - "loss": 0.6582, - "step": 71168 - }, - { - "epoch": 1.82, - "learning_rate": 7.032346944251495e-07, - "loss": 0.5601, - "step": 71169 - }, - { - "epoch": 1.82, - "learning_rate": 7.032082706264864e-07, - "loss": 0.7246, - "step": 71170 - }, - { - "epoch": 1.82, - "learning_rate": 7.031818470550629e-07, - "loss": 0.6426, - "step": 71171 - }, - { - "epoch": 1.82, - "learning_rate": 7.031554237108997e-07, - "loss": 0.6077, - "step": 71172 - }, - { - "epoch": 1.82, - "learning_rate": 7.031290005940163e-07, - "loss": 0.5864, - "step": 71173 - }, - { - "epoch": 1.82, - "learning_rate": 7.031025777044338e-07, - "loss": 0.6113, - "step": 71174 - }, - { - "epoch": 1.82, - "learning_rate": 7.030761550421718e-07, - "loss": 0.7988, - "step": 71175 - }, - { - "epoch": 1.82, - "learning_rate": 7.030497326072509e-07, - "loss": 0.6655, - "step": 71176 - }, - { - "epoch": 1.82, - "learning_rate": 7.030233103996908e-07, - "loss": 0.6755, - "step": 71177 - }, - { - "epoch": 1.82, - "learning_rate": 7.029968884195125e-07, - "loss": 0.645, - "step": 71178 - }, - { - "epoch": 1.82, - "learning_rate": 7.029704666667359e-07, - "loss": 0.6143, - "step": 71179 - }, - { - "epoch": 1.82, - "learning_rate": 7.029440451413811e-07, - "loss": 0.6416, - "step": 71180 - }, - { - "epoch": 1.82, - "learning_rate": 7.02917623843468e-07, - "loss": 0.6367, - "step": 71181 - }, - { - "epoch": 1.82, - "learning_rate": 7.028912027730175e-07, - "loss": 0.7593, - "step": 71182 - }, - { - "epoch": 1.82, - "learning_rate": 7.028647819300493e-07, - "loss": 0.6943, - "step": 71183 - }, - { - "epoch": 1.82, - "learning_rate": 7.028383613145842e-07, - "loss": 0.6084, - "step": 71184 - }, - { - "epoch": 1.82, - "learning_rate": 7.028119409266417e-07, - "loss": 0.7842, - "step": 71185 - }, - { - "epoch": 1.82, - "learning_rate": 7.027855207662429e-07, - "loss": 0.5693, - "step": 71186 - }, - { - "epoch": 1.82, - "learning_rate": 7.027591008334072e-07, - "loss": 0.6641, - "step": 71187 - }, - { - "epoch": 1.82, - "learning_rate": 7.027326811281554e-07, - "loss": 0.6719, - "step": 71188 - }, - { - "epoch": 1.82, - "learning_rate": 7.027062616505078e-07, - "loss": 0.6245, - "step": 71189 - }, - { - "epoch": 1.82, - "learning_rate": 7.026798424004838e-07, - "loss": 0.8369, - "step": 71190 - }, - { - "epoch": 1.82, - "learning_rate": 7.026534233781045e-07, - "loss": 0.7568, - "step": 71191 - }, - { - "epoch": 1.82, - "learning_rate": 7.026270045833896e-07, - "loss": 0.4941, - "step": 71192 - }, - { - "epoch": 1.82, - "learning_rate": 7.026005860163596e-07, - "loss": 0.5601, - "step": 71193 - }, - { - "epoch": 1.82, - "learning_rate": 7.025741676770344e-07, - "loss": 0.5894, - "step": 71194 - }, - { - "epoch": 1.82, - "learning_rate": 7.02547749565435e-07, - "loss": 0.6636, - "step": 71195 - }, - { - "epoch": 1.82, - "learning_rate": 7.025213316815808e-07, - "loss": 0.8184, - "step": 71196 - }, - { - "epoch": 1.82, - "learning_rate": 7.024949140254923e-07, - "loss": 0.5801, - "step": 71197 - }, - { - "epoch": 1.82, - "learning_rate": 7.024684965971899e-07, - "loss": 0.752, - "step": 71198 - }, - { - "epoch": 1.82, - "learning_rate": 7.02442079396694e-07, - "loss": 0.6963, - "step": 71199 - }, - { - "epoch": 1.82, - "learning_rate": 7.024156624240241e-07, - "loss": 0.6963, - "step": 71200 - }, - { - "epoch": 1.82, - "learning_rate": 7.023892456792009e-07, - "loss": 0.5708, - "step": 71201 - }, - { - "epoch": 1.82, - "learning_rate": 7.023628291622445e-07, - "loss": 0.6816, - "step": 71202 - }, - { - "epoch": 1.82, - "learning_rate": 7.023364128731752e-07, - "loss": 0.667, - "step": 71203 - }, - { - "epoch": 1.82, - "learning_rate": 7.023099968120133e-07, - "loss": 0.5264, - "step": 71204 - }, - { - "epoch": 1.83, - "learning_rate": 7.02283580978779e-07, - "loss": 0.6436, - "step": 71205 - }, - { - "epoch": 1.83, - "learning_rate": 7.022571653734924e-07, - "loss": 0.595, - "step": 71206 - }, - { - "epoch": 1.83, - "learning_rate": 7.022307499961737e-07, - "loss": 0.5079, - "step": 71207 - }, - { - "epoch": 1.83, - "learning_rate": 7.022043348468433e-07, - "loss": 0.584, - "step": 71208 - }, - { - "epoch": 1.83, - "learning_rate": 7.021779199255216e-07, - "loss": 0.5234, - "step": 71209 - }, - { - "epoch": 1.83, - "learning_rate": 7.021515052322285e-07, - "loss": 0.6904, - "step": 71210 - }, - { - "epoch": 1.83, - "learning_rate": 7.02125090766984e-07, - "loss": 0.6484, - "step": 71211 - }, - { - "epoch": 1.83, - "learning_rate": 7.020986765298089e-07, - "loss": 0.5308, - "step": 71212 - }, - { - "epoch": 1.83, - "learning_rate": 7.020722625207231e-07, - "loss": 0.707, - "step": 71213 - }, - { - "epoch": 1.83, - "learning_rate": 7.020458487397467e-07, - "loss": 0.6035, - "step": 71214 - }, - { - "epoch": 1.83, - "learning_rate": 7.020194351869003e-07, - "loss": 0.6562, - "step": 71215 - }, - { - "epoch": 1.83, - "learning_rate": 7.019930218622035e-07, - "loss": 0.4878, - "step": 71216 - }, - { - "epoch": 1.83, - "learning_rate": 7.019666087656773e-07, - "loss": 0.6597, - "step": 71217 - }, - { - "epoch": 1.83, - "learning_rate": 7.019401958973414e-07, - "loss": 0.604, - "step": 71218 - }, - { - "epoch": 1.83, - "learning_rate": 7.019137832572166e-07, - "loss": 0.7021, - "step": 71219 - }, - { - "epoch": 1.83, - "learning_rate": 7.018873708453226e-07, - "loss": 0.6201, - "step": 71220 - }, - { - "epoch": 1.83, - "learning_rate": 7.018609586616793e-07, - "loss": 0.6802, - "step": 71221 - }, - { - "epoch": 1.83, - "learning_rate": 7.018345467063077e-07, - "loss": 0.5801, - "step": 71222 - }, - { - "epoch": 1.83, - "learning_rate": 7.018081349792274e-07, - "loss": 0.5596, - "step": 71223 - }, - { - "epoch": 1.83, - "learning_rate": 7.017817234804592e-07, - "loss": 0.5957, - "step": 71224 - }, - { - "epoch": 1.83, - "learning_rate": 7.017553122100227e-07, - "loss": 0.4199, - "step": 71225 - }, - { - "epoch": 1.83, - "learning_rate": 7.017289011679388e-07, - "loss": 0.54, - "step": 71226 - }, - { - "epoch": 1.83, - "learning_rate": 7.01702490354227e-07, - "loss": 0.678, - "step": 71227 - }, - { - "epoch": 1.83, - "learning_rate": 7.016760797689084e-07, - "loss": 0.6709, - "step": 71228 - }, - { - "epoch": 1.83, - "learning_rate": 7.016496694120024e-07, - "loss": 0.835, - "step": 71229 - }, - { - "epoch": 1.83, - "learning_rate": 7.016232592835296e-07, - "loss": 0.7686, - "step": 71230 - }, - { - "epoch": 1.83, - "learning_rate": 7.0159684938351e-07, - "loss": 0.5913, - "step": 71231 - }, - { - "epoch": 1.83, - "learning_rate": 7.015704397119641e-07, - "loss": 0.5073, - "step": 71232 - }, - { - "epoch": 1.83, - "learning_rate": 7.015440302689118e-07, - "loss": 0.7109, - "step": 71233 - }, - { - "epoch": 1.83, - "learning_rate": 7.015176210543738e-07, - "loss": 0.5098, - "step": 71234 - }, - { - "epoch": 1.83, - "learning_rate": 7.014912120683697e-07, - "loss": 0.6318, - "step": 71235 - }, - { - "epoch": 1.83, - "learning_rate": 7.014648033109203e-07, - "loss": 0.6445, - "step": 71236 - }, - { - "epoch": 1.83, - "learning_rate": 7.014383947820455e-07, - "loss": 0.6875, - "step": 71237 - }, - { - "epoch": 1.83, - "learning_rate": 7.014119864817658e-07, - "loss": 0.6113, - "step": 71238 - }, - { - "epoch": 1.83, - "learning_rate": 7.01385578410101e-07, - "loss": 0.7627, - "step": 71239 - }, - { - "epoch": 1.83, - "learning_rate": 7.013591705670715e-07, - "loss": 0.6509, - "step": 71240 - }, - { - "epoch": 1.83, - "learning_rate": 7.013327629526977e-07, - "loss": 0.4802, - "step": 71241 - }, - { - "epoch": 1.83, - "learning_rate": 7.013063555669993e-07, - "loss": 0.6729, - "step": 71242 - }, - { - "epoch": 1.83, - "learning_rate": 7.012799484099974e-07, - "loss": 0.7773, - "step": 71243 - }, - { - "epoch": 1.83, - "learning_rate": 7.012535414817113e-07, - "loss": 0.5537, - "step": 71244 - }, - { - "epoch": 1.83, - "learning_rate": 7.012271347821619e-07, - "loss": 0.5781, - "step": 71245 - }, - { - "epoch": 1.83, - "learning_rate": 7.012007283113689e-07, - "loss": 0.6357, - "step": 71246 - }, - { - "epoch": 1.83, - "learning_rate": 7.011743220693529e-07, - "loss": 0.4514, - "step": 71247 - }, - { - "epoch": 1.83, - "learning_rate": 7.011479160561344e-07, - "loss": 0.5918, - "step": 71248 - }, - { - "epoch": 1.83, - "learning_rate": 7.011215102717328e-07, - "loss": 0.6157, - "step": 71249 - }, - { - "epoch": 1.83, - "learning_rate": 7.010951047161687e-07, - "loss": 0.5571, - "step": 71250 - }, - { - "epoch": 1.83, - "learning_rate": 7.010686993894624e-07, - "loss": 0.4269, - "step": 71251 - }, - { - "epoch": 1.83, - "learning_rate": 7.010422942916336e-07, - "loss": 0.6584, - "step": 71252 - }, - { - "epoch": 1.83, - "learning_rate": 7.010158894227036e-07, - "loss": 0.6445, - "step": 71253 - }, - { - "epoch": 1.83, - "learning_rate": 7.009894847826916e-07, - "loss": 0.6445, - "step": 71254 - }, - { - "epoch": 1.83, - "learning_rate": 7.009630803716184e-07, - "loss": 0.4875, - "step": 71255 - }, - { - "epoch": 1.83, - "learning_rate": 7.009366761895038e-07, - "loss": 0.7017, - "step": 71256 - }, - { - "epoch": 1.83, - "learning_rate": 7.009102722363685e-07, - "loss": 0.834, - "step": 71257 - }, - { - "epoch": 1.83, - "learning_rate": 7.008838685122327e-07, - "loss": 0.8193, - "step": 71258 - }, - { - "epoch": 1.83, - "learning_rate": 7.008574650171157e-07, - "loss": 0.6616, - "step": 71259 - }, - { - "epoch": 1.83, - "learning_rate": 7.008310617510389e-07, - "loss": 0.7002, - "step": 71260 - }, - { - "epoch": 1.83, - "learning_rate": 7.008046587140218e-07, - "loss": 0.6553, - "step": 71261 - }, - { - "epoch": 1.83, - "learning_rate": 7.007782559060847e-07, - "loss": 0.6807, - "step": 71262 - }, - { - "epoch": 1.83, - "learning_rate": 7.00751853327248e-07, - "loss": 0.7285, - "step": 71263 - }, - { - "epoch": 1.83, - "learning_rate": 7.00725450977532e-07, - "loss": 0.7959, - "step": 71264 - }, - { - "epoch": 1.83, - "learning_rate": 7.006990488569564e-07, - "loss": 0.6416, - "step": 71265 - }, - { - "epoch": 1.83, - "learning_rate": 7.006726469655422e-07, - "loss": 0.6182, - "step": 71266 - }, - { - "epoch": 1.83, - "learning_rate": 7.006462453033089e-07, - "loss": 0.6475, - "step": 71267 - }, - { - "epoch": 1.83, - "learning_rate": 7.006198438702775e-07, - "loss": 0.5654, - "step": 71268 - }, - { - "epoch": 1.83, - "learning_rate": 7.005934426664673e-07, - "loss": 0.6953, - "step": 71269 - }, - { - "epoch": 1.83, - "learning_rate": 7.005670416918991e-07, - "loss": 0.5669, - "step": 71270 - }, - { - "epoch": 1.83, - "learning_rate": 7.005406409465926e-07, - "loss": 0.8037, - "step": 71271 - }, - { - "epoch": 1.83, - "learning_rate": 7.005142404305688e-07, - "loss": 0.4171, - "step": 71272 - }, - { - "epoch": 1.83, - "learning_rate": 7.00487840143847e-07, - "loss": 0.6104, - "step": 71273 - }, - { - "epoch": 1.83, - "learning_rate": 7.004614400864483e-07, - "loss": 0.6309, - "step": 71274 - }, - { - "epoch": 1.83, - "learning_rate": 7.004350402583922e-07, - "loss": 0.5942, - "step": 71275 - }, - { - "epoch": 1.83, - "learning_rate": 7.004086406596994e-07, - "loss": 0.5837, - "step": 71276 - }, - { - "epoch": 1.83, - "learning_rate": 7.003822412903898e-07, - "loss": 0.6572, - "step": 71277 - }, - { - "epoch": 1.83, - "learning_rate": 7.003558421504842e-07, - "loss": 0.5996, - "step": 71278 - }, - { - "epoch": 1.83, - "learning_rate": 7.00329443240002e-07, - "loss": 0.6602, - "step": 71279 - }, - { - "epoch": 1.83, - "learning_rate": 7.003030445589637e-07, - "loss": 0.6133, - "step": 71280 - }, - { - "epoch": 1.83, - "learning_rate": 7.002766461073897e-07, - "loss": 0.6924, - "step": 71281 - }, - { - "epoch": 1.83, - "learning_rate": 7.002502478852998e-07, - "loss": 0.7236, - "step": 71282 - }, - { - "epoch": 1.83, - "learning_rate": 7.002238498927149e-07, - "loss": 0.4683, - "step": 71283 - }, - { - "epoch": 1.83, - "learning_rate": 7.001974521296545e-07, - "loss": 0.5046, - "step": 71284 - }, - { - "epoch": 1.83, - "learning_rate": 7.001710545961394e-07, - "loss": 0.4714, - "step": 71285 - }, - { - "epoch": 1.83, - "learning_rate": 7.001446572921894e-07, - "loss": 0.5669, - "step": 71286 - }, - { - "epoch": 1.83, - "learning_rate": 7.001182602178247e-07, - "loss": 0.7656, - "step": 71287 - }, - { - "epoch": 1.83, - "learning_rate": 7.000918633730661e-07, - "loss": 0.6416, - "step": 71288 - }, - { - "epoch": 1.83, - "learning_rate": 7.000654667579332e-07, - "loss": 0.6064, - "step": 71289 - }, - { - "epoch": 1.83, - "learning_rate": 7.000390703724461e-07, - "loss": 0.582, - "step": 71290 - }, - { - "epoch": 1.83, - "learning_rate": 7.000126742166256e-07, - "loss": 0.6621, - "step": 71291 - }, - { - "epoch": 1.83, - "learning_rate": 6.999862782904913e-07, - "loss": 0.7568, - "step": 71292 - }, - { - "epoch": 1.83, - "learning_rate": 6.99959882594064e-07, - "loss": 0.627, - "step": 71293 - }, - { - "epoch": 1.83, - "learning_rate": 6.999334871273634e-07, - "loss": 0.7607, - "step": 71294 - }, - { - "epoch": 1.83, - "learning_rate": 6.9990709189041e-07, - "loss": 0.5265, - "step": 71295 - }, - { - "epoch": 1.83, - "learning_rate": 6.998806968832238e-07, - "loss": 0.7207, - "step": 71296 - }, - { - "epoch": 1.83, - "learning_rate": 6.998543021058254e-07, - "loss": 0.6299, - "step": 71297 - }, - { - "epoch": 1.83, - "learning_rate": 6.998279075582349e-07, - "loss": 0.6455, - "step": 71298 - }, - { - "epoch": 1.83, - "learning_rate": 6.998015132404721e-07, - "loss": 0.6445, - "step": 71299 - }, - { - "epoch": 1.83, - "learning_rate": 6.997751191525576e-07, - "loss": 0.416, - "step": 71300 - }, - { - "epoch": 1.83, - "learning_rate": 6.997487252945113e-07, - "loss": 0.6816, - "step": 71301 - }, - { - "epoch": 1.83, - "learning_rate": 6.997223316663539e-07, - "loss": 0.6963, - "step": 71302 - }, - { - "epoch": 1.83, - "learning_rate": 6.996959382681051e-07, - "loss": 0.5554, - "step": 71303 - }, - { - "epoch": 1.83, - "learning_rate": 6.996695450997851e-07, - "loss": 0.5681, - "step": 71304 - }, - { - "epoch": 1.83, - "learning_rate": 6.996431521614147e-07, - "loss": 0.604, - "step": 71305 - }, - { - "epoch": 1.83, - "learning_rate": 6.996167594530134e-07, - "loss": 0.6201, - "step": 71306 - }, - { - "epoch": 1.83, - "learning_rate": 6.99590366974602e-07, - "loss": 0.7451, - "step": 71307 - }, - { - "epoch": 1.83, - "learning_rate": 6.995639747262005e-07, - "loss": 0.708, - "step": 71308 - }, - { - "epoch": 1.83, - "learning_rate": 6.995375827078289e-07, - "loss": 0.7134, - "step": 71309 - }, - { - "epoch": 1.83, - "learning_rate": 6.995111909195076e-07, - "loss": 0.5872, - "step": 71310 - }, - { - "epoch": 1.83, - "learning_rate": 6.994847993612566e-07, - "loss": 0.5498, - "step": 71311 - }, - { - "epoch": 1.83, - "learning_rate": 6.994584080330965e-07, - "loss": 0.7568, - "step": 71312 - }, - { - "epoch": 1.83, - "learning_rate": 6.99432016935047e-07, - "loss": 0.6177, - "step": 71313 - }, - { - "epoch": 1.83, - "learning_rate": 6.994056260671288e-07, - "loss": 0.6758, - "step": 71314 - }, - { - "epoch": 1.83, - "learning_rate": 6.993792354293617e-07, - "loss": 0.5571, - "step": 71315 - }, - { - "epoch": 1.83, - "learning_rate": 6.993528450217663e-07, - "loss": 0.7422, - "step": 71316 - }, - { - "epoch": 1.83, - "learning_rate": 6.993264548443625e-07, - "loss": 0.6172, - "step": 71317 - }, - { - "epoch": 1.83, - "learning_rate": 6.99300064897171e-07, - "loss": 0.5469, - "step": 71318 - }, - { - "epoch": 1.83, - "learning_rate": 6.992736751802113e-07, - "loss": 0.5737, - "step": 71319 - }, - { - "epoch": 1.83, - "learning_rate": 6.992472856935039e-07, - "loss": 0.5448, - "step": 71320 - }, - { - "epoch": 1.83, - "learning_rate": 6.992208964370689e-07, - "loss": 0.6592, - "step": 71321 - }, - { - "epoch": 1.83, - "learning_rate": 6.991945074109268e-07, - "loss": 0.6187, - "step": 71322 - }, - { - "epoch": 1.83, - "learning_rate": 6.991681186150974e-07, - "loss": 0.5752, - "step": 71323 - }, - { - "epoch": 1.83, - "learning_rate": 6.991417300496014e-07, - "loss": 0.6841, - "step": 71324 - }, - { - "epoch": 1.83, - "learning_rate": 6.991153417144585e-07, - "loss": 0.5391, - "step": 71325 - }, - { - "epoch": 1.83, - "learning_rate": 6.990889536096893e-07, - "loss": 0.6753, - "step": 71326 - }, - { - "epoch": 1.83, - "learning_rate": 6.990625657353137e-07, - "loss": 0.6924, - "step": 71327 - }, - { - "epoch": 1.83, - "learning_rate": 6.990361780913527e-07, - "loss": 0.5813, - "step": 71328 - }, - { - "epoch": 1.83, - "learning_rate": 6.990097906778253e-07, - "loss": 0.6006, - "step": 71329 - }, - { - "epoch": 1.83, - "learning_rate": 6.989834034947523e-07, - "loss": 0.4529, - "step": 71330 - }, - { - "epoch": 1.83, - "learning_rate": 6.989570165421538e-07, - "loss": 0.7461, - "step": 71331 - }, - { - "epoch": 1.83, - "learning_rate": 6.989306298200501e-07, - "loss": 0.6885, - "step": 71332 - }, - { - "epoch": 1.83, - "learning_rate": 6.989042433284615e-07, - "loss": 0.7422, - "step": 71333 - }, - { - "epoch": 1.83, - "learning_rate": 6.988778570674079e-07, - "loss": 0.5369, - "step": 71334 - }, - { - "epoch": 1.83, - "learning_rate": 6.9885147103691e-07, - "loss": 0.7139, - "step": 71335 - }, - { - "epoch": 1.83, - "learning_rate": 6.988250852369872e-07, - "loss": 0.7725, - "step": 71336 - }, - { - "epoch": 1.83, - "learning_rate": 6.987986996676606e-07, - "loss": 0.5674, - "step": 71337 - }, - { - "epoch": 1.83, - "learning_rate": 6.987723143289501e-07, - "loss": 0.5283, - "step": 71338 - }, - { - "epoch": 1.83, - "learning_rate": 6.987459292208757e-07, - "loss": 0.7275, - "step": 71339 - }, - { - "epoch": 1.83, - "learning_rate": 6.987195443434574e-07, - "loss": 0.6641, - "step": 71340 - }, - { - "epoch": 1.83, - "learning_rate": 6.986931596967159e-07, - "loss": 0.5332, - "step": 71341 - }, - { - "epoch": 1.83, - "learning_rate": 6.98666775280671e-07, - "loss": 0.6548, - "step": 71342 - }, - { - "epoch": 1.83, - "learning_rate": 6.986403910953431e-07, - "loss": 0.6982, - "step": 71343 - }, - { - "epoch": 1.83, - "learning_rate": 6.986140071407525e-07, - "loss": 0.6797, - "step": 71344 - }, - { - "epoch": 1.83, - "learning_rate": 6.985876234169193e-07, - "loss": 0.6777, - "step": 71345 - }, - { - "epoch": 1.83, - "learning_rate": 6.985612399238636e-07, - "loss": 0.5759, - "step": 71346 - }, - { - "epoch": 1.83, - "learning_rate": 6.985348566616059e-07, - "loss": 0.4485, - "step": 71347 - }, - { - "epoch": 1.83, - "learning_rate": 6.985084736301662e-07, - "loss": 0.6455, - "step": 71348 - }, - { - "epoch": 1.83, - "learning_rate": 6.984820908295646e-07, - "loss": 0.5151, - "step": 71349 - }, - { - "epoch": 1.83, - "learning_rate": 6.984557082598214e-07, - "loss": 0.7109, - "step": 71350 - }, - { - "epoch": 1.83, - "learning_rate": 6.984293259209567e-07, - "loss": 0.5723, - "step": 71351 - }, - { - "epoch": 1.83, - "learning_rate": 6.98402943812991e-07, - "loss": 0.5381, - "step": 71352 - }, - { - "epoch": 1.83, - "learning_rate": 6.98376561935944e-07, - "loss": 0.6064, - "step": 71353 - }, - { - "epoch": 1.83, - "learning_rate": 6.983501802898365e-07, - "loss": 0.6016, - "step": 71354 - }, - { - "epoch": 1.83, - "learning_rate": 6.983237988746881e-07, - "loss": 0.6953, - "step": 71355 - }, - { - "epoch": 1.83, - "learning_rate": 6.982974176905197e-07, - "loss": 0.7036, - "step": 71356 - }, - { - "epoch": 1.83, - "learning_rate": 6.982710367373506e-07, - "loss": 0.4917, - "step": 71357 - }, - { - "epoch": 1.83, - "learning_rate": 6.982446560152022e-07, - "loss": 0.6615, - "step": 71358 - }, - { - "epoch": 1.83, - "learning_rate": 6.982182755240935e-07, - "loss": 0.6558, - "step": 71359 - }, - { - "epoch": 1.83, - "learning_rate": 6.981918952640453e-07, - "loss": 0.5249, - "step": 71360 - }, - { - "epoch": 1.83, - "learning_rate": 6.981655152350776e-07, - "loss": 0.6631, - "step": 71361 - }, - { - "epoch": 1.83, - "learning_rate": 6.981391354372107e-07, - "loss": 0.8154, - "step": 71362 - }, - { - "epoch": 1.83, - "learning_rate": 6.981127558704647e-07, - "loss": 0.7227, - "step": 71363 - }, - { - "epoch": 1.83, - "learning_rate": 6.980863765348602e-07, - "loss": 0.5018, - "step": 71364 - }, - { - "epoch": 1.83, - "learning_rate": 6.980599974304167e-07, - "loss": 0.6514, - "step": 71365 - }, - { - "epoch": 1.83, - "learning_rate": 6.980336185571549e-07, - "loss": 0.6519, - "step": 71366 - }, - { - "epoch": 1.83, - "learning_rate": 6.980072399150948e-07, - "loss": 0.6514, - "step": 71367 - }, - { - "epoch": 1.83, - "learning_rate": 6.979808615042571e-07, - "loss": 0.7549, - "step": 71368 - }, - { - "epoch": 1.83, - "learning_rate": 6.979544833246614e-07, - "loss": 0.8271, - "step": 71369 - }, - { - "epoch": 1.83, - "learning_rate": 6.979281053763278e-07, - "loss": 0.6226, - "step": 71370 - }, - { - "epoch": 1.83, - "learning_rate": 6.979017276592768e-07, - "loss": 0.5044, - "step": 71371 - }, - { - "epoch": 1.83, - "learning_rate": 6.978753501735285e-07, - "loss": 0.5356, - "step": 71372 - }, - { - "epoch": 1.83, - "learning_rate": 6.978489729191034e-07, - "loss": 0.6592, - "step": 71373 - }, - { - "epoch": 1.83, - "learning_rate": 6.978225958960211e-07, - "loss": 0.7285, - "step": 71374 - }, - { - "epoch": 1.83, - "learning_rate": 6.977962191043025e-07, - "loss": 0.6094, - "step": 71375 - }, - { - "epoch": 1.83, - "learning_rate": 6.977698425439674e-07, - "loss": 0.6201, - "step": 71376 - }, - { - "epoch": 1.83, - "learning_rate": 6.977434662150359e-07, - "loss": 0.7158, - "step": 71377 - }, - { - "epoch": 1.83, - "learning_rate": 6.977170901175286e-07, - "loss": 0.5798, - "step": 71378 - }, - { - "epoch": 1.83, - "learning_rate": 6.976907142514652e-07, - "loss": 0.7598, - "step": 71379 - }, - { - "epoch": 1.83, - "learning_rate": 6.976643386168662e-07, - "loss": 0.5527, - "step": 71380 - }, - { - "epoch": 1.83, - "learning_rate": 6.976379632137516e-07, - "loss": 0.7705, - "step": 71381 - }, - { - "epoch": 1.83, - "learning_rate": 6.976115880421416e-07, - "loss": 0.5798, - "step": 71382 - }, - { - "epoch": 1.83, - "learning_rate": 6.975852131020567e-07, - "loss": 0.6597, - "step": 71383 - }, - { - "epoch": 1.83, - "learning_rate": 6.975588383935167e-07, - "loss": 0.7412, - "step": 71384 - }, - { - "epoch": 1.83, - "learning_rate": 6.975324639165423e-07, - "loss": 0.6724, - "step": 71385 - }, - { - "epoch": 1.83, - "learning_rate": 6.975060896711531e-07, - "loss": 0.6416, - "step": 71386 - }, - { - "epoch": 1.83, - "learning_rate": 6.974797156573698e-07, - "loss": 0.5464, - "step": 71387 - }, - { - "epoch": 1.83, - "learning_rate": 6.974533418752124e-07, - "loss": 0.6602, - "step": 71388 - }, - { - "epoch": 1.83, - "learning_rate": 6.97426968324701e-07, - "loss": 0.4913, - "step": 71389 - }, - { - "epoch": 1.83, - "learning_rate": 6.974005950058557e-07, - "loss": 0.8086, - "step": 71390 - }, - { - "epoch": 1.83, - "learning_rate": 6.973742219186969e-07, - "loss": 0.8945, - "step": 71391 - }, - { - "epoch": 1.83, - "learning_rate": 6.973478490632447e-07, - "loss": 0.5349, - "step": 71392 - }, - { - "epoch": 1.83, - "learning_rate": 6.973214764395196e-07, - "loss": 0.4771, - "step": 71393 - }, - { - "epoch": 1.83, - "learning_rate": 6.972951040475412e-07, - "loss": 0.5471, - "step": 71394 - }, - { - "epoch": 1.83, - "learning_rate": 6.972687318873303e-07, - "loss": 0.6045, - "step": 71395 - }, - { - "epoch": 1.83, - "learning_rate": 6.972423599589066e-07, - "loss": 0.6426, - "step": 71396 - }, - { - "epoch": 1.83, - "learning_rate": 6.972159882622906e-07, - "loss": 0.4121, - "step": 71397 - }, - { - "epoch": 1.83, - "learning_rate": 6.971896167975027e-07, - "loss": 0.5854, - "step": 71398 - }, - { - "epoch": 1.83, - "learning_rate": 6.971632455645623e-07, - "loss": 0.7295, - "step": 71399 - }, - { - "epoch": 1.83, - "learning_rate": 6.971368745634903e-07, - "loss": 0.4087, - "step": 71400 - }, - { - "epoch": 1.83, - "learning_rate": 6.971105037943065e-07, - "loss": 0.7363, - "step": 71401 - }, - { - "epoch": 1.83, - "learning_rate": 6.970841332570314e-07, - "loss": 0.7383, - "step": 71402 - }, - { - "epoch": 1.83, - "learning_rate": 6.97057762951685e-07, - "loss": 0.6533, - "step": 71403 - }, - { - "epoch": 1.83, - "learning_rate": 6.970313928782876e-07, - "loss": 0.5723, - "step": 71404 - }, - { - "epoch": 1.83, - "learning_rate": 6.970050230368591e-07, - "loss": 0.6885, - "step": 71405 - }, - { - "epoch": 1.83, - "learning_rate": 6.969786534274203e-07, - "loss": 0.7246, - "step": 71406 - }, - { - "epoch": 1.83, - "learning_rate": 6.969522840499906e-07, - "loss": 0.7588, - "step": 71407 - }, - { - "epoch": 1.83, - "learning_rate": 6.969259149045912e-07, - "loss": 0.7896, - "step": 71408 - }, - { - "epoch": 1.83, - "learning_rate": 6.968995459912415e-07, - "loss": 0.707, - "step": 71409 - }, - { - "epoch": 1.83, - "learning_rate": 6.968731773099616e-07, - "loss": 0.5547, - "step": 71410 - }, - { - "epoch": 1.83, - "learning_rate": 6.968468088607719e-07, - "loss": 0.5688, - "step": 71411 - }, - { - "epoch": 1.83, - "learning_rate": 6.96820440643693e-07, - "loss": 0.6531, - "step": 71412 - }, - { - "epoch": 1.83, - "learning_rate": 6.967940726587444e-07, - "loss": 0.5796, - "step": 71413 - }, - { - "epoch": 1.83, - "learning_rate": 6.967677049059469e-07, - "loss": 0.6699, - "step": 71414 - }, - { - "epoch": 1.83, - "learning_rate": 6.967413373853202e-07, - "loss": 0.5527, - "step": 71415 - }, - { - "epoch": 1.83, - "learning_rate": 6.96714970096885e-07, - "loss": 0.6243, - "step": 71416 - }, - { - "epoch": 1.83, - "learning_rate": 6.966886030406609e-07, - "loss": 0.5439, - "step": 71417 - }, - { - "epoch": 1.83, - "learning_rate": 6.966622362166689e-07, - "loss": 0.6553, - "step": 71418 - }, - { - "epoch": 1.83, - "learning_rate": 6.966358696249283e-07, - "loss": 0.8652, - "step": 71419 - }, - { - "epoch": 1.83, - "learning_rate": 6.966095032654597e-07, - "loss": 0.5864, - "step": 71420 - }, - { - "epoch": 1.83, - "learning_rate": 6.965831371382833e-07, - "loss": 0.7119, - "step": 71421 - }, - { - "epoch": 1.83, - "learning_rate": 6.965567712434191e-07, - "loss": 0.707, - "step": 71422 - }, - { - "epoch": 1.83, - "learning_rate": 6.965304055808876e-07, - "loss": 0.6807, - "step": 71423 - }, - { - "epoch": 1.83, - "learning_rate": 6.965040401507085e-07, - "loss": 0.541, - "step": 71424 - }, - { - "epoch": 1.83, - "learning_rate": 6.964776749529027e-07, - "loss": 0.7363, - "step": 71425 - }, - { - "epoch": 1.83, - "learning_rate": 6.964513099874895e-07, - "loss": 0.509, - "step": 71426 - }, - { - "epoch": 1.83, - "learning_rate": 6.964249452544902e-07, - "loss": 0.7207, - "step": 71427 - }, - { - "epoch": 1.83, - "learning_rate": 6.963985807539242e-07, - "loss": 0.6855, - "step": 71428 - }, - { - "epoch": 1.83, - "learning_rate": 6.963722164858117e-07, - "loss": 0.5127, - "step": 71429 - }, - { - "epoch": 1.83, - "learning_rate": 6.963458524501731e-07, - "loss": 0.525, - "step": 71430 - }, - { - "epoch": 1.83, - "learning_rate": 6.963194886470285e-07, - "loss": 0.5015, - "step": 71431 - }, - { - "epoch": 1.83, - "learning_rate": 6.962931250763979e-07, - "loss": 0.3411, - "step": 71432 - }, - { - "epoch": 1.83, - "learning_rate": 6.962667617383019e-07, - "loss": 0.7471, - "step": 71433 - }, - { - "epoch": 1.83, - "learning_rate": 6.962403986327603e-07, - "loss": 0.6895, - "step": 71434 - }, - { - "epoch": 1.83, - "learning_rate": 6.962140357597936e-07, - "loss": 0.6211, - "step": 71435 - }, - { - "epoch": 1.83, - "learning_rate": 6.961876731194218e-07, - "loss": 0.5928, - "step": 71436 - }, - { - "epoch": 1.83, - "learning_rate": 6.961613107116652e-07, - "loss": 0.5063, - "step": 71437 - }, - { - "epoch": 1.83, - "learning_rate": 6.96134948536544e-07, - "loss": 0.5654, - "step": 71438 - }, - { - "epoch": 1.83, - "learning_rate": 6.961085865940781e-07, - "loss": 0.7637, - "step": 71439 - }, - { - "epoch": 1.83, - "learning_rate": 6.960822248842881e-07, - "loss": 0.6328, - "step": 71440 - }, - { - "epoch": 1.83, - "learning_rate": 6.960558634071936e-07, - "loss": 0.6074, - "step": 71441 - }, - { - "epoch": 1.83, - "learning_rate": 6.960295021628156e-07, - "loss": 0.4888, - "step": 71442 - }, - { - "epoch": 1.83, - "learning_rate": 6.960031411511733e-07, - "loss": 0.6089, - "step": 71443 - }, - { - "epoch": 1.83, - "learning_rate": 6.959767803722878e-07, - "loss": 0.5073, - "step": 71444 - }, - { - "epoch": 1.83, - "learning_rate": 6.959504198261787e-07, - "loss": 0.6553, - "step": 71445 - }, - { - "epoch": 1.83, - "learning_rate": 6.959240595128666e-07, - "loss": 0.6067, - "step": 71446 - }, - { - "epoch": 1.83, - "learning_rate": 6.958976994323712e-07, - "loss": 0.7148, - "step": 71447 - }, - { - "epoch": 1.83, - "learning_rate": 6.958713395847136e-07, - "loss": 0.5781, - "step": 71448 - }, - { - "epoch": 1.83, - "learning_rate": 6.958449799699126e-07, - "loss": 0.5049, - "step": 71449 - }, - { - "epoch": 1.83, - "learning_rate": 6.958186205879896e-07, - "loss": 0.5991, - "step": 71450 - }, - { - "epoch": 1.83, - "learning_rate": 6.957922614389639e-07, - "loss": 0.7754, - "step": 71451 - }, - { - "epoch": 1.83, - "learning_rate": 6.957659025228562e-07, - "loss": 0.5334, - "step": 71452 - }, - { - "epoch": 1.83, - "learning_rate": 6.957395438396865e-07, - "loss": 0.6377, - "step": 71453 - }, - { - "epoch": 1.83, - "learning_rate": 6.957131853894752e-07, - "loss": 0.8252, - "step": 71454 - }, - { - "epoch": 1.83, - "learning_rate": 6.956868271722422e-07, - "loss": 0.5801, - "step": 71455 - }, - { - "epoch": 1.83, - "learning_rate": 6.956604691880079e-07, - "loss": 0.623, - "step": 71456 - }, - { - "epoch": 1.83, - "learning_rate": 6.956341114367922e-07, - "loss": 0.5877, - "step": 71457 - }, - { - "epoch": 1.83, - "learning_rate": 6.956077539186158e-07, - "loss": 0.6865, - "step": 71458 - }, - { - "epoch": 1.83, - "learning_rate": 6.955813966334985e-07, - "loss": 0.4045, - "step": 71459 - }, - { - "epoch": 1.83, - "learning_rate": 6.955550395814602e-07, - "loss": 0.624, - "step": 71460 - }, - { - "epoch": 1.83, - "learning_rate": 6.955286827625217e-07, - "loss": 0.7861, - "step": 71461 - }, - { - "epoch": 1.83, - "learning_rate": 6.955023261767026e-07, - "loss": 0.668, - "step": 71462 - }, - { - "epoch": 1.83, - "learning_rate": 6.954759698240236e-07, - "loss": 0.7422, - "step": 71463 - }, - { - "epoch": 1.83, - "learning_rate": 6.954496137045045e-07, - "loss": 0.5449, - "step": 71464 - }, - { - "epoch": 1.83, - "learning_rate": 6.954232578181658e-07, - "loss": 0.7314, - "step": 71465 - }, - { - "epoch": 1.83, - "learning_rate": 6.953969021650275e-07, - "loss": 0.8271, - "step": 71466 - }, - { - "epoch": 1.83, - "learning_rate": 6.953705467451096e-07, - "loss": 0.5117, - "step": 71467 - }, - { - "epoch": 1.83, - "learning_rate": 6.953441915584329e-07, - "loss": 0.6099, - "step": 71468 - }, - { - "epoch": 1.83, - "learning_rate": 6.953178366050168e-07, - "loss": 0.6216, - "step": 71469 - }, - { - "epoch": 1.83, - "learning_rate": 6.952914818848817e-07, - "loss": 0.6182, - "step": 71470 - }, - { - "epoch": 1.83, - "learning_rate": 6.952651273980481e-07, - "loss": 0.5728, - "step": 71471 - }, - { - "epoch": 1.83, - "learning_rate": 6.95238773144536e-07, - "loss": 0.7021, - "step": 71472 - }, - { - "epoch": 1.83, - "learning_rate": 6.952124191243654e-07, - "loss": 0.7832, - "step": 71473 - }, - { - "epoch": 1.83, - "learning_rate": 6.951860653375565e-07, - "loss": 0.6099, - "step": 71474 - }, - { - "epoch": 1.83, - "learning_rate": 6.951597117841301e-07, - "loss": 0.4258, - "step": 71475 - }, - { - "epoch": 1.83, - "learning_rate": 6.951333584641055e-07, - "loss": 0.6538, - "step": 71476 - }, - { - "epoch": 1.83, - "learning_rate": 6.951070053775034e-07, - "loss": 0.5435, - "step": 71477 - }, - { - "epoch": 1.83, - "learning_rate": 6.950806525243441e-07, - "loss": 0.5645, - "step": 71478 - }, - { - "epoch": 1.83, - "learning_rate": 6.950542999046471e-07, - "loss": 0.4731, - "step": 71479 - }, - { - "epoch": 1.83, - "learning_rate": 6.950279475184333e-07, - "loss": 0.5698, - "step": 71480 - }, - { - "epoch": 1.83, - "learning_rate": 6.950015953657222e-07, - "loss": 0.6455, - "step": 71481 - }, - { - "epoch": 1.83, - "learning_rate": 6.949752434465348e-07, - "loss": 0.6357, - "step": 71482 - }, - { - "epoch": 1.83, - "learning_rate": 6.949488917608907e-07, - "loss": 0.5786, - "step": 71483 - }, - { - "epoch": 1.83, - "learning_rate": 6.949225403088099e-07, - "loss": 0.5737, - "step": 71484 - }, - { - "epoch": 1.83, - "learning_rate": 6.948961890903132e-07, - "loss": 0.6738, - "step": 71485 - }, - { - "epoch": 1.83, - "learning_rate": 6.948698381054203e-07, - "loss": 0.5625, - "step": 71486 - }, - { - "epoch": 1.83, - "learning_rate": 6.948434873541517e-07, - "loss": 0.5449, - "step": 71487 - }, - { - "epoch": 1.83, - "learning_rate": 6.948171368365275e-07, - "loss": 0.6494, - "step": 71488 - }, - { - "epoch": 1.83, - "learning_rate": 6.947907865525675e-07, - "loss": 0.6328, - "step": 71489 - }, - { - "epoch": 1.83, - "learning_rate": 6.947644365022924e-07, - "loss": 0.5889, - "step": 71490 - }, - { - "epoch": 1.83, - "learning_rate": 6.947380866857219e-07, - "loss": 0.4119, - "step": 71491 - }, - { - "epoch": 1.83, - "learning_rate": 6.947117371028766e-07, - "loss": 0.7432, - "step": 71492 - }, - { - "epoch": 1.83, - "learning_rate": 6.946853877537761e-07, - "loss": 0.6553, - "step": 71493 - }, - { - "epoch": 1.83, - "learning_rate": 6.946590386384414e-07, - "loss": 0.5332, - "step": 71494 - }, - { - "epoch": 1.83, - "learning_rate": 6.946326897568919e-07, - "loss": 0.7832, - "step": 71495 - }, - { - "epoch": 1.83, - "learning_rate": 6.946063411091485e-07, - "loss": 0.6274, - "step": 71496 - }, - { - "epoch": 1.83, - "learning_rate": 6.945799926952306e-07, - "loss": 0.5757, - "step": 71497 - }, - { - "epoch": 1.83, - "learning_rate": 6.945536445151592e-07, - "loss": 0.5859, - "step": 71498 - }, - { - "epoch": 1.83, - "learning_rate": 6.945272965689539e-07, - "loss": 0.5925, - "step": 71499 - }, - { - "epoch": 1.83, - "learning_rate": 6.945009488566349e-07, - "loss": 0.6316, - "step": 71500 - }, - { - "epoch": 1.83, - "learning_rate": 6.944746013782223e-07, - "loss": 0.7383, - "step": 71501 - }, - { - "epoch": 1.83, - "learning_rate": 6.944482541337366e-07, - "loss": 0.5508, - "step": 71502 - }, - { - "epoch": 1.83, - "learning_rate": 6.944219071231978e-07, - "loss": 0.7725, - "step": 71503 - }, - { - "epoch": 1.83, - "learning_rate": 6.943955603466263e-07, - "loss": 0.6885, - "step": 71504 - }, - { - "epoch": 1.83, - "learning_rate": 6.943692138040416e-07, - "loss": 0.6519, - "step": 71505 - }, - { - "epoch": 1.83, - "learning_rate": 6.943428674954648e-07, - "loss": 0.5635, - "step": 71506 - }, - { - "epoch": 1.83, - "learning_rate": 6.943165214209152e-07, - "loss": 0.4011, - "step": 71507 - }, - { - "epoch": 1.83, - "learning_rate": 6.942901755804139e-07, - "loss": 0.7314, - "step": 71508 - }, - { - "epoch": 1.83, - "learning_rate": 6.942638299739804e-07, - "loss": 0.5334, - "step": 71509 - }, - { - "epoch": 1.83, - "learning_rate": 6.942374846016348e-07, - "loss": 0.79, - "step": 71510 - }, - { - "epoch": 1.83, - "learning_rate": 6.942111394633976e-07, - "loss": 0.7222, - "step": 71511 - }, - { - "epoch": 1.83, - "learning_rate": 6.941847945592887e-07, - "loss": 0.7295, - "step": 71512 - }, - { - "epoch": 1.83, - "learning_rate": 6.941584498893287e-07, - "loss": 0.5952, - "step": 71513 - }, - { - "epoch": 1.83, - "learning_rate": 6.941321054535374e-07, - "loss": 0.4471, - "step": 71514 - }, - { - "epoch": 1.83, - "learning_rate": 6.941057612519351e-07, - "loss": 0.7178, - "step": 71515 - }, - { - "epoch": 1.83, - "learning_rate": 6.940794172845419e-07, - "loss": 0.5361, - "step": 71516 - }, - { - "epoch": 1.83, - "learning_rate": 6.940530735513783e-07, - "loss": 0.7383, - "step": 71517 - }, - { - "epoch": 1.83, - "learning_rate": 6.940267300524641e-07, - "loss": 0.606, - "step": 71518 - }, - { - "epoch": 1.83, - "learning_rate": 6.940003867878195e-07, - "loss": 0.55, - "step": 71519 - }, - { - "epoch": 1.83, - "learning_rate": 6.939740437574645e-07, - "loss": 0.6479, - "step": 71520 - }, - { - "epoch": 1.83, - "learning_rate": 6.939477009614197e-07, - "loss": 0.707, - "step": 71521 - }, - { - "epoch": 1.83, - "learning_rate": 6.93921358399705e-07, - "loss": 0.7188, - "step": 71522 - }, - { - "epoch": 1.83, - "learning_rate": 6.938950160723407e-07, - "loss": 0.5732, - "step": 71523 - }, - { - "epoch": 1.83, - "learning_rate": 6.938686739793468e-07, - "loss": 0.522, - "step": 71524 - }, - { - "epoch": 1.83, - "learning_rate": 6.938423321207439e-07, - "loss": 0.5759, - "step": 71525 - }, - { - "epoch": 1.83, - "learning_rate": 6.938159904965514e-07, - "loss": 0.709, - "step": 71526 - }, - { - "epoch": 1.83, - "learning_rate": 6.937896491067904e-07, - "loss": 0.6816, - "step": 71527 - }, - { - "epoch": 1.83, - "learning_rate": 6.937633079514804e-07, - "loss": 0.5195, - "step": 71528 - }, - { - "epoch": 1.83, - "learning_rate": 6.937369670306416e-07, - "loss": 0.6499, - "step": 71529 - }, - { - "epoch": 1.83, - "learning_rate": 6.937106263442945e-07, - "loss": 0.7803, - "step": 71530 - }, - { - "epoch": 1.83, - "learning_rate": 6.936842858924588e-07, - "loss": 0.5146, - "step": 71531 - }, - { - "epoch": 1.83, - "learning_rate": 6.936579456751552e-07, - "loss": 0.6982, - "step": 71532 - }, - { - "epoch": 1.83, - "learning_rate": 6.936316056924034e-07, - "loss": 0.6245, - "step": 71533 - }, - { - "epoch": 1.83, - "learning_rate": 6.936052659442242e-07, - "loss": 0.5984, - "step": 71534 - }, - { - "epoch": 1.83, - "learning_rate": 6.935789264306369e-07, - "loss": 0.6416, - "step": 71535 - }, - { - "epoch": 1.83, - "learning_rate": 6.935525871516625e-07, - "loss": 0.5127, - "step": 71536 - }, - { - "epoch": 1.83, - "learning_rate": 6.93526248107321e-07, - "loss": 0.5322, - "step": 71537 - }, - { - "epoch": 1.83, - "learning_rate": 6.934999092976319e-07, - "loss": 0.6709, - "step": 71538 - }, - { - "epoch": 1.83, - "learning_rate": 6.934735707226159e-07, - "loss": 0.5894, - "step": 71539 - }, - { - "epoch": 1.83, - "learning_rate": 6.934472323822932e-07, - "loss": 0.582, - "step": 71540 - }, - { - "epoch": 1.83, - "learning_rate": 6.934208942766837e-07, - "loss": 0.6797, - "step": 71541 - }, - { - "epoch": 1.83, - "learning_rate": 6.933945564058079e-07, - "loss": 0.6289, - "step": 71542 - }, - { - "epoch": 1.83, - "learning_rate": 6.933682187696855e-07, - "loss": 0.6289, - "step": 71543 - }, - { - "epoch": 1.83, - "learning_rate": 6.933418813683372e-07, - "loss": 0.8223, - "step": 71544 - }, - { - "epoch": 1.83, - "learning_rate": 6.933155442017829e-07, - "loss": 0.6191, - "step": 71545 - }, - { - "epoch": 1.83, - "learning_rate": 6.932892072700427e-07, - "loss": 0.5466, - "step": 71546 - }, - { - "epoch": 1.83, - "learning_rate": 6.932628705731373e-07, - "loss": 0.5249, - "step": 71547 - }, - { - "epoch": 1.83, - "learning_rate": 6.932365341110859e-07, - "loss": 0.7681, - "step": 71548 - }, - { - "epoch": 1.83, - "learning_rate": 6.932101978839093e-07, - "loss": 0.7891, - "step": 71549 - }, - { - "epoch": 1.83, - "learning_rate": 6.931838618916274e-07, - "loss": 0.5884, - "step": 71550 - }, - { - "epoch": 1.83, - "learning_rate": 6.931575261342608e-07, - "loss": 0.7783, - "step": 71551 - }, - { - "epoch": 1.83, - "learning_rate": 6.931311906118291e-07, - "loss": 0.3604, - "step": 71552 - }, - { - "epoch": 1.83, - "learning_rate": 6.931048553243531e-07, - "loss": 0.8389, - "step": 71553 - }, - { - "epoch": 1.83, - "learning_rate": 6.930785202718521e-07, - "loss": 0.6025, - "step": 71554 - }, - { - "epoch": 1.83, - "learning_rate": 6.930521854543472e-07, - "loss": 0.5591, - "step": 71555 - }, - { - "epoch": 1.83, - "learning_rate": 6.93025850871858e-07, - "loss": 0.6968, - "step": 71556 - }, - { - "epoch": 1.83, - "learning_rate": 6.92999516524405e-07, - "loss": 0.6133, - "step": 71557 - }, - { - "epoch": 1.83, - "learning_rate": 6.929731824120077e-07, - "loss": 0.5728, - "step": 71558 - }, - { - "epoch": 1.83, - "learning_rate": 6.929468485346871e-07, - "loss": 0.4868, - "step": 71559 - }, - { - "epoch": 1.83, - "learning_rate": 6.929205148924628e-07, - "loss": 0.5635, - "step": 71560 - }, - { - "epoch": 1.83, - "learning_rate": 6.928941814853551e-07, - "loss": 0.5298, - "step": 71561 - }, - { - "epoch": 1.83, - "learning_rate": 6.928678483133842e-07, - "loss": 0.6196, - "step": 71562 - }, - { - "epoch": 1.83, - "learning_rate": 6.928415153765703e-07, - "loss": 0.4097, - "step": 71563 - }, - { - "epoch": 1.83, - "learning_rate": 6.928151826749335e-07, - "loss": 0.6797, - "step": 71564 - }, - { - "epoch": 1.83, - "learning_rate": 6.92788850208494e-07, - "loss": 0.5328, - "step": 71565 - }, - { - "epoch": 1.83, - "learning_rate": 6.92762517977272e-07, - "loss": 0.6055, - "step": 71566 - }, - { - "epoch": 1.83, - "learning_rate": 6.927361859812879e-07, - "loss": 0.6177, - "step": 71567 - }, - { - "epoch": 1.83, - "learning_rate": 6.927098542205614e-07, - "loss": 0.7095, - "step": 71568 - }, - { - "epoch": 1.83, - "learning_rate": 6.926835226951124e-07, - "loss": 0.6533, - "step": 71569 - }, - { - "epoch": 1.83, - "learning_rate": 6.926571914049619e-07, - "loss": 0.7354, - "step": 71570 - }, - { - "epoch": 1.83, - "learning_rate": 6.926308603501295e-07, - "loss": 0.6309, - "step": 71571 - }, - { - "epoch": 1.83, - "learning_rate": 6.926045295306357e-07, - "loss": 0.4572, - "step": 71572 - }, - { - "epoch": 1.83, - "learning_rate": 6.925781989465005e-07, - "loss": 0.7354, - "step": 71573 - }, - { - "epoch": 1.83, - "learning_rate": 6.925518685977436e-07, - "loss": 0.624, - "step": 71574 - }, - { - "epoch": 1.83, - "learning_rate": 6.92525538484386e-07, - "loss": 0.5889, - "step": 71575 - }, - { - "epoch": 1.83, - "learning_rate": 6.924992086064472e-07, - "loss": 0.6377, - "step": 71576 - }, - { - "epoch": 1.83, - "learning_rate": 6.924728789639481e-07, - "loss": 0.6904, - "step": 71577 - }, - { - "epoch": 1.83, - "learning_rate": 6.924465495569082e-07, - "loss": 0.6396, - "step": 71578 - }, - { - "epoch": 1.83, - "learning_rate": 6.924202203853475e-07, - "loss": 0.6216, - "step": 71579 - }, - { - "epoch": 1.83, - "learning_rate": 6.923938914492868e-07, - "loss": 0.4771, - "step": 71580 - }, - { - "epoch": 1.83, - "learning_rate": 6.923675627487457e-07, - "loss": 0.7432, - "step": 71581 - }, - { - "epoch": 1.83, - "learning_rate": 6.923412342837448e-07, - "loss": 0.7227, - "step": 71582 - }, - { - "epoch": 1.83, - "learning_rate": 6.923149060543039e-07, - "loss": 0.6963, - "step": 71583 - }, - { - "epoch": 1.83, - "learning_rate": 6.922885780604435e-07, - "loss": 0.5908, - "step": 71584 - }, - { - "epoch": 1.83, - "learning_rate": 6.922622503021833e-07, - "loss": 0.4656, - "step": 71585 - }, - { - "epoch": 1.83, - "learning_rate": 6.922359227795441e-07, - "loss": 0.6636, - "step": 71586 - }, - { - "epoch": 1.83, - "learning_rate": 6.922095954925458e-07, - "loss": 0.4858, - "step": 71587 - }, - { - "epoch": 1.83, - "learning_rate": 6.921832684412081e-07, - "loss": 0.5476, - "step": 71588 - }, - { - "epoch": 1.83, - "learning_rate": 6.921569416255518e-07, - "loss": 0.4795, - "step": 71589 - }, - { - "epoch": 1.83, - "learning_rate": 6.921306150455967e-07, - "loss": 0.5212, - "step": 71590 - }, - { - "epoch": 1.83, - "learning_rate": 6.921042887013629e-07, - "loss": 0.6777, - "step": 71591 - }, - { - "epoch": 1.83, - "learning_rate": 6.920779625928708e-07, - "loss": 0.5881, - "step": 71592 - }, - { - "epoch": 1.83, - "learning_rate": 6.920516367201402e-07, - "loss": 0.5957, - "step": 71593 - }, - { - "epoch": 1.83, - "learning_rate": 6.920253110831917e-07, - "loss": 0.6675, - "step": 71594 - }, - { - "epoch": 1.84, - "learning_rate": 6.919989856820451e-07, - "loss": 0.6709, - "step": 71595 - }, - { - "epoch": 1.84, - "learning_rate": 6.91972660516721e-07, - "loss": 0.6777, - "step": 71596 - }, - { - "epoch": 1.84, - "learning_rate": 6.919463355872395e-07, - "loss": 0.6738, - "step": 71597 - }, - { - "epoch": 1.84, - "learning_rate": 6.9192001089362e-07, - "loss": 0.7354, - "step": 71598 - }, - { - "epoch": 1.84, - "learning_rate": 6.918936864358835e-07, - "loss": 0.4158, - "step": 71599 - }, - { - "epoch": 1.84, - "learning_rate": 6.918673622140495e-07, - "loss": 0.6177, - "step": 71600 - }, - { - "epoch": 1.84, - "learning_rate": 6.918410382281388e-07, - "loss": 0.5645, - "step": 71601 - }, - { - "epoch": 1.84, - "learning_rate": 6.91814714478171e-07, - "loss": 0.7275, - "step": 71602 - }, - { - "epoch": 1.84, - "learning_rate": 6.917883909641666e-07, - "loss": 0.6572, - "step": 71603 - }, - { - "epoch": 1.84, - "learning_rate": 6.917620676861455e-07, - "loss": 0.3787, - "step": 71604 - }, - { - "epoch": 1.84, - "learning_rate": 6.917357446441284e-07, - "loss": 0.6123, - "step": 71605 - }, - { - "epoch": 1.84, - "learning_rate": 6.917094218381347e-07, - "loss": 0.543, - "step": 71606 - }, - { - "epoch": 1.84, - "learning_rate": 6.916830992681853e-07, - "loss": 0.4561, - "step": 71607 - }, - { - "epoch": 1.84, - "learning_rate": 6.916567769342999e-07, - "loss": 0.6709, - "step": 71608 - }, - { - "epoch": 1.84, - "learning_rate": 6.916304548364986e-07, - "loss": 0.5474, - "step": 71609 - }, - { - "epoch": 1.84, - "learning_rate": 6.916041329748015e-07, - "loss": 0.5332, - "step": 71610 - }, - { - "epoch": 1.84, - "learning_rate": 6.915778113492292e-07, - "loss": 0.5737, - "step": 71611 - }, - { - "epoch": 1.84, - "learning_rate": 6.915514899598014e-07, - "loss": 0.6963, - "step": 71612 - }, - { - "epoch": 1.84, - "learning_rate": 6.915251688065386e-07, - "loss": 0.4854, - "step": 71613 - }, - { - "epoch": 1.84, - "learning_rate": 6.914988478894605e-07, - "loss": 0.5706, - "step": 71614 - }, - { - "epoch": 1.84, - "learning_rate": 6.914725272085879e-07, - "loss": 0.5176, - "step": 71615 - }, - { - "epoch": 1.84, - "learning_rate": 6.914462067639404e-07, - "loss": 0.6943, - "step": 71616 - }, - { - "epoch": 1.84, - "learning_rate": 6.914198865555387e-07, - "loss": 0.6045, - "step": 71617 - }, - { - "epoch": 1.84, - "learning_rate": 6.913935665834024e-07, - "loss": 0.605, - "step": 71618 - }, - { - "epoch": 1.84, - "learning_rate": 6.913672468475517e-07, - "loss": 0.7373, - "step": 71619 - }, - { - "epoch": 1.84, - "learning_rate": 6.913409273480071e-07, - "loss": 0.6484, - "step": 71620 - }, - { - "epoch": 1.84, - "learning_rate": 6.913146080847882e-07, - "loss": 0.667, - "step": 71621 - }, - { - "epoch": 1.84, - "learning_rate": 6.912882890579159e-07, - "loss": 0.5913, - "step": 71622 - }, - { - "epoch": 1.84, - "learning_rate": 6.912619702674096e-07, - "loss": 0.834, - "step": 71623 - }, - { - "epoch": 1.84, - "learning_rate": 6.912356517132902e-07, - "loss": 0.5532, - "step": 71624 - }, - { - "epoch": 1.84, - "learning_rate": 6.912093333955771e-07, - "loss": 0.6729, - "step": 71625 - }, - { - "epoch": 1.84, - "learning_rate": 6.911830153142911e-07, - "loss": 0.6821, - "step": 71626 - }, - { - "epoch": 1.84, - "learning_rate": 6.911566974694522e-07, - "loss": 0.5322, - "step": 71627 - }, - { - "epoch": 1.84, - "learning_rate": 6.911303798610804e-07, - "loss": 0.6489, - "step": 71628 - }, - { - "epoch": 1.84, - "learning_rate": 6.911040624891955e-07, - "loss": 0.6426, - "step": 71629 - }, - { - "epoch": 1.84, - "learning_rate": 6.910777453538183e-07, - "loss": 0.6514, - "step": 71630 - }, - { - "epoch": 1.84, - "learning_rate": 6.910514284549683e-07, - "loss": 0.728, - "step": 71631 - }, - { - "epoch": 1.84, - "learning_rate": 6.910251117926664e-07, - "loss": 0.4597, - "step": 71632 - }, - { - "epoch": 1.84, - "learning_rate": 6.90998795366932e-07, - "loss": 0.6606, - "step": 71633 - }, - { - "epoch": 1.84, - "learning_rate": 6.90972479177786e-07, - "loss": 0.4585, - "step": 71634 - }, - { - "epoch": 1.84, - "learning_rate": 6.909461632252477e-07, - "loss": 0.7402, - "step": 71635 - }, - { - "epoch": 1.84, - "learning_rate": 6.909198475093383e-07, - "loss": 0.6851, - "step": 71636 - }, - { - "epoch": 1.84, - "learning_rate": 6.908935320300773e-07, - "loss": 0.5247, - "step": 71637 - }, - { - "epoch": 1.84, - "learning_rate": 6.908672167874845e-07, - "loss": 0.6333, - "step": 71638 - }, - { - "epoch": 1.84, - "learning_rate": 6.908409017815809e-07, - "loss": 0.339, - "step": 71639 - }, - { - "epoch": 1.84, - "learning_rate": 6.908145870123857e-07, - "loss": 0.6499, - "step": 71640 - }, - { - "epoch": 1.84, - "learning_rate": 6.907882724799199e-07, - "loss": 0.4492, - "step": 71641 - }, - { - "epoch": 1.84, - "learning_rate": 6.907619581842031e-07, - "loss": 0.5601, - "step": 71642 - }, - { - "epoch": 1.84, - "learning_rate": 6.907356441252558e-07, - "loss": 0.6611, - "step": 71643 - }, - { - "epoch": 1.84, - "learning_rate": 6.907093303030978e-07, - "loss": 0.79, - "step": 71644 - }, - { - "epoch": 1.84, - "learning_rate": 6.906830167177497e-07, - "loss": 0.7456, - "step": 71645 - }, - { - "epoch": 1.84, - "learning_rate": 6.906567033692313e-07, - "loss": 0.5903, - "step": 71646 - }, - { - "epoch": 1.84, - "learning_rate": 6.90630390257563e-07, - "loss": 0.625, - "step": 71647 - }, - { - "epoch": 1.84, - "learning_rate": 6.906040773827646e-07, - "loss": 0.7148, - "step": 71648 - }, - { - "epoch": 1.84, - "learning_rate": 6.905777647448565e-07, - "loss": 0.6328, - "step": 71649 - }, - { - "epoch": 1.84, - "learning_rate": 6.905514523438586e-07, - "loss": 0.8652, - "step": 71650 - }, - { - "epoch": 1.84, - "learning_rate": 6.905251401797913e-07, - "loss": 0.8994, - "step": 71651 - }, - { - "epoch": 1.84, - "learning_rate": 6.904988282526747e-07, - "loss": 0.4536, - "step": 71652 - }, - { - "epoch": 1.84, - "learning_rate": 6.904725165625289e-07, - "loss": 0.5425, - "step": 71653 - }, - { - "epoch": 1.84, - "learning_rate": 6.90446205109374e-07, - "loss": 0.4907, - "step": 71654 - }, - { - "epoch": 1.84, - "learning_rate": 6.904198938932304e-07, - "loss": 0.6255, - "step": 71655 - }, - { - "epoch": 1.84, - "learning_rate": 6.903935829141179e-07, - "loss": 0.5182, - "step": 71656 - }, - { - "epoch": 1.84, - "learning_rate": 6.90367272172057e-07, - "loss": 0.5249, - "step": 71657 - }, - { - "epoch": 1.84, - "learning_rate": 6.903409616670677e-07, - "loss": 0.7881, - "step": 71658 - }, - { - "epoch": 1.84, - "learning_rate": 6.903146513991697e-07, - "loss": 0.6792, - "step": 71659 - }, - { - "epoch": 1.84, - "learning_rate": 6.902883413683838e-07, - "loss": 0.7617, - "step": 71660 - }, - { - "epoch": 1.84, - "learning_rate": 6.902620315747296e-07, - "loss": 0.7598, - "step": 71661 - }, - { - "epoch": 1.84, - "learning_rate": 6.902357220182278e-07, - "loss": 0.6108, - "step": 71662 - }, - { - "epoch": 1.84, - "learning_rate": 6.902094126988982e-07, - "loss": 0.6924, - "step": 71663 - }, - { - "epoch": 1.84, - "learning_rate": 6.901831036167609e-07, - "loss": 0.6133, - "step": 71664 - }, - { - "epoch": 1.84, - "learning_rate": 6.901567947718363e-07, - "loss": 0.5557, - "step": 71665 - }, - { - "epoch": 1.84, - "learning_rate": 6.901304861641442e-07, - "loss": 0.6592, - "step": 71666 - }, - { - "epoch": 1.84, - "learning_rate": 6.901041777937053e-07, - "loss": 0.5552, - "step": 71667 - }, - { - "epoch": 1.84, - "learning_rate": 6.900778696605392e-07, - "loss": 0.6465, - "step": 71668 - }, - { - "epoch": 1.84, - "learning_rate": 6.900515617646661e-07, - "loss": 0.6431, - "step": 71669 - }, - { - "epoch": 1.84, - "learning_rate": 6.900252541061064e-07, - "loss": 0.603, - "step": 71670 - }, - { - "epoch": 1.84, - "learning_rate": 6.899989466848799e-07, - "loss": 0.8018, - "step": 71671 - }, - { - "epoch": 1.84, - "learning_rate": 6.899726395010072e-07, - "loss": 0.6455, - "step": 71672 - }, - { - "epoch": 1.84, - "learning_rate": 6.899463325545079e-07, - "loss": 0.5479, - "step": 71673 - }, - { - "epoch": 1.84, - "learning_rate": 6.899200258454028e-07, - "loss": 0.6621, - "step": 71674 - }, - { - "epoch": 1.84, - "learning_rate": 6.898937193737113e-07, - "loss": 0.7568, - "step": 71675 - }, - { - "epoch": 1.84, - "learning_rate": 6.898674131394541e-07, - "loss": 0.6797, - "step": 71676 - }, - { - "epoch": 1.84, - "learning_rate": 6.898411071426516e-07, - "loss": 0.6426, - "step": 71677 - }, - { - "epoch": 1.84, - "learning_rate": 6.898148013833229e-07, - "loss": 0.5869, - "step": 71678 - }, - { - "epoch": 1.84, - "learning_rate": 6.89788495861489e-07, - "loss": 0.6621, - "step": 71679 - }, - { - "epoch": 1.84, - "learning_rate": 6.897621905771695e-07, - "loss": 0.7373, - "step": 71680 - }, - { - "epoch": 1.84, - "learning_rate": 6.897358855303852e-07, - "loss": 0.5784, - "step": 71681 - }, - { - "epoch": 1.84, - "learning_rate": 6.89709580721156e-07, - "loss": 0.4042, - "step": 71682 - }, - { - "epoch": 1.84, - "learning_rate": 6.896832761495013e-07, - "loss": 0.7178, - "step": 71683 - }, - { - "epoch": 1.84, - "learning_rate": 6.896569718154422e-07, - "loss": 0.7607, - "step": 71684 - }, - { - "epoch": 1.84, - "learning_rate": 6.896306677189985e-07, - "loss": 0.6738, - "step": 71685 - }, - { - "epoch": 1.84, - "learning_rate": 6.896043638601903e-07, - "loss": 0.4578, - "step": 71686 - }, - { - "epoch": 1.84, - "learning_rate": 6.89578060239038e-07, - "loss": 0.7749, - "step": 71687 - }, - { - "epoch": 1.84, - "learning_rate": 6.895517568555611e-07, - "loss": 0.6855, - "step": 71688 - }, - { - "epoch": 1.84, - "learning_rate": 6.895254537097803e-07, - "loss": 0.6504, - "step": 71689 - }, - { - "epoch": 1.84, - "learning_rate": 6.894991508017155e-07, - "loss": 0.6797, - "step": 71690 - }, - { - "epoch": 1.84, - "learning_rate": 6.894728481313871e-07, - "loss": 0.4255, - "step": 71691 - }, - { - "epoch": 1.84, - "learning_rate": 6.894465456988148e-07, - "loss": 0.3347, - "step": 71692 - }, - { - "epoch": 1.84, - "learning_rate": 6.894202435040193e-07, - "loss": 0.6973, - "step": 71693 - }, - { - "epoch": 1.84, - "learning_rate": 6.893939415470201e-07, - "loss": 0.5918, - "step": 71694 - }, - { - "epoch": 1.84, - "learning_rate": 6.89367639827838e-07, - "loss": 0.6426, - "step": 71695 - }, - { - "epoch": 1.84, - "learning_rate": 6.893413383464925e-07, - "loss": 0.6631, - "step": 71696 - }, - { - "epoch": 1.84, - "learning_rate": 6.893150371030045e-07, - "loss": 0.709, - "step": 71697 - }, - { - "epoch": 1.84, - "learning_rate": 6.892887360973936e-07, - "loss": 0.5439, - "step": 71698 - }, - { - "epoch": 1.84, - "learning_rate": 6.892624353296798e-07, - "loss": 0.7061, - "step": 71699 - }, - { - "epoch": 1.84, - "learning_rate": 6.892361347998835e-07, - "loss": 0.7051, - "step": 71700 - }, - { - "epoch": 1.84, - "learning_rate": 6.892098345080249e-07, - "loss": 0.6356, - "step": 71701 - }, - { - "epoch": 1.84, - "learning_rate": 6.891835344541239e-07, - "loss": 0.5403, - "step": 71702 - }, - { - "epoch": 1.84, - "learning_rate": 6.891572346382009e-07, - "loss": 0.6104, - "step": 71703 - }, - { - "epoch": 1.84, - "learning_rate": 6.891309350602758e-07, - "loss": 0.6172, - "step": 71704 - }, - { - "epoch": 1.84, - "learning_rate": 6.891046357203689e-07, - "loss": 0.7451, - "step": 71705 - }, - { - "epoch": 1.84, - "learning_rate": 6.890783366185003e-07, - "loss": 0.624, - "step": 71706 - }, - { - "epoch": 1.84, - "learning_rate": 6.890520377546902e-07, - "loss": 0.7051, - "step": 71707 - }, - { - "epoch": 1.84, - "learning_rate": 6.890257391289586e-07, - "loss": 0.5664, - "step": 71708 - }, - { - "epoch": 1.84, - "learning_rate": 6.889994407413256e-07, - "loss": 0.6689, - "step": 71709 - }, - { - "epoch": 1.84, - "learning_rate": 6.889731425918117e-07, - "loss": 0.5796, - "step": 71710 - }, - { - "epoch": 1.84, - "learning_rate": 6.889468446804363e-07, - "loss": 0.6914, - "step": 71711 - }, - { - "epoch": 1.84, - "learning_rate": 6.889205470072204e-07, - "loss": 0.8262, - "step": 71712 - }, - { - "epoch": 1.84, - "learning_rate": 6.888942495721834e-07, - "loss": 0.5723, - "step": 71713 - }, - { - "epoch": 1.84, - "learning_rate": 6.88867952375346e-07, - "loss": 0.5183, - "step": 71714 - }, - { - "epoch": 1.84, - "learning_rate": 6.88841655416728e-07, - "loss": 0.604, - "step": 71715 - }, - { - "epoch": 1.84, - "learning_rate": 6.888153586963498e-07, - "loss": 0.7666, - "step": 71716 - }, - { - "epoch": 1.84, - "learning_rate": 6.887890622142316e-07, - "loss": 0.7568, - "step": 71717 - }, - { - "epoch": 1.84, - "learning_rate": 6.887627659703929e-07, - "loss": 0.6924, - "step": 71718 - }, - { - "epoch": 1.84, - "learning_rate": 6.887364699648542e-07, - "loss": 0.7236, - "step": 71719 - }, - { - "epoch": 1.84, - "learning_rate": 6.88710174197636e-07, - "loss": 0.7207, - "step": 71720 - }, - { - "epoch": 1.84, - "learning_rate": 6.886838786687576e-07, - "loss": 0.6719, - "step": 71721 - }, - { - "epoch": 1.84, - "learning_rate": 6.886575833782401e-07, - "loss": 0.666, - "step": 71722 - }, - { - "epoch": 1.84, - "learning_rate": 6.886312883261029e-07, - "loss": 0.6343, - "step": 71723 - }, - { - "epoch": 1.84, - "learning_rate": 6.886049935123666e-07, - "loss": 0.7246, - "step": 71724 - }, - { - "epoch": 1.84, - "learning_rate": 6.885786989370508e-07, - "loss": 0.542, - "step": 71725 - }, - { - "epoch": 1.84, - "learning_rate": 6.885524046001763e-07, - "loss": 0.5798, - "step": 71726 - }, - { - "epoch": 1.84, - "learning_rate": 6.885261105017633e-07, - "loss": 0.5125, - "step": 71727 - }, - { - "epoch": 1.84, - "learning_rate": 6.884998166418308e-07, - "loss": 0.5576, - "step": 71728 - }, - { - "epoch": 1.84, - "learning_rate": 6.884735230204e-07, - "loss": 0.6162, - "step": 71729 - }, - { - "epoch": 1.84, - "learning_rate": 6.884472296374905e-07, - "loss": 0.5359, - "step": 71730 - }, - { - "epoch": 1.84, - "learning_rate": 6.884209364931229e-07, - "loss": 0.5879, - "step": 71731 - }, - { - "epoch": 1.84, - "learning_rate": 6.883946435873167e-07, - "loss": 0.7051, - "step": 71732 - }, - { - "epoch": 1.84, - "learning_rate": 6.883683509200926e-07, - "loss": 0.7031, - "step": 71733 - }, - { - "epoch": 1.84, - "learning_rate": 6.883420584914706e-07, - "loss": 0.6992, - "step": 71734 - }, - { - "epoch": 1.84, - "learning_rate": 6.883157663014707e-07, - "loss": 0.6592, - "step": 71735 - }, - { - "epoch": 1.84, - "learning_rate": 6.882894743501131e-07, - "loss": 0.665, - "step": 71736 - }, - { - "epoch": 1.84, - "learning_rate": 6.882631826374181e-07, - "loss": 0.6309, - "step": 71737 - }, - { - "epoch": 1.84, - "learning_rate": 6.882368911634053e-07, - "loss": 0.5439, - "step": 71738 - }, - { - "epoch": 1.84, - "learning_rate": 6.882105999280954e-07, - "loss": 0.7998, - "step": 71739 - }, - { - "epoch": 1.84, - "learning_rate": 6.881843089315081e-07, - "loss": 0.605, - "step": 71740 - }, - { - "epoch": 1.84, - "learning_rate": 6.881580181736639e-07, - "loss": 0.5684, - "step": 71741 - }, - { - "epoch": 1.84, - "learning_rate": 6.881317276545826e-07, - "loss": 0.5967, - "step": 71742 - }, - { - "epoch": 1.84, - "learning_rate": 6.881054373742848e-07, - "loss": 0.5195, - "step": 71743 - }, - { - "epoch": 1.84, - "learning_rate": 6.8807914733279e-07, - "loss": 0.6963, - "step": 71744 - }, - { - "epoch": 1.84, - "learning_rate": 6.880528575301188e-07, - "loss": 0.7266, - "step": 71745 - }, - { - "epoch": 1.84, - "learning_rate": 6.880265679662911e-07, - "loss": 0.7031, - "step": 71746 - }, - { - "epoch": 1.84, - "learning_rate": 6.880002786413275e-07, - "loss": 0.6426, - "step": 71747 - }, - { - "epoch": 1.84, - "learning_rate": 6.879739895552475e-07, - "loss": 0.6758, - "step": 71748 - }, - { - "epoch": 1.84, - "learning_rate": 6.879477007080713e-07, - "loss": 0.5811, - "step": 71749 - }, - { - "epoch": 1.84, - "learning_rate": 6.879214120998193e-07, - "loss": 0.7842, - "step": 71750 - }, - { - "epoch": 1.84, - "learning_rate": 6.878951237305115e-07, - "loss": 0.5957, - "step": 71751 - }, - { - "epoch": 1.84, - "learning_rate": 6.878688356001681e-07, - "loss": 0.4551, - "step": 71752 - }, - { - "epoch": 1.84, - "learning_rate": 6.878425477088092e-07, - "loss": 0.5715, - "step": 71753 - }, - { - "epoch": 1.84, - "learning_rate": 6.878162600564548e-07, - "loss": 0.7168, - "step": 71754 - }, - { - "epoch": 1.84, - "learning_rate": 6.877899726431253e-07, - "loss": 0.6431, - "step": 71755 - }, - { - "epoch": 1.84, - "learning_rate": 6.877636854688405e-07, - "loss": 0.7354, - "step": 71756 - }, - { - "epoch": 1.84, - "learning_rate": 6.87737398533621e-07, - "loss": 0.668, - "step": 71757 - }, - { - "epoch": 1.84, - "learning_rate": 6.877111118374863e-07, - "loss": 0.6309, - "step": 71758 - }, - { - "epoch": 1.84, - "learning_rate": 6.876848253804568e-07, - "loss": 0.6963, - "step": 71759 - }, - { - "epoch": 1.84, - "learning_rate": 6.876585391625529e-07, - "loss": 0.5991, - "step": 71760 - }, - { - "epoch": 1.84, - "learning_rate": 6.876322531837943e-07, - "loss": 0.5459, - "step": 71761 - }, - { - "epoch": 1.84, - "learning_rate": 6.876059674442014e-07, - "loss": 0.6279, - "step": 71762 - }, - { - "epoch": 1.84, - "learning_rate": 6.875796819437942e-07, - "loss": 0.6992, - "step": 71763 - }, - { - "epoch": 1.84, - "learning_rate": 6.87553396682593e-07, - "loss": 0.6851, - "step": 71764 - }, - { - "epoch": 1.84, - "learning_rate": 6.875271116606175e-07, - "loss": 0.6328, - "step": 71765 - }, - { - "epoch": 1.84, - "learning_rate": 6.875008268778884e-07, - "loss": 0.835, - "step": 71766 - }, - { - "epoch": 1.84, - "learning_rate": 6.874745423344258e-07, - "loss": 0.7256, - "step": 71767 - }, - { - "epoch": 1.84, - "learning_rate": 6.874482580302491e-07, - "loss": 0.6729, - "step": 71768 - }, - { - "epoch": 1.84, - "learning_rate": 6.874219739653792e-07, - "loss": 0.6211, - "step": 71769 - }, - { - "epoch": 1.84, - "learning_rate": 6.873956901398356e-07, - "loss": 0.667, - "step": 71770 - }, - { - "epoch": 1.84, - "learning_rate": 6.873694065536391e-07, - "loss": 0.6479, - "step": 71771 - }, - { - "epoch": 1.84, - "learning_rate": 6.873431232068092e-07, - "loss": 0.6641, - "step": 71772 - }, - { - "epoch": 1.84, - "learning_rate": 6.873168400993663e-07, - "loss": 0.5938, - "step": 71773 - }, - { - "epoch": 1.84, - "learning_rate": 6.872905572313306e-07, - "loss": 0.4219, - "step": 71774 - }, - { - "epoch": 1.84, - "learning_rate": 6.872642746027221e-07, - "loss": 0.6416, - "step": 71775 - }, - { - "epoch": 1.84, - "learning_rate": 6.872379922135612e-07, - "loss": 0.561, - "step": 71776 - }, - { - "epoch": 1.84, - "learning_rate": 6.872117100638679e-07, - "loss": 0.5591, - "step": 71777 - }, - { - "epoch": 1.84, - "learning_rate": 6.871854281536617e-07, - "loss": 0.5962, - "step": 71778 - }, - { - "epoch": 1.84, - "learning_rate": 6.871591464829635e-07, - "loss": 0.5605, - "step": 71779 - }, - { - "epoch": 1.84, - "learning_rate": 6.871328650517929e-07, - "loss": 0.5327, - "step": 71780 - }, - { - "epoch": 1.84, - "learning_rate": 6.871065838601706e-07, - "loss": 0.5542, - "step": 71781 - }, - { - "epoch": 1.84, - "learning_rate": 6.870803029081162e-07, - "loss": 0.7129, - "step": 71782 - }, - { - "epoch": 1.84, - "learning_rate": 6.870540221956501e-07, - "loss": 0.6646, - "step": 71783 - }, - { - "epoch": 1.84, - "learning_rate": 6.870277417227924e-07, - "loss": 0.6392, - "step": 71784 - }, - { - "epoch": 1.84, - "learning_rate": 6.870014614895631e-07, - "loss": 0.5381, - "step": 71785 - }, - { - "epoch": 1.84, - "learning_rate": 6.869751814959822e-07, - "loss": 0.8242, - "step": 71786 - }, - { - "epoch": 1.84, - "learning_rate": 6.869489017420704e-07, - "loss": 0.4761, - "step": 71787 - }, - { - "epoch": 1.84, - "learning_rate": 6.869226222278475e-07, - "loss": 0.5552, - "step": 71788 - }, - { - "epoch": 1.84, - "learning_rate": 6.868963429533334e-07, - "loss": 0.5254, - "step": 71789 - }, - { - "epoch": 1.84, - "learning_rate": 6.86870063918548e-07, - "loss": 0.8135, - "step": 71790 - }, - { - "epoch": 1.84, - "learning_rate": 6.868437851235123e-07, - "loss": 0.7017, - "step": 71791 - }, - { - "epoch": 1.84, - "learning_rate": 6.868175065682454e-07, - "loss": 0.707, - "step": 71792 - }, - { - "epoch": 1.84, - "learning_rate": 6.867912282527684e-07, - "loss": 0.5645, - "step": 71793 - }, - { - "epoch": 1.84, - "learning_rate": 6.867649501771006e-07, - "loss": 0.6216, - "step": 71794 - }, - { - "epoch": 1.84, - "learning_rate": 6.867386723412627e-07, - "loss": 0.4746, - "step": 71795 - }, - { - "epoch": 1.84, - "learning_rate": 6.867123947452744e-07, - "loss": 0.9297, - "step": 71796 - }, - { - "epoch": 1.84, - "learning_rate": 6.866861173891565e-07, - "loss": 0.5928, - "step": 71797 - }, - { - "epoch": 1.84, - "learning_rate": 6.866598402729283e-07, - "loss": 0.4189, - "step": 71798 - }, - { - "epoch": 1.84, - "learning_rate": 6.866335633966101e-07, - "loss": 0.5659, - "step": 71799 - }, - { - "epoch": 1.84, - "learning_rate": 6.866072867602224e-07, - "loss": 0.6392, - "step": 71800 - }, - { - "epoch": 1.84, - "learning_rate": 6.865810103637849e-07, - "loss": 0.6245, - "step": 71801 - }, - { - "epoch": 1.84, - "learning_rate": 6.865547342073181e-07, - "loss": 0.4849, - "step": 71802 - }, - { - "epoch": 1.84, - "learning_rate": 6.865284582908417e-07, - "loss": 0.7383, - "step": 71803 - }, - { - "epoch": 1.84, - "learning_rate": 6.865021826143762e-07, - "loss": 0.4551, - "step": 71804 - }, - { - "epoch": 1.84, - "learning_rate": 6.864759071779415e-07, - "loss": 0.6392, - "step": 71805 - }, - { - "epoch": 1.84, - "learning_rate": 6.864496319815578e-07, - "loss": 0.5684, - "step": 71806 - }, - { - "epoch": 1.84, - "learning_rate": 6.864233570252455e-07, - "loss": 0.8037, - "step": 71807 - }, - { - "epoch": 1.84, - "learning_rate": 6.863970823090244e-07, - "loss": 0.6836, - "step": 71808 - }, - { - "epoch": 1.84, - "learning_rate": 6.863708078329143e-07, - "loss": 0.6992, - "step": 71809 - }, - { - "epoch": 1.84, - "learning_rate": 6.863445335969356e-07, - "loss": 0.3436, - "step": 71810 - }, - { - "epoch": 1.84, - "learning_rate": 6.863182596011085e-07, - "loss": 0.5715, - "step": 71811 - }, - { - "epoch": 1.84, - "learning_rate": 6.862919858454533e-07, - "loss": 0.4187, - "step": 71812 - }, - { - "epoch": 1.84, - "learning_rate": 6.862657123299897e-07, - "loss": 0.6157, - "step": 71813 - }, - { - "epoch": 1.84, - "learning_rate": 6.862394390547381e-07, - "loss": 0.6318, - "step": 71814 - }, - { - "epoch": 1.84, - "learning_rate": 6.862131660197185e-07, - "loss": 0.6514, - "step": 71815 - }, - { - "epoch": 1.84, - "learning_rate": 6.861868932249513e-07, - "loss": 0.8379, - "step": 71816 - }, - { - "epoch": 1.84, - "learning_rate": 6.861606206704562e-07, - "loss": 0.6348, - "step": 71817 - }, - { - "epoch": 1.84, - "learning_rate": 6.861343483562534e-07, - "loss": 0.7617, - "step": 71818 - }, - { - "epoch": 1.84, - "learning_rate": 6.861080762823633e-07, - "loss": 0.8174, - "step": 71819 - }, - { - "epoch": 1.84, - "learning_rate": 6.860818044488053e-07, - "loss": 0.6582, - "step": 71820 - }, - { - "epoch": 1.84, - "learning_rate": 6.860555328556006e-07, - "loss": 0.542, - "step": 71821 - }, - { - "epoch": 1.84, - "learning_rate": 6.860292615027683e-07, - "loss": 0.4926, - "step": 71822 - }, - { - "epoch": 1.84, - "learning_rate": 6.860029903903293e-07, - "loss": 0.6709, - "step": 71823 - }, - { - "epoch": 1.84, - "learning_rate": 6.859767195183031e-07, - "loss": 0.5469, - "step": 71824 - }, - { - "epoch": 1.84, - "learning_rate": 6.859504488867103e-07, - "loss": 0.5522, - "step": 71825 - }, - { - "epoch": 1.84, - "learning_rate": 6.85924178495571e-07, - "loss": 0.4966, - "step": 71826 - }, - { - "epoch": 1.84, - "learning_rate": 6.85897908344905e-07, - "loss": 0.7861, - "step": 71827 - }, - { - "epoch": 1.84, - "learning_rate": 6.858716384347322e-07, - "loss": 0.6689, - "step": 71828 - }, - { - "epoch": 1.84, - "learning_rate": 6.858453687650734e-07, - "loss": 0.6641, - "step": 71829 - }, - { - "epoch": 1.84, - "learning_rate": 6.85819099335948e-07, - "loss": 0.6377, - "step": 71830 - }, - { - "epoch": 1.84, - "learning_rate": 6.857928301473767e-07, - "loss": 0.3616, - "step": 71831 - }, - { - "epoch": 1.84, - "learning_rate": 6.857665611993793e-07, - "loss": 0.584, - "step": 71832 - }, - { - "epoch": 1.84, - "learning_rate": 6.85740292491976e-07, - "loss": 0.7939, - "step": 71833 - }, - { - "epoch": 1.84, - "learning_rate": 6.857140240251868e-07, - "loss": 0.7236, - "step": 71834 - }, - { - "epoch": 1.84, - "learning_rate": 6.856877557990321e-07, - "loss": 0.6367, - "step": 71835 - }, - { - "epoch": 1.84, - "learning_rate": 6.856614878135321e-07, - "loss": 0.5615, - "step": 71836 - }, - { - "epoch": 1.84, - "learning_rate": 6.856352200687062e-07, - "loss": 0.6855, - "step": 71837 - }, - { - "epoch": 1.84, - "learning_rate": 6.856089525645752e-07, - "loss": 0.6094, - "step": 71838 - }, - { - "epoch": 1.84, - "learning_rate": 6.855826853011587e-07, - "loss": 0.563, - "step": 71839 - }, - { - "epoch": 1.84, - "learning_rate": 6.855564182784774e-07, - "loss": 0.6943, - "step": 71840 - }, - { - "epoch": 1.84, - "learning_rate": 6.855301514965508e-07, - "loss": 0.6416, - "step": 71841 - }, - { - "epoch": 1.84, - "learning_rate": 6.855038849553994e-07, - "loss": 0.5991, - "step": 71842 - }, - { - "epoch": 1.84, - "learning_rate": 6.854776186550431e-07, - "loss": 0.6465, - "step": 71843 - }, - { - "epoch": 1.84, - "learning_rate": 6.854513525955024e-07, - "loss": 0.6274, - "step": 71844 - }, - { - "epoch": 1.84, - "learning_rate": 6.854250867767971e-07, - "loss": 0.6528, - "step": 71845 - }, - { - "epoch": 1.84, - "learning_rate": 6.853988211989475e-07, - "loss": 0.5483, - "step": 71846 - }, - { - "epoch": 1.84, - "learning_rate": 6.853725558619731e-07, - "loss": 0.6943, - "step": 71847 - }, - { - "epoch": 1.84, - "learning_rate": 6.853462907658949e-07, - "loss": 0.6348, - "step": 71848 - }, - { - "epoch": 1.84, - "learning_rate": 6.853200259107321e-07, - "loss": 0.7007, - "step": 71849 - }, - { - "epoch": 1.84, - "learning_rate": 6.852937612965057e-07, - "loss": 0.6895, - "step": 71850 - }, - { - "epoch": 1.84, - "learning_rate": 6.852674969232352e-07, - "loss": 0.5518, - "step": 71851 - }, - { - "epoch": 1.84, - "learning_rate": 6.852412327909409e-07, - "loss": 0.5562, - "step": 71852 - }, - { - "epoch": 1.84, - "learning_rate": 6.852149688996429e-07, - "loss": 0.5789, - "step": 71853 - }, - { - "epoch": 1.84, - "learning_rate": 6.851887052493614e-07, - "loss": 0.667, - "step": 71854 - }, - { - "epoch": 1.84, - "learning_rate": 6.851624418401163e-07, - "loss": 0.7812, - "step": 71855 - }, - { - "epoch": 1.84, - "learning_rate": 6.851361786719283e-07, - "loss": 0.6826, - "step": 71856 - }, - { - "epoch": 1.84, - "learning_rate": 6.851099157448168e-07, - "loss": 0.4934, - "step": 71857 - }, - { - "epoch": 1.84, - "learning_rate": 6.850836530588019e-07, - "loss": 0.6172, - "step": 71858 - }, - { - "epoch": 1.84, - "learning_rate": 6.850573906139042e-07, - "loss": 0.397, - "step": 71859 - }, - { - "epoch": 1.84, - "learning_rate": 6.850311284101434e-07, - "loss": 0.7549, - "step": 71860 - }, - { - "epoch": 1.84, - "learning_rate": 6.8500486644754e-07, - "loss": 0.6099, - "step": 71861 - }, - { - "epoch": 1.84, - "learning_rate": 6.849786047261139e-07, - "loss": 0.5889, - "step": 71862 - }, - { - "epoch": 1.84, - "learning_rate": 6.849523432458848e-07, - "loss": 0.5996, - "step": 71863 - }, - { - "epoch": 1.84, - "learning_rate": 6.849260820068736e-07, - "loss": 0.4919, - "step": 71864 - }, - { - "epoch": 1.84, - "learning_rate": 6.848998210090999e-07, - "loss": 0.7305, - "step": 71865 - }, - { - "epoch": 1.84, - "learning_rate": 6.848735602525842e-07, - "loss": 0.6108, - "step": 71866 - }, - { - "epoch": 1.84, - "learning_rate": 6.84847299737346e-07, - "loss": 0.7129, - "step": 71867 - }, - { - "epoch": 1.84, - "learning_rate": 6.848210394634057e-07, - "loss": 0.7119, - "step": 71868 - }, - { - "epoch": 1.84, - "learning_rate": 6.847947794307836e-07, - "loss": 0.7422, - "step": 71869 - }, - { - "epoch": 1.84, - "learning_rate": 6.847685196394994e-07, - "loss": 0.6191, - "step": 71870 - }, - { - "epoch": 1.84, - "learning_rate": 6.847422600895736e-07, - "loss": 0.4531, - "step": 71871 - }, - { - "epoch": 1.84, - "learning_rate": 6.847160007810261e-07, - "loss": 0.5967, - "step": 71872 - }, - { - "epoch": 1.84, - "learning_rate": 6.846897417138772e-07, - "loss": 0.5004, - "step": 71873 - }, - { - "epoch": 1.84, - "learning_rate": 6.846634828881465e-07, - "loss": 0.5166, - "step": 71874 - }, - { - "epoch": 1.84, - "learning_rate": 6.84637224303855e-07, - "loss": 0.5312, - "step": 71875 - }, - { - "epoch": 1.84, - "learning_rate": 6.846109659610223e-07, - "loss": 0.6895, - "step": 71876 - }, - { - "epoch": 1.84, - "learning_rate": 6.84584707859668e-07, - "loss": 0.6572, - "step": 71877 - }, - { - "epoch": 1.84, - "learning_rate": 6.84558449999813e-07, - "loss": 0.624, - "step": 71878 - }, - { - "epoch": 1.84, - "learning_rate": 6.845321923814771e-07, - "loss": 0.7363, - "step": 71879 - }, - { - "epoch": 1.84, - "learning_rate": 6.845059350046803e-07, - "loss": 0.4333, - "step": 71880 - }, - { - "epoch": 1.84, - "learning_rate": 6.844796778694427e-07, - "loss": 0.584, - "step": 71881 - }, - { - "epoch": 1.84, - "learning_rate": 6.844534209757844e-07, - "loss": 0.4863, - "step": 71882 - }, - { - "epoch": 1.84, - "learning_rate": 6.84427164323726e-07, - "loss": 0.8262, - "step": 71883 - }, - { - "epoch": 1.84, - "learning_rate": 6.844009079132869e-07, - "loss": 0.5225, - "step": 71884 - }, - { - "epoch": 1.84, - "learning_rate": 6.843746517444876e-07, - "loss": 0.7969, - "step": 71885 - }, - { - "epoch": 1.84, - "learning_rate": 6.843483958173484e-07, - "loss": 0.6367, - "step": 71886 - }, - { - "epoch": 1.84, - "learning_rate": 6.843221401318889e-07, - "loss": 0.7344, - "step": 71887 - }, - { - "epoch": 1.84, - "learning_rate": 6.842958846881293e-07, - "loss": 0.6118, - "step": 71888 - }, - { - "epoch": 1.84, - "learning_rate": 6.842696294860898e-07, - "loss": 0.8428, - "step": 71889 - }, - { - "epoch": 1.84, - "learning_rate": 6.842433745257908e-07, - "loss": 0.5112, - "step": 71890 - }, - { - "epoch": 1.84, - "learning_rate": 6.842171198072517e-07, - "loss": 0.5815, - "step": 71891 - }, - { - "epoch": 1.84, - "learning_rate": 6.841908653304933e-07, - "loss": 0.6211, - "step": 71892 - }, - { - "epoch": 1.84, - "learning_rate": 6.841646110955354e-07, - "loss": 0.75, - "step": 71893 - }, - { - "epoch": 1.84, - "learning_rate": 6.841383571023982e-07, - "loss": 0.6797, - "step": 71894 - }, - { - "epoch": 1.84, - "learning_rate": 6.841121033511015e-07, - "loss": 0.6025, - "step": 71895 - }, - { - "epoch": 1.84, - "learning_rate": 6.840858498416664e-07, - "loss": 0.5977, - "step": 71896 - }, - { - "epoch": 1.84, - "learning_rate": 6.840595965741115e-07, - "loss": 0.4937, - "step": 71897 - }, - { - "epoch": 1.84, - "learning_rate": 6.840333435484578e-07, - "loss": 0.46, - "step": 71898 - }, - { - "epoch": 1.84, - "learning_rate": 6.840070907647253e-07, - "loss": 0.8057, - "step": 71899 - }, - { - "epoch": 1.84, - "learning_rate": 6.83980838222934e-07, - "loss": 0.624, - "step": 71900 - }, - { - "epoch": 1.84, - "learning_rate": 6.83954585923104e-07, - "loss": 0.7393, - "step": 71901 - }, - { - "epoch": 1.84, - "learning_rate": 6.839283338652555e-07, - "loss": 0.7061, - "step": 71902 - }, - { - "epoch": 1.84, - "learning_rate": 6.839020820494083e-07, - "loss": 0.574, - "step": 71903 - }, - { - "epoch": 1.84, - "learning_rate": 6.838758304755831e-07, - "loss": 0.7075, - "step": 71904 - }, - { - "epoch": 1.84, - "learning_rate": 6.838495791437993e-07, - "loss": 0.5332, - "step": 71905 - }, - { - "epoch": 1.84, - "learning_rate": 6.838233280540778e-07, - "loss": 0.7002, - "step": 71906 - }, - { - "epoch": 1.84, - "learning_rate": 6.837970772064381e-07, - "loss": 0.4966, - "step": 71907 - }, - { - "epoch": 1.84, - "learning_rate": 6.837708266009002e-07, - "loss": 0.6743, - "step": 71908 - }, - { - "epoch": 1.84, - "learning_rate": 6.837445762374845e-07, - "loss": 0.749, - "step": 71909 - }, - { - "epoch": 1.84, - "learning_rate": 6.83718326116211e-07, - "loss": 0.6543, - "step": 71910 - }, - { - "epoch": 1.84, - "learning_rate": 6.836920762371e-07, - "loss": 0.6865, - "step": 71911 - }, - { - "epoch": 1.84, - "learning_rate": 6.836658266001713e-07, - "loss": 0.5815, - "step": 71912 - }, - { - "epoch": 1.84, - "learning_rate": 6.836395772054452e-07, - "loss": 0.6675, - "step": 71913 - }, - { - "epoch": 1.84, - "learning_rate": 6.836133280529415e-07, - "loss": 0.6729, - "step": 71914 - }, - { - "epoch": 1.84, - "learning_rate": 6.835870791426809e-07, - "loss": 0.5566, - "step": 71915 - }, - { - "epoch": 1.84, - "learning_rate": 6.835608304746833e-07, - "loss": 0.5083, - "step": 71916 - }, - { - "epoch": 1.84, - "learning_rate": 6.835345820489684e-07, - "loss": 0.6865, - "step": 71917 - }, - { - "epoch": 1.84, - "learning_rate": 6.835083338655562e-07, - "loss": 0.8174, - "step": 71918 - }, - { - "epoch": 1.84, - "learning_rate": 6.834820859244675e-07, - "loss": 0.4978, - "step": 71919 - }, - { - "epoch": 1.84, - "learning_rate": 6.834558382257216e-07, - "loss": 0.6104, - "step": 71920 - }, - { - "epoch": 1.84, - "learning_rate": 6.834295907693392e-07, - "loss": 0.7432, - "step": 71921 - }, - { - "epoch": 1.84, - "learning_rate": 6.834033435553403e-07, - "loss": 0.6758, - "step": 71922 - }, - { - "epoch": 1.84, - "learning_rate": 6.833770965837448e-07, - "loss": 0.6675, - "step": 71923 - }, - { - "epoch": 1.84, - "learning_rate": 6.833508498545729e-07, - "loss": 0.481, - "step": 71924 - }, - { - "epoch": 1.84, - "learning_rate": 6.833246033678448e-07, - "loss": 0.5518, - "step": 71925 - }, - { - "epoch": 1.84, - "learning_rate": 6.832983571235808e-07, - "loss": 0.7959, - "step": 71926 - }, - { - "epoch": 1.84, - "learning_rate": 6.832721111218001e-07, - "loss": 0.6743, - "step": 71927 - }, - { - "epoch": 1.84, - "learning_rate": 6.832458653625237e-07, - "loss": 0.6377, - "step": 71928 - }, - { - "epoch": 1.84, - "learning_rate": 6.832196198457712e-07, - "loss": 0.6484, - "step": 71929 - }, - { - "epoch": 1.84, - "learning_rate": 6.83193374571563e-07, - "loss": 0.6953, - "step": 71930 - }, - { - "epoch": 1.84, - "learning_rate": 6.831671295399189e-07, - "loss": 0.6572, - "step": 71931 - }, - { - "epoch": 1.84, - "learning_rate": 6.831408847508593e-07, - "loss": 0.6128, - "step": 71932 - }, - { - "epoch": 1.84, - "learning_rate": 6.83114640204404e-07, - "loss": 0.625, - "step": 71933 - }, - { - "epoch": 1.84, - "learning_rate": 6.830883959005736e-07, - "loss": 0.5781, - "step": 71934 - }, - { - "epoch": 1.84, - "learning_rate": 6.830621518393875e-07, - "loss": 0.7441, - "step": 71935 - }, - { - "epoch": 1.84, - "learning_rate": 6.830359080208666e-07, - "loss": 0.7012, - "step": 71936 - }, - { - "epoch": 1.84, - "learning_rate": 6.8300966444503e-07, - "loss": 0.4656, - "step": 71937 - }, - { - "epoch": 1.84, - "learning_rate": 6.829834211118986e-07, - "loss": 0.9277, - "step": 71938 - }, - { - "epoch": 1.84, - "learning_rate": 6.829571780214921e-07, - "loss": 0.5957, - "step": 71939 - }, - { - "epoch": 1.84, - "learning_rate": 6.829309351738308e-07, - "loss": 0.7393, - "step": 71940 - }, - { - "epoch": 1.84, - "learning_rate": 6.829046925689346e-07, - "loss": 0.5449, - "step": 71941 - }, - { - "epoch": 1.84, - "learning_rate": 6.828784502068238e-07, - "loss": 0.6914, - "step": 71942 - }, - { - "epoch": 1.84, - "learning_rate": 6.828522080875181e-07, - "loss": 0.627, - "step": 71943 - }, - { - "epoch": 1.84, - "learning_rate": 6.828259662110383e-07, - "loss": 0.4475, - "step": 71944 - }, - { - "epoch": 1.84, - "learning_rate": 6.827997245774037e-07, - "loss": 0.6816, - "step": 71945 - }, - { - "epoch": 1.84, - "learning_rate": 6.827734831866352e-07, - "loss": 0.7812, - "step": 71946 - }, - { - "epoch": 1.84, - "learning_rate": 6.827472420387523e-07, - "loss": 0.6045, - "step": 71947 - }, - { - "epoch": 1.84, - "learning_rate": 6.827210011337751e-07, - "loss": 0.5146, - "step": 71948 - }, - { - "epoch": 1.84, - "learning_rate": 6.82694760471724e-07, - "loss": 0.6953, - "step": 71949 - }, - { - "epoch": 1.84, - "learning_rate": 6.826685200526186e-07, - "loss": 0.7793, - "step": 71950 - }, - { - "epoch": 1.84, - "learning_rate": 6.826422798764797e-07, - "loss": 0.6992, - "step": 71951 - }, - { - "epoch": 1.84, - "learning_rate": 6.826160399433269e-07, - "loss": 0.623, - "step": 71952 - }, - { - "epoch": 1.84, - "learning_rate": 6.825898002531803e-07, - "loss": 0.6719, - "step": 71953 - }, - { - "epoch": 1.84, - "learning_rate": 6.825635608060603e-07, - "loss": 0.6309, - "step": 71954 - }, - { - "epoch": 1.84, - "learning_rate": 6.825373216019865e-07, - "loss": 0.5884, - "step": 71955 - }, - { - "epoch": 1.84, - "learning_rate": 6.825110826409797e-07, - "loss": 0.7344, - "step": 71956 - }, - { - "epoch": 1.84, - "learning_rate": 6.824848439230592e-07, - "loss": 0.5674, - "step": 71957 - }, - { - "epoch": 1.84, - "learning_rate": 6.824586054482455e-07, - "loss": 0.7544, - "step": 71958 - }, - { - "epoch": 1.84, - "learning_rate": 6.824323672165588e-07, - "loss": 0.4609, - "step": 71959 - }, - { - "epoch": 1.84, - "learning_rate": 6.824061292280187e-07, - "loss": 0.6768, - "step": 71960 - }, - { - "epoch": 1.84, - "learning_rate": 6.823798914826461e-07, - "loss": 0.5635, - "step": 71961 - }, - { - "epoch": 1.84, - "learning_rate": 6.823536539804602e-07, - "loss": 0.6738, - "step": 71962 - }, - { - "epoch": 1.84, - "learning_rate": 6.823274167214817e-07, - "loss": 0.6548, - "step": 71963 - }, - { - "epoch": 1.84, - "learning_rate": 6.823011797057303e-07, - "loss": 0.584, - "step": 71964 - }, - { - "epoch": 1.84, - "learning_rate": 6.822749429332267e-07, - "loss": 0.5879, - "step": 71965 - }, - { - "epoch": 1.84, - "learning_rate": 6.822487064039904e-07, - "loss": 0.6084, - "step": 71966 - }, - { - "epoch": 1.84, - "learning_rate": 6.822224701180414e-07, - "loss": 0.7021, - "step": 71967 - }, - { - "epoch": 1.84, - "learning_rate": 6.821962340754004e-07, - "loss": 0.584, - "step": 71968 - }, - { - "epoch": 1.84, - "learning_rate": 6.821699982760869e-07, - "loss": 0.6006, - "step": 71969 - }, - { - "epoch": 1.84, - "learning_rate": 6.821437627201212e-07, - "loss": 0.582, - "step": 71970 - }, - { - "epoch": 1.84, - "learning_rate": 6.821175274075235e-07, - "loss": 0.5576, - "step": 71971 - }, - { - "epoch": 1.84, - "learning_rate": 6.820912923383136e-07, - "loss": 0.6348, - "step": 71972 - }, - { - "epoch": 1.84, - "learning_rate": 6.82065057512512e-07, - "loss": 0.7881, - "step": 71973 - }, - { - "epoch": 1.84, - "learning_rate": 6.820388229301384e-07, - "loss": 0.7041, - "step": 71974 - }, - { - "epoch": 1.84, - "learning_rate": 6.820125885912132e-07, - "loss": 0.666, - "step": 71975 - }, - { - "epoch": 1.84, - "learning_rate": 6.819863544957566e-07, - "loss": 0.4943, - "step": 71976 - }, - { - "epoch": 1.84, - "learning_rate": 6.81960120643788e-07, - "loss": 0.626, - "step": 71977 - }, - { - "epoch": 1.84, - "learning_rate": 6.819338870353281e-07, - "loss": 0.5532, - "step": 71978 - }, - { - "epoch": 1.84, - "learning_rate": 6.819076536703966e-07, - "loss": 0.5605, - "step": 71979 - }, - { - "epoch": 1.84, - "learning_rate": 6.81881420549014e-07, - "loss": 0.6033, - "step": 71980 - }, - { - "epoch": 1.84, - "learning_rate": 6.818551876712e-07, - "loss": 0.8535, - "step": 71981 - }, - { - "epoch": 1.84, - "learning_rate": 6.818289550369749e-07, - "loss": 0.6143, - "step": 71982 - }, - { - "epoch": 1.84, - "learning_rate": 6.818027226463587e-07, - "loss": 0.5767, - "step": 71983 - }, - { - "epoch": 1.84, - "learning_rate": 6.817764904993717e-07, - "loss": 0.5742, - "step": 71984 - }, - { - "epoch": 1.85, - "learning_rate": 6.817502585960335e-07, - "loss": 0.6631, - "step": 71985 - }, - { - "epoch": 1.85, - "learning_rate": 6.817240269363652e-07, - "loss": 0.3938, - "step": 71986 - }, - { - "epoch": 1.85, - "learning_rate": 6.816977955203855e-07, - "loss": 0.4531, - "step": 71987 - }, - { - "epoch": 1.85, - "learning_rate": 6.816715643481155e-07, - "loss": 0.707, - "step": 71988 - }, - { - "epoch": 1.85, - "learning_rate": 6.816453334195747e-07, - "loss": 0.6211, - "step": 71989 - }, - { - "epoch": 1.85, - "learning_rate": 6.816191027347835e-07, - "loss": 0.5486, - "step": 71990 - }, - { - "epoch": 1.85, - "learning_rate": 6.815928722937619e-07, - "loss": 0.5894, - "step": 71991 - }, - { - "epoch": 1.85, - "learning_rate": 6.815666420965301e-07, - "loss": 0.666, - "step": 71992 - }, - { - "epoch": 1.85, - "learning_rate": 6.815404121431076e-07, - "loss": 0.7461, - "step": 71993 - }, - { - "epoch": 1.85, - "learning_rate": 6.815141824335155e-07, - "loss": 0.5216, - "step": 71994 - }, - { - "epoch": 1.85, - "learning_rate": 6.81487952967773e-07, - "loss": 0.6152, - "step": 71995 - }, - { - "epoch": 1.85, - "learning_rate": 6.814617237459011e-07, - "loss": 0.7944, - "step": 71996 - }, - { - "epoch": 1.85, - "learning_rate": 6.814354947679191e-07, - "loss": 0.7275, - "step": 71997 - }, - { - "epoch": 1.85, - "learning_rate": 6.814092660338471e-07, - "loss": 0.4966, - "step": 71998 - }, - { - "epoch": 1.85, - "learning_rate": 6.813830375437054e-07, - "loss": 0.5352, - "step": 71999 - }, - { - "epoch": 1.85, - "learning_rate": 6.813568092975139e-07, - "loss": 0.6914, - "step": 72000 - }, - { - "epoch": 1.85, - "learning_rate": 6.813305812952932e-07, - "loss": 0.5698, - "step": 72001 - }, - { - "epoch": 1.85, - "learning_rate": 6.813043535370626e-07, - "loss": 0.6689, - "step": 72002 - }, - { - "epoch": 1.85, - "learning_rate": 6.81278126022843e-07, - "loss": 0.6182, - "step": 72003 - }, - { - "epoch": 1.85, - "learning_rate": 6.812518987526537e-07, - "loss": 0.5825, - "step": 72004 - }, - { - "epoch": 1.85, - "learning_rate": 6.812256717265155e-07, - "loss": 0.7329, - "step": 72005 - }, - { - "epoch": 1.85, - "learning_rate": 6.811994449444483e-07, - "loss": 0.403, - "step": 72006 - }, - { - "epoch": 1.85, - "learning_rate": 6.811732184064718e-07, - "loss": 0.6594, - "step": 72007 - }, - { - "epoch": 1.85, - "learning_rate": 6.811469921126063e-07, - "loss": 0.5713, - "step": 72008 - }, - { - "epoch": 1.85, - "learning_rate": 6.811207660628718e-07, - "loss": 0.6953, - "step": 72009 - }, - { - "epoch": 1.85, - "learning_rate": 6.810945402572884e-07, - "loss": 0.5952, - "step": 72010 - }, - { - "epoch": 1.85, - "learning_rate": 6.810683146958764e-07, - "loss": 0.4596, - "step": 72011 - }, - { - "epoch": 1.85, - "learning_rate": 6.810420893786557e-07, - "loss": 0.6787, - "step": 72012 - }, - { - "epoch": 1.85, - "learning_rate": 6.810158643056464e-07, - "loss": 0.5884, - "step": 72013 - }, - { - "epoch": 1.85, - "learning_rate": 6.809896394768685e-07, - "loss": 0.6992, - "step": 72014 - }, - { - "epoch": 1.85, - "learning_rate": 6.809634148923423e-07, - "loss": 0.5386, - "step": 72015 - }, - { - "epoch": 1.85, - "learning_rate": 6.80937190552088e-07, - "loss": 0.7705, - "step": 72016 - }, - { - "epoch": 1.85, - "learning_rate": 6.80910966456125e-07, - "loss": 0.5146, - "step": 72017 - }, - { - "epoch": 1.85, - "learning_rate": 6.808847426044739e-07, - "loss": 0.4995, - "step": 72018 - }, - { - "epoch": 1.85, - "learning_rate": 6.808585189971546e-07, - "loss": 0.6206, - "step": 72019 - }, - { - "epoch": 1.85, - "learning_rate": 6.808322956341874e-07, - "loss": 0.635, - "step": 72020 - }, - { - "epoch": 1.85, - "learning_rate": 6.808060725155921e-07, - "loss": 0.718, - "step": 72021 - }, - { - "epoch": 1.85, - "learning_rate": 6.80779849641389e-07, - "loss": 0.5549, - "step": 72022 - }, - { - "epoch": 1.85, - "learning_rate": 6.807536270115981e-07, - "loss": 0.5674, - "step": 72023 - }, - { - "epoch": 1.85, - "learning_rate": 6.807274046262395e-07, - "loss": 0.3816, - "step": 72024 - }, - { - "epoch": 1.85, - "learning_rate": 6.807011824853333e-07, - "loss": 0.7437, - "step": 72025 - }, - { - "epoch": 1.85, - "learning_rate": 6.806749605888998e-07, - "loss": 0.4771, - "step": 72026 - }, - { - "epoch": 1.85, - "learning_rate": 6.806487389369582e-07, - "loss": 0.6289, - "step": 72027 - }, - { - "epoch": 1.85, - "learning_rate": 6.806225175295295e-07, - "loss": 0.9443, - "step": 72028 - }, - { - "epoch": 1.85, - "learning_rate": 6.805962963666331e-07, - "loss": 0.6846, - "step": 72029 - }, - { - "epoch": 1.85, - "learning_rate": 6.805700754482899e-07, - "loss": 0.5627, - "step": 72030 - }, - { - "epoch": 1.85, - "learning_rate": 6.805438547745191e-07, - "loss": 0.6914, - "step": 72031 - }, - { - "epoch": 1.85, - "learning_rate": 6.805176343453415e-07, - "loss": 0.6631, - "step": 72032 - }, - { - "epoch": 1.85, - "learning_rate": 6.804914141607766e-07, - "loss": 0.4561, - "step": 72033 - }, - { - "epoch": 1.85, - "learning_rate": 6.804651942208449e-07, - "loss": 0.7021, - "step": 72034 - }, - { - "epoch": 1.85, - "learning_rate": 6.804389745255661e-07, - "loss": 0.6973, - "step": 72035 - }, - { - "epoch": 1.85, - "learning_rate": 6.80412755074961e-07, - "loss": 0.4999, - "step": 72036 - }, - { - "epoch": 1.85, - "learning_rate": 6.80386535869049e-07, - "loss": 0.6582, - "step": 72037 - }, - { - "epoch": 1.85, - "learning_rate": 6.8036031690785e-07, - "loss": 0.5742, - "step": 72038 - }, - { - "epoch": 1.85, - "learning_rate": 6.803340981913845e-07, - "loss": 0.7861, - "step": 72039 - }, - { - "epoch": 1.85, - "learning_rate": 6.803078797196724e-07, - "loss": 0.6074, - "step": 72040 - }, - { - "epoch": 1.85, - "learning_rate": 6.802816614927341e-07, - "loss": 0.6807, - "step": 72041 - }, - { - "epoch": 1.85, - "learning_rate": 6.802554435105894e-07, - "loss": 0.4827, - "step": 72042 - }, - { - "epoch": 1.85, - "learning_rate": 6.802292257732583e-07, - "loss": 0.5864, - "step": 72043 - }, - { - "epoch": 1.85, - "learning_rate": 6.80203008280761e-07, - "loss": 0.6426, - "step": 72044 - }, - { - "epoch": 1.85, - "learning_rate": 6.801767910331176e-07, - "loss": 0.7129, - "step": 72045 - }, - { - "epoch": 1.85, - "learning_rate": 6.801505740303483e-07, - "loss": 0.7314, - "step": 72046 - }, - { - "epoch": 1.85, - "learning_rate": 6.801243572724728e-07, - "loss": 0.5811, - "step": 72047 - }, - { - "epoch": 1.85, - "learning_rate": 6.800981407595112e-07, - "loss": 0.6271, - "step": 72048 - }, - { - "epoch": 1.85, - "learning_rate": 6.80071924491484e-07, - "loss": 0.4873, - "step": 72049 - }, - { - "epoch": 1.85, - "learning_rate": 6.800457084684108e-07, - "loss": 0.6445, - "step": 72050 - }, - { - "epoch": 1.85, - "learning_rate": 6.80019492690312e-07, - "loss": 0.6206, - "step": 72051 - }, - { - "epoch": 1.85, - "learning_rate": 6.799932771572074e-07, - "loss": 0.7197, - "step": 72052 - }, - { - "epoch": 1.85, - "learning_rate": 6.799670618691175e-07, - "loss": 0.6152, - "step": 72053 - }, - { - "epoch": 1.85, - "learning_rate": 6.799408468260619e-07, - "loss": 0.6343, - "step": 72054 - }, - { - "epoch": 1.85, - "learning_rate": 6.799146320280611e-07, - "loss": 0.6465, - "step": 72055 - }, - { - "epoch": 1.85, - "learning_rate": 6.798884174751351e-07, - "loss": 0.6406, - "step": 72056 - }, - { - "epoch": 1.85, - "learning_rate": 6.798622031673035e-07, - "loss": 0.5859, - "step": 72057 - }, - { - "epoch": 1.85, - "learning_rate": 6.798359891045868e-07, - "loss": 0.9307, - "step": 72058 - }, - { - "epoch": 1.85, - "learning_rate": 6.798097752870049e-07, - "loss": 0.5825, - "step": 72059 - }, - { - "epoch": 1.85, - "learning_rate": 6.797835617145779e-07, - "loss": 0.1942, - "step": 72060 - }, - { - "epoch": 1.85, - "learning_rate": 6.79757348387326e-07, - "loss": 0.6782, - "step": 72061 - }, - { - "epoch": 1.85, - "learning_rate": 6.797311353052691e-07, - "loss": 0.5708, - "step": 72062 - }, - { - "epoch": 1.85, - "learning_rate": 6.797049224684272e-07, - "loss": 0.474, - "step": 72063 - }, - { - "epoch": 1.85, - "learning_rate": 6.796787098768206e-07, - "loss": 0.4849, - "step": 72064 - }, - { - "epoch": 1.85, - "learning_rate": 6.796524975304695e-07, - "loss": 0.6631, - "step": 72065 - }, - { - "epoch": 1.85, - "learning_rate": 6.796262854293939e-07, - "loss": 0.7188, - "step": 72066 - }, - { - "epoch": 1.85, - "learning_rate": 6.796000735736132e-07, - "loss": 0.6621, - "step": 72067 - }, - { - "epoch": 1.85, - "learning_rate": 6.795738619631483e-07, - "loss": 0.584, - "step": 72068 - }, - { - "epoch": 1.85, - "learning_rate": 6.795476505980188e-07, - "loss": 0.7383, - "step": 72069 - }, - { - "epoch": 1.85, - "learning_rate": 6.795214394782451e-07, - "loss": 0.48, - "step": 72070 - }, - { - "epoch": 1.85, - "learning_rate": 6.794952286038469e-07, - "loss": 0.6978, - "step": 72071 - }, - { - "epoch": 1.85, - "learning_rate": 6.794690179748446e-07, - "loss": 0.4983, - "step": 72072 - }, - { - "epoch": 1.85, - "learning_rate": 6.79442807591258e-07, - "loss": 0.6396, - "step": 72073 - }, - { - "epoch": 1.85, - "learning_rate": 6.794165974531074e-07, - "loss": 0.7197, - "step": 72074 - }, - { - "epoch": 1.85, - "learning_rate": 6.793903875604127e-07, - "loss": 0.6221, - "step": 72075 - }, - { - "epoch": 1.85, - "learning_rate": 6.793641779131947e-07, - "loss": 0.7065, - "step": 72076 - }, - { - "epoch": 1.85, - "learning_rate": 6.793379685114719e-07, - "loss": 0.5474, - "step": 72077 - }, - { - "epoch": 1.85, - "learning_rate": 6.793117593552657e-07, - "loss": 0.6147, - "step": 72078 - }, - { - "epoch": 1.85, - "learning_rate": 6.792855504445955e-07, - "loss": 0.668, - "step": 72079 - }, - { - "epoch": 1.85, - "learning_rate": 6.792593417794819e-07, - "loss": 0.7031, - "step": 72080 - }, - { - "epoch": 1.85, - "learning_rate": 6.792331333599443e-07, - "loss": 0.6182, - "step": 72081 - }, - { - "epoch": 1.85, - "learning_rate": 6.792069251860035e-07, - "loss": 0.6621, - "step": 72082 - }, - { - "epoch": 1.85, - "learning_rate": 6.791807172576789e-07, - "loss": 0.4097, - "step": 72083 - }, - { - "epoch": 1.85, - "learning_rate": 6.791545095749912e-07, - "loss": 0.5762, - "step": 72084 - }, - { - "epoch": 1.85, - "learning_rate": 6.791283021379599e-07, - "loss": 0.6875, - "step": 72085 - }, - { - "epoch": 1.85, - "learning_rate": 6.791020949466055e-07, - "loss": 0.4912, - "step": 72086 - }, - { - "epoch": 1.85, - "learning_rate": 6.790758880009479e-07, - "loss": 0.5928, - "step": 72087 - }, - { - "epoch": 1.85, - "learning_rate": 6.790496813010069e-07, - "loss": 0.5127, - "step": 72088 - }, - { - "epoch": 1.85, - "learning_rate": 6.790234748468029e-07, - "loss": 0.5928, - "step": 72089 - }, - { - "epoch": 1.85, - "learning_rate": 6.789972686383558e-07, - "loss": 0.5767, - "step": 72090 - }, - { - "epoch": 1.85, - "learning_rate": 6.78971062675686e-07, - "loss": 0.6436, - "step": 72091 - }, - { - "epoch": 1.85, - "learning_rate": 6.789448569588128e-07, - "loss": 0.6445, - "step": 72092 - }, - { - "epoch": 1.85, - "learning_rate": 6.789186514877572e-07, - "loss": 0.5986, - "step": 72093 - }, - { - "epoch": 1.85, - "learning_rate": 6.788924462625385e-07, - "loss": 0.5586, - "step": 72094 - }, - { - "epoch": 1.85, - "learning_rate": 6.788662412831774e-07, - "loss": 0.6533, - "step": 72095 - }, - { - "epoch": 1.85, - "learning_rate": 6.788400365496937e-07, - "loss": 0.6152, - "step": 72096 - }, - { - "epoch": 1.85, - "learning_rate": 6.788138320621073e-07, - "loss": 0.6213, - "step": 72097 - }, - { - "epoch": 1.85, - "learning_rate": 6.787876278204382e-07, - "loss": 0.5542, - "step": 72098 - }, - { - "epoch": 1.85, - "learning_rate": 6.787614238247069e-07, - "loss": 0.5347, - "step": 72099 - }, - { - "epoch": 1.85, - "learning_rate": 6.787352200749328e-07, - "loss": 0.48, - "step": 72100 - }, - { - "epoch": 1.85, - "learning_rate": 6.787090165711368e-07, - "loss": 0.5083, - "step": 72101 - }, - { - "epoch": 1.85, - "learning_rate": 6.786828133133382e-07, - "loss": 0.5618, - "step": 72102 - }, - { - "epoch": 1.85, - "learning_rate": 6.786566103015576e-07, - "loss": 0.6455, - "step": 72103 - }, - { - "epoch": 1.85, - "learning_rate": 6.786304075358146e-07, - "loss": 0.4907, - "step": 72104 - }, - { - "epoch": 1.85, - "learning_rate": 6.786042050161299e-07, - "loss": 0.4834, - "step": 72105 - }, - { - "epoch": 1.85, - "learning_rate": 6.785780027425233e-07, - "loss": 0.6133, - "step": 72106 - }, - { - "epoch": 1.85, - "learning_rate": 6.785518007150144e-07, - "loss": 0.7734, - "step": 72107 - }, - { - "epoch": 1.85, - "learning_rate": 6.785255989336236e-07, - "loss": 0.538, - "step": 72108 - }, - { - "epoch": 1.85, - "learning_rate": 6.78499397398371e-07, - "loss": 0.5981, - "step": 72109 - }, - { - "epoch": 1.85, - "learning_rate": 6.784731961092767e-07, - "loss": 0.7373, - "step": 72110 - }, - { - "epoch": 1.85, - "learning_rate": 6.784469950663605e-07, - "loss": 0.7007, - "step": 72111 - }, - { - "epoch": 1.85, - "learning_rate": 6.78420794269643e-07, - "loss": 0.7119, - "step": 72112 - }, - { - "epoch": 1.85, - "learning_rate": 6.783945937191436e-07, - "loss": 0.6279, - "step": 72113 - }, - { - "epoch": 1.85, - "learning_rate": 6.783683934148827e-07, - "loss": 0.5635, - "step": 72114 - }, - { - "epoch": 1.85, - "learning_rate": 6.783421933568807e-07, - "loss": 0.4153, - "step": 72115 - }, - { - "epoch": 1.85, - "learning_rate": 6.783159935451572e-07, - "loss": 0.431, - "step": 72116 - }, - { - "epoch": 1.85, - "learning_rate": 6.782897939797319e-07, - "loss": 0.627, - "step": 72117 - }, - { - "epoch": 1.85, - "learning_rate": 6.782635946606257e-07, - "loss": 0.6426, - "step": 72118 - }, - { - "epoch": 1.85, - "learning_rate": 6.78237395587858e-07, - "loss": 0.7334, - "step": 72119 - }, - { - "epoch": 1.85, - "learning_rate": 6.782111967614495e-07, - "loss": 0.6953, - "step": 72120 - }, - { - "epoch": 1.85, - "learning_rate": 6.781849981814193e-07, - "loss": 0.4045, - "step": 72121 - }, - { - "epoch": 1.85, - "learning_rate": 6.781587998477887e-07, - "loss": 0.5488, - "step": 72122 - }, - { - "epoch": 1.85, - "learning_rate": 6.781326017605766e-07, - "loss": 0.5894, - "step": 72123 - }, - { - "epoch": 1.85, - "learning_rate": 6.781064039198039e-07, - "loss": 0.6777, - "step": 72124 - }, - { - "epoch": 1.85, - "learning_rate": 6.780802063254904e-07, - "loss": 0.5144, - "step": 72125 - }, - { - "epoch": 1.85, - "learning_rate": 6.780540089776559e-07, - "loss": 0.5483, - "step": 72126 - }, - { - "epoch": 1.85, - "learning_rate": 6.780278118763207e-07, - "loss": 0.6387, - "step": 72127 - }, - { - "epoch": 1.85, - "learning_rate": 6.780016150215046e-07, - "loss": 0.5122, - "step": 72128 - }, - { - "epoch": 1.85, - "learning_rate": 6.77975418413228e-07, - "loss": 0.7075, - "step": 72129 - }, - { - "epoch": 1.85, - "learning_rate": 6.779492220515109e-07, - "loss": 0.6558, - "step": 72130 - }, - { - "epoch": 1.85, - "learning_rate": 6.779230259363731e-07, - "loss": 0.6934, - "step": 72131 - }, - { - "epoch": 1.85, - "learning_rate": 6.778968300678349e-07, - "loss": 0.8057, - "step": 72132 - }, - { - "epoch": 1.85, - "learning_rate": 6.778706344459163e-07, - "loss": 0.6133, - "step": 72133 - }, - { - "epoch": 1.85, - "learning_rate": 6.778444390706375e-07, - "loss": 0.71, - "step": 72134 - }, - { - "epoch": 1.85, - "learning_rate": 6.778182439420184e-07, - "loss": 0.5015, - "step": 72135 - }, - { - "epoch": 1.85, - "learning_rate": 6.777920490600788e-07, - "loss": 0.5278, - "step": 72136 - }, - { - "epoch": 1.85, - "learning_rate": 6.777658544248392e-07, - "loss": 0.665, - "step": 72137 - }, - { - "epoch": 1.85, - "learning_rate": 6.777396600363193e-07, - "loss": 0.6289, - "step": 72138 - }, - { - "epoch": 1.85, - "learning_rate": 6.777134658945393e-07, - "loss": 0.7441, - "step": 72139 - }, - { - "epoch": 1.85, - "learning_rate": 6.776872719995195e-07, - "loss": 0.4614, - "step": 72140 - }, - { - "epoch": 1.85, - "learning_rate": 6.776610783512796e-07, - "loss": 0.4663, - "step": 72141 - }, - { - "epoch": 1.85, - "learning_rate": 6.776348849498397e-07, - "loss": 0.7773, - "step": 72142 - }, - { - "epoch": 1.85, - "learning_rate": 6.776086917952202e-07, - "loss": 0.5244, - "step": 72143 - }, - { - "epoch": 1.85, - "learning_rate": 6.775824988874406e-07, - "loss": 0.7305, - "step": 72144 - }, - { - "epoch": 1.85, - "learning_rate": 6.775563062265217e-07, - "loss": 0.6875, - "step": 72145 - }, - { - "epoch": 1.85, - "learning_rate": 6.775301138124829e-07, - "loss": 0.624, - "step": 72146 - }, - { - "epoch": 1.85, - "learning_rate": 6.775039216453442e-07, - "loss": 0.3892, - "step": 72147 - }, - { - "epoch": 1.85, - "learning_rate": 6.774777297251261e-07, - "loss": 0.5801, - "step": 72148 - }, - { - "epoch": 1.85, - "learning_rate": 6.774515380518486e-07, - "loss": 0.5425, - "step": 72149 - }, - { - "epoch": 1.85, - "learning_rate": 6.774253466255315e-07, - "loss": 0.6113, - "step": 72150 - }, - { - "epoch": 1.85, - "learning_rate": 6.773991554461951e-07, - "loss": 0.6602, - "step": 72151 - }, - { - "epoch": 1.85, - "learning_rate": 6.77372964513859e-07, - "loss": 0.6309, - "step": 72152 - }, - { - "epoch": 1.85, - "learning_rate": 6.773467738285439e-07, - "loss": 0.6758, - "step": 72153 - }, - { - "epoch": 1.85, - "learning_rate": 6.773205833902693e-07, - "loss": 0.6592, - "step": 72154 - }, - { - "epoch": 1.85, - "learning_rate": 6.772943931990559e-07, - "loss": 0.5018, - "step": 72155 - }, - { - "epoch": 1.85, - "learning_rate": 6.772682032549232e-07, - "loss": 0.6357, - "step": 72156 - }, - { - "epoch": 1.85, - "learning_rate": 6.772420135578911e-07, - "loss": 0.5083, - "step": 72157 - }, - { - "epoch": 1.85, - "learning_rate": 6.772158241079801e-07, - "loss": 0.6201, - "step": 72158 - }, - { - "epoch": 1.85, - "learning_rate": 6.771896349052102e-07, - "loss": 0.6738, - "step": 72159 - }, - { - "epoch": 1.85, - "learning_rate": 6.771634459496012e-07, - "loss": 0.6309, - "step": 72160 - }, - { - "epoch": 1.85, - "learning_rate": 6.771372572411734e-07, - "loss": 0.7139, - "step": 72161 - }, - { - "epoch": 1.85, - "learning_rate": 6.771110687799468e-07, - "loss": 0.6807, - "step": 72162 - }, - { - "epoch": 1.85, - "learning_rate": 6.770848805659413e-07, - "loss": 0.499, - "step": 72163 - }, - { - "epoch": 1.85, - "learning_rate": 6.77058692599177e-07, - "loss": 0.7451, - "step": 72164 - }, - { - "epoch": 1.85, - "learning_rate": 6.770325048796745e-07, - "loss": 0.7559, - "step": 72165 - }, - { - "epoch": 1.85, - "learning_rate": 6.770063174074531e-07, - "loss": 0.6592, - "step": 72166 - }, - { - "epoch": 1.85, - "learning_rate": 6.769801301825329e-07, - "loss": 0.7578, - "step": 72167 - }, - { - "epoch": 1.85, - "learning_rate": 6.769539432049343e-07, - "loss": 0.5806, - "step": 72168 - }, - { - "epoch": 1.85, - "learning_rate": 6.76927756474677e-07, - "loss": 0.6621, - "step": 72169 - }, - { - "epoch": 1.85, - "learning_rate": 6.769015699917815e-07, - "loss": 0.5825, - "step": 72170 - }, - { - "epoch": 1.85, - "learning_rate": 6.768753837562674e-07, - "loss": 0.5085, - "step": 72171 - }, - { - "epoch": 1.85, - "learning_rate": 6.768491977681552e-07, - "loss": 0.5522, - "step": 72172 - }, - { - "epoch": 1.85, - "learning_rate": 6.768230120274645e-07, - "loss": 0.5962, - "step": 72173 - }, - { - "epoch": 1.85, - "learning_rate": 6.767968265342157e-07, - "loss": 0.8477, - "step": 72174 - }, - { - "epoch": 1.85, - "learning_rate": 6.767706412884289e-07, - "loss": 0.6377, - "step": 72175 - }, - { - "epoch": 1.85, - "learning_rate": 6.767444562901236e-07, - "loss": 0.4, - "step": 72176 - }, - { - "epoch": 1.85, - "learning_rate": 6.767182715393205e-07, - "loss": 0.5615, - "step": 72177 - }, - { - "epoch": 1.85, - "learning_rate": 6.76692087036039e-07, - "loss": 0.5874, - "step": 72178 - }, - { - "epoch": 1.85, - "learning_rate": 6.766659027802999e-07, - "loss": 0.6304, - "step": 72179 - }, - { - "epoch": 1.85, - "learning_rate": 6.766397187721224e-07, - "loss": 0.6343, - "step": 72180 - }, - { - "epoch": 1.85, - "learning_rate": 6.766135350115274e-07, - "loss": 0.5796, - "step": 72181 - }, - { - "epoch": 1.85, - "learning_rate": 6.765873514985343e-07, - "loss": 0.52, - "step": 72182 - }, - { - "epoch": 1.85, - "learning_rate": 6.765611682331636e-07, - "loss": 0.5525, - "step": 72183 - }, - { - "epoch": 1.85, - "learning_rate": 6.765349852154349e-07, - "loss": 0.5918, - "step": 72184 - }, - { - "epoch": 1.85, - "learning_rate": 6.765088024453691e-07, - "loss": 0.6362, - "step": 72185 - }, - { - "epoch": 1.85, - "learning_rate": 6.76482619922985e-07, - "loss": 0.6221, - "step": 72186 - }, - { - "epoch": 1.85, - "learning_rate": 6.764564376483035e-07, - "loss": 0.6455, - "step": 72187 - }, - { - "epoch": 1.85, - "learning_rate": 6.764302556213442e-07, - "loss": 0.5659, - "step": 72188 - }, - { - "epoch": 1.85, - "learning_rate": 6.764040738421277e-07, - "loss": 0.7861, - "step": 72189 - }, - { - "epoch": 1.85, - "learning_rate": 6.763778923106733e-07, - "loss": 0.5981, - "step": 72190 - }, - { - "epoch": 1.85, - "learning_rate": 6.763517110270019e-07, - "loss": 0.4326, - "step": 72191 - }, - { - "epoch": 1.85, - "learning_rate": 6.763255299911328e-07, - "loss": 0.5728, - "step": 72192 - }, - { - "epoch": 1.85, - "learning_rate": 6.762993492030866e-07, - "loss": 0.4995, - "step": 72193 - }, - { - "epoch": 1.85, - "learning_rate": 6.762731686628829e-07, - "loss": 0.5723, - "step": 72194 - }, - { - "epoch": 1.85, - "learning_rate": 6.762469883705424e-07, - "loss": 0.6006, - "step": 72195 - }, - { - "epoch": 1.85, - "learning_rate": 6.762208083260843e-07, - "loss": 0.6216, - "step": 72196 - }, - { - "epoch": 1.85, - "learning_rate": 6.76194628529529e-07, - "loss": 0.7324, - "step": 72197 - }, - { - "epoch": 1.85, - "learning_rate": 6.761684489808967e-07, - "loss": 0.6167, - "step": 72198 - }, - { - "epoch": 1.85, - "learning_rate": 6.761422696802073e-07, - "loss": 0.6074, - "step": 72199 - }, - { - "epoch": 1.85, - "learning_rate": 6.761160906274808e-07, - "loss": 0.6445, - "step": 72200 - }, - { - "epoch": 1.85, - "learning_rate": 6.760899118227373e-07, - "loss": 0.582, - "step": 72201 - }, - { - "epoch": 1.85, - "learning_rate": 6.760637332659971e-07, - "loss": 0.5103, - "step": 72202 - }, - { - "epoch": 1.85, - "learning_rate": 6.760375549572796e-07, - "loss": 0.479, - "step": 72203 - }, - { - "epoch": 1.85, - "learning_rate": 6.760113768966057e-07, - "loss": 0.6885, - "step": 72204 - }, - { - "epoch": 1.85, - "learning_rate": 6.759851990839951e-07, - "loss": 0.5352, - "step": 72205 - }, - { - "epoch": 1.85, - "learning_rate": 6.759590215194675e-07, - "loss": 0.6318, - "step": 72206 - }, - { - "epoch": 1.85, - "learning_rate": 6.75932844203043e-07, - "loss": 0.498, - "step": 72207 - }, - { - "epoch": 1.85, - "learning_rate": 6.75906667134742e-07, - "loss": 0.6299, - "step": 72208 - }, - { - "epoch": 1.85, - "learning_rate": 6.758804903145841e-07, - "loss": 0.6436, - "step": 72209 - }, - { - "epoch": 1.85, - "learning_rate": 6.758543137425898e-07, - "loss": 0.5034, - "step": 72210 - }, - { - "epoch": 1.85, - "learning_rate": 6.758281374187789e-07, - "loss": 0.627, - "step": 72211 - }, - { - "epoch": 1.85, - "learning_rate": 6.758019613431716e-07, - "loss": 0.5159, - "step": 72212 - }, - { - "epoch": 1.85, - "learning_rate": 6.757757855157877e-07, - "loss": 0.6265, - "step": 72213 - }, - { - "epoch": 1.85, - "learning_rate": 6.757496099366476e-07, - "loss": 0.667, - "step": 72214 - }, - { - "epoch": 1.85, - "learning_rate": 6.757234346057712e-07, - "loss": 0.7324, - "step": 72215 - }, - { - "epoch": 1.85, - "learning_rate": 6.75697259523178e-07, - "loss": 0.6045, - "step": 72216 - }, - { - "epoch": 1.85, - "learning_rate": 6.756710846888888e-07, - "loss": 0.6689, - "step": 72217 - }, - { - "epoch": 1.85, - "learning_rate": 6.756449101029231e-07, - "loss": 0.6475, - "step": 72218 - }, - { - "epoch": 1.85, - "learning_rate": 6.756187357653014e-07, - "loss": 0.8057, - "step": 72219 - }, - { - "epoch": 1.85, - "learning_rate": 6.755925616760433e-07, - "loss": 0.5098, - "step": 72220 - }, - { - "epoch": 1.85, - "learning_rate": 6.755663878351693e-07, - "loss": 0.6641, - "step": 72221 - }, - { - "epoch": 1.85, - "learning_rate": 6.755402142426991e-07, - "loss": 0.4058, - "step": 72222 - }, - { - "epoch": 1.85, - "learning_rate": 6.755140408986529e-07, - "loss": 0.6992, - "step": 72223 - }, - { - "epoch": 1.85, - "learning_rate": 6.754878678030505e-07, - "loss": 0.7188, - "step": 72224 - }, - { - "epoch": 1.85, - "learning_rate": 6.754616949559126e-07, - "loss": 0.4904, - "step": 72225 - }, - { - "epoch": 1.85, - "learning_rate": 6.754355223572582e-07, - "loss": 0.6665, - "step": 72226 - }, - { - "epoch": 1.85, - "learning_rate": 6.754093500071082e-07, - "loss": 0.7207, - "step": 72227 - }, - { - "epoch": 1.85, - "learning_rate": 6.75383177905482e-07, - "loss": 0.7021, - "step": 72228 - }, - { - "epoch": 1.85, - "learning_rate": 6.753570060524003e-07, - "loss": 0.5737, - "step": 72229 - }, - { - "epoch": 1.85, - "learning_rate": 6.753308344478826e-07, - "loss": 0.637, - "step": 72230 - }, - { - "epoch": 1.85, - "learning_rate": 6.753046630919493e-07, - "loss": 0.4878, - "step": 72231 - }, - { - "epoch": 1.85, - "learning_rate": 6.752784919846201e-07, - "loss": 0.5542, - "step": 72232 - }, - { - "epoch": 1.85, - "learning_rate": 6.752523211259155e-07, - "loss": 0.5391, - "step": 72233 - }, - { - "epoch": 1.85, - "learning_rate": 6.752261505158549e-07, - "loss": 0.5688, - "step": 72234 - }, - { - "epoch": 1.85, - "learning_rate": 6.751999801544595e-07, - "loss": 0.5654, - "step": 72235 - }, - { - "epoch": 1.85, - "learning_rate": 6.751738100417479e-07, - "loss": 0.5557, - "step": 72236 - }, - { - "epoch": 1.85, - "learning_rate": 6.751476401777408e-07, - "loss": 0.7617, - "step": 72237 - }, - { - "epoch": 1.85, - "learning_rate": 6.751214705624584e-07, - "loss": 0.7559, - "step": 72238 - }, - { - "epoch": 1.85, - "learning_rate": 6.750953011959204e-07, - "loss": 0.623, - "step": 72239 - }, - { - "epoch": 1.85, - "learning_rate": 6.75069132078147e-07, - "loss": 0.6777, - "step": 72240 - }, - { - "epoch": 1.85, - "learning_rate": 6.750429632091584e-07, - "loss": 0.6953, - "step": 72241 - }, - { - "epoch": 1.85, - "learning_rate": 6.75016794588974e-07, - "loss": 0.6587, - "step": 72242 - }, - { - "epoch": 1.85, - "learning_rate": 6.749906262176147e-07, - "loss": 0.7109, - "step": 72243 - }, - { - "epoch": 1.85, - "learning_rate": 6.749644580950999e-07, - "loss": 0.5513, - "step": 72244 - }, - { - "epoch": 1.85, - "learning_rate": 6.749382902214503e-07, - "loss": 0.632, - "step": 72245 - }, - { - "epoch": 1.85, - "learning_rate": 6.749121225966853e-07, - "loss": 0.5181, - "step": 72246 - }, - { - "epoch": 1.85, - "learning_rate": 6.74885955220825e-07, - "loss": 0.6934, - "step": 72247 - }, - { - "epoch": 1.85, - "learning_rate": 6.748597880938896e-07, - "loss": 0.5186, - "step": 72248 - }, - { - "epoch": 1.85, - "learning_rate": 6.748336212158989e-07, - "loss": 0.6279, - "step": 72249 - }, - { - "epoch": 1.85, - "learning_rate": 6.748074545868736e-07, - "loss": 0.7354, - "step": 72250 - }, - { - "epoch": 1.85, - "learning_rate": 6.747812882068329e-07, - "loss": 0.6377, - "step": 72251 - }, - { - "epoch": 1.85, - "learning_rate": 6.747551220757974e-07, - "loss": 0.6885, - "step": 72252 - }, - { - "epoch": 1.85, - "learning_rate": 6.747289561937868e-07, - "loss": 0.8076, - "step": 72253 - }, - { - "epoch": 1.85, - "learning_rate": 6.747027905608216e-07, - "loss": 0.5942, - "step": 72254 - }, - { - "epoch": 1.85, - "learning_rate": 6.746766251769216e-07, - "loss": 0.6641, - "step": 72255 - }, - { - "epoch": 1.85, - "learning_rate": 6.746504600421065e-07, - "loss": 0.6099, - "step": 72256 - }, - { - "epoch": 1.85, - "learning_rate": 6.746242951563963e-07, - "loss": 0.6641, - "step": 72257 - }, - { - "epoch": 1.85, - "learning_rate": 6.745981305198117e-07, - "loss": 0.6162, - "step": 72258 - }, - { - "epoch": 1.85, - "learning_rate": 6.745719661323721e-07, - "loss": 0.6213, - "step": 72259 - }, - { - "epoch": 1.85, - "learning_rate": 6.74545801994098e-07, - "loss": 0.6953, - "step": 72260 - }, - { - "epoch": 1.85, - "learning_rate": 6.745196381050089e-07, - "loss": 0.7695, - "step": 72261 - }, - { - "epoch": 1.85, - "learning_rate": 6.744934744651255e-07, - "loss": 0.7451, - "step": 72262 - }, - { - "epoch": 1.85, - "learning_rate": 6.744673110744672e-07, - "loss": 0.8271, - "step": 72263 - }, - { - "epoch": 1.85, - "learning_rate": 6.744411479330545e-07, - "loss": 0.6123, - "step": 72264 - }, - { - "epoch": 1.85, - "learning_rate": 6.744149850409076e-07, - "loss": 0.5061, - "step": 72265 - }, - { - "epoch": 1.85, - "learning_rate": 6.743888223980455e-07, - "loss": 0.7695, - "step": 72266 - }, - { - "epoch": 1.85, - "learning_rate": 6.743626600044893e-07, - "loss": 0.6079, - "step": 72267 - }, - { - "epoch": 1.85, - "learning_rate": 6.743364978602584e-07, - "loss": 0.3853, - "step": 72268 - }, - { - "epoch": 1.85, - "learning_rate": 6.743103359653732e-07, - "loss": 0.5908, - "step": 72269 - }, - { - "epoch": 1.85, - "learning_rate": 6.742841743198535e-07, - "loss": 0.6846, - "step": 72270 - }, - { - "epoch": 1.85, - "learning_rate": 6.742580129237196e-07, - "loss": 0.4497, - "step": 72271 - }, - { - "epoch": 1.85, - "learning_rate": 6.742318517769911e-07, - "loss": 0.5127, - "step": 72272 - }, - { - "epoch": 1.85, - "learning_rate": 6.742056908796884e-07, - "loss": 0.6992, - "step": 72273 - }, - { - "epoch": 1.85, - "learning_rate": 6.741795302318314e-07, - "loss": 0.5464, - "step": 72274 - }, - { - "epoch": 1.85, - "learning_rate": 6.741533698334408e-07, - "loss": 0.5869, - "step": 72275 - }, - { - "epoch": 1.85, - "learning_rate": 6.741272096845354e-07, - "loss": 0.6094, - "step": 72276 - }, - { - "epoch": 1.85, - "learning_rate": 6.741010497851358e-07, - "loss": 0.6562, - "step": 72277 - }, - { - "epoch": 1.85, - "learning_rate": 6.74074890135262e-07, - "loss": 0.6079, - "step": 72278 - }, - { - "epoch": 1.85, - "learning_rate": 6.740487307349343e-07, - "loss": 0.5122, - "step": 72279 - }, - { - "epoch": 1.85, - "learning_rate": 6.740225715841721e-07, - "loss": 0.3499, - "step": 72280 - }, - { - "epoch": 1.85, - "learning_rate": 6.739964126829963e-07, - "loss": 0.7139, - "step": 72281 - }, - { - "epoch": 1.85, - "learning_rate": 6.73970254031426e-07, - "loss": 0.5991, - "step": 72282 - }, - { - "epoch": 1.85, - "learning_rate": 6.73944095629482e-07, - "loss": 0.5159, - "step": 72283 - }, - { - "epoch": 1.85, - "learning_rate": 6.739179374771837e-07, - "loss": 0.6914, - "step": 72284 - }, - { - "epoch": 1.85, - "learning_rate": 6.73891779574552e-07, - "loss": 0.749, - "step": 72285 - }, - { - "epoch": 1.85, - "learning_rate": 6.738656219216061e-07, - "loss": 0.7656, - "step": 72286 - }, - { - "epoch": 1.85, - "learning_rate": 6.738394645183662e-07, - "loss": 0.3787, - "step": 72287 - }, - { - "epoch": 1.85, - "learning_rate": 6.738133073648525e-07, - "loss": 0.7334, - "step": 72288 - }, - { - "epoch": 1.85, - "learning_rate": 6.737871504610848e-07, - "loss": 0.7256, - "step": 72289 - }, - { - "epoch": 1.85, - "learning_rate": 6.737609938070833e-07, - "loss": 0.667, - "step": 72290 - }, - { - "epoch": 1.85, - "learning_rate": 6.737348374028681e-07, - "loss": 0.5234, - "step": 72291 - }, - { - "epoch": 1.85, - "learning_rate": 6.737086812484592e-07, - "loss": 0.5002, - "step": 72292 - }, - { - "epoch": 1.85, - "learning_rate": 6.736825253438764e-07, - "loss": 0.75, - "step": 72293 - }, - { - "epoch": 1.85, - "learning_rate": 6.7365636968914e-07, - "loss": 0.4915, - "step": 72294 - }, - { - "epoch": 1.85, - "learning_rate": 6.736302142842702e-07, - "loss": 0.6436, - "step": 72295 - }, - { - "epoch": 1.85, - "learning_rate": 6.736040591292865e-07, - "loss": 0.437, - "step": 72296 - }, - { - "epoch": 1.85, - "learning_rate": 6.735779042242089e-07, - "loss": 0.6523, - "step": 72297 - }, - { - "epoch": 1.85, - "learning_rate": 6.73551749569058e-07, - "loss": 0.6182, - "step": 72298 - }, - { - "epoch": 1.85, - "learning_rate": 6.735255951638532e-07, - "loss": 0.6284, - "step": 72299 - }, - { - "epoch": 1.85, - "learning_rate": 6.734994410086153e-07, - "loss": 0.6265, - "step": 72300 - }, - { - "epoch": 1.85, - "learning_rate": 6.734732871033634e-07, - "loss": 0.668, - "step": 72301 - }, - { - "epoch": 1.85, - "learning_rate": 6.734471334481182e-07, - "loss": 0.5464, - "step": 72302 - }, - { - "epoch": 1.85, - "learning_rate": 6.734209800428994e-07, - "loss": 0.7344, - "step": 72303 - }, - { - "epoch": 1.85, - "learning_rate": 6.733948268877273e-07, - "loss": 0.7803, - "step": 72304 - }, - { - "epoch": 1.85, - "learning_rate": 6.73368673982622e-07, - "loss": 0.5859, - "step": 72305 - }, - { - "epoch": 1.85, - "learning_rate": 6.73342521327603e-07, - "loss": 0.5728, - "step": 72306 - }, - { - "epoch": 1.85, - "learning_rate": 6.733163689226906e-07, - "loss": 0.6133, - "step": 72307 - }, - { - "epoch": 1.85, - "learning_rate": 6.732902167679047e-07, - "loss": 0.6284, - "step": 72308 - }, - { - "epoch": 1.85, - "learning_rate": 6.732640648632657e-07, - "loss": 0.6953, - "step": 72309 - }, - { - "epoch": 1.85, - "learning_rate": 6.73237913208793e-07, - "loss": 0.6768, - "step": 72310 - }, - { - "epoch": 1.85, - "learning_rate": 6.732117618045074e-07, - "loss": 0.6226, - "step": 72311 - }, - { - "epoch": 1.85, - "learning_rate": 6.731856106504285e-07, - "loss": 0.5443, - "step": 72312 - }, - { - "epoch": 1.85, - "learning_rate": 6.731594597465762e-07, - "loss": 0.6289, - "step": 72313 - }, - { - "epoch": 1.85, - "learning_rate": 6.731333090929707e-07, - "loss": 0.4641, - "step": 72314 - }, - { - "epoch": 1.85, - "learning_rate": 6.731071586896324e-07, - "loss": 0.5935, - "step": 72315 - }, - { - "epoch": 1.85, - "learning_rate": 6.730810085365804e-07, - "loss": 0.6738, - "step": 72316 - }, - { - "epoch": 1.85, - "learning_rate": 6.730548586338355e-07, - "loss": 0.6377, - "step": 72317 - }, - { - "epoch": 1.85, - "learning_rate": 6.730287089814173e-07, - "loss": 0.5405, - "step": 72318 - }, - { - "epoch": 1.85, - "learning_rate": 6.73002559579346e-07, - "loss": 0.6577, - "step": 72319 - }, - { - "epoch": 1.85, - "learning_rate": 6.729764104276416e-07, - "loss": 0.5342, - "step": 72320 - }, - { - "epoch": 1.85, - "learning_rate": 6.729502615263242e-07, - "loss": 0.5596, - "step": 72321 - }, - { - "epoch": 1.85, - "learning_rate": 6.729241128754135e-07, - "loss": 0.7031, - "step": 72322 - }, - { - "epoch": 1.85, - "learning_rate": 6.728979644749302e-07, - "loss": 0.6182, - "step": 72323 - }, - { - "epoch": 1.85, - "learning_rate": 6.728718163248934e-07, - "loss": 0.5918, - "step": 72324 - }, - { - "epoch": 1.85, - "learning_rate": 6.728456684253241e-07, - "loss": 0.6201, - "step": 72325 - }, - { - "epoch": 1.85, - "learning_rate": 6.728195207762418e-07, - "loss": 0.5015, - "step": 72326 - }, - { - "epoch": 1.85, - "learning_rate": 6.727933733776663e-07, - "loss": 0.7217, - "step": 72327 - }, - { - "epoch": 1.85, - "learning_rate": 6.727672262296179e-07, - "loss": 0.6084, - "step": 72328 - }, - { - "epoch": 1.85, - "learning_rate": 6.727410793321166e-07, - "loss": 0.7148, - "step": 72329 - }, - { - "epoch": 1.85, - "learning_rate": 6.727149326851824e-07, - "loss": 0.686, - "step": 72330 - }, - { - "epoch": 1.85, - "learning_rate": 6.726887862888354e-07, - "loss": 0.709, - "step": 72331 - }, - { - "epoch": 1.85, - "learning_rate": 6.726626401430953e-07, - "loss": 0.4263, - "step": 72332 - }, - { - "epoch": 1.85, - "learning_rate": 6.726364942479827e-07, - "loss": 0.7207, - "step": 72333 - }, - { - "epoch": 1.85, - "learning_rate": 6.726103486035171e-07, - "loss": 0.6934, - "step": 72334 - }, - { - "epoch": 1.85, - "learning_rate": 6.725842032097189e-07, - "loss": 0.624, - "step": 72335 - }, - { - "epoch": 1.85, - "learning_rate": 6.72558058066608e-07, - "loss": 0.6553, - "step": 72336 - }, - { - "epoch": 1.85, - "learning_rate": 6.725319131742038e-07, - "loss": 0.7046, - "step": 72337 - }, - { - "epoch": 1.85, - "learning_rate": 6.725057685325273e-07, - "loss": 0.5062, - "step": 72338 - }, - { - "epoch": 1.85, - "learning_rate": 6.724796241415978e-07, - "loss": 0.6431, - "step": 72339 - }, - { - "epoch": 1.85, - "learning_rate": 6.724534800014358e-07, - "loss": 0.5957, - "step": 72340 - }, - { - "epoch": 1.85, - "learning_rate": 6.724273361120609e-07, - "loss": 0.5601, - "step": 72341 - }, - { - "epoch": 1.85, - "learning_rate": 6.724011924734936e-07, - "loss": 0.5449, - "step": 72342 - }, - { - "epoch": 1.85, - "learning_rate": 6.723750490857533e-07, - "loss": 0.5278, - "step": 72343 - }, - { - "epoch": 1.85, - "learning_rate": 6.723489059488607e-07, - "loss": 0.4077, - "step": 72344 - }, - { - "epoch": 1.85, - "learning_rate": 6.723227630628356e-07, - "loss": 0.3584, - "step": 72345 - }, - { - "epoch": 1.85, - "learning_rate": 6.722966204276977e-07, - "loss": 0.6973, - "step": 72346 - }, - { - "epoch": 1.85, - "learning_rate": 6.722704780434669e-07, - "loss": 0.5469, - "step": 72347 - }, - { - "epoch": 1.85, - "learning_rate": 6.722443359101639e-07, - "loss": 0.6729, - "step": 72348 - }, - { - "epoch": 1.85, - "learning_rate": 6.722181940278081e-07, - "loss": 0.7686, - "step": 72349 - }, - { - "epoch": 1.85, - "learning_rate": 6.7219205239642e-07, - "loss": 0.75, - "step": 72350 - }, - { - "epoch": 1.85, - "learning_rate": 6.721659110160191e-07, - "loss": 0.7803, - "step": 72351 - }, - { - "epoch": 1.85, - "learning_rate": 6.721397698866257e-07, - "loss": 0.6201, - "step": 72352 - }, - { - "epoch": 1.85, - "learning_rate": 6.721136290082599e-07, - "loss": 0.6152, - "step": 72353 - }, - { - "epoch": 1.85, - "learning_rate": 6.720874883809418e-07, - "loss": 0.4314, - "step": 72354 - }, - { - "epoch": 1.85, - "learning_rate": 6.720613480046914e-07, - "loss": 0.6147, - "step": 72355 - }, - { - "epoch": 1.85, - "learning_rate": 6.720352078795281e-07, - "loss": 0.6904, - "step": 72356 - }, - { - "epoch": 1.85, - "learning_rate": 6.720090680054725e-07, - "loss": 0.793, - "step": 72357 - }, - { - "epoch": 1.85, - "learning_rate": 6.719829283825444e-07, - "loss": 0.7021, - "step": 72358 - }, - { - "epoch": 1.85, - "learning_rate": 6.71956789010764e-07, - "loss": 0.6357, - "step": 72359 - }, - { - "epoch": 1.85, - "learning_rate": 6.71930649890151e-07, - "loss": 0.4707, - "step": 72360 - }, - { - "epoch": 1.85, - "learning_rate": 6.719045110207259e-07, - "loss": 0.7822, - "step": 72361 - }, - { - "epoch": 1.85, - "learning_rate": 6.718783724025081e-07, - "loss": 0.5244, - "step": 72362 - }, - { - "epoch": 1.85, - "learning_rate": 6.718522340355182e-07, - "loss": 0.5996, - "step": 72363 - }, - { - "epoch": 1.85, - "learning_rate": 6.718260959197759e-07, - "loss": 0.71, - "step": 72364 - }, - { - "epoch": 1.85, - "learning_rate": 6.717999580553017e-07, - "loss": 0.5701, - "step": 72365 - }, - { - "epoch": 1.85, - "learning_rate": 6.717738204421146e-07, - "loss": 0.5991, - "step": 72366 - }, - { - "epoch": 1.85, - "learning_rate": 6.717476830802354e-07, - "loss": 0.5459, - "step": 72367 - }, - { - "epoch": 1.85, - "learning_rate": 6.717215459696838e-07, - "loss": 0.6543, - "step": 72368 - }, - { - "epoch": 1.85, - "learning_rate": 6.7169540911048e-07, - "loss": 0.5728, - "step": 72369 - }, - { - "epoch": 1.85, - "learning_rate": 6.716692725026438e-07, - "loss": 0.4938, - "step": 72370 - }, - { - "epoch": 1.85, - "learning_rate": 6.716431361461955e-07, - "loss": 0.5396, - "step": 72371 - }, - { - "epoch": 1.85, - "learning_rate": 6.716170000411548e-07, - "loss": 0.4902, - "step": 72372 - }, - { - "epoch": 1.85, - "learning_rate": 6.715908641875419e-07, - "loss": 0.6523, - "step": 72373 - }, - { - "epoch": 1.85, - "learning_rate": 6.715647285853768e-07, - "loss": 0.6875, - "step": 72374 - }, - { - "epoch": 1.86, - "learning_rate": 6.715385932346798e-07, - "loss": 0.5908, - "step": 72375 - }, - { - "epoch": 1.86, - "learning_rate": 6.715124581354704e-07, - "loss": 0.6602, - "step": 72376 - }, - { - "epoch": 1.86, - "learning_rate": 6.714863232877685e-07, - "loss": 0.6196, - "step": 72377 - }, - { - "epoch": 1.86, - "learning_rate": 6.714601886915947e-07, - "loss": 0.5996, - "step": 72378 - }, - { - "epoch": 1.86, - "learning_rate": 6.714340543469685e-07, - "loss": 0.4058, - "step": 72379 - }, - { - "epoch": 1.86, - "learning_rate": 6.714079202539105e-07, - "loss": 0.5723, - "step": 72380 - }, - { - "epoch": 1.86, - "learning_rate": 6.713817864124401e-07, - "loss": 0.5405, - "step": 72381 - }, - { - "epoch": 1.86, - "learning_rate": 6.713556528225775e-07, - "loss": 0.6543, - "step": 72382 - }, - { - "epoch": 1.86, - "learning_rate": 6.713295194843428e-07, - "loss": 0.5952, - "step": 72383 - }, - { - "epoch": 1.86, - "learning_rate": 6.713033863977561e-07, - "loss": 0.6909, - "step": 72384 - }, - { - "epoch": 1.86, - "learning_rate": 6.712772535628375e-07, - "loss": 0.6787, - "step": 72385 - }, - { - "epoch": 1.86, - "learning_rate": 6.712511209796066e-07, - "loss": 0.6855, - "step": 72386 - }, - { - "epoch": 1.86, - "learning_rate": 6.712249886480834e-07, - "loss": 0.6436, - "step": 72387 - }, - { - "epoch": 1.86, - "learning_rate": 6.711988565682883e-07, - "loss": 0.6362, - "step": 72388 - }, - { - "epoch": 1.86, - "learning_rate": 6.711727247402409e-07, - "loss": 0.603, - "step": 72389 - }, - { - "epoch": 1.86, - "learning_rate": 6.711465931639616e-07, - "loss": 0.6704, - "step": 72390 - }, - { - "epoch": 1.86, - "learning_rate": 6.711204618394701e-07, - "loss": 0.5063, - "step": 72391 - }, - { - "epoch": 1.86, - "learning_rate": 6.710943307667866e-07, - "loss": 0.6797, - "step": 72392 - }, - { - "epoch": 1.86, - "learning_rate": 6.710681999459311e-07, - "loss": 0.5791, - "step": 72393 - }, - { - "epoch": 1.86, - "learning_rate": 6.710420693769237e-07, - "loss": 0.6597, - "step": 72394 - }, - { - "epoch": 1.86, - "learning_rate": 6.710159390597842e-07, - "loss": 0.5111, - "step": 72395 - }, - { - "epoch": 1.86, - "learning_rate": 6.709898089945325e-07, - "loss": 0.6338, - "step": 72396 - }, - { - "epoch": 1.86, - "learning_rate": 6.709636791811889e-07, - "loss": 0.6328, - "step": 72397 - }, - { - "epoch": 1.86, - "learning_rate": 6.709375496197731e-07, - "loss": 0.6675, - "step": 72398 - }, - { - "epoch": 1.86, - "learning_rate": 6.709114203103055e-07, - "loss": 0.7456, - "step": 72399 - }, - { - "epoch": 1.86, - "learning_rate": 6.708852912528057e-07, - "loss": 0.6592, - "step": 72400 - }, - { - "epoch": 1.86, - "learning_rate": 6.708591624472942e-07, - "loss": 0.5566, - "step": 72401 - }, - { - "epoch": 1.86, - "learning_rate": 6.708330338937904e-07, - "loss": 0.7295, - "step": 72402 - }, - { - "epoch": 1.86, - "learning_rate": 6.708069055923146e-07, - "loss": 0.6279, - "step": 72403 - }, - { - "epoch": 1.86, - "learning_rate": 6.707807775428873e-07, - "loss": 0.6777, - "step": 72404 - }, - { - "epoch": 1.86, - "learning_rate": 6.707546497455276e-07, - "loss": 0.6353, - "step": 72405 - }, - { - "epoch": 1.86, - "learning_rate": 6.707285222002559e-07, - "loss": 0.564, - "step": 72406 - }, - { - "epoch": 1.86, - "learning_rate": 6.707023949070924e-07, - "loss": 0.5684, - "step": 72407 - }, - { - "epoch": 1.86, - "learning_rate": 6.706762678660567e-07, - "loss": 0.7627, - "step": 72408 - }, - { - "epoch": 1.86, - "learning_rate": 6.706501410771693e-07, - "loss": 0.583, - "step": 72409 - }, - { - "epoch": 1.86, - "learning_rate": 6.706240145404498e-07, - "loss": 0.7568, - "step": 72410 - }, - { - "epoch": 1.86, - "learning_rate": 6.705978882559184e-07, - "loss": 0.5776, - "step": 72411 - }, - { - "epoch": 1.86, - "learning_rate": 6.705717622235949e-07, - "loss": 0.6479, - "step": 72412 - }, - { - "epoch": 1.86, - "learning_rate": 6.705456364434996e-07, - "loss": 0.5845, - "step": 72413 - }, - { - "epoch": 1.86, - "learning_rate": 6.705195109156527e-07, - "loss": 0.4561, - "step": 72414 - }, - { - "epoch": 1.86, - "learning_rate": 6.704933856400733e-07, - "loss": 0.5708, - "step": 72415 - }, - { - "epoch": 1.86, - "learning_rate": 6.704672606167823e-07, - "loss": 0.6973, - "step": 72416 - }, - { - "epoch": 1.86, - "learning_rate": 6.704411358457991e-07, - "loss": 0.4966, - "step": 72417 - }, - { - "epoch": 1.86, - "learning_rate": 6.70415011327144e-07, - "loss": 0.6426, - "step": 72418 - }, - { - "epoch": 1.86, - "learning_rate": 6.703888870608373e-07, - "loss": 0.6187, - "step": 72419 - }, - { - "epoch": 1.86, - "learning_rate": 6.703627630468983e-07, - "loss": 0.7188, - "step": 72420 - }, - { - "epoch": 1.86, - "learning_rate": 6.703366392853476e-07, - "loss": 0.5962, - "step": 72421 - }, - { - "epoch": 1.86, - "learning_rate": 6.703105157762048e-07, - "loss": 0.7676, - "step": 72422 - }, - { - "epoch": 1.86, - "learning_rate": 6.702843925194902e-07, - "loss": 0.7852, - "step": 72423 - }, - { - "epoch": 1.86, - "learning_rate": 6.702582695152239e-07, - "loss": 0.4451, - "step": 72424 - }, - { - "epoch": 1.86, - "learning_rate": 6.702321467634253e-07, - "loss": 0.7073, - "step": 72425 - }, - { - "epoch": 1.86, - "learning_rate": 6.70206024264115e-07, - "loss": 0.4739, - "step": 72426 - }, - { - "epoch": 1.86, - "learning_rate": 6.701799020173127e-07, - "loss": 0.6758, - "step": 72427 - }, - { - "epoch": 1.86, - "learning_rate": 6.701537800230385e-07, - "loss": 0.6089, - "step": 72428 - }, - { - "epoch": 1.86, - "learning_rate": 6.701276582813122e-07, - "loss": 0.7363, - "step": 72429 - }, - { - "epoch": 1.86, - "learning_rate": 6.701015367921543e-07, - "loss": 0.5386, - "step": 72430 - }, - { - "epoch": 1.86, - "learning_rate": 6.700754155555841e-07, - "loss": 0.6787, - "step": 72431 - }, - { - "epoch": 1.86, - "learning_rate": 6.700492945716223e-07, - "loss": 0.3884, - "step": 72432 - }, - { - "epoch": 1.86, - "learning_rate": 6.700231738402884e-07, - "loss": 0.6348, - "step": 72433 - }, - { - "epoch": 1.86, - "learning_rate": 6.699970533616031e-07, - "loss": 0.7393, - "step": 72434 - }, - { - "epoch": 1.86, - "learning_rate": 6.699709331355854e-07, - "loss": 0.71, - "step": 72435 - }, - { - "epoch": 1.86, - "learning_rate": 6.699448131622558e-07, - "loss": 0.6465, - "step": 72436 - }, - { - "epoch": 1.86, - "learning_rate": 6.699186934416343e-07, - "loss": 0.7158, - "step": 72437 - }, - { - "epoch": 1.86, - "learning_rate": 6.698925739737411e-07, - "loss": 0.5649, - "step": 72438 - }, - { - "epoch": 1.86, - "learning_rate": 6.698664547585956e-07, - "loss": 0.5659, - "step": 72439 - }, - { - "epoch": 1.86, - "learning_rate": 6.698403357962183e-07, - "loss": 0.5698, - "step": 72440 - }, - { - "epoch": 1.86, - "learning_rate": 6.698142170866291e-07, - "loss": 0.7227, - "step": 72441 - }, - { - "epoch": 1.86, - "learning_rate": 6.69788098629848e-07, - "loss": 0.7314, - "step": 72442 - }, - { - "epoch": 1.86, - "learning_rate": 6.697619804258949e-07, - "loss": 0.7188, - "step": 72443 - }, - { - "epoch": 1.86, - "learning_rate": 6.697358624747903e-07, - "loss": 0.5253, - "step": 72444 - }, - { - "epoch": 1.86, - "learning_rate": 6.697097447765534e-07, - "loss": 0.7075, - "step": 72445 - }, - { - "epoch": 1.86, - "learning_rate": 6.696836273312045e-07, - "loss": 0.6099, - "step": 72446 - }, - { - "epoch": 1.86, - "learning_rate": 6.696575101387638e-07, - "loss": 0.5579, - "step": 72447 - }, - { - "epoch": 1.86, - "learning_rate": 6.69631393199251e-07, - "loss": 0.7739, - "step": 72448 - }, - { - "epoch": 1.86, - "learning_rate": 6.696052765126864e-07, - "loss": 0.5381, - "step": 72449 - }, - { - "epoch": 1.86, - "learning_rate": 6.695791600790897e-07, - "loss": 0.6416, - "step": 72450 - }, - { - "epoch": 1.86, - "learning_rate": 6.695530438984811e-07, - "loss": 0.748, - "step": 72451 - }, - { - "epoch": 1.86, - "learning_rate": 6.695269279708803e-07, - "loss": 0.6309, - "step": 72452 - }, - { - "epoch": 1.86, - "learning_rate": 6.695008122963081e-07, - "loss": 0.4941, - "step": 72453 - }, - { - "epoch": 1.86, - "learning_rate": 6.694746968747839e-07, - "loss": 0.6055, - "step": 72454 - }, - { - "epoch": 1.86, - "learning_rate": 6.694485817063276e-07, - "loss": 0.6514, - "step": 72455 - }, - { - "epoch": 1.86, - "learning_rate": 6.694224667909589e-07, - "loss": 0.7666, - "step": 72456 - }, - { - "epoch": 1.86, - "learning_rate": 6.693963521286986e-07, - "loss": 0.422, - "step": 72457 - }, - { - "epoch": 1.86, - "learning_rate": 6.693702377195661e-07, - "loss": 0.4949, - "step": 72458 - }, - { - "epoch": 1.86, - "learning_rate": 6.693441235635817e-07, - "loss": 0.6865, - "step": 72459 - }, - { - "epoch": 1.86, - "learning_rate": 6.693180096607653e-07, - "loss": 0.6396, - "step": 72460 - }, - { - "epoch": 1.86, - "learning_rate": 6.692918960111369e-07, - "loss": 0.6328, - "step": 72461 - }, - { - "epoch": 1.86, - "learning_rate": 6.692657826147164e-07, - "loss": 0.5317, - "step": 72462 - }, - { - "epoch": 1.86, - "learning_rate": 6.692396694715241e-07, - "loss": 0.5537, - "step": 72463 - }, - { - "epoch": 1.86, - "learning_rate": 6.692135565815799e-07, - "loss": 0.6787, - "step": 72464 - }, - { - "epoch": 1.86, - "learning_rate": 6.691874439449033e-07, - "loss": 0.4907, - "step": 72465 - }, - { - "epoch": 1.86, - "learning_rate": 6.691613315615149e-07, - "loss": 0.6299, - "step": 72466 - }, - { - "epoch": 1.86, - "learning_rate": 6.691352194314342e-07, - "loss": 0.8018, - "step": 72467 - }, - { - "epoch": 1.86, - "learning_rate": 6.691091075546817e-07, - "loss": 0.8047, - "step": 72468 - }, - { - "epoch": 1.86, - "learning_rate": 6.69082995931277e-07, - "loss": 0.4463, - "step": 72469 - }, - { - "epoch": 1.86, - "learning_rate": 6.690568845612403e-07, - "loss": 0.4878, - "step": 72470 - }, - { - "epoch": 1.86, - "learning_rate": 6.690307734445913e-07, - "loss": 0.6914, - "step": 72471 - }, - { - "epoch": 1.86, - "learning_rate": 6.690046625813506e-07, - "loss": 0.4956, - "step": 72472 - }, - { - "epoch": 1.86, - "learning_rate": 6.689785519715375e-07, - "loss": 0.6323, - "step": 72473 - }, - { - "epoch": 1.86, - "learning_rate": 6.689524416151729e-07, - "loss": 0.6562, - "step": 72474 - }, - { - "epoch": 1.86, - "learning_rate": 6.689263315122755e-07, - "loss": 0.5186, - "step": 72475 - }, - { - "epoch": 1.86, - "learning_rate": 6.689002216628663e-07, - "loss": 0.5969, - "step": 72476 - }, - { - "epoch": 1.86, - "learning_rate": 6.688741120669648e-07, - "loss": 0.7329, - "step": 72477 - }, - { - "epoch": 1.86, - "learning_rate": 6.688480027245913e-07, - "loss": 0.7031, - "step": 72478 - }, - { - "epoch": 1.86, - "learning_rate": 6.688218936357654e-07, - "loss": 0.6084, - "step": 72479 - }, - { - "epoch": 1.86, - "learning_rate": 6.687957848005077e-07, - "loss": 0.7109, - "step": 72480 - }, - { - "epoch": 1.86, - "learning_rate": 6.687696762188375e-07, - "loss": 0.7363, - "step": 72481 - }, - { - "epoch": 1.86, - "learning_rate": 6.687435678907754e-07, - "loss": 0.5862, - "step": 72482 - }, - { - "epoch": 1.86, - "learning_rate": 6.68717459816341e-07, - "loss": 0.6797, - "step": 72483 - }, - { - "epoch": 1.86, - "learning_rate": 6.686913519955547e-07, - "loss": 0.7061, - "step": 72484 - }, - { - "epoch": 1.86, - "learning_rate": 6.68665244428436e-07, - "loss": 0.666, - "step": 72485 - }, - { - "epoch": 1.86, - "learning_rate": 6.686391371150049e-07, - "loss": 0.5879, - "step": 72486 - }, - { - "epoch": 1.86, - "learning_rate": 6.686130300552818e-07, - "loss": 0.5918, - "step": 72487 - }, - { - "epoch": 1.86, - "learning_rate": 6.685869232492862e-07, - "loss": 0.5889, - "step": 72488 - }, - { - "epoch": 1.86, - "learning_rate": 6.685608166970387e-07, - "loss": 0.6562, - "step": 72489 - }, - { - "epoch": 1.86, - "learning_rate": 6.685347103985586e-07, - "loss": 0.6816, - "step": 72490 - }, - { - "epoch": 1.86, - "learning_rate": 6.685086043538665e-07, - "loss": 0.6855, - "step": 72491 - }, - { - "epoch": 1.86, - "learning_rate": 6.684824985629821e-07, - "loss": 0.6787, - "step": 72492 - }, - { - "epoch": 1.86, - "learning_rate": 6.684563930259253e-07, - "loss": 0.5024, - "step": 72493 - }, - { - "epoch": 1.86, - "learning_rate": 6.684302877427164e-07, - "loss": 0.5303, - "step": 72494 - }, - { - "epoch": 1.86, - "learning_rate": 6.68404182713375e-07, - "loss": 0.5913, - "step": 72495 - }, - { - "epoch": 1.86, - "learning_rate": 6.683780779379212e-07, - "loss": 0.478, - "step": 72496 - }, - { - "epoch": 1.86, - "learning_rate": 6.683519734163751e-07, - "loss": 0.8115, - "step": 72497 - }, - { - "epoch": 1.86, - "learning_rate": 6.683258691487567e-07, - "loss": 0.8516, - "step": 72498 - }, - { - "epoch": 1.86, - "learning_rate": 6.68299765135086e-07, - "loss": 0.4941, - "step": 72499 - }, - { - "epoch": 1.86, - "learning_rate": 6.682736613753826e-07, - "loss": 0.7891, - "step": 72500 - }, - { - "epoch": 1.86, - "learning_rate": 6.682475578696671e-07, - "loss": 0.6958, - "step": 72501 - }, - { - "epoch": 1.86, - "learning_rate": 6.68221454617959e-07, - "loss": 0.5457, - "step": 72502 - }, - { - "epoch": 1.86, - "learning_rate": 6.681953516202787e-07, - "loss": 0.5081, - "step": 72503 - }, - { - "epoch": 1.86, - "learning_rate": 6.681692488766461e-07, - "loss": 0.6455, - "step": 72504 - }, - { - "epoch": 1.86, - "learning_rate": 6.681431463870809e-07, - "loss": 0.6489, - "step": 72505 - }, - { - "epoch": 1.86, - "learning_rate": 6.681170441516031e-07, - "loss": 0.5795, - "step": 72506 - }, - { - "epoch": 1.86, - "learning_rate": 6.680909421702327e-07, - "loss": 0.708, - "step": 72507 - }, - { - "epoch": 1.86, - "learning_rate": 6.6806484044299e-07, - "loss": 0.5077, - "step": 72508 - }, - { - "epoch": 1.86, - "learning_rate": 6.680387389698949e-07, - "loss": 0.3953, - "step": 72509 - }, - { - "epoch": 1.86, - "learning_rate": 6.680126377509669e-07, - "loss": 0.6665, - "step": 72510 - }, - { - "epoch": 1.86, - "learning_rate": 6.679865367862268e-07, - "loss": 0.7363, - "step": 72511 - }, - { - "epoch": 1.86, - "learning_rate": 6.679604360756939e-07, - "loss": 0.6523, - "step": 72512 - }, - { - "epoch": 1.86, - "learning_rate": 6.679343356193885e-07, - "loss": 0.7402, - "step": 72513 - }, - { - "epoch": 1.86, - "learning_rate": 6.679082354173307e-07, - "loss": 0.6006, - "step": 72514 - }, - { - "epoch": 1.86, - "learning_rate": 6.678821354695399e-07, - "loss": 0.7002, - "step": 72515 - }, - { - "epoch": 1.86, - "learning_rate": 6.678560357760367e-07, - "loss": 0.708, - "step": 72516 - }, - { - "epoch": 1.86, - "learning_rate": 6.678299363368407e-07, - "loss": 0.7109, - "step": 72517 - }, - { - "epoch": 1.86, - "learning_rate": 6.678038371519721e-07, - "loss": 0.5308, - "step": 72518 - }, - { - "epoch": 1.86, - "learning_rate": 6.677777382214508e-07, - "loss": 0.6621, - "step": 72519 - }, - { - "epoch": 1.86, - "learning_rate": 6.67751639545297e-07, - "loss": 0.6455, - "step": 72520 - }, - { - "epoch": 1.86, - "learning_rate": 6.677255411235303e-07, - "loss": 0.6104, - "step": 72521 - }, - { - "epoch": 1.86, - "learning_rate": 6.67699442956171e-07, - "loss": 0.7207, - "step": 72522 - }, - { - "epoch": 1.86, - "learning_rate": 6.676733450432388e-07, - "loss": 0.5693, - "step": 72523 - }, - { - "epoch": 1.86, - "learning_rate": 6.676472473847542e-07, - "loss": 0.5435, - "step": 72524 - }, - { - "epoch": 1.86, - "learning_rate": 6.676211499807367e-07, - "loss": 0.627, - "step": 72525 - }, - { - "epoch": 1.86, - "learning_rate": 6.67595052831206e-07, - "loss": 0.6165, - "step": 72526 - }, - { - "epoch": 1.86, - "learning_rate": 6.675689559361829e-07, - "loss": 0.7026, - "step": 72527 - }, - { - "epoch": 1.86, - "learning_rate": 6.675428592956869e-07, - "loss": 0.4971, - "step": 72528 - }, - { - "epoch": 1.86, - "learning_rate": 6.675167629097378e-07, - "loss": 0.6174, - "step": 72529 - }, - { - "epoch": 1.86, - "learning_rate": 6.67490666778356e-07, - "loss": 0.6904, - "step": 72530 - }, - { - "epoch": 1.86, - "learning_rate": 6.674645709015613e-07, - "loss": 0.6914, - "step": 72531 - }, - { - "epoch": 1.86, - "learning_rate": 6.674384752793737e-07, - "loss": 0.5244, - "step": 72532 - }, - { - "epoch": 1.86, - "learning_rate": 6.674123799118129e-07, - "loss": 0.5688, - "step": 72533 - }, - { - "epoch": 1.86, - "learning_rate": 6.673862847988998e-07, - "loss": 0.499, - "step": 72534 - }, - { - "epoch": 1.86, - "learning_rate": 6.673601899406533e-07, - "loss": 0.6362, - "step": 72535 - }, - { - "epoch": 1.86, - "learning_rate": 6.673340953370939e-07, - "loss": 0.5764, - "step": 72536 - }, - { - "epoch": 1.86, - "learning_rate": 6.673080009882414e-07, - "loss": 0.5898, - "step": 72537 - }, - { - "epoch": 1.86, - "learning_rate": 6.672819068941158e-07, - "loss": 0.7119, - "step": 72538 - }, - { - "epoch": 1.86, - "learning_rate": 6.672558130547372e-07, - "loss": 0.5725, - "step": 72539 - }, - { - "epoch": 1.86, - "learning_rate": 6.672297194701255e-07, - "loss": 0.5645, - "step": 72540 - }, - { - "epoch": 1.86, - "learning_rate": 6.672036261403009e-07, - "loss": 0.5492, - "step": 72541 - }, - { - "epoch": 1.86, - "learning_rate": 6.671775330652829e-07, - "loss": 0.5366, - "step": 72542 - }, - { - "epoch": 1.86, - "learning_rate": 6.671514402450919e-07, - "loss": 0.793, - "step": 72543 - }, - { - "epoch": 1.86, - "learning_rate": 6.67125347679748e-07, - "loss": 0.4509, - "step": 72544 - }, - { - "epoch": 1.86, - "learning_rate": 6.670992553692708e-07, - "loss": 0.6104, - "step": 72545 - }, - { - "epoch": 1.86, - "learning_rate": 6.670731633136801e-07, - "loss": 0.5771, - "step": 72546 - }, - { - "epoch": 1.86, - "learning_rate": 6.670470715129963e-07, - "loss": 0.626, - "step": 72547 - }, - { - "epoch": 1.86, - "learning_rate": 6.670209799672393e-07, - "loss": 0.6348, - "step": 72548 - }, - { - "epoch": 1.86, - "learning_rate": 6.66994888676429e-07, - "loss": 0.6279, - "step": 72549 - }, - { - "epoch": 1.86, - "learning_rate": 6.669687976405853e-07, - "loss": 0.4951, - "step": 72550 - }, - { - "epoch": 1.86, - "learning_rate": 6.669427068597284e-07, - "loss": 0.8623, - "step": 72551 - }, - { - "epoch": 1.86, - "learning_rate": 6.66916616333878e-07, - "loss": 0.6885, - "step": 72552 - }, - { - "epoch": 1.86, - "learning_rate": 6.668905260630544e-07, - "loss": 0.5444, - "step": 72553 - }, - { - "epoch": 1.86, - "learning_rate": 6.668644360472778e-07, - "loss": 0.6519, - "step": 72554 - }, - { - "epoch": 1.86, - "learning_rate": 6.668383462865671e-07, - "loss": 0.6846, - "step": 72555 - }, - { - "epoch": 1.86, - "learning_rate": 6.668122567809433e-07, - "loss": 0.7666, - "step": 72556 - }, - { - "epoch": 1.86, - "learning_rate": 6.667861675304258e-07, - "loss": 0.7012, - "step": 72557 - }, - { - "epoch": 1.86, - "learning_rate": 6.667600785350351e-07, - "loss": 0.4573, - "step": 72558 - }, - { - "epoch": 1.86, - "learning_rate": 6.667339897947906e-07, - "loss": 0.5539, - "step": 72559 - }, - { - "epoch": 1.86, - "learning_rate": 6.667079013097127e-07, - "loss": 0.5806, - "step": 72560 - }, - { - "epoch": 1.86, - "learning_rate": 6.666818130798211e-07, - "loss": 0.5981, - "step": 72561 - }, - { - "epoch": 1.86, - "learning_rate": 6.666557251051361e-07, - "loss": 0.7324, - "step": 72562 - }, - { - "epoch": 1.86, - "learning_rate": 6.666296373856772e-07, - "loss": 0.4966, - "step": 72563 - }, - { - "epoch": 1.86, - "learning_rate": 6.666035499214655e-07, - "loss": 0.5232, - "step": 72564 - }, - { - "epoch": 1.86, - "learning_rate": 6.665774627125193e-07, - "loss": 0.6934, - "step": 72565 - }, - { - "epoch": 1.86, - "learning_rate": 6.665513757588597e-07, - "loss": 0.623, - "step": 72566 - }, - { - "epoch": 1.86, - "learning_rate": 6.665252890605062e-07, - "loss": 0.5616, - "step": 72567 - }, - { - "epoch": 1.86, - "learning_rate": 6.664992026174791e-07, - "loss": 0.5869, - "step": 72568 - }, - { - "epoch": 1.86, - "learning_rate": 6.664731164297981e-07, - "loss": 0.4741, - "step": 72569 - }, - { - "epoch": 1.86, - "learning_rate": 6.664470304974834e-07, - "loss": 0.4473, - "step": 72570 - }, - { - "epoch": 1.86, - "learning_rate": 6.664209448205546e-07, - "loss": 0.5197, - "step": 72571 - }, - { - "epoch": 1.86, - "learning_rate": 6.663948593990324e-07, - "loss": 0.623, - "step": 72572 - }, - { - "epoch": 1.86, - "learning_rate": 6.663687742329361e-07, - "loss": 0.606, - "step": 72573 - }, - { - "epoch": 1.86, - "learning_rate": 6.663426893222861e-07, - "loss": 0.6084, - "step": 72574 - }, - { - "epoch": 1.86, - "learning_rate": 6.66316604667102e-07, - "loss": 0.6406, - "step": 72575 - }, - { - "epoch": 1.86, - "learning_rate": 6.662905202674037e-07, - "loss": 0.5752, - "step": 72576 - }, - { - "epoch": 1.86, - "learning_rate": 6.662644361232117e-07, - "loss": 0.5947, - "step": 72577 - }, - { - "epoch": 1.86, - "learning_rate": 6.662383522345454e-07, - "loss": 0.7363, - "step": 72578 - }, - { - "epoch": 1.86, - "learning_rate": 6.662122686014254e-07, - "loss": 0.6104, - "step": 72579 - }, - { - "epoch": 1.86, - "learning_rate": 6.66186185223871e-07, - "loss": 0.6323, - "step": 72580 - }, - { - "epoch": 1.86, - "learning_rate": 6.661601021019027e-07, - "loss": 0.7075, - "step": 72581 - }, - { - "epoch": 1.86, - "learning_rate": 6.661340192355403e-07, - "loss": 0.5674, - "step": 72582 - }, - { - "epoch": 1.86, - "learning_rate": 6.661079366248034e-07, - "loss": 0.7529, - "step": 72583 - }, - { - "epoch": 1.86, - "learning_rate": 6.660818542697129e-07, - "loss": 0.6377, - "step": 72584 - }, - { - "epoch": 1.86, - "learning_rate": 6.660557721702878e-07, - "loss": 0.6372, - "step": 72585 - }, - { - "epoch": 1.86, - "learning_rate": 6.660296903265483e-07, - "loss": 0.623, - "step": 72586 - }, - { - "epoch": 1.86, - "learning_rate": 6.660036087385146e-07, - "loss": 0.7812, - "step": 72587 - }, - { - "epoch": 1.86, - "learning_rate": 6.659775274062065e-07, - "loss": 0.5723, - "step": 72588 - }, - { - "epoch": 1.86, - "learning_rate": 6.659514463296443e-07, - "loss": 0.5391, - "step": 72589 - }, - { - "epoch": 1.86, - "learning_rate": 6.659253655088475e-07, - "loss": 0.4863, - "step": 72590 - }, - { - "epoch": 1.86, - "learning_rate": 6.658992849438363e-07, - "loss": 0.668, - "step": 72591 - }, - { - "epoch": 1.86, - "learning_rate": 6.658732046346307e-07, - "loss": 0.8318, - "step": 72592 - }, - { - "epoch": 1.86, - "learning_rate": 6.658471245812507e-07, - "loss": 0.7617, - "step": 72593 - }, - { - "epoch": 1.86, - "learning_rate": 6.658210447837163e-07, - "loss": 0.6313, - "step": 72594 - }, - { - "epoch": 1.86, - "learning_rate": 6.657949652420472e-07, - "loss": 0.6611, - "step": 72595 - }, - { - "epoch": 1.86, - "learning_rate": 6.657688859562636e-07, - "loss": 0.5864, - "step": 72596 - }, - { - "epoch": 1.86, - "learning_rate": 6.657428069263851e-07, - "loss": 0.6074, - "step": 72597 - }, - { - "epoch": 1.86, - "learning_rate": 6.657167281524323e-07, - "loss": 0.6885, - "step": 72598 - }, - { - "epoch": 1.86, - "learning_rate": 6.656906496344246e-07, - "loss": 0.6772, - "step": 72599 - }, - { - "epoch": 1.86, - "learning_rate": 6.656645713723823e-07, - "loss": 0.7227, - "step": 72600 - }, - { - "epoch": 1.86, - "learning_rate": 6.656384933663255e-07, - "loss": 0.7222, - "step": 72601 - }, - { - "epoch": 1.86, - "learning_rate": 6.656124156162735e-07, - "loss": 0.667, - "step": 72602 - }, - { - "epoch": 1.86, - "learning_rate": 6.65586338122247e-07, - "loss": 0.6816, - "step": 72603 - }, - { - "epoch": 1.86, - "learning_rate": 6.655602608842658e-07, - "loss": 0.7705, - "step": 72604 - }, - { - "epoch": 1.86, - "learning_rate": 6.655341839023494e-07, - "loss": 0.6299, - "step": 72605 - }, - { - "epoch": 1.86, - "learning_rate": 6.655081071765183e-07, - "loss": 0.667, - "step": 72606 - }, - { - "epoch": 1.86, - "learning_rate": 6.65482030706792e-07, - "loss": 0.6523, - "step": 72607 - }, - { - "epoch": 1.86, - "learning_rate": 6.654559544931909e-07, - "loss": 0.6479, - "step": 72608 - }, - { - "epoch": 1.86, - "learning_rate": 6.654298785357347e-07, - "loss": 0.7168, - "step": 72609 - }, - { - "epoch": 1.86, - "learning_rate": 6.654038028344435e-07, - "loss": 0.6367, - "step": 72610 - }, - { - "epoch": 1.86, - "learning_rate": 6.653777273893373e-07, - "loss": 0.5669, - "step": 72611 - }, - { - "epoch": 1.86, - "learning_rate": 6.653516522004359e-07, - "loss": 0.5569, - "step": 72612 - }, - { - "epoch": 1.86, - "learning_rate": 6.653255772677593e-07, - "loss": 0.5625, - "step": 72613 - }, - { - "epoch": 1.86, - "learning_rate": 6.65299502591328e-07, - "loss": 0.6973, - "step": 72614 - }, - { - "epoch": 1.86, - "learning_rate": 6.652734281711612e-07, - "loss": 0.5093, - "step": 72615 - }, - { - "epoch": 1.86, - "learning_rate": 6.652473540072787e-07, - "loss": 0.7051, - "step": 72616 - }, - { - "epoch": 1.86, - "learning_rate": 6.652212800997015e-07, - "loss": 0.5913, - "step": 72617 - }, - { - "epoch": 1.86, - "learning_rate": 6.651952064484488e-07, - "loss": 0.5488, - "step": 72618 - }, - { - "epoch": 1.86, - "learning_rate": 6.651691330535405e-07, - "loss": 0.7241, - "step": 72619 - }, - { - "epoch": 1.86, - "learning_rate": 6.65143059914997e-07, - "loss": 0.4707, - "step": 72620 - }, - { - "epoch": 1.86, - "learning_rate": 6.651169870328379e-07, - "loss": 0.5001, - "step": 72621 - }, - { - "epoch": 1.86, - "learning_rate": 6.650909144070836e-07, - "loss": 0.5977, - "step": 72622 - }, - { - "epoch": 1.86, - "learning_rate": 6.650648420377534e-07, - "loss": 0.6553, - "step": 72623 - }, - { - "epoch": 1.86, - "learning_rate": 6.650387699248681e-07, - "loss": 0.6367, - "step": 72624 - }, - { - "epoch": 1.86, - "learning_rate": 6.650126980684471e-07, - "loss": 0.3621, - "step": 72625 - }, - { - "epoch": 1.86, - "learning_rate": 6.649866264685102e-07, - "loss": 0.6436, - "step": 72626 - }, - { - "epoch": 1.86, - "learning_rate": 6.649605551250779e-07, - "loss": 0.5352, - "step": 72627 - }, - { - "epoch": 1.86, - "learning_rate": 6.649344840381697e-07, - "loss": 0.4587, - "step": 72628 - }, - { - "epoch": 1.86, - "learning_rate": 6.64908413207806e-07, - "loss": 0.7383, - "step": 72629 - }, - { - "epoch": 1.86, - "learning_rate": 6.648823426340063e-07, - "loss": 0.6553, - "step": 72630 - }, - { - "epoch": 1.86, - "learning_rate": 6.648562723167907e-07, - "loss": 0.7207, - "step": 72631 - }, - { - "epoch": 1.86, - "learning_rate": 6.648302022561793e-07, - "loss": 0.6816, - "step": 72632 - }, - { - "epoch": 1.86, - "learning_rate": 6.648041324521923e-07, - "loss": 0.4636, - "step": 72633 - }, - { - "epoch": 1.86, - "learning_rate": 6.647780629048494e-07, - "loss": 0.6035, - "step": 72634 - }, - { - "epoch": 1.86, - "learning_rate": 6.647519936141704e-07, - "loss": 0.73, - "step": 72635 - }, - { - "epoch": 1.86, - "learning_rate": 6.647259245801751e-07, - "loss": 0.6123, - "step": 72636 - }, - { - "epoch": 1.86, - "learning_rate": 6.64699855802884e-07, - "loss": 0.7598, - "step": 72637 - }, - { - "epoch": 1.86, - "learning_rate": 6.646737872823166e-07, - "loss": 0.6348, - "step": 72638 - }, - { - "epoch": 1.86, - "learning_rate": 6.646477190184932e-07, - "loss": 0.5322, - "step": 72639 - }, - { - "epoch": 1.86, - "learning_rate": 6.646216510114335e-07, - "loss": 0.6738, - "step": 72640 - }, - { - "epoch": 1.86, - "learning_rate": 6.645955832611579e-07, - "loss": 0.5957, - "step": 72641 - }, - { - "epoch": 1.86, - "learning_rate": 6.645695157676856e-07, - "loss": 0.7646, - "step": 72642 - }, - { - "epoch": 1.86, - "learning_rate": 6.645434485310373e-07, - "loss": 0.6631, - "step": 72643 - }, - { - "epoch": 1.86, - "learning_rate": 6.645173815512328e-07, - "loss": 0.7188, - "step": 72644 - }, - { - "epoch": 1.86, - "learning_rate": 6.644913148282916e-07, - "loss": 0.5757, - "step": 72645 - }, - { - "epoch": 1.86, - "learning_rate": 6.644652483622342e-07, - "loss": 0.2648, - "step": 72646 - }, - { - "epoch": 1.86, - "learning_rate": 6.6443918215308e-07, - "loss": 0.49, - "step": 72647 - }, - { - "epoch": 1.86, - "learning_rate": 6.644131162008496e-07, - "loss": 0.6021, - "step": 72648 - }, - { - "epoch": 1.86, - "learning_rate": 6.643870505055624e-07, - "loss": 0.8311, - "step": 72649 - }, - { - "epoch": 1.86, - "learning_rate": 6.643609850672388e-07, - "loss": 0.6562, - "step": 72650 - }, - { - "epoch": 1.86, - "learning_rate": 6.643349198858983e-07, - "loss": 0.6479, - "step": 72651 - }, - { - "epoch": 1.86, - "learning_rate": 6.643088549615614e-07, - "loss": 0.6621, - "step": 72652 - }, - { - "epoch": 1.86, - "learning_rate": 6.642827902942476e-07, - "loss": 0.6587, - "step": 72653 - }, - { - "epoch": 1.86, - "learning_rate": 6.642567258839776e-07, - "loss": 0.6494, - "step": 72654 - }, - { - "epoch": 1.86, - "learning_rate": 6.642306617307702e-07, - "loss": 0.5764, - "step": 72655 - }, - { - "epoch": 1.86, - "learning_rate": 6.642045978346461e-07, - "loss": 0.7375, - "step": 72656 - }, - { - "epoch": 1.86, - "learning_rate": 6.64178534195625e-07, - "loss": 0.6953, - "step": 72657 - }, - { - "epoch": 1.86, - "learning_rate": 6.641524708137271e-07, - "loss": 0.5991, - "step": 72658 - }, - { - "epoch": 1.86, - "learning_rate": 6.641264076889718e-07, - "loss": 0.6328, - "step": 72659 - }, - { - "epoch": 1.86, - "learning_rate": 6.6410034482138e-07, - "loss": 0.6348, - "step": 72660 - }, - { - "epoch": 1.86, - "learning_rate": 6.640742822109707e-07, - "loss": 0.5576, - "step": 72661 - }, - { - "epoch": 1.86, - "learning_rate": 6.640482198577646e-07, - "loss": 0.2839, - "step": 72662 - }, - { - "epoch": 1.86, - "learning_rate": 6.64022157761781e-07, - "loss": 0.5571, - "step": 72663 - }, - { - "epoch": 1.86, - "learning_rate": 6.639960959230407e-07, - "loss": 0.6758, - "step": 72664 - }, - { - "epoch": 1.86, - "learning_rate": 6.639700343415629e-07, - "loss": 0.5918, - "step": 72665 - }, - { - "epoch": 1.86, - "learning_rate": 6.639439730173677e-07, - "loss": 0.7705, - "step": 72666 - }, - { - "epoch": 1.86, - "learning_rate": 6.639179119504752e-07, - "loss": 0.7188, - "step": 72667 - }, - { - "epoch": 1.86, - "learning_rate": 6.638918511409051e-07, - "loss": 0.6465, - "step": 72668 - }, - { - "epoch": 1.86, - "learning_rate": 6.638657905886778e-07, - "loss": 0.583, - "step": 72669 - }, - { - "epoch": 1.86, - "learning_rate": 6.638397302938128e-07, - "loss": 0.7061, - "step": 72670 - }, - { - "epoch": 1.86, - "learning_rate": 6.638136702563306e-07, - "loss": 0.7637, - "step": 72671 - }, - { - "epoch": 1.86, - "learning_rate": 6.637876104762507e-07, - "loss": 0.5796, - "step": 72672 - }, - { - "epoch": 1.86, - "learning_rate": 6.637615509535928e-07, - "loss": 0.6377, - "step": 72673 - }, - { - "epoch": 1.86, - "learning_rate": 6.637354916883778e-07, - "loss": 0.583, - "step": 72674 - }, - { - "epoch": 1.86, - "learning_rate": 6.63709432680625e-07, - "loss": 0.3926, - "step": 72675 - }, - { - "epoch": 1.86, - "learning_rate": 6.63683373930354e-07, - "loss": 0.5391, - "step": 72676 - }, - { - "epoch": 1.86, - "learning_rate": 6.636573154375854e-07, - "loss": 0.6299, - "step": 72677 - }, - { - "epoch": 1.86, - "learning_rate": 6.636312572023388e-07, - "loss": 0.4751, - "step": 72678 - }, - { - "epoch": 1.86, - "learning_rate": 6.636051992246345e-07, - "loss": 0.7344, - "step": 72679 - }, - { - "epoch": 1.86, - "learning_rate": 6.63579141504492e-07, - "loss": 0.5386, - "step": 72680 - }, - { - "epoch": 1.86, - "learning_rate": 6.635530840419317e-07, - "loss": 0.6992, - "step": 72681 - }, - { - "epoch": 1.86, - "learning_rate": 6.63527026836973e-07, - "loss": 0.5151, - "step": 72682 - }, - { - "epoch": 1.86, - "learning_rate": 6.635009698896366e-07, - "loss": 0.6387, - "step": 72683 - }, - { - "epoch": 1.86, - "learning_rate": 6.63474913199942e-07, - "loss": 0.5312, - "step": 72684 - }, - { - "epoch": 1.86, - "learning_rate": 6.634488567679088e-07, - "loss": 0.6289, - "step": 72685 - }, - { - "epoch": 1.86, - "learning_rate": 6.634228005935578e-07, - "loss": 0.5479, - "step": 72686 - }, - { - "epoch": 1.86, - "learning_rate": 6.633967446769081e-07, - "loss": 0.7637, - "step": 72687 - }, - { - "epoch": 1.86, - "learning_rate": 6.633706890179802e-07, - "loss": 0.5801, - "step": 72688 - }, - { - "epoch": 1.86, - "learning_rate": 6.633446336167938e-07, - "loss": 0.7793, - "step": 72689 - }, - { - "epoch": 1.86, - "learning_rate": 6.63318578473369e-07, - "loss": 0.502, - "step": 72690 - }, - { - "epoch": 1.86, - "learning_rate": 6.632925235877258e-07, - "loss": 0.5989, - "step": 72691 - }, - { - "epoch": 1.86, - "learning_rate": 6.632664689598839e-07, - "loss": 0.5151, - "step": 72692 - }, - { - "epoch": 1.86, - "learning_rate": 6.632404145898634e-07, - "loss": 0.5405, - "step": 72693 - }, - { - "epoch": 1.86, - "learning_rate": 6.632143604776845e-07, - "loss": 0.7969, - "step": 72694 - }, - { - "epoch": 1.86, - "learning_rate": 6.631883066233666e-07, - "loss": 0.5181, - "step": 72695 - }, - { - "epoch": 1.86, - "learning_rate": 6.6316225302693e-07, - "loss": 0.5952, - "step": 72696 - }, - { - "epoch": 1.86, - "learning_rate": 6.631361996883944e-07, - "loss": 0.668, - "step": 72697 - }, - { - "epoch": 1.86, - "learning_rate": 6.631101466077799e-07, - "loss": 0.5503, - "step": 72698 - }, - { - "epoch": 1.86, - "learning_rate": 6.630840937851065e-07, - "loss": 0.6738, - "step": 72699 - }, - { - "epoch": 1.86, - "learning_rate": 6.630580412203945e-07, - "loss": 0.6299, - "step": 72700 - }, - { - "epoch": 1.86, - "learning_rate": 6.630319889136629e-07, - "loss": 0.5896, - "step": 72701 - }, - { - "epoch": 1.86, - "learning_rate": 6.630059368649326e-07, - "loss": 0.6553, - "step": 72702 - }, - { - "epoch": 1.86, - "learning_rate": 6.629798850742234e-07, - "loss": 0.4983, - "step": 72703 - }, - { - "epoch": 1.86, - "learning_rate": 6.629538335415545e-07, - "loss": 0.6934, - "step": 72704 - }, - { - "epoch": 1.86, - "learning_rate": 6.629277822669466e-07, - "loss": 0.6016, - "step": 72705 - }, - { - "epoch": 1.86, - "learning_rate": 6.629017312504192e-07, - "loss": 0.6914, - "step": 72706 - }, - { - "epoch": 1.86, - "learning_rate": 6.628756804919926e-07, - "loss": 0.5796, - "step": 72707 - }, - { - "epoch": 1.86, - "learning_rate": 6.628496299916867e-07, - "loss": 0.6221, - "step": 72708 - }, - { - "epoch": 1.86, - "learning_rate": 6.628235797495209e-07, - "loss": 0.5127, - "step": 72709 - }, - { - "epoch": 1.86, - "learning_rate": 6.62797529765516e-07, - "loss": 0.7009, - "step": 72710 - }, - { - "epoch": 1.86, - "learning_rate": 6.627714800396913e-07, - "loss": 0.7715, - "step": 72711 - }, - { - "epoch": 1.86, - "learning_rate": 6.627454305720672e-07, - "loss": 0.5884, - "step": 72712 - }, - { - "epoch": 1.86, - "learning_rate": 6.627193813626634e-07, - "loss": 0.6738, - "step": 72713 - }, - { - "epoch": 1.86, - "learning_rate": 6.626933324114998e-07, - "loss": 0.3793, - "step": 72714 - }, - { - "epoch": 1.86, - "learning_rate": 6.626672837185964e-07, - "loss": 0.7051, - "step": 72715 - }, - { - "epoch": 1.86, - "learning_rate": 6.62641235283973e-07, - "loss": 0.53, - "step": 72716 - }, - { - "epoch": 1.86, - "learning_rate": 6.626151871076498e-07, - "loss": 0.6099, - "step": 72717 - }, - { - "epoch": 1.86, - "learning_rate": 6.625891391896466e-07, - "loss": 0.5244, - "step": 72718 - }, - { - "epoch": 1.86, - "learning_rate": 6.625630915299834e-07, - "loss": 0.5703, - "step": 72719 - }, - { - "epoch": 1.86, - "learning_rate": 6.625370441286799e-07, - "loss": 0.6113, - "step": 72720 - }, - { - "epoch": 1.86, - "learning_rate": 6.625109969857567e-07, - "loss": 0.7314, - "step": 72721 - }, - { - "epoch": 1.86, - "learning_rate": 6.62484950101233e-07, - "loss": 0.6914, - "step": 72722 - }, - { - "epoch": 1.86, - "learning_rate": 6.624589034751294e-07, - "loss": 0.6479, - "step": 72723 - }, - { - "epoch": 1.86, - "learning_rate": 6.624328571074654e-07, - "loss": 0.5288, - "step": 72724 - }, - { - "epoch": 1.86, - "learning_rate": 6.62406810998261e-07, - "loss": 0.7266, - "step": 72725 - }, - { - "epoch": 1.86, - "learning_rate": 6.62380765147536e-07, - "loss": 0.6777, - "step": 72726 - }, - { - "epoch": 1.86, - "learning_rate": 6.623547195553105e-07, - "loss": 0.7334, - "step": 72727 - }, - { - "epoch": 1.86, - "learning_rate": 6.623286742216045e-07, - "loss": 0.6436, - "step": 72728 - }, - { - "epoch": 1.86, - "learning_rate": 6.623026291464381e-07, - "loss": 0.6138, - "step": 72729 - }, - { - "epoch": 1.86, - "learning_rate": 6.622765843298308e-07, - "loss": 0.5007, - "step": 72730 - }, - { - "epoch": 1.86, - "learning_rate": 6.62250539771803e-07, - "loss": 0.5212, - "step": 72731 - }, - { - "epoch": 1.86, - "learning_rate": 6.622244954723743e-07, - "loss": 0.5923, - "step": 72732 - }, - { - "epoch": 1.86, - "learning_rate": 6.621984514315651e-07, - "loss": 0.6094, - "step": 72733 - }, - { - "epoch": 1.86, - "learning_rate": 6.621724076493947e-07, - "loss": 0.7383, - "step": 72734 - }, - { - "epoch": 1.86, - "learning_rate": 6.621463641258833e-07, - "loss": 0.52, - "step": 72735 - }, - { - "epoch": 1.86, - "learning_rate": 6.62120320861051e-07, - "loss": 0.7446, - "step": 72736 - }, - { - "epoch": 1.86, - "learning_rate": 6.620942778549176e-07, - "loss": 0.6765, - "step": 72737 - }, - { - "epoch": 1.86, - "learning_rate": 6.62068235107503e-07, - "loss": 0.6147, - "step": 72738 - }, - { - "epoch": 1.86, - "learning_rate": 6.620421926188274e-07, - "loss": 0.6689, - "step": 72739 - }, - { - "epoch": 1.86, - "learning_rate": 6.620161503889105e-07, - "loss": 0.6562, - "step": 72740 - }, - { - "epoch": 1.86, - "learning_rate": 6.619901084177721e-07, - "loss": 0.666, - "step": 72741 - }, - { - "epoch": 1.86, - "learning_rate": 6.619640667054326e-07, - "loss": 0.8018, - "step": 72742 - }, - { - "epoch": 1.86, - "learning_rate": 6.619380252519118e-07, - "loss": 0.5845, - "step": 72743 - }, - { - "epoch": 1.86, - "learning_rate": 6.619119840572294e-07, - "loss": 0.5898, - "step": 72744 - }, - { - "epoch": 1.86, - "learning_rate": 6.618859431214052e-07, - "loss": 0.4019, - "step": 72745 - }, - { - "epoch": 1.86, - "learning_rate": 6.618599024444596e-07, - "loss": 0.6738, - "step": 72746 - }, - { - "epoch": 1.86, - "learning_rate": 6.618338620264122e-07, - "loss": 0.5337, - "step": 72747 - }, - { - "epoch": 1.86, - "learning_rate": 6.61807821867283e-07, - "loss": 0.6138, - "step": 72748 - }, - { - "epoch": 1.86, - "learning_rate": 6.61781781967092e-07, - "loss": 0.6211, - "step": 72749 - }, - { - "epoch": 1.86, - "learning_rate": 6.617557423258593e-07, - "loss": 0.6919, - "step": 72750 - }, - { - "epoch": 1.86, - "learning_rate": 6.617297029436045e-07, - "loss": 0.6118, - "step": 72751 - }, - { - "epoch": 1.86, - "learning_rate": 6.617036638203479e-07, - "loss": 0.6494, - "step": 72752 - }, - { - "epoch": 1.86, - "learning_rate": 6.616776249561094e-07, - "loss": 0.6504, - "step": 72753 - }, - { - "epoch": 1.86, - "learning_rate": 6.616515863509085e-07, - "loss": 0.6572, - "step": 72754 - }, - { - "epoch": 1.86, - "learning_rate": 6.616255480047655e-07, - "loss": 0.7231, - "step": 72755 - }, - { - "epoch": 1.86, - "learning_rate": 6.615995099177001e-07, - "loss": 0.7354, - "step": 72756 - }, - { - "epoch": 1.86, - "learning_rate": 6.615734720897326e-07, - "loss": 0.5935, - "step": 72757 - }, - { - "epoch": 1.86, - "learning_rate": 6.615474345208824e-07, - "loss": 0.6182, - "step": 72758 - }, - { - "epoch": 1.86, - "learning_rate": 6.615213972111701e-07, - "loss": 0.6343, - "step": 72759 - }, - { - "epoch": 1.86, - "learning_rate": 6.614953601606153e-07, - "loss": 0.5747, - "step": 72760 - }, - { - "epoch": 1.86, - "learning_rate": 6.614693233692379e-07, - "loss": 0.6011, - "step": 72761 - }, - { - "epoch": 1.86, - "learning_rate": 6.614432868370577e-07, - "loss": 0.8232, - "step": 72762 - }, - { - "epoch": 1.86, - "learning_rate": 6.614172505640954e-07, - "loss": 0.5654, - "step": 72763 - }, - { - "epoch": 1.86, - "learning_rate": 6.613912145503697e-07, - "loss": 0.4834, - "step": 72764 - }, - { - "epoch": 1.87, - "learning_rate": 6.613651787959016e-07, - "loss": 0.5537, - "step": 72765 - }, - { - "epoch": 1.87, - "learning_rate": 6.613391433007103e-07, - "loss": 0.5396, - "step": 72766 - }, - { - "epoch": 1.87, - "learning_rate": 6.613131080648161e-07, - "loss": 0.6924, - "step": 72767 - }, - { - "epoch": 1.87, - "learning_rate": 6.612870730882387e-07, - "loss": 0.6265, - "step": 72768 - }, - { - "epoch": 1.87, - "learning_rate": 6.612610383709987e-07, - "loss": 0.5967, - "step": 72769 - }, - { - "epoch": 1.87, - "learning_rate": 6.61235003913115e-07, - "loss": 0.5635, - "step": 72770 - }, - { - "epoch": 1.87, - "learning_rate": 6.612089697146084e-07, - "loss": 0.6448, - "step": 72771 - }, - { - "epoch": 1.87, - "learning_rate": 6.611829357754983e-07, - "loss": 0.8379, - "step": 72772 - }, - { - "epoch": 1.87, - "learning_rate": 6.611569020958054e-07, - "loss": 0.5952, - "step": 72773 - }, - { - "epoch": 1.87, - "learning_rate": 6.611308686755488e-07, - "loss": 0.7109, - "step": 72774 - }, - { - "epoch": 1.87, - "learning_rate": 6.611048355147484e-07, - "loss": 0.7061, - "step": 72775 - }, - { - "epoch": 1.87, - "learning_rate": 6.610788026134247e-07, - "loss": 0.5256, - "step": 72776 - }, - { - "epoch": 1.87, - "learning_rate": 6.610527699715973e-07, - "loss": 0.4905, - "step": 72777 - }, - { - "epoch": 1.87, - "learning_rate": 6.610267375892862e-07, - "loss": 0.6729, - "step": 72778 - }, - { - "epoch": 1.87, - "learning_rate": 6.610007054665112e-07, - "loss": 0.5112, - "step": 72779 - }, - { - "epoch": 1.87, - "learning_rate": 6.609746736032927e-07, - "loss": 0.5962, - "step": 72780 - }, - { - "epoch": 1.87, - "learning_rate": 6.609486419996501e-07, - "loss": 0.5493, - "step": 72781 - }, - { - "epoch": 1.87, - "learning_rate": 6.609226106556037e-07, - "loss": 0.6641, - "step": 72782 - }, - { - "epoch": 1.87, - "learning_rate": 6.608965795711733e-07, - "loss": 0.5388, - "step": 72783 - }, - { - "epoch": 1.87, - "learning_rate": 6.608705487463788e-07, - "loss": 0.8301, - "step": 72784 - }, - { - "epoch": 1.87, - "learning_rate": 6.608445181812399e-07, - "loss": 0.7266, - "step": 72785 - }, - { - "epoch": 1.87, - "learning_rate": 6.608184878757767e-07, - "loss": 0.5632, - "step": 72786 - }, - { - "epoch": 1.87, - "learning_rate": 6.607924578300092e-07, - "loss": 0.7432, - "step": 72787 - }, - { - "epoch": 1.87, - "learning_rate": 6.607664280439576e-07, - "loss": 0.6426, - "step": 72788 - }, - { - "epoch": 1.87, - "learning_rate": 6.607403985176412e-07, - "loss": 0.6196, - "step": 72789 - }, - { - "epoch": 1.87, - "learning_rate": 6.607143692510806e-07, - "loss": 0.5183, - "step": 72790 - }, - { - "epoch": 1.87, - "learning_rate": 6.606883402442951e-07, - "loss": 0.7227, - "step": 72791 - }, - { - "epoch": 1.87, - "learning_rate": 6.606623114973052e-07, - "loss": 0.5376, - "step": 72792 - }, - { - "epoch": 1.87, - "learning_rate": 6.606362830101307e-07, - "loss": 0.6777, - "step": 72793 - }, - { - "epoch": 1.87, - "learning_rate": 6.606102547827911e-07, - "loss": 0.6411, - "step": 72794 - }, - { - "epoch": 1.87, - "learning_rate": 6.605842268153068e-07, - "loss": 0.5161, - "step": 72795 - }, - { - "epoch": 1.87, - "learning_rate": 6.605581991076972e-07, - "loss": 0.6943, - "step": 72796 - }, - { - "epoch": 1.87, - "learning_rate": 6.60532171659983e-07, - "loss": 0.5386, - "step": 72797 - }, - { - "epoch": 1.87, - "learning_rate": 6.605061444721835e-07, - "loss": 0.3782, - "step": 72798 - }, - { - "epoch": 1.87, - "learning_rate": 6.604801175443188e-07, - "loss": 0.5801, - "step": 72799 - }, - { - "epoch": 1.87, - "learning_rate": 6.604540908764089e-07, - "loss": 0.7295, - "step": 72800 - }, - { - "epoch": 1.87, - "learning_rate": 6.604280644684736e-07, - "loss": 0.6445, - "step": 72801 - }, - { - "epoch": 1.87, - "learning_rate": 6.604020383205331e-07, - "loss": 0.7437, - "step": 72802 - }, - { - "epoch": 1.87, - "learning_rate": 6.603760124326074e-07, - "loss": 0.6641, - "step": 72803 - }, - { - "epoch": 1.87, - "learning_rate": 6.603499868047157e-07, - "loss": 0.71, - "step": 72804 - }, - { - "epoch": 1.87, - "learning_rate": 6.603239614368787e-07, - "loss": 0.615, - "step": 72805 - }, - { - "epoch": 1.87, - "learning_rate": 6.602979363291157e-07, - "loss": 0.623, - "step": 72806 - }, - { - "epoch": 1.87, - "learning_rate": 6.602719114814472e-07, - "loss": 0.535, - "step": 72807 - }, - { - "epoch": 1.87, - "learning_rate": 6.602458868938927e-07, - "loss": 0.7168, - "step": 72808 - }, - { - "epoch": 1.87, - "learning_rate": 6.602198625664723e-07, - "loss": 0.6885, - "step": 72809 - }, - { - "epoch": 1.87, - "learning_rate": 6.601938384992061e-07, - "loss": 0.6353, - "step": 72810 - }, - { - "epoch": 1.87, - "learning_rate": 6.601678146921137e-07, - "loss": 0.4685, - "step": 72811 - }, - { - "epoch": 1.87, - "learning_rate": 6.601417911452151e-07, - "loss": 0.5566, - "step": 72812 - }, - { - "epoch": 1.87, - "learning_rate": 6.601157678585307e-07, - "loss": 0.7188, - "step": 72813 - }, - { - "epoch": 1.87, - "learning_rate": 6.6008974483208e-07, - "loss": 0.6572, - "step": 72814 - }, - { - "epoch": 1.87, - "learning_rate": 6.600637220658828e-07, - "loss": 0.7656, - "step": 72815 - }, - { - "epoch": 1.87, - "learning_rate": 6.600376995599591e-07, - "loss": 0.5088, - "step": 72816 - }, - { - "epoch": 1.87, - "learning_rate": 6.600116773143288e-07, - "loss": 0.7451, - "step": 72817 - }, - { - "epoch": 1.87, - "learning_rate": 6.599856553290119e-07, - "loss": 0.6089, - "step": 72818 - }, - { - "epoch": 1.87, - "learning_rate": 6.599596336040287e-07, - "loss": 0.4497, - "step": 72819 - }, - { - "epoch": 1.87, - "learning_rate": 6.599336121393983e-07, - "loss": 0.479, - "step": 72820 - }, - { - "epoch": 1.87, - "learning_rate": 6.599075909351415e-07, - "loss": 0.4338, - "step": 72821 - }, - { - "epoch": 1.87, - "learning_rate": 6.598815699912776e-07, - "loss": 0.7764, - "step": 72822 - }, - { - "epoch": 1.87, - "learning_rate": 6.598555493078271e-07, - "loss": 0.5742, - "step": 72823 - }, - { - "epoch": 1.87, - "learning_rate": 6.598295288848092e-07, - "loss": 0.7334, - "step": 72824 - }, - { - "epoch": 1.87, - "learning_rate": 6.598035087222442e-07, - "loss": 0.5493, - "step": 72825 - }, - { - "epoch": 1.87, - "learning_rate": 6.597774888201521e-07, - "loss": 0.6787, - "step": 72826 - }, - { - "epoch": 1.87, - "learning_rate": 6.597514691785527e-07, - "loss": 0.585, - "step": 72827 - }, - { - "epoch": 1.87, - "learning_rate": 6.597254497974661e-07, - "loss": 0.5352, - "step": 72828 - }, - { - "epoch": 1.87, - "learning_rate": 6.596994306769118e-07, - "loss": 0.6943, - "step": 72829 - }, - { - "epoch": 1.87, - "learning_rate": 6.596734118169102e-07, - "loss": 0.6255, - "step": 72830 - }, - { - "epoch": 1.87, - "learning_rate": 6.596473932174809e-07, - "loss": 0.6113, - "step": 72831 - }, - { - "epoch": 1.87, - "learning_rate": 6.596213748786441e-07, - "loss": 0.5369, - "step": 72832 - }, - { - "epoch": 1.87, - "learning_rate": 6.595953568004198e-07, - "loss": 0.6982, - "step": 72833 - }, - { - "epoch": 1.87, - "learning_rate": 6.595693389828274e-07, - "loss": 0.6055, - "step": 72834 - }, - { - "epoch": 1.87, - "learning_rate": 6.595433214258869e-07, - "loss": 0.5996, - "step": 72835 - }, - { - "epoch": 1.87, - "learning_rate": 6.595173041296187e-07, - "loss": 0.5496, - "step": 72836 - }, - { - "epoch": 1.87, - "learning_rate": 6.594912870940421e-07, - "loss": 0.623, - "step": 72837 - }, - { - "epoch": 1.87, - "learning_rate": 6.594652703191777e-07, - "loss": 0.666, - "step": 72838 - }, - { - "epoch": 1.87, - "learning_rate": 6.594392538050449e-07, - "loss": 0.5923, - "step": 72839 - }, - { - "epoch": 1.87, - "learning_rate": 6.594132375516639e-07, - "loss": 0.749, - "step": 72840 - }, - { - "epoch": 1.87, - "learning_rate": 6.593872215590544e-07, - "loss": 0.5527, - "step": 72841 - }, - { - "epoch": 1.87, - "learning_rate": 6.593612058272366e-07, - "loss": 0.6196, - "step": 72842 - }, - { - "epoch": 1.87, - "learning_rate": 6.593351903562306e-07, - "loss": 0.7197, - "step": 72843 - }, - { - "epoch": 1.87, - "learning_rate": 6.593091751460553e-07, - "loss": 0.6938, - "step": 72844 - }, - { - "epoch": 1.87, - "learning_rate": 6.592831601967316e-07, - "loss": 0.5894, - "step": 72845 - }, - { - "epoch": 1.87, - "learning_rate": 6.592571455082791e-07, - "loss": 0.6616, - "step": 72846 - }, - { - "epoch": 1.87, - "learning_rate": 6.592311310807178e-07, - "loss": 0.6553, - "step": 72847 - }, - { - "epoch": 1.87, - "learning_rate": 6.592051169140673e-07, - "loss": 0.5273, - "step": 72848 - }, - { - "epoch": 1.87, - "learning_rate": 6.591791030083481e-07, - "loss": 0.9189, - "step": 72849 - }, - { - "epoch": 1.87, - "learning_rate": 6.591530893635795e-07, - "loss": 0.6792, - "step": 72850 - }, - { - "epoch": 1.87, - "learning_rate": 6.59127075979782e-07, - "loss": 0.5725, - "step": 72851 - }, - { - "epoch": 1.87, - "learning_rate": 6.591010628569749e-07, - "loss": 0.5498, - "step": 72852 - }, - { - "epoch": 1.87, - "learning_rate": 6.590750499951792e-07, - "loss": 0.7207, - "step": 72853 - }, - { - "epoch": 1.87, - "learning_rate": 6.590490373944133e-07, - "loss": 0.4761, - "step": 72854 - }, - { - "epoch": 1.87, - "learning_rate": 6.590230250546982e-07, - "loss": 0.5864, - "step": 72855 - }, - { - "epoch": 1.87, - "learning_rate": 6.589970129760531e-07, - "loss": 0.6797, - "step": 72856 - }, - { - "epoch": 1.87, - "learning_rate": 6.589710011584988e-07, - "loss": 0.4883, - "step": 72857 - }, - { - "epoch": 1.87, - "learning_rate": 6.589449896020543e-07, - "loss": 0.6943, - "step": 72858 - }, - { - "epoch": 1.87, - "learning_rate": 6.589189783067401e-07, - "loss": 0.6504, - "step": 72859 - }, - { - "epoch": 1.87, - "learning_rate": 6.588929672725759e-07, - "loss": 0.7764, - "step": 72860 - }, - { - "epoch": 1.87, - "learning_rate": 6.588669564995819e-07, - "loss": 0.5869, - "step": 72861 - }, - { - "epoch": 1.87, - "learning_rate": 6.588409459877776e-07, - "loss": 0.666, - "step": 72862 - }, - { - "epoch": 1.87, - "learning_rate": 6.588149357371833e-07, - "loss": 0.5303, - "step": 72863 - }, - { - "epoch": 1.87, - "learning_rate": 6.587889257478186e-07, - "loss": 0.6328, - "step": 72864 - }, - { - "epoch": 1.87, - "learning_rate": 6.587629160197034e-07, - "loss": 0.6641, - "step": 72865 - }, - { - "epoch": 1.87, - "learning_rate": 6.587369065528579e-07, - "loss": 0.6387, - "step": 72866 - }, - { - "epoch": 1.87, - "learning_rate": 6.587108973473017e-07, - "loss": 0.5205, - "step": 72867 - }, - { - "epoch": 1.87, - "learning_rate": 6.586848884030549e-07, - "loss": 0.6689, - "step": 72868 - }, - { - "epoch": 1.87, - "learning_rate": 6.586588797201373e-07, - "loss": 0.7471, - "step": 72869 - }, - { - "epoch": 1.87, - "learning_rate": 6.586328712985691e-07, - "loss": 0.5962, - "step": 72870 - }, - { - "epoch": 1.87, - "learning_rate": 6.586068631383701e-07, - "loss": 0.4563, - "step": 72871 - }, - { - "epoch": 1.87, - "learning_rate": 6.5858085523956e-07, - "loss": 0.4651, - "step": 72872 - }, - { - "epoch": 1.87, - "learning_rate": 6.585548476021589e-07, - "loss": 0.5105, - "step": 72873 - }, - { - "epoch": 1.87, - "learning_rate": 6.585288402261868e-07, - "loss": 0.7266, - "step": 72874 - }, - { - "epoch": 1.87, - "learning_rate": 6.585028331116631e-07, - "loss": 0.6533, - "step": 72875 - }, - { - "epoch": 1.87, - "learning_rate": 6.584768262586082e-07, - "loss": 0.464, - "step": 72876 - }, - { - "epoch": 1.87, - "learning_rate": 6.584508196670419e-07, - "loss": 0.6216, - "step": 72877 - }, - { - "epoch": 1.87, - "learning_rate": 6.584248133369841e-07, - "loss": 0.7295, - "step": 72878 - }, - { - "epoch": 1.87, - "learning_rate": 6.583988072684546e-07, - "loss": 0.605, - "step": 72879 - }, - { - "epoch": 1.87, - "learning_rate": 6.583728014614737e-07, - "loss": 0.7026, - "step": 72880 - }, - { - "epoch": 1.87, - "learning_rate": 6.583467959160607e-07, - "loss": 0.7773, - "step": 72881 - }, - { - "epoch": 1.87, - "learning_rate": 6.583207906322361e-07, - "loss": 0.6455, - "step": 72882 - }, - { - "epoch": 1.87, - "learning_rate": 6.582947856100198e-07, - "loss": 0.5537, - "step": 72883 - }, - { - "epoch": 1.87, - "learning_rate": 6.582687808494312e-07, - "loss": 0.665, - "step": 72884 - }, - { - "epoch": 1.87, - "learning_rate": 6.582427763504905e-07, - "loss": 0.6191, - "step": 72885 - }, - { - "epoch": 1.87, - "learning_rate": 6.582167721132174e-07, - "loss": 0.4097, - "step": 72886 - }, - { - "epoch": 1.87, - "learning_rate": 6.581907681376322e-07, - "loss": 0.7061, - "step": 72887 - }, - { - "epoch": 1.87, - "learning_rate": 6.581647644237547e-07, - "loss": 0.6113, - "step": 72888 - }, - { - "epoch": 1.87, - "learning_rate": 6.581387609716044e-07, - "loss": 0.6709, - "step": 72889 - }, - { - "epoch": 1.87, - "learning_rate": 6.581127577812018e-07, - "loss": 0.7578, - "step": 72890 - }, - { - "epoch": 1.87, - "learning_rate": 6.580867548525664e-07, - "loss": 0.5547, - "step": 72891 - }, - { - "epoch": 1.87, - "learning_rate": 6.580607521857183e-07, - "loss": 0.4016, - "step": 72892 - }, - { - "epoch": 1.87, - "learning_rate": 6.580347497806776e-07, - "loss": 0.5879, - "step": 72893 - }, - { - "epoch": 1.87, - "learning_rate": 6.580087476374636e-07, - "loss": 0.5601, - "step": 72894 - }, - { - "epoch": 1.87, - "learning_rate": 6.579827457560969e-07, - "loss": 0.7266, - "step": 72895 - }, - { - "epoch": 1.87, - "learning_rate": 6.579567441365968e-07, - "loss": 0.6934, - "step": 72896 - }, - { - "epoch": 1.87, - "learning_rate": 6.579307427789835e-07, - "loss": 0.625, - "step": 72897 - }, - { - "epoch": 1.87, - "learning_rate": 6.579047416832769e-07, - "loss": 0.7012, - "step": 72898 - }, - { - "epoch": 1.87, - "learning_rate": 6.578787408494971e-07, - "loss": 0.4702, - "step": 72899 - }, - { - "epoch": 1.87, - "learning_rate": 6.578527402776636e-07, - "loss": 0.8262, - "step": 72900 - }, - { - "epoch": 1.87, - "learning_rate": 6.578267399677967e-07, - "loss": 0.7305, - "step": 72901 - }, - { - "epoch": 1.87, - "learning_rate": 6.578007399199159e-07, - "loss": 0.6382, - "step": 72902 - }, - { - "epoch": 1.87, - "learning_rate": 6.577747401340418e-07, - "loss": 0.7529, - "step": 72903 - }, - { - "epoch": 1.87, - "learning_rate": 6.577487406101937e-07, - "loss": 0.8042, - "step": 72904 - }, - { - "epoch": 1.87, - "learning_rate": 6.577227413483915e-07, - "loss": 0.4878, - "step": 72905 - }, - { - "epoch": 1.87, - "learning_rate": 6.576967423486553e-07, - "loss": 0.4431, - "step": 72906 - }, - { - "epoch": 1.87, - "learning_rate": 6.576707436110049e-07, - "loss": 0.7524, - "step": 72907 - }, - { - "epoch": 1.87, - "learning_rate": 6.576447451354602e-07, - "loss": 0.6484, - "step": 72908 - }, - { - "epoch": 1.87, - "learning_rate": 6.576187469220413e-07, - "loss": 0.4956, - "step": 72909 - }, - { - "epoch": 1.87, - "learning_rate": 6.575927489707679e-07, - "loss": 0.584, - "step": 72910 - }, - { - "epoch": 1.87, - "learning_rate": 6.575667512816601e-07, - "loss": 0.6094, - "step": 72911 - }, - { - "epoch": 1.87, - "learning_rate": 6.575407538547375e-07, - "loss": 0.8506, - "step": 72912 - }, - { - "epoch": 1.87, - "learning_rate": 6.575147566900207e-07, - "loss": 0.4673, - "step": 72913 - }, - { - "epoch": 1.87, - "learning_rate": 6.574887597875287e-07, - "loss": 0.749, - "step": 72914 - }, - { - "epoch": 1.87, - "learning_rate": 6.574627631472817e-07, - "loss": 0.5801, - "step": 72915 - }, - { - "epoch": 1.87, - "learning_rate": 6.574367667693e-07, - "loss": 0.668, - "step": 72916 - }, - { - "epoch": 1.87, - "learning_rate": 6.57410770653603e-07, - "loss": 0.6904, - "step": 72917 - }, - { - "epoch": 1.87, - "learning_rate": 6.573847748002111e-07, - "loss": 0.7422, - "step": 72918 - }, - { - "epoch": 1.87, - "learning_rate": 6.573587792091435e-07, - "loss": 0.6431, - "step": 72919 - }, - { - "epoch": 1.87, - "learning_rate": 6.573327838804208e-07, - "loss": 0.5645, - "step": 72920 - }, - { - "epoch": 1.87, - "learning_rate": 6.573067888140624e-07, - "loss": 0.7412, - "step": 72921 - }, - { - "epoch": 1.87, - "learning_rate": 6.572807940100887e-07, - "loss": 0.8018, - "step": 72922 - }, - { - "epoch": 1.87, - "learning_rate": 6.572547994685196e-07, - "loss": 0.6895, - "step": 72923 - }, - { - "epoch": 1.87, - "learning_rate": 6.572288051893744e-07, - "loss": 0.6777, - "step": 72924 - }, - { - "epoch": 1.87, - "learning_rate": 6.572028111726732e-07, - "loss": 0.7754, - "step": 72925 - }, - { - "epoch": 1.87, - "learning_rate": 6.571768174184363e-07, - "loss": 0.6416, - "step": 72926 - }, - { - "epoch": 1.87, - "learning_rate": 6.571508239266832e-07, - "loss": 0.7134, - "step": 72927 - }, - { - "epoch": 1.87, - "learning_rate": 6.57124830697434e-07, - "loss": 0.4634, - "step": 72928 - }, - { - "epoch": 1.87, - "learning_rate": 6.570988377307084e-07, - "loss": 0.7559, - "step": 72929 - }, - { - "epoch": 1.87, - "learning_rate": 6.570728450265266e-07, - "loss": 0.5898, - "step": 72930 - }, - { - "epoch": 1.87, - "learning_rate": 6.570468525849083e-07, - "loss": 0.6377, - "step": 72931 - }, - { - "epoch": 1.87, - "learning_rate": 6.570208604058736e-07, - "loss": 0.668, - "step": 72932 - }, - { - "epoch": 1.87, - "learning_rate": 6.569948684894425e-07, - "loss": 0.6865, - "step": 72933 - }, - { - "epoch": 1.87, - "learning_rate": 6.569688768356341e-07, - "loss": 0.5981, - "step": 72934 - }, - { - "epoch": 1.87, - "learning_rate": 6.56942885444469e-07, - "loss": 0.6304, - "step": 72935 - }, - { - "epoch": 1.87, - "learning_rate": 6.56916894315967e-07, - "loss": 0.7656, - "step": 72936 - }, - { - "epoch": 1.87, - "learning_rate": 6.56890903450148e-07, - "loss": 0.5898, - "step": 72937 - }, - { - "epoch": 1.87, - "learning_rate": 6.568649128470318e-07, - "loss": 0.5591, - "step": 72938 - }, - { - "epoch": 1.87, - "learning_rate": 6.568389225066384e-07, - "loss": 0.7515, - "step": 72939 - }, - { - "epoch": 1.87, - "learning_rate": 6.568129324289875e-07, - "loss": 0.6265, - "step": 72940 - }, - { - "epoch": 1.87, - "learning_rate": 6.567869426140995e-07, - "loss": 0.7388, - "step": 72941 - }, - { - "epoch": 1.87, - "learning_rate": 6.567609530619935e-07, - "loss": 0.5747, - "step": 72942 - }, - { - "epoch": 1.87, - "learning_rate": 6.567349637726906e-07, - "loss": 0.541, - "step": 72943 - }, - { - "epoch": 1.87, - "learning_rate": 6.567089747462095e-07, - "loss": 0.6079, - "step": 72944 - }, - { - "epoch": 1.87, - "learning_rate": 6.566829859825706e-07, - "loss": 0.6709, - "step": 72945 - }, - { - "epoch": 1.87, - "learning_rate": 6.566569974817935e-07, - "loss": 0.7188, - "step": 72946 - }, - { - "epoch": 1.87, - "learning_rate": 6.566310092438987e-07, - "loss": 0.6714, - "step": 72947 - }, - { - "epoch": 1.87, - "learning_rate": 6.566050212689054e-07, - "loss": 0.6641, - "step": 72948 - }, - { - "epoch": 1.87, - "learning_rate": 6.565790335568342e-07, - "loss": 0.6079, - "step": 72949 - }, - { - "epoch": 1.87, - "learning_rate": 6.565530461077042e-07, - "loss": 0.7339, - "step": 72950 - }, - { - "epoch": 1.87, - "learning_rate": 6.565270589215362e-07, - "loss": 0.6943, - "step": 72951 - }, - { - "epoch": 1.87, - "learning_rate": 6.565010719983493e-07, - "loss": 0.5405, - "step": 72952 - }, - { - "epoch": 1.87, - "learning_rate": 6.564750853381642e-07, - "loss": 0.6851, - "step": 72953 - }, - { - "epoch": 1.87, - "learning_rate": 6.564490989410001e-07, - "loss": 0.5151, - "step": 72954 - }, - { - "epoch": 1.87, - "learning_rate": 6.564231128068769e-07, - "loss": 0.6797, - "step": 72955 - }, - { - "epoch": 1.87, - "learning_rate": 6.563971269358148e-07, - "loss": 0.7119, - "step": 72956 - }, - { - "epoch": 1.87, - "learning_rate": 6.563711413278336e-07, - "loss": 0.8271, - "step": 72957 - }, - { - "epoch": 1.87, - "learning_rate": 6.563451559829534e-07, - "loss": 0.4683, - "step": 72958 - }, - { - "epoch": 1.87, - "learning_rate": 6.563191709011937e-07, - "loss": 0.6396, - "step": 72959 - }, - { - "epoch": 1.87, - "learning_rate": 6.562931860825749e-07, - "loss": 0.6416, - "step": 72960 - }, - { - "epoch": 1.87, - "learning_rate": 6.562672015271164e-07, - "loss": 0.8184, - "step": 72961 - }, - { - "epoch": 1.87, - "learning_rate": 6.562412172348383e-07, - "loss": 0.731, - "step": 72962 - }, - { - "epoch": 1.87, - "learning_rate": 6.562152332057608e-07, - "loss": 0.5073, - "step": 72963 - }, - { - "epoch": 1.87, - "learning_rate": 6.561892494399033e-07, - "loss": 0.6816, - "step": 72964 - }, - { - "epoch": 1.87, - "learning_rate": 6.561632659372856e-07, - "loss": 0.7158, - "step": 72965 - }, - { - "epoch": 1.87, - "learning_rate": 6.561372826979281e-07, - "loss": 0.6519, - "step": 72966 - }, - { - "epoch": 1.87, - "learning_rate": 6.561112997218503e-07, - "loss": 0.6904, - "step": 72967 - }, - { - "epoch": 1.87, - "learning_rate": 6.560853170090725e-07, - "loss": 0.7197, - "step": 72968 - }, - { - "epoch": 1.87, - "learning_rate": 6.560593345596142e-07, - "loss": 0.7227, - "step": 72969 - }, - { - "epoch": 1.87, - "learning_rate": 6.560333523734956e-07, - "loss": 0.519, - "step": 72970 - }, - { - "epoch": 1.87, - "learning_rate": 6.560073704507363e-07, - "loss": 0.4561, - "step": 72971 - }, - { - "epoch": 1.87, - "learning_rate": 6.559813887913565e-07, - "loss": 0.6147, - "step": 72972 - }, - { - "epoch": 1.87, - "learning_rate": 6.559554073953761e-07, - "loss": 0.5532, - "step": 72973 - }, - { - "epoch": 1.87, - "learning_rate": 6.559294262628144e-07, - "loss": 0.5171, - "step": 72974 - }, - { - "epoch": 1.87, - "learning_rate": 6.559034453936921e-07, - "loss": 0.3677, - "step": 72975 - }, - { - "epoch": 1.87, - "learning_rate": 6.558774647880282e-07, - "loss": 0.7568, - "step": 72976 - }, - { - "epoch": 1.87, - "learning_rate": 6.558514844458434e-07, - "loss": 0.6709, - "step": 72977 - }, - { - "epoch": 1.87, - "learning_rate": 6.558255043671575e-07, - "loss": 0.4902, - "step": 72978 - }, - { - "epoch": 1.87, - "learning_rate": 6.557995245519899e-07, - "loss": 0.6021, - "step": 72979 - }, - { - "epoch": 1.87, - "learning_rate": 6.557735450003607e-07, - "loss": 0.667, - "step": 72980 - }, - { - "epoch": 1.87, - "learning_rate": 6.5574756571229e-07, - "loss": 0.6284, - "step": 72981 - }, - { - "epoch": 1.87, - "learning_rate": 6.557215866877976e-07, - "loss": 0.751, - "step": 72982 - }, - { - "epoch": 1.87, - "learning_rate": 6.556956079269036e-07, - "loss": 0.6172, - "step": 72983 - }, - { - "epoch": 1.87, - "learning_rate": 6.556696294296274e-07, - "loss": 0.7051, - "step": 72984 - }, - { - "epoch": 1.87, - "learning_rate": 6.556436511959891e-07, - "loss": 0.6484, - "step": 72985 - }, - { - "epoch": 1.87, - "learning_rate": 6.556176732260085e-07, - "loss": 0.5757, - "step": 72986 - }, - { - "epoch": 1.87, - "learning_rate": 6.555916955197058e-07, - "loss": 0.6543, - "step": 72987 - }, - { - "epoch": 1.87, - "learning_rate": 6.555657180771006e-07, - "loss": 0.4897, - "step": 72988 - }, - { - "epoch": 1.87, - "learning_rate": 6.555397408982129e-07, - "loss": 0.7109, - "step": 72989 - }, - { - "epoch": 1.87, - "learning_rate": 6.555137639830626e-07, - "loss": 0.7246, - "step": 72990 - }, - { - "epoch": 1.87, - "learning_rate": 6.554877873316696e-07, - "loss": 0.606, - "step": 72991 - }, - { - "epoch": 1.87, - "learning_rate": 6.554618109440536e-07, - "loss": 0.5371, - "step": 72992 - }, - { - "epoch": 1.87, - "learning_rate": 6.554358348202351e-07, - "loss": 0.6246, - "step": 72993 - }, - { - "epoch": 1.87, - "learning_rate": 6.554098589602333e-07, - "loss": 0.6797, - "step": 72994 - }, - { - "epoch": 1.87, - "learning_rate": 6.553838833640684e-07, - "loss": 0.7607, - "step": 72995 - }, - { - "epoch": 1.87, - "learning_rate": 6.553579080317598e-07, - "loss": 0.583, - "step": 72996 - }, - { - "epoch": 1.87, - "learning_rate": 6.553319329633282e-07, - "loss": 0.7764, - "step": 72997 - }, - { - "epoch": 1.87, - "learning_rate": 6.553059581587929e-07, - "loss": 0.5552, - "step": 72998 - }, - { - "epoch": 1.87, - "learning_rate": 6.552799836181741e-07, - "loss": 0.6162, - "step": 72999 - }, - { - "epoch": 1.87, - "learning_rate": 6.552540093414913e-07, - "loss": 0.5366, - "step": 73000 - }, - { - "epoch": 1.87, - "learning_rate": 6.552280353287649e-07, - "loss": 0.6738, - "step": 73001 - }, - { - "epoch": 1.87, - "learning_rate": 6.552020615800149e-07, - "loss": 0.6426, - "step": 73002 - }, - { - "epoch": 1.87, - "learning_rate": 6.551760880952603e-07, - "loss": 0.7192, - "step": 73003 - }, - { - "epoch": 1.87, - "learning_rate": 6.551501148745218e-07, - "loss": 0.5874, - "step": 73004 - }, - { - "epoch": 1.87, - "learning_rate": 6.551241419178186e-07, - "loss": 0.6826, - "step": 73005 - }, - { - "epoch": 1.87, - "learning_rate": 6.550981692251713e-07, - "loss": 0.4592, - "step": 73006 - }, - { - "epoch": 1.87, - "learning_rate": 6.550721967965993e-07, - "loss": 0.4948, - "step": 73007 - }, - { - "epoch": 1.87, - "learning_rate": 6.550462246321228e-07, - "loss": 0.6904, - "step": 73008 - }, - { - "epoch": 1.87, - "learning_rate": 6.550202527317615e-07, - "loss": 0.6895, - "step": 73009 - }, - { - "epoch": 1.87, - "learning_rate": 6.549942810955353e-07, - "loss": 0.5996, - "step": 73010 - }, - { - "epoch": 1.87, - "learning_rate": 6.549683097234641e-07, - "loss": 0.6294, - "step": 73011 - }, - { - "epoch": 1.87, - "learning_rate": 6.549423386155684e-07, - "loss": 0.7188, - "step": 73012 - }, - { - "epoch": 1.87, - "learning_rate": 6.549163677718668e-07, - "loss": 0.7217, - "step": 73013 - }, - { - "epoch": 1.87, - "learning_rate": 6.5489039719238e-07, - "loss": 0.6626, - "step": 73014 - }, - { - "epoch": 1.87, - "learning_rate": 6.548644268771276e-07, - "loss": 0.5952, - "step": 73015 - }, - { - "epoch": 1.87, - "learning_rate": 6.548384568261299e-07, - "loss": 0.7178, - "step": 73016 - }, - { - "epoch": 1.87, - "learning_rate": 6.548124870394062e-07, - "loss": 0.7344, - "step": 73017 - }, - { - "epoch": 1.87, - "learning_rate": 6.547865175169771e-07, - "loss": 0.6978, - "step": 73018 - }, - { - "epoch": 1.87, - "learning_rate": 6.547605482588618e-07, - "loss": 0.5879, - "step": 73019 - }, - { - "epoch": 1.87, - "learning_rate": 6.547345792650807e-07, - "loss": 0.6357, - "step": 73020 - }, - { - "epoch": 1.87, - "learning_rate": 6.547086105356532e-07, - "loss": 0.6182, - "step": 73021 - }, - { - "epoch": 1.87, - "learning_rate": 6.546826420705999e-07, - "loss": 0.5808, - "step": 73022 - }, - { - "epoch": 1.87, - "learning_rate": 6.546566738699399e-07, - "loss": 0.6343, - "step": 73023 - }, - { - "epoch": 1.87, - "learning_rate": 6.546307059336933e-07, - "loss": 0.6279, - "step": 73024 - }, - { - "epoch": 1.87, - "learning_rate": 6.546047382618803e-07, - "loss": 0.7939, - "step": 73025 - }, - { - "epoch": 1.87, - "learning_rate": 6.545787708545204e-07, - "loss": 0.6982, - "step": 73026 - }, - { - "epoch": 1.87, - "learning_rate": 6.545528037116338e-07, - "loss": 0.5859, - "step": 73027 - }, - { - "epoch": 1.87, - "learning_rate": 6.5452683683324e-07, - "loss": 0.6133, - "step": 73028 - }, - { - "epoch": 1.87, - "learning_rate": 6.545008702193594e-07, - "loss": 0.7031, - "step": 73029 - }, - { - "epoch": 1.87, - "learning_rate": 6.544749038700112e-07, - "loss": 0.5161, - "step": 73030 - }, - { - "epoch": 1.87, - "learning_rate": 6.544489377852162e-07, - "loss": 0.6147, - "step": 73031 - }, - { - "epoch": 1.87, - "learning_rate": 6.544229719649938e-07, - "loss": 0.6506, - "step": 73032 - }, - { - "epoch": 1.87, - "learning_rate": 6.543970064093636e-07, - "loss": 0.7227, - "step": 73033 - }, - { - "epoch": 1.87, - "learning_rate": 6.543710411183457e-07, - "loss": 0.6455, - "step": 73034 - }, - { - "epoch": 1.87, - "learning_rate": 6.543450760919599e-07, - "loss": 0.5193, - "step": 73035 - }, - { - "epoch": 1.87, - "learning_rate": 6.543191113302261e-07, - "loss": 0.5071, - "step": 73036 - }, - { - "epoch": 1.87, - "learning_rate": 6.542931468331645e-07, - "loss": 0.6646, - "step": 73037 - }, - { - "epoch": 1.87, - "learning_rate": 6.542671826007946e-07, - "loss": 0.5537, - "step": 73038 - }, - { - "epoch": 1.87, - "learning_rate": 6.542412186331365e-07, - "loss": 0.6699, - "step": 73039 - }, - { - "epoch": 1.87, - "learning_rate": 6.542152549302098e-07, - "loss": 0.7705, - "step": 73040 - }, - { - "epoch": 1.87, - "learning_rate": 6.541892914920348e-07, - "loss": 0.6011, - "step": 73041 - }, - { - "epoch": 1.87, - "learning_rate": 6.541633283186315e-07, - "loss": 0.5327, - "step": 73042 - }, - { - "epoch": 1.87, - "learning_rate": 6.541373654100189e-07, - "loss": 0.7324, - "step": 73043 - }, - { - "epoch": 1.87, - "learning_rate": 6.541114027662178e-07, - "loss": 0.7402, - "step": 73044 - }, - { - "epoch": 1.87, - "learning_rate": 6.540854403872472e-07, - "loss": 0.7305, - "step": 73045 - }, - { - "epoch": 1.87, - "learning_rate": 6.540594782731279e-07, - "loss": 0.6787, - "step": 73046 - }, - { - "epoch": 1.87, - "learning_rate": 6.54033516423879e-07, - "loss": 0.6987, - "step": 73047 - }, - { - "epoch": 1.87, - "learning_rate": 6.54007554839521e-07, - "loss": 0.5684, - "step": 73048 - }, - { - "epoch": 1.87, - "learning_rate": 6.539815935200733e-07, - "loss": 0.6572, - "step": 73049 - }, - { - "epoch": 1.87, - "learning_rate": 6.539556324655562e-07, - "loss": 0.6123, - "step": 73050 - }, - { - "epoch": 1.87, - "learning_rate": 6.539296716759894e-07, - "loss": 0.7256, - "step": 73051 - }, - { - "epoch": 1.87, - "learning_rate": 6.539037111513929e-07, - "loss": 0.7754, - "step": 73052 - }, - { - "epoch": 1.87, - "learning_rate": 6.53877750891786e-07, - "loss": 0.5615, - "step": 73053 - }, - { - "epoch": 1.87, - "learning_rate": 6.538517908971892e-07, - "loss": 0.6025, - "step": 73054 - }, - { - "epoch": 1.87, - "learning_rate": 6.538258311676219e-07, - "loss": 0.7383, - "step": 73055 - }, - { - "epoch": 1.87, - "learning_rate": 6.537998717031045e-07, - "loss": 0.6543, - "step": 73056 - }, - { - "epoch": 1.87, - "learning_rate": 6.537739125036564e-07, - "loss": 0.5923, - "step": 73057 - }, - { - "epoch": 1.87, - "learning_rate": 6.53747953569298e-07, - "loss": 0.5806, - "step": 73058 - }, - { - "epoch": 1.87, - "learning_rate": 6.537219949000486e-07, - "loss": 0.6777, - "step": 73059 - }, - { - "epoch": 1.87, - "learning_rate": 6.536960364959285e-07, - "loss": 0.7686, - "step": 73060 - }, - { - "epoch": 1.87, - "learning_rate": 6.536700783569572e-07, - "loss": 0.6387, - "step": 73061 - }, - { - "epoch": 1.87, - "learning_rate": 6.536441204831554e-07, - "loss": 0.6543, - "step": 73062 - }, - { - "epoch": 1.87, - "learning_rate": 6.536181628745418e-07, - "loss": 0.5049, - "step": 73063 - }, - { - "epoch": 1.87, - "learning_rate": 6.53592205531137e-07, - "loss": 0.7529, - "step": 73064 - }, - { - "epoch": 1.87, - "learning_rate": 6.535662484529608e-07, - "loss": 0.751, - "step": 73065 - }, - { - "epoch": 1.87, - "learning_rate": 6.535402916400328e-07, - "loss": 0.4752, - "step": 73066 - }, - { - "epoch": 1.87, - "learning_rate": 6.535143350923732e-07, - "loss": 0.6128, - "step": 73067 - }, - { - "epoch": 1.87, - "learning_rate": 6.534883788100019e-07, - "loss": 0.7524, - "step": 73068 - }, - { - "epoch": 1.87, - "learning_rate": 6.534624227929382e-07, - "loss": 0.6553, - "step": 73069 - }, - { - "epoch": 1.87, - "learning_rate": 6.534364670412026e-07, - "loss": 0.6748, - "step": 73070 - }, - { - "epoch": 1.87, - "learning_rate": 6.534105115548147e-07, - "loss": 0.4878, - "step": 73071 - }, - { - "epoch": 1.87, - "learning_rate": 6.533845563337949e-07, - "loss": 0.6279, - "step": 73072 - }, - { - "epoch": 1.87, - "learning_rate": 6.533586013781622e-07, - "loss": 0.5688, - "step": 73073 - }, - { - "epoch": 1.87, - "learning_rate": 6.533326466879368e-07, - "loss": 0.6416, - "step": 73074 - }, - { - "epoch": 1.87, - "learning_rate": 6.533066922631388e-07, - "loss": 0.4858, - "step": 73075 - }, - { - "epoch": 1.87, - "learning_rate": 6.532807381037879e-07, - "loss": 0.8701, - "step": 73076 - }, - { - "epoch": 1.87, - "learning_rate": 6.53254784209904e-07, - "loss": 0.6226, - "step": 73077 - }, - { - "epoch": 1.87, - "learning_rate": 6.532288305815068e-07, - "loss": 0.6055, - "step": 73078 - }, - { - "epoch": 1.87, - "learning_rate": 6.532028772186166e-07, - "loss": 0.5859, - "step": 73079 - }, - { - "epoch": 1.87, - "learning_rate": 6.531769241212526e-07, - "loss": 0.5715, - "step": 73080 - }, - { - "epoch": 1.87, - "learning_rate": 6.531509712894357e-07, - "loss": 0.6802, - "step": 73081 - }, - { - "epoch": 1.87, - "learning_rate": 6.531250187231849e-07, - "loss": 0.3105, - "step": 73082 - }, - { - "epoch": 1.87, - "learning_rate": 6.530990664225202e-07, - "loss": 0.5066, - "step": 73083 - }, - { - "epoch": 1.87, - "learning_rate": 6.530731143874617e-07, - "loss": 0.5715, - "step": 73084 - }, - { - "epoch": 1.87, - "learning_rate": 6.530471626180291e-07, - "loss": 0.793, - "step": 73085 - }, - { - "epoch": 1.87, - "learning_rate": 6.530212111142423e-07, - "loss": 0.5571, - "step": 73086 - }, - { - "epoch": 1.87, - "learning_rate": 6.529952598761213e-07, - "loss": 0.5376, - "step": 73087 - }, - { - "epoch": 1.87, - "learning_rate": 6.529693089036858e-07, - "loss": 0.8291, - "step": 73088 - }, - { - "epoch": 1.87, - "learning_rate": 6.529433581969558e-07, - "loss": 0.5723, - "step": 73089 - }, - { - "epoch": 1.87, - "learning_rate": 6.529174077559509e-07, - "loss": 0.521, - "step": 73090 - }, - { - "epoch": 1.87, - "learning_rate": 6.528914575806914e-07, - "loss": 0.5474, - "step": 73091 - }, - { - "epoch": 1.87, - "learning_rate": 6.528655076711973e-07, - "loss": 0.6826, - "step": 73092 - }, - { - "epoch": 1.87, - "learning_rate": 6.528395580274875e-07, - "loss": 0.7871, - "step": 73093 - }, - { - "epoch": 1.87, - "learning_rate": 6.528136086495829e-07, - "loss": 0.7646, - "step": 73094 - }, - { - "epoch": 1.87, - "learning_rate": 6.527876595375026e-07, - "loss": 0.5576, - "step": 73095 - }, - { - "epoch": 1.87, - "learning_rate": 6.52761710691267e-07, - "loss": 0.6621, - "step": 73096 - }, - { - "epoch": 1.87, - "learning_rate": 6.527357621108957e-07, - "loss": 0.8037, - "step": 73097 - }, - { - "epoch": 1.87, - "learning_rate": 6.527098137964089e-07, - "loss": 0.5957, - "step": 73098 - }, - { - "epoch": 1.87, - "learning_rate": 6.526838657478259e-07, - "loss": 0.5596, - "step": 73099 - }, - { - "epoch": 1.87, - "learning_rate": 6.526579179651672e-07, - "loss": 0.6128, - "step": 73100 - }, - { - "epoch": 1.87, - "learning_rate": 6.526319704484521e-07, - "loss": 0.5469, - "step": 73101 - }, - { - "epoch": 1.87, - "learning_rate": 6.526060231977011e-07, - "loss": 0.5586, - "step": 73102 - }, - { - "epoch": 1.87, - "learning_rate": 6.525800762129336e-07, - "loss": 0.5684, - "step": 73103 - }, - { - "epoch": 1.87, - "learning_rate": 6.525541294941694e-07, - "loss": 0.4819, - "step": 73104 - }, - { - "epoch": 1.87, - "learning_rate": 6.525281830414284e-07, - "loss": 0.4351, - "step": 73105 - }, - { - "epoch": 1.87, - "learning_rate": 6.525022368547308e-07, - "loss": 0.7217, - "step": 73106 - }, - { - "epoch": 1.87, - "learning_rate": 6.524762909340961e-07, - "loss": 0.6112, - "step": 73107 - }, - { - "epoch": 1.87, - "learning_rate": 6.524503452795446e-07, - "loss": 0.5796, - "step": 73108 - }, - { - "epoch": 1.87, - "learning_rate": 6.524243998910956e-07, - "loss": 0.6128, - "step": 73109 - }, - { - "epoch": 1.87, - "learning_rate": 6.523984547687693e-07, - "loss": 0.6289, - "step": 73110 - }, - { - "epoch": 1.87, - "learning_rate": 6.523725099125856e-07, - "loss": 0.7803, - "step": 73111 - }, - { - "epoch": 1.87, - "learning_rate": 6.523465653225645e-07, - "loss": 0.4839, - "step": 73112 - }, - { - "epoch": 1.87, - "learning_rate": 6.523206209987256e-07, - "loss": 0.6006, - "step": 73113 - }, - { - "epoch": 1.87, - "learning_rate": 6.522946769410884e-07, - "loss": 0.5435, - "step": 73114 - }, - { - "epoch": 1.87, - "learning_rate": 6.522687331496734e-07, - "loss": 0.5122, - "step": 73115 - }, - { - "epoch": 1.87, - "learning_rate": 6.522427896245002e-07, - "loss": 0.7002, - "step": 73116 - }, - { - "epoch": 1.87, - "learning_rate": 6.522168463655888e-07, - "loss": 0.7188, - "step": 73117 - }, - { - "epoch": 1.87, - "learning_rate": 6.521909033729588e-07, - "loss": 0.6611, - "step": 73118 - }, - { - "epoch": 1.87, - "learning_rate": 6.521649606466304e-07, - "loss": 0.7119, - "step": 73119 - }, - { - "epoch": 1.87, - "learning_rate": 6.521390181866231e-07, - "loss": 0.833, - "step": 73120 - }, - { - "epoch": 1.87, - "learning_rate": 6.521130759929572e-07, - "loss": 0.7559, - "step": 73121 - }, - { - "epoch": 1.87, - "learning_rate": 6.520871340656527e-07, - "loss": 0.6509, - "step": 73122 - }, - { - "epoch": 1.87, - "learning_rate": 6.520611924047286e-07, - "loss": 0.6484, - "step": 73123 - }, - { - "epoch": 1.87, - "learning_rate": 6.520352510102052e-07, - "loss": 0.7373, - "step": 73124 - }, - { - "epoch": 1.87, - "learning_rate": 6.520093098821025e-07, - "loss": 0.7256, - "step": 73125 - }, - { - "epoch": 1.87, - "learning_rate": 6.519833690204401e-07, - "loss": 0.3957, - "step": 73126 - }, - { - "epoch": 1.87, - "learning_rate": 6.519574284252383e-07, - "loss": 0.7061, - "step": 73127 - }, - { - "epoch": 1.87, - "learning_rate": 6.519314880965164e-07, - "loss": 0.605, - "step": 73128 - }, - { - "epoch": 1.87, - "learning_rate": 6.519055480342947e-07, - "loss": 0.623, - "step": 73129 - }, - { - "epoch": 1.87, - "learning_rate": 6.518796082385929e-07, - "loss": 0.5977, - "step": 73130 - }, - { - "epoch": 1.87, - "learning_rate": 6.518536687094309e-07, - "loss": 0.584, - "step": 73131 - }, - { - "epoch": 1.87, - "learning_rate": 6.518277294468289e-07, - "loss": 0.7637, - "step": 73132 - }, - { - "epoch": 1.87, - "learning_rate": 6.51801790450806e-07, - "loss": 0.5757, - "step": 73133 - }, - { - "epoch": 1.87, - "learning_rate": 6.517758517213825e-07, - "loss": 0.7402, - "step": 73134 - }, - { - "epoch": 1.87, - "learning_rate": 6.517499132585782e-07, - "loss": 0.7046, - "step": 73135 - }, - { - "epoch": 1.87, - "learning_rate": 6.517239750624131e-07, - "loss": 0.7637, - "step": 73136 - }, - { - "epoch": 1.87, - "learning_rate": 6.516980371329066e-07, - "loss": 0.7031, - "step": 73137 - }, - { - "epoch": 1.87, - "learning_rate": 6.516720994700793e-07, - "loss": 0.4678, - "step": 73138 - }, - { - "epoch": 1.87, - "learning_rate": 6.516461620739503e-07, - "loss": 0.562, - "step": 73139 - }, - { - "epoch": 1.87, - "learning_rate": 6.516202249445401e-07, - "loss": 0.5093, - "step": 73140 - }, - { - "epoch": 1.87, - "learning_rate": 6.515942880818683e-07, - "loss": 0.7251, - "step": 73141 - }, - { - "epoch": 1.87, - "learning_rate": 6.515683514859549e-07, - "loss": 0.6582, - "step": 73142 - }, - { - "epoch": 1.87, - "learning_rate": 6.515424151568192e-07, - "loss": 0.7144, - "step": 73143 - }, - { - "epoch": 1.87, - "learning_rate": 6.515164790944816e-07, - "loss": 0.5574, - "step": 73144 - }, - { - "epoch": 1.87, - "learning_rate": 6.514905432989617e-07, - "loss": 0.564, - "step": 73145 - }, - { - "epoch": 1.87, - "learning_rate": 6.514646077702796e-07, - "loss": 0.7446, - "step": 73146 - }, - { - "epoch": 1.87, - "learning_rate": 6.514386725084548e-07, - "loss": 0.6826, - "step": 73147 - }, - { - "epoch": 1.87, - "learning_rate": 6.514127375135076e-07, - "loss": 0.6436, - "step": 73148 - }, - { - "epoch": 1.87, - "learning_rate": 6.513868027854575e-07, - "loss": 0.4497, - "step": 73149 - }, - { - "epoch": 1.87, - "learning_rate": 6.513608683243247e-07, - "loss": 0.6279, - "step": 73150 - }, - { - "epoch": 1.87, - "learning_rate": 6.513349341301286e-07, - "loss": 0.6284, - "step": 73151 - }, - { - "epoch": 1.87, - "learning_rate": 6.513090002028897e-07, - "loss": 0.7383, - "step": 73152 - }, - { - "epoch": 1.87, - "learning_rate": 6.512830665426272e-07, - "loss": 0.7051, - "step": 73153 - }, - { - "epoch": 1.87, - "learning_rate": 6.512571331493612e-07, - "loss": 0.6191, - "step": 73154 - }, - { - "epoch": 1.88, - "learning_rate": 6.512312000231117e-07, - "loss": 0.751, - "step": 73155 - }, - { - "epoch": 1.88, - "learning_rate": 6.512052671638981e-07, - "loss": 0.6748, - "step": 73156 - }, - { - "epoch": 1.88, - "learning_rate": 6.511793345717409e-07, - "loss": 0.6436, - "step": 73157 - }, - { - "epoch": 1.88, - "learning_rate": 6.511534022466598e-07, - "loss": 0.5356, - "step": 73158 - }, - { - "epoch": 1.88, - "learning_rate": 6.511274701886741e-07, - "loss": 0.7119, - "step": 73159 - }, - { - "epoch": 1.88, - "learning_rate": 6.511015383978042e-07, - "loss": 0.6387, - "step": 73160 - }, - { - "epoch": 1.88, - "learning_rate": 6.510756068740697e-07, - "loss": 0.6465, - "step": 73161 - }, - { - "epoch": 1.88, - "learning_rate": 6.51049675617491e-07, - "loss": 0.6484, - "step": 73162 - }, - { - "epoch": 1.88, - "learning_rate": 6.510237446280873e-07, - "loss": 0.6328, - "step": 73163 - }, - { - "epoch": 1.88, - "learning_rate": 6.509978139058784e-07, - "loss": 0.5557, - "step": 73164 - }, - { - "epoch": 1.88, - "learning_rate": 6.509718834508848e-07, - "loss": 0.6973, - "step": 73165 - }, - { - "epoch": 1.88, - "learning_rate": 6.509459532631256e-07, - "loss": 0.6465, - "step": 73166 - }, - { - "epoch": 1.88, - "learning_rate": 6.509200233426214e-07, - "loss": 0.5635, - "step": 73167 - }, - { - "epoch": 1.88, - "learning_rate": 6.508940936893914e-07, - "loss": 0.6187, - "step": 73168 - }, - { - "epoch": 1.88, - "learning_rate": 6.508681643034559e-07, - "loss": 0.5918, - "step": 73169 - }, - { - "epoch": 1.88, - "learning_rate": 6.508422351848344e-07, - "loss": 0.4517, - "step": 73170 - }, - { - "epoch": 1.88, - "learning_rate": 6.508163063335472e-07, - "loss": 0.6914, - "step": 73171 - }, - { - "epoch": 1.88, - "learning_rate": 6.507903777496141e-07, - "loss": 0.75, - "step": 73172 - }, - { - "epoch": 1.88, - "learning_rate": 6.507644494330544e-07, - "loss": 0.5488, - "step": 73173 - }, - { - "epoch": 1.88, - "learning_rate": 6.507385213838883e-07, - "loss": 0.7783, - "step": 73174 - }, - { - "epoch": 1.88, - "learning_rate": 6.507125936021358e-07, - "loss": 0.6465, - "step": 73175 - }, - { - "epoch": 1.88, - "learning_rate": 6.506866660878164e-07, - "loss": 0.6216, - "step": 73176 - }, - { - "epoch": 1.88, - "learning_rate": 6.506607388409504e-07, - "loss": 0.6172, - "step": 73177 - }, - { - "epoch": 1.88, - "learning_rate": 6.506348118615572e-07, - "loss": 0.5483, - "step": 73178 - }, - { - "epoch": 1.88, - "learning_rate": 6.50608885149657e-07, - "loss": 0.7832, - "step": 73179 - }, - { - "epoch": 1.88, - "learning_rate": 6.505829587052693e-07, - "loss": 0.5718, - "step": 73180 - }, - { - "epoch": 1.88, - "learning_rate": 6.505570325284144e-07, - "loss": 0.5344, - "step": 73181 - }, - { - "epoch": 1.88, - "learning_rate": 6.505311066191121e-07, - "loss": 0.48, - "step": 73182 - }, - { - "epoch": 1.88, - "learning_rate": 6.505051809773816e-07, - "loss": 0.5918, - "step": 73183 - }, - { - "epoch": 1.88, - "learning_rate": 6.504792556032435e-07, - "loss": 0.7178, - "step": 73184 - }, - { - "epoch": 1.88, - "learning_rate": 6.50453330496717e-07, - "loss": 0.5757, - "step": 73185 - }, - { - "epoch": 1.88, - "learning_rate": 6.504274056578228e-07, - "loss": 0.4709, - "step": 73186 - }, - { - "epoch": 1.88, - "learning_rate": 6.504014810865799e-07, - "loss": 0.5366, - "step": 73187 - }, - { - "epoch": 1.88, - "learning_rate": 6.503755567830087e-07, - "loss": 0.7412, - "step": 73188 - }, - { - "epoch": 1.88, - "learning_rate": 6.503496327471286e-07, - "loss": 0.5759, - "step": 73189 - }, - { - "epoch": 1.88, - "learning_rate": 6.503237089789601e-07, - "loss": 0.5486, - "step": 73190 - }, - { - "epoch": 1.88, - "learning_rate": 6.502977854785223e-07, - "loss": 0.6333, - "step": 73191 - }, - { - "epoch": 1.88, - "learning_rate": 6.502718622458359e-07, - "loss": 0.8115, - "step": 73192 - }, - { - "epoch": 1.88, - "learning_rate": 6.502459392809199e-07, - "loss": 0.5938, - "step": 73193 - }, - { - "epoch": 1.88, - "learning_rate": 6.502200165837947e-07, - "loss": 0.4142, - "step": 73194 - }, - { - "epoch": 1.88, - "learning_rate": 6.501940941544796e-07, - "loss": 0.6655, - "step": 73195 - }, - { - "epoch": 1.88, - "learning_rate": 6.50168171992995e-07, - "loss": 0.7041, - "step": 73196 - }, - { - "epoch": 1.88, - "learning_rate": 6.501422500993605e-07, - "loss": 0.834, - "step": 73197 - }, - { - "epoch": 1.88, - "learning_rate": 6.50116328473596e-07, - "loss": 0.5856, - "step": 73198 - }, - { - "epoch": 1.88, - "learning_rate": 6.500904071157213e-07, - "loss": 0.5259, - "step": 73199 - }, - { - "epoch": 1.88, - "learning_rate": 6.500644860257564e-07, - "loss": 0.6313, - "step": 73200 - }, - { - "epoch": 1.88, - "learning_rate": 6.500385652037208e-07, - "loss": 0.5471, - "step": 73201 - }, - { - "epoch": 1.88, - "learning_rate": 6.500126446496351e-07, - "loss": 0.7539, - "step": 73202 - }, - { - "epoch": 1.88, - "learning_rate": 6.499867243635184e-07, - "loss": 0.7236, - "step": 73203 - }, - { - "epoch": 1.88, - "learning_rate": 6.499608043453904e-07, - "loss": 0.6235, - "step": 73204 - }, - { - "epoch": 1.88, - "learning_rate": 6.499348845952717e-07, - "loss": 0.8154, - "step": 73205 - }, - { - "epoch": 1.88, - "learning_rate": 6.499089651131815e-07, - "loss": 0.7012, - "step": 73206 - }, - { - "epoch": 1.88, - "learning_rate": 6.498830458991402e-07, - "loss": 0.4778, - "step": 73207 - }, - { - "epoch": 1.88, - "learning_rate": 6.498571269531669e-07, - "loss": 0.7734, - "step": 73208 - }, - { - "epoch": 1.88, - "learning_rate": 6.498312082752824e-07, - "loss": 0.6279, - "step": 73209 - }, - { - "epoch": 1.88, - "learning_rate": 6.498052898655057e-07, - "loss": 0.7607, - "step": 73210 - }, - { - "epoch": 1.88, - "learning_rate": 6.497793717238571e-07, - "loss": 0.533, - "step": 73211 - }, - { - "epoch": 1.88, - "learning_rate": 6.497534538503567e-07, - "loss": 0.7598, - "step": 73212 - }, - { - "epoch": 1.88, - "learning_rate": 6.497275362450237e-07, - "loss": 0.5806, - "step": 73213 - }, - { - "epoch": 1.88, - "learning_rate": 6.497016189078781e-07, - "loss": 0.7627, - "step": 73214 - }, - { - "epoch": 1.88, - "learning_rate": 6.496757018389399e-07, - "loss": 0.6387, - "step": 73215 - }, - { - "epoch": 1.88, - "learning_rate": 6.496497850382288e-07, - "loss": 0.5977, - "step": 73216 - }, - { - "epoch": 1.88, - "learning_rate": 6.496238685057649e-07, - "loss": 0.5737, - "step": 73217 - }, - { - "epoch": 1.88, - "learning_rate": 6.495979522415677e-07, - "loss": 0.7314, - "step": 73218 - }, - { - "epoch": 1.88, - "learning_rate": 6.495720362456576e-07, - "loss": 0.7734, - "step": 73219 - }, - { - "epoch": 1.88, - "learning_rate": 6.495461205180537e-07, - "loss": 0.584, - "step": 73220 - }, - { - "epoch": 1.88, - "learning_rate": 6.495202050587765e-07, - "loss": 0.6045, - "step": 73221 - }, - { - "epoch": 1.88, - "learning_rate": 6.494942898678457e-07, - "loss": 0.6396, - "step": 73222 - }, - { - "epoch": 1.88, - "learning_rate": 6.494683749452808e-07, - "loss": 0.6885, - "step": 73223 - }, - { - "epoch": 1.88, - "learning_rate": 6.494424602911018e-07, - "loss": 0.6201, - "step": 73224 - }, - { - "epoch": 1.88, - "learning_rate": 6.494165459053285e-07, - "loss": 0.5488, - "step": 73225 - }, - { - "epoch": 1.88, - "learning_rate": 6.49390631787981e-07, - "loss": 0.6504, - "step": 73226 - }, - { - "epoch": 1.88, - "learning_rate": 6.493647179390786e-07, - "loss": 0.5718, - "step": 73227 - }, - { - "epoch": 1.88, - "learning_rate": 6.49338804358642e-07, - "loss": 0.6016, - "step": 73228 - }, - { - "epoch": 1.88, - "learning_rate": 6.493128910466903e-07, - "loss": 0.4812, - "step": 73229 - }, - { - "epoch": 1.88, - "learning_rate": 6.492869780032438e-07, - "loss": 0.5796, - "step": 73230 - }, - { - "epoch": 1.88, - "learning_rate": 6.492610652283219e-07, - "loss": 0.6973, - "step": 73231 - }, - { - "epoch": 1.88, - "learning_rate": 6.49235152721945e-07, - "loss": 0.5562, - "step": 73232 - }, - { - "epoch": 1.88, - "learning_rate": 6.492092404841324e-07, - "loss": 0.4819, - "step": 73233 - }, - { - "epoch": 1.88, - "learning_rate": 6.491833285149042e-07, - "loss": 0.5122, - "step": 73234 - }, - { - "epoch": 1.88, - "learning_rate": 6.4915741681428e-07, - "loss": 0.6416, - "step": 73235 - }, - { - "epoch": 1.88, - "learning_rate": 6.491315053822802e-07, - "loss": 0.5776, - "step": 73236 - }, - { - "epoch": 1.88, - "learning_rate": 6.491055942189237e-07, - "loss": 0.6011, - "step": 73237 - }, - { - "epoch": 1.88, - "learning_rate": 6.490796833242313e-07, - "loss": 0.5376, - "step": 73238 - }, - { - "epoch": 1.88, - "learning_rate": 6.490537726982224e-07, - "loss": 0.7461, - "step": 73239 - }, - { - "epoch": 1.88, - "learning_rate": 6.490278623409169e-07, - "loss": 0.793, - "step": 73240 - }, - { - "epoch": 1.88, - "learning_rate": 6.490019522523345e-07, - "loss": 0.4685, - "step": 73241 - }, - { - "epoch": 1.88, - "learning_rate": 6.489760424324957e-07, - "loss": 0.5508, - "step": 73242 - }, - { - "epoch": 1.88, - "learning_rate": 6.489501328814194e-07, - "loss": 0.6714, - "step": 73243 - }, - { - "epoch": 1.88, - "learning_rate": 6.489242235991257e-07, - "loss": 0.6973, - "step": 73244 - }, - { - "epoch": 1.88, - "learning_rate": 6.488983145856348e-07, - "loss": 0.582, - "step": 73245 - }, - { - "epoch": 1.88, - "learning_rate": 6.488724058409661e-07, - "loss": 0.7178, - "step": 73246 - }, - { - "epoch": 1.88, - "learning_rate": 6.488464973651399e-07, - "loss": 0.5361, - "step": 73247 - }, - { - "epoch": 1.88, - "learning_rate": 6.488205891581758e-07, - "loss": 0.4722, - "step": 73248 - }, - { - "epoch": 1.88, - "learning_rate": 6.487946812200933e-07, - "loss": 0.5649, - "step": 73249 - }, - { - "epoch": 1.88, - "learning_rate": 6.487687735509128e-07, - "loss": 0.6816, - "step": 73250 - }, - { - "epoch": 1.88, - "learning_rate": 6.487428661506538e-07, - "loss": 0.6289, - "step": 73251 - }, - { - "epoch": 1.88, - "learning_rate": 6.487169590193365e-07, - "loss": 0.7295, - "step": 73252 - }, - { - "epoch": 1.88, - "learning_rate": 6.486910521569804e-07, - "loss": 0.6953, - "step": 73253 - }, - { - "epoch": 1.88, - "learning_rate": 6.486651455636052e-07, - "loss": 0.667, - "step": 73254 - }, - { - "epoch": 1.88, - "learning_rate": 6.486392392392311e-07, - "loss": 0.7129, - "step": 73255 - }, - { - "epoch": 1.88, - "learning_rate": 6.486133331838775e-07, - "loss": 0.3975, - "step": 73256 - }, - { - "epoch": 1.88, - "learning_rate": 6.485874273975649e-07, - "loss": 0.5171, - "step": 73257 - }, - { - "epoch": 1.88, - "learning_rate": 6.485615218803124e-07, - "loss": 0.4629, - "step": 73258 - }, - { - "epoch": 1.88, - "learning_rate": 6.485356166321404e-07, - "loss": 0.585, - "step": 73259 - }, - { - "epoch": 1.88, - "learning_rate": 6.485097116530683e-07, - "loss": 0.7207, - "step": 73260 - }, - { - "epoch": 1.88, - "learning_rate": 6.484838069431165e-07, - "loss": 0.7588, - "step": 73261 - }, - { - "epoch": 1.88, - "learning_rate": 6.484579025023045e-07, - "loss": 0.6426, - "step": 73262 - }, - { - "epoch": 1.88, - "learning_rate": 6.484319983306518e-07, - "loss": 0.3848, - "step": 73263 - }, - { - "epoch": 1.88, - "learning_rate": 6.484060944281788e-07, - "loss": 0.6738, - "step": 73264 - }, - { - "epoch": 1.88, - "learning_rate": 6.483801907949048e-07, - "loss": 0.7295, - "step": 73265 - }, - { - "epoch": 1.88, - "learning_rate": 6.483542874308502e-07, - "loss": 0.668, - "step": 73266 - }, - { - "epoch": 1.88, - "learning_rate": 6.483283843360345e-07, - "loss": 0.645, - "step": 73267 - }, - { - "epoch": 1.88, - "learning_rate": 6.483024815104774e-07, - "loss": 0.833, - "step": 73268 - }, - { - "epoch": 1.88, - "learning_rate": 6.482765789541991e-07, - "loss": 0.6973, - "step": 73269 - }, - { - "epoch": 1.88, - "learning_rate": 6.482506766672191e-07, - "loss": 0.6602, - "step": 73270 - }, - { - "epoch": 1.88, - "learning_rate": 6.482247746495575e-07, - "loss": 0.8447, - "step": 73271 - }, - { - "epoch": 1.88, - "learning_rate": 6.481988729012343e-07, - "loss": 0.5337, - "step": 73272 - }, - { - "epoch": 1.88, - "learning_rate": 6.481729714222686e-07, - "loss": 0.6816, - "step": 73273 - }, - { - "epoch": 1.88, - "learning_rate": 6.481470702126809e-07, - "loss": 0.6152, - "step": 73274 - }, - { - "epoch": 1.88, - "learning_rate": 6.481211692724906e-07, - "loss": 0.7656, - "step": 73275 - }, - { - "epoch": 1.88, - "learning_rate": 6.480952686017179e-07, - "loss": 0.6406, - "step": 73276 - }, - { - "epoch": 1.88, - "learning_rate": 6.480693682003824e-07, - "loss": 0.4062, - "step": 73277 - }, - { - "epoch": 1.88, - "learning_rate": 6.480434680685041e-07, - "loss": 0.5596, - "step": 73278 - }, - { - "epoch": 1.88, - "learning_rate": 6.480175682061026e-07, - "loss": 0.4443, - "step": 73279 - }, - { - "epoch": 1.88, - "learning_rate": 6.479916686131979e-07, - "loss": 0.6494, - "step": 73280 - }, - { - "epoch": 1.88, - "learning_rate": 6.479657692898097e-07, - "loss": 0.4412, - "step": 73281 - }, - { - "epoch": 1.88, - "learning_rate": 6.479398702359585e-07, - "loss": 0.6528, - "step": 73282 - }, - { - "epoch": 1.88, - "learning_rate": 6.47913971451663e-07, - "loss": 0.5409, - "step": 73283 - }, - { - "epoch": 1.88, - "learning_rate": 6.478880729369438e-07, - "loss": 0.6367, - "step": 73284 - }, - { - "epoch": 1.88, - "learning_rate": 6.478621746918203e-07, - "loss": 0.5505, - "step": 73285 - }, - { - "epoch": 1.88, - "learning_rate": 6.478362767163128e-07, - "loss": 0.6436, - "step": 73286 - }, - { - "epoch": 1.88, - "learning_rate": 6.478103790104406e-07, - "loss": 0.457, - "step": 73287 - }, - { - "epoch": 1.88, - "learning_rate": 6.47784481574224e-07, - "loss": 0.5942, - "step": 73288 - }, - { - "epoch": 1.88, - "learning_rate": 6.477585844076822e-07, - "loss": 0.5674, - "step": 73289 - }, - { - "epoch": 1.88, - "learning_rate": 6.47732687510836e-07, - "loss": 0.6582, - "step": 73290 - }, - { - "epoch": 1.88, - "learning_rate": 6.477067908837047e-07, - "loss": 0.5112, - "step": 73291 - }, - { - "epoch": 1.88, - "learning_rate": 6.476808945263078e-07, - "loss": 0.6392, - "step": 73292 - }, - { - "epoch": 1.88, - "learning_rate": 6.476549984386656e-07, - "loss": 0.7021, - "step": 73293 - }, - { - "epoch": 1.88, - "learning_rate": 6.476291026207976e-07, - "loss": 0.7002, - "step": 73294 - }, - { - "epoch": 1.88, - "learning_rate": 6.47603207072724e-07, - "loss": 0.585, - "step": 73295 - }, - { - "epoch": 1.88, - "learning_rate": 6.475773117944641e-07, - "loss": 0.54, - "step": 73296 - }, - { - "epoch": 1.88, - "learning_rate": 6.475514167860383e-07, - "loss": 0.5522, - "step": 73297 - }, - { - "epoch": 1.88, - "learning_rate": 6.47525522047466e-07, - "loss": 0.6375, - "step": 73298 - }, - { - "epoch": 1.88, - "learning_rate": 6.474996275787674e-07, - "loss": 0.5422, - "step": 73299 - }, - { - "epoch": 1.88, - "learning_rate": 6.47473733379962e-07, - "loss": 0.8408, - "step": 73300 - }, - { - "epoch": 1.88, - "learning_rate": 6.474478394510703e-07, - "loss": 0.4768, - "step": 73301 - }, - { - "epoch": 1.88, - "learning_rate": 6.474219457921109e-07, - "loss": 0.7104, - "step": 73302 - }, - { - "epoch": 1.88, - "learning_rate": 6.473960524031046e-07, - "loss": 0.5327, - "step": 73303 - }, - { - "epoch": 1.88, - "learning_rate": 6.473701592840708e-07, - "loss": 0.6064, - "step": 73304 - }, - { - "epoch": 1.88, - "learning_rate": 6.473442664350294e-07, - "loss": 0.752, - "step": 73305 - }, - { - "epoch": 1.88, - "learning_rate": 6.473183738560002e-07, - "loss": 0.502, - "step": 73306 - }, - { - "epoch": 1.88, - "learning_rate": 6.472924815470035e-07, - "loss": 0.6143, - "step": 73307 - }, - { - "epoch": 1.88, - "learning_rate": 6.472665895080583e-07, - "loss": 0.5874, - "step": 73308 - }, - { - "epoch": 1.88, - "learning_rate": 6.472406977391851e-07, - "loss": 0.6846, - "step": 73309 - }, - { - "epoch": 1.88, - "learning_rate": 6.472148062404032e-07, - "loss": 0.8076, - "step": 73310 - }, - { - "epoch": 1.88, - "learning_rate": 6.471889150117334e-07, - "loss": 0.6074, - "step": 73311 - }, - { - "epoch": 1.88, - "learning_rate": 6.471630240531943e-07, - "loss": 0.4858, - "step": 73312 - }, - { - "epoch": 1.88, - "learning_rate": 6.471371333648062e-07, - "loss": 0.7266, - "step": 73313 - }, - { - "epoch": 1.88, - "learning_rate": 6.471112429465892e-07, - "loss": 0.5276, - "step": 73314 - }, - { - "epoch": 1.88, - "learning_rate": 6.470853527985627e-07, - "loss": 0.6489, - "step": 73315 - }, - { - "epoch": 1.88, - "learning_rate": 6.470594629207468e-07, - "loss": 0.8096, - "step": 73316 - }, - { - "epoch": 1.88, - "learning_rate": 6.470335733131611e-07, - "loss": 0.6377, - "step": 73317 - }, - { - "epoch": 1.88, - "learning_rate": 6.470076839758257e-07, - "loss": 0.5698, - "step": 73318 - }, - { - "epoch": 1.88, - "learning_rate": 6.469817949087602e-07, - "loss": 0.4629, - "step": 73319 - }, - { - "epoch": 1.88, - "learning_rate": 6.469559061119847e-07, - "loss": 0.6899, - "step": 73320 - }, - { - "epoch": 1.88, - "learning_rate": 6.469300175855189e-07, - "loss": 0.6665, - "step": 73321 - }, - { - "epoch": 1.88, - "learning_rate": 6.469041293293825e-07, - "loss": 0.6978, - "step": 73322 - }, - { - "epoch": 1.88, - "learning_rate": 6.468782413435951e-07, - "loss": 0.6108, - "step": 73323 - }, - { - "epoch": 1.88, - "learning_rate": 6.46852353628177e-07, - "loss": 0.6963, - "step": 73324 - }, - { - "epoch": 1.88, - "learning_rate": 6.468264661831475e-07, - "loss": 0.4211, - "step": 73325 - }, - { - "epoch": 1.88, - "learning_rate": 6.468005790085272e-07, - "loss": 0.834, - "step": 73326 - }, - { - "epoch": 1.88, - "learning_rate": 6.46774692104335e-07, - "loss": 0.4854, - "step": 73327 - }, - { - "epoch": 1.88, - "learning_rate": 6.467488054705915e-07, - "loss": 0.5557, - "step": 73328 - }, - { - "epoch": 1.88, - "learning_rate": 6.46722919107316e-07, - "loss": 0.5728, - "step": 73329 - }, - { - "epoch": 1.88, - "learning_rate": 6.466970330145288e-07, - "loss": 0.6025, - "step": 73330 - }, - { - "epoch": 1.88, - "learning_rate": 6.466711471922495e-07, - "loss": 0.6855, - "step": 73331 - }, - { - "epoch": 1.88, - "learning_rate": 6.466452616404974e-07, - "loss": 0.8311, - "step": 73332 - }, - { - "epoch": 1.88, - "learning_rate": 6.466193763592931e-07, - "loss": 0.7441, - "step": 73333 - }, - { - "epoch": 1.88, - "learning_rate": 6.465934913486558e-07, - "loss": 0.6318, - "step": 73334 - }, - { - "epoch": 1.88, - "learning_rate": 6.465676066086059e-07, - "loss": 0.364, - "step": 73335 - }, - { - "epoch": 1.88, - "learning_rate": 6.465417221391627e-07, - "loss": 0.7065, - "step": 73336 - }, - { - "epoch": 1.88, - "learning_rate": 6.465158379403465e-07, - "loss": 0.5386, - "step": 73337 - }, - { - "epoch": 1.88, - "learning_rate": 6.464899540121768e-07, - "loss": 0.6699, - "step": 73338 - }, - { - "epoch": 1.88, - "learning_rate": 6.464640703546733e-07, - "loss": 0.7754, - "step": 73339 - }, - { - "epoch": 1.88, - "learning_rate": 6.464381869678563e-07, - "loss": 0.5996, - "step": 73340 - }, - { - "epoch": 1.88, - "learning_rate": 6.464123038517454e-07, - "loss": 0.5503, - "step": 73341 - }, - { - "epoch": 1.88, - "learning_rate": 6.463864210063599e-07, - "loss": 0.7109, - "step": 73342 - }, - { - "epoch": 1.88, - "learning_rate": 6.463605384317204e-07, - "loss": 0.7764, - "step": 73343 - }, - { - "epoch": 1.88, - "learning_rate": 6.463346561278461e-07, - "loss": 0.8223, - "step": 73344 - }, - { - "epoch": 1.88, - "learning_rate": 6.463087740947573e-07, - "loss": 0.6826, - "step": 73345 - }, - { - "epoch": 1.88, - "learning_rate": 6.462828923324735e-07, - "loss": 0.6694, - "step": 73346 - }, - { - "epoch": 1.88, - "learning_rate": 6.462570108410145e-07, - "loss": 0.6396, - "step": 73347 - }, - { - "epoch": 1.88, - "learning_rate": 6.462311296204004e-07, - "loss": 0.7148, - "step": 73348 - }, - { - "epoch": 1.88, - "learning_rate": 6.46205248670651e-07, - "loss": 0.8818, - "step": 73349 - }, - { - "epoch": 1.88, - "learning_rate": 6.461793679917858e-07, - "loss": 0.6533, - "step": 73350 - }, - { - "epoch": 1.88, - "learning_rate": 6.461534875838251e-07, - "loss": 0.5173, - "step": 73351 - }, - { - "epoch": 1.88, - "learning_rate": 6.461276074467881e-07, - "loss": 0.668, - "step": 73352 - }, - { - "epoch": 1.88, - "learning_rate": 6.461017275806948e-07, - "loss": 0.7041, - "step": 73353 - }, - { - "epoch": 1.88, - "learning_rate": 6.460758479855654e-07, - "loss": 0.5286, - "step": 73354 - }, - { - "epoch": 1.88, - "learning_rate": 6.460499686614192e-07, - "loss": 0.6592, - "step": 73355 - }, - { - "epoch": 1.88, - "learning_rate": 6.460240896082765e-07, - "loss": 0.6641, - "step": 73356 - }, - { - "epoch": 1.88, - "learning_rate": 6.459982108261568e-07, - "loss": 0.4723, - "step": 73357 - }, - { - "epoch": 1.88, - "learning_rate": 6.459723323150799e-07, - "loss": 0.6621, - "step": 73358 - }, - { - "epoch": 1.88, - "learning_rate": 6.459464540750658e-07, - "loss": 0.6104, - "step": 73359 - }, - { - "epoch": 1.88, - "learning_rate": 6.45920576106134e-07, - "loss": 0.7998, - "step": 73360 - }, - { - "epoch": 1.88, - "learning_rate": 6.458946984083051e-07, - "loss": 0.7842, - "step": 73361 - }, - { - "epoch": 1.88, - "learning_rate": 6.45868820981598e-07, - "loss": 0.5771, - "step": 73362 - }, - { - "epoch": 1.88, - "learning_rate": 6.458429438260326e-07, - "loss": 0.5238, - "step": 73363 - }, - { - "epoch": 1.88, - "learning_rate": 6.458170669416294e-07, - "loss": 0.5542, - "step": 73364 - }, - { - "epoch": 1.88, - "learning_rate": 6.457911903284074e-07, - "loss": 0.6201, - "step": 73365 - }, - { - "epoch": 1.88, - "learning_rate": 6.457653139863872e-07, - "loss": 0.5225, - "step": 73366 - }, - { - "epoch": 1.88, - "learning_rate": 6.457394379155878e-07, - "loss": 0.6191, - "step": 73367 - }, - { - "epoch": 1.88, - "learning_rate": 6.457135621160296e-07, - "loss": 0.8135, - "step": 73368 - }, - { - "epoch": 1.88, - "learning_rate": 6.456876865877323e-07, - "loss": 0.5073, - "step": 73369 - }, - { - "epoch": 1.88, - "learning_rate": 6.456618113307157e-07, - "loss": 0.4872, - "step": 73370 - }, - { - "epoch": 1.88, - "learning_rate": 6.456359363449997e-07, - "loss": 0.6152, - "step": 73371 - }, - { - "epoch": 1.88, - "learning_rate": 6.456100616306036e-07, - "loss": 0.7056, - "step": 73372 - }, - { - "epoch": 1.88, - "learning_rate": 6.455841871875478e-07, - "loss": 0.7168, - "step": 73373 - }, - { - "epoch": 1.88, - "learning_rate": 6.45558313015852e-07, - "loss": 0.7227, - "step": 73374 - }, - { - "epoch": 1.88, - "learning_rate": 6.455324391155354e-07, - "loss": 0.5786, - "step": 73375 - }, - { - "epoch": 1.88, - "learning_rate": 6.455065654866187e-07, - "loss": 0.7065, - "step": 73376 - }, - { - "epoch": 1.88, - "learning_rate": 6.454806921291211e-07, - "loss": 0.6377, - "step": 73377 - }, - { - "epoch": 1.88, - "learning_rate": 6.45454819043063e-07, - "loss": 0.709, - "step": 73378 - }, - { - "epoch": 1.88, - "learning_rate": 6.454289462284635e-07, - "loss": 0.6729, - "step": 73379 - }, - { - "epoch": 1.88, - "learning_rate": 6.454030736853429e-07, - "loss": 0.4507, - "step": 73380 - }, - { - "epoch": 1.88, - "learning_rate": 6.45377201413721e-07, - "loss": 0.6875, - "step": 73381 - }, - { - "epoch": 1.88, - "learning_rate": 6.453513294136172e-07, - "loss": 0.7637, - "step": 73382 - }, - { - "epoch": 1.88, - "learning_rate": 6.453254576850519e-07, - "loss": 0.5747, - "step": 73383 - }, - { - "epoch": 1.88, - "learning_rate": 6.452995862280441e-07, - "loss": 0.4875, - "step": 73384 - }, - { - "epoch": 1.88, - "learning_rate": 6.452737150426146e-07, - "loss": 0.6523, - "step": 73385 - }, - { - "epoch": 1.88, - "learning_rate": 6.452478441287823e-07, - "loss": 0.5962, - "step": 73386 - }, - { - "epoch": 1.88, - "learning_rate": 6.452219734865677e-07, - "loss": 0.5903, - "step": 73387 - }, - { - "epoch": 1.88, - "learning_rate": 6.451961031159901e-07, - "loss": 0.6387, - "step": 73388 - }, - { - "epoch": 1.88, - "learning_rate": 6.451702330170696e-07, - "loss": 0.5649, - "step": 73389 - }, - { - "epoch": 1.88, - "learning_rate": 6.451443631898259e-07, - "loss": 0.5244, - "step": 73390 - }, - { - "epoch": 1.88, - "learning_rate": 6.451184936342795e-07, - "loss": 0.5691, - "step": 73391 - }, - { - "epoch": 1.88, - "learning_rate": 6.450926243504489e-07, - "loss": 0.6113, - "step": 73392 - }, - { - "epoch": 1.88, - "learning_rate": 6.450667553383546e-07, - "loss": 0.7012, - "step": 73393 - }, - { - "epoch": 1.88, - "learning_rate": 6.450408865980163e-07, - "loss": 0.6084, - "step": 73394 - }, - { - "epoch": 1.88, - "learning_rate": 6.45015018129454e-07, - "loss": 0.4329, - "step": 73395 - }, - { - "epoch": 1.88, - "learning_rate": 6.449891499326872e-07, - "loss": 0.6289, - "step": 73396 - }, - { - "epoch": 1.88, - "learning_rate": 6.449632820077362e-07, - "loss": 0.5203, - "step": 73397 - }, - { - "epoch": 1.88, - "learning_rate": 6.449374143546202e-07, - "loss": 0.6499, - "step": 73398 - }, - { - "epoch": 1.88, - "learning_rate": 6.449115469733595e-07, - "loss": 0.5742, - "step": 73399 - }, - { - "epoch": 1.88, - "learning_rate": 6.448856798639735e-07, - "loss": 0.6182, - "step": 73400 - }, - { - "epoch": 1.88, - "learning_rate": 6.448598130264827e-07, - "loss": 0.5918, - "step": 73401 - }, - { - "epoch": 1.88, - "learning_rate": 6.44833946460906e-07, - "loss": 0.5503, - "step": 73402 - }, - { - "epoch": 1.88, - "learning_rate": 6.448080801672635e-07, - "loss": 0.5938, - "step": 73403 - }, - { - "epoch": 1.88, - "learning_rate": 6.447822141455754e-07, - "loss": 0.6074, - "step": 73404 - }, - { - "epoch": 1.88, - "learning_rate": 6.44756348395861e-07, - "loss": 0.5542, - "step": 73405 - }, - { - "epoch": 1.88, - "learning_rate": 6.447304829181404e-07, - "loss": 0.4692, - "step": 73406 - }, - { - "epoch": 1.88, - "learning_rate": 6.447046177124333e-07, - "loss": 0.7607, - "step": 73407 - }, - { - "epoch": 1.88, - "learning_rate": 6.446787527787596e-07, - "loss": 0.3619, - "step": 73408 - }, - { - "epoch": 1.88, - "learning_rate": 6.446528881171389e-07, - "loss": 0.5212, - "step": 73409 - }, - { - "epoch": 1.88, - "learning_rate": 6.446270237275915e-07, - "loss": 0.6719, - "step": 73410 - }, - { - "epoch": 1.88, - "learning_rate": 6.446011596101368e-07, - "loss": 0.6382, - "step": 73411 - }, - { - "epoch": 1.88, - "learning_rate": 6.445752957647945e-07, - "loss": 0.5791, - "step": 73412 - }, - { - "epoch": 1.88, - "learning_rate": 6.445494321915845e-07, - "loss": 0.5762, - "step": 73413 - }, - { - "epoch": 1.88, - "learning_rate": 6.445235688905268e-07, - "loss": 0.7178, - "step": 73414 - }, - { - "epoch": 1.88, - "learning_rate": 6.444977058616407e-07, - "loss": 0.7588, - "step": 73415 - }, - { - "epoch": 1.88, - "learning_rate": 6.444718431049467e-07, - "loss": 0.6797, - "step": 73416 - }, - { - "epoch": 1.88, - "learning_rate": 6.444459806204641e-07, - "loss": 0.627, - "step": 73417 - }, - { - "epoch": 1.88, - "learning_rate": 6.44420118408213e-07, - "loss": 0.6143, - "step": 73418 - }, - { - "epoch": 1.88, - "learning_rate": 6.44394256468213e-07, - "loss": 0.6221, - "step": 73419 - }, - { - "epoch": 1.88, - "learning_rate": 6.443683948004839e-07, - "loss": 0.5376, - "step": 73420 - }, - { - "epoch": 1.88, - "learning_rate": 6.44342533405046e-07, - "loss": 0.7305, - "step": 73421 - }, - { - "epoch": 1.88, - "learning_rate": 6.443166722819182e-07, - "loss": 0.4888, - "step": 73422 - }, - { - "epoch": 1.88, - "learning_rate": 6.44290811431121e-07, - "loss": 0.6548, - "step": 73423 - }, - { - "epoch": 1.88, - "learning_rate": 6.442649508526736e-07, - "loss": 0.4561, - "step": 73424 - }, - { - "epoch": 1.88, - "learning_rate": 6.442390905465965e-07, - "loss": 0.5139, - "step": 73425 - }, - { - "epoch": 1.88, - "learning_rate": 6.44213230512909e-07, - "loss": 0.6577, - "step": 73426 - }, - { - "epoch": 1.88, - "learning_rate": 6.441873707516312e-07, - "loss": 0.668, - "step": 73427 - }, - { - "epoch": 1.88, - "learning_rate": 6.441615112627826e-07, - "loss": 0.627, - "step": 73428 - }, - { - "epoch": 1.88, - "learning_rate": 6.441356520463835e-07, - "loss": 0.2308, - "step": 73429 - }, - { - "epoch": 1.88, - "learning_rate": 6.44109793102453e-07, - "loss": 0.708, - "step": 73430 - }, - { - "epoch": 1.88, - "learning_rate": 6.440839344310118e-07, - "loss": 0.6354, - "step": 73431 - }, - { - "epoch": 1.88, - "learning_rate": 6.440580760320786e-07, - "loss": 0.7871, - "step": 73432 - }, - { - "epoch": 1.88, - "learning_rate": 6.440322179056741e-07, - "loss": 0.5664, - "step": 73433 - }, - { - "epoch": 1.88, - "learning_rate": 6.440063600518175e-07, - "loss": 0.6357, - "step": 73434 - }, - { - "epoch": 1.88, - "learning_rate": 6.439805024705291e-07, - "loss": 0.769, - "step": 73435 - }, - { - "epoch": 1.88, - "learning_rate": 6.439546451618282e-07, - "loss": 0.6484, - "step": 73436 - }, - { - "epoch": 1.88, - "learning_rate": 6.439287881257352e-07, - "loss": 0.6816, - "step": 73437 - }, - { - "epoch": 1.88, - "learning_rate": 6.43902931362269e-07, - "loss": 0.6729, - "step": 73438 - }, - { - "epoch": 1.88, - "learning_rate": 6.438770748714505e-07, - "loss": 0.6699, - "step": 73439 - }, - { - "epoch": 1.88, - "learning_rate": 6.438512186532986e-07, - "loss": 0.6626, - "step": 73440 - }, - { - "epoch": 1.88, - "learning_rate": 6.438253627078339e-07, - "loss": 0.5413, - "step": 73441 - }, - { - "epoch": 1.88, - "learning_rate": 6.437995070350754e-07, - "loss": 0.5659, - "step": 73442 - }, - { - "epoch": 1.88, - "learning_rate": 6.437736516350433e-07, - "loss": 0.7568, - "step": 73443 - }, - { - "epoch": 1.88, - "learning_rate": 6.437477965077573e-07, - "loss": 0.5513, - "step": 73444 - }, - { - "epoch": 1.88, - "learning_rate": 6.437219416532372e-07, - "loss": 0.4735, - "step": 73445 - }, - { - "epoch": 1.88, - "learning_rate": 6.436960870715029e-07, - "loss": 0.5645, - "step": 73446 - }, - { - "epoch": 1.88, - "learning_rate": 6.436702327625742e-07, - "loss": 0.6909, - "step": 73447 - }, - { - "epoch": 1.88, - "learning_rate": 6.436443787264706e-07, - "loss": 0.5566, - "step": 73448 - }, - { - "epoch": 1.88, - "learning_rate": 6.436185249632122e-07, - "loss": 0.6221, - "step": 73449 - }, - { - "epoch": 1.88, - "learning_rate": 6.435926714728187e-07, - "loss": 0.6855, - "step": 73450 - }, - { - "epoch": 1.88, - "learning_rate": 6.435668182553102e-07, - "loss": 0.7393, - "step": 73451 - }, - { - "epoch": 1.88, - "learning_rate": 6.43540965310706e-07, - "loss": 0.502, - "step": 73452 - }, - { - "epoch": 1.88, - "learning_rate": 6.435151126390259e-07, - "loss": 0.6826, - "step": 73453 - }, - { - "epoch": 1.88, - "learning_rate": 6.434892602402902e-07, - "loss": 0.6655, - "step": 73454 - }, - { - "epoch": 1.88, - "learning_rate": 6.43463408114518e-07, - "loss": 0.6284, - "step": 73455 - }, - { - "epoch": 1.88, - "learning_rate": 6.434375562617298e-07, - "loss": 0.7607, - "step": 73456 - }, - { - "epoch": 1.88, - "learning_rate": 6.434117046819447e-07, - "loss": 0.4937, - "step": 73457 - }, - { - "epoch": 1.88, - "learning_rate": 6.433858533751833e-07, - "loss": 0.6182, - "step": 73458 - }, - { - "epoch": 1.88, - "learning_rate": 6.433600023414645e-07, - "loss": 0.6748, - "step": 73459 - }, - { - "epoch": 1.88, - "learning_rate": 6.43334151580809e-07, - "loss": 0.6807, - "step": 73460 - }, - { - "epoch": 1.88, - "learning_rate": 6.433083010932362e-07, - "loss": 0.7354, - "step": 73461 - }, - { - "epoch": 1.88, - "learning_rate": 6.432824508787655e-07, - "loss": 0.5703, - "step": 73462 - }, - { - "epoch": 1.88, - "learning_rate": 6.432566009374171e-07, - "loss": 0.4487, - "step": 73463 - }, - { - "epoch": 1.88, - "learning_rate": 6.432307512692108e-07, - "loss": 0.5107, - "step": 73464 - }, - { - "epoch": 1.88, - "learning_rate": 6.432049018741661e-07, - "loss": 0.5125, - "step": 73465 - }, - { - "epoch": 1.88, - "learning_rate": 6.431790527523032e-07, - "loss": 0.6963, - "step": 73466 - }, - { - "epoch": 1.88, - "learning_rate": 6.431532039036414e-07, - "loss": 0.6177, - "step": 73467 - }, - { - "epoch": 1.88, - "learning_rate": 6.431273553282012e-07, - "loss": 0.6641, - "step": 73468 - }, - { - "epoch": 1.88, - "learning_rate": 6.431015070260017e-07, - "loss": 0.8887, - "step": 73469 - }, - { - "epoch": 1.88, - "learning_rate": 6.430756589970631e-07, - "loss": 0.7354, - "step": 73470 - }, - { - "epoch": 1.88, - "learning_rate": 6.430498112414052e-07, - "loss": 0.8076, - "step": 73471 - }, - { - "epoch": 1.88, - "learning_rate": 6.430239637590473e-07, - "loss": 0.5566, - "step": 73472 - }, - { - "epoch": 1.88, - "learning_rate": 6.429981165500098e-07, - "loss": 0.582, - "step": 73473 - }, - { - "epoch": 1.88, - "learning_rate": 6.42972269614312e-07, - "loss": 0.6465, - "step": 73474 - }, - { - "epoch": 1.88, - "learning_rate": 6.429464229519741e-07, - "loss": 0.6157, - "step": 73475 - }, - { - "epoch": 1.88, - "learning_rate": 6.429205765630155e-07, - "loss": 0.7593, - "step": 73476 - }, - { - "epoch": 1.88, - "learning_rate": 6.428947304474563e-07, - "loss": 0.5635, - "step": 73477 - }, - { - "epoch": 1.88, - "learning_rate": 6.428688846053162e-07, - "loss": 0.624, - "step": 73478 - }, - { - "epoch": 1.88, - "learning_rate": 6.428430390366151e-07, - "loss": 0.6924, - "step": 73479 - }, - { - "epoch": 1.88, - "learning_rate": 6.428171937413725e-07, - "loss": 0.8018, - "step": 73480 - }, - { - "epoch": 1.88, - "learning_rate": 6.427913487196089e-07, - "loss": 0.6597, - "step": 73481 - }, - { - "epoch": 1.88, - "learning_rate": 6.427655039713428e-07, - "loss": 0.6436, - "step": 73482 - }, - { - "epoch": 1.88, - "learning_rate": 6.427396594965951e-07, - "loss": 0.6777, - "step": 73483 - }, - { - "epoch": 1.88, - "learning_rate": 6.427138152953848e-07, - "loss": 0.4271, - "step": 73484 - }, - { - "epoch": 1.88, - "learning_rate": 6.426879713677326e-07, - "loss": 0.585, - "step": 73485 - }, - { - "epoch": 1.88, - "learning_rate": 6.426621277136575e-07, - "loss": 0.563, - "step": 73486 - }, - { - "epoch": 1.88, - "learning_rate": 6.426362843331796e-07, - "loss": 0.7617, - "step": 73487 - }, - { - "epoch": 1.88, - "learning_rate": 6.426104412263187e-07, - "loss": 0.4236, - "step": 73488 - }, - { - "epoch": 1.88, - "learning_rate": 6.425845983930947e-07, - "loss": 0.6875, - "step": 73489 - }, - { - "epoch": 1.88, - "learning_rate": 6.425587558335268e-07, - "loss": 0.5864, - "step": 73490 - }, - { - "epoch": 1.88, - "learning_rate": 6.425329135476359e-07, - "loss": 0.6514, - "step": 73491 - }, - { - "epoch": 1.88, - "learning_rate": 6.425070715354408e-07, - "loss": 0.5698, - "step": 73492 - }, - { - "epoch": 1.88, - "learning_rate": 6.424812297969615e-07, - "loss": 0.7559, - "step": 73493 - }, - { - "epoch": 1.88, - "learning_rate": 6.424553883322179e-07, - "loss": 0.3063, - "step": 73494 - }, - { - "epoch": 1.88, - "learning_rate": 6.424295471412297e-07, - "loss": 0.5562, - "step": 73495 - }, - { - "epoch": 1.88, - "learning_rate": 6.424037062240169e-07, - "loss": 0.6965, - "step": 73496 - }, - { - "epoch": 1.88, - "learning_rate": 6.423778655805989e-07, - "loss": 0.8184, - "step": 73497 - }, - { - "epoch": 1.88, - "learning_rate": 6.42352025210996e-07, - "loss": 0.5745, - "step": 73498 - }, - { - "epoch": 1.88, - "learning_rate": 6.423261851152275e-07, - "loss": 0.7383, - "step": 73499 - }, - { - "epoch": 1.88, - "learning_rate": 6.423003452933137e-07, - "loss": 0.6406, - "step": 73500 - }, - { - "epoch": 1.88, - "learning_rate": 6.42274505745274e-07, - "loss": 0.7422, - "step": 73501 - }, - { - "epoch": 1.88, - "learning_rate": 6.422486664711284e-07, - "loss": 0.4399, - "step": 73502 - }, - { - "epoch": 1.88, - "learning_rate": 6.422228274708962e-07, - "loss": 0.6084, - "step": 73503 - }, - { - "epoch": 1.88, - "learning_rate": 6.421969887445977e-07, - "loss": 0.668, - "step": 73504 - }, - { - "epoch": 1.88, - "learning_rate": 6.421711502922523e-07, - "loss": 0.5659, - "step": 73505 - }, - { - "epoch": 1.88, - "learning_rate": 6.421453121138802e-07, - "loss": 0.6807, - "step": 73506 - }, - { - "epoch": 1.88, - "learning_rate": 6.421194742095009e-07, - "loss": 0.5923, - "step": 73507 - }, - { - "epoch": 1.88, - "learning_rate": 6.420936365791343e-07, - "loss": 0.6846, - "step": 73508 - }, - { - "epoch": 1.88, - "learning_rate": 6.420677992228e-07, - "loss": 0.6831, - "step": 73509 - }, - { - "epoch": 1.88, - "learning_rate": 6.420419621405182e-07, - "loss": 0.5408, - "step": 73510 - }, - { - "epoch": 1.88, - "learning_rate": 6.420161253323084e-07, - "loss": 0.5663, - "step": 73511 - }, - { - "epoch": 1.88, - "learning_rate": 6.419902887981903e-07, - "loss": 0.6553, - "step": 73512 - }, - { - "epoch": 1.88, - "learning_rate": 6.419644525381837e-07, - "loss": 0.71, - "step": 73513 - }, - { - "epoch": 1.88, - "learning_rate": 6.419386165523084e-07, - "loss": 0.5161, - "step": 73514 - }, - { - "epoch": 1.88, - "learning_rate": 6.419127808405844e-07, - "loss": 0.6621, - "step": 73515 - }, - { - "epoch": 1.88, - "learning_rate": 6.418869454030311e-07, - "loss": 0.709, - "step": 73516 - }, - { - "epoch": 1.88, - "learning_rate": 6.418611102396687e-07, - "loss": 0.6416, - "step": 73517 - }, - { - "epoch": 1.88, - "learning_rate": 6.418352753505167e-07, - "loss": 0.7061, - "step": 73518 - }, - { - "epoch": 1.88, - "learning_rate": 6.418094407355949e-07, - "loss": 0.665, - "step": 73519 - }, - { - "epoch": 1.88, - "learning_rate": 6.417836063949235e-07, - "loss": 0.6445, - "step": 73520 - }, - { - "epoch": 1.88, - "learning_rate": 6.417577723285219e-07, - "loss": 0.6924, - "step": 73521 - }, - { - "epoch": 1.88, - "learning_rate": 6.417319385364095e-07, - "loss": 0.6455, - "step": 73522 - }, - { - "epoch": 1.88, - "learning_rate": 6.417061050186068e-07, - "loss": 0.4741, - "step": 73523 - }, - { - "epoch": 1.88, - "learning_rate": 6.416802717751328e-07, - "loss": 0.7803, - "step": 73524 - }, - { - "epoch": 1.88, - "learning_rate": 6.416544388060081e-07, - "loss": 0.6255, - "step": 73525 - }, - { - "epoch": 1.88, - "learning_rate": 6.41628606111252e-07, - "loss": 0.5625, - "step": 73526 - }, - { - "epoch": 1.88, - "learning_rate": 6.416027736908846e-07, - "loss": 0.6523, - "step": 73527 - }, - { - "epoch": 1.88, - "learning_rate": 6.415769415449251e-07, - "loss": 0.6938, - "step": 73528 - }, - { - "epoch": 1.88, - "learning_rate": 6.41551109673394e-07, - "loss": 0.7314, - "step": 73529 - }, - { - "epoch": 1.88, - "learning_rate": 6.415252780763105e-07, - "loss": 0.3878, - "step": 73530 - }, - { - "epoch": 1.88, - "learning_rate": 6.414994467536949e-07, - "loss": 0.5786, - "step": 73531 - }, - { - "epoch": 1.88, - "learning_rate": 6.414736157055667e-07, - "loss": 0.832, - "step": 73532 - }, - { - "epoch": 1.88, - "learning_rate": 6.414477849319453e-07, - "loss": 0.5424, - "step": 73533 - }, - { - "epoch": 1.88, - "learning_rate": 6.414219544328512e-07, - "loss": 0.4399, - "step": 73534 - }, - { - "epoch": 1.88, - "learning_rate": 6.413961242083034e-07, - "loss": 0.5684, - "step": 73535 - }, - { - "epoch": 1.88, - "learning_rate": 6.413702942583225e-07, - "loss": 0.709, - "step": 73536 - }, - { - "epoch": 1.88, - "learning_rate": 6.413444645829278e-07, - "loss": 0.4976, - "step": 73537 - }, - { - "epoch": 1.88, - "learning_rate": 6.413186351821389e-07, - "loss": 0.6963, - "step": 73538 - }, - { - "epoch": 1.88, - "learning_rate": 6.412928060559761e-07, - "loss": 0.4893, - "step": 73539 - }, - { - "epoch": 1.88, - "learning_rate": 6.412669772044588e-07, - "loss": 0.5869, - "step": 73540 - }, - { - "epoch": 1.88, - "learning_rate": 6.41241148627607e-07, - "loss": 0.5237, - "step": 73541 - }, - { - "epoch": 1.88, - "learning_rate": 6.412153203254404e-07, - "loss": 0.6982, - "step": 73542 - }, - { - "epoch": 1.88, - "learning_rate": 6.411894922979785e-07, - "loss": 0.7114, - "step": 73543 - }, - { - "epoch": 1.88, - "learning_rate": 6.411636645452414e-07, - "loss": 0.429, - "step": 73544 - }, - { - "epoch": 1.88, - "learning_rate": 6.411378370672486e-07, - "loss": 0.7998, - "step": 73545 - }, - { - "epoch": 1.89, - "learning_rate": 6.411120098640203e-07, - "loss": 0.5688, - "step": 73546 - }, - { - "epoch": 1.89, - "learning_rate": 6.410861829355759e-07, - "loss": 0.438, - "step": 73547 - }, - { - "epoch": 1.89, - "learning_rate": 6.410603562819354e-07, - "loss": 0.6123, - "step": 73548 - }, - { - "epoch": 1.89, - "learning_rate": 6.410345299031184e-07, - "loss": 0.6782, - "step": 73549 - }, - { - "epoch": 1.89, - "learning_rate": 6.410087037991449e-07, - "loss": 0.7197, - "step": 73550 - }, - { - "epoch": 1.89, - "learning_rate": 6.409828779700346e-07, - "loss": 0.6934, - "step": 73551 - }, - { - "epoch": 1.89, - "learning_rate": 6.40957052415807e-07, - "loss": 0.5889, - "step": 73552 - }, - { - "epoch": 1.89, - "learning_rate": 6.409312271364822e-07, - "loss": 0.5107, - "step": 73553 - }, - { - "epoch": 1.89, - "learning_rate": 6.409054021320797e-07, - "loss": 0.5576, - "step": 73554 - }, - { - "epoch": 1.89, - "learning_rate": 6.408795774026194e-07, - "loss": 0.749, - "step": 73555 - }, - { - "epoch": 1.89, - "learning_rate": 6.408537529481213e-07, - "loss": 0.6968, - "step": 73556 - }, - { - "epoch": 1.89, - "learning_rate": 6.408279287686047e-07, - "loss": 0.5166, - "step": 73557 - }, - { - "epoch": 1.89, - "learning_rate": 6.408021048640899e-07, - "loss": 0.5532, - "step": 73558 - }, - { - "epoch": 1.89, - "learning_rate": 6.407762812345962e-07, - "loss": 0.5825, - "step": 73559 - }, - { - "epoch": 1.89, - "learning_rate": 6.407504578801437e-07, - "loss": 0.6768, - "step": 73560 - }, - { - "epoch": 1.89, - "learning_rate": 6.407246348007522e-07, - "loss": 0.7158, - "step": 73561 - }, - { - "epoch": 1.89, - "learning_rate": 6.406988119964412e-07, - "loss": 0.4843, - "step": 73562 - }, - { - "epoch": 1.89, - "learning_rate": 6.406729894672306e-07, - "loss": 0.6748, - "step": 73563 - }, - { - "epoch": 1.89, - "learning_rate": 6.406471672131399e-07, - "loss": 0.6816, - "step": 73564 - }, - { - "epoch": 1.89, - "learning_rate": 6.406213452341896e-07, - "loss": 0.6421, - "step": 73565 - }, - { - "epoch": 1.89, - "learning_rate": 6.405955235303986e-07, - "loss": 0.6963, - "step": 73566 - }, - { - "epoch": 1.89, - "learning_rate": 6.405697021017873e-07, - "loss": 0.6035, - "step": 73567 - }, - { - "epoch": 1.89, - "learning_rate": 6.405438809483751e-07, - "loss": 0.7598, - "step": 73568 - }, - { - "epoch": 1.89, - "learning_rate": 6.405180600701821e-07, - "loss": 0.6665, - "step": 73569 - }, - { - "epoch": 1.89, - "learning_rate": 6.404922394672277e-07, - "loss": 0.6787, - "step": 73570 - }, - { - "epoch": 1.89, - "learning_rate": 6.404664191395325e-07, - "loss": 0.6865, - "step": 73571 - }, - { - "epoch": 1.89, - "learning_rate": 6.404405990871149e-07, - "loss": 0.4917, - "step": 73572 - }, - { - "epoch": 1.89, - "learning_rate": 6.404147793099957e-07, - "loss": 0.5801, - "step": 73573 - }, - { - "epoch": 1.89, - "learning_rate": 6.403889598081942e-07, - "loss": 0.418, - "step": 73574 - }, - { - "epoch": 1.89, - "learning_rate": 6.403631405817304e-07, - "loss": 0.6836, - "step": 73575 - }, - { - "epoch": 1.89, - "learning_rate": 6.403373216306241e-07, - "loss": 0.4673, - "step": 73576 - }, - { - "epoch": 1.89, - "learning_rate": 6.403115029548949e-07, - "loss": 0.6963, - "step": 73577 - }, - { - "epoch": 1.89, - "learning_rate": 6.402856845545625e-07, - "loss": 0.6611, - "step": 73578 - }, - { - "epoch": 1.89, - "learning_rate": 6.40259866429647e-07, - "loss": 0.5957, - "step": 73579 - }, - { - "epoch": 1.89, - "learning_rate": 6.402340485801678e-07, - "loss": 0.5151, - "step": 73580 - }, - { - "epoch": 1.89, - "learning_rate": 6.402082310061454e-07, - "loss": 0.6758, - "step": 73581 - }, - { - "epoch": 1.89, - "learning_rate": 6.401824137075986e-07, - "loss": 0.6929, - "step": 73582 - }, - { - "epoch": 1.89, - "learning_rate": 6.401565966845475e-07, - "loss": 0.6035, - "step": 73583 - }, - { - "epoch": 1.89, - "learning_rate": 6.401307799370122e-07, - "loss": 0.6016, - "step": 73584 - }, - { - "epoch": 1.89, - "learning_rate": 6.401049634650118e-07, - "loss": 0.6055, - "step": 73585 - }, - { - "epoch": 1.89, - "learning_rate": 6.400791472685668e-07, - "loss": 0.6387, - "step": 73586 - }, - { - "epoch": 1.89, - "learning_rate": 6.400533313476965e-07, - "loss": 0.6392, - "step": 73587 - }, - { - "epoch": 1.89, - "learning_rate": 6.400275157024209e-07, - "loss": 0.8164, - "step": 73588 - }, - { - "epoch": 1.89, - "learning_rate": 6.400017003327596e-07, - "loss": 0.5835, - "step": 73589 - }, - { - "epoch": 1.89, - "learning_rate": 6.399758852387329e-07, - "loss": 0.7314, - "step": 73590 - }, - { - "epoch": 1.89, - "learning_rate": 6.399500704203596e-07, - "loss": 0.7412, - "step": 73591 - }, - { - "epoch": 1.89, - "learning_rate": 6.399242558776603e-07, - "loss": 0.6475, - "step": 73592 - }, - { - "epoch": 1.89, - "learning_rate": 6.398984416106541e-07, - "loss": 0.6318, - "step": 73593 - }, - { - "epoch": 1.89, - "learning_rate": 6.398726276193613e-07, - "loss": 0.6387, - "step": 73594 - }, - { - "epoch": 1.89, - "learning_rate": 6.398468139038013e-07, - "loss": 0.6218, - "step": 73595 - }, - { - "epoch": 1.89, - "learning_rate": 6.398210004639941e-07, - "loss": 0.7305, - "step": 73596 - }, - { - "epoch": 1.89, - "learning_rate": 6.397951872999594e-07, - "loss": 0.667, - "step": 73597 - }, - { - "epoch": 1.89, - "learning_rate": 6.397693744117171e-07, - "loss": 0.6235, - "step": 73598 - }, - { - "epoch": 1.89, - "learning_rate": 6.397435617992866e-07, - "loss": 0.7114, - "step": 73599 - }, - { - "epoch": 1.89, - "learning_rate": 6.397177494626883e-07, - "loss": 0.4692, - "step": 73600 - }, - { - "epoch": 1.89, - "learning_rate": 6.396919374019413e-07, - "loss": 0.5654, - "step": 73601 - }, - { - "epoch": 1.89, - "learning_rate": 6.396661256170654e-07, - "loss": 0.5991, - "step": 73602 - }, - { - "epoch": 1.89, - "learning_rate": 6.39640314108081e-07, - "loss": 0.5547, - "step": 73603 - }, - { - "epoch": 1.89, - "learning_rate": 6.39614502875007e-07, - "loss": 0.5728, - "step": 73604 - }, - { - "epoch": 1.89, - "learning_rate": 6.395886919178639e-07, - "loss": 0.7979, - "step": 73605 - }, - { - "epoch": 1.89, - "learning_rate": 6.39562881236671e-07, - "loss": 0.7959, - "step": 73606 - }, - { - "epoch": 1.89, - "learning_rate": 6.395370708314485e-07, - "loss": 0.6562, - "step": 73607 - }, - { - "epoch": 1.89, - "learning_rate": 6.395112607022155e-07, - "loss": 0.6562, - "step": 73608 - }, - { - "epoch": 1.89, - "learning_rate": 6.394854508489924e-07, - "loss": 0.5635, - "step": 73609 - }, - { - "epoch": 1.89, - "learning_rate": 6.39459641271799e-07, - "loss": 0.6382, - "step": 73610 - }, - { - "epoch": 1.89, - "learning_rate": 6.394338319706545e-07, - "loss": 0.5308, - "step": 73611 - }, - { - "epoch": 1.89, - "learning_rate": 6.394080229455787e-07, - "loss": 0.5305, - "step": 73612 - }, - { - "epoch": 1.89, - "learning_rate": 6.393822141965919e-07, - "loss": 0.7319, - "step": 73613 - }, - { - "epoch": 1.89, - "learning_rate": 6.393564057237133e-07, - "loss": 0.709, - "step": 73614 - }, - { - "epoch": 1.89, - "learning_rate": 6.393305975269631e-07, - "loss": 0.7148, - "step": 73615 - }, - { - "epoch": 1.89, - "learning_rate": 6.393047896063608e-07, - "loss": 0.6416, - "step": 73616 - }, - { - "epoch": 1.89, - "learning_rate": 6.392789819619262e-07, - "loss": 0.5806, - "step": 73617 - }, - { - "epoch": 1.89, - "learning_rate": 6.392531745936791e-07, - "loss": 0.6069, - "step": 73618 - }, - { - "epoch": 1.89, - "learning_rate": 6.392273675016394e-07, - "loss": 0.6143, - "step": 73619 - }, - { - "epoch": 1.89, - "learning_rate": 6.39201560685827e-07, - "loss": 0.4692, - "step": 73620 - }, - { - "epoch": 1.89, - "learning_rate": 6.391757541462608e-07, - "loss": 0.7344, - "step": 73621 - }, - { - "epoch": 1.89, - "learning_rate": 6.391499478829614e-07, - "loss": 0.6226, - "step": 73622 - }, - { - "epoch": 1.89, - "learning_rate": 6.391241418959481e-07, - "loss": 0.4333, - "step": 73623 - }, - { - "epoch": 1.89, - "learning_rate": 6.390983361852411e-07, - "loss": 0.5469, - "step": 73624 - }, - { - "epoch": 1.89, - "learning_rate": 6.390725307508597e-07, - "loss": 0.5669, - "step": 73625 - }, - { - "epoch": 1.89, - "learning_rate": 6.39046725592824e-07, - "loss": 0.6758, - "step": 73626 - }, - { - "epoch": 1.89, - "learning_rate": 6.390209207111536e-07, - "loss": 0.5576, - "step": 73627 - }, - { - "epoch": 1.89, - "learning_rate": 6.389951161058682e-07, - "loss": 0.7686, - "step": 73628 - }, - { - "epoch": 1.89, - "learning_rate": 6.389693117769879e-07, - "loss": 0.6006, - "step": 73629 - }, - { - "epoch": 1.89, - "learning_rate": 6.389435077245322e-07, - "loss": 0.5332, - "step": 73630 - }, - { - "epoch": 1.89, - "learning_rate": 6.389177039485205e-07, - "loss": 0.3975, - "step": 73631 - }, - { - "epoch": 1.89, - "learning_rate": 6.388919004489732e-07, - "loss": 0.6646, - "step": 73632 - }, - { - "epoch": 1.89, - "learning_rate": 6.388660972259095e-07, - "loss": 0.7729, - "step": 73633 - }, - { - "epoch": 1.89, - "learning_rate": 6.388402942793496e-07, - "loss": 0.6475, - "step": 73634 - }, - { - "epoch": 1.89, - "learning_rate": 6.38814491609313e-07, - "loss": 0.6562, - "step": 73635 - }, - { - "epoch": 1.89, - "learning_rate": 6.387886892158196e-07, - "loss": 0.5815, - "step": 73636 - }, - { - "epoch": 1.89, - "learning_rate": 6.387628870988891e-07, - "loss": 0.3828, - "step": 73637 - }, - { - "epoch": 1.89, - "learning_rate": 6.387370852585412e-07, - "loss": 0.6841, - "step": 73638 - }, - { - "epoch": 1.89, - "learning_rate": 6.387112836947956e-07, - "loss": 0.665, - "step": 73639 - }, - { - "epoch": 1.89, - "learning_rate": 6.386854824076725e-07, - "loss": 0.6338, - "step": 73640 - }, - { - "epoch": 1.89, - "learning_rate": 6.386596813971912e-07, - "loss": 0.6089, - "step": 73641 - }, - { - "epoch": 1.89, - "learning_rate": 6.386338806633713e-07, - "loss": 0.5962, - "step": 73642 - }, - { - "epoch": 1.89, - "learning_rate": 6.38608080206233e-07, - "loss": 0.7041, - "step": 73643 - }, - { - "epoch": 1.89, - "learning_rate": 6.385822800257961e-07, - "loss": 0.603, - "step": 73644 - }, - { - "epoch": 1.89, - "learning_rate": 6.385564801220797e-07, - "loss": 0.5464, - "step": 73645 - }, - { - "epoch": 1.89, - "learning_rate": 6.385306804951043e-07, - "loss": 0.6279, - "step": 73646 - }, - { - "epoch": 1.89, - "learning_rate": 6.385048811448889e-07, - "loss": 0.5083, - "step": 73647 - }, - { - "epoch": 1.89, - "learning_rate": 6.384790820714542e-07, - "loss": 0.7676, - "step": 73648 - }, - { - "epoch": 1.89, - "learning_rate": 6.38453283274819e-07, - "loss": 0.6484, - "step": 73649 - }, - { - "epoch": 1.89, - "learning_rate": 6.384274847550042e-07, - "loss": 0.7627, - "step": 73650 - }, - { - "epoch": 1.89, - "learning_rate": 6.384016865120284e-07, - "loss": 0.6177, - "step": 73651 - }, - { - "epoch": 1.89, - "learning_rate": 6.383758885459117e-07, - "loss": 0.6479, - "step": 73652 - }, - { - "epoch": 1.89, - "learning_rate": 6.383500908566741e-07, - "loss": 0.793, - "step": 73653 - }, - { - "epoch": 1.89, - "learning_rate": 6.38324293444335e-07, - "loss": 0.5723, - "step": 73654 - }, - { - "epoch": 1.89, - "learning_rate": 6.382984963089147e-07, - "loss": 0.625, - "step": 73655 - }, - { - "epoch": 1.89, - "learning_rate": 6.382726994504322e-07, - "loss": 0.6299, - "step": 73656 - }, - { - "epoch": 1.89, - "learning_rate": 6.38246902868908e-07, - "loss": 0.6797, - "step": 73657 - }, - { - "epoch": 1.89, - "learning_rate": 6.382211065643612e-07, - "loss": 0.6484, - "step": 73658 - }, - { - "epoch": 1.89, - "learning_rate": 6.381953105368121e-07, - "loss": 0.5947, - "step": 73659 - }, - { - "epoch": 1.89, - "learning_rate": 6.381695147862805e-07, - "loss": 0.6582, - "step": 73660 - }, - { - "epoch": 1.89, - "learning_rate": 6.381437193127856e-07, - "loss": 0.7734, - "step": 73661 - }, - { - "epoch": 1.89, - "learning_rate": 6.381179241163473e-07, - "loss": 0.5789, - "step": 73662 - }, - { - "epoch": 1.89, - "learning_rate": 6.380921291969856e-07, - "loss": 0.624, - "step": 73663 - }, - { - "epoch": 1.89, - "learning_rate": 6.380663345547199e-07, - "loss": 0.7578, - "step": 73664 - }, - { - "epoch": 1.89, - "learning_rate": 6.380405401895703e-07, - "loss": 0.6855, - "step": 73665 - }, - { - "epoch": 1.89, - "learning_rate": 6.380147461015564e-07, - "loss": 0.7061, - "step": 73666 - }, - { - "epoch": 1.89, - "learning_rate": 6.379889522906979e-07, - "loss": 0.451, - "step": 73667 - }, - { - "epoch": 1.89, - "learning_rate": 6.379631587570147e-07, - "loss": 0.7793, - "step": 73668 - }, - { - "epoch": 1.89, - "learning_rate": 6.379373655005265e-07, - "loss": 0.7222, - "step": 73669 - }, - { - "epoch": 1.89, - "learning_rate": 6.379115725212532e-07, - "loss": 0.5112, - "step": 73670 - }, - { - "epoch": 1.89, - "learning_rate": 6.37885779819214e-07, - "loss": 0.6201, - "step": 73671 - }, - { - "epoch": 1.89, - "learning_rate": 6.378599873944292e-07, - "loss": 0.8799, - "step": 73672 - }, - { - "epoch": 1.89, - "learning_rate": 6.378341952469182e-07, - "loss": 0.749, - "step": 73673 - }, - { - "epoch": 1.89, - "learning_rate": 6.37808403376701e-07, - "loss": 0.7236, - "step": 73674 - }, - { - "epoch": 1.89, - "learning_rate": 6.377826117837973e-07, - "loss": 0.6538, - "step": 73675 - }, - { - "epoch": 1.89, - "learning_rate": 6.377568204682267e-07, - "loss": 0.5908, - "step": 73676 - }, - { - "epoch": 1.89, - "learning_rate": 6.377310294300089e-07, - "loss": 0.6914, - "step": 73677 - }, - { - "epoch": 1.89, - "learning_rate": 6.377052386691642e-07, - "loss": 0.6489, - "step": 73678 - }, - { - "epoch": 1.89, - "learning_rate": 6.376794481857115e-07, - "loss": 0.5718, - "step": 73679 - }, - { - "epoch": 1.89, - "learning_rate": 6.376536579796716e-07, - "loss": 0.6001, - "step": 73680 - }, - { - "epoch": 1.89, - "learning_rate": 6.376278680510632e-07, - "loss": 0.5786, - "step": 73681 - }, - { - "epoch": 1.89, - "learning_rate": 6.376020783999066e-07, - "loss": 0.5923, - "step": 73682 - }, - { - "epoch": 1.89, - "learning_rate": 6.375762890262213e-07, - "loss": 0.7354, - "step": 73683 - }, - { - "epoch": 1.89, - "learning_rate": 6.375504999300272e-07, - "loss": 0.5649, - "step": 73684 - }, - { - "epoch": 1.89, - "learning_rate": 6.37524711111344e-07, - "loss": 0.6343, - "step": 73685 - }, - { - "epoch": 1.89, - "learning_rate": 6.374989225701915e-07, - "loss": 0.7256, - "step": 73686 - }, - { - "epoch": 1.89, - "learning_rate": 6.374731343065893e-07, - "loss": 0.5898, - "step": 73687 - }, - { - "epoch": 1.89, - "learning_rate": 6.374473463205574e-07, - "loss": 0.5588, - "step": 73688 - }, - { - "epoch": 1.89, - "learning_rate": 6.374215586121152e-07, - "loss": 0.8115, - "step": 73689 - }, - { - "epoch": 1.89, - "learning_rate": 6.373957711812832e-07, - "loss": 0.6416, - "step": 73690 - }, - { - "epoch": 1.89, - "learning_rate": 6.373699840280802e-07, - "loss": 0.6992, - "step": 73691 - }, - { - "epoch": 1.89, - "learning_rate": 6.373441971525262e-07, - "loss": 0.6855, - "step": 73692 - }, - { - "epoch": 1.89, - "learning_rate": 6.373184105546412e-07, - "loss": 0.6284, - "step": 73693 - }, - { - "epoch": 1.89, - "learning_rate": 6.372926242344447e-07, - "loss": 0.7148, - "step": 73694 - }, - { - "epoch": 1.89, - "learning_rate": 6.372668381919567e-07, - "loss": 0.5645, - "step": 73695 - }, - { - "epoch": 1.89, - "learning_rate": 6.372410524271966e-07, - "loss": 0.5354, - "step": 73696 - }, - { - "epoch": 1.89, - "learning_rate": 6.372152669401847e-07, - "loss": 0.6685, - "step": 73697 - }, - { - "epoch": 1.89, - "learning_rate": 6.3718948173094e-07, - "loss": 0.6553, - "step": 73698 - }, - { - "epoch": 1.89, - "learning_rate": 6.371636967994829e-07, - "loss": 0.6611, - "step": 73699 - }, - { - "epoch": 1.89, - "learning_rate": 6.371379121458331e-07, - "loss": 0.437, - "step": 73700 - }, - { - "epoch": 1.89, - "learning_rate": 6.371121277700098e-07, - "loss": 0.4724, - "step": 73701 - }, - { - "epoch": 1.89, - "learning_rate": 6.370863436720331e-07, - "loss": 0.4368, - "step": 73702 - }, - { - "epoch": 1.89, - "learning_rate": 6.370605598519226e-07, - "loss": 0.6772, - "step": 73703 - }, - { - "epoch": 1.89, - "learning_rate": 6.370347763096982e-07, - "loss": 0.6504, - "step": 73704 - }, - { - "epoch": 1.89, - "learning_rate": 6.370089930453796e-07, - "loss": 0.4858, - "step": 73705 - }, - { - "epoch": 1.89, - "learning_rate": 6.369832100589864e-07, - "loss": 0.666, - "step": 73706 - }, - { - "epoch": 1.89, - "learning_rate": 6.369574273505387e-07, - "loss": 0.5869, - "step": 73707 - }, - { - "epoch": 1.89, - "learning_rate": 6.369316449200557e-07, - "loss": 0.7129, - "step": 73708 - }, - { - "epoch": 1.89, - "learning_rate": 6.369058627675576e-07, - "loss": 0.7207, - "step": 73709 - }, - { - "epoch": 1.89, - "learning_rate": 6.368800808930644e-07, - "loss": 0.6011, - "step": 73710 - }, - { - "epoch": 1.89, - "learning_rate": 6.368542992965949e-07, - "loss": 0.6763, - "step": 73711 - }, - { - "epoch": 1.89, - "learning_rate": 6.368285179781696e-07, - "loss": 0.7129, - "step": 73712 - }, - { - "epoch": 1.89, - "learning_rate": 6.368027369378077e-07, - "loss": 0.5898, - "step": 73713 - }, - { - "epoch": 1.89, - "learning_rate": 6.367769561755296e-07, - "loss": 0.7764, - "step": 73714 - }, - { - "epoch": 1.89, - "learning_rate": 6.367511756913544e-07, - "loss": 0.5825, - "step": 73715 - }, - { - "epoch": 1.89, - "learning_rate": 6.367253954853023e-07, - "loss": 0.6387, - "step": 73716 - }, - { - "epoch": 1.89, - "learning_rate": 6.36699615557393e-07, - "loss": 0.5029, - "step": 73717 - }, - { - "epoch": 1.89, - "learning_rate": 6.366738359076458e-07, - "loss": 0.5437, - "step": 73718 - }, - { - "epoch": 1.89, - "learning_rate": 6.366480565360809e-07, - "loss": 0.5083, - "step": 73719 - }, - { - "epoch": 1.89, - "learning_rate": 6.366222774427182e-07, - "loss": 0.479, - "step": 73720 - }, - { - "epoch": 1.89, - "learning_rate": 6.365964986275764e-07, - "loss": 0.6963, - "step": 73721 - }, - { - "epoch": 1.89, - "learning_rate": 6.365707200906765e-07, - "loss": 0.4619, - "step": 73722 - }, - { - "epoch": 1.89, - "learning_rate": 6.365449418320374e-07, - "loss": 0.7773, - "step": 73723 - }, - { - "epoch": 1.89, - "learning_rate": 6.365191638516793e-07, - "loss": 0.585, - "step": 73724 - }, - { - "epoch": 1.89, - "learning_rate": 6.364933861496216e-07, - "loss": 0.6475, - "step": 73725 - }, - { - "epoch": 1.89, - "learning_rate": 6.364676087258842e-07, - "loss": 0.7168, - "step": 73726 - }, - { - "epoch": 1.89, - "learning_rate": 6.364418315804869e-07, - "loss": 0.7222, - "step": 73727 - }, - { - "epoch": 1.89, - "learning_rate": 6.364160547134493e-07, - "loss": 0.5361, - "step": 73728 - }, - { - "epoch": 1.89, - "learning_rate": 6.363902781247913e-07, - "loss": 0.6572, - "step": 73729 - }, - { - "epoch": 1.89, - "learning_rate": 6.363645018145329e-07, - "loss": 0.6982, - "step": 73730 - }, - { - "epoch": 1.89, - "learning_rate": 6.363387257826931e-07, - "loss": 0.5811, - "step": 73731 - }, - { - "epoch": 1.89, - "learning_rate": 6.363129500292919e-07, - "loss": 0.4814, - "step": 73732 - }, - { - "epoch": 1.89, - "learning_rate": 6.362871745543494e-07, - "loss": 0.5576, - "step": 73733 - }, - { - "epoch": 1.89, - "learning_rate": 6.362613993578851e-07, - "loss": 0.7012, - "step": 73734 - }, - { - "epoch": 1.89, - "learning_rate": 6.362356244399184e-07, - "loss": 0.6475, - "step": 73735 - }, - { - "epoch": 1.89, - "learning_rate": 6.362098498004696e-07, - "loss": 0.6504, - "step": 73736 - }, - { - "epoch": 1.89, - "learning_rate": 6.36184075439558e-07, - "loss": 0.4807, - "step": 73737 - }, - { - "epoch": 1.89, - "learning_rate": 6.361583013572038e-07, - "loss": 0.6396, - "step": 73738 - }, - { - "epoch": 1.89, - "learning_rate": 6.361325275534262e-07, - "loss": 0.6011, - "step": 73739 - }, - { - "epoch": 1.89, - "learning_rate": 6.361067540282457e-07, - "loss": 0.752, - "step": 73740 - }, - { - "epoch": 1.89, - "learning_rate": 6.360809807816811e-07, - "loss": 0.665, - "step": 73741 - }, - { - "epoch": 1.89, - "learning_rate": 6.360552078137525e-07, - "loss": 0.7324, - "step": 73742 - }, - { - "epoch": 1.89, - "learning_rate": 6.360294351244799e-07, - "loss": 0.6089, - "step": 73743 - }, - { - "epoch": 1.89, - "learning_rate": 6.360036627138825e-07, - "loss": 0.6196, - "step": 73744 - }, - { - "epoch": 1.89, - "learning_rate": 6.359778905819808e-07, - "loss": 0.5337, - "step": 73745 - }, - { - "epoch": 1.89, - "learning_rate": 6.359521187287937e-07, - "loss": 0.6885, - "step": 73746 - }, - { - "epoch": 1.89, - "learning_rate": 6.359263471543415e-07, - "loss": 0.7007, - "step": 73747 - }, - { - "epoch": 1.89, - "learning_rate": 6.359005758586436e-07, - "loss": 0.709, - "step": 73748 - }, - { - "epoch": 1.89, - "learning_rate": 6.358748048417201e-07, - "loss": 0.6211, - "step": 73749 - }, - { - "epoch": 1.89, - "learning_rate": 6.358490341035908e-07, - "loss": 0.7773, - "step": 73750 - }, - { - "epoch": 1.89, - "learning_rate": 6.358232636442749e-07, - "loss": 0.5967, - "step": 73751 - }, - { - "epoch": 1.89, - "learning_rate": 6.357974934637922e-07, - "loss": 0.541, - "step": 73752 - }, - { - "epoch": 1.89, - "learning_rate": 6.357717235621627e-07, - "loss": 0.6172, - "step": 73753 - }, - { - "epoch": 1.89, - "learning_rate": 6.357459539394059e-07, - "loss": 0.6846, - "step": 73754 - }, - { - "epoch": 1.89, - "learning_rate": 6.35720184595542e-07, - "loss": 0.2909, - "step": 73755 - }, - { - "epoch": 1.89, - "learning_rate": 6.356944155305901e-07, - "loss": 0.5, - "step": 73756 - }, - { - "epoch": 1.89, - "learning_rate": 6.356686467445704e-07, - "loss": 0.6875, - "step": 73757 - }, - { - "epoch": 1.89, - "learning_rate": 6.356428782375023e-07, - "loss": 0.6914, - "step": 73758 - }, - { - "epoch": 1.89, - "learning_rate": 6.356171100094059e-07, - "loss": 0.7373, - "step": 73759 - }, - { - "epoch": 1.89, - "learning_rate": 6.35591342060301e-07, - "loss": 0.3826, - "step": 73760 - }, - { - "epoch": 1.89, - "learning_rate": 6.355655743902064e-07, - "loss": 0.791, - "step": 73761 - }, - { - "epoch": 1.89, - "learning_rate": 6.355398069991429e-07, - "loss": 0.5856, - "step": 73762 - }, - { - "epoch": 1.89, - "learning_rate": 6.355140398871296e-07, - "loss": 0.5254, - "step": 73763 - }, - { - "epoch": 1.89, - "learning_rate": 6.354882730541866e-07, - "loss": 0.5813, - "step": 73764 - }, - { - "epoch": 1.89, - "learning_rate": 6.354625065003333e-07, - "loss": 0.6392, - "step": 73765 - }, - { - "epoch": 1.89, - "learning_rate": 6.354367402255898e-07, - "loss": 0.7705, - "step": 73766 - }, - { - "epoch": 1.89, - "learning_rate": 6.354109742299754e-07, - "loss": 0.6445, - "step": 73767 - }, - { - "epoch": 1.89, - "learning_rate": 6.353852085135101e-07, - "loss": 0.665, - "step": 73768 - }, - { - "epoch": 1.89, - "learning_rate": 6.353594430762137e-07, - "loss": 0.6436, - "step": 73769 - }, - { - "epoch": 1.89, - "learning_rate": 6.353336779181062e-07, - "loss": 0.7339, - "step": 73770 - }, - { - "epoch": 1.89, - "learning_rate": 6.353079130392063e-07, - "loss": 0.7598, - "step": 73771 - }, - { - "epoch": 1.89, - "learning_rate": 6.352821484395346e-07, - "loss": 0.5432, - "step": 73772 - }, - { - "epoch": 1.89, - "learning_rate": 6.352563841191106e-07, - "loss": 0.666, - "step": 73773 - }, - { - "epoch": 1.89, - "learning_rate": 6.352306200779539e-07, - "loss": 0.5923, - "step": 73774 - }, - { - "epoch": 1.89, - "learning_rate": 6.352048563160843e-07, - "loss": 0.593, - "step": 73775 - }, - { - "epoch": 1.89, - "learning_rate": 6.351790928335218e-07, - "loss": 0.4641, - "step": 73776 - }, - { - "epoch": 1.89, - "learning_rate": 6.351533296302856e-07, - "loss": 0.4824, - "step": 73777 - }, - { - "epoch": 1.89, - "learning_rate": 6.35127566706396e-07, - "loss": 0.5762, - "step": 73778 - }, - { - "epoch": 1.89, - "learning_rate": 6.351018040618721e-07, - "loss": 0.7275, - "step": 73779 - }, - { - "epoch": 1.89, - "learning_rate": 6.350760416967346e-07, - "loss": 0.6494, - "step": 73780 - }, - { - "epoch": 1.89, - "learning_rate": 6.350502796110023e-07, - "loss": 0.8096, - "step": 73781 - }, - { - "epoch": 1.89, - "learning_rate": 6.350245178046949e-07, - "loss": 0.7246, - "step": 73782 - }, - { - "epoch": 1.89, - "learning_rate": 6.349987562778327e-07, - "loss": 0.5757, - "step": 73783 - }, - { - "epoch": 1.89, - "learning_rate": 6.34972995030435e-07, - "loss": 0.5244, - "step": 73784 - }, - { - "epoch": 1.89, - "learning_rate": 6.349472340625219e-07, - "loss": 0.6611, - "step": 73785 - }, - { - "epoch": 1.89, - "learning_rate": 6.349214733741129e-07, - "loss": 0.5732, - "step": 73786 - }, - { - "epoch": 1.89, - "learning_rate": 6.348957129652277e-07, - "loss": 0.644, - "step": 73787 - }, - { - "epoch": 1.89, - "learning_rate": 6.348699528358859e-07, - "loss": 0.6353, - "step": 73788 - }, - { - "epoch": 1.89, - "learning_rate": 6.348441929861074e-07, - "loss": 0.6543, - "step": 73789 - }, - { - "epoch": 1.89, - "learning_rate": 6.348184334159124e-07, - "loss": 0.4268, - "step": 73790 - }, - { - "epoch": 1.89, - "learning_rate": 6.347926741253201e-07, - "loss": 0.6484, - "step": 73791 - }, - { - "epoch": 1.89, - "learning_rate": 6.347669151143497e-07, - "loss": 0.7002, - "step": 73792 - }, - { - "epoch": 1.89, - "learning_rate": 6.347411563830218e-07, - "loss": 0.7627, - "step": 73793 - }, - { - "epoch": 1.89, - "learning_rate": 6.347153979313555e-07, - "loss": 0.6025, - "step": 73794 - }, - { - "epoch": 1.89, - "learning_rate": 6.346896397593711e-07, - "loss": 0.4805, - "step": 73795 - }, - { - "epoch": 1.89, - "learning_rate": 6.346638818670879e-07, - "loss": 0.6992, - "step": 73796 - }, - { - "epoch": 1.89, - "learning_rate": 6.34638124254526e-07, - "loss": 0.7334, - "step": 73797 - }, - { - "epoch": 1.89, - "learning_rate": 6.346123669217045e-07, - "loss": 0.5938, - "step": 73798 - }, - { - "epoch": 1.89, - "learning_rate": 6.345866098686439e-07, - "loss": 0.6787, - "step": 73799 - }, - { - "epoch": 1.89, - "learning_rate": 6.345608530953636e-07, - "loss": 0.5994, - "step": 73800 - }, - { - "epoch": 1.89, - "learning_rate": 6.345350966018829e-07, - "loss": 0.6694, - "step": 73801 - }, - { - "epoch": 1.89, - "learning_rate": 6.345093403882221e-07, - "loss": 0.5767, - "step": 73802 - }, - { - "epoch": 1.89, - "learning_rate": 6.344835844544005e-07, - "loss": 0.624, - "step": 73803 - }, - { - "epoch": 1.89, - "learning_rate": 6.344578288004382e-07, - "loss": 0.5693, - "step": 73804 - }, - { - "epoch": 1.89, - "learning_rate": 6.344320734263546e-07, - "loss": 0.6042, - "step": 73805 - }, - { - "epoch": 1.89, - "learning_rate": 6.344063183321695e-07, - "loss": 0.5977, - "step": 73806 - }, - { - "epoch": 1.89, - "learning_rate": 6.34380563517903e-07, - "loss": 0.4648, - "step": 73807 - }, - { - "epoch": 1.89, - "learning_rate": 6.34354808983574e-07, - "loss": 0.6016, - "step": 73808 - }, - { - "epoch": 1.89, - "learning_rate": 6.343290547292031e-07, - "loss": 0.5186, - "step": 73809 - }, - { - "epoch": 1.89, - "learning_rate": 6.343033007548097e-07, - "loss": 0.6592, - "step": 73810 - }, - { - "epoch": 1.89, - "learning_rate": 6.342775470604131e-07, - "loss": 0.7148, - "step": 73811 - }, - { - "epoch": 1.89, - "learning_rate": 6.342517936460337e-07, - "loss": 0.5376, - "step": 73812 - }, - { - "epoch": 1.89, - "learning_rate": 6.342260405116906e-07, - "loss": 0.6753, - "step": 73813 - }, - { - "epoch": 1.89, - "learning_rate": 6.34200287657404e-07, - "loss": 0.667, - "step": 73814 - }, - { - "epoch": 1.89, - "learning_rate": 6.341745350831931e-07, - "loss": 0.7607, - "step": 73815 - }, - { - "epoch": 1.89, - "learning_rate": 6.341487827890782e-07, - "loss": 0.6743, - "step": 73816 - }, - { - "epoch": 1.89, - "learning_rate": 6.341230307750787e-07, - "loss": 0.563, - "step": 73817 - }, - { - "epoch": 1.89, - "learning_rate": 6.340972790412144e-07, - "loss": 0.6533, - "step": 73818 - }, - { - "epoch": 1.89, - "learning_rate": 6.340715275875049e-07, - "loss": 0.5505, - "step": 73819 - }, - { - "epoch": 1.89, - "learning_rate": 6.340457764139703e-07, - "loss": 0.5728, - "step": 73820 - }, - { - "epoch": 1.89, - "learning_rate": 6.340200255206299e-07, - "loss": 0.5889, - "step": 73821 - }, - { - "epoch": 1.89, - "learning_rate": 6.339942749075032e-07, - "loss": 0.6104, - "step": 73822 - }, - { - "epoch": 1.89, - "learning_rate": 6.339685245746106e-07, - "loss": 0.5894, - "step": 73823 - }, - { - "epoch": 1.89, - "learning_rate": 6.339427745219714e-07, - "loss": 0.5869, - "step": 73824 - }, - { - "epoch": 1.89, - "learning_rate": 6.339170247496053e-07, - "loss": 0.6099, - "step": 73825 - }, - { - "epoch": 1.89, - "learning_rate": 6.338912752575322e-07, - "loss": 0.6069, - "step": 73826 - }, - { - "epoch": 1.89, - "learning_rate": 6.338655260457715e-07, - "loss": 0.7168, - "step": 73827 - }, - { - "epoch": 1.89, - "learning_rate": 6.338397771143434e-07, - "loss": 0.6492, - "step": 73828 - }, - { - "epoch": 1.89, - "learning_rate": 6.338140284632671e-07, - "loss": 0.5469, - "step": 73829 - }, - { - "epoch": 1.89, - "learning_rate": 6.337882800925629e-07, - "loss": 0.7627, - "step": 73830 - }, - { - "epoch": 1.89, - "learning_rate": 6.337625320022501e-07, - "loss": 0.5396, - "step": 73831 - }, - { - "epoch": 1.89, - "learning_rate": 6.337367841923483e-07, - "loss": 0.7041, - "step": 73832 - }, - { - "epoch": 1.89, - "learning_rate": 6.337110366628775e-07, - "loss": 0.7188, - "step": 73833 - }, - { - "epoch": 1.89, - "learning_rate": 6.336852894138571e-07, - "loss": 0.5469, - "step": 73834 - }, - { - "epoch": 1.89, - "learning_rate": 6.336595424453073e-07, - "loss": 0.5039, - "step": 73835 - }, - { - "epoch": 1.89, - "learning_rate": 6.336337957572474e-07, - "loss": 0.6992, - "step": 73836 - }, - { - "epoch": 1.89, - "learning_rate": 6.336080493496974e-07, - "loss": 0.5503, - "step": 73837 - }, - { - "epoch": 1.89, - "learning_rate": 6.335823032226766e-07, - "loss": 0.5317, - "step": 73838 - }, - { - "epoch": 1.89, - "learning_rate": 6.335565573762053e-07, - "loss": 0.7383, - "step": 73839 - }, - { - "epoch": 1.89, - "learning_rate": 6.335308118103031e-07, - "loss": 0.6582, - "step": 73840 - }, - { - "epoch": 1.89, - "learning_rate": 6.335050665249892e-07, - "loss": 0.6514, - "step": 73841 - }, - { - "epoch": 1.89, - "learning_rate": 6.334793215202834e-07, - "loss": 0.6421, - "step": 73842 - }, - { - "epoch": 1.89, - "learning_rate": 6.334535767962059e-07, - "loss": 0.748, - "step": 73843 - }, - { - "epoch": 1.89, - "learning_rate": 6.33427832352776e-07, - "loss": 0.5938, - "step": 73844 - }, - { - "epoch": 1.89, - "learning_rate": 6.334020881900136e-07, - "loss": 0.8506, - "step": 73845 - }, - { - "epoch": 1.89, - "learning_rate": 6.333763443079383e-07, - "loss": 0.709, - "step": 73846 - }, - { - "epoch": 1.89, - "learning_rate": 6.333506007065701e-07, - "loss": 0.666, - "step": 73847 - }, - { - "epoch": 1.89, - "learning_rate": 6.333248573859281e-07, - "loss": 0.6924, - "step": 73848 - }, - { - "epoch": 1.89, - "learning_rate": 6.332991143460327e-07, - "loss": 0.4695, - "step": 73849 - }, - { - "epoch": 1.89, - "learning_rate": 6.332733715869036e-07, - "loss": 0.5908, - "step": 73850 - }, - { - "epoch": 1.89, - "learning_rate": 6.332476291085597e-07, - "loss": 0.6514, - "step": 73851 - }, - { - "epoch": 1.89, - "learning_rate": 6.332218869110215e-07, - "loss": 0.5918, - "step": 73852 - }, - { - "epoch": 1.89, - "learning_rate": 6.331961449943082e-07, - "loss": 0.5569, - "step": 73853 - }, - { - "epoch": 1.89, - "learning_rate": 6.331704033584399e-07, - "loss": 0.6475, - "step": 73854 - }, - { - "epoch": 1.89, - "learning_rate": 6.331446620034359e-07, - "loss": 0.6851, - "step": 73855 - }, - { - "epoch": 1.89, - "learning_rate": 6.331189209293166e-07, - "loss": 0.5962, - "step": 73856 - }, - { - "epoch": 1.89, - "learning_rate": 6.330931801361008e-07, - "loss": 0.6699, - "step": 73857 - }, - { - "epoch": 1.89, - "learning_rate": 6.330674396238091e-07, - "loss": 0.6826, - "step": 73858 - }, - { - "epoch": 1.89, - "learning_rate": 6.330416993924605e-07, - "loss": 0.4995, - "step": 73859 - }, - { - "epoch": 1.89, - "learning_rate": 6.330159594420756e-07, - "loss": 0.6396, - "step": 73860 - }, - { - "epoch": 1.89, - "learning_rate": 6.329902197726729e-07, - "loss": 0.5591, - "step": 73861 - }, - { - "epoch": 1.89, - "learning_rate": 6.329644803842728e-07, - "loss": 0.4783, - "step": 73862 - }, - { - "epoch": 1.89, - "learning_rate": 6.329387412768949e-07, - "loss": 0.5806, - "step": 73863 - }, - { - "epoch": 1.89, - "learning_rate": 6.329130024505591e-07, - "loss": 0.5791, - "step": 73864 - }, - { - "epoch": 1.89, - "learning_rate": 6.328872639052846e-07, - "loss": 0.6543, - "step": 73865 - }, - { - "epoch": 1.89, - "learning_rate": 6.328615256410918e-07, - "loss": 0.5742, - "step": 73866 - }, - { - "epoch": 1.89, - "learning_rate": 6.32835787658e-07, - "loss": 0.667, - "step": 73867 - }, - { - "epoch": 1.89, - "learning_rate": 6.328100499560289e-07, - "loss": 0.4858, - "step": 73868 - }, - { - "epoch": 1.89, - "learning_rate": 6.32784312535198e-07, - "loss": 0.8369, - "step": 73869 - }, - { - "epoch": 1.89, - "learning_rate": 6.327585753955278e-07, - "loss": 0.5728, - "step": 73870 - }, - { - "epoch": 1.89, - "learning_rate": 6.327328385370373e-07, - "loss": 0.5142, - "step": 73871 - }, - { - "epoch": 1.89, - "learning_rate": 6.327071019597461e-07, - "loss": 0.6689, - "step": 73872 - }, - { - "epoch": 1.89, - "learning_rate": 6.326813656636745e-07, - "loss": 0.6221, - "step": 73873 - }, - { - "epoch": 1.89, - "learning_rate": 6.326556296488414e-07, - "loss": 0.5281, - "step": 73874 - }, - { - "epoch": 1.89, - "learning_rate": 6.326298939152675e-07, - "loss": 0.5552, - "step": 73875 - }, - { - "epoch": 1.89, - "learning_rate": 6.326041584629716e-07, - "loss": 0.4291, - "step": 73876 - }, - { - "epoch": 1.89, - "learning_rate": 6.325784232919742e-07, - "loss": 0.4771, - "step": 73877 - }, - { - "epoch": 1.89, - "learning_rate": 6.325526884022943e-07, - "loss": 0.7119, - "step": 73878 - }, - { - "epoch": 1.89, - "learning_rate": 6.325269537939522e-07, - "loss": 0.7188, - "step": 73879 - }, - { - "epoch": 1.89, - "learning_rate": 6.325012194669673e-07, - "loss": 0.6382, - "step": 73880 - }, - { - "epoch": 1.89, - "learning_rate": 6.324754854213592e-07, - "loss": 0.5249, - "step": 73881 - }, - { - "epoch": 1.89, - "learning_rate": 6.324497516571477e-07, - "loss": 0.5852, - "step": 73882 - }, - { - "epoch": 1.89, - "learning_rate": 6.324240181743526e-07, - "loss": 0.6132, - "step": 73883 - }, - { - "epoch": 1.89, - "learning_rate": 6.323982849729932e-07, - "loss": 0.709, - "step": 73884 - }, - { - "epoch": 1.89, - "learning_rate": 6.323725520530898e-07, - "loss": 0.6021, - "step": 73885 - }, - { - "epoch": 1.89, - "learning_rate": 6.323468194146618e-07, - "loss": 0.7979, - "step": 73886 - }, - { - "epoch": 1.89, - "learning_rate": 6.323210870577289e-07, - "loss": 0.4873, - "step": 73887 - }, - { - "epoch": 1.89, - "learning_rate": 6.322953549823109e-07, - "loss": 0.603, - "step": 73888 - }, - { - "epoch": 1.89, - "learning_rate": 6.322696231884277e-07, - "loss": 0.71, - "step": 73889 - }, - { - "epoch": 1.89, - "learning_rate": 6.322438916760985e-07, - "loss": 0.4685, - "step": 73890 - }, - { - "epoch": 1.89, - "learning_rate": 6.32218160445343e-07, - "loss": 0.7881, - "step": 73891 - }, - { - "epoch": 1.89, - "learning_rate": 6.321924294961814e-07, - "loss": 0.4695, - "step": 73892 - }, - { - "epoch": 1.89, - "learning_rate": 6.321666988286329e-07, - "loss": 0.689, - "step": 73893 - }, - { - "epoch": 1.89, - "learning_rate": 6.321409684427178e-07, - "loss": 0.4839, - "step": 73894 - }, - { - "epoch": 1.89, - "learning_rate": 6.321152383384552e-07, - "loss": 0.6729, - "step": 73895 - }, - { - "epoch": 1.89, - "learning_rate": 6.320895085158652e-07, - "loss": 0.6938, - "step": 73896 - }, - { - "epoch": 1.89, - "learning_rate": 6.320637789749673e-07, - "loss": 0.6133, - "step": 73897 - }, - { - "epoch": 1.89, - "learning_rate": 6.320380497157811e-07, - "loss": 0.5525, - "step": 73898 - }, - { - "epoch": 1.89, - "learning_rate": 6.320123207383269e-07, - "loss": 0.647, - "step": 73899 - }, - { - "epoch": 1.89, - "learning_rate": 6.319865920426238e-07, - "loss": 0.7539, - "step": 73900 - }, - { - "epoch": 1.89, - "learning_rate": 6.319608636286912e-07, - "loss": 0.5629, - "step": 73901 - }, - { - "epoch": 1.89, - "learning_rate": 6.319351354965496e-07, - "loss": 0.6201, - "step": 73902 - }, - { - "epoch": 1.89, - "learning_rate": 6.319094076462181e-07, - "loss": 0.564, - "step": 73903 - }, - { - "epoch": 1.89, - "learning_rate": 6.318836800777168e-07, - "loss": 0.6768, - "step": 73904 - }, - { - "epoch": 1.89, - "learning_rate": 6.318579527910651e-07, - "loss": 0.7549, - "step": 73905 - }, - { - "epoch": 1.89, - "learning_rate": 6.318322257862831e-07, - "loss": 0.5645, - "step": 73906 - }, - { - "epoch": 1.89, - "learning_rate": 6.3180649906339e-07, - "loss": 0.5251, - "step": 73907 - }, - { - "epoch": 1.89, - "learning_rate": 6.317807726224058e-07, - "loss": 0.4036, - "step": 73908 - }, - { - "epoch": 1.89, - "learning_rate": 6.317550464633505e-07, - "loss": 0.6396, - "step": 73909 - }, - { - "epoch": 1.89, - "learning_rate": 6.317293205862429e-07, - "loss": 0.5815, - "step": 73910 - }, - { - "epoch": 1.89, - "learning_rate": 6.317035949911035e-07, - "loss": 0.6953, - "step": 73911 - }, - { - "epoch": 1.89, - "learning_rate": 6.316778696779515e-07, - "loss": 0.7832, - "step": 73912 - }, - { - "epoch": 1.89, - "learning_rate": 6.31652144646807e-07, - "loss": 0.7197, - "step": 73913 - }, - { - "epoch": 1.89, - "learning_rate": 6.316264198976896e-07, - "loss": 0.5244, - "step": 73914 - }, - { - "epoch": 1.89, - "learning_rate": 6.316006954306186e-07, - "loss": 0.7764, - "step": 73915 - }, - { - "epoch": 1.89, - "learning_rate": 6.315749712456144e-07, - "loss": 0.7549, - "step": 73916 - }, - { - "epoch": 1.89, - "learning_rate": 6.31549247342696e-07, - "loss": 0.5256, - "step": 73917 - }, - { - "epoch": 1.89, - "learning_rate": 6.315235237218834e-07, - "loss": 0.7539, - "step": 73918 - }, - { - "epoch": 1.89, - "learning_rate": 6.314978003831968e-07, - "loss": 0.7441, - "step": 73919 - }, - { - "epoch": 1.89, - "learning_rate": 6.314720773266549e-07, - "loss": 0.751, - "step": 73920 - }, - { - "epoch": 1.89, - "learning_rate": 6.314463545522779e-07, - "loss": 0.7568, - "step": 73921 - }, - { - "epoch": 1.89, - "learning_rate": 6.314206320600854e-07, - "loss": 0.6816, - "step": 73922 - }, - { - "epoch": 1.89, - "learning_rate": 6.313949098500975e-07, - "loss": 0.4771, - "step": 73923 - }, - { - "epoch": 1.89, - "learning_rate": 6.313691879223333e-07, - "loss": 0.8701, - "step": 73924 - }, - { - "epoch": 1.89, - "learning_rate": 6.313434662768129e-07, - "loss": 0.6631, - "step": 73925 - }, - { - "epoch": 1.89, - "learning_rate": 6.313177449135556e-07, - "loss": 0.5918, - "step": 73926 - }, - { - "epoch": 1.89, - "learning_rate": 6.312920238325816e-07, - "loss": 0.7319, - "step": 73927 - }, - { - "epoch": 1.89, - "learning_rate": 6.312663030339103e-07, - "loss": 0.5889, - "step": 73928 - }, - { - "epoch": 1.89, - "learning_rate": 6.312405825175617e-07, - "loss": 0.5659, - "step": 73929 - }, - { - "epoch": 1.89, - "learning_rate": 6.31214862283555e-07, - "loss": 0.6885, - "step": 73930 - }, - { - "epoch": 1.89, - "learning_rate": 6.311891423319103e-07, - "loss": 0.6348, - "step": 73931 - }, - { - "epoch": 1.89, - "learning_rate": 6.311634226626467e-07, - "loss": 0.5688, - "step": 73932 - }, - { - "epoch": 1.89, - "learning_rate": 6.311377032757846e-07, - "loss": 0.661, - "step": 73933 - }, - { - "epoch": 1.89, - "learning_rate": 6.311119841713432e-07, - "loss": 0.4653, - "step": 73934 - }, - { - "epoch": 1.89, - "learning_rate": 6.310862653493425e-07, - "loss": 0.7236, - "step": 73935 - }, - { - "epoch": 1.9, - "learning_rate": 6.31060546809802e-07, - "loss": 0.6333, - "step": 73936 - }, - { - "epoch": 1.9, - "learning_rate": 6.310348285527416e-07, - "loss": 0.604, - "step": 73937 - }, - { - "epoch": 1.9, - "learning_rate": 6.310091105781808e-07, - "loss": 0.6226, - "step": 73938 - }, - { - "epoch": 1.9, - "learning_rate": 6.309833928861397e-07, - "loss": 0.7412, - "step": 73939 - }, - { - "epoch": 1.9, - "learning_rate": 6.309576754766374e-07, - "loss": 0.667, - "step": 73940 - }, - { - "epoch": 1.9, - "learning_rate": 6.309319583496936e-07, - "loss": 0.5391, - "step": 73941 - }, - { - "epoch": 1.9, - "learning_rate": 6.309062415053285e-07, - "loss": 0.6621, - "step": 73942 - }, - { - "epoch": 1.9, - "learning_rate": 6.308805249435613e-07, - "loss": 0.7354, - "step": 73943 - }, - { - "epoch": 1.9, - "learning_rate": 6.30854808664412e-07, - "loss": 0.9414, - "step": 73944 - }, - { - "epoch": 1.9, - "learning_rate": 6.308290926679002e-07, - "loss": 0.5786, - "step": 73945 - }, - { - "epoch": 1.9, - "learning_rate": 6.308033769540457e-07, - "loss": 0.4644, - "step": 73946 - }, - { - "epoch": 1.9, - "learning_rate": 6.30777661522868e-07, - "loss": 0.6475, - "step": 73947 - }, - { - "epoch": 1.9, - "learning_rate": 6.307519463743868e-07, - "loss": 0.5498, - "step": 73948 - }, - { - "epoch": 1.9, - "learning_rate": 6.307262315086221e-07, - "loss": 0.6567, - "step": 73949 - }, - { - "epoch": 1.9, - "learning_rate": 6.307005169255934e-07, - "loss": 0.7412, - "step": 73950 - }, - { - "epoch": 1.9, - "learning_rate": 6.306748026253199e-07, - "loss": 0.4592, - "step": 73951 - }, - { - "epoch": 1.9, - "learning_rate": 6.30649088607822e-07, - "loss": 0.6885, - "step": 73952 - }, - { - "epoch": 1.9, - "learning_rate": 6.306233748731189e-07, - "loss": 0.6074, - "step": 73953 - }, - { - "epoch": 1.9, - "learning_rate": 6.305976614212307e-07, - "loss": 0.5571, - "step": 73954 - }, - { - "epoch": 1.9, - "learning_rate": 6.305719482521768e-07, - "loss": 0.6191, - "step": 73955 - }, - { - "epoch": 1.9, - "learning_rate": 6.305462353659769e-07, - "loss": 0.5278, - "step": 73956 - }, - { - "epoch": 1.9, - "learning_rate": 6.305205227626508e-07, - "loss": 0.6333, - "step": 73957 - }, - { - "epoch": 1.9, - "learning_rate": 6.304948104422183e-07, - "loss": 0.793, - "step": 73958 - }, - { - "epoch": 1.9, - "learning_rate": 6.304690984046991e-07, - "loss": 0.7686, - "step": 73959 - }, - { - "epoch": 1.9, - "learning_rate": 6.304433866501123e-07, - "loss": 0.6934, - "step": 73960 - }, - { - "epoch": 1.9, - "learning_rate": 6.304176751784782e-07, - "loss": 0.645, - "step": 73961 - }, - { - "epoch": 1.9, - "learning_rate": 6.303919639898162e-07, - "loss": 0.7393, - "step": 73962 - }, - { - "epoch": 1.9, - "learning_rate": 6.303662530841463e-07, - "loss": 0.533, - "step": 73963 - }, - { - "epoch": 1.9, - "learning_rate": 6.303405424614876e-07, - "loss": 0.6221, - "step": 73964 - }, - { - "epoch": 1.9, - "learning_rate": 6.303148321218603e-07, - "loss": 0.6553, - "step": 73965 - }, - { - "epoch": 1.9, - "learning_rate": 6.30289122065284e-07, - "loss": 0.6045, - "step": 73966 - }, - { - "epoch": 1.9, - "learning_rate": 6.302634122917783e-07, - "loss": 0.6768, - "step": 73967 - }, - { - "epoch": 1.9, - "learning_rate": 6.302377028013628e-07, - "loss": 0.7734, - "step": 73968 - }, - { - "epoch": 1.9, - "learning_rate": 6.302119935940578e-07, - "loss": 0.6562, - "step": 73969 - }, - { - "epoch": 1.9, - "learning_rate": 6.30186284669882e-07, - "loss": 0.5918, - "step": 73970 - }, - { - "epoch": 1.9, - "learning_rate": 6.301605760288556e-07, - "loss": 0.6572, - "step": 73971 - }, - { - "epoch": 1.9, - "learning_rate": 6.301348676709981e-07, - "loss": 0.7227, - "step": 73972 - }, - { - "epoch": 1.9, - "learning_rate": 6.301091595963296e-07, - "loss": 0.7852, - "step": 73973 - }, - { - "epoch": 1.9, - "learning_rate": 6.300834518048692e-07, - "loss": 0.5635, - "step": 73974 - }, - { - "epoch": 1.9, - "learning_rate": 6.300577442966372e-07, - "loss": 0.5903, - "step": 73975 - }, - { - "epoch": 1.9, - "learning_rate": 6.300320370716528e-07, - "loss": 0.708, - "step": 73976 - }, - { - "epoch": 1.9, - "learning_rate": 6.30006330129936e-07, - "loss": 0.7471, - "step": 73977 - }, - { - "epoch": 1.9, - "learning_rate": 6.299806234715062e-07, - "loss": 0.6086, - "step": 73978 - }, - { - "epoch": 1.9, - "learning_rate": 6.299549170963834e-07, - "loss": 0.5286, - "step": 73979 - }, - { - "epoch": 1.9, - "learning_rate": 6.299292110045871e-07, - "loss": 0.5879, - "step": 73980 - }, - { - "epoch": 1.9, - "learning_rate": 6.299035051961367e-07, - "loss": 0.625, - "step": 73981 - }, - { - "epoch": 1.9, - "learning_rate": 6.298777996710525e-07, - "loss": 0.6191, - "step": 73982 - }, - { - "epoch": 1.9, - "learning_rate": 6.298520944293534e-07, - "loss": 0.3274, - "step": 73983 - }, - { - "epoch": 1.9, - "learning_rate": 6.2982638947106e-07, - "loss": 0.3811, - "step": 73984 - }, - { - "epoch": 1.9, - "learning_rate": 6.298006847961912e-07, - "loss": 0.6133, - "step": 73985 - }, - { - "epoch": 1.9, - "learning_rate": 6.297749804047672e-07, - "loss": 0.5225, - "step": 73986 - }, - { - "epoch": 1.9, - "learning_rate": 6.297492762968075e-07, - "loss": 0.6143, - "step": 73987 - }, - { - "epoch": 1.9, - "learning_rate": 6.297235724723316e-07, - "loss": 0.6167, - "step": 73988 - }, - { - "epoch": 1.9, - "learning_rate": 6.296978689313597e-07, - "loss": 0.6562, - "step": 73989 - }, - { - "epoch": 1.9, - "learning_rate": 6.296721656739108e-07, - "loss": 0.6953, - "step": 73990 - }, - { - "epoch": 1.9, - "learning_rate": 6.296464627000048e-07, - "loss": 0.7412, - "step": 73991 - }, - { - "epoch": 1.9, - "learning_rate": 6.296207600096616e-07, - "loss": 0.5254, - "step": 73992 - }, - { - "epoch": 1.9, - "learning_rate": 6.295950576029005e-07, - "loss": 0.583, - "step": 73993 - }, - { - "epoch": 1.9, - "learning_rate": 6.295693554797419e-07, - "loss": 0.6111, - "step": 73994 - }, - { - "epoch": 1.9, - "learning_rate": 6.295436536402046e-07, - "loss": 0.5415, - "step": 73995 - }, - { - "epoch": 1.9, - "learning_rate": 6.295179520843089e-07, - "loss": 0.6118, - "step": 73996 - }, - { - "epoch": 1.9, - "learning_rate": 6.294922508120741e-07, - "loss": 0.4399, - "step": 73997 - }, - { - "epoch": 1.9, - "learning_rate": 6.294665498235203e-07, - "loss": 0.6234, - "step": 73998 - }, - { - "epoch": 1.9, - "learning_rate": 6.294408491186671e-07, - "loss": 0.7148, - "step": 73999 - }, - { - "epoch": 1.9, - "learning_rate": 6.294151486975335e-07, - "loss": 0.7412, - "step": 74000 - }, - { - "epoch": 1.9, - "learning_rate": 6.293894485601399e-07, - "loss": 0.5084, - "step": 74001 - }, - { - "epoch": 1.9, - "learning_rate": 6.293637487065058e-07, - "loss": 0.6875, - "step": 74002 - }, - { - "epoch": 1.9, - "learning_rate": 6.293380491366508e-07, - "loss": 0.6172, - "step": 74003 - }, - { - "epoch": 1.9, - "learning_rate": 6.293123498505946e-07, - "loss": 0.6089, - "step": 74004 - }, - { - "epoch": 1.9, - "learning_rate": 6.292866508483568e-07, - "loss": 0.6631, - "step": 74005 - }, - { - "epoch": 1.9, - "learning_rate": 6.292609521299573e-07, - "loss": 0.7158, - "step": 74006 - }, - { - "epoch": 1.9, - "learning_rate": 6.292352536954156e-07, - "loss": 0.6177, - "step": 74007 - }, - { - "epoch": 1.9, - "learning_rate": 6.292095555447514e-07, - "loss": 0.4089, - "step": 74008 - }, - { - "epoch": 1.9, - "learning_rate": 6.291838576779847e-07, - "loss": 0.8145, - "step": 74009 - }, - { - "epoch": 1.9, - "learning_rate": 6.291581600951343e-07, - "loss": 0.6069, - "step": 74010 - }, - { - "epoch": 1.9, - "learning_rate": 6.291324627962209e-07, - "loss": 0.5601, - "step": 74011 - }, - { - "epoch": 1.9, - "learning_rate": 6.291067657812634e-07, - "loss": 0.7305, - "step": 74012 - }, - { - "epoch": 1.9, - "learning_rate": 6.290810690502819e-07, - "loss": 0.6006, - "step": 74013 - }, - { - "epoch": 1.9, - "learning_rate": 6.290553726032959e-07, - "loss": 0.4431, - "step": 74014 - }, - { - "epoch": 1.9, - "learning_rate": 6.290296764403253e-07, - "loss": 0.6157, - "step": 74015 - }, - { - "epoch": 1.9, - "learning_rate": 6.290039805613895e-07, - "loss": 0.6602, - "step": 74016 - }, - { - "epoch": 1.9, - "learning_rate": 6.289782849665084e-07, - "loss": 0.5349, - "step": 74017 - }, - { - "epoch": 1.9, - "learning_rate": 6.289525896557014e-07, - "loss": 0.644, - "step": 74018 - }, - { - "epoch": 1.9, - "learning_rate": 6.289268946289887e-07, - "loss": 0.481, - "step": 74019 - }, - { - "epoch": 1.9, - "learning_rate": 6.289011998863895e-07, - "loss": 0.6099, - "step": 74020 - }, - { - "epoch": 1.9, - "learning_rate": 6.288755054279234e-07, - "loss": 0.6113, - "step": 74021 - }, - { - "epoch": 1.9, - "learning_rate": 6.288498112536103e-07, - "loss": 0.6948, - "step": 74022 - }, - { - "epoch": 1.9, - "learning_rate": 6.2882411736347e-07, - "loss": 0.6318, - "step": 74023 - }, - { - "epoch": 1.9, - "learning_rate": 6.287984237575218e-07, - "loss": 0.7329, - "step": 74024 - }, - { - "epoch": 1.9, - "learning_rate": 6.287727304357857e-07, - "loss": 0.7109, - "step": 74025 - }, - { - "epoch": 1.9, - "learning_rate": 6.287470373982811e-07, - "loss": 0.9287, - "step": 74026 - }, - { - "epoch": 1.9, - "learning_rate": 6.287213446450279e-07, - "loss": 0.6689, - "step": 74027 - }, - { - "epoch": 1.9, - "learning_rate": 6.286956521760455e-07, - "loss": 0.7285, - "step": 74028 - }, - { - "epoch": 1.9, - "learning_rate": 6.286699599913544e-07, - "loss": 0.6982, - "step": 74029 - }, - { - "epoch": 1.9, - "learning_rate": 6.286442680909734e-07, - "loss": 0.7734, - "step": 74030 - }, - { - "epoch": 1.9, - "learning_rate": 6.28618576474922e-07, - "loss": 0.707, - "step": 74031 - }, - { - "epoch": 1.9, - "learning_rate": 6.285928851432205e-07, - "loss": 0.6387, - "step": 74032 - }, - { - "epoch": 1.9, - "learning_rate": 6.285671940958883e-07, - "loss": 0.7207, - "step": 74033 - }, - { - "epoch": 1.9, - "learning_rate": 6.285415033329453e-07, - "loss": 0.6802, - "step": 74034 - }, - { - "epoch": 1.9, - "learning_rate": 6.285158128544107e-07, - "loss": 0.7363, - "step": 74035 - }, - { - "epoch": 1.9, - "learning_rate": 6.284901226603048e-07, - "loss": 0.5801, - "step": 74036 - }, - { - "epoch": 1.9, - "learning_rate": 6.284644327506466e-07, - "loss": 0.7812, - "step": 74037 - }, - { - "epoch": 1.9, - "learning_rate": 6.284387431254563e-07, - "loss": 0.6709, - "step": 74038 - }, - { - "epoch": 1.9, - "learning_rate": 6.284130537847536e-07, - "loss": 0.5488, - "step": 74039 - }, - { - "epoch": 1.9, - "learning_rate": 6.283873647285578e-07, - "loss": 0.6606, - "step": 74040 - }, - { - "epoch": 1.9, - "learning_rate": 6.283616759568883e-07, - "loss": 0.6748, - "step": 74041 - }, - { - "epoch": 1.9, - "learning_rate": 6.283359874697656e-07, - "loss": 0.6895, - "step": 74042 - }, - { - "epoch": 1.9, - "learning_rate": 6.283102992672087e-07, - "loss": 0.5371, - "step": 74043 - }, - { - "epoch": 1.9, - "learning_rate": 6.282846113492377e-07, - "loss": 0.6709, - "step": 74044 - }, - { - "epoch": 1.9, - "learning_rate": 6.282589237158717e-07, - "loss": 0.7236, - "step": 74045 - }, - { - "epoch": 1.9, - "learning_rate": 6.282332363671312e-07, - "loss": 0.6973, - "step": 74046 - }, - { - "epoch": 1.9, - "learning_rate": 6.282075493030352e-07, - "loss": 0.5442, - "step": 74047 - }, - { - "epoch": 1.9, - "learning_rate": 6.281818625236037e-07, - "loss": 0.5601, - "step": 74048 - }, - { - "epoch": 1.9, - "learning_rate": 6.281561760288565e-07, - "loss": 0.5066, - "step": 74049 - }, - { - "epoch": 1.9, - "learning_rate": 6.281304898188126e-07, - "loss": 0.7119, - "step": 74050 - }, - { - "epoch": 1.9, - "learning_rate": 6.281048038934922e-07, - "loss": 0.6621, - "step": 74051 - }, - { - "epoch": 1.9, - "learning_rate": 6.280791182529147e-07, - "loss": 0.5664, - "step": 74052 - }, - { - "epoch": 1.9, - "learning_rate": 6.280534328971001e-07, - "loss": 0.5586, - "step": 74053 - }, - { - "epoch": 1.9, - "learning_rate": 6.280277478260678e-07, - "loss": 0.6465, - "step": 74054 - }, - { - "epoch": 1.9, - "learning_rate": 6.280020630398377e-07, - "loss": 0.7407, - "step": 74055 - }, - { - "epoch": 1.9, - "learning_rate": 6.279763785384291e-07, - "loss": 0.5752, - "step": 74056 - }, - { - "epoch": 1.9, - "learning_rate": 6.27950694321862e-07, - "loss": 0.521, - "step": 74057 - }, - { - "epoch": 1.9, - "learning_rate": 6.279250103901559e-07, - "loss": 0.5503, - "step": 74058 - }, - { - "epoch": 1.9, - "learning_rate": 6.27899326743331e-07, - "loss": 0.4269, - "step": 74059 - }, - { - "epoch": 1.9, - "learning_rate": 6.278736433814058e-07, - "loss": 0.5073, - "step": 74060 - }, - { - "epoch": 1.9, - "learning_rate": 6.27847960304401e-07, - "loss": 0.6992, - "step": 74061 - }, - { - "epoch": 1.9, - "learning_rate": 6.278222775123357e-07, - "loss": 0.7188, - "step": 74062 - }, - { - "epoch": 1.9, - "learning_rate": 6.277965950052299e-07, - "loss": 0.6924, - "step": 74063 - }, - { - "epoch": 1.9, - "learning_rate": 6.277709127831029e-07, - "loss": 0.498, - "step": 74064 - }, - { - "epoch": 1.9, - "learning_rate": 6.277452308459749e-07, - "loss": 0.6841, - "step": 74065 - }, - { - "epoch": 1.9, - "learning_rate": 6.277195491938649e-07, - "loss": 0.7002, - "step": 74066 - }, - { - "epoch": 1.9, - "learning_rate": 6.276938678267933e-07, - "loss": 0.646, - "step": 74067 - }, - { - "epoch": 1.9, - "learning_rate": 6.276681867447791e-07, - "loss": 0.6875, - "step": 74068 - }, - { - "epoch": 1.9, - "learning_rate": 6.276425059478427e-07, - "loss": 0.4581, - "step": 74069 - }, - { - "epoch": 1.9, - "learning_rate": 6.27616825436003e-07, - "loss": 0.5806, - "step": 74070 - }, - { - "epoch": 1.9, - "learning_rate": 6.275911452092799e-07, - "loss": 0.7383, - "step": 74071 - }, - { - "epoch": 1.9, - "learning_rate": 6.275654652676933e-07, - "loss": 0.7227, - "step": 74072 - }, - { - "epoch": 1.9, - "learning_rate": 6.275397856112625e-07, - "loss": 0.4426, - "step": 74073 - }, - { - "epoch": 1.9, - "learning_rate": 6.275141062400076e-07, - "loss": 0.6699, - "step": 74074 - }, - { - "epoch": 1.9, - "learning_rate": 6.274884271539477e-07, - "loss": 0.6855, - "step": 74075 - }, - { - "epoch": 1.9, - "learning_rate": 6.274627483531029e-07, - "loss": 0.7568, - "step": 74076 - }, - { - "epoch": 1.9, - "learning_rate": 6.274370698374932e-07, - "loss": 0.6943, - "step": 74077 - }, - { - "epoch": 1.9, - "learning_rate": 6.274113916071371e-07, - "loss": 0.6348, - "step": 74078 - }, - { - "epoch": 1.9, - "learning_rate": 6.273857136620556e-07, - "loss": 0.7012, - "step": 74079 - }, - { - "epoch": 1.9, - "learning_rate": 6.273600360022675e-07, - "loss": 0.5874, - "step": 74080 - }, - { - "epoch": 1.9, - "learning_rate": 6.273343586277925e-07, - "loss": 0.5723, - "step": 74081 - }, - { - "epoch": 1.9, - "learning_rate": 6.273086815386505e-07, - "loss": 0.6299, - "step": 74082 - }, - { - "epoch": 1.9, - "learning_rate": 6.272830047348612e-07, - "loss": 0.6343, - "step": 74083 - }, - { - "epoch": 1.9, - "learning_rate": 6.272573282164441e-07, - "loss": 0.6084, - "step": 74084 - }, - { - "epoch": 1.9, - "learning_rate": 6.272316519834188e-07, - "loss": 0.5039, - "step": 74085 - }, - { - "epoch": 1.9, - "learning_rate": 6.272059760358052e-07, - "loss": 0.5259, - "step": 74086 - }, - { - "epoch": 1.9, - "learning_rate": 6.271803003736229e-07, - "loss": 0.6357, - "step": 74087 - }, - { - "epoch": 1.9, - "learning_rate": 6.271546249968915e-07, - "loss": 0.614, - "step": 74088 - }, - { - "epoch": 1.9, - "learning_rate": 6.271289499056309e-07, - "loss": 0.6934, - "step": 74089 - }, - { - "epoch": 1.9, - "learning_rate": 6.271032750998601e-07, - "loss": 0.7451, - "step": 74090 - }, - { - "epoch": 1.9, - "learning_rate": 6.270776005795995e-07, - "loss": 0.5732, - "step": 74091 - }, - { - "epoch": 1.9, - "learning_rate": 6.270519263448682e-07, - "loss": 0.6123, - "step": 74092 - }, - { - "epoch": 1.9, - "learning_rate": 6.270262523956861e-07, - "loss": 0.5808, - "step": 74093 - }, - { - "epoch": 1.9, - "learning_rate": 6.270005787320729e-07, - "loss": 0.6777, - "step": 74094 - }, - { - "epoch": 1.9, - "learning_rate": 6.26974905354048e-07, - "loss": 0.6509, - "step": 74095 - }, - { - "epoch": 1.9, - "learning_rate": 6.269492322616317e-07, - "loss": 0.5889, - "step": 74096 - }, - { - "epoch": 1.9, - "learning_rate": 6.269235594548427e-07, - "loss": 0.5903, - "step": 74097 - }, - { - "epoch": 1.9, - "learning_rate": 6.268978869337016e-07, - "loss": 0.4268, - "step": 74098 - }, - { - "epoch": 1.9, - "learning_rate": 6.268722146982279e-07, - "loss": 0.4805, - "step": 74099 - }, - { - "epoch": 1.9, - "learning_rate": 6.268465427484404e-07, - "loss": 0.707, - "step": 74100 - }, - { - "epoch": 1.9, - "learning_rate": 6.268208710843597e-07, - "loss": 0.5645, - "step": 74101 - }, - { - "epoch": 1.9, - "learning_rate": 6.267951997060047e-07, - "loss": 0.7051, - "step": 74102 - }, - { - "epoch": 1.9, - "learning_rate": 6.267695286133958e-07, - "loss": 0.5996, - "step": 74103 - }, - { - "epoch": 1.9, - "learning_rate": 6.26743857806552e-07, - "loss": 0.5676, - "step": 74104 - }, - { - "epoch": 1.9, - "learning_rate": 6.267181872854936e-07, - "loss": 0.686, - "step": 74105 - }, - { - "epoch": 1.9, - "learning_rate": 6.266925170502396e-07, - "loss": 0.5254, - "step": 74106 - }, - { - "epoch": 1.9, - "learning_rate": 6.266668471008104e-07, - "loss": 0.5034, - "step": 74107 - }, - { - "epoch": 1.9, - "learning_rate": 6.266411774372247e-07, - "loss": 0.7578, - "step": 74108 - }, - { - "epoch": 1.9, - "learning_rate": 6.266155080595032e-07, - "loss": 0.5913, - "step": 74109 - }, - { - "epoch": 1.9, - "learning_rate": 6.265898389676649e-07, - "loss": 0.6287, - "step": 74110 - }, - { - "epoch": 1.9, - "learning_rate": 6.265641701617294e-07, - "loss": 0.6826, - "step": 74111 - }, - { - "epoch": 1.9, - "learning_rate": 6.265385016417167e-07, - "loss": 0.6768, - "step": 74112 - }, - { - "epoch": 1.9, - "learning_rate": 6.265128334076463e-07, - "loss": 0.5752, - "step": 74113 - }, - { - "epoch": 1.9, - "learning_rate": 6.264871654595376e-07, - "loss": 0.5835, - "step": 74114 - }, - { - "epoch": 1.9, - "learning_rate": 6.264614977974107e-07, - "loss": 0.7549, - "step": 74115 - }, - { - "epoch": 1.9, - "learning_rate": 6.26435830421285e-07, - "loss": 0.5127, - "step": 74116 - }, - { - "epoch": 1.9, - "learning_rate": 6.264101633311803e-07, - "loss": 0.5747, - "step": 74117 - }, - { - "epoch": 1.9, - "learning_rate": 6.26384496527116e-07, - "loss": 0.4912, - "step": 74118 - }, - { - "epoch": 1.9, - "learning_rate": 6.263588300091123e-07, - "loss": 0.5503, - "step": 74119 - }, - { - "epoch": 1.9, - "learning_rate": 6.263331637771883e-07, - "loss": 0.6152, - "step": 74120 - }, - { - "epoch": 1.9, - "learning_rate": 6.263074978313636e-07, - "loss": 0.5688, - "step": 74121 - }, - { - "epoch": 1.9, - "learning_rate": 6.262818321716582e-07, - "loss": 0.4856, - "step": 74122 - }, - { - "epoch": 1.9, - "learning_rate": 6.262561667980914e-07, - "loss": 0.6025, - "step": 74123 - }, - { - "epoch": 1.9, - "learning_rate": 6.262305017106833e-07, - "loss": 0.7041, - "step": 74124 - }, - { - "epoch": 1.9, - "learning_rate": 6.262048369094532e-07, - "loss": 0.3745, - "step": 74125 - }, - { - "epoch": 1.9, - "learning_rate": 6.26179172394421e-07, - "loss": 0.6519, - "step": 74126 - }, - { - "epoch": 1.9, - "learning_rate": 6.26153508165606e-07, - "loss": 0.7549, - "step": 74127 - }, - { - "epoch": 1.9, - "learning_rate": 6.261278442230284e-07, - "loss": 0.6406, - "step": 74128 - }, - { - "epoch": 1.9, - "learning_rate": 6.261021805667075e-07, - "loss": 0.6436, - "step": 74129 - }, - { - "epoch": 1.9, - "learning_rate": 6.260765171966629e-07, - "loss": 0.6323, - "step": 74130 - }, - { - "epoch": 1.9, - "learning_rate": 6.260508541129141e-07, - "loss": 0.5737, - "step": 74131 - }, - { - "epoch": 1.9, - "learning_rate": 6.260251913154813e-07, - "loss": 0.5908, - "step": 74132 - }, - { - "epoch": 1.9, - "learning_rate": 6.259995288043834e-07, - "loss": 0.4248, - "step": 74133 - }, - { - "epoch": 1.9, - "learning_rate": 6.259738665796408e-07, - "loss": 0.5842, - "step": 74134 - }, - { - "epoch": 1.9, - "learning_rate": 6.259482046412725e-07, - "loss": 0.6709, - "step": 74135 - }, - { - "epoch": 1.9, - "learning_rate": 6.259225429892987e-07, - "loss": 0.5818, - "step": 74136 - }, - { - "epoch": 1.9, - "learning_rate": 6.258968816237387e-07, - "loss": 0.5054, - "step": 74137 - }, - { - "epoch": 1.9, - "learning_rate": 6.258712205446123e-07, - "loss": 0.6797, - "step": 74138 - }, - { - "epoch": 1.9, - "learning_rate": 6.258455597519394e-07, - "loss": 0.5325, - "step": 74139 - }, - { - "epoch": 1.9, - "learning_rate": 6.25819899245739e-07, - "loss": 0.6797, - "step": 74140 - }, - { - "epoch": 1.9, - "learning_rate": 6.257942390260312e-07, - "loss": 0.6338, - "step": 74141 - }, - { - "epoch": 1.9, - "learning_rate": 6.257685790928353e-07, - "loss": 0.7344, - "step": 74142 - }, - { - "epoch": 1.9, - "learning_rate": 6.257429194461717e-07, - "loss": 0.5757, - "step": 74143 - }, - { - "epoch": 1.9, - "learning_rate": 6.25717260086059e-07, - "loss": 0.6943, - "step": 74144 - }, - { - "epoch": 1.9, - "learning_rate": 6.256916010125177e-07, - "loss": 0.6572, - "step": 74145 - }, - { - "epoch": 1.9, - "learning_rate": 6.256659422255669e-07, - "loss": 0.7275, - "step": 74146 - }, - { - "epoch": 1.9, - "learning_rate": 6.256402837252268e-07, - "loss": 0.6128, - "step": 74147 - }, - { - "epoch": 1.9, - "learning_rate": 6.256146255115162e-07, - "loss": 0.708, - "step": 74148 - }, - { - "epoch": 1.9, - "learning_rate": 6.255889675844562e-07, - "loss": 0.593, - "step": 74149 - }, - { - "epoch": 1.9, - "learning_rate": 6.255633099440648e-07, - "loss": 0.748, - "step": 74150 - }, - { - "epoch": 1.9, - "learning_rate": 6.255376525903626e-07, - "loss": 0.6348, - "step": 74151 - }, - { - "epoch": 1.9, - "learning_rate": 6.255119955233687e-07, - "loss": 0.4338, - "step": 74152 - }, - { - "epoch": 1.9, - "learning_rate": 6.254863387431033e-07, - "loss": 0.521, - "step": 74153 - }, - { - "epoch": 1.9, - "learning_rate": 6.254606822495855e-07, - "loss": 0.7163, - "step": 74154 - }, - { - "epoch": 1.9, - "learning_rate": 6.254350260428356e-07, - "loss": 0.6514, - "step": 74155 - }, - { - "epoch": 1.9, - "learning_rate": 6.254093701228727e-07, - "loss": 0.6182, - "step": 74156 - }, - { - "epoch": 1.9, - "learning_rate": 6.253837144897167e-07, - "loss": 0.575, - "step": 74157 - }, - { - "epoch": 1.9, - "learning_rate": 6.253580591433869e-07, - "loss": 0.6021, - "step": 74158 - }, - { - "epoch": 1.9, - "learning_rate": 6.253324040839038e-07, - "loss": 0.6523, - "step": 74159 - }, - { - "epoch": 1.9, - "learning_rate": 6.253067493112861e-07, - "loss": 0.4763, - "step": 74160 - }, - { - "epoch": 1.9, - "learning_rate": 6.252810948255536e-07, - "loss": 0.3882, - "step": 74161 - }, - { - "epoch": 1.9, - "learning_rate": 6.252554406267265e-07, - "loss": 0.8906, - "step": 74162 - }, - { - "epoch": 1.9, - "learning_rate": 6.252297867148237e-07, - "loss": 0.5908, - "step": 74163 - }, - { - "epoch": 1.9, - "learning_rate": 6.252041330898655e-07, - "loss": 0.6191, - "step": 74164 - }, - { - "epoch": 1.9, - "learning_rate": 6.251784797518709e-07, - "loss": 0.5605, - "step": 74165 - }, - { - "epoch": 1.9, - "learning_rate": 6.251528267008603e-07, - "loss": 0.6611, - "step": 74166 - }, - { - "epoch": 1.9, - "learning_rate": 6.251271739368529e-07, - "loss": 0.5957, - "step": 74167 - }, - { - "epoch": 1.9, - "learning_rate": 6.251015214598681e-07, - "loss": 0.7109, - "step": 74168 - }, - { - "epoch": 1.9, - "learning_rate": 6.250758692699264e-07, - "loss": 0.3484, - "step": 74169 - }, - { - "epoch": 1.9, - "learning_rate": 6.250502173670466e-07, - "loss": 0.6206, - "step": 74170 - }, - { - "epoch": 1.9, - "learning_rate": 6.250245657512482e-07, - "loss": 0.6719, - "step": 74171 - }, - { - "epoch": 1.9, - "learning_rate": 6.249989144225518e-07, - "loss": 0.5601, - "step": 74172 - }, - { - "epoch": 1.9, - "learning_rate": 6.249732633809761e-07, - "loss": 0.5903, - "step": 74173 - }, - { - "epoch": 1.9, - "learning_rate": 6.249476126265412e-07, - "loss": 0.4106, - "step": 74174 - }, - { - "epoch": 1.9, - "learning_rate": 6.249219621592667e-07, - "loss": 0.7207, - "step": 74175 - }, - { - "epoch": 1.9, - "learning_rate": 6.248963119791723e-07, - "loss": 0.5107, - "step": 74176 - }, - { - "epoch": 1.9, - "learning_rate": 6.248706620862773e-07, - "loss": 0.6328, - "step": 74177 - }, - { - "epoch": 1.9, - "learning_rate": 6.248450124806022e-07, - "loss": 0.6738, - "step": 74178 - }, - { - "epoch": 1.9, - "learning_rate": 6.248193631621656e-07, - "loss": 0.6465, - "step": 74179 - }, - { - "epoch": 1.9, - "learning_rate": 6.247937141309874e-07, - "loss": 0.6875, - "step": 74180 - }, - { - "epoch": 1.9, - "learning_rate": 6.247680653870877e-07, - "loss": 0.7197, - "step": 74181 - }, - { - "epoch": 1.9, - "learning_rate": 6.247424169304855e-07, - "loss": 0.5845, - "step": 74182 - }, - { - "epoch": 1.9, - "learning_rate": 6.247167687612011e-07, - "loss": 0.6622, - "step": 74183 - }, - { - "epoch": 1.9, - "learning_rate": 6.246911208792536e-07, - "loss": 0.5066, - "step": 74184 - }, - { - "epoch": 1.9, - "learning_rate": 6.246654732846629e-07, - "loss": 0.5454, - "step": 74185 - }, - { - "epoch": 1.9, - "learning_rate": 6.246398259774487e-07, - "loss": 0.5671, - "step": 74186 - }, - { - "epoch": 1.9, - "learning_rate": 6.246141789576304e-07, - "loss": 0.5615, - "step": 74187 - }, - { - "epoch": 1.9, - "learning_rate": 6.24588532225228e-07, - "loss": 0.6572, - "step": 74188 - }, - { - "epoch": 1.9, - "learning_rate": 6.245628857802609e-07, - "loss": 0.6211, - "step": 74189 - }, - { - "epoch": 1.9, - "learning_rate": 6.245372396227484e-07, - "loss": 0.4089, - "step": 74190 - }, - { - "epoch": 1.9, - "learning_rate": 6.245115937527106e-07, - "loss": 0.8613, - "step": 74191 - }, - { - "epoch": 1.9, - "learning_rate": 6.24485948170167e-07, - "loss": 0.5811, - "step": 74192 - }, - { - "epoch": 1.9, - "learning_rate": 6.244603028751373e-07, - "loss": 0.5542, - "step": 74193 - }, - { - "epoch": 1.9, - "learning_rate": 6.24434657867641e-07, - "loss": 0.6348, - "step": 74194 - }, - { - "epoch": 1.9, - "learning_rate": 6.244090131476978e-07, - "loss": 0.5801, - "step": 74195 - }, - { - "epoch": 1.9, - "learning_rate": 6.243833687153273e-07, - "loss": 0.7021, - "step": 74196 - }, - { - "epoch": 1.9, - "learning_rate": 6.243577245705494e-07, - "loss": 0.4941, - "step": 74197 - }, - { - "epoch": 1.9, - "learning_rate": 6.243320807133836e-07, - "loss": 0.6597, - "step": 74198 - }, - { - "epoch": 1.9, - "learning_rate": 6.243064371438492e-07, - "loss": 0.7432, - "step": 74199 - }, - { - "epoch": 1.9, - "learning_rate": 6.242807938619663e-07, - "loss": 0.6206, - "step": 74200 - }, - { - "epoch": 1.9, - "learning_rate": 6.242551508677541e-07, - "loss": 0.6768, - "step": 74201 - }, - { - "epoch": 1.9, - "learning_rate": 6.242295081612325e-07, - "loss": 0.5874, - "step": 74202 - }, - { - "epoch": 1.9, - "learning_rate": 6.242038657424211e-07, - "loss": 0.5493, - "step": 74203 - }, - { - "epoch": 1.9, - "learning_rate": 6.241782236113396e-07, - "loss": 0.3569, - "step": 74204 - }, - { - "epoch": 1.9, - "learning_rate": 6.241525817680073e-07, - "loss": 0.6304, - "step": 74205 - }, - { - "epoch": 1.9, - "learning_rate": 6.241269402124443e-07, - "loss": 0.6396, - "step": 74206 - }, - { - "epoch": 1.9, - "learning_rate": 6.2410129894467e-07, - "loss": 0.6963, - "step": 74207 - }, - { - "epoch": 1.9, - "learning_rate": 6.240756579647044e-07, - "loss": 0.6338, - "step": 74208 - }, - { - "epoch": 1.9, - "learning_rate": 6.240500172725662e-07, - "loss": 0.6494, - "step": 74209 - }, - { - "epoch": 1.9, - "learning_rate": 6.24024376868276e-07, - "loss": 0.6924, - "step": 74210 - }, - { - "epoch": 1.9, - "learning_rate": 6.239987367518526e-07, - "loss": 0.6338, - "step": 74211 - }, - { - "epoch": 1.9, - "learning_rate": 6.239730969233165e-07, - "loss": 0.7358, - "step": 74212 - }, - { - "epoch": 1.9, - "learning_rate": 6.239474573826866e-07, - "loss": 0.5327, - "step": 74213 - }, - { - "epoch": 1.9, - "learning_rate": 6.239218181299833e-07, - "loss": 0.6699, - "step": 74214 - }, - { - "epoch": 1.9, - "learning_rate": 6.238961791652253e-07, - "loss": 0.6836, - "step": 74215 - }, - { - "epoch": 1.9, - "learning_rate": 6.238705404884329e-07, - "loss": 0.7568, - "step": 74216 - }, - { - "epoch": 1.9, - "learning_rate": 6.238449020996254e-07, - "loss": 0.5845, - "step": 74217 - }, - { - "epoch": 1.9, - "learning_rate": 6.238192639988229e-07, - "loss": 0.425, - "step": 74218 - }, - { - "epoch": 1.9, - "learning_rate": 6.237936261860446e-07, - "loss": 0.5696, - "step": 74219 - }, - { - "epoch": 1.9, - "learning_rate": 6.237679886613102e-07, - "loss": 0.5928, - "step": 74220 - }, - { - "epoch": 1.9, - "learning_rate": 6.237423514246392e-07, - "loss": 0.7803, - "step": 74221 - }, - { - "epoch": 1.9, - "learning_rate": 6.237167144760514e-07, - "loss": 0.6328, - "step": 74222 - }, - { - "epoch": 1.9, - "learning_rate": 6.236910778155663e-07, - "loss": 0.8232, - "step": 74223 - }, - { - "epoch": 1.9, - "learning_rate": 6.236654414432039e-07, - "loss": 0.6387, - "step": 74224 - }, - { - "epoch": 1.9, - "learning_rate": 6.236398053589833e-07, - "loss": 0.6318, - "step": 74225 - }, - { - "epoch": 1.9, - "learning_rate": 6.236141695629246e-07, - "loss": 0.7441, - "step": 74226 - }, - { - "epoch": 1.9, - "learning_rate": 6.23588534055047e-07, - "loss": 0.6514, - "step": 74227 - }, - { - "epoch": 1.9, - "learning_rate": 6.235628988353708e-07, - "loss": 0.6055, - "step": 74228 - }, - { - "epoch": 1.9, - "learning_rate": 6.235372639039149e-07, - "loss": 0.5664, - "step": 74229 - }, - { - "epoch": 1.9, - "learning_rate": 6.235116292606993e-07, - "loss": 0.6099, - "step": 74230 - }, - { - "epoch": 1.9, - "learning_rate": 6.234859949057434e-07, - "loss": 0.6052, - "step": 74231 - }, - { - "epoch": 1.9, - "learning_rate": 6.234603608390668e-07, - "loss": 0.5991, - "step": 74232 - }, - { - "epoch": 1.9, - "learning_rate": 6.234347270606897e-07, - "loss": 0.6099, - "step": 74233 - }, - { - "epoch": 1.9, - "learning_rate": 6.234090935706308e-07, - "loss": 0.6387, - "step": 74234 - }, - { - "epoch": 1.9, - "learning_rate": 6.233834603689108e-07, - "loss": 0.553, - "step": 74235 - }, - { - "epoch": 1.9, - "learning_rate": 6.233578274555482e-07, - "loss": 0.6758, - "step": 74236 - }, - { - "epoch": 1.9, - "learning_rate": 6.233321948305637e-07, - "loss": 0.6641, - "step": 74237 - }, - { - "epoch": 1.9, - "learning_rate": 6.233065624939764e-07, - "loss": 0.6343, - "step": 74238 - }, - { - "epoch": 1.9, - "learning_rate": 6.232809304458059e-07, - "loss": 0.6367, - "step": 74239 - }, - { - "epoch": 1.9, - "learning_rate": 6.232552986860716e-07, - "loss": 0.4219, - "step": 74240 - }, - { - "epoch": 1.9, - "learning_rate": 6.232296672147936e-07, - "loss": 0.7012, - "step": 74241 - }, - { - "epoch": 1.9, - "learning_rate": 6.232040360319911e-07, - "loss": 0.5051, - "step": 74242 - }, - { - "epoch": 1.9, - "learning_rate": 6.231784051376842e-07, - "loss": 0.6538, - "step": 74243 - }, - { - "epoch": 1.9, - "learning_rate": 6.231527745318919e-07, - "loss": 0.564, - "step": 74244 - }, - { - "epoch": 1.9, - "learning_rate": 6.231271442146347e-07, - "loss": 0.668, - "step": 74245 - }, - { - "epoch": 1.9, - "learning_rate": 6.231015141859312e-07, - "loss": 0.667, - "step": 74246 - }, - { - "epoch": 1.9, - "learning_rate": 6.230758844458019e-07, - "loss": 0.5747, - "step": 74247 - }, - { - "epoch": 1.9, - "learning_rate": 6.230502549942662e-07, - "loss": 0.4698, - "step": 74248 - }, - { - "epoch": 1.9, - "learning_rate": 6.230246258313434e-07, - "loss": 0.7676, - "step": 74249 - }, - { - "epoch": 1.9, - "learning_rate": 6.229989969570533e-07, - "loss": 0.5454, - "step": 74250 - }, - { - "epoch": 1.9, - "learning_rate": 6.229733683714153e-07, - "loss": 0.6553, - "step": 74251 - }, - { - "epoch": 1.9, - "learning_rate": 6.229477400744496e-07, - "loss": 0.7046, - "step": 74252 - }, - { - "epoch": 1.9, - "learning_rate": 6.229221120661751e-07, - "loss": 0.6802, - "step": 74253 - }, - { - "epoch": 1.9, - "learning_rate": 6.228964843466123e-07, - "loss": 0.54, - "step": 74254 - }, - { - "epoch": 1.9, - "learning_rate": 6.228708569157799e-07, - "loss": 0.8535, - "step": 74255 - }, - { - "epoch": 1.9, - "learning_rate": 6.228452297736982e-07, - "loss": 0.7031, - "step": 74256 - }, - { - "epoch": 1.9, - "learning_rate": 6.228196029203865e-07, - "loss": 0.6777, - "step": 74257 - }, - { - "epoch": 1.9, - "learning_rate": 6.227939763558647e-07, - "loss": 0.6421, - "step": 74258 - }, - { - "epoch": 1.9, - "learning_rate": 6.227683500801518e-07, - "loss": 0.5811, - "step": 74259 - }, - { - "epoch": 1.9, - "learning_rate": 6.227427240932681e-07, - "loss": 0.6143, - "step": 74260 - }, - { - "epoch": 1.9, - "learning_rate": 6.227170983952327e-07, - "loss": 0.6553, - "step": 74261 - }, - { - "epoch": 1.9, - "learning_rate": 6.226914729860657e-07, - "loss": 0.5781, - "step": 74262 - }, - { - "epoch": 1.9, - "learning_rate": 6.226658478657862e-07, - "loss": 0.6042, - "step": 74263 - }, - { - "epoch": 1.9, - "learning_rate": 6.226402230344144e-07, - "loss": 0.6763, - "step": 74264 - }, - { - "epoch": 1.9, - "learning_rate": 6.226145984919695e-07, - "loss": 0.6445, - "step": 74265 - }, - { - "epoch": 1.9, - "learning_rate": 6.225889742384713e-07, - "loss": 0.3785, - "step": 74266 - }, - { - "epoch": 1.9, - "learning_rate": 6.225633502739393e-07, - "loss": 0.7451, - "step": 74267 - }, - { - "epoch": 1.9, - "learning_rate": 6.225377265983935e-07, - "loss": 0.5654, - "step": 74268 - }, - { - "epoch": 1.9, - "learning_rate": 6.22512103211853e-07, - "loss": 0.6592, - "step": 74269 - }, - { - "epoch": 1.9, - "learning_rate": 6.224864801143374e-07, - "loss": 0.5684, - "step": 74270 - }, - { - "epoch": 1.9, - "learning_rate": 6.224608573058668e-07, - "loss": 0.6797, - "step": 74271 - }, - { - "epoch": 1.9, - "learning_rate": 6.224352347864604e-07, - "loss": 0.6777, - "step": 74272 - }, - { - "epoch": 1.9, - "learning_rate": 6.224096125561382e-07, - "loss": 0.5317, - "step": 74273 - }, - { - "epoch": 1.9, - "learning_rate": 6.223839906149194e-07, - "loss": 0.6611, - "step": 74274 - }, - { - "epoch": 1.9, - "learning_rate": 6.223583689628238e-07, - "loss": 0.6904, - "step": 74275 - }, - { - "epoch": 1.9, - "learning_rate": 6.223327475998712e-07, - "loss": 0.6611, - "step": 74276 - }, - { - "epoch": 1.9, - "learning_rate": 6.223071265260809e-07, - "loss": 0.7314, - "step": 74277 - }, - { - "epoch": 1.9, - "learning_rate": 6.222815057414729e-07, - "loss": 0.6392, - "step": 74278 - }, - { - "epoch": 1.9, - "learning_rate": 6.222558852460666e-07, - "loss": 0.5962, - "step": 74279 - }, - { - "epoch": 1.9, - "learning_rate": 6.222302650398812e-07, - "loss": 0.7422, - "step": 74280 - }, - { - "epoch": 1.9, - "learning_rate": 6.222046451229371e-07, - "loss": 0.6694, - "step": 74281 - }, - { - "epoch": 1.9, - "learning_rate": 6.221790254952532e-07, - "loss": 0.6431, - "step": 74282 - }, - { - "epoch": 1.9, - "learning_rate": 6.221534061568497e-07, - "loss": 0.7188, - "step": 74283 - }, - { - "epoch": 1.9, - "learning_rate": 6.221277871077457e-07, - "loss": 0.6807, - "step": 74284 - }, - { - "epoch": 1.9, - "learning_rate": 6.221021683479612e-07, - "loss": 0.6514, - "step": 74285 - }, - { - "epoch": 1.9, - "learning_rate": 6.220765498775156e-07, - "loss": 0.6602, - "step": 74286 - }, - { - "epoch": 1.9, - "learning_rate": 6.220509316964288e-07, - "loss": 0.5645, - "step": 74287 - }, - { - "epoch": 1.9, - "learning_rate": 6.220253138047205e-07, - "loss": 0.6914, - "step": 74288 - }, - { - "epoch": 1.9, - "learning_rate": 6.219996962024096e-07, - "loss": 0.6577, - "step": 74289 - }, - { - "epoch": 1.9, - "learning_rate": 6.219740788895163e-07, - "loss": 0.6895, - "step": 74290 - }, - { - "epoch": 1.9, - "learning_rate": 6.2194846186606e-07, - "loss": 0.6304, - "step": 74291 - }, - { - "epoch": 1.9, - "learning_rate": 6.219228451320604e-07, - "loss": 0.6494, - "step": 74292 - }, - { - "epoch": 1.9, - "learning_rate": 6.218972286875372e-07, - "loss": 0.5435, - "step": 74293 - }, - { - "epoch": 1.9, - "learning_rate": 6.218716125325097e-07, - "loss": 0.5566, - "step": 74294 - }, - { - "epoch": 1.9, - "learning_rate": 6.218459966669979e-07, - "loss": 0.4165, - "step": 74295 - }, - { - "epoch": 1.9, - "learning_rate": 6.218203810910209e-07, - "loss": 0.6646, - "step": 74296 - }, - { - "epoch": 1.9, - "learning_rate": 6.217947658045991e-07, - "loss": 0.6816, - "step": 74297 - }, - { - "epoch": 1.9, - "learning_rate": 6.217691508077517e-07, - "loss": 0.7007, - "step": 74298 - }, - { - "epoch": 1.9, - "learning_rate": 6.217435361004979e-07, - "loss": 0.5537, - "step": 74299 - }, - { - "epoch": 1.9, - "learning_rate": 6.217179216828579e-07, - "loss": 0.6953, - "step": 74300 - }, - { - "epoch": 1.9, - "learning_rate": 6.216923075548509e-07, - "loss": 0.3933, - "step": 74301 - }, - { - "epoch": 1.9, - "learning_rate": 6.216666937164969e-07, - "loss": 0.7686, - "step": 74302 - }, - { - "epoch": 1.9, - "learning_rate": 6.216410801678152e-07, - "loss": 0.7988, - "step": 74303 - }, - { - "epoch": 1.9, - "learning_rate": 6.216154669088255e-07, - "loss": 0.6484, - "step": 74304 - }, - { - "epoch": 1.9, - "learning_rate": 6.215898539395474e-07, - "loss": 0.543, - "step": 74305 - }, - { - "epoch": 1.9, - "learning_rate": 6.215642412600006e-07, - "loss": 0.4124, - "step": 74306 - }, - { - "epoch": 1.9, - "learning_rate": 6.215386288702047e-07, - "loss": 0.6016, - "step": 74307 - }, - { - "epoch": 1.9, - "learning_rate": 6.215130167701794e-07, - "loss": 0.6318, - "step": 74308 - }, - { - "epoch": 1.9, - "learning_rate": 6.214874049599442e-07, - "loss": 0.6855, - "step": 74309 - }, - { - "epoch": 1.9, - "learning_rate": 6.214617934395186e-07, - "loss": 0.6523, - "step": 74310 - }, - { - "epoch": 1.9, - "learning_rate": 6.214361822089221e-07, - "loss": 0.5923, - "step": 74311 - }, - { - "epoch": 1.9, - "learning_rate": 6.214105712681748e-07, - "loss": 0.498, - "step": 74312 - }, - { - "epoch": 1.9, - "learning_rate": 6.213849606172957e-07, - "loss": 0.71, - "step": 74313 - }, - { - "epoch": 1.9, - "learning_rate": 6.21359350256305e-07, - "loss": 0.6602, - "step": 74314 - }, - { - "epoch": 1.9, - "learning_rate": 6.213337401852217e-07, - "loss": 0.6367, - "step": 74315 - }, - { - "epoch": 1.9, - "learning_rate": 6.213081304040662e-07, - "loss": 0.7158, - "step": 74316 - }, - { - "epoch": 1.9, - "learning_rate": 6.212825209128571e-07, - "loss": 0.6062, - "step": 74317 - }, - { - "epoch": 1.9, - "learning_rate": 6.212569117116153e-07, - "loss": 0.604, - "step": 74318 - }, - { - "epoch": 1.9, - "learning_rate": 6.212313028003593e-07, - "loss": 0.6396, - "step": 74319 - }, - { - "epoch": 1.9, - "learning_rate": 6.212056941791088e-07, - "loss": 0.666, - "step": 74320 - }, - { - "epoch": 1.9, - "learning_rate": 6.211800858478841e-07, - "loss": 0.6377, - "step": 74321 - }, - { - "epoch": 1.9, - "learning_rate": 6.211544778067039e-07, - "loss": 0.4697, - "step": 74322 - }, - { - "epoch": 1.9, - "learning_rate": 6.211288700555887e-07, - "loss": 0.6719, - "step": 74323 - }, - { - "epoch": 1.9, - "learning_rate": 6.211032625945576e-07, - "loss": 0.6528, - "step": 74324 - }, - { - "epoch": 1.9, - "learning_rate": 6.210776554236303e-07, - "loss": 0.5574, - "step": 74325 - }, - { - "epoch": 1.91, - "learning_rate": 6.210520485428263e-07, - "loss": 0.4536, - "step": 74326 - }, - { - "epoch": 1.91, - "learning_rate": 6.210264419521656e-07, - "loss": 0.7236, - "step": 74327 - }, - { - "epoch": 1.91, - "learning_rate": 6.210008356516676e-07, - "loss": 0.6084, - "step": 74328 - }, - { - "epoch": 1.91, - "learning_rate": 6.209752296413517e-07, - "loss": 0.7861, - "step": 74329 - }, - { - "epoch": 1.91, - "learning_rate": 6.209496239212372e-07, - "loss": 0.6689, - "step": 74330 - }, - { - "epoch": 1.91, - "learning_rate": 6.209240184913447e-07, - "loss": 0.6377, - "step": 74331 - }, - { - "epoch": 1.91, - "learning_rate": 6.208984133516929e-07, - "loss": 0.4048, - "step": 74332 - }, - { - "epoch": 1.91, - "learning_rate": 6.208728085023021e-07, - "loss": 0.5945, - "step": 74333 - }, - { - "epoch": 1.91, - "learning_rate": 6.208472039431912e-07, - "loss": 0.6582, - "step": 74334 - }, - { - "epoch": 1.91, - "learning_rate": 6.208215996743803e-07, - "loss": 0.7754, - "step": 74335 - }, - { - "epoch": 1.91, - "learning_rate": 6.207959956958888e-07, - "loss": 0.6333, - "step": 74336 - }, - { - "epoch": 1.91, - "learning_rate": 6.207703920077365e-07, - "loss": 0.6758, - "step": 74337 - }, - { - "epoch": 1.91, - "learning_rate": 6.20744788609943e-07, - "loss": 0.7051, - "step": 74338 - }, - { - "epoch": 1.91, - "learning_rate": 6.207191855025276e-07, - "loss": 0.6021, - "step": 74339 - }, - { - "epoch": 1.91, - "learning_rate": 6.206935826855101e-07, - "loss": 0.8379, - "step": 74340 - }, - { - "epoch": 1.91, - "learning_rate": 6.206679801589099e-07, - "loss": 0.4919, - "step": 74341 - }, - { - "epoch": 1.91, - "learning_rate": 6.20642377922747e-07, - "loss": 0.3822, - "step": 74342 - }, - { - "epoch": 1.91, - "learning_rate": 6.206167759770407e-07, - "loss": 0.6084, - "step": 74343 - }, - { - "epoch": 1.91, - "learning_rate": 6.205911743218106e-07, - "loss": 0.6274, - "step": 74344 - }, - { - "epoch": 1.91, - "learning_rate": 6.205655729570765e-07, - "loss": 0.6523, - "step": 74345 - }, - { - "epoch": 1.91, - "learning_rate": 6.205399718828579e-07, - "loss": 0.647, - "step": 74346 - }, - { - "epoch": 1.91, - "learning_rate": 6.205143710991743e-07, - "loss": 0.6509, - "step": 74347 - }, - { - "epoch": 1.91, - "learning_rate": 6.20488770606046e-07, - "loss": 0.4719, - "step": 74348 - }, - { - "epoch": 1.91, - "learning_rate": 6.204631704034914e-07, - "loss": 0.6475, - "step": 74349 - }, - { - "epoch": 1.91, - "learning_rate": 6.204375704915308e-07, - "loss": 0.5366, - "step": 74350 - }, - { - "epoch": 1.91, - "learning_rate": 6.204119708701836e-07, - "loss": 0.4897, - "step": 74351 - }, - { - "epoch": 1.91, - "learning_rate": 6.203863715394697e-07, - "loss": 0.6729, - "step": 74352 - }, - { - "epoch": 1.91, - "learning_rate": 6.203607724994082e-07, - "loss": 0.5967, - "step": 74353 - }, - { - "epoch": 1.91, - "learning_rate": 6.203351737500193e-07, - "loss": 0.635, - "step": 74354 - }, - { - "epoch": 1.91, - "learning_rate": 6.203095752913221e-07, - "loss": 0.5386, - "step": 74355 - }, - { - "epoch": 1.91, - "learning_rate": 6.202839771233366e-07, - "loss": 0.6211, - "step": 74356 - }, - { - "epoch": 1.91, - "learning_rate": 6.202583792460819e-07, - "loss": 0.8125, - "step": 74357 - }, - { - "epoch": 1.91, - "learning_rate": 6.202327816595784e-07, - "loss": 0.5254, - "step": 74358 - }, - { - "epoch": 1.91, - "learning_rate": 6.20207184363845e-07, - "loss": 0.6494, - "step": 74359 - }, - { - "epoch": 1.91, - "learning_rate": 6.201815873589012e-07, - "loss": 0.6646, - "step": 74360 - }, - { - "epoch": 1.91, - "learning_rate": 6.201559906447672e-07, - "loss": 0.5796, - "step": 74361 - }, - { - "epoch": 1.91, - "learning_rate": 6.20130394221462e-07, - "loss": 0.6714, - "step": 74362 - }, - { - "epoch": 1.91, - "learning_rate": 6.201047980890057e-07, - "loss": 0.5796, - "step": 74363 - }, - { - "epoch": 1.91, - "learning_rate": 6.200792022474175e-07, - "loss": 0.6836, - "step": 74364 - }, - { - "epoch": 1.91, - "learning_rate": 6.200536066967175e-07, - "loss": 0.5085, - "step": 74365 - }, - { - "epoch": 1.91, - "learning_rate": 6.200280114369249e-07, - "loss": 0.6943, - "step": 74366 - }, - { - "epoch": 1.91, - "learning_rate": 6.20002416468059e-07, - "loss": 0.6128, - "step": 74367 - }, - { - "epoch": 1.91, - "learning_rate": 6.199768217901405e-07, - "loss": 0.5532, - "step": 74368 - }, - { - "epoch": 1.91, - "learning_rate": 6.19951227403188e-07, - "loss": 0.6436, - "step": 74369 - }, - { - "epoch": 1.91, - "learning_rate": 6.199256333072211e-07, - "loss": 0.5715, - "step": 74370 - }, - { - "epoch": 1.91, - "learning_rate": 6.199000395022597e-07, - "loss": 0.5654, - "step": 74371 - }, - { - "epoch": 1.91, - "learning_rate": 6.198744459883234e-07, - "loss": 0.5979, - "step": 74372 - }, - { - "epoch": 1.91, - "learning_rate": 6.198488527654319e-07, - "loss": 0.7109, - "step": 74373 - }, - { - "epoch": 1.91, - "learning_rate": 6.198232598336044e-07, - "loss": 0.5547, - "step": 74374 - }, - { - "epoch": 1.91, - "learning_rate": 6.19797667192861e-07, - "loss": 0.6987, - "step": 74375 - }, - { - "epoch": 1.91, - "learning_rate": 6.197720748432208e-07, - "loss": 0.7305, - "step": 74376 - }, - { - "epoch": 1.91, - "learning_rate": 6.197464827847038e-07, - "loss": 0.5723, - "step": 74377 - }, - { - "epoch": 1.91, - "learning_rate": 6.197208910173297e-07, - "loss": 0.5903, - "step": 74378 - }, - { - "epoch": 1.91, - "learning_rate": 6.196952995411175e-07, - "loss": 0.668, - "step": 74379 - }, - { - "epoch": 1.91, - "learning_rate": 6.196697083560872e-07, - "loss": 0.5571, - "step": 74380 - }, - { - "epoch": 1.91, - "learning_rate": 6.196441174622582e-07, - "loss": 0.6426, - "step": 74381 - }, - { - "epoch": 1.91, - "learning_rate": 6.196185268596503e-07, - "loss": 0.8018, - "step": 74382 - }, - { - "epoch": 1.91, - "learning_rate": 6.195929365482831e-07, - "loss": 0.6484, - "step": 74383 - }, - { - "epoch": 1.91, - "learning_rate": 6.195673465281759e-07, - "loss": 0.4929, - "step": 74384 - }, - { - "epoch": 1.91, - "learning_rate": 6.195417567993486e-07, - "loss": 0.5996, - "step": 74385 - }, - { - "epoch": 1.91, - "learning_rate": 6.195161673618207e-07, - "loss": 0.7705, - "step": 74386 - }, - { - "epoch": 1.91, - "learning_rate": 6.194905782156117e-07, - "loss": 0.4285, - "step": 74387 - }, - { - "epoch": 1.91, - "learning_rate": 6.194649893607416e-07, - "loss": 0.5938, - "step": 74388 - }, - { - "epoch": 1.91, - "learning_rate": 6.194394007972293e-07, - "loss": 0.6875, - "step": 74389 - }, - { - "epoch": 1.91, - "learning_rate": 6.19413812525095e-07, - "loss": 0.7725, - "step": 74390 - }, - { - "epoch": 1.91, - "learning_rate": 6.193882245443577e-07, - "loss": 0.4868, - "step": 74391 - }, - { - "epoch": 1.91, - "learning_rate": 6.193626368550376e-07, - "loss": 0.5806, - "step": 74392 - }, - { - "epoch": 1.91, - "learning_rate": 6.193370494571537e-07, - "loss": 0.4178, - "step": 74393 - }, - { - "epoch": 1.91, - "learning_rate": 6.193114623507263e-07, - "loss": 0.71, - "step": 74394 - }, - { - "epoch": 1.91, - "learning_rate": 6.192858755357743e-07, - "loss": 0.6548, - "step": 74395 - }, - { - "epoch": 1.91, - "learning_rate": 6.192602890123179e-07, - "loss": 0.7031, - "step": 74396 - }, - { - "epoch": 1.91, - "learning_rate": 6.192347027803761e-07, - "loss": 0.5068, - "step": 74397 - }, - { - "epoch": 1.91, - "learning_rate": 6.192091168399691e-07, - "loss": 0.3925, - "step": 74398 - }, - { - "epoch": 1.91, - "learning_rate": 6.191835311911162e-07, - "loss": 0.6973, - "step": 74399 - }, - { - "epoch": 1.91, - "learning_rate": 6.191579458338368e-07, - "loss": 0.6562, - "step": 74400 - }, - { - "epoch": 1.91, - "learning_rate": 6.191323607681505e-07, - "loss": 0.7354, - "step": 74401 - }, - { - "epoch": 1.91, - "learning_rate": 6.191067759940772e-07, - "loss": 0.6387, - "step": 74402 - }, - { - "epoch": 1.91, - "learning_rate": 6.19081191511636e-07, - "loss": 0.4043, - "step": 74403 - }, - { - "epoch": 1.91, - "learning_rate": 6.190556073208472e-07, - "loss": 0.7236, - "step": 74404 - }, - { - "epoch": 1.91, - "learning_rate": 6.190300234217299e-07, - "loss": 0.5225, - "step": 74405 - }, - { - "epoch": 1.91, - "learning_rate": 6.190044398143038e-07, - "loss": 0.5444, - "step": 74406 - }, - { - "epoch": 1.91, - "learning_rate": 6.189788564985883e-07, - "loss": 0.7773, - "step": 74407 - }, - { - "epoch": 1.91, - "learning_rate": 6.189532734746037e-07, - "loss": 0.6338, - "step": 74408 - }, - { - "epoch": 1.91, - "learning_rate": 6.189276907423689e-07, - "loss": 0.6289, - "step": 74409 - }, - { - "epoch": 1.91, - "learning_rate": 6.189021083019032e-07, - "loss": 0.7744, - "step": 74410 - }, - { - "epoch": 1.91, - "learning_rate": 6.18876526153227e-07, - "loss": 0.5669, - "step": 74411 - }, - { - "epoch": 1.91, - "learning_rate": 6.188509442963592e-07, - "loss": 0.6836, - "step": 74412 - }, - { - "epoch": 1.91, - "learning_rate": 6.1882536273132e-07, - "loss": 0.5347, - "step": 74413 - }, - { - "epoch": 1.91, - "learning_rate": 6.187997814581285e-07, - "loss": 0.7373, - "step": 74414 - }, - { - "epoch": 1.91, - "learning_rate": 6.187742004768046e-07, - "loss": 0.6191, - "step": 74415 - }, - { - "epoch": 1.91, - "learning_rate": 6.187486197873677e-07, - "loss": 0.5537, - "step": 74416 - }, - { - "epoch": 1.91, - "learning_rate": 6.187230393898375e-07, - "loss": 0.5791, - "step": 74417 - }, - { - "epoch": 1.91, - "learning_rate": 6.186974592842338e-07, - "loss": 0.6602, - "step": 74418 - }, - { - "epoch": 1.91, - "learning_rate": 6.186718794705758e-07, - "loss": 0.6182, - "step": 74419 - }, - { - "epoch": 1.91, - "learning_rate": 6.186462999488829e-07, - "loss": 0.6387, - "step": 74420 - }, - { - "epoch": 1.91, - "learning_rate": 6.186207207191751e-07, - "loss": 0.7378, - "step": 74421 - }, - { - "epoch": 1.91, - "learning_rate": 6.185951417814719e-07, - "loss": 0.5996, - "step": 74422 - }, - { - "epoch": 1.91, - "learning_rate": 6.185695631357931e-07, - "loss": 0.668, - "step": 74423 - }, - { - "epoch": 1.91, - "learning_rate": 6.185439847821576e-07, - "loss": 0.6196, - "step": 74424 - }, - { - "epoch": 1.91, - "learning_rate": 6.185184067205858e-07, - "loss": 0.6685, - "step": 74425 - }, - { - "epoch": 1.91, - "learning_rate": 6.184928289510967e-07, - "loss": 0.6084, - "step": 74426 - }, - { - "epoch": 1.91, - "learning_rate": 6.184672514737101e-07, - "loss": 0.5522, - "step": 74427 - }, - { - "epoch": 1.91, - "learning_rate": 6.184416742884459e-07, - "loss": 0.6577, - "step": 74428 - }, - { - "epoch": 1.91, - "learning_rate": 6.184160973953232e-07, - "loss": 0.7158, - "step": 74429 - }, - { - "epoch": 1.91, - "learning_rate": 6.183905207943617e-07, - "loss": 0.8486, - "step": 74430 - }, - { - "epoch": 1.91, - "learning_rate": 6.183649444855809e-07, - "loss": 0.6914, - "step": 74431 - }, - { - "epoch": 1.91, - "learning_rate": 6.183393684690007e-07, - "loss": 0.6353, - "step": 74432 - }, - { - "epoch": 1.91, - "learning_rate": 6.183137927446402e-07, - "loss": 0.5532, - "step": 74433 - }, - { - "epoch": 1.91, - "learning_rate": 6.182882173125197e-07, - "loss": 0.5273, - "step": 74434 - }, - { - "epoch": 1.91, - "learning_rate": 6.18262642172658e-07, - "loss": 0.5459, - "step": 74435 - }, - { - "epoch": 1.91, - "learning_rate": 6.182370673250752e-07, - "loss": 0.7002, - "step": 74436 - }, - { - "epoch": 1.91, - "learning_rate": 6.182114927697907e-07, - "loss": 0.5439, - "step": 74437 - }, - { - "epoch": 1.91, - "learning_rate": 6.181859185068245e-07, - "loss": 0.5566, - "step": 74438 - }, - { - "epoch": 1.91, - "learning_rate": 6.181603445361954e-07, - "loss": 0.6753, - "step": 74439 - }, - { - "epoch": 1.91, - "learning_rate": 6.181347708579234e-07, - "loss": 0.6685, - "step": 74440 - }, - { - "epoch": 1.91, - "learning_rate": 6.181091974720279e-07, - "loss": 0.5903, - "step": 74441 - }, - { - "epoch": 1.91, - "learning_rate": 6.180836243785289e-07, - "loss": 0.8291, - "step": 74442 - }, - { - "epoch": 1.91, - "learning_rate": 6.180580515774454e-07, - "loss": 0.5889, - "step": 74443 - }, - { - "epoch": 1.91, - "learning_rate": 6.180324790687976e-07, - "loss": 0.4854, - "step": 74444 - }, - { - "epoch": 1.91, - "learning_rate": 6.180069068526043e-07, - "loss": 0.5571, - "step": 74445 - }, - { - "epoch": 1.91, - "learning_rate": 6.179813349288861e-07, - "loss": 0.8027, - "step": 74446 - }, - { - "epoch": 1.91, - "learning_rate": 6.179557632976618e-07, - "loss": 0.6729, - "step": 74447 - }, - { - "epoch": 1.91, - "learning_rate": 6.179301919589514e-07, - "loss": 0.6416, - "step": 74448 - }, - { - "epoch": 1.91, - "learning_rate": 6.179046209127741e-07, - "loss": 0.6016, - "step": 74449 - }, - { - "epoch": 1.91, - "learning_rate": 6.178790501591495e-07, - "loss": 0.8164, - "step": 74450 - }, - { - "epoch": 1.91, - "learning_rate": 6.178534796980976e-07, - "loss": 0.7305, - "step": 74451 - }, - { - "epoch": 1.91, - "learning_rate": 6.178279095296375e-07, - "loss": 0.5913, - "step": 74452 - }, - { - "epoch": 1.91, - "learning_rate": 6.178023396537891e-07, - "loss": 0.5342, - "step": 74453 - }, - { - "epoch": 1.91, - "learning_rate": 6.177767700705719e-07, - "loss": 0.6089, - "step": 74454 - }, - { - "epoch": 1.91, - "learning_rate": 6.177512007800054e-07, - "loss": 0.6421, - "step": 74455 - }, - { - "epoch": 1.91, - "learning_rate": 6.177256317821093e-07, - "loss": 0.4812, - "step": 74456 - }, - { - "epoch": 1.91, - "learning_rate": 6.177000630769029e-07, - "loss": 0.5354, - "step": 74457 - }, - { - "epoch": 1.91, - "learning_rate": 6.176744946644066e-07, - "loss": 0.5541, - "step": 74458 - }, - { - "epoch": 1.91, - "learning_rate": 6.17648926544639e-07, - "loss": 0.6396, - "step": 74459 - }, - { - "epoch": 1.91, - "learning_rate": 6.176233587176197e-07, - "loss": 0.6729, - "step": 74460 - }, - { - "epoch": 1.91, - "learning_rate": 6.175977911833689e-07, - "loss": 0.7036, - "step": 74461 - }, - { - "epoch": 1.91, - "learning_rate": 6.175722239419058e-07, - "loss": 0.7041, - "step": 74462 - }, - { - "epoch": 1.91, - "learning_rate": 6.175466569932502e-07, - "loss": 0.5552, - "step": 74463 - }, - { - "epoch": 1.91, - "learning_rate": 6.175210903374213e-07, - "loss": 0.6167, - "step": 74464 - }, - { - "epoch": 1.91, - "learning_rate": 6.174955239744392e-07, - "loss": 0.7705, - "step": 74465 - }, - { - "epoch": 1.91, - "learning_rate": 6.174699579043229e-07, - "loss": 0.5063, - "step": 74466 - }, - { - "epoch": 1.91, - "learning_rate": 6.174443921270924e-07, - "loss": 0.7842, - "step": 74467 - }, - { - "epoch": 1.91, - "learning_rate": 6.174188266427676e-07, - "loss": 0.7412, - "step": 74468 - }, - { - "epoch": 1.91, - "learning_rate": 6.173932614513669e-07, - "loss": 0.5776, - "step": 74469 - }, - { - "epoch": 1.91, - "learning_rate": 6.173676965529109e-07, - "loss": 0.6494, - "step": 74470 - }, - { - "epoch": 1.91, - "learning_rate": 6.173421319474188e-07, - "loss": 0.7236, - "step": 74471 - }, - { - "epoch": 1.91, - "learning_rate": 6.173165676349102e-07, - "loss": 0.5864, - "step": 74472 - }, - { - "epoch": 1.91, - "learning_rate": 6.172910036154049e-07, - "loss": 0.7305, - "step": 74473 - }, - { - "epoch": 1.91, - "learning_rate": 6.17265439888922e-07, - "loss": 0.7617, - "step": 74474 - }, - { - "epoch": 1.91, - "learning_rate": 6.172398764554816e-07, - "loss": 0.5854, - "step": 74475 - }, - { - "epoch": 1.91, - "learning_rate": 6.172143133151027e-07, - "loss": 0.7285, - "step": 74476 - }, - { - "epoch": 1.91, - "learning_rate": 6.171887504678058e-07, - "loss": 0.498, - "step": 74477 - }, - { - "epoch": 1.91, - "learning_rate": 6.171631879136096e-07, - "loss": 0.543, - "step": 74478 - }, - { - "epoch": 1.91, - "learning_rate": 6.171376256525335e-07, - "loss": 0.689, - "step": 74479 - }, - { - "epoch": 1.91, - "learning_rate": 6.171120636845981e-07, - "loss": 0.7139, - "step": 74480 - }, - { - "epoch": 1.91, - "learning_rate": 6.170865020098219e-07, - "loss": 0.6187, - "step": 74481 - }, - { - "epoch": 1.91, - "learning_rate": 6.170609406282255e-07, - "loss": 0.6172, - "step": 74482 - }, - { - "epoch": 1.91, - "learning_rate": 6.170353795398273e-07, - "loss": 0.4465, - "step": 74483 - }, - { - "epoch": 1.91, - "learning_rate": 6.17009818744648e-07, - "loss": 0.7178, - "step": 74484 - }, - { - "epoch": 1.91, - "learning_rate": 6.169842582427063e-07, - "loss": 0.5269, - "step": 74485 - }, - { - "epoch": 1.91, - "learning_rate": 6.169586980340224e-07, - "loss": 0.7256, - "step": 74486 - }, - { - "epoch": 1.91, - "learning_rate": 6.169331381186159e-07, - "loss": 0.5493, - "step": 74487 - }, - { - "epoch": 1.91, - "learning_rate": 6.169075784965057e-07, - "loss": 0.5801, - "step": 74488 - }, - { - "epoch": 1.91, - "learning_rate": 6.168820191677117e-07, - "loss": 0.6899, - "step": 74489 - }, - { - "epoch": 1.91, - "learning_rate": 6.168564601322537e-07, - "loss": 0.6484, - "step": 74490 - }, - { - "epoch": 1.91, - "learning_rate": 6.168309013901509e-07, - "loss": 0.6172, - "step": 74491 - }, - { - "epoch": 1.91, - "learning_rate": 6.168053429414233e-07, - "loss": 0.6963, - "step": 74492 - }, - { - "epoch": 1.91, - "learning_rate": 6.167797847860898e-07, - "loss": 0.6035, - "step": 74493 - }, - { - "epoch": 1.91, - "learning_rate": 6.167542269241709e-07, - "loss": 0.7109, - "step": 74494 - }, - { - "epoch": 1.91, - "learning_rate": 6.167286693556852e-07, - "loss": 0.6577, - "step": 74495 - }, - { - "epoch": 1.91, - "learning_rate": 6.167031120806531e-07, - "loss": 0.479, - "step": 74496 - }, - { - "epoch": 1.91, - "learning_rate": 6.16677555099094e-07, - "loss": 0.6733, - "step": 74497 - }, - { - "epoch": 1.91, - "learning_rate": 6.166519984110269e-07, - "loss": 0.709, - "step": 74498 - }, - { - "epoch": 1.91, - "learning_rate": 6.166264420164719e-07, - "loss": 0.5669, - "step": 74499 - }, - { - "epoch": 1.91, - "learning_rate": 6.166008859154481e-07, - "loss": 0.5723, - "step": 74500 - }, - { - "epoch": 1.91, - "learning_rate": 6.165753301079757e-07, - "loss": 0.5898, - "step": 74501 - }, - { - "epoch": 1.91, - "learning_rate": 6.165497745940736e-07, - "loss": 0.6504, - "step": 74502 - }, - { - "epoch": 1.91, - "learning_rate": 6.165242193737621e-07, - "loss": 0.5854, - "step": 74503 - }, - { - "epoch": 1.91, - "learning_rate": 6.1649866444706e-07, - "loss": 0.6553, - "step": 74504 - }, - { - "epoch": 1.91, - "learning_rate": 6.164731098139875e-07, - "loss": 0.7402, - "step": 74505 - }, - { - "epoch": 1.91, - "learning_rate": 6.164475554745637e-07, - "loss": 0.6077, - "step": 74506 - }, - { - "epoch": 1.91, - "learning_rate": 6.164220014288091e-07, - "loss": 0.6436, - "step": 74507 - }, - { - "epoch": 1.91, - "learning_rate": 6.163964476767418e-07, - "loss": 0.6914, - "step": 74508 - }, - { - "epoch": 1.91, - "learning_rate": 6.163708942183823e-07, - "loss": 0.6421, - "step": 74509 - }, - { - "epoch": 1.91, - "learning_rate": 6.163453410537498e-07, - "loss": 0.6973, - "step": 74510 - }, - { - "epoch": 1.91, - "learning_rate": 6.163197881828642e-07, - "loss": 0.519, - "step": 74511 - }, - { - "epoch": 1.91, - "learning_rate": 6.162942356057447e-07, - "loss": 0.4932, - "step": 74512 - }, - { - "epoch": 1.91, - "learning_rate": 6.162686833224114e-07, - "loss": 0.7236, - "step": 74513 - }, - { - "epoch": 1.91, - "learning_rate": 6.162431313328831e-07, - "loss": 0.8545, - "step": 74514 - }, - { - "epoch": 1.91, - "learning_rate": 6.162175796371801e-07, - "loss": 0.6641, - "step": 74515 - }, - { - "epoch": 1.91, - "learning_rate": 6.161920282353214e-07, - "loss": 0.5244, - "step": 74516 - }, - { - "epoch": 1.91, - "learning_rate": 6.161664771273272e-07, - "loss": 0.8438, - "step": 74517 - }, - { - "epoch": 1.91, - "learning_rate": 6.161409263132167e-07, - "loss": 0.5356, - "step": 74518 - }, - { - "epoch": 1.91, - "learning_rate": 6.16115375793009e-07, - "loss": 0.7188, - "step": 74519 - }, - { - "epoch": 1.91, - "learning_rate": 6.160898255667244e-07, - "loss": 0.5474, - "step": 74520 - }, - { - "epoch": 1.91, - "learning_rate": 6.160642756343819e-07, - "loss": 0.7139, - "step": 74521 - }, - { - "epoch": 1.91, - "learning_rate": 6.160387259960016e-07, - "loss": 0.6416, - "step": 74522 - }, - { - "epoch": 1.91, - "learning_rate": 6.160131766516026e-07, - "loss": 0.5002, - "step": 74523 - }, - { - "epoch": 1.91, - "learning_rate": 6.159876276012048e-07, - "loss": 0.3545, - "step": 74524 - }, - { - "epoch": 1.91, - "learning_rate": 6.159620788448275e-07, - "loss": 0.5947, - "step": 74525 - }, - { - "epoch": 1.91, - "learning_rate": 6.159365303824905e-07, - "loss": 0.5635, - "step": 74526 - }, - { - "epoch": 1.91, - "learning_rate": 6.159109822142135e-07, - "loss": 0.6934, - "step": 74527 - }, - { - "epoch": 1.91, - "learning_rate": 6.158854343400155e-07, - "loss": 0.6235, - "step": 74528 - }, - { - "epoch": 1.91, - "learning_rate": 6.158598867599163e-07, - "loss": 0.583, - "step": 74529 - }, - { - "epoch": 1.91, - "learning_rate": 6.158343394739356e-07, - "loss": 0.5117, - "step": 74530 - }, - { - "epoch": 1.91, - "learning_rate": 6.158087924820927e-07, - "loss": 0.6562, - "step": 74531 - }, - { - "epoch": 1.91, - "learning_rate": 6.157832457844076e-07, - "loss": 0.4722, - "step": 74532 - }, - { - "epoch": 1.91, - "learning_rate": 6.157576993808992e-07, - "loss": 0.7168, - "step": 74533 - }, - { - "epoch": 1.91, - "learning_rate": 6.15732153271588e-07, - "loss": 0.6357, - "step": 74534 - }, - { - "epoch": 1.91, - "learning_rate": 6.157066074564927e-07, - "loss": 0.6602, - "step": 74535 - }, - { - "epoch": 1.91, - "learning_rate": 6.156810619356332e-07, - "loss": 0.4004, - "step": 74536 - }, - { - "epoch": 1.91, - "learning_rate": 6.156555167090293e-07, - "loss": 0.6108, - "step": 74537 - }, - { - "epoch": 1.91, - "learning_rate": 6.156299717767002e-07, - "loss": 0.5522, - "step": 74538 - }, - { - "epoch": 1.91, - "learning_rate": 6.156044271386655e-07, - "loss": 0.6855, - "step": 74539 - }, - { - "epoch": 1.91, - "learning_rate": 6.155788827949446e-07, - "loss": 0.5327, - "step": 74540 - }, - { - "epoch": 1.91, - "learning_rate": 6.155533387455575e-07, - "loss": 0.749, - "step": 74541 - }, - { - "epoch": 1.91, - "learning_rate": 6.155277949905233e-07, - "loss": 0.6299, - "step": 74542 - }, - { - "epoch": 1.91, - "learning_rate": 6.15502251529862e-07, - "loss": 0.6528, - "step": 74543 - }, - { - "epoch": 1.91, - "learning_rate": 6.154767083635929e-07, - "loss": 0.4307, - "step": 74544 - }, - { - "epoch": 1.91, - "learning_rate": 6.154511654917356e-07, - "loss": 0.4058, - "step": 74545 - }, - { - "epoch": 1.91, - "learning_rate": 6.154256229143098e-07, - "loss": 0.5269, - "step": 74546 - }, - { - "epoch": 1.91, - "learning_rate": 6.154000806313351e-07, - "loss": 0.7178, - "step": 74547 - }, - { - "epoch": 1.91, - "learning_rate": 6.153745386428304e-07, - "loss": 0.4888, - "step": 74548 - }, - { - "epoch": 1.91, - "learning_rate": 6.153489969488159e-07, - "loss": 0.5731, - "step": 74549 - }, - { - "epoch": 1.91, - "learning_rate": 6.153234555493109e-07, - "loss": 0.8184, - "step": 74550 - }, - { - "epoch": 1.91, - "learning_rate": 6.152979144443352e-07, - "loss": 0.707, - "step": 74551 - }, - { - "epoch": 1.91, - "learning_rate": 6.15272373633908e-07, - "loss": 0.709, - "step": 74552 - }, - { - "epoch": 1.91, - "learning_rate": 6.152468331180493e-07, - "loss": 0.5698, - "step": 74553 - }, - { - "epoch": 1.91, - "learning_rate": 6.152212928967781e-07, - "loss": 0.6719, - "step": 74554 - }, - { - "epoch": 1.91, - "learning_rate": 6.151957529701146e-07, - "loss": 0.6201, - "step": 74555 - }, - { - "epoch": 1.91, - "learning_rate": 6.151702133380776e-07, - "loss": 0.7236, - "step": 74556 - }, - { - "epoch": 1.91, - "learning_rate": 6.151446740006877e-07, - "loss": 0.6116, - "step": 74557 - }, - { - "epoch": 1.91, - "learning_rate": 6.151191349579636e-07, - "loss": 0.623, - "step": 74558 - }, - { - "epoch": 1.91, - "learning_rate": 6.150935962099247e-07, - "loss": 0.7568, - "step": 74559 - }, - { - "epoch": 1.91, - "learning_rate": 6.150680577565913e-07, - "loss": 0.6826, - "step": 74560 - }, - { - "epoch": 1.91, - "learning_rate": 6.150425195979824e-07, - "loss": 0.6016, - "step": 74561 - }, - { - "epoch": 1.91, - "learning_rate": 6.150169817341179e-07, - "loss": 0.6719, - "step": 74562 - }, - { - "epoch": 1.91, - "learning_rate": 6.149914441650172e-07, - "loss": 0.6079, - "step": 74563 - }, - { - "epoch": 1.91, - "learning_rate": 6.149659068906996e-07, - "loss": 0.4456, - "step": 74564 - }, - { - "epoch": 1.91, - "learning_rate": 6.14940369911185e-07, - "loss": 0.8311, - "step": 74565 - }, - { - "epoch": 1.91, - "learning_rate": 6.149148332264929e-07, - "loss": 0.7607, - "step": 74566 - }, - { - "epoch": 1.91, - "learning_rate": 6.14889296836643e-07, - "loss": 0.5437, - "step": 74567 - }, - { - "epoch": 1.91, - "learning_rate": 6.148637607416546e-07, - "loss": 0.6111, - "step": 74568 - }, - { - "epoch": 1.91, - "learning_rate": 6.148382249415471e-07, - "loss": 0.5928, - "step": 74569 - }, - { - "epoch": 1.91, - "learning_rate": 6.148126894363403e-07, - "loss": 0.6182, - "step": 74570 - }, - { - "epoch": 1.91, - "learning_rate": 6.147871542260536e-07, - "loss": 0.5952, - "step": 74571 - }, - { - "epoch": 1.91, - "learning_rate": 6.147616193107071e-07, - "loss": 0.6543, - "step": 74572 - }, - { - "epoch": 1.91, - "learning_rate": 6.147360846903193e-07, - "loss": 0.5562, - "step": 74573 - }, - { - "epoch": 1.91, - "learning_rate": 6.147105503649109e-07, - "loss": 0.5129, - "step": 74574 - }, - { - "epoch": 1.91, - "learning_rate": 6.146850163345005e-07, - "loss": 0.6699, - "step": 74575 - }, - { - "epoch": 1.91, - "learning_rate": 6.146594825991084e-07, - "loss": 0.6045, - "step": 74576 - }, - { - "epoch": 1.91, - "learning_rate": 6.14633949158754e-07, - "loss": 0.6338, - "step": 74577 - }, - { - "epoch": 1.91, - "learning_rate": 6.146084160134561e-07, - "loss": 0.7754, - "step": 74578 - }, - { - "epoch": 1.91, - "learning_rate": 6.145828831632353e-07, - "loss": 0.6855, - "step": 74579 - }, - { - "epoch": 1.91, - "learning_rate": 6.145573506081106e-07, - "loss": 0.6143, - "step": 74580 - }, - { - "epoch": 1.91, - "learning_rate": 6.145318183481012e-07, - "loss": 0.75, - "step": 74581 - }, - { - "epoch": 1.91, - "learning_rate": 6.145062863832273e-07, - "loss": 0.4277, - "step": 74582 - }, - { - "epoch": 1.91, - "learning_rate": 6.144807547135082e-07, - "loss": 0.4888, - "step": 74583 - }, - { - "epoch": 1.91, - "learning_rate": 6.144552233389635e-07, - "loss": 0.6411, - "step": 74584 - }, - { - "epoch": 1.91, - "learning_rate": 6.144296922596127e-07, - "loss": 0.6216, - "step": 74585 - }, - { - "epoch": 1.91, - "learning_rate": 6.144041614754753e-07, - "loss": 0.7012, - "step": 74586 - }, - { - "epoch": 1.91, - "learning_rate": 6.143786309865712e-07, - "loss": 0.4536, - "step": 74587 - }, - { - "epoch": 1.91, - "learning_rate": 6.143531007929193e-07, - "loss": 0.6313, - "step": 74588 - }, - { - "epoch": 1.91, - "learning_rate": 6.143275708945397e-07, - "loss": 0.6538, - "step": 74589 - }, - { - "epoch": 1.91, - "learning_rate": 6.143020412914514e-07, - "loss": 0.6367, - "step": 74590 - }, - { - "epoch": 1.91, - "learning_rate": 6.142765119836748e-07, - "loss": 0.5945, - "step": 74591 - }, - { - "epoch": 1.91, - "learning_rate": 6.142509829712286e-07, - "loss": 0.6621, - "step": 74592 - }, - { - "epoch": 1.91, - "learning_rate": 6.142254542541327e-07, - "loss": 0.7207, - "step": 74593 - }, - { - "epoch": 1.91, - "learning_rate": 6.141999258324066e-07, - "loss": 0.5818, - "step": 74594 - }, - { - "epoch": 1.91, - "learning_rate": 6.1417439770607e-07, - "loss": 0.6499, - "step": 74595 - }, - { - "epoch": 1.91, - "learning_rate": 6.141488698751423e-07, - "loss": 0.6284, - "step": 74596 - }, - { - "epoch": 1.91, - "learning_rate": 6.141233423396434e-07, - "loss": 0.666, - "step": 74597 - }, - { - "epoch": 1.91, - "learning_rate": 6.140978150995921e-07, - "loss": 0.7207, - "step": 74598 - }, - { - "epoch": 1.91, - "learning_rate": 6.140722881550084e-07, - "loss": 0.6499, - "step": 74599 - }, - { - "epoch": 1.91, - "learning_rate": 6.140467615059118e-07, - "loss": 0.2649, - "step": 74600 - }, - { - "epoch": 1.91, - "learning_rate": 6.14021235152322e-07, - "loss": 0.6055, - "step": 74601 - }, - { - "epoch": 1.91, - "learning_rate": 6.139957090942581e-07, - "loss": 0.4177, - "step": 74602 - }, - { - "epoch": 1.91, - "learning_rate": 6.139701833317403e-07, - "loss": 0.6289, - "step": 74603 - }, - { - "epoch": 1.91, - "learning_rate": 6.139446578647873e-07, - "loss": 0.4768, - "step": 74604 - }, - { - "epoch": 1.91, - "learning_rate": 6.139191326934196e-07, - "loss": 0.5198, - "step": 74605 - }, - { - "epoch": 1.91, - "learning_rate": 6.13893607817656e-07, - "loss": 0.5645, - "step": 74606 - }, - { - "epoch": 1.91, - "learning_rate": 6.138680832375167e-07, - "loss": 0.7021, - "step": 74607 - }, - { - "epoch": 1.91, - "learning_rate": 6.138425589530205e-07, - "loss": 0.3096, - "step": 74608 - }, - { - "epoch": 1.91, - "learning_rate": 6.138170349641874e-07, - "loss": 0.8047, - "step": 74609 - }, - { - "epoch": 1.91, - "learning_rate": 6.137915112710367e-07, - "loss": 0.6899, - "step": 74610 - }, - { - "epoch": 1.91, - "learning_rate": 6.137659878735881e-07, - "loss": 0.5107, - "step": 74611 - }, - { - "epoch": 1.91, - "learning_rate": 6.137404647718613e-07, - "loss": 0.6782, - "step": 74612 - }, - { - "epoch": 1.91, - "learning_rate": 6.137149419658754e-07, - "loss": 0.6537, - "step": 74613 - }, - { - "epoch": 1.91, - "learning_rate": 6.136894194556505e-07, - "loss": 0.6895, - "step": 74614 - }, - { - "epoch": 1.91, - "learning_rate": 6.136638972412055e-07, - "loss": 0.8135, - "step": 74615 - }, - { - "epoch": 1.91, - "learning_rate": 6.136383753225605e-07, - "loss": 0.6689, - "step": 74616 - }, - { - "epoch": 1.91, - "learning_rate": 6.136128536997352e-07, - "loss": 0.5679, - "step": 74617 - }, - { - "epoch": 1.91, - "learning_rate": 6.135873323727485e-07, - "loss": 0.5752, - "step": 74618 - }, - { - "epoch": 1.91, - "learning_rate": 6.1356181134162e-07, - "loss": 0.6133, - "step": 74619 - }, - { - "epoch": 1.91, - "learning_rate": 6.135362906063697e-07, - "loss": 0.7686, - "step": 74620 - }, - { - "epoch": 1.91, - "learning_rate": 6.135107701670166e-07, - "loss": 0.6121, - "step": 74621 - }, - { - "epoch": 1.91, - "learning_rate": 6.134852500235808e-07, - "loss": 0.6855, - "step": 74622 - }, - { - "epoch": 1.91, - "learning_rate": 6.134597301760813e-07, - "loss": 0.7646, - "step": 74623 - }, - { - "epoch": 1.91, - "learning_rate": 6.134342106245381e-07, - "loss": 0.4302, - "step": 74624 - }, - { - "epoch": 1.91, - "learning_rate": 6.134086913689704e-07, - "loss": 0.6631, - "step": 74625 - }, - { - "epoch": 1.91, - "learning_rate": 6.133831724093981e-07, - "loss": 0.6382, - "step": 74626 - }, - { - "epoch": 1.91, - "learning_rate": 6.133576537458407e-07, - "loss": 0.6128, - "step": 74627 - }, - { - "epoch": 1.91, - "learning_rate": 6.133321353783172e-07, - "loss": 0.6069, - "step": 74628 - }, - { - "epoch": 1.91, - "learning_rate": 6.133066173068477e-07, - "loss": 0.6768, - "step": 74629 - }, - { - "epoch": 1.91, - "learning_rate": 6.132810995314513e-07, - "loss": 0.79, - "step": 74630 - }, - { - "epoch": 1.91, - "learning_rate": 6.132555820521482e-07, - "loss": 0.6904, - "step": 74631 - }, - { - "epoch": 1.91, - "learning_rate": 6.13230064868957e-07, - "loss": 0.7275, - "step": 74632 - }, - { - "epoch": 1.91, - "learning_rate": 6.132045479818982e-07, - "loss": 0.5776, - "step": 74633 - }, - { - "epoch": 1.91, - "learning_rate": 6.131790313909904e-07, - "loss": 0.5234, - "step": 74634 - }, - { - "epoch": 1.91, - "learning_rate": 6.13153515096254e-07, - "loss": 0.6108, - "step": 74635 - }, - { - "epoch": 1.91, - "learning_rate": 6.131279990977081e-07, - "loss": 0.501, - "step": 74636 - }, - { - "epoch": 1.91, - "learning_rate": 6.131024833953727e-07, - "loss": 0.6274, - "step": 74637 - }, - { - "epoch": 1.91, - "learning_rate": 6.130769679892665e-07, - "loss": 0.5684, - "step": 74638 - }, - { - "epoch": 1.91, - "learning_rate": 6.130514528794095e-07, - "loss": 0.6016, - "step": 74639 - }, - { - "epoch": 1.91, - "learning_rate": 6.130259380658212e-07, - "loss": 0.6221, - "step": 74640 - }, - { - "epoch": 1.91, - "learning_rate": 6.130004235485211e-07, - "loss": 0.5249, - "step": 74641 - }, - { - "epoch": 1.91, - "learning_rate": 6.129749093275287e-07, - "loss": 0.5747, - "step": 74642 - }, - { - "epoch": 1.91, - "learning_rate": 6.129493954028639e-07, - "loss": 0.5337, - "step": 74643 - }, - { - "epoch": 1.91, - "learning_rate": 6.129238817745457e-07, - "loss": 0.6367, - "step": 74644 - }, - { - "epoch": 1.91, - "learning_rate": 6.128983684425941e-07, - "loss": 0.6533, - "step": 74645 - }, - { - "epoch": 1.91, - "learning_rate": 6.128728554070281e-07, - "loss": 0.6069, - "step": 74646 - }, - { - "epoch": 1.91, - "learning_rate": 6.128473426678681e-07, - "loss": 0.5811, - "step": 74647 - }, - { - "epoch": 1.91, - "learning_rate": 6.128218302251329e-07, - "loss": 0.4968, - "step": 74648 - }, - { - "epoch": 1.91, - "learning_rate": 6.127963180788419e-07, - "loss": 0.7324, - "step": 74649 - }, - { - "epoch": 1.91, - "learning_rate": 6.127708062290152e-07, - "loss": 0.6758, - "step": 74650 - }, - { - "epoch": 1.91, - "learning_rate": 6.127452946756719e-07, - "loss": 0.7373, - "step": 74651 - }, - { - "epoch": 1.91, - "learning_rate": 6.12719783418832e-07, - "loss": 0.7666, - "step": 74652 - }, - { - "epoch": 1.91, - "learning_rate": 6.126942724585147e-07, - "loss": 0.5933, - "step": 74653 - }, - { - "epoch": 1.91, - "learning_rate": 6.126687617947393e-07, - "loss": 0.6484, - "step": 74654 - }, - { - "epoch": 1.91, - "learning_rate": 6.12643251427526e-07, - "loss": 0.5874, - "step": 74655 - }, - { - "epoch": 1.91, - "learning_rate": 6.126177413568935e-07, - "loss": 0.7764, - "step": 74656 - }, - { - "epoch": 1.91, - "learning_rate": 6.125922315828624e-07, - "loss": 0.5664, - "step": 74657 - }, - { - "epoch": 1.91, - "learning_rate": 6.125667221054513e-07, - "loss": 0.6245, - "step": 74658 - }, - { - "epoch": 1.91, - "learning_rate": 6.125412129246799e-07, - "loss": 0.6455, - "step": 74659 - }, - { - "epoch": 1.91, - "learning_rate": 6.12515704040568e-07, - "loss": 0.4595, - "step": 74660 - }, - { - "epoch": 1.91, - "learning_rate": 6.124901954531349e-07, - "loss": 0.6265, - "step": 74661 - }, - { - "epoch": 1.91, - "learning_rate": 6.124646871624004e-07, - "loss": 0.5776, - "step": 74662 - }, - { - "epoch": 1.91, - "learning_rate": 6.124391791683836e-07, - "loss": 0.5884, - "step": 74663 - }, - { - "epoch": 1.91, - "learning_rate": 6.124136714711046e-07, - "loss": 0.5215, - "step": 74664 - }, - { - "epoch": 1.91, - "learning_rate": 6.123881640705823e-07, - "loss": 0.6055, - "step": 74665 - }, - { - "epoch": 1.91, - "learning_rate": 6.12362656966837e-07, - "loss": 0.6523, - "step": 74666 - }, - { - "epoch": 1.91, - "learning_rate": 6.123371501598879e-07, - "loss": 0.7173, - "step": 74667 - }, - { - "epoch": 1.91, - "learning_rate": 6.123116436497539e-07, - "loss": 0.4802, - "step": 74668 - }, - { - "epoch": 1.91, - "learning_rate": 6.122861374364554e-07, - "loss": 0.7822, - "step": 74669 - }, - { - "epoch": 1.91, - "learning_rate": 6.122606315200114e-07, - "loss": 0.6826, - "step": 74670 - }, - { - "epoch": 1.91, - "learning_rate": 6.122351259004415e-07, - "loss": 0.6279, - "step": 74671 - }, - { - "epoch": 1.91, - "learning_rate": 6.122096205777656e-07, - "loss": 0.5889, - "step": 74672 - }, - { - "epoch": 1.91, - "learning_rate": 6.121841155520027e-07, - "loss": 0.5635, - "step": 74673 - }, - { - "epoch": 1.91, - "learning_rate": 6.121586108231728e-07, - "loss": 0.7285, - "step": 74674 - }, - { - "epoch": 1.91, - "learning_rate": 6.12133106391295e-07, - "loss": 0.6914, - "step": 74675 - }, - { - "epoch": 1.91, - "learning_rate": 6.121076022563892e-07, - "loss": 0.7104, - "step": 74676 - }, - { - "epoch": 1.91, - "learning_rate": 6.120820984184751e-07, - "loss": 0.5122, - "step": 74677 - }, - { - "epoch": 1.91, - "learning_rate": 6.120565948775714e-07, - "loss": 0.5684, - "step": 74678 - }, - { - "epoch": 1.91, - "learning_rate": 6.120310916336983e-07, - "loss": 0.7051, - "step": 74679 - }, - { - "epoch": 1.91, - "learning_rate": 6.120055886868751e-07, - "loss": 0.6777, - "step": 74680 - }, - { - "epoch": 1.91, - "learning_rate": 6.119800860371214e-07, - "loss": 0.6372, - "step": 74681 - }, - { - "epoch": 1.91, - "learning_rate": 6.119545836844566e-07, - "loss": 0.5859, - "step": 74682 - }, - { - "epoch": 1.91, - "learning_rate": 6.119290816289006e-07, - "loss": 0.5942, - "step": 74683 - }, - { - "epoch": 1.91, - "learning_rate": 6.119035798704723e-07, - "loss": 0.6182, - "step": 74684 - }, - { - "epoch": 1.91, - "learning_rate": 6.118780784091919e-07, - "loss": 0.6304, - "step": 74685 - }, - { - "epoch": 1.91, - "learning_rate": 6.118525772450784e-07, - "loss": 0.5405, - "step": 74686 - }, - { - "epoch": 1.91, - "learning_rate": 6.118270763781519e-07, - "loss": 0.542, - "step": 74687 - }, - { - "epoch": 1.91, - "learning_rate": 6.118015758084314e-07, - "loss": 0.7812, - "step": 74688 - }, - { - "epoch": 1.91, - "learning_rate": 6.117760755359365e-07, - "loss": 0.6504, - "step": 74689 - }, - { - "epoch": 1.91, - "learning_rate": 6.117505755606867e-07, - "loss": 0.5674, - "step": 74690 - }, - { - "epoch": 1.91, - "learning_rate": 6.117250758827018e-07, - "loss": 0.6523, - "step": 74691 - }, - { - "epoch": 1.91, - "learning_rate": 6.11699576502001e-07, - "loss": 0.6289, - "step": 74692 - }, - { - "epoch": 1.91, - "learning_rate": 6.116740774186041e-07, - "loss": 0.6709, - "step": 74693 - }, - { - "epoch": 1.91, - "learning_rate": 6.116485786325302e-07, - "loss": 0.7002, - "step": 74694 - }, - { - "epoch": 1.91, - "learning_rate": 6.116230801437996e-07, - "loss": 0.6631, - "step": 74695 - }, - { - "epoch": 1.91, - "learning_rate": 6.115975819524311e-07, - "loss": 0.6621, - "step": 74696 - }, - { - "epoch": 1.91, - "learning_rate": 6.115720840584447e-07, - "loss": 0.7197, - "step": 74697 - }, - { - "epoch": 1.91, - "learning_rate": 6.115465864618596e-07, - "loss": 0.5146, - "step": 74698 - }, - { - "epoch": 1.91, - "learning_rate": 6.115210891626952e-07, - "loss": 0.4893, - "step": 74699 - }, - { - "epoch": 1.91, - "learning_rate": 6.114955921609715e-07, - "loss": 0.749, - "step": 74700 - }, - { - "epoch": 1.91, - "learning_rate": 6.114700954567074e-07, - "loss": 0.6108, - "step": 74701 - }, - { - "epoch": 1.91, - "learning_rate": 6.11444599049923e-07, - "loss": 0.6074, - "step": 74702 - }, - { - "epoch": 1.91, - "learning_rate": 6.114191029406376e-07, - "loss": 0.5183, - "step": 74703 - }, - { - "epoch": 1.91, - "learning_rate": 6.113936071288707e-07, - "loss": 0.5884, - "step": 74704 - }, - { - "epoch": 1.91, - "learning_rate": 6.113681116146419e-07, - "loss": 0.6689, - "step": 74705 - }, - { - "epoch": 1.91, - "learning_rate": 6.113426163979707e-07, - "loss": 0.7432, - "step": 74706 - }, - { - "epoch": 1.91, - "learning_rate": 6.113171214788768e-07, - "loss": 0.6934, - "step": 74707 - }, - { - "epoch": 1.91, - "learning_rate": 6.112916268573793e-07, - "loss": 0.5444, - "step": 74708 - }, - { - "epoch": 1.91, - "learning_rate": 6.112661325334978e-07, - "loss": 0.5913, - "step": 74709 - }, - { - "epoch": 1.91, - "learning_rate": 6.11240638507252e-07, - "loss": 0.7285, - "step": 74710 - }, - { - "epoch": 1.91, - "learning_rate": 6.112151447786614e-07, - "loss": 0.688, - "step": 74711 - }, - { - "epoch": 1.91, - "learning_rate": 6.111896513477455e-07, - "loss": 0.6709, - "step": 74712 - }, - { - "epoch": 1.91, - "learning_rate": 6.111641582145236e-07, - "loss": 0.7441, - "step": 74713 - }, - { - "epoch": 1.91, - "learning_rate": 6.111386653790157e-07, - "loss": 0.5571, - "step": 74714 - }, - { - "epoch": 1.91, - "learning_rate": 6.111131728412408e-07, - "loss": 0.7227, - "step": 74715 - }, - { - "epoch": 1.92, - "learning_rate": 6.110876806012189e-07, - "loss": 0.6592, - "step": 74716 - }, - { - "epoch": 1.92, - "learning_rate": 6.110621886589695e-07, - "loss": 0.6343, - "step": 74717 - }, - { - "epoch": 1.92, - "learning_rate": 6.110366970145115e-07, - "loss": 0.5179, - "step": 74718 - }, - { - "epoch": 1.92, - "learning_rate": 6.110112056678649e-07, - "loss": 0.5132, - "step": 74719 - }, - { - "epoch": 1.92, - "learning_rate": 6.109857146190491e-07, - "loss": 0.5815, - "step": 74720 - }, - { - "epoch": 1.92, - "learning_rate": 6.109602238680838e-07, - "loss": 0.6196, - "step": 74721 - }, - { - "epoch": 1.92, - "learning_rate": 6.109347334149881e-07, - "loss": 0.4355, - "step": 74722 - }, - { - "epoch": 1.92, - "learning_rate": 6.10909243259782e-07, - "loss": 0.6089, - "step": 74723 - }, - { - "epoch": 1.92, - "learning_rate": 6.108837534024845e-07, - "loss": 0.6904, - "step": 74724 - }, - { - "epoch": 1.92, - "learning_rate": 6.108582638431158e-07, - "loss": 0.8193, - "step": 74725 - }, - { - "epoch": 1.92, - "learning_rate": 6.10832774581695e-07, - "loss": 0.6748, - "step": 74726 - }, - { - "epoch": 1.92, - "learning_rate": 6.108072856182418e-07, - "loss": 0.689, - "step": 74727 - }, - { - "epoch": 1.92, - "learning_rate": 6.107817969527752e-07, - "loss": 0.5322, - "step": 74728 - }, - { - "epoch": 1.92, - "learning_rate": 6.107563085853153e-07, - "loss": 0.6455, - "step": 74729 - }, - { - "epoch": 1.92, - "learning_rate": 6.107308205158811e-07, - "loss": 0.6826, - "step": 74730 - }, - { - "epoch": 1.92, - "learning_rate": 6.107053327444926e-07, - "loss": 0.6104, - "step": 74731 - }, - { - "epoch": 1.92, - "learning_rate": 6.106798452711691e-07, - "loss": 0.7192, - "step": 74732 - }, - { - "epoch": 1.92, - "learning_rate": 6.106543580959303e-07, - "loss": 0.5354, - "step": 74733 - }, - { - "epoch": 1.92, - "learning_rate": 6.106288712187952e-07, - "loss": 0.6592, - "step": 74734 - }, - { - "epoch": 1.92, - "learning_rate": 6.10603384639784e-07, - "loss": 0.7383, - "step": 74735 - }, - { - "epoch": 1.92, - "learning_rate": 6.105778983589156e-07, - "loss": 0.6768, - "step": 74736 - }, - { - "epoch": 1.92, - "learning_rate": 6.105524123762102e-07, - "loss": 0.7744, - "step": 74737 - }, - { - "epoch": 1.92, - "learning_rate": 6.105269266916869e-07, - "loss": 0.5527, - "step": 74738 - }, - { - "epoch": 1.92, - "learning_rate": 6.105014413053649e-07, - "loss": 0.6226, - "step": 74739 - }, - { - "epoch": 1.92, - "learning_rate": 6.104759562172641e-07, - "loss": 0.6846, - "step": 74740 - }, - { - "epoch": 1.92, - "learning_rate": 6.10450471427404e-07, - "loss": 0.6479, - "step": 74741 - }, - { - "epoch": 1.92, - "learning_rate": 6.10424986935804e-07, - "loss": 0.467, - "step": 74742 - }, - { - "epoch": 1.92, - "learning_rate": 6.10399502742484e-07, - "loss": 0.5811, - "step": 74743 - }, - { - "epoch": 1.92, - "learning_rate": 6.103740188474626e-07, - "loss": 0.9297, - "step": 74744 - }, - { - "epoch": 1.92, - "learning_rate": 6.103485352507604e-07, - "loss": 0.6401, - "step": 74745 - }, - { - "epoch": 1.92, - "learning_rate": 6.103230519523961e-07, - "loss": 0.5288, - "step": 74746 - }, - { - "epoch": 1.92, - "learning_rate": 6.1029756895239e-07, - "loss": 0.5596, - "step": 74747 - }, - { - "epoch": 1.92, - "learning_rate": 6.102720862507608e-07, - "loss": 0.8369, - "step": 74748 - }, - { - "epoch": 1.92, - "learning_rate": 6.102466038475282e-07, - "loss": 0.7158, - "step": 74749 - }, - { - "epoch": 1.92, - "learning_rate": 6.10221121742712e-07, - "loss": 0.6309, - "step": 74750 - }, - { - "epoch": 1.92, - "learning_rate": 6.101956399363315e-07, - "loss": 0.7676, - "step": 74751 - }, - { - "epoch": 1.92, - "learning_rate": 6.101701584284062e-07, - "loss": 0.6992, - "step": 74752 - }, - { - "epoch": 1.92, - "learning_rate": 6.101446772189557e-07, - "loss": 0.749, - "step": 74753 - }, - { - "epoch": 1.92, - "learning_rate": 6.101191963079998e-07, - "loss": 0.6973, - "step": 74754 - }, - { - "epoch": 1.92, - "learning_rate": 6.100937156955574e-07, - "loss": 0.5386, - "step": 74755 - }, - { - "epoch": 1.92, - "learning_rate": 6.100682353816484e-07, - "loss": 0.7705, - "step": 74756 - }, - { - "epoch": 1.92, - "learning_rate": 6.100427553662926e-07, - "loss": 0.4871, - "step": 74757 - }, - { - "epoch": 1.92, - "learning_rate": 6.100172756495085e-07, - "loss": 0.7148, - "step": 74758 - }, - { - "epoch": 1.92, - "learning_rate": 6.099917962313167e-07, - "loss": 0.7725, - "step": 74759 - }, - { - "epoch": 1.92, - "learning_rate": 6.099663171117362e-07, - "loss": 0.5889, - "step": 74760 - }, - { - "epoch": 1.92, - "learning_rate": 6.099408382907862e-07, - "loss": 0.5815, - "step": 74761 - }, - { - "epoch": 1.92, - "learning_rate": 6.099153597684868e-07, - "loss": 0.6504, - "step": 74762 - }, - { - "epoch": 1.92, - "learning_rate": 6.098898815448572e-07, - "loss": 0.5337, - "step": 74763 - }, - { - "epoch": 1.92, - "learning_rate": 6.098644036199171e-07, - "loss": 0.6743, - "step": 74764 - }, - { - "epoch": 1.92, - "learning_rate": 6.098389259936857e-07, - "loss": 0.7256, - "step": 74765 - }, - { - "epoch": 1.92, - "learning_rate": 6.098134486661829e-07, - "loss": 0.7725, - "step": 74766 - }, - { - "epoch": 1.92, - "learning_rate": 6.097879716374281e-07, - "loss": 0.7188, - "step": 74767 - }, - { - "epoch": 1.92, - "learning_rate": 6.097624949074404e-07, - "loss": 0.4939, - "step": 74768 - }, - { - "epoch": 1.92, - "learning_rate": 6.097370184762398e-07, - "loss": 0.4236, - "step": 74769 - }, - { - "epoch": 1.92, - "learning_rate": 6.097115423438455e-07, - "loss": 0.5908, - "step": 74770 - }, - { - "epoch": 1.92, - "learning_rate": 6.096860665102772e-07, - "loss": 0.603, - "step": 74771 - }, - { - "epoch": 1.92, - "learning_rate": 6.096605909755543e-07, - "loss": 0.8271, - "step": 74772 - }, - { - "epoch": 1.92, - "learning_rate": 6.096351157396964e-07, - "loss": 0.6318, - "step": 74773 - }, - { - "epoch": 1.92, - "learning_rate": 6.096096408027227e-07, - "loss": 0.7021, - "step": 74774 - }, - { - "epoch": 1.92, - "learning_rate": 6.095841661646533e-07, - "loss": 0.667, - "step": 74775 - }, - { - "epoch": 1.92, - "learning_rate": 6.095586918255074e-07, - "loss": 0.4966, - "step": 74776 - }, - { - "epoch": 1.92, - "learning_rate": 6.095332177853041e-07, - "loss": 0.6504, - "step": 74777 - }, - { - "epoch": 1.92, - "learning_rate": 6.095077440440635e-07, - "loss": 0.5674, - "step": 74778 - }, - { - "epoch": 1.92, - "learning_rate": 6.09482270601805e-07, - "loss": 0.47, - "step": 74779 - }, - { - "epoch": 1.92, - "learning_rate": 6.094567974585475e-07, - "loss": 0.6553, - "step": 74780 - }, - { - "epoch": 1.92, - "learning_rate": 6.094313246143112e-07, - "loss": 0.6885, - "step": 74781 - }, - { - "epoch": 1.92, - "learning_rate": 6.094058520691154e-07, - "loss": 0.7305, - "step": 74782 - }, - { - "epoch": 1.92, - "learning_rate": 6.093803798229797e-07, - "loss": 0.6343, - "step": 74783 - }, - { - "epoch": 1.92, - "learning_rate": 6.093549078759232e-07, - "loss": 0.5203, - "step": 74784 - }, - { - "epoch": 1.92, - "learning_rate": 6.093294362279659e-07, - "loss": 0.4421, - "step": 74785 - }, - { - "epoch": 1.92, - "learning_rate": 6.093039648791273e-07, - "loss": 0.6562, - "step": 74786 - }, - { - "epoch": 1.92, - "learning_rate": 6.092784938294261e-07, - "loss": 0.5613, - "step": 74787 - }, - { - "epoch": 1.92, - "learning_rate": 6.092530230788829e-07, - "loss": 0.5244, - "step": 74788 - }, - { - "epoch": 1.92, - "learning_rate": 6.092275526275163e-07, - "loss": 0.5005, - "step": 74789 - }, - { - "epoch": 1.92, - "learning_rate": 6.092020824753466e-07, - "loss": 0.5327, - "step": 74790 - }, - { - "epoch": 1.92, - "learning_rate": 6.091766126223925e-07, - "loss": 0.4995, - "step": 74791 - }, - { - "epoch": 1.92, - "learning_rate": 6.091511430686742e-07, - "loss": 0.7637, - "step": 74792 - }, - { - "epoch": 1.92, - "learning_rate": 6.091256738142106e-07, - "loss": 0.7295, - "step": 74793 - }, - { - "epoch": 1.92, - "learning_rate": 6.091002048590219e-07, - "loss": 0.7051, - "step": 74794 - }, - { - "epoch": 1.92, - "learning_rate": 6.090747362031267e-07, - "loss": 0.5503, - "step": 74795 - }, - { - "epoch": 1.92, - "learning_rate": 6.090492678465459e-07, - "loss": 0.7666, - "step": 74796 - }, - { - "epoch": 1.92, - "learning_rate": 6.090237997892973e-07, - "loss": 0.7302, - "step": 74797 - }, - { - "epoch": 1.92, - "learning_rate": 6.089983320314015e-07, - "loss": 0.8047, - "step": 74798 - }, - { - "epoch": 1.92, - "learning_rate": 6.089728645728774e-07, - "loss": 0.6143, - "step": 74799 - }, - { - "epoch": 1.92, - "learning_rate": 6.089473974137451e-07, - "loss": 0.5439, - "step": 74800 - }, - { - "epoch": 1.92, - "learning_rate": 6.089219305540235e-07, - "loss": 0.7725, - "step": 74801 - }, - { - "epoch": 1.92, - "learning_rate": 6.088964639937326e-07, - "loss": 0.6865, - "step": 74802 - }, - { - "epoch": 1.92, - "learning_rate": 6.088709977328916e-07, - "loss": 0.6494, - "step": 74803 - }, - { - "epoch": 1.92, - "learning_rate": 6.088455317715202e-07, - "loss": 0.5928, - "step": 74804 - }, - { - "epoch": 1.92, - "learning_rate": 6.088200661096377e-07, - "loss": 0.4731, - "step": 74805 - }, - { - "epoch": 1.92, - "learning_rate": 6.08794600747264e-07, - "loss": 0.6538, - "step": 74806 - }, - { - "epoch": 1.92, - "learning_rate": 6.08769135684418e-07, - "loss": 0.6094, - "step": 74807 - }, - { - "epoch": 1.92, - "learning_rate": 6.087436709211194e-07, - "loss": 0.8145, - "step": 74808 - }, - { - "epoch": 1.92, - "learning_rate": 6.08718206457388e-07, - "loss": 0.668, - "step": 74809 - }, - { - "epoch": 1.92, - "learning_rate": 6.086927422932428e-07, - "loss": 0.6313, - "step": 74810 - }, - { - "epoch": 1.92, - "learning_rate": 6.086672784287039e-07, - "loss": 0.6504, - "step": 74811 - }, - { - "epoch": 1.92, - "learning_rate": 6.086418148637902e-07, - "loss": 0.6904, - "step": 74812 - }, - { - "epoch": 1.92, - "learning_rate": 6.086163515985216e-07, - "loss": 0.6323, - "step": 74813 - }, - { - "epoch": 1.92, - "learning_rate": 6.085908886329173e-07, - "loss": 0.5898, - "step": 74814 - }, - { - "epoch": 1.92, - "learning_rate": 6.085654259669972e-07, - "loss": 0.4922, - "step": 74815 - }, - { - "epoch": 1.92, - "learning_rate": 6.085399636007808e-07, - "loss": 0.5244, - "step": 74816 - }, - { - "epoch": 1.92, - "learning_rate": 6.08514501534287e-07, - "loss": 0.6914, - "step": 74817 - }, - { - "epoch": 1.92, - "learning_rate": 6.084890397675355e-07, - "loss": 0.4858, - "step": 74818 - }, - { - "epoch": 1.92, - "learning_rate": 6.084635783005461e-07, - "loss": 0.6372, - "step": 74819 - }, - { - "epoch": 1.92, - "learning_rate": 6.084381171333382e-07, - "loss": 0.498, - "step": 74820 - }, - { - "epoch": 1.92, - "learning_rate": 6.084126562659311e-07, - "loss": 0.749, - "step": 74821 - }, - { - "epoch": 1.92, - "learning_rate": 6.083871956983444e-07, - "loss": 0.6196, - "step": 74822 - }, - { - "epoch": 1.92, - "learning_rate": 6.083617354305976e-07, - "loss": 0.6382, - "step": 74823 - }, - { - "epoch": 1.92, - "learning_rate": 6.083362754627104e-07, - "loss": 0.6543, - "step": 74824 - }, - { - "epoch": 1.92, - "learning_rate": 6.08310815794702e-07, - "loss": 0.489, - "step": 74825 - }, - { - "epoch": 1.92, - "learning_rate": 6.082853564265923e-07, - "loss": 0.5244, - "step": 74826 - }, - { - "epoch": 1.92, - "learning_rate": 6.082598973584001e-07, - "loss": 0.7119, - "step": 74827 - }, - { - "epoch": 1.92, - "learning_rate": 6.082344385901455e-07, - "loss": 0.5591, - "step": 74828 - }, - { - "epoch": 1.92, - "learning_rate": 6.082089801218475e-07, - "loss": 0.5029, - "step": 74829 - }, - { - "epoch": 1.92, - "learning_rate": 6.081835219535261e-07, - "loss": 0.542, - "step": 74830 - }, - { - "epoch": 1.92, - "learning_rate": 6.081580640852003e-07, - "loss": 0.6099, - "step": 74831 - }, - { - "epoch": 1.92, - "learning_rate": 6.081326065168902e-07, - "loss": 0.4808, - "step": 74832 - }, - { - "epoch": 1.92, - "learning_rate": 6.081071492486147e-07, - "loss": 0.7852, - "step": 74833 - }, - { - "epoch": 1.92, - "learning_rate": 6.080816922803936e-07, - "loss": 0.7891, - "step": 74834 - }, - { - "epoch": 1.92, - "learning_rate": 6.080562356122465e-07, - "loss": 0.5098, - "step": 74835 - }, - { - "epoch": 1.92, - "learning_rate": 6.080307792441928e-07, - "loss": 0.5112, - "step": 74836 - }, - { - "epoch": 1.92, - "learning_rate": 6.080053231762515e-07, - "loss": 0.5918, - "step": 74837 - }, - { - "epoch": 1.92, - "learning_rate": 6.079798674084427e-07, - "loss": 0.3398, - "step": 74838 - }, - { - "epoch": 1.92, - "learning_rate": 6.079544119407856e-07, - "loss": 0.6626, - "step": 74839 - }, - { - "epoch": 1.92, - "learning_rate": 6.079289567732999e-07, - "loss": 0.4956, - "step": 74840 - }, - { - "epoch": 1.92, - "learning_rate": 6.079035019060048e-07, - "loss": 0.6445, - "step": 74841 - }, - { - "epoch": 1.92, - "learning_rate": 6.078780473389202e-07, - "loss": 0.6738, - "step": 74842 - }, - { - "epoch": 1.92, - "learning_rate": 6.07852593072065e-07, - "loss": 0.6924, - "step": 74843 - }, - { - "epoch": 1.92, - "learning_rate": 6.078271391054594e-07, - "loss": 0.7725, - "step": 74844 - }, - { - "epoch": 1.92, - "learning_rate": 6.078016854391223e-07, - "loss": 0.5972, - "step": 74845 - }, - { - "epoch": 1.92, - "learning_rate": 6.077762320730737e-07, - "loss": 0.5024, - "step": 74846 - }, - { - "epoch": 1.92, - "learning_rate": 6.077507790073328e-07, - "loss": 0.6113, - "step": 74847 - }, - { - "epoch": 1.92, - "learning_rate": 6.077253262419187e-07, - "loss": 0.562, - "step": 74848 - }, - { - "epoch": 1.92, - "learning_rate": 6.076998737768516e-07, - "loss": 0.5908, - "step": 74849 - }, - { - "epoch": 1.92, - "learning_rate": 6.076744216121505e-07, - "loss": 0.5923, - "step": 74850 - }, - { - "epoch": 1.92, - "learning_rate": 6.076489697478351e-07, - "loss": 0.6289, - "step": 74851 - }, - { - "epoch": 1.92, - "learning_rate": 6.076235181839248e-07, - "loss": 0.6777, - "step": 74852 - }, - { - "epoch": 1.92, - "learning_rate": 6.075980669204392e-07, - "loss": 0.6235, - "step": 74853 - }, - { - "epoch": 1.92, - "learning_rate": 6.075726159573977e-07, - "loss": 0.7109, - "step": 74854 - }, - { - "epoch": 1.92, - "learning_rate": 6.075471652948198e-07, - "loss": 0.6484, - "step": 74855 - }, - { - "epoch": 1.92, - "learning_rate": 6.075217149327252e-07, - "loss": 0.6104, - "step": 74856 - }, - { - "epoch": 1.92, - "learning_rate": 6.074962648711331e-07, - "loss": 0.6611, - "step": 74857 - }, - { - "epoch": 1.92, - "learning_rate": 6.074708151100627e-07, - "loss": 0.4219, - "step": 74858 - }, - { - "epoch": 1.92, - "learning_rate": 6.074453656495342e-07, - "loss": 0.4839, - "step": 74859 - }, - { - "epoch": 1.92, - "learning_rate": 6.074199164895664e-07, - "loss": 0.3911, - "step": 74860 - }, - { - "epoch": 1.92, - "learning_rate": 6.073944676301794e-07, - "loss": 0.6934, - "step": 74861 - }, - { - "epoch": 1.92, - "learning_rate": 6.073690190713922e-07, - "loss": 0.6963, - "step": 74862 - }, - { - "epoch": 1.92, - "learning_rate": 6.073435708132249e-07, - "loss": 0.5229, - "step": 74863 - }, - { - "epoch": 1.92, - "learning_rate": 6.073181228556961e-07, - "loss": 0.6494, - "step": 74864 - }, - { - "epoch": 1.92, - "learning_rate": 6.072926751988259e-07, - "loss": 0.5771, - "step": 74865 - }, - { - "epoch": 1.92, - "learning_rate": 6.072672278426341e-07, - "loss": 0.833, - "step": 74866 - }, - { - "epoch": 1.92, - "learning_rate": 6.072417807871392e-07, - "loss": 0.749, - "step": 74867 - }, - { - "epoch": 1.92, - "learning_rate": 6.072163340323613e-07, - "loss": 0.7236, - "step": 74868 - }, - { - "epoch": 1.92, - "learning_rate": 6.0719088757832e-07, - "loss": 0.7002, - "step": 74869 - }, - { - "epoch": 1.92, - "learning_rate": 6.071654414250342e-07, - "loss": 0.4536, - "step": 74870 - }, - { - "epoch": 1.92, - "learning_rate": 6.071399955725241e-07, - "loss": 0.7178, - "step": 74871 - }, - { - "epoch": 1.92, - "learning_rate": 6.071145500208086e-07, - "loss": 0.79, - "step": 74872 - }, - { - "epoch": 1.92, - "learning_rate": 6.070891047699075e-07, - "loss": 0.6416, - "step": 74873 - }, - { - "epoch": 1.92, - "learning_rate": 6.070636598198401e-07, - "loss": 0.6147, - "step": 74874 - }, - { - "epoch": 1.92, - "learning_rate": 6.070382151706261e-07, - "loss": 0.6406, - "step": 74875 - }, - { - "epoch": 1.92, - "learning_rate": 6.070127708222852e-07, - "loss": 0.5264, - "step": 74876 - }, - { - "epoch": 1.92, - "learning_rate": 6.069873267748363e-07, - "loss": 0.6465, - "step": 74877 - }, - { - "epoch": 1.92, - "learning_rate": 6.06961883028299e-07, - "loss": 0.4355, - "step": 74878 - }, - { - "epoch": 1.92, - "learning_rate": 6.069364395826928e-07, - "loss": 0.5044, - "step": 74879 - }, - { - "epoch": 1.92, - "learning_rate": 6.069109964380376e-07, - "loss": 0.4756, - "step": 74880 - }, - { - "epoch": 1.92, - "learning_rate": 6.068855535943523e-07, - "loss": 0.3749, - "step": 74881 - }, - { - "epoch": 1.92, - "learning_rate": 6.068601110516569e-07, - "loss": 0.7651, - "step": 74882 - }, - { - "epoch": 1.92, - "learning_rate": 6.068346688099703e-07, - "loss": 0.6748, - "step": 74883 - }, - { - "epoch": 1.92, - "learning_rate": 6.068092268693128e-07, - "loss": 0.5942, - "step": 74884 - }, - { - "epoch": 1.92, - "learning_rate": 6.067837852297031e-07, - "loss": 0.6543, - "step": 74885 - }, - { - "epoch": 1.92, - "learning_rate": 6.067583438911614e-07, - "loss": 0.5308, - "step": 74886 - }, - { - "epoch": 1.92, - "learning_rate": 6.067329028537063e-07, - "loss": 0.5869, - "step": 74887 - }, - { - "epoch": 1.92, - "learning_rate": 6.067074621173578e-07, - "loss": 0.5957, - "step": 74888 - }, - { - "epoch": 1.92, - "learning_rate": 6.066820216821354e-07, - "loss": 0.6973, - "step": 74889 - }, - { - "epoch": 1.92, - "learning_rate": 6.066565815480585e-07, - "loss": 0.6768, - "step": 74890 - }, - { - "epoch": 1.92, - "learning_rate": 6.066311417151461e-07, - "loss": 0.5103, - "step": 74891 - }, - { - "epoch": 1.92, - "learning_rate": 6.066057021834188e-07, - "loss": 0.3967, - "step": 74892 - }, - { - "epoch": 1.92, - "learning_rate": 6.06580262952895e-07, - "loss": 0.6475, - "step": 74893 - }, - { - "epoch": 1.92, - "learning_rate": 6.065548240235948e-07, - "loss": 0.6504, - "step": 74894 - }, - { - "epoch": 1.92, - "learning_rate": 6.065293853955373e-07, - "loss": 0.6416, - "step": 74895 - }, - { - "epoch": 1.92, - "learning_rate": 6.065039470687426e-07, - "loss": 0.5503, - "step": 74896 - }, - { - "epoch": 1.92, - "learning_rate": 6.064785090432295e-07, - "loss": 0.6523, - "step": 74897 - }, - { - "epoch": 1.92, - "learning_rate": 6.064530713190174e-07, - "loss": 0.6899, - "step": 74898 - }, - { - "epoch": 1.92, - "learning_rate": 6.064276338961264e-07, - "loss": 0.479, - "step": 74899 - }, - { - "epoch": 1.92, - "learning_rate": 6.064021967745756e-07, - "loss": 0.7646, - "step": 74900 - }, - { - "epoch": 1.92, - "learning_rate": 6.063767599543846e-07, - "loss": 0.7188, - "step": 74901 - }, - { - "epoch": 1.92, - "learning_rate": 6.063513234355726e-07, - "loss": 0.5977, - "step": 74902 - }, - { - "epoch": 1.92, - "learning_rate": 6.063258872181596e-07, - "loss": 0.6396, - "step": 74903 - }, - { - "epoch": 1.92, - "learning_rate": 6.063004513021645e-07, - "loss": 0.667, - "step": 74904 - }, - { - "epoch": 1.92, - "learning_rate": 6.062750156876072e-07, - "loss": 0.6553, - "step": 74905 - }, - { - "epoch": 1.92, - "learning_rate": 6.062495803745072e-07, - "loss": 0.6646, - "step": 74906 - }, - { - "epoch": 1.92, - "learning_rate": 6.062241453628837e-07, - "loss": 0.4686, - "step": 74907 - }, - { - "epoch": 1.92, - "learning_rate": 6.06198710652756e-07, - "loss": 0.4355, - "step": 74908 - }, - { - "epoch": 1.92, - "learning_rate": 6.061732762441441e-07, - "loss": 0.707, - "step": 74909 - }, - { - "epoch": 1.92, - "learning_rate": 6.061478421370669e-07, - "loss": 0.4397, - "step": 74910 - }, - { - "epoch": 1.92, - "learning_rate": 6.061224083315443e-07, - "loss": 0.8457, - "step": 74911 - }, - { - "epoch": 1.92, - "learning_rate": 6.060969748275957e-07, - "loss": 0.6455, - "step": 74912 - }, - { - "epoch": 1.92, - "learning_rate": 6.060715416252407e-07, - "loss": 0.7529, - "step": 74913 - }, - { - "epoch": 1.92, - "learning_rate": 6.060461087244984e-07, - "loss": 0.6895, - "step": 74914 - }, - { - "epoch": 1.92, - "learning_rate": 6.060206761253886e-07, - "loss": 0.5718, - "step": 74915 - }, - { - "epoch": 1.92, - "learning_rate": 6.059952438279308e-07, - "loss": 0.7051, - "step": 74916 - }, - { - "epoch": 1.92, - "learning_rate": 6.05969811832144e-07, - "loss": 0.7302, - "step": 74917 - }, - { - "epoch": 1.92, - "learning_rate": 6.059443801380482e-07, - "loss": 0.6851, - "step": 74918 - }, - { - "epoch": 1.92, - "learning_rate": 6.059189487456624e-07, - "loss": 0.5479, - "step": 74919 - }, - { - "epoch": 1.92, - "learning_rate": 6.058935176550066e-07, - "loss": 0.6147, - "step": 74920 - }, - { - "epoch": 1.92, - "learning_rate": 6.058680868660999e-07, - "loss": 0.5042, - "step": 74921 - }, - { - "epoch": 1.92, - "learning_rate": 6.05842656378962e-07, - "loss": 0.6616, - "step": 74922 - }, - { - "epoch": 1.92, - "learning_rate": 6.058172261936124e-07, - "loss": 0.5093, - "step": 74923 - }, - { - "epoch": 1.92, - "learning_rate": 6.057917963100699e-07, - "loss": 0.7314, - "step": 74924 - }, - { - "epoch": 1.92, - "learning_rate": 6.05766366728355e-07, - "loss": 0.8672, - "step": 74925 - }, - { - "epoch": 1.92, - "learning_rate": 6.057409374484867e-07, - "loss": 0.6865, - "step": 74926 - }, - { - "epoch": 1.92, - "learning_rate": 6.057155084704841e-07, - "loss": 0.4279, - "step": 74927 - }, - { - "epoch": 1.92, - "learning_rate": 6.056900797943672e-07, - "loss": 0.6226, - "step": 74928 - }, - { - "epoch": 1.92, - "learning_rate": 6.05664651420155e-07, - "loss": 0.5361, - "step": 74929 - }, - { - "epoch": 1.92, - "learning_rate": 6.056392233478676e-07, - "loss": 0.6846, - "step": 74930 - }, - { - "epoch": 1.92, - "learning_rate": 6.056137955775238e-07, - "loss": 0.7803, - "step": 74931 - }, - { - "epoch": 1.92, - "learning_rate": 6.055883681091436e-07, - "loss": 0.6406, - "step": 74932 - }, - { - "epoch": 1.92, - "learning_rate": 6.05562940942746e-07, - "loss": 0.6758, - "step": 74933 - }, - { - "epoch": 1.92, - "learning_rate": 6.05537514078351e-07, - "loss": 0.6465, - "step": 74934 - }, - { - "epoch": 1.92, - "learning_rate": 6.055120875159775e-07, - "loss": 0.553, - "step": 74935 - }, - { - "epoch": 1.92, - "learning_rate": 6.054866612556457e-07, - "loss": 0.457, - "step": 74936 - }, - { - "epoch": 1.92, - "learning_rate": 6.054612352973745e-07, - "loss": 0.4512, - "step": 74937 - }, - { - "epoch": 1.92, - "learning_rate": 6.054358096411831e-07, - "loss": 0.6172, - "step": 74938 - }, - { - "epoch": 1.92, - "learning_rate": 6.054103842870918e-07, - "loss": 0.5543, - "step": 74939 - }, - { - "epoch": 1.92, - "learning_rate": 6.053849592351192e-07, - "loss": 0.4702, - "step": 74940 - }, - { - "epoch": 1.92, - "learning_rate": 6.053595344852855e-07, - "loss": 0.6865, - "step": 74941 - }, - { - "epoch": 1.92, - "learning_rate": 6.0533411003761e-07, - "loss": 0.6846, - "step": 74942 - }, - { - "epoch": 1.92, - "learning_rate": 6.053086858921117e-07, - "loss": 0.709, - "step": 74943 - }, - { - "epoch": 1.92, - "learning_rate": 6.052832620488105e-07, - "loss": 0.6582, - "step": 74944 - }, - { - "epoch": 1.92, - "learning_rate": 6.052578385077256e-07, - "loss": 0.5762, - "step": 74945 - }, - { - "epoch": 1.92, - "learning_rate": 6.052324152688772e-07, - "loss": 0.5239, - "step": 74946 - }, - { - "epoch": 1.92, - "learning_rate": 6.052069923322838e-07, - "loss": 0.791, - "step": 74947 - }, - { - "epoch": 1.92, - "learning_rate": 6.051815696979651e-07, - "loss": 0.4484, - "step": 74948 - }, - { - "epoch": 1.92, - "learning_rate": 6.051561473659409e-07, - "loss": 0.6899, - "step": 74949 - }, - { - "epoch": 1.92, - "learning_rate": 6.051307253362304e-07, - "loss": 0.5254, - "step": 74950 - }, - { - "epoch": 1.92, - "learning_rate": 6.051053036088531e-07, - "loss": 0.6147, - "step": 74951 - }, - { - "epoch": 1.92, - "learning_rate": 6.050798821838285e-07, - "loss": 0.6633, - "step": 74952 - }, - { - "epoch": 1.92, - "learning_rate": 6.050544610611762e-07, - "loss": 0.5864, - "step": 74953 - }, - { - "epoch": 1.92, - "learning_rate": 6.050290402409154e-07, - "loss": 0.6348, - "step": 74954 - }, - { - "epoch": 1.92, - "learning_rate": 6.050036197230659e-07, - "loss": 0.6533, - "step": 74955 - }, - { - "epoch": 1.92, - "learning_rate": 6.049781995076471e-07, - "loss": 0.7471, - "step": 74956 - }, - { - "epoch": 1.92, - "learning_rate": 6.04952779594678e-07, - "loss": 0.7158, - "step": 74957 - }, - { - "epoch": 1.92, - "learning_rate": 6.049273599841785e-07, - "loss": 0.6616, - "step": 74958 - }, - { - "epoch": 1.92, - "learning_rate": 6.049019406761679e-07, - "loss": 0.6826, - "step": 74959 - }, - { - "epoch": 1.92, - "learning_rate": 6.048765216706657e-07, - "loss": 0.6187, - "step": 74960 - }, - { - "epoch": 1.92, - "learning_rate": 6.048511029676916e-07, - "loss": 0.5806, - "step": 74961 - }, - { - "epoch": 1.92, - "learning_rate": 6.048256845672645e-07, - "loss": 0.6567, - "step": 74962 - }, - { - "epoch": 1.92, - "learning_rate": 6.048002664694045e-07, - "loss": 0.6377, - "step": 74963 - }, - { - "epoch": 1.92, - "learning_rate": 6.047748486741304e-07, - "loss": 0.5706, - "step": 74964 - }, - { - "epoch": 1.92, - "learning_rate": 6.047494311814625e-07, - "loss": 0.6338, - "step": 74965 - }, - { - "epoch": 1.92, - "learning_rate": 6.047240139914199e-07, - "loss": 0.4956, - "step": 74966 - }, - { - "epoch": 1.92, - "learning_rate": 6.046985971040213e-07, - "loss": 0.5913, - "step": 74967 - }, - { - "epoch": 1.92, - "learning_rate": 6.046731805192873e-07, - "loss": 0.6475, - "step": 74968 - }, - { - "epoch": 1.92, - "learning_rate": 6.046477642372365e-07, - "loss": 0.6274, - "step": 74969 - }, - { - "epoch": 1.92, - "learning_rate": 6.046223482578889e-07, - "loss": 0.5254, - "step": 74970 - }, - { - "epoch": 1.92, - "learning_rate": 6.045969325812637e-07, - "loss": 0.4977, - "step": 74971 - }, - { - "epoch": 1.92, - "learning_rate": 6.045715172073807e-07, - "loss": 0.7461, - "step": 74972 - }, - { - "epoch": 1.92, - "learning_rate": 6.045461021362587e-07, - "loss": 0.5718, - "step": 74973 - }, - { - "epoch": 1.92, - "learning_rate": 6.045206873679179e-07, - "loss": 0.6367, - "step": 74974 - }, - { - "epoch": 1.92, - "learning_rate": 6.044952729023773e-07, - "loss": 0.667, - "step": 74975 - }, - { - "epoch": 1.92, - "learning_rate": 6.04469858739657e-07, - "loss": 0.6562, - "step": 74976 - }, - { - "epoch": 1.92, - "learning_rate": 6.044444448797753e-07, - "loss": 0.543, - "step": 74977 - }, - { - "epoch": 1.92, - "learning_rate": 6.044190313227526e-07, - "loss": 0.6221, - "step": 74978 - }, - { - "epoch": 1.92, - "learning_rate": 6.043936180686078e-07, - "loss": 0.6245, - "step": 74979 - }, - { - "epoch": 1.92, - "learning_rate": 6.043682051173608e-07, - "loss": 0.5005, - "step": 74980 - }, - { - "epoch": 1.92, - "learning_rate": 6.043427924690307e-07, - "loss": 0.5708, - "step": 74981 - }, - { - "epoch": 1.92, - "learning_rate": 6.043173801236373e-07, - "loss": 0.5669, - "step": 74982 - }, - { - "epoch": 1.92, - "learning_rate": 6.042919680811997e-07, - "loss": 0.4675, - "step": 74983 - }, - { - "epoch": 1.92, - "learning_rate": 6.042665563417378e-07, - "loss": 0.5815, - "step": 74984 - }, - { - "epoch": 1.92, - "learning_rate": 6.042411449052704e-07, - "loss": 0.6455, - "step": 74985 - }, - { - "epoch": 1.92, - "learning_rate": 6.04215733771818e-07, - "loss": 0.5149, - "step": 74986 - }, - { - "epoch": 1.92, - "learning_rate": 6.041903229413991e-07, - "loss": 0.5654, - "step": 74987 - }, - { - "epoch": 1.92, - "learning_rate": 6.041649124140334e-07, - "loss": 0.6128, - "step": 74988 - }, - { - "epoch": 1.92, - "learning_rate": 6.041395021897405e-07, - "loss": 0.5552, - "step": 74989 - }, - { - "epoch": 1.92, - "learning_rate": 6.041140922685396e-07, - "loss": 0.4468, - "step": 74990 - }, - { - "epoch": 1.92, - "learning_rate": 6.040886826504506e-07, - "loss": 0.6377, - "step": 74991 - }, - { - "epoch": 1.92, - "learning_rate": 6.040632733354923e-07, - "loss": 0.5591, - "step": 74992 - }, - { - "epoch": 1.92, - "learning_rate": 6.040378643236849e-07, - "loss": 0.6953, - "step": 74993 - }, - { - "epoch": 1.92, - "learning_rate": 6.040124556150473e-07, - "loss": 0.582, - "step": 74994 - }, - { - "epoch": 1.92, - "learning_rate": 6.039870472095993e-07, - "loss": 0.6987, - "step": 74995 - }, - { - "epoch": 1.92, - "learning_rate": 6.039616391073605e-07, - "loss": 0.667, - "step": 74996 - }, - { - "epoch": 1.92, - "learning_rate": 6.039362313083498e-07, - "loss": 0.7256, - "step": 74997 - }, - { - "epoch": 1.92, - "learning_rate": 6.039108238125867e-07, - "loss": 0.494, - "step": 74998 - }, - { - "epoch": 1.92, - "learning_rate": 6.038854166200911e-07, - "loss": 0.7432, - "step": 74999 - }, - { - "epoch": 1.92, - "learning_rate": 6.03860009730882e-07, - "loss": 0.7031, - "step": 75000 - }, - { - "epoch": 1.92, - "learning_rate": 6.038346031449792e-07, - "loss": 0.6494, - "step": 75001 - }, - { - "epoch": 1.92, - "learning_rate": 6.03809196862402e-07, - "loss": 0.6001, - "step": 75002 - }, - { - "epoch": 1.92, - "learning_rate": 6.0378379088317e-07, - "loss": 0.7686, - "step": 75003 - }, - { - "epoch": 1.92, - "learning_rate": 6.037583852073023e-07, - "loss": 0.6719, - "step": 75004 - }, - { - "epoch": 1.92, - "learning_rate": 6.037329798348189e-07, - "loss": 0.5889, - "step": 75005 - }, - { - "epoch": 1.92, - "learning_rate": 6.037075747657389e-07, - "loss": 0.6562, - "step": 75006 - }, - { - "epoch": 1.92, - "learning_rate": 6.036821700000816e-07, - "loss": 0.6436, - "step": 75007 - }, - { - "epoch": 1.92, - "learning_rate": 6.036567655378668e-07, - "loss": 0.7549, - "step": 75008 - }, - { - "epoch": 1.92, - "learning_rate": 6.036313613791135e-07, - "loss": 0.6313, - "step": 75009 - }, - { - "epoch": 1.92, - "learning_rate": 6.036059575238418e-07, - "loss": 0.6841, - "step": 75010 - }, - { - "epoch": 1.92, - "learning_rate": 6.035805539720704e-07, - "loss": 0.48, - "step": 75011 - }, - { - "epoch": 1.92, - "learning_rate": 6.035551507238195e-07, - "loss": 0.5811, - "step": 75012 - }, - { - "epoch": 1.92, - "learning_rate": 6.035297477791079e-07, - "loss": 0.6523, - "step": 75013 - }, - { - "epoch": 1.92, - "learning_rate": 6.035043451379556e-07, - "loss": 0.6074, - "step": 75014 - }, - { - "epoch": 1.92, - "learning_rate": 6.034789428003818e-07, - "loss": 0.7329, - "step": 75015 - }, - { - "epoch": 1.92, - "learning_rate": 6.03453540766406e-07, - "loss": 0.7471, - "step": 75016 - }, - { - "epoch": 1.92, - "learning_rate": 6.034281390360474e-07, - "loss": 0.4795, - "step": 75017 - }, - { - "epoch": 1.92, - "learning_rate": 6.034027376093258e-07, - "loss": 0.6523, - "step": 75018 - }, - { - "epoch": 1.92, - "learning_rate": 6.033773364862602e-07, - "loss": 0.6748, - "step": 75019 - }, - { - "epoch": 1.92, - "learning_rate": 6.033519356668706e-07, - "loss": 0.6968, - "step": 75020 - }, - { - "epoch": 1.92, - "learning_rate": 6.033265351511759e-07, - "loss": 0.5688, - "step": 75021 - }, - { - "epoch": 1.92, - "learning_rate": 6.033011349391961e-07, - "loss": 0.4169, - "step": 75022 - }, - { - "epoch": 1.92, - "learning_rate": 6.032757350309501e-07, - "loss": 0.4905, - "step": 75023 - }, - { - "epoch": 1.92, - "learning_rate": 6.03250335426458e-07, - "loss": 0.5542, - "step": 75024 - }, - { - "epoch": 1.92, - "learning_rate": 6.032249361257385e-07, - "loss": 0.458, - "step": 75025 - }, - { - "epoch": 1.92, - "learning_rate": 6.031995371288119e-07, - "loss": 0.5439, - "step": 75026 - }, - { - "epoch": 1.92, - "learning_rate": 6.03174138435697e-07, - "loss": 0.6406, - "step": 75027 - }, - { - "epoch": 1.92, - "learning_rate": 6.031487400464132e-07, - "loss": 0.5522, - "step": 75028 - }, - { - "epoch": 1.92, - "learning_rate": 6.031233419609802e-07, - "loss": 0.5781, - "step": 75029 - }, - { - "epoch": 1.92, - "learning_rate": 6.030979441794174e-07, - "loss": 0.6323, - "step": 75030 - }, - { - "epoch": 1.92, - "learning_rate": 6.030725467017444e-07, - "loss": 0.5591, - "step": 75031 - }, - { - "epoch": 1.92, - "learning_rate": 6.030471495279805e-07, - "loss": 0.5576, - "step": 75032 - }, - { - "epoch": 1.92, - "learning_rate": 6.030217526581449e-07, - "loss": 0.749, - "step": 75033 - }, - { - "epoch": 1.92, - "learning_rate": 6.029963560922576e-07, - "loss": 0.3771, - "step": 75034 - }, - { - "epoch": 1.92, - "learning_rate": 6.029709598303374e-07, - "loss": 0.6709, - "step": 75035 - }, - { - "epoch": 1.92, - "learning_rate": 6.029455638724046e-07, - "loss": 0.7144, - "step": 75036 - }, - { - "epoch": 1.92, - "learning_rate": 6.029201682184779e-07, - "loss": 0.8125, - "step": 75037 - }, - { - "epoch": 1.92, - "learning_rate": 6.028947728685767e-07, - "loss": 0.3254, - "step": 75038 - }, - { - "epoch": 1.92, - "learning_rate": 6.028693778227209e-07, - "loss": 0.6133, - "step": 75039 - }, - { - "epoch": 1.92, - "learning_rate": 6.028439830809296e-07, - "loss": 0.5962, - "step": 75040 - }, - { - "epoch": 1.92, - "learning_rate": 6.028185886432227e-07, - "loss": 0.6831, - "step": 75041 - }, - { - "epoch": 1.92, - "learning_rate": 6.027931945096189e-07, - "loss": 0.6885, - "step": 75042 - }, - { - "epoch": 1.92, - "learning_rate": 6.027678006801385e-07, - "loss": 0.6826, - "step": 75043 - }, - { - "epoch": 1.92, - "learning_rate": 6.027424071548003e-07, - "loss": 0.8037, - "step": 75044 - }, - { - "epoch": 1.92, - "learning_rate": 6.027170139336241e-07, - "loss": 0.6523, - "step": 75045 - }, - { - "epoch": 1.92, - "learning_rate": 6.026916210166295e-07, - "loss": 0.7598, - "step": 75046 - }, - { - "epoch": 1.92, - "learning_rate": 6.026662284038353e-07, - "loss": 0.667, - "step": 75047 - }, - { - "epoch": 1.92, - "learning_rate": 6.026408360952613e-07, - "loss": 0.7275, - "step": 75048 - }, - { - "epoch": 1.92, - "learning_rate": 6.02615444090927e-07, - "loss": 0.6235, - "step": 75049 - }, - { - "epoch": 1.92, - "learning_rate": 6.025900523908517e-07, - "loss": 0.6274, - "step": 75050 - }, - { - "epoch": 1.92, - "learning_rate": 6.025646609950551e-07, - "loss": 0.6416, - "step": 75051 - }, - { - "epoch": 1.92, - "learning_rate": 6.025392699035562e-07, - "loss": 0.3041, - "step": 75052 - }, - { - "epoch": 1.92, - "learning_rate": 6.025138791163748e-07, - "loss": 0.5859, - "step": 75053 - }, - { - "epoch": 1.92, - "learning_rate": 6.024884886335303e-07, - "loss": 0.5693, - "step": 75054 - }, - { - "epoch": 1.92, - "learning_rate": 6.024630984550422e-07, - "loss": 0.6377, - "step": 75055 - }, - { - "epoch": 1.92, - "learning_rate": 6.024377085809301e-07, - "loss": 0.6338, - "step": 75056 - }, - { - "epoch": 1.92, - "learning_rate": 6.024123190112124e-07, - "loss": 0.7168, - "step": 75057 - }, - { - "epoch": 1.92, - "learning_rate": 6.023869297459099e-07, - "loss": 0.634, - "step": 75058 - }, - { - "epoch": 1.92, - "learning_rate": 6.023615407850411e-07, - "loss": 0.6128, - "step": 75059 - }, - { - "epoch": 1.92, - "learning_rate": 6.02336152128626e-07, - "loss": 0.6523, - "step": 75060 - }, - { - "epoch": 1.92, - "learning_rate": 6.023107637766836e-07, - "loss": 0.5693, - "step": 75061 - }, - { - "epoch": 1.92, - "learning_rate": 6.022853757292338e-07, - "loss": 0.7061, - "step": 75062 - }, - { - "epoch": 1.92, - "learning_rate": 6.022599879862955e-07, - "loss": 0.4993, - "step": 75063 - }, - { - "epoch": 1.92, - "learning_rate": 6.022346005478887e-07, - "loss": 0.7373, - "step": 75064 - }, - { - "epoch": 1.92, - "learning_rate": 6.022092134140329e-07, - "loss": 0.7012, - "step": 75065 - }, - { - "epoch": 1.92, - "learning_rate": 6.021838265847469e-07, - "loss": 0.3555, - "step": 75066 - }, - { - "epoch": 1.92, - "learning_rate": 6.021584400600501e-07, - "loss": 0.6592, - "step": 75067 - }, - { - "epoch": 1.92, - "learning_rate": 6.021330538399627e-07, - "loss": 0.5811, - "step": 75068 - }, - { - "epoch": 1.92, - "learning_rate": 6.021076679245035e-07, - "loss": 0.6416, - "step": 75069 - }, - { - "epoch": 1.92, - "learning_rate": 6.020822823136924e-07, - "loss": 0.6138, - "step": 75070 - }, - { - "epoch": 1.92, - "learning_rate": 6.020568970075484e-07, - "loss": 0.6147, - "step": 75071 - }, - { - "epoch": 1.92, - "learning_rate": 6.020315120060911e-07, - "loss": 0.7686, - "step": 75072 - }, - { - "epoch": 1.92, - "learning_rate": 6.020061273093399e-07, - "loss": 0.6245, - "step": 75073 - }, - { - "epoch": 1.92, - "learning_rate": 6.019807429173147e-07, - "loss": 0.5947, - "step": 75074 - }, - { - "epoch": 1.92, - "learning_rate": 6.019553588300346e-07, - "loss": 0.5327, - "step": 75075 - }, - { - "epoch": 1.92, - "learning_rate": 6.019299750475186e-07, - "loss": 0.5817, - "step": 75076 - }, - { - "epoch": 1.92, - "learning_rate": 6.019045915697867e-07, - "loss": 0.7061, - "step": 75077 - }, - { - "epoch": 1.92, - "learning_rate": 6.018792083968578e-07, - "loss": 0.623, - "step": 75078 - }, - { - "epoch": 1.92, - "learning_rate": 6.018538255287521e-07, - "loss": 0.4399, - "step": 75079 - }, - { - "epoch": 1.92, - "learning_rate": 6.018284429654883e-07, - "loss": 0.6606, - "step": 75080 - }, - { - "epoch": 1.92, - "learning_rate": 6.018030607070865e-07, - "loss": 0.6465, - "step": 75081 - }, - { - "epoch": 1.92, - "learning_rate": 6.017776787535653e-07, - "loss": 0.5815, - "step": 75082 - }, - { - "epoch": 1.92, - "learning_rate": 6.017522971049451e-07, - "loss": 0.4644, - "step": 75083 - }, - { - "epoch": 1.92, - "learning_rate": 6.017269157612446e-07, - "loss": 0.4678, - "step": 75084 - }, - { - "epoch": 1.92, - "learning_rate": 6.01701534722484e-07, - "loss": 0.7158, - "step": 75085 - }, - { - "epoch": 1.92, - "learning_rate": 6.016761539886816e-07, - "loss": 0.6367, - "step": 75086 - }, - { - "epoch": 1.92, - "learning_rate": 6.016507735598577e-07, - "loss": 0.542, - "step": 75087 - }, - { - "epoch": 1.92, - "learning_rate": 6.016253934360314e-07, - "loss": 0.6631, - "step": 75088 - }, - { - "epoch": 1.92, - "learning_rate": 6.016000136172224e-07, - "loss": 0.6912, - "step": 75089 - }, - { - "epoch": 1.92, - "learning_rate": 6.015746341034496e-07, - "loss": 0.6528, - "step": 75090 - }, - { - "epoch": 1.92, - "learning_rate": 6.01549254894733e-07, - "loss": 0.5054, - "step": 75091 - }, - { - "epoch": 1.92, - "learning_rate": 6.015238759910916e-07, - "loss": 0.5266, - "step": 75092 - }, - { - "epoch": 1.92, - "learning_rate": 6.014984973925454e-07, - "loss": 0.5928, - "step": 75093 - }, - { - "epoch": 1.92, - "learning_rate": 6.014731190991131e-07, - "loss": 0.6191, - "step": 75094 - }, - { - "epoch": 1.92, - "learning_rate": 6.014477411108151e-07, - "loss": 0.5447, - "step": 75095 - }, - { - "epoch": 1.92, - "learning_rate": 6.0142236342767e-07, - "loss": 0.5544, - "step": 75096 - }, - { - "epoch": 1.92, - "learning_rate": 6.013969860496972e-07, - "loss": 0.2887, - "step": 75097 - }, - { - "epoch": 1.92, - "learning_rate": 6.013716089769166e-07, - "loss": 0.6631, - "step": 75098 - }, - { - "epoch": 1.92, - "learning_rate": 6.013462322093472e-07, - "loss": 0.7002, - "step": 75099 - }, - { - "epoch": 1.92, - "learning_rate": 6.013208557470089e-07, - "loss": 0.5479, - "step": 75100 - }, - { - "epoch": 1.92, - "learning_rate": 6.012954795899206e-07, - "loss": 0.7334, - "step": 75101 - }, - { - "epoch": 1.92, - "learning_rate": 6.012701037381024e-07, - "loss": 0.6982, - "step": 75102 - }, - { - "epoch": 1.92, - "learning_rate": 6.01244728191573e-07, - "loss": 0.6885, - "step": 75103 - }, - { - "epoch": 1.92, - "learning_rate": 6.012193529503524e-07, - "loss": 0.6611, - "step": 75104 - }, - { - "epoch": 1.92, - "learning_rate": 6.011939780144602e-07, - "loss": 0.7378, - "step": 75105 - }, - { - "epoch": 1.93, - "learning_rate": 6.011686033839149e-07, - "loss": 0.5933, - "step": 75106 - }, - { - "epoch": 1.93, - "learning_rate": 6.011432290587365e-07, - "loss": 0.7217, - "step": 75107 - }, - { - "epoch": 1.93, - "learning_rate": 6.011178550389444e-07, - "loss": 0.5208, - "step": 75108 - }, - { - "epoch": 1.93, - "learning_rate": 6.01092481324558e-07, - "loss": 0.4487, - "step": 75109 - }, - { - "epoch": 1.93, - "learning_rate": 6.010671079155969e-07, - "loss": 0.6211, - "step": 75110 - }, - { - "epoch": 1.93, - "learning_rate": 6.010417348120802e-07, - "loss": 0.6348, - "step": 75111 - }, - { - "epoch": 1.93, - "learning_rate": 6.010163620140276e-07, - "loss": 0.6543, - "step": 75112 - }, - { - "epoch": 1.93, - "learning_rate": 6.009909895214582e-07, - "loss": 0.5645, - "step": 75113 - }, - { - "epoch": 1.93, - "learning_rate": 6.00965617334392e-07, - "loss": 0.7139, - "step": 75114 - }, - { - "epoch": 1.93, - "learning_rate": 6.009402454528483e-07, - "loss": 0.6074, - "step": 75115 - }, - { - "epoch": 1.93, - "learning_rate": 6.009148738768457e-07, - "loss": 0.5991, - "step": 75116 - }, - { - "epoch": 1.93, - "learning_rate": 6.008895026064046e-07, - "loss": 0.666, - "step": 75117 - }, - { - "epoch": 1.93, - "learning_rate": 6.008641316415437e-07, - "loss": 0.4978, - "step": 75118 - }, - { - "epoch": 1.93, - "learning_rate": 6.008387609822832e-07, - "loss": 0.7107, - "step": 75119 - }, - { - "epoch": 1.93, - "learning_rate": 6.008133906286417e-07, - "loss": 0.5796, - "step": 75120 - }, - { - "epoch": 1.93, - "learning_rate": 6.007880205806394e-07, - "loss": 0.5942, - "step": 75121 - }, - { - "epoch": 1.93, - "learning_rate": 6.007626508382952e-07, - "loss": 0.6113, - "step": 75122 - }, - { - "epoch": 1.93, - "learning_rate": 6.007372814016286e-07, - "loss": 0.5347, - "step": 75123 - }, - { - "epoch": 1.93, - "learning_rate": 6.007119122706593e-07, - "loss": 0.6855, - "step": 75124 - }, - { - "epoch": 1.93, - "learning_rate": 6.006865434454067e-07, - "loss": 0.6616, - "step": 75125 - }, - { - "epoch": 1.93, - "learning_rate": 6.006611749258896e-07, - "loss": 0.6475, - "step": 75126 - }, - { - "epoch": 1.93, - "learning_rate": 6.006358067121281e-07, - "loss": 0.9131, - "step": 75127 - }, - { - "epoch": 1.93, - "learning_rate": 6.006104388041412e-07, - "loss": 0.6504, - "step": 75128 - }, - { - "epoch": 1.93, - "learning_rate": 6.005850712019487e-07, - "loss": 0.5981, - "step": 75129 - }, - { - "epoch": 1.93, - "learning_rate": 6.005597039055698e-07, - "loss": 0.6338, - "step": 75130 - }, - { - "epoch": 1.93, - "learning_rate": 6.00534336915024e-07, - "loss": 0.5298, - "step": 75131 - }, - { - "epoch": 1.93, - "learning_rate": 6.005089702303305e-07, - "loss": 0.6992, - "step": 75132 - }, - { - "epoch": 1.93, - "learning_rate": 6.004836038515092e-07, - "loss": 0.4644, - "step": 75133 - }, - { - "epoch": 1.93, - "learning_rate": 6.00458237778579e-07, - "loss": 0.4264, - "step": 75134 - }, - { - "epoch": 1.93, - "learning_rate": 6.004328720115599e-07, - "loss": 0.748, - "step": 75135 - }, - { - "epoch": 1.93, - "learning_rate": 6.004075065504707e-07, - "loss": 0.4724, - "step": 75136 - }, - { - "epoch": 1.93, - "learning_rate": 6.003821413953312e-07, - "loss": 0.6943, - "step": 75137 - }, - { - "epoch": 1.93, - "learning_rate": 6.003567765461608e-07, - "loss": 0.7266, - "step": 75138 - }, - { - "epoch": 1.93, - "learning_rate": 6.003314120029787e-07, - "loss": 0.6592, - "step": 75139 - }, - { - "epoch": 1.93, - "learning_rate": 6.003060477658044e-07, - "loss": 0.7471, - "step": 75140 - }, - { - "epoch": 1.93, - "learning_rate": 6.002806838346575e-07, - "loss": 0.6152, - "step": 75141 - }, - { - "epoch": 1.93, - "learning_rate": 6.00255320209557e-07, - "loss": 0.6182, - "step": 75142 - }, - { - "epoch": 1.93, - "learning_rate": 6.002299568905231e-07, - "loss": 0.4609, - "step": 75143 - }, - { - "epoch": 1.93, - "learning_rate": 6.002045938775743e-07, - "loss": 0.5679, - "step": 75144 - }, - { - "epoch": 1.93, - "learning_rate": 6.00179231170731e-07, - "loss": 0.7773, - "step": 75145 - }, - { - "epoch": 1.93, - "learning_rate": 6.001538687700119e-07, - "loss": 0.5854, - "step": 75146 - }, - { - "epoch": 1.93, - "learning_rate": 6.001285066754362e-07, - "loss": 0.6028, - "step": 75147 - }, - { - "epoch": 1.93, - "learning_rate": 6.001031448870241e-07, - "loss": 0.6201, - "step": 75148 - }, - { - "epoch": 1.93, - "learning_rate": 6.000777834047944e-07, - "loss": 0.493, - "step": 75149 - }, - { - "epoch": 1.93, - "learning_rate": 6.000524222287668e-07, - "loss": 0.6968, - "step": 75150 - }, - { - "epoch": 1.93, - "learning_rate": 6.000270613589607e-07, - "loss": 0.6943, - "step": 75151 - }, - { - "epoch": 1.93, - "learning_rate": 6.000017007953955e-07, - "loss": 0.6016, - "step": 75152 - }, - { - "epoch": 1.93, - "learning_rate": 5.999763405380905e-07, - "loss": 0.7656, - "step": 75153 - }, - { - "epoch": 1.93, - "learning_rate": 5.999509805870655e-07, - "loss": 0.5542, - "step": 75154 - }, - { - "epoch": 1.93, - "learning_rate": 5.999256209423397e-07, - "loss": 0.585, - "step": 75155 - }, - { - "epoch": 1.93, - "learning_rate": 5.999002616039323e-07, - "loss": 0.6069, - "step": 75156 - }, - { - "epoch": 1.93, - "learning_rate": 5.998749025718627e-07, - "loss": 0.6953, - "step": 75157 - }, - { - "epoch": 1.93, - "learning_rate": 5.998495438461507e-07, - "loss": 0.5493, - "step": 75158 - }, - { - "epoch": 1.93, - "learning_rate": 5.998241854268153e-07, - "loss": 0.665, - "step": 75159 - }, - { - "epoch": 1.93, - "learning_rate": 5.997988273138763e-07, - "loss": 0.6777, - "step": 75160 - }, - { - "epoch": 1.93, - "learning_rate": 5.997734695073527e-07, - "loss": 0.6448, - "step": 75161 - }, - { - "epoch": 1.93, - "learning_rate": 5.997481120072642e-07, - "loss": 0.6875, - "step": 75162 - }, - { - "epoch": 1.93, - "learning_rate": 5.997227548136303e-07, - "loss": 0.709, - "step": 75163 - }, - { - "epoch": 1.93, - "learning_rate": 5.996973979264704e-07, - "loss": 0.5142, - "step": 75164 - }, - { - "epoch": 1.93, - "learning_rate": 5.996720413458038e-07, - "loss": 0.5239, - "step": 75165 - }, - { - "epoch": 1.93, - "learning_rate": 5.996466850716497e-07, - "loss": 0.7959, - "step": 75166 - }, - { - "epoch": 1.93, - "learning_rate": 5.996213291040277e-07, - "loss": 0.6357, - "step": 75167 - }, - { - "epoch": 1.93, - "learning_rate": 5.995959734429573e-07, - "loss": 0.6055, - "step": 75168 - }, - { - "epoch": 1.93, - "learning_rate": 5.995706180884579e-07, - "loss": 0.6162, - "step": 75169 - }, - { - "epoch": 1.93, - "learning_rate": 5.995452630405488e-07, - "loss": 0.6113, - "step": 75170 - }, - { - "epoch": 1.93, - "learning_rate": 5.995199082992495e-07, - "loss": 0.6934, - "step": 75171 - }, - { - "epoch": 1.93, - "learning_rate": 5.994945538645792e-07, - "loss": 0.5815, - "step": 75172 - }, - { - "epoch": 1.93, - "learning_rate": 5.99469199736558e-07, - "loss": 0.7129, - "step": 75173 - }, - { - "epoch": 1.93, - "learning_rate": 5.994438459152042e-07, - "loss": 0.4111, - "step": 75174 - }, - { - "epoch": 1.93, - "learning_rate": 5.994184924005388e-07, - "loss": 0.6562, - "step": 75175 - }, - { - "epoch": 1.93, - "learning_rate": 5.993931391925795e-07, - "loss": 0.3896, - "step": 75176 - }, - { - "epoch": 1.93, - "learning_rate": 5.993677862913466e-07, - "loss": 0.5938, - "step": 75177 - }, - { - "epoch": 1.93, - "learning_rate": 5.993424336968591e-07, - "loss": 0.6719, - "step": 75178 - }, - { - "epoch": 1.93, - "learning_rate": 5.993170814091371e-07, - "loss": 0.7373, - "step": 75179 - }, - { - "epoch": 1.93, - "learning_rate": 5.992917294281992e-07, - "loss": 0.6377, - "step": 75180 - }, - { - "epoch": 1.93, - "learning_rate": 5.992663777540654e-07, - "loss": 0.5986, - "step": 75181 - }, - { - "epoch": 1.93, - "learning_rate": 5.992410263867548e-07, - "loss": 0.6709, - "step": 75182 - }, - { - "epoch": 1.93, - "learning_rate": 5.992156753262872e-07, - "loss": 0.5977, - "step": 75183 - }, - { - "epoch": 1.93, - "learning_rate": 5.991903245726813e-07, - "loss": 0.6343, - "step": 75184 - }, - { - "epoch": 1.93, - "learning_rate": 5.991649741259574e-07, - "loss": 0.5405, - "step": 75185 - }, - { - "epoch": 1.93, - "learning_rate": 5.991396239861344e-07, - "loss": 0.6162, - "step": 75186 - }, - { - "epoch": 1.93, - "learning_rate": 5.991142741532313e-07, - "loss": 0.6221, - "step": 75187 - }, - { - "epoch": 1.93, - "learning_rate": 5.990889246272683e-07, - "loss": 0.6372, - "step": 75188 - }, - { - "epoch": 1.93, - "learning_rate": 5.990635754082645e-07, - "loss": 0.668, - "step": 75189 - }, - { - "epoch": 1.93, - "learning_rate": 5.990382264962393e-07, - "loss": 0.5007, - "step": 75190 - }, - { - "epoch": 1.93, - "learning_rate": 5.990128778912118e-07, - "loss": 0.7031, - "step": 75191 - }, - { - "epoch": 1.93, - "learning_rate": 5.98987529593202e-07, - "loss": 0.6689, - "step": 75192 - }, - { - "epoch": 1.93, - "learning_rate": 5.989621816022288e-07, - "loss": 0.7007, - "step": 75193 - }, - { - "epoch": 1.93, - "learning_rate": 5.989368339183119e-07, - "loss": 0.7324, - "step": 75194 - }, - { - "epoch": 1.93, - "learning_rate": 5.98911486541471e-07, - "loss": 0.5513, - "step": 75195 - }, - { - "epoch": 1.93, - "learning_rate": 5.988861394717248e-07, - "loss": 0.4648, - "step": 75196 - }, - { - "epoch": 1.93, - "learning_rate": 5.98860792709093e-07, - "loss": 0.5737, - "step": 75197 - }, - { - "epoch": 1.93, - "learning_rate": 5.988354462535951e-07, - "loss": 0.7031, - "step": 75198 - }, - { - "epoch": 1.93, - "learning_rate": 5.988101001052504e-07, - "loss": 0.7334, - "step": 75199 - }, - { - "epoch": 1.93, - "learning_rate": 5.987847542640784e-07, - "loss": 0.6738, - "step": 75200 - }, - { - "epoch": 1.93, - "learning_rate": 5.987594087300983e-07, - "loss": 0.4111, - "step": 75201 - }, - { - "epoch": 1.93, - "learning_rate": 5.987340635033299e-07, - "loss": 0.8379, - "step": 75202 - }, - { - "epoch": 1.93, - "learning_rate": 5.987087185837921e-07, - "loss": 0.6152, - "step": 75203 - }, - { - "epoch": 1.93, - "learning_rate": 5.986833739715049e-07, - "loss": 0.6523, - "step": 75204 - }, - { - "epoch": 1.93, - "learning_rate": 5.986580296664876e-07, - "loss": 0.5566, - "step": 75205 - }, - { - "epoch": 1.93, - "learning_rate": 5.986326856687589e-07, - "loss": 0.6768, - "step": 75206 - }, - { - "epoch": 1.93, - "learning_rate": 5.986073419783389e-07, - "loss": 0.623, - "step": 75207 - }, - { - "epoch": 1.93, - "learning_rate": 5.985819985952467e-07, - "loss": 0.7109, - "step": 75208 - }, - { - "epoch": 1.93, - "learning_rate": 5.985566555195019e-07, - "loss": 0.5991, - "step": 75209 - }, - { - "epoch": 1.93, - "learning_rate": 5.985313127511236e-07, - "loss": 0.5192, - "step": 75210 - }, - { - "epoch": 1.93, - "learning_rate": 5.985059702901316e-07, - "loss": 0.563, - "step": 75211 - }, - { - "epoch": 1.93, - "learning_rate": 5.984806281365453e-07, - "loss": 0.6772, - "step": 75212 - }, - { - "epoch": 1.93, - "learning_rate": 5.984552862903835e-07, - "loss": 0.7441, - "step": 75213 - }, - { - "epoch": 1.93, - "learning_rate": 5.984299447516664e-07, - "loss": 0.5781, - "step": 75214 - }, - { - "epoch": 1.93, - "learning_rate": 5.984046035204132e-07, - "loss": 0.6514, - "step": 75215 - }, - { - "epoch": 1.93, - "learning_rate": 5.983792625966426e-07, - "loss": 0.7676, - "step": 75216 - }, - { - "epoch": 1.93, - "learning_rate": 5.983539219803748e-07, - "loss": 0.6553, - "step": 75217 - }, - { - "epoch": 1.93, - "learning_rate": 5.983285816716288e-07, - "loss": 0.4656, - "step": 75218 - }, - { - "epoch": 1.93, - "learning_rate": 5.983032416704243e-07, - "loss": 0.5752, - "step": 75219 - }, - { - "epoch": 1.93, - "learning_rate": 5.982779019767803e-07, - "loss": 0.7422, - "step": 75220 - }, - { - "epoch": 1.93, - "learning_rate": 5.982525625907167e-07, - "loss": 0.426, - "step": 75221 - }, - { - "epoch": 1.93, - "learning_rate": 5.982272235122523e-07, - "loss": 0.562, - "step": 75222 - }, - { - "epoch": 1.93, - "learning_rate": 5.982018847414072e-07, - "loss": 0.75, - "step": 75223 - }, - { - "epoch": 1.93, - "learning_rate": 5.981765462782002e-07, - "loss": 0.5684, - "step": 75224 - }, - { - "epoch": 1.93, - "learning_rate": 5.981512081226513e-07, - "loss": 0.6041, - "step": 75225 - }, - { - "epoch": 1.93, - "learning_rate": 5.981258702747794e-07, - "loss": 0.6875, - "step": 75226 - }, - { - "epoch": 1.93, - "learning_rate": 5.981005327346038e-07, - "loss": 0.5034, - "step": 75227 - }, - { - "epoch": 1.93, - "learning_rate": 5.980751955021444e-07, - "loss": 0.623, - "step": 75228 - }, - { - "epoch": 1.93, - "learning_rate": 5.980498585774203e-07, - "loss": 0.646, - "step": 75229 - }, - { - "epoch": 1.93, - "learning_rate": 5.980245219604507e-07, - "loss": 0.5801, - "step": 75230 - }, - { - "epoch": 1.93, - "learning_rate": 5.979991856512554e-07, - "loss": 0.6909, - "step": 75231 - }, - { - "epoch": 1.93, - "learning_rate": 5.979738496498536e-07, - "loss": 0.7334, - "step": 75232 - }, - { - "epoch": 1.93, - "learning_rate": 5.979485139562648e-07, - "loss": 0.6973, - "step": 75233 - }, - { - "epoch": 1.93, - "learning_rate": 5.979231785705081e-07, - "loss": 0.5957, - "step": 75234 - }, - { - "epoch": 1.93, - "learning_rate": 5.978978434926036e-07, - "loss": 0.7637, - "step": 75235 - }, - { - "epoch": 1.93, - "learning_rate": 5.978725087225702e-07, - "loss": 0.4849, - "step": 75236 - }, - { - "epoch": 1.93, - "learning_rate": 5.97847174260427e-07, - "loss": 0.5693, - "step": 75237 - }, - { - "epoch": 1.93, - "learning_rate": 5.978218401061938e-07, - "loss": 0.5482, - "step": 75238 - }, - { - "epoch": 1.93, - "learning_rate": 5.977965062598899e-07, - "loss": 0.7344, - "step": 75239 - }, - { - "epoch": 1.93, - "learning_rate": 5.977711727215349e-07, - "loss": 0.5107, - "step": 75240 - }, - { - "epoch": 1.93, - "learning_rate": 5.977458394911477e-07, - "loss": 0.3691, - "step": 75241 - }, - { - "epoch": 1.93, - "learning_rate": 5.977205065687483e-07, - "loss": 0.5996, - "step": 75242 - }, - { - "epoch": 1.93, - "learning_rate": 5.976951739543557e-07, - "loss": 0.6035, - "step": 75243 - }, - { - "epoch": 1.93, - "learning_rate": 5.976698416479894e-07, - "loss": 0.7476, - "step": 75244 - }, - { - "epoch": 1.93, - "learning_rate": 5.976445096496692e-07, - "loss": 0.7192, - "step": 75245 - }, - { - "epoch": 1.93, - "learning_rate": 5.976191779594138e-07, - "loss": 0.5801, - "step": 75246 - }, - { - "epoch": 1.93, - "learning_rate": 5.975938465772425e-07, - "loss": 0.6375, - "step": 75247 - }, - { - "epoch": 1.93, - "learning_rate": 5.975685155031755e-07, - "loss": 0.5776, - "step": 75248 - }, - { - "epoch": 1.93, - "learning_rate": 5.975431847372317e-07, - "loss": 0.4504, - "step": 75249 - }, - { - "epoch": 1.93, - "learning_rate": 5.975178542794306e-07, - "loss": 0.6489, - "step": 75250 - }, - { - "epoch": 1.93, - "learning_rate": 5.974925241297915e-07, - "loss": 0.6787, - "step": 75251 - }, - { - "epoch": 1.93, - "learning_rate": 5.974671942883339e-07, - "loss": 0.6177, - "step": 75252 - }, - { - "epoch": 1.93, - "learning_rate": 5.974418647550771e-07, - "loss": 0.5317, - "step": 75253 - }, - { - "epoch": 1.93, - "learning_rate": 5.974165355300406e-07, - "loss": 0.7568, - "step": 75254 - }, - { - "epoch": 1.93, - "learning_rate": 5.973912066132442e-07, - "loss": 0.6797, - "step": 75255 - }, - { - "epoch": 1.93, - "learning_rate": 5.973658780047062e-07, - "loss": 0.408, - "step": 75256 - }, - { - "epoch": 1.93, - "learning_rate": 5.97340549704447e-07, - "loss": 0.5439, - "step": 75257 - }, - { - "epoch": 1.93, - "learning_rate": 5.973152217124853e-07, - "loss": 0.5801, - "step": 75258 - }, - { - "epoch": 1.93, - "learning_rate": 5.972898940288411e-07, - "loss": 0.5684, - "step": 75259 - }, - { - "epoch": 1.93, - "learning_rate": 5.972645666535332e-07, - "loss": 0.6826, - "step": 75260 - }, - { - "epoch": 1.93, - "learning_rate": 5.972392395865817e-07, - "loss": 0.5674, - "step": 75261 - }, - { - "epoch": 1.93, - "learning_rate": 5.972139128280051e-07, - "loss": 0.5767, - "step": 75262 - }, - { - "epoch": 1.93, - "learning_rate": 5.971885863778238e-07, - "loss": 0.6494, - "step": 75263 - }, - { - "epoch": 1.93, - "learning_rate": 5.971632602360563e-07, - "loss": 0.5752, - "step": 75264 - }, - { - "epoch": 1.93, - "learning_rate": 5.97137934402723e-07, - "loss": 0.6533, - "step": 75265 - }, - { - "epoch": 1.93, - "learning_rate": 5.971126088778421e-07, - "loss": 0.7812, - "step": 75266 - }, - { - "epoch": 1.93, - "learning_rate": 5.970872836614338e-07, - "loss": 0.4956, - "step": 75267 - }, - { - "epoch": 1.93, - "learning_rate": 5.970619587535168e-07, - "loss": 0.5654, - "step": 75268 - }, - { - "epoch": 1.93, - "learning_rate": 5.970366341541114e-07, - "loss": 0.6143, - "step": 75269 - }, - { - "epoch": 1.93, - "learning_rate": 5.970113098632363e-07, - "loss": 0.7896, - "step": 75270 - }, - { - "epoch": 1.93, - "learning_rate": 5.969859858809112e-07, - "loss": 0.6528, - "step": 75271 - }, - { - "epoch": 1.93, - "learning_rate": 5.969606622071551e-07, - "loss": 0.6284, - "step": 75272 - }, - { - "epoch": 1.93, - "learning_rate": 5.969353388419879e-07, - "loss": 0.5626, - "step": 75273 - }, - { - "epoch": 1.93, - "learning_rate": 5.969100157854287e-07, - "loss": 0.687, - "step": 75274 - }, - { - "epoch": 1.93, - "learning_rate": 5.968846930374975e-07, - "loss": 0.6523, - "step": 75275 - }, - { - "epoch": 1.93, - "learning_rate": 5.968593705982127e-07, - "loss": 0.5796, - "step": 75276 - }, - { - "epoch": 1.93, - "learning_rate": 5.968340484675943e-07, - "loss": 0.6079, - "step": 75277 - }, - { - "epoch": 1.93, - "learning_rate": 5.968087266456614e-07, - "loss": 0.5793, - "step": 75278 - }, - { - "epoch": 1.93, - "learning_rate": 5.967834051324334e-07, - "loss": 0.5107, - "step": 75279 - }, - { - "epoch": 1.93, - "learning_rate": 5.9675808392793e-07, - "loss": 0.5295, - "step": 75280 - }, - { - "epoch": 1.93, - "learning_rate": 5.967327630321701e-07, - "loss": 0.5933, - "step": 75281 - }, - { - "epoch": 1.93, - "learning_rate": 5.967074424451737e-07, - "loss": 0.7617, - "step": 75282 - }, - { - "epoch": 1.93, - "learning_rate": 5.966821221669597e-07, - "loss": 0.7617, - "step": 75283 - }, - { - "epoch": 1.93, - "learning_rate": 5.966568021975478e-07, - "loss": 0.5581, - "step": 75284 - }, - { - "epoch": 1.93, - "learning_rate": 5.966314825369574e-07, - "loss": 0.5601, - "step": 75285 - }, - { - "epoch": 1.93, - "learning_rate": 5.966061631852076e-07, - "loss": 0.4663, - "step": 75286 - }, - { - "epoch": 1.93, - "learning_rate": 5.965808441423177e-07, - "loss": 0.7695, - "step": 75287 - }, - { - "epoch": 1.93, - "learning_rate": 5.965555254083074e-07, - "loss": 0.6646, - "step": 75288 - }, - { - "epoch": 1.93, - "learning_rate": 5.965302069831959e-07, - "loss": 0.6392, - "step": 75289 - }, - { - "epoch": 1.93, - "learning_rate": 5.965048888670029e-07, - "loss": 0.5054, - "step": 75290 - }, - { - "epoch": 1.93, - "learning_rate": 5.964795710597472e-07, - "loss": 0.4314, - "step": 75291 - }, - { - "epoch": 1.93, - "learning_rate": 5.96454253561449e-07, - "loss": 0.5581, - "step": 75292 - }, - { - "epoch": 1.93, - "learning_rate": 5.964289363721267e-07, - "loss": 0.5674, - "step": 75293 - }, - { - "epoch": 1.93, - "learning_rate": 5.964036194918006e-07, - "loss": 0.4548, - "step": 75294 - }, - { - "epoch": 1.93, - "learning_rate": 5.963783029204898e-07, - "loss": 0.7207, - "step": 75295 - }, - { - "epoch": 1.93, - "learning_rate": 5.963529866582134e-07, - "loss": 0.6943, - "step": 75296 - }, - { - "epoch": 1.93, - "learning_rate": 5.963276707049909e-07, - "loss": 0.5239, - "step": 75297 - }, - { - "epoch": 1.93, - "learning_rate": 5.963023550608416e-07, - "loss": 0.6045, - "step": 75298 - }, - { - "epoch": 1.93, - "learning_rate": 5.962770397257852e-07, - "loss": 0.6113, - "step": 75299 - }, - { - "epoch": 1.93, - "learning_rate": 5.962517246998408e-07, - "loss": 0.6299, - "step": 75300 - }, - { - "epoch": 1.93, - "learning_rate": 5.96226409983028e-07, - "loss": 0.624, - "step": 75301 - }, - { - "epoch": 1.93, - "learning_rate": 5.962010955753661e-07, - "loss": 0.7178, - "step": 75302 - }, - { - "epoch": 1.93, - "learning_rate": 5.961757814768742e-07, - "loss": 0.5933, - "step": 75303 - }, - { - "epoch": 1.93, - "learning_rate": 5.961504676875722e-07, - "loss": 0.7061, - "step": 75304 - }, - { - "epoch": 1.93, - "learning_rate": 5.961251542074794e-07, - "loss": 0.5078, - "step": 75305 - }, - { - "epoch": 1.93, - "learning_rate": 5.960998410366147e-07, - "loss": 0.5062, - "step": 75306 - }, - { - "epoch": 1.93, - "learning_rate": 5.960745281749979e-07, - "loss": 0.5933, - "step": 75307 - }, - { - "epoch": 1.93, - "learning_rate": 5.960492156226481e-07, - "loss": 0.5771, - "step": 75308 - }, - { - "epoch": 1.93, - "learning_rate": 5.96023903379585e-07, - "loss": 0.5308, - "step": 75309 - }, - { - "epoch": 1.93, - "learning_rate": 5.959985914458276e-07, - "loss": 0.6689, - "step": 75310 - }, - { - "epoch": 1.93, - "learning_rate": 5.959732798213956e-07, - "loss": 0.5825, - "step": 75311 - }, - { - "epoch": 1.93, - "learning_rate": 5.959479685063083e-07, - "loss": 0.6348, - "step": 75312 - }, - { - "epoch": 1.93, - "learning_rate": 5.959226575005852e-07, - "loss": 0.6201, - "step": 75313 - }, - { - "epoch": 1.93, - "learning_rate": 5.958973468042453e-07, - "loss": 0.7197, - "step": 75314 - }, - { - "epoch": 1.93, - "learning_rate": 5.958720364173087e-07, - "loss": 0.6865, - "step": 75315 - }, - { - "epoch": 1.93, - "learning_rate": 5.958467263397939e-07, - "loss": 0.5652, - "step": 75316 - }, - { - "epoch": 1.93, - "learning_rate": 5.958214165717206e-07, - "loss": 0.8242, - "step": 75317 - }, - { - "epoch": 1.93, - "learning_rate": 5.957961071131086e-07, - "loss": 0.6304, - "step": 75318 - }, - { - "epoch": 1.93, - "learning_rate": 5.957707979639768e-07, - "loss": 0.4639, - "step": 75319 - }, - { - "epoch": 1.93, - "learning_rate": 5.957454891243445e-07, - "loss": 0.5972, - "step": 75320 - }, - { - "epoch": 1.93, - "learning_rate": 5.957201805942314e-07, - "loss": 0.6479, - "step": 75321 - }, - { - "epoch": 1.93, - "learning_rate": 5.956948723736567e-07, - "loss": 0.6777, - "step": 75322 - }, - { - "epoch": 1.93, - "learning_rate": 5.9566956446264e-07, - "loss": 0.5662, - "step": 75323 - }, - { - "epoch": 1.93, - "learning_rate": 5.956442568612003e-07, - "loss": 0.6494, - "step": 75324 - }, - { - "epoch": 1.93, - "learning_rate": 5.956189495693577e-07, - "loss": 0.6676, - "step": 75325 - }, - { - "epoch": 1.93, - "learning_rate": 5.955936425871308e-07, - "loss": 0.6919, - "step": 75326 - }, - { - "epoch": 1.93, - "learning_rate": 5.955683359145391e-07, - "loss": 0.5415, - "step": 75327 - }, - { - "epoch": 1.93, - "learning_rate": 5.955430295516023e-07, - "loss": 0.4222, - "step": 75328 - }, - { - "epoch": 1.93, - "learning_rate": 5.955177234983394e-07, - "loss": 0.574, - "step": 75329 - }, - { - "epoch": 1.93, - "learning_rate": 5.954924177547702e-07, - "loss": 0.7266, - "step": 75330 - }, - { - "epoch": 1.93, - "learning_rate": 5.954671123209137e-07, - "loss": 0.5674, - "step": 75331 - }, - { - "epoch": 1.93, - "learning_rate": 5.954418071967895e-07, - "loss": 0.6086, - "step": 75332 - }, - { - "epoch": 1.93, - "learning_rate": 5.954165023824167e-07, - "loss": 0.6821, - "step": 75333 - }, - { - "epoch": 1.93, - "learning_rate": 5.953911978778152e-07, - "loss": 0.6387, - "step": 75334 - }, - { - "epoch": 1.93, - "learning_rate": 5.953658936830042e-07, - "loss": 0.6401, - "step": 75335 - }, - { - "epoch": 1.93, - "learning_rate": 5.953405897980029e-07, - "loss": 0.7129, - "step": 75336 - }, - { - "epoch": 1.93, - "learning_rate": 5.953152862228302e-07, - "loss": 0.6211, - "step": 75337 - }, - { - "epoch": 1.93, - "learning_rate": 5.952899829575063e-07, - "loss": 0.4875, - "step": 75338 - }, - { - "epoch": 1.93, - "learning_rate": 5.952646800020501e-07, - "loss": 0.6313, - "step": 75339 - }, - { - "epoch": 1.93, - "learning_rate": 5.952393773564813e-07, - "loss": 0.6387, - "step": 75340 - }, - { - "epoch": 1.93, - "learning_rate": 5.952140750208189e-07, - "loss": 0.6423, - "step": 75341 - }, - { - "epoch": 1.93, - "learning_rate": 5.951887729950826e-07, - "loss": 0.6816, - "step": 75342 - }, - { - "epoch": 1.93, - "learning_rate": 5.951634712792915e-07, - "loss": 0.7422, - "step": 75343 - }, - { - "epoch": 1.93, - "learning_rate": 5.951381698734655e-07, - "loss": 0.5142, - "step": 75344 - }, - { - "epoch": 1.93, - "learning_rate": 5.951128687776235e-07, - "loss": 0.4788, - "step": 75345 - }, - { - "epoch": 1.93, - "learning_rate": 5.950875679917847e-07, - "loss": 0.7549, - "step": 75346 - }, - { - "epoch": 1.93, - "learning_rate": 5.950622675159689e-07, - "loss": 0.6367, - "step": 75347 - }, - { - "epoch": 1.93, - "learning_rate": 5.950369673501952e-07, - "loss": 0.7021, - "step": 75348 - }, - { - "epoch": 1.93, - "learning_rate": 5.950116674944831e-07, - "loss": 0.6528, - "step": 75349 - }, - { - "epoch": 1.93, - "learning_rate": 5.949863679488518e-07, - "loss": 0.7188, - "step": 75350 - }, - { - "epoch": 1.93, - "learning_rate": 5.949610687133211e-07, - "loss": 0.5046, - "step": 75351 - }, - { - "epoch": 1.93, - "learning_rate": 5.949357697879097e-07, - "loss": 0.519, - "step": 75352 - }, - { - "epoch": 1.93, - "learning_rate": 5.949104711726377e-07, - "loss": 0.7197, - "step": 75353 - }, - { - "epoch": 1.93, - "learning_rate": 5.94885172867524e-07, - "loss": 0.6006, - "step": 75354 - }, - { - "epoch": 1.93, - "learning_rate": 5.948598748725886e-07, - "loss": 0.4858, - "step": 75355 - }, - { - "epoch": 1.93, - "learning_rate": 5.948345771878496e-07, - "loss": 0.7812, - "step": 75356 - }, - { - "epoch": 1.93, - "learning_rate": 5.948092798133275e-07, - "loss": 0.7454, - "step": 75357 - }, - { - "epoch": 1.93, - "learning_rate": 5.947839827490412e-07, - "loss": 0.6089, - "step": 75358 - }, - { - "epoch": 1.93, - "learning_rate": 5.947586859950102e-07, - "loss": 0.3855, - "step": 75359 - }, - { - "epoch": 1.93, - "learning_rate": 5.947333895512537e-07, - "loss": 0.6523, - "step": 75360 - }, - { - "epoch": 1.93, - "learning_rate": 5.947080934177915e-07, - "loss": 0.4526, - "step": 75361 - }, - { - "epoch": 1.93, - "learning_rate": 5.946827975946425e-07, - "loss": 0.4893, - "step": 75362 - }, - { - "epoch": 1.93, - "learning_rate": 5.946575020818263e-07, - "loss": 0.6333, - "step": 75363 - }, - { - "epoch": 1.93, - "learning_rate": 5.946322068793623e-07, - "loss": 0.4192, - "step": 75364 - }, - { - "epoch": 1.93, - "learning_rate": 5.946069119872696e-07, - "loss": 0.6611, - "step": 75365 - }, - { - "epoch": 1.93, - "learning_rate": 5.945816174055679e-07, - "loss": 0.6577, - "step": 75366 - }, - { - "epoch": 1.93, - "learning_rate": 5.945563231342763e-07, - "loss": 0.6714, - "step": 75367 - }, - { - "epoch": 1.93, - "learning_rate": 5.945310291734142e-07, - "loss": 0.6553, - "step": 75368 - }, - { - "epoch": 1.93, - "learning_rate": 5.945057355230011e-07, - "loss": 0.5605, - "step": 75369 - }, - { - "epoch": 1.93, - "learning_rate": 5.944804421830565e-07, - "loss": 0.7246, - "step": 75370 - }, - { - "epoch": 1.93, - "learning_rate": 5.944551491535993e-07, - "loss": 0.6509, - "step": 75371 - }, - { - "epoch": 1.93, - "learning_rate": 5.944298564346493e-07, - "loss": 0.54, - "step": 75372 - }, - { - "epoch": 1.93, - "learning_rate": 5.944045640262256e-07, - "loss": 0.4839, - "step": 75373 - }, - { - "epoch": 1.93, - "learning_rate": 5.943792719283483e-07, - "loss": 0.5264, - "step": 75374 - }, - { - "epoch": 1.93, - "learning_rate": 5.943539801410354e-07, - "loss": 0.791, - "step": 75375 - }, - { - "epoch": 1.93, - "learning_rate": 5.943286886643072e-07, - "loss": 0.6343, - "step": 75376 - }, - { - "epoch": 1.93, - "learning_rate": 5.94303397498183e-07, - "loss": 0.4971, - "step": 75377 - }, - { - "epoch": 1.93, - "learning_rate": 5.942781066426819e-07, - "loss": 0.6309, - "step": 75378 - }, - { - "epoch": 1.93, - "learning_rate": 5.942528160978233e-07, - "loss": 0.7192, - "step": 75379 - }, - { - "epoch": 1.93, - "learning_rate": 5.942275258636269e-07, - "loss": 0.5439, - "step": 75380 - }, - { - "epoch": 1.93, - "learning_rate": 5.942022359401115e-07, - "loss": 0.5352, - "step": 75381 - }, - { - "epoch": 1.93, - "learning_rate": 5.941769463272971e-07, - "loss": 0.6445, - "step": 75382 - }, - { - "epoch": 1.93, - "learning_rate": 5.941516570252026e-07, - "loss": 0.5332, - "step": 75383 - }, - { - "epoch": 1.93, - "learning_rate": 5.941263680338477e-07, - "loss": 0.5938, - "step": 75384 - }, - { - "epoch": 1.93, - "learning_rate": 5.941010793532517e-07, - "loss": 0.4448, - "step": 75385 - }, - { - "epoch": 1.93, - "learning_rate": 5.940757909834333e-07, - "loss": 0.6201, - "step": 75386 - }, - { - "epoch": 1.93, - "learning_rate": 5.940505029244129e-07, - "loss": 0.6582, - "step": 75387 - }, - { - "epoch": 1.93, - "learning_rate": 5.940252151762088e-07, - "loss": 0.6377, - "step": 75388 - }, - { - "epoch": 1.93, - "learning_rate": 5.939999277388414e-07, - "loss": 0.6531, - "step": 75389 - }, - { - "epoch": 1.93, - "learning_rate": 5.939746406123294e-07, - "loss": 0.7334, - "step": 75390 - }, - { - "epoch": 1.93, - "learning_rate": 5.939493537966924e-07, - "loss": 0.4561, - "step": 75391 - }, - { - "epoch": 1.93, - "learning_rate": 5.939240672919499e-07, - "loss": 0.6855, - "step": 75392 - }, - { - "epoch": 1.93, - "learning_rate": 5.938987810981208e-07, - "loss": 0.6836, - "step": 75393 - }, - { - "epoch": 1.93, - "learning_rate": 5.938734952152251e-07, - "loss": 0.6616, - "step": 75394 - }, - { - "epoch": 1.93, - "learning_rate": 5.938482096432815e-07, - "loss": 0.6719, - "step": 75395 - }, - { - "epoch": 1.93, - "learning_rate": 5.938229243823097e-07, - "loss": 0.8438, - "step": 75396 - }, - { - "epoch": 1.93, - "learning_rate": 5.937976394323289e-07, - "loss": 0.709, - "step": 75397 - }, - { - "epoch": 1.93, - "learning_rate": 5.937723547933585e-07, - "loss": 0.7695, - "step": 75398 - }, - { - "epoch": 1.93, - "learning_rate": 5.937470704654181e-07, - "loss": 0.6152, - "step": 75399 - }, - { - "epoch": 1.93, - "learning_rate": 5.937217864485268e-07, - "loss": 0.6177, - "step": 75400 - }, - { - "epoch": 1.93, - "learning_rate": 5.936965027427042e-07, - "loss": 0.71, - "step": 75401 - }, - { - "epoch": 1.93, - "learning_rate": 5.936712193479693e-07, - "loss": 0.6699, - "step": 75402 - }, - { - "epoch": 1.93, - "learning_rate": 5.936459362643418e-07, - "loss": 0.585, - "step": 75403 - }, - { - "epoch": 1.93, - "learning_rate": 5.936206534918411e-07, - "loss": 0.8301, - "step": 75404 - }, - { - "epoch": 1.93, - "learning_rate": 5.935953710304862e-07, - "loss": 0.6719, - "step": 75405 - }, - { - "epoch": 1.93, - "learning_rate": 5.935700888802966e-07, - "loss": 0.6753, - "step": 75406 - }, - { - "epoch": 1.93, - "learning_rate": 5.935448070412916e-07, - "loss": 0.6099, - "step": 75407 - }, - { - "epoch": 1.93, - "learning_rate": 5.935195255134909e-07, - "loss": 0.7256, - "step": 75408 - }, - { - "epoch": 1.93, - "learning_rate": 5.934942442969135e-07, - "loss": 0.7119, - "step": 75409 - }, - { - "epoch": 1.93, - "learning_rate": 5.934689633915785e-07, - "loss": 0.4937, - "step": 75410 - }, - { - "epoch": 1.93, - "learning_rate": 5.934436827975063e-07, - "loss": 0.5542, - "step": 75411 - }, - { - "epoch": 1.93, - "learning_rate": 5.934184025147151e-07, - "loss": 0.6313, - "step": 75412 - }, - { - "epoch": 1.93, - "learning_rate": 5.933931225432248e-07, - "loss": 0.751, - "step": 75413 - }, - { - "epoch": 1.93, - "learning_rate": 5.933678428830551e-07, - "loss": 0.5435, - "step": 75414 - }, - { - "epoch": 1.93, - "learning_rate": 5.933425635342244e-07, - "loss": 0.5469, - "step": 75415 - }, - { - "epoch": 1.93, - "learning_rate": 5.933172844967529e-07, - "loss": 0.7607, - "step": 75416 - }, - { - "epoch": 1.93, - "learning_rate": 5.932920057706594e-07, - "loss": 0.5547, - "step": 75417 - }, - { - "epoch": 1.93, - "learning_rate": 5.932667273559638e-07, - "loss": 0.6562, - "step": 75418 - }, - { - "epoch": 1.93, - "learning_rate": 5.93241449252685e-07, - "loss": 0.7129, - "step": 75419 - }, - { - "epoch": 1.93, - "learning_rate": 5.932161714608426e-07, - "loss": 0.5537, - "step": 75420 - }, - { - "epoch": 1.93, - "learning_rate": 5.931908939804557e-07, - "loss": 0.6484, - "step": 75421 - }, - { - "epoch": 1.93, - "learning_rate": 5.93165616811544e-07, - "loss": 0.6182, - "step": 75422 - }, - { - "epoch": 1.93, - "learning_rate": 5.931403399541265e-07, - "loss": 0.7803, - "step": 75423 - }, - { - "epoch": 1.93, - "learning_rate": 5.931150634082232e-07, - "loss": 0.623, - "step": 75424 - }, - { - "epoch": 1.93, - "learning_rate": 5.930897871738528e-07, - "loss": 0.7676, - "step": 75425 - }, - { - "epoch": 1.93, - "learning_rate": 5.930645112510346e-07, - "loss": 0.432, - "step": 75426 - }, - { - "epoch": 1.93, - "learning_rate": 5.930392356397882e-07, - "loss": 0.5073, - "step": 75427 - }, - { - "epoch": 1.93, - "learning_rate": 5.930139603401331e-07, - "loss": 0.6304, - "step": 75428 - }, - { - "epoch": 1.93, - "learning_rate": 5.929886853520882e-07, - "loss": 0.6072, - "step": 75429 - }, - { - "epoch": 1.93, - "learning_rate": 5.929634106756735e-07, - "loss": 0.6274, - "step": 75430 - }, - { - "epoch": 1.93, - "learning_rate": 5.929381363109078e-07, - "loss": 0.8145, - "step": 75431 - }, - { - "epoch": 1.93, - "learning_rate": 5.929128622578108e-07, - "loss": 0.7041, - "step": 75432 - }, - { - "epoch": 1.93, - "learning_rate": 5.928875885164015e-07, - "loss": 0.5996, - "step": 75433 - }, - { - "epoch": 1.93, - "learning_rate": 5.928623150866998e-07, - "loss": 0.6348, - "step": 75434 - }, - { - "epoch": 1.93, - "learning_rate": 5.928370419687247e-07, - "loss": 0.6211, - "step": 75435 - }, - { - "epoch": 1.93, - "learning_rate": 5.928117691624952e-07, - "loss": 0.7129, - "step": 75436 - }, - { - "epoch": 1.93, - "learning_rate": 5.927864966680312e-07, - "loss": 0.6895, - "step": 75437 - }, - { - "epoch": 1.93, - "learning_rate": 5.927612244853517e-07, - "loss": 0.522, - "step": 75438 - }, - { - "epoch": 1.93, - "learning_rate": 5.927359526144764e-07, - "loss": 0.5024, - "step": 75439 - }, - { - "epoch": 1.93, - "learning_rate": 5.927106810554241e-07, - "loss": 0.7041, - "step": 75440 - }, - { - "epoch": 1.93, - "learning_rate": 5.926854098082149e-07, - "loss": 0.6187, - "step": 75441 - }, - { - "epoch": 1.93, - "learning_rate": 5.926601388728675e-07, - "loss": 0.6719, - "step": 75442 - }, - { - "epoch": 1.93, - "learning_rate": 5.926348682494018e-07, - "loss": 0.6436, - "step": 75443 - }, - { - "epoch": 1.93, - "learning_rate": 5.926095979378369e-07, - "loss": 0.6074, - "step": 75444 - }, - { - "epoch": 1.93, - "learning_rate": 5.92584327938192e-07, - "loss": 0.5903, - "step": 75445 - }, - { - "epoch": 1.93, - "learning_rate": 5.925590582504863e-07, - "loss": 0.5894, - "step": 75446 - }, - { - "epoch": 1.93, - "learning_rate": 5.925337888747395e-07, - "loss": 0.6343, - "step": 75447 - }, - { - "epoch": 1.93, - "learning_rate": 5.925085198109708e-07, - "loss": 0.5386, - "step": 75448 - }, - { - "epoch": 1.93, - "learning_rate": 5.924832510591996e-07, - "loss": 0.6875, - "step": 75449 - }, - { - "epoch": 1.93, - "learning_rate": 5.924579826194451e-07, - "loss": 0.7295, - "step": 75450 - }, - { - "epoch": 1.93, - "learning_rate": 5.924327144917272e-07, - "loss": 0.5205, - "step": 75451 - }, - { - "epoch": 1.93, - "learning_rate": 5.924074466760645e-07, - "loss": 0.6812, - "step": 75452 - }, - { - "epoch": 1.93, - "learning_rate": 5.923821791724767e-07, - "loss": 0.626, - "step": 75453 - }, - { - "epoch": 1.93, - "learning_rate": 5.923569119809835e-07, - "loss": 0.668, - "step": 75454 - }, - { - "epoch": 1.93, - "learning_rate": 5.923316451016033e-07, - "loss": 0.537, - "step": 75455 - }, - { - "epoch": 1.93, - "learning_rate": 5.923063785343565e-07, - "loss": 0.592, - "step": 75456 - }, - { - "epoch": 1.93, - "learning_rate": 5.922811122792617e-07, - "loss": 0.6973, - "step": 75457 - }, - { - "epoch": 1.93, - "learning_rate": 5.922558463363385e-07, - "loss": 0.498, - "step": 75458 - }, - { - "epoch": 1.93, - "learning_rate": 5.922305807056063e-07, - "loss": 0.7021, - "step": 75459 - }, - { - "epoch": 1.93, - "learning_rate": 5.922053153870842e-07, - "loss": 0.4595, - "step": 75460 - }, - { - "epoch": 1.93, - "learning_rate": 5.921800503807919e-07, - "loss": 0.6152, - "step": 75461 - }, - { - "epoch": 1.93, - "learning_rate": 5.921547856867488e-07, - "loss": 0.6025, - "step": 75462 - }, - { - "epoch": 1.93, - "learning_rate": 5.921295213049736e-07, - "loss": 0.6279, - "step": 75463 - }, - { - "epoch": 1.93, - "learning_rate": 5.921042572354868e-07, - "loss": 0.4834, - "step": 75464 - }, - { - "epoch": 1.93, - "learning_rate": 5.920789934783063e-07, - "loss": 0.6338, - "step": 75465 - }, - { - "epoch": 1.93, - "learning_rate": 5.920537300334526e-07, - "loss": 0.5503, - "step": 75466 - }, - { - "epoch": 1.93, - "learning_rate": 5.920284669009442e-07, - "loss": 0.6436, - "step": 75467 - }, - { - "epoch": 1.93, - "learning_rate": 5.920032040808012e-07, - "loss": 0.6201, - "step": 75468 - }, - { - "epoch": 1.93, - "learning_rate": 5.919779415730422e-07, - "loss": 0.666, - "step": 75469 - }, - { - "epoch": 1.93, - "learning_rate": 5.919526793776872e-07, - "loss": 0.7881, - "step": 75470 - }, - { - "epoch": 1.93, - "learning_rate": 5.91927417494755e-07, - "loss": 0.6562, - "step": 75471 - }, - { - "epoch": 1.93, - "learning_rate": 5.919021559242656e-07, - "loss": 0.6904, - "step": 75472 - }, - { - "epoch": 1.93, - "learning_rate": 5.918768946662377e-07, - "loss": 0.585, - "step": 75473 - }, - { - "epoch": 1.93, - "learning_rate": 5.918516337206912e-07, - "loss": 0.6187, - "step": 75474 - }, - { - "epoch": 1.93, - "learning_rate": 5.91826373087645e-07, - "loss": 0.5488, - "step": 75475 - }, - { - "epoch": 1.93, - "learning_rate": 5.918011127671184e-07, - "loss": 0.5615, - "step": 75476 - }, - { - "epoch": 1.93, - "learning_rate": 5.91775852759131e-07, - "loss": 0.5269, - "step": 75477 - }, - { - "epoch": 1.93, - "learning_rate": 5.91750593063702e-07, - "loss": 0.6807, - "step": 75478 - }, - { - "epoch": 1.93, - "learning_rate": 5.91725333680851e-07, - "loss": 0.585, - "step": 75479 - }, - { - "epoch": 1.93, - "learning_rate": 5.917000746105968e-07, - "loss": 0.7412, - "step": 75480 - }, - { - "epoch": 1.93, - "learning_rate": 5.916748158529594e-07, - "loss": 0.5046, - "step": 75481 - }, - { - "epoch": 1.93, - "learning_rate": 5.916495574079577e-07, - "loss": 0.6528, - "step": 75482 - }, - { - "epoch": 1.93, - "learning_rate": 5.916242992756111e-07, - "loss": 0.6934, - "step": 75483 - }, - { - "epoch": 1.93, - "learning_rate": 5.915990414559393e-07, - "loss": 0.457, - "step": 75484 - }, - { - "epoch": 1.93, - "learning_rate": 5.915737839489611e-07, - "loss": 0.7168, - "step": 75485 - }, - { - "epoch": 1.93, - "learning_rate": 5.91548526754696e-07, - "loss": 0.6631, - "step": 75486 - }, - { - "epoch": 1.93, - "learning_rate": 5.915232698731636e-07, - "loss": 0.5635, - "step": 75487 - }, - { - "epoch": 1.93, - "learning_rate": 5.914980133043827e-07, - "loss": 0.8467, - "step": 75488 - }, - { - "epoch": 1.93, - "learning_rate": 5.914727570483732e-07, - "loss": 0.5143, - "step": 75489 - }, - { - "epoch": 1.93, - "learning_rate": 5.914475011051543e-07, - "loss": 0.6628, - "step": 75490 - }, - { - "epoch": 1.93, - "learning_rate": 5.914222454747453e-07, - "loss": 0.5273, - "step": 75491 - }, - { - "epoch": 1.93, - "learning_rate": 5.913969901571651e-07, - "loss": 0.6484, - "step": 75492 - }, - { - "epoch": 1.93, - "learning_rate": 5.913717351524339e-07, - "loss": 0.5977, - "step": 75493 - }, - { - "epoch": 1.93, - "learning_rate": 5.913464804605708e-07, - "loss": 0.6045, - "step": 75494 - }, - { - "epoch": 1.93, - "learning_rate": 5.913212260815943e-07, - "loss": 0.4956, - "step": 75495 - }, - { - "epoch": 1.94, - "learning_rate": 5.912959720155246e-07, - "loss": 0.624, - "step": 75496 - }, - { - "epoch": 1.94, - "learning_rate": 5.912707182623807e-07, - "loss": 0.7451, - "step": 75497 - }, - { - "epoch": 1.94, - "learning_rate": 5.912454648221821e-07, - "loss": 0.603, - "step": 75498 - }, - { - "epoch": 1.94, - "learning_rate": 5.912202116949481e-07, - "loss": 0.7007, - "step": 75499 - }, - { - "epoch": 1.94, - "learning_rate": 5.911949588806977e-07, - "loss": 0.5571, - "step": 75500 - }, - { - "epoch": 1.94, - "learning_rate": 5.911697063794509e-07, - "loss": 0.6597, - "step": 75501 - }, - { - "epoch": 1.94, - "learning_rate": 5.911444541912263e-07, - "loss": 0.5649, - "step": 75502 - }, - { - "epoch": 1.94, - "learning_rate": 5.911192023160438e-07, - "loss": 0.6353, - "step": 75503 - }, - { - "epoch": 1.94, - "learning_rate": 5.910939507539229e-07, - "loss": 0.5498, - "step": 75504 - }, - { - "epoch": 1.94, - "learning_rate": 5.91068699504882e-07, - "loss": 0.6504, - "step": 75505 - }, - { - "epoch": 1.94, - "learning_rate": 5.910434485689413e-07, - "loss": 0.6533, - "step": 75506 - }, - { - "epoch": 1.94, - "learning_rate": 5.910181979461195e-07, - "loss": 0.6982, - "step": 75507 - }, - { - "epoch": 1.94, - "learning_rate": 5.909929476364366e-07, - "loss": 0.7148, - "step": 75508 - }, - { - "epoch": 1.94, - "learning_rate": 5.909676976399111e-07, - "loss": 0.6094, - "step": 75509 - }, - { - "epoch": 1.94, - "learning_rate": 5.909424479565635e-07, - "loss": 0.7197, - "step": 75510 - }, - { - "epoch": 1.94, - "learning_rate": 5.909171985864119e-07, - "loss": 0.5942, - "step": 75511 - }, - { - "epoch": 1.94, - "learning_rate": 5.908919495294764e-07, - "loss": 0.5708, - "step": 75512 - }, - { - "epoch": 1.94, - "learning_rate": 5.908667007857761e-07, - "loss": 0.6123, - "step": 75513 - }, - { - "epoch": 1.94, - "learning_rate": 5.908414523553307e-07, - "loss": 0.6201, - "step": 75514 - }, - { - "epoch": 1.94, - "learning_rate": 5.908162042381588e-07, - "loss": 0.6597, - "step": 75515 - }, - { - "epoch": 1.94, - "learning_rate": 5.907909564342803e-07, - "loss": 0.5527, - "step": 75516 - }, - { - "epoch": 1.94, - "learning_rate": 5.907657089437142e-07, - "loss": 0.7188, - "step": 75517 - }, - { - "epoch": 1.94, - "learning_rate": 5.9074046176648e-07, - "loss": 0.6191, - "step": 75518 - }, - { - "epoch": 1.94, - "learning_rate": 5.907152149025969e-07, - "loss": 0.7627, - "step": 75519 - }, - { - "epoch": 1.94, - "learning_rate": 5.906899683520846e-07, - "loss": 0.4459, - "step": 75520 - }, - { - "epoch": 1.94, - "learning_rate": 5.906647221149619e-07, - "loss": 0.5859, - "step": 75521 - }, - { - "epoch": 1.94, - "learning_rate": 5.906394761912487e-07, - "loss": 0.6416, - "step": 75522 - }, - { - "epoch": 1.94, - "learning_rate": 5.906142305809638e-07, - "loss": 0.5591, - "step": 75523 - }, - { - "epoch": 1.94, - "learning_rate": 5.90588985284127e-07, - "loss": 0.5087, - "step": 75524 - }, - { - "epoch": 1.94, - "learning_rate": 5.905637403007572e-07, - "loss": 0.5693, - "step": 75525 - }, - { - "epoch": 1.94, - "learning_rate": 5.905384956308738e-07, - "loss": 0.6543, - "step": 75526 - }, - { - "epoch": 1.94, - "learning_rate": 5.905132512744966e-07, - "loss": 0.5, - "step": 75527 - }, - { - "epoch": 1.94, - "learning_rate": 5.904880072316443e-07, - "loss": 0.5913, - "step": 75528 - }, - { - "epoch": 1.94, - "learning_rate": 5.904627635023366e-07, - "loss": 0.543, - "step": 75529 - }, - { - "epoch": 1.94, - "learning_rate": 5.904375200865925e-07, - "loss": 0.5874, - "step": 75530 - }, - { - "epoch": 1.94, - "learning_rate": 5.904122769844318e-07, - "loss": 0.6514, - "step": 75531 - }, - { - "epoch": 1.94, - "learning_rate": 5.903870341958735e-07, - "loss": 0.708, - "step": 75532 - }, - { - "epoch": 1.94, - "learning_rate": 5.903617917209371e-07, - "loss": 0.5967, - "step": 75533 - }, - { - "epoch": 1.94, - "learning_rate": 5.903365495596421e-07, - "loss": 0.3521, - "step": 75534 - }, - { - "epoch": 1.94, - "learning_rate": 5.903113077120073e-07, - "loss": 0.5946, - "step": 75535 - }, - { - "epoch": 1.94, - "learning_rate": 5.902860661780522e-07, - "loss": 0.6641, - "step": 75536 - }, - { - "epoch": 1.94, - "learning_rate": 5.902608249577962e-07, - "loss": 0.7148, - "step": 75537 - }, - { - "epoch": 1.94, - "learning_rate": 5.902355840512587e-07, - "loss": 0.6973, - "step": 75538 - }, - { - "epoch": 1.94, - "learning_rate": 5.902103434584591e-07, - "loss": 0.7881, - "step": 75539 - }, - { - "epoch": 1.94, - "learning_rate": 5.901851031794162e-07, - "loss": 0.9854, - "step": 75540 - }, - { - "epoch": 1.94, - "learning_rate": 5.901598632141502e-07, - "loss": 0.481, - "step": 75541 - }, - { - "epoch": 1.94, - "learning_rate": 5.901346235626796e-07, - "loss": 0.4386, - "step": 75542 - }, - { - "epoch": 1.94, - "learning_rate": 5.901093842250244e-07, - "loss": 0.8652, - "step": 75543 - }, - { - "epoch": 1.94, - "learning_rate": 5.900841452012037e-07, - "loss": 0.6348, - "step": 75544 - }, - { - "epoch": 1.94, - "learning_rate": 5.900589064912362e-07, - "loss": 0.6099, - "step": 75545 - }, - { - "epoch": 1.94, - "learning_rate": 5.900336680951421e-07, - "loss": 0.6265, - "step": 75546 - }, - { - "epoch": 1.94, - "learning_rate": 5.900084300129402e-07, - "loss": 0.7178, - "step": 75547 - }, - { - "epoch": 1.94, - "learning_rate": 5.899831922446501e-07, - "loss": 0.7217, - "step": 75548 - }, - { - "epoch": 1.94, - "learning_rate": 5.899579547902909e-07, - "loss": 0.585, - "step": 75549 - }, - { - "epoch": 1.94, - "learning_rate": 5.899327176498822e-07, - "loss": 0.6309, - "step": 75550 - }, - { - "epoch": 1.94, - "learning_rate": 5.89907480823443e-07, - "loss": 0.5347, - "step": 75551 - }, - { - "epoch": 1.94, - "learning_rate": 5.898822443109928e-07, - "loss": 0.4399, - "step": 75552 - }, - { - "epoch": 1.94, - "learning_rate": 5.89857008112551e-07, - "loss": 0.5317, - "step": 75553 - }, - { - "epoch": 1.94, - "learning_rate": 5.898317722281372e-07, - "loss": 0.6201, - "step": 75554 - }, - { - "epoch": 1.94, - "learning_rate": 5.898065366577698e-07, - "loss": 0.6797, - "step": 75555 - }, - { - "epoch": 1.94, - "learning_rate": 5.897813014014689e-07, - "loss": 0.7339, - "step": 75556 - }, - { - "epoch": 1.94, - "learning_rate": 5.897560664592535e-07, - "loss": 0.6602, - "step": 75557 - }, - { - "epoch": 1.94, - "learning_rate": 5.897308318311431e-07, - "loss": 0.5291, - "step": 75558 - }, - { - "epoch": 1.94, - "learning_rate": 5.897055975171567e-07, - "loss": 0.4624, - "step": 75559 - }, - { - "epoch": 1.94, - "learning_rate": 5.896803635173142e-07, - "loss": 0.6367, - "step": 75560 - }, - { - "epoch": 1.94, - "learning_rate": 5.896551298316342e-07, - "loss": 0.4941, - "step": 75561 - }, - { - "epoch": 1.94, - "learning_rate": 5.896298964601367e-07, - "loss": 0.6074, - "step": 75562 - }, - { - "epoch": 1.94, - "learning_rate": 5.896046634028404e-07, - "loss": 0.6328, - "step": 75563 - }, - { - "epoch": 1.94, - "learning_rate": 5.895794306597656e-07, - "loss": 0.605, - "step": 75564 - }, - { - "epoch": 1.94, - "learning_rate": 5.895541982309305e-07, - "loss": 0.6157, - "step": 75565 - }, - { - "epoch": 1.94, - "learning_rate": 5.895289661163549e-07, - "loss": 0.751, - "step": 75566 - }, - { - "epoch": 1.94, - "learning_rate": 5.895037343160582e-07, - "loss": 0.5903, - "step": 75567 - }, - { - "epoch": 1.94, - "learning_rate": 5.894785028300593e-07, - "loss": 0.326, - "step": 75568 - }, - { - "epoch": 1.94, - "learning_rate": 5.894532716583782e-07, - "loss": 0.7617, - "step": 75569 - }, - { - "epoch": 1.94, - "learning_rate": 5.894280408010334e-07, - "loss": 0.6313, - "step": 75570 - }, - { - "epoch": 1.94, - "learning_rate": 5.894028102580451e-07, - "loss": 0.666, - "step": 75571 - }, - { - "epoch": 1.94, - "learning_rate": 5.893775800294323e-07, - "loss": 0.5742, - "step": 75572 - }, - { - "epoch": 1.94, - "learning_rate": 5.893523501152138e-07, - "loss": 0.4209, - "step": 75573 - }, - { - "epoch": 1.94, - "learning_rate": 5.893271205154097e-07, - "loss": 0.4971, - "step": 75574 - }, - { - "epoch": 1.94, - "learning_rate": 5.893018912300389e-07, - "loss": 0.5464, - "step": 75575 - }, - { - "epoch": 1.94, - "learning_rate": 5.892766622591205e-07, - "loss": 0.626, - "step": 75576 - }, - { - "epoch": 1.94, - "learning_rate": 5.892514336026741e-07, - "loss": 0.6094, - "step": 75577 - }, - { - "epoch": 1.94, - "learning_rate": 5.89226205260719e-07, - "loss": 0.6895, - "step": 75578 - }, - { - "epoch": 1.94, - "learning_rate": 5.892009772332746e-07, - "loss": 0.6377, - "step": 75579 - }, - { - "epoch": 1.94, - "learning_rate": 5.8917574952036e-07, - "loss": 0.5315, - "step": 75580 - }, - { - "epoch": 1.94, - "learning_rate": 5.891505221219948e-07, - "loss": 0.6182, - "step": 75581 - }, - { - "epoch": 1.94, - "learning_rate": 5.89125295038198e-07, - "loss": 0.5601, - "step": 75582 - }, - { - "epoch": 1.94, - "learning_rate": 5.891000682689892e-07, - "loss": 0.606, - "step": 75583 - }, - { - "epoch": 1.94, - "learning_rate": 5.890748418143878e-07, - "loss": 0.6733, - "step": 75584 - }, - { - "epoch": 1.94, - "learning_rate": 5.890496156744125e-07, - "loss": 0.6377, - "step": 75585 - }, - { - "epoch": 1.94, - "learning_rate": 5.890243898490832e-07, - "loss": 0.5393, - "step": 75586 - }, - { - "epoch": 1.94, - "learning_rate": 5.889991643384189e-07, - "loss": 0.6924, - "step": 75587 - }, - { - "epoch": 1.94, - "learning_rate": 5.889739391424391e-07, - "loss": 0.7476, - "step": 75588 - }, - { - "epoch": 1.94, - "learning_rate": 5.889487142611631e-07, - "loss": 0.5605, - "step": 75589 - }, - { - "epoch": 1.94, - "learning_rate": 5.889234896946101e-07, - "loss": 0.5081, - "step": 75590 - }, - { - "epoch": 1.94, - "learning_rate": 5.888982654427996e-07, - "loss": 0.667, - "step": 75591 - }, - { - "epoch": 1.94, - "learning_rate": 5.888730415057506e-07, - "loss": 0.6191, - "step": 75592 - }, - { - "epoch": 1.94, - "learning_rate": 5.888478178834828e-07, - "loss": 0.7207, - "step": 75593 - }, - { - "epoch": 1.94, - "learning_rate": 5.888225945760154e-07, - "loss": 0.4307, - "step": 75594 - }, - { - "epoch": 1.94, - "learning_rate": 5.887973715833674e-07, - "loss": 0.4771, - "step": 75595 - }, - { - "epoch": 1.94, - "learning_rate": 5.887721489055586e-07, - "loss": 0.666, - "step": 75596 - }, - { - "epoch": 1.94, - "learning_rate": 5.887469265426078e-07, - "loss": 0.5132, - "step": 75597 - }, - { - "epoch": 1.94, - "learning_rate": 5.887217044945346e-07, - "loss": 0.6064, - "step": 75598 - }, - { - "epoch": 1.94, - "learning_rate": 5.886964827613582e-07, - "loss": 0.6221, - "step": 75599 - }, - { - "epoch": 1.94, - "learning_rate": 5.886712613430982e-07, - "loss": 0.832, - "step": 75600 - }, - { - "epoch": 1.94, - "learning_rate": 5.886460402397735e-07, - "loss": 0.6021, - "step": 75601 - }, - { - "epoch": 1.94, - "learning_rate": 5.886208194514038e-07, - "loss": 0.647, - "step": 75602 - }, - { - "epoch": 1.94, - "learning_rate": 5.88595598978008e-07, - "loss": 0.592, - "step": 75603 - }, - { - "epoch": 1.94, - "learning_rate": 5.885703788196061e-07, - "loss": 0.6802, - "step": 75604 - }, - { - "epoch": 1.94, - "learning_rate": 5.885451589762167e-07, - "loss": 0.6216, - "step": 75605 - }, - { - "epoch": 1.94, - "learning_rate": 5.885199394478591e-07, - "loss": 0.6528, - "step": 75606 - }, - { - "epoch": 1.94, - "learning_rate": 5.884947202345531e-07, - "loss": 0.7393, - "step": 75607 - }, - { - "epoch": 1.94, - "learning_rate": 5.884695013363179e-07, - "loss": 0.7471, - "step": 75608 - }, - { - "epoch": 1.94, - "learning_rate": 5.884442827531723e-07, - "loss": 0.5532, - "step": 75609 - }, - { - "epoch": 1.94, - "learning_rate": 5.884190644851364e-07, - "loss": 0.6636, - "step": 75610 - }, - { - "epoch": 1.94, - "learning_rate": 5.883938465322287e-07, - "loss": 0.5857, - "step": 75611 - }, - { - "epoch": 1.94, - "learning_rate": 5.883686288944692e-07, - "loss": 0.6045, - "step": 75612 - }, - { - "epoch": 1.94, - "learning_rate": 5.883434115718766e-07, - "loss": 0.5723, - "step": 75613 - }, - { - "epoch": 1.94, - "learning_rate": 5.883181945644711e-07, - "loss": 0.6313, - "step": 75614 - }, - { - "epoch": 1.94, - "learning_rate": 5.88292977872271e-07, - "loss": 0.7305, - "step": 75615 - }, - { - "epoch": 1.94, - "learning_rate": 5.88267761495296e-07, - "loss": 0.7715, - "step": 75616 - }, - { - "epoch": 1.94, - "learning_rate": 5.882425454335656e-07, - "loss": 0.5786, - "step": 75617 - }, - { - "epoch": 1.94, - "learning_rate": 5.882173296870987e-07, - "loss": 0.6338, - "step": 75618 - }, - { - "epoch": 1.94, - "learning_rate": 5.881921142559151e-07, - "loss": 0.5806, - "step": 75619 - }, - { - "epoch": 1.94, - "learning_rate": 5.881668991400337e-07, - "loss": 0.6201, - "step": 75620 - }, - { - "epoch": 1.94, - "learning_rate": 5.881416843394742e-07, - "loss": 0.6992, - "step": 75621 - }, - { - "epoch": 1.94, - "learning_rate": 5.881164698542553e-07, - "loss": 0.7959, - "step": 75622 - }, - { - "epoch": 1.94, - "learning_rate": 5.880912556843971e-07, - "loss": 0.5188, - "step": 75623 - }, - { - "epoch": 1.94, - "learning_rate": 5.880660418299186e-07, - "loss": 0.54, - "step": 75624 - }, - { - "epoch": 1.94, - "learning_rate": 5.880408282908388e-07, - "loss": 0.4346, - "step": 75625 - }, - { - "epoch": 1.94, - "learning_rate": 5.880156150671769e-07, - "loss": 0.6416, - "step": 75626 - }, - { - "epoch": 1.94, - "learning_rate": 5.879904021589528e-07, - "loss": 0.5562, - "step": 75627 - }, - { - "epoch": 1.94, - "learning_rate": 5.879651895661853e-07, - "loss": 0.7139, - "step": 75628 - }, - { - "epoch": 1.94, - "learning_rate": 5.87939977288894e-07, - "loss": 0.707, - "step": 75629 - }, - { - "epoch": 1.94, - "learning_rate": 5.879147653270981e-07, - "loss": 0.5605, - "step": 75630 - }, - { - "epoch": 1.94, - "learning_rate": 5.878895536808169e-07, - "loss": 0.7021, - "step": 75631 - }, - { - "epoch": 1.94, - "learning_rate": 5.878643423500698e-07, - "loss": 0.6943, - "step": 75632 - }, - { - "epoch": 1.94, - "learning_rate": 5.878391313348759e-07, - "loss": 0.7656, - "step": 75633 - }, - { - "epoch": 1.94, - "learning_rate": 5.87813920635255e-07, - "loss": 0.6367, - "step": 75634 - }, - { - "epoch": 1.94, - "learning_rate": 5.877887102512256e-07, - "loss": 0.5537, - "step": 75635 - }, - { - "epoch": 1.94, - "learning_rate": 5.877635001828077e-07, - "loss": 0.6504, - "step": 75636 - }, - { - "epoch": 1.94, - "learning_rate": 5.877382904300201e-07, - "loss": 0.5293, - "step": 75637 - }, - { - "epoch": 1.94, - "learning_rate": 5.877130809928824e-07, - "loss": 0.6362, - "step": 75638 - }, - { - "epoch": 1.94, - "learning_rate": 5.876878718714138e-07, - "loss": 0.6606, - "step": 75639 - }, - { - "epoch": 1.94, - "learning_rate": 5.876626630656338e-07, - "loss": 0.5034, - "step": 75640 - }, - { - "epoch": 1.94, - "learning_rate": 5.876374545755613e-07, - "loss": 0.5845, - "step": 75641 - }, - { - "epoch": 1.94, - "learning_rate": 5.876122464012161e-07, - "loss": 0.7178, - "step": 75642 - }, - { - "epoch": 1.94, - "learning_rate": 5.875870385426169e-07, - "loss": 0.582, - "step": 75643 - }, - { - "epoch": 1.94, - "learning_rate": 5.87561830999784e-07, - "loss": 0.7007, - "step": 75644 - }, - { - "epoch": 1.94, - "learning_rate": 5.875366237727355e-07, - "loss": 0.6543, - "step": 75645 - }, - { - "epoch": 1.94, - "learning_rate": 5.875114168614914e-07, - "loss": 0.5098, - "step": 75646 - }, - { - "epoch": 1.94, - "learning_rate": 5.874862102660707e-07, - "loss": 0.5845, - "step": 75647 - }, - { - "epoch": 1.94, - "learning_rate": 5.874610039864931e-07, - "loss": 0.6787, - "step": 75648 - }, - { - "epoch": 1.94, - "learning_rate": 5.874357980227773e-07, - "loss": 0.6631, - "step": 75649 - }, - { - "epoch": 1.94, - "learning_rate": 5.874105923749431e-07, - "loss": 0.5332, - "step": 75650 - }, - { - "epoch": 1.94, - "learning_rate": 5.873853870430097e-07, - "loss": 0.7334, - "step": 75651 - }, - { - "epoch": 1.94, - "learning_rate": 5.873601820269962e-07, - "loss": 0.5723, - "step": 75652 - }, - { - "epoch": 1.94, - "learning_rate": 5.87334977326922e-07, - "loss": 0.7153, - "step": 75653 - }, - { - "epoch": 1.94, - "learning_rate": 5.873097729428069e-07, - "loss": 0.5767, - "step": 75654 - }, - { - "epoch": 1.94, - "learning_rate": 5.872845688746695e-07, - "loss": 0.5884, - "step": 75655 - }, - { - "epoch": 1.94, - "learning_rate": 5.872593651225291e-07, - "loss": 0.5542, - "step": 75656 - }, - { - "epoch": 1.94, - "learning_rate": 5.872341616864054e-07, - "loss": 0.6138, - "step": 75657 - }, - { - "epoch": 1.94, - "learning_rate": 5.872089585663174e-07, - "loss": 0.5942, - "step": 75658 - }, - { - "epoch": 1.94, - "learning_rate": 5.871837557622846e-07, - "loss": 0.6279, - "step": 75659 - }, - { - "epoch": 1.94, - "learning_rate": 5.87158553274326e-07, - "loss": 0.7607, - "step": 75660 - }, - { - "epoch": 1.94, - "learning_rate": 5.871333511024615e-07, - "loss": 0.3912, - "step": 75661 - }, - { - "epoch": 1.94, - "learning_rate": 5.871081492467099e-07, - "loss": 0.4185, - "step": 75662 - }, - { - "epoch": 1.94, - "learning_rate": 5.870829477070906e-07, - "loss": 0.5806, - "step": 75663 - }, - { - "epoch": 1.94, - "learning_rate": 5.870577464836229e-07, - "loss": 0.5659, - "step": 75664 - }, - { - "epoch": 1.94, - "learning_rate": 5.870325455763259e-07, - "loss": 0.563, - "step": 75665 - }, - { - "epoch": 1.94, - "learning_rate": 5.870073449852191e-07, - "loss": 0.6382, - "step": 75666 - }, - { - "epoch": 1.94, - "learning_rate": 5.86982144710322e-07, - "loss": 0.4446, - "step": 75667 - }, - { - "epoch": 1.94, - "learning_rate": 5.869569447516535e-07, - "loss": 0.5708, - "step": 75668 - }, - { - "epoch": 1.94, - "learning_rate": 5.869317451092333e-07, - "loss": 0.5391, - "step": 75669 - }, - { - "epoch": 1.94, - "learning_rate": 5.869065457830802e-07, - "loss": 0.7993, - "step": 75670 - }, - { - "epoch": 1.94, - "learning_rate": 5.868813467732139e-07, - "loss": 0.6484, - "step": 75671 - }, - { - "epoch": 1.94, - "learning_rate": 5.868561480796534e-07, - "loss": 0.6406, - "step": 75672 - }, - { - "epoch": 1.94, - "learning_rate": 5.868309497024187e-07, - "loss": 0.6172, - "step": 75673 - }, - { - "epoch": 1.94, - "learning_rate": 5.868057516415281e-07, - "loss": 0.7686, - "step": 75674 - }, - { - "epoch": 1.94, - "learning_rate": 5.867805538970012e-07, - "loss": 0.6924, - "step": 75675 - }, - { - "epoch": 1.94, - "learning_rate": 5.867553564688576e-07, - "loss": 0.627, - "step": 75676 - }, - { - "epoch": 1.94, - "learning_rate": 5.867301593571164e-07, - "loss": 0.666, - "step": 75677 - }, - { - "epoch": 1.94, - "learning_rate": 5.867049625617971e-07, - "loss": 0.6016, - "step": 75678 - }, - { - "epoch": 1.94, - "learning_rate": 5.866797660829186e-07, - "loss": 0.5679, - "step": 75679 - }, - { - "epoch": 1.94, - "learning_rate": 5.866545699205003e-07, - "loss": 0.3542, - "step": 75680 - }, - { - "epoch": 1.94, - "learning_rate": 5.866293740745618e-07, - "loss": 0.563, - "step": 75681 - }, - { - "epoch": 1.94, - "learning_rate": 5.866041785451221e-07, - "loss": 0.6895, - "step": 75682 - }, - { - "epoch": 1.94, - "learning_rate": 5.865789833322008e-07, - "loss": 0.708, - "step": 75683 - }, - { - "epoch": 1.94, - "learning_rate": 5.86553788435817e-07, - "loss": 0.6382, - "step": 75684 - }, - { - "epoch": 1.94, - "learning_rate": 5.865285938559895e-07, - "loss": 0.4395, - "step": 75685 - }, - { - "epoch": 1.94, - "learning_rate": 5.865033995927382e-07, - "loss": 0.7373, - "step": 75686 - }, - { - "epoch": 1.94, - "learning_rate": 5.864782056460822e-07, - "loss": 0.6689, - "step": 75687 - }, - { - "epoch": 1.94, - "learning_rate": 5.864530120160409e-07, - "loss": 0.7725, - "step": 75688 - }, - { - "epoch": 1.94, - "learning_rate": 5.864278187026334e-07, - "loss": 0.7002, - "step": 75689 - }, - { - "epoch": 1.94, - "learning_rate": 5.864026257058794e-07, - "loss": 0.645, - "step": 75690 - }, - { - "epoch": 1.94, - "learning_rate": 5.863774330257975e-07, - "loss": 0.6025, - "step": 75691 - }, - { - "epoch": 1.94, - "learning_rate": 5.863522406624077e-07, - "loss": 0.4135, - "step": 75692 - }, - { - "epoch": 1.94, - "learning_rate": 5.863270486157293e-07, - "loss": 0.6118, - "step": 75693 - }, - { - "epoch": 1.94, - "learning_rate": 5.863018568857805e-07, - "loss": 0.6382, - "step": 75694 - }, - { - "epoch": 1.94, - "learning_rate": 5.862766654725818e-07, - "loss": 0.4839, - "step": 75695 - }, - { - "epoch": 1.94, - "learning_rate": 5.862514743761517e-07, - "loss": 0.6729, - "step": 75696 - }, - { - "epoch": 1.94, - "learning_rate": 5.862262835965102e-07, - "loss": 0.7148, - "step": 75697 - }, - { - "epoch": 1.94, - "learning_rate": 5.86201093133676e-07, - "loss": 0.6523, - "step": 75698 - }, - { - "epoch": 1.94, - "learning_rate": 5.861759029876685e-07, - "loss": 0.5464, - "step": 75699 - }, - { - "epoch": 1.94, - "learning_rate": 5.861507131585074e-07, - "loss": 0.8037, - "step": 75700 - }, - { - "epoch": 1.94, - "learning_rate": 5.861255236462112e-07, - "loss": 0.5498, - "step": 75701 - }, - { - "epoch": 1.94, - "learning_rate": 5.861003344508002e-07, - "loss": 0.6689, - "step": 75702 - }, - { - "epoch": 1.94, - "learning_rate": 5.860751455722931e-07, - "loss": 0.6992, - "step": 75703 - }, - { - "epoch": 1.94, - "learning_rate": 5.860499570107089e-07, - "loss": 0.6992, - "step": 75704 - }, - { - "epoch": 1.94, - "learning_rate": 5.860247687660673e-07, - "loss": 0.7627, - "step": 75705 - }, - { - "epoch": 1.94, - "learning_rate": 5.859995808383875e-07, - "loss": 0.6689, - "step": 75706 - }, - { - "epoch": 1.94, - "learning_rate": 5.859743932276889e-07, - "loss": 0.5613, - "step": 75707 - }, - { - "epoch": 1.94, - "learning_rate": 5.859492059339904e-07, - "loss": 0.6357, - "step": 75708 - }, - { - "epoch": 1.94, - "learning_rate": 5.859240189573118e-07, - "loss": 0.646, - "step": 75709 - }, - { - "epoch": 1.94, - "learning_rate": 5.858988322976719e-07, - "loss": 0.4102, - "step": 75710 - }, - { - "epoch": 1.94, - "learning_rate": 5.858736459550905e-07, - "loss": 0.6729, - "step": 75711 - }, - { - "epoch": 1.94, - "learning_rate": 5.858484599295864e-07, - "loss": 0.6543, - "step": 75712 - }, - { - "epoch": 1.94, - "learning_rate": 5.858232742211795e-07, - "loss": 0.4817, - "step": 75713 - }, - { - "epoch": 1.94, - "learning_rate": 5.857980888298884e-07, - "loss": 0.7676, - "step": 75714 - }, - { - "epoch": 1.94, - "learning_rate": 5.857729037557327e-07, - "loss": 0.7344, - "step": 75715 - }, - { - "epoch": 1.94, - "learning_rate": 5.857477189987314e-07, - "loss": 0.7666, - "step": 75716 - }, - { - "epoch": 1.94, - "learning_rate": 5.857225345589043e-07, - "loss": 0.7793, - "step": 75717 - }, - { - "epoch": 1.94, - "learning_rate": 5.856973504362701e-07, - "loss": 0.4387, - "step": 75718 - }, - { - "epoch": 1.94, - "learning_rate": 5.856721666308486e-07, - "loss": 0.6836, - "step": 75719 - }, - { - "epoch": 1.94, - "learning_rate": 5.856469831426588e-07, - "loss": 0.4746, - "step": 75720 - }, - { - "epoch": 1.94, - "learning_rate": 5.856217999717202e-07, - "loss": 0.6313, - "step": 75721 - }, - { - "epoch": 1.94, - "learning_rate": 5.855966171180518e-07, - "loss": 0.5518, - "step": 75722 - }, - { - "epoch": 1.94, - "learning_rate": 5.855714345816733e-07, - "loss": 0.6284, - "step": 75723 - }, - { - "epoch": 1.94, - "learning_rate": 5.855462523626035e-07, - "loss": 0.3071, - "step": 75724 - }, - { - "epoch": 1.94, - "learning_rate": 5.855210704608617e-07, - "loss": 0.5205, - "step": 75725 - }, - { - "epoch": 1.94, - "learning_rate": 5.854958888764675e-07, - "loss": 0.7852, - "step": 75726 - }, - { - "epoch": 1.94, - "learning_rate": 5.854707076094399e-07, - "loss": 0.7861, - "step": 75727 - }, - { - "epoch": 1.94, - "learning_rate": 5.854455266597986e-07, - "loss": 0.6553, - "step": 75728 - }, - { - "epoch": 1.94, - "learning_rate": 5.854203460275622e-07, - "loss": 0.7451, - "step": 75729 - }, - { - "epoch": 1.94, - "learning_rate": 5.853951657127507e-07, - "loss": 0.627, - "step": 75730 - }, - { - "epoch": 1.94, - "learning_rate": 5.853699857153829e-07, - "loss": 0.5942, - "step": 75731 - }, - { - "epoch": 1.94, - "learning_rate": 5.853448060354784e-07, - "loss": 0.3667, - "step": 75732 - }, - { - "epoch": 1.94, - "learning_rate": 5.853196266730565e-07, - "loss": 0.4402, - "step": 75733 - }, - { - "epoch": 1.94, - "learning_rate": 5.85294447628136e-07, - "loss": 0.7031, - "step": 75734 - }, - { - "epoch": 1.94, - "learning_rate": 5.852692689007365e-07, - "loss": 0.8857, - "step": 75735 - }, - { - "epoch": 1.94, - "learning_rate": 5.852440904908773e-07, - "loss": 0.626, - "step": 75736 - }, - { - "epoch": 1.94, - "learning_rate": 5.852189123985773e-07, - "loss": 0.7432, - "step": 75737 - }, - { - "epoch": 1.94, - "learning_rate": 5.851937346238566e-07, - "loss": 0.6821, - "step": 75738 - }, - { - "epoch": 1.94, - "learning_rate": 5.851685571667337e-07, - "loss": 0.7021, - "step": 75739 - }, - { - "epoch": 1.94, - "learning_rate": 5.851433800272283e-07, - "loss": 0.6562, - "step": 75740 - }, - { - "epoch": 1.94, - "learning_rate": 5.851182032053592e-07, - "loss": 0.6582, - "step": 75741 - }, - { - "epoch": 1.94, - "learning_rate": 5.850930267011465e-07, - "loss": 0.4833, - "step": 75742 - }, - { - "epoch": 1.94, - "learning_rate": 5.850678505146089e-07, - "loss": 0.5981, - "step": 75743 - }, - { - "epoch": 1.94, - "learning_rate": 5.850426746457657e-07, - "loss": 0.6504, - "step": 75744 - }, - { - "epoch": 1.94, - "learning_rate": 5.850174990946362e-07, - "loss": 0.5425, - "step": 75745 - }, - { - "epoch": 1.94, - "learning_rate": 5.849923238612395e-07, - "loss": 0.6948, - "step": 75746 - }, - { - "epoch": 1.94, - "learning_rate": 5.849671489455953e-07, - "loss": 0.8047, - "step": 75747 - }, - { - "epoch": 1.94, - "learning_rate": 5.849419743477226e-07, - "loss": 0.519, - "step": 75748 - }, - { - "epoch": 1.94, - "learning_rate": 5.849168000676409e-07, - "loss": 0.6162, - "step": 75749 - }, - { - "epoch": 1.94, - "learning_rate": 5.848916261053691e-07, - "loss": 0.6025, - "step": 75750 - }, - { - "epoch": 1.94, - "learning_rate": 5.84866452460927e-07, - "loss": 0.623, - "step": 75751 - }, - { - "epoch": 1.94, - "learning_rate": 5.848412791343334e-07, - "loss": 0.5443, - "step": 75752 - }, - { - "epoch": 1.94, - "learning_rate": 5.848161061256081e-07, - "loss": 0.7197, - "step": 75753 - }, - { - "epoch": 1.94, - "learning_rate": 5.847909334347694e-07, - "loss": 0.6396, - "step": 75754 - }, - { - "epoch": 1.94, - "learning_rate": 5.847657610618376e-07, - "loss": 0.5159, - "step": 75755 - }, - { - "epoch": 1.94, - "learning_rate": 5.847405890068313e-07, - "loss": 0.4595, - "step": 75756 - }, - { - "epoch": 1.94, - "learning_rate": 5.847154172697702e-07, - "loss": 0.6101, - "step": 75757 - }, - { - "epoch": 1.94, - "learning_rate": 5.846902458506732e-07, - "loss": 0.7188, - "step": 75758 - }, - { - "epoch": 1.94, - "learning_rate": 5.8466507474956e-07, - "loss": 0.3779, - "step": 75759 - }, - { - "epoch": 1.94, - "learning_rate": 5.846399039664495e-07, - "loss": 0.5786, - "step": 75760 - }, - { - "epoch": 1.94, - "learning_rate": 5.846147335013614e-07, - "loss": 0.6572, - "step": 75761 - }, - { - "epoch": 1.94, - "learning_rate": 5.845895633543143e-07, - "loss": 0.7119, - "step": 75762 - }, - { - "epoch": 1.94, - "learning_rate": 5.845643935253283e-07, - "loss": 0.6738, - "step": 75763 - }, - { - "epoch": 1.94, - "learning_rate": 5.845392240144223e-07, - "loss": 0.5415, - "step": 75764 - }, - { - "epoch": 1.94, - "learning_rate": 5.84514054821615e-07, - "loss": 0.5227, - "step": 75765 - }, - { - "epoch": 1.94, - "learning_rate": 5.844888859469266e-07, - "loss": 0.6553, - "step": 75766 - }, - { - "epoch": 1.94, - "learning_rate": 5.844637173903756e-07, - "loss": 0.6191, - "step": 75767 - }, - { - "epoch": 1.94, - "learning_rate": 5.844385491519819e-07, - "loss": 0.6543, - "step": 75768 - }, - { - "epoch": 1.94, - "learning_rate": 5.844133812317642e-07, - "loss": 0.4963, - "step": 75769 - }, - { - "epoch": 1.94, - "learning_rate": 5.843882136297424e-07, - "loss": 0.8564, - "step": 75770 - }, - { - "epoch": 1.94, - "learning_rate": 5.843630463459355e-07, - "loss": 0.6709, - "step": 75771 - }, - { - "epoch": 1.94, - "learning_rate": 5.843378793803623e-07, - "loss": 0.7461, - "step": 75772 - }, - { - "epoch": 1.94, - "learning_rate": 5.84312712733043e-07, - "loss": 0.6118, - "step": 75773 - }, - { - "epoch": 1.94, - "learning_rate": 5.842875464039961e-07, - "loss": 0.7041, - "step": 75774 - }, - { - "epoch": 1.94, - "learning_rate": 5.842623803932408e-07, - "loss": 0.5239, - "step": 75775 - }, - { - "epoch": 1.94, - "learning_rate": 5.84237214700797e-07, - "loss": 0.4886, - "step": 75776 - }, - { - "epoch": 1.94, - "learning_rate": 5.842120493266835e-07, - "loss": 0.6396, - "step": 75777 - }, - { - "epoch": 1.94, - "learning_rate": 5.841868842709199e-07, - "loss": 0.7666, - "step": 75778 - }, - { - "epoch": 1.94, - "learning_rate": 5.841617195335249e-07, - "loss": 0.7559, - "step": 75779 - }, - { - "epoch": 1.94, - "learning_rate": 5.841365551145185e-07, - "loss": 0.4878, - "step": 75780 - }, - { - "epoch": 1.94, - "learning_rate": 5.841113910139195e-07, - "loss": 0.6157, - "step": 75781 - }, - { - "epoch": 1.94, - "learning_rate": 5.840862272317473e-07, - "loss": 0.6958, - "step": 75782 - }, - { - "epoch": 1.94, - "learning_rate": 5.840610637680214e-07, - "loss": 0.6611, - "step": 75783 - }, - { - "epoch": 1.94, - "learning_rate": 5.840359006227606e-07, - "loss": 0.5142, - "step": 75784 - }, - { - "epoch": 1.94, - "learning_rate": 5.840107377959844e-07, - "loss": 0.7373, - "step": 75785 - }, - { - "epoch": 1.94, - "learning_rate": 5.839855752877119e-07, - "loss": 0.6836, - "step": 75786 - }, - { - "epoch": 1.94, - "learning_rate": 5.839604130979628e-07, - "loss": 0.6509, - "step": 75787 - }, - { - "epoch": 1.94, - "learning_rate": 5.839352512267559e-07, - "loss": 0.5396, - "step": 75788 - }, - { - "epoch": 1.94, - "learning_rate": 5.839100896741105e-07, - "loss": 0.6548, - "step": 75789 - }, - { - "epoch": 1.94, - "learning_rate": 5.838849284400462e-07, - "loss": 0.6709, - "step": 75790 - }, - { - "epoch": 1.94, - "learning_rate": 5.83859767524582e-07, - "loss": 0.5801, - "step": 75791 - }, - { - "epoch": 1.94, - "learning_rate": 5.838346069277371e-07, - "loss": 0.5728, - "step": 75792 - }, - { - "epoch": 1.94, - "learning_rate": 5.838094466495313e-07, - "loss": 0.6729, - "step": 75793 - }, - { - "epoch": 1.94, - "learning_rate": 5.837842866899836e-07, - "loss": 0.4056, - "step": 75794 - }, - { - "epoch": 1.94, - "learning_rate": 5.837591270491127e-07, - "loss": 0.6572, - "step": 75795 - }, - { - "epoch": 1.94, - "learning_rate": 5.837339677269383e-07, - "loss": 0.709, - "step": 75796 - }, - { - "epoch": 1.94, - "learning_rate": 5.837088087234796e-07, - "loss": 0.5156, - "step": 75797 - }, - { - "epoch": 1.94, - "learning_rate": 5.836836500387563e-07, - "loss": 0.6191, - "step": 75798 - }, - { - "epoch": 1.94, - "learning_rate": 5.83658491672787e-07, - "loss": 0.4673, - "step": 75799 - }, - { - "epoch": 1.94, - "learning_rate": 5.836333336255912e-07, - "loss": 0.5693, - "step": 75800 - }, - { - "epoch": 1.94, - "learning_rate": 5.836081758971882e-07, - "loss": 0.5142, - "step": 75801 - }, - { - "epoch": 1.94, - "learning_rate": 5.835830184875976e-07, - "loss": 0.562, - "step": 75802 - }, - { - "epoch": 1.94, - "learning_rate": 5.835578613968385e-07, - "loss": 0.575, - "step": 75803 - }, - { - "epoch": 1.94, - "learning_rate": 5.835327046249295e-07, - "loss": 0.7236, - "step": 75804 - }, - { - "epoch": 1.94, - "learning_rate": 5.835075481718903e-07, - "loss": 0.8018, - "step": 75805 - }, - { - "epoch": 1.94, - "learning_rate": 5.834823920377407e-07, - "loss": 0.6802, - "step": 75806 - }, - { - "epoch": 1.94, - "learning_rate": 5.834572362224992e-07, - "loss": 0.4214, - "step": 75807 - }, - { - "epoch": 1.94, - "learning_rate": 5.834320807261852e-07, - "loss": 0.71, - "step": 75808 - }, - { - "epoch": 1.94, - "learning_rate": 5.834069255488181e-07, - "loss": 0.4207, - "step": 75809 - }, - { - "epoch": 1.94, - "learning_rate": 5.833817706904177e-07, - "loss": 0.6616, - "step": 75810 - }, - { - "epoch": 1.94, - "learning_rate": 5.83356616151002e-07, - "loss": 0.5337, - "step": 75811 - }, - { - "epoch": 1.94, - "learning_rate": 5.833314619305911e-07, - "loss": 0.624, - "step": 75812 - }, - { - "epoch": 1.94, - "learning_rate": 5.833063080292046e-07, - "loss": 0.5747, - "step": 75813 - }, - { - "epoch": 1.94, - "learning_rate": 5.83281154446861e-07, - "loss": 0.6172, - "step": 75814 - }, - { - "epoch": 1.94, - "learning_rate": 5.832560011835803e-07, - "loss": 0.5051, - "step": 75815 - }, - { - "epoch": 1.94, - "learning_rate": 5.832308482393806e-07, - "loss": 0.522, - "step": 75816 - }, - { - "epoch": 1.94, - "learning_rate": 5.832056956142822e-07, - "loss": 0.5664, - "step": 75817 - }, - { - "epoch": 1.94, - "learning_rate": 5.831805433083039e-07, - "loss": 0.5695, - "step": 75818 - }, - { - "epoch": 1.94, - "learning_rate": 5.831553913214655e-07, - "loss": 0.8105, - "step": 75819 - }, - { - "epoch": 1.94, - "learning_rate": 5.831302396537854e-07, - "loss": 0.5596, - "step": 75820 - }, - { - "epoch": 1.94, - "learning_rate": 5.831050883052834e-07, - "loss": 0.707, - "step": 75821 - }, - { - "epoch": 1.94, - "learning_rate": 5.830799372759785e-07, - "loss": 0.6221, - "step": 75822 - }, - { - "epoch": 1.94, - "learning_rate": 5.830547865658911e-07, - "loss": 0.4919, - "step": 75823 - }, - { - "epoch": 1.94, - "learning_rate": 5.830296361750386e-07, - "loss": 0.509, - "step": 75824 - }, - { - "epoch": 1.94, - "learning_rate": 5.830044861034411e-07, - "loss": 0.4536, - "step": 75825 - }, - { - "epoch": 1.94, - "learning_rate": 5.82979336351118e-07, - "loss": 0.791, - "step": 75826 - }, - { - "epoch": 1.94, - "learning_rate": 5.829541869180887e-07, - "loss": 0.5352, - "step": 75827 - }, - { - "epoch": 1.94, - "learning_rate": 5.82929037804372e-07, - "loss": 0.6406, - "step": 75828 - }, - { - "epoch": 1.94, - "learning_rate": 5.829038890099872e-07, - "loss": 0.6162, - "step": 75829 - }, - { - "epoch": 1.94, - "learning_rate": 5.828787405349537e-07, - "loss": 0.666, - "step": 75830 - }, - { - "epoch": 1.94, - "learning_rate": 5.828535923792914e-07, - "loss": 0.7559, - "step": 75831 - }, - { - "epoch": 1.94, - "learning_rate": 5.828284445430183e-07, - "loss": 0.6274, - "step": 75832 - }, - { - "epoch": 1.94, - "learning_rate": 5.828032970261547e-07, - "loss": 0.9492, - "step": 75833 - }, - { - "epoch": 1.94, - "learning_rate": 5.827781498287191e-07, - "loss": 0.5581, - "step": 75834 - }, - { - "epoch": 1.94, - "learning_rate": 5.82753002950731e-07, - "loss": 0.5591, - "step": 75835 - }, - { - "epoch": 1.94, - "learning_rate": 5.827278563922102e-07, - "loss": 0.6304, - "step": 75836 - }, - { - "epoch": 1.94, - "learning_rate": 5.827027101531751e-07, - "loss": 0.6523, - "step": 75837 - }, - { - "epoch": 1.94, - "learning_rate": 5.826775642336453e-07, - "loss": 0.564, - "step": 75838 - }, - { - "epoch": 1.94, - "learning_rate": 5.826524186336401e-07, - "loss": 0.6865, - "step": 75839 - }, - { - "epoch": 1.94, - "learning_rate": 5.826272733531793e-07, - "loss": 0.4863, - "step": 75840 - }, - { - "epoch": 1.94, - "learning_rate": 5.826021283922811e-07, - "loss": 0.6453, - "step": 75841 - }, - { - "epoch": 1.94, - "learning_rate": 5.825769837509652e-07, - "loss": 0.7354, - "step": 75842 - }, - { - "epoch": 1.94, - "learning_rate": 5.825518394292513e-07, - "loss": 0.4583, - "step": 75843 - }, - { - "epoch": 1.94, - "learning_rate": 5.825266954271584e-07, - "loss": 0.5693, - "step": 75844 - }, - { - "epoch": 1.94, - "learning_rate": 5.825015517447052e-07, - "loss": 0.5054, - "step": 75845 - }, - { - "epoch": 1.94, - "learning_rate": 5.824764083819112e-07, - "loss": 0.6885, - "step": 75846 - }, - { - "epoch": 1.94, - "learning_rate": 5.82451265338796e-07, - "loss": 0.8838, - "step": 75847 - }, - { - "epoch": 1.94, - "learning_rate": 5.824261226153789e-07, - "loss": 0.5469, - "step": 75848 - }, - { - "epoch": 1.94, - "learning_rate": 5.824009802116786e-07, - "loss": 0.8281, - "step": 75849 - }, - { - "epoch": 1.94, - "learning_rate": 5.823758381277146e-07, - "loss": 0.5581, - "step": 75850 - }, - { - "epoch": 1.94, - "learning_rate": 5.823506963635063e-07, - "loss": 0.4688, - "step": 75851 - }, - { - "epoch": 1.94, - "learning_rate": 5.823255549190733e-07, - "loss": 0.6147, - "step": 75852 - }, - { - "epoch": 1.94, - "learning_rate": 5.823004137944344e-07, - "loss": 0.7129, - "step": 75853 - }, - { - "epoch": 1.94, - "learning_rate": 5.822752729896084e-07, - "loss": 0.4068, - "step": 75854 - }, - { - "epoch": 1.94, - "learning_rate": 5.822501325046151e-07, - "loss": 0.4951, - "step": 75855 - }, - { - "epoch": 1.94, - "learning_rate": 5.822249923394735e-07, - "loss": 0.5449, - "step": 75856 - }, - { - "epoch": 1.94, - "learning_rate": 5.821998524942036e-07, - "loss": 0.7197, - "step": 75857 - }, - { - "epoch": 1.94, - "learning_rate": 5.821747129688237e-07, - "loss": 0.7422, - "step": 75858 - }, - { - "epoch": 1.94, - "learning_rate": 5.821495737633532e-07, - "loss": 0.3264, - "step": 75859 - }, - { - "epoch": 1.94, - "learning_rate": 5.82124434877812e-07, - "loss": 0.3811, - "step": 75860 - }, - { - "epoch": 1.94, - "learning_rate": 5.820992963122187e-07, - "loss": 0.6392, - "step": 75861 - }, - { - "epoch": 1.94, - "learning_rate": 5.820741580665925e-07, - "loss": 0.5271, - "step": 75862 - }, - { - "epoch": 1.94, - "learning_rate": 5.820490201409534e-07, - "loss": 0.5732, - "step": 75863 - }, - { - "epoch": 1.94, - "learning_rate": 5.820238825353199e-07, - "loss": 0.502, - "step": 75864 - }, - { - "epoch": 1.94, - "learning_rate": 5.819987452497117e-07, - "loss": 0.5811, - "step": 75865 - }, - { - "epoch": 1.94, - "learning_rate": 5.819736082841476e-07, - "loss": 0.5991, - "step": 75866 - }, - { - "epoch": 1.94, - "learning_rate": 5.819484716386469e-07, - "loss": 0.5308, - "step": 75867 - }, - { - "epoch": 1.94, - "learning_rate": 5.819233353132291e-07, - "loss": 0.5, - "step": 75868 - }, - { - "epoch": 1.94, - "learning_rate": 5.818981993079139e-07, - "loss": 0.5591, - "step": 75869 - }, - { - "epoch": 1.94, - "learning_rate": 5.818730636227195e-07, - "loss": 0.4521, - "step": 75870 - }, - { - "epoch": 1.94, - "learning_rate": 5.818479282576656e-07, - "loss": 0.5942, - "step": 75871 - }, - { - "epoch": 1.94, - "learning_rate": 5.818227932127717e-07, - "loss": 0.5747, - "step": 75872 - }, - { - "epoch": 1.94, - "learning_rate": 5.817976584880571e-07, - "loss": 0.8018, - "step": 75873 - }, - { - "epoch": 1.94, - "learning_rate": 5.817725240835409e-07, - "loss": 0.6104, - "step": 75874 - }, - { - "epoch": 1.94, - "learning_rate": 5.817473899992417e-07, - "loss": 0.5762, - "step": 75875 - }, - { - "epoch": 1.94, - "learning_rate": 5.817222562351796e-07, - "loss": 0.5913, - "step": 75876 - }, - { - "epoch": 1.94, - "learning_rate": 5.816971227913736e-07, - "loss": 0.5308, - "step": 75877 - }, - { - "epoch": 1.94, - "learning_rate": 5.816719896678427e-07, - "loss": 0.5464, - "step": 75878 - }, - { - "epoch": 1.94, - "learning_rate": 5.816468568646062e-07, - "loss": 0.6539, - "step": 75879 - }, - { - "epoch": 1.94, - "learning_rate": 5.816217243816835e-07, - "loss": 0.5557, - "step": 75880 - }, - { - "epoch": 1.94, - "learning_rate": 5.815965922190943e-07, - "loss": 0.6367, - "step": 75881 - }, - { - "epoch": 1.94, - "learning_rate": 5.815714603768569e-07, - "loss": 0.7451, - "step": 75882 - }, - { - "epoch": 1.94, - "learning_rate": 5.815463288549913e-07, - "loss": 0.5367, - "step": 75883 - }, - { - "epoch": 1.94, - "learning_rate": 5.815211976535162e-07, - "loss": 0.582, - "step": 75884 - }, - { - "epoch": 1.94, - "learning_rate": 5.814960667724509e-07, - "loss": 0.6138, - "step": 75885 - }, - { - "epoch": 1.94, - "learning_rate": 5.814709362118153e-07, - "loss": 0.6055, - "step": 75886 - }, - { - "epoch": 1.95, - "learning_rate": 5.814458059716278e-07, - "loss": 0.5305, - "step": 75887 - }, - { - "epoch": 1.95, - "learning_rate": 5.814206760519078e-07, - "loss": 0.4893, - "step": 75888 - }, - { - "epoch": 1.95, - "learning_rate": 5.813955464526749e-07, - "loss": 0.7039, - "step": 75889 - }, - { - "epoch": 1.95, - "learning_rate": 5.813704171739486e-07, - "loss": 0.6211, - "step": 75890 - }, - { - "epoch": 1.95, - "learning_rate": 5.813452882157473e-07, - "loss": 0.6523, - "step": 75891 - }, - { - "epoch": 1.95, - "learning_rate": 5.813201595780908e-07, - "loss": 0.4622, - "step": 75892 - }, - { - "epoch": 1.95, - "learning_rate": 5.812950312609983e-07, - "loss": 0.6797, - "step": 75893 - }, - { - "epoch": 1.95, - "learning_rate": 5.812699032644892e-07, - "loss": 0.6367, - "step": 75894 - }, - { - "epoch": 1.95, - "learning_rate": 5.81244775588582e-07, - "loss": 0.501, - "step": 75895 - }, - { - "epoch": 1.95, - "learning_rate": 5.812196482332964e-07, - "loss": 0.6221, - "step": 75896 - }, - { - "epoch": 1.95, - "learning_rate": 5.811945211986516e-07, - "loss": 0.6514, - "step": 75897 - }, - { - "epoch": 1.95, - "learning_rate": 5.811693944846674e-07, - "loss": 0.4612, - "step": 75898 - }, - { - "epoch": 1.95, - "learning_rate": 5.81144268091362e-07, - "loss": 0.7793, - "step": 75899 - }, - { - "epoch": 1.95, - "learning_rate": 5.811191420187553e-07, - "loss": 0.4712, - "step": 75900 - }, - { - "epoch": 1.95, - "learning_rate": 5.810940162668664e-07, - "loss": 0.791, - "step": 75901 - }, - { - "epoch": 1.95, - "learning_rate": 5.81068890835715e-07, - "loss": 0.6943, - "step": 75902 - }, - { - "epoch": 1.95, - "learning_rate": 5.810437657253199e-07, - "loss": 0.5625, - "step": 75903 - }, - { - "epoch": 1.95, - "learning_rate": 5.810186409356998e-07, - "loss": 0.6777, - "step": 75904 - }, - { - "epoch": 1.95, - "learning_rate": 5.809935164668744e-07, - "loss": 0.6748, - "step": 75905 - }, - { - "epoch": 1.95, - "learning_rate": 5.809683923188633e-07, - "loss": 0.6162, - "step": 75906 - }, - { - "epoch": 1.95, - "learning_rate": 5.809432684916855e-07, - "loss": 0.4971, - "step": 75907 - }, - { - "epoch": 1.95, - "learning_rate": 5.8091814498536e-07, - "loss": 0.667, - "step": 75908 - }, - { - "epoch": 1.95, - "learning_rate": 5.808930217999062e-07, - "loss": 0.5571, - "step": 75909 - }, - { - "epoch": 1.95, - "learning_rate": 5.808678989353432e-07, - "loss": 0.8145, - "step": 75910 - }, - { - "epoch": 1.95, - "learning_rate": 5.808427763916908e-07, - "loss": 0.4998, - "step": 75911 - }, - { - "epoch": 1.95, - "learning_rate": 5.808176541689675e-07, - "loss": 0.6182, - "step": 75912 - }, - { - "epoch": 1.95, - "learning_rate": 5.807925322671932e-07, - "loss": 0.707, - "step": 75913 - }, - { - "epoch": 1.95, - "learning_rate": 5.807674106863863e-07, - "loss": 0.833, - "step": 75914 - }, - { - "epoch": 1.95, - "learning_rate": 5.80742289426567e-07, - "loss": 0.6699, - "step": 75915 - }, - { - "epoch": 1.95, - "learning_rate": 5.807171684877537e-07, - "loss": 0.3777, - "step": 75916 - }, - { - "epoch": 1.95, - "learning_rate": 5.80692047869966e-07, - "loss": 0.4114, - "step": 75917 - }, - { - "epoch": 1.95, - "learning_rate": 5.80666927573223e-07, - "loss": 0.7588, - "step": 75918 - }, - { - "epoch": 1.95, - "learning_rate": 5.806418075975445e-07, - "loss": 0.6255, - "step": 75919 - }, - { - "epoch": 1.95, - "learning_rate": 5.806166879429488e-07, - "loss": 0.6655, - "step": 75920 - }, - { - "epoch": 1.95, - "learning_rate": 5.805915686094558e-07, - "loss": 0.5771, - "step": 75921 - }, - { - "epoch": 1.95, - "learning_rate": 5.805664495970845e-07, - "loss": 0.606, - "step": 75922 - }, - { - "epoch": 1.95, - "learning_rate": 5.805413309058544e-07, - "loss": 0.6387, - "step": 75923 - }, - { - "epoch": 1.95, - "learning_rate": 5.805162125357848e-07, - "loss": 0.6807, - "step": 75924 - }, - { - "epoch": 1.95, - "learning_rate": 5.804910944868941e-07, - "loss": 0.793, - "step": 75925 - }, - { - "epoch": 1.95, - "learning_rate": 5.80465976759202e-07, - "loss": 0.7451, - "step": 75926 - }, - { - "epoch": 1.95, - "learning_rate": 5.804408593527279e-07, - "loss": 0.5879, - "step": 75927 - }, - { - "epoch": 1.95, - "learning_rate": 5.804157422674913e-07, - "loss": 0.626, - "step": 75928 - }, - { - "epoch": 1.95, - "learning_rate": 5.80390625503511e-07, - "loss": 0.667, - "step": 75929 - }, - { - "epoch": 1.95, - "learning_rate": 5.803655090608059e-07, - "loss": 0.5713, - "step": 75930 - }, - { - "epoch": 1.95, - "learning_rate": 5.803403929393957e-07, - "loss": 0.7119, - "step": 75931 - }, - { - "epoch": 1.95, - "learning_rate": 5.803152771393001e-07, - "loss": 0.6328, - "step": 75932 - }, - { - "epoch": 1.95, - "learning_rate": 5.802901616605375e-07, - "loss": 0.6572, - "step": 75933 - }, - { - "epoch": 1.95, - "learning_rate": 5.802650465031273e-07, - "loss": 0.4995, - "step": 75934 - }, - { - "epoch": 1.95, - "learning_rate": 5.802399316670889e-07, - "loss": 0.4304, - "step": 75935 - }, - { - "epoch": 1.95, - "learning_rate": 5.802148171524417e-07, - "loss": 0.6201, - "step": 75936 - }, - { - "epoch": 1.95, - "learning_rate": 5.801897029592044e-07, - "loss": 0.5262, - "step": 75937 - }, - { - "epoch": 1.95, - "learning_rate": 5.801645890873965e-07, - "loss": 0.7842, - "step": 75938 - }, - { - "epoch": 1.95, - "learning_rate": 5.801394755370373e-07, - "loss": 0.5615, - "step": 75939 - }, - { - "epoch": 1.95, - "learning_rate": 5.801143623081465e-07, - "loss": 0.7305, - "step": 75940 - }, - { - "epoch": 1.95, - "learning_rate": 5.800892494007423e-07, - "loss": 0.7339, - "step": 75941 - }, - { - "epoch": 1.95, - "learning_rate": 5.800641368148444e-07, - "loss": 0.6729, - "step": 75942 - }, - { - "epoch": 1.95, - "learning_rate": 5.800390245504726e-07, - "loss": 0.5503, - "step": 75943 - }, - { - "epoch": 1.95, - "learning_rate": 5.80013912607645e-07, - "loss": 0.7568, - "step": 75944 - }, - { - "epoch": 1.95, - "learning_rate": 5.799888009863822e-07, - "loss": 0.6953, - "step": 75945 - }, - { - "epoch": 1.95, - "learning_rate": 5.79963689686702e-07, - "loss": 0.4664, - "step": 75946 - }, - { - "epoch": 1.95, - "learning_rate": 5.799385787086244e-07, - "loss": 0.7607, - "step": 75947 - }, - { - "epoch": 1.95, - "learning_rate": 5.799134680521684e-07, - "loss": 0.563, - "step": 75948 - }, - { - "epoch": 1.95, - "learning_rate": 5.798883577173539e-07, - "loss": 0.833, - "step": 75949 - }, - { - "epoch": 1.95, - "learning_rate": 5.798632477041991e-07, - "loss": 0.6641, - "step": 75950 - }, - { - "epoch": 1.95, - "learning_rate": 5.798381380127236e-07, - "loss": 0.7031, - "step": 75951 - }, - { - "epoch": 1.95, - "learning_rate": 5.798130286429472e-07, - "loss": 0.6118, - "step": 75952 - }, - { - "epoch": 1.95, - "learning_rate": 5.797879195948887e-07, - "loss": 0.751, - "step": 75953 - }, - { - "epoch": 1.95, - "learning_rate": 5.797628108685667e-07, - "loss": 0.6228, - "step": 75954 - }, - { - "epoch": 1.95, - "learning_rate": 5.797377024640012e-07, - "loss": 0.7969, - "step": 75955 - }, - { - "epoch": 1.95, - "learning_rate": 5.79712594381211e-07, - "loss": 0.6636, - "step": 75956 - }, - { - "epoch": 1.95, - "learning_rate": 5.79687486620216e-07, - "loss": 0.6689, - "step": 75957 - }, - { - "epoch": 1.95, - "learning_rate": 5.796623791810347e-07, - "loss": 0.6631, - "step": 75958 - }, - { - "epoch": 1.95, - "learning_rate": 5.796372720636865e-07, - "loss": 0.707, - "step": 75959 - }, - { - "epoch": 1.95, - "learning_rate": 5.796121652681906e-07, - "loss": 0.708, - "step": 75960 - }, - { - "epoch": 1.95, - "learning_rate": 5.79587058794567e-07, - "loss": 0.4731, - "step": 75961 - }, - { - "epoch": 1.95, - "learning_rate": 5.795619526428341e-07, - "loss": 0.6143, - "step": 75962 - }, - { - "epoch": 1.95, - "learning_rate": 5.795368468130109e-07, - "loss": 0.5244, - "step": 75963 - }, - { - "epoch": 1.95, - "learning_rate": 5.795117413051169e-07, - "loss": 0.5212, - "step": 75964 - }, - { - "epoch": 1.95, - "learning_rate": 5.794866361191714e-07, - "loss": 0.5513, - "step": 75965 - }, - { - "epoch": 1.95, - "learning_rate": 5.794615312551942e-07, - "loss": 0.71, - "step": 75966 - }, - { - "epoch": 1.95, - "learning_rate": 5.794364267132037e-07, - "loss": 0.6104, - "step": 75967 - }, - { - "epoch": 1.95, - "learning_rate": 5.794113224932191e-07, - "loss": 0.5854, - "step": 75968 - }, - { - "epoch": 1.95, - "learning_rate": 5.793862185952604e-07, - "loss": 0.6387, - "step": 75969 - }, - { - "epoch": 1.95, - "learning_rate": 5.79361115019346e-07, - "loss": 0.6235, - "step": 75970 - }, - { - "epoch": 1.95, - "learning_rate": 5.793360117654955e-07, - "loss": 0.5283, - "step": 75971 - }, - { - "epoch": 1.95, - "learning_rate": 5.793109088337285e-07, - "loss": 0.791, - "step": 75972 - }, - { - "epoch": 1.95, - "learning_rate": 5.792858062240631e-07, - "loss": 0.7412, - "step": 75973 - }, - { - "epoch": 1.95, - "learning_rate": 5.792607039365198e-07, - "loss": 0.7002, - "step": 75974 - }, - { - "epoch": 1.95, - "learning_rate": 5.792356019711169e-07, - "loss": 0.5908, - "step": 75975 - }, - { - "epoch": 1.95, - "learning_rate": 5.792105003278739e-07, - "loss": 0.5647, - "step": 75976 - }, - { - "epoch": 1.95, - "learning_rate": 5.791853990068101e-07, - "loss": 0.6191, - "step": 75977 - }, - { - "epoch": 1.95, - "learning_rate": 5.791602980079449e-07, - "loss": 0.7305, - "step": 75978 - }, - { - "epoch": 1.95, - "learning_rate": 5.791351973312971e-07, - "loss": 0.6621, - "step": 75979 - }, - { - "epoch": 1.95, - "learning_rate": 5.79110096976886e-07, - "loss": 0.4565, - "step": 75980 - }, - { - "epoch": 1.95, - "learning_rate": 5.790849969447311e-07, - "loss": 0.583, - "step": 75981 - }, - { - "epoch": 1.95, - "learning_rate": 5.790598972348518e-07, - "loss": 0.6809, - "step": 75982 - }, - { - "epoch": 1.95, - "learning_rate": 5.790347978472669e-07, - "loss": 0.6455, - "step": 75983 - }, - { - "epoch": 1.95, - "learning_rate": 5.790096987819954e-07, - "loss": 0.5952, - "step": 75984 - }, - { - "epoch": 1.95, - "learning_rate": 5.789846000390568e-07, - "loss": 0.6387, - "step": 75985 - }, - { - "epoch": 1.95, - "learning_rate": 5.789595016184708e-07, - "loss": 0.8271, - "step": 75986 - }, - { - "epoch": 1.95, - "learning_rate": 5.789344035202557e-07, - "loss": 0.5781, - "step": 75987 - }, - { - "epoch": 1.95, - "learning_rate": 5.789093057444311e-07, - "loss": 0.7031, - "step": 75988 - }, - { - "epoch": 1.95, - "learning_rate": 5.788842082910164e-07, - "loss": 0.5017, - "step": 75989 - }, - { - "epoch": 1.95, - "learning_rate": 5.78859111160031e-07, - "loss": 0.6836, - "step": 75990 - }, - { - "epoch": 1.95, - "learning_rate": 5.788340143514934e-07, - "loss": 0.709, - "step": 75991 - }, - { - "epoch": 1.95, - "learning_rate": 5.788089178654236e-07, - "loss": 0.6465, - "step": 75992 - }, - { - "epoch": 1.95, - "learning_rate": 5.787838217018401e-07, - "loss": 0.6753, - "step": 75993 - }, - { - "epoch": 1.95, - "learning_rate": 5.787587258607625e-07, - "loss": 0.6162, - "step": 75994 - }, - { - "epoch": 1.95, - "learning_rate": 5.787336303422103e-07, - "loss": 0.71, - "step": 75995 - }, - { - "epoch": 1.95, - "learning_rate": 5.78708535146202e-07, - "loss": 0.666, - "step": 75996 - }, - { - "epoch": 1.95, - "learning_rate": 5.786834402727572e-07, - "loss": 0.6282, - "step": 75997 - }, - { - "epoch": 1.95, - "learning_rate": 5.786583457218952e-07, - "loss": 0.6074, - "step": 75998 - }, - { - "epoch": 1.95, - "learning_rate": 5.786332514936355e-07, - "loss": 0.5522, - "step": 75999 - }, - { - "epoch": 1.95, - "learning_rate": 5.786081575879965e-07, - "loss": 0.6432, - "step": 76000 - }, - { - "epoch": 1.95, - "learning_rate": 5.78583064004998e-07, - "loss": 0.5576, - "step": 76001 - }, - { - "epoch": 1.95, - "learning_rate": 5.785579707446593e-07, - "loss": 0.7744, - "step": 76002 - }, - { - "epoch": 1.95, - "learning_rate": 5.785328778069993e-07, - "loss": 0.3103, - "step": 76003 - }, - { - "epoch": 1.95, - "learning_rate": 5.785077851920371e-07, - "loss": 0.6162, - "step": 76004 - }, - { - "epoch": 1.95, - "learning_rate": 5.784826928997921e-07, - "loss": 0.6401, - "step": 76005 - }, - { - "epoch": 1.95, - "learning_rate": 5.784576009302835e-07, - "loss": 0.6416, - "step": 76006 - }, - { - "epoch": 1.95, - "learning_rate": 5.784325092835309e-07, - "loss": 0.5818, - "step": 76007 - }, - { - "epoch": 1.95, - "learning_rate": 5.784074179595526e-07, - "loss": 0.7422, - "step": 76008 - }, - { - "epoch": 1.95, - "learning_rate": 5.783823269583685e-07, - "loss": 0.8398, - "step": 76009 - }, - { - "epoch": 1.95, - "learning_rate": 5.783572362799978e-07, - "loss": 0.7012, - "step": 76010 - }, - { - "epoch": 1.95, - "learning_rate": 5.783321459244597e-07, - "loss": 0.833, - "step": 76011 - }, - { - "epoch": 1.95, - "learning_rate": 5.783070558917736e-07, - "loss": 0.5537, - "step": 76012 - }, - { - "epoch": 1.95, - "learning_rate": 5.782819661819577e-07, - "loss": 0.5835, - "step": 76013 - }, - { - "epoch": 1.95, - "learning_rate": 5.78256876795032e-07, - "loss": 0.7754, - "step": 76014 - }, - { - "epoch": 1.95, - "learning_rate": 5.782317877310156e-07, - "loss": 0.6382, - "step": 76015 - }, - { - "epoch": 1.95, - "learning_rate": 5.782066989899281e-07, - "loss": 0.7256, - "step": 76016 - }, - { - "epoch": 1.95, - "learning_rate": 5.78181610571788e-07, - "loss": 0.4604, - "step": 76017 - }, - { - "epoch": 1.95, - "learning_rate": 5.781565224766149e-07, - "loss": 0.5903, - "step": 76018 - }, - { - "epoch": 1.95, - "learning_rate": 5.78131434704428e-07, - "loss": 0.562, - "step": 76019 - }, - { - "epoch": 1.95, - "learning_rate": 5.781063472552468e-07, - "loss": 0.4475, - "step": 76020 - }, - { - "epoch": 1.95, - "learning_rate": 5.780812601290896e-07, - "loss": 0.5044, - "step": 76021 - }, - { - "epoch": 1.95, - "learning_rate": 5.780561733259768e-07, - "loss": 0.6292, - "step": 76022 - }, - { - "epoch": 1.95, - "learning_rate": 5.780310868459265e-07, - "loss": 0.6616, - "step": 76023 - }, - { - "epoch": 1.95, - "learning_rate": 5.780060006889588e-07, - "loss": 0.5771, - "step": 76024 - }, - { - "epoch": 1.95, - "learning_rate": 5.779809148550921e-07, - "loss": 0.4622, - "step": 76025 - }, - { - "epoch": 1.95, - "learning_rate": 5.77955829344346e-07, - "loss": 0.54, - "step": 76026 - }, - { - "epoch": 1.95, - "learning_rate": 5.779307441567397e-07, - "loss": 0.4917, - "step": 76027 - }, - { - "epoch": 1.95, - "learning_rate": 5.779056592922929e-07, - "loss": 0.5771, - "step": 76028 - }, - { - "epoch": 1.95, - "learning_rate": 5.778805747510238e-07, - "loss": 0.5732, - "step": 76029 - }, - { - "epoch": 1.95, - "learning_rate": 5.778554905329522e-07, - "loss": 0.4766, - "step": 76030 - }, - { - "epoch": 1.95, - "learning_rate": 5.778304066380972e-07, - "loss": 0.708, - "step": 76031 - }, - { - "epoch": 1.95, - "learning_rate": 5.778053230664786e-07, - "loss": 0.5493, - "step": 76032 - }, - { - "epoch": 1.95, - "learning_rate": 5.777802398181148e-07, - "loss": 0.7202, - "step": 76033 - }, - { - "epoch": 1.95, - "learning_rate": 5.77755156893025e-07, - "loss": 0.4607, - "step": 76034 - }, - { - "epoch": 1.95, - "learning_rate": 5.777300742912288e-07, - "loss": 0.5284, - "step": 76035 - }, - { - "epoch": 1.95, - "learning_rate": 5.77704992012745e-07, - "loss": 0.5508, - "step": 76036 - }, - { - "epoch": 1.95, - "learning_rate": 5.776799100575936e-07, - "loss": 0.7363, - "step": 76037 - }, - { - "epoch": 1.95, - "learning_rate": 5.776548284257929e-07, - "loss": 0.5913, - "step": 76038 - }, - { - "epoch": 1.95, - "learning_rate": 5.776297471173626e-07, - "loss": 0.6455, - "step": 76039 - }, - { - "epoch": 1.95, - "learning_rate": 5.77604666132322e-07, - "loss": 0.5142, - "step": 76040 - }, - { - "epoch": 1.95, - "learning_rate": 5.775795854706896e-07, - "loss": 0.7041, - "step": 76041 - }, - { - "epoch": 1.95, - "learning_rate": 5.775545051324856e-07, - "loss": 0.875, - "step": 76042 - }, - { - "epoch": 1.95, - "learning_rate": 5.775294251177283e-07, - "loss": 0.6465, - "step": 76043 - }, - { - "epoch": 1.95, - "learning_rate": 5.775043454264373e-07, - "loss": 0.603, - "step": 76044 - }, - { - "epoch": 1.95, - "learning_rate": 5.774792660586322e-07, - "loss": 0.5283, - "step": 76045 - }, - { - "epoch": 1.95, - "learning_rate": 5.774541870143314e-07, - "loss": 0.6392, - "step": 76046 - }, - { - "epoch": 1.95, - "learning_rate": 5.774291082935545e-07, - "loss": 0.5762, - "step": 76047 - }, - { - "epoch": 1.95, - "learning_rate": 5.774040298963206e-07, - "loss": 0.687, - "step": 76048 - }, - { - "epoch": 1.95, - "learning_rate": 5.773789518226495e-07, - "loss": 0.5469, - "step": 76049 - }, - { - "epoch": 1.95, - "learning_rate": 5.773538740725594e-07, - "loss": 0.6611, - "step": 76050 - }, - { - "epoch": 1.95, - "learning_rate": 5.773287966460703e-07, - "loss": 0.8037, - "step": 76051 - }, - { - "epoch": 1.95, - "learning_rate": 5.773037195432011e-07, - "loss": 0.606, - "step": 76052 - }, - { - "epoch": 1.95, - "learning_rate": 5.772786427639709e-07, - "loss": 0.4766, - "step": 76053 - }, - { - "epoch": 1.95, - "learning_rate": 5.772535663083993e-07, - "loss": 0.7549, - "step": 76054 - }, - { - "epoch": 1.95, - "learning_rate": 5.772284901765048e-07, - "loss": 0.5293, - "step": 76055 - }, - { - "epoch": 1.95, - "learning_rate": 5.772034143683071e-07, - "loss": 0.5493, - "step": 76056 - }, - { - "epoch": 1.95, - "learning_rate": 5.771783388838256e-07, - "loss": 0.5288, - "step": 76057 - }, - { - "epoch": 1.95, - "learning_rate": 5.771532637230788e-07, - "loss": 0.6143, - "step": 76058 - }, - { - "epoch": 1.95, - "learning_rate": 5.771281888860864e-07, - "loss": 0.4795, - "step": 76059 - }, - { - "epoch": 1.95, - "learning_rate": 5.771031143728673e-07, - "loss": 0.5146, - "step": 76060 - }, - { - "epoch": 1.95, - "learning_rate": 5.770780401834414e-07, - "loss": 0.6221, - "step": 76061 - }, - { - "epoch": 1.95, - "learning_rate": 5.770529663178275e-07, - "loss": 0.6641, - "step": 76062 - }, - { - "epoch": 1.95, - "learning_rate": 5.770278927760443e-07, - "loss": 0.7578, - "step": 76063 - }, - { - "epoch": 1.95, - "learning_rate": 5.770028195581114e-07, - "loss": 0.5522, - "step": 76064 - }, - { - "epoch": 1.95, - "learning_rate": 5.769777466640478e-07, - "loss": 0.5527, - "step": 76065 - }, - { - "epoch": 1.95, - "learning_rate": 5.769526740938734e-07, - "loss": 0.6655, - "step": 76066 - }, - { - "epoch": 1.95, - "learning_rate": 5.769276018476065e-07, - "loss": 0.6279, - "step": 76067 - }, - { - "epoch": 1.95, - "learning_rate": 5.769025299252667e-07, - "loss": 0.4587, - "step": 76068 - }, - { - "epoch": 1.95, - "learning_rate": 5.768774583268732e-07, - "loss": 0.708, - "step": 76069 - }, - { - "epoch": 1.95, - "learning_rate": 5.768523870524454e-07, - "loss": 0.6289, - "step": 76070 - }, - { - "epoch": 1.95, - "learning_rate": 5.76827316102002e-07, - "loss": 0.4746, - "step": 76071 - }, - { - "epoch": 1.95, - "learning_rate": 5.768022454755629e-07, - "loss": 0.5112, - "step": 76072 - }, - { - "epoch": 1.95, - "learning_rate": 5.767771751731464e-07, - "loss": 0.5986, - "step": 76073 - }, - { - "epoch": 1.95, - "learning_rate": 5.767521051947721e-07, - "loss": 0.7373, - "step": 76074 - }, - { - "epoch": 1.95, - "learning_rate": 5.767270355404599e-07, - "loss": 0.5391, - "step": 76075 - }, - { - "epoch": 1.95, - "learning_rate": 5.767019662102277e-07, - "loss": 0.5317, - "step": 76076 - }, - { - "epoch": 1.95, - "learning_rate": 5.766768972040954e-07, - "loss": 0.6067, - "step": 76077 - }, - { - "epoch": 1.95, - "learning_rate": 5.766518285220825e-07, - "loss": 0.6807, - "step": 76078 - }, - { - "epoch": 1.95, - "learning_rate": 5.766267601642075e-07, - "loss": 0.7178, - "step": 76079 - }, - { - "epoch": 1.95, - "learning_rate": 5.766016921304899e-07, - "loss": 0.4617, - "step": 76080 - }, - { - "epoch": 1.95, - "learning_rate": 5.765766244209489e-07, - "loss": 0.5818, - "step": 76081 - }, - { - "epoch": 1.95, - "learning_rate": 5.765515570356041e-07, - "loss": 0.5383, - "step": 76082 - }, - { - "epoch": 1.95, - "learning_rate": 5.765264899744744e-07, - "loss": 0.7178, - "step": 76083 - }, - { - "epoch": 1.95, - "learning_rate": 5.765014232375784e-07, - "loss": 0.6587, - "step": 76084 - }, - { - "epoch": 1.95, - "learning_rate": 5.764763568249358e-07, - "loss": 0.6743, - "step": 76085 - }, - { - "epoch": 1.95, - "learning_rate": 5.764512907365658e-07, - "loss": 0.7744, - "step": 76086 - }, - { - "epoch": 1.95, - "learning_rate": 5.764262249724881e-07, - "loss": 0.5315, - "step": 76087 - }, - { - "epoch": 1.95, - "learning_rate": 5.764011595327207e-07, - "loss": 0.5547, - "step": 76088 - }, - { - "epoch": 1.95, - "learning_rate": 5.763760944172835e-07, - "loss": 0.873, - "step": 76089 - }, - { - "epoch": 1.95, - "learning_rate": 5.763510296261957e-07, - "loss": 0.5581, - "step": 76090 - }, - { - "epoch": 1.95, - "learning_rate": 5.76325965159477e-07, - "loss": 0.5757, - "step": 76091 - }, - { - "epoch": 1.95, - "learning_rate": 5.763009010171458e-07, - "loss": 0.7861, - "step": 76092 - }, - { - "epoch": 1.95, - "learning_rate": 5.762758371992213e-07, - "loss": 0.6978, - "step": 76093 - }, - { - "epoch": 1.95, - "learning_rate": 5.762507737057227e-07, - "loss": 0.52, - "step": 76094 - }, - { - "epoch": 1.95, - "learning_rate": 5.7622571053667e-07, - "loss": 0.5903, - "step": 76095 - }, - { - "epoch": 1.95, - "learning_rate": 5.762006476920813e-07, - "loss": 0.5857, - "step": 76096 - }, - { - "epoch": 1.95, - "learning_rate": 5.761755851719763e-07, - "loss": 0.4719, - "step": 76097 - }, - { - "epoch": 1.95, - "learning_rate": 5.761505229763741e-07, - "loss": 0.7715, - "step": 76098 - }, - { - "epoch": 1.95, - "learning_rate": 5.761254611052944e-07, - "loss": 0.6475, - "step": 76099 - }, - { - "epoch": 1.95, - "learning_rate": 5.761003995587556e-07, - "loss": 0.5776, - "step": 76100 - }, - { - "epoch": 1.95, - "learning_rate": 5.760753383367771e-07, - "loss": 0.6997, - "step": 76101 - }, - { - "epoch": 1.95, - "learning_rate": 5.760502774393788e-07, - "loss": 0.6641, - "step": 76102 - }, - { - "epoch": 1.95, - "learning_rate": 5.760252168665787e-07, - "loss": 0.5449, - "step": 76103 - }, - { - "epoch": 1.95, - "learning_rate": 5.760001566183972e-07, - "loss": 0.5278, - "step": 76104 - }, - { - "epoch": 1.95, - "learning_rate": 5.759750966948523e-07, - "loss": 0.5149, - "step": 76105 - }, - { - "epoch": 1.95, - "learning_rate": 5.759500370959639e-07, - "loss": 0.6753, - "step": 76106 - }, - { - "epoch": 1.95, - "learning_rate": 5.75924977821751e-07, - "loss": 0.5439, - "step": 76107 - }, - { - "epoch": 1.95, - "learning_rate": 5.758999188722333e-07, - "loss": 0.6709, - "step": 76108 - }, - { - "epoch": 1.95, - "learning_rate": 5.75874860247429e-07, - "loss": 0.6543, - "step": 76109 - }, - { - "epoch": 1.95, - "learning_rate": 5.758498019473579e-07, - "loss": 0.5518, - "step": 76110 - }, - { - "epoch": 1.95, - "learning_rate": 5.758247439720392e-07, - "loss": 0.6919, - "step": 76111 - }, - { - "epoch": 1.95, - "learning_rate": 5.757996863214927e-07, - "loss": 0.7402, - "step": 76112 - }, - { - "epoch": 1.95, - "learning_rate": 5.757746289957362e-07, - "loss": 0.583, - "step": 76113 - }, - { - "epoch": 1.95, - "learning_rate": 5.757495719947894e-07, - "loss": 0.6953, - "step": 76114 - }, - { - "epoch": 1.95, - "learning_rate": 5.757245153186716e-07, - "loss": 0.5818, - "step": 76115 - }, - { - "epoch": 1.95, - "learning_rate": 5.756994589674025e-07, - "loss": 0.6973, - "step": 76116 - }, - { - "epoch": 1.95, - "learning_rate": 5.756744029410004e-07, - "loss": 0.6514, - "step": 76117 - }, - { - "epoch": 1.95, - "learning_rate": 5.75649347239485e-07, - "loss": 0.5527, - "step": 76118 - }, - { - "epoch": 1.95, - "learning_rate": 5.756242918628753e-07, - "loss": 0.6611, - "step": 76119 - }, - { - "epoch": 1.95, - "learning_rate": 5.755992368111911e-07, - "loss": 0.5676, - "step": 76120 - }, - { - "epoch": 1.95, - "learning_rate": 5.755741820844504e-07, - "loss": 0.6475, - "step": 76121 - }, - { - "epoch": 1.95, - "learning_rate": 5.755491276826736e-07, - "loss": 0.6355, - "step": 76122 - }, - { - "epoch": 1.95, - "learning_rate": 5.755240736058789e-07, - "loss": 0.7959, - "step": 76123 - }, - { - "epoch": 1.95, - "learning_rate": 5.754990198540857e-07, - "loss": 0.5996, - "step": 76124 - }, - { - "epoch": 1.95, - "learning_rate": 5.754739664273141e-07, - "loss": 0.5728, - "step": 76125 - }, - { - "epoch": 1.95, - "learning_rate": 5.75448913325582e-07, - "loss": 0.6309, - "step": 76126 - }, - { - "epoch": 1.95, - "learning_rate": 5.754238605489091e-07, - "loss": 0.6226, - "step": 76127 - }, - { - "epoch": 1.95, - "learning_rate": 5.753988080973147e-07, - "loss": 0.6792, - "step": 76128 - }, - { - "epoch": 1.95, - "learning_rate": 5.753737559708182e-07, - "loss": 0.5693, - "step": 76129 - }, - { - "epoch": 1.95, - "learning_rate": 5.753487041694382e-07, - "loss": 0.7744, - "step": 76130 - }, - { - "epoch": 1.95, - "learning_rate": 5.753236526931942e-07, - "loss": 0.4854, - "step": 76131 - }, - { - "epoch": 1.95, - "learning_rate": 5.752986015421058e-07, - "loss": 0.6787, - "step": 76132 - }, - { - "epoch": 1.95, - "learning_rate": 5.752735507161917e-07, - "loss": 0.7236, - "step": 76133 - }, - { - "epoch": 1.95, - "learning_rate": 5.752485002154705e-07, - "loss": 0.4492, - "step": 76134 - }, - { - "epoch": 1.95, - "learning_rate": 5.752234500399622e-07, - "loss": 0.6025, - "step": 76135 - }, - { - "epoch": 1.95, - "learning_rate": 5.751984001896858e-07, - "loss": 0.7598, - "step": 76136 - }, - { - "epoch": 1.95, - "learning_rate": 5.751733506646607e-07, - "loss": 0.562, - "step": 76137 - }, - { - "epoch": 1.95, - "learning_rate": 5.751483014649056e-07, - "loss": 0.6963, - "step": 76138 - }, - { - "epoch": 1.95, - "learning_rate": 5.751232525904398e-07, - "loss": 0.6719, - "step": 76139 - }, - { - "epoch": 1.95, - "learning_rate": 5.750982040412826e-07, - "loss": 0.5342, - "step": 76140 - }, - { - "epoch": 1.95, - "learning_rate": 5.750731558174535e-07, - "loss": 0.6758, - "step": 76141 - }, - { - "epoch": 1.95, - "learning_rate": 5.750481079189715e-07, - "loss": 0.6455, - "step": 76142 - }, - { - "epoch": 1.95, - "learning_rate": 5.750230603458552e-07, - "loss": 0.4878, - "step": 76143 - }, - { - "epoch": 1.95, - "learning_rate": 5.749980130981241e-07, - "loss": 0.6313, - "step": 76144 - }, - { - "epoch": 1.95, - "learning_rate": 5.749729661757976e-07, - "loss": 0.5903, - "step": 76145 - }, - { - "epoch": 1.95, - "learning_rate": 5.749479195788951e-07, - "loss": 0.584, - "step": 76146 - }, - { - "epoch": 1.95, - "learning_rate": 5.749228733074349e-07, - "loss": 0.6641, - "step": 76147 - }, - { - "epoch": 1.95, - "learning_rate": 5.748978273614368e-07, - "loss": 0.6484, - "step": 76148 - }, - { - "epoch": 1.95, - "learning_rate": 5.748727817409205e-07, - "loss": 0.7598, - "step": 76149 - }, - { - "epoch": 1.95, - "learning_rate": 5.748477364459039e-07, - "loss": 0.4956, - "step": 76150 - }, - { - "epoch": 1.95, - "learning_rate": 5.748226914764069e-07, - "loss": 0.7065, - "step": 76151 - }, - { - "epoch": 1.95, - "learning_rate": 5.747976468324491e-07, - "loss": 0.6758, - "step": 76152 - }, - { - "epoch": 1.95, - "learning_rate": 5.747726025140486e-07, - "loss": 0.6758, - "step": 76153 - }, - { - "epoch": 1.95, - "learning_rate": 5.747475585212258e-07, - "loss": 0.6416, - "step": 76154 - }, - { - "epoch": 1.95, - "learning_rate": 5.747225148539987e-07, - "loss": 0.7793, - "step": 76155 - }, - { - "epoch": 1.95, - "learning_rate": 5.74697471512387e-07, - "loss": 0.5332, - "step": 76156 - }, - { - "epoch": 1.95, - "learning_rate": 5.746724284964099e-07, - "loss": 0.5193, - "step": 76157 - }, - { - "epoch": 1.95, - "learning_rate": 5.74647385806087e-07, - "loss": 0.6753, - "step": 76158 - }, - { - "epoch": 1.95, - "learning_rate": 5.746223434414366e-07, - "loss": 0.4722, - "step": 76159 - }, - { - "epoch": 1.95, - "learning_rate": 5.745973014024784e-07, - "loss": 0.7178, - "step": 76160 - }, - { - "epoch": 1.95, - "learning_rate": 5.745722596892315e-07, - "loss": 0.6372, - "step": 76161 - }, - { - "epoch": 1.95, - "learning_rate": 5.745472183017154e-07, - "loss": 0.7192, - "step": 76162 - }, - { - "epoch": 1.95, - "learning_rate": 5.745221772399489e-07, - "loss": 0.6602, - "step": 76163 - }, - { - "epoch": 1.95, - "learning_rate": 5.744971365039508e-07, - "loss": 0.7637, - "step": 76164 - }, - { - "epoch": 1.95, - "learning_rate": 5.744720960937407e-07, - "loss": 0.2976, - "step": 76165 - }, - { - "epoch": 1.95, - "learning_rate": 5.744470560093382e-07, - "loss": 0.5718, - "step": 76166 - }, - { - "epoch": 1.95, - "learning_rate": 5.744220162507615e-07, - "loss": 0.7695, - "step": 76167 - }, - { - "epoch": 1.95, - "learning_rate": 5.743969768180304e-07, - "loss": 0.5923, - "step": 76168 - }, - { - "epoch": 1.95, - "learning_rate": 5.74371937711164e-07, - "loss": 0.623, - "step": 76169 - }, - { - "epoch": 1.95, - "learning_rate": 5.743468989301818e-07, - "loss": 0.6133, - "step": 76170 - }, - { - "epoch": 1.95, - "learning_rate": 5.743218604751021e-07, - "loss": 0.5854, - "step": 76171 - }, - { - "epoch": 1.95, - "learning_rate": 5.742968223459452e-07, - "loss": 0.5396, - "step": 76172 - }, - { - "epoch": 1.95, - "learning_rate": 5.742717845427289e-07, - "loss": 0.6348, - "step": 76173 - }, - { - "epoch": 1.95, - "learning_rate": 5.742467470654735e-07, - "loss": 0.7871, - "step": 76174 - }, - { - "epoch": 1.95, - "learning_rate": 5.742217099141979e-07, - "loss": 0.6943, - "step": 76175 - }, - { - "epoch": 1.95, - "learning_rate": 5.741966730889209e-07, - "loss": 0.5601, - "step": 76176 - }, - { - "epoch": 1.95, - "learning_rate": 5.74171636589662e-07, - "loss": 0.6426, - "step": 76177 - }, - { - "epoch": 1.95, - "learning_rate": 5.741466004164401e-07, - "loss": 0.7188, - "step": 76178 - }, - { - "epoch": 1.95, - "learning_rate": 5.741215645692752e-07, - "loss": 0.771, - "step": 76179 - }, - { - "epoch": 1.95, - "learning_rate": 5.740965290481852e-07, - "loss": 0.6396, - "step": 76180 - }, - { - "epoch": 1.95, - "learning_rate": 5.740714938531901e-07, - "loss": 0.564, - "step": 76181 - }, - { - "epoch": 1.95, - "learning_rate": 5.740464589843091e-07, - "loss": 0.6851, - "step": 76182 - }, - { - "epoch": 1.95, - "learning_rate": 5.740214244415613e-07, - "loss": 0.7461, - "step": 76183 - }, - { - "epoch": 1.95, - "learning_rate": 5.739963902249651e-07, - "loss": 0.7002, - "step": 76184 - }, - { - "epoch": 1.95, - "learning_rate": 5.739713563345405e-07, - "loss": 0.6328, - "step": 76185 - }, - { - "epoch": 1.95, - "learning_rate": 5.739463227703063e-07, - "loss": 0.6841, - "step": 76186 - }, - { - "epoch": 1.95, - "learning_rate": 5.739212895322822e-07, - "loss": 0.8096, - "step": 76187 - }, - { - "epoch": 1.95, - "learning_rate": 5.738962566204868e-07, - "loss": 0.7271, - "step": 76188 - }, - { - "epoch": 1.95, - "learning_rate": 5.738712240349393e-07, - "loss": 0.7236, - "step": 76189 - }, - { - "epoch": 1.95, - "learning_rate": 5.73846191775659e-07, - "loss": 0.5615, - "step": 76190 - }, - { - "epoch": 1.95, - "learning_rate": 5.738211598426654e-07, - "loss": 0.6885, - "step": 76191 - }, - { - "epoch": 1.95, - "learning_rate": 5.737961282359773e-07, - "loss": 0.5752, - "step": 76192 - }, - { - "epoch": 1.95, - "learning_rate": 5.737710969556138e-07, - "loss": 0.5923, - "step": 76193 - }, - { - "epoch": 1.95, - "learning_rate": 5.737460660015938e-07, - "loss": 0.6621, - "step": 76194 - }, - { - "epoch": 1.95, - "learning_rate": 5.737210353739372e-07, - "loss": 0.6602, - "step": 76195 - }, - { - "epoch": 1.95, - "learning_rate": 5.73696005072663e-07, - "loss": 0.6836, - "step": 76196 - }, - { - "epoch": 1.95, - "learning_rate": 5.736709750977897e-07, - "loss": 0.7295, - "step": 76197 - }, - { - "epoch": 1.95, - "learning_rate": 5.736459454493371e-07, - "loss": 0.6128, - "step": 76198 - }, - { - "epoch": 1.95, - "learning_rate": 5.736209161273242e-07, - "loss": 0.7056, - "step": 76199 - }, - { - "epoch": 1.95, - "learning_rate": 5.735958871317703e-07, - "loss": 0.6729, - "step": 76200 - }, - { - "epoch": 1.95, - "learning_rate": 5.735708584626942e-07, - "loss": 0.5762, - "step": 76201 - }, - { - "epoch": 1.95, - "learning_rate": 5.735458301201157e-07, - "loss": 0.6216, - "step": 76202 - }, - { - "epoch": 1.95, - "learning_rate": 5.735208021040532e-07, - "loss": 0.593, - "step": 76203 - }, - { - "epoch": 1.95, - "learning_rate": 5.734957744145266e-07, - "loss": 0.5786, - "step": 76204 - }, - { - "epoch": 1.95, - "learning_rate": 5.734707470515542e-07, - "loss": 0.6484, - "step": 76205 - }, - { - "epoch": 1.95, - "learning_rate": 5.734457200151557e-07, - "loss": 0.6963, - "step": 76206 - }, - { - "epoch": 1.95, - "learning_rate": 5.734206933053501e-07, - "loss": 0.7461, - "step": 76207 - }, - { - "epoch": 1.95, - "learning_rate": 5.733956669221571e-07, - "loss": 0.6299, - "step": 76208 - }, - { - "epoch": 1.95, - "learning_rate": 5.73370640865595e-07, - "loss": 0.5834, - "step": 76209 - }, - { - "epoch": 1.95, - "learning_rate": 5.733456151356835e-07, - "loss": 0.6162, - "step": 76210 - }, - { - "epoch": 1.95, - "learning_rate": 5.733205897324416e-07, - "loss": 0.6436, - "step": 76211 - }, - { - "epoch": 1.95, - "learning_rate": 5.732955646558888e-07, - "loss": 0.709, - "step": 76212 - }, - { - "epoch": 1.95, - "learning_rate": 5.73270539906044e-07, - "loss": 0.5908, - "step": 76213 - }, - { - "epoch": 1.95, - "learning_rate": 5.732455154829261e-07, - "loss": 0.6548, - "step": 76214 - }, - { - "epoch": 1.95, - "learning_rate": 5.732204913865544e-07, - "loss": 0.7578, - "step": 76215 - }, - { - "epoch": 1.95, - "learning_rate": 5.731954676169479e-07, - "loss": 0.6338, - "step": 76216 - }, - { - "epoch": 1.95, - "learning_rate": 5.731704441741267e-07, - "loss": 0.6572, - "step": 76217 - }, - { - "epoch": 1.95, - "learning_rate": 5.731454210581088e-07, - "loss": 0.585, - "step": 76218 - }, - { - "epoch": 1.95, - "learning_rate": 5.731203982689137e-07, - "loss": 0.5369, - "step": 76219 - }, - { - "epoch": 1.95, - "learning_rate": 5.730953758065613e-07, - "loss": 0.5271, - "step": 76220 - }, - { - "epoch": 1.95, - "learning_rate": 5.730703536710695e-07, - "loss": 0.7178, - "step": 76221 - }, - { - "epoch": 1.95, - "learning_rate": 5.730453318624587e-07, - "loss": 0.6836, - "step": 76222 - }, - { - "epoch": 1.95, - "learning_rate": 5.73020310380747e-07, - "loss": 0.624, - "step": 76223 - }, - { - "epoch": 1.95, - "learning_rate": 5.72995289225954e-07, - "loss": 0.6267, - "step": 76224 - }, - { - "epoch": 1.95, - "learning_rate": 5.729702683980992e-07, - "loss": 0.4958, - "step": 76225 - }, - { - "epoch": 1.95, - "learning_rate": 5.729452478972011e-07, - "loss": 0.5366, - "step": 76226 - }, - { - "epoch": 1.95, - "learning_rate": 5.729202277232792e-07, - "loss": 0.6787, - "step": 76227 - }, - { - "epoch": 1.95, - "learning_rate": 5.728952078763526e-07, - "loss": 0.6895, - "step": 76228 - }, - { - "epoch": 1.95, - "learning_rate": 5.728701883564409e-07, - "loss": 0.46, - "step": 76229 - }, - { - "epoch": 1.95, - "learning_rate": 5.728451691635625e-07, - "loss": 0.791, - "step": 76230 - }, - { - "epoch": 1.95, - "learning_rate": 5.728201502977369e-07, - "loss": 0.6538, - "step": 76231 - }, - { - "epoch": 1.95, - "learning_rate": 5.727951317589836e-07, - "loss": 0.5542, - "step": 76232 - }, - { - "epoch": 1.95, - "learning_rate": 5.727701135473211e-07, - "loss": 0.6592, - "step": 76233 - }, - { - "epoch": 1.95, - "learning_rate": 5.727450956627693e-07, - "loss": 0.5845, - "step": 76234 - }, - { - "epoch": 1.95, - "learning_rate": 5.727200781053465e-07, - "loss": 0.6851, - "step": 76235 - }, - { - "epoch": 1.95, - "learning_rate": 5.726950608750723e-07, - "loss": 0.6353, - "step": 76236 - }, - { - "epoch": 1.95, - "learning_rate": 5.726700439719659e-07, - "loss": 0.4795, - "step": 76237 - }, - { - "epoch": 1.95, - "learning_rate": 5.726450273960467e-07, - "loss": 0.6553, - "step": 76238 - }, - { - "epoch": 1.95, - "learning_rate": 5.726200111473331e-07, - "loss": 0.7129, - "step": 76239 - }, - { - "epoch": 1.95, - "learning_rate": 5.725949952258449e-07, - "loss": 0.9033, - "step": 76240 - }, - { - "epoch": 1.95, - "learning_rate": 5.725699796316012e-07, - "loss": 0.5867, - "step": 76241 - }, - { - "epoch": 1.95, - "learning_rate": 5.725449643646212e-07, - "loss": 0.4976, - "step": 76242 - }, - { - "epoch": 1.95, - "learning_rate": 5.725199494249236e-07, - "loss": 0.5566, - "step": 76243 - }, - { - "epoch": 1.95, - "learning_rate": 5.724949348125275e-07, - "loss": 0.5703, - "step": 76244 - }, - { - "epoch": 1.95, - "learning_rate": 5.724699205274526e-07, - "loss": 0.7119, - "step": 76245 - }, - { - "epoch": 1.95, - "learning_rate": 5.724449065697181e-07, - "loss": 0.4985, - "step": 76246 - }, - { - "epoch": 1.95, - "learning_rate": 5.724198929393425e-07, - "loss": 0.4556, - "step": 76247 - }, - { - "epoch": 1.95, - "learning_rate": 5.723948796363453e-07, - "loss": 0.7021, - "step": 76248 - }, - { - "epoch": 1.95, - "learning_rate": 5.723698666607457e-07, - "loss": 0.6787, - "step": 76249 - }, - { - "epoch": 1.95, - "learning_rate": 5.723448540125633e-07, - "loss": 0.7012, - "step": 76250 - }, - { - "epoch": 1.95, - "learning_rate": 5.723198416918168e-07, - "loss": 0.4834, - "step": 76251 - }, - { - "epoch": 1.95, - "learning_rate": 5.722948296985249e-07, - "loss": 0.7607, - "step": 76252 - }, - { - "epoch": 1.95, - "learning_rate": 5.72269818032707e-07, - "loss": 0.7354, - "step": 76253 - }, - { - "epoch": 1.95, - "learning_rate": 5.722448066943827e-07, - "loss": 0.707, - "step": 76254 - }, - { - "epoch": 1.95, - "learning_rate": 5.722197956835712e-07, - "loss": 0.624, - "step": 76255 - }, - { - "epoch": 1.95, - "learning_rate": 5.721947850002909e-07, - "loss": 0.3051, - "step": 76256 - }, - { - "epoch": 1.95, - "learning_rate": 5.721697746445613e-07, - "loss": 0.5493, - "step": 76257 - }, - { - "epoch": 1.95, - "learning_rate": 5.721447646164021e-07, - "loss": 0.4824, - "step": 76258 - }, - { - "epoch": 1.95, - "learning_rate": 5.721197549158317e-07, - "loss": 0.708, - "step": 76259 - }, - { - "epoch": 1.95, - "learning_rate": 5.720947455428693e-07, - "loss": 0.7627, - "step": 76260 - }, - { - "epoch": 1.95, - "learning_rate": 5.720697364975349e-07, - "loss": 0.6396, - "step": 76261 - }, - { - "epoch": 1.95, - "learning_rate": 5.720447277798464e-07, - "loss": 0.6328, - "step": 76262 - }, - { - "epoch": 1.95, - "learning_rate": 5.720197193898242e-07, - "loss": 0.4656, - "step": 76263 - }, - { - "epoch": 1.95, - "learning_rate": 5.719947113274863e-07, - "loss": 0.6162, - "step": 76264 - }, - { - "epoch": 1.95, - "learning_rate": 5.719697035928523e-07, - "loss": 0.5586, - "step": 76265 - }, - { - "epoch": 1.95, - "learning_rate": 5.719446961859415e-07, - "loss": 0.541, - "step": 76266 - }, - { - "epoch": 1.95, - "learning_rate": 5.719196891067734e-07, - "loss": 0.514, - "step": 76267 - }, - { - "epoch": 1.95, - "learning_rate": 5.718946823553663e-07, - "loss": 0.6982, - "step": 76268 - }, - { - "epoch": 1.95, - "learning_rate": 5.718696759317398e-07, - "loss": 0.4802, - "step": 76269 - }, - { - "epoch": 1.95, - "learning_rate": 5.718446698359129e-07, - "loss": 0.6543, - "step": 76270 - }, - { - "epoch": 1.95, - "learning_rate": 5.718196640679054e-07, - "loss": 0.5066, - "step": 76271 - }, - { - "epoch": 1.95, - "learning_rate": 5.717946586277357e-07, - "loss": 0.6855, - "step": 76272 - }, - { - "epoch": 1.95, - "learning_rate": 5.717696535154228e-07, - "loss": 0.519, - "step": 76273 - }, - { - "epoch": 1.95, - "learning_rate": 5.717446487309863e-07, - "loss": 0.5811, - "step": 76274 - }, - { - "epoch": 1.95, - "learning_rate": 5.717196442744454e-07, - "loss": 0.5303, - "step": 76275 - }, - { - "epoch": 1.95, - "learning_rate": 5.71694640145819e-07, - "loss": 0.8125, - "step": 76276 - }, - { - "epoch": 1.96, - "learning_rate": 5.716696363451262e-07, - "loss": 0.4849, - "step": 76277 - }, - { - "epoch": 1.96, - "learning_rate": 5.716446328723861e-07, - "loss": 0.4553, - "step": 76278 - }, - { - "epoch": 1.96, - "learning_rate": 5.716196297276185e-07, - "loss": 0.6943, - "step": 76279 - }, - { - "epoch": 1.96, - "learning_rate": 5.715946269108416e-07, - "loss": 0.6885, - "step": 76280 - }, - { - "epoch": 1.96, - "learning_rate": 5.715696244220754e-07, - "loss": 0.5811, - "step": 76281 - }, - { - "epoch": 1.96, - "learning_rate": 5.715446222613384e-07, - "loss": 0.4639, - "step": 76282 - }, - { - "epoch": 1.96, - "learning_rate": 5.715196204286499e-07, - "loss": 0.627, - "step": 76283 - }, - { - "epoch": 1.96, - "learning_rate": 5.714946189240295e-07, - "loss": 0.6504, - "step": 76284 - }, - { - "epoch": 1.96, - "learning_rate": 5.714696177474956e-07, - "loss": 0.5247, - "step": 76285 - }, - { - "epoch": 1.96, - "learning_rate": 5.714446168990677e-07, - "loss": 0.665, - "step": 76286 - }, - { - "epoch": 1.96, - "learning_rate": 5.714196163787648e-07, - "loss": 0.5455, - "step": 76287 - }, - { - "epoch": 1.96, - "learning_rate": 5.713946161866068e-07, - "loss": 0.7598, - "step": 76288 - }, - { - "epoch": 1.96, - "learning_rate": 5.713696163226117e-07, - "loss": 0.45, - "step": 76289 - }, - { - "epoch": 1.96, - "learning_rate": 5.713446167867993e-07, - "loss": 0.5854, - "step": 76290 - }, - { - "epoch": 1.96, - "learning_rate": 5.713196175791889e-07, - "loss": 0.7061, - "step": 76291 - }, - { - "epoch": 1.96, - "learning_rate": 5.712946186997993e-07, - "loss": 0.5183, - "step": 76292 - }, - { - "epoch": 1.96, - "learning_rate": 5.712696201486496e-07, - "loss": 0.6543, - "step": 76293 - }, - { - "epoch": 1.96, - "learning_rate": 5.712446219257587e-07, - "loss": 0.5669, - "step": 76294 - }, - { - "epoch": 1.96, - "learning_rate": 5.712196240311462e-07, - "loss": 0.75, - "step": 76295 - }, - { - "epoch": 1.96, - "learning_rate": 5.711946264648316e-07, - "loss": 0.6064, - "step": 76296 - }, - { - "epoch": 1.96, - "learning_rate": 5.711696292268331e-07, - "loss": 0.6953, - "step": 76297 - }, - { - "epoch": 1.96, - "learning_rate": 5.711446323171703e-07, - "loss": 0.6816, - "step": 76298 - }, - { - "epoch": 1.96, - "learning_rate": 5.711196357358623e-07, - "loss": 0.575, - "step": 76299 - }, - { - "epoch": 1.96, - "learning_rate": 5.710946394829288e-07, - "loss": 0.6519, - "step": 76300 - }, - { - "epoch": 1.96, - "learning_rate": 5.710696435583883e-07, - "loss": 0.7383, - "step": 76301 - }, - { - "epoch": 1.96, - "learning_rate": 5.710446479622597e-07, - "loss": 0.6345, - "step": 76302 - }, - { - "epoch": 1.96, - "learning_rate": 5.710196526945623e-07, - "loss": 0.3068, - "step": 76303 - }, - { - "epoch": 1.96, - "learning_rate": 5.709946577553157e-07, - "loss": 0.536, - "step": 76304 - }, - { - "epoch": 1.96, - "learning_rate": 5.709696631445391e-07, - "loss": 0.6631, - "step": 76305 - }, - { - "epoch": 1.96, - "learning_rate": 5.709446688622508e-07, - "loss": 0.6782, - "step": 76306 - }, - { - "epoch": 1.96, - "learning_rate": 5.709196749084705e-07, - "loss": 0.5273, - "step": 76307 - }, - { - "epoch": 1.96, - "learning_rate": 5.708946812832172e-07, - "loss": 0.6582, - "step": 76308 - }, - { - "epoch": 1.96, - "learning_rate": 5.708696879865107e-07, - "loss": 0.7144, - "step": 76309 - }, - { - "epoch": 1.96, - "learning_rate": 5.70844695018369e-07, - "loss": 0.5322, - "step": 76310 - }, - { - "epoch": 1.96, - "learning_rate": 5.708197023788122e-07, - "loss": 0.7061, - "step": 76311 - }, - { - "epoch": 1.96, - "learning_rate": 5.707947100678585e-07, - "loss": 0.6738, - "step": 76312 - }, - { - "epoch": 1.96, - "learning_rate": 5.707697180855283e-07, - "loss": 0.6582, - "step": 76313 - }, - { - "epoch": 1.96, - "learning_rate": 5.707447264318392e-07, - "loss": 0.5322, - "step": 76314 - }, - { - "epoch": 1.96, - "learning_rate": 5.707197351068114e-07, - "loss": 0.4272, - "step": 76315 - }, - { - "epoch": 1.96, - "learning_rate": 5.706947441104636e-07, - "loss": 0.6274, - "step": 76316 - }, - { - "epoch": 1.96, - "learning_rate": 5.706697534428156e-07, - "loss": 0.6123, - "step": 76317 - }, - { - "epoch": 1.96, - "learning_rate": 5.706447631038856e-07, - "loss": 0.6289, - "step": 76318 - }, - { - "epoch": 1.96, - "learning_rate": 5.70619773093693e-07, - "loss": 0.6743, - "step": 76319 - }, - { - "epoch": 1.96, - "learning_rate": 5.705947834122573e-07, - "loss": 0.707, - "step": 76320 - }, - { - "epoch": 1.96, - "learning_rate": 5.705697940595978e-07, - "loss": 0.6172, - "step": 76321 - }, - { - "epoch": 1.96, - "learning_rate": 5.705448050357333e-07, - "loss": 0.4956, - "step": 76322 - }, - { - "epoch": 1.96, - "learning_rate": 5.705198163406823e-07, - "loss": 0.5723, - "step": 76323 - }, - { - "epoch": 1.96, - "learning_rate": 5.704948279744648e-07, - "loss": 0.5889, - "step": 76324 - }, - { - "epoch": 1.96, - "learning_rate": 5.704698399370995e-07, - "loss": 0.7798, - "step": 76325 - }, - { - "epoch": 1.96, - "learning_rate": 5.704448522286061e-07, - "loss": 0.4175, - "step": 76326 - }, - { - "epoch": 1.96, - "learning_rate": 5.704198648490029e-07, - "loss": 0.7588, - "step": 76327 - }, - { - "epoch": 1.96, - "learning_rate": 5.703948777983095e-07, - "loss": 0.6611, - "step": 76328 - }, - { - "epoch": 1.96, - "learning_rate": 5.703698910765453e-07, - "loss": 0.4756, - "step": 76329 - }, - { - "epoch": 1.96, - "learning_rate": 5.703449046837288e-07, - "loss": 0.7891, - "step": 76330 - }, - { - "epoch": 1.96, - "learning_rate": 5.703199186198799e-07, - "loss": 0.6123, - "step": 76331 - }, - { - "epoch": 1.96, - "learning_rate": 5.702949328850169e-07, - "loss": 0.5437, - "step": 76332 - }, - { - "epoch": 1.96, - "learning_rate": 5.702699474791592e-07, - "loss": 0.5449, - "step": 76333 - }, - { - "epoch": 1.96, - "learning_rate": 5.702449624023265e-07, - "loss": 0.7393, - "step": 76334 - }, - { - "epoch": 1.96, - "learning_rate": 5.702199776545371e-07, - "loss": 0.5288, - "step": 76335 - }, - { - "epoch": 1.96, - "learning_rate": 5.701949932358105e-07, - "loss": 0.4708, - "step": 76336 - }, - { - "epoch": 1.96, - "learning_rate": 5.701700091461657e-07, - "loss": 0.6641, - "step": 76337 - }, - { - "epoch": 1.96, - "learning_rate": 5.701450253856225e-07, - "loss": 0.6562, - "step": 76338 - }, - { - "epoch": 1.96, - "learning_rate": 5.701200419541989e-07, - "loss": 0.5479, - "step": 76339 - }, - { - "epoch": 1.96, - "learning_rate": 5.700950588519148e-07, - "loss": 0.7354, - "step": 76340 - }, - { - "epoch": 1.96, - "learning_rate": 5.700700760787896e-07, - "loss": 0.6621, - "step": 76341 - }, - { - "epoch": 1.96, - "learning_rate": 5.700450936348414e-07, - "loss": 0.5952, - "step": 76342 - }, - { - "epoch": 1.96, - "learning_rate": 5.700201115200905e-07, - "loss": 0.4946, - "step": 76343 - }, - { - "epoch": 1.96, - "learning_rate": 5.699951297345549e-07, - "loss": 0.7422, - "step": 76344 - }, - { - "epoch": 1.96, - "learning_rate": 5.699701482782542e-07, - "loss": 0.665, - "step": 76345 - }, - { - "epoch": 1.96, - "learning_rate": 5.699451671512081e-07, - "loss": 0.7842, - "step": 76346 - }, - { - "epoch": 1.96, - "learning_rate": 5.699201863534348e-07, - "loss": 0.6045, - "step": 76347 - }, - { - "epoch": 1.96, - "learning_rate": 5.698952058849538e-07, - "loss": 0.6475, - "step": 76348 - }, - { - "epoch": 1.96, - "learning_rate": 5.698702257457842e-07, - "loss": 0.6714, - "step": 76349 - }, - { - "epoch": 1.96, - "learning_rate": 5.698452459359456e-07, - "loss": 0.5635, - "step": 76350 - }, - { - "epoch": 1.96, - "learning_rate": 5.698202664554568e-07, - "loss": 0.751, - "step": 76351 - }, - { - "epoch": 1.96, - "learning_rate": 5.697952873043365e-07, - "loss": 0.605, - "step": 76352 - }, - { - "epoch": 1.96, - "learning_rate": 5.69770308482604e-07, - "loss": 0.3298, - "step": 76353 - }, - { - "epoch": 1.96, - "learning_rate": 5.697453299902787e-07, - "loss": 0.6543, - "step": 76354 - }, - { - "epoch": 1.96, - "learning_rate": 5.6972035182738e-07, - "loss": 0.8066, - "step": 76355 - }, - { - "epoch": 1.96, - "learning_rate": 5.696953739939262e-07, - "loss": 0.7539, - "step": 76356 - }, - { - "epoch": 1.96, - "learning_rate": 5.69670396489937e-07, - "loss": 0.606, - "step": 76357 - }, - { - "epoch": 1.96, - "learning_rate": 5.696454193154312e-07, - "loss": 0.6724, - "step": 76358 - }, - { - "epoch": 1.96, - "learning_rate": 5.696204424704285e-07, - "loss": 0.5645, - "step": 76359 - }, - { - "epoch": 1.96, - "learning_rate": 5.695954659549475e-07, - "loss": 0.6235, - "step": 76360 - }, - { - "epoch": 1.96, - "learning_rate": 5.695704897690077e-07, - "loss": 0.7031, - "step": 76361 - }, - { - "epoch": 1.96, - "learning_rate": 5.695455139126275e-07, - "loss": 0.6289, - "step": 76362 - }, - { - "epoch": 1.96, - "learning_rate": 5.695205383858271e-07, - "loss": 0.7539, - "step": 76363 - }, - { - "epoch": 1.96, - "learning_rate": 5.694955631886245e-07, - "loss": 0.6777, - "step": 76364 - }, - { - "epoch": 1.96, - "learning_rate": 5.694705883210393e-07, - "loss": 0.7803, - "step": 76365 - }, - { - "epoch": 1.96, - "learning_rate": 5.694456137830907e-07, - "loss": 0.4316, - "step": 76366 - }, - { - "epoch": 1.96, - "learning_rate": 5.694206395747983e-07, - "loss": 0.7349, - "step": 76367 - }, - { - "epoch": 1.96, - "learning_rate": 5.693956656961802e-07, - "loss": 0.7939, - "step": 76368 - }, - { - "epoch": 1.96, - "learning_rate": 5.69370692147256e-07, - "loss": 0.6855, - "step": 76369 - }, - { - "epoch": 1.96, - "learning_rate": 5.69345718928045e-07, - "loss": 0.6499, - "step": 76370 - }, - { - "epoch": 1.96, - "learning_rate": 5.693207460385668e-07, - "loss": 0.6904, - "step": 76371 - }, - { - "epoch": 1.96, - "learning_rate": 5.692957734788395e-07, - "loss": 0.7461, - "step": 76372 - }, - { - "epoch": 1.96, - "learning_rate": 5.692708012488824e-07, - "loss": 0.4565, - "step": 76373 - }, - { - "epoch": 1.96, - "learning_rate": 5.692458293487148e-07, - "loss": 0.5996, - "step": 76374 - }, - { - "epoch": 1.96, - "learning_rate": 5.692208577783558e-07, - "loss": 0.5718, - "step": 76375 - }, - { - "epoch": 1.96, - "learning_rate": 5.69195886537825e-07, - "loss": 0.6035, - "step": 76376 - }, - { - "epoch": 1.96, - "learning_rate": 5.691709156271409e-07, - "loss": 0.6167, - "step": 76377 - }, - { - "epoch": 1.96, - "learning_rate": 5.691459450463226e-07, - "loss": 0.6143, - "step": 76378 - }, - { - "epoch": 1.96, - "learning_rate": 5.691209747953896e-07, - "loss": 0.6313, - "step": 76379 - }, - { - "epoch": 1.96, - "learning_rate": 5.690960048743612e-07, - "loss": 0.55, - "step": 76380 - }, - { - "epoch": 1.96, - "learning_rate": 5.69071035283256e-07, - "loss": 0.6758, - "step": 76381 - }, - { - "epoch": 1.96, - "learning_rate": 5.690460660220931e-07, - "loss": 0.5581, - "step": 76382 - }, - { - "epoch": 1.96, - "learning_rate": 5.690210970908918e-07, - "loss": 0.4736, - "step": 76383 - }, - { - "epoch": 1.96, - "learning_rate": 5.689961284896715e-07, - "loss": 0.7383, - "step": 76384 - }, - { - "epoch": 1.96, - "learning_rate": 5.689711602184507e-07, - "loss": 0.666, - "step": 76385 - }, - { - "epoch": 1.96, - "learning_rate": 5.689461922772489e-07, - "loss": 0.4299, - "step": 76386 - }, - { - "epoch": 1.96, - "learning_rate": 5.689212246660852e-07, - "loss": 0.6533, - "step": 76387 - }, - { - "epoch": 1.96, - "learning_rate": 5.688962573849791e-07, - "loss": 0.6572, - "step": 76388 - }, - { - "epoch": 1.96, - "learning_rate": 5.688712904339487e-07, - "loss": 0.5532, - "step": 76389 - }, - { - "epoch": 1.96, - "learning_rate": 5.688463238130141e-07, - "loss": 0.6167, - "step": 76390 - }, - { - "epoch": 1.96, - "learning_rate": 5.688213575221942e-07, - "loss": 0.5942, - "step": 76391 - }, - { - "epoch": 1.96, - "learning_rate": 5.687963915615076e-07, - "loss": 0.5898, - "step": 76392 - }, - { - "epoch": 1.96, - "learning_rate": 5.687714259309742e-07, - "loss": 0.5879, - "step": 76393 - }, - { - "epoch": 1.96, - "learning_rate": 5.687464606306122e-07, - "loss": 0.5557, - "step": 76394 - }, - { - "epoch": 1.96, - "learning_rate": 5.687214956604413e-07, - "loss": 0.6787, - "step": 76395 - }, - { - "epoch": 1.96, - "learning_rate": 5.686965310204806e-07, - "loss": 0.6855, - "step": 76396 - }, - { - "epoch": 1.96, - "learning_rate": 5.686715667107493e-07, - "loss": 0.5105, - "step": 76397 - }, - { - "epoch": 1.96, - "learning_rate": 5.686466027312662e-07, - "loss": 0.6812, - "step": 76398 - }, - { - "epoch": 1.96, - "learning_rate": 5.686216390820504e-07, - "loss": 0.5654, - "step": 76399 - }, - { - "epoch": 1.96, - "learning_rate": 5.685966757631213e-07, - "loss": 0.6138, - "step": 76400 - }, - { - "epoch": 1.96, - "learning_rate": 5.685717127744986e-07, - "loss": 0.5986, - "step": 76401 - }, - { - "epoch": 1.96, - "learning_rate": 5.685467501161998e-07, - "loss": 0.5947, - "step": 76402 - }, - { - "epoch": 1.96, - "learning_rate": 5.685217877882451e-07, - "loss": 0.6592, - "step": 76403 - }, - { - "epoch": 1.96, - "learning_rate": 5.684968257906532e-07, - "loss": 0.6992, - "step": 76404 - }, - { - "epoch": 1.96, - "learning_rate": 5.684718641234442e-07, - "loss": 0.8682, - "step": 76405 - }, - { - "epoch": 1.96, - "learning_rate": 5.684469027866359e-07, - "loss": 0.5171, - "step": 76406 - }, - { - "epoch": 1.96, - "learning_rate": 5.684219417802478e-07, - "loss": 0.7822, - "step": 76407 - }, - { - "epoch": 1.96, - "learning_rate": 5.683969811042993e-07, - "loss": 0.5869, - "step": 76408 - }, - { - "epoch": 1.96, - "learning_rate": 5.683720207588098e-07, - "loss": 0.4561, - "step": 76409 - }, - { - "epoch": 1.96, - "learning_rate": 5.683470607437975e-07, - "loss": 0.5913, - "step": 76410 - }, - { - "epoch": 1.96, - "learning_rate": 5.683221010592825e-07, - "loss": 0.5288, - "step": 76411 - }, - { - "epoch": 1.96, - "learning_rate": 5.68297141705283e-07, - "loss": 0.5007, - "step": 76412 - }, - { - "epoch": 1.96, - "learning_rate": 5.682721826818186e-07, - "loss": 0.6074, - "step": 76413 - }, - { - "epoch": 1.96, - "learning_rate": 5.682472239889085e-07, - "loss": 0.6748, - "step": 76414 - }, - { - "epoch": 1.96, - "learning_rate": 5.682222656265714e-07, - "loss": 0.5879, - "step": 76415 - }, - { - "epoch": 1.96, - "learning_rate": 5.681973075948268e-07, - "loss": 0.5435, - "step": 76416 - }, - { - "epoch": 1.96, - "learning_rate": 5.681723498936934e-07, - "loss": 0.7432, - "step": 76417 - }, - { - "epoch": 1.96, - "learning_rate": 5.681473925231913e-07, - "loss": 0.5645, - "step": 76418 - }, - { - "epoch": 1.96, - "learning_rate": 5.681224354833383e-07, - "loss": 0.6392, - "step": 76419 - }, - { - "epoch": 1.96, - "learning_rate": 5.680974787741539e-07, - "loss": 0.6611, - "step": 76420 - }, - { - "epoch": 1.96, - "learning_rate": 5.680725223956581e-07, - "loss": 0.6963, - "step": 76421 - }, - { - "epoch": 1.96, - "learning_rate": 5.680475663478692e-07, - "loss": 0.645, - "step": 76422 - }, - { - "epoch": 1.96, - "learning_rate": 5.680226106308059e-07, - "loss": 0.7812, - "step": 76423 - }, - { - "epoch": 1.96, - "learning_rate": 5.679976552444881e-07, - "loss": 0.6348, - "step": 76424 - }, - { - "epoch": 1.96, - "learning_rate": 5.679727001889344e-07, - "loss": 0.4902, - "step": 76425 - }, - { - "epoch": 1.96, - "learning_rate": 5.679477454641646e-07, - "loss": 0.4763, - "step": 76426 - }, - { - "epoch": 1.96, - "learning_rate": 5.679227910701969e-07, - "loss": 0.7529, - "step": 76427 - }, - { - "epoch": 1.96, - "learning_rate": 5.67897837007051e-07, - "loss": 0.5468, - "step": 76428 - }, - { - "epoch": 1.96, - "learning_rate": 5.678728832747457e-07, - "loss": 0.7949, - "step": 76429 - }, - { - "epoch": 1.96, - "learning_rate": 5.678479298733008e-07, - "loss": 0.7231, - "step": 76430 - }, - { - "epoch": 1.96, - "learning_rate": 5.678229768027347e-07, - "loss": 0.7256, - "step": 76431 - }, - { - "epoch": 1.96, - "learning_rate": 5.677980240630664e-07, - "loss": 0.502, - "step": 76432 - }, - { - "epoch": 1.96, - "learning_rate": 5.677730716543152e-07, - "loss": 0.501, - "step": 76433 - }, - { - "epoch": 1.96, - "learning_rate": 5.677481195765004e-07, - "loss": 0.7207, - "step": 76434 - }, - { - "epoch": 1.96, - "learning_rate": 5.677231678296412e-07, - "loss": 0.5815, - "step": 76435 - }, - { - "epoch": 1.96, - "learning_rate": 5.676982164137563e-07, - "loss": 0.5083, - "step": 76436 - }, - { - "epoch": 1.96, - "learning_rate": 5.67673265328865e-07, - "loss": 0.6133, - "step": 76437 - }, - { - "epoch": 1.96, - "learning_rate": 5.676483145749866e-07, - "loss": 0.5962, - "step": 76438 - }, - { - "epoch": 1.96, - "learning_rate": 5.676233641521397e-07, - "loss": 0.2526, - "step": 76439 - }, - { - "epoch": 1.96, - "learning_rate": 5.675984140603438e-07, - "loss": 0.6582, - "step": 76440 - }, - { - "epoch": 1.96, - "learning_rate": 5.675734642996183e-07, - "loss": 0.5905, - "step": 76441 - }, - { - "epoch": 1.96, - "learning_rate": 5.675485148699815e-07, - "loss": 0.7065, - "step": 76442 - }, - { - "epoch": 1.96, - "learning_rate": 5.675235657714533e-07, - "loss": 0.666, - "step": 76443 - }, - { - "epoch": 1.96, - "learning_rate": 5.674986170040519e-07, - "loss": 0.6875, - "step": 76444 - }, - { - "epoch": 1.96, - "learning_rate": 5.674736685677969e-07, - "loss": 0.5938, - "step": 76445 - }, - { - "epoch": 1.96, - "learning_rate": 5.674487204627076e-07, - "loss": 0.4949, - "step": 76446 - }, - { - "epoch": 1.96, - "learning_rate": 5.674237726888034e-07, - "loss": 0.5356, - "step": 76447 - }, - { - "epoch": 1.96, - "learning_rate": 5.673988252461023e-07, - "loss": 0.5752, - "step": 76448 - }, - { - "epoch": 1.96, - "learning_rate": 5.673738781346241e-07, - "loss": 0.7578, - "step": 76449 - }, - { - "epoch": 1.96, - "learning_rate": 5.673489313543879e-07, - "loss": 0.6738, - "step": 76450 - }, - { - "epoch": 1.96, - "learning_rate": 5.67323984905413e-07, - "loss": 0.4731, - "step": 76451 - }, - { - "epoch": 1.96, - "learning_rate": 5.672990387877184e-07, - "loss": 0.5957, - "step": 76452 - }, - { - "epoch": 1.96, - "learning_rate": 5.672740930013224e-07, - "loss": 0.8057, - "step": 76453 - }, - { - "epoch": 1.96, - "learning_rate": 5.67249147546245e-07, - "loss": 0.5112, - "step": 76454 - }, - { - "epoch": 1.96, - "learning_rate": 5.672242024225053e-07, - "loss": 0.6577, - "step": 76455 - }, - { - "epoch": 1.96, - "learning_rate": 5.671992576301217e-07, - "loss": 0.7451, - "step": 76456 - }, - { - "epoch": 1.96, - "learning_rate": 5.671743131691138e-07, - "loss": 0.7373, - "step": 76457 - }, - { - "epoch": 1.96, - "learning_rate": 5.671493690395005e-07, - "loss": 0.5938, - "step": 76458 - }, - { - "epoch": 1.96, - "learning_rate": 5.671244252413016e-07, - "loss": 0.8135, - "step": 76459 - }, - { - "epoch": 1.96, - "learning_rate": 5.67099481774535e-07, - "loss": 0.4883, - "step": 76460 - }, - { - "epoch": 1.96, - "learning_rate": 5.67074538639221e-07, - "loss": 0.7031, - "step": 76461 - }, - { - "epoch": 1.96, - "learning_rate": 5.670495958353777e-07, - "loss": 0.625, - "step": 76462 - }, - { - "epoch": 1.96, - "learning_rate": 5.670246533630246e-07, - "loss": 0.5034, - "step": 76463 - }, - { - "epoch": 1.96, - "learning_rate": 5.669997112221811e-07, - "loss": 0.6104, - "step": 76464 - }, - { - "epoch": 1.96, - "learning_rate": 5.669747694128657e-07, - "loss": 0.6392, - "step": 76465 - }, - { - "epoch": 1.96, - "learning_rate": 5.669498279350979e-07, - "loss": 0.5122, - "step": 76466 - }, - { - "epoch": 1.96, - "learning_rate": 5.669248867888966e-07, - "loss": 0.7529, - "step": 76467 - }, - { - "epoch": 1.96, - "learning_rate": 5.668999459742815e-07, - "loss": 0.6592, - "step": 76468 - }, - { - "epoch": 1.96, - "learning_rate": 5.668750054912706e-07, - "loss": 0.4417, - "step": 76469 - }, - { - "epoch": 1.96, - "learning_rate": 5.668500653398838e-07, - "loss": 0.6294, - "step": 76470 - }, - { - "epoch": 1.96, - "learning_rate": 5.668251255201403e-07, - "loss": 0.5957, - "step": 76471 - }, - { - "epoch": 1.96, - "learning_rate": 5.668001860320588e-07, - "loss": 0.7012, - "step": 76472 - }, - { - "epoch": 1.96, - "learning_rate": 5.667752468756582e-07, - "loss": 0.7676, - "step": 76473 - }, - { - "epoch": 1.96, - "learning_rate": 5.667503080509579e-07, - "loss": 0.4302, - "step": 76474 - }, - { - "epoch": 1.96, - "learning_rate": 5.66725369557977e-07, - "loss": 0.6079, - "step": 76475 - }, - { - "epoch": 1.96, - "learning_rate": 5.667004313967348e-07, - "loss": 0.6416, - "step": 76476 - }, - { - "epoch": 1.96, - "learning_rate": 5.666754935672498e-07, - "loss": 0.7295, - "step": 76477 - }, - { - "epoch": 1.96, - "learning_rate": 5.666505560695415e-07, - "loss": 0.5419, - "step": 76478 - }, - { - "epoch": 1.96, - "learning_rate": 5.666256189036289e-07, - "loss": 0.6572, - "step": 76479 - }, - { - "epoch": 1.96, - "learning_rate": 5.666006820695315e-07, - "loss": 0.5571, - "step": 76480 - }, - { - "epoch": 1.96, - "learning_rate": 5.665757455672681e-07, - "loss": 0.6787, - "step": 76481 - }, - { - "epoch": 1.96, - "learning_rate": 5.665508093968574e-07, - "loss": 0.5806, - "step": 76482 - }, - { - "epoch": 1.96, - "learning_rate": 5.665258735583187e-07, - "loss": 0.6743, - "step": 76483 - }, - { - "epoch": 1.96, - "learning_rate": 5.665009380516712e-07, - "loss": 0.7588, - "step": 76484 - }, - { - "epoch": 1.96, - "learning_rate": 5.664760028769345e-07, - "loss": 0.6094, - "step": 76485 - }, - { - "epoch": 1.96, - "learning_rate": 5.664510680341266e-07, - "loss": 0.563, - "step": 76486 - }, - { - "epoch": 1.96, - "learning_rate": 5.664261335232674e-07, - "loss": 0.6143, - "step": 76487 - }, - { - "epoch": 1.96, - "learning_rate": 5.664011993443755e-07, - "loss": 0.5957, - "step": 76488 - }, - { - "epoch": 1.96, - "learning_rate": 5.663762654974709e-07, - "loss": 0.7031, - "step": 76489 - }, - { - "epoch": 1.96, - "learning_rate": 5.663513319825717e-07, - "loss": 0.6787, - "step": 76490 - }, - { - "epoch": 1.96, - "learning_rate": 5.663263987996976e-07, - "loss": 0.5237, - "step": 76491 - }, - { - "epoch": 1.96, - "learning_rate": 5.66301465948867e-07, - "loss": 0.6162, - "step": 76492 - }, - { - "epoch": 1.96, - "learning_rate": 5.662765334300999e-07, - "loss": 0.5503, - "step": 76493 - }, - { - "epoch": 1.96, - "learning_rate": 5.662516012434146e-07, - "loss": 0.4863, - "step": 76494 - }, - { - "epoch": 1.96, - "learning_rate": 5.662266693888303e-07, - "loss": 0.6958, - "step": 76495 - }, - { - "epoch": 1.96, - "learning_rate": 5.662017378663665e-07, - "loss": 0.5942, - "step": 76496 - }, - { - "epoch": 1.96, - "learning_rate": 5.661768066760424e-07, - "loss": 0.5059, - "step": 76497 - }, - { - "epoch": 1.96, - "learning_rate": 5.661518758178763e-07, - "loss": 0.5947, - "step": 76498 - }, - { - "epoch": 1.96, - "learning_rate": 5.661269452918879e-07, - "loss": 0.79, - "step": 76499 - }, - { - "epoch": 1.96, - "learning_rate": 5.661020150980961e-07, - "loss": 0.6445, - "step": 76500 - }, - { - "epoch": 1.96, - "learning_rate": 5.660770852365205e-07, - "loss": 0.5664, - "step": 76501 - }, - { - "epoch": 1.96, - "learning_rate": 5.660521557071796e-07, - "loss": 0.4646, - "step": 76502 - }, - { - "epoch": 1.96, - "learning_rate": 5.660272265100922e-07, - "loss": 0.5557, - "step": 76503 - }, - { - "epoch": 1.96, - "learning_rate": 5.660022976452779e-07, - "loss": 0.3943, - "step": 76504 - }, - { - "epoch": 1.96, - "learning_rate": 5.659773691127555e-07, - "loss": 0.707, - "step": 76505 - }, - { - "epoch": 1.96, - "learning_rate": 5.659524409125448e-07, - "loss": 0.5864, - "step": 76506 - }, - { - "epoch": 1.96, - "learning_rate": 5.65927513044664e-07, - "loss": 0.5276, - "step": 76507 - }, - { - "epoch": 1.96, - "learning_rate": 5.659025855091324e-07, - "loss": 0.6211, - "step": 76508 - }, - { - "epoch": 1.96, - "learning_rate": 5.658776583059698e-07, - "loss": 0.7666, - "step": 76509 - }, - { - "epoch": 1.96, - "learning_rate": 5.658527314351942e-07, - "loss": 0.5854, - "step": 76510 - }, - { - "epoch": 1.96, - "learning_rate": 5.658278048968257e-07, - "loss": 0.5098, - "step": 76511 - }, - { - "epoch": 1.96, - "learning_rate": 5.658028786908824e-07, - "loss": 0.6499, - "step": 76512 - }, - { - "epoch": 1.96, - "learning_rate": 5.657779528173839e-07, - "loss": 0.6636, - "step": 76513 - }, - { - "epoch": 1.96, - "learning_rate": 5.657530272763498e-07, - "loss": 0.6113, - "step": 76514 - }, - { - "epoch": 1.96, - "learning_rate": 5.65728102067798e-07, - "loss": 0.5908, - "step": 76515 - }, - { - "epoch": 1.96, - "learning_rate": 5.657031771917483e-07, - "loss": 0.5328, - "step": 76516 - }, - { - "epoch": 1.96, - "learning_rate": 5.656782526482197e-07, - "loss": 0.5796, - "step": 76517 - }, - { - "epoch": 1.96, - "learning_rate": 5.656533284372318e-07, - "loss": 0.7617, - "step": 76518 - }, - { - "epoch": 1.96, - "learning_rate": 5.656284045588027e-07, - "loss": 0.5605, - "step": 76519 - }, - { - "epoch": 1.96, - "learning_rate": 5.656034810129519e-07, - "loss": 0.5586, - "step": 76520 - }, - { - "epoch": 1.96, - "learning_rate": 5.65578557799699e-07, - "loss": 0.7354, - "step": 76521 - }, - { - "epoch": 1.96, - "learning_rate": 5.655536349190622e-07, - "loss": 0.5752, - "step": 76522 - }, - { - "epoch": 1.96, - "learning_rate": 5.655287123710615e-07, - "loss": 0.8037, - "step": 76523 - }, - { - "epoch": 1.96, - "learning_rate": 5.65503790155715e-07, - "loss": 0.6885, - "step": 76524 - }, - { - "epoch": 1.96, - "learning_rate": 5.654788682730423e-07, - "loss": 0.6875, - "step": 76525 - }, - { - "epoch": 1.96, - "learning_rate": 5.654539467230628e-07, - "loss": 0.5112, - "step": 76526 - }, - { - "epoch": 1.96, - "learning_rate": 5.654290255057949e-07, - "loss": 0.5498, - "step": 76527 - }, - { - "epoch": 1.96, - "learning_rate": 5.654041046212579e-07, - "loss": 0.6299, - "step": 76528 - }, - { - "epoch": 1.96, - "learning_rate": 5.65379184069471e-07, - "loss": 0.709, - "step": 76529 - }, - { - "epoch": 1.96, - "learning_rate": 5.653542638504538e-07, - "loss": 0.5508, - "step": 76530 - }, - { - "epoch": 1.96, - "learning_rate": 5.653293439642249e-07, - "loss": 0.6221, - "step": 76531 - }, - { - "epoch": 1.96, - "learning_rate": 5.653044244108027e-07, - "loss": 0.5698, - "step": 76532 - }, - { - "epoch": 1.96, - "learning_rate": 5.652795051902071e-07, - "loss": 0.6621, - "step": 76533 - }, - { - "epoch": 1.96, - "learning_rate": 5.65254586302457e-07, - "loss": 0.708, - "step": 76534 - }, - { - "epoch": 1.96, - "learning_rate": 5.652296677475718e-07, - "loss": 0.5479, - "step": 76535 - }, - { - "epoch": 1.96, - "learning_rate": 5.652047495255698e-07, - "loss": 0.6948, - "step": 76536 - }, - { - "epoch": 1.96, - "learning_rate": 5.651798316364706e-07, - "loss": 0.6885, - "step": 76537 - }, - { - "epoch": 1.96, - "learning_rate": 5.651549140802933e-07, - "loss": 0.7969, - "step": 76538 - }, - { - "epoch": 1.96, - "learning_rate": 5.651299968570571e-07, - "loss": 0.8223, - "step": 76539 - }, - { - "epoch": 1.96, - "learning_rate": 5.651050799667807e-07, - "loss": 0.4761, - "step": 76540 - }, - { - "epoch": 1.96, - "learning_rate": 5.650801634094835e-07, - "loss": 0.6484, - "step": 76541 - }, - { - "epoch": 1.96, - "learning_rate": 5.650552471851841e-07, - "loss": 0.5181, - "step": 76542 - }, - { - "epoch": 1.96, - "learning_rate": 5.650303312939024e-07, - "loss": 0.4188, - "step": 76543 - }, - { - "epoch": 1.96, - "learning_rate": 5.650054157356565e-07, - "loss": 0.6353, - "step": 76544 - }, - { - "epoch": 1.96, - "learning_rate": 5.64980500510466e-07, - "loss": 0.5269, - "step": 76545 - }, - { - "epoch": 1.96, - "learning_rate": 5.649555856183499e-07, - "loss": 0.6221, - "step": 76546 - }, - { - "epoch": 1.96, - "learning_rate": 5.649306710593275e-07, - "loss": 0.7119, - "step": 76547 - }, - { - "epoch": 1.96, - "learning_rate": 5.649057568334175e-07, - "loss": 0.624, - "step": 76548 - }, - { - "epoch": 1.96, - "learning_rate": 5.648808429406391e-07, - "loss": 0.5654, - "step": 76549 - }, - { - "epoch": 1.96, - "learning_rate": 5.648559293810119e-07, - "loss": 0.4025, - "step": 76550 - }, - { - "epoch": 1.96, - "learning_rate": 5.648310161545541e-07, - "loss": 0.7305, - "step": 76551 - }, - { - "epoch": 1.96, - "learning_rate": 5.648061032612855e-07, - "loss": 0.67, - "step": 76552 - }, - { - "epoch": 1.96, - "learning_rate": 5.647811907012245e-07, - "loss": 0.5811, - "step": 76553 - }, - { - "epoch": 1.96, - "learning_rate": 5.647562784743904e-07, - "loss": 0.7998, - "step": 76554 - }, - { - "epoch": 1.96, - "learning_rate": 5.647313665808027e-07, - "loss": 0.6841, - "step": 76555 - }, - { - "epoch": 1.96, - "learning_rate": 5.647064550204803e-07, - "loss": 0.5918, - "step": 76556 - }, - { - "epoch": 1.96, - "learning_rate": 5.64681543793442e-07, - "loss": 0.6709, - "step": 76557 - }, - { - "epoch": 1.96, - "learning_rate": 5.646566328997067e-07, - "loss": 0.8232, - "step": 76558 - }, - { - "epoch": 1.96, - "learning_rate": 5.64631722339294e-07, - "loss": 0.6533, - "step": 76559 - }, - { - "epoch": 1.96, - "learning_rate": 5.646068121122236e-07, - "loss": 0.813, - "step": 76560 - }, - { - "epoch": 1.96, - "learning_rate": 5.64581902218513e-07, - "loss": 0.5967, - "step": 76561 - }, - { - "epoch": 1.96, - "learning_rate": 5.645569926581819e-07, - "loss": 0.6929, - "step": 76562 - }, - { - "epoch": 1.96, - "learning_rate": 5.645320834312494e-07, - "loss": 0.6631, - "step": 76563 - }, - { - "epoch": 1.96, - "learning_rate": 5.645071745377352e-07, - "loss": 0.6025, - "step": 76564 - }, - { - "epoch": 1.96, - "learning_rate": 5.644822659776574e-07, - "loss": 0.5103, - "step": 76565 - }, - { - "epoch": 1.96, - "learning_rate": 5.644573577510355e-07, - "loss": 0.4298, - "step": 76566 - }, - { - "epoch": 1.96, - "learning_rate": 5.644324498578885e-07, - "loss": 0.5413, - "step": 76567 - }, - { - "epoch": 1.96, - "learning_rate": 5.644075422982362e-07, - "loss": 0.4941, - "step": 76568 - }, - { - "epoch": 1.96, - "learning_rate": 5.643826350720964e-07, - "loss": 0.2236, - "step": 76569 - }, - { - "epoch": 1.96, - "learning_rate": 5.643577281794892e-07, - "loss": 0.6299, - "step": 76570 - }, - { - "epoch": 1.96, - "learning_rate": 5.643328216204329e-07, - "loss": 0.6099, - "step": 76571 - }, - { - "epoch": 1.96, - "learning_rate": 5.643079153949469e-07, - "loss": 0.6074, - "step": 76572 - }, - { - "epoch": 1.96, - "learning_rate": 5.642830095030507e-07, - "loss": 0.6479, - "step": 76573 - }, - { - "epoch": 1.96, - "learning_rate": 5.642581039447624e-07, - "loss": 0.5516, - "step": 76574 - }, - { - "epoch": 1.96, - "learning_rate": 5.642331987201019e-07, - "loss": 0.5977, - "step": 76575 - }, - { - "epoch": 1.96, - "learning_rate": 5.64208293829088e-07, - "loss": 0.5703, - "step": 76576 - }, - { - "epoch": 1.96, - "learning_rate": 5.641833892717401e-07, - "loss": 0.5103, - "step": 76577 - }, - { - "epoch": 1.96, - "learning_rate": 5.641584850480764e-07, - "loss": 0.688, - "step": 76578 - }, - { - "epoch": 1.96, - "learning_rate": 5.641335811581166e-07, - "loss": 0.6426, - "step": 76579 - }, - { - "epoch": 1.96, - "learning_rate": 5.641086776018801e-07, - "loss": 0.5234, - "step": 76580 - }, - { - "epoch": 1.96, - "learning_rate": 5.640837743793856e-07, - "loss": 0.7178, - "step": 76581 - }, - { - "epoch": 1.96, - "learning_rate": 5.640588714906516e-07, - "loss": 0.7363, - "step": 76582 - }, - { - "epoch": 1.96, - "learning_rate": 5.640339689356977e-07, - "loss": 0.5449, - "step": 76583 - }, - { - "epoch": 1.96, - "learning_rate": 5.64009066714543e-07, - "loss": 0.5854, - "step": 76584 - }, - { - "epoch": 1.96, - "learning_rate": 5.639841648272068e-07, - "loss": 0.4961, - "step": 76585 - }, - { - "epoch": 1.96, - "learning_rate": 5.639592632737075e-07, - "loss": 0.7061, - "step": 76586 - }, - { - "epoch": 1.96, - "learning_rate": 5.639343620540647e-07, - "loss": 0.5356, - "step": 76587 - }, - { - "epoch": 1.96, - "learning_rate": 5.639094611682972e-07, - "loss": 0.5967, - "step": 76588 - }, - { - "epoch": 1.96, - "learning_rate": 5.638845606164245e-07, - "loss": 0.5293, - "step": 76589 - }, - { - "epoch": 1.96, - "learning_rate": 5.638596603984656e-07, - "loss": 0.5781, - "step": 76590 - }, - { - "epoch": 1.96, - "learning_rate": 5.638347605144386e-07, - "loss": 0.5591, - "step": 76591 - }, - { - "epoch": 1.96, - "learning_rate": 5.638098609643633e-07, - "loss": 0.6406, - "step": 76592 - }, - { - "epoch": 1.96, - "learning_rate": 5.637849617482588e-07, - "loss": 0.4321, - "step": 76593 - }, - { - "epoch": 1.96, - "learning_rate": 5.637600628661446e-07, - "loss": 0.5894, - "step": 76594 - }, - { - "epoch": 1.96, - "learning_rate": 5.637351643180388e-07, - "loss": 0.4649, - "step": 76595 - }, - { - "epoch": 1.96, - "learning_rate": 5.637102661039609e-07, - "loss": 0.4824, - "step": 76596 - }, - { - "epoch": 1.96, - "learning_rate": 5.6368536822393e-07, - "loss": 0.584, - "step": 76597 - }, - { - "epoch": 1.96, - "learning_rate": 5.636604706779656e-07, - "loss": 0.605, - "step": 76598 - }, - { - "epoch": 1.96, - "learning_rate": 5.636355734660858e-07, - "loss": 0.6377, - "step": 76599 - }, - { - "epoch": 1.96, - "learning_rate": 5.636106765883106e-07, - "loss": 0.4424, - "step": 76600 - }, - { - "epoch": 1.96, - "learning_rate": 5.635857800446583e-07, - "loss": 0.7197, - "step": 76601 - }, - { - "epoch": 1.96, - "learning_rate": 5.635608838351486e-07, - "loss": 0.75, - "step": 76602 - }, - { - "epoch": 1.96, - "learning_rate": 5.635359879598001e-07, - "loss": 0.4219, - "step": 76603 - }, - { - "epoch": 1.96, - "learning_rate": 5.635110924186317e-07, - "loss": 0.7891, - "step": 76604 - }, - { - "epoch": 1.96, - "learning_rate": 5.63486197211663e-07, - "loss": 0.7788, - "step": 76605 - }, - { - "epoch": 1.96, - "learning_rate": 5.634613023389132e-07, - "loss": 0.5713, - "step": 76606 - }, - { - "epoch": 1.96, - "learning_rate": 5.634364078004006e-07, - "loss": 0.6897, - "step": 76607 - }, - { - "epoch": 1.96, - "learning_rate": 5.634115135961447e-07, - "loss": 0.4546, - "step": 76608 - }, - { - "epoch": 1.96, - "learning_rate": 5.633866197261646e-07, - "loss": 0.5361, - "step": 76609 - }, - { - "epoch": 1.96, - "learning_rate": 5.633617261904795e-07, - "loss": 0.6631, - "step": 76610 - }, - { - "epoch": 1.96, - "learning_rate": 5.633368329891084e-07, - "loss": 0.605, - "step": 76611 - }, - { - "epoch": 1.96, - "learning_rate": 5.633119401220696e-07, - "loss": 0.6982, - "step": 76612 - }, - { - "epoch": 1.96, - "learning_rate": 5.63287047589383e-07, - "loss": 0.6958, - "step": 76613 - }, - { - "epoch": 1.96, - "learning_rate": 5.632621553910674e-07, - "loss": 0.6035, - "step": 76614 - }, - { - "epoch": 1.96, - "learning_rate": 5.632372635271422e-07, - "loss": 0.6738, - "step": 76615 - }, - { - "epoch": 1.96, - "learning_rate": 5.632123719976258e-07, - "loss": 0.521, - "step": 76616 - }, - { - "epoch": 1.96, - "learning_rate": 5.631874808025375e-07, - "loss": 0.7583, - "step": 76617 - }, - { - "epoch": 1.96, - "learning_rate": 5.63162589941897e-07, - "loss": 0.6729, - "step": 76618 - }, - { - "epoch": 1.96, - "learning_rate": 5.631376994157223e-07, - "loss": 0.7402, - "step": 76619 - }, - { - "epoch": 1.96, - "learning_rate": 5.631128092240335e-07, - "loss": 0.509, - "step": 76620 - }, - { - "epoch": 1.96, - "learning_rate": 5.630879193668487e-07, - "loss": 0.7329, - "step": 76621 - }, - { - "epoch": 1.96, - "learning_rate": 5.630630298441873e-07, - "loss": 0.5579, - "step": 76622 - }, - { - "epoch": 1.96, - "learning_rate": 5.63038140656069e-07, - "loss": 0.5864, - "step": 76623 - }, - { - "epoch": 1.96, - "learning_rate": 5.630132518025117e-07, - "loss": 0.5452, - "step": 76624 - }, - { - "epoch": 1.96, - "learning_rate": 5.629883632835352e-07, - "loss": 0.5737, - "step": 76625 - }, - { - "epoch": 1.96, - "learning_rate": 5.629634750991583e-07, - "loss": 0.6685, - "step": 76626 - }, - { - "epoch": 1.96, - "learning_rate": 5.629385872494006e-07, - "loss": 0.5991, - "step": 76627 - }, - { - "epoch": 1.96, - "learning_rate": 5.629136997342804e-07, - "loss": 0.5991, - "step": 76628 - }, - { - "epoch": 1.96, - "learning_rate": 5.628888125538172e-07, - "loss": 0.7627, - "step": 76629 - }, - { - "epoch": 1.96, - "learning_rate": 5.628639257080301e-07, - "loss": 0.6768, - "step": 76630 - }, - { - "epoch": 1.96, - "learning_rate": 5.628390391969378e-07, - "loss": 0.5522, - "step": 76631 - }, - { - "epoch": 1.96, - "learning_rate": 5.628141530205597e-07, - "loss": 0.875, - "step": 76632 - }, - { - "epoch": 1.96, - "learning_rate": 5.627892671789145e-07, - "loss": 0.4773, - "step": 76633 - }, - { - "epoch": 1.96, - "learning_rate": 5.627643816720214e-07, - "loss": 0.6504, - "step": 76634 - }, - { - "epoch": 1.96, - "learning_rate": 5.627394964998999e-07, - "loss": 0.7256, - "step": 76635 - }, - { - "epoch": 1.96, - "learning_rate": 5.627146116625683e-07, - "loss": 0.7041, - "step": 76636 - }, - { - "epoch": 1.96, - "learning_rate": 5.62689727160046e-07, - "loss": 0.6089, - "step": 76637 - }, - { - "epoch": 1.96, - "learning_rate": 5.626648429923519e-07, - "loss": 0.75, - "step": 76638 - }, - { - "epoch": 1.96, - "learning_rate": 5.626399591595059e-07, - "loss": 0.6621, - "step": 76639 - }, - { - "epoch": 1.96, - "learning_rate": 5.626150756615262e-07, - "loss": 0.5215, - "step": 76640 - }, - { - "epoch": 1.96, - "learning_rate": 5.625901924984318e-07, - "loss": 0.5061, - "step": 76641 - }, - { - "epoch": 1.96, - "learning_rate": 5.625653096702418e-07, - "loss": 0.5487, - "step": 76642 - }, - { - "epoch": 1.96, - "learning_rate": 5.625404271769754e-07, - "loss": 0.625, - "step": 76643 - }, - { - "epoch": 1.96, - "learning_rate": 5.625155450186522e-07, - "loss": 0.501, - "step": 76644 - }, - { - "epoch": 1.96, - "learning_rate": 5.624906631952902e-07, - "loss": 0.5605, - "step": 76645 - }, - { - "epoch": 1.96, - "learning_rate": 5.624657817069092e-07, - "loss": 0.6611, - "step": 76646 - }, - { - "epoch": 1.96, - "learning_rate": 5.624409005535278e-07, - "loss": 0.6475, - "step": 76647 - }, - { - "epoch": 1.96, - "learning_rate": 5.624160197351657e-07, - "loss": 0.5947, - "step": 76648 - }, - { - "epoch": 1.96, - "learning_rate": 5.623911392518414e-07, - "loss": 0.7588, - "step": 76649 - }, - { - "epoch": 1.96, - "learning_rate": 5.623662591035742e-07, - "loss": 0.6357, - "step": 76650 - }, - { - "epoch": 1.96, - "learning_rate": 5.623413792903828e-07, - "loss": 0.7339, - "step": 76651 - }, - { - "epoch": 1.96, - "learning_rate": 5.623164998122867e-07, - "loss": 0.7046, - "step": 76652 - }, - { - "epoch": 1.96, - "learning_rate": 5.622916206693045e-07, - "loss": 0.5225, - "step": 76653 - }, - { - "epoch": 1.96, - "learning_rate": 5.622667418614554e-07, - "loss": 0.7402, - "step": 76654 - }, - { - "epoch": 1.96, - "learning_rate": 5.622418633887586e-07, - "loss": 0.5791, - "step": 76655 - }, - { - "epoch": 1.96, - "learning_rate": 5.622169852512334e-07, - "loss": 0.7783, - "step": 76656 - }, - { - "epoch": 1.96, - "learning_rate": 5.621921074488982e-07, - "loss": 0.7183, - "step": 76657 - }, - { - "epoch": 1.96, - "learning_rate": 5.621672299817724e-07, - "loss": 0.7188, - "step": 76658 - }, - { - "epoch": 1.96, - "learning_rate": 5.621423528498747e-07, - "loss": 0.5728, - "step": 76659 - }, - { - "epoch": 1.96, - "learning_rate": 5.621174760532253e-07, - "loss": 0.7227, - "step": 76660 - }, - { - "epoch": 1.96, - "learning_rate": 5.620925995918422e-07, - "loss": 0.8545, - "step": 76661 - }, - { - "epoch": 1.96, - "learning_rate": 5.620677234657442e-07, - "loss": 0.5615, - "step": 76662 - }, - { - "epoch": 1.96, - "learning_rate": 5.620428476749509e-07, - "loss": 0.665, - "step": 76663 - }, - { - "epoch": 1.96, - "learning_rate": 5.620179722194813e-07, - "loss": 0.7441, - "step": 76664 - }, - { - "epoch": 1.96, - "learning_rate": 5.619930970993548e-07, - "loss": 0.5923, - "step": 76665 - }, - { - "epoch": 1.96, - "learning_rate": 5.619682223145895e-07, - "loss": 0.7979, - "step": 76666 - }, - { - "epoch": 1.97, - "learning_rate": 5.619433478652052e-07, - "loss": 0.4624, - "step": 76667 - }, - { - "epoch": 1.97, - "learning_rate": 5.619184737512206e-07, - "loss": 0.4714, - "step": 76668 - }, - { - "epoch": 1.97, - "learning_rate": 5.618935999726553e-07, - "loss": 0.3795, - "step": 76669 - }, - { - "epoch": 1.97, - "learning_rate": 5.618687265295279e-07, - "loss": 0.7041, - "step": 76670 - }, - { - "epoch": 1.97, - "learning_rate": 5.61843853421857e-07, - "loss": 0.6152, - "step": 76671 - }, - { - "epoch": 1.97, - "learning_rate": 5.618189806496623e-07, - "loss": 0.5244, - "step": 76672 - }, - { - "epoch": 1.97, - "learning_rate": 5.617941082129629e-07, - "loss": 0.543, - "step": 76673 - }, - { - "epoch": 1.97, - "learning_rate": 5.617692361117773e-07, - "loss": 0.6973, - "step": 76674 - }, - { - "epoch": 1.97, - "learning_rate": 5.617443643461248e-07, - "loss": 0.4561, - "step": 76675 - }, - { - "epoch": 1.97, - "learning_rate": 5.617194929160245e-07, - "loss": 0.563, - "step": 76676 - }, - { - "epoch": 1.97, - "learning_rate": 5.616946218214959e-07, - "loss": 0.686, - "step": 76677 - }, - { - "epoch": 1.97, - "learning_rate": 5.616697510625571e-07, - "loss": 0.6768, - "step": 76678 - }, - { - "epoch": 1.97, - "learning_rate": 5.616448806392275e-07, - "loss": 0.5337, - "step": 76679 - }, - { - "epoch": 1.97, - "learning_rate": 5.61620010551527e-07, - "loss": 0.344, - "step": 76680 - }, - { - "epoch": 1.97, - "learning_rate": 5.615951407994732e-07, - "loss": 0.6826, - "step": 76681 - }, - { - "epoch": 1.97, - "learning_rate": 5.615702713830863e-07, - "loss": 0.5981, - "step": 76682 - }, - { - "epoch": 1.97, - "learning_rate": 5.615454023023844e-07, - "loss": 0.8037, - "step": 76683 - }, - { - "epoch": 1.97, - "learning_rate": 5.615205335573873e-07, - "loss": 0.71, - "step": 76684 - }, - { - "epoch": 1.97, - "learning_rate": 5.614956651481135e-07, - "loss": 0.5957, - "step": 76685 - }, - { - "epoch": 1.97, - "learning_rate": 5.614707970745829e-07, - "loss": 0.5659, - "step": 76686 - }, - { - "epoch": 1.97, - "learning_rate": 5.614459293368134e-07, - "loss": 0.7852, - "step": 76687 - }, - { - "epoch": 1.97, - "learning_rate": 5.614210619348247e-07, - "loss": 0.6641, - "step": 76688 - }, - { - "epoch": 1.97, - "learning_rate": 5.613961948686361e-07, - "loss": 0.709, - "step": 76689 - }, - { - "epoch": 1.97, - "learning_rate": 5.613713281382662e-07, - "loss": 0.5874, - "step": 76690 - }, - { - "epoch": 1.97, - "learning_rate": 5.613464617437338e-07, - "loss": 0.7002, - "step": 76691 - }, - { - "epoch": 1.97, - "learning_rate": 5.613215956850581e-07, - "loss": 0.4722, - "step": 76692 - }, - { - "epoch": 1.97, - "learning_rate": 5.612967299622584e-07, - "loss": 0.5635, - "step": 76693 - }, - { - "epoch": 1.97, - "learning_rate": 5.61271864575354e-07, - "loss": 0.6499, - "step": 76694 - }, - { - "epoch": 1.97, - "learning_rate": 5.612469995243632e-07, - "loss": 0.5859, - "step": 76695 - }, - { - "epoch": 1.97, - "learning_rate": 5.612221348093053e-07, - "loss": 0.647, - "step": 76696 - }, - { - "epoch": 1.97, - "learning_rate": 5.611972704301995e-07, - "loss": 0.707, - "step": 76697 - }, - { - "epoch": 1.97, - "learning_rate": 5.611724063870651e-07, - "loss": 0.7197, - "step": 76698 - }, - { - "epoch": 1.97, - "learning_rate": 5.611475426799204e-07, - "loss": 0.3895, - "step": 76699 - }, - { - "epoch": 1.97, - "learning_rate": 5.611226793087855e-07, - "loss": 0.5698, - "step": 76700 - }, - { - "epoch": 1.97, - "learning_rate": 5.610978162736782e-07, - "loss": 0.6816, - "step": 76701 - }, - { - "epoch": 1.97, - "learning_rate": 5.61072953574618e-07, - "loss": 0.5552, - "step": 76702 - }, - { - "epoch": 1.97, - "learning_rate": 5.610480912116247e-07, - "loss": 0.477, - "step": 76703 - }, - { - "epoch": 1.97, - "learning_rate": 5.610232291847161e-07, - "loss": 0.8164, - "step": 76704 - }, - { - "epoch": 1.97, - "learning_rate": 5.609983674939118e-07, - "loss": 0.5835, - "step": 76705 - }, - { - "epoch": 1.97, - "learning_rate": 5.609735061392314e-07, - "loss": 0.5503, - "step": 76706 - }, - { - "epoch": 1.97, - "learning_rate": 5.60948645120693e-07, - "loss": 0.4946, - "step": 76707 - }, - { - "epoch": 1.97, - "learning_rate": 5.60923784438316e-07, - "loss": 0.8047, - "step": 76708 - }, - { - "epoch": 1.97, - "learning_rate": 5.608989240921195e-07, - "loss": 0.521, - "step": 76709 - }, - { - "epoch": 1.97, - "learning_rate": 5.608740640821227e-07, - "loss": 0.4736, - "step": 76710 - }, - { - "epoch": 1.97, - "learning_rate": 5.608492044083448e-07, - "loss": 0.7822, - "step": 76711 - }, - { - "epoch": 1.97, - "learning_rate": 5.608243450708039e-07, - "loss": 0.6592, - "step": 76712 - }, - { - "epoch": 1.97, - "learning_rate": 5.607994860695195e-07, - "loss": 0.5359, - "step": 76713 - }, - { - "epoch": 1.97, - "learning_rate": 5.607746274045109e-07, - "loss": 0.6865, - "step": 76714 - }, - { - "epoch": 1.97, - "learning_rate": 5.607497690757972e-07, - "loss": 0.7305, - "step": 76715 - }, - { - "epoch": 1.97, - "learning_rate": 5.607249110833969e-07, - "loss": 0.6162, - "step": 76716 - }, - { - "epoch": 1.97, - "learning_rate": 5.607000534273294e-07, - "loss": 0.5898, - "step": 76717 - }, - { - "epoch": 1.97, - "learning_rate": 5.606751961076136e-07, - "loss": 0.5806, - "step": 76718 - }, - { - "epoch": 1.97, - "learning_rate": 5.60650339124269e-07, - "loss": 0.6179, - "step": 76719 - }, - { - "epoch": 1.97, - "learning_rate": 5.606254824773143e-07, - "loss": 0.6719, - "step": 76720 - }, - { - "epoch": 1.97, - "learning_rate": 5.60600626166768e-07, - "loss": 0.4124, - "step": 76721 - }, - { - "epoch": 1.97, - "learning_rate": 5.605757701926496e-07, - "loss": 0.8906, - "step": 76722 - }, - { - "epoch": 1.97, - "learning_rate": 5.605509145549785e-07, - "loss": 0.7207, - "step": 76723 - }, - { - "epoch": 1.97, - "learning_rate": 5.60526059253773e-07, - "loss": 0.751, - "step": 76724 - }, - { - "epoch": 1.97, - "learning_rate": 5.605012042890524e-07, - "loss": 0.3896, - "step": 76725 - }, - { - "epoch": 1.97, - "learning_rate": 5.60476349660836e-07, - "loss": 0.6376, - "step": 76726 - }, - { - "epoch": 1.97, - "learning_rate": 5.60451495369143e-07, - "loss": 0.5952, - "step": 76727 - }, - { - "epoch": 1.97, - "learning_rate": 5.604266414139915e-07, - "loss": 0.6865, - "step": 76728 - }, - { - "epoch": 1.97, - "learning_rate": 5.604017877954013e-07, - "loss": 0.6733, - "step": 76729 - }, - { - "epoch": 1.97, - "learning_rate": 5.603769345133915e-07, - "loss": 0.6528, - "step": 76730 - }, - { - "epoch": 1.97, - "learning_rate": 5.603520815679806e-07, - "loss": 0.5574, - "step": 76731 - }, - { - "epoch": 1.97, - "learning_rate": 5.603272289591883e-07, - "loss": 0.7988, - "step": 76732 - }, - { - "epoch": 1.97, - "learning_rate": 5.603023766870328e-07, - "loss": 0.5762, - "step": 76733 - }, - { - "epoch": 1.97, - "learning_rate": 5.602775247515334e-07, - "loss": 0.3634, - "step": 76734 - }, - { - "epoch": 1.97, - "learning_rate": 5.602526731527094e-07, - "loss": 0.6553, - "step": 76735 - }, - { - "epoch": 1.97, - "learning_rate": 5.6022782189058e-07, - "loss": 0.6582, - "step": 76736 - }, - { - "epoch": 1.97, - "learning_rate": 5.602029709651637e-07, - "loss": 0.6816, - "step": 76737 - }, - { - "epoch": 1.97, - "learning_rate": 5.601781203764797e-07, - "loss": 0.603, - "step": 76738 - }, - { - "epoch": 1.97, - "learning_rate": 5.60153270124547e-07, - "loss": 0.6328, - "step": 76739 - }, - { - "epoch": 1.97, - "learning_rate": 5.601284202093853e-07, - "loss": 0.6524, - "step": 76740 - }, - { - "epoch": 1.97, - "learning_rate": 5.601035706310128e-07, - "loss": 0.667, - "step": 76741 - }, - { - "epoch": 1.97, - "learning_rate": 5.600787213894486e-07, - "loss": 0.7998, - "step": 76742 - }, - { - "epoch": 1.97, - "learning_rate": 5.60053872484712e-07, - "loss": 0.7075, - "step": 76743 - }, - { - "epoch": 1.97, - "learning_rate": 5.60029023916822e-07, - "loss": 0.6377, - "step": 76744 - }, - { - "epoch": 1.97, - "learning_rate": 5.600041756857973e-07, - "loss": 0.4976, - "step": 76745 - }, - { - "epoch": 1.97, - "learning_rate": 5.599793277916571e-07, - "loss": 0.5234, - "step": 76746 - }, - { - "epoch": 1.97, - "learning_rate": 5.599544802344206e-07, - "loss": 0.6309, - "step": 76747 - }, - { - "epoch": 1.97, - "learning_rate": 5.59929633014107e-07, - "loss": 0.7002, - "step": 76748 - }, - { - "epoch": 1.97, - "learning_rate": 5.599047861307348e-07, - "loss": 0.5815, - "step": 76749 - }, - { - "epoch": 1.97, - "learning_rate": 5.598799395843236e-07, - "loss": 0.5269, - "step": 76750 - }, - { - "epoch": 1.97, - "learning_rate": 5.598550933748916e-07, - "loss": 0.5752, - "step": 76751 - }, - { - "epoch": 1.97, - "learning_rate": 5.598302475024583e-07, - "loss": 0.5115, - "step": 76752 - }, - { - "epoch": 1.97, - "learning_rate": 5.598054019670432e-07, - "loss": 0.5417, - "step": 76753 - }, - { - "epoch": 1.97, - "learning_rate": 5.597805567686646e-07, - "loss": 0.4683, - "step": 76754 - }, - { - "epoch": 1.97, - "learning_rate": 5.597557119073417e-07, - "loss": 0.8467, - "step": 76755 - }, - { - "epoch": 1.97, - "learning_rate": 5.597308673830936e-07, - "loss": 0.625, - "step": 76756 - }, - { - "epoch": 1.97, - "learning_rate": 5.597060231959396e-07, - "loss": 0.5374, - "step": 76757 - }, - { - "epoch": 1.97, - "learning_rate": 5.596811793458982e-07, - "loss": 0.6685, - "step": 76758 - }, - { - "epoch": 1.97, - "learning_rate": 5.596563358329886e-07, - "loss": 0.6016, - "step": 76759 - }, - { - "epoch": 1.97, - "learning_rate": 5.596314926572305e-07, - "loss": 0.5479, - "step": 76760 - }, - { - "epoch": 1.97, - "learning_rate": 5.596066498186422e-07, - "loss": 0.5674, - "step": 76761 - }, - { - "epoch": 1.97, - "learning_rate": 5.595818073172423e-07, - "loss": 0.748, - "step": 76762 - }, - { - "epoch": 1.97, - "learning_rate": 5.595569651530506e-07, - "loss": 0.6011, - "step": 76763 - }, - { - "epoch": 1.97, - "learning_rate": 5.595321233260857e-07, - "loss": 0.6104, - "step": 76764 - }, - { - "epoch": 1.97, - "learning_rate": 5.59507281836367e-07, - "loss": 0.4882, - "step": 76765 - }, - { - "epoch": 1.97, - "learning_rate": 5.594824406839134e-07, - "loss": 0.3604, - "step": 76766 - }, - { - "epoch": 1.97, - "learning_rate": 5.594575998687434e-07, - "loss": 0.5764, - "step": 76767 - }, - { - "epoch": 1.97, - "learning_rate": 5.594327593908767e-07, - "loss": 0.5132, - "step": 76768 - }, - { - "epoch": 1.97, - "learning_rate": 5.594079192503325e-07, - "loss": 0.5718, - "step": 76769 - }, - { - "epoch": 1.97, - "learning_rate": 5.593830794471292e-07, - "loss": 0.6318, - "step": 76770 - }, - { - "epoch": 1.97, - "learning_rate": 5.593582399812859e-07, - "loss": 0.5781, - "step": 76771 - }, - { - "epoch": 1.97, - "learning_rate": 5.593334008528216e-07, - "loss": 0.6748, - "step": 76772 - }, - { - "epoch": 1.97, - "learning_rate": 5.593085620617554e-07, - "loss": 0.7197, - "step": 76773 - }, - { - "epoch": 1.97, - "learning_rate": 5.592837236081067e-07, - "loss": 0.5208, - "step": 76774 - }, - { - "epoch": 1.97, - "learning_rate": 5.59258885491894e-07, - "loss": 0.6963, - "step": 76775 - }, - { - "epoch": 1.97, - "learning_rate": 5.592340477131363e-07, - "loss": 0.646, - "step": 76776 - }, - { - "epoch": 1.97, - "learning_rate": 5.592092102718529e-07, - "loss": 0.3879, - "step": 76777 - }, - { - "epoch": 1.97, - "learning_rate": 5.591843731680632e-07, - "loss": 0.6787, - "step": 76778 - }, - { - "epoch": 1.97, - "learning_rate": 5.591595364017854e-07, - "loss": 0.5625, - "step": 76779 - }, - { - "epoch": 1.97, - "learning_rate": 5.591346999730391e-07, - "loss": 0.5215, - "step": 76780 - }, - { - "epoch": 1.97, - "learning_rate": 5.591098638818428e-07, - "loss": 0.7754, - "step": 76781 - }, - { - "epoch": 1.97, - "learning_rate": 5.590850281282162e-07, - "loss": 0.5737, - "step": 76782 - }, - { - "epoch": 1.97, - "learning_rate": 5.590601927121775e-07, - "loss": 0.6777, - "step": 76783 - }, - { - "epoch": 1.97, - "learning_rate": 5.590353576337461e-07, - "loss": 0.5144, - "step": 76784 - }, - { - "epoch": 1.97, - "learning_rate": 5.590105228929412e-07, - "loss": 0.4541, - "step": 76785 - }, - { - "epoch": 1.97, - "learning_rate": 5.589856884897819e-07, - "loss": 0.7812, - "step": 76786 - }, - { - "epoch": 1.97, - "learning_rate": 5.589608544242866e-07, - "loss": 0.6387, - "step": 76787 - }, - { - "epoch": 1.97, - "learning_rate": 5.589360206964747e-07, - "loss": 0.5979, - "step": 76788 - }, - { - "epoch": 1.97, - "learning_rate": 5.589111873063652e-07, - "loss": 0.6914, - "step": 76789 - }, - { - "epoch": 1.97, - "learning_rate": 5.588863542539776e-07, - "loss": 0.4382, - "step": 76790 - }, - { - "epoch": 1.97, - "learning_rate": 5.588615215393304e-07, - "loss": 0.6338, - "step": 76791 - }, - { - "epoch": 1.97, - "learning_rate": 5.588366891624423e-07, - "loss": 0.5732, - "step": 76792 - }, - { - "epoch": 1.97, - "learning_rate": 5.588118571233325e-07, - "loss": 0.584, - "step": 76793 - }, - { - "epoch": 1.97, - "learning_rate": 5.587870254220204e-07, - "loss": 0.6553, - "step": 76794 - }, - { - "epoch": 1.97, - "learning_rate": 5.58762194058525e-07, - "loss": 0.5918, - "step": 76795 - }, - { - "epoch": 1.97, - "learning_rate": 5.587373630328648e-07, - "loss": 0.6211, - "step": 76796 - }, - { - "epoch": 1.97, - "learning_rate": 5.58712532345059e-07, - "loss": 0.7188, - "step": 76797 - }, - { - "epoch": 1.97, - "learning_rate": 5.586877019951272e-07, - "loss": 0.3022, - "step": 76798 - }, - { - "epoch": 1.97, - "learning_rate": 5.586628719830875e-07, - "loss": 0.5942, - "step": 76799 - }, - { - "epoch": 1.97, - "learning_rate": 5.586380423089598e-07, - "loss": 0.5674, - "step": 76800 - }, - { - "epoch": 1.97, - "learning_rate": 5.586132129727623e-07, - "loss": 0.7549, - "step": 76801 - }, - { - "epoch": 1.97, - "learning_rate": 5.585883839745142e-07, - "loss": 0.6162, - "step": 76802 - }, - { - "epoch": 1.97, - "learning_rate": 5.585635553142352e-07, - "loss": 0.6421, - "step": 76803 - }, - { - "epoch": 1.97, - "learning_rate": 5.585387269919435e-07, - "loss": 0.5317, - "step": 76804 - }, - { - "epoch": 1.97, - "learning_rate": 5.585138990076582e-07, - "loss": 0.6748, - "step": 76805 - }, - { - "epoch": 1.97, - "learning_rate": 5.584890713613986e-07, - "loss": 0.3796, - "step": 76806 - }, - { - "epoch": 1.97, - "learning_rate": 5.58464244053184e-07, - "loss": 0.7471, - "step": 76807 - }, - { - "epoch": 1.97, - "learning_rate": 5.584394170830327e-07, - "loss": 0.6777, - "step": 76808 - }, - { - "epoch": 1.97, - "learning_rate": 5.584145904509638e-07, - "loss": 0.71, - "step": 76809 - }, - { - "epoch": 1.97, - "learning_rate": 5.583897641569971e-07, - "loss": 0.4844, - "step": 76810 - }, - { - "epoch": 1.97, - "learning_rate": 5.583649382011506e-07, - "loss": 0.6594, - "step": 76811 - }, - { - "epoch": 1.97, - "learning_rate": 5.583401125834443e-07, - "loss": 0.4932, - "step": 76812 - }, - { - "epoch": 1.97, - "learning_rate": 5.583152873038961e-07, - "loss": 0.7104, - "step": 76813 - }, - { - "epoch": 1.97, - "learning_rate": 5.582904623625258e-07, - "loss": 0.6846, - "step": 76814 - }, - { - "epoch": 1.97, - "learning_rate": 5.582656377593523e-07, - "loss": 0.6968, - "step": 76815 - }, - { - "epoch": 1.97, - "learning_rate": 5.582408134943943e-07, - "loss": 0.6328, - "step": 76816 - }, - { - "epoch": 1.97, - "learning_rate": 5.582159895676708e-07, - "loss": 0.6406, - "step": 76817 - }, - { - "epoch": 1.97, - "learning_rate": 5.581911659792012e-07, - "loss": 0.541, - "step": 76818 - }, - { - "epoch": 1.97, - "learning_rate": 5.581663427290046e-07, - "loss": 0.5962, - "step": 76819 - }, - { - "epoch": 1.97, - "learning_rate": 5.581415198170998e-07, - "loss": 0.5996, - "step": 76820 - }, - { - "epoch": 1.97, - "learning_rate": 5.581166972435051e-07, - "loss": 0.7344, - "step": 76821 - }, - { - "epoch": 1.97, - "learning_rate": 5.580918750082404e-07, - "loss": 0.562, - "step": 76822 - }, - { - "epoch": 1.97, - "learning_rate": 5.580670531113243e-07, - "loss": 0.5996, - "step": 76823 - }, - { - "epoch": 1.97, - "learning_rate": 5.580422315527764e-07, - "loss": 0.6685, - "step": 76824 - }, - { - "epoch": 1.97, - "learning_rate": 5.580174103326148e-07, - "loss": 0.6318, - "step": 76825 - }, - { - "epoch": 1.97, - "learning_rate": 5.57992589450859e-07, - "loss": 0.7832, - "step": 76826 - }, - { - "epoch": 1.97, - "learning_rate": 5.579677689075279e-07, - "loss": 0.709, - "step": 76827 - }, - { - "epoch": 1.97, - "learning_rate": 5.57942948702641e-07, - "loss": 0.5801, - "step": 76828 - }, - { - "epoch": 1.97, - "learning_rate": 5.579181288362163e-07, - "loss": 0.6807, - "step": 76829 - }, - { - "epoch": 1.97, - "learning_rate": 5.578933093082739e-07, - "loss": 0.5198, - "step": 76830 - }, - { - "epoch": 1.97, - "learning_rate": 5.578684901188319e-07, - "loss": 0.665, - "step": 76831 - }, - { - "epoch": 1.97, - "learning_rate": 5.5784367126791e-07, - "loss": 0.5557, - "step": 76832 - }, - { - "epoch": 1.97, - "learning_rate": 5.578188527555265e-07, - "loss": 0.8174, - "step": 76833 - }, - { - "epoch": 1.97, - "learning_rate": 5.577940345817007e-07, - "loss": 0.4609, - "step": 76834 - }, - { - "epoch": 1.97, - "learning_rate": 5.577692167464517e-07, - "loss": 0.5557, - "step": 76835 - }, - { - "epoch": 1.97, - "learning_rate": 5.57744399249799e-07, - "loss": 0.752, - "step": 76836 - }, - { - "epoch": 1.97, - "learning_rate": 5.577195820917605e-07, - "loss": 0.6479, - "step": 76837 - }, - { - "epoch": 1.97, - "learning_rate": 5.576947652723559e-07, - "loss": 0.8135, - "step": 76838 - }, - { - "epoch": 1.97, - "learning_rate": 5.576699487916043e-07, - "loss": 0.6953, - "step": 76839 - }, - { - "epoch": 1.97, - "learning_rate": 5.576451326495243e-07, - "loss": 0.6729, - "step": 76840 - }, - { - "epoch": 1.97, - "learning_rate": 5.576203168461354e-07, - "loss": 0.6929, - "step": 76841 - }, - { - "epoch": 1.97, - "learning_rate": 5.575955013814559e-07, - "loss": 0.7471, - "step": 76842 - }, - { - "epoch": 1.97, - "learning_rate": 5.575706862555052e-07, - "loss": 0.7129, - "step": 76843 - }, - { - "epoch": 1.97, - "learning_rate": 5.575458714683021e-07, - "loss": 0.7314, - "step": 76844 - }, - { - "epoch": 1.97, - "learning_rate": 5.575210570198664e-07, - "loss": 0.6104, - "step": 76845 - }, - { - "epoch": 1.97, - "learning_rate": 5.57496242910216e-07, - "loss": 0.5918, - "step": 76846 - }, - { - "epoch": 1.97, - "learning_rate": 5.574714291393706e-07, - "loss": 0.748, - "step": 76847 - }, - { - "epoch": 1.97, - "learning_rate": 5.574466157073485e-07, - "loss": 0.458, - "step": 76848 - }, - { - "epoch": 1.97, - "learning_rate": 5.574218026141704e-07, - "loss": 0.5032, - "step": 76849 - }, - { - "epoch": 1.97, - "learning_rate": 5.57396989859853e-07, - "loss": 0.5989, - "step": 76850 - }, - { - "epoch": 1.97, - "learning_rate": 5.573721774444165e-07, - "loss": 0.7583, - "step": 76851 - }, - { - "epoch": 1.97, - "learning_rate": 5.573473653678798e-07, - "loss": 0.6641, - "step": 76852 - }, - { - "epoch": 1.97, - "learning_rate": 5.573225536302623e-07, - "loss": 0.7002, - "step": 76853 - }, - { - "epoch": 1.97, - "learning_rate": 5.572977422315821e-07, - "loss": 0.6533, - "step": 76854 - }, - { - "epoch": 1.97, - "learning_rate": 5.572729311718586e-07, - "loss": 0.5601, - "step": 76855 - }, - { - "epoch": 1.97, - "learning_rate": 5.572481204511109e-07, - "loss": 0.6562, - "step": 76856 - }, - { - "epoch": 1.97, - "learning_rate": 5.572233100693584e-07, - "loss": 0.6387, - "step": 76857 - }, - { - "epoch": 1.97, - "learning_rate": 5.571985000266193e-07, - "loss": 0.5981, - "step": 76858 - }, - { - "epoch": 1.97, - "learning_rate": 5.571736903229132e-07, - "loss": 0.7109, - "step": 76859 - }, - { - "epoch": 1.97, - "learning_rate": 5.571488809582585e-07, - "loss": 0.5977, - "step": 76860 - }, - { - "epoch": 1.97, - "learning_rate": 5.571240719326746e-07, - "loss": 0.5898, - "step": 76861 - }, - { - "epoch": 1.97, - "learning_rate": 5.570992632461808e-07, - "loss": 0.6597, - "step": 76862 - }, - { - "epoch": 1.97, - "learning_rate": 5.570744548987954e-07, - "loss": 0.5042, - "step": 76863 - }, - { - "epoch": 1.97, - "learning_rate": 5.570496468905375e-07, - "loss": 0.7598, - "step": 76864 - }, - { - "epoch": 1.97, - "learning_rate": 5.570248392214265e-07, - "loss": 0.7085, - "step": 76865 - }, - { - "epoch": 1.97, - "learning_rate": 5.570000318914816e-07, - "loss": 0.5933, - "step": 76866 - }, - { - "epoch": 1.97, - "learning_rate": 5.56975224900721e-07, - "loss": 0.4553, - "step": 76867 - }, - { - "epoch": 1.97, - "learning_rate": 5.569504182491641e-07, - "loss": 0.45, - "step": 76868 - }, - { - "epoch": 1.97, - "learning_rate": 5.569256119368302e-07, - "loss": 0.7461, - "step": 76869 - }, - { - "epoch": 1.97, - "learning_rate": 5.569008059637381e-07, - "loss": 0.583, - "step": 76870 - }, - { - "epoch": 1.97, - "learning_rate": 5.568760003299062e-07, - "loss": 0.7104, - "step": 76871 - }, - { - "epoch": 1.97, - "learning_rate": 5.56851195035354e-07, - "loss": 0.7607, - "step": 76872 - }, - { - "epoch": 1.97, - "learning_rate": 5.568263900801005e-07, - "loss": 0.5176, - "step": 76873 - }, - { - "epoch": 1.97, - "learning_rate": 5.56801585464165e-07, - "loss": 0.6875, - "step": 76874 - }, - { - "epoch": 1.97, - "learning_rate": 5.567767811875659e-07, - "loss": 0.5811, - "step": 76875 - }, - { - "epoch": 1.97, - "learning_rate": 5.567519772503221e-07, - "loss": 0.5874, - "step": 76876 - }, - { - "epoch": 1.97, - "learning_rate": 5.567271736524533e-07, - "loss": 0.5436, - "step": 76877 - }, - { - "epoch": 1.97, - "learning_rate": 5.567023703939783e-07, - "loss": 0.5388, - "step": 76878 - }, - { - "epoch": 1.97, - "learning_rate": 5.56677567474916e-07, - "loss": 0.5718, - "step": 76879 - }, - { - "epoch": 1.97, - "learning_rate": 5.56652764895285e-07, - "loss": 0.4988, - "step": 76880 - }, - { - "epoch": 1.97, - "learning_rate": 5.566279626551045e-07, - "loss": 0.5779, - "step": 76881 - }, - { - "epoch": 1.97, - "learning_rate": 5.566031607543935e-07, - "loss": 0.5996, - "step": 76882 - }, - { - "epoch": 1.97, - "learning_rate": 5.565783591931714e-07, - "loss": 0.7939, - "step": 76883 - }, - { - "epoch": 1.97, - "learning_rate": 5.565535579714567e-07, - "loss": 0.5198, - "step": 76884 - }, - { - "epoch": 1.97, - "learning_rate": 5.565287570892685e-07, - "loss": 0.7812, - "step": 76885 - }, - { - "epoch": 1.97, - "learning_rate": 5.565039565466261e-07, - "loss": 0.6963, - "step": 76886 - }, - { - "epoch": 1.97, - "learning_rate": 5.56479156343548e-07, - "loss": 0.3719, - "step": 76887 - }, - { - "epoch": 1.97, - "learning_rate": 5.564543564800533e-07, - "loss": 0.6489, - "step": 76888 - }, - { - "epoch": 1.97, - "learning_rate": 5.564295569561614e-07, - "loss": 0.793, - "step": 76889 - }, - { - "epoch": 1.97, - "learning_rate": 5.564047577718907e-07, - "loss": 0.6084, - "step": 76890 - }, - { - "epoch": 1.97, - "learning_rate": 5.56379958927261e-07, - "loss": 0.6494, - "step": 76891 - }, - { - "epoch": 1.97, - "learning_rate": 5.563551604222902e-07, - "loss": 0.5435, - "step": 76892 - }, - { - "epoch": 1.97, - "learning_rate": 5.563303622569979e-07, - "loss": 0.6479, - "step": 76893 - }, - { - "epoch": 1.97, - "learning_rate": 5.563055644314032e-07, - "loss": 0.6465, - "step": 76894 - }, - { - "epoch": 1.97, - "learning_rate": 5.562807669455252e-07, - "loss": 0.6084, - "step": 76895 - }, - { - "epoch": 1.97, - "learning_rate": 5.562559697993821e-07, - "loss": 0.6111, - "step": 76896 - }, - { - "epoch": 1.97, - "learning_rate": 5.562311729929936e-07, - "loss": 0.5789, - "step": 76897 - }, - { - "epoch": 1.97, - "learning_rate": 5.562063765263783e-07, - "loss": 0.6484, - "step": 76898 - }, - { - "epoch": 1.97, - "learning_rate": 5.561815803995559e-07, - "loss": 0.7725, - "step": 76899 - }, - { - "epoch": 1.97, - "learning_rate": 5.561567846125448e-07, - "loss": 0.5596, - "step": 76900 - }, - { - "epoch": 1.97, - "learning_rate": 5.561319891653637e-07, - "loss": 0.6284, - "step": 76901 - }, - { - "epoch": 1.97, - "learning_rate": 5.561071940580318e-07, - "loss": 0.5615, - "step": 76902 - }, - { - "epoch": 1.97, - "learning_rate": 5.560823992905684e-07, - "loss": 0.5085, - "step": 76903 - }, - { - "epoch": 1.97, - "learning_rate": 5.560576048629925e-07, - "loss": 0.5342, - "step": 76904 - }, - { - "epoch": 1.97, - "learning_rate": 5.560328107753226e-07, - "loss": 0.6514, - "step": 76905 - }, - { - "epoch": 1.97, - "learning_rate": 5.560080170275779e-07, - "loss": 0.6904, - "step": 76906 - }, - { - "epoch": 1.97, - "learning_rate": 5.559832236197779e-07, - "loss": 0.6313, - "step": 76907 - }, - { - "epoch": 1.97, - "learning_rate": 5.559584305519407e-07, - "loss": 0.5269, - "step": 76908 - }, - { - "epoch": 1.97, - "learning_rate": 5.559336378240862e-07, - "loss": 0.5242, - "step": 76909 - }, - { - "epoch": 1.97, - "learning_rate": 5.559088454362324e-07, - "loss": 0.54, - "step": 76910 - }, - { - "epoch": 1.97, - "learning_rate": 5.558840533883987e-07, - "loss": 0.6299, - "step": 76911 - }, - { - "epoch": 1.97, - "learning_rate": 5.558592616806047e-07, - "loss": 0.5718, - "step": 76912 - }, - { - "epoch": 1.97, - "learning_rate": 5.558344703128684e-07, - "loss": 0.6665, - "step": 76913 - }, - { - "epoch": 1.97, - "learning_rate": 5.558096792852091e-07, - "loss": 0.7461, - "step": 76914 - }, - { - "epoch": 1.97, - "learning_rate": 5.557848885976462e-07, - "loss": 0.5552, - "step": 76915 - }, - { - "epoch": 1.97, - "learning_rate": 5.557600982501985e-07, - "loss": 0.6387, - "step": 76916 - }, - { - "epoch": 1.97, - "learning_rate": 5.557353082428846e-07, - "loss": 0.5342, - "step": 76917 - }, - { - "epoch": 1.97, - "learning_rate": 5.557105185757237e-07, - "loss": 0.6426, - "step": 76918 - }, - { - "epoch": 1.97, - "learning_rate": 5.556857292487353e-07, - "loss": 0.5, - "step": 76919 - }, - { - "epoch": 1.97, - "learning_rate": 5.556609402619374e-07, - "loss": 0.6453, - "step": 76920 - }, - { - "epoch": 1.97, - "learning_rate": 5.556361516153499e-07, - "loss": 0.4128, - "step": 76921 - }, - { - "epoch": 1.97, - "learning_rate": 5.55611363308991e-07, - "loss": 0.5352, - "step": 76922 - }, - { - "epoch": 1.97, - "learning_rate": 5.555865753428801e-07, - "loss": 0.7764, - "step": 76923 - }, - { - "epoch": 1.97, - "learning_rate": 5.555617877170365e-07, - "loss": 0.4731, - "step": 76924 - }, - { - "epoch": 1.97, - "learning_rate": 5.555370004314784e-07, - "loss": 0.6191, - "step": 76925 - }, - { - "epoch": 1.97, - "learning_rate": 5.555122134862251e-07, - "loss": 0.71, - "step": 76926 - }, - { - "epoch": 1.97, - "learning_rate": 5.554874268812957e-07, - "loss": 0.6392, - "step": 76927 - }, - { - "epoch": 1.97, - "learning_rate": 5.554626406167096e-07, - "loss": 0.668, - "step": 76928 - }, - { - "epoch": 1.97, - "learning_rate": 5.554378546924853e-07, - "loss": 0.7988, - "step": 76929 - }, - { - "epoch": 1.97, - "learning_rate": 5.554130691086414e-07, - "loss": 0.6465, - "step": 76930 - }, - { - "epoch": 1.97, - "learning_rate": 5.553882838651972e-07, - "loss": 0.3818, - "step": 76931 - }, - { - "epoch": 1.97, - "learning_rate": 5.553634989621718e-07, - "loss": 0.6958, - "step": 76932 - }, - { - "epoch": 1.97, - "learning_rate": 5.553387143995844e-07, - "loss": 0.6421, - "step": 76933 - }, - { - "epoch": 1.97, - "learning_rate": 5.553139301774534e-07, - "loss": 0.6943, - "step": 76934 - }, - { - "epoch": 1.97, - "learning_rate": 5.552891462957981e-07, - "loss": 0.481, - "step": 76935 - }, - { - "epoch": 1.97, - "learning_rate": 5.552643627546375e-07, - "loss": 0.7432, - "step": 76936 - }, - { - "epoch": 1.97, - "learning_rate": 5.552395795539908e-07, - "loss": 0.4428, - "step": 76937 - }, - { - "epoch": 1.97, - "learning_rate": 5.552147966938765e-07, - "loss": 0.5747, - "step": 76938 - }, - { - "epoch": 1.97, - "learning_rate": 5.55190014174314e-07, - "loss": 0.6572, - "step": 76939 - }, - { - "epoch": 1.97, - "learning_rate": 5.551652319953217e-07, - "loss": 0.7666, - "step": 76940 - }, - { - "epoch": 1.97, - "learning_rate": 5.551404501569193e-07, - "loss": 0.6147, - "step": 76941 - }, - { - "epoch": 1.97, - "learning_rate": 5.551156686591251e-07, - "loss": 0.6094, - "step": 76942 - }, - { - "epoch": 1.97, - "learning_rate": 5.550908875019583e-07, - "loss": 0.6436, - "step": 76943 - }, - { - "epoch": 1.97, - "learning_rate": 5.550661066854379e-07, - "loss": 0.5479, - "step": 76944 - }, - { - "epoch": 1.97, - "learning_rate": 5.550413262095834e-07, - "loss": 0.6426, - "step": 76945 - }, - { - "epoch": 1.97, - "learning_rate": 5.55016546074413e-07, - "loss": 0.665, - "step": 76946 - }, - { - "epoch": 1.97, - "learning_rate": 5.549917662799457e-07, - "loss": 0.7109, - "step": 76947 - }, - { - "epoch": 1.97, - "learning_rate": 5.549669868262009e-07, - "loss": 0.4946, - "step": 76948 - }, - { - "epoch": 1.97, - "learning_rate": 5.549422077131978e-07, - "loss": 0.5474, - "step": 76949 - }, - { - "epoch": 1.97, - "learning_rate": 5.54917428940955e-07, - "loss": 0.5811, - "step": 76950 - }, - { - "epoch": 1.97, - "learning_rate": 5.54892650509491e-07, - "loss": 0.6504, - "step": 76951 - }, - { - "epoch": 1.97, - "learning_rate": 5.548678724188254e-07, - "loss": 0.6709, - "step": 76952 - }, - { - "epoch": 1.97, - "learning_rate": 5.548430946689768e-07, - "loss": 0.3877, - "step": 76953 - }, - { - "epoch": 1.97, - "learning_rate": 5.548183172599648e-07, - "loss": 0.6953, - "step": 76954 - }, - { - "epoch": 1.97, - "learning_rate": 5.547935401918077e-07, - "loss": 0.4966, - "step": 76955 - }, - { - "epoch": 1.97, - "learning_rate": 5.547687634645246e-07, - "loss": 0.6504, - "step": 76956 - }, - { - "epoch": 1.97, - "learning_rate": 5.547439870781345e-07, - "loss": 0.6982, - "step": 76957 - }, - { - "epoch": 1.97, - "learning_rate": 5.54719211032657e-07, - "loss": 0.5251, - "step": 76958 - }, - { - "epoch": 1.97, - "learning_rate": 5.546944353281106e-07, - "loss": 0.6113, - "step": 76959 - }, - { - "epoch": 1.97, - "learning_rate": 5.546696599645137e-07, - "loss": 0.6357, - "step": 76960 - }, - { - "epoch": 1.97, - "learning_rate": 5.546448849418856e-07, - "loss": 0.7627, - "step": 76961 - }, - { - "epoch": 1.97, - "learning_rate": 5.546201102602461e-07, - "loss": 0.6572, - "step": 76962 - }, - { - "epoch": 1.97, - "learning_rate": 5.545953359196129e-07, - "loss": 0.7422, - "step": 76963 - }, - { - "epoch": 1.97, - "learning_rate": 5.545705619200056e-07, - "loss": 0.4785, - "step": 76964 - }, - { - "epoch": 1.97, - "learning_rate": 5.545457882614433e-07, - "loss": 0.521, - "step": 76965 - }, - { - "epoch": 1.97, - "learning_rate": 5.54521014943945e-07, - "loss": 0.7373, - "step": 76966 - }, - { - "epoch": 1.97, - "learning_rate": 5.544962419675292e-07, - "loss": 0.5654, - "step": 76967 - }, - { - "epoch": 1.97, - "learning_rate": 5.544714693322152e-07, - "loss": 0.5615, - "step": 76968 - }, - { - "epoch": 1.97, - "learning_rate": 5.544466970380222e-07, - "loss": 0.6035, - "step": 76969 - }, - { - "epoch": 1.97, - "learning_rate": 5.544219250849685e-07, - "loss": 0.6191, - "step": 76970 - }, - { - "epoch": 1.97, - "learning_rate": 5.543971534730738e-07, - "loss": 0.7051, - "step": 76971 - }, - { - "epoch": 1.97, - "learning_rate": 5.543723822023564e-07, - "loss": 0.7295, - "step": 76972 - }, - { - "epoch": 1.97, - "learning_rate": 5.543476112728356e-07, - "loss": 0.8623, - "step": 76973 - }, - { - "epoch": 1.97, - "learning_rate": 5.543228406845302e-07, - "loss": 0.6689, - "step": 76974 - }, - { - "epoch": 1.97, - "learning_rate": 5.542980704374598e-07, - "loss": 0.623, - "step": 76975 - }, - { - "epoch": 1.97, - "learning_rate": 5.542733005316424e-07, - "loss": 0.6758, - "step": 76976 - }, - { - "epoch": 1.97, - "learning_rate": 5.542485309670974e-07, - "loss": 0.7666, - "step": 76977 - }, - { - "epoch": 1.97, - "learning_rate": 5.542237617438445e-07, - "loss": 0.5957, - "step": 76978 - }, - { - "epoch": 1.97, - "learning_rate": 5.541989928619017e-07, - "loss": 0.5566, - "step": 76979 - }, - { - "epoch": 1.97, - "learning_rate": 5.541742243212879e-07, - "loss": 0.6924, - "step": 76980 - }, - { - "epoch": 1.97, - "learning_rate": 5.541494561220224e-07, - "loss": 0.5718, - "step": 76981 - }, - { - "epoch": 1.97, - "learning_rate": 5.541246882641241e-07, - "loss": 0.5312, - "step": 76982 - }, - { - "epoch": 1.97, - "learning_rate": 5.540999207476125e-07, - "loss": 0.3888, - "step": 76983 - }, - { - "epoch": 1.97, - "learning_rate": 5.540751535725056e-07, - "loss": 0.4756, - "step": 76984 - }, - { - "epoch": 1.97, - "learning_rate": 5.54050386738823e-07, - "loss": 0.6978, - "step": 76985 - }, - { - "epoch": 1.97, - "learning_rate": 5.540256202465833e-07, - "loss": 0.2551, - "step": 76986 - }, - { - "epoch": 1.97, - "learning_rate": 5.540008540958063e-07, - "loss": 0.6392, - "step": 76987 - }, - { - "epoch": 1.97, - "learning_rate": 5.539760882865098e-07, - "loss": 0.6753, - "step": 76988 - }, - { - "epoch": 1.97, - "learning_rate": 5.539513228187138e-07, - "loss": 0.5372, - "step": 76989 - }, - { - "epoch": 1.97, - "learning_rate": 5.539265576924363e-07, - "loss": 0.6387, - "step": 76990 - }, - { - "epoch": 1.97, - "learning_rate": 5.539017929076968e-07, - "loss": 0.525, - "step": 76991 - }, - { - "epoch": 1.97, - "learning_rate": 5.538770284645145e-07, - "loss": 0.667, - "step": 76992 - }, - { - "epoch": 1.97, - "learning_rate": 5.538522643629077e-07, - "loss": 0.6787, - "step": 76993 - }, - { - "epoch": 1.97, - "learning_rate": 5.538275006028956e-07, - "loss": 0.5654, - "step": 76994 - }, - { - "epoch": 1.97, - "learning_rate": 5.538027371844977e-07, - "loss": 0.6377, - "step": 76995 - }, - { - "epoch": 1.97, - "learning_rate": 5.537779741077324e-07, - "loss": 0.5723, - "step": 76996 - }, - { - "epoch": 1.97, - "learning_rate": 5.537532113726185e-07, - "loss": 0.5981, - "step": 76997 - }, - { - "epoch": 1.97, - "learning_rate": 5.537284489791752e-07, - "loss": 0.6074, - "step": 76998 - }, - { - "epoch": 1.97, - "learning_rate": 5.537036869274221e-07, - "loss": 0.6521, - "step": 76999 - }, - { - "epoch": 1.97, - "learning_rate": 5.536789252173774e-07, - "loss": 0.4858, - "step": 77000 - }, - { - "epoch": 1.97, - "learning_rate": 5.5365416384906e-07, - "loss": 0.4443, - "step": 77001 - }, - { - "epoch": 1.97, - "learning_rate": 5.536294028224889e-07, - "loss": 0.6035, - "step": 77002 - }, - { - "epoch": 1.97, - "learning_rate": 5.536046421376833e-07, - "loss": 0.7705, - "step": 77003 - }, - { - "epoch": 1.97, - "learning_rate": 5.535798817946625e-07, - "loss": 0.6133, - "step": 77004 - }, - { - "epoch": 1.97, - "learning_rate": 5.535551217934447e-07, - "loss": 0.7012, - "step": 77005 - }, - { - "epoch": 1.97, - "learning_rate": 5.535303621340492e-07, - "loss": 0.6309, - "step": 77006 - }, - { - "epoch": 1.97, - "learning_rate": 5.53505602816495e-07, - "loss": 0.7944, - "step": 77007 - }, - { - "epoch": 1.97, - "learning_rate": 5.534808438408014e-07, - "loss": 0.7002, - "step": 77008 - }, - { - "epoch": 1.97, - "learning_rate": 5.534560852069869e-07, - "loss": 0.6943, - "step": 77009 - }, - { - "epoch": 1.97, - "learning_rate": 5.534313269150703e-07, - "loss": 0.6509, - "step": 77010 - }, - { - "epoch": 1.97, - "learning_rate": 5.534065689650708e-07, - "loss": 0.7949, - "step": 77011 - }, - { - "epoch": 1.97, - "learning_rate": 5.533818113570077e-07, - "loss": 0.5728, - "step": 77012 - }, - { - "epoch": 1.97, - "learning_rate": 5.533570540908992e-07, - "loss": 0.7207, - "step": 77013 - }, - { - "epoch": 1.97, - "learning_rate": 5.533322971667646e-07, - "loss": 0.7764, - "step": 77014 - }, - { - "epoch": 1.97, - "learning_rate": 5.533075405846231e-07, - "loss": 0.6572, - "step": 77015 - }, - { - "epoch": 1.97, - "learning_rate": 5.532827843444936e-07, - "loss": 0.6846, - "step": 77016 - }, - { - "epoch": 1.97, - "learning_rate": 5.532580284463947e-07, - "loss": 0.6182, - "step": 77017 - }, - { - "epoch": 1.97, - "learning_rate": 5.532332728903456e-07, - "loss": 0.6431, - "step": 77018 - }, - { - "epoch": 1.97, - "learning_rate": 5.532085176763657e-07, - "loss": 0.5869, - "step": 77019 - }, - { - "epoch": 1.97, - "learning_rate": 5.531837628044728e-07, - "loss": 0.4917, - "step": 77020 - }, - { - "epoch": 1.97, - "learning_rate": 5.531590082746873e-07, - "loss": 0.5366, - "step": 77021 - }, - { - "epoch": 1.97, - "learning_rate": 5.531342540870267e-07, - "loss": 0.5227, - "step": 77022 - }, - { - "epoch": 1.97, - "learning_rate": 5.531095002415109e-07, - "loss": 0.6436, - "step": 77023 - }, - { - "epoch": 1.97, - "learning_rate": 5.530847467381585e-07, - "loss": 0.5994, - "step": 77024 - }, - { - "epoch": 1.97, - "learning_rate": 5.530599935769891e-07, - "loss": 0.4883, - "step": 77025 - }, - { - "epoch": 1.97, - "learning_rate": 5.530352407580206e-07, - "loss": 0.6738, - "step": 77026 - }, - { - "epoch": 1.97, - "learning_rate": 5.530104882812724e-07, - "loss": 0.5015, - "step": 77027 - }, - { - "epoch": 1.97, - "learning_rate": 5.529857361467636e-07, - "loss": 0.6228, - "step": 77028 - }, - { - "epoch": 1.97, - "learning_rate": 5.529609843545137e-07, - "loss": 0.6943, - "step": 77029 - }, - { - "epoch": 1.97, - "learning_rate": 5.529362329045404e-07, - "loss": 0.6206, - "step": 77030 - }, - { - "epoch": 1.97, - "learning_rate": 5.529114817968632e-07, - "loss": 0.7109, - "step": 77031 - }, - { - "epoch": 1.97, - "learning_rate": 5.528867310315013e-07, - "loss": 0.6035, - "step": 77032 - }, - { - "epoch": 1.97, - "learning_rate": 5.528619806084737e-07, - "loss": 0.6953, - "step": 77033 - }, - { - "epoch": 1.97, - "learning_rate": 5.528372305277986e-07, - "loss": 0.7007, - "step": 77034 - }, - { - "epoch": 1.97, - "learning_rate": 5.528124807894957e-07, - "loss": 0.6621, - "step": 77035 - }, - { - "epoch": 1.97, - "learning_rate": 5.527877313935836e-07, - "loss": 0.3552, - "step": 77036 - }, - { - "epoch": 1.97, - "learning_rate": 5.527629823400819e-07, - "loss": 0.6396, - "step": 77037 - }, - { - "epoch": 1.97, - "learning_rate": 5.527382336290085e-07, - "loss": 0.5215, - "step": 77038 - }, - { - "epoch": 1.97, - "learning_rate": 5.527134852603832e-07, - "loss": 0.5703, - "step": 77039 - }, - { - "epoch": 1.97, - "learning_rate": 5.526887372342243e-07, - "loss": 0.5386, - "step": 77040 - }, - { - "epoch": 1.97, - "learning_rate": 5.526639895505511e-07, - "loss": 0.5911, - "step": 77041 - }, - { - "epoch": 1.97, - "learning_rate": 5.52639242209383e-07, - "loss": 0.7334, - "step": 77042 - }, - { - "epoch": 1.97, - "learning_rate": 5.526144952107378e-07, - "loss": 0.519, - "step": 77043 - }, - { - "epoch": 1.97, - "learning_rate": 5.525897485546354e-07, - "loss": 0.5273, - "step": 77044 - }, - { - "epoch": 1.97, - "learning_rate": 5.525650022410943e-07, - "loss": 0.9131, - "step": 77045 - }, - { - "epoch": 1.97, - "learning_rate": 5.52540256270134e-07, - "loss": 0.6465, - "step": 77046 - }, - { - "epoch": 1.97, - "learning_rate": 5.525155106417727e-07, - "loss": 0.4917, - "step": 77047 - }, - { - "epoch": 1.97, - "learning_rate": 5.524907653560297e-07, - "loss": 0.6777, - "step": 77048 - }, - { - "epoch": 1.97, - "learning_rate": 5.524660204129243e-07, - "loss": 0.5942, - "step": 77049 - }, - { - "epoch": 1.97, - "learning_rate": 5.52441275812475e-07, - "loss": 0.7041, - "step": 77050 - }, - { - "epoch": 1.97, - "learning_rate": 5.524165315547007e-07, - "loss": 0.6748, - "step": 77051 - }, - { - "epoch": 1.97, - "learning_rate": 5.523917876396203e-07, - "loss": 0.6562, - "step": 77052 - }, - { - "epoch": 1.97, - "learning_rate": 5.523670440672529e-07, - "loss": 0.8428, - "step": 77053 - }, - { - "epoch": 1.97, - "learning_rate": 5.523423008376179e-07, - "loss": 0.7158, - "step": 77054 - }, - { - "epoch": 1.97, - "learning_rate": 5.523175579507334e-07, - "loss": 0.6919, - "step": 77055 - }, - { - "epoch": 1.97, - "learning_rate": 5.522928154066189e-07, - "loss": 0.5325, - "step": 77056 - }, - { - "epoch": 1.98, - "learning_rate": 5.522680732052932e-07, - "loss": 0.6387, - "step": 77057 - }, - { - "epoch": 1.98, - "learning_rate": 5.522433313467753e-07, - "loss": 0.5669, - "step": 77058 - }, - { - "epoch": 1.98, - "learning_rate": 5.522185898310844e-07, - "loss": 0.668, - "step": 77059 - }, - { - "epoch": 1.98, - "learning_rate": 5.521938486582387e-07, - "loss": 0.6387, - "step": 77060 - }, - { - "epoch": 1.98, - "learning_rate": 5.521691078282576e-07, - "loss": 0.5737, - "step": 77061 - }, - { - "epoch": 1.98, - "learning_rate": 5.5214436734116e-07, - "loss": 0.5684, - "step": 77062 - }, - { - "epoch": 1.98, - "learning_rate": 5.521196271969653e-07, - "loss": 0.834, - "step": 77063 - }, - { - "epoch": 1.98, - "learning_rate": 5.520948873956914e-07, - "loss": 0.5713, - "step": 77064 - }, - { - "epoch": 1.98, - "learning_rate": 5.520701479373582e-07, - "loss": 0.6938, - "step": 77065 - }, - { - "epoch": 1.98, - "learning_rate": 5.52045408821984e-07, - "loss": 0.5295, - "step": 77066 - }, - { - "epoch": 1.98, - "learning_rate": 5.520206700495885e-07, - "loss": 0.5789, - "step": 77067 - }, - { - "epoch": 1.98, - "learning_rate": 5.519959316201898e-07, - "loss": 0.6035, - "step": 77068 - }, - { - "epoch": 1.98, - "learning_rate": 5.519711935338077e-07, - "loss": 0.625, - "step": 77069 - }, - { - "epoch": 1.98, - "learning_rate": 5.519464557904601e-07, - "loss": 0.615, - "step": 77070 - }, - { - "epoch": 1.98, - "learning_rate": 5.51921718390167e-07, - "loss": 0.5249, - "step": 77071 - }, - { - "epoch": 1.98, - "learning_rate": 5.518969813329463e-07, - "loss": 0.6865, - "step": 77072 - }, - { - "epoch": 1.98, - "learning_rate": 5.518722446188178e-07, - "loss": 0.7578, - "step": 77073 - }, - { - "epoch": 1.98, - "learning_rate": 5.518475082477998e-07, - "loss": 0.3537, - "step": 77074 - }, - { - "epoch": 1.98, - "learning_rate": 5.518227722199121e-07, - "loss": 0.5996, - "step": 77075 - }, - { - "epoch": 1.98, - "learning_rate": 5.517980365351727e-07, - "loss": 0.6533, - "step": 77076 - }, - { - "epoch": 1.98, - "learning_rate": 5.517733011936008e-07, - "loss": 0.5376, - "step": 77077 - }, - { - "epoch": 1.98, - "learning_rate": 5.517485661952156e-07, - "loss": 0.5142, - "step": 77078 - }, - { - "epoch": 1.98, - "learning_rate": 5.517238315400363e-07, - "loss": 0.5737, - "step": 77079 - }, - { - "epoch": 1.98, - "learning_rate": 5.516990972280814e-07, - "loss": 0.2742, - "step": 77080 - }, - { - "epoch": 1.98, - "learning_rate": 5.516743632593694e-07, - "loss": 0.6924, - "step": 77081 - }, - { - "epoch": 1.98, - "learning_rate": 5.5164962963392e-07, - "loss": 0.6641, - "step": 77082 - }, - { - "epoch": 1.98, - "learning_rate": 5.516248963517515e-07, - "loss": 0.7725, - "step": 77083 - }, - { - "epoch": 1.98, - "learning_rate": 5.51600163412884e-07, - "loss": 0.6636, - "step": 77084 - }, - { - "epoch": 1.98, - "learning_rate": 5.515754308173351e-07, - "loss": 0.6338, - "step": 77085 - }, - { - "epoch": 1.98, - "learning_rate": 5.515506985651241e-07, - "loss": 0.6235, - "step": 77086 - }, - { - "epoch": 1.98, - "learning_rate": 5.515259666562706e-07, - "loss": 0.5854, - "step": 77087 - }, - { - "epoch": 1.98, - "learning_rate": 5.515012350907926e-07, - "loss": 0.5981, - "step": 77088 - }, - { - "epoch": 1.98, - "learning_rate": 5.5147650386871e-07, - "loss": 0.6416, - "step": 77089 - }, - { - "epoch": 1.98, - "learning_rate": 5.514517729900408e-07, - "loss": 0.5267, - "step": 77090 - }, - { - "epoch": 1.98, - "learning_rate": 5.514270424548044e-07, - "loss": 0.6255, - "step": 77091 - }, - { - "epoch": 1.98, - "learning_rate": 5.514023122630199e-07, - "loss": 0.6206, - "step": 77092 - }, - { - "epoch": 1.98, - "learning_rate": 5.513775824147058e-07, - "loss": 0.6245, - "step": 77093 - }, - { - "epoch": 1.98, - "learning_rate": 5.513528529098812e-07, - "loss": 0.6465, - "step": 77094 - }, - { - "epoch": 1.98, - "learning_rate": 5.51328123748565e-07, - "loss": 0.6904, - "step": 77095 - }, - { - "epoch": 1.98, - "learning_rate": 5.513033949307767e-07, - "loss": 0.6357, - "step": 77096 - }, - { - "epoch": 1.98, - "learning_rate": 5.512786664565343e-07, - "loss": 0.665, - "step": 77097 - }, - { - "epoch": 1.98, - "learning_rate": 5.512539383258574e-07, - "loss": 0.5625, - "step": 77098 - }, - { - "epoch": 1.98, - "learning_rate": 5.512292105387649e-07, - "loss": 0.5713, - "step": 77099 - }, - { - "epoch": 1.98, - "learning_rate": 5.512044830952753e-07, - "loss": 0.6641, - "step": 77100 - }, - { - "epoch": 1.98, - "learning_rate": 5.511797559954081e-07, - "loss": 0.4601, - "step": 77101 - }, - { - "epoch": 1.98, - "learning_rate": 5.511550292391816e-07, - "loss": 0.6196, - "step": 77102 - }, - { - "epoch": 1.98, - "learning_rate": 5.51130302826615e-07, - "loss": 0.5566, - "step": 77103 - }, - { - "epoch": 1.98, - "learning_rate": 5.511055767577277e-07, - "loss": 0.6934, - "step": 77104 - }, - { - "epoch": 1.98, - "learning_rate": 5.510808510325378e-07, - "loss": 0.6201, - "step": 77105 - }, - { - "epoch": 1.98, - "learning_rate": 5.510561256510647e-07, - "loss": 0.7305, - "step": 77106 - }, - { - "epoch": 1.98, - "learning_rate": 5.510314006133272e-07, - "loss": 0.5735, - "step": 77107 - }, - { - "epoch": 1.98, - "learning_rate": 5.510066759193447e-07, - "loss": 0.4673, - "step": 77108 - }, - { - "epoch": 1.98, - "learning_rate": 5.509819515691359e-07, - "loss": 0.6543, - "step": 77109 - }, - { - "epoch": 1.98, - "learning_rate": 5.50957227562719e-07, - "loss": 0.6289, - "step": 77110 - }, - { - "epoch": 1.98, - "learning_rate": 5.509325039001136e-07, - "loss": 0.5212, - "step": 77111 - }, - { - "epoch": 1.98, - "learning_rate": 5.509077805813385e-07, - "loss": 0.5913, - "step": 77112 - }, - { - "epoch": 1.98, - "learning_rate": 5.508830576064131e-07, - "loss": 0.6709, - "step": 77113 - }, - { - "epoch": 1.98, - "learning_rate": 5.508583349753555e-07, - "loss": 0.7549, - "step": 77114 - }, - { - "epoch": 1.98, - "learning_rate": 5.50833612688185e-07, - "loss": 0.582, - "step": 77115 - }, - { - "epoch": 1.98, - "learning_rate": 5.508088907449204e-07, - "loss": 0.6758, - "step": 77116 - }, - { - "epoch": 1.98, - "learning_rate": 5.507841691455815e-07, - "loss": 0.7539, - "step": 77117 - }, - { - "epoch": 1.98, - "learning_rate": 5.507594478901858e-07, - "loss": 0.3563, - "step": 77118 - }, - { - "epoch": 1.98, - "learning_rate": 5.507347269787534e-07, - "loss": 0.7012, - "step": 77119 - }, - { - "epoch": 1.98, - "learning_rate": 5.507100064113025e-07, - "loss": 0.4678, - "step": 77120 - }, - { - "epoch": 1.98, - "learning_rate": 5.506852861878526e-07, - "loss": 0.397, - "step": 77121 - }, - { - "epoch": 1.98, - "learning_rate": 5.506605663084219e-07, - "loss": 0.7407, - "step": 77122 - }, - { - "epoch": 1.98, - "learning_rate": 5.506358467730299e-07, - "loss": 0.6953, - "step": 77123 - }, - { - "epoch": 1.98, - "learning_rate": 5.506111275816951e-07, - "loss": 0.7568, - "step": 77124 - }, - { - "epoch": 1.98, - "learning_rate": 5.505864087344373e-07, - "loss": 0.5464, - "step": 77125 - }, - { - "epoch": 1.98, - "learning_rate": 5.505616902312743e-07, - "loss": 0.6758, - "step": 77126 - }, - { - "epoch": 1.98, - "learning_rate": 5.505369720722257e-07, - "loss": 0.6108, - "step": 77127 - }, - { - "epoch": 1.98, - "learning_rate": 5.505122542573102e-07, - "loss": 0.7305, - "step": 77128 - }, - { - "epoch": 1.98, - "learning_rate": 5.504875367865471e-07, - "loss": 0.7432, - "step": 77129 - }, - { - "epoch": 1.98, - "learning_rate": 5.50462819659955e-07, - "loss": 0.6895, - "step": 77130 - }, - { - "epoch": 1.98, - "learning_rate": 5.504381028775527e-07, - "loss": 0.6514, - "step": 77131 - }, - { - "epoch": 1.98, - "learning_rate": 5.50413386439359e-07, - "loss": 0.6279, - "step": 77132 - }, - { - "epoch": 1.98, - "learning_rate": 5.503886703453933e-07, - "loss": 0.5259, - "step": 77133 - }, - { - "epoch": 1.98, - "learning_rate": 5.503639545956746e-07, - "loss": 0.4927, - "step": 77134 - }, - { - "epoch": 1.98, - "learning_rate": 5.503392391902211e-07, - "loss": 0.6104, - "step": 77135 - }, - { - "epoch": 1.98, - "learning_rate": 5.503145241290524e-07, - "loss": 0.7383, - "step": 77136 - }, - { - "epoch": 1.98, - "learning_rate": 5.50289809412187e-07, - "loss": 0.6978, - "step": 77137 - }, - { - "epoch": 1.98, - "learning_rate": 5.502650950396448e-07, - "loss": 0.6514, - "step": 77138 - }, - { - "epoch": 1.98, - "learning_rate": 5.502403810114433e-07, - "loss": 0.7422, - "step": 77139 - }, - { - "epoch": 1.98, - "learning_rate": 5.50215667327602e-07, - "loss": 0.6777, - "step": 77140 - }, - { - "epoch": 1.98, - "learning_rate": 5.501909539881398e-07, - "loss": 0.6333, - "step": 77141 - }, - { - "epoch": 1.98, - "learning_rate": 5.501662409930761e-07, - "loss": 0.584, - "step": 77142 - }, - { - "epoch": 1.98, - "learning_rate": 5.501415283424291e-07, - "loss": 0.5605, - "step": 77143 - }, - { - "epoch": 1.98, - "learning_rate": 5.501168160362179e-07, - "loss": 0.5718, - "step": 77144 - }, - { - "epoch": 1.98, - "learning_rate": 5.500921040744617e-07, - "loss": 0.8623, - "step": 77145 - }, - { - "epoch": 1.98, - "learning_rate": 5.500673924571797e-07, - "loss": 0.7217, - "step": 77146 - }, - { - "epoch": 1.98, - "learning_rate": 5.5004268118439e-07, - "loss": 0.5684, - "step": 77147 - }, - { - "epoch": 1.98, - "learning_rate": 5.500179702561123e-07, - "loss": 0.709, - "step": 77148 - }, - { - "epoch": 1.98, - "learning_rate": 5.499932596723647e-07, - "loss": 0.7695, - "step": 77149 - }, - { - "epoch": 1.98, - "learning_rate": 5.499685494331667e-07, - "loss": 0.7148, - "step": 77150 - }, - { - "epoch": 1.98, - "learning_rate": 5.499438395385374e-07, - "loss": 0.7236, - "step": 77151 - }, - { - "epoch": 1.98, - "learning_rate": 5.499191299884951e-07, - "loss": 0.7656, - "step": 77152 - }, - { - "epoch": 1.98, - "learning_rate": 5.498944207830589e-07, - "loss": 0.7217, - "step": 77153 - }, - { - "epoch": 1.98, - "learning_rate": 5.498697119222479e-07, - "loss": 0.6143, - "step": 77154 - }, - { - "epoch": 1.98, - "learning_rate": 5.498450034060814e-07, - "loss": 0.5962, - "step": 77155 - }, - { - "epoch": 1.98, - "learning_rate": 5.498202952345774e-07, - "loss": 0.7393, - "step": 77156 - }, - { - "epoch": 1.98, - "learning_rate": 5.497955874077553e-07, - "loss": 0.6816, - "step": 77157 - }, - { - "epoch": 1.98, - "learning_rate": 5.497708799256346e-07, - "loss": 0.5503, - "step": 77158 - }, - { - "epoch": 1.98, - "learning_rate": 5.497461727882334e-07, - "loss": 0.6887, - "step": 77159 - }, - { - "epoch": 1.98, - "learning_rate": 5.497214659955706e-07, - "loss": 0.6182, - "step": 77160 - }, - { - "epoch": 1.98, - "learning_rate": 5.496967595476654e-07, - "loss": 0.5029, - "step": 77161 - }, - { - "epoch": 1.98, - "learning_rate": 5.496720534445365e-07, - "loss": 0.603, - "step": 77162 - }, - { - "epoch": 1.98, - "learning_rate": 5.496473476862035e-07, - "loss": 0.6279, - "step": 77163 - }, - { - "epoch": 1.98, - "learning_rate": 5.496226422726844e-07, - "loss": 0.7422, - "step": 77164 - }, - { - "epoch": 1.98, - "learning_rate": 5.495979372039986e-07, - "loss": 0.6611, - "step": 77165 - }, - { - "epoch": 1.98, - "learning_rate": 5.49573232480165e-07, - "loss": 0.4907, - "step": 77166 - }, - { - "epoch": 1.98, - "learning_rate": 5.495485281012027e-07, - "loss": 0.6152, - "step": 77167 - }, - { - "epoch": 1.98, - "learning_rate": 5.495238240671304e-07, - "loss": 0.5903, - "step": 77168 - }, - { - "epoch": 1.98, - "learning_rate": 5.494991203779666e-07, - "loss": 0.5129, - "step": 77169 - }, - { - "epoch": 1.98, - "learning_rate": 5.494744170337307e-07, - "loss": 0.4463, - "step": 77170 - }, - { - "epoch": 1.98, - "learning_rate": 5.494497140344415e-07, - "loss": 0.3987, - "step": 77171 - }, - { - "epoch": 1.98, - "learning_rate": 5.494250113801183e-07, - "loss": 0.6484, - "step": 77172 - }, - { - "epoch": 1.98, - "learning_rate": 5.494003090707793e-07, - "loss": 0.7236, - "step": 77173 - }, - { - "epoch": 1.98, - "learning_rate": 5.493756071064437e-07, - "loss": 0.5713, - "step": 77174 - }, - { - "epoch": 1.98, - "learning_rate": 5.49350905487131e-07, - "loss": 0.5098, - "step": 77175 - }, - { - "epoch": 1.98, - "learning_rate": 5.49326204212859e-07, - "loss": 0.5698, - "step": 77176 - }, - { - "epoch": 1.98, - "learning_rate": 5.493015032836473e-07, - "loss": 0.6064, - "step": 77177 - }, - { - "epoch": 1.98, - "learning_rate": 5.492768026995152e-07, - "loss": 0.7168, - "step": 77178 - }, - { - "epoch": 1.98, - "learning_rate": 5.492521024604805e-07, - "loss": 0.6475, - "step": 77179 - }, - { - "epoch": 1.98, - "learning_rate": 5.492274025665633e-07, - "loss": 0.6196, - "step": 77180 - }, - { - "epoch": 1.98, - "learning_rate": 5.492027030177816e-07, - "loss": 0.6973, - "step": 77181 - }, - { - "epoch": 1.98, - "learning_rate": 5.491780038141547e-07, - "loss": 0.5511, - "step": 77182 - }, - { - "epoch": 1.98, - "learning_rate": 5.491533049557013e-07, - "loss": 0.6699, - "step": 77183 - }, - { - "epoch": 1.98, - "learning_rate": 5.49128606442441e-07, - "loss": 0.6045, - "step": 77184 - }, - { - "epoch": 1.98, - "learning_rate": 5.491039082743917e-07, - "loss": 0.5703, - "step": 77185 - }, - { - "epoch": 1.98, - "learning_rate": 5.490792104515729e-07, - "loss": 0.5801, - "step": 77186 - }, - { - "epoch": 1.98, - "learning_rate": 5.490545129740033e-07, - "loss": 0.5298, - "step": 77187 - }, - { - "epoch": 1.98, - "learning_rate": 5.490298158417024e-07, - "loss": 0.5967, - "step": 77188 - }, - { - "epoch": 1.98, - "learning_rate": 5.490051190546886e-07, - "loss": 0.5859, - "step": 77189 - }, - { - "epoch": 1.98, - "learning_rate": 5.489804226129805e-07, - "loss": 0.6299, - "step": 77190 - }, - { - "epoch": 1.98, - "learning_rate": 5.489557265165974e-07, - "loss": 0.7109, - "step": 77191 - }, - { - "epoch": 1.98, - "learning_rate": 5.489310307655584e-07, - "loss": 0.4836, - "step": 77192 - }, - { - "epoch": 1.98, - "learning_rate": 5.489063353598818e-07, - "loss": 0.6836, - "step": 77193 - }, - { - "epoch": 1.98, - "learning_rate": 5.48881640299587e-07, - "loss": 0.6348, - "step": 77194 - }, - { - "epoch": 1.98, - "learning_rate": 5.488569455846928e-07, - "loss": 0.7905, - "step": 77195 - }, - { - "epoch": 1.98, - "learning_rate": 5.488322512152184e-07, - "loss": 0.437, - "step": 77196 - }, - { - "epoch": 1.98, - "learning_rate": 5.488075571911818e-07, - "loss": 0.5488, - "step": 77197 - }, - { - "epoch": 1.98, - "learning_rate": 5.487828635126033e-07, - "loss": 0.626, - "step": 77198 - }, - { - "epoch": 1.98, - "learning_rate": 5.487581701795003e-07, - "loss": 0.575, - "step": 77199 - }, - { - "epoch": 1.98, - "learning_rate": 5.487334771918926e-07, - "loss": 0.6533, - "step": 77200 - }, - { - "epoch": 1.98, - "learning_rate": 5.487087845497993e-07, - "loss": 0.4927, - "step": 77201 - }, - { - "epoch": 1.98, - "learning_rate": 5.486840922532385e-07, - "loss": 0.6058, - "step": 77202 - }, - { - "epoch": 1.98, - "learning_rate": 5.486594003022295e-07, - "loss": 0.667, - "step": 77203 - }, - { - "epoch": 1.98, - "learning_rate": 5.486347086967913e-07, - "loss": 0.5737, - "step": 77204 - }, - { - "epoch": 1.98, - "learning_rate": 5.486100174369432e-07, - "loss": 0.573, - "step": 77205 - }, - { - "epoch": 1.98, - "learning_rate": 5.485853265227031e-07, - "loss": 0.7114, - "step": 77206 - }, - { - "epoch": 1.98, - "learning_rate": 5.485606359540907e-07, - "loss": 0.6396, - "step": 77207 - }, - { - "epoch": 1.98, - "learning_rate": 5.485359457311247e-07, - "loss": 0.6475, - "step": 77208 - }, - { - "epoch": 1.98, - "learning_rate": 5.485112558538243e-07, - "loss": 0.6958, - "step": 77209 - }, - { - "epoch": 1.98, - "learning_rate": 5.484865663222076e-07, - "loss": 0.5474, - "step": 77210 - }, - { - "epoch": 1.98, - "learning_rate": 5.484618771362939e-07, - "loss": 0.873, - "step": 77211 - }, - { - "epoch": 1.98, - "learning_rate": 5.484371882961022e-07, - "loss": 0.4346, - "step": 77212 - }, - { - "epoch": 1.98, - "learning_rate": 5.484124998016517e-07, - "loss": 0.7227, - "step": 77213 - }, - { - "epoch": 1.98, - "learning_rate": 5.483878116529608e-07, - "loss": 0.5977, - "step": 77214 - }, - { - "epoch": 1.98, - "learning_rate": 5.483631238500484e-07, - "loss": 0.5269, - "step": 77215 - }, - { - "epoch": 1.98, - "learning_rate": 5.483384363929336e-07, - "loss": 0.5432, - "step": 77216 - }, - { - "epoch": 1.98, - "learning_rate": 5.483137492816357e-07, - "loss": 0.5942, - "step": 77217 - }, - { - "epoch": 1.98, - "learning_rate": 5.482890625161733e-07, - "loss": 0.7549, - "step": 77218 - }, - { - "epoch": 1.98, - "learning_rate": 5.482643760965648e-07, - "loss": 0.4741, - "step": 77219 - }, - { - "epoch": 1.98, - "learning_rate": 5.482396900228294e-07, - "loss": 0.6309, - "step": 77220 - }, - { - "epoch": 1.98, - "learning_rate": 5.48215004294986e-07, - "loss": 0.6533, - "step": 77221 - }, - { - "epoch": 1.98, - "learning_rate": 5.481903189130542e-07, - "loss": 0.7275, - "step": 77222 - }, - { - "epoch": 1.98, - "learning_rate": 5.481656338770519e-07, - "loss": 0.5219, - "step": 77223 - }, - { - "epoch": 1.98, - "learning_rate": 5.481409491869982e-07, - "loss": 0.667, - "step": 77224 - }, - { - "epoch": 1.98, - "learning_rate": 5.481162648429123e-07, - "loss": 0.5431, - "step": 77225 - }, - { - "epoch": 1.98, - "learning_rate": 5.480915808448135e-07, - "loss": 0.5464, - "step": 77226 - }, - { - "epoch": 1.98, - "learning_rate": 5.480668971927196e-07, - "loss": 0.519, - "step": 77227 - }, - { - "epoch": 1.98, - "learning_rate": 5.480422138866507e-07, - "loss": 0.7197, - "step": 77228 - }, - { - "epoch": 1.98, - "learning_rate": 5.480175309266247e-07, - "loss": 0.4556, - "step": 77229 - }, - { - "epoch": 1.98, - "learning_rate": 5.47992848312661e-07, - "loss": 0.6416, - "step": 77230 - }, - { - "epoch": 1.98, - "learning_rate": 5.479681660447782e-07, - "loss": 0.7002, - "step": 77231 - }, - { - "epoch": 1.98, - "learning_rate": 5.479434841229954e-07, - "loss": 0.5225, - "step": 77232 - }, - { - "epoch": 1.98, - "learning_rate": 5.479188025473315e-07, - "loss": 0.7949, - "step": 77233 - }, - { - "epoch": 1.98, - "learning_rate": 5.478941213178057e-07, - "loss": 0.7051, - "step": 77234 - }, - { - "epoch": 1.98, - "learning_rate": 5.478694404344363e-07, - "loss": 0.5889, - "step": 77235 - }, - { - "epoch": 1.98, - "learning_rate": 5.478447598972424e-07, - "loss": 0.5239, - "step": 77236 - }, - { - "epoch": 1.98, - "learning_rate": 5.47820079706243e-07, - "loss": 0.4941, - "step": 77237 - }, - { - "epoch": 1.98, - "learning_rate": 5.477953998614573e-07, - "loss": 0.4749, - "step": 77238 - }, - { - "epoch": 1.98, - "learning_rate": 5.477707203629039e-07, - "loss": 0.6484, - "step": 77239 - }, - { - "epoch": 1.98, - "learning_rate": 5.477460412106014e-07, - "loss": 0.615, - "step": 77240 - }, - { - "epoch": 1.98, - "learning_rate": 5.477213624045689e-07, - "loss": 0.6523, - "step": 77241 - }, - { - "epoch": 1.98, - "learning_rate": 5.476966839448252e-07, - "loss": 0.6406, - "step": 77242 - }, - { - "epoch": 1.98, - "learning_rate": 5.4767200583139e-07, - "loss": 0.666, - "step": 77243 - }, - { - "epoch": 1.98, - "learning_rate": 5.476473280642809e-07, - "loss": 0.3945, - "step": 77244 - }, - { - "epoch": 1.98, - "learning_rate": 5.476226506435176e-07, - "loss": 0.522, - "step": 77245 - }, - { - "epoch": 1.98, - "learning_rate": 5.475979735691187e-07, - "loss": 0.9072, - "step": 77246 - }, - { - "epoch": 1.98, - "learning_rate": 5.475732968411038e-07, - "loss": 0.6826, - "step": 77247 - }, - { - "epoch": 1.98, - "learning_rate": 5.475486204594912e-07, - "loss": 0.6602, - "step": 77248 - }, - { - "epoch": 1.98, - "learning_rate": 5.475239444242993e-07, - "loss": 0.4819, - "step": 77249 - }, - { - "epoch": 1.98, - "learning_rate": 5.474992687355476e-07, - "loss": 0.7246, - "step": 77250 - }, - { - "epoch": 1.98, - "learning_rate": 5.474745933932552e-07, - "loss": 0.511, - "step": 77251 - }, - { - "epoch": 1.98, - "learning_rate": 5.474499183974404e-07, - "loss": 0.751, - "step": 77252 - }, - { - "epoch": 1.98, - "learning_rate": 5.474252437481224e-07, - "loss": 0.6587, - "step": 77253 - }, - { - "epoch": 1.98, - "learning_rate": 5.474005694453199e-07, - "loss": 0.7104, - "step": 77254 - }, - { - "epoch": 1.98, - "learning_rate": 5.473758954890526e-07, - "loss": 0.6289, - "step": 77255 - }, - { - "epoch": 1.98, - "learning_rate": 5.473512218793384e-07, - "loss": 0.5615, - "step": 77256 - }, - { - "epoch": 1.98, - "learning_rate": 5.473265486161963e-07, - "loss": 0.6611, - "step": 77257 - }, - { - "epoch": 1.98, - "learning_rate": 5.473018756996459e-07, - "loss": 0.8057, - "step": 77258 - }, - { - "epoch": 1.98, - "learning_rate": 5.472772031297054e-07, - "loss": 0.6147, - "step": 77259 - }, - { - "epoch": 1.98, - "learning_rate": 5.472525309063942e-07, - "loss": 0.7168, - "step": 77260 - }, - { - "epoch": 1.98, - "learning_rate": 5.472278590297306e-07, - "loss": 0.3347, - "step": 77261 - }, - { - "epoch": 1.98, - "learning_rate": 5.472031874997338e-07, - "loss": 0.6719, - "step": 77262 - }, - { - "epoch": 1.98, - "learning_rate": 5.471785163164226e-07, - "loss": 0.4277, - "step": 77263 - }, - { - "epoch": 1.98, - "learning_rate": 5.471538454798165e-07, - "loss": 0.5652, - "step": 77264 - }, - { - "epoch": 1.98, - "learning_rate": 5.471291749899335e-07, - "loss": 0.5962, - "step": 77265 - }, - { - "epoch": 1.98, - "learning_rate": 5.471045048467929e-07, - "loss": 0.6362, - "step": 77266 - }, - { - "epoch": 1.98, - "learning_rate": 5.470798350504137e-07, - "loss": 0.4558, - "step": 77267 - }, - { - "epoch": 1.98, - "learning_rate": 5.470551656008149e-07, - "loss": 0.5801, - "step": 77268 - }, - { - "epoch": 1.98, - "learning_rate": 5.470304964980146e-07, - "loss": 0.5273, - "step": 77269 - }, - { - "epoch": 1.98, - "learning_rate": 5.470058277420323e-07, - "loss": 0.5122, - "step": 77270 - }, - { - "epoch": 1.98, - "learning_rate": 5.469811593328868e-07, - "loss": 0.6997, - "step": 77271 - }, - { - "epoch": 1.98, - "learning_rate": 5.469564912705973e-07, - "loss": 0.6836, - "step": 77272 - }, - { - "epoch": 1.98, - "learning_rate": 5.469318235551821e-07, - "loss": 0.6272, - "step": 77273 - }, - { - "epoch": 1.98, - "learning_rate": 5.469071561866603e-07, - "loss": 0.6699, - "step": 77274 - }, - { - "epoch": 1.98, - "learning_rate": 5.468824891650508e-07, - "loss": 0.6797, - "step": 77275 - }, - { - "epoch": 1.98, - "learning_rate": 5.46857822490373e-07, - "loss": 0.7012, - "step": 77276 - }, - { - "epoch": 1.98, - "learning_rate": 5.46833156162645e-07, - "loss": 0.7646, - "step": 77277 - }, - { - "epoch": 1.98, - "learning_rate": 5.468084901818863e-07, - "loss": 0.834, - "step": 77278 - }, - { - "epoch": 1.98, - "learning_rate": 5.467838245481153e-07, - "loss": 0.7871, - "step": 77279 - }, - { - "epoch": 1.98, - "learning_rate": 5.467591592613509e-07, - "loss": 0.5361, - "step": 77280 - }, - { - "epoch": 1.98, - "learning_rate": 5.467344943216127e-07, - "loss": 0.8242, - "step": 77281 - }, - { - "epoch": 1.98, - "learning_rate": 5.467098297289185e-07, - "loss": 0.6738, - "step": 77282 - }, - { - "epoch": 1.98, - "learning_rate": 5.466851654832878e-07, - "loss": 0.6277, - "step": 77283 - }, - { - "epoch": 1.98, - "learning_rate": 5.466605015847398e-07, - "loss": 0.5669, - "step": 77284 - }, - { - "epoch": 1.98, - "learning_rate": 5.466358380332927e-07, - "loss": 0.6284, - "step": 77285 - }, - { - "epoch": 1.98, - "learning_rate": 5.466111748289657e-07, - "loss": 0.5552, - "step": 77286 - }, - { - "epoch": 1.98, - "learning_rate": 5.465865119717777e-07, - "loss": 0.6328, - "step": 77287 - }, - { - "epoch": 1.98, - "learning_rate": 5.465618494617478e-07, - "loss": 0.5496, - "step": 77288 - }, - { - "epoch": 1.98, - "learning_rate": 5.465371872988946e-07, - "loss": 0.7148, - "step": 77289 - }, - { - "epoch": 1.98, - "learning_rate": 5.465125254832368e-07, - "loss": 0.6289, - "step": 77290 - }, - { - "epoch": 1.98, - "learning_rate": 5.464878640147935e-07, - "loss": 0.5825, - "step": 77291 - }, - { - "epoch": 1.98, - "learning_rate": 5.464632028935837e-07, - "loss": 0.5264, - "step": 77292 - }, - { - "epoch": 1.98, - "learning_rate": 5.464385421196263e-07, - "loss": 0.5437, - "step": 77293 - }, - { - "epoch": 1.98, - "learning_rate": 5.464138816929398e-07, - "loss": 0.5386, - "step": 77294 - }, - { - "epoch": 1.98, - "learning_rate": 5.463892216135433e-07, - "loss": 0.5276, - "step": 77295 - }, - { - "epoch": 1.98, - "learning_rate": 5.463645618814557e-07, - "loss": 0.4785, - "step": 77296 - }, - { - "epoch": 1.98, - "learning_rate": 5.463399024966964e-07, - "loss": 0.7207, - "step": 77297 - }, - { - "epoch": 1.98, - "learning_rate": 5.463152434592836e-07, - "loss": 0.4358, - "step": 77298 - }, - { - "epoch": 1.98, - "learning_rate": 5.46290584769236e-07, - "loss": 0.6938, - "step": 77299 - }, - { - "epoch": 1.98, - "learning_rate": 5.46265926426573e-07, - "loss": 0.4707, - "step": 77300 - }, - { - "epoch": 1.98, - "learning_rate": 5.462412684313136e-07, - "loss": 0.5117, - "step": 77301 - }, - { - "epoch": 1.98, - "learning_rate": 5.462166107834759e-07, - "loss": 0.6953, - "step": 77302 - }, - { - "epoch": 1.98, - "learning_rate": 5.461919534830795e-07, - "loss": 0.6235, - "step": 77303 - }, - { - "epoch": 1.98, - "learning_rate": 5.461672965301428e-07, - "loss": 0.7969, - "step": 77304 - }, - { - "epoch": 1.98, - "learning_rate": 5.461426399246856e-07, - "loss": 0.4142, - "step": 77305 - }, - { - "epoch": 1.98, - "learning_rate": 5.461179836667254e-07, - "loss": 0.7871, - "step": 77306 - }, - { - "epoch": 1.98, - "learning_rate": 5.46093327756282e-07, - "loss": 0.6235, - "step": 77307 - }, - { - "epoch": 1.98, - "learning_rate": 5.460686721933745e-07, - "loss": 0.6377, - "step": 77308 - }, - { - "epoch": 1.98, - "learning_rate": 5.460440169780208e-07, - "loss": 0.5347, - "step": 77309 - }, - { - "epoch": 1.98, - "learning_rate": 5.460193621102409e-07, - "loss": 0.5886, - "step": 77310 - }, - { - "epoch": 1.98, - "learning_rate": 5.459947075900526e-07, - "loss": 0.5557, - "step": 77311 - }, - { - "epoch": 1.98, - "learning_rate": 5.459700534174752e-07, - "loss": 0.562, - "step": 77312 - }, - { - "epoch": 1.98, - "learning_rate": 5.459453995925278e-07, - "loss": 0.6133, - "step": 77313 - }, - { - "epoch": 1.98, - "learning_rate": 5.459207461152294e-07, - "loss": 0.6499, - "step": 77314 - }, - { - "epoch": 1.98, - "learning_rate": 5.458960929855983e-07, - "loss": 0.7529, - "step": 77315 - }, - { - "epoch": 1.98, - "learning_rate": 5.458714402036536e-07, - "loss": 0.4699, - "step": 77316 - }, - { - "epoch": 1.98, - "learning_rate": 5.458467877694144e-07, - "loss": 0.6885, - "step": 77317 - }, - { - "epoch": 1.98, - "learning_rate": 5.458221356829001e-07, - "loss": 0.5562, - "step": 77318 - }, - { - "epoch": 1.98, - "learning_rate": 5.457974839441281e-07, - "loss": 0.52, - "step": 77319 - }, - { - "epoch": 1.98, - "learning_rate": 5.457728325531181e-07, - "loss": 0.353, - "step": 77320 - }, - { - "epoch": 1.98, - "learning_rate": 5.457481815098889e-07, - "loss": 0.7314, - "step": 77321 - }, - { - "epoch": 1.98, - "learning_rate": 5.457235308144601e-07, - "loss": 0.5615, - "step": 77322 - }, - { - "epoch": 1.98, - "learning_rate": 5.456988804668492e-07, - "loss": 0.7217, - "step": 77323 - }, - { - "epoch": 1.98, - "learning_rate": 5.456742304670759e-07, - "loss": 0.6582, - "step": 77324 - }, - { - "epoch": 1.98, - "learning_rate": 5.45649580815159e-07, - "loss": 0.5679, - "step": 77325 - }, - { - "epoch": 1.98, - "learning_rate": 5.456249315111177e-07, - "loss": 0.8516, - "step": 77326 - }, - { - "epoch": 1.98, - "learning_rate": 5.4560028255497e-07, - "loss": 0.6992, - "step": 77327 - }, - { - "epoch": 1.98, - "learning_rate": 5.455756339467356e-07, - "loss": 0.48, - "step": 77328 - }, - { - "epoch": 1.98, - "learning_rate": 5.455509856864328e-07, - "loss": 0.7217, - "step": 77329 - }, - { - "epoch": 1.98, - "learning_rate": 5.455263377740809e-07, - "loss": 0.707, - "step": 77330 - }, - { - "epoch": 1.98, - "learning_rate": 5.455016902096987e-07, - "loss": 0.4633, - "step": 77331 - }, - { - "epoch": 1.98, - "learning_rate": 5.454770429933047e-07, - "loss": 0.519, - "step": 77332 - }, - { - "epoch": 1.98, - "learning_rate": 5.454523961249179e-07, - "loss": 0.5396, - "step": 77333 - }, - { - "epoch": 1.98, - "learning_rate": 5.454277496045573e-07, - "loss": 0.5693, - "step": 77334 - }, - { - "epoch": 1.98, - "learning_rate": 5.454031034322424e-07, - "loss": 0.5283, - "step": 77335 - }, - { - "epoch": 1.98, - "learning_rate": 5.453784576079907e-07, - "loss": 0.3632, - "step": 77336 - }, - { - "epoch": 1.98, - "learning_rate": 5.453538121318221e-07, - "loss": 0.7744, - "step": 77337 - }, - { - "epoch": 1.98, - "learning_rate": 5.453291670037554e-07, - "loss": 0.6377, - "step": 77338 - }, - { - "epoch": 1.98, - "learning_rate": 5.453045222238093e-07, - "loss": 0.5151, - "step": 77339 - }, - { - "epoch": 1.98, - "learning_rate": 5.452798777920022e-07, - "loss": 0.7715, - "step": 77340 - }, - { - "epoch": 1.98, - "learning_rate": 5.452552337083536e-07, - "loss": 0.563, - "step": 77341 - }, - { - "epoch": 1.98, - "learning_rate": 5.452305899728819e-07, - "loss": 0.4612, - "step": 77342 - }, - { - "epoch": 1.98, - "learning_rate": 5.452059465856067e-07, - "loss": 0.7334, - "step": 77343 - }, - { - "epoch": 1.98, - "learning_rate": 5.45181303546546e-07, - "loss": 0.6616, - "step": 77344 - }, - { - "epoch": 1.98, - "learning_rate": 5.451566608557191e-07, - "loss": 0.6699, - "step": 77345 - }, - { - "epoch": 1.98, - "learning_rate": 5.451320185131447e-07, - "loss": 0.5947, - "step": 77346 - }, - { - "epoch": 1.98, - "learning_rate": 5.451073765188424e-07, - "loss": 0.5708, - "step": 77347 - }, - { - "epoch": 1.98, - "learning_rate": 5.450827348728304e-07, - "loss": 0.4886, - "step": 77348 - }, - { - "epoch": 1.98, - "learning_rate": 5.450580935751271e-07, - "loss": 0.7783, - "step": 77349 - }, - { - "epoch": 1.98, - "learning_rate": 5.45033452625752e-07, - "loss": 0.6143, - "step": 77350 - }, - { - "epoch": 1.98, - "learning_rate": 5.450088120247238e-07, - "loss": 0.5083, - "step": 77351 - }, - { - "epoch": 1.98, - "learning_rate": 5.44984171772062e-07, - "loss": 0.8047, - "step": 77352 - }, - { - "epoch": 1.98, - "learning_rate": 5.449595318677844e-07, - "loss": 0.627, - "step": 77353 - }, - { - "epoch": 1.98, - "learning_rate": 5.449348923119104e-07, - "loss": 0.7021, - "step": 77354 - }, - { - "epoch": 1.98, - "learning_rate": 5.449102531044592e-07, - "loss": 0.5977, - "step": 77355 - }, - { - "epoch": 1.98, - "learning_rate": 5.448856142454487e-07, - "loss": 0.6084, - "step": 77356 - }, - { - "epoch": 1.98, - "learning_rate": 5.448609757348986e-07, - "loss": 0.6699, - "step": 77357 - }, - { - "epoch": 1.98, - "learning_rate": 5.448363375728279e-07, - "loss": 0.6675, - "step": 77358 - }, - { - "epoch": 1.98, - "learning_rate": 5.448116997592546e-07, - "loss": 0.6724, - "step": 77359 - }, - { - "epoch": 1.98, - "learning_rate": 5.447870622941985e-07, - "loss": 0.4236, - "step": 77360 - }, - { - "epoch": 1.98, - "learning_rate": 5.447624251776777e-07, - "loss": 0.8408, - "step": 77361 - }, - { - "epoch": 1.98, - "learning_rate": 5.447377884097112e-07, - "loss": 0.5161, - "step": 77362 - }, - { - "epoch": 1.98, - "learning_rate": 5.447131519903181e-07, - "loss": 0.543, - "step": 77363 - }, - { - "epoch": 1.98, - "learning_rate": 5.446885159195176e-07, - "loss": 0.7373, - "step": 77364 - }, - { - "epoch": 1.98, - "learning_rate": 5.446638801973278e-07, - "loss": 0.6094, - "step": 77365 - }, - { - "epoch": 1.98, - "learning_rate": 5.44639244823768e-07, - "loss": 0.6306, - "step": 77366 - }, - { - "epoch": 1.98, - "learning_rate": 5.446146097988569e-07, - "loss": 0.4473, - "step": 77367 - }, - { - "epoch": 1.98, - "learning_rate": 5.445899751226139e-07, - "loss": 0.6313, - "step": 77368 - }, - { - "epoch": 1.98, - "learning_rate": 5.445653407950574e-07, - "loss": 0.585, - "step": 77369 - }, - { - "epoch": 1.98, - "learning_rate": 5.445407068162058e-07, - "loss": 0.4501, - "step": 77370 - }, - { - "epoch": 1.98, - "learning_rate": 5.445160731860785e-07, - "loss": 0.6494, - "step": 77371 - }, - { - "epoch": 1.98, - "learning_rate": 5.444914399046947e-07, - "loss": 0.7041, - "step": 77372 - }, - { - "epoch": 1.98, - "learning_rate": 5.444668069720726e-07, - "loss": 0.5259, - "step": 77373 - }, - { - "epoch": 1.98, - "learning_rate": 5.444421743882311e-07, - "loss": 0.6577, - "step": 77374 - }, - { - "epoch": 1.98, - "learning_rate": 5.444175421531893e-07, - "loss": 0.6504, - "step": 77375 - }, - { - "epoch": 1.98, - "learning_rate": 5.443929102669666e-07, - "loss": 0.5508, - "step": 77376 - }, - { - "epoch": 1.98, - "learning_rate": 5.443682787295808e-07, - "loss": 0.8145, - "step": 77377 - }, - { - "epoch": 1.98, - "learning_rate": 5.443436475410517e-07, - "loss": 0.707, - "step": 77378 - }, - { - "epoch": 1.98, - "learning_rate": 5.443190167013972e-07, - "loss": 0.6587, - "step": 77379 - }, - { - "epoch": 1.98, - "learning_rate": 5.442943862106369e-07, - "loss": 0.5723, - "step": 77380 - }, - { - "epoch": 1.98, - "learning_rate": 5.442697560687897e-07, - "loss": 0.4524, - "step": 77381 - }, - { - "epoch": 1.98, - "learning_rate": 5.442451262758737e-07, - "loss": 0.542, - "step": 77382 - }, - { - "epoch": 1.98, - "learning_rate": 5.442204968319084e-07, - "loss": 0.6111, - "step": 77383 - }, - { - "epoch": 1.98, - "learning_rate": 5.441958677369124e-07, - "loss": 0.6377, - "step": 77384 - }, - { - "epoch": 1.98, - "learning_rate": 5.44171238990905e-07, - "loss": 0.6572, - "step": 77385 - }, - { - "epoch": 1.98, - "learning_rate": 5.441466105939046e-07, - "loss": 0.7783, - "step": 77386 - }, - { - "epoch": 1.98, - "learning_rate": 5.4412198254593e-07, - "loss": 0.6172, - "step": 77387 - }, - { - "epoch": 1.98, - "learning_rate": 5.440973548470006e-07, - "loss": 0.5981, - "step": 77388 - }, - { - "epoch": 1.98, - "learning_rate": 5.440727274971348e-07, - "loss": 0.5089, - "step": 77389 - }, - { - "epoch": 1.98, - "learning_rate": 5.440481004963515e-07, - "loss": 0.4863, - "step": 77390 - }, - { - "epoch": 1.98, - "learning_rate": 5.440234738446693e-07, - "loss": 0.5737, - "step": 77391 - }, - { - "epoch": 1.98, - "learning_rate": 5.439988475421075e-07, - "loss": 0.7559, - "step": 77392 - }, - { - "epoch": 1.98, - "learning_rate": 5.439742215886851e-07, - "loss": 0.6089, - "step": 77393 - }, - { - "epoch": 1.98, - "learning_rate": 5.439495959844203e-07, - "loss": 0.5903, - "step": 77394 - }, - { - "epoch": 1.98, - "learning_rate": 5.439249707293324e-07, - "loss": 0.5654, - "step": 77395 - }, - { - "epoch": 1.98, - "learning_rate": 5.439003458234401e-07, - "loss": 0.5693, - "step": 77396 - }, - { - "epoch": 1.98, - "learning_rate": 5.438757212667629e-07, - "loss": 0.6123, - "step": 77397 - }, - { - "epoch": 1.98, - "learning_rate": 5.438510970593188e-07, - "loss": 0.5398, - "step": 77398 - }, - { - "epoch": 1.98, - "learning_rate": 5.438264732011268e-07, - "loss": 0.6758, - "step": 77399 - }, - { - "epoch": 1.98, - "learning_rate": 5.438018496922059e-07, - "loss": 0.6611, - "step": 77400 - }, - { - "epoch": 1.98, - "learning_rate": 5.437772265325748e-07, - "loss": 0.6641, - "step": 77401 - }, - { - "epoch": 1.98, - "learning_rate": 5.437526037222528e-07, - "loss": 0.5757, - "step": 77402 - }, - { - "epoch": 1.98, - "learning_rate": 5.437279812612583e-07, - "loss": 0.7539, - "step": 77403 - }, - { - "epoch": 1.98, - "learning_rate": 5.437033591496101e-07, - "loss": 0.667, - "step": 77404 - }, - { - "epoch": 1.98, - "learning_rate": 5.436787373873276e-07, - "loss": 0.6953, - "step": 77405 - }, - { - "epoch": 1.98, - "learning_rate": 5.436541159744293e-07, - "loss": 0.4512, - "step": 77406 - }, - { - "epoch": 1.98, - "learning_rate": 5.436294949109339e-07, - "loss": 0.6777, - "step": 77407 - }, - { - "epoch": 1.98, - "learning_rate": 5.436048741968606e-07, - "loss": 0.5339, - "step": 77408 - }, - { - "epoch": 1.98, - "learning_rate": 5.435802538322278e-07, - "loss": 0.5557, - "step": 77409 - }, - { - "epoch": 1.98, - "learning_rate": 5.43555633817055e-07, - "loss": 0.8867, - "step": 77410 - }, - { - "epoch": 1.98, - "learning_rate": 5.435310141513604e-07, - "loss": 0.6113, - "step": 77411 - }, - { - "epoch": 1.98, - "learning_rate": 5.43506394835163e-07, - "loss": 0.8477, - "step": 77412 - }, - { - "epoch": 1.98, - "learning_rate": 5.434817758684818e-07, - "loss": 0.6431, - "step": 77413 - }, - { - "epoch": 1.98, - "learning_rate": 5.434571572513359e-07, - "loss": 0.8354, - "step": 77414 - }, - { - "epoch": 1.98, - "learning_rate": 5.434325389837436e-07, - "loss": 0.6123, - "step": 77415 - }, - { - "epoch": 1.98, - "learning_rate": 5.434079210657238e-07, - "loss": 0.7852, - "step": 77416 - }, - { - "epoch": 1.98, - "learning_rate": 5.433833034972957e-07, - "loss": 0.6328, - "step": 77417 - }, - { - "epoch": 1.98, - "learning_rate": 5.433586862784785e-07, - "loss": 0.6323, - "step": 77418 - }, - { - "epoch": 1.98, - "learning_rate": 5.433340694092905e-07, - "loss": 0.5576, - "step": 77419 - }, - { - "epoch": 1.98, - "learning_rate": 5.433094528897501e-07, - "loss": 0.363, - "step": 77420 - }, - { - "epoch": 1.98, - "learning_rate": 5.432848367198768e-07, - "loss": 0.3209, - "step": 77421 - }, - { - "epoch": 1.98, - "learning_rate": 5.432602208996891e-07, - "loss": 0.7588, - "step": 77422 - }, - { - "epoch": 1.98, - "learning_rate": 5.432356054292067e-07, - "loss": 0.6719, - "step": 77423 - }, - { - "epoch": 1.98, - "learning_rate": 5.432109903084471e-07, - "loss": 0.7026, - "step": 77424 - }, - { - "epoch": 1.98, - "learning_rate": 5.431863755374302e-07, - "loss": 0.6621, - "step": 77425 - }, - { - "epoch": 1.98, - "learning_rate": 5.431617611161742e-07, - "loss": 0.5767, - "step": 77426 - }, - { - "epoch": 1.98, - "learning_rate": 5.431371470446987e-07, - "loss": 0.6724, - "step": 77427 - }, - { - "epoch": 1.98, - "learning_rate": 5.431125333230222e-07, - "loss": 0.4878, - "step": 77428 - }, - { - "epoch": 1.98, - "learning_rate": 5.430879199511629e-07, - "loss": 0.4692, - "step": 77429 - }, - { - "epoch": 1.98, - "learning_rate": 5.430633069291401e-07, - "loss": 0.582, - "step": 77430 - }, - { - "epoch": 1.98, - "learning_rate": 5.430386942569734e-07, - "loss": 0.6279, - "step": 77431 - }, - { - "epoch": 1.98, - "learning_rate": 5.430140819346803e-07, - "loss": 0.6597, - "step": 77432 - }, - { - "epoch": 1.98, - "learning_rate": 5.429894699622803e-07, - "loss": 0.5659, - "step": 77433 - }, - { - "epoch": 1.98, - "learning_rate": 5.429648583397924e-07, - "loss": 0.5488, - "step": 77434 - }, - { - "epoch": 1.98, - "learning_rate": 5.429402470672356e-07, - "loss": 0.6748, - "step": 77435 - }, - { - "epoch": 1.98, - "learning_rate": 5.429156361446281e-07, - "loss": 0.5913, - "step": 77436 - }, - { - "epoch": 1.98, - "learning_rate": 5.428910255719894e-07, - "loss": 0.7842, - "step": 77437 - }, - { - "epoch": 1.98, - "learning_rate": 5.428664153493376e-07, - "loss": 0.6484, - "step": 77438 - }, - { - "epoch": 1.98, - "learning_rate": 5.428418054766921e-07, - "loss": 0.573, - "step": 77439 - }, - { - "epoch": 1.98, - "learning_rate": 5.428171959540719e-07, - "loss": 0.5605, - "step": 77440 - }, - { - "epoch": 1.98, - "learning_rate": 5.427925867814953e-07, - "loss": 0.5916, - "step": 77441 - }, - { - "epoch": 1.98, - "learning_rate": 5.427679779589812e-07, - "loss": 0.6133, - "step": 77442 - }, - { - "epoch": 1.98, - "learning_rate": 5.427433694865487e-07, - "loss": 0.6982, - "step": 77443 - }, - { - "epoch": 1.98, - "learning_rate": 5.427187613642171e-07, - "loss": 0.7188, - "step": 77444 - }, - { - "epoch": 1.98, - "learning_rate": 5.426941535920042e-07, - "loss": 0.71, - "step": 77445 - }, - { - "epoch": 1.98, - "learning_rate": 5.426695461699293e-07, - "loss": 0.3694, - "step": 77446 - }, - { - "epoch": 1.99, - "learning_rate": 5.426449390980118e-07, - "loss": 0.6313, - "step": 77447 - }, - { - "epoch": 1.99, - "learning_rate": 5.4262033237627e-07, - "loss": 0.4385, - "step": 77448 - }, - { - "epoch": 1.99, - "learning_rate": 5.425957260047225e-07, - "loss": 0.6245, - "step": 77449 - }, - { - "epoch": 1.99, - "learning_rate": 5.425711199833883e-07, - "loss": 0.7266, - "step": 77450 - }, - { - "epoch": 1.99, - "learning_rate": 5.425465143122863e-07, - "loss": 0.4424, - "step": 77451 - }, - { - "epoch": 1.99, - "learning_rate": 5.425219089914359e-07, - "loss": 0.6465, - "step": 77452 - }, - { - "epoch": 1.99, - "learning_rate": 5.42497304020855e-07, - "loss": 0.5132, - "step": 77453 - }, - { - "epoch": 1.99, - "learning_rate": 5.424726994005628e-07, - "loss": 0.646, - "step": 77454 - }, - { - "epoch": 1.99, - "learning_rate": 5.424480951305783e-07, - "loss": 0.6699, - "step": 77455 - }, - { - "epoch": 1.99, - "learning_rate": 5.424234912109207e-07, - "loss": 0.6196, - "step": 77456 - }, - { - "epoch": 1.99, - "learning_rate": 5.423988876416084e-07, - "loss": 0.6768, - "step": 77457 - }, - { - "epoch": 1.99, - "learning_rate": 5.423742844226598e-07, - "loss": 0.2644, - "step": 77458 - }, - { - "epoch": 1.99, - "learning_rate": 5.423496815540942e-07, - "loss": 0.6118, - "step": 77459 - }, - { - "epoch": 1.99, - "learning_rate": 5.423250790359304e-07, - "loss": 0.406, - "step": 77460 - }, - { - "epoch": 1.99, - "learning_rate": 5.423004768681876e-07, - "loss": 0.6328, - "step": 77461 - }, - { - "epoch": 1.99, - "learning_rate": 5.422758750508838e-07, - "loss": 0.7812, - "step": 77462 - }, - { - "epoch": 1.99, - "learning_rate": 5.422512735840384e-07, - "loss": 0.5962, - "step": 77463 - }, - { - "epoch": 1.99, - "learning_rate": 5.422266724676706e-07, - "loss": 0.3366, - "step": 77464 - }, - { - "epoch": 1.99, - "learning_rate": 5.422020717017983e-07, - "loss": 0.7158, - "step": 77465 - }, - { - "epoch": 1.99, - "learning_rate": 5.421774712864409e-07, - "loss": 0.5972, - "step": 77466 - }, - { - "epoch": 1.99, - "learning_rate": 5.421528712216175e-07, - "loss": 0.5586, - "step": 77467 - }, - { - "epoch": 1.99, - "learning_rate": 5.421282715073462e-07, - "loss": 0.6738, - "step": 77468 - }, - { - "epoch": 1.99, - "learning_rate": 5.421036721436466e-07, - "loss": 0.6587, - "step": 77469 - }, - { - "epoch": 1.99, - "learning_rate": 5.420790731305368e-07, - "loss": 0.7188, - "step": 77470 - }, - { - "epoch": 1.99, - "learning_rate": 5.42054474468036e-07, - "loss": 0.5344, - "step": 77471 - }, - { - "epoch": 1.99, - "learning_rate": 5.42029876156163e-07, - "loss": 0.5662, - "step": 77472 - }, - { - "epoch": 1.99, - "learning_rate": 5.420052781949372e-07, - "loss": 0.5908, - "step": 77473 - }, - { - "epoch": 1.99, - "learning_rate": 5.419806805843763e-07, - "loss": 0.4761, - "step": 77474 - }, - { - "epoch": 1.99, - "learning_rate": 5.419560833244999e-07, - "loss": 0.6782, - "step": 77475 - }, - { - "epoch": 1.99, - "learning_rate": 5.419314864153266e-07, - "loss": 0.708, - "step": 77476 - }, - { - "epoch": 1.99, - "learning_rate": 5.419068898568757e-07, - "loss": 0.5996, - "step": 77477 - }, - { - "epoch": 1.99, - "learning_rate": 5.418822936491656e-07, - "loss": 0.5894, - "step": 77478 - }, - { - "epoch": 1.99, - "learning_rate": 5.418576977922149e-07, - "loss": 0.6924, - "step": 77479 - }, - { - "epoch": 1.99, - "learning_rate": 5.418331022860426e-07, - "loss": 0.7471, - "step": 77480 - }, - { - "epoch": 1.99, - "learning_rate": 5.41808507130668e-07, - "loss": 0.5391, - "step": 77481 - }, - { - "epoch": 1.99, - "learning_rate": 5.417839123261091e-07, - "loss": 0.7324, - "step": 77482 - }, - { - "epoch": 1.99, - "learning_rate": 5.417593178723852e-07, - "loss": 0.5864, - "step": 77483 - }, - { - "epoch": 1.99, - "learning_rate": 5.417347237695152e-07, - "loss": 0.4648, - "step": 77484 - }, - { - "epoch": 1.99, - "learning_rate": 5.417101300175182e-07, - "loss": 0.7354, - "step": 77485 - }, - { - "epoch": 1.99, - "learning_rate": 5.416855366164123e-07, - "loss": 0.6997, - "step": 77486 - }, - { - "epoch": 1.99, - "learning_rate": 5.416609435662172e-07, - "loss": 0.6777, - "step": 77487 - }, - { - "epoch": 1.99, - "learning_rate": 5.416363508669508e-07, - "loss": 0.6382, - "step": 77488 - }, - { - "epoch": 1.99, - "learning_rate": 5.416117585186324e-07, - "loss": 0.6357, - "step": 77489 - }, - { - "epoch": 1.99, - "learning_rate": 5.41587166521281e-07, - "loss": 0.5415, - "step": 77490 - }, - { - "epoch": 1.99, - "learning_rate": 5.415625748749151e-07, - "loss": 0.6348, - "step": 77491 - }, - { - "epoch": 1.99, - "learning_rate": 5.415379835795534e-07, - "loss": 0.5791, - "step": 77492 - }, - { - "epoch": 1.99, - "learning_rate": 5.415133926352151e-07, - "loss": 0.457, - "step": 77493 - }, - { - "epoch": 1.99, - "learning_rate": 5.414888020419193e-07, - "loss": 0.5962, - "step": 77494 - }, - { - "epoch": 1.99, - "learning_rate": 5.414642117996841e-07, - "loss": 0.7637, - "step": 77495 - }, - { - "epoch": 1.99, - "learning_rate": 5.414396219085287e-07, - "loss": 0.7871, - "step": 77496 - }, - { - "epoch": 1.99, - "learning_rate": 5.414150323684721e-07, - "loss": 0.5674, - "step": 77497 - }, - { - "epoch": 1.99, - "learning_rate": 5.41390443179533e-07, - "loss": 0.4844, - "step": 77498 - }, - { - "epoch": 1.99, - "learning_rate": 5.413658543417299e-07, - "loss": 0.572, - "step": 77499 - }, - { - "epoch": 1.99, - "learning_rate": 5.413412658550818e-07, - "loss": 0.5977, - "step": 77500 - }, - { - "epoch": 1.99, - "learning_rate": 5.413166777196076e-07, - "loss": 0.6475, - "step": 77501 - }, - { - "epoch": 1.99, - "learning_rate": 5.412920899353264e-07, - "loss": 0.6367, - "step": 77502 - }, - { - "epoch": 1.99, - "learning_rate": 5.412675025022565e-07, - "loss": 0.6494, - "step": 77503 - }, - { - "epoch": 1.99, - "learning_rate": 5.41242915420417e-07, - "loss": 0.5537, - "step": 77504 - }, - { - "epoch": 1.99, - "learning_rate": 5.412183286898266e-07, - "loss": 0.7959, - "step": 77505 - }, - { - "epoch": 1.99, - "learning_rate": 5.411937423105047e-07, - "loss": 0.5447, - "step": 77506 - }, - { - "epoch": 1.99, - "learning_rate": 5.411691562824696e-07, - "loss": 0.5601, - "step": 77507 - }, - { - "epoch": 1.99, - "learning_rate": 5.411445706057398e-07, - "loss": 0.5403, - "step": 77508 - }, - { - "epoch": 1.99, - "learning_rate": 5.411199852803345e-07, - "loss": 0.5043, - "step": 77509 - }, - { - "epoch": 1.99, - "learning_rate": 5.410954003062725e-07, - "loss": 0.4541, - "step": 77510 - }, - { - "epoch": 1.99, - "learning_rate": 5.410708156835732e-07, - "loss": 0.4397, - "step": 77511 - }, - { - "epoch": 1.99, - "learning_rate": 5.410462314122544e-07, - "loss": 0.562, - "step": 77512 - }, - { - "epoch": 1.99, - "learning_rate": 5.410216474923352e-07, - "loss": 0.6943, - "step": 77513 - }, - { - "epoch": 1.99, - "learning_rate": 5.409970639238348e-07, - "loss": 0.6177, - "step": 77514 - }, - { - "epoch": 1.99, - "learning_rate": 5.409724807067723e-07, - "loss": 0.6377, - "step": 77515 - }, - { - "epoch": 1.99, - "learning_rate": 5.409478978411655e-07, - "loss": 0.7017, - "step": 77516 - }, - { - "epoch": 1.99, - "learning_rate": 5.409233153270344e-07, - "loss": 0.6709, - "step": 77517 - }, - { - "epoch": 1.99, - "learning_rate": 5.408987331643966e-07, - "loss": 0.5337, - "step": 77518 - }, - { - "epoch": 1.99, - "learning_rate": 5.40874151353272e-07, - "loss": 0.4304, - "step": 77519 - }, - { - "epoch": 1.99, - "learning_rate": 5.408495698936786e-07, - "loss": 0.509, - "step": 77520 - }, - { - "epoch": 1.99, - "learning_rate": 5.408249887856355e-07, - "loss": 0.6294, - "step": 77521 - }, - { - "epoch": 1.99, - "learning_rate": 5.408004080291617e-07, - "loss": 0.647, - "step": 77522 - }, - { - "epoch": 1.99, - "learning_rate": 5.407758276242762e-07, - "loss": 0.6543, - "step": 77523 - }, - { - "epoch": 1.99, - "learning_rate": 5.407512475709972e-07, - "loss": 0.3071, - "step": 77524 - }, - { - "epoch": 1.99, - "learning_rate": 5.407266678693438e-07, - "loss": 0.6348, - "step": 77525 - }, - { - "epoch": 1.99, - "learning_rate": 5.40702088519335e-07, - "loss": 0.6172, - "step": 77526 - }, - { - "epoch": 1.99, - "learning_rate": 5.406775095209898e-07, - "loss": 0.554, - "step": 77527 - }, - { - "epoch": 1.99, - "learning_rate": 5.406529308743266e-07, - "loss": 0.5251, - "step": 77528 - }, - { - "epoch": 1.99, - "learning_rate": 5.406283525793641e-07, - "loss": 0.6006, - "step": 77529 - }, - { - "epoch": 1.99, - "learning_rate": 5.406037746361214e-07, - "loss": 0.5483, - "step": 77530 - }, - { - "epoch": 1.99, - "learning_rate": 5.40579197044617e-07, - "loss": 0.6953, - "step": 77531 - }, - { - "epoch": 1.99, - "learning_rate": 5.405546198048706e-07, - "loss": 0.6719, - "step": 77532 - }, - { - "epoch": 1.99, - "learning_rate": 5.405300429169e-07, - "loss": 0.6323, - "step": 77533 - }, - { - "epoch": 1.99, - "learning_rate": 5.405054663807242e-07, - "loss": 0.6514, - "step": 77534 - }, - { - "epoch": 1.99, - "learning_rate": 5.404808901963629e-07, - "loss": 0.6118, - "step": 77535 - }, - { - "epoch": 1.99, - "learning_rate": 5.404563143638337e-07, - "loss": 0.5005, - "step": 77536 - }, - { - "epoch": 1.99, - "learning_rate": 5.404317388831566e-07, - "loss": 0.5264, - "step": 77537 - }, - { - "epoch": 1.99, - "learning_rate": 5.40407163754349e-07, - "loss": 0.5947, - "step": 77538 - }, - { - "epoch": 1.99, - "learning_rate": 5.403825889774307e-07, - "loss": 0.6934, - "step": 77539 - }, - { - "epoch": 1.99, - "learning_rate": 5.403580145524207e-07, - "loss": 0.8203, - "step": 77540 - }, - { - "epoch": 1.99, - "learning_rate": 5.403334404793371e-07, - "loss": 0.5659, - "step": 77541 - }, - { - "epoch": 1.99, - "learning_rate": 5.40308866758199e-07, - "loss": 0.4422, - "step": 77542 - }, - { - "epoch": 1.99, - "learning_rate": 5.402842933890252e-07, - "loss": 0.6235, - "step": 77543 - }, - { - "epoch": 1.99, - "learning_rate": 5.402597203718351e-07, - "loss": 0.707, - "step": 77544 - }, - { - "epoch": 1.99, - "learning_rate": 5.402351477066466e-07, - "loss": 0.5084, - "step": 77545 - }, - { - "epoch": 1.99, - "learning_rate": 5.402105753934788e-07, - "loss": 0.7314, - "step": 77546 - }, - { - "epoch": 1.99, - "learning_rate": 5.401860034323511e-07, - "loss": 0.4905, - "step": 77547 - }, - { - "epoch": 1.99, - "learning_rate": 5.401614318232814e-07, - "loss": 0.6904, - "step": 77548 - }, - { - "epoch": 1.99, - "learning_rate": 5.401368605662893e-07, - "loss": 0.7383, - "step": 77549 - }, - { - "epoch": 1.99, - "learning_rate": 5.40112289661393e-07, - "loss": 0.7559, - "step": 77550 - }, - { - "epoch": 1.99, - "learning_rate": 5.400877191086115e-07, - "loss": 0.583, - "step": 77551 - }, - { - "epoch": 1.99, - "learning_rate": 5.40063148907964e-07, - "loss": 0.7002, - "step": 77552 - }, - { - "epoch": 1.99, - "learning_rate": 5.400385790594686e-07, - "loss": 0.7432, - "step": 77553 - }, - { - "epoch": 1.99, - "learning_rate": 5.400140095631447e-07, - "loss": 0.6348, - "step": 77554 - }, - { - "epoch": 1.99, - "learning_rate": 5.399894404190107e-07, - "loss": 0.5957, - "step": 77555 - }, - { - "epoch": 1.99, - "learning_rate": 5.399648716270862e-07, - "loss": 0.5229, - "step": 77556 - }, - { - "epoch": 1.99, - "learning_rate": 5.399403031873893e-07, - "loss": 0.522, - "step": 77557 - }, - { - "epoch": 1.99, - "learning_rate": 5.399157350999386e-07, - "loss": 0.6953, - "step": 77558 - }, - { - "epoch": 1.99, - "learning_rate": 5.398911673647534e-07, - "loss": 0.5742, - "step": 77559 - }, - { - "epoch": 1.99, - "learning_rate": 5.398665999818523e-07, - "loss": 0.7056, - "step": 77560 - }, - { - "epoch": 1.99, - "learning_rate": 5.398420329512545e-07, - "loss": 0.6172, - "step": 77561 - }, - { - "epoch": 1.99, - "learning_rate": 5.398174662729782e-07, - "loss": 0.8154, - "step": 77562 - }, - { - "epoch": 1.99, - "learning_rate": 5.397928999470424e-07, - "loss": 0.6025, - "step": 77563 - }, - { - "epoch": 1.99, - "learning_rate": 5.397683339734661e-07, - "loss": 0.668, - "step": 77564 - }, - { - "epoch": 1.99, - "learning_rate": 5.397437683522685e-07, - "loss": 0.5317, - "step": 77565 - }, - { - "epoch": 1.99, - "learning_rate": 5.397192030834675e-07, - "loss": 0.4374, - "step": 77566 - }, - { - "epoch": 1.99, - "learning_rate": 5.396946381670826e-07, - "loss": 0.5771, - "step": 77567 - }, - { - "epoch": 1.99, - "learning_rate": 5.39670073603132e-07, - "loss": 0.6602, - "step": 77568 - }, - { - "epoch": 1.99, - "learning_rate": 5.396455093916349e-07, - "loss": 0.625, - "step": 77569 - }, - { - "epoch": 1.99, - "learning_rate": 5.396209455326103e-07, - "loss": 0.4783, - "step": 77570 - }, - { - "epoch": 1.99, - "learning_rate": 5.395963820260767e-07, - "loss": 0.5957, - "step": 77571 - }, - { - "epoch": 1.99, - "learning_rate": 5.395718188720529e-07, - "loss": 0.6411, - "step": 77572 - }, - { - "epoch": 1.99, - "learning_rate": 5.395472560705579e-07, - "loss": 0.6475, - "step": 77573 - }, - { - "epoch": 1.99, - "learning_rate": 5.395226936216102e-07, - "loss": 0.6377, - "step": 77574 - }, - { - "epoch": 1.99, - "learning_rate": 5.394981315252288e-07, - "loss": 0.4078, - "step": 77575 - }, - { - "epoch": 1.99, - "learning_rate": 5.394735697814325e-07, - "loss": 0.5981, - "step": 77576 - }, - { - "epoch": 1.99, - "learning_rate": 5.394490083902406e-07, - "loss": 0.6641, - "step": 77577 - }, - { - "epoch": 1.99, - "learning_rate": 5.394244473516713e-07, - "loss": 0.624, - "step": 77578 - }, - { - "epoch": 1.99, - "learning_rate": 5.393998866657432e-07, - "loss": 0.6099, - "step": 77579 - }, - { - "epoch": 1.99, - "learning_rate": 5.393753263324753e-07, - "loss": 0.6787, - "step": 77580 - }, - { - "epoch": 1.99, - "learning_rate": 5.393507663518866e-07, - "loss": 0.5869, - "step": 77581 - }, - { - "epoch": 1.99, - "learning_rate": 5.393262067239963e-07, - "loss": 0.6104, - "step": 77582 - }, - { - "epoch": 1.99, - "learning_rate": 5.393016474488222e-07, - "loss": 0.5713, - "step": 77583 - }, - { - "epoch": 1.99, - "learning_rate": 5.392770885263837e-07, - "loss": 0.6318, - "step": 77584 - }, - { - "epoch": 1.99, - "learning_rate": 5.392525299566997e-07, - "loss": 0.5752, - "step": 77585 - }, - { - "epoch": 1.99, - "learning_rate": 5.392279717397891e-07, - "loss": 0.6777, - "step": 77586 - }, - { - "epoch": 1.99, - "learning_rate": 5.392034138756704e-07, - "loss": 0.7695, - "step": 77587 - }, - { - "epoch": 1.99, - "learning_rate": 5.391788563643623e-07, - "loss": 0.7275, - "step": 77588 - }, - { - "epoch": 1.99, - "learning_rate": 5.391542992058835e-07, - "loss": 0.6626, - "step": 77589 - }, - { - "epoch": 1.99, - "learning_rate": 5.391297424002536e-07, - "loss": 0.6157, - "step": 77590 - }, - { - "epoch": 1.99, - "learning_rate": 5.391051859474904e-07, - "loss": 0.5293, - "step": 77591 - }, - { - "epoch": 1.99, - "learning_rate": 5.390806298476133e-07, - "loss": 0.6689, - "step": 77592 - }, - { - "epoch": 1.99, - "learning_rate": 5.390560741006408e-07, - "loss": 0.563, - "step": 77593 - }, - { - "epoch": 1.99, - "learning_rate": 5.390315187065924e-07, - "loss": 0.52, - "step": 77594 - }, - { - "epoch": 1.99, - "learning_rate": 5.390069636654859e-07, - "loss": 0.6836, - "step": 77595 - }, - { - "epoch": 1.99, - "learning_rate": 5.389824089773405e-07, - "loss": 0.584, - "step": 77596 - }, - { - "epoch": 1.99, - "learning_rate": 5.389578546421755e-07, - "loss": 0.6167, - "step": 77597 - }, - { - "epoch": 1.99, - "learning_rate": 5.38933300660009e-07, - "loss": 0.6494, - "step": 77598 - }, - { - "epoch": 1.99, - "learning_rate": 5.389087470308604e-07, - "loss": 0.6812, - "step": 77599 - }, - { - "epoch": 1.99, - "learning_rate": 5.388841937547478e-07, - "loss": 0.5444, - "step": 77600 - }, - { - "epoch": 1.99, - "learning_rate": 5.388596408316903e-07, - "loss": 0.791, - "step": 77601 - }, - { - "epoch": 1.99, - "learning_rate": 5.388350882617068e-07, - "loss": 0.6553, - "step": 77602 - }, - { - "epoch": 1.99, - "learning_rate": 5.388105360448165e-07, - "loss": 0.5908, - "step": 77603 - }, - { - "epoch": 1.99, - "learning_rate": 5.387859841810374e-07, - "loss": 0.626, - "step": 77604 - }, - { - "epoch": 1.99, - "learning_rate": 5.387614326703886e-07, - "loss": 0.7793, - "step": 77605 - }, - { - "epoch": 1.99, - "learning_rate": 5.38736881512889e-07, - "loss": 0.4219, - "step": 77606 - }, - { - "epoch": 1.99, - "learning_rate": 5.387123307085581e-07, - "loss": 0.549, - "step": 77607 - }, - { - "epoch": 1.99, - "learning_rate": 5.386877802574132e-07, - "loss": 0.5474, - "step": 77608 - }, - { - "epoch": 1.99, - "learning_rate": 5.386632301594738e-07, - "loss": 0.6875, - "step": 77609 - }, - { - "epoch": 1.99, - "learning_rate": 5.386386804147587e-07, - "loss": 0.6396, - "step": 77610 - }, - { - "epoch": 1.99, - "learning_rate": 5.386141310232872e-07, - "loss": 0.6865, - "step": 77611 - }, - { - "epoch": 1.99, - "learning_rate": 5.385895819850774e-07, - "loss": 0.8105, - "step": 77612 - }, - { - "epoch": 1.99, - "learning_rate": 5.385650333001483e-07, - "loss": 0.543, - "step": 77613 - }, - { - "epoch": 1.99, - "learning_rate": 5.385404849685186e-07, - "loss": 0.6567, - "step": 77614 - }, - { - "epoch": 1.99, - "learning_rate": 5.385159369902077e-07, - "loss": 0.6426, - "step": 77615 - }, - { - "epoch": 1.99, - "learning_rate": 5.384913893652334e-07, - "loss": 0.4976, - "step": 77616 - }, - { - "epoch": 1.99, - "learning_rate": 5.384668420936156e-07, - "loss": 0.7783, - "step": 77617 - }, - { - "epoch": 1.99, - "learning_rate": 5.384422951753721e-07, - "loss": 0.6113, - "step": 77618 - }, - { - "epoch": 1.99, - "learning_rate": 5.384177486105221e-07, - "loss": 0.7949, - "step": 77619 - }, - { - "epoch": 1.99, - "learning_rate": 5.383932023990847e-07, - "loss": 0.6143, - "step": 77620 - }, - { - "epoch": 1.99, - "learning_rate": 5.383686565410781e-07, - "loss": 0.4849, - "step": 77621 - }, - { - "epoch": 1.99, - "learning_rate": 5.383441110365214e-07, - "loss": 0.6514, - "step": 77622 - }, - { - "epoch": 1.99, - "learning_rate": 5.383195658854333e-07, - "loss": 0.6641, - "step": 77623 - }, - { - "epoch": 1.99, - "learning_rate": 5.382950210878332e-07, - "loss": 0.5542, - "step": 77624 - }, - { - "epoch": 1.99, - "learning_rate": 5.382704766437389e-07, - "loss": 0.6284, - "step": 77625 - }, - { - "epoch": 1.99, - "learning_rate": 5.382459325531696e-07, - "loss": 0.6299, - "step": 77626 - }, - { - "epoch": 1.99, - "learning_rate": 5.382213888161447e-07, - "loss": 0.5728, - "step": 77627 - }, - { - "epoch": 1.99, - "learning_rate": 5.381968454326824e-07, - "loss": 0.5239, - "step": 77628 - }, - { - "epoch": 1.99, - "learning_rate": 5.381723024028011e-07, - "loss": 0.592, - "step": 77629 - }, - { - "epoch": 1.99, - "learning_rate": 5.381477597265201e-07, - "loss": 0.7051, - "step": 77630 - }, - { - "epoch": 1.99, - "learning_rate": 5.381232174038581e-07, - "loss": 0.5601, - "step": 77631 - }, - { - "epoch": 1.99, - "learning_rate": 5.380986754348343e-07, - "loss": 0.5276, - "step": 77632 - }, - { - "epoch": 1.99, - "learning_rate": 5.380741338194666e-07, - "loss": 0.8984, - "step": 77633 - }, - { - "epoch": 1.99, - "learning_rate": 5.380495925577745e-07, - "loss": 0.7607, - "step": 77634 - }, - { - "epoch": 1.99, - "learning_rate": 5.380250516497764e-07, - "loss": 0.5259, - "step": 77635 - }, - { - "epoch": 1.99, - "learning_rate": 5.380005110954919e-07, - "loss": 0.5864, - "step": 77636 - }, - { - "epoch": 1.99, - "learning_rate": 5.37975970894939e-07, - "loss": 0.6431, - "step": 77637 - }, - { - "epoch": 1.99, - "learning_rate": 5.379514310481362e-07, - "loss": 0.6943, - "step": 77638 - }, - { - "epoch": 1.99, - "learning_rate": 5.379268915551028e-07, - "loss": 0.6719, - "step": 77639 - }, - { - "epoch": 1.99, - "learning_rate": 5.379023524158575e-07, - "loss": 0.5046, - "step": 77640 - }, - { - "epoch": 1.99, - "learning_rate": 5.378778136304196e-07, - "loss": 0.4834, - "step": 77641 - }, - { - "epoch": 1.99, - "learning_rate": 5.37853275198807e-07, - "loss": 0.8223, - "step": 77642 - }, - { - "epoch": 1.99, - "learning_rate": 5.378287371210389e-07, - "loss": 0.606, - "step": 77643 - }, - { - "epoch": 1.99, - "learning_rate": 5.378041993971345e-07, - "loss": 0.624, - "step": 77644 - }, - { - "epoch": 1.99, - "learning_rate": 5.377796620271118e-07, - "loss": 0.5122, - "step": 77645 - }, - { - "epoch": 1.99, - "learning_rate": 5.377551250109898e-07, - "loss": 0.6201, - "step": 77646 - }, - { - "epoch": 1.99, - "learning_rate": 5.377305883487879e-07, - "loss": 0.5781, - "step": 77647 - }, - { - "epoch": 1.99, - "learning_rate": 5.377060520405241e-07, - "loss": 0.7705, - "step": 77648 - }, - { - "epoch": 1.99, - "learning_rate": 5.376815160862179e-07, - "loss": 0.6143, - "step": 77649 - }, - { - "epoch": 1.99, - "learning_rate": 5.376569804858874e-07, - "loss": 0.438, - "step": 77650 - }, - { - "epoch": 1.99, - "learning_rate": 5.376324452395515e-07, - "loss": 0.624, - "step": 77651 - }, - { - "epoch": 1.99, - "learning_rate": 5.376079103472293e-07, - "loss": 0.6738, - "step": 77652 - }, - { - "epoch": 1.99, - "learning_rate": 5.375833758089399e-07, - "loss": 0.5078, - "step": 77653 - }, - { - "epoch": 1.99, - "learning_rate": 5.375588416247011e-07, - "loss": 0.7031, - "step": 77654 - }, - { - "epoch": 1.99, - "learning_rate": 5.375343077945323e-07, - "loss": 0.6396, - "step": 77655 - }, - { - "epoch": 1.99, - "learning_rate": 5.375097743184522e-07, - "loss": 0.6387, - "step": 77656 - }, - { - "epoch": 1.99, - "learning_rate": 5.374852411964801e-07, - "loss": 0.7529, - "step": 77657 - }, - { - "epoch": 1.99, - "learning_rate": 5.374607084286343e-07, - "loss": 0.707, - "step": 77658 - }, - { - "epoch": 1.99, - "learning_rate": 5.37436176014933e-07, - "loss": 0.7393, - "step": 77659 - }, - { - "epoch": 1.99, - "learning_rate": 5.374116439553956e-07, - "loss": 0.6846, - "step": 77660 - }, - { - "epoch": 1.99, - "learning_rate": 5.373871122500413e-07, - "loss": 0.7246, - "step": 77661 - }, - { - "epoch": 1.99, - "learning_rate": 5.37362580898888e-07, - "loss": 0.7109, - "step": 77662 - }, - { - "epoch": 1.99, - "learning_rate": 5.373380499019549e-07, - "loss": 0.6597, - "step": 77663 - }, - { - "epoch": 1.99, - "learning_rate": 5.373135192592606e-07, - "loss": 0.6025, - "step": 77664 - }, - { - "epoch": 1.99, - "learning_rate": 5.372889889708248e-07, - "loss": 0.5171, - "step": 77665 - }, - { - "epoch": 1.99, - "learning_rate": 5.372644590366648e-07, - "loss": 0.7004, - "step": 77666 - }, - { - "epoch": 1.99, - "learning_rate": 5.372399294568008e-07, - "loss": 0.449, - "step": 77667 - }, - { - "epoch": 1.99, - "learning_rate": 5.372154002312503e-07, - "loss": 0.6245, - "step": 77668 - }, - { - "epoch": 1.99, - "learning_rate": 5.371908713600328e-07, - "loss": 0.4824, - "step": 77669 - }, - { - "epoch": 1.99, - "learning_rate": 5.371663428431674e-07, - "loss": 0.4662, - "step": 77670 - }, - { - "epoch": 1.99, - "learning_rate": 5.371418146806719e-07, - "loss": 0.6396, - "step": 77671 - }, - { - "epoch": 1.99, - "learning_rate": 5.371172868725658e-07, - "loss": 0.6299, - "step": 77672 - }, - { - "epoch": 1.99, - "learning_rate": 5.370927594188676e-07, - "loss": 0.5469, - "step": 77673 - }, - { - "epoch": 1.99, - "learning_rate": 5.370682323195967e-07, - "loss": 0.6699, - "step": 77674 - }, - { - "epoch": 1.99, - "learning_rate": 5.37043705574771e-07, - "loss": 0.7949, - "step": 77675 - }, - { - "epoch": 1.99, - "learning_rate": 5.370191791844095e-07, - "loss": 0.5325, - "step": 77676 - }, - { - "epoch": 1.99, - "learning_rate": 5.369946531485316e-07, - "loss": 0.7412, - "step": 77677 - }, - { - "epoch": 1.99, - "learning_rate": 5.369701274671556e-07, - "loss": 0.6543, - "step": 77678 - }, - { - "epoch": 1.99, - "learning_rate": 5.369456021402998e-07, - "loss": 0.533, - "step": 77679 - }, - { - "epoch": 1.99, - "learning_rate": 5.369210771679835e-07, - "loss": 0.5176, - "step": 77680 - }, - { - "epoch": 1.99, - "learning_rate": 5.368965525502255e-07, - "loss": 0.4816, - "step": 77681 - }, - { - "epoch": 1.99, - "learning_rate": 5.368720282870449e-07, - "loss": 0.8022, - "step": 77682 - }, - { - "epoch": 1.99, - "learning_rate": 5.368475043784598e-07, - "loss": 0.7085, - "step": 77683 - }, - { - "epoch": 1.99, - "learning_rate": 5.368229808244891e-07, - "loss": 0.647, - "step": 77684 - }, - { - "epoch": 1.99, - "learning_rate": 5.367984576251516e-07, - "loss": 0.4319, - "step": 77685 - }, - { - "epoch": 1.99, - "learning_rate": 5.367739347804669e-07, - "loss": 0.6074, - "step": 77686 - }, - { - "epoch": 1.99, - "learning_rate": 5.36749412290453e-07, - "loss": 0.5918, - "step": 77687 - }, - { - "epoch": 1.99, - "learning_rate": 5.367248901551284e-07, - "loss": 0.7114, - "step": 77688 - }, - { - "epoch": 1.99, - "learning_rate": 5.367003683745122e-07, - "loss": 0.6924, - "step": 77689 - }, - { - "epoch": 1.99, - "learning_rate": 5.366758469486233e-07, - "loss": 0.7559, - "step": 77690 - }, - { - "epoch": 1.99, - "learning_rate": 5.366513258774807e-07, - "loss": 0.8516, - "step": 77691 - }, - { - "epoch": 1.99, - "learning_rate": 5.366268051611026e-07, - "loss": 0.6475, - "step": 77692 - }, - { - "epoch": 1.99, - "learning_rate": 5.366022847995079e-07, - "loss": 0.582, - "step": 77693 - }, - { - "epoch": 1.99, - "learning_rate": 5.365777647927157e-07, - "loss": 0.707, - "step": 77694 - }, - { - "epoch": 1.99, - "learning_rate": 5.365532451407449e-07, - "loss": 0.6616, - "step": 77695 - }, - { - "epoch": 1.99, - "learning_rate": 5.365287258436136e-07, - "loss": 0.7437, - "step": 77696 - }, - { - "epoch": 1.99, - "learning_rate": 5.365042069013413e-07, - "loss": 0.5894, - "step": 77697 - }, - { - "epoch": 1.99, - "learning_rate": 5.36479688313946e-07, - "loss": 0.6455, - "step": 77698 - }, - { - "epoch": 1.99, - "learning_rate": 5.364551700814473e-07, - "loss": 0.6426, - "step": 77699 - }, - { - "epoch": 1.99, - "learning_rate": 5.364306522038632e-07, - "loss": 0.6035, - "step": 77700 - }, - { - "epoch": 1.99, - "learning_rate": 5.364061346812128e-07, - "loss": 0.5637, - "step": 77701 - }, - { - "epoch": 1.99, - "learning_rate": 5.36381617513515e-07, - "loss": 0.5757, - "step": 77702 - }, - { - "epoch": 1.99, - "learning_rate": 5.363571007007888e-07, - "loss": 0.5801, - "step": 77703 - }, - { - "epoch": 1.99, - "learning_rate": 5.363325842430522e-07, - "loss": 0.6826, - "step": 77704 - }, - { - "epoch": 1.99, - "learning_rate": 5.363080681403245e-07, - "loss": 0.4089, - "step": 77705 - }, - { - "epoch": 1.99, - "learning_rate": 5.362835523926243e-07, - "loss": 0.5908, - "step": 77706 - }, - { - "epoch": 1.99, - "learning_rate": 5.362590369999709e-07, - "loss": 0.7139, - "step": 77707 - }, - { - "epoch": 1.99, - "learning_rate": 5.362345219623828e-07, - "loss": 0.5435, - "step": 77708 - }, - { - "epoch": 1.99, - "learning_rate": 5.362100072798778e-07, - "loss": 0.5439, - "step": 77709 - }, - { - "epoch": 1.99, - "learning_rate": 5.361854929524759e-07, - "loss": 0.479, - "step": 77710 - }, - { - "epoch": 1.99, - "learning_rate": 5.361609789801953e-07, - "loss": 0.6973, - "step": 77711 - }, - { - "epoch": 1.99, - "learning_rate": 5.361364653630552e-07, - "loss": 0.7241, - "step": 77712 - }, - { - "epoch": 1.99, - "learning_rate": 5.361119521010738e-07, - "loss": 0.6157, - "step": 77713 - }, - { - "epoch": 1.99, - "learning_rate": 5.3608743919427e-07, - "loss": 0.4366, - "step": 77714 - }, - { - "epoch": 1.99, - "learning_rate": 5.360629266426633e-07, - "loss": 0.6479, - "step": 77715 - }, - { - "epoch": 1.99, - "learning_rate": 5.360384144462714e-07, - "loss": 0.5645, - "step": 77716 - }, - { - "epoch": 1.99, - "learning_rate": 5.36013902605114e-07, - "loss": 0.5439, - "step": 77717 - }, - { - "epoch": 1.99, - "learning_rate": 5.359893911192091e-07, - "loss": 0.6641, - "step": 77718 - }, - { - "epoch": 1.99, - "learning_rate": 5.359648799885755e-07, - "loss": 0.688, - "step": 77719 - }, - { - "epoch": 1.99, - "learning_rate": 5.35940369213233e-07, - "loss": 0.6914, - "step": 77720 - }, - { - "epoch": 1.99, - "learning_rate": 5.359158587931989e-07, - "loss": 0.6855, - "step": 77721 - }, - { - "epoch": 1.99, - "learning_rate": 5.358913487284929e-07, - "loss": 0.7686, - "step": 77722 - }, - { - "epoch": 1.99, - "learning_rate": 5.358668390191334e-07, - "loss": 0.5527, - "step": 77723 - }, - { - "epoch": 1.99, - "learning_rate": 5.358423296651398e-07, - "loss": 0.5925, - "step": 77724 - }, - { - "epoch": 1.99, - "learning_rate": 5.3581782066653e-07, - "loss": 0.6768, - "step": 77725 - }, - { - "epoch": 1.99, - "learning_rate": 5.357933120233236e-07, - "loss": 0.6211, - "step": 77726 - }, - { - "epoch": 1.99, - "learning_rate": 5.357688037355385e-07, - "loss": 0.564, - "step": 77727 - }, - { - "epoch": 1.99, - "learning_rate": 5.357442958031938e-07, - "loss": 0.562, - "step": 77728 - }, - { - "epoch": 1.99, - "learning_rate": 5.357197882263087e-07, - "loss": 0.6665, - "step": 77729 - }, - { - "epoch": 1.99, - "learning_rate": 5.356952810049014e-07, - "loss": 0.7324, - "step": 77730 - }, - { - "epoch": 1.99, - "learning_rate": 5.356707741389908e-07, - "loss": 0.6885, - "step": 77731 - }, - { - "epoch": 1.99, - "learning_rate": 5.356462676285957e-07, - "loss": 0.5381, - "step": 77732 - }, - { - "epoch": 1.99, - "learning_rate": 5.356217614737353e-07, - "loss": 0.5681, - "step": 77733 - }, - { - "epoch": 1.99, - "learning_rate": 5.355972556744274e-07, - "loss": 0.5967, - "step": 77734 - }, - { - "epoch": 1.99, - "learning_rate": 5.355727502306917e-07, - "loss": 0.6846, - "step": 77735 - }, - { - "epoch": 1.99, - "learning_rate": 5.355482451425467e-07, - "loss": 0.7793, - "step": 77736 - }, - { - "epoch": 1.99, - "learning_rate": 5.355237404100111e-07, - "loss": 0.5879, - "step": 77737 - }, - { - "epoch": 1.99, - "learning_rate": 5.354992360331033e-07, - "loss": 0.4175, - "step": 77738 - }, - { - "epoch": 1.99, - "learning_rate": 5.354747320118424e-07, - "loss": 0.5781, - "step": 77739 - }, - { - "epoch": 1.99, - "learning_rate": 5.35450228346247e-07, - "loss": 0.6157, - "step": 77740 - }, - { - "epoch": 1.99, - "learning_rate": 5.354257250363366e-07, - "loss": 0.6841, - "step": 77741 - }, - { - "epoch": 1.99, - "learning_rate": 5.354012220821287e-07, - "loss": 0.7021, - "step": 77742 - }, - { - "epoch": 1.99, - "learning_rate": 5.353767194836429e-07, - "loss": 0.6846, - "step": 77743 - }, - { - "epoch": 1.99, - "learning_rate": 5.353522172408977e-07, - "loss": 0.6621, - "step": 77744 - }, - { - "epoch": 1.99, - "learning_rate": 5.353277153539124e-07, - "loss": 0.6533, - "step": 77745 - }, - { - "epoch": 1.99, - "learning_rate": 5.353032138227054e-07, - "loss": 0.3726, - "step": 77746 - }, - { - "epoch": 1.99, - "learning_rate": 5.352787126472947e-07, - "loss": 0.4663, - "step": 77747 - }, - { - "epoch": 1.99, - "learning_rate": 5.352542118277e-07, - "loss": 0.6626, - "step": 77748 - }, - { - "epoch": 1.99, - "learning_rate": 5.352297113639395e-07, - "loss": 0.4814, - "step": 77749 - }, - { - "epoch": 1.99, - "learning_rate": 5.352052112560328e-07, - "loss": 0.5896, - "step": 77750 - }, - { - "epoch": 1.99, - "learning_rate": 5.351807115039977e-07, - "loss": 0.4675, - "step": 77751 - }, - { - "epoch": 1.99, - "learning_rate": 5.351562121078534e-07, - "loss": 0.562, - "step": 77752 - }, - { - "epoch": 1.99, - "learning_rate": 5.35131713067619e-07, - "loss": 0.6699, - "step": 77753 - }, - { - "epoch": 1.99, - "learning_rate": 5.351072143833125e-07, - "loss": 0.6631, - "step": 77754 - }, - { - "epoch": 1.99, - "learning_rate": 5.350827160549528e-07, - "loss": 0.6797, - "step": 77755 - }, - { - "epoch": 1.99, - "learning_rate": 5.350582180825595e-07, - "loss": 0.6069, - "step": 77756 - }, - { - "epoch": 1.99, - "learning_rate": 5.350337204661503e-07, - "loss": 0.4756, - "step": 77757 - }, - { - "epoch": 1.99, - "learning_rate": 5.350092232057447e-07, - "loss": 0.6929, - "step": 77758 - }, - { - "epoch": 1.99, - "learning_rate": 5.349847263013609e-07, - "loss": 0.6223, - "step": 77759 - }, - { - "epoch": 1.99, - "learning_rate": 5.349602297530178e-07, - "loss": 0.5869, - "step": 77760 - }, - { - "epoch": 1.99, - "learning_rate": 5.349357335607343e-07, - "loss": 0.7295, - "step": 77761 - }, - { - "epoch": 1.99, - "learning_rate": 5.349112377245296e-07, - "loss": 0.6826, - "step": 77762 - }, - { - "epoch": 1.99, - "learning_rate": 5.348867422444216e-07, - "loss": 0.6094, - "step": 77763 - }, - { - "epoch": 1.99, - "learning_rate": 5.348622471204294e-07, - "loss": 0.5029, - "step": 77764 - }, - { - "epoch": 1.99, - "learning_rate": 5.348377523525716e-07, - "loss": 0.5737, - "step": 77765 - }, - { - "epoch": 1.99, - "learning_rate": 5.348132579408678e-07, - "loss": 0.792, - "step": 77766 - }, - { - "epoch": 1.99, - "learning_rate": 5.347887638853359e-07, - "loss": 0.7168, - "step": 77767 - }, - { - "epoch": 1.99, - "learning_rate": 5.347642701859946e-07, - "loss": 0.6973, - "step": 77768 - }, - { - "epoch": 1.99, - "learning_rate": 5.347397768428629e-07, - "loss": 0.7832, - "step": 77769 - }, - { - "epoch": 1.99, - "learning_rate": 5.347152838559598e-07, - "loss": 0.6333, - "step": 77770 - }, - { - "epoch": 1.99, - "learning_rate": 5.346907912253036e-07, - "loss": 0.6396, - "step": 77771 - }, - { - "epoch": 1.99, - "learning_rate": 5.346662989509131e-07, - "loss": 0.7285, - "step": 77772 - }, - { - "epoch": 1.99, - "learning_rate": 5.346418070328074e-07, - "loss": 0.5414, - "step": 77773 - }, - { - "epoch": 1.99, - "learning_rate": 5.346173154710054e-07, - "loss": 0.7764, - "step": 77774 - }, - { - "epoch": 1.99, - "learning_rate": 5.345928242655251e-07, - "loss": 0.8076, - "step": 77775 - }, - { - "epoch": 1.99, - "learning_rate": 5.345683334163861e-07, - "loss": 0.5205, - "step": 77776 - }, - { - "epoch": 1.99, - "learning_rate": 5.345438429236062e-07, - "loss": 0.5845, - "step": 77777 - }, - { - "epoch": 1.99, - "learning_rate": 5.345193527872049e-07, - "loss": 0.5256, - "step": 77778 - }, - { - "epoch": 1.99, - "learning_rate": 5.344948630072011e-07, - "loss": 0.6208, - "step": 77779 - }, - { - "epoch": 1.99, - "learning_rate": 5.344703735836126e-07, - "loss": 0.5669, - "step": 77780 - }, - { - "epoch": 1.99, - "learning_rate": 5.344458845164588e-07, - "loss": 0.7134, - "step": 77781 - }, - { - "epoch": 1.99, - "learning_rate": 5.344213958057584e-07, - "loss": 0.6543, - "step": 77782 - }, - { - "epoch": 1.99, - "learning_rate": 5.343969074515305e-07, - "loss": 0.6895, - "step": 77783 - }, - { - "epoch": 1.99, - "learning_rate": 5.343724194537931e-07, - "loss": 0.9097, - "step": 77784 - }, - { - "epoch": 1.99, - "learning_rate": 5.343479318125654e-07, - "loss": 0.5679, - "step": 77785 - }, - { - "epoch": 1.99, - "learning_rate": 5.343234445278664e-07, - "loss": 0.5845, - "step": 77786 - }, - { - "epoch": 1.99, - "learning_rate": 5.342989575997145e-07, - "loss": 0.5967, - "step": 77787 - }, - { - "epoch": 1.99, - "learning_rate": 5.342744710281282e-07, - "loss": 0.7021, - "step": 77788 - }, - { - "epoch": 1.99, - "learning_rate": 5.342499848131264e-07, - "loss": 0.6479, - "step": 77789 - }, - { - "epoch": 1.99, - "learning_rate": 5.342254989547281e-07, - "loss": 0.4297, - "step": 77790 - }, - { - "epoch": 1.99, - "learning_rate": 5.342010134529521e-07, - "loss": 0.4536, - "step": 77791 - }, - { - "epoch": 1.99, - "learning_rate": 5.341765283078167e-07, - "loss": 0.6719, - "step": 77792 - }, - { - "epoch": 1.99, - "learning_rate": 5.34152043519341e-07, - "loss": 0.5107, - "step": 77793 - }, - { - "epoch": 1.99, - "learning_rate": 5.341275590875435e-07, - "loss": 0.6548, - "step": 77794 - }, - { - "epoch": 1.99, - "learning_rate": 5.341030750124436e-07, - "loss": 0.6826, - "step": 77795 - }, - { - "epoch": 1.99, - "learning_rate": 5.340785912940595e-07, - "loss": 0.4045, - "step": 77796 - }, - { - "epoch": 1.99, - "learning_rate": 5.340541079324097e-07, - "loss": 0.6836, - "step": 77797 - }, - { - "epoch": 1.99, - "learning_rate": 5.340296249275131e-07, - "loss": 0.5835, - "step": 77798 - }, - { - "epoch": 1.99, - "learning_rate": 5.340051422793886e-07, - "loss": 0.668, - "step": 77799 - }, - { - "epoch": 1.99, - "learning_rate": 5.339806599880554e-07, - "loss": 0.7578, - "step": 77800 - }, - { - "epoch": 1.99, - "learning_rate": 5.339561780535314e-07, - "loss": 0.4971, - "step": 77801 - }, - { - "epoch": 1.99, - "learning_rate": 5.339316964758357e-07, - "loss": 0.3479, - "step": 77802 - }, - { - "epoch": 1.99, - "learning_rate": 5.339072152549871e-07, - "loss": 0.5264, - "step": 77803 - }, - { - "epoch": 1.99, - "learning_rate": 5.338827343910046e-07, - "loss": 0.7139, - "step": 77804 - }, - { - "epoch": 1.99, - "learning_rate": 5.338582538839065e-07, - "loss": 0.666, - "step": 77805 - }, - { - "epoch": 1.99, - "learning_rate": 5.338337737337119e-07, - "loss": 0.6143, - "step": 77806 - }, - { - "epoch": 1.99, - "learning_rate": 5.33809293940439e-07, - "loss": 0.6807, - "step": 77807 - }, - { - "epoch": 1.99, - "learning_rate": 5.337848145041073e-07, - "loss": 0.6523, - "step": 77808 - }, - { - "epoch": 1.99, - "learning_rate": 5.337603354247346e-07, - "loss": 0.6963, - "step": 77809 - }, - { - "epoch": 1.99, - "learning_rate": 5.337358567023403e-07, - "loss": 0.8076, - "step": 77810 - }, - { - "epoch": 1.99, - "learning_rate": 5.33711378336943e-07, - "loss": 0.5547, - "step": 77811 - }, - { - "epoch": 1.99, - "learning_rate": 5.336869003285617e-07, - "loss": 0.668, - "step": 77812 - }, - { - "epoch": 1.99, - "learning_rate": 5.336624226772148e-07, - "loss": 0.5579, - "step": 77813 - }, - { - "epoch": 1.99, - "learning_rate": 5.336379453829209e-07, - "loss": 0.6924, - "step": 77814 - }, - { - "epoch": 1.99, - "learning_rate": 5.336134684456992e-07, - "loss": 0.584, - "step": 77815 - }, - { - "epoch": 1.99, - "learning_rate": 5.335889918655685e-07, - "loss": 0.7041, - "step": 77816 - }, - { - "epoch": 1.99, - "learning_rate": 5.335645156425472e-07, - "loss": 0.6279, - "step": 77817 - }, - { - "epoch": 1.99, - "learning_rate": 5.335400397766539e-07, - "loss": 0.6885, - "step": 77818 - }, - { - "epoch": 1.99, - "learning_rate": 5.335155642679072e-07, - "loss": 0.6387, - "step": 77819 - }, - { - "epoch": 1.99, - "learning_rate": 5.334910891163265e-07, - "loss": 0.5029, - "step": 77820 - }, - { - "epoch": 1.99, - "learning_rate": 5.334666143219304e-07, - "loss": 0.6943, - "step": 77821 - }, - { - "epoch": 1.99, - "learning_rate": 5.334421398847373e-07, - "loss": 0.6357, - "step": 77822 - }, - { - "epoch": 1.99, - "learning_rate": 5.33417665804766e-07, - "loss": 0.5591, - "step": 77823 - }, - { - "epoch": 1.99, - "learning_rate": 5.333931920820356e-07, - "loss": 0.5303, - "step": 77824 - }, - { - "epoch": 1.99, - "learning_rate": 5.333687187165643e-07, - "loss": 0.5498, - "step": 77825 - }, - { - "epoch": 1.99, - "learning_rate": 5.333442457083715e-07, - "loss": 0.6753, - "step": 77826 - }, - { - "epoch": 1.99, - "learning_rate": 5.333197730574752e-07, - "loss": 0.5693, - "step": 77827 - }, - { - "epoch": 1.99, - "learning_rate": 5.332953007638944e-07, - "loss": 0.6855, - "step": 77828 - }, - { - "epoch": 1.99, - "learning_rate": 5.332708288276484e-07, - "loss": 0.4822, - "step": 77829 - }, - { - "epoch": 1.99, - "learning_rate": 5.332463572487551e-07, - "loss": 0.4009, - "step": 77830 - }, - { - "epoch": 1.99, - "learning_rate": 5.332218860272335e-07, - "loss": 0.6382, - "step": 77831 - }, - { - "epoch": 1.99, - "learning_rate": 5.331974151631024e-07, - "loss": 0.6963, - "step": 77832 - }, - { - "epoch": 1.99, - "learning_rate": 5.331729446563811e-07, - "loss": 0.6895, - "step": 77833 - }, - { - "epoch": 1.99, - "learning_rate": 5.331484745070873e-07, - "loss": 0.6616, - "step": 77834 - }, - { - "epoch": 1.99, - "learning_rate": 5.331240047152404e-07, - "loss": 0.666, - "step": 77835 - }, - { - "epoch": 1.99, - "learning_rate": 5.330995352808594e-07, - "loss": 0.5493, - "step": 77836 - }, - { - "epoch": 2.0, - "learning_rate": 5.33075066203962e-07, - "loss": 0.5923, - "step": 77837 - }, - { - "epoch": 2.0, - "learning_rate": 5.33050597484568e-07, - "loss": 0.6025, - "step": 77838 - }, - { - "epoch": 2.0, - "learning_rate": 5.330261291226954e-07, - "loss": 0.626, - "step": 77839 - }, - { - "epoch": 2.0, - "learning_rate": 5.330016611183632e-07, - "loss": 0.5688, - "step": 77840 - }, - { - "epoch": 2.0, - "learning_rate": 5.329771934715906e-07, - "loss": 0.7881, - "step": 77841 - }, - { - "epoch": 2.0, - "learning_rate": 5.329527261823954e-07, - "loss": 0.6357, - "step": 77842 - }, - { - "epoch": 2.0, - "learning_rate": 5.329282592507969e-07, - "loss": 0.7026, - "step": 77843 - }, - { - "epoch": 2.0, - "learning_rate": 5.329037926768136e-07, - "loss": 0.4946, - "step": 77844 - }, - { - "epoch": 2.0, - "learning_rate": 5.32879326460465e-07, - "loss": 0.5747, - "step": 77845 - }, - { - "epoch": 2.0, - "learning_rate": 5.32854860601769e-07, - "loss": 0.5571, - "step": 77846 - }, - { - "epoch": 2.0, - "learning_rate": 5.328303951007442e-07, - "loss": 0.7549, - "step": 77847 - }, - { - "epoch": 2.0, - "learning_rate": 5.328059299574098e-07, - "loss": 0.5144, - "step": 77848 - }, - { - "epoch": 2.0, - "learning_rate": 5.327814651717843e-07, - "loss": 0.792, - "step": 77849 - }, - { - "epoch": 2.0, - "learning_rate": 5.327570007438871e-07, - "loss": 0.6138, - "step": 77850 - }, - { - "epoch": 2.0, - "learning_rate": 5.327325366737359e-07, - "loss": 0.5035, - "step": 77851 - }, - { - "epoch": 2.0, - "learning_rate": 5.327080729613497e-07, - "loss": 0.8301, - "step": 77852 - }, - { - "epoch": 2.0, - "learning_rate": 5.326836096067477e-07, - "loss": 0.7725, - "step": 77853 - }, - { - "epoch": 2.0, - "learning_rate": 5.326591466099488e-07, - "loss": 0.6504, - "step": 77854 - }, - { - "epoch": 2.0, - "learning_rate": 5.326346839709708e-07, - "loss": 0.5898, - "step": 77855 - }, - { - "epoch": 2.0, - "learning_rate": 5.326102216898334e-07, - "loss": 0.7393, - "step": 77856 - }, - { - "epoch": 2.0, - "learning_rate": 5.325857597665544e-07, - "loss": 0.5576, - "step": 77857 - }, - { - "epoch": 2.0, - "learning_rate": 5.325612982011534e-07, - "loss": 0.6865, - "step": 77858 - }, - { - "epoch": 2.0, - "learning_rate": 5.325368369936483e-07, - "loss": 0.6208, - "step": 77859 - }, - { - "epoch": 2.0, - "learning_rate": 5.325123761440583e-07, - "loss": 0.6553, - "step": 77860 - }, - { - "epoch": 2.0, - "learning_rate": 5.32487915652402e-07, - "loss": 0.563, - "step": 77861 - }, - { - "epoch": 2.0, - "learning_rate": 5.324634555186986e-07, - "loss": 0.668, - "step": 77862 - }, - { - "epoch": 2.0, - "learning_rate": 5.324389957429662e-07, - "loss": 0.7969, - "step": 77863 - }, - { - "epoch": 2.0, - "learning_rate": 5.324145363252237e-07, - "loss": 0.501, - "step": 77864 - }, - { - "epoch": 2.0, - "learning_rate": 5.323900772654899e-07, - "loss": 0.6748, - "step": 77865 - }, - { - "epoch": 2.0, - "learning_rate": 5.323656185637837e-07, - "loss": 0.582, - "step": 77866 - }, - { - "epoch": 2.0, - "learning_rate": 5.323411602201238e-07, - "loss": 0.7529, - "step": 77867 - }, - { - "epoch": 2.0, - "learning_rate": 5.323167022345285e-07, - "loss": 0.6553, - "step": 77868 - }, - { - "epoch": 2.0, - "learning_rate": 5.322922446070166e-07, - "loss": 0.5688, - "step": 77869 - }, - { - "epoch": 2.0, - "learning_rate": 5.322677873376071e-07, - "loss": 0.5898, - "step": 77870 - }, - { - "epoch": 2.0, - "learning_rate": 5.322433304263191e-07, - "loss": 0.6797, - "step": 77871 - }, - { - "epoch": 2.0, - "learning_rate": 5.322188738731703e-07, - "loss": 0.5088, - "step": 77872 - }, - { - "epoch": 2.0, - "learning_rate": 5.321944176781801e-07, - "loss": 0.6104, - "step": 77873 - }, - { - "epoch": 2.0, - "learning_rate": 5.321699618413673e-07, - "loss": 0.5356, - "step": 77874 - }, - { - "epoch": 2.0, - "learning_rate": 5.321455063627507e-07, - "loss": 0.4834, - "step": 77875 - }, - { - "epoch": 2.0, - "learning_rate": 5.321210512423486e-07, - "loss": 0.5139, - "step": 77876 - }, - { - "epoch": 2.0, - "learning_rate": 5.320965964801798e-07, - "loss": 0.5737, - "step": 77877 - }, - { - "epoch": 2.0, - "learning_rate": 5.320721420762629e-07, - "loss": 0.5469, - "step": 77878 - }, - { - "epoch": 2.0, - "learning_rate": 5.320476880306173e-07, - "loss": 0.5881, - "step": 77879 - }, - { - "epoch": 2.0, - "learning_rate": 5.320232343432609e-07, - "loss": 0.7422, - "step": 77880 - }, - { - "epoch": 2.0, - "learning_rate": 5.319987810142128e-07, - "loss": 0.6777, - "step": 77881 - }, - { - "epoch": 2.0, - "learning_rate": 5.319743280434917e-07, - "loss": 0.5546, - "step": 77882 - }, - { - "epoch": 2.0, - "learning_rate": 5.319498754311167e-07, - "loss": 0.624, - "step": 77883 - }, - { - "epoch": 2.0, - "learning_rate": 5.319254231771058e-07, - "loss": 0.623, - "step": 77884 - }, - { - "epoch": 2.0, - "learning_rate": 5.319009712814781e-07, - "loss": 0.6318, - "step": 77885 - }, - { - "epoch": 2.0, - "learning_rate": 5.318765197442527e-07, - "loss": 0.5859, - "step": 77886 - }, - { - "epoch": 2.0, - "learning_rate": 5.318520685654475e-07, - "loss": 0.5762, - "step": 77887 - }, - { - "epoch": 2.0, - "learning_rate": 5.31827617745082e-07, - "loss": 0.5381, - "step": 77888 - }, - { - "epoch": 2.0, - "learning_rate": 5.318031672831742e-07, - "loss": 0.5127, - "step": 77889 - }, - { - "epoch": 2.0, - "learning_rate": 5.317787171797432e-07, - "loss": 0.5723, - "step": 77890 - }, - { - "epoch": 2.0, - "learning_rate": 5.317542674348078e-07, - "loss": 0.749, - "step": 77891 - }, - { - "epoch": 2.0, - "learning_rate": 5.31729818048387e-07, - "loss": 0.6245, - "step": 77892 - }, - { - "epoch": 2.0, - "learning_rate": 5.317053690204985e-07, - "loss": 0.6758, - "step": 77893 - }, - { - "epoch": 2.0, - "learning_rate": 5.316809203511618e-07, - "loss": 0.5664, - "step": 77894 - }, - { - "epoch": 2.0, - "learning_rate": 5.316564720403956e-07, - "loss": 0.5298, - "step": 77895 - }, - { - "epoch": 2.0, - "learning_rate": 5.316320240882193e-07, - "loss": 0.6416, - "step": 77896 - }, - { - "epoch": 2.0, - "learning_rate": 5.3160757649465e-07, - "loss": 0.437, - "step": 77897 - }, - { - "epoch": 2.0, - "learning_rate": 5.315831292597072e-07, - "loss": 0.707, - "step": 77898 - }, - { - "epoch": 2.0, - "learning_rate": 5.315586823834096e-07, - "loss": 0.5288, - "step": 77899 - }, - { - "epoch": 2.0, - "learning_rate": 5.315342358657764e-07, - "loss": 0.5352, - "step": 77900 - }, - { - "epoch": 2.0, - "learning_rate": 5.315097897068255e-07, - "loss": 0.4922, - "step": 77901 - }, - { - "epoch": 2.0, - "learning_rate": 5.314853439065761e-07, - "loss": 0.6973, - "step": 77902 - }, - { - "epoch": 2.0, - "learning_rate": 5.314608984650469e-07, - "loss": 0.3765, - "step": 77903 - }, - { - "epoch": 2.0, - "learning_rate": 5.314364533822566e-07, - "loss": 0.6943, - "step": 77904 - }, - { - "epoch": 2.0, - "learning_rate": 5.314120086582237e-07, - "loss": 0.5933, - "step": 77905 - }, - { - "epoch": 2.0, - "learning_rate": 5.313875642929675e-07, - "loss": 0.3682, - "step": 77906 - }, - { - "epoch": 2.0, - "learning_rate": 5.313631202865059e-07, - "loss": 0.6025, - "step": 77907 - }, - { - "epoch": 2.0, - "learning_rate": 5.313386766388579e-07, - "loss": 0.6226, - "step": 77908 - }, - { - "epoch": 2.0, - "learning_rate": 5.313142333500429e-07, - "loss": 0.5596, - "step": 77909 - }, - { - "epoch": 2.0, - "learning_rate": 5.312897904200785e-07, - "loss": 0.5249, - "step": 77910 - }, - { - "epoch": 2.0, - "learning_rate": 5.31265347848984e-07, - "loss": 0.4507, - "step": 77911 - }, - { - "epoch": 2.0, - "learning_rate": 5.31240905636778e-07, - "loss": 0.6758, - "step": 77912 - }, - { - "epoch": 2.0, - "learning_rate": 5.312164637834797e-07, - "loss": 0.5771, - "step": 77913 - }, - { - "epoch": 2.0, - "learning_rate": 5.311920222891071e-07, - "loss": 0.6177, - "step": 77914 - }, - { - "epoch": 2.0, - "learning_rate": 5.311675811536791e-07, - "loss": 0.667, - "step": 77915 - }, - { - "epoch": 2.0, - "learning_rate": 5.311431403772151e-07, - "loss": 0.5938, - "step": 77916 - }, - { - "epoch": 2.0, - "learning_rate": 5.311186999597331e-07, - "loss": 0.7441, - "step": 77917 - }, - { - "epoch": 2.0, - "learning_rate": 5.310942599012515e-07, - "loss": 0.5164, - "step": 77918 - }, - { - "epoch": 2.0, - "learning_rate": 5.310698202017896e-07, - "loss": 0.6855, - "step": 77919 - }, - { - "epoch": 2.0, - "learning_rate": 5.310453808613659e-07, - "loss": 0.4844, - "step": 77920 - }, - { - "epoch": 2.0, - "learning_rate": 5.310209418799996e-07, - "loss": 0.7261, - "step": 77921 - }, - { - "epoch": 2.0, - "learning_rate": 5.309965032577086e-07, - "loss": 0.5583, - "step": 77922 - }, - { - "epoch": 2.0, - "learning_rate": 5.309720649945119e-07, - "loss": 0.5669, - "step": 77923 - }, - { - "epoch": 2.0, - "learning_rate": 5.309476270904285e-07, - "loss": 0.4583, - "step": 77924 - }, - { - "epoch": 2.0, - "learning_rate": 5.309231895454773e-07, - "loss": 0.5864, - "step": 77925 - }, - { - "epoch": 2.0, - "learning_rate": 5.308987523596767e-07, - "loss": 0.5811, - "step": 77926 - }, - { - "epoch": 2.0, - "learning_rate": 5.308743155330449e-07, - "loss": 0.7334, - "step": 77927 - }, - { - "epoch": 2.0, - "learning_rate": 5.308498790656009e-07, - "loss": 0.5996, - "step": 77928 - }, - { - "epoch": 2.0, - "learning_rate": 5.308254429573638e-07, - "loss": 0.7246, - "step": 77929 - }, - { - "epoch": 2.0, - "learning_rate": 5.308010072083523e-07, - "loss": 0.3831, - "step": 77930 - }, - { - "epoch": 2.0, - "learning_rate": 5.307765718185846e-07, - "loss": 0.6221, - "step": 77931 - }, - { - "epoch": 2.0, - "learning_rate": 5.307521367880796e-07, - "loss": 0.5891, - "step": 77932 - }, - { - "epoch": 2.0, - "learning_rate": 5.307277021168567e-07, - "loss": 0.6377, - "step": 77933 - }, - { - "epoch": 2.0, - "learning_rate": 5.307032678049335e-07, - "loss": 0.52, - "step": 77934 - }, - { - "epoch": 2.0, - "learning_rate": 5.306788338523294e-07, - "loss": 0.5801, - "step": 77935 - }, - { - "epoch": 2.0, - "learning_rate": 5.30654400259063e-07, - "loss": 0.7056, - "step": 77936 - }, - { - "epoch": 2.0, - "learning_rate": 5.306299670251529e-07, - "loss": 0.5796, - "step": 77937 - }, - { - "epoch": 2.0, - "learning_rate": 5.306055341506179e-07, - "loss": 0.6011, - "step": 77938 - }, - { - "epoch": 2.0, - "learning_rate": 5.305811016354765e-07, - "loss": 0.5596, - "step": 77939 - }, - { - "epoch": 2.0, - "learning_rate": 5.305566694797476e-07, - "loss": 0.644, - "step": 77940 - }, - { - "epoch": 2.0, - "learning_rate": 5.305322376834498e-07, - "loss": 0.7285, - "step": 77941 - }, - { - "epoch": 2.0, - "learning_rate": 5.305078062466022e-07, - "loss": 0.6133, - "step": 77942 - }, - { - "epoch": 2.0, - "learning_rate": 5.304833751692228e-07, - "loss": 0.6147, - "step": 77943 - }, - { - "epoch": 2.0, - "learning_rate": 5.304589444513308e-07, - "loss": 0.5122, - "step": 77944 - }, - { - "epoch": 2.0, - "learning_rate": 5.304345140929447e-07, - "loss": 0.5391, - "step": 77945 - }, - { - "epoch": 2.0, - "learning_rate": 5.304100840940837e-07, - "loss": 0.7666, - "step": 77946 - }, - { - "epoch": 2.0, - "learning_rate": 5.303856544547663e-07, - "loss": 0.7588, - "step": 77947 - }, - { - "epoch": 2.0, - "learning_rate": 5.303612251750103e-07, - "loss": 0.5664, - "step": 77948 - }, - { - "epoch": 2.0, - "learning_rate": 5.303367962548353e-07, - "loss": 0.5894, - "step": 77949 - }, - { - "epoch": 2.0, - "learning_rate": 5.303123676942603e-07, - "loss": 0.502, - "step": 77950 - }, - { - "epoch": 2.0, - "learning_rate": 5.30287939493303e-07, - "loss": 0.7266, - "step": 77951 - }, - { - "epoch": 2.0, - "learning_rate": 5.302635116519827e-07, - "loss": 0.7148, - "step": 77952 - }, - { - "epoch": 2.0, - "learning_rate": 5.302390841703179e-07, - "loss": 0.5723, - "step": 77953 - }, - { - "epoch": 2.0, - "learning_rate": 5.302146570483279e-07, - "loss": 0.6362, - "step": 77954 - }, - { - "epoch": 2.0, - "learning_rate": 5.301902302860306e-07, - "loss": 0.5718, - "step": 77955 - }, - { - "epoch": 2.0, - "learning_rate": 5.301658038834454e-07, - "loss": 0.7017, - "step": 77956 - }, - { - "epoch": 2.0, - "learning_rate": 5.301413778405901e-07, - "loss": 0.7026, - "step": 77957 - }, - { - "epoch": 2.0, - "learning_rate": 5.301169521574841e-07, - "loss": 0.5894, - "step": 77958 - }, - { - "epoch": 2.0, - "learning_rate": 5.300925268341463e-07, - "loss": 0.8467, - "step": 77959 - }, - { - "epoch": 2.0, - "learning_rate": 5.300681018705946e-07, - "loss": 0.7046, - "step": 77960 - }, - { - "epoch": 2.0, - "learning_rate": 5.300436772668481e-07, - "loss": 0.5105, - "step": 77961 - }, - { - "epoch": 2.0, - "learning_rate": 5.300192530229258e-07, - "loss": 0.624, - "step": 77962 - }, - { - "epoch": 2.0, - "learning_rate": 5.299948291388463e-07, - "loss": 0.6455, - "step": 77963 - }, - { - "epoch": 2.0, - "learning_rate": 5.299704056146279e-07, - "loss": 0.7393, - "step": 77964 - }, - { - "epoch": 2.0, - "learning_rate": 5.299459824502894e-07, - "loss": 0.7393, - "step": 77965 - }, - { - "epoch": 2.0, - "learning_rate": 5.299215596458502e-07, - "loss": 0.4507, - "step": 77966 - }, - { - "epoch": 2.0, - "learning_rate": 5.298971372013283e-07, - "loss": 0.582, - "step": 77967 - }, - { - "epoch": 2.0, - "learning_rate": 5.298727151167423e-07, - "loss": 0.5176, - "step": 77968 - }, - { - "epoch": 2.0, - "learning_rate": 5.298482933921111e-07, - "loss": 0.7246, - "step": 77969 - }, - { - "epoch": 2.0, - "learning_rate": 5.298238720274535e-07, - "loss": 0.707, - "step": 77970 - }, - { - "epoch": 2.0, - "learning_rate": 5.297994510227884e-07, - "loss": 0.6196, - "step": 77971 - }, - { - "epoch": 2.0, - "learning_rate": 5.297750303781339e-07, - "loss": 0.4736, - "step": 77972 - }, - { - "epoch": 2.0, - "learning_rate": 5.297506100935089e-07, - "loss": 0.5908, - "step": 77973 - }, - { - "epoch": 2.0, - "learning_rate": 5.297261901689325e-07, - "loss": 0.7344, - "step": 77974 - }, - { - "epoch": 2.0, - "learning_rate": 5.297017706044234e-07, - "loss": 0.5977, - "step": 77975 - }, - { - "epoch": 2.0, - "learning_rate": 5.296773514000001e-07, - "loss": 0.5825, - "step": 77976 - }, - { - "epoch": 2.0, - "learning_rate": 5.296529325556806e-07, - "loss": 0.5464, - "step": 77977 - }, - { - "epoch": 2.0, - "learning_rate": 5.296285140714845e-07, - "loss": 0.6992, - "step": 77978 - }, - { - "epoch": 2.0, - "learning_rate": 5.296040959474302e-07, - "loss": 0.6616, - "step": 77979 - }, - { - "epoch": 2.0, - "learning_rate": 5.295796781835366e-07, - "loss": 0.6694, - "step": 77980 - }, - { - "epoch": 2.0, - "learning_rate": 5.295552607798219e-07, - "loss": 0.6875, - "step": 77981 - }, - { - "epoch": 2.0, - "learning_rate": 5.29530843736305e-07, - "loss": 0.5757, - "step": 77982 - }, - { - "epoch": 2.0, - "learning_rate": 5.29506427053005e-07, - "loss": 0.6685, - "step": 77983 - }, - { - "epoch": 2.0, - "learning_rate": 5.294820107299405e-07, - "loss": 0.604, - "step": 77984 - }, - { - "epoch": 2.0, - "learning_rate": 5.294575947671296e-07, - "loss": 0.6211, - "step": 77985 - }, - { - "epoch": 2.0, - "learning_rate": 5.294331791645919e-07, - "loss": 0.5271, - "step": 77986 - }, - { - "epoch": 2.0, - "learning_rate": 5.29408763922345e-07, - "loss": 0.583, - "step": 77987 - }, - { - "epoch": 2.0, - "learning_rate": 5.293843490404086e-07, - "loss": 0.7217, - "step": 77988 - }, - { - "epoch": 2.0, - "learning_rate": 5.293599345188007e-07, - "loss": 0.5024, - "step": 77989 - }, - { - "epoch": 2.0, - "learning_rate": 5.293355203575402e-07, - "loss": 0.645, - "step": 77990 - }, - { - "epoch": 2.0, - "learning_rate": 5.293111065566458e-07, - "loss": 0.7148, - "step": 77991 - }, - { - "epoch": 2.0, - "learning_rate": 5.292866931161367e-07, - "loss": 0.835, - "step": 77992 - }, - { - "epoch": 2.0, - "learning_rate": 5.292622800360306e-07, - "loss": 0.6465, - "step": 77993 - }, - { - "epoch": 2.0, - "learning_rate": 5.292378673163469e-07, - "loss": 0.709, - "step": 77994 - }, - { - "epoch": 2.0, - "learning_rate": 5.292134549571039e-07, - "loss": 0.7129, - "step": 77995 - }, - { - "epoch": 2.0, - "learning_rate": 5.291890429583211e-07, - "loss": 0.8311, - "step": 77996 - }, - { - "epoch": 2.0, - "learning_rate": 5.291646313200165e-07, - "loss": 0.3918, - "step": 77997 - }, - { - "epoch": 2.0, - "learning_rate": 5.291402200422086e-07, - "loss": 0.6187, - "step": 77998 - }, - { - "epoch": 2.0, - "learning_rate": 5.291158091249164e-07, - "loss": 0.6047, - "step": 77999 - }, - { - "epoch": 2.0, - "learning_rate": 5.290913985681584e-07, - "loss": 0.4841, - "step": 78000 - }, - { - "epoch": 2.0, - "learning_rate": 5.29066988371954e-07, - "loss": 0.6318, - "step": 78001 - }, - { - "epoch": 2.0, - "learning_rate": 5.290425785363209e-07, - "loss": 0.6235, - "step": 78002 - }, - { - "epoch": 2.0, - "learning_rate": 5.290181690612783e-07, - "loss": 0.7383, - "step": 78003 - }, - { - "epoch": 2.0, - "learning_rate": 5.289937599468452e-07, - "loss": 0.6357, - "step": 78004 - }, - { - "epoch": 2.0, - "learning_rate": 5.289693511930396e-07, - "loss": 0.6973, - "step": 78005 - }, - { - "epoch": 2.0, - "learning_rate": 5.289449427998806e-07, - "loss": 0.7168, - "step": 78006 - }, - { - "epoch": 2.0, - "learning_rate": 5.289205347673867e-07, - "loss": 0.5439, - "step": 78007 - }, - { - "epoch": 2.0, - "learning_rate": 5.288961270955766e-07, - "loss": 0.6318, - "step": 78008 - }, - { - "epoch": 2.0, - "learning_rate": 5.288717197844695e-07, - "loss": 0.6797, - "step": 78009 - }, - { - "epoch": 2.0, - "learning_rate": 5.288473128340833e-07, - "loss": 0.7441, - "step": 78010 - }, - { - "epoch": 2.0, - "learning_rate": 5.28822906244437e-07, - "loss": 0.4835, - "step": 78011 - }, - { - "epoch": 2.0, - "learning_rate": 5.287985000155493e-07, - "loss": 0.6924, - "step": 78012 - }, - { - "epoch": 2.0, - "learning_rate": 5.287740941474394e-07, - "loss": 0.6274, - "step": 78013 - }, - { - "epoch": 2.0, - "learning_rate": 5.287496886401251e-07, - "loss": 0.6543, - "step": 78014 - }, - { - "epoch": 2.0, - "learning_rate": 5.287252834936253e-07, - "loss": 0.688, - "step": 78015 - }, - { - "epoch": 2.0, - "learning_rate": 5.287008787079595e-07, - "loss": 0.6445, - "step": 78016 - }, - { - "epoch": 2.0, - "learning_rate": 5.286764742831453e-07, - "loss": 0.3557, - "step": 78017 - }, - { - "epoch": 2.0, - "learning_rate": 5.286520702192022e-07, - "loss": 0.5977, - "step": 78018 - }, - { - "epoch": 2.0, - "learning_rate": 5.286276665161482e-07, - "loss": 0.5996, - "step": 78019 - }, - { - "epoch": 2.0, - "learning_rate": 5.286032631740023e-07, - "loss": 0.5674, - "step": 78020 - }, - { - "epoch": 2.0, - "learning_rate": 5.285788601927836e-07, - "loss": 0.6108, - "step": 78021 - }, - { - "epoch": 2.0, - "learning_rate": 5.285544575725101e-07, - "loss": 0.6543, - "step": 78022 - }, - { - "epoch": 2.0, - "learning_rate": 5.285300553132006e-07, - "loss": 0.5542, - "step": 78023 - }, - { - "epoch": 2.0, - "learning_rate": 5.28505653414874e-07, - "loss": 0.7598, - "step": 78024 - }, - { - "epoch": 2.0, - "learning_rate": 5.284812518775494e-07, - "loss": 0.8291, - "step": 78025 - }, - { - "epoch": 2.0, - "learning_rate": 5.28456850701245e-07, - "loss": 0.707, - "step": 78026 - }, - { - "epoch": 2.0, - "learning_rate": 5.284324498859792e-07, - "loss": 0.7422, - "step": 78027 - }, - { - "epoch": 2.0, - "learning_rate": 5.284080494317709e-07, - "loss": 0.7637, - "step": 78028 - }, - { - "epoch": 2.0, - "learning_rate": 5.283836493386388e-07, - "loss": 0.7324, - "step": 78029 - }, - { - "epoch": 2.0, - "learning_rate": 5.283592496066021e-07, - "loss": 0.6748, - "step": 78030 - }, - { - "epoch": 2.0, - "learning_rate": 5.283348502356785e-07, - "loss": 0.6123, - "step": 78031 - }, - { - "epoch": 2.0, - "learning_rate": 5.283104512258876e-07, - "loss": 0.6738, - "step": 78032 - }, - { - "epoch": 2.0, - "learning_rate": 5.282860525772474e-07, - "loss": 0.4316, - "step": 78033 - }, - { - "epoch": 2.0, - "learning_rate": 5.282616542897773e-07, - "loss": 0.5317, - "step": 78034 - }, - { - "epoch": 2.0, - "learning_rate": 5.282372563634957e-07, - "loss": 0.2528, - "step": 78035 - }, - { - "epoch": 2.0, - "learning_rate": 5.282128587984207e-07, - "loss": 0.4692, - "step": 78036 - }, - { - "epoch": 2.0, - "learning_rate": 5.281884615945713e-07, - "loss": 0.4561, - "step": 78037 - }, - { - "epoch": 2.0, - "learning_rate": 5.281640647519667e-07, - "loss": 0.3325, - "step": 78038 - }, - { - "epoch": 2.0, - "learning_rate": 5.28139668270625e-07, - "loss": 0.4868, - "step": 78039 - }, - { - "epoch": 2.0, - "learning_rate": 5.281152721505649e-07, - "loss": 0.491, - "step": 78040 - }, - { - "epoch": 2.0, - "learning_rate": 5.280908763918053e-07, - "loss": 0.3757, - "step": 78041 - }, - { - "epoch": 2.0, - "learning_rate": 5.280664809943651e-07, - "loss": 0.4419, - "step": 78042 - }, - { - "epoch": 2.0, - "learning_rate": 5.280420859582624e-07, - "loss": 0.298, - "step": 78043 - }, - { - "epoch": 2.0, - "learning_rate": 5.280176912835161e-07, - "loss": 0.603, - "step": 78044 - }, - { - "epoch": 2.0, - "learning_rate": 5.279932969701454e-07, - "loss": 0.4521, - "step": 78045 - }, - { - "epoch": 2.0, - "learning_rate": 5.279689030181681e-07, - "loss": 0.4775, - "step": 78046 - }, - { - "epoch": 2.0, - "learning_rate": 5.279445094276038e-07, - "loss": 0.3804, - "step": 78047 - }, - { - "epoch": 2.0, - "learning_rate": 5.279201161984701e-07, - "loss": 0.5171, - "step": 78048 - }, - { - "epoch": 2.0, - "learning_rate": 5.278957233307864e-07, - "loss": 0.4331, - "step": 78049 - }, - { - "epoch": 2.0, - "learning_rate": 5.278713308245713e-07, - "loss": 0.519, - "step": 78050 - }, - { - "epoch": 2.0, - "learning_rate": 5.278469386798436e-07, - "loss": 0.4927, - "step": 78051 - }, - { - "epoch": 2.0, - "learning_rate": 5.278225468966215e-07, - "loss": 0.5303, - "step": 78052 - }, - { - "epoch": 2.0, - "learning_rate": 5.27798155474924e-07, - "loss": 0.5957, - "step": 78053 - }, - { - "epoch": 2.0, - "learning_rate": 5.277737644147698e-07, - "loss": 0.448, - "step": 78054 - }, - { - "epoch": 2.0, - "learning_rate": 5.277493737161782e-07, - "loss": 0.4421, - "step": 78055 - }, - { - "epoch": 2.0, - "learning_rate": 5.277249833791664e-07, - "loss": 0.4062, - "step": 78056 - }, - { - "epoch": 2.0, - "learning_rate": 5.277005934037539e-07, - "loss": 0.4736, - "step": 78057 - }, - { - "epoch": 2.0, - "learning_rate": 5.276762037899594e-07, - "loss": 0.5078, - "step": 78058 - }, - { - "epoch": 2.0, - "learning_rate": 5.276518145378017e-07, - "loss": 0.5005, - "step": 78059 - }, - { - "epoch": 2.0, - "learning_rate": 5.27627425647299e-07, - "loss": 0.4453, - "step": 78060 - }, - { - "epoch": 2.0, - "learning_rate": 5.276030371184703e-07, - "loss": 0.5425, - "step": 78061 - }, - { - "epoch": 2.0, - "learning_rate": 5.275786489513343e-07, - "loss": 0.5029, - "step": 78062 - }, - { - "epoch": 2.0, - "learning_rate": 5.275542611459098e-07, - "loss": 0.4268, - "step": 78063 - }, - { - "epoch": 2.0, - "learning_rate": 5.275298737022152e-07, - "loss": 0.4824, - "step": 78064 - }, - { - "epoch": 2.0, - "learning_rate": 5.275054866202692e-07, - "loss": 0.4678, - "step": 78065 - }, - { - "epoch": 2.0, - "learning_rate": 5.274810999000905e-07, - "loss": 0.4834, - "step": 78066 - }, - { - "epoch": 2.0, - "learning_rate": 5.274567135416976e-07, - "loss": 0.4829, - "step": 78067 - }, - { - "epoch": 2.0, - "learning_rate": 5.274323275451099e-07, - "loss": 0.4746, - "step": 78068 - }, - { - "epoch": 2.0, - "learning_rate": 5.274079419103451e-07, - "loss": 0.3428, - "step": 78069 - }, - { - "epoch": 2.0, - "learning_rate": 5.273835566374222e-07, - "loss": 0.4971, - "step": 78070 - }, - { - "epoch": 2.0, - "learning_rate": 5.273591717263601e-07, - "loss": 0.4116, - "step": 78071 - }, - { - "epoch": 2.0, - "learning_rate": 5.273347871771777e-07, - "loss": 0.4033, - "step": 78072 - }, - { - "epoch": 2.0, - "learning_rate": 5.273104029898929e-07, - "loss": 0.4004, - "step": 78073 - }, - { - "epoch": 2.0, - "learning_rate": 5.272860191645249e-07, - "loss": 0.3368, - "step": 78074 - }, - { - "epoch": 2.0, - "learning_rate": 5.272616357010926e-07, - "loss": 0.4941, - "step": 78075 - }, - { - "epoch": 2.0, - "learning_rate": 5.272372525996142e-07, - "loss": 0.4116, - "step": 78076 - }, - { - "epoch": 2.0, - "learning_rate": 5.272128698601083e-07, - "loss": 0.3885, - "step": 78077 - }, - { - "epoch": 2.0, - "learning_rate": 5.271884874825936e-07, - "loss": 0.4219, - "step": 78078 - }, - { - "epoch": 2.0, - "learning_rate": 5.27164105467089e-07, - "loss": 0.3994, - "step": 78079 - }, - { - "epoch": 2.0, - "learning_rate": 5.271397238136135e-07, - "loss": 0.4431, - "step": 78080 - }, - { - "epoch": 2.0, - "learning_rate": 5.271153425221851e-07, - "loss": 0.3655, - "step": 78081 - }, - { - "epoch": 2.0, - "learning_rate": 5.270909615928225e-07, - "loss": 0.4717, - "step": 78082 - }, - { - "epoch": 2.0, - "learning_rate": 5.270665810255448e-07, - "loss": 0.4053, - "step": 78083 - }, - { - "epoch": 2.0, - "learning_rate": 5.270422008203708e-07, - "loss": 0.2834, - "step": 78084 - }, - { - "epoch": 2.0, - "learning_rate": 5.270178209773188e-07, - "loss": 0.3918, - "step": 78085 - }, - { - "epoch": 2.0, - "learning_rate": 5.269934414964073e-07, - "loss": 0.4204, - "step": 78086 - }, - { - "epoch": 2.0, - "learning_rate": 5.269690623776548e-07, - "loss": 0.4399, - "step": 78087 - }, - { - "epoch": 2.0, - "learning_rate": 5.269446836210807e-07, - "loss": 0.397, - "step": 78088 - }, - { - "epoch": 2.0, - "learning_rate": 5.269203052267034e-07, - "loss": 0.3647, - "step": 78089 - }, - { - "epoch": 2.0, - "learning_rate": 5.268959271945413e-07, - "loss": 0.5059, - "step": 78090 - }, - { - "epoch": 2.0, - "learning_rate": 5.268715495246133e-07, - "loss": 0.481, - "step": 78091 - }, - { - "epoch": 2.0, - "learning_rate": 5.268471722169377e-07, - "loss": 0.3955, - "step": 78092 - }, - { - "epoch": 2.0, - "learning_rate": 5.268227952715341e-07, - "loss": 0.3887, - "step": 78093 - }, - { - "epoch": 2.0, - "learning_rate": 5.267984186884201e-07, - "loss": 0.4668, - "step": 78094 - }, - { - "epoch": 2.0, - "learning_rate": 5.267740424676151e-07, - "loss": 0.4087, - "step": 78095 - }, - { - "epoch": 2.0, - "learning_rate": 5.267496666091371e-07, - "loss": 0.4761, - "step": 78096 - }, - { - "epoch": 2.0, - "learning_rate": 5.267252911130054e-07, - "loss": 0.3792, - "step": 78097 - }, - { - "epoch": 2.0, - "learning_rate": 5.267009159792382e-07, - "loss": 0.4546, - "step": 78098 - }, - { - "epoch": 2.0, - "learning_rate": 5.266765412078542e-07, - "loss": 0.2788, - "step": 78099 - }, - { - "epoch": 2.0, - "learning_rate": 5.266521667988723e-07, - "loss": 0.501, - "step": 78100 - }, - { - "epoch": 2.0, - "learning_rate": 5.266277927523114e-07, - "loss": 0.4751, - "step": 78101 - }, - { - "epoch": 2.0, - "learning_rate": 5.266034190681894e-07, - "loss": 0.355, - "step": 78102 - }, - { - "epoch": 2.0, - "learning_rate": 5.265790457465256e-07, - "loss": 0.3735, - "step": 78103 - }, - { - "epoch": 2.0, - "learning_rate": 5.265546727873383e-07, - "loss": 0.2698, - "step": 78104 - }, - { - "epoch": 2.0, - "learning_rate": 5.265303001906468e-07, - "loss": 0.3696, - "step": 78105 - }, - { - "epoch": 2.0, - "learning_rate": 5.26505927956469e-07, - "loss": 0.3317, - "step": 78106 - }, - { - "epoch": 2.0, - "learning_rate": 5.264815560848236e-07, - "loss": 0.3982, - "step": 78107 - }, - { - "epoch": 2.0, - "learning_rate": 5.264571845757297e-07, - "loss": 0.4165, - "step": 78108 - }, - { - "epoch": 2.0, - "learning_rate": 5.264328134292055e-07, - "loss": 0.4966, - "step": 78109 - }, - { - "epoch": 2.0, - "learning_rate": 5.264084426452705e-07, - "loss": 0.4023, - "step": 78110 - }, - { - "epoch": 2.0, - "learning_rate": 5.263840722239424e-07, - "loss": 0.439, - "step": 78111 - }, - { - "epoch": 2.0, - "learning_rate": 5.2635970216524e-07, - "loss": 0.4658, - "step": 78112 - }, - { - "epoch": 2.0, - "learning_rate": 5.263353324691829e-07, - "loss": 0.4307, - "step": 78113 - }, - { - "epoch": 2.0, - "learning_rate": 5.263109631357884e-07, - "loss": 0.4531, - "step": 78114 - }, - { - "epoch": 2.0, - "learning_rate": 5.262865941650763e-07, - "loss": 0.3076, - "step": 78115 - }, - { - "epoch": 2.0, - "learning_rate": 5.262622255570644e-07, - "loss": 0.3187, - "step": 78116 - }, - { - "epoch": 2.0, - "learning_rate": 5.262378573117717e-07, - "loss": 0.5376, - "step": 78117 - }, - { - "epoch": 2.0, - "learning_rate": 5.262134894292174e-07, - "loss": 0.302, - "step": 78118 - }, - { - "epoch": 2.0, - "learning_rate": 5.26189121909419e-07, - "loss": 0.4541, - "step": 78119 - }, - { - "epoch": 2.0, - "learning_rate": 5.26164754752396e-07, - "loss": 0.3804, - "step": 78120 - }, - { - "epoch": 2.0, - "learning_rate": 5.261403879581668e-07, - "loss": 0.4678, - "step": 78121 - }, - { - "epoch": 2.0, - "learning_rate": 5.261160215267506e-07, - "loss": 0.2551, - "step": 78122 - }, - { - "epoch": 2.0, - "learning_rate": 5.260916554581651e-07, - "loss": 0.4377, - "step": 78123 - }, - { - "epoch": 2.0, - "learning_rate": 5.260672897524294e-07, - "loss": 0.4534, - "step": 78124 - }, - { - "epoch": 2.0, - "learning_rate": 5.260429244095625e-07, - "loss": 0.5771, - "step": 78125 - }, - { - "epoch": 2.0, - "learning_rate": 5.260185594295825e-07, - "loss": 0.4453, - "step": 78126 - }, - { - "epoch": 2.0, - "learning_rate": 5.259941948125088e-07, - "loss": 0.4919, - "step": 78127 - }, - { - "epoch": 2.0, - "learning_rate": 5.259698305583589e-07, - "loss": 0.3728, - "step": 78128 - }, - { - "epoch": 2.0, - "learning_rate": 5.259454666671523e-07, - "loss": 0.5352, - "step": 78129 - }, - { - "epoch": 2.0, - "learning_rate": 5.259211031389077e-07, - "loss": 0.3974, - "step": 78130 - }, - { - "epoch": 2.0, - "learning_rate": 5.258967399736431e-07, - "loss": 0.4629, - "step": 78131 - }, - { - "epoch": 2.0, - "learning_rate": 5.258723771713778e-07, - "loss": 0.3584, - "step": 78132 - }, - { - "epoch": 2.0, - "learning_rate": 5.258480147321301e-07, - "loss": 0.4458, - "step": 78133 - }, - { - "epoch": 2.0, - "learning_rate": 5.25823652655919e-07, - "loss": 0.3635, - "step": 78134 - }, - { - "epoch": 2.0, - "learning_rate": 5.257992909427631e-07, - "loss": 0.4307, - "step": 78135 - }, - { - "epoch": 2.0, - "learning_rate": 5.257749295926803e-07, - "loss": 0.4602, - "step": 78136 - }, - { - "epoch": 2.0, - "learning_rate": 5.2575056860569e-07, - "loss": 0.3545, - "step": 78137 - }, - { - "epoch": 2.0, - "learning_rate": 5.257262079818108e-07, - "loss": 0.4172, - "step": 78138 - }, - { - "epoch": 2.0, - "learning_rate": 5.257018477210614e-07, - "loss": 0.4292, - "step": 78139 - }, - { - "epoch": 2.0, - "learning_rate": 5.2567748782346e-07, - "loss": 0.4927, - "step": 78140 - }, - { - "epoch": 2.0, - "learning_rate": 5.256531282890256e-07, - "loss": 0.3938, - "step": 78141 - }, - { - "epoch": 2.0, - "learning_rate": 5.256287691177765e-07, - "loss": 0.4976, - "step": 78142 - }, - { - "epoch": 2.0, - "learning_rate": 5.256044103097323e-07, - "loss": 0.3514, - "step": 78143 - }, - { - "epoch": 2.0, - "learning_rate": 5.255800518649105e-07, - "loss": 0.3755, - "step": 78144 - }, - { - "epoch": 2.0, - "learning_rate": 5.255556937833308e-07, - "loss": 0.3921, - "step": 78145 - }, - { - "epoch": 2.0, - "learning_rate": 5.255313360650107e-07, - "loss": 0.3545, - "step": 78146 - }, - { - "epoch": 2.0, - "learning_rate": 5.255069787099699e-07, - "loss": 0.4082, - "step": 78147 - }, - { - "epoch": 2.0, - "learning_rate": 5.254826217182262e-07, - "loss": 0.3723, - "step": 78148 - }, - { - "epoch": 2.0, - "learning_rate": 5.254582650897985e-07, - "loss": 0.4307, - "step": 78149 - }, - { - "epoch": 2.0, - "learning_rate": 5.254339088247057e-07, - "loss": 0.5298, - "step": 78150 - }, - { - "epoch": 2.0, - "learning_rate": 5.254095529229668e-07, - "loss": 0.2917, - "step": 78151 - }, - { - "epoch": 2.0, - "learning_rate": 5.253851973845995e-07, - "loss": 0.5732, - "step": 78152 - }, - { - "epoch": 2.0, - "learning_rate": 5.25360842209623e-07, - "loss": 0.4048, - "step": 78153 - }, - { - "epoch": 2.0, - "learning_rate": 5.253364873980559e-07, - "loss": 0.4658, - "step": 78154 - }, - { - "epoch": 2.0, - "learning_rate": 5.253121329499171e-07, - "loss": 0.5146, - "step": 78155 - }, - { - "epoch": 2.0, - "learning_rate": 5.25287778865225e-07, - "loss": 0.5723, - "step": 78156 - }, - { - "epoch": 2.0, - "learning_rate": 5.252634251439979e-07, - "loss": 0.4355, - "step": 78157 - }, - { - "epoch": 2.0, - "learning_rate": 5.252390717862547e-07, - "loss": 0.3872, - "step": 78158 - }, - { - "epoch": 2.0, - "learning_rate": 5.252147187920141e-07, - "loss": 0.5107, - "step": 78159 - }, - { - "epoch": 2.0, - "learning_rate": 5.251903661612953e-07, - "loss": 0.2463, - "step": 78160 - }, - { - "epoch": 2.0, - "learning_rate": 5.251660138941158e-07, - "loss": 0.5508, - "step": 78161 - }, - { - "epoch": 2.0, - "learning_rate": 5.25141661990495e-07, - "loss": 0.4663, - "step": 78162 - }, - { - "epoch": 2.0, - "learning_rate": 5.251173104504513e-07, - "loss": 0.4751, - "step": 78163 - }, - { - "epoch": 2.0, - "learning_rate": 5.250929592740039e-07, - "loss": 0.3884, - "step": 78164 - }, - { - "epoch": 2.0, - "learning_rate": 5.250686084611711e-07, - "loss": 0.3831, - "step": 78165 - }, - { - "epoch": 2.0, - "learning_rate": 5.250442580119708e-07, - "loss": 0.4253, - "step": 78166 - }, - { - "epoch": 2.0, - "learning_rate": 5.250199079264223e-07, - "loss": 0.4326, - "step": 78167 - }, - { - "epoch": 2.0, - "learning_rate": 5.249955582045447e-07, - "loss": 0.2772, - "step": 78168 - }, - { - "epoch": 2.0, - "learning_rate": 5.249712088463559e-07, - "loss": 0.4365, - "step": 78169 - }, - { - "epoch": 2.0, - "learning_rate": 5.249468598518746e-07, - "loss": 0.4316, - "step": 78170 - }, - { - "epoch": 2.0, - "learning_rate": 5.249225112211197e-07, - "loss": 0.4365, - "step": 78171 - }, - { - "epoch": 2.0, - "learning_rate": 5.248981629541101e-07, - "loss": 0.377, - "step": 78172 - }, - { - "epoch": 2.0, - "learning_rate": 5.248738150508638e-07, - "loss": 0.4399, - "step": 78173 - }, - { - "epoch": 2.0, - "learning_rate": 5.248494675113999e-07, - "loss": 0.3857, - "step": 78174 - }, - { - "epoch": 2.0, - "learning_rate": 5.248251203357372e-07, - "loss": 0.3704, - "step": 78175 - }, - { - "epoch": 2.0, - "learning_rate": 5.248007735238937e-07, - "loss": 0.2454, - "step": 78176 - }, - { - "epoch": 2.0, - "learning_rate": 5.247764270758886e-07, - "loss": 0.4395, - "step": 78177 - }, - { - "epoch": 2.0, - "learning_rate": 5.247520809917402e-07, - "loss": 0.5127, - "step": 78178 - }, - { - "epoch": 2.0, - "learning_rate": 5.247277352714672e-07, - "loss": 0.4127, - "step": 78179 - }, - { - "epoch": 2.0, - "learning_rate": 5.247033899150882e-07, - "loss": 0.395, - "step": 78180 - }, - { - "epoch": 2.0, - "learning_rate": 5.246790449226225e-07, - "loss": 0.2844, - "step": 78181 - }, - { - "epoch": 2.0, - "learning_rate": 5.246547002940878e-07, - "loss": 0.5435, - "step": 78182 - }, - { - "epoch": 2.0, - "learning_rate": 5.24630356029503e-07, - "loss": 0.1517, - "step": 78183 - }, - { - "epoch": 2.0, - "learning_rate": 5.246060121288873e-07, - "loss": 0.4287, - "step": 78184 - }, - { - "epoch": 2.0, - "learning_rate": 5.24581668592259e-07, - "loss": 0.3926, - "step": 78185 - }, - { - "epoch": 2.0, - "learning_rate": 5.245573254196362e-07, - "loss": 0.4087, - "step": 78186 - }, - { - "epoch": 2.0, - "learning_rate": 5.24532982611038e-07, - "loss": 0.3584, - "step": 78187 - }, - { - "epoch": 2.0, - "learning_rate": 5.245086401664832e-07, - "loss": 0.4497, - "step": 78188 - }, - { - "epoch": 2.0, - "learning_rate": 5.244842980859905e-07, - "loss": 0.4495, - "step": 78189 - }, - { - "epoch": 2.0, - "learning_rate": 5.24459956369578e-07, - "loss": 0.4722, - "step": 78190 - }, - { - "epoch": 2.0, - "learning_rate": 5.244356150172647e-07, - "loss": 0.394, - "step": 78191 - }, - { - "epoch": 2.0, - "learning_rate": 5.244112740290689e-07, - "loss": 0.3804, - "step": 78192 - }, - { - "epoch": 2.0, - "learning_rate": 5.243869334050101e-07, - "loss": 0.4238, - "step": 78193 - }, - { - "epoch": 2.0, - "learning_rate": 5.24362593145106e-07, - "loss": 0.3882, - "step": 78194 - }, - { - "epoch": 2.0, - "learning_rate": 5.24338253249376e-07, - "loss": 0.4092, - "step": 78195 - }, - { - "epoch": 2.0, - "learning_rate": 5.243139137178378e-07, - "loss": 0.5234, - "step": 78196 - }, - { - "epoch": 2.0, - "learning_rate": 5.242895745505107e-07, - "loss": 0.4238, - "step": 78197 - }, - { - "epoch": 2.0, - "learning_rate": 5.242652357474135e-07, - "loss": 0.4067, - "step": 78198 - }, - { - "epoch": 2.0, - "learning_rate": 5.242408973085642e-07, - "loss": 0.3896, - "step": 78199 - }, - { - "epoch": 2.0, - "learning_rate": 5.242165592339817e-07, - "loss": 0.4438, - "step": 78200 - }, - { - "epoch": 2.0, - "learning_rate": 5.241922215236852e-07, - "loss": 0.3044, - "step": 78201 - }, - { - "epoch": 2.0, - "learning_rate": 5.241678841776923e-07, - "loss": 0.3755, - "step": 78202 - }, - { - "epoch": 2.0, - "learning_rate": 5.241435471960223e-07, - "loss": 0.4459, - "step": 78203 - }, - { - "epoch": 2.0, - "learning_rate": 5.241192105786935e-07, - "loss": 0.3599, - "step": 78204 - }, - { - "epoch": 2.0, - "learning_rate": 5.240948743257254e-07, - "loss": 0.48, - "step": 78205 - }, - { - "epoch": 2.0, - "learning_rate": 5.240705384371359e-07, - "loss": 0.3394, - "step": 78206 - }, - { - "epoch": 2.0, - "learning_rate": 5.240462029129433e-07, - "loss": 0.4226, - "step": 78207 - }, - { - "epoch": 2.0, - "learning_rate": 5.240218677531664e-07, - "loss": 0.2361, - "step": 78208 - }, - { - "epoch": 2.0, - "learning_rate": 5.239975329578245e-07, - "loss": 0.4756, - "step": 78209 - }, - { - "epoch": 2.0, - "learning_rate": 5.239731985269359e-07, - "loss": 0.4443, - "step": 78210 - }, - { - "epoch": 2.0, - "learning_rate": 5.239488644605188e-07, - "loss": 0.3853, - "step": 78211 - }, - { - "epoch": 2.0, - "learning_rate": 5.239245307585922e-07, - "loss": 0.3284, - "step": 78212 - }, - { - "epoch": 2.0, - "learning_rate": 5.239001974211748e-07, - "loss": 0.4146, - "step": 78213 - }, - { - "epoch": 2.0, - "learning_rate": 5.238758644482853e-07, - "loss": 0.302, - "step": 78214 - }, - { - "epoch": 2.0, - "learning_rate": 5.238515318399422e-07, - "loss": 0.4492, - "step": 78215 - }, - { - "epoch": 2.0, - "learning_rate": 5.238271995961639e-07, - "loss": 0.3931, - "step": 78216 - }, - { - "epoch": 2.0, - "learning_rate": 5.23802867716969e-07, - "loss": 0.3782, - "step": 78217 - }, - { - "epoch": 2.0, - "learning_rate": 5.237785362023767e-07, - "loss": 0.3159, - "step": 78218 - }, - { - "epoch": 2.0, - "learning_rate": 5.23754205052405e-07, - "loss": 0.4565, - "step": 78219 - }, - { - "epoch": 2.0, - "learning_rate": 5.237298742670728e-07, - "loss": 0.3599, - "step": 78220 - }, - { - "epoch": 2.0, - "learning_rate": 5.237055438463989e-07, - "loss": 0.4351, - "step": 78221 - }, - { - "epoch": 2.0, - "learning_rate": 5.236812137904019e-07, - "loss": 0.4226, - "step": 78222 - }, - { - "epoch": 2.0, - "learning_rate": 5.236568840991e-07, - "loss": 0.415, - "step": 78223 - }, - { - "epoch": 2.0, - "learning_rate": 5.236325547725121e-07, - "loss": 0.3713, - "step": 78224 - }, - { - "epoch": 2.0, - "learning_rate": 5.236082258106574e-07, - "loss": 0.3457, - "step": 78225 - }, - { - "epoch": 2.0, - "learning_rate": 5.235838972135533e-07, - "loss": 0.4497, - "step": 78226 - }, - { - "epoch": 2.0, - "learning_rate": 5.235595689812195e-07, - "loss": 0.3303, - "step": 78227 - }, - { - "epoch": 2.01, - "learning_rate": 5.235352411136741e-07, - "loss": 0.5103, - "step": 78228 - }, - { - "epoch": 2.01, - "learning_rate": 5.235109136109357e-07, - "loss": 0.3788, - "step": 78229 - }, - { - "epoch": 2.01, - "learning_rate": 5.234865864730231e-07, - "loss": 0.3574, - "step": 78230 - }, - { - "epoch": 2.01, - "learning_rate": 5.234622596999554e-07, - "loss": 0.438, - "step": 78231 - }, - { - "epoch": 2.01, - "learning_rate": 5.234379332917502e-07, - "loss": 0.3907, - "step": 78232 - }, - { - "epoch": 2.01, - "learning_rate": 5.234136072484268e-07, - "loss": 0.4336, - "step": 78233 - }, - { - "epoch": 2.01, - "learning_rate": 5.233892815700036e-07, - "loss": 0.4243, - "step": 78234 - }, - { - "epoch": 2.01, - "learning_rate": 5.233649562564997e-07, - "loss": 0.625, - "step": 78235 - }, - { - "epoch": 2.01, - "learning_rate": 5.233406313079334e-07, - "loss": 0.3159, - "step": 78236 - }, - { - "epoch": 2.01, - "learning_rate": 5.233163067243226e-07, - "loss": 0.4414, - "step": 78237 - }, - { - "epoch": 2.01, - "learning_rate": 5.23291982505687e-07, - "loss": 0.3918, - "step": 78238 - }, - { - "epoch": 2.01, - "learning_rate": 5.23267658652045e-07, - "loss": 0.4395, - "step": 78239 - }, - { - "epoch": 2.01, - "learning_rate": 5.232433351634147e-07, - "loss": 0.4565, - "step": 78240 - }, - { - "epoch": 2.01, - "learning_rate": 5.23219012039815e-07, - "loss": 0.3557, - "step": 78241 - }, - { - "epoch": 2.01, - "learning_rate": 5.231946892812645e-07, - "loss": 0.3911, - "step": 78242 - }, - { - "epoch": 2.01, - "learning_rate": 5.231703668877824e-07, - "loss": 0.3875, - "step": 78243 - }, - { - "epoch": 2.01, - "learning_rate": 5.231460448593864e-07, - "loss": 0.3394, - "step": 78244 - }, - { - "epoch": 2.01, - "learning_rate": 5.23121723196096e-07, - "loss": 0.361, - "step": 78245 - }, - { - "epoch": 2.01, - "learning_rate": 5.230974018979288e-07, - "loss": 0.4106, - "step": 78246 - }, - { - "epoch": 2.01, - "learning_rate": 5.230730809649042e-07, - "loss": 0.3354, - "step": 78247 - }, - { - "epoch": 2.01, - "learning_rate": 5.230487603970409e-07, - "loss": 0.4111, - "step": 78248 - }, - { - "epoch": 2.01, - "learning_rate": 5.230244401943568e-07, - "loss": 0.5405, - "step": 78249 - }, - { - "epoch": 2.01, - "learning_rate": 5.230001203568711e-07, - "loss": 0.4121, - "step": 78250 - }, - { - "epoch": 2.01, - "learning_rate": 5.229758008846021e-07, - "loss": 0.4883, - "step": 78251 - }, - { - "epoch": 2.01, - "learning_rate": 5.229514817775692e-07, - "loss": 0.406, - "step": 78252 - }, - { - "epoch": 2.01, - "learning_rate": 5.229271630357899e-07, - "loss": 0.4976, - "step": 78253 - }, - { - "epoch": 2.01, - "learning_rate": 5.229028446592834e-07, - "loss": 0.4482, - "step": 78254 - }, - { - "epoch": 2.01, - "learning_rate": 5.228785266480685e-07, - "loss": 0.5229, - "step": 78255 - }, - { - "epoch": 2.01, - "learning_rate": 5.228542090021637e-07, - "loss": 0.4502, - "step": 78256 - }, - { - "epoch": 2.01, - "learning_rate": 5.22829891721587e-07, - "loss": 0.3556, - "step": 78257 - }, - { - "epoch": 2.01, - "learning_rate": 5.228055748063576e-07, - "loss": 0.5015, - "step": 78258 - }, - { - "epoch": 2.01, - "learning_rate": 5.22781258256494e-07, - "loss": 0.3311, - "step": 78259 - }, - { - "epoch": 2.01, - "learning_rate": 5.227569420720152e-07, - "loss": 0.4963, - "step": 78260 - }, - { - "epoch": 2.01, - "learning_rate": 5.227326262529393e-07, - "loss": 0.4893, - "step": 78261 - }, - { - "epoch": 2.01, - "learning_rate": 5.227083107992847e-07, - "loss": 0.4653, - "step": 78262 - }, - { - "epoch": 2.01, - "learning_rate": 5.226839957110707e-07, - "loss": 0.4688, - "step": 78263 - }, - { - "epoch": 2.01, - "learning_rate": 5.226596809883159e-07, - "loss": 0.439, - "step": 78264 - }, - { - "epoch": 2.01, - "learning_rate": 5.226353666310385e-07, - "loss": 0.3685, - "step": 78265 - }, - { - "epoch": 2.01, - "learning_rate": 5.226110526392571e-07, - "loss": 0.3721, - "step": 78266 - }, - { - "epoch": 2.01, - "learning_rate": 5.225867390129904e-07, - "loss": 0.5068, - "step": 78267 - }, - { - "epoch": 2.01, - "learning_rate": 5.22562425752257e-07, - "loss": 0.3914, - "step": 78268 - }, - { - "epoch": 2.01, - "learning_rate": 5.225381128570761e-07, - "loss": 0.3552, - "step": 78269 - }, - { - "epoch": 2.01, - "learning_rate": 5.225138003274653e-07, - "loss": 0.4023, - "step": 78270 - }, - { - "epoch": 2.01, - "learning_rate": 5.224894881634438e-07, - "loss": 0.3076, - "step": 78271 - }, - { - "epoch": 2.01, - "learning_rate": 5.224651763650301e-07, - "loss": 0.4596, - "step": 78272 - }, - { - "epoch": 2.01, - "learning_rate": 5.224408649322433e-07, - "loss": 0.4731, - "step": 78273 - }, - { - "epoch": 2.01, - "learning_rate": 5.224165538651011e-07, - "loss": 0.52, - "step": 78274 - }, - { - "epoch": 2.01, - "learning_rate": 5.223922431636229e-07, - "loss": 0.5659, - "step": 78275 - }, - { - "epoch": 2.01, - "learning_rate": 5.223679328278269e-07, - "loss": 0.4146, - "step": 78276 - }, - { - "epoch": 2.01, - "learning_rate": 5.22343622857732e-07, - "loss": 0.3315, - "step": 78277 - }, - { - "epoch": 2.01, - "learning_rate": 5.223193132533563e-07, - "loss": 0.5737, - "step": 78278 - }, - { - "epoch": 2.01, - "learning_rate": 5.222950040147187e-07, - "loss": 0.3867, - "step": 78279 - }, - { - "epoch": 2.01, - "learning_rate": 5.222706951418378e-07, - "loss": 0.4194, - "step": 78280 - }, - { - "epoch": 2.01, - "learning_rate": 5.222463866347328e-07, - "loss": 0.5786, - "step": 78281 - }, - { - "epoch": 2.01, - "learning_rate": 5.222220784934213e-07, - "loss": 0.5259, - "step": 78282 - }, - { - "epoch": 2.01, - "learning_rate": 5.221977707179224e-07, - "loss": 0.355, - "step": 78283 - }, - { - "epoch": 2.01, - "learning_rate": 5.221734633082546e-07, - "loss": 0.3086, - "step": 78284 - }, - { - "epoch": 2.01, - "learning_rate": 5.221491562644371e-07, - "loss": 0.3877, - "step": 78285 - }, - { - "epoch": 2.01, - "learning_rate": 5.22124849586488e-07, - "loss": 0.4259, - "step": 78286 - }, - { - "epoch": 2.01, - "learning_rate": 5.221005432744256e-07, - "loss": 0.3643, - "step": 78287 - }, - { - "epoch": 2.01, - "learning_rate": 5.220762373282688e-07, - "loss": 0.3862, - "step": 78288 - }, - { - "epoch": 2.01, - "learning_rate": 5.22051931748036e-07, - "loss": 0.4277, - "step": 78289 - }, - { - "epoch": 2.01, - "learning_rate": 5.220276265337469e-07, - "loss": 0.4707, - "step": 78290 - }, - { - "epoch": 2.01, - "learning_rate": 5.220033216854184e-07, - "loss": 0.3848, - "step": 78291 - }, - { - "epoch": 2.01, - "learning_rate": 5.219790172030704e-07, - "loss": 0.4722, - "step": 78292 - }, - { - "epoch": 2.01, - "learning_rate": 5.219547130867212e-07, - "loss": 0.4409, - "step": 78293 - }, - { - "epoch": 2.01, - "learning_rate": 5.219304093363891e-07, - "loss": 0.5356, - "step": 78294 - }, - { - "epoch": 2.01, - "learning_rate": 5.219061059520932e-07, - "loss": 0.3457, - "step": 78295 - }, - { - "epoch": 2.01, - "learning_rate": 5.218818029338514e-07, - "loss": 0.4697, - "step": 78296 - }, - { - "epoch": 2.01, - "learning_rate": 5.218575002816827e-07, - "loss": 0.3975, - "step": 78297 - }, - { - "epoch": 2.01, - "learning_rate": 5.218331979956062e-07, - "loss": 0.4248, - "step": 78298 - }, - { - "epoch": 2.01, - "learning_rate": 5.218088960756397e-07, - "loss": 0.3457, - "step": 78299 - }, - { - "epoch": 2.01, - "learning_rate": 5.21784594521802e-07, - "loss": 0.5015, - "step": 78300 - }, - { - "epoch": 2.01, - "learning_rate": 5.217602933341119e-07, - "loss": 0.5278, - "step": 78301 - }, - { - "epoch": 2.01, - "learning_rate": 5.217359925125884e-07, - "loss": 0.4556, - "step": 78302 - }, - { - "epoch": 2.01, - "learning_rate": 5.21711692057249e-07, - "loss": 0.4375, - "step": 78303 - }, - { - "epoch": 2.01, - "learning_rate": 5.216873919681133e-07, - "loss": 0.5195, - "step": 78304 - }, - { - "epoch": 2.01, - "learning_rate": 5.216630922451999e-07, - "loss": 0.4531, - "step": 78305 - }, - { - "epoch": 2.01, - "learning_rate": 5.216387928885266e-07, - "loss": 0.4712, - "step": 78306 - }, - { - "epoch": 2.01, - "learning_rate": 5.216144938981128e-07, - "loss": 0.459, - "step": 78307 - }, - { - "epoch": 2.01, - "learning_rate": 5.215901952739765e-07, - "loss": 0.2781, - "step": 78308 - }, - { - "epoch": 2.01, - "learning_rate": 5.215658970161365e-07, - "loss": 0.4282, - "step": 78309 - }, - { - "epoch": 2.01, - "learning_rate": 5.21541599124612e-07, - "loss": 0.375, - "step": 78310 - }, - { - "epoch": 2.01, - "learning_rate": 5.215173015994207e-07, - "loss": 0.4541, - "step": 78311 - }, - { - "epoch": 2.01, - "learning_rate": 5.214930044405817e-07, - "loss": 0.4385, - "step": 78312 - }, - { - "epoch": 2.01, - "learning_rate": 5.214687076481133e-07, - "loss": 0.3127, - "step": 78313 - }, - { - "epoch": 2.01, - "learning_rate": 5.214444112220346e-07, - "loss": 0.4001, - "step": 78314 - }, - { - "epoch": 2.01, - "learning_rate": 5.214201151623642e-07, - "loss": 0.5186, - "step": 78315 - }, - { - "epoch": 2.01, - "learning_rate": 5.2139581946912e-07, - "loss": 0.3094, - "step": 78316 - }, - { - "epoch": 2.01, - "learning_rate": 5.213715241423207e-07, - "loss": 0.3958, - "step": 78317 - }, - { - "epoch": 2.01, - "learning_rate": 5.213472291819855e-07, - "loss": 0.417, - "step": 78318 - }, - { - "epoch": 2.01, - "learning_rate": 5.213229345881331e-07, - "loss": 0.4495, - "step": 78319 - }, - { - "epoch": 2.01, - "learning_rate": 5.212986403607812e-07, - "loss": 0.259, - "step": 78320 - }, - { - "epoch": 2.01, - "learning_rate": 5.212743464999489e-07, - "loss": 0.406, - "step": 78321 - }, - { - "epoch": 2.01, - "learning_rate": 5.21250053005655e-07, - "loss": 0.4111, - "step": 78322 - }, - { - "epoch": 2.01, - "learning_rate": 5.212257598779181e-07, - "loss": 0.5415, - "step": 78323 - }, - { - "epoch": 2.01, - "learning_rate": 5.212014671167568e-07, - "loss": 0.3224, - "step": 78324 - }, - { - "epoch": 2.01, - "learning_rate": 5.211771747221892e-07, - "loss": 0.2822, - "step": 78325 - }, - { - "epoch": 2.01, - "learning_rate": 5.21152882694234e-07, - "loss": 0.376, - "step": 78326 - }, - { - "epoch": 2.01, - "learning_rate": 5.211285910329105e-07, - "loss": 0.3643, - "step": 78327 - }, - { - "epoch": 2.01, - "learning_rate": 5.211042997382364e-07, - "loss": 0.3276, - "step": 78328 - }, - { - "epoch": 2.01, - "learning_rate": 5.210800088102307e-07, - "loss": 0.5005, - "step": 78329 - }, - { - "epoch": 2.01, - "learning_rate": 5.210557182489121e-07, - "loss": 0.5151, - "step": 78330 - }, - { - "epoch": 2.01, - "learning_rate": 5.210314280542995e-07, - "loss": 0.3347, - "step": 78331 - }, - { - "epoch": 2.01, - "learning_rate": 5.210071382264108e-07, - "loss": 0.4585, - "step": 78332 - }, - { - "epoch": 2.01, - "learning_rate": 5.209828487652646e-07, - "loss": 0.4683, - "step": 78333 - }, - { - "epoch": 2.01, - "learning_rate": 5.209585596708806e-07, - "loss": 0.4521, - "step": 78334 - }, - { - "epoch": 2.01, - "learning_rate": 5.209342709432758e-07, - "loss": 0.3255, - "step": 78335 - }, - { - "epoch": 2.01, - "learning_rate": 5.209099825824703e-07, - "loss": 0.5591, - "step": 78336 - }, - { - "epoch": 2.01, - "learning_rate": 5.208856945884814e-07, - "loss": 0.478, - "step": 78337 - }, - { - "epoch": 2.01, - "learning_rate": 5.208614069613284e-07, - "loss": 0.3513, - "step": 78338 - }, - { - "epoch": 2.01, - "learning_rate": 5.208371197010298e-07, - "loss": 0.48, - "step": 78339 - }, - { - "epoch": 2.01, - "learning_rate": 5.208128328076046e-07, - "loss": 0.4009, - "step": 78340 - }, - { - "epoch": 2.01, - "learning_rate": 5.207885462810706e-07, - "loss": 0.4883, - "step": 78341 - }, - { - "epoch": 2.01, - "learning_rate": 5.207642601214467e-07, - "loss": 0.5176, - "step": 78342 - }, - { - "epoch": 2.01, - "learning_rate": 5.207399743287516e-07, - "loss": 0.3972, - "step": 78343 - }, - { - "epoch": 2.01, - "learning_rate": 5.207156889030047e-07, - "loss": 0.5098, - "step": 78344 - }, - { - "epoch": 2.01, - "learning_rate": 5.206914038442229e-07, - "loss": 0.4985, - "step": 78345 - }, - { - "epoch": 2.01, - "learning_rate": 5.206671191524257e-07, - "loss": 0.3117, - "step": 78346 - }, - { - "epoch": 2.01, - "learning_rate": 5.206428348276315e-07, - "loss": 0.3259, - "step": 78347 - }, - { - "epoch": 2.01, - "learning_rate": 5.206185508698596e-07, - "loss": 0.479, - "step": 78348 - }, - { - "epoch": 2.01, - "learning_rate": 5.205942672791276e-07, - "loss": 0.3542, - "step": 78349 - }, - { - "epoch": 2.01, - "learning_rate": 5.205699840554545e-07, - "loss": 0.3572, - "step": 78350 - }, - { - "epoch": 2.01, - "learning_rate": 5.20545701198859e-07, - "loss": 0.3229, - "step": 78351 - }, - { - "epoch": 2.01, - "learning_rate": 5.205214187093598e-07, - "loss": 0.4795, - "step": 78352 - }, - { - "epoch": 2.01, - "learning_rate": 5.204971365869751e-07, - "loss": 0.4055, - "step": 78353 - }, - { - "epoch": 2.01, - "learning_rate": 5.204728548317241e-07, - "loss": 0.4194, - "step": 78354 - }, - { - "epoch": 2.01, - "learning_rate": 5.204485734436245e-07, - "loss": 0.3347, - "step": 78355 - }, - { - "epoch": 2.01, - "learning_rate": 5.204242924226953e-07, - "loss": 0.4824, - "step": 78356 - }, - { - "epoch": 2.01, - "learning_rate": 5.204000117689557e-07, - "loss": 0.4829, - "step": 78357 - }, - { - "epoch": 2.01, - "learning_rate": 5.203757314824235e-07, - "loss": 0.4302, - "step": 78358 - }, - { - "epoch": 2.01, - "learning_rate": 5.203514515631173e-07, - "loss": 0.386, - "step": 78359 - }, - { - "epoch": 2.01, - "learning_rate": 5.20327172011056e-07, - "loss": 0.3938, - "step": 78360 - }, - { - "epoch": 2.01, - "learning_rate": 5.203028928262585e-07, - "loss": 0.3851, - "step": 78361 - }, - { - "epoch": 2.01, - "learning_rate": 5.202786140087427e-07, - "loss": 0.4199, - "step": 78362 - }, - { - "epoch": 2.01, - "learning_rate": 5.202543355585276e-07, - "loss": 0.3608, - "step": 78363 - }, - { - "epoch": 2.01, - "learning_rate": 5.202300574756319e-07, - "loss": 0.437, - "step": 78364 - }, - { - "epoch": 2.01, - "learning_rate": 5.202057797600741e-07, - "loss": 0.3745, - "step": 78365 - }, - { - "epoch": 2.01, - "learning_rate": 5.201815024118721e-07, - "loss": 0.3384, - "step": 78366 - }, - { - "epoch": 2.01, - "learning_rate": 5.201572254310452e-07, - "loss": 0.4189, - "step": 78367 - }, - { - "epoch": 2.01, - "learning_rate": 5.201329488176119e-07, - "loss": 0.4014, - "step": 78368 - }, - { - "epoch": 2.01, - "learning_rate": 5.201086725715911e-07, - "loss": 0.4712, - "step": 78369 - }, - { - "epoch": 2.01, - "learning_rate": 5.200843966930005e-07, - "loss": 0.5366, - "step": 78370 - }, - { - "epoch": 2.01, - "learning_rate": 5.200601211818594e-07, - "loss": 0.395, - "step": 78371 - }, - { - "epoch": 2.01, - "learning_rate": 5.200358460381861e-07, - "loss": 0.3218, - "step": 78372 - }, - { - "epoch": 2.01, - "learning_rate": 5.200115712619997e-07, - "loss": 0.2944, - "step": 78373 - }, - { - "epoch": 2.01, - "learning_rate": 5.199872968533183e-07, - "loss": 0.3787, - "step": 78374 - }, - { - "epoch": 2.01, - "learning_rate": 5.199630228121602e-07, - "loss": 0.3656, - "step": 78375 - }, - { - "epoch": 2.01, - "learning_rate": 5.199387491385443e-07, - "loss": 0.4077, - "step": 78376 - }, - { - "epoch": 2.01, - "learning_rate": 5.199144758324894e-07, - "loss": 0.3892, - "step": 78377 - }, - { - "epoch": 2.01, - "learning_rate": 5.198902028940142e-07, - "loss": 0.4746, - "step": 78378 - }, - { - "epoch": 2.01, - "learning_rate": 5.198659303231366e-07, - "loss": 0.3911, - "step": 78379 - }, - { - "epoch": 2.01, - "learning_rate": 5.198416581198755e-07, - "loss": 0.4805, - "step": 78380 - }, - { - "epoch": 2.01, - "learning_rate": 5.1981738628425e-07, - "loss": 0.3213, - "step": 78381 - }, - { - "epoch": 2.01, - "learning_rate": 5.197931148162778e-07, - "loss": 0.4565, - "step": 78382 - }, - { - "epoch": 2.01, - "learning_rate": 5.19768843715978e-07, - "loss": 0.2996, - "step": 78383 - }, - { - "epoch": 2.01, - "learning_rate": 5.197445729833696e-07, - "loss": 0.5024, - "step": 78384 - }, - { - "epoch": 2.01, - "learning_rate": 5.197203026184702e-07, - "loss": 0.4717, - "step": 78385 - }, - { - "epoch": 2.01, - "learning_rate": 5.196960326212994e-07, - "loss": 0.4277, - "step": 78386 - }, - { - "epoch": 2.01, - "learning_rate": 5.196717629918748e-07, - "loss": 0.4177, - "step": 78387 - }, - { - "epoch": 2.01, - "learning_rate": 5.196474937302153e-07, - "loss": 0.4248, - "step": 78388 - }, - { - "epoch": 2.01, - "learning_rate": 5.196232248363397e-07, - "loss": 0.2826, - "step": 78389 - }, - { - "epoch": 2.01, - "learning_rate": 5.19598956310267e-07, - "loss": 0.5049, - "step": 78390 - }, - { - "epoch": 2.01, - "learning_rate": 5.195746881520148e-07, - "loss": 0.3979, - "step": 78391 - }, - { - "epoch": 2.01, - "learning_rate": 5.195504203616023e-07, - "loss": 0.3676, - "step": 78392 - }, - { - "epoch": 2.01, - "learning_rate": 5.195261529390478e-07, - "loss": 0.4375, - "step": 78393 - }, - { - "epoch": 2.01, - "learning_rate": 5.195018858843705e-07, - "loss": 0.4736, - "step": 78394 - }, - { - "epoch": 2.01, - "learning_rate": 5.194776191975885e-07, - "loss": 0.4224, - "step": 78395 - }, - { - "epoch": 2.01, - "learning_rate": 5.1945335287872e-07, - "loss": 0.4182, - "step": 78396 - }, - { - "epoch": 2.01, - "learning_rate": 5.19429086927784e-07, - "loss": 0.4028, - "step": 78397 - }, - { - "epoch": 2.01, - "learning_rate": 5.19404821344799e-07, - "loss": 0.4697, - "step": 78398 - }, - { - "epoch": 2.01, - "learning_rate": 5.193805561297839e-07, - "loss": 0.4094, - "step": 78399 - }, - { - "epoch": 2.01, - "learning_rate": 5.193562912827569e-07, - "loss": 0.4258, - "step": 78400 - }, - { - "epoch": 2.01, - "learning_rate": 5.193320268037364e-07, - "loss": 0.3555, - "step": 78401 - }, - { - "epoch": 2.01, - "learning_rate": 5.193077626927418e-07, - "loss": 0.5117, - "step": 78402 - }, - { - "epoch": 2.01, - "learning_rate": 5.192834989497909e-07, - "loss": 0.5576, - "step": 78403 - }, - { - "epoch": 2.01, - "learning_rate": 5.192592355749027e-07, - "loss": 0.5127, - "step": 78404 - }, - { - "epoch": 2.01, - "learning_rate": 5.192349725680952e-07, - "loss": 0.4497, - "step": 78405 - }, - { - "epoch": 2.01, - "learning_rate": 5.192107099293875e-07, - "loss": 0.46, - "step": 78406 - }, - { - "epoch": 2.01, - "learning_rate": 5.191864476587984e-07, - "loss": 0.5381, - "step": 78407 - }, - { - "epoch": 2.01, - "learning_rate": 5.191621857563458e-07, - "loss": 0.4966, - "step": 78408 - }, - { - "epoch": 2.01, - "learning_rate": 5.191379242220484e-07, - "loss": 0.5332, - "step": 78409 - }, - { - "epoch": 2.01, - "learning_rate": 5.191136630559252e-07, - "loss": 0.3877, - "step": 78410 - }, - { - "epoch": 2.01, - "learning_rate": 5.190894022579948e-07, - "loss": 0.498, - "step": 78411 - }, - { - "epoch": 2.01, - "learning_rate": 5.190651418282752e-07, - "loss": 0.4072, - "step": 78412 - }, - { - "epoch": 2.01, - "learning_rate": 5.190408817667852e-07, - "loss": 0.3403, - "step": 78413 - }, - { - "epoch": 2.01, - "learning_rate": 5.190166220735441e-07, - "loss": 0.4663, - "step": 78414 - }, - { - "epoch": 2.01, - "learning_rate": 5.189923627485692e-07, - "loss": 0.4429, - "step": 78415 - }, - { - "epoch": 2.01, - "learning_rate": 5.189681037918805e-07, - "loss": 0.4507, - "step": 78416 - }, - { - "epoch": 2.01, - "learning_rate": 5.189438452034952e-07, - "loss": 0.5024, - "step": 78417 - }, - { - "epoch": 2.01, - "learning_rate": 5.189195869834324e-07, - "loss": 0.4883, - "step": 78418 - }, - { - "epoch": 2.01, - "learning_rate": 5.188953291317112e-07, - "loss": 0.4878, - "step": 78419 - }, - { - "epoch": 2.01, - "learning_rate": 5.188710716483493e-07, - "loss": 0.4824, - "step": 78420 - }, - { - "epoch": 2.01, - "learning_rate": 5.188468145333657e-07, - "loss": 0.5835, - "step": 78421 - }, - { - "epoch": 2.01, - "learning_rate": 5.18822557786779e-07, - "loss": 0.397, - "step": 78422 - }, - { - "epoch": 2.01, - "learning_rate": 5.187983014086082e-07, - "loss": 0.459, - "step": 78423 - }, - { - "epoch": 2.01, - "learning_rate": 5.187740453988714e-07, - "loss": 0.4468, - "step": 78424 - }, - { - "epoch": 2.01, - "learning_rate": 5.187497897575867e-07, - "loss": 0.4861, - "step": 78425 - }, - { - "epoch": 2.01, - "learning_rate": 5.187255344847731e-07, - "loss": 0.4756, - "step": 78426 - }, - { - "epoch": 2.01, - "learning_rate": 5.187012795804494e-07, - "loss": 0.4951, - "step": 78427 - }, - { - "epoch": 2.01, - "learning_rate": 5.186770250446344e-07, - "loss": 0.4849, - "step": 78428 - }, - { - "epoch": 2.01, - "learning_rate": 5.186527708773457e-07, - "loss": 0.4194, - "step": 78429 - }, - { - "epoch": 2.01, - "learning_rate": 5.186285170786025e-07, - "loss": 0.3706, - "step": 78430 - }, - { - "epoch": 2.01, - "learning_rate": 5.186042636484233e-07, - "loss": 0.4546, - "step": 78431 - }, - { - "epoch": 2.01, - "learning_rate": 5.185800105868272e-07, - "loss": 0.4922, - "step": 78432 - }, - { - "epoch": 2.01, - "learning_rate": 5.185557578938317e-07, - "loss": 0.3339, - "step": 78433 - }, - { - "epoch": 2.01, - "learning_rate": 5.185315055694566e-07, - "loss": 0.3643, - "step": 78434 - }, - { - "epoch": 2.01, - "learning_rate": 5.185072536137191e-07, - "loss": 0.4599, - "step": 78435 - }, - { - "epoch": 2.01, - "learning_rate": 5.184830020266389e-07, - "loss": 0.3054, - "step": 78436 - }, - { - "epoch": 2.01, - "learning_rate": 5.184587508082338e-07, - "loss": 0.4219, - "step": 78437 - }, - { - "epoch": 2.01, - "learning_rate": 5.184344999585226e-07, - "loss": 0.2299, - "step": 78438 - }, - { - "epoch": 2.01, - "learning_rate": 5.184102494775241e-07, - "loss": 0.5078, - "step": 78439 - }, - { - "epoch": 2.01, - "learning_rate": 5.18385999365257e-07, - "loss": 0.4985, - "step": 78440 - }, - { - "epoch": 2.01, - "learning_rate": 5.183617496217393e-07, - "loss": 0.4319, - "step": 78441 - }, - { - "epoch": 2.01, - "learning_rate": 5.183375002469899e-07, - "loss": 0.4062, - "step": 78442 - }, - { - "epoch": 2.01, - "learning_rate": 5.183132512410271e-07, - "loss": 0.373, - "step": 78443 - }, - { - "epoch": 2.01, - "learning_rate": 5.182890026038702e-07, - "loss": 0.4717, - "step": 78444 - }, - { - "epoch": 2.01, - "learning_rate": 5.182647543355374e-07, - "loss": 0.2192, - "step": 78445 - }, - { - "epoch": 2.01, - "learning_rate": 5.182405064360466e-07, - "loss": 0.4229, - "step": 78446 - }, - { - "epoch": 2.01, - "learning_rate": 5.182162589054169e-07, - "loss": 0.4038, - "step": 78447 - }, - { - "epoch": 2.01, - "learning_rate": 5.181920117436669e-07, - "loss": 0.4434, - "step": 78448 - }, - { - "epoch": 2.01, - "learning_rate": 5.181677649508154e-07, - "loss": 0.4939, - "step": 78449 - }, - { - "epoch": 2.01, - "learning_rate": 5.181435185268803e-07, - "loss": 0.458, - "step": 78450 - }, - { - "epoch": 2.01, - "learning_rate": 5.181192724718808e-07, - "loss": 0.4546, - "step": 78451 - }, - { - "epoch": 2.01, - "learning_rate": 5.18095026785835e-07, - "loss": 0.4817, - "step": 78452 - }, - { - "epoch": 2.01, - "learning_rate": 5.180707814687622e-07, - "loss": 0.3473, - "step": 78453 - }, - { - "epoch": 2.01, - "learning_rate": 5.180465365206804e-07, - "loss": 0.4985, - "step": 78454 - }, - { - "epoch": 2.01, - "learning_rate": 5.180222919416076e-07, - "loss": 0.322, - "step": 78455 - }, - { - "epoch": 2.01, - "learning_rate": 5.179980477315632e-07, - "loss": 0.4124, - "step": 78456 - }, - { - "epoch": 2.01, - "learning_rate": 5.179738038905659e-07, - "loss": 0.5259, - "step": 78457 - }, - { - "epoch": 2.01, - "learning_rate": 5.179495604186335e-07, - "loss": 0.3767, - "step": 78458 - }, - { - "epoch": 2.01, - "learning_rate": 5.179253173157848e-07, - "loss": 0.3936, - "step": 78459 - }, - { - "epoch": 2.01, - "learning_rate": 5.179010745820387e-07, - "loss": 0.4751, - "step": 78460 - }, - { - "epoch": 2.01, - "learning_rate": 5.178768322174138e-07, - "loss": 0.4165, - "step": 78461 - }, - { - "epoch": 2.01, - "learning_rate": 5.178525902219282e-07, - "loss": 0.3887, - "step": 78462 - }, - { - "epoch": 2.01, - "learning_rate": 5.178283485956008e-07, - "loss": 0.4287, - "step": 78463 - }, - { - "epoch": 2.01, - "learning_rate": 5.178041073384502e-07, - "loss": 0.3582, - "step": 78464 - }, - { - "epoch": 2.01, - "learning_rate": 5.177798664504946e-07, - "loss": 0.2697, - "step": 78465 - }, - { - "epoch": 2.01, - "learning_rate": 5.177556259317531e-07, - "loss": 0.3721, - "step": 78466 - }, - { - "epoch": 2.01, - "learning_rate": 5.177313857822437e-07, - "loss": 0.3696, - "step": 78467 - }, - { - "epoch": 2.01, - "learning_rate": 5.17707146001985e-07, - "loss": 0.4487, - "step": 78468 - }, - { - "epoch": 2.01, - "learning_rate": 5.176829065909958e-07, - "loss": 0.4062, - "step": 78469 - }, - { - "epoch": 2.01, - "learning_rate": 5.176586675492951e-07, - "loss": 0.2988, - "step": 78470 - }, - { - "epoch": 2.01, - "learning_rate": 5.176344288769006e-07, - "loss": 0.2781, - "step": 78471 - }, - { - "epoch": 2.01, - "learning_rate": 5.176101905738311e-07, - "loss": 0.4165, - "step": 78472 - }, - { - "epoch": 2.01, - "learning_rate": 5.175859526401059e-07, - "loss": 0.4756, - "step": 78473 - }, - { - "epoch": 2.01, - "learning_rate": 5.175617150757427e-07, - "loss": 0.4834, - "step": 78474 - }, - { - "epoch": 2.01, - "learning_rate": 5.175374778807599e-07, - "loss": 0.3411, - "step": 78475 - }, - { - "epoch": 2.01, - "learning_rate": 5.175132410551768e-07, - "loss": 0.4424, - "step": 78476 - }, - { - "epoch": 2.01, - "learning_rate": 5.174890045990115e-07, - "loss": 0.4062, - "step": 78477 - }, - { - "epoch": 2.01, - "learning_rate": 5.174647685122828e-07, - "loss": 0.4121, - "step": 78478 - }, - { - "epoch": 2.01, - "learning_rate": 5.174405327950091e-07, - "loss": 0.4736, - "step": 78479 - }, - { - "epoch": 2.01, - "learning_rate": 5.174162974472088e-07, - "loss": 0.3989, - "step": 78480 - }, - { - "epoch": 2.01, - "learning_rate": 5.173920624689007e-07, - "loss": 0.3669, - "step": 78481 - }, - { - "epoch": 2.01, - "learning_rate": 5.173678278601037e-07, - "loss": 0.3014, - "step": 78482 - }, - { - "epoch": 2.01, - "learning_rate": 5.173435936208357e-07, - "loss": 0.4014, - "step": 78483 - }, - { - "epoch": 2.01, - "learning_rate": 5.173193597511156e-07, - "loss": 0.4167, - "step": 78484 - }, - { - "epoch": 2.01, - "learning_rate": 5.172951262509617e-07, - "loss": 0.5088, - "step": 78485 - }, - { - "epoch": 2.01, - "learning_rate": 5.172708931203927e-07, - "loss": 0.5156, - "step": 78486 - }, - { - "epoch": 2.01, - "learning_rate": 5.172466603594277e-07, - "loss": 0.4492, - "step": 78487 - }, - { - "epoch": 2.01, - "learning_rate": 5.172224279680842e-07, - "loss": 0.4069, - "step": 78488 - }, - { - "epoch": 2.01, - "learning_rate": 5.171981959463811e-07, - "loss": 0.3989, - "step": 78489 - }, - { - "epoch": 2.01, - "learning_rate": 5.171739642943378e-07, - "loss": 0.415, - "step": 78490 - }, - { - "epoch": 2.01, - "learning_rate": 5.171497330119718e-07, - "loss": 0.3573, - "step": 78491 - }, - { - "epoch": 2.01, - "learning_rate": 5.17125502099302e-07, - "loss": 0.3462, - "step": 78492 - }, - { - "epoch": 2.01, - "learning_rate": 5.17101271556347e-07, - "loss": 0.3118, - "step": 78493 - }, - { - "epoch": 2.01, - "learning_rate": 5.170770413831255e-07, - "loss": 0.3899, - "step": 78494 - }, - { - "epoch": 2.01, - "learning_rate": 5.170528115796563e-07, - "loss": 0.3794, - "step": 78495 - }, - { - "epoch": 2.01, - "learning_rate": 5.17028582145957e-07, - "loss": 0.4736, - "step": 78496 - }, - { - "epoch": 2.01, - "learning_rate": 5.170043530820467e-07, - "loss": 0.4072, - "step": 78497 - }, - { - "epoch": 2.01, - "learning_rate": 5.169801243879439e-07, - "loss": 0.3979, - "step": 78498 - }, - { - "epoch": 2.01, - "learning_rate": 5.169558960636677e-07, - "loss": 0.4138, - "step": 78499 - }, - { - "epoch": 2.01, - "learning_rate": 5.169316681092357e-07, - "loss": 0.3862, - "step": 78500 - }, - { - "epoch": 2.01, - "learning_rate": 5.16907440524667e-07, - "loss": 0.4111, - "step": 78501 - }, - { - "epoch": 2.01, - "learning_rate": 5.168832133099798e-07, - "loss": 0.4458, - "step": 78502 - }, - { - "epoch": 2.01, - "learning_rate": 5.168589864651935e-07, - "loss": 0.5, - "step": 78503 - }, - { - "epoch": 2.01, - "learning_rate": 5.168347599903262e-07, - "loss": 0.4204, - "step": 78504 - }, - { - "epoch": 2.01, - "learning_rate": 5.168105338853958e-07, - "loss": 0.4819, - "step": 78505 - }, - { - "epoch": 2.01, - "learning_rate": 5.167863081504214e-07, - "loss": 0.2122, - "step": 78506 - }, - { - "epoch": 2.01, - "learning_rate": 5.167620827854217e-07, - "loss": 0.4575, - "step": 78507 - }, - { - "epoch": 2.01, - "learning_rate": 5.167378577904148e-07, - "loss": 0.4292, - "step": 78508 - }, - { - "epoch": 2.01, - "learning_rate": 5.167136331654194e-07, - "loss": 0.394, - "step": 78509 - }, - { - "epoch": 2.01, - "learning_rate": 5.166894089104543e-07, - "loss": 0.3682, - "step": 78510 - }, - { - "epoch": 2.01, - "learning_rate": 5.166651850255382e-07, - "loss": 0.4988, - "step": 78511 - }, - { - "epoch": 2.01, - "learning_rate": 5.166409615106891e-07, - "loss": 0.3689, - "step": 78512 - }, - { - "epoch": 2.01, - "learning_rate": 5.166167383659255e-07, - "loss": 0.4268, - "step": 78513 - }, - { - "epoch": 2.01, - "learning_rate": 5.165925155912669e-07, - "loss": 0.5088, - "step": 78514 - }, - { - "epoch": 2.01, - "learning_rate": 5.165682931867306e-07, - "loss": 0.2888, - "step": 78515 - }, - { - "epoch": 2.01, - "learning_rate": 5.165440711523363e-07, - "loss": 0.5664, - "step": 78516 - }, - { - "epoch": 2.01, - "learning_rate": 5.165198494881013e-07, - "loss": 0.4888, - "step": 78517 - }, - { - "epoch": 2.01, - "learning_rate": 5.164956281940452e-07, - "loss": 0.2608, - "step": 78518 - }, - { - "epoch": 2.01, - "learning_rate": 5.164714072701859e-07, - "loss": 0.4946, - "step": 78519 - }, - { - "epoch": 2.01, - "learning_rate": 5.164471867165428e-07, - "loss": 0.5596, - "step": 78520 - }, - { - "epoch": 2.01, - "learning_rate": 5.164229665331333e-07, - "loss": 0.4773, - "step": 78521 - }, - { - "epoch": 2.01, - "learning_rate": 5.163987467199764e-07, - "loss": 0.332, - "step": 78522 - }, - { - "epoch": 2.01, - "learning_rate": 5.163745272770909e-07, - "loss": 0.4453, - "step": 78523 - }, - { - "epoch": 2.01, - "learning_rate": 5.16350308204496e-07, - "loss": 0.3879, - "step": 78524 - }, - { - "epoch": 2.01, - "learning_rate": 5.163260895022086e-07, - "loss": 0.283, - "step": 78525 - }, - { - "epoch": 2.01, - "learning_rate": 5.163018711702481e-07, - "loss": 0.3926, - "step": 78526 - }, - { - "epoch": 2.01, - "learning_rate": 5.162776532086331e-07, - "loss": 0.394, - "step": 78527 - }, - { - "epoch": 2.01, - "learning_rate": 5.162534356173822e-07, - "loss": 0.363, - "step": 78528 - }, - { - "epoch": 2.01, - "learning_rate": 5.162292183965135e-07, - "loss": 0.4561, - "step": 78529 - }, - { - "epoch": 2.01, - "learning_rate": 5.16205001546046e-07, - "loss": 0.4351, - "step": 78530 - }, - { - "epoch": 2.01, - "learning_rate": 5.161807850659978e-07, - "loss": 0.2691, - "step": 78531 - }, - { - "epoch": 2.01, - "learning_rate": 5.161565689563884e-07, - "loss": 0.3257, - "step": 78532 - }, - { - "epoch": 2.01, - "learning_rate": 5.161323532172352e-07, - "loss": 0.3409, - "step": 78533 - }, - { - "epoch": 2.01, - "learning_rate": 5.161081378485576e-07, - "loss": 0.4316, - "step": 78534 - }, - { - "epoch": 2.01, - "learning_rate": 5.160839228503733e-07, - "loss": 0.4209, - "step": 78535 - }, - { - "epoch": 2.01, - "learning_rate": 5.160597082227012e-07, - "loss": 0.2959, - "step": 78536 - }, - { - "epoch": 2.01, - "learning_rate": 5.160354939655604e-07, - "loss": 0.3508, - "step": 78537 - }, - { - "epoch": 2.01, - "learning_rate": 5.160112800789686e-07, - "loss": 0.3276, - "step": 78538 - }, - { - "epoch": 2.01, - "learning_rate": 5.159870665629449e-07, - "loss": 0.4136, - "step": 78539 - }, - { - "epoch": 2.01, - "learning_rate": 5.159628534175075e-07, - "loss": 0.4636, - "step": 78540 - }, - { - "epoch": 2.01, - "learning_rate": 5.159386406426753e-07, - "loss": 0.4517, - "step": 78541 - }, - { - "epoch": 2.01, - "learning_rate": 5.159144282384664e-07, - "loss": 0.3843, - "step": 78542 - }, - { - "epoch": 2.01, - "learning_rate": 5.158902162048996e-07, - "loss": 0.2074, - "step": 78543 - }, - { - "epoch": 2.01, - "learning_rate": 5.158660045419938e-07, - "loss": 0.5093, - "step": 78544 - }, - { - "epoch": 2.01, - "learning_rate": 5.158417932497669e-07, - "loss": 0.428, - "step": 78545 - }, - { - "epoch": 2.01, - "learning_rate": 5.158175823282376e-07, - "loss": 0.4746, - "step": 78546 - }, - { - "epoch": 2.01, - "learning_rate": 5.157933717774243e-07, - "loss": 0.3682, - "step": 78547 - }, - { - "epoch": 2.01, - "learning_rate": 5.157691615973459e-07, - "loss": 0.4893, - "step": 78548 - }, - { - "epoch": 2.01, - "learning_rate": 5.15744951788021e-07, - "loss": 0.2278, - "step": 78549 - }, - { - "epoch": 2.01, - "learning_rate": 5.157207423494677e-07, - "loss": 0.4609, - "step": 78550 - }, - { - "epoch": 2.01, - "learning_rate": 5.156965332817048e-07, - "loss": 0.4099, - "step": 78551 - }, - { - "epoch": 2.01, - "learning_rate": 5.156723245847506e-07, - "loss": 0.4043, - "step": 78552 - }, - { - "epoch": 2.01, - "learning_rate": 5.156481162586244e-07, - "loss": 0.3447, - "step": 78553 - }, - { - "epoch": 2.01, - "learning_rate": 5.15623908303344e-07, - "loss": 0.3508, - "step": 78554 - }, - { - "epoch": 2.01, - "learning_rate": 5.155997007189279e-07, - "loss": 0.5229, - "step": 78555 - }, - { - "epoch": 2.01, - "learning_rate": 5.155754935053946e-07, - "loss": 0.3821, - "step": 78556 - }, - { - "epoch": 2.01, - "learning_rate": 5.15551286662763e-07, - "loss": 0.4043, - "step": 78557 - }, - { - "epoch": 2.01, - "learning_rate": 5.155270801910519e-07, - "loss": 0.3872, - "step": 78558 - }, - { - "epoch": 2.01, - "learning_rate": 5.155028740902791e-07, - "loss": 0.4561, - "step": 78559 - }, - { - "epoch": 2.01, - "learning_rate": 5.154786683604633e-07, - "loss": 0.3933, - "step": 78560 - }, - { - "epoch": 2.01, - "learning_rate": 5.154544630016234e-07, - "loss": 0.3643, - "step": 78561 - }, - { - "epoch": 2.01, - "learning_rate": 5.154302580137781e-07, - "loss": 0.4387, - "step": 78562 - }, - { - "epoch": 2.01, - "learning_rate": 5.154060533969451e-07, - "loss": 0.254, - "step": 78563 - }, - { - "epoch": 2.01, - "learning_rate": 5.153818491511438e-07, - "loss": 0.4277, - "step": 78564 - }, - { - "epoch": 2.01, - "learning_rate": 5.153576452763919e-07, - "loss": 0.4375, - "step": 78565 - }, - { - "epoch": 2.01, - "learning_rate": 5.153334417727089e-07, - "loss": 0.386, - "step": 78566 - }, - { - "epoch": 2.01, - "learning_rate": 5.153092386401123e-07, - "loss": 0.3025, - "step": 78567 - }, - { - "epoch": 2.01, - "learning_rate": 5.152850358786211e-07, - "loss": 0.4204, - "step": 78568 - }, - { - "epoch": 2.01, - "learning_rate": 5.15260833488254e-07, - "loss": 0.4614, - "step": 78569 - }, - { - "epoch": 2.01, - "learning_rate": 5.152366314690297e-07, - "loss": 0.5425, - "step": 78570 - }, - { - "epoch": 2.01, - "learning_rate": 5.15212429820966e-07, - "loss": 0.603, - "step": 78571 - }, - { - "epoch": 2.01, - "learning_rate": 5.151882285440818e-07, - "loss": 0.304, - "step": 78572 - }, - { - "epoch": 2.01, - "learning_rate": 5.151640276383958e-07, - "loss": 0.4917, - "step": 78573 - }, - { - "epoch": 2.01, - "learning_rate": 5.151398271039269e-07, - "loss": 0.4482, - "step": 78574 - }, - { - "epoch": 2.01, - "learning_rate": 5.151156269406929e-07, - "loss": 0.3727, - "step": 78575 - }, - { - "epoch": 2.01, - "learning_rate": 5.150914271487124e-07, - "loss": 0.4717, - "step": 78576 - }, - { - "epoch": 2.01, - "learning_rate": 5.150672277280039e-07, - "loss": 0.345, - "step": 78577 - }, - { - "epoch": 2.01, - "learning_rate": 5.150430286785862e-07, - "loss": 0.4756, - "step": 78578 - }, - { - "epoch": 2.01, - "learning_rate": 5.150188300004781e-07, - "loss": 0.3235, - "step": 78579 - }, - { - "epoch": 2.01, - "learning_rate": 5.149946316936975e-07, - "loss": 0.4438, - "step": 78580 - }, - { - "epoch": 2.01, - "learning_rate": 5.149704337582631e-07, - "loss": 0.5303, - "step": 78581 - }, - { - "epoch": 2.01, - "learning_rate": 5.149462361941941e-07, - "loss": 0.4941, - "step": 78582 - }, - { - "epoch": 2.01, - "learning_rate": 5.149220390015079e-07, - "loss": 0.4819, - "step": 78583 - }, - { - "epoch": 2.01, - "learning_rate": 5.148978421802239e-07, - "loss": 0.4653, - "step": 78584 - }, - { - "epoch": 2.01, - "learning_rate": 5.148736457303601e-07, - "loss": 0.6069, - "step": 78585 - }, - { - "epoch": 2.01, - "learning_rate": 5.148494496519353e-07, - "loss": 0.3257, - "step": 78586 - }, - { - "epoch": 2.01, - "learning_rate": 5.148252539449682e-07, - "loss": 0.3374, - "step": 78587 - }, - { - "epoch": 2.01, - "learning_rate": 5.148010586094768e-07, - "loss": 0.2526, - "step": 78588 - }, - { - "epoch": 2.01, - "learning_rate": 5.147768636454799e-07, - "loss": 0.3347, - "step": 78589 - }, - { - "epoch": 2.01, - "learning_rate": 5.14752669052996e-07, - "loss": 0.3048, - "step": 78590 - }, - { - "epoch": 2.01, - "learning_rate": 5.14728474832044e-07, - "loss": 0.438, - "step": 78591 - }, - { - "epoch": 2.01, - "learning_rate": 5.147042809826418e-07, - "loss": 0.4099, - "step": 78592 - }, - { - "epoch": 2.01, - "learning_rate": 5.146800875048083e-07, - "loss": 0.4702, - "step": 78593 - }, - { - "epoch": 2.01, - "learning_rate": 5.146558943985622e-07, - "loss": 0.415, - "step": 78594 - }, - { - "epoch": 2.01, - "learning_rate": 5.146317016639215e-07, - "loss": 0.3595, - "step": 78595 - }, - { - "epoch": 2.01, - "learning_rate": 5.146075093009052e-07, - "loss": 0.4878, - "step": 78596 - }, - { - "epoch": 2.01, - "learning_rate": 5.145833173095313e-07, - "loss": 0.3767, - "step": 78597 - }, - { - "epoch": 2.01, - "learning_rate": 5.145591256898187e-07, - "loss": 0.2612, - "step": 78598 - }, - { - "epoch": 2.01, - "learning_rate": 5.145349344417862e-07, - "loss": 0.4951, - "step": 78599 - }, - { - "epoch": 2.01, - "learning_rate": 5.145107435654516e-07, - "loss": 0.4282, - "step": 78600 - }, - { - "epoch": 2.01, - "learning_rate": 5.144865530608337e-07, - "loss": 0.4956, - "step": 78601 - }, - { - "epoch": 2.01, - "learning_rate": 5.144623629279512e-07, - "loss": 0.4697, - "step": 78602 - }, - { - "epoch": 2.01, - "learning_rate": 5.14438173166823e-07, - "loss": 0.417, - "step": 78603 - }, - { - "epoch": 2.01, - "learning_rate": 5.14413983777467e-07, - "loss": 0.4692, - "step": 78604 - }, - { - "epoch": 2.01, - "learning_rate": 5.143897947599017e-07, - "loss": 0.3602, - "step": 78605 - }, - { - "epoch": 2.01, - "learning_rate": 5.143656061141457e-07, - "loss": 0.5024, - "step": 78606 - }, - { - "epoch": 2.01, - "learning_rate": 5.143414178402176e-07, - "loss": 0.3263, - "step": 78607 - }, - { - "epoch": 2.01, - "learning_rate": 5.143172299381364e-07, - "loss": 0.3843, - "step": 78608 - }, - { - "epoch": 2.01, - "learning_rate": 5.142930424079197e-07, - "loss": 0.2759, - "step": 78609 - }, - { - "epoch": 2.01, - "learning_rate": 5.142688552495865e-07, - "loss": 0.4199, - "step": 78610 - }, - { - "epoch": 2.01, - "learning_rate": 5.142446684631554e-07, - "loss": 0.3435, - "step": 78611 - }, - { - "epoch": 2.01, - "learning_rate": 5.142204820486451e-07, - "loss": 0.3486, - "step": 78612 - }, - { - "epoch": 2.01, - "learning_rate": 5.141962960060739e-07, - "loss": 0.3682, - "step": 78613 - }, - { - "epoch": 2.01, - "learning_rate": 5.141721103354597e-07, - "loss": 0.4309, - "step": 78614 - }, - { - "epoch": 2.01, - "learning_rate": 5.141479250368218e-07, - "loss": 0.4854, - "step": 78615 - }, - { - "epoch": 2.01, - "learning_rate": 5.141237401101788e-07, - "loss": 0.4478, - "step": 78616 - }, - { - "epoch": 2.01, - "learning_rate": 5.140995555555485e-07, - "loss": 0.4619, - "step": 78617 - }, - { - "epoch": 2.02, - "learning_rate": 5.140753713729499e-07, - "loss": 0.4614, - "step": 78618 - }, - { - "epoch": 2.02, - "learning_rate": 5.140511875624014e-07, - "loss": 0.4287, - "step": 78619 - }, - { - "epoch": 2.02, - "learning_rate": 5.140270041239219e-07, - "loss": 0.3721, - "step": 78620 - }, - { - "epoch": 2.02, - "learning_rate": 5.140028210575292e-07, - "loss": 0.5088, - "step": 78621 - }, - { - "epoch": 2.02, - "learning_rate": 5.139786383632423e-07, - "loss": 0.3442, - "step": 78622 - }, - { - "epoch": 2.02, - "learning_rate": 5.139544560410799e-07, - "loss": 0.4316, - "step": 78623 - }, - { - "epoch": 2.02, - "learning_rate": 5.139302740910598e-07, - "loss": 0.52, - "step": 78624 - }, - { - "epoch": 2.02, - "learning_rate": 5.139060925132015e-07, - "loss": 0.2688, - "step": 78625 - }, - { - "epoch": 2.02, - "learning_rate": 5.138819113075223e-07, - "loss": 0.3862, - "step": 78626 - }, - { - "epoch": 2.02, - "learning_rate": 5.138577304740417e-07, - "loss": 0.4937, - "step": 78627 - }, - { - "epoch": 2.02, - "learning_rate": 5.138335500127776e-07, - "loss": 0.3457, - "step": 78628 - }, - { - "epoch": 2.02, - "learning_rate": 5.138093699237493e-07, - "loss": 0.3499, - "step": 78629 - }, - { - "epoch": 2.02, - "learning_rate": 5.137851902069744e-07, - "loss": 0.459, - "step": 78630 - }, - { - "epoch": 2.02, - "learning_rate": 5.137610108624719e-07, - "loss": 0.3333, - "step": 78631 - }, - { - "epoch": 2.02, - "learning_rate": 5.137368318902601e-07, - "loss": 0.5024, - "step": 78632 - }, - { - "epoch": 2.02, - "learning_rate": 5.137126532903587e-07, - "loss": 0.4531, - "step": 78633 - }, - { - "epoch": 2.02, - "learning_rate": 5.136884750627841e-07, - "loss": 0.439, - "step": 78634 - }, - { - "epoch": 2.02, - "learning_rate": 5.136642972075559e-07, - "loss": 0.4985, - "step": 78635 - }, - { - "epoch": 2.02, - "learning_rate": 5.136401197246927e-07, - "loss": 0.397, - "step": 78636 - }, - { - "epoch": 2.02, - "learning_rate": 5.136159426142132e-07, - "loss": 0.3462, - "step": 78637 - }, - { - "epoch": 2.02, - "learning_rate": 5.135917658761351e-07, - "loss": 0.3052, - "step": 78638 - }, - { - "epoch": 2.02, - "learning_rate": 5.135675895104776e-07, - "loss": 0.4736, - "step": 78639 - }, - { - "epoch": 2.02, - "learning_rate": 5.135434135172591e-07, - "loss": 0.4385, - "step": 78640 - }, - { - "epoch": 2.02, - "learning_rate": 5.135192378964983e-07, - "loss": 0.4419, - "step": 78641 - }, - { - "epoch": 2.02, - "learning_rate": 5.13495062648213e-07, - "loss": 0.4199, - "step": 78642 - }, - { - "epoch": 2.02, - "learning_rate": 5.134708877724228e-07, - "loss": 0.4482, - "step": 78643 - }, - { - "epoch": 2.02, - "learning_rate": 5.134467132691449e-07, - "loss": 0.4917, - "step": 78644 - }, - { - "epoch": 2.02, - "learning_rate": 5.134225391383986e-07, - "loss": 0.3989, - "step": 78645 - }, - { - "epoch": 2.02, - "learning_rate": 5.133983653802026e-07, - "loss": 0.3423, - "step": 78646 - }, - { - "epoch": 2.02, - "learning_rate": 5.133741919945749e-07, - "loss": 0.5015, - "step": 78647 - }, - { - "epoch": 2.02, - "learning_rate": 5.13350018981534e-07, - "loss": 0.4385, - "step": 78648 - }, - { - "epoch": 2.02, - "learning_rate": 5.133258463410988e-07, - "loss": 0.4165, - "step": 78649 - }, - { - "epoch": 2.02, - "learning_rate": 5.133016740732878e-07, - "loss": 0.4834, - "step": 78650 - }, - { - "epoch": 2.02, - "learning_rate": 5.13277502178119e-07, - "loss": 0.4053, - "step": 78651 - }, - { - "epoch": 2.02, - "learning_rate": 5.132533306556114e-07, - "loss": 0.5059, - "step": 78652 - }, - { - "epoch": 2.02, - "learning_rate": 5.132291595057836e-07, - "loss": 0.3955, - "step": 78653 - }, - { - "epoch": 2.02, - "learning_rate": 5.132049887286539e-07, - "loss": 0.4282, - "step": 78654 - }, - { - "epoch": 2.02, - "learning_rate": 5.131808183242403e-07, - "loss": 0.2925, - "step": 78655 - }, - { - "epoch": 2.02, - "learning_rate": 5.131566482925618e-07, - "loss": 0.342, - "step": 78656 - }, - { - "epoch": 2.02, - "learning_rate": 5.131324786336368e-07, - "loss": 0.3667, - "step": 78657 - }, - { - "epoch": 2.02, - "learning_rate": 5.131083093474844e-07, - "loss": 0.4287, - "step": 78658 - }, - { - "epoch": 2.02, - "learning_rate": 5.130841404341221e-07, - "loss": 0.3589, - "step": 78659 - }, - { - "epoch": 2.02, - "learning_rate": 5.130599718935689e-07, - "loss": 0.4141, - "step": 78660 - }, - { - "epoch": 2.02, - "learning_rate": 5.130358037258434e-07, - "loss": 0.3657, - "step": 78661 - }, - { - "epoch": 2.02, - "learning_rate": 5.130116359309642e-07, - "loss": 0.4629, - "step": 78662 - }, - { - "epoch": 2.02, - "learning_rate": 5.129874685089497e-07, - "loss": 0.3833, - "step": 78663 - }, - { - "epoch": 2.02, - "learning_rate": 5.129633014598178e-07, - "loss": 0.3691, - "step": 78664 - }, - { - "epoch": 2.02, - "learning_rate": 5.129391347835876e-07, - "loss": 0.3706, - "step": 78665 - }, - { - "epoch": 2.02, - "learning_rate": 5.129149684802776e-07, - "loss": 0.4521, - "step": 78666 - }, - { - "epoch": 2.02, - "learning_rate": 5.128908025499065e-07, - "loss": 0.3497, - "step": 78667 - }, - { - "epoch": 2.02, - "learning_rate": 5.128666369924921e-07, - "loss": 0.3372, - "step": 78668 - }, - { - "epoch": 2.02, - "learning_rate": 5.128424718080533e-07, - "loss": 0.5107, - "step": 78669 - }, - { - "epoch": 2.02, - "learning_rate": 5.128183069966091e-07, - "loss": 0.4536, - "step": 78670 - }, - { - "epoch": 2.02, - "learning_rate": 5.12794142558177e-07, - "loss": 0.4155, - "step": 78671 - }, - { - "epoch": 2.02, - "learning_rate": 5.127699784927762e-07, - "loss": 0.5718, - "step": 78672 - }, - { - "epoch": 2.02, - "learning_rate": 5.127458148004253e-07, - "loss": 0.4248, - "step": 78673 - }, - { - "epoch": 2.02, - "learning_rate": 5.127216514811422e-07, - "loss": 0.406, - "step": 78674 - }, - { - "epoch": 2.02, - "learning_rate": 5.126974885349461e-07, - "loss": 0.3746, - "step": 78675 - }, - { - "epoch": 2.02, - "learning_rate": 5.126733259618547e-07, - "loss": 0.4204, - "step": 78676 - }, - { - "epoch": 2.02, - "learning_rate": 5.12649163761887e-07, - "loss": 0.3596, - "step": 78677 - }, - { - "epoch": 2.02, - "learning_rate": 5.126250019350613e-07, - "loss": 0.4507, - "step": 78678 - }, - { - "epoch": 2.02, - "learning_rate": 5.126008404813966e-07, - "loss": 0.2878, - "step": 78679 - }, - { - "epoch": 2.02, - "learning_rate": 5.125766794009107e-07, - "loss": 0.5249, - "step": 78680 - }, - { - "epoch": 2.02, - "learning_rate": 5.125525186936226e-07, - "loss": 0.3894, - "step": 78681 - }, - { - "epoch": 2.02, - "learning_rate": 5.125283583595504e-07, - "loss": 0.3418, - "step": 78682 - }, - { - "epoch": 2.02, - "learning_rate": 5.125041983987133e-07, - "loss": 0.3989, - "step": 78683 - }, - { - "epoch": 2.02, - "learning_rate": 5.124800388111292e-07, - "loss": 0.3623, - "step": 78684 - }, - { - "epoch": 2.02, - "learning_rate": 5.124558795968165e-07, - "loss": 0.4015, - "step": 78685 - }, - { - "epoch": 2.02, - "learning_rate": 5.124317207557938e-07, - "loss": 0.312, - "step": 78686 - }, - { - "epoch": 2.02, - "learning_rate": 5.124075622880801e-07, - "loss": 0.3103, - "step": 78687 - }, - { - "epoch": 2.02, - "learning_rate": 5.123834041936931e-07, - "loss": 0.4565, - "step": 78688 - }, - { - "epoch": 2.02, - "learning_rate": 5.123592464726518e-07, - "loss": 0.3923, - "step": 78689 - }, - { - "epoch": 2.02, - "learning_rate": 5.123350891249747e-07, - "loss": 0.4399, - "step": 78690 - }, - { - "epoch": 2.02, - "learning_rate": 5.123109321506804e-07, - "loss": 0.502, - "step": 78691 - }, - { - "epoch": 2.02, - "learning_rate": 5.122867755497868e-07, - "loss": 0.3677, - "step": 78692 - }, - { - "epoch": 2.02, - "learning_rate": 5.122626193223133e-07, - "loss": 0.5039, - "step": 78693 - }, - { - "epoch": 2.02, - "learning_rate": 5.122384634682775e-07, - "loss": 0.4092, - "step": 78694 - }, - { - "epoch": 2.02, - "learning_rate": 5.122143079876982e-07, - "loss": 0.4092, - "step": 78695 - }, - { - "epoch": 2.02, - "learning_rate": 5.121901528805943e-07, - "loss": 0.4028, - "step": 78696 - }, - { - "epoch": 2.02, - "learning_rate": 5.121659981469837e-07, - "loss": 0.3535, - "step": 78697 - }, - { - "epoch": 2.02, - "learning_rate": 5.121418437868852e-07, - "loss": 0.3965, - "step": 78698 - }, - { - "epoch": 2.02, - "learning_rate": 5.121176898003171e-07, - "loss": 0.3828, - "step": 78699 - }, - { - "epoch": 2.02, - "learning_rate": 5.120935361872986e-07, - "loss": 0.519, - "step": 78700 - }, - { - "epoch": 2.02, - "learning_rate": 5.120693829478471e-07, - "loss": 0.4272, - "step": 78701 - }, - { - "epoch": 2.02, - "learning_rate": 5.120452300819818e-07, - "loss": 0.3315, - "step": 78702 - }, - { - "epoch": 2.02, - "learning_rate": 5.120210775897213e-07, - "loss": 0.4663, - "step": 78703 - }, - { - "epoch": 2.02, - "learning_rate": 5.119969254710838e-07, - "loss": 0.3298, - "step": 78704 - }, - { - "epoch": 2.02, - "learning_rate": 5.119727737260875e-07, - "loss": 0.2684, - "step": 78705 - }, - { - "epoch": 2.02, - "learning_rate": 5.119486223547513e-07, - "loss": 0.4644, - "step": 78706 - }, - { - "epoch": 2.02, - "learning_rate": 5.119244713570934e-07, - "loss": 0.4224, - "step": 78707 - }, - { - "epoch": 2.02, - "learning_rate": 5.11900320733133e-07, - "loss": 0.3899, - "step": 78708 - }, - { - "epoch": 2.02, - "learning_rate": 5.118761704828876e-07, - "loss": 0.3794, - "step": 78709 - }, - { - "epoch": 2.02, - "learning_rate": 5.118520206063763e-07, - "loss": 0.4673, - "step": 78710 - }, - { - "epoch": 2.02, - "learning_rate": 5.118278711036174e-07, - "loss": 0.2765, - "step": 78711 - }, - { - "epoch": 2.02, - "learning_rate": 5.118037219746298e-07, - "loss": 0.3813, - "step": 78712 - }, - { - "epoch": 2.02, - "learning_rate": 5.117795732194316e-07, - "loss": 0.3481, - "step": 78713 - }, - { - "epoch": 2.02, - "learning_rate": 5.117554248380412e-07, - "loss": 0.4282, - "step": 78714 - }, - { - "epoch": 2.02, - "learning_rate": 5.11731276830477e-07, - "loss": 0.3789, - "step": 78715 - }, - { - "epoch": 2.02, - "learning_rate": 5.117071291967578e-07, - "loss": 0.3623, - "step": 78716 - }, - { - "epoch": 2.02, - "learning_rate": 5.116829819369023e-07, - "loss": 0.3073, - "step": 78717 - }, - { - "epoch": 2.02, - "learning_rate": 5.116588350509284e-07, - "loss": 0.4214, - "step": 78718 - }, - { - "epoch": 2.02, - "learning_rate": 5.116346885388547e-07, - "loss": 0.26, - "step": 78719 - }, - { - "epoch": 2.02, - "learning_rate": 5.116105424007e-07, - "loss": 0.3879, - "step": 78720 - }, - { - "epoch": 2.02, - "learning_rate": 5.115863966364831e-07, - "loss": 0.4089, - "step": 78721 - }, - { - "epoch": 2.02, - "learning_rate": 5.115622512462215e-07, - "loss": 0.3378, - "step": 78722 - }, - { - "epoch": 2.02, - "learning_rate": 5.115381062299347e-07, - "loss": 0.5015, - "step": 78723 - }, - { - "epoch": 2.02, - "learning_rate": 5.115139615876403e-07, - "loss": 0.4062, - "step": 78724 - }, - { - "epoch": 2.02, - "learning_rate": 5.114898173193576e-07, - "loss": 0.478, - "step": 78725 - }, - { - "epoch": 2.02, - "learning_rate": 5.114656734251043e-07, - "loss": 0.3691, - "step": 78726 - }, - { - "epoch": 2.02, - "learning_rate": 5.114415299048993e-07, - "loss": 0.4316, - "step": 78727 - }, - { - "epoch": 2.02, - "learning_rate": 5.114173867587611e-07, - "loss": 0.376, - "step": 78728 - }, - { - "epoch": 2.02, - "learning_rate": 5.113932439867084e-07, - "loss": 0.4007, - "step": 78729 - }, - { - "epoch": 2.02, - "learning_rate": 5.113691015887591e-07, - "loss": 0.3838, - "step": 78730 - }, - { - "epoch": 2.02, - "learning_rate": 5.113449595649319e-07, - "loss": 0.4146, - "step": 78731 - }, - { - "epoch": 2.02, - "learning_rate": 5.113208179152455e-07, - "loss": 0.4302, - "step": 78732 - }, - { - "epoch": 2.02, - "learning_rate": 5.112966766397187e-07, - "loss": 0.4807, - "step": 78733 - }, - { - "epoch": 2.02, - "learning_rate": 5.112725357383696e-07, - "loss": 0.3211, - "step": 78734 - }, - { - "epoch": 2.02, - "learning_rate": 5.112483952112161e-07, - "loss": 0.4053, - "step": 78735 - }, - { - "epoch": 2.02, - "learning_rate": 5.112242550582772e-07, - "loss": 0.2922, - "step": 78736 - }, - { - "epoch": 2.02, - "learning_rate": 5.112001152795717e-07, - "loss": 0.4075, - "step": 78737 - }, - { - "epoch": 2.02, - "learning_rate": 5.11175975875118e-07, - "loss": 0.4077, - "step": 78738 - }, - { - "epoch": 2.02, - "learning_rate": 5.111518368449339e-07, - "loss": 0.3853, - "step": 78739 - }, - { - "epoch": 2.02, - "learning_rate": 5.111276981890384e-07, - "loss": 0.3555, - "step": 78740 - }, - { - "epoch": 2.02, - "learning_rate": 5.111035599074502e-07, - "loss": 0.3379, - "step": 78741 - }, - { - "epoch": 2.02, - "learning_rate": 5.110794220001876e-07, - "loss": 0.4625, - "step": 78742 - }, - { - "epoch": 2.02, - "learning_rate": 5.110552844672691e-07, - "loss": 0.479, - "step": 78743 - }, - { - "epoch": 2.02, - "learning_rate": 5.110311473087128e-07, - "loss": 0.4463, - "step": 78744 - }, - { - "epoch": 2.02, - "learning_rate": 5.110070105245374e-07, - "loss": 0.385, - "step": 78745 - }, - { - "epoch": 2.02, - "learning_rate": 5.109828741147617e-07, - "loss": 0.3652, - "step": 78746 - }, - { - "epoch": 2.02, - "learning_rate": 5.109587380794038e-07, - "loss": 0.4946, - "step": 78747 - }, - { - "epoch": 2.02, - "learning_rate": 5.109346024184821e-07, - "loss": 0.5786, - "step": 78748 - }, - { - "epoch": 2.02, - "learning_rate": 5.109104671320154e-07, - "loss": 0.4741, - "step": 78749 - }, - { - "epoch": 2.02, - "learning_rate": 5.108863322200223e-07, - "loss": 0.4746, - "step": 78750 - }, - { - "epoch": 2.02, - "learning_rate": 5.10862197682521e-07, - "loss": 0.2917, - "step": 78751 - }, - { - "epoch": 2.02, - "learning_rate": 5.108380635195296e-07, - "loss": 0.3755, - "step": 78752 - }, - { - "epoch": 2.02, - "learning_rate": 5.108139297310676e-07, - "loss": 0.3733, - "step": 78753 - }, - { - "epoch": 2.02, - "learning_rate": 5.107897963171526e-07, - "loss": 0.4685, - "step": 78754 - }, - { - "epoch": 2.02, - "learning_rate": 5.107656632778034e-07, - "loss": 0.406, - "step": 78755 - }, - { - "epoch": 2.02, - "learning_rate": 5.107415306130385e-07, - "loss": 0.46, - "step": 78756 - }, - { - "epoch": 2.02, - "learning_rate": 5.10717398322876e-07, - "loss": 0.4124, - "step": 78757 - }, - { - "epoch": 2.02, - "learning_rate": 5.106932664073348e-07, - "loss": 0.3623, - "step": 78758 - }, - { - "epoch": 2.02, - "learning_rate": 5.106691348664336e-07, - "loss": 0.5234, - "step": 78759 - }, - { - "epoch": 2.02, - "learning_rate": 5.106450037001902e-07, - "loss": 0.3569, - "step": 78760 - }, - { - "epoch": 2.02, - "learning_rate": 5.106208729086234e-07, - "loss": 0.3523, - "step": 78761 - }, - { - "epoch": 2.02, - "learning_rate": 5.105967424917521e-07, - "loss": 0.3298, - "step": 78762 - }, - { - "epoch": 2.02, - "learning_rate": 5.105726124495944e-07, - "loss": 0.5, - "step": 78763 - }, - { - "epoch": 2.02, - "learning_rate": 5.105484827821683e-07, - "loss": 0.4214, - "step": 78764 - }, - { - "epoch": 2.02, - "learning_rate": 5.105243534894928e-07, - "loss": 0.3815, - "step": 78765 - }, - { - "epoch": 2.02, - "learning_rate": 5.105002245715862e-07, - "loss": 0.3162, - "step": 78766 - }, - { - "epoch": 2.02, - "learning_rate": 5.104760960284674e-07, - "loss": 0.3333, - "step": 78767 - }, - { - "epoch": 2.02, - "learning_rate": 5.104519678601542e-07, - "loss": 0.3551, - "step": 78768 - }, - { - "epoch": 2.02, - "learning_rate": 5.104278400666655e-07, - "loss": 0.5093, - "step": 78769 - }, - { - "epoch": 2.02, - "learning_rate": 5.104037126480196e-07, - "loss": 0.481, - "step": 78770 - }, - { - "epoch": 2.02, - "learning_rate": 5.103795856042357e-07, - "loss": 0.4443, - "step": 78771 - }, - { - "epoch": 2.02, - "learning_rate": 5.10355458935331e-07, - "loss": 0.5005, - "step": 78772 - }, - { - "epoch": 2.02, - "learning_rate": 5.10331332641325e-07, - "loss": 0.4473, - "step": 78773 - }, - { - "epoch": 2.02, - "learning_rate": 5.103072067222355e-07, - "loss": 0.3251, - "step": 78774 - }, - { - "epoch": 2.02, - "learning_rate": 5.102830811780812e-07, - "loss": 0.3721, - "step": 78775 - }, - { - "epoch": 2.02, - "learning_rate": 5.10258956008881e-07, - "loss": 0.5043, - "step": 78776 - }, - { - "epoch": 2.02, - "learning_rate": 5.102348312146527e-07, - "loss": 0.263, - "step": 78777 - }, - { - "epoch": 2.02, - "learning_rate": 5.102107067954148e-07, - "loss": 0.4771, - "step": 78778 - }, - { - "epoch": 2.02, - "learning_rate": 5.101865827511869e-07, - "loss": 0.4316, - "step": 78779 - }, - { - "epoch": 2.02, - "learning_rate": 5.101624590819859e-07, - "loss": 0.4211, - "step": 78780 - }, - { - "epoch": 2.02, - "learning_rate": 5.101383357878311e-07, - "loss": 0.3596, - "step": 78781 - }, - { - "epoch": 2.02, - "learning_rate": 5.101142128687407e-07, - "loss": 0.3513, - "step": 78782 - }, - { - "epoch": 2.02, - "learning_rate": 5.100900903247338e-07, - "loss": 0.4006, - "step": 78783 - }, - { - "epoch": 2.02, - "learning_rate": 5.100659681558283e-07, - "loss": 0.3853, - "step": 78784 - }, - { - "epoch": 2.02, - "learning_rate": 5.100418463620426e-07, - "loss": 0.3898, - "step": 78785 - }, - { - "epoch": 2.02, - "learning_rate": 5.100177249433951e-07, - "loss": 0.4868, - "step": 78786 - }, - { - "epoch": 2.02, - "learning_rate": 5.099936038999046e-07, - "loss": 0.4736, - "step": 78787 - }, - { - "epoch": 2.02, - "learning_rate": 5.0996948323159e-07, - "loss": 0.4281, - "step": 78788 - }, - { - "epoch": 2.02, - "learning_rate": 5.099453629384686e-07, - "loss": 0.3356, - "step": 78789 - }, - { - "epoch": 2.02, - "learning_rate": 5.099212430205595e-07, - "loss": 0.4233, - "step": 78790 - }, - { - "epoch": 2.02, - "learning_rate": 5.098971234778813e-07, - "loss": 0.3494, - "step": 78791 - }, - { - "epoch": 2.02, - "learning_rate": 5.098730043104527e-07, - "loss": 0.3166, - "step": 78792 - }, - { - "epoch": 2.02, - "learning_rate": 5.098488855182919e-07, - "loss": 0.4042, - "step": 78793 - }, - { - "epoch": 2.02, - "learning_rate": 5.098247671014167e-07, - "loss": 0.3809, - "step": 78794 - }, - { - "epoch": 2.02, - "learning_rate": 5.098006490598463e-07, - "loss": 0.3633, - "step": 78795 - }, - { - "epoch": 2.02, - "learning_rate": 5.097765313935992e-07, - "loss": 0.3703, - "step": 78796 - }, - { - "epoch": 2.02, - "learning_rate": 5.097524141026935e-07, - "loss": 0.4229, - "step": 78797 - }, - { - "epoch": 2.02, - "learning_rate": 5.097282971871476e-07, - "loss": 0.4224, - "step": 78798 - }, - { - "epoch": 2.02, - "learning_rate": 5.097041806469804e-07, - "loss": 0.3037, - "step": 78799 - }, - { - "epoch": 2.02, - "learning_rate": 5.096800644822103e-07, - "loss": 0.4795, - "step": 78800 - }, - { - "epoch": 2.02, - "learning_rate": 5.096559486928555e-07, - "loss": 0.2552, - "step": 78801 - }, - { - "epoch": 2.02, - "learning_rate": 5.096318332789344e-07, - "loss": 0.3965, - "step": 78802 - }, - { - "epoch": 2.02, - "learning_rate": 5.096077182404663e-07, - "loss": 0.3772, - "step": 78803 - }, - { - "epoch": 2.02, - "learning_rate": 5.095836035774684e-07, - "loss": 0.4697, - "step": 78804 - }, - { - "epoch": 2.02, - "learning_rate": 5.095594892899603e-07, - "loss": 0.3673, - "step": 78805 - }, - { - "epoch": 2.02, - "learning_rate": 5.095353753779595e-07, - "loss": 0.4263, - "step": 78806 - }, - { - "epoch": 2.02, - "learning_rate": 5.095112618414849e-07, - "loss": 0.375, - "step": 78807 - }, - { - "epoch": 2.02, - "learning_rate": 5.09487148680555e-07, - "loss": 0.4065, - "step": 78808 - }, - { - "epoch": 2.02, - "learning_rate": 5.094630358951887e-07, - "loss": 0.3752, - "step": 78809 - }, - { - "epoch": 2.02, - "learning_rate": 5.094389234854036e-07, - "loss": 0.5034, - "step": 78810 - }, - { - "epoch": 2.02, - "learning_rate": 5.094148114512185e-07, - "loss": 0.5215, - "step": 78811 - }, - { - "epoch": 2.02, - "learning_rate": 5.093906997926518e-07, - "loss": 0.4961, - "step": 78812 - }, - { - "epoch": 2.02, - "learning_rate": 5.09366588509723e-07, - "loss": 0.4077, - "step": 78813 - }, - { - "epoch": 2.02, - "learning_rate": 5.093424776024489e-07, - "loss": 0.4185, - "step": 78814 - }, - { - "epoch": 2.02, - "learning_rate": 5.093183670708486e-07, - "loss": 0.3772, - "step": 78815 - }, - { - "epoch": 2.02, - "learning_rate": 5.092942569149408e-07, - "loss": 0.5166, - "step": 78816 - }, - { - "epoch": 2.02, - "learning_rate": 5.092701471347441e-07, - "loss": 0.3999, - "step": 78817 - }, - { - "epoch": 2.02, - "learning_rate": 5.092460377302763e-07, - "loss": 0.4414, - "step": 78818 - }, - { - "epoch": 2.02, - "learning_rate": 5.092219287015563e-07, - "loss": 0.4526, - "step": 78819 - }, - { - "epoch": 2.02, - "learning_rate": 5.091978200486025e-07, - "loss": 0.4556, - "step": 78820 - }, - { - "epoch": 2.02, - "learning_rate": 5.091737117714336e-07, - "loss": 0.519, - "step": 78821 - }, - { - "epoch": 2.02, - "learning_rate": 5.091496038700676e-07, - "loss": 0.3682, - "step": 78822 - }, - { - "epoch": 2.02, - "learning_rate": 5.091254963445235e-07, - "loss": 0.4673, - "step": 78823 - }, - { - "epoch": 2.02, - "learning_rate": 5.09101389194819e-07, - "loss": 0.4507, - "step": 78824 - }, - { - "epoch": 2.02, - "learning_rate": 5.09077282420973e-07, - "loss": 0.2232, - "step": 78825 - }, - { - "epoch": 2.02, - "learning_rate": 5.090531760230045e-07, - "loss": 0.3772, - "step": 78826 - }, - { - "epoch": 2.02, - "learning_rate": 5.090290700009309e-07, - "loss": 0.2639, - "step": 78827 - }, - { - "epoch": 2.02, - "learning_rate": 5.090049643547711e-07, - "loss": 0.417, - "step": 78828 - }, - { - "epoch": 2.02, - "learning_rate": 5.089808590845438e-07, - "loss": 0.5361, - "step": 78829 - }, - { - "epoch": 2.02, - "learning_rate": 5.089567541902675e-07, - "loss": 0.522, - "step": 78830 - }, - { - "epoch": 2.02, - "learning_rate": 5.089326496719601e-07, - "loss": 0.3091, - "step": 78831 - }, - { - "epoch": 2.02, - "learning_rate": 5.089085455296405e-07, - "loss": 0.4448, - "step": 78832 - }, - { - "epoch": 2.02, - "learning_rate": 5.088844417633274e-07, - "loss": 0.4893, - "step": 78833 - }, - { - "epoch": 2.02, - "learning_rate": 5.088603383730387e-07, - "loss": 0.5332, - "step": 78834 - }, - { - "epoch": 2.02, - "learning_rate": 5.088362353587929e-07, - "loss": 0.5054, - "step": 78835 - }, - { - "epoch": 2.02, - "learning_rate": 5.088121327206085e-07, - "loss": 0.3767, - "step": 78836 - }, - { - "epoch": 2.02, - "learning_rate": 5.08788030458504e-07, - "loss": 0.3184, - "step": 78837 - }, - { - "epoch": 2.02, - "learning_rate": 5.087639285724985e-07, - "loss": 0.3984, - "step": 78838 - }, - { - "epoch": 2.02, - "learning_rate": 5.087398270626093e-07, - "loss": 0.3645, - "step": 78839 - }, - { - "epoch": 2.02, - "learning_rate": 5.087157259288555e-07, - "loss": 0.3809, - "step": 78840 - }, - { - "epoch": 2.02, - "learning_rate": 5.086916251712556e-07, - "loss": 0.2244, - "step": 78841 - }, - { - "epoch": 2.02, - "learning_rate": 5.086675247898281e-07, - "loss": 0.2891, - "step": 78842 - }, - { - "epoch": 2.02, - "learning_rate": 5.086434247845914e-07, - "loss": 0.3711, - "step": 78843 - }, - { - "epoch": 2.02, - "learning_rate": 5.086193251555635e-07, - "loss": 0.3826, - "step": 78844 - }, - { - "epoch": 2.02, - "learning_rate": 5.085952259027631e-07, - "loss": 0.4565, - "step": 78845 - }, - { - "epoch": 2.02, - "learning_rate": 5.085711270262088e-07, - "loss": 0.3176, - "step": 78846 - }, - { - "epoch": 2.02, - "learning_rate": 5.085470285259193e-07, - "loss": 0.3423, - "step": 78847 - }, - { - "epoch": 2.02, - "learning_rate": 5.085229304019123e-07, - "loss": 0.3625, - "step": 78848 - }, - { - "epoch": 2.02, - "learning_rate": 5.084988326542068e-07, - "loss": 0.4575, - "step": 78849 - }, - { - "epoch": 2.02, - "learning_rate": 5.084747352828216e-07, - "loss": 0.3513, - "step": 78850 - }, - { - "epoch": 2.02, - "learning_rate": 5.084506382877742e-07, - "loss": 0.4244, - "step": 78851 - }, - { - "epoch": 2.02, - "learning_rate": 5.084265416690836e-07, - "loss": 0.3672, - "step": 78852 - }, - { - "epoch": 2.02, - "learning_rate": 5.084024454267686e-07, - "loss": 0.1902, - "step": 78853 - }, - { - "epoch": 2.02, - "learning_rate": 5.083783495608467e-07, - "loss": 0.4092, - "step": 78854 - }, - { - "epoch": 2.02, - "learning_rate": 5.083542540713375e-07, - "loss": 0.4624, - "step": 78855 - }, - { - "epoch": 2.02, - "learning_rate": 5.083301589582582e-07, - "loss": 0.3463, - "step": 78856 - }, - { - "epoch": 2.02, - "learning_rate": 5.083060642216281e-07, - "loss": 0.4365, - "step": 78857 - }, - { - "epoch": 2.02, - "learning_rate": 5.082819698614653e-07, - "loss": 0.5063, - "step": 78858 - }, - { - "epoch": 2.02, - "learning_rate": 5.082578758777889e-07, - "loss": 0.4492, - "step": 78859 - }, - { - "epoch": 2.02, - "learning_rate": 5.082337822706164e-07, - "loss": 0.3477, - "step": 78860 - }, - { - "epoch": 2.02, - "learning_rate": 5.082096890399667e-07, - "loss": 0.4194, - "step": 78861 - }, - { - "epoch": 2.02, - "learning_rate": 5.081855961858581e-07, - "loss": 0.3235, - "step": 78862 - }, - { - "epoch": 2.02, - "learning_rate": 5.081615037083098e-07, - "loss": 0.3772, - "step": 78863 - }, - { - "epoch": 2.02, - "learning_rate": 5.081374116073394e-07, - "loss": 0.623, - "step": 78864 - }, - { - "epoch": 2.02, - "learning_rate": 5.081133198829652e-07, - "loss": 0.335, - "step": 78865 - }, - { - "epoch": 2.02, - "learning_rate": 5.080892285352061e-07, - "loss": 0.4785, - "step": 78866 - }, - { - "epoch": 2.02, - "learning_rate": 5.080651375640809e-07, - "loss": 0.4395, - "step": 78867 - }, - { - "epoch": 2.02, - "learning_rate": 5.080410469696071e-07, - "loss": 0.3821, - "step": 78868 - }, - { - "epoch": 2.02, - "learning_rate": 5.080169567518037e-07, - "loss": 0.2823, - "step": 78869 - }, - { - "epoch": 2.02, - "learning_rate": 5.07992866910689e-07, - "loss": 0.3213, - "step": 78870 - }, - { - "epoch": 2.02, - "learning_rate": 5.07968777446282e-07, - "loss": 0.2996, - "step": 78871 - }, - { - "epoch": 2.02, - "learning_rate": 5.079446883586003e-07, - "loss": 0.3726, - "step": 78872 - }, - { - "epoch": 2.02, - "learning_rate": 5.079205996476632e-07, - "loss": 0.2815, - "step": 78873 - }, - { - "epoch": 2.02, - "learning_rate": 5.078965113134883e-07, - "loss": 0.4175, - "step": 78874 - }, - { - "epoch": 2.02, - "learning_rate": 5.078724233560943e-07, - "loss": 0.2892, - "step": 78875 - }, - { - "epoch": 2.02, - "learning_rate": 5.078483357755001e-07, - "loss": 0.3577, - "step": 78876 - }, - { - "epoch": 2.02, - "learning_rate": 5.078242485717234e-07, - "loss": 0.2507, - "step": 78877 - }, - { - "epoch": 2.02, - "learning_rate": 5.078001617447831e-07, - "loss": 0.3133, - "step": 78878 - }, - { - "epoch": 2.02, - "learning_rate": 5.077760752946975e-07, - "loss": 0.3179, - "step": 78879 - }, - { - "epoch": 2.02, - "learning_rate": 5.077519892214857e-07, - "loss": 0.4702, - "step": 78880 - }, - { - "epoch": 2.02, - "learning_rate": 5.077279035251651e-07, - "loss": 0.4155, - "step": 78881 - }, - { - "epoch": 2.02, - "learning_rate": 5.077038182057547e-07, - "loss": 0.3638, - "step": 78882 - }, - { - "epoch": 2.02, - "learning_rate": 5.076797332632731e-07, - "loss": 0.5107, - "step": 78883 - }, - { - "epoch": 2.02, - "learning_rate": 5.076556486977386e-07, - "loss": 0.363, - "step": 78884 - }, - { - "epoch": 2.02, - "learning_rate": 5.07631564509169e-07, - "loss": 0.4351, - "step": 78885 - }, - { - "epoch": 2.02, - "learning_rate": 5.076074806975833e-07, - "loss": 0.3932, - "step": 78886 - }, - { - "epoch": 2.02, - "learning_rate": 5.07583397263e-07, - "loss": 0.437, - "step": 78887 - }, - { - "epoch": 2.02, - "learning_rate": 5.075593142054377e-07, - "loss": 0.4458, - "step": 78888 - }, - { - "epoch": 2.02, - "learning_rate": 5.075352315249144e-07, - "loss": 0.3481, - "step": 78889 - }, - { - "epoch": 2.02, - "learning_rate": 5.075111492214485e-07, - "loss": 0.46, - "step": 78890 - }, - { - "epoch": 2.02, - "learning_rate": 5.074870672950588e-07, - "loss": 0.3882, - "step": 78891 - }, - { - "epoch": 2.02, - "learning_rate": 5.074629857457641e-07, - "loss": 0.3379, - "step": 78892 - }, - { - "epoch": 2.02, - "learning_rate": 5.074389045735822e-07, - "loss": 0.4453, - "step": 78893 - }, - { - "epoch": 2.02, - "learning_rate": 5.074148237785314e-07, - "loss": 0.3887, - "step": 78894 - }, - { - "epoch": 2.02, - "learning_rate": 5.073907433606303e-07, - "loss": 0.3813, - "step": 78895 - }, - { - "epoch": 2.02, - "learning_rate": 5.073666633198974e-07, - "loss": 0.4287, - "step": 78896 - }, - { - "epoch": 2.02, - "learning_rate": 5.073425836563517e-07, - "loss": 0.3322, - "step": 78897 - }, - { - "epoch": 2.02, - "learning_rate": 5.073185043700108e-07, - "loss": 0.5239, - "step": 78898 - }, - { - "epoch": 2.02, - "learning_rate": 5.072944254608934e-07, - "loss": 0.5508, - "step": 78899 - }, - { - "epoch": 2.02, - "learning_rate": 5.07270346929018e-07, - "loss": 0.4409, - "step": 78900 - }, - { - "epoch": 2.02, - "learning_rate": 5.072462687744035e-07, - "loss": 0.4365, - "step": 78901 - }, - { - "epoch": 2.02, - "learning_rate": 5.072221909970673e-07, - "loss": 0.5244, - "step": 78902 - }, - { - "epoch": 2.02, - "learning_rate": 5.071981135970289e-07, - "loss": 0.2012, - "step": 78903 - }, - { - "epoch": 2.02, - "learning_rate": 5.07174036574306e-07, - "loss": 0.3721, - "step": 78904 - }, - { - "epoch": 2.02, - "learning_rate": 5.071499599289174e-07, - "loss": 0.3168, - "step": 78905 - }, - { - "epoch": 2.02, - "learning_rate": 5.071258836608811e-07, - "loss": 0.3306, - "step": 78906 - }, - { - "epoch": 2.02, - "learning_rate": 5.07101807770216e-07, - "loss": 0.5698, - "step": 78907 - }, - { - "epoch": 2.02, - "learning_rate": 5.070777322569402e-07, - "loss": 0.3492, - "step": 78908 - }, - { - "epoch": 2.02, - "learning_rate": 5.070536571210729e-07, - "loss": 0.3898, - "step": 78909 - }, - { - "epoch": 2.02, - "learning_rate": 5.070295823626313e-07, - "loss": 0.2341, - "step": 78910 - }, - { - "epoch": 2.02, - "learning_rate": 5.070055079816348e-07, - "loss": 0.4355, - "step": 78911 - }, - { - "epoch": 2.02, - "learning_rate": 5.069814339781016e-07, - "loss": 0.376, - "step": 78912 - }, - { - "epoch": 2.02, - "learning_rate": 5.069573603520499e-07, - "loss": 0.4229, - "step": 78913 - }, - { - "epoch": 2.02, - "learning_rate": 5.069332871034985e-07, - "loss": 0.3999, - "step": 78914 - }, - { - "epoch": 2.02, - "learning_rate": 5.069092142324654e-07, - "loss": 0.4849, - "step": 78915 - }, - { - "epoch": 2.02, - "learning_rate": 5.06885141738969e-07, - "loss": 0.3456, - "step": 78916 - }, - { - "epoch": 2.02, - "learning_rate": 5.068610696230282e-07, - "loss": 0.4375, - "step": 78917 - }, - { - "epoch": 2.02, - "learning_rate": 5.068369978846613e-07, - "loss": 0.3689, - "step": 78918 - }, - { - "epoch": 2.02, - "learning_rate": 5.068129265238865e-07, - "loss": 0.4668, - "step": 78919 - }, - { - "epoch": 2.02, - "learning_rate": 5.067888555407224e-07, - "loss": 0.3696, - "step": 78920 - }, - { - "epoch": 2.02, - "learning_rate": 5.067647849351873e-07, - "loss": 0.3425, - "step": 78921 - }, - { - "epoch": 2.02, - "learning_rate": 5.067407147073004e-07, - "loss": 0.1973, - "step": 78922 - }, - { - "epoch": 2.02, - "learning_rate": 5.067166448570787e-07, - "loss": 0.4653, - "step": 78923 - }, - { - "epoch": 2.02, - "learning_rate": 5.066925753845415e-07, - "loss": 0.3696, - "step": 78924 - }, - { - "epoch": 2.02, - "learning_rate": 5.066685062897071e-07, - "loss": 0.4639, - "step": 78925 - }, - { - "epoch": 2.02, - "learning_rate": 5.066444375725944e-07, - "loss": 0.4512, - "step": 78926 - }, - { - "epoch": 2.02, - "learning_rate": 5.066203692332208e-07, - "loss": 0.2832, - "step": 78927 - }, - { - "epoch": 2.02, - "learning_rate": 5.065963012716054e-07, - "loss": 0.4443, - "step": 78928 - }, - { - "epoch": 2.02, - "learning_rate": 5.065722336877665e-07, - "loss": 0.457, - "step": 78929 - }, - { - "epoch": 2.02, - "learning_rate": 5.06548166481723e-07, - "loss": 0.4673, - "step": 78930 - }, - { - "epoch": 2.02, - "learning_rate": 5.065240996534924e-07, - "loss": 0.4404, - "step": 78931 - }, - { - "epoch": 2.02, - "learning_rate": 5.06500033203094e-07, - "loss": 0.4766, - "step": 78932 - }, - { - "epoch": 2.02, - "learning_rate": 5.064759671305455e-07, - "loss": 0.4717, - "step": 78933 - }, - { - "epoch": 2.02, - "learning_rate": 5.064519014358657e-07, - "loss": 0.5659, - "step": 78934 - }, - { - "epoch": 2.02, - "learning_rate": 5.064278361190732e-07, - "loss": 0.4055, - "step": 78935 - }, - { - "epoch": 2.02, - "learning_rate": 5.06403771180186e-07, - "loss": 0.3042, - "step": 78936 - }, - { - "epoch": 2.02, - "learning_rate": 5.063797066192226e-07, - "loss": 0.4663, - "step": 78937 - }, - { - "epoch": 2.02, - "learning_rate": 5.063556424362017e-07, - "loss": 0.6147, - "step": 78938 - }, - { - "epoch": 2.02, - "learning_rate": 5.063315786311418e-07, - "loss": 0.3376, - "step": 78939 - }, - { - "epoch": 2.02, - "learning_rate": 5.063075152040608e-07, - "loss": 0.4375, - "step": 78940 - }, - { - "epoch": 2.02, - "learning_rate": 5.062834521549775e-07, - "loss": 0.4058, - "step": 78941 - }, - { - "epoch": 2.02, - "learning_rate": 5.062593894839107e-07, - "loss": 0.3818, - "step": 78942 - }, - { - "epoch": 2.02, - "learning_rate": 5.062353271908782e-07, - "loss": 0.582, - "step": 78943 - }, - { - "epoch": 2.02, - "learning_rate": 5.062112652758983e-07, - "loss": 0.4609, - "step": 78944 - }, - { - "epoch": 2.02, - "learning_rate": 5.061872037389898e-07, - "loss": 0.2859, - "step": 78945 - }, - { - "epoch": 2.02, - "learning_rate": 5.061631425801709e-07, - "loss": 0.4873, - "step": 78946 - }, - { - "epoch": 2.02, - "learning_rate": 5.061390817994606e-07, - "loss": 0.4277, - "step": 78947 - }, - { - "epoch": 2.02, - "learning_rate": 5.061150213968765e-07, - "loss": 0.304, - "step": 78948 - }, - { - "epoch": 2.02, - "learning_rate": 5.060909613724376e-07, - "loss": 0.4697, - "step": 78949 - }, - { - "epoch": 2.02, - "learning_rate": 5.060669017261621e-07, - "loss": 0.4414, - "step": 78950 - }, - { - "epoch": 2.02, - "learning_rate": 5.060428424580687e-07, - "loss": 0.4941, - "step": 78951 - }, - { - "epoch": 2.02, - "learning_rate": 5.060187835681756e-07, - "loss": 0.3302, - "step": 78952 - }, - { - "epoch": 2.02, - "learning_rate": 5.059947250565008e-07, - "loss": 0.3652, - "step": 78953 - }, - { - "epoch": 2.02, - "learning_rate": 5.059706669230633e-07, - "loss": 0.415, - "step": 78954 - }, - { - "epoch": 2.02, - "learning_rate": 5.059466091678813e-07, - "loss": 0.458, - "step": 78955 - }, - { - "epoch": 2.02, - "learning_rate": 5.059225517909735e-07, - "loss": 0.4507, - "step": 78956 - }, - { - "epoch": 2.02, - "learning_rate": 5.058984947923578e-07, - "loss": 0.4438, - "step": 78957 - }, - { - "epoch": 2.02, - "learning_rate": 5.058744381720528e-07, - "loss": 0.3712, - "step": 78958 - }, - { - "epoch": 2.02, - "learning_rate": 5.058503819300775e-07, - "loss": 0.5024, - "step": 78959 - }, - { - "epoch": 2.02, - "learning_rate": 5.058263260664495e-07, - "loss": 0.4299, - "step": 78960 - }, - { - "epoch": 2.02, - "learning_rate": 5.058022705811875e-07, - "loss": 0.5039, - "step": 78961 - }, - { - "epoch": 2.02, - "learning_rate": 5.057782154743104e-07, - "loss": 0.3682, - "step": 78962 - }, - { - "epoch": 2.02, - "learning_rate": 5.057541607458357e-07, - "loss": 0.4558, - "step": 78963 - }, - { - "epoch": 2.02, - "learning_rate": 5.057301063957828e-07, - "loss": 0.3867, - "step": 78964 - }, - { - "epoch": 2.02, - "learning_rate": 5.057060524241693e-07, - "loss": 0.343, - "step": 78965 - }, - { - "epoch": 2.02, - "learning_rate": 5.05681998831014e-07, - "loss": 0.3582, - "step": 78966 - }, - { - "epoch": 2.02, - "learning_rate": 5.056579456163351e-07, - "loss": 0.332, - "step": 78967 - }, - { - "epoch": 2.02, - "learning_rate": 5.056338927801515e-07, - "loss": 0.3464, - "step": 78968 - }, - { - "epoch": 2.02, - "learning_rate": 5.05609840322481e-07, - "loss": 0.478, - "step": 78969 - }, - { - "epoch": 2.02, - "learning_rate": 5.055857882433423e-07, - "loss": 0.457, - "step": 78970 - }, - { - "epoch": 2.02, - "learning_rate": 5.055617365427538e-07, - "loss": 0.271, - "step": 78971 - }, - { - "epoch": 2.02, - "learning_rate": 5.055376852207344e-07, - "loss": 0.3596, - "step": 78972 - }, - { - "epoch": 2.02, - "learning_rate": 5.05513634277302e-07, - "loss": 0.4907, - "step": 78973 - }, - { - "epoch": 2.02, - "learning_rate": 5.054895837124749e-07, - "loss": 0.498, - "step": 78974 - }, - { - "epoch": 2.02, - "learning_rate": 5.054655335262714e-07, - "loss": 0.3304, - "step": 78975 - }, - { - "epoch": 2.02, - "learning_rate": 5.054414837187107e-07, - "loss": 0.3896, - "step": 78976 - }, - { - "epoch": 2.02, - "learning_rate": 5.054174342898103e-07, - "loss": 0.3298, - "step": 78977 - }, - { - "epoch": 2.02, - "learning_rate": 5.053933852395891e-07, - "loss": 0.4609, - "step": 78978 - }, - { - "epoch": 2.02, - "learning_rate": 5.053693365680655e-07, - "loss": 0.4536, - "step": 78979 - }, - { - "epoch": 2.02, - "learning_rate": 5.05345288275258e-07, - "loss": 0.4386, - "step": 78980 - }, - { - "epoch": 2.02, - "learning_rate": 5.053212403611847e-07, - "loss": 0.4707, - "step": 78981 - }, - { - "epoch": 2.02, - "learning_rate": 5.052971928258645e-07, - "loss": 0.3291, - "step": 78982 - }, - { - "epoch": 2.02, - "learning_rate": 5.052731456693151e-07, - "loss": 0.4375, - "step": 78983 - }, - { - "epoch": 2.02, - "learning_rate": 5.052490988915553e-07, - "loss": 0.4438, - "step": 78984 - }, - { - "epoch": 2.02, - "learning_rate": 5.05225052492604e-07, - "loss": 0.3818, - "step": 78985 - }, - { - "epoch": 2.02, - "learning_rate": 5.052010064724786e-07, - "loss": 0.3734, - "step": 78986 - }, - { - "epoch": 2.02, - "learning_rate": 5.05176960831198e-07, - "loss": 0.4712, - "step": 78987 - }, - { - "epoch": 2.02, - "learning_rate": 5.051529155687809e-07, - "loss": 0.4756, - "step": 78988 - }, - { - "epoch": 2.02, - "learning_rate": 5.051288706852456e-07, - "loss": 0.4849, - "step": 78989 - }, - { - "epoch": 2.02, - "learning_rate": 5.051048261806101e-07, - "loss": 0.4468, - "step": 78990 - }, - { - "epoch": 2.02, - "learning_rate": 5.05080782054893e-07, - "loss": 0.3303, - "step": 78991 - }, - { - "epoch": 2.02, - "learning_rate": 5.050567383081132e-07, - "loss": 0.3616, - "step": 78992 - }, - { - "epoch": 2.02, - "learning_rate": 5.050326949402888e-07, - "loss": 0.3477, - "step": 78993 - }, - { - "epoch": 2.02, - "learning_rate": 5.050086519514376e-07, - "loss": 0.374, - "step": 78994 - }, - { - "epoch": 2.02, - "learning_rate": 5.049846093415785e-07, - "loss": 0.2576, - "step": 78995 - }, - { - "epoch": 2.02, - "learning_rate": 5.0496056711073e-07, - "loss": 0.3284, - "step": 78996 - }, - { - "epoch": 2.02, - "learning_rate": 5.049365252589107e-07, - "loss": 0.3496, - "step": 78997 - }, - { - "epoch": 2.02, - "learning_rate": 5.049124837861385e-07, - "loss": 0.4077, - "step": 78998 - }, - { - "epoch": 2.02, - "learning_rate": 5.04888442692432e-07, - "loss": 0.5166, - "step": 78999 - }, - { - "epoch": 2.02, - "learning_rate": 5.048644019778097e-07, - "loss": 0.3438, - "step": 79000 - }, - { - "epoch": 2.02, - "learning_rate": 5.048403616422903e-07, - "loss": 0.3669, - "step": 79001 - }, - { - "epoch": 2.02, - "learning_rate": 5.048163216858917e-07, - "loss": 0.3625, - "step": 79002 - }, - { - "epoch": 2.02, - "learning_rate": 5.047922821086324e-07, - "loss": 0.2671, - "step": 79003 - }, - { - "epoch": 2.02, - "learning_rate": 5.047682429105307e-07, - "loss": 0.4878, - "step": 79004 - }, - { - "epoch": 2.02, - "learning_rate": 5.047442040916051e-07, - "loss": 0.4346, - "step": 79005 - }, - { - "epoch": 2.02, - "learning_rate": 5.047201656518745e-07, - "loss": 0.4517, - "step": 79006 - }, - { - "epoch": 2.02, - "learning_rate": 5.046961275913566e-07, - "loss": 0.4282, - "step": 79007 - }, - { - "epoch": 2.03, - "learning_rate": 5.046720899100702e-07, - "loss": 0.4263, - "step": 79008 - }, - { - "epoch": 2.03, - "learning_rate": 5.046480526080334e-07, - "loss": 0.4771, - "step": 79009 - }, - { - "epoch": 2.03, - "learning_rate": 5.046240156852654e-07, - "loss": 0.4856, - "step": 79010 - }, - { - "epoch": 2.03, - "learning_rate": 5.045999791417834e-07, - "loss": 0.4297, - "step": 79011 - }, - { - "epoch": 2.03, - "learning_rate": 5.045759429776071e-07, - "loss": 0.418, - "step": 79012 - }, - { - "epoch": 2.03, - "learning_rate": 5.045519071927535e-07, - "loss": 0.3604, - "step": 79013 - }, - { - "epoch": 2.03, - "learning_rate": 5.045278717872424e-07, - "loss": 0.2759, - "step": 79014 - }, - { - "epoch": 2.03, - "learning_rate": 5.04503836761091e-07, - "loss": 0.4966, - "step": 79015 - }, - { - "epoch": 2.03, - "learning_rate": 5.044798021143182e-07, - "loss": 0.4038, - "step": 79016 - }, - { - "epoch": 2.03, - "learning_rate": 5.044557678469425e-07, - "loss": 0.4248, - "step": 79017 - }, - { - "epoch": 2.03, - "learning_rate": 5.044317339589825e-07, - "loss": 0.4478, - "step": 79018 - }, - { - "epoch": 2.03, - "learning_rate": 5.044077004504561e-07, - "loss": 0.3789, - "step": 79019 - }, - { - "epoch": 2.03, - "learning_rate": 5.043836673213818e-07, - "loss": 0.3716, - "step": 79020 - }, - { - "epoch": 2.03, - "learning_rate": 5.043596345717783e-07, - "loss": 0.2028, - "step": 79021 - }, - { - "epoch": 2.03, - "learning_rate": 5.04335602201664e-07, - "loss": 0.3611, - "step": 79022 - }, - { - "epoch": 2.03, - "learning_rate": 5.043115702110573e-07, - "loss": 0.4893, - "step": 79023 - }, - { - "epoch": 2.03, - "learning_rate": 5.042875385999761e-07, - "loss": 0.5254, - "step": 79024 - }, - { - "epoch": 2.03, - "learning_rate": 5.04263507368439e-07, - "loss": 0.2472, - "step": 79025 - }, - { - "epoch": 2.03, - "learning_rate": 5.042394765164646e-07, - "loss": 0.4561, - "step": 79026 - }, - { - "epoch": 2.03, - "learning_rate": 5.042154460440716e-07, - "loss": 0.3608, - "step": 79027 - }, - { - "epoch": 2.03, - "learning_rate": 5.041914159512777e-07, - "loss": 0.436, - "step": 79028 - }, - { - "epoch": 2.03, - "learning_rate": 5.041673862381015e-07, - "loss": 0.4047, - "step": 79029 - }, - { - "epoch": 2.03, - "learning_rate": 5.041433569045621e-07, - "loss": 0.4951, - "step": 79030 - }, - { - "epoch": 2.03, - "learning_rate": 5.041193279506769e-07, - "loss": 0.3745, - "step": 79031 - }, - { - "epoch": 2.03, - "learning_rate": 5.040952993764651e-07, - "loss": 0.3303, - "step": 79032 - }, - { - "epoch": 2.03, - "learning_rate": 5.040712711819444e-07, - "loss": 0.4448, - "step": 79033 - }, - { - "epoch": 2.03, - "learning_rate": 5.040472433671333e-07, - "loss": 0.3965, - "step": 79034 - }, - { - "epoch": 2.03, - "learning_rate": 5.04023215932051e-07, - "loss": 0.3069, - "step": 79035 - }, - { - "epoch": 2.03, - "learning_rate": 5.039991888767149e-07, - "loss": 0.457, - "step": 79036 - }, - { - "epoch": 2.03, - "learning_rate": 5.039751622011438e-07, - "loss": 0.498, - "step": 79037 - }, - { - "epoch": 2.03, - "learning_rate": 5.039511359053561e-07, - "loss": 0.4135, - "step": 79038 - }, - { - "epoch": 2.03, - "learning_rate": 5.039271099893706e-07, - "loss": 0.2627, - "step": 79039 - }, - { - "epoch": 2.03, - "learning_rate": 5.03903084453205e-07, - "loss": 0.4775, - "step": 79040 - }, - { - "epoch": 2.03, - "learning_rate": 5.038790592968778e-07, - "loss": 0.3792, - "step": 79041 - }, - { - "epoch": 2.03, - "learning_rate": 5.038550345204083e-07, - "loss": 0.3804, - "step": 79042 - }, - { - "epoch": 2.03, - "learning_rate": 5.038310101238134e-07, - "loss": 0.3402, - "step": 79043 - }, - { - "epoch": 2.03, - "learning_rate": 5.038069861071129e-07, - "loss": 0.3284, - "step": 79044 - }, - { - "epoch": 2.03, - "learning_rate": 5.037829624703241e-07, - "loss": 0.4028, - "step": 79045 - }, - { - "epoch": 2.03, - "learning_rate": 5.03758939213466e-07, - "loss": 0.3549, - "step": 79046 - }, - { - "epoch": 2.03, - "learning_rate": 5.037349163365572e-07, - "loss": 0.5415, - "step": 79047 - }, - { - "epoch": 2.03, - "learning_rate": 5.037108938396153e-07, - "loss": 0.4185, - "step": 79048 - }, - { - "epoch": 2.03, - "learning_rate": 5.036868717226592e-07, - "loss": 0.321, - "step": 79049 - }, - { - "epoch": 2.03, - "learning_rate": 5.036628499857072e-07, - "loss": 0.2151, - "step": 79050 - }, - { - "epoch": 2.03, - "learning_rate": 5.036388286287781e-07, - "loss": 0.2374, - "step": 79051 - }, - { - "epoch": 2.03, - "learning_rate": 5.0361480765189e-07, - "loss": 0.4141, - "step": 79052 - }, - { - "epoch": 2.03, - "learning_rate": 5.035907870550608e-07, - "loss": 0.3271, - "step": 79053 - }, - { - "epoch": 2.03, - "learning_rate": 5.035667668383094e-07, - "loss": 0.5183, - "step": 79054 - }, - { - "epoch": 2.03, - "learning_rate": 5.03542747001654e-07, - "loss": 0.4272, - "step": 79055 - }, - { - "epoch": 2.03, - "learning_rate": 5.035187275451134e-07, - "loss": 0.2955, - "step": 79056 - }, - { - "epoch": 2.03, - "learning_rate": 5.034947084687055e-07, - "loss": 0.4487, - "step": 79057 - }, - { - "epoch": 2.03, - "learning_rate": 5.034706897724487e-07, - "loss": 0.3737, - "step": 79058 - }, - { - "epoch": 2.03, - "learning_rate": 5.034466714563617e-07, - "loss": 0.3623, - "step": 79059 - }, - { - "epoch": 2.03, - "learning_rate": 5.034226535204631e-07, - "loss": 0.5151, - "step": 79060 - }, - { - "epoch": 2.03, - "learning_rate": 5.033986359647704e-07, - "loss": 0.4712, - "step": 79061 - }, - { - "epoch": 2.03, - "learning_rate": 5.033746187893031e-07, - "loss": 0.4595, - "step": 79062 - }, - { - "epoch": 2.03, - "learning_rate": 5.033506019940785e-07, - "loss": 0.374, - "step": 79063 - }, - { - "epoch": 2.03, - "learning_rate": 5.03326585579116e-07, - "loss": 0.5049, - "step": 79064 - }, - { - "epoch": 2.03, - "learning_rate": 5.033025695444331e-07, - "loss": 0.402, - "step": 79065 - }, - { - "epoch": 2.03, - "learning_rate": 5.032785538900486e-07, - "loss": 0.3306, - "step": 79066 - }, - { - "epoch": 2.03, - "learning_rate": 5.032545386159807e-07, - "loss": 0.3538, - "step": 79067 - }, - { - "epoch": 2.03, - "learning_rate": 5.032305237222485e-07, - "loss": 0.4128, - "step": 79068 - }, - { - "epoch": 2.03, - "learning_rate": 5.032065092088694e-07, - "loss": 0.3789, - "step": 79069 - }, - { - "epoch": 2.03, - "learning_rate": 5.031824950758623e-07, - "loss": 0.3569, - "step": 79070 - }, - { - "epoch": 2.03, - "learning_rate": 5.031584813232454e-07, - "loss": 0.4541, - "step": 79071 - }, - { - "epoch": 2.03, - "learning_rate": 5.031344679510378e-07, - "loss": 0.5137, - "step": 79072 - }, - { - "epoch": 2.03, - "learning_rate": 5.031104549592571e-07, - "loss": 0.3862, - "step": 79073 - }, - { - "epoch": 2.03, - "learning_rate": 5.030864423479215e-07, - "loss": 0.4658, - "step": 79074 - }, - { - "epoch": 2.03, - "learning_rate": 5.030624301170499e-07, - "loss": 0.2529, - "step": 79075 - }, - { - "epoch": 2.03, - "learning_rate": 5.030384182666605e-07, - "loss": 0.4187, - "step": 79076 - }, - { - "epoch": 2.03, - "learning_rate": 5.03014406796772e-07, - "loss": 0.3853, - "step": 79077 - }, - { - "epoch": 2.03, - "learning_rate": 5.029903957074022e-07, - "loss": 0.3457, - "step": 79078 - }, - { - "epoch": 2.03, - "learning_rate": 5.029663849985699e-07, - "loss": 0.3654, - "step": 79079 - }, - { - "epoch": 2.03, - "learning_rate": 5.029423746702932e-07, - "loss": 0.4136, - "step": 79080 - }, - { - "epoch": 2.03, - "learning_rate": 5.029183647225912e-07, - "loss": 0.4873, - "step": 79081 - }, - { - "epoch": 2.03, - "learning_rate": 5.028943551554816e-07, - "loss": 0.4551, - "step": 79082 - }, - { - "epoch": 2.03, - "learning_rate": 5.028703459689827e-07, - "loss": 0.3755, - "step": 79083 - }, - { - "epoch": 2.03, - "learning_rate": 5.028463371631131e-07, - "loss": 0.5171, - "step": 79084 - }, - { - "epoch": 2.03, - "learning_rate": 5.028223287378916e-07, - "loss": 0.5884, - "step": 79085 - }, - { - "epoch": 2.03, - "learning_rate": 5.027983206933358e-07, - "loss": 0.4453, - "step": 79086 - }, - { - "epoch": 2.03, - "learning_rate": 5.027743130294643e-07, - "loss": 0.4946, - "step": 79087 - }, - { - "epoch": 2.03, - "learning_rate": 5.027503057462959e-07, - "loss": 0.5732, - "step": 79088 - }, - { - "epoch": 2.03, - "learning_rate": 5.027262988438489e-07, - "loss": 0.4272, - "step": 79089 - }, - { - "epoch": 2.03, - "learning_rate": 5.027022923221412e-07, - "loss": 0.3983, - "step": 79090 - }, - { - "epoch": 2.03, - "learning_rate": 5.026782861811914e-07, - "loss": 0.3595, - "step": 79091 - }, - { - "epoch": 2.03, - "learning_rate": 5.026542804210185e-07, - "loss": 0.4224, - "step": 79092 - }, - { - "epoch": 2.03, - "learning_rate": 5.026302750416399e-07, - "loss": 0.5059, - "step": 79093 - }, - { - "epoch": 2.03, - "learning_rate": 5.026062700430748e-07, - "loss": 0.4849, - "step": 79094 - }, - { - "epoch": 2.03, - "learning_rate": 5.025822654253409e-07, - "loss": 0.3867, - "step": 79095 - }, - { - "epoch": 2.03, - "learning_rate": 5.025582611884567e-07, - "loss": 0.4064, - "step": 79096 - }, - { - "epoch": 2.03, - "learning_rate": 5.02534257332441e-07, - "loss": 0.355, - "step": 79097 - }, - { - "epoch": 2.03, - "learning_rate": 5.025102538573123e-07, - "loss": 0.4854, - "step": 79098 - }, - { - "epoch": 2.03, - "learning_rate": 5.02486250763088e-07, - "loss": 0.4692, - "step": 79099 - }, - { - "epoch": 2.03, - "learning_rate": 5.024622480497873e-07, - "loss": 0.438, - "step": 79100 - }, - { - "epoch": 2.03, - "learning_rate": 5.024382457174283e-07, - "loss": 0.4653, - "step": 79101 - }, - { - "epoch": 2.03, - "learning_rate": 5.024142437660304e-07, - "loss": 0.4001, - "step": 79102 - }, - { - "epoch": 2.03, - "learning_rate": 5.023902421956101e-07, - "loss": 0.4214, - "step": 79103 - }, - { - "epoch": 2.03, - "learning_rate": 5.023662410061866e-07, - "loss": 0.4143, - "step": 79104 - }, - { - "epoch": 2.03, - "learning_rate": 5.023422401977785e-07, - "loss": 0.3359, - "step": 79105 - }, - { - "epoch": 2.03, - "learning_rate": 5.023182397704047e-07, - "loss": 0.5044, - "step": 79106 - }, - { - "epoch": 2.03, - "learning_rate": 5.022942397240822e-07, - "loss": 0.3821, - "step": 79107 - }, - { - "epoch": 2.03, - "learning_rate": 5.022702400588303e-07, - "loss": 0.3687, - "step": 79108 - }, - { - "epoch": 2.03, - "learning_rate": 5.022462407746672e-07, - "loss": 0.4868, - "step": 79109 - }, - { - "epoch": 2.03, - "learning_rate": 5.022222418716116e-07, - "loss": 0.4521, - "step": 79110 - }, - { - "epoch": 2.03, - "learning_rate": 5.02198243349681e-07, - "loss": 0.6328, - "step": 79111 - }, - { - "epoch": 2.03, - "learning_rate": 5.021742452088949e-07, - "loss": 0.3298, - "step": 79112 - }, - { - "epoch": 2.03, - "learning_rate": 5.021502474492707e-07, - "loss": 0.4658, - "step": 79113 - }, - { - "epoch": 2.03, - "learning_rate": 5.021262500708271e-07, - "loss": 0.3872, - "step": 79114 - }, - { - "epoch": 2.03, - "learning_rate": 5.02102253073583e-07, - "loss": 0.455, - "step": 79115 - }, - { - "epoch": 2.03, - "learning_rate": 5.020782564575559e-07, - "loss": 0.4697, - "step": 79116 - }, - { - "epoch": 2.03, - "learning_rate": 5.020542602227644e-07, - "loss": 0.3115, - "step": 79117 - }, - { - "epoch": 2.03, - "learning_rate": 5.020302643692274e-07, - "loss": 0.4878, - "step": 79118 - }, - { - "epoch": 2.03, - "learning_rate": 5.020062688969631e-07, - "loss": 0.4458, - "step": 79119 - }, - { - "epoch": 2.03, - "learning_rate": 5.019822738059892e-07, - "loss": 0.4146, - "step": 79120 - }, - { - "epoch": 2.03, - "learning_rate": 5.019582790963248e-07, - "loss": 0.4521, - "step": 79121 - }, - { - "epoch": 2.03, - "learning_rate": 5.019342847679882e-07, - "loss": 0.4663, - "step": 79122 - }, - { - "epoch": 2.03, - "learning_rate": 5.019102908209978e-07, - "loss": 0.2958, - "step": 79123 - }, - { - "epoch": 2.03, - "learning_rate": 5.018862972553715e-07, - "loss": 0.4561, - "step": 79124 - }, - { - "epoch": 2.03, - "learning_rate": 5.018623040711278e-07, - "loss": 0.4473, - "step": 79125 - }, - { - "epoch": 2.03, - "learning_rate": 5.018383112682852e-07, - "loss": 0.4326, - "step": 79126 - }, - { - "epoch": 2.03, - "learning_rate": 5.018143188468625e-07, - "loss": 0.6157, - "step": 79127 - }, - { - "epoch": 2.03, - "learning_rate": 5.017903268068773e-07, - "loss": 0.2894, - "step": 79128 - }, - { - "epoch": 2.03, - "learning_rate": 5.017663351483484e-07, - "loss": 0.4036, - "step": 79129 - }, - { - "epoch": 2.03, - "learning_rate": 5.01742343871294e-07, - "loss": 0.3962, - "step": 79130 - }, - { - "epoch": 2.03, - "learning_rate": 5.01718352975733e-07, - "loss": 0.3538, - "step": 79131 - }, - { - "epoch": 2.03, - "learning_rate": 5.016943624616834e-07, - "loss": 0.4863, - "step": 79132 - }, - { - "epoch": 2.03, - "learning_rate": 5.016703723291631e-07, - "loss": 0.4468, - "step": 79133 - }, - { - "epoch": 2.03, - "learning_rate": 5.016463825781909e-07, - "loss": 0.4478, - "step": 79134 - }, - { - "epoch": 2.03, - "learning_rate": 5.016223932087851e-07, - "loss": 0.4287, - "step": 79135 - }, - { - "epoch": 2.03, - "learning_rate": 5.015984042209646e-07, - "loss": 0.3638, - "step": 79136 - }, - { - "epoch": 2.03, - "learning_rate": 5.015744156147468e-07, - "loss": 0.3286, - "step": 79137 - }, - { - "epoch": 2.03, - "learning_rate": 5.015504273901505e-07, - "loss": 0.5166, - "step": 79138 - }, - { - "epoch": 2.03, - "learning_rate": 5.015264395471948e-07, - "loss": 0.3276, - "step": 79139 - }, - { - "epoch": 2.03, - "learning_rate": 5.015024520858967e-07, - "loss": 0.3345, - "step": 79140 - }, - { - "epoch": 2.03, - "learning_rate": 5.014784650062754e-07, - "loss": 0.522, - "step": 79141 - }, - { - "epoch": 2.03, - "learning_rate": 5.014544783083495e-07, - "loss": 0.4268, - "step": 79142 - }, - { - "epoch": 2.03, - "learning_rate": 5.014304919921364e-07, - "loss": 0.5234, - "step": 79143 - }, - { - "epoch": 2.03, - "learning_rate": 5.014065060576556e-07, - "loss": 0.4434, - "step": 79144 - }, - { - "epoch": 2.03, - "learning_rate": 5.013825205049245e-07, - "loss": 0.5146, - "step": 79145 - }, - { - "epoch": 2.03, - "learning_rate": 5.013585353339618e-07, - "loss": 0.4668, - "step": 79146 - }, - { - "epoch": 2.03, - "learning_rate": 5.013345505447861e-07, - "loss": 0.4653, - "step": 79147 - }, - { - "epoch": 2.03, - "learning_rate": 5.013105661374158e-07, - "loss": 0.3975, - "step": 79148 - }, - { - "epoch": 2.03, - "learning_rate": 5.012865821118688e-07, - "loss": 0.4414, - "step": 79149 - }, - { - "epoch": 2.03, - "learning_rate": 5.012625984681637e-07, - "loss": 0.3687, - "step": 79150 - }, - { - "epoch": 2.03, - "learning_rate": 5.012386152063191e-07, - "loss": 0.4148, - "step": 79151 - }, - { - "epoch": 2.03, - "learning_rate": 5.012146323263533e-07, - "loss": 0.4526, - "step": 79152 - }, - { - "epoch": 2.03, - "learning_rate": 5.011906498282845e-07, - "loss": 0.3459, - "step": 79153 - }, - { - "epoch": 2.03, - "learning_rate": 5.011666677121309e-07, - "loss": 0.4026, - "step": 79154 - }, - { - "epoch": 2.03, - "learning_rate": 5.011426859779109e-07, - "loss": 0.4116, - "step": 79155 - }, - { - "epoch": 2.03, - "learning_rate": 5.011187046256434e-07, - "loss": 0.302, - "step": 79156 - }, - { - "epoch": 2.03, - "learning_rate": 5.01094723655346e-07, - "loss": 0.3964, - "step": 79157 - }, - { - "epoch": 2.03, - "learning_rate": 5.010707430670374e-07, - "loss": 0.5586, - "step": 79158 - }, - { - "epoch": 2.03, - "learning_rate": 5.01046762860736e-07, - "loss": 0.4214, - "step": 79159 - }, - { - "epoch": 2.03, - "learning_rate": 5.010227830364606e-07, - "loss": 0.3301, - "step": 79160 - }, - { - "epoch": 2.03, - "learning_rate": 5.009988035942287e-07, - "loss": 0.4521, - "step": 79161 - }, - { - "epoch": 2.03, - "learning_rate": 5.009748245340595e-07, - "loss": 0.4506, - "step": 79162 - }, - { - "epoch": 2.03, - "learning_rate": 5.009508458559704e-07, - "loss": 0.418, - "step": 79163 - }, - { - "epoch": 2.03, - "learning_rate": 5.009268675599804e-07, - "loss": 0.3616, - "step": 79164 - }, - { - "epoch": 2.03, - "learning_rate": 5.009028896461081e-07, - "loss": 0.4138, - "step": 79165 - }, - { - "epoch": 2.03, - "learning_rate": 5.00878912114371e-07, - "loss": 0.4424, - "step": 79166 - }, - { - "epoch": 2.03, - "learning_rate": 5.008549349647883e-07, - "loss": 0.498, - "step": 79167 - }, - { - "epoch": 2.03, - "learning_rate": 5.008309581973777e-07, - "loss": 0.4473, - "step": 79168 - }, - { - "epoch": 2.03, - "learning_rate": 5.008069818121585e-07, - "loss": 0.4922, - "step": 79169 - }, - { - "epoch": 2.03, - "learning_rate": 5.007830058091479e-07, - "loss": 0.4976, - "step": 79170 - }, - { - "epoch": 2.03, - "learning_rate": 5.007590301883648e-07, - "loss": 0.5117, - "step": 79171 - }, - { - "epoch": 2.03, - "learning_rate": 5.00735054949828e-07, - "loss": 0.415, - "step": 79172 - }, - { - "epoch": 2.03, - "learning_rate": 5.007110800935554e-07, - "loss": 0.5625, - "step": 79173 - }, - { - "epoch": 2.03, - "learning_rate": 5.006871056195651e-07, - "loss": 0.4272, - "step": 79174 - }, - { - "epoch": 2.03, - "learning_rate": 5.006631315278755e-07, - "loss": 0.2542, - "step": 79175 - }, - { - "epoch": 2.03, - "learning_rate": 5.006391578185054e-07, - "loss": 0.4712, - "step": 79176 - }, - { - "epoch": 2.03, - "learning_rate": 5.006151844914732e-07, - "loss": 0.3774, - "step": 79177 - }, - { - "epoch": 2.03, - "learning_rate": 5.005912115467965e-07, - "loss": 0.4165, - "step": 79178 - }, - { - "epoch": 2.03, - "learning_rate": 5.005672389844944e-07, - "loss": 0.3528, - "step": 79179 - }, - { - "epoch": 2.03, - "learning_rate": 5.005432668045848e-07, - "loss": 0.3735, - "step": 79180 - }, - { - "epoch": 2.03, - "learning_rate": 5.005192950070867e-07, - "loss": 0.5107, - "step": 79181 - }, - { - "epoch": 2.03, - "learning_rate": 5.00495323592018e-07, - "loss": 0.2869, - "step": 79182 - }, - { - "epoch": 2.03, - "learning_rate": 5.004713525593966e-07, - "loss": 0.4355, - "step": 79183 - }, - { - "epoch": 2.03, - "learning_rate": 5.004473819092415e-07, - "loss": 0.3921, - "step": 79184 - }, - { - "epoch": 2.03, - "learning_rate": 5.004234116415708e-07, - "loss": 0.3604, - "step": 79185 - }, - { - "epoch": 2.03, - "learning_rate": 5.003994417564033e-07, - "loss": 0.4033, - "step": 79186 - }, - { - "epoch": 2.03, - "learning_rate": 5.003754722537565e-07, - "loss": 0.3154, - "step": 79187 - }, - { - "epoch": 2.03, - "learning_rate": 5.003515031336494e-07, - "loss": 0.3562, - "step": 79188 - }, - { - "epoch": 2.03, - "learning_rate": 5.003275343961e-07, - "loss": 0.3195, - "step": 79189 - }, - { - "epoch": 2.03, - "learning_rate": 5.003035660411274e-07, - "loss": 0.2976, - "step": 79190 - }, - { - "epoch": 2.03, - "learning_rate": 5.002795980687489e-07, - "loss": 0.395, - "step": 79191 - }, - { - "epoch": 2.03, - "learning_rate": 5.002556304789836e-07, - "loss": 0.5532, - "step": 79192 - }, - { - "epoch": 2.03, - "learning_rate": 5.002316632718493e-07, - "loss": 0.4424, - "step": 79193 - }, - { - "epoch": 2.03, - "learning_rate": 5.002076964473652e-07, - "loss": 0.3875, - "step": 79194 - }, - { - "epoch": 2.03, - "learning_rate": 5.001837300055484e-07, - "loss": 0.314, - "step": 79195 - }, - { - "epoch": 2.03, - "learning_rate": 5.001597639464181e-07, - "loss": 0.5049, - "step": 79196 - }, - { - "epoch": 2.03, - "learning_rate": 5.001357982699925e-07, - "loss": 0.4302, - "step": 79197 - }, - { - "epoch": 2.03, - "learning_rate": 5.001118329762902e-07, - "loss": 0.4258, - "step": 79198 - }, - { - "epoch": 2.03, - "learning_rate": 5.00087868065329e-07, - "loss": 0.4404, - "step": 79199 - }, - { - "epoch": 2.03, - "learning_rate": 5.000639035371274e-07, - "loss": 0.4424, - "step": 79200 - }, - { - "epoch": 2.03, - "learning_rate": 5.00039939391704e-07, - "loss": 0.3699, - "step": 79201 - }, - { - "epoch": 2.03, - "learning_rate": 5.000159756290775e-07, - "loss": 0.4722, - "step": 79202 - }, - { - "epoch": 2.03, - "learning_rate": 4.999920122492657e-07, - "loss": 0.478, - "step": 79203 - }, - { - "epoch": 2.03, - "learning_rate": 4.999680492522867e-07, - "loss": 0.2145, - "step": 79204 - }, - { - "epoch": 2.03, - "learning_rate": 4.99944086638159e-07, - "loss": 0.5137, - "step": 79205 - }, - { - "epoch": 2.03, - "learning_rate": 4.999201244069012e-07, - "loss": 0.4175, - "step": 79206 - }, - { - "epoch": 2.03, - "learning_rate": 4.99896162558532e-07, - "loss": 0.2743, - "step": 79207 - }, - { - "epoch": 2.03, - "learning_rate": 4.998722010930688e-07, - "loss": 0.3722, - "step": 79208 - }, - { - "epoch": 2.03, - "learning_rate": 4.998482400105306e-07, - "loss": 0.3262, - "step": 79209 - }, - { - "epoch": 2.03, - "learning_rate": 4.99824279310936e-07, - "loss": 0.4075, - "step": 79210 - }, - { - "epoch": 2.03, - "learning_rate": 4.998003189943028e-07, - "loss": 0.3931, - "step": 79211 - }, - { - "epoch": 2.03, - "learning_rate": 4.997763590606493e-07, - "loss": 0.4312, - "step": 79212 - }, - { - "epoch": 2.03, - "learning_rate": 4.99752399509994e-07, - "loss": 0.2446, - "step": 79213 - }, - { - "epoch": 2.03, - "learning_rate": 4.997284403423551e-07, - "loss": 0.4111, - "step": 79214 - }, - { - "epoch": 2.03, - "learning_rate": 4.997044815577517e-07, - "loss": 0.4424, - "step": 79215 - }, - { - "epoch": 2.03, - "learning_rate": 4.996805231562012e-07, - "loss": 0.4238, - "step": 79216 - }, - { - "epoch": 2.03, - "learning_rate": 4.996565651377221e-07, - "loss": 0.3296, - "step": 79217 - }, - { - "epoch": 2.03, - "learning_rate": 4.996326075023332e-07, - "loss": 0.4199, - "step": 79218 - }, - { - "epoch": 2.03, - "learning_rate": 4.996086502500529e-07, - "loss": 0.3354, - "step": 79219 - }, - { - "epoch": 2.03, - "learning_rate": 4.995846933808989e-07, - "loss": 0.3339, - "step": 79220 - }, - { - "epoch": 2.03, - "learning_rate": 4.995607368948902e-07, - "loss": 0.279, - "step": 79221 - }, - { - "epoch": 2.03, - "learning_rate": 4.995367807920446e-07, - "loss": 0.4673, - "step": 79222 - }, - { - "epoch": 2.03, - "learning_rate": 4.995128250723804e-07, - "loss": 0.4097, - "step": 79223 - }, - { - "epoch": 2.03, - "learning_rate": 4.994888697359168e-07, - "loss": 0.4795, - "step": 79224 - }, - { - "epoch": 2.03, - "learning_rate": 4.994649147826712e-07, - "loss": 0.4893, - "step": 79225 - }, - { - "epoch": 2.03, - "learning_rate": 4.994409602126622e-07, - "loss": 0.4434, - "step": 79226 - }, - { - "epoch": 2.03, - "learning_rate": 4.994170060259086e-07, - "loss": 0.3901, - "step": 79227 - }, - { - "epoch": 2.03, - "learning_rate": 4.993930522224281e-07, - "loss": 0.5073, - "step": 79228 - }, - { - "epoch": 2.03, - "learning_rate": 4.993690988022394e-07, - "loss": 0.3535, - "step": 79229 - }, - { - "epoch": 2.03, - "learning_rate": 4.993451457653605e-07, - "loss": 0.2915, - "step": 79230 - }, - { - "epoch": 2.03, - "learning_rate": 4.993211931118106e-07, - "loss": 0.4878, - "step": 79231 - }, - { - "epoch": 2.03, - "learning_rate": 4.992972408416074e-07, - "loss": 0.4561, - "step": 79232 - }, - { - "epoch": 2.03, - "learning_rate": 4.992732889547689e-07, - "loss": 0.5068, - "step": 79233 - }, - { - "epoch": 2.03, - "learning_rate": 4.992493374513137e-07, - "loss": 0.4883, - "step": 79234 - }, - { - "epoch": 2.03, - "learning_rate": 4.992253863312604e-07, - "loss": 0.4814, - "step": 79235 - }, - { - "epoch": 2.03, - "learning_rate": 4.992014355946274e-07, - "loss": 0.4819, - "step": 79236 - }, - { - "epoch": 2.03, - "learning_rate": 4.991774852414326e-07, - "loss": 0.4122, - "step": 79237 - }, - { - "epoch": 2.03, - "learning_rate": 4.991535352716945e-07, - "loss": 0.3584, - "step": 79238 - }, - { - "epoch": 2.03, - "learning_rate": 4.991295856854316e-07, - "loss": 0.4766, - "step": 79239 - }, - { - "epoch": 2.03, - "learning_rate": 4.991056364826626e-07, - "loss": 0.564, - "step": 79240 - }, - { - "epoch": 2.03, - "learning_rate": 4.990816876634052e-07, - "loss": 0.4985, - "step": 79241 - }, - { - "epoch": 2.03, - "learning_rate": 4.990577392276776e-07, - "loss": 0.3413, - "step": 79242 - }, - { - "epoch": 2.03, - "learning_rate": 4.990337911754985e-07, - "loss": 0.4194, - "step": 79243 - }, - { - "epoch": 2.03, - "learning_rate": 4.990098435068861e-07, - "loss": 0.3704, - "step": 79244 - }, - { - "epoch": 2.03, - "learning_rate": 4.989858962218593e-07, - "loss": 0.5371, - "step": 79245 - }, - { - "epoch": 2.03, - "learning_rate": 4.989619493204355e-07, - "loss": 0.395, - "step": 79246 - }, - { - "epoch": 2.03, - "learning_rate": 4.989380028026335e-07, - "loss": 0.3823, - "step": 79247 - }, - { - "epoch": 2.03, - "learning_rate": 4.989140566684721e-07, - "loss": 0.2991, - "step": 79248 - }, - { - "epoch": 2.03, - "learning_rate": 4.988901109179687e-07, - "loss": 0.4409, - "step": 79249 - }, - { - "epoch": 2.03, - "learning_rate": 4.988661655511422e-07, - "loss": 0.3828, - "step": 79250 - }, - { - "epoch": 2.03, - "learning_rate": 4.98842220568011e-07, - "loss": 0.4902, - "step": 79251 - }, - { - "epoch": 2.03, - "learning_rate": 4.988182759685932e-07, - "loss": 0.3936, - "step": 79252 - }, - { - "epoch": 2.03, - "learning_rate": 4.987943317529073e-07, - "loss": 0.3853, - "step": 79253 - }, - { - "epoch": 2.03, - "learning_rate": 4.987703879209712e-07, - "loss": 0.2297, - "step": 79254 - }, - { - "epoch": 2.03, - "learning_rate": 4.987464444728037e-07, - "loss": 0.4536, - "step": 79255 - }, - { - "epoch": 2.03, - "learning_rate": 4.98722501408423e-07, - "loss": 0.4269, - "step": 79256 - }, - { - "epoch": 2.03, - "learning_rate": 4.986985587278477e-07, - "loss": 0.4233, - "step": 79257 - }, - { - "epoch": 2.03, - "learning_rate": 4.986746164310955e-07, - "loss": 0.458, - "step": 79258 - }, - { - "epoch": 2.03, - "learning_rate": 4.986506745181852e-07, - "loss": 0.54, - "step": 79259 - }, - { - "epoch": 2.03, - "learning_rate": 4.98626732989135e-07, - "loss": 0.4937, - "step": 79260 - }, - { - "epoch": 2.03, - "learning_rate": 4.986027918439634e-07, - "loss": 0.4976, - "step": 79261 - }, - { - "epoch": 2.03, - "learning_rate": 4.98578851082689e-07, - "loss": 0.4404, - "step": 79262 - }, - { - "epoch": 2.03, - "learning_rate": 4.98554910705329e-07, - "loss": 0.3605, - "step": 79263 - }, - { - "epoch": 2.03, - "learning_rate": 4.985309707119026e-07, - "loss": 0.2917, - "step": 79264 - }, - { - "epoch": 2.03, - "learning_rate": 4.985070311024283e-07, - "loss": 0.3784, - "step": 79265 - }, - { - "epoch": 2.03, - "learning_rate": 4.984830918769237e-07, - "loss": 0.418, - "step": 79266 - }, - { - "epoch": 2.03, - "learning_rate": 4.984591530354076e-07, - "loss": 0.4404, - "step": 79267 - }, - { - "epoch": 2.03, - "learning_rate": 4.984352145778983e-07, - "loss": 0.481, - "step": 79268 - }, - { - "epoch": 2.03, - "learning_rate": 4.984112765044144e-07, - "loss": 0.3794, - "step": 79269 - }, - { - "epoch": 2.03, - "learning_rate": 4.983873388149735e-07, - "loss": 0.3821, - "step": 79270 - }, - { - "epoch": 2.03, - "learning_rate": 4.983634015095948e-07, - "loss": 0.4136, - "step": 79271 - }, - { - "epoch": 2.03, - "learning_rate": 4.983394645882958e-07, - "loss": 0.421, - "step": 79272 - }, - { - "epoch": 2.03, - "learning_rate": 4.983155280510952e-07, - "loss": 0.3586, - "step": 79273 - }, - { - "epoch": 2.03, - "learning_rate": 4.982915918980118e-07, - "loss": 0.4033, - "step": 79274 - }, - { - "epoch": 2.03, - "learning_rate": 4.982676561290629e-07, - "loss": 0.4526, - "step": 79275 - }, - { - "epoch": 2.03, - "learning_rate": 4.982437207442675e-07, - "loss": 0.4708, - "step": 79276 - }, - { - "epoch": 2.03, - "learning_rate": 4.982197857436437e-07, - "loss": 0.4414, - "step": 79277 - }, - { - "epoch": 2.03, - "learning_rate": 4.981958511272104e-07, - "loss": 0.3428, - "step": 79278 - }, - { - "epoch": 2.03, - "learning_rate": 4.981719168949851e-07, - "loss": 0.4966, - "step": 79279 - }, - { - "epoch": 2.03, - "learning_rate": 4.981479830469864e-07, - "loss": 0.3438, - "step": 79280 - }, - { - "epoch": 2.03, - "learning_rate": 4.981240495832333e-07, - "loss": 0.3818, - "step": 79281 - }, - { - "epoch": 2.03, - "learning_rate": 4.981001165037433e-07, - "loss": 0.4709, - "step": 79282 - }, - { - "epoch": 2.03, - "learning_rate": 4.980761838085348e-07, - "loss": 0.4409, - "step": 79283 - }, - { - "epoch": 2.03, - "learning_rate": 4.980522514976261e-07, - "loss": 0.3965, - "step": 79284 - }, - { - "epoch": 2.03, - "learning_rate": 4.980283195710358e-07, - "loss": 0.4263, - "step": 79285 - }, - { - "epoch": 2.03, - "learning_rate": 4.980043880287826e-07, - "loss": 0.4399, - "step": 79286 - }, - { - "epoch": 2.03, - "learning_rate": 4.979804568708838e-07, - "loss": 0.4199, - "step": 79287 - }, - { - "epoch": 2.03, - "learning_rate": 4.979565260973583e-07, - "loss": 0.3557, - "step": 79288 - }, - { - "epoch": 2.03, - "learning_rate": 4.979325957082245e-07, - "loss": 0.458, - "step": 79289 - }, - { - "epoch": 2.03, - "learning_rate": 4.97908665703501e-07, - "loss": 0.2637, - "step": 79290 - }, - { - "epoch": 2.03, - "learning_rate": 4.978847360832057e-07, - "loss": 0.4756, - "step": 79291 - }, - { - "epoch": 2.03, - "learning_rate": 4.978608068473566e-07, - "loss": 0.4614, - "step": 79292 - }, - { - "epoch": 2.03, - "learning_rate": 4.978368779959724e-07, - "loss": 0.206, - "step": 79293 - }, - { - "epoch": 2.03, - "learning_rate": 4.978129495290714e-07, - "loss": 0.3862, - "step": 79294 - }, - { - "epoch": 2.03, - "learning_rate": 4.977890214466722e-07, - "loss": 0.3696, - "step": 79295 - }, - { - "epoch": 2.03, - "learning_rate": 4.977650937487927e-07, - "loss": 0.4138, - "step": 79296 - }, - { - "epoch": 2.03, - "learning_rate": 4.977411664354512e-07, - "loss": 0.3521, - "step": 79297 - }, - { - "epoch": 2.03, - "learning_rate": 4.977172395066663e-07, - "loss": 0.4165, - "step": 79298 - }, - { - "epoch": 2.03, - "learning_rate": 4.976933129624565e-07, - "loss": 0.3799, - "step": 79299 - }, - { - "epoch": 2.03, - "learning_rate": 4.976693868028396e-07, - "loss": 0.3347, - "step": 79300 - }, - { - "epoch": 2.03, - "learning_rate": 4.976454610278344e-07, - "loss": 0.375, - "step": 79301 - }, - { - "epoch": 2.03, - "learning_rate": 4.976215356374587e-07, - "loss": 0.4746, - "step": 79302 - }, - { - "epoch": 2.03, - "learning_rate": 4.975976106317314e-07, - "loss": 0.3401, - "step": 79303 - }, - { - "epoch": 2.03, - "learning_rate": 4.9757368601067e-07, - "loss": 0.4038, - "step": 79304 - }, - { - "epoch": 2.03, - "learning_rate": 4.975497617742936e-07, - "loss": 0.3777, - "step": 79305 - }, - { - "epoch": 2.03, - "learning_rate": 4.975258379226201e-07, - "loss": 0.3906, - "step": 79306 - }, - { - "epoch": 2.03, - "learning_rate": 4.975019144556682e-07, - "loss": 0.4644, - "step": 79307 - }, - { - "epoch": 2.03, - "learning_rate": 4.974779913734558e-07, - "loss": 0.3887, - "step": 79308 - }, - { - "epoch": 2.03, - "learning_rate": 4.974540686760014e-07, - "loss": 0.3073, - "step": 79309 - }, - { - "epoch": 2.03, - "learning_rate": 4.974301463633232e-07, - "loss": 0.4326, - "step": 79310 - }, - { - "epoch": 2.03, - "learning_rate": 4.974062244354401e-07, - "loss": 0.3242, - "step": 79311 - }, - { - "epoch": 2.03, - "learning_rate": 4.973823028923699e-07, - "loss": 0.3555, - "step": 79312 - }, - { - "epoch": 2.03, - "learning_rate": 4.973583817341306e-07, - "loss": 0.4316, - "step": 79313 - }, - { - "epoch": 2.03, - "learning_rate": 4.973344609607408e-07, - "loss": 0.3943, - "step": 79314 - }, - { - "epoch": 2.03, - "learning_rate": 4.97310540572219e-07, - "loss": 0.4893, - "step": 79315 - }, - { - "epoch": 2.03, - "learning_rate": 4.972866205685837e-07, - "loss": 0.314, - "step": 79316 - }, - { - "epoch": 2.03, - "learning_rate": 4.972627009498526e-07, - "loss": 0.4795, - "step": 79317 - }, - { - "epoch": 2.03, - "learning_rate": 4.972387817160443e-07, - "loss": 0.5, - "step": 79318 - }, - { - "epoch": 2.03, - "learning_rate": 4.972148628671775e-07, - "loss": 0.3784, - "step": 79319 - }, - { - "epoch": 2.03, - "learning_rate": 4.971909444032698e-07, - "loss": 0.46, - "step": 79320 - }, - { - "epoch": 2.03, - "learning_rate": 4.971670263243403e-07, - "loss": 0.2705, - "step": 79321 - }, - { - "epoch": 2.03, - "learning_rate": 4.971431086304066e-07, - "loss": 0.364, - "step": 79322 - }, - { - "epoch": 2.03, - "learning_rate": 4.97119191321487e-07, - "loss": 0.4028, - "step": 79323 - }, - { - "epoch": 2.03, - "learning_rate": 4.970952743976008e-07, - "loss": 0.4565, - "step": 79324 - }, - { - "epoch": 2.03, - "learning_rate": 4.97071357858765e-07, - "loss": 0.5225, - "step": 79325 - }, - { - "epoch": 2.03, - "learning_rate": 4.970474417049987e-07, - "loss": 0.4192, - "step": 79326 - }, - { - "epoch": 2.03, - "learning_rate": 4.9702352593632e-07, - "loss": 0.3655, - "step": 79327 - }, - { - "epoch": 2.03, - "learning_rate": 4.969996105527477e-07, - "loss": 0.3843, - "step": 79328 - }, - { - "epoch": 2.03, - "learning_rate": 4.969756955542992e-07, - "loss": 0.3252, - "step": 79329 - }, - { - "epoch": 2.03, - "learning_rate": 4.969517809409932e-07, - "loss": 0.562, - "step": 79330 - }, - { - "epoch": 2.03, - "learning_rate": 4.969278667128486e-07, - "loss": 0.4365, - "step": 79331 - }, - { - "epoch": 2.03, - "learning_rate": 4.969039528698828e-07, - "loss": 0.4502, - "step": 79332 - }, - { - "epoch": 2.03, - "learning_rate": 4.968800394121148e-07, - "loss": 0.3181, - "step": 79333 - }, - { - "epoch": 2.03, - "learning_rate": 4.968561263395624e-07, - "loss": 0.4407, - "step": 79334 - }, - { - "epoch": 2.03, - "learning_rate": 4.968322136522441e-07, - "loss": 0.3535, - "step": 79335 - }, - { - "epoch": 2.03, - "learning_rate": 4.968083013501786e-07, - "loss": 0.4277, - "step": 79336 - }, - { - "epoch": 2.03, - "learning_rate": 4.967843894333834e-07, - "loss": 0.5371, - "step": 79337 - }, - { - "epoch": 2.03, - "learning_rate": 4.967604779018772e-07, - "loss": 0.4771, - "step": 79338 - }, - { - "epoch": 2.03, - "learning_rate": 4.967365667556786e-07, - "loss": 0.4395, - "step": 79339 - }, - { - "epoch": 2.03, - "learning_rate": 4.967126559948058e-07, - "loss": 0.3794, - "step": 79340 - }, - { - "epoch": 2.03, - "learning_rate": 4.966887456192771e-07, - "loss": 0.3464, - "step": 79341 - }, - { - "epoch": 2.03, - "learning_rate": 4.966648356291103e-07, - "loss": 0.3755, - "step": 79342 - }, - { - "epoch": 2.03, - "learning_rate": 4.966409260243241e-07, - "loss": 0.2068, - "step": 79343 - }, - { - "epoch": 2.03, - "learning_rate": 4.966170168049367e-07, - "loss": 0.2556, - "step": 79344 - }, - { - "epoch": 2.03, - "learning_rate": 4.96593107970967e-07, - "loss": 0.4041, - "step": 79345 - }, - { - "epoch": 2.03, - "learning_rate": 4.965691995224325e-07, - "loss": 0.4229, - "step": 79346 - }, - { - "epoch": 2.03, - "learning_rate": 4.965452914593517e-07, - "loss": 0.3582, - "step": 79347 - }, - { - "epoch": 2.03, - "learning_rate": 4.965213837817429e-07, - "loss": 0.4121, - "step": 79348 - }, - { - "epoch": 2.03, - "learning_rate": 4.964974764896252e-07, - "loss": 0.3511, - "step": 79349 - }, - { - "epoch": 2.03, - "learning_rate": 4.964735695830156e-07, - "loss": 0.4507, - "step": 79350 - }, - { - "epoch": 2.03, - "learning_rate": 4.964496630619334e-07, - "loss": 0.4033, - "step": 79351 - }, - { - "epoch": 2.03, - "learning_rate": 4.964257569263963e-07, - "loss": 0.2864, - "step": 79352 - }, - { - "epoch": 2.03, - "learning_rate": 4.964018511764232e-07, - "loss": 0.3652, - "step": 79353 - }, - { - "epoch": 2.03, - "learning_rate": 4.963779458120316e-07, - "loss": 0.4031, - "step": 79354 - }, - { - "epoch": 2.03, - "learning_rate": 4.963540408332404e-07, - "loss": 0.4932, - "step": 79355 - }, - { - "epoch": 2.03, - "learning_rate": 4.963301362400676e-07, - "loss": 0.481, - "step": 79356 - }, - { - "epoch": 2.03, - "learning_rate": 4.963062320325321e-07, - "loss": 0.4087, - "step": 79357 - }, - { - "epoch": 2.03, - "learning_rate": 4.962823282106513e-07, - "loss": 0.23, - "step": 79358 - }, - { - "epoch": 2.03, - "learning_rate": 4.962584247744441e-07, - "loss": 0.5635, - "step": 79359 - }, - { - "epoch": 2.03, - "learning_rate": 4.962345217239285e-07, - "loss": 0.3905, - "step": 79360 - }, - { - "epoch": 2.03, - "learning_rate": 4.962106190591235e-07, - "loss": 0.2839, - "step": 79361 - }, - { - "epoch": 2.03, - "learning_rate": 4.961867167800467e-07, - "loss": 0.3682, - "step": 79362 - }, - { - "epoch": 2.03, - "learning_rate": 4.961628148867164e-07, - "loss": 0.3267, - "step": 79363 - }, - { - "epoch": 2.03, - "learning_rate": 4.961389133791509e-07, - "loss": 0.3682, - "step": 79364 - }, - { - "epoch": 2.03, - "learning_rate": 4.961150122573688e-07, - "loss": 0.5068, - "step": 79365 - }, - { - "epoch": 2.03, - "learning_rate": 4.960911115213885e-07, - "loss": 0.4487, - "step": 79366 - }, - { - "epoch": 2.03, - "learning_rate": 4.960672111712278e-07, - "loss": 0.3857, - "step": 79367 - }, - { - "epoch": 2.03, - "learning_rate": 4.960433112069051e-07, - "loss": 0.5044, - "step": 79368 - }, - { - "epoch": 2.03, - "learning_rate": 4.960194116284389e-07, - "loss": 0.5786, - "step": 79369 - }, - { - "epoch": 2.03, - "learning_rate": 4.95995512435848e-07, - "loss": 0.3027, - "step": 79370 - }, - { - "epoch": 2.03, - "learning_rate": 4.959716136291501e-07, - "loss": 0.4692, - "step": 79371 - }, - { - "epoch": 2.03, - "learning_rate": 4.959477152083631e-07, - "loss": 0.3972, - "step": 79372 - }, - { - "epoch": 2.03, - "learning_rate": 4.959238171735058e-07, - "loss": 0.3085, - "step": 79373 - }, - { - "epoch": 2.03, - "learning_rate": 4.958999195245968e-07, - "loss": 0.4878, - "step": 79374 - }, - { - "epoch": 2.03, - "learning_rate": 4.958760222616538e-07, - "loss": 0.4121, - "step": 79375 - }, - { - "epoch": 2.03, - "learning_rate": 4.958521253846952e-07, - "loss": 0.4048, - "step": 79376 - }, - { - "epoch": 2.03, - "learning_rate": 4.958282288937395e-07, - "loss": 0.3848, - "step": 79377 - }, - { - "epoch": 2.03, - "learning_rate": 4.958043327888054e-07, - "loss": 0.5508, - "step": 79378 - }, - { - "epoch": 2.03, - "learning_rate": 4.957804370699102e-07, - "loss": 0.439, - "step": 79379 - }, - { - "epoch": 2.03, - "learning_rate": 4.957565417370729e-07, - "loss": 0.4565, - "step": 79380 - }, - { - "epoch": 2.03, - "learning_rate": 4.957326467903119e-07, - "loss": 0.4316, - "step": 79381 - }, - { - "epoch": 2.03, - "learning_rate": 4.957087522296449e-07, - "loss": 0.4517, - "step": 79382 - }, - { - "epoch": 2.03, - "learning_rate": 4.95684858055091e-07, - "loss": 0.4456, - "step": 79383 - }, - { - "epoch": 2.03, - "learning_rate": 4.956609642666675e-07, - "loss": 0.5371, - "step": 79384 - }, - { - "epoch": 2.03, - "learning_rate": 4.956370708643932e-07, - "loss": 0.3523, - "step": 79385 - }, - { - "epoch": 2.03, - "learning_rate": 4.956131778482864e-07, - "loss": 0.3502, - "step": 79386 - }, - { - "epoch": 2.03, - "learning_rate": 4.955892852183659e-07, - "loss": 0.3015, - "step": 79387 - }, - { - "epoch": 2.03, - "learning_rate": 4.955653929746489e-07, - "loss": 0.4971, - "step": 79388 - }, - { - "epoch": 2.03, - "learning_rate": 4.955415011171544e-07, - "loss": 0.3207, - "step": 79389 - }, - { - "epoch": 2.03, - "learning_rate": 4.95517609645901e-07, - "loss": 0.3926, - "step": 79390 - }, - { - "epoch": 2.03, - "learning_rate": 4.954937185609065e-07, - "loss": 0.4604, - "step": 79391 - }, - { - "epoch": 2.03, - "learning_rate": 4.954698278621889e-07, - "loss": 0.5571, - "step": 79392 - }, - { - "epoch": 2.03, - "learning_rate": 4.95445937549767e-07, - "loss": 0.2381, - "step": 79393 - }, - { - "epoch": 2.03, - "learning_rate": 4.954220476236587e-07, - "loss": 0.345, - "step": 79394 - }, - { - "epoch": 2.03, - "learning_rate": 4.953981580838831e-07, - "loss": 0.4595, - "step": 79395 - }, - { - "epoch": 2.03, - "learning_rate": 4.953742689304574e-07, - "loss": 0.4141, - "step": 79396 - }, - { - "epoch": 2.03, - "learning_rate": 4.953503801634005e-07, - "loss": 0.3691, - "step": 79397 - }, - { - "epoch": 2.04, - "learning_rate": 4.953264917827307e-07, - "loss": 0.2675, - "step": 79398 - }, - { - "epoch": 2.04, - "learning_rate": 4.953026037884664e-07, - "loss": 0.457, - "step": 79399 - }, - { - "epoch": 2.04, - "learning_rate": 4.952787161806255e-07, - "loss": 0.4429, - "step": 79400 - }, - { - "epoch": 2.04, - "learning_rate": 4.952548289592267e-07, - "loss": 0.5244, - "step": 79401 - }, - { - "epoch": 2.04, - "learning_rate": 4.952309421242877e-07, - "loss": 0.4829, - "step": 79402 - }, - { - "epoch": 2.04, - "learning_rate": 4.952070556758272e-07, - "loss": 0.3447, - "step": 79403 - }, - { - "epoch": 2.04, - "learning_rate": 4.951831696138638e-07, - "loss": 0.3168, - "step": 79404 - }, - { - "epoch": 2.04, - "learning_rate": 4.951592839384151e-07, - "loss": 0.5513, - "step": 79405 - }, - { - "epoch": 2.04, - "learning_rate": 4.951353986494997e-07, - "loss": 0.4702, - "step": 79406 - }, - { - "epoch": 2.04, - "learning_rate": 4.95111513747136e-07, - "loss": 0.4053, - "step": 79407 - }, - { - "epoch": 2.04, - "learning_rate": 4.950876292313425e-07, - "loss": 0.4502, - "step": 79408 - }, - { - "epoch": 2.04, - "learning_rate": 4.950637451021367e-07, - "loss": 0.3899, - "step": 79409 - }, - { - "epoch": 2.04, - "learning_rate": 4.950398613595375e-07, - "loss": 0.376, - "step": 79410 - }, - { - "epoch": 2.04, - "learning_rate": 4.950159780035634e-07, - "loss": 0.3843, - "step": 79411 - }, - { - "epoch": 2.04, - "learning_rate": 4.949920950342325e-07, - "loss": 0.3293, - "step": 79412 - }, - { - "epoch": 2.04, - "learning_rate": 4.949682124515624e-07, - "loss": 0.4551, - "step": 79413 - }, - { - "epoch": 2.04, - "learning_rate": 4.94944330255572e-07, - "loss": 0.3389, - "step": 79414 - }, - { - "epoch": 2.04, - "learning_rate": 4.949204484462793e-07, - "loss": 0.3174, - "step": 79415 - }, - { - "epoch": 2.04, - "learning_rate": 4.948965670237033e-07, - "loss": 0.4966, - "step": 79416 - }, - { - "epoch": 2.04, - "learning_rate": 4.948726859878613e-07, - "loss": 0.5581, - "step": 79417 - }, - { - "epoch": 2.04, - "learning_rate": 4.948488053387722e-07, - "loss": 0.3721, - "step": 79418 - }, - { - "epoch": 2.04, - "learning_rate": 4.948249250764542e-07, - "loss": 0.3232, - "step": 79419 - }, - { - "epoch": 2.04, - "learning_rate": 4.948010452009258e-07, - "loss": 0.6028, - "step": 79420 - }, - { - "epoch": 2.04, - "learning_rate": 4.94777165712205e-07, - "loss": 0.4521, - "step": 79421 - }, - { - "epoch": 2.04, - "learning_rate": 4.947532866103096e-07, - "loss": 0.3718, - "step": 79422 - }, - { - "epoch": 2.04, - "learning_rate": 4.947294078952586e-07, - "loss": 0.245, - "step": 79423 - }, - { - "epoch": 2.04, - "learning_rate": 4.9470552956707e-07, - "loss": 0.4736, - "step": 79424 - }, - { - "epoch": 2.04, - "learning_rate": 4.946816516257625e-07, - "loss": 0.3513, - "step": 79425 - }, - { - "epoch": 2.04, - "learning_rate": 4.946577740713536e-07, - "loss": 0.3912, - "step": 79426 - }, - { - "epoch": 2.04, - "learning_rate": 4.94633896903862e-07, - "loss": 0.4897, - "step": 79427 - }, - { - "epoch": 2.04, - "learning_rate": 4.946100201233064e-07, - "loss": 0.4155, - "step": 79428 - }, - { - "epoch": 2.04, - "learning_rate": 4.945861437297043e-07, - "loss": 0.4287, - "step": 79429 - }, - { - "epoch": 2.04, - "learning_rate": 4.945622677230742e-07, - "loss": 0.311, - "step": 79430 - }, - { - "epoch": 2.04, - "learning_rate": 4.945383921034351e-07, - "loss": 0.3926, - "step": 79431 - }, - { - "epoch": 2.04, - "learning_rate": 4.945145168708043e-07, - "loss": 0.5488, - "step": 79432 - }, - { - "epoch": 2.04, - "learning_rate": 4.94490642025201e-07, - "loss": 0.4536, - "step": 79433 - }, - { - "epoch": 2.04, - "learning_rate": 4.944667675666424e-07, - "loss": 0.5254, - "step": 79434 - }, - { - "epoch": 2.04, - "learning_rate": 4.944428934951473e-07, - "loss": 0.4082, - "step": 79435 - }, - { - "epoch": 2.04, - "learning_rate": 4.944190198107342e-07, - "loss": 0.3524, - "step": 79436 - }, - { - "epoch": 2.04, - "learning_rate": 4.943951465134216e-07, - "loss": 0.52, - "step": 79437 - }, - { - "epoch": 2.04, - "learning_rate": 4.943712736032269e-07, - "loss": 0.4243, - "step": 79438 - }, - { - "epoch": 2.04, - "learning_rate": 4.943474010801688e-07, - "loss": 0.3708, - "step": 79439 - }, - { - "epoch": 2.04, - "learning_rate": 4.943235289442657e-07, - "loss": 0.4565, - "step": 79440 - }, - { - "epoch": 2.04, - "learning_rate": 4.942996571955364e-07, - "loss": 0.4722, - "step": 79441 - }, - { - "epoch": 2.04, - "learning_rate": 4.942757858339983e-07, - "loss": 0.3533, - "step": 79442 - }, - { - "epoch": 2.04, - "learning_rate": 4.942519148596698e-07, - "loss": 0.5801, - "step": 79443 - }, - { - "epoch": 2.04, - "learning_rate": 4.942280442725692e-07, - "loss": 0.4531, - "step": 79444 - }, - { - "epoch": 2.04, - "learning_rate": 4.942041740727154e-07, - "loss": 0.3157, - "step": 79445 - }, - { - "epoch": 2.04, - "learning_rate": 4.941803042601259e-07, - "loss": 0.4658, - "step": 79446 - }, - { - "epoch": 2.04, - "learning_rate": 4.941564348348192e-07, - "loss": 0.4365, - "step": 79447 - }, - { - "epoch": 2.04, - "learning_rate": 4.941325657968138e-07, - "loss": 0.4448, - "step": 79448 - }, - { - "epoch": 2.04, - "learning_rate": 4.941086971461279e-07, - "loss": 0.4451, - "step": 79449 - }, - { - "epoch": 2.04, - "learning_rate": 4.940848288827796e-07, - "loss": 0.2884, - "step": 79450 - }, - { - "epoch": 2.04, - "learning_rate": 4.940609610067875e-07, - "loss": 0.3097, - "step": 79451 - }, - { - "epoch": 2.04, - "learning_rate": 4.940370935181694e-07, - "loss": 0.3396, - "step": 79452 - }, - { - "epoch": 2.04, - "learning_rate": 4.940132264169438e-07, - "loss": 0.5122, - "step": 79453 - }, - { - "epoch": 2.04, - "learning_rate": 4.939893597031294e-07, - "loss": 0.4663, - "step": 79454 - }, - { - "epoch": 2.04, - "learning_rate": 4.939654933767437e-07, - "loss": 0.5486, - "step": 79455 - }, - { - "epoch": 2.04, - "learning_rate": 4.939416274378052e-07, - "loss": 0.4761, - "step": 79456 - }, - { - "epoch": 2.04, - "learning_rate": 4.939177618863325e-07, - "loss": 0.5088, - "step": 79457 - }, - { - "epoch": 2.04, - "learning_rate": 4.93893896722344e-07, - "loss": 0.4673, - "step": 79458 - }, - { - "epoch": 2.04, - "learning_rate": 4.938700319458574e-07, - "loss": 0.3958, - "step": 79459 - }, - { - "epoch": 2.04, - "learning_rate": 4.938461675568911e-07, - "loss": 0.2576, - "step": 79460 - }, - { - "epoch": 2.04, - "learning_rate": 4.938223035554639e-07, - "loss": 0.4873, - "step": 79461 - }, - { - "epoch": 2.04, - "learning_rate": 4.937984399415939e-07, - "loss": 0.3787, - "step": 79462 - }, - { - "epoch": 2.04, - "learning_rate": 4.937745767152985e-07, - "loss": 0.4634, - "step": 79463 - }, - { - "epoch": 2.04, - "learning_rate": 4.937507138765968e-07, - "loss": 0.564, - "step": 79464 - }, - { - "epoch": 2.04, - "learning_rate": 4.937268514255068e-07, - "loss": 0.4922, - "step": 79465 - }, - { - "epoch": 2.04, - "learning_rate": 4.937029893620475e-07, - "loss": 0.4199, - "step": 79466 - }, - { - "epoch": 2.04, - "learning_rate": 4.936791276862358e-07, - "loss": 0.4265, - "step": 79467 - }, - { - "epoch": 2.04, - "learning_rate": 4.93655266398091e-07, - "loss": 0.3398, - "step": 79468 - }, - { - "epoch": 2.04, - "learning_rate": 4.936314054976309e-07, - "loss": 0.406, - "step": 79469 - }, - { - "epoch": 2.04, - "learning_rate": 4.936075449848744e-07, - "loss": 0.3894, - "step": 79470 - }, - { - "epoch": 2.04, - "learning_rate": 4.935836848598394e-07, - "loss": 0.4597, - "step": 79471 - }, - { - "epoch": 2.04, - "learning_rate": 4.935598251225435e-07, - "loss": 0.4097, - "step": 79472 - }, - { - "epoch": 2.04, - "learning_rate": 4.935359657730057e-07, - "loss": 0.4014, - "step": 79473 - }, - { - "epoch": 2.04, - "learning_rate": 4.935121068112441e-07, - "loss": 0.4297, - "step": 79474 - }, - { - "epoch": 2.04, - "learning_rate": 4.934882482372774e-07, - "loss": 0.5454, - "step": 79475 - }, - { - "epoch": 2.04, - "learning_rate": 4.93464390051123e-07, - "loss": 0.3933, - "step": 79476 - }, - { - "epoch": 2.04, - "learning_rate": 4.934405322527997e-07, - "loss": 0.3945, - "step": 79477 - }, - { - "epoch": 2.04, - "learning_rate": 4.934166748423256e-07, - "loss": 0.4419, - "step": 79478 - }, - { - "epoch": 2.04, - "learning_rate": 4.933928178197195e-07, - "loss": 0.2797, - "step": 79479 - }, - { - "epoch": 2.04, - "learning_rate": 4.93368961184999e-07, - "loss": 0.3782, - "step": 79480 - }, - { - "epoch": 2.04, - "learning_rate": 4.933451049381827e-07, - "loss": 0.3718, - "step": 79481 - }, - { - "epoch": 2.04, - "learning_rate": 4.933212490792885e-07, - "loss": 0.4922, - "step": 79482 - }, - { - "epoch": 2.04, - "learning_rate": 4.932973936083353e-07, - "loss": 0.3381, - "step": 79483 - }, - { - "epoch": 2.04, - "learning_rate": 4.932735385253406e-07, - "loss": 0.4438, - "step": 79484 - }, - { - "epoch": 2.04, - "learning_rate": 4.93249683830323e-07, - "loss": 0.4819, - "step": 79485 - }, - { - "epoch": 2.04, - "learning_rate": 4.93225829523301e-07, - "loss": 0.4248, - "step": 79486 - }, - { - "epoch": 2.04, - "learning_rate": 4.932019756042929e-07, - "loss": 0.3604, - "step": 79487 - }, - { - "epoch": 2.04, - "learning_rate": 4.931781220733164e-07, - "loss": 0.5249, - "step": 79488 - }, - { - "epoch": 2.04, - "learning_rate": 4.9315426893039e-07, - "loss": 0.3329, - "step": 79489 - }, - { - "epoch": 2.04, - "learning_rate": 4.931304161755323e-07, - "loss": 0.4688, - "step": 79490 - }, - { - "epoch": 2.04, - "learning_rate": 4.931065638087615e-07, - "loss": 0.436, - "step": 79491 - }, - { - "epoch": 2.04, - "learning_rate": 4.930827118300958e-07, - "loss": 0.4707, - "step": 79492 - }, - { - "epoch": 2.04, - "learning_rate": 4.93058860239553e-07, - "loss": 0.4346, - "step": 79493 - }, - { - "epoch": 2.04, - "learning_rate": 4.930350090371516e-07, - "loss": 0.3633, - "step": 79494 - }, - { - "epoch": 2.04, - "learning_rate": 4.930111582229102e-07, - "loss": 0.6035, - "step": 79495 - }, - { - "epoch": 2.04, - "learning_rate": 4.929873077968471e-07, - "loss": 0.3816, - "step": 79496 - }, - { - "epoch": 2.04, - "learning_rate": 4.929634577589798e-07, - "loss": 0.4399, - "step": 79497 - }, - { - "epoch": 2.04, - "learning_rate": 4.929396081093273e-07, - "loss": 0.4062, - "step": 79498 - }, - { - "epoch": 2.04, - "learning_rate": 4.929157588479078e-07, - "loss": 0.3752, - "step": 79499 - }, - { - "epoch": 2.04, - "learning_rate": 4.928919099747395e-07, - "loss": 0.4507, - "step": 79500 - }, - { - "epoch": 2.04, - "learning_rate": 4.928680614898402e-07, - "loss": 0.2661, - "step": 79501 - }, - { - "epoch": 2.04, - "learning_rate": 4.928442133932283e-07, - "loss": 0.45, - "step": 79502 - }, - { - "epoch": 2.04, - "learning_rate": 4.928203656849224e-07, - "loss": 0.3602, - "step": 79503 - }, - { - "epoch": 2.04, - "learning_rate": 4.927965183649412e-07, - "loss": 0.52, - "step": 79504 - }, - { - "epoch": 2.04, - "learning_rate": 4.927726714333016e-07, - "loss": 0.3542, - "step": 79505 - }, - { - "epoch": 2.04, - "learning_rate": 4.92748824890023e-07, - "loss": 0.3542, - "step": 79506 - }, - { - "epoch": 2.04, - "learning_rate": 4.927249787351232e-07, - "loss": 0.3661, - "step": 79507 - }, - { - "epoch": 2.04, - "learning_rate": 4.92701132968621e-07, - "loss": 0.4453, - "step": 79508 - }, - { - "epoch": 2.04, - "learning_rate": 4.926772875905336e-07, - "loss": 0.3373, - "step": 79509 - }, - { - "epoch": 2.04, - "learning_rate": 4.926534426008805e-07, - "loss": 0.4697, - "step": 79510 - }, - { - "epoch": 2.04, - "learning_rate": 4.926295979996787e-07, - "loss": 0.4165, - "step": 79511 - }, - { - "epoch": 2.04, - "learning_rate": 4.926057537869474e-07, - "loss": 0.5171, - "step": 79512 - }, - { - "epoch": 2.04, - "learning_rate": 4.925819099627047e-07, - "loss": 0.4316, - "step": 79513 - }, - { - "epoch": 2.04, - "learning_rate": 4.925580665269684e-07, - "loss": 0.3118, - "step": 79514 - }, - { - "epoch": 2.04, - "learning_rate": 4.92534223479757e-07, - "loss": 0.3448, - "step": 79515 - }, - { - "epoch": 2.04, - "learning_rate": 4.925103808210892e-07, - "loss": 0.3127, - "step": 79516 - }, - { - "epoch": 2.04, - "learning_rate": 4.924865385509826e-07, - "loss": 0.415, - "step": 79517 - }, - { - "epoch": 2.04, - "learning_rate": 4.924626966694556e-07, - "loss": 0.3618, - "step": 79518 - }, - { - "epoch": 2.04, - "learning_rate": 4.924388551765266e-07, - "loss": 0.4746, - "step": 79519 - }, - { - "epoch": 2.04, - "learning_rate": 4.924150140722142e-07, - "loss": 0.4346, - "step": 79520 - }, - { - "epoch": 2.04, - "learning_rate": 4.923911733565364e-07, - "loss": 0.3628, - "step": 79521 - }, - { - "epoch": 2.04, - "learning_rate": 4.923673330295108e-07, - "loss": 0.4248, - "step": 79522 - }, - { - "epoch": 2.04, - "learning_rate": 4.923434930911561e-07, - "loss": 0.3481, - "step": 79523 - }, - { - "epoch": 2.04, - "learning_rate": 4.92319653541491e-07, - "loss": 0.4497, - "step": 79524 - }, - { - "epoch": 2.04, - "learning_rate": 4.922958143805335e-07, - "loss": 0.4675, - "step": 79525 - }, - { - "epoch": 2.04, - "learning_rate": 4.922719756083015e-07, - "loss": 0.3623, - "step": 79526 - }, - { - "epoch": 2.04, - "learning_rate": 4.922481372248134e-07, - "loss": 0.2687, - "step": 79527 - }, - { - "epoch": 2.04, - "learning_rate": 4.922242992300876e-07, - "loss": 0.3953, - "step": 79528 - }, - { - "epoch": 2.04, - "learning_rate": 4.922004616241427e-07, - "loss": 0.3955, - "step": 79529 - }, - { - "epoch": 2.04, - "learning_rate": 4.921766244069965e-07, - "loss": 0.2925, - "step": 79530 - }, - { - "epoch": 2.04, - "learning_rate": 4.921527875786669e-07, - "loss": 0.3394, - "step": 79531 - }, - { - "epoch": 2.04, - "learning_rate": 4.921289511391727e-07, - "loss": 0.4214, - "step": 79532 - }, - { - "epoch": 2.04, - "learning_rate": 4.921051150885324e-07, - "loss": 0.4536, - "step": 79533 - }, - { - "epoch": 2.04, - "learning_rate": 4.920812794267633e-07, - "loss": 0.2861, - "step": 79534 - }, - { - "epoch": 2.04, - "learning_rate": 4.920574441538844e-07, - "loss": 0.2394, - "step": 79535 - }, - { - "epoch": 2.04, - "learning_rate": 4.920336092699137e-07, - "loss": 0.3516, - "step": 79536 - }, - { - "epoch": 2.04, - "learning_rate": 4.920097747748699e-07, - "loss": 0.3381, - "step": 79537 - }, - { - "epoch": 2.04, - "learning_rate": 4.919859406687704e-07, - "loss": 0.4219, - "step": 79538 - }, - { - "epoch": 2.04, - "learning_rate": 4.919621069516339e-07, - "loss": 0.4182, - "step": 79539 - }, - { - "epoch": 2.04, - "learning_rate": 4.919382736234791e-07, - "loss": 0.3025, - "step": 79540 - }, - { - "epoch": 2.04, - "learning_rate": 4.919144406843234e-07, - "loss": 0.377, - "step": 79541 - }, - { - "epoch": 2.04, - "learning_rate": 4.918906081341858e-07, - "loss": 0.3752, - "step": 79542 - }, - { - "epoch": 2.04, - "learning_rate": 4.918667759730838e-07, - "loss": 0.3486, - "step": 79543 - }, - { - "epoch": 2.04, - "learning_rate": 4.918429442010361e-07, - "loss": 0.5542, - "step": 79544 - }, - { - "epoch": 2.04, - "learning_rate": 4.918191128180609e-07, - "loss": 0.3599, - "step": 79545 - }, - { - "epoch": 2.04, - "learning_rate": 4.917952818241769e-07, - "loss": 0.481, - "step": 79546 - }, - { - "epoch": 2.04, - "learning_rate": 4.917714512194013e-07, - "loss": 0.4165, - "step": 79547 - }, - { - "epoch": 2.04, - "learning_rate": 4.917476210037531e-07, - "loss": 0.5503, - "step": 79548 - }, - { - "epoch": 2.04, - "learning_rate": 4.917237911772502e-07, - "loss": 0.498, - "step": 79549 - }, - { - "epoch": 2.04, - "learning_rate": 4.91699961739912e-07, - "loss": 0.3799, - "step": 79550 - }, - { - "epoch": 2.04, - "learning_rate": 4.916761326917549e-07, - "loss": 0.3892, - "step": 79551 - }, - { - "epoch": 2.04, - "learning_rate": 4.91652304032798e-07, - "loss": 0.4421, - "step": 79552 - }, - { - "epoch": 2.04, - "learning_rate": 4.916284757630595e-07, - "loss": 0.4761, - "step": 79553 - }, - { - "epoch": 2.04, - "learning_rate": 4.916046478825583e-07, - "loss": 0.4673, - "step": 79554 - }, - { - "epoch": 2.04, - "learning_rate": 4.915808203913114e-07, - "loss": 0.4941, - "step": 79555 - }, - { - "epoch": 2.04, - "learning_rate": 4.915569932893378e-07, - "loss": 0.3926, - "step": 79556 - }, - { - "epoch": 2.04, - "learning_rate": 4.915331665766557e-07, - "loss": 0.4233, - "step": 79557 - }, - { - "epoch": 2.04, - "learning_rate": 4.915093402532836e-07, - "loss": 0.4229, - "step": 79558 - }, - { - "epoch": 2.04, - "learning_rate": 4.91485514319239e-07, - "loss": 0.3726, - "step": 79559 - }, - { - "epoch": 2.04, - "learning_rate": 4.914616887745409e-07, - "loss": 0.3557, - "step": 79560 - }, - { - "epoch": 2.04, - "learning_rate": 4.91437863619207e-07, - "loss": 0.4033, - "step": 79561 - }, - { - "epoch": 2.04, - "learning_rate": 4.914140388532556e-07, - "loss": 0.418, - "step": 79562 - }, - { - "epoch": 2.04, - "learning_rate": 4.913902144767055e-07, - "loss": 0.4912, - "step": 79563 - }, - { - "epoch": 2.04, - "learning_rate": 4.913663904895742e-07, - "loss": 0.4434, - "step": 79564 - }, - { - "epoch": 2.04, - "learning_rate": 4.913425668918802e-07, - "loss": 0.3, - "step": 79565 - }, - { - "epoch": 2.04, - "learning_rate": 4.913187436836417e-07, - "loss": 0.4336, - "step": 79566 - }, - { - "epoch": 2.04, - "learning_rate": 4.912949208648777e-07, - "loss": 0.3121, - "step": 79567 - }, - { - "epoch": 2.04, - "learning_rate": 4.912710984356053e-07, - "loss": 0.4253, - "step": 79568 - }, - { - "epoch": 2.04, - "learning_rate": 4.912472763958431e-07, - "loss": 0.4722, - "step": 79569 - }, - { - "epoch": 2.04, - "learning_rate": 4.912234547456099e-07, - "loss": 0.3373, - "step": 79570 - }, - { - "epoch": 2.04, - "learning_rate": 4.911996334849235e-07, - "loss": 0.3716, - "step": 79571 - }, - { - "epoch": 2.04, - "learning_rate": 4.911758126138019e-07, - "loss": 0.324, - "step": 79572 - }, - { - "epoch": 2.04, - "learning_rate": 4.911519921322634e-07, - "loss": 0.3545, - "step": 79573 - }, - { - "epoch": 2.04, - "learning_rate": 4.911281720403267e-07, - "loss": 0.4883, - "step": 79574 - }, - { - "epoch": 2.04, - "learning_rate": 4.911043523380098e-07, - "loss": 0.3237, - "step": 79575 - }, - { - "epoch": 2.04, - "learning_rate": 4.910805330253307e-07, - "loss": 0.4092, - "step": 79576 - }, - { - "epoch": 2.04, - "learning_rate": 4.910567141023078e-07, - "loss": 0.5005, - "step": 79577 - }, - { - "epoch": 2.04, - "learning_rate": 4.910328955689595e-07, - "loss": 0.4858, - "step": 79578 - }, - { - "epoch": 2.04, - "learning_rate": 4.910090774253041e-07, - "loss": 0.5317, - "step": 79579 - }, - { - "epoch": 2.04, - "learning_rate": 4.909852596713596e-07, - "loss": 0.5479, - "step": 79580 - }, - { - "epoch": 2.04, - "learning_rate": 4.909614423071441e-07, - "loss": 0.4531, - "step": 79581 - }, - { - "epoch": 2.04, - "learning_rate": 4.909376253326759e-07, - "loss": 0.3828, - "step": 79582 - }, - { - "epoch": 2.04, - "learning_rate": 4.909138087479734e-07, - "loss": 0.48, - "step": 79583 - }, - { - "epoch": 2.04, - "learning_rate": 4.908899925530552e-07, - "loss": 0.4028, - "step": 79584 - }, - { - "epoch": 2.04, - "learning_rate": 4.908661767479386e-07, - "loss": 0.4321, - "step": 79585 - }, - { - "epoch": 2.04, - "learning_rate": 4.908423613326425e-07, - "loss": 0.5117, - "step": 79586 - }, - { - "epoch": 2.04, - "learning_rate": 4.908185463071849e-07, - "loss": 0.5542, - "step": 79587 - }, - { - "epoch": 2.04, - "learning_rate": 4.907947316715845e-07, - "loss": 0.522, - "step": 79588 - }, - { - "epoch": 2.04, - "learning_rate": 4.907709174258588e-07, - "loss": 0.4644, - "step": 79589 - }, - { - "epoch": 2.04, - "learning_rate": 4.907471035700269e-07, - "loss": 0.4243, - "step": 79590 - }, - { - "epoch": 2.04, - "learning_rate": 4.907232901041061e-07, - "loss": 0.3909, - "step": 79591 - }, - { - "epoch": 2.04, - "learning_rate": 4.906994770281153e-07, - "loss": 0.4614, - "step": 79592 - }, - { - "epoch": 2.04, - "learning_rate": 4.906756643420723e-07, - "loss": 0.5122, - "step": 79593 - }, - { - "epoch": 2.04, - "learning_rate": 4.906518520459953e-07, - "loss": 0.3591, - "step": 79594 - }, - { - "epoch": 2.04, - "learning_rate": 4.90628040139903e-07, - "loss": 0.2665, - "step": 79595 - }, - { - "epoch": 2.04, - "learning_rate": 4.906042286238136e-07, - "loss": 0.3735, - "step": 79596 - }, - { - "epoch": 2.04, - "learning_rate": 4.905804174977448e-07, - "loss": 0.4736, - "step": 79597 - }, - { - "epoch": 2.04, - "learning_rate": 4.905566067617152e-07, - "loss": 0.4304, - "step": 79598 - }, - { - "epoch": 2.04, - "learning_rate": 4.905327964157429e-07, - "loss": 0.3252, - "step": 79599 - }, - { - "epoch": 2.04, - "learning_rate": 4.905089864598467e-07, - "loss": 0.3525, - "step": 79600 - }, - { - "epoch": 2.04, - "learning_rate": 4.904851768940441e-07, - "loss": 0.3516, - "step": 79601 - }, - { - "epoch": 2.04, - "learning_rate": 4.904613677183534e-07, - "loss": 0.3804, - "step": 79602 - }, - { - "epoch": 2.04, - "learning_rate": 4.904375589327929e-07, - "loss": 0.4606, - "step": 79603 - }, - { - "epoch": 2.04, - "learning_rate": 4.90413750537381e-07, - "loss": 0.3254, - "step": 79604 - }, - { - "epoch": 2.04, - "learning_rate": 4.903899425321363e-07, - "loss": 0.4158, - "step": 79605 - }, - { - "epoch": 2.04, - "learning_rate": 4.903661349170761e-07, - "loss": 0.3477, - "step": 79606 - }, - { - "epoch": 2.04, - "learning_rate": 4.903423276922192e-07, - "loss": 0.5186, - "step": 79607 - }, - { - "epoch": 2.04, - "learning_rate": 4.90318520857584e-07, - "loss": 0.4883, - "step": 79608 - }, - { - "epoch": 2.04, - "learning_rate": 4.902947144131882e-07, - "loss": 0.4717, - "step": 79609 - }, - { - "epoch": 2.04, - "learning_rate": 4.902709083590506e-07, - "loss": 0.4917, - "step": 79610 - }, - { - "epoch": 2.04, - "learning_rate": 4.902471026951888e-07, - "loss": 0.4399, - "step": 79611 - }, - { - "epoch": 2.04, - "learning_rate": 4.902232974216213e-07, - "loss": 0.5098, - "step": 79612 - }, - { - "epoch": 2.04, - "learning_rate": 4.901994925383669e-07, - "loss": 0.4268, - "step": 79613 - }, - { - "epoch": 2.04, - "learning_rate": 4.901756880454428e-07, - "loss": 0.5684, - "step": 79614 - }, - { - "epoch": 2.04, - "learning_rate": 4.901518839428678e-07, - "loss": 0.4189, - "step": 79615 - }, - { - "epoch": 2.04, - "learning_rate": 4.9012808023066e-07, - "loss": 0.468, - "step": 79616 - }, - { - "epoch": 2.04, - "learning_rate": 4.90104276908838e-07, - "loss": 0.4127, - "step": 79617 - }, - { - "epoch": 2.04, - "learning_rate": 4.900804739774195e-07, - "loss": 0.4683, - "step": 79618 - }, - { - "epoch": 2.04, - "learning_rate": 4.900566714364229e-07, - "loss": 0.4609, - "step": 79619 - }, - { - "epoch": 2.04, - "learning_rate": 4.900328692858667e-07, - "loss": 0.2561, - "step": 79620 - }, - { - "epoch": 2.04, - "learning_rate": 4.900090675257686e-07, - "loss": 0.4194, - "step": 79621 - }, - { - "epoch": 2.04, - "learning_rate": 4.899852661561475e-07, - "loss": 0.4785, - "step": 79622 - }, - { - "epoch": 2.04, - "learning_rate": 4.899614651770208e-07, - "loss": 0.4004, - "step": 79623 - }, - { - "epoch": 2.04, - "learning_rate": 4.899376645884072e-07, - "loss": 0.4453, - "step": 79624 - }, - { - "epoch": 2.04, - "learning_rate": 4.899138643903253e-07, - "loss": 0.3639, - "step": 79625 - }, - { - "epoch": 2.04, - "learning_rate": 4.898900645827925e-07, - "loss": 0.5063, - "step": 79626 - }, - { - "epoch": 2.04, - "learning_rate": 4.898662651658274e-07, - "loss": 0.3625, - "step": 79627 - }, - { - "epoch": 2.04, - "learning_rate": 4.898424661394481e-07, - "loss": 0.416, - "step": 79628 - }, - { - "epoch": 2.04, - "learning_rate": 4.898186675036735e-07, - "loss": 0.5259, - "step": 79629 - }, - { - "epoch": 2.04, - "learning_rate": 4.897948692585213e-07, - "loss": 0.4277, - "step": 79630 - }, - { - "epoch": 2.04, - "learning_rate": 4.897710714040093e-07, - "loss": 0.359, - "step": 79631 - }, - { - "epoch": 2.04, - "learning_rate": 4.897472739401562e-07, - "loss": 0.3308, - "step": 79632 - }, - { - "epoch": 2.04, - "learning_rate": 4.8972347686698e-07, - "loss": 0.3716, - "step": 79633 - }, - { - "epoch": 2.04, - "learning_rate": 4.896996801844996e-07, - "loss": 0.1527, - "step": 79634 - }, - { - "epoch": 2.04, - "learning_rate": 4.896758838927322e-07, - "loss": 0.4639, - "step": 79635 - }, - { - "epoch": 2.04, - "learning_rate": 4.896520879916965e-07, - "loss": 0.4395, - "step": 79636 - }, - { - "epoch": 2.04, - "learning_rate": 4.896282924814108e-07, - "loss": 0.3206, - "step": 79637 - }, - { - "epoch": 2.04, - "learning_rate": 4.896044973618936e-07, - "loss": 0.4436, - "step": 79638 - }, - { - "epoch": 2.04, - "learning_rate": 4.895807026331624e-07, - "loss": 0.4136, - "step": 79639 - }, - { - "epoch": 2.04, - "learning_rate": 4.895569082952362e-07, - "loss": 0.458, - "step": 79640 - }, - { - "epoch": 2.04, - "learning_rate": 4.895331143481324e-07, - "loss": 0.4155, - "step": 79641 - }, - { - "epoch": 2.04, - "learning_rate": 4.895093207918699e-07, - "loss": 0.4219, - "step": 79642 - }, - { - "epoch": 2.04, - "learning_rate": 4.894855276264664e-07, - "loss": 0.35, - "step": 79643 - }, - { - "epoch": 2.04, - "learning_rate": 4.894617348519403e-07, - "loss": 0.2891, - "step": 79644 - }, - { - "epoch": 2.04, - "learning_rate": 4.894379424683098e-07, - "loss": 0.5137, - "step": 79645 - }, - { - "epoch": 2.04, - "learning_rate": 4.894141504755938e-07, - "loss": 0.3407, - "step": 79646 - }, - { - "epoch": 2.04, - "learning_rate": 4.893903588738093e-07, - "loss": 0.4756, - "step": 79647 - }, - { - "epoch": 2.04, - "learning_rate": 4.893665676629751e-07, - "loss": 0.5107, - "step": 79648 - }, - { - "epoch": 2.04, - "learning_rate": 4.893427768431097e-07, - "loss": 0.4131, - "step": 79649 - }, - { - "epoch": 2.04, - "learning_rate": 4.893189864142312e-07, - "loss": 0.4448, - "step": 79650 - }, - { - "epoch": 2.04, - "learning_rate": 4.892951963763578e-07, - "loss": 0.3799, - "step": 79651 - }, - { - "epoch": 2.04, - "learning_rate": 4.892714067295071e-07, - "loss": 0.4941, - "step": 79652 - }, - { - "epoch": 2.04, - "learning_rate": 4.892476174736978e-07, - "loss": 0.3085, - "step": 79653 - }, - { - "epoch": 2.04, - "learning_rate": 4.892238286089481e-07, - "loss": 0.3079, - "step": 79654 - }, - { - "epoch": 2.04, - "learning_rate": 4.892000401352768e-07, - "loss": 0.4067, - "step": 79655 - }, - { - "epoch": 2.04, - "learning_rate": 4.89176252052701e-07, - "loss": 0.4316, - "step": 79656 - }, - { - "epoch": 2.04, - "learning_rate": 4.891524643612395e-07, - "loss": 0.4287, - "step": 79657 - }, - { - "epoch": 2.04, - "learning_rate": 4.891286770609104e-07, - "loss": 0.3906, - "step": 79658 - }, - { - "epoch": 2.04, - "learning_rate": 4.891048901517325e-07, - "loss": 0.4102, - "step": 79659 - }, - { - "epoch": 2.04, - "learning_rate": 4.890811036337234e-07, - "loss": 0.521, - "step": 79660 - }, - { - "epoch": 2.04, - "learning_rate": 4.89057317506901e-07, - "loss": 0.4941, - "step": 79661 - }, - { - "epoch": 2.04, - "learning_rate": 4.89033531771284e-07, - "loss": 0.5073, - "step": 79662 - }, - { - "epoch": 2.04, - "learning_rate": 4.890097464268908e-07, - "loss": 0.5908, - "step": 79663 - }, - { - "epoch": 2.04, - "learning_rate": 4.889859614737391e-07, - "loss": 0.4043, - "step": 79664 - }, - { - "epoch": 2.04, - "learning_rate": 4.889621769118473e-07, - "loss": 0.4082, - "step": 79665 - }, - { - "epoch": 2.04, - "learning_rate": 4.889383927412336e-07, - "loss": 0.4761, - "step": 79666 - }, - { - "epoch": 2.04, - "learning_rate": 4.889146089619167e-07, - "loss": 0.4976, - "step": 79667 - }, - { - "epoch": 2.04, - "learning_rate": 4.88890825573914e-07, - "loss": 0.4365, - "step": 79668 - }, - { - "epoch": 2.04, - "learning_rate": 4.888670425772441e-07, - "loss": 0.3171, - "step": 79669 - }, - { - "epoch": 2.04, - "learning_rate": 4.888432599719256e-07, - "loss": 0.3091, - "step": 79670 - }, - { - "epoch": 2.04, - "learning_rate": 4.888194777579759e-07, - "loss": 0.4092, - "step": 79671 - }, - { - "epoch": 2.04, - "learning_rate": 4.88795695935414e-07, - "loss": 0.3794, - "step": 79672 - }, - { - "epoch": 2.04, - "learning_rate": 4.887719145042574e-07, - "loss": 0.4048, - "step": 79673 - }, - { - "epoch": 2.04, - "learning_rate": 4.887481334645246e-07, - "loss": 0.4688, - "step": 79674 - }, - { - "epoch": 2.04, - "learning_rate": 4.887243528162338e-07, - "loss": 0.4546, - "step": 79675 - }, - { - "epoch": 2.04, - "learning_rate": 4.887005725594038e-07, - "loss": 0.5425, - "step": 79676 - }, - { - "epoch": 2.04, - "learning_rate": 4.886767926940517e-07, - "loss": 0.2775, - "step": 79677 - }, - { - "epoch": 2.04, - "learning_rate": 4.886530132201964e-07, - "loss": 0.3247, - "step": 79678 - }, - { - "epoch": 2.04, - "learning_rate": 4.886292341378561e-07, - "loss": 0.4167, - "step": 79679 - }, - { - "epoch": 2.04, - "learning_rate": 4.886054554470492e-07, - "loss": 0.185, - "step": 79680 - }, - { - "epoch": 2.04, - "learning_rate": 4.885816771477931e-07, - "loss": 0.4561, - "step": 79681 - }, - { - "epoch": 2.04, - "learning_rate": 4.885578992401063e-07, - "loss": 0.4272, - "step": 79682 - }, - { - "epoch": 2.04, - "learning_rate": 4.885341217240075e-07, - "loss": 0.4736, - "step": 79683 - }, - { - "epoch": 2.04, - "learning_rate": 4.885103445995149e-07, - "loss": 0.4253, - "step": 79684 - }, - { - "epoch": 2.04, - "learning_rate": 4.884865678666459e-07, - "loss": 0.4238, - "step": 79685 - }, - { - "epoch": 2.04, - "learning_rate": 4.884627915254194e-07, - "loss": 0.4204, - "step": 79686 - }, - { - "epoch": 2.04, - "learning_rate": 4.884390155758533e-07, - "loss": 0.2114, - "step": 79687 - }, - { - "epoch": 2.04, - "learning_rate": 4.884152400179663e-07, - "loss": 0.5347, - "step": 79688 - }, - { - "epoch": 2.04, - "learning_rate": 4.883914648517758e-07, - "loss": 0.3599, - "step": 79689 - }, - { - "epoch": 2.04, - "learning_rate": 4.883676900773009e-07, - "loss": 0.3037, - "step": 79690 - }, - { - "epoch": 2.04, - "learning_rate": 4.88343915694559e-07, - "loss": 0.3513, - "step": 79691 - }, - { - "epoch": 2.04, - "learning_rate": 4.883201417035685e-07, - "loss": 0.2686, - "step": 79692 - }, - { - "epoch": 2.04, - "learning_rate": 4.882963681043482e-07, - "loss": 0.4531, - "step": 79693 - }, - { - "epoch": 2.04, - "learning_rate": 4.882725948969155e-07, - "loss": 0.5132, - "step": 79694 - }, - { - "epoch": 2.04, - "learning_rate": 4.882488220812889e-07, - "loss": 0.4051, - "step": 79695 - }, - { - "epoch": 2.04, - "learning_rate": 4.88225049657487e-07, - "loss": 0.4062, - "step": 79696 - }, - { - "epoch": 2.04, - "learning_rate": 4.882012776255273e-07, - "loss": 0.3367, - "step": 79697 - }, - { - "epoch": 2.04, - "learning_rate": 4.881775059854284e-07, - "loss": 0.499, - "step": 79698 - }, - { - "epoch": 2.04, - "learning_rate": 4.881537347372084e-07, - "loss": 0.3916, - "step": 79699 - }, - { - "epoch": 2.04, - "learning_rate": 4.881299638808859e-07, - "loss": 0.3215, - "step": 79700 - }, - { - "epoch": 2.04, - "learning_rate": 4.881061934164787e-07, - "loss": 0.3032, - "step": 79701 - }, - { - "epoch": 2.04, - "learning_rate": 4.880824233440048e-07, - "loss": 0.349, - "step": 79702 - }, - { - "epoch": 2.04, - "learning_rate": 4.880586536634826e-07, - "loss": 0.4182, - "step": 79703 - }, - { - "epoch": 2.04, - "learning_rate": 4.880348843749304e-07, - "loss": 0.5332, - "step": 79704 - }, - { - "epoch": 2.04, - "learning_rate": 4.880111154783666e-07, - "loss": 0.4365, - "step": 79705 - }, - { - "epoch": 2.04, - "learning_rate": 4.879873469738089e-07, - "loss": 0.4639, - "step": 79706 - }, - { - "epoch": 2.04, - "learning_rate": 4.879635788612756e-07, - "loss": 0.4341, - "step": 79707 - }, - { - "epoch": 2.04, - "learning_rate": 4.87939811140785e-07, - "loss": 0.4604, - "step": 79708 - }, - { - "epoch": 2.04, - "learning_rate": 4.879160438123559e-07, - "loss": 0.4436, - "step": 79709 - }, - { - "epoch": 2.04, - "learning_rate": 4.87892276876006e-07, - "loss": 0.459, - "step": 79710 - }, - { - "epoch": 2.04, - "learning_rate": 4.878685103317529e-07, - "loss": 0.4001, - "step": 79711 - }, - { - "epoch": 2.04, - "learning_rate": 4.878447441796154e-07, - "loss": 0.4175, - "step": 79712 - }, - { - "epoch": 2.04, - "learning_rate": 4.87820978419612e-07, - "loss": 0.374, - "step": 79713 - }, - { - "epoch": 2.04, - "learning_rate": 4.877972130517601e-07, - "loss": 0.5747, - "step": 79714 - }, - { - "epoch": 2.04, - "learning_rate": 4.877734480760783e-07, - "loss": 0.4167, - "step": 79715 - }, - { - "epoch": 2.04, - "learning_rate": 4.877496834925849e-07, - "loss": 0.5034, - "step": 79716 - }, - { - "epoch": 2.04, - "learning_rate": 4.877259193012983e-07, - "loss": 0.4717, - "step": 79717 - }, - { - "epoch": 2.04, - "learning_rate": 4.877021555022361e-07, - "loss": 0.4888, - "step": 79718 - }, - { - "epoch": 2.04, - "learning_rate": 4.876783920954169e-07, - "loss": 0.375, - "step": 79719 - }, - { - "epoch": 2.04, - "learning_rate": 4.876546290808591e-07, - "loss": 0.4639, - "step": 79720 - }, - { - "epoch": 2.04, - "learning_rate": 4.876308664585801e-07, - "loss": 0.478, - "step": 79721 - }, - { - "epoch": 2.04, - "learning_rate": 4.876071042285991e-07, - "loss": 0.4707, - "step": 79722 - }, - { - "epoch": 2.04, - "learning_rate": 4.875833423909334e-07, - "loss": 0.5356, - "step": 79723 - }, - { - "epoch": 2.04, - "learning_rate": 4.875595809456014e-07, - "loss": 0.4155, - "step": 79724 - }, - { - "epoch": 2.04, - "learning_rate": 4.875358198926218e-07, - "loss": 0.3975, - "step": 79725 - }, - { - "epoch": 2.04, - "learning_rate": 4.875120592320126e-07, - "loss": 0.6172, - "step": 79726 - }, - { - "epoch": 2.04, - "learning_rate": 4.874882989637914e-07, - "loss": 0.4028, - "step": 79727 - }, - { - "epoch": 2.04, - "learning_rate": 4.874645390879769e-07, - "loss": 0.439, - "step": 79728 - }, - { - "epoch": 2.04, - "learning_rate": 4.874407796045873e-07, - "loss": 0.2925, - "step": 79729 - }, - { - "epoch": 2.04, - "learning_rate": 4.874170205136415e-07, - "loss": 0.5352, - "step": 79730 - }, - { - "epoch": 2.04, - "learning_rate": 4.873932618151561e-07, - "loss": 0.3418, - "step": 79731 - }, - { - "epoch": 2.04, - "learning_rate": 4.873695035091502e-07, - "loss": 0.4722, - "step": 79732 - }, - { - "epoch": 2.04, - "learning_rate": 4.873457455956418e-07, - "loss": 0.4673, - "step": 79733 - }, - { - "epoch": 2.04, - "learning_rate": 4.873219880746497e-07, - "loss": 0.3787, - "step": 79734 - }, - { - "epoch": 2.04, - "learning_rate": 4.872982309461911e-07, - "loss": 0.3042, - "step": 79735 - }, - { - "epoch": 2.04, - "learning_rate": 4.872744742102845e-07, - "loss": 0.5117, - "step": 79736 - }, - { - "epoch": 2.04, - "learning_rate": 4.872507178669485e-07, - "loss": 0.3127, - "step": 79737 - }, - { - "epoch": 2.04, - "learning_rate": 4.872269619162014e-07, - "loss": 0.4233, - "step": 79738 - }, - { - "epoch": 2.04, - "learning_rate": 4.872032063580607e-07, - "loss": 0.3766, - "step": 79739 - }, - { - "epoch": 2.04, - "learning_rate": 4.871794511925451e-07, - "loss": 0.3586, - "step": 79740 - }, - { - "epoch": 2.04, - "learning_rate": 4.871556964196724e-07, - "loss": 0.4014, - "step": 79741 - }, - { - "epoch": 2.04, - "learning_rate": 4.871319420394609e-07, - "loss": 0.5493, - "step": 79742 - }, - { - "epoch": 2.04, - "learning_rate": 4.871081880519294e-07, - "loss": 0.4717, - "step": 79743 - }, - { - "epoch": 2.04, - "learning_rate": 4.870844344570951e-07, - "loss": 0.4053, - "step": 79744 - }, - { - "epoch": 2.04, - "learning_rate": 4.870606812549767e-07, - "loss": 0.3286, - "step": 79745 - }, - { - "epoch": 2.04, - "learning_rate": 4.870369284455925e-07, - "loss": 0.3928, - "step": 79746 - }, - { - "epoch": 2.04, - "learning_rate": 4.870131760289607e-07, - "loss": 0.48, - "step": 79747 - }, - { - "epoch": 2.04, - "learning_rate": 4.86989424005099e-07, - "loss": 0.3706, - "step": 79748 - }, - { - "epoch": 2.04, - "learning_rate": 4.869656723740259e-07, - "loss": 0.4434, - "step": 79749 - }, - { - "epoch": 2.04, - "learning_rate": 4.8694192113576e-07, - "loss": 0.4575, - "step": 79750 - }, - { - "epoch": 2.04, - "learning_rate": 4.86918170290319e-07, - "loss": 0.5039, - "step": 79751 - }, - { - "epoch": 2.04, - "learning_rate": 4.868944198377208e-07, - "loss": 0.2842, - "step": 79752 - }, - { - "epoch": 2.04, - "learning_rate": 4.86870669777984e-07, - "loss": 0.4644, - "step": 79753 - }, - { - "epoch": 2.04, - "learning_rate": 4.868469201111268e-07, - "loss": 0.5132, - "step": 79754 - }, - { - "epoch": 2.04, - "learning_rate": 4.868231708371676e-07, - "loss": 0.4658, - "step": 79755 - }, - { - "epoch": 2.04, - "learning_rate": 4.86799421956124e-07, - "loss": 0.4436, - "step": 79756 - }, - { - "epoch": 2.04, - "learning_rate": 4.867756734680144e-07, - "loss": 0.6001, - "step": 79757 - }, - { - "epoch": 2.04, - "learning_rate": 4.867519253728572e-07, - "loss": 0.3306, - "step": 79758 - }, - { - "epoch": 2.04, - "learning_rate": 4.867281776706708e-07, - "loss": 0.328, - "step": 79759 - }, - { - "epoch": 2.04, - "learning_rate": 4.867044303614729e-07, - "loss": 0.499, - "step": 79760 - }, - { - "epoch": 2.04, - "learning_rate": 4.866806834452815e-07, - "loss": 0.4436, - "step": 79761 - }, - { - "epoch": 2.04, - "learning_rate": 4.866569369221151e-07, - "loss": 0.5127, - "step": 79762 - }, - { - "epoch": 2.04, - "learning_rate": 4.866331907919918e-07, - "loss": 0.4189, - "step": 79763 - }, - { - "epoch": 2.04, - "learning_rate": 4.866094450549304e-07, - "loss": 0.3916, - "step": 79764 - }, - { - "epoch": 2.04, - "learning_rate": 4.865856997109481e-07, - "loss": 0.3892, - "step": 79765 - }, - { - "epoch": 2.04, - "learning_rate": 4.865619547600636e-07, - "loss": 0.3682, - "step": 79766 - }, - { - "epoch": 2.04, - "learning_rate": 4.865382102022948e-07, - "loss": 0.394, - "step": 79767 - }, - { - "epoch": 2.04, - "learning_rate": 4.865144660376607e-07, - "loss": 0.2832, - "step": 79768 - }, - { - "epoch": 2.04, - "learning_rate": 4.864907222661782e-07, - "loss": 0.3228, - "step": 79769 - }, - { - "epoch": 2.04, - "learning_rate": 4.864669788878668e-07, - "loss": 0.3499, - "step": 79770 - }, - { - "epoch": 2.04, - "learning_rate": 4.864432359027435e-07, - "loss": 0.4072, - "step": 79771 - }, - { - "epoch": 2.04, - "learning_rate": 4.864194933108274e-07, - "loss": 0.5293, - "step": 79772 - }, - { - "epoch": 2.04, - "learning_rate": 4.863957511121359e-07, - "loss": 0.481, - "step": 79773 - }, - { - "epoch": 2.04, - "learning_rate": 4.863720093066876e-07, - "loss": 0.3118, - "step": 79774 - }, - { - "epoch": 2.04, - "learning_rate": 4.863482678945005e-07, - "loss": 0.4663, - "step": 79775 - }, - { - "epoch": 2.04, - "learning_rate": 4.863245268755935e-07, - "loss": 0.3896, - "step": 79776 - }, - { - "epoch": 2.04, - "learning_rate": 4.863007862499836e-07, - "loss": 0.3506, - "step": 79777 - }, - { - "epoch": 2.04, - "learning_rate": 4.862770460176897e-07, - "loss": 0.3599, - "step": 79778 - }, - { - "epoch": 2.04, - "learning_rate": 4.862533061787298e-07, - "loss": 0.4187, - "step": 79779 - }, - { - "epoch": 2.04, - "learning_rate": 4.862295667331226e-07, - "loss": 0.4314, - "step": 79780 - }, - { - "epoch": 2.04, - "learning_rate": 4.862058276808856e-07, - "loss": 0.4214, - "step": 79781 - }, - { - "epoch": 2.04, - "learning_rate": 4.86182089022037e-07, - "loss": 0.4229, - "step": 79782 - }, - { - "epoch": 2.04, - "learning_rate": 4.861583507565949e-07, - "loss": 0.3242, - "step": 79783 - }, - { - "epoch": 2.04, - "learning_rate": 4.861346128845779e-07, - "loss": 0.3557, - "step": 79784 - }, - { - "epoch": 2.04, - "learning_rate": 4.861108754060043e-07, - "loss": 0.479, - "step": 79785 - }, - { - "epoch": 2.04, - "learning_rate": 4.860871383208918e-07, - "loss": 0.4717, - "step": 79786 - }, - { - "epoch": 2.04, - "learning_rate": 4.860634016292586e-07, - "loss": 0.4707, - "step": 79787 - }, - { - "epoch": 2.05, - "learning_rate": 4.860396653311234e-07, - "loss": 0.3567, - "step": 79788 - }, - { - "epoch": 2.05, - "learning_rate": 4.860159294265036e-07, - "loss": 0.5137, - "step": 79789 - }, - { - "epoch": 2.05, - "learning_rate": 4.859921939154181e-07, - "loss": 0.5098, - "step": 79790 - }, - { - "epoch": 2.05, - "learning_rate": 4.859684587978844e-07, - "loss": 0.5049, - "step": 79791 - }, - { - "epoch": 2.05, - "learning_rate": 4.859447240739211e-07, - "loss": 0.4956, - "step": 79792 - }, - { - "epoch": 2.05, - "learning_rate": 4.859209897435466e-07, - "loss": 0.4468, - "step": 79793 - }, - { - "epoch": 2.05, - "learning_rate": 4.858972558067783e-07, - "loss": 0.5356, - "step": 79794 - }, - { - "epoch": 2.05, - "learning_rate": 4.858735222636349e-07, - "loss": 0.437, - "step": 79795 - }, - { - "epoch": 2.05, - "learning_rate": 4.858497891141347e-07, - "loss": 0.3267, - "step": 79796 - }, - { - "epoch": 2.05, - "learning_rate": 4.858260563582957e-07, - "loss": 0.4902, - "step": 79797 - }, - { - "epoch": 2.05, - "learning_rate": 4.85802323996136e-07, - "loss": 0.237, - "step": 79798 - }, - { - "epoch": 2.05, - "learning_rate": 4.85778592027674e-07, - "loss": 0.4343, - "step": 79799 - }, - { - "epoch": 2.05, - "learning_rate": 4.857548604529274e-07, - "loss": 0.2676, - "step": 79800 - }, - { - "epoch": 2.05, - "learning_rate": 4.857311292719145e-07, - "loss": 0.4531, - "step": 79801 - }, - { - "epoch": 2.05, - "learning_rate": 4.857073984846542e-07, - "loss": 0.4055, - "step": 79802 - }, - { - "epoch": 2.05, - "learning_rate": 4.856836680911635e-07, - "loss": 0.4048, - "step": 79803 - }, - { - "epoch": 2.05, - "learning_rate": 4.856599380914614e-07, - "loss": 0.4551, - "step": 79804 - }, - { - "epoch": 2.05, - "learning_rate": 4.856362084855661e-07, - "loss": 0.46, - "step": 79805 - }, - { - "epoch": 2.05, - "learning_rate": 4.856124792734951e-07, - "loss": 0.4438, - "step": 79806 - }, - { - "epoch": 2.05, - "learning_rate": 4.85588750455267e-07, - "loss": 0.4165, - "step": 79807 - }, - { - "epoch": 2.05, - "learning_rate": 4.855650220309e-07, - "loss": 0.4517, - "step": 79808 - }, - { - "epoch": 2.05, - "learning_rate": 4.855412940004125e-07, - "loss": 0.3223, - "step": 79809 - }, - { - "epoch": 2.05, - "learning_rate": 4.855175663638225e-07, - "loss": 0.377, - "step": 79810 - }, - { - "epoch": 2.05, - "learning_rate": 4.854938391211475e-07, - "loss": 0.3975, - "step": 79811 - }, - { - "epoch": 2.05, - "learning_rate": 4.854701122724063e-07, - "loss": 0.2061, - "step": 79812 - }, - { - "epoch": 2.05, - "learning_rate": 4.85446385817617e-07, - "loss": 0.4189, - "step": 79813 - }, - { - "epoch": 2.05, - "learning_rate": 4.854226597567981e-07, - "loss": 0.5015, - "step": 79814 - }, - { - "epoch": 2.05, - "learning_rate": 4.853989340899671e-07, - "loss": 0.3643, - "step": 79815 - }, - { - "epoch": 2.05, - "learning_rate": 4.853752088171422e-07, - "loss": 0.3346, - "step": 79816 - }, - { - "epoch": 2.05, - "learning_rate": 4.853514839383422e-07, - "loss": 0.3643, - "step": 79817 - }, - { - "epoch": 2.05, - "learning_rate": 4.853277594535849e-07, - "loss": 0.3982, - "step": 79818 - }, - { - "epoch": 2.05, - "learning_rate": 4.853040353628888e-07, - "loss": 0.4668, - "step": 79819 - }, - { - "epoch": 2.05, - "learning_rate": 4.852803116662712e-07, - "loss": 0.4043, - "step": 79820 - }, - { - "epoch": 2.05, - "learning_rate": 4.852565883637508e-07, - "loss": 0.3069, - "step": 79821 - }, - { - "epoch": 2.05, - "learning_rate": 4.852328654553462e-07, - "loss": 0.5425, - "step": 79822 - }, - { - "epoch": 2.05, - "learning_rate": 4.852091429410747e-07, - "loss": 0.3896, - "step": 79823 - }, - { - "epoch": 2.05, - "learning_rate": 4.851854208209549e-07, - "loss": 0.4946, - "step": 79824 - }, - { - "epoch": 2.05, - "learning_rate": 4.85161699095005e-07, - "loss": 0.3542, - "step": 79825 - }, - { - "epoch": 2.05, - "learning_rate": 4.851379777632435e-07, - "loss": 0.5552, - "step": 79826 - }, - { - "epoch": 2.05, - "learning_rate": 4.851142568256878e-07, - "loss": 0.3892, - "step": 79827 - }, - { - "epoch": 2.05, - "learning_rate": 4.850905362823563e-07, - "loss": 0.2218, - "step": 79828 - }, - { - "epoch": 2.05, - "learning_rate": 4.850668161332679e-07, - "loss": 0.4136, - "step": 79829 - }, - { - "epoch": 2.05, - "learning_rate": 4.850430963784396e-07, - "loss": 0.3217, - "step": 79830 - }, - { - "epoch": 2.05, - "learning_rate": 4.850193770178905e-07, - "loss": 0.4407, - "step": 79831 - }, - { - "epoch": 2.05, - "learning_rate": 4.84995658051638e-07, - "loss": 0.4478, - "step": 79832 - }, - { - "epoch": 2.05, - "learning_rate": 4.849719394797007e-07, - "loss": 0.5654, - "step": 79833 - }, - { - "epoch": 2.05, - "learning_rate": 4.849482213020968e-07, - "loss": 0.4614, - "step": 79834 - }, - { - "epoch": 2.05, - "learning_rate": 4.849245035188446e-07, - "loss": 0.4531, - "step": 79835 - }, - { - "epoch": 2.05, - "learning_rate": 4.849007861299616e-07, - "loss": 0.4907, - "step": 79836 - }, - { - "epoch": 2.05, - "learning_rate": 4.848770691354666e-07, - "loss": 0.4194, - "step": 79837 - }, - { - "epoch": 2.05, - "learning_rate": 4.848533525353774e-07, - "loss": 0.4873, - "step": 79838 - }, - { - "epoch": 2.05, - "learning_rate": 4.848296363297131e-07, - "loss": 0.3784, - "step": 79839 - }, - { - "epoch": 2.05, - "learning_rate": 4.848059205184902e-07, - "loss": 0.3579, - "step": 79840 - }, - { - "epoch": 2.05, - "learning_rate": 4.847822051017278e-07, - "loss": 0.3696, - "step": 79841 - }, - { - "epoch": 2.05, - "learning_rate": 4.84758490079444e-07, - "loss": 0.4104, - "step": 79842 - }, - { - "epoch": 2.05, - "learning_rate": 4.847347754516573e-07, - "loss": 0.4648, - "step": 79843 - }, - { - "epoch": 2.05, - "learning_rate": 4.847110612183851e-07, - "loss": 0.3838, - "step": 79844 - }, - { - "epoch": 2.05, - "learning_rate": 4.846873473796459e-07, - "loss": 0.3811, - "step": 79845 - }, - { - "epoch": 2.05, - "learning_rate": 4.84663633935458e-07, - "loss": 0.356, - "step": 79846 - }, - { - "epoch": 2.05, - "learning_rate": 4.846399208858398e-07, - "loss": 0.4082, - "step": 79847 - }, - { - "epoch": 2.05, - "learning_rate": 4.846162082308088e-07, - "loss": 0.3806, - "step": 79848 - }, - { - "epoch": 2.05, - "learning_rate": 4.845924959703837e-07, - "loss": 0.4033, - "step": 79849 - }, - { - "epoch": 2.05, - "learning_rate": 4.845687841045821e-07, - "loss": 0.4036, - "step": 79850 - }, - { - "epoch": 2.05, - "learning_rate": 4.845450726334225e-07, - "loss": 0.5581, - "step": 79851 - }, - { - "epoch": 2.05, - "learning_rate": 4.845213615569234e-07, - "loss": 0.4536, - "step": 79852 - }, - { - "epoch": 2.05, - "learning_rate": 4.844976508751022e-07, - "loss": 0.2458, - "step": 79853 - }, - { - "epoch": 2.05, - "learning_rate": 4.844739405879776e-07, - "loss": 0.4526, - "step": 79854 - }, - { - "epoch": 2.05, - "learning_rate": 4.844502306955673e-07, - "loss": 0.3564, - "step": 79855 - }, - { - "epoch": 2.05, - "learning_rate": 4.844265211978904e-07, - "loss": 0.3051, - "step": 79856 - }, - { - "epoch": 2.05, - "learning_rate": 4.844028120949639e-07, - "loss": 0.5732, - "step": 79857 - }, - { - "epoch": 2.05, - "learning_rate": 4.843791033868066e-07, - "loss": 0.3945, - "step": 79858 - }, - { - "epoch": 2.05, - "learning_rate": 4.843553950734368e-07, - "loss": 0.3579, - "step": 79859 - }, - { - "epoch": 2.05, - "learning_rate": 4.843316871548723e-07, - "loss": 0.2959, - "step": 79860 - }, - { - "epoch": 2.05, - "learning_rate": 4.843079796311309e-07, - "loss": 0.3752, - "step": 79861 - }, - { - "epoch": 2.05, - "learning_rate": 4.842842725022312e-07, - "loss": 0.4697, - "step": 79862 - }, - { - "epoch": 2.05, - "learning_rate": 4.842605657681914e-07, - "loss": 0.5005, - "step": 79863 - }, - { - "epoch": 2.05, - "learning_rate": 4.8423685942903e-07, - "loss": 0.3915, - "step": 79864 - }, - { - "epoch": 2.05, - "learning_rate": 4.842131534847642e-07, - "loss": 0.5, - "step": 79865 - }, - { - "epoch": 2.05, - "learning_rate": 4.841894479354127e-07, - "loss": 0.2767, - "step": 79866 - }, - { - "epoch": 2.05, - "learning_rate": 4.841657427809938e-07, - "loss": 0.4956, - "step": 79867 - }, - { - "epoch": 2.05, - "learning_rate": 4.841420380215256e-07, - "loss": 0.4209, - "step": 79868 - }, - { - "epoch": 2.05, - "learning_rate": 4.841183336570263e-07, - "loss": 0.4404, - "step": 79869 - }, - { - "epoch": 2.05, - "learning_rate": 4.840946296875134e-07, - "loss": 0.4878, - "step": 79870 - }, - { - "epoch": 2.05, - "learning_rate": 4.840709261130055e-07, - "loss": 0.3748, - "step": 79871 - }, - { - "epoch": 2.05, - "learning_rate": 4.840472229335209e-07, - "loss": 0.366, - "step": 79872 - }, - { - "epoch": 2.05, - "learning_rate": 4.840235201490779e-07, - "loss": 0.3994, - "step": 79873 - }, - { - "epoch": 2.05, - "learning_rate": 4.839998177596939e-07, - "loss": 0.2949, - "step": 79874 - }, - { - "epoch": 2.05, - "learning_rate": 4.839761157653877e-07, - "loss": 0.4502, - "step": 79875 - }, - { - "epoch": 2.05, - "learning_rate": 4.839524141661775e-07, - "loss": 0.415, - "step": 79876 - }, - { - "epoch": 2.05, - "learning_rate": 4.839287129620808e-07, - "loss": 0.4927, - "step": 79877 - }, - { - "epoch": 2.05, - "learning_rate": 4.839050121531162e-07, - "loss": 0.3391, - "step": 79878 - }, - { - "epoch": 2.05, - "learning_rate": 4.838813117393022e-07, - "loss": 0.3398, - "step": 79879 - }, - { - "epoch": 2.05, - "learning_rate": 4.838576117206563e-07, - "loss": 0.4221, - "step": 79880 - }, - { - "epoch": 2.05, - "learning_rate": 4.838339120971972e-07, - "loss": 0.3984, - "step": 79881 - }, - { - "epoch": 2.05, - "learning_rate": 4.838102128689422e-07, - "loss": 0.3687, - "step": 79882 - }, - { - "epoch": 2.05, - "learning_rate": 4.837865140359101e-07, - "loss": 0.3999, - "step": 79883 - }, - { - "epoch": 2.05, - "learning_rate": 4.837628155981189e-07, - "loss": 0.3621, - "step": 79884 - }, - { - "epoch": 2.05, - "learning_rate": 4.837391175555873e-07, - "loss": 0.4727, - "step": 79885 - }, - { - "epoch": 2.05, - "learning_rate": 4.837154199083323e-07, - "loss": 0.3538, - "step": 79886 - }, - { - "epoch": 2.05, - "learning_rate": 4.836917226563728e-07, - "loss": 0.3689, - "step": 79887 - }, - { - "epoch": 2.05, - "learning_rate": 4.836680257997269e-07, - "loss": 0.4849, - "step": 79888 - }, - { - "epoch": 2.05, - "learning_rate": 4.836443293384128e-07, - "loss": 0.3916, - "step": 79889 - }, - { - "epoch": 2.05, - "learning_rate": 4.836206332724487e-07, - "loss": 0.4766, - "step": 79890 - }, - { - "epoch": 2.05, - "learning_rate": 4.835969376018521e-07, - "loss": 0.3424, - "step": 79891 - }, - { - "epoch": 2.05, - "learning_rate": 4.835732423266416e-07, - "loss": 0.4039, - "step": 79892 - }, - { - "epoch": 2.05, - "learning_rate": 4.835495474468356e-07, - "loss": 0.4214, - "step": 79893 - }, - { - "epoch": 2.05, - "learning_rate": 4.835258529624516e-07, - "loss": 0.4326, - "step": 79894 - }, - { - "epoch": 2.05, - "learning_rate": 4.835021588735082e-07, - "loss": 0.3818, - "step": 79895 - }, - { - "epoch": 2.05, - "learning_rate": 4.834784651800233e-07, - "loss": 0.4243, - "step": 79896 - }, - { - "epoch": 2.05, - "learning_rate": 4.834547718820157e-07, - "loss": 0.4468, - "step": 79897 - }, - { - "epoch": 2.05, - "learning_rate": 4.834310789795026e-07, - "loss": 0.4419, - "step": 79898 - }, - { - "epoch": 2.05, - "learning_rate": 4.83407386472503e-07, - "loss": 0.4023, - "step": 79899 - }, - { - "epoch": 2.05, - "learning_rate": 4.833836943610342e-07, - "loss": 0.4854, - "step": 79900 - }, - { - "epoch": 2.05, - "learning_rate": 4.833600026451148e-07, - "loss": 0.3462, - "step": 79901 - }, - { - "epoch": 2.05, - "learning_rate": 4.833363113247631e-07, - "loss": 0.2418, - "step": 79902 - }, - { - "epoch": 2.05, - "learning_rate": 4.833126203999968e-07, - "loss": 0.4246, - "step": 79903 - }, - { - "epoch": 2.05, - "learning_rate": 4.832889298708342e-07, - "loss": 0.3193, - "step": 79904 - }, - { - "epoch": 2.05, - "learning_rate": 4.832652397372936e-07, - "loss": 0.4185, - "step": 79905 - }, - { - "epoch": 2.05, - "learning_rate": 4.832415499993934e-07, - "loss": 0.4517, - "step": 79906 - }, - { - "epoch": 2.05, - "learning_rate": 4.83217860657151e-07, - "loss": 0.4141, - "step": 79907 - }, - { - "epoch": 2.05, - "learning_rate": 4.831941717105849e-07, - "loss": 0.4346, - "step": 79908 - }, - { - "epoch": 2.05, - "learning_rate": 4.831704831597135e-07, - "loss": 0.4351, - "step": 79909 - }, - { - "epoch": 2.05, - "learning_rate": 4.831467950045545e-07, - "loss": 0.3402, - "step": 79910 - }, - { - "epoch": 2.05, - "learning_rate": 4.831231072451266e-07, - "loss": 0.5142, - "step": 79911 - }, - { - "epoch": 2.05, - "learning_rate": 4.83099419881447e-07, - "loss": 0.5415, - "step": 79912 - }, - { - "epoch": 2.05, - "learning_rate": 4.830757329135346e-07, - "loss": 0.5542, - "step": 79913 - }, - { - "epoch": 2.05, - "learning_rate": 4.830520463414077e-07, - "loss": 0.3496, - "step": 79914 - }, - { - "epoch": 2.05, - "learning_rate": 4.830283601650838e-07, - "loss": 0.3735, - "step": 79915 - }, - { - "epoch": 2.05, - "learning_rate": 4.830046743845811e-07, - "loss": 0.3975, - "step": 79916 - }, - { - "epoch": 2.05, - "learning_rate": 4.829809889999181e-07, - "loss": 0.5156, - "step": 79917 - }, - { - "epoch": 2.05, - "learning_rate": 4.829573040111132e-07, - "loss": 0.4465, - "step": 79918 - }, - { - "epoch": 2.05, - "learning_rate": 4.829336194181839e-07, - "loss": 0.4126, - "step": 79919 - }, - { - "epoch": 2.05, - "learning_rate": 4.829099352211483e-07, - "loss": 0.3245, - "step": 79920 - }, - { - "epoch": 2.05, - "learning_rate": 4.828862514200249e-07, - "loss": 0.396, - "step": 79921 - }, - { - "epoch": 2.05, - "learning_rate": 4.828625680148315e-07, - "loss": 0.3105, - "step": 79922 - }, - { - "epoch": 2.05, - "learning_rate": 4.828388850055869e-07, - "loss": 0.4526, - "step": 79923 - }, - { - "epoch": 2.05, - "learning_rate": 4.828152023923084e-07, - "loss": 0.4268, - "step": 79924 - }, - { - "epoch": 2.05, - "learning_rate": 4.827915201750147e-07, - "loss": 0.3818, - "step": 79925 - }, - { - "epoch": 2.05, - "learning_rate": 4.827678383537236e-07, - "loss": 0.3823, - "step": 79926 - }, - { - "epoch": 2.05, - "learning_rate": 4.827441569284537e-07, - "loss": 0.2917, - "step": 79927 - }, - { - "epoch": 2.05, - "learning_rate": 4.827204758992225e-07, - "loss": 0.3882, - "step": 79928 - }, - { - "epoch": 2.05, - "learning_rate": 4.826967952660489e-07, - "loss": 0.2955, - "step": 79929 - }, - { - "epoch": 2.05, - "learning_rate": 4.826731150289501e-07, - "loss": 0.3923, - "step": 79930 - }, - { - "epoch": 2.05, - "learning_rate": 4.826494351879451e-07, - "loss": 0.3752, - "step": 79931 - }, - { - "epoch": 2.05, - "learning_rate": 4.826257557430513e-07, - "loss": 0.4746, - "step": 79932 - }, - { - "epoch": 2.05, - "learning_rate": 4.826020766942872e-07, - "loss": 0.3347, - "step": 79933 - }, - { - "epoch": 2.05, - "learning_rate": 4.825783980416708e-07, - "loss": 0.2912, - "step": 79934 - }, - { - "epoch": 2.05, - "learning_rate": 4.825547197852207e-07, - "loss": 0.4526, - "step": 79935 - }, - { - "epoch": 2.05, - "learning_rate": 4.825310419249545e-07, - "loss": 0.4697, - "step": 79936 - }, - { - "epoch": 2.05, - "learning_rate": 4.825073644608903e-07, - "loss": 0.481, - "step": 79937 - }, - { - "epoch": 2.05, - "learning_rate": 4.824836873930463e-07, - "loss": 0.4558, - "step": 79938 - }, - { - "epoch": 2.05, - "learning_rate": 4.824600107214414e-07, - "loss": 0.4399, - "step": 79939 - }, - { - "epoch": 2.05, - "learning_rate": 4.824363344460929e-07, - "loss": 0.4902, - "step": 79940 - }, - { - "epoch": 2.05, - "learning_rate": 4.824126585670188e-07, - "loss": 0.4116, - "step": 79941 - }, - { - "epoch": 2.05, - "learning_rate": 4.823889830842375e-07, - "loss": 0.4497, - "step": 79942 - }, - { - "epoch": 2.05, - "learning_rate": 4.823653079977671e-07, - "loss": 0.3672, - "step": 79943 - }, - { - "epoch": 2.05, - "learning_rate": 4.823416333076262e-07, - "loss": 0.4678, - "step": 79944 - }, - { - "epoch": 2.05, - "learning_rate": 4.823179590138321e-07, - "loss": 0.415, - "step": 79945 - }, - { - "epoch": 2.05, - "learning_rate": 4.822942851164033e-07, - "loss": 0.4785, - "step": 79946 - }, - { - "epoch": 2.05, - "learning_rate": 4.822706116153581e-07, - "loss": 0.2102, - "step": 79947 - }, - { - "epoch": 2.05, - "learning_rate": 4.822469385107148e-07, - "loss": 0.3667, - "step": 79948 - }, - { - "epoch": 2.05, - "learning_rate": 4.822232658024912e-07, - "loss": 0.3724, - "step": 79949 - }, - { - "epoch": 2.05, - "learning_rate": 4.821995934907051e-07, - "loss": 0.4067, - "step": 79950 - }, - { - "epoch": 2.05, - "learning_rate": 4.821759215753749e-07, - "loss": 0.2727, - "step": 79951 - }, - { - "epoch": 2.05, - "learning_rate": 4.821522500565191e-07, - "loss": 0.3127, - "step": 79952 - }, - { - "epoch": 2.05, - "learning_rate": 4.821285789341554e-07, - "loss": 0.3257, - "step": 79953 - }, - { - "epoch": 2.05, - "learning_rate": 4.821049082083017e-07, - "loss": 0.5283, - "step": 79954 - }, - { - "epoch": 2.05, - "learning_rate": 4.820812378789767e-07, - "loss": 0.3691, - "step": 79955 - }, - { - "epoch": 2.05, - "learning_rate": 4.820575679461985e-07, - "loss": 0.4351, - "step": 79956 - }, - { - "epoch": 2.05, - "learning_rate": 4.820338984099847e-07, - "loss": 0.353, - "step": 79957 - }, - { - "epoch": 2.05, - "learning_rate": 4.820102292703538e-07, - "loss": 0.5107, - "step": 79958 - }, - { - "epoch": 2.05, - "learning_rate": 4.819865605273242e-07, - "loss": 0.2261, - "step": 79959 - }, - { - "epoch": 2.05, - "learning_rate": 4.819628921809133e-07, - "loss": 0.5256, - "step": 79960 - }, - { - "epoch": 2.05, - "learning_rate": 4.819392242311398e-07, - "loss": 0.3765, - "step": 79961 - }, - { - "epoch": 2.05, - "learning_rate": 4.819155566780214e-07, - "loss": 0.5815, - "step": 79962 - }, - { - "epoch": 2.05, - "learning_rate": 4.818918895215764e-07, - "loss": 0.3735, - "step": 79963 - }, - { - "epoch": 2.05, - "learning_rate": 4.818682227618229e-07, - "loss": 0.5073, - "step": 79964 - }, - { - "epoch": 2.05, - "learning_rate": 4.818445563987797e-07, - "loss": 0.519, - "step": 79965 - }, - { - "epoch": 2.05, - "learning_rate": 4.818208904324636e-07, - "loss": 0.4321, - "step": 79966 - }, - { - "epoch": 2.05, - "learning_rate": 4.817972248628935e-07, - "loss": 0.4668, - "step": 79967 - }, - { - "epoch": 2.05, - "learning_rate": 4.817735596900879e-07, - "loss": 0.4624, - "step": 79968 - }, - { - "epoch": 2.05, - "learning_rate": 4.817498949140645e-07, - "loss": 0.2599, - "step": 79969 - }, - { - "epoch": 2.05, - "learning_rate": 4.817262305348409e-07, - "loss": 0.5098, - "step": 79970 - }, - { - "epoch": 2.05, - "learning_rate": 4.817025665524357e-07, - "loss": 0.5605, - "step": 79971 - }, - { - "epoch": 2.05, - "learning_rate": 4.816789029668669e-07, - "loss": 0.2808, - "step": 79972 - }, - { - "epoch": 2.05, - "learning_rate": 4.816552397781533e-07, - "loss": 0.4282, - "step": 79973 - }, - { - "epoch": 2.05, - "learning_rate": 4.816315769863121e-07, - "loss": 0.4062, - "step": 79974 - }, - { - "epoch": 2.05, - "learning_rate": 4.816079145913616e-07, - "loss": 0.4429, - "step": 79975 - }, - { - "epoch": 2.05, - "learning_rate": 4.815842525933201e-07, - "loss": 0.4131, - "step": 79976 - }, - { - "epoch": 2.05, - "learning_rate": 4.815605909922063e-07, - "loss": 0.4766, - "step": 79977 - }, - { - "epoch": 2.05, - "learning_rate": 4.815369297880371e-07, - "loss": 0.2898, - "step": 79978 - }, - { - "epoch": 2.05, - "learning_rate": 4.815132689808317e-07, - "loss": 0.4771, - "step": 79979 - }, - { - "epoch": 2.05, - "learning_rate": 4.814896085706073e-07, - "loss": 0.3019, - "step": 79980 - }, - { - "epoch": 2.05, - "learning_rate": 4.814659485573825e-07, - "loss": 0.478, - "step": 79981 - }, - { - "epoch": 2.05, - "learning_rate": 4.814422889411757e-07, - "loss": 0.4014, - "step": 79982 - }, - { - "epoch": 2.05, - "learning_rate": 4.814186297220045e-07, - "loss": 0.3464, - "step": 79983 - }, - { - "epoch": 2.05, - "learning_rate": 4.813949708998871e-07, - "loss": 0.4478, - "step": 79984 - }, - { - "epoch": 2.05, - "learning_rate": 4.813713124748422e-07, - "loss": 0.2253, - "step": 79985 - }, - { - "epoch": 2.05, - "learning_rate": 4.81347654446887e-07, - "loss": 0.458, - "step": 79986 - }, - { - "epoch": 2.05, - "learning_rate": 4.8132399681604e-07, - "loss": 0.4058, - "step": 79987 - }, - { - "epoch": 2.05, - "learning_rate": 4.813003395823193e-07, - "loss": 0.4341, - "step": 79988 - }, - { - "epoch": 2.05, - "learning_rate": 4.812766827457435e-07, - "loss": 0.5054, - "step": 79989 - }, - { - "epoch": 2.05, - "learning_rate": 4.812530263063303e-07, - "loss": 0.417, - "step": 79990 - }, - { - "epoch": 2.05, - "learning_rate": 4.812293702640976e-07, - "loss": 0.3774, - "step": 79991 - }, - { - "epoch": 2.05, - "learning_rate": 4.812057146190636e-07, - "loss": 0.4565, - "step": 79992 - }, - { - "epoch": 2.05, - "learning_rate": 4.811820593712465e-07, - "loss": 0.5327, - "step": 79993 - }, - { - "epoch": 2.05, - "learning_rate": 4.811584045206648e-07, - "loss": 0.3313, - "step": 79994 - }, - { - "epoch": 2.05, - "learning_rate": 4.811347500673359e-07, - "loss": 0.3779, - "step": 79995 - }, - { - "epoch": 2.05, - "learning_rate": 4.811110960112783e-07, - "loss": 0.3782, - "step": 79996 - }, - { - "epoch": 2.05, - "learning_rate": 4.810874423525099e-07, - "loss": 0.3647, - "step": 79997 - }, - { - "epoch": 2.05, - "learning_rate": 4.810637890910496e-07, - "loss": 0.4595, - "step": 79998 - }, - { - "epoch": 2.05, - "learning_rate": 4.810401362269149e-07, - "loss": 0.4429, - "step": 79999 - }, - { - "epoch": 2.05, - "learning_rate": 4.810164837601233e-07, - "loss": 0.2094, - "step": 80000 - }, - { - "epoch": 2.05, - "learning_rate": 4.809928316906937e-07, - "loss": 0.478, - "step": 80001 - }, - { - "epoch": 2.05, - "learning_rate": 4.809691800186444e-07, - "loss": 0.3979, - "step": 80002 - }, - { - "epoch": 2.05, - "learning_rate": 4.809455287439927e-07, - "loss": 0.4854, - "step": 80003 - }, - { - "epoch": 2.05, - "learning_rate": 4.80921877866757e-07, - "loss": 0.3679, - "step": 80004 - }, - { - "epoch": 2.05, - "learning_rate": 4.808982273869558e-07, - "loss": 0.3752, - "step": 80005 - }, - { - "epoch": 2.05, - "learning_rate": 4.808745773046073e-07, - "loss": 0.3575, - "step": 80006 - }, - { - "epoch": 2.05, - "learning_rate": 4.808509276197288e-07, - "loss": 0.3848, - "step": 80007 - }, - { - "epoch": 2.05, - "learning_rate": 4.808272783323389e-07, - "loss": 0.5474, - "step": 80008 - }, - { - "epoch": 2.05, - "learning_rate": 4.80803629442456e-07, - "loss": 0.3726, - "step": 80009 - }, - { - "epoch": 2.05, - "learning_rate": 4.807799809500975e-07, - "loss": 0.4082, - "step": 80010 - }, - { - "epoch": 2.05, - "learning_rate": 4.807563328552824e-07, - "loss": 0.394, - "step": 80011 - }, - { - "epoch": 2.05, - "learning_rate": 4.807326851580279e-07, - "loss": 0.3645, - "step": 80012 - }, - { - "epoch": 2.05, - "learning_rate": 4.807090378583523e-07, - "loss": 0.3838, - "step": 80013 - }, - { - "epoch": 2.05, - "learning_rate": 4.806853909562742e-07, - "loss": 0.4473, - "step": 80014 - }, - { - "epoch": 2.05, - "learning_rate": 4.806617444518117e-07, - "loss": 0.2947, - "step": 80015 - }, - { - "epoch": 2.05, - "learning_rate": 4.806380983449822e-07, - "loss": 0.4424, - "step": 80016 - }, - { - "epoch": 2.05, - "learning_rate": 4.806144526358042e-07, - "loss": 0.4253, - "step": 80017 - }, - { - "epoch": 2.05, - "learning_rate": 4.805908073242959e-07, - "loss": 0.2925, - "step": 80018 - }, - { - "epoch": 2.05, - "learning_rate": 4.805671624104761e-07, - "loss": 0.4191, - "step": 80019 - }, - { - "epoch": 2.05, - "learning_rate": 4.805435178943613e-07, - "loss": 0.2361, - "step": 80020 - }, - { - "epoch": 2.05, - "learning_rate": 4.805198737759705e-07, - "loss": 0.3389, - "step": 80021 - }, - { - "epoch": 2.05, - "learning_rate": 4.804962300553217e-07, - "loss": 0.5381, - "step": 80022 - }, - { - "epoch": 2.05, - "learning_rate": 4.804725867324335e-07, - "loss": 0.3413, - "step": 80023 - }, - { - "epoch": 2.05, - "learning_rate": 4.804489438073232e-07, - "loss": 0.3723, - "step": 80024 - }, - { - "epoch": 2.05, - "learning_rate": 4.804253012800092e-07, - "loss": 0.3683, - "step": 80025 - }, - { - "epoch": 2.05, - "learning_rate": 4.804016591505096e-07, - "loss": 0.2881, - "step": 80026 - }, - { - "epoch": 2.05, - "learning_rate": 4.803780174188429e-07, - "loss": 0.4253, - "step": 80027 - }, - { - "epoch": 2.05, - "learning_rate": 4.803543760850266e-07, - "loss": 0.417, - "step": 80028 - }, - { - "epoch": 2.05, - "learning_rate": 4.803307351490795e-07, - "loss": 0.302, - "step": 80029 - }, - { - "epoch": 2.05, - "learning_rate": 4.803070946110187e-07, - "loss": 0.5156, - "step": 80030 - }, - { - "epoch": 2.05, - "learning_rate": 4.802834544708631e-07, - "loss": 0.3745, - "step": 80031 - }, - { - "epoch": 2.05, - "learning_rate": 4.802598147286307e-07, - "loss": 0.4135, - "step": 80032 - }, - { - "epoch": 2.05, - "learning_rate": 4.802361753843391e-07, - "loss": 0.4531, - "step": 80033 - }, - { - "epoch": 2.05, - "learning_rate": 4.802125364380069e-07, - "loss": 0.4663, - "step": 80034 - }, - { - "epoch": 2.05, - "learning_rate": 4.80188897889652e-07, - "loss": 0.3912, - "step": 80035 - }, - { - "epoch": 2.05, - "learning_rate": 4.801652597392928e-07, - "loss": 0.459, - "step": 80036 - }, - { - "epoch": 2.05, - "learning_rate": 4.801416219869471e-07, - "loss": 0.4771, - "step": 80037 - }, - { - "epoch": 2.05, - "learning_rate": 4.801179846326328e-07, - "loss": 0.3088, - "step": 80038 - }, - { - "epoch": 2.05, - "learning_rate": 4.800943476763687e-07, - "loss": 0.3079, - "step": 80039 - }, - { - "epoch": 2.05, - "learning_rate": 4.800707111181724e-07, - "loss": 0.354, - "step": 80040 - }, - { - "epoch": 2.05, - "learning_rate": 4.800470749580617e-07, - "loss": 0.3778, - "step": 80041 - }, - { - "epoch": 2.05, - "learning_rate": 4.800234391960552e-07, - "loss": 0.4673, - "step": 80042 - }, - { - "epoch": 2.05, - "learning_rate": 4.799998038321707e-07, - "loss": 0.3024, - "step": 80043 - }, - { - "epoch": 2.05, - "learning_rate": 4.799761688664267e-07, - "loss": 0.364, - "step": 80044 - }, - { - "epoch": 2.05, - "learning_rate": 4.799525342988409e-07, - "loss": 0.4585, - "step": 80045 - }, - { - "epoch": 2.05, - "learning_rate": 4.799289001294315e-07, - "loss": 0.4849, - "step": 80046 - }, - { - "epoch": 2.05, - "learning_rate": 4.799052663582165e-07, - "loss": 0.4038, - "step": 80047 - }, - { - "epoch": 2.05, - "learning_rate": 4.798816329852145e-07, - "loss": 0.3892, - "step": 80048 - }, - { - "epoch": 2.05, - "learning_rate": 4.798580000104433e-07, - "loss": 0.3818, - "step": 80049 - }, - { - "epoch": 2.05, - "learning_rate": 4.798343674339205e-07, - "loss": 0.5532, - "step": 80050 - }, - { - "epoch": 2.05, - "learning_rate": 4.798107352556646e-07, - "loss": 0.3816, - "step": 80051 - }, - { - "epoch": 2.05, - "learning_rate": 4.797871034756938e-07, - "loss": 0.5444, - "step": 80052 - }, - { - "epoch": 2.05, - "learning_rate": 4.797634720940264e-07, - "loss": 0.4199, - "step": 80053 - }, - { - "epoch": 2.05, - "learning_rate": 4.797398411106797e-07, - "loss": 0.3523, - "step": 80054 - }, - { - "epoch": 2.05, - "learning_rate": 4.797162105256723e-07, - "loss": 0.3094, - "step": 80055 - }, - { - "epoch": 2.05, - "learning_rate": 4.796925803390228e-07, - "loss": 0.4492, - "step": 80056 - }, - { - "epoch": 2.05, - "learning_rate": 4.796689505507483e-07, - "loss": 0.5449, - "step": 80057 - }, - { - "epoch": 2.05, - "learning_rate": 4.796453211608674e-07, - "loss": 0.4302, - "step": 80058 - }, - { - "epoch": 2.05, - "learning_rate": 4.796216921693985e-07, - "loss": 0.3945, - "step": 80059 - }, - { - "epoch": 2.05, - "learning_rate": 4.79598063576359e-07, - "loss": 0.3857, - "step": 80060 - }, - { - "epoch": 2.05, - "learning_rate": 4.795744353817676e-07, - "loss": 0.5581, - "step": 80061 - }, - { - "epoch": 2.05, - "learning_rate": 4.79550807585642e-07, - "loss": 0.4536, - "step": 80062 - }, - { - "epoch": 2.05, - "learning_rate": 4.795271801880001e-07, - "loss": 0.3765, - "step": 80063 - }, - { - "epoch": 2.05, - "learning_rate": 4.795035531888605e-07, - "loss": 0.4146, - "step": 80064 - }, - { - "epoch": 2.05, - "learning_rate": 4.794799265882415e-07, - "loss": 0.4507, - "step": 80065 - }, - { - "epoch": 2.05, - "learning_rate": 4.794563003861602e-07, - "loss": 0.5078, - "step": 80066 - }, - { - "epoch": 2.05, - "learning_rate": 4.794326745826355e-07, - "loss": 0.3967, - "step": 80067 - }, - { - "epoch": 2.05, - "learning_rate": 4.794090491776851e-07, - "loss": 0.356, - "step": 80068 - }, - { - "epoch": 2.05, - "learning_rate": 4.793854241713277e-07, - "loss": 0.2376, - "step": 80069 - }, - { - "epoch": 2.05, - "learning_rate": 4.79361799563581e-07, - "loss": 0.3418, - "step": 80070 - }, - { - "epoch": 2.05, - "learning_rate": 4.793381753544626e-07, - "loss": 0.5186, - "step": 80071 - }, - { - "epoch": 2.05, - "learning_rate": 4.79314551543991e-07, - "loss": 0.3401, - "step": 80072 - }, - { - "epoch": 2.05, - "learning_rate": 4.792909281321843e-07, - "loss": 0.302, - "step": 80073 - }, - { - "epoch": 2.05, - "learning_rate": 4.79267305119061e-07, - "loss": 0.4336, - "step": 80074 - }, - { - "epoch": 2.05, - "learning_rate": 4.792436825046385e-07, - "loss": 0.3428, - "step": 80075 - }, - { - "epoch": 2.05, - "learning_rate": 4.79220060288935e-07, - "loss": 0.48, - "step": 80076 - }, - { - "epoch": 2.05, - "learning_rate": 4.791964384719692e-07, - "loss": 0.4268, - "step": 80077 - }, - { - "epoch": 2.05, - "learning_rate": 4.791728170537583e-07, - "loss": 0.4648, - "step": 80078 - }, - { - "epoch": 2.05, - "learning_rate": 4.791491960343214e-07, - "loss": 0.4951, - "step": 80079 - }, - { - "epoch": 2.05, - "learning_rate": 4.791255754136753e-07, - "loss": 0.3103, - "step": 80080 - }, - { - "epoch": 2.05, - "learning_rate": 4.791019551918392e-07, - "loss": 0.4893, - "step": 80081 - }, - { - "epoch": 2.05, - "learning_rate": 4.790783353688309e-07, - "loss": 0.3643, - "step": 80082 - }, - { - "epoch": 2.05, - "learning_rate": 4.79054715944668e-07, - "loss": 0.3325, - "step": 80083 - }, - { - "epoch": 2.05, - "learning_rate": 4.790310969193691e-07, - "loss": 0.3306, - "step": 80084 - }, - { - "epoch": 2.05, - "learning_rate": 4.79007478292952e-07, - "loss": 0.4189, - "step": 80085 - }, - { - "epoch": 2.05, - "learning_rate": 4.789838600654352e-07, - "loss": 0.2318, - "step": 80086 - }, - { - "epoch": 2.05, - "learning_rate": 4.789602422368363e-07, - "loss": 0.4419, - "step": 80087 - }, - { - "epoch": 2.05, - "learning_rate": 4.789366248071735e-07, - "loss": 0.3582, - "step": 80088 - }, - { - "epoch": 2.05, - "learning_rate": 4.789130077764654e-07, - "loss": 0.4907, - "step": 80089 - }, - { - "epoch": 2.05, - "learning_rate": 4.788893911447293e-07, - "loss": 0.2634, - "step": 80090 - }, - { - "epoch": 2.05, - "learning_rate": 4.788657749119839e-07, - "loss": 0.4492, - "step": 80091 - }, - { - "epoch": 2.05, - "learning_rate": 4.788421590782467e-07, - "loss": 0.2969, - "step": 80092 - }, - { - "epoch": 2.05, - "learning_rate": 4.788185436435361e-07, - "loss": 0.3945, - "step": 80093 - }, - { - "epoch": 2.05, - "learning_rate": 4.787949286078705e-07, - "loss": 0.3868, - "step": 80094 - }, - { - "epoch": 2.05, - "learning_rate": 4.787713139712674e-07, - "loss": 0.4021, - "step": 80095 - }, - { - "epoch": 2.05, - "learning_rate": 4.787476997337449e-07, - "loss": 0.4985, - "step": 80096 - }, - { - "epoch": 2.05, - "learning_rate": 4.787240858953215e-07, - "loss": 0.4341, - "step": 80097 - }, - { - "epoch": 2.05, - "learning_rate": 4.787004724560155e-07, - "loss": 0.3706, - "step": 80098 - }, - { - "epoch": 2.05, - "learning_rate": 4.786768594158446e-07, - "loss": 0.5161, - "step": 80099 - }, - { - "epoch": 2.05, - "learning_rate": 4.786532467748264e-07, - "loss": 0.2827, - "step": 80100 - }, - { - "epoch": 2.05, - "learning_rate": 4.786296345329795e-07, - "loss": 0.5195, - "step": 80101 - }, - { - "epoch": 2.05, - "learning_rate": 4.786060226903218e-07, - "loss": 0.4146, - "step": 80102 - }, - { - "epoch": 2.05, - "learning_rate": 4.785824112468719e-07, - "loss": 0.3562, - "step": 80103 - }, - { - "epoch": 2.05, - "learning_rate": 4.785588002026471e-07, - "loss": 0.4536, - "step": 80104 - }, - { - "epoch": 2.05, - "learning_rate": 4.78535189557666e-07, - "loss": 0.3647, - "step": 80105 - }, - { - "epoch": 2.05, - "learning_rate": 4.785115793119464e-07, - "loss": 0.3726, - "step": 80106 - }, - { - "epoch": 2.05, - "learning_rate": 4.784879694655069e-07, - "loss": 0.4346, - "step": 80107 - }, - { - "epoch": 2.05, - "learning_rate": 4.784643600183651e-07, - "loss": 0.4011, - "step": 80108 - }, - { - "epoch": 2.05, - "learning_rate": 4.784407509705389e-07, - "loss": 0.4277, - "step": 80109 - }, - { - "epoch": 2.05, - "learning_rate": 4.784171423220466e-07, - "loss": 0.3547, - "step": 80110 - }, - { - "epoch": 2.05, - "learning_rate": 4.783935340729067e-07, - "loss": 0.4397, - "step": 80111 - }, - { - "epoch": 2.05, - "learning_rate": 4.783699262231364e-07, - "loss": 0.4044, - "step": 80112 - }, - { - "epoch": 2.05, - "learning_rate": 4.783463187727544e-07, - "loss": 0.478, - "step": 80113 - }, - { - "epoch": 2.05, - "learning_rate": 4.783227117217786e-07, - "loss": 0.4097, - "step": 80114 - }, - { - "epoch": 2.05, - "learning_rate": 4.782991050702274e-07, - "loss": 0.2642, - "step": 80115 - }, - { - "epoch": 2.05, - "learning_rate": 4.782754988181183e-07, - "loss": 0.5137, - "step": 80116 - }, - { - "epoch": 2.05, - "learning_rate": 4.782518929654698e-07, - "loss": 0.4199, - "step": 80117 - }, - { - "epoch": 2.05, - "learning_rate": 4.782282875123e-07, - "loss": 0.3872, - "step": 80118 - }, - { - "epoch": 2.05, - "learning_rate": 4.782046824586265e-07, - "loss": 0.4927, - "step": 80119 - }, - { - "epoch": 2.05, - "learning_rate": 4.781810778044681e-07, - "loss": 0.3596, - "step": 80120 - }, - { - "epoch": 2.05, - "learning_rate": 4.781574735498419e-07, - "loss": 0.293, - "step": 80121 - }, - { - "epoch": 2.05, - "learning_rate": 4.781338696947667e-07, - "loss": 0.365, - "step": 80122 - }, - { - "epoch": 2.05, - "learning_rate": 4.781102662392603e-07, - "loss": 0.2646, - "step": 80123 - }, - { - "epoch": 2.05, - "learning_rate": 4.780866631833414e-07, - "loss": 0.5059, - "step": 80124 - }, - { - "epoch": 2.05, - "learning_rate": 4.78063060527027e-07, - "loss": 0.4106, - "step": 80125 - }, - { - "epoch": 2.05, - "learning_rate": 4.780394582703358e-07, - "loss": 0.3108, - "step": 80126 - }, - { - "epoch": 2.05, - "learning_rate": 4.780158564132858e-07, - "loss": 0.4185, - "step": 80127 - }, - { - "epoch": 2.05, - "learning_rate": 4.779922549558958e-07, - "loss": 0.375, - "step": 80128 - }, - { - "epoch": 2.05, - "learning_rate": 4.779686538981823e-07, - "loss": 0.46, - "step": 80129 - }, - { - "epoch": 2.05, - "learning_rate": 4.779450532401643e-07, - "loss": 0.4371, - "step": 80130 - }, - { - "epoch": 2.05, - "learning_rate": 4.779214529818597e-07, - "loss": 0.4629, - "step": 80131 - }, - { - "epoch": 2.05, - "learning_rate": 4.77897853123287e-07, - "loss": 0.5186, - "step": 80132 - }, - { - "epoch": 2.05, - "learning_rate": 4.778742536644637e-07, - "loss": 0.5005, - "step": 80133 - }, - { - "epoch": 2.05, - "learning_rate": 4.778506546054078e-07, - "loss": 0.4419, - "step": 80134 - }, - { - "epoch": 2.05, - "learning_rate": 4.778270559461378e-07, - "loss": 0.3047, - "step": 80135 - }, - { - "epoch": 2.05, - "learning_rate": 4.778034576866721e-07, - "loss": 0.3857, - "step": 80136 - }, - { - "epoch": 2.05, - "learning_rate": 4.777798598270277e-07, - "loss": 0.3215, - "step": 80137 - }, - { - "epoch": 2.05, - "learning_rate": 4.777562623672238e-07, - "loss": 0.4526, - "step": 80138 - }, - { - "epoch": 2.05, - "learning_rate": 4.777326653072774e-07, - "loss": 0.501, - "step": 80139 - }, - { - "epoch": 2.05, - "learning_rate": 4.777090686472071e-07, - "loss": 0.4614, - "step": 80140 - }, - { - "epoch": 2.05, - "learning_rate": 4.776854723870314e-07, - "loss": 0.4482, - "step": 80141 - }, - { - "epoch": 2.05, - "learning_rate": 4.776618765267674e-07, - "loss": 0.3604, - "step": 80142 - }, - { - "epoch": 2.05, - "learning_rate": 4.776382810664339e-07, - "loss": 0.4099, - "step": 80143 - }, - { - "epoch": 2.05, - "learning_rate": 4.776146860060486e-07, - "loss": 0.3979, - "step": 80144 - }, - { - "epoch": 2.05, - "learning_rate": 4.775910913456302e-07, - "loss": 0.3364, - "step": 80145 - }, - { - "epoch": 2.05, - "learning_rate": 4.775674970851958e-07, - "loss": 0.4951, - "step": 80146 - }, - { - "epoch": 2.05, - "learning_rate": 4.775439032247639e-07, - "loss": 0.4414, - "step": 80147 - }, - { - "epoch": 2.05, - "learning_rate": 4.775203097643531e-07, - "loss": 0.5229, - "step": 80148 - }, - { - "epoch": 2.05, - "learning_rate": 4.77496716703981e-07, - "loss": 0.4194, - "step": 80149 - }, - { - "epoch": 2.05, - "learning_rate": 4.774731240436651e-07, - "loss": 0.4248, - "step": 80150 - }, - { - "epoch": 2.05, - "learning_rate": 4.774495317834241e-07, - "loss": 0.2455, - "step": 80151 - }, - { - "epoch": 2.05, - "learning_rate": 4.774259399232759e-07, - "loss": 0.4951, - "step": 80152 - }, - { - "epoch": 2.05, - "learning_rate": 4.774023484632393e-07, - "loss": 0.3459, - "step": 80153 - }, - { - "epoch": 2.05, - "learning_rate": 4.77378757403331e-07, - "loss": 0.3735, - "step": 80154 - }, - { - "epoch": 2.05, - "learning_rate": 4.773551667435697e-07, - "loss": 0.3853, - "step": 80155 - }, - { - "epoch": 2.05, - "learning_rate": 4.773315764839738e-07, - "loss": 0.311, - "step": 80156 - }, - { - "epoch": 2.05, - "learning_rate": 4.773079866245613e-07, - "loss": 0.3423, - "step": 80157 - }, - { - "epoch": 2.05, - "learning_rate": 4.772843971653501e-07, - "loss": 0.2499, - "step": 80158 - }, - { - "epoch": 2.05, - "learning_rate": 4.772608081063577e-07, - "loss": 0.4019, - "step": 80159 - }, - { - "epoch": 2.05, - "learning_rate": 4.772372194476028e-07, - "loss": 0.373, - "step": 80160 - }, - { - "epoch": 2.05, - "learning_rate": 4.772136311891032e-07, - "loss": 0.4214, - "step": 80161 - }, - { - "epoch": 2.05, - "learning_rate": 4.771900433308775e-07, - "loss": 0.3262, - "step": 80162 - }, - { - "epoch": 2.05, - "learning_rate": 4.77166455872943e-07, - "loss": 0.4226, - "step": 80163 - }, - { - "epoch": 2.05, - "learning_rate": 4.771428688153182e-07, - "loss": 0.4099, - "step": 80164 - }, - { - "epoch": 2.05, - "learning_rate": 4.771192821580213e-07, - "loss": 0.4419, - "step": 80165 - }, - { - "epoch": 2.05, - "learning_rate": 4.770956959010698e-07, - "loss": 0.2192, - "step": 80166 - }, - { - "epoch": 2.05, - "learning_rate": 4.770721100444821e-07, - "loss": 0.4839, - "step": 80167 - }, - { - "epoch": 2.05, - "learning_rate": 4.770485245882766e-07, - "loss": 0.3728, - "step": 80168 - }, - { - "epoch": 2.05, - "learning_rate": 4.770249395324706e-07, - "loss": 0.4019, - "step": 80169 - }, - { - "epoch": 2.05, - "learning_rate": 4.770013548770829e-07, - "loss": 0.3574, - "step": 80170 - }, - { - "epoch": 2.05, - "learning_rate": 4.769777706221309e-07, - "loss": 0.2683, - "step": 80171 - }, - { - "epoch": 2.05, - "learning_rate": 4.76954186767633e-07, - "loss": 0.3575, - "step": 80172 - }, - { - "epoch": 2.05, - "learning_rate": 4.769306033136072e-07, - "loss": 0.3289, - "step": 80173 - }, - { - "epoch": 2.05, - "learning_rate": 4.769070202600719e-07, - "loss": 0.4668, - "step": 80174 - }, - { - "epoch": 2.05, - "learning_rate": 4.768834376070446e-07, - "loss": 0.5957, - "step": 80175 - }, - { - "epoch": 2.05, - "learning_rate": 4.768598553545434e-07, - "loss": 0.4255, - "step": 80176 - }, - { - "epoch": 2.05, - "learning_rate": 4.768362735025866e-07, - "loss": 0.3986, - "step": 80177 - }, - { - "epoch": 2.06, - "learning_rate": 4.768126920511927e-07, - "loss": 0.4287, - "step": 80178 - }, - { - "epoch": 2.06, - "learning_rate": 4.7678911100037923e-07, - "loss": 0.355, - "step": 80179 - }, - { - "epoch": 2.06, - "learning_rate": 4.767655303501639e-07, - "loss": 0.5361, - "step": 80180 - }, - { - "epoch": 2.06, - "learning_rate": 4.7674195010056504e-07, - "loss": 0.397, - "step": 80181 - }, - { - "epoch": 2.06, - "learning_rate": 4.7671837025160136e-07, - "loss": 0.4019, - "step": 80182 - }, - { - "epoch": 2.06, - "learning_rate": 4.766947908032899e-07, - "loss": 0.394, - "step": 80183 - }, - { - "epoch": 2.06, - "learning_rate": 4.7667121175564915e-07, - "loss": 0.4468, - "step": 80184 - }, - { - "epoch": 2.06, - "learning_rate": 4.7664763310869726e-07, - "loss": 0.502, - "step": 80185 - }, - { - "epoch": 2.06, - "learning_rate": 4.7662405486245247e-07, - "loss": 0.4419, - "step": 80186 - }, - { - "epoch": 2.06, - "learning_rate": 4.766004770169323e-07, - "loss": 0.3311, - "step": 80187 - }, - { - "epoch": 2.06, - "learning_rate": 4.7657689957215543e-07, - "loss": 0.3149, - "step": 80188 - }, - { - "epoch": 2.06, - "learning_rate": 4.7655332252813917e-07, - "loss": 0.5168, - "step": 80189 - }, - { - "epoch": 2.06, - "learning_rate": 4.76529745884902e-07, - "loss": 0.2542, - "step": 80190 - }, - { - "epoch": 2.06, - "learning_rate": 4.7650616964246226e-07, - "loss": 0.3669, - "step": 80191 - }, - { - "epoch": 2.06, - "learning_rate": 4.7648259380083733e-07, - "loss": 0.4656, - "step": 80192 - }, - { - "epoch": 2.06, - "learning_rate": 4.7645901836004565e-07, - "loss": 0.4629, - "step": 80193 - }, - { - "epoch": 2.06, - "learning_rate": 4.764354433201052e-07, - "loss": 0.4597, - "step": 80194 - }, - { - "epoch": 2.06, - "learning_rate": 4.7641186868103436e-07, - "loss": 0.4482, - "step": 80195 - }, - { - "epoch": 2.06, - "learning_rate": 4.763882944428506e-07, - "loss": 0.3779, - "step": 80196 - }, - { - "epoch": 2.06, - "learning_rate": 4.763647206055722e-07, - "loss": 0.5029, - "step": 80197 - }, - { - "epoch": 2.06, - "learning_rate": 4.7634114716921756e-07, - "loss": 0.3911, - "step": 80198 - }, - { - "epoch": 2.06, - "learning_rate": 4.763175741338046e-07, - "loss": 0.4375, - "step": 80199 - }, - { - "epoch": 2.06, - "learning_rate": 4.7629400149935064e-07, - "loss": 0.4048, - "step": 80200 - }, - { - "epoch": 2.06, - "learning_rate": 4.7627042926587436e-07, - "loss": 0.3374, - "step": 80201 - }, - { - "epoch": 2.06, - "learning_rate": 4.7624685743339375e-07, - "loss": 0.3098, - "step": 80202 - }, - { - "epoch": 2.06, - "learning_rate": 4.762232860019272e-07, - "loss": 0.2904, - "step": 80203 - }, - { - "epoch": 2.06, - "learning_rate": 4.76199714971492e-07, - "loss": 0.3193, - "step": 80204 - }, - { - "epoch": 2.06, - "learning_rate": 4.761761443421066e-07, - "loss": 0.4253, - "step": 80205 - }, - { - "epoch": 2.06, - "learning_rate": 4.761525741137891e-07, - "loss": 0.3275, - "step": 80206 - }, - { - "epoch": 2.06, - "learning_rate": 4.7612900428655776e-07, - "loss": 0.4277, - "step": 80207 - }, - { - "epoch": 2.06, - "learning_rate": 4.761054348604304e-07, - "loss": 0.4414, - "step": 80208 - }, - { - "epoch": 2.06, - "learning_rate": 4.760818658354246e-07, - "loss": 0.4098, - "step": 80209 - }, - { - "epoch": 2.06, - "learning_rate": 4.7605829721155887e-07, - "loss": 0.4785, - "step": 80210 - }, - { - "epoch": 2.06, - "learning_rate": 4.760347289888512e-07, - "loss": 0.3868, - "step": 80211 - }, - { - "epoch": 2.06, - "learning_rate": 4.760111611673201e-07, - "loss": 0.2522, - "step": 80212 - }, - { - "epoch": 2.06, - "learning_rate": 4.759875937469827e-07, - "loss": 0.5254, - "step": 80213 - }, - { - "epoch": 2.06, - "learning_rate": 4.759640267278575e-07, - "loss": 0.4028, - "step": 80214 - }, - { - "epoch": 2.06, - "learning_rate": 4.759404601099626e-07, - "loss": 0.4854, - "step": 80215 - }, - { - "epoch": 2.06, - "learning_rate": 4.7591689389331636e-07, - "loss": 0.4751, - "step": 80216 - }, - { - "epoch": 2.06, - "learning_rate": 4.7589332807793604e-07, - "loss": 0.4824, - "step": 80217 - }, - { - "epoch": 2.06, - "learning_rate": 4.758697626638405e-07, - "loss": 0.3042, - "step": 80218 - }, - { - "epoch": 2.06, - "learning_rate": 4.758461976510469e-07, - "loss": 0.3916, - "step": 80219 - }, - { - "epoch": 2.06, - "learning_rate": 4.758226330395744e-07, - "loss": 0.481, - "step": 80220 - }, - { - "epoch": 2.06, - "learning_rate": 4.757990688294398e-07, - "loss": 0.606, - "step": 80221 - }, - { - "epoch": 2.06, - "learning_rate": 4.757755050206619e-07, - "loss": 0.4658, - "step": 80222 - }, - { - "epoch": 2.06, - "learning_rate": 4.757519416132585e-07, - "loss": 0.4043, - "step": 80223 - }, - { - "epoch": 2.06, - "learning_rate": 4.757283786072481e-07, - "loss": 0.3833, - "step": 80224 - }, - { - "epoch": 2.06, - "learning_rate": 4.75704816002648e-07, - "loss": 0.4062, - "step": 80225 - }, - { - "epoch": 2.06, - "learning_rate": 4.756812537994767e-07, - "loss": 0.4185, - "step": 80226 - }, - { - "epoch": 2.06, - "learning_rate": 4.756576919977521e-07, - "loss": 0.4614, - "step": 80227 - }, - { - "epoch": 2.06, - "learning_rate": 4.7563413059749257e-07, - "loss": 0.5098, - "step": 80228 - }, - { - "epoch": 2.06, - "learning_rate": 4.7561056959871604e-07, - "loss": 0.4204, - "step": 80229 - }, - { - "epoch": 2.06, - "learning_rate": 4.755870090014399e-07, - "loss": 0.5205, - "step": 80230 - }, - { - "epoch": 2.06, - "learning_rate": 4.7556344880568267e-07, - "loss": 0.416, - "step": 80231 - }, - { - "epoch": 2.06, - "learning_rate": 4.755398890114625e-07, - "loss": 0.3735, - "step": 80232 - }, - { - "epoch": 2.06, - "learning_rate": 4.7551632961879763e-07, - "loss": 0.3716, - "step": 80233 - }, - { - "epoch": 2.06, - "learning_rate": 4.7549277062770543e-07, - "loss": 0.5229, - "step": 80234 - }, - { - "epoch": 2.06, - "learning_rate": 4.754692120382042e-07, - "loss": 0.3818, - "step": 80235 - }, - { - "epoch": 2.06, - "learning_rate": 4.7544565385031223e-07, - "loss": 0.4104, - "step": 80236 - }, - { - "epoch": 2.06, - "learning_rate": 4.754220960640477e-07, - "loss": 0.2992, - "step": 80237 - }, - { - "epoch": 2.06, - "learning_rate": 4.7539853867942834e-07, - "loss": 0.3342, - "step": 80238 - }, - { - "epoch": 2.06, - "learning_rate": 4.7537498169647185e-07, - "loss": 0.4185, - "step": 80239 - }, - { - "epoch": 2.06, - "learning_rate": 4.7535142511519655e-07, - "loss": 0.5151, - "step": 80240 - }, - { - "epoch": 2.06, - "learning_rate": 4.7532786893562106e-07, - "loss": 0.4658, - "step": 80241 - }, - { - "epoch": 2.06, - "learning_rate": 4.7530431315776243e-07, - "loss": 0.4443, - "step": 80242 - }, - { - "epoch": 2.06, - "learning_rate": 4.7528075778163914e-07, - "loss": 0.4102, - "step": 80243 - }, - { - "epoch": 2.06, - "learning_rate": 4.752572028072692e-07, - "loss": 0.3901, - "step": 80244 - }, - { - "epoch": 2.06, - "learning_rate": 4.7523364823467117e-07, - "loss": 0.4888, - "step": 80245 - }, - { - "epoch": 2.06, - "learning_rate": 4.7521009406386216e-07, - "loss": 0.4629, - "step": 80246 - }, - { - "epoch": 2.06, - "learning_rate": 4.751865402948607e-07, - "loss": 0.4756, - "step": 80247 - }, - { - "epoch": 2.06, - "learning_rate": 4.751629869276852e-07, - "loss": 0.4507, - "step": 80248 - }, - { - "epoch": 2.06, - "learning_rate": 4.751394339623528e-07, - "loss": 0.3386, - "step": 80249 - }, - { - "epoch": 2.06, - "learning_rate": 4.7511588139888234e-07, - "loss": 0.4565, - "step": 80250 - }, - { - "epoch": 2.06, - "learning_rate": 4.7509232923729123e-07, - "loss": 0.5078, - "step": 80251 - }, - { - "epoch": 2.06, - "learning_rate": 4.7506877747759777e-07, - "loss": 0.313, - "step": 80252 - }, - { - "epoch": 2.06, - "learning_rate": 4.7504522611982e-07, - "loss": 0.2368, - "step": 80253 - }, - { - "epoch": 2.06, - "learning_rate": 4.750216751639764e-07, - "loss": 0.5381, - "step": 80254 - }, - { - "epoch": 2.06, - "learning_rate": 4.7499812461008403e-07, - "loss": 0.4678, - "step": 80255 - }, - { - "epoch": 2.06, - "learning_rate": 4.749745744581616e-07, - "loss": 0.3357, - "step": 80256 - }, - { - "epoch": 2.06, - "learning_rate": 4.7495102470822734e-07, - "loss": 0.28, - "step": 80257 - }, - { - "epoch": 2.06, - "learning_rate": 4.74927475360299e-07, - "loss": 0.2958, - "step": 80258 - }, - { - "epoch": 2.06, - "learning_rate": 4.7490392641439403e-07, - "loss": 0.1877, - "step": 80259 - }, - { - "epoch": 2.06, - "learning_rate": 4.7488037787053104e-07, - "loss": 0.3604, - "step": 80260 - }, - { - "epoch": 2.06, - "learning_rate": 4.74856829728728e-07, - "loss": 0.4482, - "step": 80261 - }, - { - "epoch": 2.06, - "learning_rate": 4.748332819890033e-07, - "loss": 0.4453, - "step": 80262 - }, - { - "epoch": 2.06, - "learning_rate": 4.748097346513743e-07, - "loss": 0.5068, - "step": 80263 - }, - { - "epoch": 2.06, - "learning_rate": 4.747861877158593e-07, - "loss": 0.5337, - "step": 80264 - }, - { - "epoch": 2.06, - "learning_rate": 4.7476264118247636e-07, - "loss": 0.3755, - "step": 80265 - }, - { - "epoch": 2.06, - "learning_rate": 4.747390950512439e-07, - "loss": 0.4241, - "step": 80266 - }, - { - "epoch": 2.06, - "learning_rate": 4.7471554932217915e-07, - "loss": 0.4404, - "step": 80267 - }, - { - "epoch": 2.06, - "learning_rate": 4.7469200399530097e-07, - "loss": 0.4189, - "step": 80268 - }, - { - "epoch": 2.06, - "learning_rate": 4.746684590706266e-07, - "loss": 0.3662, - "step": 80269 - }, - { - "epoch": 2.06, - "learning_rate": 4.7464491454817437e-07, - "loss": 0.4966, - "step": 80270 - }, - { - "epoch": 2.06, - "learning_rate": 4.746213704279628e-07, - "loss": 0.3196, - "step": 80271 - }, - { - "epoch": 2.06, - "learning_rate": 4.7459782671000904e-07, - "loss": 0.3066, - "step": 80272 - }, - { - "epoch": 2.06, - "learning_rate": 4.745742833943316e-07, - "loss": 0.4849, - "step": 80273 - }, - { - "epoch": 2.06, - "learning_rate": 4.745507404809489e-07, - "loss": 0.3438, - "step": 80274 - }, - { - "epoch": 2.06, - "learning_rate": 4.745271979698782e-07, - "loss": 0.449, - "step": 80275 - }, - { - "epoch": 2.06, - "learning_rate": 4.7450365586113773e-07, - "loss": 0.4663, - "step": 80276 - }, - { - "epoch": 2.06, - "learning_rate": 4.7448011415474576e-07, - "loss": 0.3755, - "step": 80277 - }, - { - "epoch": 2.06, - "learning_rate": 4.744565728507205e-07, - "loss": 0.3191, - "step": 80278 - }, - { - "epoch": 2.06, - "learning_rate": 4.744330319490797e-07, - "loss": 0.3424, - "step": 80279 - }, - { - "epoch": 2.06, - "learning_rate": 4.74409491449841e-07, - "loss": 0.3442, - "step": 80280 - }, - { - "epoch": 2.06, - "learning_rate": 4.743859513530228e-07, - "loss": 0.4556, - "step": 80281 - }, - { - "epoch": 2.06, - "learning_rate": 4.743624116586431e-07, - "loss": 0.3761, - "step": 80282 - }, - { - "epoch": 2.06, - "learning_rate": 4.743388723667203e-07, - "loss": 0.4421, - "step": 80283 - }, - { - "epoch": 2.06, - "learning_rate": 4.743153334772717e-07, - "loss": 0.4336, - "step": 80284 - }, - { - "epoch": 2.06, - "learning_rate": 4.7429179499031555e-07, - "loss": 0.4021, - "step": 80285 - }, - { - "epoch": 2.06, - "learning_rate": 4.7426825690587013e-07, - "loss": 0.4956, - "step": 80286 - }, - { - "epoch": 2.06, - "learning_rate": 4.742447192239537e-07, - "loss": 0.3994, - "step": 80287 - }, - { - "epoch": 2.06, - "learning_rate": 4.7422118194458395e-07, - "loss": 0.4268, - "step": 80288 - }, - { - "epoch": 2.06, - "learning_rate": 4.741976450677784e-07, - "loss": 0.436, - "step": 80289 - }, - { - "epoch": 2.06, - "learning_rate": 4.741741085935556e-07, - "loss": 0.3447, - "step": 80290 - }, - { - "epoch": 2.06, - "learning_rate": 4.741505725219338e-07, - "loss": 0.3643, - "step": 80291 - }, - { - "epoch": 2.06, - "learning_rate": 4.7412703685293043e-07, - "loss": 0.4673, - "step": 80292 - }, - { - "epoch": 2.06, - "learning_rate": 4.7410350158656374e-07, - "loss": 0.3918, - "step": 80293 - }, - { - "epoch": 2.06, - "learning_rate": 4.740799667228519e-07, - "loss": 0.4133, - "step": 80294 - }, - { - "epoch": 2.06, - "learning_rate": 4.7405643226181314e-07, - "loss": 0.4446, - "step": 80295 - }, - { - "epoch": 2.06, - "learning_rate": 4.7403289820346493e-07, - "loss": 0.4478, - "step": 80296 - }, - { - "epoch": 2.06, - "learning_rate": 4.7400936454782546e-07, - "loss": 0.4158, - "step": 80297 - }, - { - "epoch": 2.06, - "learning_rate": 4.739858312949132e-07, - "loss": 0.423, - "step": 80298 - }, - { - "epoch": 2.06, - "learning_rate": 4.7396229844474546e-07, - "loss": 0.5928, - "step": 80299 - }, - { - "epoch": 2.06, - "learning_rate": 4.7393876599734094e-07, - "loss": 0.4038, - "step": 80300 - }, - { - "epoch": 2.06, - "learning_rate": 4.7391523395271695e-07, - "loss": 0.2812, - "step": 80301 - }, - { - "epoch": 2.06, - "learning_rate": 4.7389170231089195e-07, - "loss": 0.3796, - "step": 80302 - }, - { - "epoch": 2.06, - "learning_rate": 4.738681710718837e-07, - "loss": 0.4756, - "step": 80303 - }, - { - "epoch": 2.06, - "learning_rate": 4.738446402357109e-07, - "loss": 0.3287, - "step": 80304 - }, - { - "epoch": 2.06, - "learning_rate": 4.7382110980239075e-07, - "loss": 0.436, - "step": 80305 - }, - { - "epoch": 2.06, - "learning_rate": 4.7379757977194144e-07, - "loss": 0.4395, - "step": 80306 - }, - { - "epoch": 2.06, - "learning_rate": 4.7377405014438133e-07, - "loss": 0.4092, - "step": 80307 - }, - { - "epoch": 2.06, - "learning_rate": 4.737505209197288e-07, - "loss": 0.3999, - "step": 80308 - }, - { - "epoch": 2.06, - "learning_rate": 4.737269920980006e-07, - "loss": 0.4214, - "step": 80309 - }, - { - "epoch": 2.06, - "learning_rate": 4.737034636792154e-07, - "loss": 0.4041, - "step": 80310 - }, - { - "epoch": 2.06, - "learning_rate": 4.7367993566339135e-07, - "loss": 0.3923, - "step": 80311 - }, - { - "epoch": 2.06, - "learning_rate": 4.7365640805054676e-07, - "loss": 0.4214, - "step": 80312 - }, - { - "epoch": 2.06, - "learning_rate": 4.7363288084069873e-07, - "loss": 0.3541, - "step": 80313 - }, - { - "epoch": 2.06, - "learning_rate": 4.736093540338659e-07, - "loss": 0.5264, - "step": 80314 - }, - { - "epoch": 2.06, - "learning_rate": 4.7358582763006625e-07, - "loss": 0.267, - "step": 80315 - }, - { - "epoch": 2.06, - "learning_rate": 4.73562301629318e-07, - "loss": 0.4771, - "step": 80316 - }, - { - "epoch": 2.06, - "learning_rate": 4.735387760316386e-07, - "loss": 0.3402, - "step": 80317 - }, - { - "epoch": 2.06, - "learning_rate": 4.735152508370467e-07, - "loss": 0.4893, - "step": 80318 - }, - { - "epoch": 2.06, - "learning_rate": 4.734917260455595e-07, - "loss": 0.4287, - "step": 80319 - }, - { - "epoch": 2.06, - "learning_rate": 4.734682016571956e-07, - "loss": 0.5054, - "step": 80320 - }, - { - "epoch": 2.06, - "learning_rate": 4.7344467767197316e-07, - "loss": 0.3735, - "step": 80321 - }, - { - "epoch": 2.06, - "learning_rate": 4.7342115408990955e-07, - "loss": 0.3667, - "step": 80322 - }, - { - "epoch": 2.06, - "learning_rate": 4.7339763091102324e-07, - "loss": 0.3496, - "step": 80323 - }, - { - "epoch": 2.06, - "learning_rate": 4.733741081353321e-07, - "loss": 0.4482, - "step": 80324 - }, - { - "epoch": 2.06, - "learning_rate": 4.733505857628545e-07, - "loss": 0.4341, - "step": 80325 - }, - { - "epoch": 2.06, - "learning_rate": 4.733270637936079e-07, - "loss": 0.4021, - "step": 80326 - }, - { - "epoch": 2.06, - "learning_rate": 4.7330354222761037e-07, - "loss": 0.417, - "step": 80327 - }, - { - "epoch": 2.06, - "learning_rate": 4.7328002106488064e-07, - "loss": 0.48, - "step": 80328 - }, - { - "epoch": 2.06, - "learning_rate": 4.7325650030543606e-07, - "loss": 0.4233, - "step": 80329 - }, - { - "epoch": 2.06, - "learning_rate": 4.7323297994929446e-07, - "loss": 0.3828, - "step": 80330 - }, - { - "epoch": 2.06, - "learning_rate": 4.732094599964742e-07, - "loss": 0.2794, - "step": 80331 - }, - { - "epoch": 2.06, - "learning_rate": 4.731859404469931e-07, - "loss": 0.3293, - "step": 80332 - }, - { - "epoch": 2.06, - "learning_rate": 4.731624213008698e-07, - "loss": 0.3716, - "step": 80333 - }, - { - "epoch": 2.06, - "learning_rate": 4.731389025581213e-07, - "loss": 0.3745, - "step": 80334 - }, - { - "epoch": 2.06, - "learning_rate": 4.731153842187662e-07, - "loss": 0.3914, - "step": 80335 - }, - { - "epoch": 2.06, - "learning_rate": 4.730918662828224e-07, - "loss": 0.4551, - "step": 80336 - }, - { - "epoch": 2.06, - "learning_rate": 4.730683487503083e-07, - "loss": 0.3625, - "step": 80337 - }, - { - "epoch": 2.06, - "learning_rate": 4.7304483162124166e-07, - "loss": 0.3638, - "step": 80338 - }, - { - "epoch": 2.06, - "learning_rate": 4.730213148956398e-07, - "loss": 0.3635, - "step": 80339 - }, - { - "epoch": 2.06, - "learning_rate": 4.729977985735214e-07, - "loss": 0.4355, - "step": 80340 - }, - { - "epoch": 2.06, - "learning_rate": 4.7297428265490433e-07, - "loss": 0.4253, - "step": 80341 - }, - { - "epoch": 2.06, - "learning_rate": 4.7295076713980696e-07, - "loss": 0.4165, - "step": 80342 - }, - { - "epoch": 2.06, - "learning_rate": 4.7292725202824656e-07, - "loss": 0.3462, - "step": 80343 - }, - { - "epoch": 2.06, - "learning_rate": 4.7290373732024157e-07, - "loss": 0.418, - "step": 80344 - }, - { - "epoch": 2.06, - "learning_rate": 4.7288022301581045e-07, - "loss": 0.4365, - "step": 80345 - }, - { - "epoch": 2.06, - "learning_rate": 4.728567091149701e-07, - "loss": 0.4556, - "step": 80346 - }, - { - "epoch": 2.06, - "learning_rate": 4.7283319561773925e-07, - "loss": 0.319, - "step": 80347 - }, - { - "epoch": 2.06, - "learning_rate": 4.7280968252413623e-07, - "loss": 0.4517, - "step": 80348 - }, - { - "epoch": 2.06, - "learning_rate": 4.7278616983417807e-07, - "loss": 0.5044, - "step": 80349 - }, - { - "epoch": 2.06, - "learning_rate": 4.727626575478838e-07, - "loss": 0.3696, - "step": 80350 - }, - { - "epoch": 2.06, - "learning_rate": 4.727391456652704e-07, - "loss": 0.4702, - "step": 80351 - }, - { - "epoch": 2.06, - "learning_rate": 4.727156341863565e-07, - "loss": 0.3506, - "step": 80352 - }, - { - "epoch": 2.06, - "learning_rate": 4.7269212311116e-07, - "loss": 0.4673, - "step": 80353 - }, - { - "epoch": 2.06, - "learning_rate": 4.7266861243969925e-07, - "loss": 0.4294, - "step": 80354 - }, - { - "epoch": 2.06, - "learning_rate": 4.726451021719915e-07, - "loss": 0.3323, - "step": 80355 - }, - { - "epoch": 2.06, - "learning_rate": 4.726215923080552e-07, - "loss": 0.3459, - "step": 80356 - }, - { - "epoch": 2.06, - "learning_rate": 4.7259808284790826e-07, - "loss": 0.254, - "step": 80357 - }, - { - "epoch": 2.06, - "learning_rate": 4.7257457379156904e-07, - "loss": 0.4019, - "step": 80358 - }, - { - "epoch": 2.06, - "learning_rate": 4.725510651390553e-07, - "loss": 0.3945, - "step": 80359 - }, - { - "epoch": 2.06, - "learning_rate": 4.725275568903845e-07, - "loss": 0.4441, - "step": 80360 - }, - { - "epoch": 2.06, - "learning_rate": 4.725040490455752e-07, - "loss": 0.5366, - "step": 80361 - }, - { - "epoch": 2.06, - "learning_rate": 4.724805416046456e-07, - "loss": 0.277, - "step": 80362 - }, - { - "epoch": 2.06, - "learning_rate": 4.72457034567613e-07, - "loss": 0.4902, - "step": 80363 - }, - { - "epoch": 2.06, - "learning_rate": 4.7243352793449586e-07, - "loss": 0.3479, - "step": 80364 - }, - { - "epoch": 2.06, - "learning_rate": 4.7241002170531206e-07, - "loss": 0.417, - "step": 80365 - }, - { - "epoch": 2.06, - "learning_rate": 4.7238651588008006e-07, - "loss": 0.2025, - "step": 80366 - }, - { - "epoch": 2.06, - "learning_rate": 4.72363010458817e-07, - "loss": 0.4858, - "step": 80367 - }, - { - "epoch": 2.06, - "learning_rate": 4.7233950544154177e-07, - "loss": 0.3989, - "step": 80368 - }, - { - "epoch": 2.06, - "learning_rate": 4.723160008282715e-07, - "loss": 0.3579, - "step": 80369 - }, - { - "epoch": 2.06, - "learning_rate": 4.722924966190246e-07, - "loss": 0.5205, - "step": 80370 - }, - { - "epoch": 2.06, - "learning_rate": 4.722689928138195e-07, - "loss": 0.4485, - "step": 80371 - }, - { - "epoch": 2.06, - "learning_rate": 4.722454894126733e-07, - "loss": 0.4429, - "step": 80372 - }, - { - "epoch": 2.06, - "learning_rate": 4.7222198641560453e-07, - "loss": 0.3838, - "step": 80373 - }, - { - "epoch": 2.06, - "learning_rate": 4.7219848382263105e-07, - "loss": 0.35, - "step": 80374 - }, - { - "epoch": 2.06, - "learning_rate": 4.7217498163377143e-07, - "loss": 0.4214, - "step": 80375 - }, - { - "epoch": 2.06, - "learning_rate": 4.721514798490427e-07, - "loss": 0.4756, - "step": 80376 - }, - { - "epoch": 2.06, - "learning_rate": 4.7212797846846333e-07, - "loss": 0.582, - "step": 80377 - }, - { - "epoch": 2.06, - "learning_rate": 4.7210447749205164e-07, - "loss": 0.4219, - "step": 80378 - }, - { - "epoch": 2.06, - "learning_rate": 4.720809769198253e-07, - "loss": 0.4771, - "step": 80379 - }, - { - "epoch": 2.06, - "learning_rate": 4.7205747675180184e-07, - "loss": 0.3098, - "step": 80380 - }, - { - "epoch": 2.06, - "learning_rate": 4.720339769879997e-07, - "loss": 0.5288, - "step": 80381 - }, - { - "epoch": 2.06, - "learning_rate": 4.72010477628437e-07, - "loss": 0.4619, - "step": 80382 - }, - { - "epoch": 2.06, - "learning_rate": 4.7198697867313187e-07, - "loss": 0.4204, - "step": 80383 - }, - { - "epoch": 2.06, - "learning_rate": 4.7196348012210173e-07, - "loss": 0.457, - "step": 80384 - }, - { - "epoch": 2.06, - "learning_rate": 4.7193998197536475e-07, - "loss": 0.3643, - "step": 80385 - }, - { - "epoch": 2.06, - "learning_rate": 4.7191648423293915e-07, - "loss": 0.3167, - "step": 80386 - }, - { - "epoch": 2.06, - "learning_rate": 4.7189298689484314e-07, - "loss": 0.3396, - "step": 80387 - }, - { - "epoch": 2.06, - "learning_rate": 4.7186948996109446e-07, - "loss": 0.4714, - "step": 80388 - }, - { - "epoch": 2.06, - "learning_rate": 4.718459934317106e-07, - "loss": 0.418, - "step": 80389 - }, - { - "epoch": 2.06, - "learning_rate": 4.7182249730671e-07, - "loss": 0.4756, - "step": 80390 - }, - { - "epoch": 2.06, - "learning_rate": 4.7179900158611054e-07, - "loss": 0.54, - "step": 80391 - }, - { - "epoch": 2.06, - "learning_rate": 4.717755062699308e-07, - "loss": 0.3877, - "step": 80392 - }, - { - "epoch": 2.06, - "learning_rate": 4.7175201135818775e-07, - "loss": 0.4126, - "step": 80393 - }, - { - "epoch": 2.06, - "learning_rate": 4.717285168509e-07, - "loss": 0.502, - "step": 80394 - }, - { - "epoch": 2.06, - "learning_rate": 4.7170502274808544e-07, - "loss": 0.3877, - "step": 80395 - }, - { - "epoch": 2.06, - "learning_rate": 4.7168152904976243e-07, - "loss": 0.4683, - "step": 80396 - }, - { - "epoch": 2.06, - "learning_rate": 4.716580357559485e-07, - "loss": 0.4331, - "step": 80397 - }, - { - "epoch": 2.06, - "learning_rate": 4.7163454286666135e-07, - "loss": 0.3176, - "step": 80398 - }, - { - "epoch": 2.06, - "learning_rate": 4.716110503819194e-07, - "loss": 0.5029, - "step": 80399 - }, - { - "epoch": 2.06, - "learning_rate": 4.715875583017409e-07, - "loss": 0.2347, - "step": 80400 - }, - { - "epoch": 2.06, - "learning_rate": 4.715640666261432e-07, - "loss": 0.3994, - "step": 80401 - }, - { - "epoch": 2.06, - "learning_rate": 4.715405753551446e-07, - "loss": 0.3955, - "step": 80402 - }, - { - "epoch": 2.06, - "learning_rate": 4.7151708448876304e-07, - "loss": 0.4666, - "step": 80403 - }, - { - "epoch": 2.06, - "learning_rate": 4.714935940270168e-07, - "loss": 0.4463, - "step": 80404 - }, - { - "epoch": 2.06, - "learning_rate": 4.714701039699235e-07, - "loss": 0.4272, - "step": 80405 - }, - { - "epoch": 2.06, - "learning_rate": 4.71446614317501e-07, - "loss": 0.3694, - "step": 80406 - }, - { - "epoch": 2.06, - "learning_rate": 4.71423125069768e-07, - "loss": 0.4248, - "step": 80407 - }, - { - "epoch": 2.06, - "learning_rate": 4.713996362267416e-07, - "loss": 0.4648, - "step": 80408 - }, - { - "epoch": 2.06, - "learning_rate": 4.713761477884407e-07, - "loss": 0.2157, - "step": 80409 - }, - { - "epoch": 2.06, - "learning_rate": 4.7135265975488223e-07, - "loss": 0.4517, - "step": 80410 - }, - { - "epoch": 2.06, - "learning_rate": 4.713291721260848e-07, - "loss": 0.4014, - "step": 80411 - }, - { - "epoch": 2.06, - "learning_rate": 4.7130568490206634e-07, - "loss": 0.4893, - "step": 80412 - }, - { - "epoch": 2.06, - "learning_rate": 4.7128219808284506e-07, - "loss": 0.3275, - "step": 80413 - }, - { - "epoch": 2.06, - "learning_rate": 4.7125871166843847e-07, - "loss": 0.4355, - "step": 80414 - }, - { - "epoch": 2.06, - "learning_rate": 4.7123522565886476e-07, - "loss": 0.3041, - "step": 80415 - }, - { - "epoch": 2.06, - "learning_rate": 4.7121174005414177e-07, - "loss": 0.4004, - "step": 80416 - }, - { - "epoch": 2.06, - "learning_rate": 4.7118825485428846e-07, - "loss": 0.4019, - "step": 80417 - }, - { - "epoch": 2.06, - "learning_rate": 4.711647700593213e-07, - "loss": 0.3081, - "step": 80418 - }, - { - "epoch": 2.06, - "learning_rate": 4.711412856692589e-07, - "loss": 0.3931, - "step": 80419 - }, - { - "epoch": 2.06, - "learning_rate": 4.711178016841194e-07, - "loss": 0.6548, - "step": 80420 - }, - { - "epoch": 2.06, - "learning_rate": 4.7109431810392095e-07, - "loss": 0.542, - "step": 80421 - }, - { - "epoch": 2.06, - "learning_rate": 4.7107083492868094e-07, - "loss": 0.4958, - "step": 80422 - }, - { - "epoch": 2.06, - "learning_rate": 4.710473521584176e-07, - "loss": 0.4497, - "step": 80423 - }, - { - "epoch": 2.06, - "learning_rate": 4.71023869793149e-07, - "loss": 0.4028, - "step": 80424 - }, - { - "epoch": 2.06, - "learning_rate": 4.7100038783289353e-07, - "loss": 0.417, - "step": 80425 - }, - { - "epoch": 2.06, - "learning_rate": 4.709769062776683e-07, - "loss": 0.5435, - "step": 80426 - }, - { - "epoch": 2.06, - "learning_rate": 4.709534251274921e-07, - "loss": 0.3552, - "step": 80427 - }, - { - "epoch": 2.06, - "learning_rate": 4.7092994438238233e-07, - "loss": 0.4629, - "step": 80428 - }, - { - "epoch": 2.06, - "learning_rate": 4.70906464042357e-07, - "loss": 0.4463, - "step": 80429 - }, - { - "epoch": 2.06, - "learning_rate": 4.7088298410743466e-07, - "loss": 0.3906, - "step": 80430 - }, - { - "epoch": 2.06, - "learning_rate": 4.7085950457763255e-07, - "loss": 0.4814, - "step": 80431 - }, - { - "epoch": 2.06, - "learning_rate": 4.7083602545296895e-07, - "loss": 0.355, - "step": 80432 - }, - { - "epoch": 2.06, - "learning_rate": 4.708125467334619e-07, - "loss": 0.4722, - "step": 80433 - }, - { - "epoch": 2.06, - "learning_rate": 4.707890684191297e-07, - "loss": 0.4771, - "step": 80434 - }, - { - "epoch": 2.06, - "learning_rate": 4.7076559050998966e-07, - "loss": 0.4326, - "step": 80435 - }, - { - "epoch": 2.06, - "learning_rate": 4.7074211300606e-07, - "loss": 0.541, - "step": 80436 - }, - { - "epoch": 2.06, - "learning_rate": 4.7071863590735916e-07, - "loss": 0.5435, - "step": 80437 - }, - { - "epoch": 2.06, - "learning_rate": 4.706951592139048e-07, - "loss": 0.51, - "step": 80438 - }, - { - "epoch": 2.06, - "learning_rate": 4.7067168292571435e-07, - "loss": 0.2495, - "step": 80439 - }, - { - "epoch": 2.06, - "learning_rate": 4.706482070428063e-07, - "loss": 0.4434, - "step": 80440 - }, - { - "epoch": 2.06, - "learning_rate": 4.7062473156519853e-07, - "loss": 0.5259, - "step": 80441 - }, - { - "epoch": 2.06, - "learning_rate": 4.706012564929095e-07, - "loss": 0.4253, - "step": 80442 - }, - { - "epoch": 2.06, - "learning_rate": 4.705777818259563e-07, - "loss": 0.3523, - "step": 80443 - }, - { - "epoch": 2.06, - "learning_rate": 4.7055430756435745e-07, - "loss": 0.355, - "step": 80444 - }, - { - "epoch": 2.06, - "learning_rate": 4.7053083370813074e-07, - "loss": 0.4526, - "step": 80445 - }, - { - "epoch": 2.06, - "learning_rate": 4.705073602572946e-07, - "loss": 0.457, - "step": 80446 - }, - { - "epoch": 2.06, - "learning_rate": 4.704838872118666e-07, - "loss": 0.3628, - "step": 80447 - }, - { - "epoch": 2.06, - "learning_rate": 4.7046041457186446e-07, - "loss": 0.4077, - "step": 80448 - }, - { - "epoch": 2.06, - "learning_rate": 4.7043694233730635e-07, - "loss": 0.4209, - "step": 80449 - }, - { - "epoch": 2.06, - "learning_rate": 4.704134705082103e-07, - "loss": 0.5015, - "step": 80450 - }, - { - "epoch": 2.06, - "learning_rate": 4.703899990845949e-07, - "loss": 0.5322, - "step": 80451 - }, - { - "epoch": 2.06, - "learning_rate": 4.703665280664769e-07, - "loss": 0.356, - "step": 80452 - }, - { - "epoch": 2.06, - "learning_rate": 4.70343057453875e-07, - "loss": 0.4036, - "step": 80453 - }, - { - "epoch": 2.06, - "learning_rate": 4.7031958724680743e-07, - "loss": 0.343, - "step": 80454 - }, - { - "epoch": 2.06, - "learning_rate": 4.7029611744529143e-07, - "loss": 0.3672, - "step": 80455 - }, - { - "epoch": 2.06, - "learning_rate": 4.702726480493453e-07, - "loss": 0.293, - "step": 80456 - }, - { - "epoch": 2.06, - "learning_rate": 4.7024917905898743e-07, - "loss": 0.4515, - "step": 80457 - }, - { - "epoch": 2.06, - "learning_rate": 4.702257104742351e-07, - "loss": 0.2966, - "step": 80458 - }, - { - "epoch": 2.06, - "learning_rate": 4.7020224229510686e-07, - "loss": 0.3381, - "step": 80459 - }, - { - "epoch": 2.06, - "learning_rate": 4.7017877452162014e-07, - "loss": 0.4844, - "step": 80460 - }, - { - "epoch": 2.06, - "learning_rate": 4.70155307153793e-07, - "loss": 0.3989, - "step": 80461 - }, - { - "epoch": 2.06, - "learning_rate": 4.7013184019164374e-07, - "loss": 0.2706, - "step": 80462 - }, - { - "epoch": 2.06, - "learning_rate": 4.7010837363519053e-07, - "loss": 0.3347, - "step": 80463 - }, - { - "epoch": 2.06, - "learning_rate": 4.700849074844505e-07, - "loss": 0.437, - "step": 80464 - }, - { - "epoch": 2.06, - "learning_rate": 4.700614417394422e-07, - "loss": 0.4595, - "step": 80465 - }, - { - "epoch": 2.06, - "learning_rate": 4.7003797640018337e-07, - "loss": 0.3106, - "step": 80466 - }, - { - "epoch": 2.06, - "learning_rate": 4.7001451146669257e-07, - "loss": 0.3523, - "step": 80467 - }, - { - "epoch": 2.06, - "learning_rate": 4.699910469389872e-07, - "loss": 0.332, - "step": 80468 - }, - { - "epoch": 2.06, - "learning_rate": 4.69967582817085e-07, - "loss": 0.5073, - "step": 80469 - }, - { - "epoch": 2.06, - "learning_rate": 4.699441191010042e-07, - "loss": 0.4565, - "step": 80470 - }, - { - "epoch": 2.06, - "learning_rate": 4.6992065579076323e-07, - "loss": 0.5483, - "step": 80471 - }, - { - "epoch": 2.06, - "learning_rate": 4.698971928863793e-07, - "loss": 0.4375, - "step": 80472 - }, - { - "epoch": 2.06, - "learning_rate": 4.698737303878707e-07, - "loss": 0.2845, - "step": 80473 - }, - { - "epoch": 2.06, - "learning_rate": 4.698502682952553e-07, - "loss": 0.3923, - "step": 80474 - }, - { - "epoch": 2.06, - "learning_rate": 4.698268066085517e-07, - "loss": 0.2846, - "step": 80475 - }, - { - "epoch": 2.06, - "learning_rate": 4.6980334532777686e-07, - "loss": 0.3479, - "step": 80476 - }, - { - "epoch": 2.06, - "learning_rate": 4.6977988445294967e-07, - "loss": 0.3416, - "step": 80477 - }, - { - "epoch": 2.06, - "learning_rate": 4.697564239840872e-07, - "loss": 0.499, - "step": 80478 - }, - { - "epoch": 2.06, - "learning_rate": 4.6973296392120785e-07, - "loss": 0.6392, - "step": 80479 - }, - { - "epoch": 2.06, - "learning_rate": 4.6970950426432996e-07, - "loss": 0.4084, - "step": 80480 - }, - { - "epoch": 2.06, - "learning_rate": 4.6968604501347086e-07, - "loss": 0.4678, - "step": 80481 - }, - { - "epoch": 2.06, - "learning_rate": 4.696625861686486e-07, - "loss": 0.4316, - "step": 80482 - }, - { - "epoch": 2.06, - "learning_rate": 4.6963912772988143e-07, - "loss": 0.3696, - "step": 80483 - }, - { - "epoch": 2.06, - "learning_rate": 4.696156696971876e-07, - "loss": 0.3916, - "step": 80484 - }, - { - "epoch": 2.06, - "learning_rate": 4.695922120705842e-07, - "loss": 0.4434, - "step": 80485 - }, - { - "epoch": 2.06, - "learning_rate": 4.6956875485008965e-07, - "loss": 0.4263, - "step": 80486 - }, - { - "epoch": 2.06, - "learning_rate": 4.695452980357223e-07, - "loss": 0.5264, - "step": 80487 - }, - { - "epoch": 2.06, - "learning_rate": 4.6952184162749973e-07, - "loss": 0.4678, - "step": 80488 - }, - { - "epoch": 2.06, - "learning_rate": 4.6949838562543963e-07, - "loss": 0.3901, - "step": 80489 - }, - { - "epoch": 2.06, - "learning_rate": 4.6947493002956004e-07, - "loss": 0.4189, - "step": 80490 - }, - { - "epoch": 2.06, - "learning_rate": 4.6945147483987924e-07, - "loss": 0.418, - "step": 80491 - }, - { - "epoch": 2.06, - "learning_rate": 4.6942802005641537e-07, - "loss": 0.2683, - "step": 80492 - }, - { - "epoch": 2.06, - "learning_rate": 4.6940456567918574e-07, - "loss": 0.3092, - "step": 80493 - }, - { - "epoch": 2.06, - "learning_rate": 4.693811117082086e-07, - "loss": 0.392, - "step": 80494 - }, - { - "epoch": 2.06, - "learning_rate": 4.6935765814350193e-07, - "loss": 0.4563, - "step": 80495 - }, - { - "epoch": 2.06, - "learning_rate": 4.69334204985084e-07, - "loss": 0.4062, - "step": 80496 - }, - { - "epoch": 2.06, - "learning_rate": 4.693107522329726e-07, - "loss": 0.2913, - "step": 80497 - }, - { - "epoch": 2.06, - "learning_rate": 4.692872998871852e-07, - "loss": 0.3079, - "step": 80498 - }, - { - "epoch": 2.06, - "learning_rate": 4.6926384794773996e-07, - "loss": 0.4326, - "step": 80499 - }, - { - "epoch": 2.06, - "learning_rate": 4.6924039641465507e-07, - "loss": 0.373, - "step": 80500 - }, - { - "epoch": 2.06, - "learning_rate": 4.6921694528794874e-07, - "loss": 0.4209, - "step": 80501 - }, - { - "epoch": 2.06, - "learning_rate": 4.6919349456763834e-07, - "loss": 0.376, - "step": 80502 - }, - { - "epoch": 2.06, - "learning_rate": 4.6917004425374197e-07, - "loss": 0.4011, - "step": 80503 - }, - { - "epoch": 2.06, - "learning_rate": 4.691465943462777e-07, - "loss": 0.4556, - "step": 80504 - }, - { - "epoch": 2.06, - "learning_rate": 4.6912314484526384e-07, - "loss": 0.2974, - "step": 80505 - }, - { - "epoch": 2.06, - "learning_rate": 4.690996957507176e-07, - "loss": 0.2841, - "step": 80506 - }, - { - "epoch": 2.06, - "learning_rate": 4.690762470626578e-07, - "loss": 0.3005, - "step": 80507 - }, - { - "epoch": 2.06, - "learning_rate": 4.6905279878110135e-07, - "loss": 0.2868, - "step": 80508 - }, - { - "epoch": 2.06, - "learning_rate": 4.690293509060672e-07, - "loss": 0.5352, - "step": 80509 - }, - { - "epoch": 2.06, - "learning_rate": 4.690059034375725e-07, - "loss": 0.3318, - "step": 80510 - }, - { - "epoch": 2.06, - "learning_rate": 4.6898245637563563e-07, - "loss": 0.382, - "step": 80511 - }, - { - "epoch": 2.06, - "learning_rate": 4.6895900972027446e-07, - "loss": 0.4258, - "step": 80512 - }, - { - "epoch": 2.06, - "learning_rate": 4.689355634715072e-07, - "loss": 0.3972, - "step": 80513 - }, - { - "epoch": 2.06, - "learning_rate": 4.6891211762935134e-07, - "loss": 0.4302, - "step": 80514 - }, - { - "epoch": 2.06, - "learning_rate": 4.6888867219382497e-07, - "loss": 0.3828, - "step": 80515 - }, - { - "epoch": 2.06, - "learning_rate": 4.6886522716494615e-07, - "loss": 0.408, - "step": 80516 - }, - { - "epoch": 2.06, - "learning_rate": 4.688417825427331e-07, - "loss": 0.4653, - "step": 80517 - }, - { - "epoch": 2.06, - "learning_rate": 4.6881833832720363e-07, - "loss": 0.2723, - "step": 80518 - }, - { - "epoch": 2.06, - "learning_rate": 4.687948945183751e-07, - "loss": 0.5146, - "step": 80519 - }, - { - "epoch": 2.06, - "learning_rate": 4.687714511162658e-07, - "loss": 0.376, - "step": 80520 - }, - { - "epoch": 2.06, - "learning_rate": 4.687480081208939e-07, - "loss": 0.4771, - "step": 80521 - }, - { - "epoch": 2.06, - "learning_rate": 4.687245655322775e-07, - "loss": 0.4072, - "step": 80522 - }, - { - "epoch": 2.06, - "learning_rate": 4.687011233504339e-07, - "loss": 0.4153, - "step": 80523 - }, - { - "epoch": 2.06, - "learning_rate": 4.686776815753815e-07, - "loss": 0.3346, - "step": 80524 - }, - { - "epoch": 2.06, - "learning_rate": 4.686542402071384e-07, - "loss": 0.3843, - "step": 80525 - }, - { - "epoch": 2.06, - "learning_rate": 4.686307992457221e-07, - "loss": 0.4258, - "step": 80526 - }, - { - "epoch": 2.06, - "learning_rate": 4.686073586911511e-07, - "loss": 0.4526, - "step": 80527 - }, - { - "epoch": 2.06, - "learning_rate": 4.685839185434426e-07, - "loss": 0.4873, - "step": 80528 - }, - { - "epoch": 2.06, - "learning_rate": 4.6856047880261496e-07, - "loss": 0.4653, - "step": 80529 - }, - { - "epoch": 2.06, - "learning_rate": 4.685370394686865e-07, - "loss": 0.4058, - "step": 80530 - }, - { - "epoch": 2.06, - "learning_rate": 4.6851360054167443e-07, - "loss": 0.429, - "step": 80531 - }, - { - "epoch": 2.06, - "learning_rate": 4.684901620215971e-07, - "loss": 0.3804, - "step": 80532 - }, - { - "epoch": 2.06, - "learning_rate": 4.684667239084723e-07, - "loss": 0.4189, - "step": 80533 - }, - { - "epoch": 2.06, - "learning_rate": 4.684432862023185e-07, - "loss": 0.4402, - "step": 80534 - }, - { - "epoch": 2.06, - "learning_rate": 4.684198489031529e-07, - "loss": 0.426, - "step": 80535 - }, - { - "epoch": 2.06, - "learning_rate": 4.683964120109938e-07, - "loss": 0.3142, - "step": 80536 - }, - { - "epoch": 2.06, - "learning_rate": 4.6837297552585954e-07, - "loss": 0.4985, - "step": 80537 - }, - { - "epoch": 2.06, - "learning_rate": 4.6834953944776714e-07, - "loss": 0.4487, - "step": 80538 - }, - { - "epoch": 2.06, - "learning_rate": 4.683261037767354e-07, - "loss": 0.3567, - "step": 80539 - }, - { - "epoch": 2.06, - "learning_rate": 4.6830266851278164e-07, - "loss": 0.5342, - "step": 80540 - }, - { - "epoch": 2.06, - "learning_rate": 4.6827923365592413e-07, - "loss": 0.3447, - "step": 80541 - }, - { - "epoch": 2.06, - "learning_rate": 4.682557992061811e-07, - "loss": 0.3879, - "step": 80542 - }, - { - "epoch": 2.06, - "learning_rate": 4.682323651635698e-07, - "loss": 0.3772, - "step": 80543 - }, - { - "epoch": 2.06, - "learning_rate": 4.682089315281084e-07, - "loss": 0.2927, - "step": 80544 - }, - { - "epoch": 2.06, - "learning_rate": 4.6818549829981503e-07, - "loss": 0.3882, - "step": 80545 - }, - { - "epoch": 2.06, - "learning_rate": 4.68162065478708e-07, - "loss": 0.5327, - "step": 80546 - }, - { - "epoch": 2.06, - "learning_rate": 4.681386330648048e-07, - "loss": 0.418, - "step": 80547 - }, - { - "epoch": 2.06, - "learning_rate": 4.6811520105812297e-07, - "loss": 0.4233, - "step": 80548 - }, - { - "epoch": 2.06, - "learning_rate": 4.680917694586809e-07, - "loss": 0.4697, - "step": 80549 - }, - { - "epoch": 2.06, - "learning_rate": 4.680683382664965e-07, - "loss": 0.4683, - "step": 80550 - }, - { - "epoch": 2.06, - "learning_rate": 4.680449074815881e-07, - "loss": 0.4507, - "step": 80551 - }, - { - "epoch": 2.06, - "learning_rate": 4.6802147710397286e-07, - "loss": 0.3691, - "step": 80552 - }, - { - "epoch": 2.06, - "learning_rate": 4.679980471336692e-07, - "loss": 0.4443, - "step": 80553 - }, - { - "epoch": 2.06, - "learning_rate": 4.679746175706949e-07, - "loss": 0.5732, - "step": 80554 - }, - { - "epoch": 2.06, - "learning_rate": 4.679511884150683e-07, - "loss": 0.3762, - "step": 80555 - }, - { - "epoch": 2.06, - "learning_rate": 4.6792775966680674e-07, - "loss": 0.3867, - "step": 80556 - }, - { - "epoch": 2.06, - "learning_rate": 4.679043313259288e-07, - "loss": 0.3286, - "step": 80557 - }, - { - "epoch": 2.06, - "learning_rate": 4.6788090339245156e-07, - "loss": 0.4242, - "step": 80558 - }, - { - "epoch": 2.06, - "learning_rate": 4.678574758663939e-07, - "loss": 0.5059, - "step": 80559 - }, - { - "epoch": 2.06, - "learning_rate": 4.6783404874777286e-07, - "loss": 0.2932, - "step": 80560 - }, - { - "epoch": 2.06, - "learning_rate": 4.6781062203660695e-07, - "loss": 0.4634, - "step": 80561 - }, - { - "epoch": 2.06, - "learning_rate": 4.677871957329139e-07, - "loss": 0.3843, - "step": 80562 - }, - { - "epoch": 2.06, - "learning_rate": 4.677637698367121e-07, - "loss": 0.4658, - "step": 80563 - }, - { - "epoch": 2.06, - "learning_rate": 4.677403443480187e-07, - "loss": 0.4556, - "step": 80564 - }, - { - "epoch": 2.06, - "learning_rate": 4.6771691926685207e-07, - "loss": 0.4082, - "step": 80565 - }, - { - "epoch": 2.06, - "learning_rate": 4.6769349459323016e-07, - "loss": 0.4154, - "step": 80566 - }, - { - "epoch": 2.06, - "learning_rate": 4.676700703271712e-07, - "loss": 0.356, - "step": 80567 - }, - { - "epoch": 2.06, - "learning_rate": 4.676466464686928e-07, - "loss": 0.4624, - "step": 80568 - }, - { - "epoch": 2.07, - "learning_rate": 4.6762322301781257e-07, - "loss": 0.3276, - "step": 80569 - }, - { - "epoch": 2.07, - "learning_rate": 4.6759979997454856e-07, - "loss": 0.41, - "step": 80570 - }, - { - "epoch": 2.07, - "learning_rate": 4.675763773389191e-07, - "loss": 0.3401, - "step": 80571 - }, - { - "epoch": 2.07, - "learning_rate": 4.6755295511094215e-07, - "loss": 0.3887, - "step": 80572 - }, - { - "epoch": 2.07, - "learning_rate": 4.6752953329063517e-07, - "loss": 0.3756, - "step": 80573 - }, - { - "epoch": 2.07, - "learning_rate": 4.6750611187801636e-07, - "loss": 0.324, - "step": 80574 - }, - { - "epoch": 2.07, - "learning_rate": 4.6748269087310353e-07, - "loss": 0.447, - "step": 80575 - }, - { - "epoch": 2.07, - "learning_rate": 4.6745927027591514e-07, - "loss": 0.3464, - "step": 80576 - }, - { - "epoch": 2.07, - "learning_rate": 4.6743585008646866e-07, - "loss": 0.4248, - "step": 80577 - }, - { - "epoch": 2.07, - "learning_rate": 4.6741243030478183e-07, - "loss": 0.4897, - "step": 80578 - }, - { - "epoch": 2.07, - "learning_rate": 4.673890109308727e-07, - "loss": 0.4346, - "step": 80579 - }, - { - "epoch": 2.07, - "learning_rate": 4.6736559196475965e-07, - "loss": 0.5088, - "step": 80580 - }, - { - "epoch": 2.07, - "learning_rate": 4.6734217340646e-07, - "loss": 0.5288, - "step": 80581 - }, - { - "epoch": 2.07, - "learning_rate": 4.6731875525599185e-07, - "loss": 0.5278, - "step": 80582 - }, - { - "epoch": 2.07, - "learning_rate": 4.6729533751337336e-07, - "loss": 0.3762, - "step": 80583 - }, - { - "epoch": 2.07, - "learning_rate": 4.672719201786226e-07, - "loss": 0.436, - "step": 80584 - }, - { - "epoch": 2.07, - "learning_rate": 4.672485032517569e-07, - "loss": 0.4463, - "step": 80585 - }, - { - "epoch": 2.07, - "learning_rate": 4.672250867327946e-07, - "loss": 0.2716, - "step": 80586 - }, - { - "epoch": 2.07, - "learning_rate": 4.6720167062175387e-07, - "loss": 0.3486, - "step": 80587 - }, - { - "epoch": 2.07, - "learning_rate": 4.671782549186519e-07, - "loss": 0.3511, - "step": 80588 - }, - { - "epoch": 2.07, - "learning_rate": 4.6715483962350744e-07, - "loss": 0.4109, - "step": 80589 - }, - { - "epoch": 2.07, - "learning_rate": 4.671314247363376e-07, - "loss": 0.4221, - "step": 80590 - }, - { - "epoch": 2.07, - "learning_rate": 4.6710801025716083e-07, - "loss": 0.4692, - "step": 80591 - }, - { - "epoch": 2.07, - "learning_rate": 4.6708459618599496e-07, - "loss": 0.3616, - "step": 80592 - }, - { - "epoch": 2.07, - "learning_rate": 4.670611825228582e-07, - "loss": 0.5137, - "step": 80593 - }, - { - "epoch": 2.07, - "learning_rate": 4.6703776926776785e-07, - "loss": 0.3918, - "step": 80594 - }, - { - "epoch": 2.07, - "learning_rate": 4.6701435642074215e-07, - "loss": 0.3948, - "step": 80595 - }, - { - "epoch": 2.07, - "learning_rate": 4.6699094398179907e-07, - "loss": 0.3687, - "step": 80596 - }, - { - "epoch": 2.07, - "learning_rate": 4.6696753195095716e-07, - "loss": 0.3135, - "step": 80597 - }, - { - "epoch": 2.07, - "learning_rate": 4.6694412032823304e-07, - "loss": 0.4646, - "step": 80598 - }, - { - "epoch": 2.07, - "learning_rate": 4.6692070911364533e-07, - "loss": 0.3003, - "step": 80599 - }, - { - "epoch": 2.07, - "learning_rate": 4.6689729830721194e-07, - "loss": 0.499, - "step": 80600 - }, - { - "epoch": 2.07, - "learning_rate": 4.668738879089511e-07, - "loss": 0.4434, - "step": 80601 - }, - { - "epoch": 2.07, - "learning_rate": 4.668504779188801e-07, - "loss": 0.3584, - "step": 80602 - }, - { - "epoch": 2.07, - "learning_rate": 4.668270683370171e-07, - "loss": 0.3315, - "step": 80603 - }, - { - "epoch": 2.07, - "learning_rate": 4.6680365916338007e-07, - "loss": 0.415, - "step": 80604 - }, - { - "epoch": 2.07, - "learning_rate": 4.667802503979874e-07, - "loss": 0.3853, - "step": 80605 - }, - { - "epoch": 2.07, - "learning_rate": 4.6675684204085617e-07, - "loss": 0.344, - "step": 80606 - }, - { - "epoch": 2.07, - "learning_rate": 4.6673343409200516e-07, - "loss": 0.2678, - "step": 80607 - }, - { - "epoch": 2.07, - "learning_rate": 4.667100265514513e-07, - "loss": 0.4746, - "step": 80608 - }, - { - "epoch": 2.07, - "learning_rate": 4.6668661941921315e-07, - "loss": 0.376, - "step": 80609 - }, - { - "epoch": 2.07, - "learning_rate": 4.6666321269530894e-07, - "loss": 0.3442, - "step": 80610 - }, - { - "epoch": 2.07, - "learning_rate": 4.6663980637975577e-07, - "loss": 0.415, - "step": 80611 - }, - { - "epoch": 2.07, - "learning_rate": 4.66616400472572e-07, - "loss": 0.4126, - "step": 80612 - }, - { - "epoch": 2.07, - "learning_rate": 4.6659299497377555e-07, - "loss": 0.4795, - "step": 80613 - }, - { - "epoch": 2.07, - "learning_rate": 4.6656958988338455e-07, - "loss": 0.2474, - "step": 80614 - }, - { - "epoch": 2.07, - "learning_rate": 4.6654618520141653e-07, - "loss": 0.3984, - "step": 80615 - }, - { - "epoch": 2.07, - "learning_rate": 4.6652278092788944e-07, - "loss": 0.4309, - "step": 80616 - }, - { - "epoch": 2.07, - "learning_rate": 4.664993770628217e-07, - "loss": 0.4224, - "step": 80617 - }, - { - "epoch": 2.07, - "learning_rate": 4.6647597360623083e-07, - "loss": 0.4336, - "step": 80618 - }, - { - "epoch": 2.07, - "learning_rate": 4.6645257055813447e-07, - "loss": 0.4233, - "step": 80619 - }, - { - "epoch": 2.07, - "learning_rate": 4.664291679185508e-07, - "loss": 0.4397, - "step": 80620 - }, - { - "epoch": 2.07, - "learning_rate": 4.664057656874978e-07, - "loss": 0.272, - "step": 80621 - }, - { - "epoch": 2.07, - "learning_rate": 4.663823638649937e-07, - "loss": 0.3748, - "step": 80622 - }, - { - "epoch": 2.07, - "learning_rate": 4.663589624510558e-07, - "loss": 0.4443, - "step": 80623 - }, - { - "epoch": 2.07, - "learning_rate": 4.663355614457023e-07, - "loss": 0.4248, - "step": 80624 - }, - { - "epoch": 2.07, - "learning_rate": 4.66312160848951e-07, - "loss": 0.3757, - "step": 80625 - }, - { - "epoch": 2.07, - "learning_rate": 4.6628876066082046e-07, - "loss": 0.4712, - "step": 80626 - }, - { - "epoch": 2.07, - "learning_rate": 4.6626536088132794e-07, - "loss": 0.3354, - "step": 80627 - }, - { - "epoch": 2.07, - "learning_rate": 4.6624196151049124e-07, - "loss": 0.4106, - "step": 80628 - }, - { - "epoch": 2.07, - "learning_rate": 4.662185625483285e-07, - "loss": 0.5088, - "step": 80629 - }, - { - "epoch": 2.07, - "learning_rate": 4.6619516399485757e-07, - "loss": 0.2471, - "step": 80630 - }, - { - "epoch": 2.07, - "learning_rate": 4.6617176585009687e-07, - "loss": 0.3997, - "step": 80631 - }, - { - "epoch": 2.07, - "learning_rate": 4.6614836811406356e-07, - "loss": 0.396, - "step": 80632 - }, - { - "epoch": 2.07, - "learning_rate": 4.6612497078677595e-07, - "loss": 0.3589, - "step": 80633 - }, - { - "epoch": 2.07, - "learning_rate": 4.661015738682522e-07, - "loss": 0.3318, - "step": 80634 - }, - { - "epoch": 2.07, - "learning_rate": 4.660781773585095e-07, - "loss": 0.3618, - "step": 80635 - }, - { - "epoch": 2.07, - "learning_rate": 4.6605478125756636e-07, - "loss": 0.4194, - "step": 80636 - }, - { - "epoch": 2.07, - "learning_rate": 4.6603138556544075e-07, - "loss": 0.5244, - "step": 80637 - }, - { - "epoch": 2.07, - "learning_rate": 4.6600799028215e-07, - "loss": 0.4072, - "step": 80638 - }, - { - "epoch": 2.07, - "learning_rate": 4.6598459540771284e-07, - "loss": 0.4702, - "step": 80639 - }, - { - "epoch": 2.07, - "learning_rate": 4.659612009421463e-07, - "loss": 0.3528, - "step": 80640 - }, - { - "epoch": 2.07, - "learning_rate": 4.659378068854687e-07, - "loss": 0.4673, - "step": 80641 - }, - { - "epoch": 2.07, - "learning_rate": 4.65914413237698e-07, - "loss": 0.4004, - "step": 80642 - }, - { - "epoch": 2.07, - "learning_rate": 4.6589101999885237e-07, - "loss": 0.3755, - "step": 80643 - }, - { - "epoch": 2.07, - "learning_rate": 4.6586762716894914e-07, - "loss": 0.2965, - "step": 80644 - }, - { - "epoch": 2.07, - "learning_rate": 4.658442347480064e-07, - "loss": 0.3486, - "step": 80645 - }, - { - "epoch": 2.07, - "learning_rate": 4.6582084273604226e-07, - "loss": 0.4302, - "step": 80646 - }, - { - "epoch": 2.07, - "learning_rate": 4.657974511330749e-07, - "loss": 0.3289, - "step": 80647 - }, - { - "epoch": 2.07, - "learning_rate": 4.6577405993912176e-07, - "loss": 0.4526, - "step": 80648 - }, - { - "epoch": 2.07, - "learning_rate": 4.657506691542006e-07, - "loss": 0.4692, - "step": 80649 - }, - { - "epoch": 2.07, - "learning_rate": 4.6572727877832963e-07, - "loss": 0.5186, - "step": 80650 - }, - { - "epoch": 2.07, - "learning_rate": 4.65703888811527e-07, - "loss": 0.5312, - "step": 80651 - }, - { - "epoch": 2.07, - "learning_rate": 4.656804992538099e-07, - "loss": 0.3261, - "step": 80652 - }, - { - "epoch": 2.07, - "learning_rate": 4.6565711010519683e-07, - "loss": 0.353, - "step": 80653 - }, - { - "epoch": 2.07, - "learning_rate": 4.6563372136570544e-07, - "loss": 0.542, - "step": 80654 - }, - { - "epoch": 2.07, - "learning_rate": 4.6561033303535414e-07, - "loss": 0.4761, - "step": 80655 - }, - { - "epoch": 2.07, - "learning_rate": 4.655869451141601e-07, - "loss": 0.438, - "step": 80656 - }, - { - "epoch": 2.07, - "learning_rate": 4.6556355760214194e-07, - "loss": 0.3494, - "step": 80657 - }, - { - "epoch": 2.07, - "learning_rate": 4.655401704993167e-07, - "loss": 0.3691, - "step": 80658 - }, - { - "epoch": 2.07, - "learning_rate": 4.655167838057029e-07, - "loss": 0.4971, - "step": 80659 - }, - { - "epoch": 2.07, - "learning_rate": 4.6549339752131867e-07, - "loss": 0.3667, - "step": 80660 - }, - { - "epoch": 2.07, - "learning_rate": 4.6547001164618114e-07, - "loss": 0.3503, - "step": 80661 - }, - { - "epoch": 2.07, - "learning_rate": 4.654466261803087e-07, - "loss": 0.2986, - "step": 80662 - }, - { - "epoch": 2.07, - "learning_rate": 4.654232411237191e-07, - "loss": 0.4824, - "step": 80663 - }, - { - "epoch": 2.07, - "learning_rate": 4.6539985647643087e-07, - "loss": 0.3887, - "step": 80664 - }, - { - "epoch": 2.07, - "learning_rate": 4.6537647223846086e-07, - "loss": 0.4346, - "step": 80665 - }, - { - "epoch": 2.07, - "learning_rate": 4.653530884098277e-07, - "loss": 0.4131, - "step": 80666 - }, - { - "epoch": 2.07, - "learning_rate": 4.653297049905494e-07, - "loss": 0.5298, - "step": 80667 - }, - { - "epoch": 2.07, - "learning_rate": 4.6530632198064347e-07, - "loss": 0.5049, - "step": 80668 - }, - { - "epoch": 2.07, - "learning_rate": 4.6528293938012754e-07, - "loss": 0.4294, - "step": 80669 - }, - { - "epoch": 2.07, - "learning_rate": 4.6525955718901986e-07, - "loss": 0.2806, - "step": 80670 - }, - { - "epoch": 2.07, - "learning_rate": 4.652361754073384e-07, - "loss": 0.4385, - "step": 80671 - }, - { - "epoch": 2.07, - "learning_rate": 4.652127940351014e-07, - "loss": 0.2031, - "step": 80672 - }, - { - "epoch": 2.07, - "learning_rate": 4.6518941307232596e-07, - "loss": 0.3877, - "step": 80673 - }, - { - "epoch": 2.07, - "learning_rate": 4.6516603251903043e-07, - "loss": 0.4551, - "step": 80674 - }, - { - "epoch": 2.07, - "learning_rate": 4.6514265237523266e-07, - "loss": 0.3467, - "step": 80675 - }, - { - "epoch": 2.07, - "learning_rate": 4.65119272640951e-07, - "loss": 0.3833, - "step": 80676 - }, - { - "epoch": 2.07, - "learning_rate": 4.650958933162028e-07, - "loss": 0.3313, - "step": 80677 - }, - { - "epoch": 2.07, - "learning_rate": 4.650725144010058e-07, - "loss": 0.3032, - "step": 80678 - }, - { - "epoch": 2.07, - "learning_rate": 4.650491358953782e-07, - "loss": 0.519, - "step": 80679 - }, - { - "epoch": 2.07, - "learning_rate": 4.6502575779933773e-07, - "loss": 0.4192, - "step": 80680 - }, - { - "epoch": 2.07, - "learning_rate": 4.6500238011290293e-07, - "loss": 0.4236, - "step": 80681 - }, - { - "epoch": 2.07, - "learning_rate": 4.649790028360908e-07, - "loss": 0.4414, - "step": 80682 - }, - { - "epoch": 2.07, - "learning_rate": 4.649556259689197e-07, - "loss": 0.5122, - "step": 80683 - }, - { - "epoch": 2.07, - "learning_rate": 4.649322495114074e-07, - "loss": 0.521, - "step": 80684 - }, - { - "epoch": 2.07, - "learning_rate": 4.6490887346357233e-07, - "loss": 0.3597, - "step": 80685 - }, - { - "epoch": 2.07, - "learning_rate": 4.6488549782543186e-07, - "loss": 0.3801, - "step": 80686 - }, - { - "epoch": 2.07, - "learning_rate": 4.6486212259700366e-07, - "loss": 0.4175, - "step": 80687 - }, - { - "epoch": 2.07, - "learning_rate": 4.648387477783058e-07, - "loss": 0.4531, - "step": 80688 - }, - { - "epoch": 2.07, - "learning_rate": 4.648153733693568e-07, - "loss": 0.2231, - "step": 80689 - }, - { - "epoch": 2.07, - "learning_rate": 4.6479199937017364e-07, - "loss": 0.3516, - "step": 80690 - }, - { - "epoch": 2.07, - "learning_rate": 4.647686257807746e-07, - "loss": 0.4517, - "step": 80691 - }, - { - "epoch": 2.07, - "learning_rate": 4.647452526011777e-07, - "loss": 0.4219, - "step": 80692 - }, - { - "epoch": 2.07, - "learning_rate": 4.647218798314011e-07, - "loss": 0.306, - "step": 80693 - }, - { - "epoch": 2.07, - "learning_rate": 4.646985074714619e-07, - "loss": 0.374, - "step": 80694 - }, - { - "epoch": 2.07, - "learning_rate": 4.646751355213785e-07, - "loss": 0.3781, - "step": 80695 - }, - { - "epoch": 2.07, - "learning_rate": 4.64651763981169e-07, - "loss": 0.4854, - "step": 80696 - }, - { - "epoch": 2.07, - "learning_rate": 4.646283928508508e-07, - "loss": 0.3572, - "step": 80697 - }, - { - "epoch": 2.07, - "learning_rate": 4.646050221304423e-07, - "loss": 0.5146, - "step": 80698 - }, - { - "epoch": 2.07, - "learning_rate": 4.6458165181996077e-07, - "loss": 0.3651, - "step": 80699 - }, - { - "epoch": 2.07, - "learning_rate": 4.645582819194245e-07, - "loss": 0.4395, - "step": 80700 - }, - { - "epoch": 2.07, - "learning_rate": 4.645349124288513e-07, - "loss": 0.4824, - "step": 80701 - }, - { - "epoch": 2.07, - "learning_rate": 4.6451154334825946e-07, - "loss": 0.4702, - "step": 80702 - }, - { - "epoch": 2.07, - "learning_rate": 4.644881746776661e-07, - "loss": 0.4546, - "step": 80703 - }, - { - "epoch": 2.07, - "learning_rate": 4.6446480641708965e-07, - "loss": 0.5107, - "step": 80704 - }, - { - "epoch": 2.07, - "learning_rate": 4.644414385665482e-07, - "loss": 0.28, - "step": 80705 - }, - { - "epoch": 2.07, - "learning_rate": 4.644180711260592e-07, - "loss": 0.3843, - "step": 80706 - }, - { - "epoch": 2.07, - "learning_rate": 4.643947040956403e-07, - "loss": 0.5649, - "step": 80707 - }, - { - "epoch": 2.07, - "learning_rate": 4.643713374753099e-07, - "loss": 0.418, - "step": 80708 - }, - { - "epoch": 2.07, - "learning_rate": 4.6434797126508563e-07, - "loss": 0.4043, - "step": 80709 - }, - { - "epoch": 2.07, - "learning_rate": 4.643246054649859e-07, - "loss": 0.5298, - "step": 80710 - }, - { - "epoch": 2.07, - "learning_rate": 4.643012400750277e-07, - "loss": 0.4458, - "step": 80711 - }, - { - "epoch": 2.07, - "learning_rate": 4.642778750952295e-07, - "loss": 0.3994, - "step": 80712 - }, - { - "epoch": 2.07, - "learning_rate": 4.6425451052560914e-07, - "loss": 0.3606, - "step": 80713 - }, - { - "epoch": 2.07, - "learning_rate": 4.642311463661848e-07, - "loss": 0.4883, - "step": 80714 - }, - { - "epoch": 2.07, - "learning_rate": 4.6420778261697356e-07, - "loss": 0.3994, - "step": 80715 - }, - { - "epoch": 2.07, - "learning_rate": 4.6418441927799437e-07, - "loss": 0.3623, - "step": 80716 - }, - { - "epoch": 2.07, - "learning_rate": 4.6416105634926394e-07, - "loss": 0.2247, - "step": 80717 - }, - { - "epoch": 2.07, - "learning_rate": 4.641376938308009e-07, - "loss": 0.4409, - "step": 80718 - }, - { - "epoch": 2.07, - "learning_rate": 4.6411433172262327e-07, - "loss": 0.4736, - "step": 80719 - }, - { - "epoch": 2.07, - "learning_rate": 4.640909700247484e-07, - "loss": 0.257, - "step": 80720 - }, - { - "epoch": 2.07, - "learning_rate": 4.640676087371943e-07, - "loss": 0.2482, - "step": 80721 - }, - { - "epoch": 2.07, - "learning_rate": 4.6404424785997944e-07, - "loss": 0.2606, - "step": 80722 - }, - { - "epoch": 2.07, - "learning_rate": 4.6402088739312084e-07, - "loss": 0.4817, - "step": 80723 - }, - { - "epoch": 2.07, - "learning_rate": 4.639975273366369e-07, - "loss": 0.3417, - "step": 80724 - }, - { - "epoch": 2.07, - "learning_rate": 4.639741676905453e-07, - "loss": 0.3174, - "step": 80725 - }, - { - "epoch": 2.07, - "learning_rate": 4.6395080845486446e-07, - "loss": 0.3706, - "step": 80726 - }, - { - "epoch": 2.07, - "learning_rate": 4.6392744962961183e-07, - "loss": 0.4175, - "step": 80727 - }, - { - "epoch": 2.07, - "learning_rate": 4.639040912148049e-07, - "loss": 0.3975, - "step": 80728 - }, - { - "epoch": 2.07, - "learning_rate": 4.6388073321046197e-07, - "loss": 0.4614, - "step": 80729 - }, - { - "epoch": 2.07, - "learning_rate": 4.638573756166009e-07, - "loss": 0.3364, - "step": 80730 - }, - { - "epoch": 2.07, - "learning_rate": 4.6383401843324e-07, - "loss": 0.3884, - "step": 80731 - }, - { - "epoch": 2.07, - "learning_rate": 4.6381066166039626e-07, - "loss": 0.4766, - "step": 80732 - }, - { - "epoch": 2.07, - "learning_rate": 4.6378730529808817e-07, - "loss": 0.3218, - "step": 80733 - }, - { - "epoch": 2.07, - "learning_rate": 4.6376394934633345e-07, - "loss": 0.4121, - "step": 80734 - }, - { - "epoch": 2.07, - "learning_rate": 4.637405938051504e-07, - "loss": 0.3412, - "step": 80735 - }, - { - "epoch": 2.07, - "learning_rate": 4.6371723867455646e-07, - "loss": 0.5586, - "step": 80736 - }, - { - "epoch": 2.07, - "learning_rate": 4.6369388395456923e-07, - "loss": 0.4351, - "step": 80737 - }, - { - "epoch": 2.07, - "learning_rate": 4.636705296452069e-07, - "loss": 0.4312, - "step": 80738 - }, - { - "epoch": 2.07, - "learning_rate": 4.6364717574648746e-07, - "loss": 0.4204, - "step": 80739 - }, - { - "epoch": 2.07, - "learning_rate": 4.6362382225842913e-07, - "loss": 0.4575, - "step": 80740 - }, - { - "epoch": 2.07, - "learning_rate": 4.636004691810489e-07, - "loss": 0.5269, - "step": 80741 - }, - { - "epoch": 2.07, - "learning_rate": 4.6357711651436514e-07, - "loss": 0.4453, - "step": 80742 - }, - { - "epoch": 2.07, - "learning_rate": 4.6355376425839607e-07, - "loss": 0.4492, - "step": 80743 - }, - { - "epoch": 2.07, - "learning_rate": 4.6353041241315883e-07, - "loss": 0.4553, - "step": 80744 - }, - { - "epoch": 2.07, - "learning_rate": 4.6350706097867174e-07, - "loss": 0.2825, - "step": 80745 - }, - { - "epoch": 2.07, - "learning_rate": 4.63483709954953e-07, - "loss": 0.5254, - "step": 80746 - }, - { - "epoch": 2.07, - "learning_rate": 4.6346035934201976e-07, - "loss": 0.4238, - "step": 80747 - }, - { - "epoch": 2.07, - "learning_rate": 4.634370091398906e-07, - "loss": 0.3601, - "step": 80748 - }, - { - "epoch": 2.07, - "learning_rate": 4.634136593485827e-07, - "loss": 0.2351, - "step": 80749 - }, - { - "epoch": 2.07, - "learning_rate": 4.633903099681142e-07, - "loss": 0.4065, - "step": 80750 - }, - { - "epoch": 2.07, - "learning_rate": 4.633669609985031e-07, - "loss": 0.3481, - "step": 80751 - }, - { - "epoch": 2.07, - "learning_rate": 4.633436124397676e-07, - "loss": 0.4436, - "step": 80752 - }, - { - "epoch": 2.07, - "learning_rate": 4.6332026429192493e-07, - "loss": 0.3896, - "step": 80753 - }, - { - "epoch": 2.07, - "learning_rate": 4.6329691655499325e-07, - "loss": 0.4468, - "step": 80754 - }, - { - "epoch": 2.07, - "learning_rate": 4.632735692289904e-07, - "loss": 0.3218, - "step": 80755 - }, - { - "epoch": 2.07, - "learning_rate": 4.6325022231393464e-07, - "loss": 0.3779, - "step": 80756 - }, - { - "epoch": 2.07, - "learning_rate": 4.6322687580984353e-07, - "loss": 0.395, - "step": 80757 - }, - { - "epoch": 2.07, - "learning_rate": 4.632035297167346e-07, - "loss": 0.438, - "step": 80758 - }, - { - "epoch": 2.07, - "learning_rate": 4.63180184034626e-07, - "loss": 0.4194, - "step": 80759 - }, - { - "epoch": 2.07, - "learning_rate": 4.63156838763536e-07, - "loss": 0.2635, - "step": 80760 - }, - { - "epoch": 2.07, - "learning_rate": 4.631334939034818e-07, - "loss": 0.4214, - "step": 80761 - }, - { - "epoch": 2.07, - "learning_rate": 4.6311014945448154e-07, - "loss": 0.479, - "step": 80762 - }, - { - "epoch": 2.07, - "learning_rate": 4.6308680541655323e-07, - "loss": 0.3833, - "step": 80763 - }, - { - "epoch": 2.07, - "learning_rate": 4.63063461789715e-07, - "loss": 0.5195, - "step": 80764 - }, - { - "epoch": 2.07, - "learning_rate": 4.6304011857398394e-07, - "loss": 0.2659, - "step": 80765 - }, - { - "epoch": 2.07, - "learning_rate": 4.630167757693788e-07, - "loss": 0.5066, - "step": 80766 - }, - { - "epoch": 2.07, - "learning_rate": 4.6299343337591667e-07, - "loss": 0.4053, - "step": 80767 - }, - { - "epoch": 2.07, - "learning_rate": 4.6297009139361577e-07, - "loss": 0.3593, - "step": 80768 - }, - { - "epoch": 2.07, - "learning_rate": 4.6294674982249436e-07, - "loss": 0.4207, - "step": 80769 - }, - { - "epoch": 2.07, - "learning_rate": 4.629234086625695e-07, - "loss": 0.3367, - "step": 80770 - }, - { - "epoch": 2.07, - "learning_rate": 4.629000679138596e-07, - "loss": 0.1906, - "step": 80771 - }, - { - "epoch": 2.07, - "learning_rate": 4.6287672757638243e-07, - "loss": 0.3358, - "step": 80772 - }, - { - "epoch": 2.07, - "learning_rate": 4.628533876501561e-07, - "loss": 0.5586, - "step": 80773 - }, - { - "epoch": 2.07, - "learning_rate": 4.628300481351979e-07, - "loss": 0.3108, - "step": 80774 - }, - { - "epoch": 2.07, - "learning_rate": 4.6280670903152606e-07, - "loss": 0.2964, - "step": 80775 - }, - { - "epoch": 2.07, - "learning_rate": 4.6278337033915884e-07, - "loss": 0.4136, - "step": 80776 - }, - { - "epoch": 2.07, - "learning_rate": 4.6276003205811356e-07, - "loss": 0.4746, - "step": 80777 - }, - { - "epoch": 2.07, - "learning_rate": 4.6273669418840787e-07, - "loss": 0.5283, - "step": 80778 - }, - { - "epoch": 2.07, - "learning_rate": 4.6271335673006007e-07, - "loss": 0.4189, - "step": 80779 - }, - { - "epoch": 2.07, - "learning_rate": 4.6269001968308796e-07, - "loss": 0.4497, - "step": 80780 - }, - { - "epoch": 2.07, - "learning_rate": 4.6266668304750964e-07, - "loss": 0.4692, - "step": 80781 - }, - { - "epoch": 2.07, - "learning_rate": 4.626433468233425e-07, - "loss": 0.4971, - "step": 80782 - }, - { - "epoch": 2.07, - "learning_rate": 4.6262001101060457e-07, - "loss": 0.3867, - "step": 80783 - }, - { - "epoch": 2.07, - "learning_rate": 4.625966756093138e-07, - "loss": 0.3268, - "step": 80784 - }, - { - "epoch": 2.07, - "learning_rate": 4.625733406194885e-07, - "loss": 0.3441, - "step": 80785 - }, - { - "epoch": 2.07, - "learning_rate": 4.625500060411459e-07, - "loss": 0.5679, - "step": 80786 - }, - { - "epoch": 2.07, - "learning_rate": 4.6252667187430386e-07, - "loss": 0.4321, - "step": 80787 - }, - { - "epoch": 2.07, - "learning_rate": 4.6250333811898034e-07, - "loss": 0.4302, - "step": 80788 - }, - { - "epoch": 2.07, - "learning_rate": 4.6248000477519334e-07, - "loss": 0.4463, - "step": 80789 - }, - { - "epoch": 2.07, - "learning_rate": 4.62456671842961e-07, - "loss": 0.3936, - "step": 80790 - }, - { - "epoch": 2.07, - "learning_rate": 4.6243333932230057e-07, - "loss": 0.4331, - "step": 80791 - }, - { - "epoch": 2.07, - "learning_rate": 4.624100072132301e-07, - "loss": 0.3784, - "step": 80792 - }, - { - "epoch": 2.07, - "learning_rate": 4.623866755157676e-07, - "loss": 0.2679, - "step": 80793 - }, - { - "epoch": 2.07, - "learning_rate": 4.623633442299314e-07, - "loss": 0.4868, - "step": 80794 - }, - { - "epoch": 2.07, - "learning_rate": 4.6234001335573837e-07, - "loss": 0.5508, - "step": 80795 - }, - { - "epoch": 2.07, - "learning_rate": 4.6231668289320726e-07, - "loss": 0.3494, - "step": 80796 - }, - { - "epoch": 2.07, - "learning_rate": 4.6229335284235513e-07, - "loss": 0.4985, - "step": 80797 - }, - { - "epoch": 2.07, - "learning_rate": 4.6227002320320077e-07, - "loss": 0.4272, - "step": 80798 - }, - { - "epoch": 2.07, - "learning_rate": 4.622466939757611e-07, - "loss": 0.3052, - "step": 80799 - }, - { - "epoch": 2.07, - "learning_rate": 4.6222336516005434e-07, - "loss": 0.377, - "step": 80800 - }, - { - "epoch": 2.07, - "learning_rate": 4.622000367560984e-07, - "loss": 0.4438, - "step": 80801 - }, - { - "epoch": 2.07, - "learning_rate": 4.621767087639117e-07, - "loss": 0.3521, - "step": 80802 - }, - { - "epoch": 2.07, - "learning_rate": 4.621533811835111e-07, - "loss": 0.4194, - "step": 80803 - }, - { - "epoch": 2.07, - "learning_rate": 4.621300540149149e-07, - "loss": 0.4414, - "step": 80804 - }, - { - "epoch": 2.07, - "learning_rate": 4.6210672725814095e-07, - "loss": 0.4067, - "step": 80805 - }, - { - "epoch": 2.07, - "learning_rate": 4.620834009132076e-07, - "loss": 0.4465, - "step": 80806 - }, - { - "epoch": 2.07, - "learning_rate": 4.620600749801322e-07, - "loss": 0.3618, - "step": 80807 - }, - { - "epoch": 2.07, - "learning_rate": 4.6203674945893234e-07, - "loss": 0.3979, - "step": 80808 - }, - { - "epoch": 2.07, - "learning_rate": 4.620134243496262e-07, - "loss": 0.418, - "step": 80809 - }, - { - "epoch": 2.07, - "learning_rate": 4.619900996522316e-07, - "loss": 0.4326, - "step": 80810 - }, - { - "epoch": 2.07, - "learning_rate": 4.6196677536676686e-07, - "loss": 0.4668, - "step": 80811 - }, - { - "epoch": 2.07, - "learning_rate": 4.61943451493249e-07, - "loss": 0.4644, - "step": 80812 - }, - { - "epoch": 2.07, - "learning_rate": 4.6192012803169633e-07, - "loss": 0.3978, - "step": 80813 - }, - { - "epoch": 2.07, - "learning_rate": 4.61896804982127e-07, - "loss": 0.3838, - "step": 80814 - }, - { - "epoch": 2.07, - "learning_rate": 4.6187348234455826e-07, - "loss": 0.3794, - "step": 80815 - }, - { - "epoch": 2.07, - "learning_rate": 4.618501601190086e-07, - "loss": 0.5713, - "step": 80816 - }, - { - "epoch": 2.07, - "learning_rate": 4.6182683830549516e-07, - "loss": 0.4038, - "step": 80817 - }, - { - "epoch": 2.07, - "learning_rate": 4.6180351690403616e-07, - "loss": 0.4373, - "step": 80818 - }, - { - "epoch": 2.07, - "learning_rate": 4.617801959146498e-07, - "loss": 0.4214, - "step": 80819 - }, - { - "epoch": 2.07, - "learning_rate": 4.617568753373532e-07, - "loss": 0.4031, - "step": 80820 - }, - { - "epoch": 2.07, - "learning_rate": 4.617335551721647e-07, - "loss": 0.4238, - "step": 80821 - }, - { - "epoch": 2.07, - "learning_rate": 4.6171023541910203e-07, - "loss": 0.2961, - "step": 80822 - }, - { - "epoch": 2.07, - "learning_rate": 4.6168691607818345e-07, - "loss": 0.429, - "step": 80823 - }, - { - "epoch": 2.07, - "learning_rate": 4.61663597149426e-07, - "loss": 0.2859, - "step": 80824 - }, - { - "epoch": 2.07, - "learning_rate": 4.6164027863284807e-07, - "loss": 0.354, - "step": 80825 - }, - { - "epoch": 2.07, - "learning_rate": 4.616169605284678e-07, - "loss": 0.3584, - "step": 80826 - }, - { - "epoch": 2.07, - "learning_rate": 4.615936428363022e-07, - "loss": 0.3611, - "step": 80827 - }, - { - "epoch": 2.07, - "learning_rate": 4.615703255563701e-07, - "loss": 0.2996, - "step": 80828 - }, - { - "epoch": 2.07, - "learning_rate": 4.6154700868868834e-07, - "loss": 0.3523, - "step": 80829 - }, - { - "epoch": 2.07, - "learning_rate": 4.615236922332754e-07, - "loss": 0.5054, - "step": 80830 - }, - { - "epoch": 2.07, - "learning_rate": 4.6150037619014925e-07, - "loss": 0.226, - "step": 80831 - }, - { - "epoch": 2.07, - "learning_rate": 4.6147706055932725e-07, - "loss": 0.5015, - "step": 80832 - }, - { - "epoch": 2.07, - "learning_rate": 4.614537453408275e-07, - "loss": 0.4216, - "step": 80833 - }, - { - "epoch": 2.07, - "learning_rate": 4.614304305346678e-07, - "loss": 0.4058, - "step": 80834 - }, - { - "epoch": 2.07, - "learning_rate": 4.6140711614086636e-07, - "loss": 0.4712, - "step": 80835 - }, - { - "epoch": 2.07, - "learning_rate": 4.613838021594408e-07, - "loss": 0.3433, - "step": 80836 - }, - { - "epoch": 2.07, - "learning_rate": 4.6136048859040856e-07, - "loss": 0.3823, - "step": 80837 - }, - { - "epoch": 2.07, - "learning_rate": 4.613371754337878e-07, - "loss": 0.4045, - "step": 80838 - }, - { - "epoch": 2.07, - "learning_rate": 4.613138626895964e-07, - "loss": 0.3506, - "step": 80839 - }, - { - "epoch": 2.07, - "learning_rate": 4.612905503578525e-07, - "loss": 0.4976, - "step": 80840 - }, - { - "epoch": 2.07, - "learning_rate": 4.612672384385734e-07, - "loss": 0.3965, - "step": 80841 - }, - { - "epoch": 2.07, - "learning_rate": 4.612439269317772e-07, - "loss": 0.3616, - "step": 80842 - }, - { - "epoch": 2.07, - "learning_rate": 4.612206158374816e-07, - "loss": 0.4233, - "step": 80843 - }, - { - "epoch": 2.07, - "learning_rate": 4.611973051557051e-07, - "loss": 0.5635, - "step": 80844 - }, - { - "epoch": 2.07, - "learning_rate": 4.611739948864647e-07, - "loss": 0.396, - "step": 80845 - }, - { - "epoch": 2.07, - "learning_rate": 4.6115068502977884e-07, - "loss": 0.3163, - "step": 80846 - }, - { - "epoch": 2.07, - "learning_rate": 4.6112737558566485e-07, - "loss": 0.5137, - "step": 80847 - }, - { - "epoch": 2.07, - "learning_rate": 4.6110406655414123e-07, - "loss": 0.4604, - "step": 80848 - }, - { - "epoch": 2.07, - "learning_rate": 4.6108075793522505e-07, - "loss": 0.415, - "step": 80849 - }, - { - "epoch": 2.07, - "learning_rate": 4.6105744972893457e-07, - "loss": 0.4561, - "step": 80850 - }, - { - "epoch": 2.07, - "learning_rate": 4.6103414193528757e-07, - "loss": 0.5278, - "step": 80851 - }, - { - "epoch": 2.07, - "learning_rate": 4.6101083455430236e-07, - "loss": 0.3506, - "step": 80852 - }, - { - "epoch": 2.07, - "learning_rate": 4.60987527585996e-07, - "loss": 0.3918, - "step": 80853 - }, - { - "epoch": 2.07, - "learning_rate": 4.609642210303867e-07, - "loss": 0.3303, - "step": 80854 - }, - { - "epoch": 2.07, - "learning_rate": 4.609409148874923e-07, - "loss": 0.3491, - "step": 80855 - }, - { - "epoch": 2.07, - "learning_rate": 4.60917609157331e-07, - "loss": 0.4551, - "step": 80856 - }, - { - "epoch": 2.07, - "learning_rate": 4.6089430383992034e-07, - "loss": 0.5986, - "step": 80857 - }, - { - "epoch": 2.07, - "learning_rate": 4.608709989352777e-07, - "loss": 0.4448, - "step": 80858 - }, - { - "epoch": 2.07, - "learning_rate": 4.6084769444342143e-07, - "loss": 0.3413, - "step": 80859 - }, - { - "epoch": 2.07, - "learning_rate": 4.608243903643693e-07, - "loss": 0.3478, - "step": 80860 - }, - { - "epoch": 2.07, - "learning_rate": 4.6080108669813945e-07, - "loss": 0.5654, - "step": 80861 - }, - { - "epoch": 2.07, - "learning_rate": 4.6077778344474903e-07, - "loss": 0.2997, - "step": 80862 - }, - { - "epoch": 2.07, - "learning_rate": 4.607544806042163e-07, - "loss": 0.4116, - "step": 80863 - }, - { - "epoch": 2.07, - "learning_rate": 4.6073117817655905e-07, - "loss": 0.3999, - "step": 80864 - }, - { - "epoch": 2.07, - "learning_rate": 4.607078761617955e-07, - "loss": 0.4351, - "step": 80865 - }, - { - "epoch": 2.07, - "learning_rate": 4.6068457455994314e-07, - "loss": 0.4253, - "step": 80866 - }, - { - "epoch": 2.07, - "learning_rate": 4.6066127337101945e-07, - "loss": 0.4038, - "step": 80867 - }, - { - "epoch": 2.07, - "learning_rate": 4.606379725950427e-07, - "loss": 0.396, - "step": 80868 - }, - { - "epoch": 2.07, - "learning_rate": 4.6061467223203086e-07, - "loss": 0.4424, - "step": 80869 - }, - { - "epoch": 2.07, - "learning_rate": 4.605913722820013e-07, - "loss": 0.4609, - "step": 80870 - }, - { - "epoch": 2.07, - "learning_rate": 4.605680727449721e-07, - "loss": 0.4956, - "step": 80871 - }, - { - "epoch": 2.07, - "learning_rate": 4.605447736209611e-07, - "loss": 0.2132, - "step": 80872 - }, - { - "epoch": 2.07, - "learning_rate": 4.605214749099866e-07, - "loss": 0.4443, - "step": 80873 - }, - { - "epoch": 2.07, - "learning_rate": 4.6049817661206556e-07, - "loss": 0.4287, - "step": 80874 - }, - { - "epoch": 2.07, - "learning_rate": 4.6047487872721633e-07, - "loss": 0.5801, - "step": 80875 - }, - { - "epoch": 2.07, - "learning_rate": 4.60451581255457e-07, - "loss": 0.3868, - "step": 80876 - }, - { - "epoch": 2.07, - "learning_rate": 4.604282841968047e-07, - "loss": 0.3496, - "step": 80877 - }, - { - "epoch": 2.07, - "learning_rate": 4.604049875512781e-07, - "loss": 0.2908, - "step": 80878 - }, - { - "epoch": 2.07, - "learning_rate": 4.6038169131889413e-07, - "loss": 0.5059, - "step": 80879 - }, - { - "epoch": 2.07, - "learning_rate": 4.6035839549967117e-07, - "loss": 0.3616, - "step": 80880 - }, - { - "epoch": 2.07, - "learning_rate": 4.6033510009362686e-07, - "loss": 0.4937, - "step": 80881 - }, - { - "epoch": 2.07, - "learning_rate": 4.603118051007796e-07, - "loss": 0.4839, - "step": 80882 - }, - { - "epoch": 2.07, - "learning_rate": 4.602885105211464e-07, - "loss": 0.5151, - "step": 80883 - }, - { - "epoch": 2.07, - "learning_rate": 4.602652163547455e-07, - "loss": 0.4729, - "step": 80884 - }, - { - "epoch": 2.07, - "learning_rate": 4.60241922601595e-07, - "loss": 0.4121, - "step": 80885 - }, - { - "epoch": 2.07, - "learning_rate": 4.602186292617124e-07, - "loss": 0.3458, - "step": 80886 - }, - { - "epoch": 2.07, - "learning_rate": 4.601953363351153e-07, - "loss": 0.4233, - "step": 80887 - }, - { - "epoch": 2.07, - "learning_rate": 4.6017204382182183e-07, - "loss": 0.4023, - "step": 80888 - }, - { - "epoch": 2.07, - "learning_rate": 4.6014875172184976e-07, - "loss": 0.5137, - "step": 80889 - }, - { - "epoch": 2.07, - "learning_rate": 4.6012546003521733e-07, - "loss": 0.4648, - "step": 80890 - }, - { - "epoch": 2.07, - "learning_rate": 4.6010216876194163e-07, - "loss": 0.519, - "step": 80891 - }, - { - "epoch": 2.07, - "learning_rate": 4.6007887790204094e-07, - "loss": 0.4155, - "step": 80892 - }, - { - "epoch": 2.07, - "learning_rate": 4.60055587455533e-07, - "loss": 0.3979, - "step": 80893 - }, - { - "epoch": 2.07, - "learning_rate": 4.6003229742243597e-07, - "loss": 0.5044, - "step": 80894 - }, - { - "epoch": 2.07, - "learning_rate": 4.6000900780276706e-07, - "loss": 0.3779, - "step": 80895 - }, - { - "epoch": 2.07, - "learning_rate": 4.599857185965448e-07, - "loss": 0.4521, - "step": 80896 - }, - { - "epoch": 2.07, - "learning_rate": 4.599624298037863e-07, - "loss": 0.5024, - "step": 80897 - }, - { - "epoch": 2.07, - "learning_rate": 4.5993914142450976e-07, - "loss": 0.3845, - "step": 80898 - }, - { - "epoch": 2.07, - "learning_rate": 4.599158534587333e-07, - "loss": 0.4038, - "step": 80899 - }, - { - "epoch": 2.07, - "learning_rate": 4.598925659064741e-07, - "loss": 0.4438, - "step": 80900 - }, - { - "epoch": 2.07, - "learning_rate": 4.5986927876775027e-07, - "loss": 0.4097, - "step": 80901 - }, - { - "epoch": 2.07, - "learning_rate": 4.5984599204257966e-07, - "loss": 0.3225, - "step": 80902 - }, - { - "epoch": 2.07, - "learning_rate": 4.598227057309806e-07, - "loss": 0.5103, - "step": 80903 - }, - { - "epoch": 2.07, - "learning_rate": 4.597994198329701e-07, - "loss": 0.5234, - "step": 80904 - }, - { - "epoch": 2.07, - "learning_rate": 4.5977613434856635e-07, - "loss": 0.3235, - "step": 80905 - }, - { - "epoch": 2.07, - "learning_rate": 4.5975284927778746e-07, - "loss": 0.5059, - "step": 80906 - }, - { - "epoch": 2.07, - "learning_rate": 4.5972956462065096e-07, - "loss": 0.5474, - "step": 80907 - }, - { - "epoch": 2.07, - "learning_rate": 4.597062803771744e-07, - "loss": 0.4023, - "step": 80908 - }, - { - "epoch": 2.07, - "learning_rate": 4.5968299654737584e-07, - "loss": 0.2737, - "step": 80909 - }, - { - "epoch": 2.07, - "learning_rate": 4.5965971313127326e-07, - "loss": 0.5342, - "step": 80910 - }, - { - "epoch": 2.07, - "learning_rate": 4.5963643012888466e-07, - "loss": 0.3239, - "step": 80911 - }, - { - "epoch": 2.07, - "learning_rate": 4.596131475402273e-07, - "loss": 0.2686, - "step": 80912 - }, - { - "epoch": 2.07, - "learning_rate": 4.595898653653193e-07, - "loss": 0.3743, - "step": 80913 - }, - { - "epoch": 2.07, - "learning_rate": 4.5956658360417846e-07, - "loss": 0.3608, - "step": 80914 - }, - { - "epoch": 2.07, - "learning_rate": 4.5954330225682294e-07, - "loss": 0.5435, - "step": 80915 - }, - { - "epoch": 2.07, - "learning_rate": 4.595200213232704e-07, - "loss": 0.4297, - "step": 80916 - }, - { - "epoch": 2.07, - "learning_rate": 4.5949674080353806e-07, - "loss": 0.438, - "step": 80917 - }, - { - "epoch": 2.07, - "learning_rate": 4.5947346069764426e-07, - "loss": 0.5293, - "step": 80918 - }, - { - "epoch": 2.07, - "learning_rate": 4.5945018100560675e-07, - "loss": 0.459, - "step": 80919 - }, - { - "epoch": 2.07, - "learning_rate": 4.594269017274437e-07, - "loss": 0.3491, - "step": 80920 - }, - { - "epoch": 2.07, - "learning_rate": 4.5940362286317237e-07, - "loss": 0.3215, - "step": 80921 - }, - { - "epoch": 2.07, - "learning_rate": 4.593803444128107e-07, - "loss": 0.4023, - "step": 80922 - }, - { - "epoch": 2.07, - "learning_rate": 4.593570663763772e-07, - "loss": 0.459, - "step": 80923 - }, - { - "epoch": 2.07, - "learning_rate": 4.593337887538886e-07, - "loss": 0.4312, - "step": 80924 - }, - { - "epoch": 2.07, - "learning_rate": 4.593105115453633e-07, - "loss": 0.4277, - "step": 80925 - }, - { - "epoch": 2.07, - "learning_rate": 4.5928723475081943e-07, - "loss": 0.3357, - "step": 80926 - }, - { - "epoch": 2.07, - "learning_rate": 4.592639583702741e-07, - "loss": 0.406, - "step": 80927 - }, - { - "epoch": 2.07, - "learning_rate": 4.592406824037459e-07, - "loss": 0.5366, - "step": 80928 - }, - { - "epoch": 2.07, - "learning_rate": 4.592174068512519e-07, - "loss": 0.4028, - "step": 80929 - }, - { - "epoch": 2.07, - "learning_rate": 4.591941317128102e-07, - "loss": 0.5957, - "step": 80930 - }, - { - "epoch": 2.07, - "learning_rate": 4.591708569884386e-07, - "loss": 0.3818, - "step": 80931 - }, - { - "epoch": 2.07, - "learning_rate": 4.591475826781556e-07, - "loss": 0.4238, - "step": 80932 - }, - { - "epoch": 2.07, - "learning_rate": 4.591243087819778e-07, - "loss": 0.49, - "step": 80933 - }, - { - "epoch": 2.07, - "learning_rate": 4.5910103529992386e-07, - "loss": 0.2736, - "step": 80934 - }, - { - "epoch": 2.07, - "learning_rate": 4.590777622320113e-07, - "loss": 0.4438, - "step": 80935 - }, - { - "epoch": 2.07, - "learning_rate": 4.5905448957825844e-07, - "loss": 0.3677, - "step": 80936 - }, - { - "epoch": 2.07, - "learning_rate": 4.5903121733868255e-07, - "loss": 0.397, - "step": 80937 - }, - { - "epoch": 2.07, - "learning_rate": 4.5900794551330137e-07, - "loss": 0.4302, - "step": 80938 - }, - { - "epoch": 2.07, - "learning_rate": 4.589846741021328e-07, - "loss": 0.4302, - "step": 80939 - }, - { - "epoch": 2.07, - "learning_rate": 4.589614031051953e-07, - "loss": 0.384, - "step": 80940 - }, - { - "epoch": 2.07, - "learning_rate": 4.5893813252250567e-07, - "loss": 0.4033, - "step": 80941 - }, - { - "epoch": 2.07, - "learning_rate": 4.589148623540824e-07, - "loss": 0.5205, - "step": 80942 - }, - { - "epoch": 2.07, - "learning_rate": 4.58891592599943e-07, - "loss": 0.3425, - "step": 80943 - }, - { - "epoch": 2.07, - "learning_rate": 4.588683232601058e-07, - "loss": 0.348, - "step": 80944 - }, - { - "epoch": 2.07, - "learning_rate": 4.58845054334588e-07, - "loss": 0.373, - "step": 80945 - }, - { - "epoch": 2.07, - "learning_rate": 4.588217858234079e-07, - "loss": 0.6011, - "step": 80946 - }, - { - "epoch": 2.07, - "learning_rate": 4.587985177265827e-07, - "loss": 0.3679, - "step": 80947 - }, - { - "epoch": 2.07, - "learning_rate": 4.5877525004413064e-07, - "loss": 0.3629, - "step": 80948 - }, - { - "epoch": 2.07, - "learning_rate": 4.5875198277606984e-07, - "loss": 0.3107, - "step": 80949 - }, - { - "epoch": 2.07, - "learning_rate": 4.587287159224175e-07, - "loss": 0.5347, - "step": 80950 - }, - { - "epoch": 2.07, - "learning_rate": 4.5870544948319144e-07, - "loss": 0.22, - "step": 80951 - }, - { - "epoch": 2.07, - "learning_rate": 4.586821834584099e-07, - "loss": 0.4033, - "step": 80952 - }, - { - "epoch": 2.07, - "learning_rate": 4.5865891784809083e-07, - "loss": 0.3657, - "step": 80953 - }, - { - "epoch": 2.07, - "learning_rate": 4.5863565265225146e-07, - "loss": 0.3245, - "step": 80954 - }, - { - "epoch": 2.07, - "learning_rate": 4.5861238787090983e-07, - "loss": 0.4209, - "step": 80955 - }, - { - "epoch": 2.07, - "learning_rate": 4.585891235040842e-07, - "loss": 0.3989, - "step": 80956 - }, - { - "epoch": 2.07, - "learning_rate": 4.5856585955179196e-07, - "loss": 0.415, - "step": 80957 - }, - { - "epoch": 2.07, - "learning_rate": 4.5854259601405055e-07, - "loss": 0.4126, - "step": 80958 - }, - { - "epoch": 2.08, - "learning_rate": 4.585193328908782e-07, - "loss": 0.3833, - "step": 80959 - }, - { - "epoch": 2.08, - "learning_rate": 4.5849607018229263e-07, - "loss": 0.4639, - "step": 80960 - }, - { - "epoch": 2.08, - "learning_rate": 4.584728078883122e-07, - "loss": 0.5322, - "step": 80961 - }, - { - "epoch": 2.08, - "learning_rate": 4.584495460089538e-07, - "loss": 0.4641, - "step": 80962 - }, - { - "epoch": 2.08, - "learning_rate": 4.584262845442357e-07, - "loss": 0.4868, - "step": 80963 - }, - { - "epoch": 2.08, - "learning_rate": 4.584030234941757e-07, - "loss": 0.4077, - "step": 80964 - }, - { - "epoch": 2.08, - "learning_rate": 4.58379762858792e-07, - "loss": 0.4209, - "step": 80965 - }, - { - "epoch": 2.08, - "learning_rate": 4.583565026381019e-07, - "loss": 0.4214, - "step": 80966 - }, - { - "epoch": 2.08, - "learning_rate": 4.5833324283212306e-07, - "loss": 0.502, - "step": 80967 - }, - { - "epoch": 2.08, - "learning_rate": 4.583099834408736e-07, - "loss": 0.3513, - "step": 80968 - }, - { - "epoch": 2.08, - "learning_rate": 4.5828672446437113e-07, - "loss": 0.4109, - "step": 80969 - }, - { - "epoch": 2.08, - "learning_rate": 4.58263465902634e-07, - "loss": 0.4414, - "step": 80970 - }, - { - "epoch": 2.08, - "learning_rate": 4.582402077556793e-07, - "loss": 0.4753, - "step": 80971 - }, - { - "epoch": 2.08, - "learning_rate": 4.582169500235252e-07, - "loss": 0.3408, - "step": 80972 - }, - { - "epoch": 2.08, - "learning_rate": 4.5819369270618937e-07, - "loss": 0.4417, - "step": 80973 - }, - { - "epoch": 2.08, - "learning_rate": 4.581704358036902e-07, - "loss": 0.4163, - "step": 80974 - }, - { - "epoch": 2.08, - "learning_rate": 4.581471793160445e-07, - "loss": 0.3525, - "step": 80975 - }, - { - "epoch": 2.08, - "learning_rate": 4.581239232432711e-07, - "loss": 0.3153, - "step": 80976 - }, - { - "epoch": 2.08, - "learning_rate": 4.581006675853869e-07, - "loss": 0.5103, - "step": 80977 - }, - { - "epoch": 2.08, - "learning_rate": 4.580774123424104e-07, - "loss": 0.4155, - "step": 80978 - }, - { - "epoch": 2.08, - "learning_rate": 4.5805415751435885e-07, - "loss": 0.4902, - "step": 80979 - }, - { - "epoch": 2.08, - "learning_rate": 4.5803090310125027e-07, - "loss": 0.4292, - "step": 80980 - }, - { - "epoch": 2.08, - "learning_rate": 4.580076491031024e-07, - "loss": 0.3821, - "step": 80981 - }, - { - "epoch": 2.08, - "learning_rate": 4.5798439551993364e-07, - "loss": 0.4482, - "step": 80982 - }, - { - "epoch": 2.08, - "learning_rate": 4.579611423517609e-07, - "loss": 0.3353, - "step": 80983 - }, - { - "epoch": 2.08, - "learning_rate": 4.5793788959860237e-07, - "loss": 0.3965, - "step": 80984 - }, - { - "epoch": 2.08, - "learning_rate": 4.579146372604763e-07, - "loss": 0.5205, - "step": 80985 - }, - { - "epoch": 2.08, - "learning_rate": 4.5789138533739956e-07, - "loss": 0.4192, - "step": 80986 - }, - { - "epoch": 2.08, - "learning_rate": 4.5786813382939096e-07, - "loss": 0.2108, - "step": 80987 - }, - { - "epoch": 2.08, - "learning_rate": 4.5784488273646736e-07, - "loss": 0.2762, - "step": 80988 - }, - { - "epoch": 2.08, - "learning_rate": 4.578216320586471e-07, - "loss": 0.4482, - "step": 80989 - }, - { - "epoch": 2.08, - "learning_rate": 4.577983817959479e-07, - "loss": 0.1984, - "step": 80990 - }, - { - "epoch": 2.08, - "learning_rate": 4.577751319483878e-07, - "loss": 0.3457, - "step": 80991 - }, - { - "epoch": 2.08, - "learning_rate": 4.5775188251598397e-07, - "loss": 0.5044, - "step": 80992 - }, - { - "epoch": 2.08, - "learning_rate": 4.577286334987547e-07, - "loss": 0.3745, - "step": 80993 - }, - { - "epoch": 2.08, - "learning_rate": 4.5770538489671797e-07, - "loss": 0.4868, - "step": 80994 - }, - { - "epoch": 2.08, - "learning_rate": 4.576821367098913e-07, - "loss": 0.3101, - "step": 80995 - }, - { - "epoch": 2.08, - "learning_rate": 4.576588889382922e-07, - "loss": 0.3082, - "step": 80996 - }, - { - "epoch": 2.08, - "learning_rate": 4.5763564158193866e-07, - "loss": 0.4463, - "step": 80997 - }, - { - "epoch": 2.08, - "learning_rate": 4.5761239464084854e-07, - "loss": 0.3945, - "step": 80998 - }, - { - "epoch": 2.08, - "learning_rate": 4.5758914811504014e-07, - "loss": 0.439, - "step": 80999 - }, - { - "epoch": 2.08, - "learning_rate": 4.5756590200453035e-07, - "loss": 0.4399, - "step": 81000 - }, - { - "epoch": 2.08, - "learning_rate": 4.575426563093374e-07, - "loss": 0.4028, - "step": 81001 - }, - { - "epoch": 2.08, - "learning_rate": 4.575194110294791e-07, - "loss": 0.3462, - "step": 81002 - }, - { - "epoch": 2.08, - "learning_rate": 4.5749616616497367e-07, - "loss": 0.4961, - "step": 81003 - }, - { - "epoch": 2.08, - "learning_rate": 4.5747292171583807e-07, - "loss": 0.5342, - "step": 81004 - }, - { - "epoch": 2.08, - "learning_rate": 4.5744967768209097e-07, - "loss": 0.4072, - "step": 81005 - }, - { - "epoch": 2.08, - "learning_rate": 4.5742643406374915e-07, - "loss": 0.5142, - "step": 81006 - }, - { - "epoch": 2.08, - "learning_rate": 4.574031908608311e-07, - "loss": 0.3945, - "step": 81007 - }, - { - "epoch": 2.08, - "learning_rate": 4.573799480733548e-07, - "loss": 0.3188, - "step": 81008 - }, - { - "epoch": 2.08, - "learning_rate": 4.573567057013373e-07, - "loss": 0.3711, - "step": 81009 - }, - { - "epoch": 2.08, - "learning_rate": 4.5733346374479697e-07, - "loss": 0.4585, - "step": 81010 - }, - { - "epoch": 2.08, - "learning_rate": 4.573102222037517e-07, - "loss": 0.3738, - "step": 81011 - }, - { - "epoch": 2.08, - "learning_rate": 4.572869810782187e-07, - "loss": 0.4846, - "step": 81012 - }, - { - "epoch": 2.08, - "learning_rate": 4.5726374036821615e-07, - "loss": 0.3333, - "step": 81013 - }, - { - "epoch": 2.08, - "learning_rate": 4.572405000737617e-07, - "loss": 0.5039, - "step": 81014 - }, - { - "epoch": 2.08, - "learning_rate": 4.572172601948737e-07, - "loss": 0.4023, - "step": 81015 - }, - { - "epoch": 2.08, - "learning_rate": 4.5719402073156944e-07, - "loss": 0.3481, - "step": 81016 - }, - { - "epoch": 2.08, - "learning_rate": 4.571707816838665e-07, - "loss": 0.4653, - "step": 81017 - }, - { - "epoch": 2.08, - "learning_rate": 4.571475430517828e-07, - "loss": 0.437, - "step": 81018 - }, - { - "epoch": 2.08, - "learning_rate": 4.5712430483533627e-07, - "loss": 0.3309, - "step": 81019 - }, - { - "epoch": 2.08, - "learning_rate": 4.571010670345451e-07, - "loss": 0.356, - "step": 81020 - }, - { - "epoch": 2.08, - "learning_rate": 4.5707782964942633e-07, - "loss": 0.3893, - "step": 81021 - }, - { - "epoch": 2.08, - "learning_rate": 4.57054592679998e-07, - "loss": 0.3689, - "step": 81022 - }, - { - "epoch": 2.08, - "learning_rate": 4.5703135612627817e-07, - "loss": 0.4429, - "step": 81023 - }, - { - "epoch": 2.08, - "learning_rate": 4.570081199882847e-07, - "loss": 0.4614, - "step": 81024 - }, - { - "epoch": 2.08, - "learning_rate": 4.569848842660352e-07, - "loss": 0.3315, - "step": 81025 - }, - { - "epoch": 2.08, - "learning_rate": 4.56961648959547e-07, - "loss": 0.4229, - "step": 81026 - }, - { - "epoch": 2.08, - "learning_rate": 4.569384140688384e-07, - "loss": 0.4829, - "step": 81027 - }, - { - "epoch": 2.08, - "learning_rate": 4.5691517959392735e-07, - "loss": 0.4022, - "step": 81028 - }, - { - "epoch": 2.08, - "learning_rate": 4.5689194553483103e-07, - "loss": 0.4285, - "step": 81029 - }, - { - "epoch": 2.08, - "learning_rate": 4.5686871189156763e-07, - "loss": 0.3672, - "step": 81030 - }, - { - "epoch": 2.08, - "learning_rate": 4.568454786641548e-07, - "loss": 0.2462, - "step": 81031 - }, - { - "epoch": 2.08, - "learning_rate": 4.5682224585261085e-07, - "loss": 0.2977, - "step": 81032 - }, - { - "epoch": 2.08, - "learning_rate": 4.567990134569527e-07, - "loss": 0.4434, - "step": 81033 - }, - { - "epoch": 2.08, - "learning_rate": 4.5677578147719866e-07, - "loss": 0.3784, - "step": 81034 - }, - { - "epoch": 2.08, - "learning_rate": 4.5675254991336663e-07, - "loss": 0.4878, - "step": 81035 - }, - { - "epoch": 2.08, - "learning_rate": 4.5672931876547395e-07, - "loss": 0.4844, - "step": 81036 - }, - { - "epoch": 2.08, - "learning_rate": 4.56706088033539e-07, - "loss": 0.4702, - "step": 81037 - }, - { - "epoch": 2.08, - "learning_rate": 4.5668285771757886e-07, - "loss": 0.4404, - "step": 81038 - }, - { - "epoch": 2.08, - "learning_rate": 4.5665962781761167e-07, - "loss": 0.3389, - "step": 81039 - }, - { - "epoch": 2.08, - "learning_rate": 4.5663639833365517e-07, - "loss": 0.4595, - "step": 81040 - }, - { - "epoch": 2.08, - "learning_rate": 4.566131692657276e-07, - "loss": 0.3373, - "step": 81041 - }, - { - "epoch": 2.08, - "learning_rate": 4.5658994061384603e-07, - "loss": 0.4893, - "step": 81042 - }, - { - "epoch": 2.08, - "learning_rate": 4.565667123780285e-07, - "loss": 0.3265, - "step": 81043 - }, - { - "epoch": 2.08, - "learning_rate": 4.5654348455829283e-07, - "loss": 0.3408, - "step": 81044 - }, - { - "epoch": 2.08, - "learning_rate": 4.5652025715465757e-07, - "loss": 0.3152, - "step": 81045 - }, - { - "epoch": 2.08, - "learning_rate": 4.5649703016713905e-07, - "loss": 0.0738, - "step": 81046 - }, - { - "epoch": 2.08, - "learning_rate": 4.564738035957557e-07, - "loss": 0.3961, - "step": 81047 - }, - { - "epoch": 2.08, - "learning_rate": 4.564505774405254e-07, - "loss": 0.52, - "step": 81048 - }, - { - "epoch": 2.08, - "learning_rate": 4.564273517014663e-07, - "loss": 0.3274, - "step": 81049 - }, - { - "epoch": 2.08, - "learning_rate": 4.564041263785954e-07, - "loss": 0.5005, - "step": 81050 - }, - { - "epoch": 2.08, - "learning_rate": 4.5638090147193087e-07, - "loss": 0.4487, - "step": 81051 - }, - { - "epoch": 2.08, - "learning_rate": 4.563576769814904e-07, - "loss": 0.3787, - "step": 81052 - }, - { - "epoch": 2.08, - "learning_rate": 4.563344529072923e-07, - "loss": 0.4873, - "step": 81053 - }, - { - "epoch": 2.08, - "learning_rate": 4.5631122924935363e-07, - "loss": 0.3833, - "step": 81054 - }, - { - "epoch": 2.08, - "learning_rate": 4.562880060076927e-07, - "loss": 0.3179, - "step": 81055 - }, - { - "epoch": 2.08, - "learning_rate": 4.562647831823268e-07, - "loss": 0.4272, - "step": 81056 - }, - { - "epoch": 2.08, - "learning_rate": 4.562415607732738e-07, - "loss": 0.4438, - "step": 81057 - }, - { - "epoch": 2.08, - "learning_rate": 4.5621833878055203e-07, - "loss": 0.4419, - "step": 81058 - }, - { - "epoch": 2.08, - "learning_rate": 4.561951172041786e-07, - "loss": 0.4344, - "step": 81059 - }, - { - "epoch": 2.08, - "learning_rate": 4.561718960441715e-07, - "loss": 0.3176, - "step": 81060 - }, - { - "epoch": 2.08, - "learning_rate": 4.5614867530054855e-07, - "loss": 0.3455, - "step": 81061 - }, - { - "epoch": 2.08, - "learning_rate": 4.56125454973328e-07, - "loss": 0.4795, - "step": 81062 - }, - { - "epoch": 2.08, - "learning_rate": 4.561022350625268e-07, - "loss": 0.266, - "step": 81063 - }, - { - "epoch": 2.08, - "learning_rate": 4.560790155681631e-07, - "loss": 0.405, - "step": 81064 - }, - { - "epoch": 2.08, - "learning_rate": 4.5605579649025496e-07, - "loss": 0.4434, - "step": 81065 - }, - { - "epoch": 2.08, - "learning_rate": 4.5603257782882e-07, - "loss": 0.326, - "step": 81066 - }, - { - "epoch": 2.08, - "learning_rate": 4.5600935958387545e-07, - "loss": 0.2787, - "step": 81067 - }, - { - "epoch": 2.08, - "learning_rate": 4.559861417554395e-07, - "loss": 0.3594, - "step": 81068 - }, - { - "epoch": 2.08, - "learning_rate": 4.5596292434353e-07, - "loss": 0.3599, - "step": 81069 - }, - { - "epoch": 2.08, - "learning_rate": 4.55939707348165e-07, - "loss": 0.333, - "step": 81070 - }, - { - "epoch": 2.08, - "learning_rate": 4.5591649076936166e-07, - "loss": 0.3982, - "step": 81071 - }, - { - "epoch": 2.08, - "learning_rate": 4.55893274607138e-07, - "loss": 0.3979, - "step": 81072 - }, - { - "epoch": 2.08, - "learning_rate": 4.558700588615119e-07, - "loss": 0.4375, - "step": 81073 - }, - { - "epoch": 2.08, - "learning_rate": 4.558468435325014e-07, - "loss": 0.4314, - "step": 81074 - }, - { - "epoch": 2.08, - "learning_rate": 4.558236286201238e-07, - "loss": 0.4448, - "step": 81075 - }, - { - "epoch": 2.08, - "learning_rate": 4.5580041412439686e-07, - "loss": 0.4785, - "step": 81076 - }, - { - "epoch": 2.08, - "learning_rate": 4.557772000453385e-07, - "loss": 0.3773, - "step": 81077 - }, - { - "epoch": 2.08, - "learning_rate": 4.5575398638296635e-07, - "loss": 0.4971, - "step": 81078 - }, - { - "epoch": 2.08, - "learning_rate": 4.557307731372989e-07, - "loss": 0.4023, - "step": 81079 - }, - { - "epoch": 2.08, - "learning_rate": 4.557075603083529e-07, - "loss": 0.5034, - "step": 81080 - }, - { - "epoch": 2.08, - "learning_rate": 4.556843478961466e-07, - "loss": 0.4312, - "step": 81081 - }, - { - "epoch": 2.08, - "learning_rate": 4.5566113590069786e-07, - "loss": 0.3787, - "step": 81082 - }, - { - "epoch": 2.08, - "learning_rate": 4.556379243220246e-07, - "loss": 0.4087, - "step": 81083 - }, - { - "epoch": 2.08, - "learning_rate": 4.556147131601441e-07, - "loss": 0.3533, - "step": 81084 - }, - { - "epoch": 2.08, - "learning_rate": 4.555915024150747e-07, - "loss": 0.3555, - "step": 81085 - }, - { - "epoch": 2.08, - "learning_rate": 4.5556829208683347e-07, - "loss": 0.3994, - "step": 81086 - }, - { - "epoch": 2.08, - "learning_rate": 4.5554508217543897e-07, - "loss": 0.4937, - "step": 81087 - }, - { - "epoch": 2.08, - "learning_rate": 4.5552187268090814e-07, - "loss": 0.366, - "step": 81088 - }, - { - "epoch": 2.08, - "learning_rate": 4.554986636032592e-07, - "loss": 0.3989, - "step": 81089 - }, - { - "epoch": 2.08, - "learning_rate": 4.5547545494250994e-07, - "loss": 0.3418, - "step": 81090 - }, - { - "epoch": 2.08, - "learning_rate": 4.554522466986784e-07, - "loss": 0.5239, - "step": 81091 - }, - { - "epoch": 2.08, - "learning_rate": 4.554290388717816e-07, - "loss": 0.5151, - "step": 81092 - }, - { - "epoch": 2.08, - "learning_rate": 4.554058314618379e-07, - "loss": 0.3779, - "step": 81093 - }, - { - "epoch": 2.08, - "learning_rate": 4.553826244688649e-07, - "loss": 0.4111, - "step": 81094 - }, - { - "epoch": 2.08, - "learning_rate": 4.553594178928807e-07, - "loss": 0.1779, - "step": 81095 - }, - { - "epoch": 2.08, - "learning_rate": 4.5533621173390266e-07, - "loss": 0.3248, - "step": 81096 - }, - { - "epoch": 2.08, - "learning_rate": 4.5531300599194833e-07, - "loss": 0.2855, - "step": 81097 - }, - { - "epoch": 2.08, - "learning_rate": 4.552898006670358e-07, - "loss": 0.3406, - "step": 81098 - }, - { - "epoch": 2.08, - "learning_rate": 4.5526659575918293e-07, - "loss": 0.4355, - "step": 81099 - }, - { - "epoch": 2.08, - "learning_rate": 4.552433912684076e-07, - "loss": 0.3799, - "step": 81100 - }, - { - "epoch": 2.08, - "learning_rate": 4.552201871947271e-07, - "loss": 0.4272, - "step": 81101 - }, - { - "epoch": 2.08, - "learning_rate": 4.551969835381594e-07, - "loss": 0.4829, - "step": 81102 - }, - { - "epoch": 2.08, - "learning_rate": 4.5517378029872265e-07, - "loss": 0.3234, - "step": 81103 - }, - { - "epoch": 2.08, - "learning_rate": 4.5515057747643393e-07, - "loss": 0.5107, - "step": 81104 - }, - { - "epoch": 2.08, - "learning_rate": 4.5512737507131174e-07, - "loss": 0.3079, - "step": 81105 - }, - { - "epoch": 2.08, - "learning_rate": 4.551041730833731e-07, - "loss": 0.3009, - "step": 81106 - }, - { - "epoch": 2.08, - "learning_rate": 4.5508097151263614e-07, - "loss": 0.5435, - "step": 81107 - }, - { - "epoch": 2.08, - "learning_rate": 4.5505777035911895e-07, - "loss": 0.3958, - "step": 81108 - }, - { - "epoch": 2.08, - "learning_rate": 4.550345696228387e-07, - "loss": 0.625, - "step": 81109 - }, - { - "epoch": 2.08, - "learning_rate": 4.5501136930381334e-07, - "loss": 0.3657, - "step": 81110 - }, - { - "epoch": 2.08, - "learning_rate": 4.5498816940206076e-07, - "loss": 0.5117, - "step": 81111 - }, - { - "epoch": 2.08, - "learning_rate": 4.54964969917599e-07, - "loss": 0.4023, - "step": 81112 - }, - { - "epoch": 2.08, - "learning_rate": 4.5494177085044515e-07, - "loss": 0.5376, - "step": 81113 - }, - { - "epoch": 2.08, - "learning_rate": 4.549185722006174e-07, - "loss": 0.3667, - "step": 81114 - }, - { - "epoch": 2.08, - "learning_rate": 4.548953739681337e-07, - "loss": 0.4116, - "step": 81115 - }, - { - "epoch": 2.08, - "learning_rate": 4.548721761530112e-07, - "loss": 0.3187, - "step": 81116 - }, - { - "epoch": 2.08, - "learning_rate": 4.548489787552685e-07, - "loss": 0.3555, - "step": 81117 - }, - { - "epoch": 2.08, - "learning_rate": 4.548257817749224e-07, - "loss": 0.3943, - "step": 81118 - }, - { - "epoch": 2.08, - "learning_rate": 4.548025852119911e-07, - "loss": 0.3984, - "step": 81119 - }, - { - "epoch": 2.08, - "learning_rate": 4.5477938906649283e-07, - "loss": 0.239, - "step": 81120 - }, - { - "epoch": 2.08, - "learning_rate": 4.547561933384444e-07, - "loss": 0.3975, - "step": 81121 - }, - { - "epoch": 2.08, - "learning_rate": 4.547329980278642e-07, - "loss": 0.2649, - "step": 81122 - }, - { - "epoch": 2.08, - "learning_rate": 4.5470980313476993e-07, - "loss": 0.4893, - "step": 81123 - }, - { - "epoch": 2.08, - "learning_rate": 4.546866086591795e-07, - "loss": 0.3909, - "step": 81124 - }, - { - "epoch": 2.08, - "learning_rate": 4.5466341460111056e-07, - "loss": 0.3452, - "step": 81125 - }, - { - "epoch": 2.08, - "learning_rate": 4.546402209605804e-07, - "loss": 0.3313, - "step": 81126 - }, - { - "epoch": 2.08, - "learning_rate": 4.5461702773760714e-07, - "loss": 0.5122, - "step": 81127 - }, - { - "epoch": 2.08, - "learning_rate": 4.545938349322085e-07, - "loss": 0.4199, - "step": 81128 - }, - { - "epoch": 2.08, - "learning_rate": 4.545706425444027e-07, - "loss": 0.3809, - "step": 81129 - }, - { - "epoch": 2.08, - "learning_rate": 4.545474505742067e-07, - "loss": 0.3672, - "step": 81130 - }, - { - "epoch": 2.08, - "learning_rate": 4.545242590216386e-07, - "loss": 0.4617, - "step": 81131 - }, - { - "epoch": 2.08, - "learning_rate": 4.545010678867163e-07, - "loss": 0.4307, - "step": 81132 - }, - { - "epoch": 2.08, - "learning_rate": 4.5447787716945773e-07, - "loss": 0.4348, - "step": 81133 - }, - { - "epoch": 2.08, - "learning_rate": 4.5445468686987997e-07, - "loss": 0.4262, - "step": 81134 - }, - { - "epoch": 2.08, - "learning_rate": 4.544314969880017e-07, - "loss": 0.479, - "step": 81135 - }, - { - "epoch": 2.08, - "learning_rate": 4.5440830752383964e-07, - "loss": 0.3804, - "step": 81136 - }, - { - "epoch": 2.08, - "learning_rate": 4.5438511847741234e-07, - "loss": 0.2686, - "step": 81137 - }, - { - "epoch": 2.08, - "learning_rate": 4.5436192984873703e-07, - "loss": 0.324, - "step": 81138 - }, - { - "epoch": 2.08, - "learning_rate": 4.543387416378317e-07, - "loss": 0.4751, - "step": 81139 - }, - { - "epoch": 2.08, - "learning_rate": 4.543155538447141e-07, - "loss": 0.3643, - "step": 81140 - }, - { - "epoch": 2.08, - "learning_rate": 4.542923664694023e-07, - "loss": 0.3207, - "step": 81141 - }, - { - "epoch": 2.08, - "learning_rate": 4.5426917951191335e-07, - "loss": 0.4902, - "step": 81142 - }, - { - "epoch": 2.08, - "learning_rate": 4.542459929722655e-07, - "loss": 0.3528, - "step": 81143 - }, - { - "epoch": 2.08, - "learning_rate": 4.542228068504763e-07, - "loss": 0.3887, - "step": 81144 - }, - { - "epoch": 2.08, - "learning_rate": 4.5419962114656405e-07, - "loss": 0.4521, - "step": 81145 - }, - { - "epoch": 2.08, - "learning_rate": 4.541764358605461e-07, - "loss": 0.2946, - "step": 81146 - }, - { - "epoch": 2.08, - "learning_rate": 4.541532509924396e-07, - "loss": 0.448, - "step": 81147 - }, - { - "epoch": 2.08, - "learning_rate": 4.5413006654226306e-07, - "loss": 0.3921, - "step": 81148 - }, - { - "epoch": 2.08, - "learning_rate": 4.5410688251003395e-07, - "loss": 0.5112, - "step": 81149 - }, - { - "epoch": 2.08, - "learning_rate": 4.5408369889577045e-07, - "loss": 0.4775, - "step": 81150 - }, - { - "epoch": 2.08, - "learning_rate": 4.5406051569948954e-07, - "loss": 0.4805, - "step": 81151 - }, - { - "epoch": 2.08, - "learning_rate": 4.540373329212095e-07, - "loss": 0.3934, - "step": 81152 - }, - { - "epoch": 2.08, - "learning_rate": 4.5401415056094793e-07, - "loss": 0.4731, - "step": 81153 - }, - { - "epoch": 2.08, - "learning_rate": 4.5399096861872286e-07, - "loss": 0.3423, - "step": 81154 - }, - { - "epoch": 2.08, - "learning_rate": 4.5396778709455196e-07, - "loss": 0.4316, - "step": 81155 - }, - { - "epoch": 2.08, - "learning_rate": 4.5394460598845243e-07, - "loss": 0.4648, - "step": 81156 - }, - { - "epoch": 2.08, - "learning_rate": 4.5392142530044244e-07, - "loss": 0.397, - "step": 81157 - }, - { - "epoch": 2.08, - "learning_rate": 4.5389824503054e-07, - "loss": 0.385, - "step": 81158 - }, - { - "epoch": 2.08, - "learning_rate": 4.5387506517876215e-07, - "loss": 0.3943, - "step": 81159 - }, - { - "epoch": 2.08, - "learning_rate": 4.538518857451271e-07, - "loss": 0.4219, - "step": 81160 - }, - { - "epoch": 2.08, - "learning_rate": 4.5382870672965255e-07, - "loss": 0.3501, - "step": 81161 - }, - { - "epoch": 2.08, - "learning_rate": 4.538055281323566e-07, - "loss": 0.4087, - "step": 81162 - }, - { - "epoch": 2.08, - "learning_rate": 4.5378234995325636e-07, - "loss": 0.4717, - "step": 81163 - }, - { - "epoch": 2.08, - "learning_rate": 4.5375917219236983e-07, - "loss": 0.4517, - "step": 81164 - }, - { - "epoch": 2.08, - "learning_rate": 4.5373599484971514e-07, - "loss": 0.3096, - "step": 81165 - }, - { - "epoch": 2.08, - "learning_rate": 4.537128179253092e-07, - "loss": 0.3406, - "step": 81166 - }, - { - "epoch": 2.08, - "learning_rate": 4.536896414191708e-07, - "loss": 0.4258, - "step": 81167 - }, - { - "epoch": 2.08, - "learning_rate": 4.5366646533131657e-07, - "loss": 0.3049, - "step": 81168 - }, - { - "epoch": 2.08, - "learning_rate": 4.536432896617649e-07, - "loss": 0.2534, - "step": 81169 - }, - { - "epoch": 2.08, - "learning_rate": 4.5362011441053336e-07, - "loss": 0.3369, - "step": 81170 - }, - { - "epoch": 2.08, - "learning_rate": 4.535969395776403e-07, - "loss": 0.4565, - "step": 81171 - }, - { - "epoch": 2.08, - "learning_rate": 4.535737651631024e-07, - "loss": 0.4717, - "step": 81172 - }, - { - "epoch": 2.08, - "learning_rate": 4.535505911669381e-07, - "loss": 0.4238, - "step": 81173 - }, - { - "epoch": 2.08, - "learning_rate": 4.535274175891652e-07, - "loss": 0.3491, - "step": 81174 - }, - { - "epoch": 2.08, - "learning_rate": 4.5350424442980137e-07, - "loss": 0.4429, - "step": 81175 - }, - { - "epoch": 2.08, - "learning_rate": 4.5348107168886387e-07, - "loss": 0.5044, - "step": 81176 - }, - { - "epoch": 2.08, - "learning_rate": 4.534578993663706e-07, - "loss": 0.3821, - "step": 81177 - }, - { - "epoch": 2.08, - "learning_rate": 4.534347274623396e-07, - "loss": 0.3945, - "step": 81178 - }, - { - "epoch": 2.08, - "learning_rate": 4.534115559767888e-07, - "loss": 0.2937, - "step": 81179 - }, - { - "epoch": 2.08, - "learning_rate": 4.5338838490973543e-07, - "loss": 0.4209, - "step": 81180 - }, - { - "epoch": 2.08, - "learning_rate": 4.533652142611972e-07, - "loss": 0.3181, - "step": 81181 - }, - { - "epoch": 2.08, - "learning_rate": 4.5334204403119226e-07, - "loss": 0.3687, - "step": 81182 - }, - { - "epoch": 2.08, - "learning_rate": 4.533188742197386e-07, - "loss": 0.3997, - "step": 81183 - }, - { - "epoch": 2.08, - "learning_rate": 4.5329570482685297e-07, - "loss": 0.4431, - "step": 81184 - }, - { - "epoch": 2.08, - "learning_rate": 4.532725358525542e-07, - "loss": 0.4824, - "step": 81185 - }, - { - "epoch": 2.08, - "learning_rate": 4.5324936729685915e-07, - "loss": 0.3035, - "step": 81186 - }, - { - "epoch": 2.08, - "learning_rate": 4.532261991597858e-07, - "loss": 0.3311, - "step": 81187 - }, - { - "epoch": 2.08, - "learning_rate": 4.5320303144135244e-07, - "loss": 0.4629, - "step": 81188 - }, - { - "epoch": 2.08, - "learning_rate": 4.5317986414157607e-07, - "loss": 0.4756, - "step": 81189 - }, - { - "epoch": 2.08, - "learning_rate": 4.531566972604747e-07, - "loss": 0.4893, - "step": 81190 - }, - { - "epoch": 2.08, - "learning_rate": 4.5313353079806637e-07, - "loss": 0.4956, - "step": 81191 - }, - { - "epoch": 2.08, - "learning_rate": 4.5311036475436824e-07, - "loss": 0.3508, - "step": 81192 - }, - { - "epoch": 2.08, - "learning_rate": 4.530871991293984e-07, - "loss": 0.4722, - "step": 81193 - }, - { - "epoch": 2.08, - "learning_rate": 4.530640339231745e-07, - "loss": 0.5303, - "step": 81194 - }, - { - "epoch": 2.08, - "learning_rate": 4.530408691357147e-07, - "loss": 0.3403, - "step": 81195 - }, - { - "epoch": 2.08, - "learning_rate": 4.530177047670364e-07, - "loss": 0.4844, - "step": 81196 - }, - { - "epoch": 2.08, - "learning_rate": 4.529945408171569e-07, - "loss": 0.3848, - "step": 81197 - }, - { - "epoch": 2.08, - "learning_rate": 4.5297137728609436e-07, - "loss": 0.4211, - "step": 81198 - }, - { - "epoch": 2.08, - "learning_rate": 4.529482141738664e-07, - "loss": 0.3257, - "step": 81199 - }, - { - "epoch": 2.08, - "learning_rate": 4.529250514804912e-07, - "loss": 0.2804, - "step": 81200 - }, - { - "epoch": 2.08, - "learning_rate": 4.529018892059858e-07, - "loss": 0.4702, - "step": 81201 - }, - { - "epoch": 2.08, - "learning_rate": 4.5287872735036835e-07, - "loss": 0.4648, - "step": 81202 - }, - { - "epoch": 2.08, - "learning_rate": 4.528555659136565e-07, - "loss": 0.3356, - "step": 81203 - }, - { - "epoch": 2.08, - "learning_rate": 4.5283240489586826e-07, - "loss": 0.3291, - "step": 81204 - }, - { - "epoch": 2.08, - "learning_rate": 4.5280924429702105e-07, - "loss": 0.4268, - "step": 81205 - }, - { - "epoch": 2.08, - "learning_rate": 4.527860841171324e-07, - "loss": 0.3575, - "step": 81206 - }, - { - "epoch": 2.08, - "learning_rate": 4.527629243562202e-07, - "loss": 0.4902, - "step": 81207 - }, - { - "epoch": 2.08, - "learning_rate": 4.527397650143027e-07, - "loss": 0.4727, - "step": 81208 - }, - { - "epoch": 2.08, - "learning_rate": 4.527166060913967e-07, - "loss": 0.4932, - "step": 81209 - }, - { - "epoch": 2.08, - "learning_rate": 4.526934475875205e-07, - "loss": 0.3394, - "step": 81210 - }, - { - "epoch": 2.08, - "learning_rate": 4.526702895026918e-07, - "loss": 0.4614, - "step": 81211 - }, - { - "epoch": 2.08, - "learning_rate": 4.526471318369286e-07, - "loss": 0.4092, - "step": 81212 - }, - { - "epoch": 2.08, - "learning_rate": 4.5262397459024803e-07, - "loss": 0.4761, - "step": 81213 - }, - { - "epoch": 2.08, - "learning_rate": 4.526008177626681e-07, - "loss": 0.4473, - "step": 81214 - }, - { - "epoch": 2.08, - "learning_rate": 4.525776613542068e-07, - "loss": 0.5039, - "step": 81215 - }, - { - "epoch": 2.08, - "learning_rate": 4.5255450536488135e-07, - "loss": 0.3896, - "step": 81216 - }, - { - "epoch": 2.08, - "learning_rate": 4.525313497947102e-07, - "loss": 0.3064, - "step": 81217 - }, - { - "epoch": 2.08, - "learning_rate": 4.5250819464371013e-07, - "loss": 0.3455, - "step": 81218 - }, - { - "epoch": 2.08, - "learning_rate": 4.5248503991189937e-07, - "loss": 0.3516, - "step": 81219 - }, - { - "epoch": 2.08, - "learning_rate": 4.5246188559929563e-07, - "loss": 0.324, - "step": 81220 - }, - { - "epoch": 2.08, - "learning_rate": 4.5243873170591704e-07, - "loss": 0.3624, - "step": 81221 - }, - { - "epoch": 2.08, - "learning_rate": 4.524155782317807e-07, - "loss": 0.3833, - "step": 81222 - }, - { - "epoch": 2.08, - "learning_rate": 4.5239242517690436e-07, - "loss": 0.3523, - "step": 81223 - }, - { - "epoch": 2.08, - "learning_rate": 4.5236927254130607e-07, - "loss": 0.5186, - "step": 81224 - }, - { - "epoch": 2.08, - "learning_rate": 4.5234612032500416e-07, - "loss": 0.4124, - "step": 81225 - }, - { - "epoch": 2.08, - "learning_rate": 4.5232296852801486e-07, - "loss": 0.3147, - "step": 81226 - }, - { - "epoch": 2.08, - "learning_rate": 4.5229981715035684e-07, - "loss": 0.4497, - "step": 81227 - }, - { - "epoch": 2.08, - "learning_rate": 4.522766661920475e-07, - "loss": 0.2792, - "step": 81228 - }, - { - "epoch": 2.08, - "learning_rate": 4.522535156531051e-07, - "loss": 0.2914, - "step": 81229 - }, - { - "epoch": 2.08, - "learning_rate": 4.5223036553354666e-07, - "loss": 0.4146, - "step": 81230 - }, - { - "epoch": 2.08, - "learning_rate": 4.5220721583339027e-07, - "loss": 0.5195, - "step": 81231 - }, - { - "epoch": 2.08, - "learning_rate": 4.5218406655265363e-07, - "loss": 0.3254, - "step": 81232 - }, - { - "epoch": 2.08, - "learning_rate": 4.521609176913549e-07, - "loss": 0.3103, - "step": 81233 - }, - { - "epoch": 2.08, - "learning_rate": 4.5213776924951084e-07, - "loss": 0.3335, - "step": 81234 - }, - { - "epoch": 2.08, - "learning_rate": 4.5211462122714017e-07, - "loss": 0.4219, - "step": 81235 - }, - { - "epoch": 2.08, - "learning_rate": 4.520914736242597e-07, - "loss": 0.406, - "step": 81236 - }, - { - "epoch": 2.08, - "learning_rate": 4.5206832644088765e-07, - "loss": 0.4038, - "step": 81237 - }, - { - "epoch": 2.08, - "learning_rate": 4.52045179677042e-07, - "loss": 0.4238, - "step": 81238 - }, - { - "epoch": 2.08, - "learning_rate": 4.520220333327399e-07, - "loss": 0.4966, - "step": 81239 - }, - { - "epoch": 2.08, - "learning_rate": 4.519988874079993e-07, - "loss": 0.5918, - "step": 81240 - }, - { - "epoch": 2.08, - "learning_rate": 4.519757419028379e-07, - "loss": 0.3304, - "step": 81241 - }, - { - "epoch": 2.08, - "learning_rate": 4.5195259681727394e-07, - "loss": 0.4609, - "step": 81242 - }, - { - "epoch": 2.08, - "learning_rate": 4.5192945215132415e-07, - "loss": 0.5195, - "step": 81243 - }, - { - "epoch": 2.08, - "learning_rate": 4.519063079050069e-07, - "loss": 0.5107, - "step": 81244 - }, - { - "epoch": 2.08, - "learning_rate": 4.5188316407834015e-07, - "loss": 0.2512, - "step": 81245 - }, - { - "epoch": 2.08, - "learning_rate": 4.518600206713412e-07, - "loss": 0.4526, - "step": 81246 - }, - { - "epoch": 2.08, - "learning_rate": 4.5183687768402744e-07, - "loss": 0.3308, - "step": 81247 - }, - { - "epoch": 2.08, - "learning_rate": 4.5181373511641707e-07, - "loss": 0.5073, - "step": 81248 - }, - { - "epoch": 2.08, - "learning_rate": 4.5179059296852773e-07, - "loss": 0.4165, - "step": 81249 - }, - { - "epoch": 2.08, - "learning_rate": 4.517674512403774e-07, - "loss": 0.4009, - "step": 81250 - }, - { - "epoch": 2.08, - "learning_rate": 4.517443099319832e-07, - "loss": 0.5098, - "step": 81251 - }, - { - "epoch": 2.08, - "learning_rate": 4.517211690433632e-07, - "loss": 0.3621, - "step": 81252 - }, - { - "epoch": 2.08, - "learning_rate": 4.51698028574535e-07, - "loss": 0.5952, - "step": 81253 - }, - { - "epoch": 2.08, - "learning_rate": 4.5167488852551683e-07, - "loss": 0.5713, - "step": 81254 - }, - { - "epoch": 2.08, - "learning_rate": 4.5165174889632607e-07, - "loss": 0.479, - "step": 81255 - }, - { - "epoch": 2.08, - "learning_rate": 4.516286096869798e-07, - "loss": 0.3732, - "step": 81256 - }, - { - "epoch": 2.08, - "learning_rate": 4.5160547089749645e-07, - "loss": 0.4507, - "step": 81257 - }, - { - "epoch": 2.08, - "learning_rate": 4.5158233252789345e-07, - "loss": 0.4346, - "step": 81258 - }, - { - "epoch": 2.08, - "learning_rate": 4.515591945781891e-07, - "loss": 0.4666, - "step": 81259 - }, - { - "epoch": 2.08, - "learning_rate": 4.515360570484003e-07, - "loss": 0.5093, - "step": 81260 - }, - { - "epoch": 2.08, - "learning_rate": 4.515129199385451e-07, - "loss": 0.4619, - "step": 81261 - }, - { - "epoch": 2.08, - "learning_rate": 4.5148978324864116e-07, - "loss": 0.4329, - "step": 81262 - }, - { - "epoch": 2.08, - "learning_rate": 4.514666469787067e-07, - "loss": 0.4908, - "step": 81263 - }, - { - "epoch": 2.08, - "learning_rate": 4.5144351112875864e-07, - "loss": 0.3843, - "step": 81264 - }, - { - "epoch": 2.08, - "learning_rate": 4.514203756988155e-07, - "loss": 0.5415, - "step": 81265 - }, - { - "epoch": 2.08, - "learning_rate": 4.5139724068889404e-07, - "loss": 0.4146, - "step": 81266 - }, - { - "epoch": 2.08, - "learning_rate": 4.5137410609901303e-07, - "loss": 0.3284, - "step": 81267 - }, - { - "epoch": 2.08, - "learning_rate": 4.5135097192918916e-07, - "loss": 0.3691, - "step": 81268 - }, - { - "epoch": 2.08, - "learning_rate": 4.5132783817944065e-07, - "loss": 0.4521, - "step": 81269 - }, - { - "epoch": 2.08, - "learning_rate": 4.513047048497851e-07, - "loss": 0.3281, - "step": 81270 - }, - { - "epoch": 2.08, - "learning_rate": 4.5128157194024075e-07, - "loss": 0.2812, - "step": 81271 - }, - { - "epoch": 2.08, - "learning_rate": 4.5125843945082453e-07, - "loss": 0.5186, - "step": 81272 - }, - { - "epoch": 2.08, - "learning_rate": 4.5123530738155444e-07, - "loss": 0.4077, - "step": 81273 - }, - { - "epoch": 2.08, - "learning_rate": 4.5121217573244864e-07, - "loss": 0.4966, - "step": 81274 - }, - { - "epoch": 2.08, - "learning_rate": 4.511890445035241e-07, - "loss": 0.3767, - "step": 81275 - }, - { - "epoch": 2.08, - "learning_rate": 4.511659136947992e-07, - "loss": 0.4132, - "step": 81276 - }, - { - "epoch": 2.08, - "learning_rate": 4.5114278330629096e-07, - "loss": 0.3499, - "step": 81277 - }, - { - "epoch": 2.08, - "learning_rate": 4.511196533380175e-07, - "loss": 0.4106, - "step": 81278 - }, - { - "epoch": 2.08, - "learning_rate": 4.510965237899964e-07, - "loss": 0.4956, - "step": 81279 - }, - { - "epoch": 2.08, - "learning_rate": 4.5107339466224583e-07, - "loss": 0.4712, - "step": 81280 - }, - { - "epoch": 2.08, - "learning_rate": 4.510502659547828e-07, - "loss": 0.3245, - "step": 81281 - }, - { - "epoch": 2.08, - "learning_rate": 4.5102713766762536e-07, - "loss": 0.3774, - "step": 81282 - }, - { - "epoch": 2.08, - "learning_rate": 4.5100400980079155e-07, - "loss": 0.3973, - "step": 81283 - }, - { - "epoch": 2.08, - "learning_rate": 4.5098088235429864e-07, - "loss": 0.3872, - "step": 81284 - }, - { - "epoch": 2.08, - "learning_rate": 4.5095775532816414e-07, - "loss": 0.4033, - "step": 81285 - }, - { - "epoch": 2.08, - "learning_rate": 4.5093462872240606e-07, - "loss": 0.3848, - "step": 81286 - }, - { - "epoch": 2.08, - "learning_rate": 4.50911502537042e-07, - "loss": 0.4771, - "step": 81287 - }, - { - "epoch": 2.08, - "learning_rate": 4.5088837677209025e-07, - "loss": 0.2858, - "step": 81288 - }, - { - "epoch": 2.08, - "learning_rate": 4.508652514275675e-07, - "loss": 0.4814, - "step": 81289 - }, - { - "epoch": 2.08, - "learning_rate": 4.5084212650349207e-07, - "loss": 0.3118, - "step": 81290 - }, - { - "epoch": 2.08, - "learning_rate": 4.5081900199988156e-07, - "loss": 0.4006, - "step": 81291 - }, - { - "epoch": 2.08, - "learning_rate": 4.507958779167541e-07, - "loss": 0.4111, - "step": 81292 - }, - { - "epoch": 2.08, - "learning_rate": 4.5077275425412655e-07, - "loss": 0.3433, - "step": 81293 - }, - { - "epoch": 2.08, - "learning_rate": 4.5074963101201746e-07, - "loss": 0.4546, - "step": 81294 - }, - { - "epoch": 2.08, - "learning_rate": 4.5072650819044366e-07, - "loss": 0.4351, - "step": 81295 - }, - { - "epoch": 2.08, - "learning_rate": 4.5070338578942346e-07, - "loss": 0.4175, - "step": 81296 - }, - { - "epoch": 2.08, - "learning_rate": 4.506802638089747e-07, - "loss": 0.3734, - "step": 81297 - }, - { - "epoch": 2.08, - "learning_rate": 4.5065714224911445e-07, - "loss": 0.3735, - "step": 81298 - }, - { - "epoch": 2.08, - "learning_rate": 4.506340211098607e-07, - "loss": 0.4634, - "step": 81299 - }, - { - "epoch": 2.08, - "learning_rate": 4.506109003912317e-07, - "loss": 0.4233, - "step": 81300 - }, - { - "epoch": 2.08, - "learning_rate": 4.5058778009324425e-07, - "loss": 0.4331, - "step": 81301 - }, - { - "epoch": 2.08, - "learning_rate": 4.5056466021591653e-07, - "loss": 0.4702, - "step": 81302 - }, - { - "epoch": 2.08, - "learning_rate": 4.505415407592661e-07, - "loss": 0.502, - "step": 81303 - }, - { - "epoch": 2.08, - "learning_rate": 4.505184217233111e-07, - "loss": 0.3389, - "step": 81304 - }, - { - "epoch": 2.08, - "learning_rate": 4.5049530310806904e-07, - "loss": 0.3994, - "step": 81305 - }, - { - "epoch": 2.08, - "learning_rate": 4.50472184913557e-07, - "loss": 0.4292, - "step": 81306 - }, - { - "epoch": 2.08, - "learning_rate": 4.50449067139793e-07, - "loss": 0.439, - "step": 81307 - }, - { - "epoch": 2.08, - "learning_rate": 4.5042594978679505e-07, - "loss": 0.5088, - "step": 81308 - }, - { - "epoch": 2.08, - "learning_rate": 4.5040283285458103e-07, - "loss": 0.4531, - "step": 81309 - }, - { - "epoch": 2.08, - "learning_rate": 4.5037971634316784e-07, - "loss": 0.3384, - "step": 81310 - }, - { - "epoch": 2.08, - "learning_rate": 4.503566002525737e-07, - "loss": 0.4922, - "step": 81311 - }, - { - "epoch": 2.08, - "learning_rate": 4.503334845828163e-07, - "loss": 0.3564, - "step": 81312 - }, - { - "epoch": 2.08, - "learning_rate": 4.5031036933391355e-07, - "loss": 0.3745, - "step": 81313 - }, - { - "epoch": 2.08, - "learning_rate": 4.502872545058829e-07, - "loss": 0.2004, - "step": 81314 - }, - { - "epoch": 2.08, - "learning_rate": 4.502641400987416e-07, - "loss": 0.4004, - "step": 81315 - }, - { - "epoch": 2.08, - "learning_rate": 4.502410261125078e-07, - "loss": 0.3385, - "step": 81316 - }, - { - "epoch": 2.08, - "learning_rate": 4.5021791254719955e-07, - "loss": 0.4238, - "step": 81317 - }, - { - "epoch": 2.08, - "learning_rate": 4.5019479940283376e-07, - "loss": 0.5112, - "step": 81318 - }, - { - "epoch": 2.08, - "learning_rate": 4.501716866794286e-07, - "loss": 0.3787, - "step": 81319 - }, - { - "epoch": 2.08, - "learning_rate": 4.501485743770017e-07, - "loss": 0.3015, - "step": 81320 - }, - { - "epoch": 2.08, - "learning_rate": 4.5012546249557105e-07, - "loss": 0.5796, - "step": 81321 - }, - { - "epoch": 2.08, - "learning_rate": 4.501023510351537e-07, - "loss": 0.3751, - "step": 81322 - }, - { - "epoch": 2.08, - "learning_rate": 4.500792399957678e-07, - "loss": 0.4004, - "step": 81323 - }, - { - "epoch": 2.08, - "learning_rate": 4.500561293774312e-07, - "loss": 0.4448, - "step": 81324 - }, - { - "epoch": 2.08, - "learning_rate": 4.50033019180161e-07, - "loss": 0.4272, - "step": 81325 - }, - { - "epoch": 2.08, - "learning_rate": 4.5000990940397556e-07, - "loss": 0.4453, - "step": 81326 - }, - { - "epoch": 2.08, - "learning_rate": 4.499868000488919e-07, - "loss": 0.3309, - "step": 81327 - }, - { - "epoch": 2.08, - "learning_rate": 4.4996369111492806e-07, - "loss": 0.4214, - "step": 81328 - }, - { - "epoch": 2.08, - "learning_rate": 4.499405826021018e-07, - "loss": 0.4751, - "step": 81329 - }, - { - "epoch": 2.08, - "learning_rate": 4.4991747451043094e-07, - "loss": 0.3054, - "step": 81330 - }, - { - "epoch": 2.08, - "learning_rate": 4.4989436683993277e-07, - "loss": 0.4292, - "step": 81331 - }, - { - "epoch": 2.08, - "learning_rate": 4.498712595906251e-07, - "loss": 0.4438, - "step": 81332 - }, - { - "epoch": 2.08, - "learning_rate": 4.4984815276252573e-07, - "loss": 0.4448, - "step": 81333 - }, - { - "epoch": 2.08, - "learning_rate": 4.498250463556531e-07, - "loss": 0.3936, - "step": 81334 - }, - { - "epoch": 2.08, - "learning_rate": 4.498019403700234e-07, - "loss": 0.4211, - "step": 81335 - }, - { - "epoch": 2.08, - "learning_rate": 4.49778834805655e-07, - "loss": 0.522, - "step": 81336 - }, - { - "epoch": 2.08, - "learning_rate": 4.497557296625657e-07, - "loss": 0.5591, - "step": 81337 - }, - { - "epoch": 2.08, - "learning_rate": 4.497326249407735e-07, - "loss": 0.3539, - "step": 81338 - }, - { - "epoch": 2.08, - "learning_rate": 4.497095206402953e-07, - "loss": 0.4358, - "step": 81339 - }, - { - "epoch": 2.08, - "learning_rate": 4.496864167611493e-07, - "loss": 0.4102, - "step": 81340 - }, - { - "epoch": 2.08, - "learning_rate": 4.4966331330335306e-07, - "loss": 0.3267, - "step": 81341 - }, - { - "epoch": 2.08, - "learning_rate": 4.4964021026692466e-07, - "loss": 0.3748, - "step": 81342 - }, - { - "epoch": 2.08, - "learning_rate": 4.496171076518811e-07, - "loss": 0.3785, - "step": 81343 - }, - { - "epoch": 2.08, - "learning_rate": 4.4959400545824076e-07, - "loss": 0.3853, - "step": 81344 - }, - { - "epoch": 2.08, - "learning_rate": 4.495709036860207e-07, - "loss": 0.353, - "step": 81345 - }, - { - "epoch": 2.08, - "learning_rate": 4.495478023352388e-07, - "loss": 0.395, - "step": 81346 - }, - { - "epoch": 2.08, - "learning_rate": 4.4952470140591325e-07, - "loss": 0.3508, - "step": 81347 - }, - { - "epoch": 2.08, - "learning_rate": 4.495016008980609e-07, - "loss": 0.4526, - "step": 81348 - }, - { - "epoch": 2.09, - "learning_rate": 4.494785008116999e-07, - "loss": 0.3813, - "step": 81349 - }, - { - "epoch": 2.09, - "learning_rate": 4.49455401146848e-07, - "loss": 0.5049, - "step": 81350 - }, - { - "epoch": 2.09, - "learning_rate": 4.49432301903523e-07, - "loss": 0.5049, - "step": 81351 - }, - { - "epoch": 2.09, - "learning_rate": 4.4940920308174203e-07, - "loss": 0.3628, - "step": 81352 - }, - { - "epoch": 2.09, - "learning_rate": 4.4938610468152316e-07, - "loss": 0.4402, - "step": 81353 - }, - { - "epoch": 2.09, - "learning_rate": 4.493630067028844e-07, - "loss": 0.4004, - "step": 81354 - }, - { - "epoch": 2.09, - "learning_rate": 4.493399091458431e-07, - "loss": 0.4429, - "step": 81355 - }, - { - "epoch": 2.09, - "learning_rate": 4.4931681201041647e-07, - "loss": 0.4037, - "step": 81356 - }, - { - "epoch": 2.09, - "learning_rate": 4.492937152966226e-07, - "loss": 0.3988, - "step": 81357 - }, - { - "epoch": 2.09, - "learning_rate": 4.492706190044793e-07, - "loss": 0.2332, - "step": 81358 - }, - { - "epoch": 2.09, - "learning_rate": 4.4924752313400447e-07, - "loss": 0.3516, - "step": 81359 - }, - { - "epoch": 2.09, - "learning_rate": 4.492244276852152e-07, - "loss": 0.4272, - "step": 81360 - }, - { - "epoch": 2.09, - "learning_rate": 4.4920133265812945e-07, - "loss": 0.4526, - "step": 81361 - }, - { - "epoch": 2.09, - "learning_rate": 4.4917823805276477e-07, - "loss": 0.4385, - "step": 81362 - }, - { - "epoch": 2.09, - "learning_rate": 4.4915514386913954e-07, - "loss": 0.4556, - "step": 81363 - }, - { - "epoch": 2.09, - "learning_rate": 4.491320501072707e-07, - "loss": 0.4717, - "step": 81364 - }, - { - "epoch": 2.09, - "learning_rate": 4.4910895676717595e-07, - "loss": 0.4443, - "step": 81365 - }, - { - "epoch": 2.09, - "learning_rate": 4.4908586384887305e-07, - "loss": 0.4048, - "step": 81366 - }, - { - "epoch": 2.09, - "learning_rate": 4.490627713523798e-07, - "loss": 0.311, - "step": 81367 - }, - { - "epoch": 2.09, - "learning_rate": 4.4903967927771415e-07, - "loss": 0.2778, - "step": 81368 - }, - { - "epoch": 2.09, - "learning_rate": 4.4901658762489314e-07, - "loss": 0.5142, - "step": 81369 - }, - { - "epoch": 2.09, - "learning_rate": 4.489934963939348e-07, - "loss": 0.2972, - "step": 81370 - }, - { - "epoch": 2.09, - "learning_rate": 4.489704055848572e-07, - "loss": 0.401, - "step": 81371 - }, - { - "epoch": 2.09, - "learning_rate": 4.489473151976773e-07, - "loss": 0.4246, - "step": 81372 - }, - { - "epoch": 2.09, - "learning_rate": 4.4892422523241303e-07, - "loss": 0.396, - "step": 81373 - }, - { - "epoch": 2.09, - "learning_rate": 4.489011356890825e-07, - "loss": 0.4141, - "step": 81374 - }, - { - "epoch": 2.09, - "learning_rate": 4.488780465677027e-07, - "loss": 0.3374, - "step": 81375 - }, - { - "epoch": 2.09, - "learning_rate": 4.4885495786829197e-07, - "loss": 0.481, - "step": 81376 - }, - { - "epoch": 2.09, - "learning_rate": 4.488318695908673e-07, - "loss": 0.353, - "step": 81377 - }, - { - "epoch": 2.09, - "learning_rate": 4.4880878173544676e-07, - "loss": 0.4038, - "step": 81378 - }, - { - "epoch": 2.09, - "learning_rate": 4.4878569430204796e-07, - "loss": 0.3562, - "step": 81379 - }, - { - "epoch": 2.09, - "learning_rate": 4.4876260729068893e-07, - "loss": 0.4688, - "step": 81380 - }, - { - "epoch": 2.09, - "learning_rate": 4.487395207013868e-07, - "loss": 0.3467, - "step": 81381 - }, - { - "epoch": 2.09, - "learning_rate": 4.487164345341593e-07, - "loss": 0.4409, - "step": 81382 - }, - { - "epoch": 2.09, - "learning_rate": 4.486933487890244e-07, - "loss": 0.4873, - "step": 81383 - }, - { - "epoch": 2.09, - "learning_rate": 4.48670263466e-07, - "loss": 0.436, - "step": 81384 - }, - { - "epoch": 2.09, - "learning_rate": 4.4864717856510334e-07, - "loss": 0.4414, - "step": 81385 - }, - { - "epoch": 2.09, - "learning_rate": 4.486240940863519e-07, - "loss": 0.3304, - "step": 81386 - }, - { - "epoch": 2.09, - "learning_rate": 4.4860101002976356e-07, - "loss": 0.4492, - "step": 81387 - }, - { - "epoch": 2.09, - "learning_rate": 4.4857792639535666e-07, - "loss": 0.4243, - "step": 81388 - }, - { - "epoch": 2.09, - "learning_rate": 4.485548431831476e-07, - "loss": 0.3771, - "step": 81389 - }, - { - "epoch": 2.09, - "learning_rate": 4.48531760393155e-07, - "loss": 0.4844, - "step": 81390 - }, - { - "epoch": 2.09, - "learning_rate": 4.4850867802539617e-07, - "loss": 0.387, - "step": 81391 - }, - { - "epoch": 2.09, - "learning_rate": 4.484855960798892e-07, - "loss": 0.2753, - "step": 81392 - }, - { - "epoch": 2.09, - "learning_rate": 4.484625145566512e-07, - "loss": 0.5161, - "step": 81393 - }, - { - "epoch": 2.09, - "learning_rate": 4.4843943345570036e-07, - "loss": 0.3867, - "step": 81394 - }, - { - "epoch": 2.09, - "learning_rate": 4.4841635277705383e-07, - "loss": 0.3936, - "step": 81395 - }, - { - "epoch": 2.09, - "learning_rate": 4.4839327252072946e-07, - "loss": 0.4097, - "step": 81396 - }, - { - "epoch": 2.09, - "learning_rate": 4.4837019268674535e-07, - "loss": 0.3335, - "step": 81397 - }, - { - "epoch": 2.09, - "learning_rate": 4.4834711327511844e-07, - "loss": 0.3999, - "step": 81398 - }, - { - "epoch": 2.09, - "learning_rate": 4.4832403428586685e-07, - "loss": 0.3813, - "step": 81399 - }, - { - "epoch": 2.09, - "learning_rate": 4.483009557190081e-07, - "loss": 0.4482, - "step": 81400 - }, - { - "epoch": 2.09, - "learning_rate": 4.4827787757456036e-07, - "loss": 0.4199, - "step": 81401 - }, - { - "epoch": 2.09, - "learning_rate": 4.4825479985254046e-07, - "loss": 0.3645, - "step": 81402 - }, - { - "epoch": 2.09, - "learning_rate": 4.482317225529666e-07, - "loss": 0.4204, - "step": 81403 - }, - { - "epoch": 2.09, - "learning_rate": 4.482086456758566e-07, - "loss": 0.3928, - "step": 81404 - }, - { - "epoch": 2.09, - "learning_rate": 4.4818556922122755e-07, - "loss": 0.3325, - "step": 81405 - }, - { - "epoch": 2.09, - "learning_rate": 4.4816249318909783e-07, - "loss": 0.5127, - "step": 81406 - }, - { - "epoch": 2.09, - "learning_rate": 4.4813941757948424e-07, - "loss": 0.3816, - "step": 81407 - }, - { - "epoch": 2.09, - "learning_rate": 4.4811634239240504e-07, - "loss": 0.4565, - "step": 81408 - }, - { - "epoch": 2.09, - "learning_rate": 4.48093267627878e-07, - "loss": 0.3542, - "step": 81409 - }, - { - "epoch": 2.09, - "learning_rate": 4.4807019328592034e-07, - "loss": 0.4326, - "step": 81410 - }, - { - "epoch": 2.09, - "learning_rate": 4.4804711936654993e-07, - "loss": 0.4546, - "step": 81411 - }, - { - "epoch": 2.09, - "learning_rate": 4.480240458697845e-07, - "loss": 0.4609, - "step": 81412 - }, - { - "epoch": 2.09, - "learning_rate": 4.48000972795642e-07, - "loss": 0.4648, - "step": 81413 - }, - { - "epoch": 2.09, - "learning_rate": 4.4797790014413973e-07, - "loss": 0.4761, - "step": 81414 - }, - { - "epoch": 2.09, - "learning_rate": 4.4795482791529504e-07, - "loss": 0.3789, - "step": 81415 - }, - { - "epoch": 2.09, - "learning_rate": 4.4793175610912604e-07, - "loss": 0.3513, - "step": 81416 - }, - { - "epoch": 2.09, - "learning_rate": 4.4790868472565025e-07, - "loss": 0.5059, - "step": 81417 - }, - { - "epoch": 2.09, - "learning_rate": 4.478856137648858e-07, - "loss": 0.4751, - "step": 81418 - }, - { - "epoch": 2.09, - "learning_rate": 4.4786254322684945e-07, - "loss": 0.3391, - "step": 81419 - }, - { - "epoch": 2.09, - "learning_rate": 4.4783947311155944e-07, - "loss": 0.4697, - "step": 81420 - }, - { - "epoch": 2.09, - "learning_rate": 4.4781640341903336e-07, - "loss": 0.3735, - "step": 81421 - }, - { - "epoch": 2.09, - "learning_rate": 4.4779333414928933e-07, - "loss": 0.3477, - "step": 81422 - }, - { - "epoch": 2.09, - "learning_rate": 4.4777026530234407e-07, - "loss": 0.4225, - "step": 81423 - }, - { - "epoch": 2.09, - "learning_rate": 4.4774719687821616e-07, - "loss": 0.3307, - "step": 81424 - }, - { - "epoch": 2.09, - "learning_rate": 4.4772412887692234e-07, - "loss": 0.4775, - "step": 81425 - }, - { - "epoch": 2.09, - "learning_rate": 4.477010612984813e-07, - "loss": 0.3936, - "step": 81426 - }, - { - "epoch": 2.09, - "learning_rate": 4.476779941429096e-07, - "loss": 0.29, - "step": 81427 - }, - { - "epoch": 2.09, - "learning_rate": 4.4765492741022573e-07, - "loss": 0.2347, - "step": 81428 - }, - { - "epoch": 2.09, - "learning_rate": 4.476318611004468e-07, - "loss": 0.501, - "step": 81429 - }, - { - "epoch": 2.09, - "learning_rate": 4.476087952135913e-07, - "loss": 0.4277, - "step": 81430 - }, - { - "epoch": 2.09, - "learning_rate": 4.475857297496759e-07, - "loss": 0.6162, - "step": 81431 - }, - { - "epoch": 2.09, - "learning_rate": 4.475626647087187e-07, - "loss": 0.3004, - "step": 81432 - }, - { - "epoch": 2.09, - "learning_rate": 4.475396000907374e-07, - "loss": 0.5615, - "step": 81433 - }, - { - "epoch": 2.09, - "learning_rate": 4.475165358957501e-07, - "loss": 0.4761, - "step": 81434 - }, - { - "epoch": 2.09, - "learning_rate": 4.4749347212377384e-07, - "loss": 0.322, - "step": 81435 - }, - { - "epoch": 2.09, - "learning_rate": 4.474704087748261e-07, - "loss": 0.3264, - "step": 81436 - }, - { - "epoch": 2.09, - "learning_rate": 4.4744734584892485e-07, - "loss": 0.3396, - "step": 81437 - }, - { - "epoch": 2.09, - "learning_rate": 4.4742428334608786e-07, - "loss": 0.4512, - "step": 81438 - }, - { - "epoch": 2.09, - "learning_rate": 4.4740122126633287e-07, - "loss": 0.4014, - "step": 81439 - }, - { - "epoch": 2.09, - "learning_rate": 4.473781596096771e-07, - "loss": 0.3647, - "step": 81440 - }, - { - "epoch": 2.09, - "learning_rate": 4.473550983761385e-07, - "loss": 0.313, - "step": 81441 - }, - { - "epoch": 2.09, - "learning_rate": 4.473320375657346e-07, - "loss": 0.3831, - "step": 81442 - }, - { - "epoch": 2.09, - "learning_rate": 4.473089771784835e-07, - "loss": 0.4565, - "step": 81443 - }, - { - "epoch": 2.09, - "learning_rate": 4.4728591721440256e-07, - "loss": 0.3329, - "step": 81444 - }, - { - "epoch": 2.09, - "learning_rate": 4.47262857673509e-07, - "loss": 0.3203, - "step": 81445 - }, - { - "epoch": 2.09, - "learning_rate": 4.4723979855582083e-07, - "loss": 0.3018, - "step": 81446 - }, - { - "epoch": 2.09, - "learning_rate": 4.472167398613562e-07, - "loss": 0.3965, - "step": 81447 - }, - { - "epoch": 2.09, - "learning_rate": 4.471936815901318e-07, - "loss": 0.4023, - "step": 81448 - }, - { - "epoch": 2.09, - "learning_rate": 4.4717062374216586e-07, - "loss": 0.3212, - "step": 81449 - }, - { - "epoch": 2.09, - "learning_rate": 4.47147566317476e-07, - "loss": 0.2191, - "step": 81450 - }, - { - "epoch": 2.09, - "learning_rate": 4.4712450931608e-07, - "loss": 0.3862, - "step": 81451 - }, - { - "epoch": 2.09, - "learning_rate": 4.4710145273799514e-07, - "loss": 0.4253, - "step": 81452 - }, - { - "epoch": 2.09, - "learning_rate": 4.470783965832392e-07, - "loss": 0.4429, - "step": 81453 - }, - { - "epoch": 2.09, - "learning_rate": 4.470553408518303e-07, - "loss": 0.2822, - "step": 81454 - }, - { - "epoch": 2.09, - "learning_rate": 4.4703228554378534e-07, - "loss": 0.4717, - "step": 81455 - }, - { - "epoch": 2.09, - "learning_rate": 4.4700923065912275e-07, - "loss": 0.4077, - "step": 81456 - }, - { - "epoch": 2.09, - "learning_rate": 4.469861761978593e-07, - "loss": 0.37, - "step": 81457 - }, - { - "epoch": 2.09, - "learning_rate": 4.469631221600132e-07, - "loss": 0.3718, - "step": 81458 - }, - { - "epoch": 2.09, - "learning_rate": 4.4694006854560197e-07, - "loss": 0.4702, - "step": 81459 - }, - { - "epoch": 2.09, - "learning_rate": 4.4691701535464365e-07, - "loss": 0.4805, - "step": 81460 - }, - { - "epoch": 2.09, - "learning_rate": 4.4689396258715516e-07, - "loss": 0.4351, - "step": 81461 - }, - { - "epoch": 2.09, - "learning_rate": 4.4687091024315446e-07, - "loss": 0.397, - "step": 81462 - }, - { - "epoch": 2.09, - "learning_rate": 4.468478583226598e-07, - "loss": 0.4722, - "step": 81463 - }, - { - "epoch": 2.09, - "learning_rate": 4.4682480682568824e-07, - "loss": 0.5327, - "step": 81464 - }, - { - "epoch": 2.09, - "learning_rate": 4.4680175575225707e-07, - "loss": 0.4136, - "step": 81465 - }, - { - "epoch": 2.09, - "learning_rate": 4.4677870510238447e-07, - "loss": 0.5015, - "step": 81466 - }, - { - "epoch": 2.09, - "learning_rate": 4.467556548760879e-07, - "loss": 0.3149, - "step": 81467 - }, - { - "epoch": 2.09, - "learning_rate": 4.467326050733854e-07, - "loss": 0.3428, - "step": 81468 - }, - { - "epoch": 2.09, - "learning_rate": 4.4670955569429404e-07, - "loss": 0.4639, - "step": 81469 - }, - { - "epoch": 2.09, - "learning_rate": 4.466865067388317e-07, - "loss": 0.4609, - "step": 81470 - }, - { - "epoch": 2.09, - "learning_rate": 4.46663458207016e-07, - "loss": 0.5894, - "step": 81471 - }, - { - "epoch": 2.09, - "learning_rate": 4.466404100988651e-07, - "loss": 0.2927, - "step": 81472 - }, - { - "epoch": 2.09, - "learning_rate": 4.4661736241439575e-07, - "loss": 0.5791, - "step": 81473 - }, - { - "epoch": 2.09, - "learning_rate": 4.4659431515362643e-07, - "loss": 0.2277, - "step": 81474 - }, - { - "epoch": 2.09, - "learning_rate": 4.465712683165741e-07, - "loss": 0.2753, - "step": 81475 - }, - { - "epoch": 2.09, - "learning_rate": 4.465482219032566e-07, - "loss": 0.4761, - "step": 81476 - }, - { - "epoch": 2.09, - "learning_rate": 4.465251759136921e-07, - "loss": 0.5137, - "step": 81477 - }, - { - "epoch": 2.09, - "learning_rate": 4.4650213034789743e-07, - "loss": 0.3904, - "step": 81478 - }, - { - "epoch": 2.09, - "learning_rate": 4.464790852058907e-07, - "loss": 0.4658, - "step": 81479 - }, - { - "epoch": 2.09, - "learning_rate": 4.4645604048768983e-07, - "loss": 0.4531, - "step": 81480 - }, - { - "epoch": 2.09, - "learning_rate": 4.4643299619331163e-07, - "loss": 0.354, - "step": 81481 - }, - { - "epoch": 2.09, - "learning_rate": 4.464099523227743e-07, - "loss": 0.4297, - "step": 81482 - }, - { - "epoch": 2.09, - "learning_rate": 4.463869088760955e-07, - "loss": 0.3225, - "step": 81483 - }, - { - "epoch": 2.09, - "learning_rate": 4.4636386585329313e-07, - "loss": 0.3657, - "step": 81484 - }, - { - "epoch": 2.09, - "learning_rate": 4.4634082325438436e-07, - "loss": 0.1786, - "step": 81485 - }, - { - "epoch": 2.09, - "learning_rate": 4.4631778107938677e-07, - "loss": 0.4231, - "step": 81486 - }, - { - "epoch": 2.09, - "learning_rate": 4.4629473932831806e-07, - "loss": 0.5391, - "step": 81487 - }, - { - "epoch": 2.09, - "learning_rate": 4.46271698001196e-07, - "loss": 0.4819, - "step": 81488 - }, - { - "epoch": 2.09, - "learning_rate": 4.4624865709803873e-07, - "loss": 0.3735, - "step": 81489 - }, - { - "epoch": 2.09, - "learning_rate": 4.4622561661886294e-07, - "loss": 0.334, - "step": 81490 - }, - { - "epoch": 2.09, - "learning_rate": 4.4620257656368675e-07, - "loss": 0.417, - "step": 81491 - }, - { - "epoch": 2.09, - "learning_rate": 4.4617953693252785e-07, - "loss": 0.3252, - "step": 81492 - }, - { - "epoch": 2.09, - "learning_rate": 4.461564977254041e-07, - "loss": 0.3335, - "step": 81493 - }, - { - "epoch": 2.09, - "learning_rate": 4.4613345894233287e-07, - "loss": 0.4224, - "step": 81494 - }, - { - "epoch": 2.09, - "learning_rate": 4.461104205833315e-07, - "loss": 0.4653, - "step": 81495 - }, - { - "epoch": 2.09, - "learning_rate": 4.4608738264841783e-07, - "loss": 0.4941, - "step": 81496 - }, - { - "epoch": 2.09, - "learning_rate": 4.460643451376099e-07, - "loss": 0.467, - "step": 81497 - }, - { - "epoch": 2.09, - "learning_rate": 4.4604130805092475e-07, - "loss": 0.3901, - "step": 81498 - }, - { - "epoch": 2.09, - "learning_rate": 4.460182713883802e-07, - "loss": 0.4175, - "step": 81499 - }, - { - "epoch": 2.09, - "learning_rate": 4.4599523514999415e-07, - "loss": 0.4634, - "step": 81500 - }, - { - "epoch": 2.09, - "learning_rate": 4.4597219933578435e-07, - "loss": 0.4697, - "step": 81501 - }, - { - "epoch": 2.09, - "learning_rate": 4.4594916394576774e-07, - "loss": 0.436, - "step": 81502 - }, - { - "epoch": 2.09, - "learning_rate": 4.459261289799625e-07, - "loss": 0.3926, - "step": 81503 - }, - { - "epoch": 2.09, - "learning_rate": 4.4590309443838634e-07, - "loss": 0.4253, - "step": 81504 - }, - { - "epoch": 2.09, - "learning_rate": 4.4588006032105653e-07, - "loss": 0.427, - "step": 81505 - }, - { - "epoch": 2.09, - "learning_rate": 4.458570266279912e-07, - "loss": 0.2946, - "step": 81506 - }, - { - "epoch": 2.09, - "learning_rate": 4.4583399335920724e-07, - "loss": 0.3418, - "step": 81507 - }, - { - "epoch": 2.09, - "learning_rate": 4.458109605147227e-07, - "loss": 0.318, - "step": 81508 - }, - { - "epoch": 2.09, - "learning_rate": 4.457879280945552e-07, - "loss": 0.4639, - "step": 81509 - }, - { - "epoch": 2.09, - "learning_rate": 4.457648960987228e-07, - "loss": 0.542, - "step": 81510 - }, - { - "epoch": 2.09, - "learning_rate": 4.457418645272424e-07, - "loss": 0.4746, - "step": 81511 - }, - { - "epoch": 2.09, - "learning_rate": 4.457188333801319e-07, - "loss": 0.4434, - "step": 81512 - }, - { - "epoch": 2.09, - "learning_rate": 4.4569580265740916e-07, - "loss": 0.5156, - "step": 81513 - }, - { - "epoch": 2.09, - "learning_rate": 4.456727723590923e-07, - "loss": 0.4971, - "step": 81514 - }, - { - "epoch": 2.09, - "learning_rate": 4.456497424851975e-07, - "loss": 0.4189, - "step": 81515 - }, - { - "epoch": 2.09, - "learning_rate": 4.456267130357433e-07, - "loss": 0.4214, - "step": 81516 - }, - { - "epoch": 2.09, - "learning_rate": 4.456036840107472e-07, - "loss": 0.3335, - "step": 81517 - }, - { - "epoch": 2.09, - "learning_rate": 4.4558065541022726e-07, - "loss": 0.4829, - "step": 81518 - }, - { - "epoch": 2.09, - "learning_rate": 4.455576272342003e-07, - "loss": 0.4165, - "step": 81519 - }, - { - "epoch": 2.09, - "learning_rate": 4.4553459948268437e-07, - "loss": 0.2367, - "step": 81520 - }, - { - "epoch": 2.09, - "learning_rate": 4.455115721556971e-07, - "loss": 0.5952, - "step": 81521 - }, - { - "epoch": 2.09, - "learning_rate": 4.454885452532565e-07, - "loss": 0.4355, - "step": 81522 - }, - { - "epoch": 2.09, - "learning_rate": 4.4546551877537954e-07, - "loss": 0.2894, - "step": 81523 - }, - { - "epoch": 2.09, - "learning_rate": 4.4544249272208445e-07, - "loss": 0.2942, - "step": 81524 - }, - { - "epoch": 2.09, - "learning_rate": 4.454194670933882e-07, - "loss": 0.5488, - "step": 81525 - }, - { - "epoch": 2.09, - "learning_rate": 4.453964418893087e-07, - "loss": 0.5454, - "step": 81526 - }, - { - "epoch": 2.09, - "learning_rate": 4.4537341710986396e-07, - "loss": 0.3343, - "step": 81527 - }, - { - "epoch": 2.09, - "learning_rate": 4.4535039275507105e-07, - "loss": 0.3584, - "step": 81528 - }, - { - "epoch": 2.09, - "learning_rate": 4.453273688249478e-07, - "loss": 0.3901, - "step": 81529 - }, - { - "epoch": 2.09, - "learning_rate": 4.453043453195119e-07, - "loss": 0.4565, - "step": 81530 - }, - { - "epoch": 2.09, - "learning_rate": 4.4528132223878124e-07, - "loss": 0.3994, - "step": 81531 - }, - { - "epoch": 2.09, - "learning_rate": 4.4525829958277283e-07, - "loss": 0.353, - "step": 81532 - }, - { - "epoch": 2.09, - "learning_rate": 4.452352773515047e-07, - "loss": 0.4692, - "step": 81533 - }, - { - "epoch": 2.09, - "learning_rate": 4.4521225554499474e-07, - "loss": 0.4091, - "step": 81534 - }, - { - "epoch": 2.09, - "learning_rate": 4.4518923416326026e-07, - "loss": 0.4106, - "step": 81535 - }, - { - "epoch": 2.09, - "learning_rate": 4.451662132063184e-07, - "loss": 0.4314, - "step": 81536 - }, - { - "epoch": 2.09, - "learning_rate": 4.451431926741874e-07, - "loss": 0.395, - "step": 81537 - }, - { - "epoch": 2.09, - "learning_rate": 4.4512017256688473e-07, - "loss": 0.239, - "step": 81538 - }, - { - "epoch": 2.09, - "learning_rate": 4.4509715288442826e-07, - "loss": 0.5, - "step": 81539 - }, - { - "epoch": 2.09, - "learning_rate": 4.450741336268352e-07, - "loss": 0.4678, - "step": 81540 - }, - { - "epoch": 2.09, - "learning_rate": 4.450511147941233e-07, - "loss": 0.417, - "step": 81541 - }, - { - "epoch": 2.09, - "learning_rate": 4.450280963863102e-07, - "loss": 0.3613, - "step": 81542 - }, - { - "epoch": 2.09, - "learning_rate": 4.4500507840341397e-07, - "loss": 0.4517, - "step": 81543 - }, - { - "epoch": 2.09, - "learning_rate": 4.4498206084545176e-07, - "loss": 0.5303, - "step": 81544 - }, - { - "epoch": 2.09, - "learning_rate": 4.4495904371244095e-07, - "loss": 0.3457, - "step": 81545 - }, - { - "epoch": 2.09, - "learning_rate": 4.449360270043995e-07, - "loss": 0.3483, - "step": 81546 - }, - { - "epoch": 2.09, - "learning_rate": 4.44913010721345e-07, - "loss": 0.5684, - "step": 81547 - }, - { - "epoch": 2.09, - "learning_rate": 4.448899948632955e-07, - "loss": 0.249, - "step": 81548 - }, - { - "epoch": 2.09, - "learning_rate": 4.4486697943026774e-07, - "loss": 0.321, - "step": 81549 - }, - { - "epoch": 2.09, - "learning_rate": 4.448439644222798e-07, - "loss": 0.3435, - "step": 81550 - }, - { - "epoch": 2.09, - "learning_rate": 4.448209498393498e-07, - "loss": 0.5645, - "step": 81551 - }, - { - "epoch": 2.09, - "learning_rate": 4.4479793568149437e-07, - "loss": 0.5029, - "step": 81552 - }, - { - "epoch": 2.09, - "learning_rate": 4.447749219487317e-07, - "loss": 0.4595, - "step": 81553 - }, - { - "epoch": 2.09, - "learning_rate": 4.447519086410797e-07, - "loss": 0.3794, - "step": 81554 - }, - { - "epoch": 2.09, - "learning_rate": 4.4472889575855533e-07, - "loss": 0.5117, - "step": 81555 - }, - { - "epoch": 2.09, - "learning_rate": 4.4470588330117676e-07, - "loss": 0.3228, - "step": 81556 - }, - { - "epoch": 2.09, - "learning_rate": 4.446828712689611e-07, - "loss": 0.4609, - "step": 81557 - }, - { - "epoch": 2.09, - "learning_rate": 4.446598596619262e-07, - "loss": 0.3779, - "step": 81558 - }, - { - "epoch": 2.09, - "learning_rate": 4.4463684848008964e-07, - "loss": 0.4263, - "step": 81559 - }, - { - "epoch": 2.09, - "learning_rate": 4.446138377234695e-07, - "loss": 0.3505, - "step": 81560 - }, - { - "epoch": 2.09, - "learning_rate": 4.4459082739208273e-07, - "loss": 0.4189, - "step": 81561 - }, - { - "epoch": 2.09, - "learning_rate": 4.445678174859472e-07, - "loss": 0.4399, - "step": 81562 - }, - { - "epoch": 2.09, - "learning_rate": 4.445448080050804e-07, - "loss": 0.4153, - "step": 81563 - }, - { - "epoch": 2.09, - "learning_rate": 4.445217989495007e-07, - "loss": 0.3848, - "step": 81564 - }, - { - "epoch": 2.09, - "learning_rate": 4.44498790319225e-07, - "loss": 0.3505, - "step": 81565 - }, - { - "epoch": 2.09, - "learning_rate": 4.4447578211427064e-07, - "loss": 0.3994, - "step": 81566 - }, - { - "epoch": 2.09, - "learning_rate": 4.4445277433465567e-07, - "loss": 0.4536, - "step": 81567 - }, - { - "epoch": 2.09, - "learning_rate": 4.4442976698039803e-07, - "loss": 0.3831, - "step": 81568 - }, - { - "epoch": 2.09, - "learning_rate": 4.444067600515146e-07, - "loss": 0.4277, - "step": 81569 - }, - { - "epoch": 2.09, - "learning_rate": 4.443837535480234e-07, - "loss": 0.4678, - "step": 81570 - }, - { - "epoch": 2.09, - "learning_rate": 4.4436074746994187e-07, - "loss": 0.3367, - "step": 81571 - }, - { - "epoch": 2.09, - "learning_rate": 4.4433774181728836e-07, - "loss": 0.3691, - "step": 81572 - }, - { - "epoch": 2.09, - "learning_rate": 4.443147365900797e-07, - "loss": 0.4204, - "step": 81573 - }, - { - "epoch": 2.09, - "learning_rate": 4.4429173178833335e-07, - "loss": 0.4312, - "step": 81574 - }, - { - "epoch": 2.09, - "learning_rate": 4.442687274120673e-07, - "loss": 0.3481, - "step": 81575 - }, - { - "epoch": 2.09, - "learning_rate": 4.442457234612992e-07, - "loss": 0.3989, - "step": 81576 - }, - { - "epoch": 2.09, - "learning_rate": 4.44222719936047e-07, - "loss": 0.4482, - "step": 81577 - }, - { - "epoch": 2.09, - "learning_rate": 4.441997168363274e-07, - "loss": 0.543, - "step": 81578 - }, - { - "epoch": 2.09, - "learning_rate": 4.441767141621585e-07, - "loss": 0.4438, - "step": 81579 - }, - { - "epoch": 2.09, - "learning_rate": 4.441537119135581e-07, - "loss": 0.3489, - "step": 81580 - }, - { - "epoch": 2.09, - "learning_rate": 4.4413071009054393e-07, - "loss": 0.479, - "step": 81581 - }, - { - "epoch": 2.09, - "learning_rate": 4.4410770869313285e-07, - "loss": 0.3533, - "step": 81582 - }, - { - "epoch": 2.09, - "learning_rate": 4.4408470772134344e-07, - "loss": 0.4419, - "step": 81583 - }, - { - "epoch": 2.09, - "learning_rate": 4.440617071751924e-07, - "loss": 0.3149, - "step": 81584 - }, - { - "epoch": 2.09, - "learning_rate": 4.440387070546977e-07, - "loss": 0.4023, - "step": 81585 - }, - { - "epoch": 2.09, - "learning_rate": 4.440157073598775e-07, - "loss": 0.415, - "step": 81586 - }, - { - "epoch": 2.09, - "learning_rate": 4.439927080907484e-07, - "loss": 0.459, - "step": 81587 - }, - { - "epoch": 2.09, - "learning_rate": 4.4396970924732857e-07, - "loss": 0.3149, - "step": 81588 - }, - { - "epoch": 2.09, - "learning_rate": 4.439467108296359e-07, - "loss": 0.478, - "step": 81589 - }, - { - "epoch": 2.09, - "learning_rate": 4.4392371283768735e-07, - "loss": 0.3521, - "step": 81590 - }, - { - "epoch": 2.09, - "learning_rate": 4.4390071527150074e-07, - "loss": 0.2952, - "step": 81591 - }, - { - "epoch": 2.09, - "learning_rate": 4.4387771813109387e-07, - "loss": 0.4702, - "step": 81592 - }, - { - "epoch": 2.09, - "learning_rate": 4.4385472141648464e-07, - "loss": 0.3232, - "step": 81593 - }, - { - "epoch": 2.09, - "learning_rate": 4.438317251276903e-07, - "loss": 0.3862, - "step": 81594 - }, - { - "epoch": 2.09, - "learning_rate": 4.43808729264728e-07, - "loss": 0.4575, - "step": 81595 - }, - { - "epoch": 2.09, - "learning_rate": 4.4378573382761573e-07, - "loss": 0.5381, - "step": 81596 - }, - { - "epoch": 2.09, - "learning_rate": 4.437627388163713e-07, - "loss": 0.4204, - "step": 81597 - }, - { - "epoch": 2.09, - "learning_rate": 4.4373974423101246e-07, - "loss": 0.3433, - "step": 81598 - }, - { - "epoch": 2.09, - "learning_rate": 4.437167500715562e-07, - "loss": 0.4316, - "step": 81599 - }, - { - "epoch": 2.09, - "learning_rate": 4.436937563380203e-07, - "loss": 0.3466, - "step": 81600 - }, - { - "epoch": 2.09, - "learning_rate": 4.4367076303042263e-07, - "loss": 0.3502, - "step": 81601 - }, - { - "epoch": 2.09, - "learning_rate": 4.4364777014878106e-07, - "loss": 0.4746, - "step": 81602 - }, - { - "epoch": 2.09, - "learning_rate": 4.436247776931128e-07, - "loss": 0.3845, - "step": 81603 - }, - { - "epoch": 2.09, - "learning_rate": 4.43601785663435e-07, - "loss": 0.4873, - "step": 81604 - }, - { - "epoch": 2.09, - "learning_rate": 4.435787940597658e-07, - "loss": 0.4648, - "step": 81605 - }, - { - "epoch": 2.09, - "learning_rate": 4.4355580288212314e-07, - "loss": 0.374, - "step": 81606 - }, - { - "epoch": 2.09, - "learning_rate": 4.4353281213052374e-07, - "loss": 0.3009, - "step": 81607 - }, - { - "epoch": 2.09, - "learning_rate": 4.4350982180498577e-07, - "loss": 0.4767, - "step": 81608 - }, - { - "epoch": 2.09, - "learning_rate": 4.434868319055267e-07, - "loss": 0.5103, - "step": 81609 - }, - { - "epoch": 2.09, - "learning_rate": 4.434638424321646e-07, - "loss": 0.4067, - "step": 81610 - }, - { - "epoch": 2.09, - "learning_rate": 4.434408533849162e-07, - "loss": 0.4355, - "step": 81611 - }, - { - "epoch": 2.09, - "learning_rate": 4.434178647637996e-07, - "loss": 0.5449, - "step": 81612 - }, - { - "epoch": 2.09, - "learning_rate": 4.4339487656883266e-07, - "loss": 0.2874, - "step": 81613 - }, - { - "epoch": 2.09, - "learning_rate": 4.433718888000324e-07, - "loss": 0.4131, - "step": 81614 - }, - { - "epoch": 2.09, - "learning_rate": 4.43348901457417e-07, - "loss": 0.4009, - "step": 81615 - }, - { - "epoch": 2.09, - "learning_rate": 4.433259145410033e-07, - "loss": 0.5405, - "step": 81616 - }, - { - "epoch": 2.09, - "learning_rate": 4.4330292805080947e-07, - "loss": 0.4316, - "step": 81617 - }, - { - "epoch": 2.09, - "learning_rate": 4.432799419868529e-07, - "loss": 0.4355, - "step": 81618 - }, - { - "epoch": 2.09, - "learning_rate": 4.4325695634915173e-07, - "loss": 0.4648, - "step": 81619 - }, - { - "epoch": 2.09, - "learning_rate": 4.432339711377228e-07, - "loss": 0.5752, - "step": 81620 - }, - { - "epoch": 2.09, - "learning_rate": 4.432109863525838e-07, - "loss": 0.3794, - "step": 81621 - }, - { - "epoch": 2.09, - "learning_rate": 4.431880019937527e-07, - "loss": 0.4346, - "step": 81622 - }, - { - "epoch": 2.09, - "learning_rate": 4.4316501806124773e-07, - "loss": 0.4907, - "step": 81623 - }, - { - "epoch": 2.09, - "learning_rate": 4.4314203455508483e-07, - "loss": 0.3351, - "step": 81624 - }, - { - "epoch": 2.09, - "learning_rate": 4.431190514752825e-07, - "loss": 0.4814, - "step": 81625 - }, - { - "epoch": 2.09, - "learning_rate": 4.4309606882185835e-07, - "loss": 0.356, - "step": 81626 - }, - { - "epoch": 2.09, - "learning_rate": 4.4307308659483035e-07, - "loss": 0.3756, - "step": 81627 - }, - { - "epoch": 2.09, - "learning_rate": 4.4305010479421525e-07, - "loss": 0.5332, - "step": 81628 - }, - { - "epoch": 2.09, - "learning_rate": 4.43027123420031e-07, - "loss": 0.4424, - "step": 81629 - }, - { - "epoch": 2.09, - "learning_rate": 4.4300414247229533e-07, - "loss": 0.3865, - "step": 81630 - }, - { - "epoch": 2.09, - "learning_rate": 4.429811619510262e-07, - "loss": 0.4453, - "step": 81631 - }, - { - "epoch": 2.09, - "learning_rate": 4.4295818185624036e-07, - "loss": 0.376, - "step": 81632 - }, - { - "epoch": 2.09, - "learning_rate": 4.429352021879562e-07, - "loss": 0.4546, - "step": 81633 - }, - { - "epoch": 2.09, - "learning_rate": 4.429122229461906e-07, - "loss": 0.4512, - "step": 81634 - }, - { - "epoch": 2.09, - "learning_rate": 4.4288924413096154e-07, - "loss": 0.4211, - "step": 81635 - }, - { - "epoch": 2.09, - "learning_rate": 4.428662657422868e-07, - "loss": 0.3411, - "step": 81636 - }, - { - "epoch": 2.09, - "learning_rate": 4.4284328778018344e-07, - "loss": 0.4146, - "step": 81637 - }, - { - "epoch": 2.09, - "learning_rate": 4.428203102446694e-07, - "loss": 0.4001, - "step": 81638 - }, - { - "epoch": 2.09, - "learning_rate": 4.4279733313576216e-07, - "loss": 0.4154, - "step": 81639 - }, - { - "epoch": 2.09, - "learning_rate": 4.427743564534798e-07, - "loss": 0.4141, - "step": 81640 - }, - { - "epoch": 2.09, - "learning_rate": 4.427513801978391e-07, - "loss": 0.4888, - "step": 81641 - }, - { - "epoch": 2.09, - "learning_rate": 4.4272840436885805e-07, - "loss": 0.4033, - "step": 81642 - }, - { - "epoch": 2.09, - "learning_rate": 4.427054289665546e-07, - "loss": 0.4424, - "step": 81643 - }, - { - "epoch": 2.09, - "learning_rate": 4.4268245399094596e-07, - "loss": 0.438, - "step": 81644 - }, - { - "epoch": 2.09, - "learning_rate": 4.426594794420494e-07, - "loss": 0.4009, - "step": 81645 - }, - { - "epoch": 2.09, - "learning_rate": 4.426365053198828e-07, - "loss": 0.4019, - "step": 81646 - }, - { - "epoch": 2.09, - "learning_rate": 4.426135316244639e-07, - "loss": 0.3704, - "step": 81647 - }, - { - "epoch": 2.09, - "learning_rate": 4.425905583558105e-07, - "loss": 0.4829, - "step": 81648 - }, - { - "epoch": 2.09, - "learning_rate": 4.4256758551393946e-07, - "loss": 0.3979, - "step": 81649 - }, - { - "epoch": 2.09, - "learning_rate": 4.425446130988689e-07, - "loss": 0.4585, - "step": 81650 - }, - { - "epoch": 2.09, - "learning_rate": 4.425216411106162e-07, - "loss": 0.5098, - "step": 81651 - }, - { - "epoch": 2.09, - "learning_rate": 4.424986695491995e-07, - "loss": 0.2915, - "step": 81652 - }, - { - "epoch": 2.09, - "learning_rate": 4.4247569841463585e-07, - "loss": 0.5264, - "step": 81653 - }, - { - "epoch": 2.09, - "learning_rate": 4.4245272770694263e-07, - "loss": 0.4023, - "step": 81654 - }, - { - "epoch": 2.09, - "learning_rate": 4.4242975742613766e-07, - "loss": 0.4292, - "step": 81655 - }, - { - "epoch": 2.09, - "learning_rate": 4.424067875722386e-07, - "loss": 0.3555, - "step": 81656 - }, - { - "epoch": 2.09, - "learning_rate": 4.423838181452634e-07, - "loss": 0.3916, - "step": 81657 - }, - { - "epoch": 2.09, - "learning_rate": 4.423608491452289e-07, - "loss": 0.3564, - "step": 81658 - }, - { - "epoch": 2.09, - "learning_rate": 4.4233788057215304e-07, - "loss": 0.2751, - "step": 81659 - }, - { - "epoch": 2.09, - "learning_rate": 4.423149124260538e-07, - "loss": 0.3892, - "step": 81660 - }, - { - "epoch": 2.09, - "learning_rate": 4.422919447069481e-07, - "loss": 0.4268, - "step": 81661 - }, - { - "epoch": 2.09, - "learning_rate": 4.422689774148537e-07, - "loss": 0.3158, - "step": 81662 - }, - { - "epoch": 2.09, - "learning_rate": 4.422460105497887e-07, - "loss": 0.5557, - "step": 81663 - }, - { - "epoch": 2.09, - "learning_rate": 4.422230441117699e-07, - "loss": 0.4746, - "step": 81664 - }, - { - "epoch": 2.09, - "learning_rate": 4.422000781008157e-07, - "loss": 0.3403, - "step": 81665 - }, - { - "epoch": 2.09, - "learning_rate": 4.421771125169429e-07, - "loss": 0.458, - "step": 81666 - }, - { - "epoch": 2.09, - "learning_rate": 4.421541473601693e-07, - "loss": 0.5435, - "step": 81667 - }, - { - "epoch": 2.09, - "learning_rate": 4.4213118263051275e-07, - "loss": 0.4092, - "step": 81668 - }, - { - "epoch": 2.09, - "learning_rate": 4.4210821832799104e-07, - "loss": 0.4556, - "step": 81669 - }, - { - "epoch": 2.09, - "learning_rate": 4.42085254452621e-07, - "loss": 0.4946, - "step": 81670 - }, - { - "epoch": 2.09, - "learning_rate": 4.420622910044206e-07, - "loss": 0.3322, - "step": 81671 - }, - { - "epoch": 2.09, - "learning_rate": 4.420393279834076e-07, - "loss": 0.3955, - "step": 81672 - }, - { - "epoch": 2.09, - "learning_rate": 4.420163653895996e-07, - "loss": 0.4241, - "step": 81673 - }, - { - "epoch": 2.09, - "learning_rate": 4.4199340322301415e-07, - "loss": 0.4453, - "step": 81674 - }, - { - "epoch": 2.09, - "learning_rate": 4.4197044148366835e-07, - "loss": 0.3589, - "step": 81675 - }, - { - "epoch": 2.09, - "learning_rate": 4.4194748017158e-07, - "loss": 0.2864, - "step": 81676 - }, - { - "epoch": 2.09, - "learning_rate": 4.419245192867672e-07, - "loss": 0.3843, - "step": 81677 - }, - { - "epoch": 2.09, - "learning_rate": 4.4190155882924684e-07, - "loss": 0.3652, - "step": 81678 - }, - { - "epoch": 2.09, - "learning_rate": 4.4187859879903676e-07, - "loss": 0.4438, - "step": 81679 - }, - { - "epoch": 2.09, - "learning_rate": 4.4185563919615454e-07, - "loss": 0.4458, - "step": 81680 - }, - { - "epoch": 2.09, - "learning_rate": 4.418326800206182e-07, - "loss": 0.2975, - "step": 81681 - }, - { - "epoch": 2.09, - "learning_rate": 4.4180972127244455e-07, - "loss": 0.3638, - "step": 81682 - }, - { - "epoch": 2.09, - "learning_rate": 4.4178676295165183e-07, - "loss": 0.4922, - "step": 81683 - }, - { - "epoch": 2.09, - "learning_rate": 4.4176380505825707e-07, - "loss": 0.4072, - "step": 81684 - }, - { - "epoch": 2.09, - "learning_rate": 4.4174084759227803e-07, - "loss": 0.3613, - "step": 81685 - }, - { - "epoch": 2.09, - "learning_rate": 4.4171789055373274e-07, - "loss": 0.5557, - "step": 81686 - }, - { - "epoch": 2.09, - "learning_rate": 4.41694933942638e-07, - "loss": 0.3262, - "step": 81687 - }, - { - "epoch": 2.09, - "learning_rate": 4.4167197775901175e-07, - "loss": 0.5879, - "step": 81688 - }, - { - "epoch": 2.09, - "learning_rate": 4.416490220028717e-07, - "loss": 0.3721, - "step": 81689 - }, - { - "epoch": 2.09, - "learning_rate": 4.416260666742355e-07, - "loss": 0.2849, - "step": 81690 - }, - { - "epoch": 2.09, - "learning_rate": 4.4160311177312037e-07, - "loss": 0.3721, - "step": 81691 - }, - { - "epoch": 2.09, - "learning_rate": 4.41580157299544e-07, - "loss": 0.3833, - "step": 81692 - }, - { - "epoch": 2.09, - "learning_rate": 4.415572032535243e-07, - "loss": 0.5684, - "step": 81693 - }, - { - "epoch": 2.09, - "learning_rate": 4.415342496350787e-07, - "loss": 0.4937, - "step": 81694 - }, - { - "epoch": 2.09, - "learning_rate": 4.4151129644422424e-07, - "loss": 0.3428, - "step": 81695 - }, - { - "epoch": 2.09, - "learning_rate": 4.4148834368097885e-07, - "loss": 0.3657, - "step": 81696 - }, - { - "epoch": 2.09, - "learning_rate": 4.414653913453602e-07, - "loss": 0.3301, - "step": 81697 - }, - { - "epoch": 2.09, - "learning_rate": 4.4144243943738624e-07, - "loss": 0.4194, - "step": 81698 - }, - { - "epoch": 2.09, - "learning_rate": 4.4141948795707363e-07, - "loss": 0.4756, - "step": 81699 - }, - { - "epoch": 2.09, - "learning_rate": 4.4139653690444045e-07, - "loss": 0.3967, - "step": 81700 - }, - { - "epoch": 2.09, - "learning_rate": 4.413735862795044e-07, - "loss": 0.5781, - "step": 81701 - }, - { - "epoch": 2.09, - "learning_rate": 4.4135063608228316e-07, - "loss": 0.3428, - "step": 81702 - }, - { - "epoch": 2.09, - "learning_rate": 4.4132768631279404e-07, - "loss": 0.4146, - "step": 81703 - }, - { - "epoch": 2.09, - "learning_rate": 4.413047369710543e-07, - "loss": 0.4316, - "step": 81704 - }, - { - "epoch": 2.09, - "learning_rate": 4.4128178805708183e-07, - "loss": 0.324, - "step": 81705 - }, - { - "epoch": 2.09, - "learning_rate": 4.4125883957089416e-07, - "loss": 0.4241, - "step": 81706 - }, - { - "epoch": 2.09, - "learning_rate": 4.4123589151250927e-07, - "loss": 0.3916, - "step": 81707 - }, - { - "epoch": 2.09, - "learning_rate": 4.412129438819441e-07, - "loss": 0.4277, - "step": 81708 - }, - { - "epoch": 2.09, - "learning_rate": 4.4118999667921643e-07, - "loss": 0.3252, - "step": 81709 - }, - { - "epoch": 2.09, - "learning_rate": 4.4116704990434385e-07, - "loss": 0.3779, - "step": 81710 - }, - { - "epoch": 2.09, - "learning_rate": 4.4114410355734434e-07, - "loss": 0.416, - "step": 81711 - }, - { - "epoch": 2.09, - "learning_rate": 4.4112115763823476e-07, - "loss": 0.4795, - "step": 81712 - }, - { - "epoch": 2.09, - "learning_rate": 4.4109821214703335e-07, - "loss": 0.4048, - "step": 81713 - }, - { - "epoch": 2.09, - "learning_rate": 4.4107526708375696e-07, - "loss": 0.4399, - "step": 81714 - }, - { - "epoch": 2.09, - "learning_rate": 4.4105232244842395e-07, - "loss": 0.2355, - "step": 81715 - }, - { - "epoch": 2.09, - "learning_rate": 4.41029378241051e-07, - "loss": 0.4399, - "step": 81716 - }, - { - "epoch": 2.09, - "learning_rate": 4.410064344616563e-07, - "loss": 0.4431, - "step": 81717 - }, - { - "epoch": 2.09, - "learning_rate": 4.4098349111025725e-07, - "loss": 0.4639, - "step": 81718 - }, - { - "epoch": 2.09, - "learning_rate": 4.409605481868717e-07, - "loss": 0.3293, - "step": 81719 - }, - { - "epoch": 2.09, - "learning_rate": 4.409376056915166e-07, - "loss": 0.4248, - "step": 81720 - }, - { - "epoch": 2.09, - "learning_rate": 4.4091466362420994e-07, - "loss": 0.5913, - "step": 81721 - }, - { - "epoch": 2.09, - "learning_rate": 4.4089172198496927e-07, - "loss": 0.3354, - "step": 81722 - }, - { - "epoch": 2.09, - "learning_rate": 4.4086878077381227e-07, - "loss": 0.4087, - "step": 81723 - }, - { - "epoch": 2.09, - "learning_rate": 4.408458399907565e-07, - "loss": 0.4395, - "step": 81724 - }, - { - "epoch": 2.09, - "learning_rate": 4.4082289963581896e-07, - "loss": 0.3555, - "step": 81725 - }, - { - "epoch": 2.09, - "learning_rate": 4.407999597090176e-07, - "loss": 0.3298, - "step": 81726 - }, - { - "epoch": 2.09, - "learning_rate": 4.4077702021037e-07, - "loss": 0.3828, - "step": 81727 - }, - { - "epoch": 2.09, - "learning_rate": 4.407540811398941e-07, - "loss": 0.4185, - "step": 81728 - }, - { - "epoch": 2.09, - "learning_rate": 4.407311424976067e-07, - "loss": 0.4434, - "step": 81729 - }, - { - "epoch": 2.09, - "learning_rate": 4.4070820428352573e-07, - "loss": 0.2829, - "step": 81730 - }, - { - "epoch": 2.09, - "learning_rate": 4.406852664976691e-07, - "loss": 0.5283, - "step": 81731 - }, - { - "epoch": 2.09, - "learning_rate": 4.4066232914005373e-07, - "loss": 0.4268, - "step": 81732 - }, - { - "epoch": 2.09, - "learning_rate": 4.406393922106979e-07, - "loss": 0.5244, - "step": 81733 - }, - { - "epoch": 2.09, - "learning_rate": 4.4061645570961836e-07, - "loss": 0.4128, - "step": 81734 - }, - { - "epoch": 2.09, - "learning_rate": 4.405935196368331e-07, - "loss": 0.2625, - "step": 81735 - }, - { - "epoch": 2.09, - "learning_rate": 4.4057058399236e-07, - "loss": 0.3403, - "step": 81736 - }, - { - "epoch": 2.09, - "learning_rate": 4.4054764877621597e-07, - "loss": 0.418, - "step": 81737 - }, - { - "epoch": 2.09, - "learning_rate": 4.405247139884188e-07, - "loss": 0.479, - "step": 81738 - }, - { - "epoch": 2.1, - "learning_rate": 4.405017796289863e-07, - "loss": 0.3071, - "step": 81739 - }, - { - "epoch": 2.1, - "learning_rate": 4.40478845697936e-07, - "loss": 0.3611, - "step": 81740 - }, - { - "epoch": 2.1, - "learning_rate": 4.404559121952851e-07, - "loss": 0.4204, - "step": 81741 - }, - { - "epoch": 2.1, - "learning_rate": 4.4043297912105127e-07, - "loss": 0.3423, - "step": 81742 - }, - { - "epoch": 2.1, - "learning_rate": 4.404100464752526e-07, - "loss": 0.5151, - "step": 81743 - }, - { - "epoch": 2.1, - "learning_rate": 4.4038711425790586e-07, - "loss": 0.4282, - "step": 81744 - }, - { - "epoch": 2.1, - "learning_rate": 4.403641824690294e-07, - "loss": 0.335, - "step": 81745 - }, - { - "epoch": 2.1, - "learning_rate": 4.4034125110863994e-07, - "loss": 0.4819, - "step": 81746 - }, - { - "epoch": 2.1, - "learning_rate": 4.403183201767554e-07, - "loss": 0.5112, - "step": 81747 - }, - { - "epoch": 2.1, - "learning_rate": 4.402953896733934e-07, - "loss": 0.4087, - "step": 81748 - }, - { - "epoch": 2.1, - "learning_rate": 4.4027245959857196e-07, - "loss": 0.3411, - "step": 81749 - }, - { - "epoch": 2.1, - "learning_rate": 4.402495299523077e-07, - "loss": 0.4346, - "step": 81750 - }, - { - "epoch": 2.1, - "learning_rate": 4.402266007346187e-07, - "loss": 0.2797, - "step": 81751 - }, - { - "epoch": 2.1, - "learning_rate": 4.402036719455228e-07, - "loss": 0.5371, - "step": 81752 - }, - { - "epoch": 2.1, - "learning_rate": 4.401807435850371e-07, - "loss": 0.4214, - "step": 81753 - }, - { - "epoch": 2.1, - "learning_rate": 4.40157815653179e-07, - "loss": 0.4014, - "step": 81754 - }, - { - "epoch": 2.1, - "learning_rate": 4.4013488814996624e-07, - "loss": 0.3663, - "step": 81755 - }, - { - "epoch": 2.1, - "learning_rate": 4.401119610754166e-07, - "loss": 0.3352, - "step": 81756 - }, - { - "epoch": 2.1, - "learning_rate": 4.4008903442954773e-07, - "loss": 0.5444, - "step": 81757 - }, - { - "epoch": 2.1, - "learning_rate": 4.4006610821237653e-07, - "loss": 0.4097, - "step": 81758 - }, - { - "epoch": 2.1, - "learning_rate": 4.400431824239211e-07, - "loss": 0.314, - "step": 81759 - }, - { - "epoch": 2.1, - "learning_rate": 4.4002025706419877e-07, - "loss": 0.5669, - "step": 81760 - }, - { - "epoch": 2.1, - "learning_rate": 4.399973321332277e-07, - "loss": 0.3416, - "step": 81761 - }, - { - "epoch": 2.1, - "learning_rate": 4.3997440763102434e-07, - "loss": 0.4072, - "step": 81762 - }, - { - "epoch": 2.1, - "learning_rate": 4.3995148355760724e-07, - "loss": 0.4263, - "step": 81763 - }, - { - "epoch": 2.1, - "learning_rate": 4.3992855991299327e-07, - "loss": 0.3624, - "step": 81764 - }, - { - "epoch": 2.1, - "learning_rate": 4.3990563669720015e-07, - "loss": 0.4175, - "step": 81765 - }, - { - "epoch": 2.1, - "learning_rate": 4.39882713910246e-07, - "loss": 0.5234, - "step": 81766 - }, - { - "epoch": 2.1, - "learning_rate": 4.398597915521475e-07, - "loss": 0.3218, - "step": 81767 - }, - { - "epoch": 2.1, - "learning_rate": 4.3983686962292256e-07, - "loss": 0.4551, - "step": 81768 - }, - { - "epoch": 2.1, - "learning_rate": 4.398139481225891e-07, - "loss": 0.3994, - "step": 81769 - }, - { - "epoch": 2.1, - "learning_rate": 4.397910270511641e-07, - "loss": 0.3501, - "step": 81770 - }, - { - "epoch": 2.1, - "learning_rate": 4.397681064086652e-07, - "loss": 0.3203, - "step": 81771 - }, - { - "epoch": 2.1, - "learning_rate": 4.3974518619511024e-07, - "loss": 0.4502, - "step": 81772 - }, - { - "epoch": 2.1, - "learning_rate": 4.397222664105169e-07, - "loss": 0.5146, - "step": 81773 - }, - { - "epoch": 2.1, - "learning_rate": 4.396993470549025e-07, - "loss": 0.3071, - "step": 81774 - }, - { - "epoch": 2.1, - "learning_rate": 4.396764281282842e-07, - "loss": 0.2755, - "step": 81775 - }, - { - "epoch": 2.1, - "learning_rate": 4.3965350963067995e-07, - "loss": 0.5283, - "step": 81776 - }, - { - "epoch": 2.1, - "learning_rate": 4.3963059156210716e-07, - "loss": 0.4873, - "step": 81777 - }, - { - "epoch": 2.1, - "learning_rate": 4.396076739225838e-07, - "loss": 0.395, - "step": 81778 - }, - { - "epoch": 2.1, - "learning_rate": 4.395847567121267e-07, - "loss": 0.4233, - "step": 81779 - }, - { - "epoch": 2.1, - "learning_rate": 4.395618399307538e-07, - "loss": 0.3511, - "step": 81780 - }, - { - "epoch": 2.1, - "learning_rate": 4.395389235784827e-07, - "loss": 0.4697, - "step": 81781 - }, - { - "epoch": 2.1, - "learning_rate": 4.3951600765533116e-07, - "loss": 0.2593, - "step": 81782 - }, - { - "epoch": 2.1, - "learning_rate": 4.394930921613165e-07, - "loss": 0.4414, - "step": 81783 - }, - { - "epoch": 2.1, - "learning_rate": 4.3947017709645583e-07, - "loss": 0.394, - "step": 81784 - }, - { - "epoch": 2.1, - "learning_rate": 4.39447262460767e-07, - "loss": 0.4316, - "step": 81785 - }, - { - "epoch": 2.1, - "learning_rate": 4.394243482542681e-07, - "loss": 0.3706, - "step": 81786 - }, - { - "epoch": 2.1, - "learning_rate": 4.3940143447697573e-07, - "loss": 0.457, - "step": 81787 - }, - { - "epoch": 2.1, - "learning_rate": 4.3937852112890803e-07, - "loss": 0.2739, - "step": 81788 - }, - { - "epoch": 2.1, - "learning_rate": 4.393556082100823e-07, - "loss": 0.4214, - "step": 81789 - }, - { - "epoch": 2.1, - "learning_rate": 4.3933269572051665e-07, - "loss": 0.436, - "step": 81790 - }, - { - "epoch": 2.1, - "learning_rate": 4.3930978366022776e-07, - "loss": 0.4688, - "step": 81791 - }, - { - "epoch": 2.1, - "learning_rate": 4.3928687202923364e-07, - "loss": 0.2868, - "step": 81792 - }, - { - "epoch": 2.1, - "learning_rate": 4.3926396082755214e-07, - "loss": 0.2986, - "step": 81793 - }, - { - "epoch": 2.1, - "learning_rate": 4.392410500552001e-07, - "loss": 0.2681, - "step": 81794 - }, - { - "epoch": 2.1, - "learning_rate": 4.392181397121957e-07, - "loss": 0.364, - "step": 81795 - }, - { - "epoch": 2.1, - "learning_rate": 4.3919522979855574e-07, - "loss": 0.4316, - "step": 81796 - }, - { - "epoch": 2.1, - "learning_rate": 4.391723203142983e-07, - "loss": 0.4907, - "step": 81797 - }, - { - "epoch": 2.1, - "learning_rate": 4.3914941125944084e-07, - "loss": 0.3945, - "step": 81798 - }, - { - "epoch": 2.1, - "learning_rate": 4.391265026340013e-07, - "loss": 0.4065, - "step": 81799 - }, - { - "epoch": 2.1, - "learning_rate": 4.3910359443799636e-07, - "loss": 0.4697, - "step": 81800 - }, - { - "epoch": 2.1, - "learning_rate": 4.3908068667144406e-07, - "loss": 0.373, - "step": 81801 - }, - { - "epoch": 2.1, - "learning_rate": 4.390577793343618e-07, - "loss": 0.3755, - "step": 81802 - }, - { - "epoch": 2.1, - "learning_rate": 4.3903487242676794e-07, - "loss": 0.4321, - "step": 81803 - }, - { - "epoch": 2.1, - "learning_rate": 4.3901196594867864e-07, - "loss": 0.3989, - "step": 81804 - }, - { - "epoch": 2.1, - "learning_rate": 4.38989059900112e-07, - "loss": 0.3833, - "step": 81805 - }, - { - "epoch": 2.1, - "learning_rate": 4.3896615428108576e-07, - "loss": 0.4746, - "step": 81806 - }, - { - "epoch": 2.1, - "learning_rate": 4.3894324909161764e-07, - "loss": 0.4395, - "step": 81807 - }, - { - "epoch": 2.1, - "learning_rate": 4.389203443317245e-07, - "loss": 0.4263, - "step": 81808 - }, - { - "epoch": 2.1, - "learning_rate": 4.3889744000142426e-07, - "loss": 0.498, - "step": 81809 - }, - { - "epoch": 2.1, - "learning_rate": 4.3887453610073445e-07, - "loss": 0.5801, - "step": 81810 - }, - { - "epoch": 2.1, - "learning_rate": 4.3885163262967294e-07, - "loss": 0.3821, - "step": 81811 - }, - { - "epoch": 2.1, - "learning_rate": 4.3882872958825656e-07, - "loss": 0.4419, - "step": 81812 - }, - { - "epoch": 2.1, - "learning_rate": 4.388058269765037e-07, - "loss": 0.3159, - "step": 81813 - }, - { - "epoch": 2.1, - "learning_rate": 4.387829247944309e-07, - "loss": 0.4678, - "step": 81814 - }, - { - "epoch": 2.1, - "learning_rate": 4.3876002304205627e-07, - "loss": 0.4192, - "step": 81815 - }, - { - "epoch": 2.1, - "learning_rate": 4.387371217193977e-07, - "loss": 0.48, - "step": 81816 - }, - { - "epoch": 2.1, - "learning_rate": 4.387142208264719e-07, - "loss": 0.5439, - "step": 81817 - }, - { - "epoch": 2.1, - "learning_rate": 4.386913203632968e-07, - "loss": 0.342, - "step": 81818 - }, - { - "epoch": 2.1, - "learning_rate": 4.3866842032988993e-07, - "loss": 0.3169, - "step": 81819 - }, - { - "epoch": 2.1, - "learning_rate": 4.3864552072626926e-07, - "loss": 0.345, - "step": 81820 - }, - { - "epoch": 2.1, - "learning_rate": 4.3862262155245154e-07, - "loss": 0.3807, - "step": 81821 - }, - { - "epoch": 2.1, - "learning_rate": 4.385997228084546e-07, - "loss": 0.3123, - "step": 81822 - }, - { - "epoch": 2.1, - "learning_rate": 4.3857682449429647e-07, - "loss": 0.4258, - "step": 81823 - }, - { - "epoch": 2.1, - "learning_rate": 4.3855392660999424e-07, - "loss": 0.3093, - "step": 81824 - }, - { - "epoch": 2.1, - "learning_rate": 4.3853102915556504e-07, - "loss": 0.2477, - "step": 81825 - }, - { - "epoch": 2.1, - "learning_rate": 4.3850813213102687e-07, - "loss": 0.5315, - "step": 81826 - }, - { - "epoch": 2.1, - "learning_rate": 4.3848523553639714e-07, - "loss": 0.3264, - "step": 81827 - }, - { - "epoch": 2.1, - "learning_rate": 4.3846233937169387e-07, - "loss": 0.4258, - "step": 81828 - }, - { - "epoch": 2.1, - "learning_rate": 4.384394436369337e-07, - "loss": 0.3511, - "step": 81829 - }, - { - "epoch": 2.1, - "learning_rate": 4.384165483321348e-07, - "loss": 0.373, - "step": 81830 - }, - { - "epoch": 2.1, - "learning_rate": 4.3839365345731437e-07, - "loss": 0.4512, - "step": 81831 - }, - { - "epoch": 2.1, - "learning_rate": 4.3837075901249053e-07, - "loss": 0.6045, - "step": 81832 - }, - { - "epoch": 2.1, - "learning_rate": 4.383478649976804e-07, - "loss": 0.2977, - "step": 81833 - }, - { - "epoch": 2.1, - "learning_rate": 4.3832497141290104e-07, - "loss": 0.4448, - "step": 81834 - }, - { - "epoch": 2.1, - "learning_rate": 4.383020782581706e-07, - "loss": 0.5083, - "step": 81835 - }, - { - "epoch": 2.1, - "learning_rate": 4.382791855335062e-07, - "loss": 0.3293, - "step": 81836 - }, - { - "epoch": 2.1, - "learning_rate": 4.382562932389261e-07, - "loss": 0.3843, - "step": 81837 - }, - { - "epoch": 2.1, - "learning_rate": 4.382334013744469e-07, - "loss": 0.342, - "step": 81838 - }, - { - "epoch": 2.1, - "learning_rate": 4.3821050994008656e-07, - "loss": 0.3762, - "step": 81839 - }, - { - "epoch": 2.1, - "learning_rate": 4.3818761893586296e-07, - "loss": 0.3945, - "step": 81840 - }, - { - "epoch": 2.1, - "learning_rate": 4.3816472836179297e-07, - "loss": 0.4214, - "step": 81841 - }, - { - "epoch": 2.1, - "learning_rate": 4.3814183821789444e-07, - "loss": 0.479, - "step": 81842 - }, - { - "epoch": 2.1, - "learning_rate": 4.381189485041852e-07, - "loss": 0.4395, - "step": 81843 - }, - { - "epoch": 2.1, - "learning_rate": 4.380960592206819e-07, - "loss": 0.3232, - "step": 81844 - }, - { - "epoch": 2.1, - "learning_rate": 4.380731703674032e-07, - "loss": 0.4032, - "step": 81845 - }, - { - "epoch": 2.1, - "learning_rate": 4.3805028194436555e-07, - "loss": 0.4331, - "step": 81846 - }, - { - "epoch": 2.1, - "learning_rate": 4.3802739395158707e-07, - "loss": 0.4673, - "step": 81847 - }, - { - "epoch": 2.1, - "learning_rate": 4.38004506389085e-07, - "loss": 0.4697, - "step": 81848 - }, - { - "epoch": 2.1, - "learning_rate": 4.379816192568776e-07, - "loss": 0.4575, - "step": 81849 - }, - { - "epoch": 2.1, - "learning_rate": 4.379587325549814e-07, - "loss": 0.5161, - "step": 81850 - }, - { - "epoch": 2.1, - "learning_rate": 4.379358462834143e-07, - "loss": 0.5234, - "step": 81851 - }, - { - "epoch": 2.1, - "learning_rate": 4.3791296044219395e-07, - "loss": 0.4565, - "step": 81852 - }, - { - "epoch": 2.1, - "learning_rate": 4.378900750313381e-07, - "loss": 0.4312, - "step": 81853 - }, - { - "epoch": 2.1, - "learning_rate": 4.37867190050864e-07, - "loss": 0.3591, - "step": 81854 - }, - { - "epoch": 2.1, - "learning_rate": 4.3784430550078876e-07, - "loss": 0.4932, - "step": 81855 - }, - { - "epoch": 2.1, - "learning_rate": 4.378214213811303e-07, - "loss": 0.3955, - "step": 81856 - }, - { - "epoch": 2.1, - "learning_rate": 4.3779853769190654e-07, - "loss": 0.2921, - "step": 81857 - }, - { - "epoch": 2.1, - "learning_rate": 4.377756544331341e-07, - "loss": 0.4265, - "step": 81858 - }, - { - "epoch": 2.1, - "learning_rate": 4.3775277160483113e-07, - "loss": 0.4297, - "step": 81859 - }, - { - "epoch": 2.1, - "learning_rate": 4.37729889207015e-07, - "loss": 0.4612, - "step": 81860 - }, - { - "epoch": 2.1, - "learning_rate": 4.3770700723970356e-07, - "loss": 0.5005, - "step": 81861 - }, - { - "epoch": 2.1, - "learning_rate": 4.376841257029136e-07, - "loss": 0.3412, - "step": 81862 - }, - { - "epoch": 2.1, - "learning_rate": 4.3766124459666354e-07, - "loss": 0.3938, - "step": 81863 - }, - { - "epoch": 2.1, - "learning_rate": 4.3763836392096986e-07, - "loss": 0.4263, - "step": 81864 - }, - { - "epoch": 2.1, - "learning_rate": 4.3761548367585076e-07, - "loss": 0.4951, - "step": 81865 - }, - { - "epoch": 2.1, - "learning_rate": 4.3759260386132404e-07, - "loss": 0.4043, - "step": 81866 - }, - { - "epoch": 2.1, - "learning_rate": 4.3756972447740627e-07, - "loss": 0.4451, - "step": 81867 - }, - { - "epoch": 2.1, - "learning_rate": 4.375468455241156e-07, - "loss": 0.4341, - "step": 81868 - }, - { - "epoch": 2.1, - "learning_rate": 4.3752396700146945e-07, - "loss": 0.2817, - "step": 81869 - }, - { - "epoch": 2.1, - "learning_rate": 4.3750108890948566e-07, - "loss": 0.4536, - "step": 81870 - }, - { - "epoch": 2.1, - "learning_rate": 4.3747821124818107e-07, - "loss": 0.3799, - "step": 81871 - }, - { - "epoch": 2.1, - "learning_rate": 4.3745533401757394e-07, - "loss": 0.3665, - "step": 81872 - }, - { - "epoch": 2.1, - "learning_rate": 4.3743245721768105e-07, - "loss": 0.4507, - "step": 81873 - }, - { - "epoch": 2.1, - "learning_rate": 4.3740958084852056e-07, - "loss": 0.4238, - "step": 81874 - }, - { - "epoch": 2.1, - "learning_rate": 4.373867049101093e-07, - "loss": 0.4766, - "step": 81875 - }, - { - "epoch": 2.1, - "learning_rate": 4.373638294024653e-07, - "loss": 0.5103, - "step": 81876 - }, - { - "epoch": 2.1, - "learning_rate": 4.373409543256058e-07, - "loss": 0.4336, - "step": 81877 - }, - { - "epoch": 2.1, - "learning_rate": 4.3731807967954893e-07, - "loss": 0.4858, - "step": 81878 - }, - { - "epoch": 2.1, - "learning_rate": 4.3729520546431133e-07, - "loss": 0.5317, - "step": 81879 - }, - { - "epoch": 2.1, - "learning_rate": 4.3727233167991095e-07, - "loss": 0.3926, - "step": 81880 - }, - { - "epoch": 2.1, - "learning_rate": 4.3724945832636515e-07, - "loss": 0.4268, - "step": 81881 - }, - { - "epoch": 2.1, - "learning_rate": 4.3722658540369204e-07, - "loss": 0.3923, - "step": 81882 - }, - { - "epoch": 2.1, - "learning_rate": 4.372037129119086e-07, - "loss": 0.4912, - "step": 81883 - }, - { - "epoch": 2.1, - "learning_rate": 4.3718084085103214e-07, - "loss": 0.4092, - "step": 81884 - }, - { - "epoch": 2.1, - "learning_rate": 4.371579692210804e-07, - "loss": 0.314, - "step": 81885 - }, - { - "epoch": 2.1, - "learning_rate": 4.3713509802207083e-07, - "loss": 0.4023, - "step": 81886 - }, - { - "epoch": 2.1, - "learning_rate": 4.3711222725402143e-07, - "loss": 0.3891, - "step": 81887 - }, - { - "epoch": 2.1, - "learning_rate": 4.3708935691694895e-07, - "loss": 0.3198, - "step": 81888 - }, - { - "epoch": 2.1, - "learning_rate": 4.3706648701087135e-07, - "loss": 0.5049, - "step": 81889 - }, - { - "epoch": 2.1, - "learning_rate": 4.37043617535806e-07, - "loss": 0.3833, - "step": 81890 - }, - { - "epoch": 2.1, - "learning_rate": 4.3702074849177075e-07, - "loss": 0.4072, - "step": 81891 - }, - { - "epoch": 2.1, - "learning_rate": 4.369978798787829e-07, - "loss": 0.3993, - "step": 81892 - }, - { - "epoch": 2.1, - "learning_rate": 4.3697501169685956e-07, - "loss": 0.3945, - "step": 81893 - }, - { - "epoch": 2.1, - "learning_rate": 4.3695214394601854e-07, - "loss": 0.3301, - "step": 81894 - }, - { - "epoch": 2.1, - "learning_rate": 4.3692927662627764e-07, - "loss": 0.4077, - "step": 81895 - }, - { - "epoch": 2.1, - "learning_rate": 4.369064097376539e-07, - "loss": 0.4025, - "step": 81896 - }, - { - "epoch": 2.1, - "learning_rate": 4.3688354328016495e-07, - "loss": 0.4546, - "step": 81897 - }, - { - "epoch": 2.1, - "learning_rate": 4.368606772538284e-07, - "loss": 0.425, - "step": 81898 - }, - { - "epoch": 2.1, - "learning_rate": 4.3683781165866207e-07, - "loss": 0.3999, - "step": 81899 - }, - { - "epoch": 2.1, - "learning_rate": 4.3681494649468275e-07, - "loss": 0.4268, - "step": 81900 - }, - { - "epoch": 2.1, - "learning_rate": 4.367920817619084e-07, - "loss": 0.3645, - "step": 81901 - }, - { - "epoch": 2.1, - "learning_rate": 4.3676921746035677e-07, - "loss": 0.3606, - "step": 81902 - }, - { - "epoch": 2.1, - "learning_rate": 4.3674635359004463e-07, - "loss": 0.3967, - "step": 81903 - }, - { - "epoch": 2.1, - "learning_rate": 4.367234901509904e-07, - "loss": 0.5176, - "step": 81904 - }, - { - "epoch": 2.1, - "learning_rate": 4.3670062714321065e-07, - "loss": 0.3181, - "step": 81905 - }, - { - "epoch": 2.1, - "learning_rate": 4.3667776456672333e-07, - "loss": 0.5127, - "step": 81906 - }, - { - "epoch": 2.1, - "learning_rate": 4.36654902421546e-07, - "loss": 0.412, - "step": 81907 - }, - { - "epoch": 2.1, - "learning_rate": 4.3663204070769645e-07, - "loss": 0.5024, - "step": 81908 - }, - { - "epoch": 2.1, - "learning_rate": 4.3660917942519135e-07, - "loss": 0.3887, - "step": 81909 - }, - { - "epoch": 2.1, - "learning_rate": 4.365863185740488e-07, - "loss": 0.312, - "step": 81910 - }, - { - "epoch": 2.1, - "learning_rate": 4.365634581542863e-07, - "loss": 0.3118, - "step": 81911 - }, - { - "epoch": 2.1, - "learning_rate": 4.365405981659218e-07, - "loss": 0.343, - "step": 81912 - }, - { - "epoch": 2.1, - "learning_rate": 4.365177386089717e-07, - "loss": 0.3181, - "step": 81913 - }, - { - "epoch": 2.1, - "learning_rate": 4.36494879483454e-07, - "loss": 0.4524, - "step": 81914 - }, - { - "epoch": 2.1, - "learning_rate": 4.3647202078938617e-07, - "loss": 0.3643, - "step": 81915 - }, - { - "epoch": 2.1, - "learning_rate": 4.364491625267862e-07, - "loss": 0.3511, - "step": 81916 - }, - { - "epoch": 2.1, - "learning_rate": 4.364263046956709e-07, - "loss": 0.3574, - "step": 81917 - }, - { - "epoch": 2.1, - "learning_rate": 4.3640344729605805e-07, - "loss": 0.415, - "step": 81918 - }, - { - "epoch": 2.1, - "learning_rate": 4.3638059032796514e-07, - "loss": 0.2694, - "step": 81919 - }, - { - "epoch": 2.1, - "learning_rate": 4.3635773379141005e-07, - "loss": 0.4609, - "step": 81920 - }, - { - "epoch": 2.1, - "learning_rate": 4.363348776864095e-07, - "loss": 0.4668, - "step": 81921 - }, - { - "epoch": 2.1, - "learning_rate": 4.363120220129819e-07, - "loss": 0.3755, - "step": 81922 - }, - { - "epoch": 2.1, - "learning_rate": 4.362891667711438e-07, - "loss": 0.4434, - "step": 81923 - }, - { - "epoch": 2.1, - "learning_rate": 4.3626631196091323e-07, - "loss": 0.3798, - "step": 81924 - }, - { - "epoch": 2.1, - "learning_rate": 4.36243457582308e-07, - "loss": 0.4009, - "step": 81925 - }, - { - "epoch": 2.1, - "learning_rate": 4.3622060363534484e-07, - "loss": 0.3492, - "step": 81926 - }, - { - "epoch": 2.1, - "learning_rate": 4.3619775012004166e-07, - "loss": 0.3634, - "step": 81927 - }, - { - "epoch": 2.1, - "learning_rate": 4.3617489703641585e-07, - "loss": 0.3507, - "step": 81928 - }, - { - "epoch": 2.1, - "learning_rate": 4.361520443844855e-07, - "loss": 0.3545, - "step": 81929 - }, - { - "epoch": 2.1, - "learning_rate": 4.361291921642671e-07, - "loss": 0.5527, - "step": 81930 - }, - { - "epoch": 2.1, - "learning_rate": 4.3610634037577877e-07, - "loss": 0.4019, - "step": 81931 - }, - { - "epoch": 2.1, - "learning_rate": 4.3608348901903826e-07, - "loss": 0.3911, - "step": 81932 - }, - { - "epoch": 2.1, - "learning_rate": 4.3606063809406257e-07, - "loss": 0.3159, - "step": 81933 - }, - { - "epoch": 2.1, - "learning_rate": 4.360377876008691e-07, - "loss": 0.5005, - "step": 81934 - }, - { - "epoch": 2.1, - "learning_rate": 4.360149375394754e-07, - "loss": 0.4185, - "step": 81935 - }, - { - "epoch": 2.1, - "learning_rate": 4.359920879098993e-07, - "loss": 0.425, - "step": 81936 - }, - { - "epoch": 2.1, - "learning_rate": 4.359692387121583e-07, - "loss": 0.4062, - "step": 81937 - }, - { - "epoch": 2.1, - "learning_rate": 4.3594638994626954e-07, - "loss": 0.3031, - "step": 81938 - }, - { - "epoch": 2.1, - "learning_rate": 4.3592354161225054e-07, - "loss": 0.4448, - "step": 81939 - }, - { - "epoch": 2.1, - "learning_rate": 4.359006937101191e-07, - "loss": 0.4414, - "step": 81940 - }, - { - "epoch": 2.1, - "learning_rate": 4.358778462398928e-07, - "loss": 0.313, - "step": 81941 - }, - { - "epoch": 2.1, - "learning_rate": 4.3585499920158887e-07, - "loss": 0.2969, - "step": 81942 - }, - { - "epoch": 2.1, - "learning_rate": 4.3583215259522453e-07, - "loss": 0.4255, - "step": 81943 - }, - { - "epoch": 2.1, - "learning_rate": 4.3580930642081757e-07, - "loss": 0.3621, - "step": 81944 - }, - { - "epoch": 2.1, - "learning_rate": 4.3578646067838555e-07, - "loss": 0.3906, - "step": 81945 - }, - { - "epoch": 2.1, - "learning_rate": 4.3576361536794615e-07, - "loss": 0.4043, - "step": 81946 - }, - { - "epoch": 2.1, - "learning_rate": 4.3574077048951627e-07, - "loss": 0.4463, - "step": 81947 - }, - { - "epoch": 2.1, - "learning_rate": 4.3571792604311375e-07, - "loss": 0.4653, - "step": 81948 - }, - { - "epoch": 2.1, - "learning_rate": 4.3569508202875647e-07, - "loss": 0.519, - "step": 81949 - }, - { - "epoch": 2.1, - "learning_rate": 4.3567223844646106e-07, - "loss": 0.2714, - "step": 81950 - }, - { - "epoch": 2.1, - "learning_rate": 4.356493952962456e-07, - "loss": 0.4243, - "step": 81951 - }, - { - "epoch": 2.1, - "learning_rate": 4.3562655257812765e-07, - "loss": 0.4219, - "step": 81952 - }, - { - "epoch": 2.1, - "learning_rate": 4.3560371029212427e-07, - "loss": 0.5439, - "step": 81953 - }, - { - "epoch": 2.1, - "learning_rate": 4.355808684382535e-07, - "loss": 0.365, - "step": 81954 - }, - { - "epoch": 2.1, - "learning_rate": 4.355580270165321e-07, - "loss": 0.366, - "step": 81955 - }, - { - "epoch": 2.1, - "learning_rate": 4.3553518602697805e-07, - "loss": 0.3887, - "step": 81956 - }, - { - "epoch": 2.1, - "learning_rate": 4.3551234546960867e-07, - "loss": 0.3979, - "step": 81957 - }, - { - "epoch": 2.1, - "learning_rate": 4.3548950534444197e-07, - "loss": 0.458, - "step": 81958 - }, - { - "epoch": 2.1, - "learning_rate": 4.354666656514945e-07, - "loss": 0.375, - "step": 81959 - }, - { - "epoch": 2.1, - "learning_rate": 4.3544382639078436e-07, - "loss": 0.4907, - "step": 81960 - }, - { - "epoch": 2.1, - "learning_rate": 4.354209875623289e-07, - "loss": 0.3574, - "step": 81961 - }, - { - "epoch": 2.1, - "learning_rate": 4.3539814916614605e-07, - "loss": 0.2478, - "step": 81962 - }, - { - "epoch": 2.1, - "learning_rate": 4.353753112022528e-07, - "loss": 0.3018, - "step": 81963 - }, - { - "epoch": 2.1, - "learning_rate": 4.353524736706663e-07, - "loss": 0.3929, - "step": 81964 - }, - { - "epoch": 2.1, - "learning_rate": 4.3532963657140453e-07, - "loss": 0.3774, - "step": 81965 - }, - { - "epoch": 2.1, - "learning_rate": 4.3530679990448527e-07, - "loss": 0.4067, - "step": 81966 - }, - { - "epoch": 2.1, - "learning_rate": 4.3528396366992523e-07, - "loss": 0.4116, - "step": 81967 - }, - { - "epoch": 2.1, - "learning_rate": 4.352611278677423e-07, - "loss": 0.481, - "step": 81968 - }, - { - "epoch": 2.1, - "learning_rate": 4.3523829249795396e-07, - "loss": 0.4695, - "step": 81969 - }, - { - "epoch": 2.1, - "learning_rate": 4.35215457560578e-07, - "loss": 0.4546, - "step": 81970 - }, - { - "epoch": 2.1, - "learning_rate": 4.3519262305563133e-07, - "loss": 0.3656, - "step": 81971 - }, - { - "epoch": 2.1, - "learning_rate": 4.3516978898313195e-07, - "loss": 0.4897, - "step": 81972 - }, - { - "epoch": 2.1, - "learning_rate": 4.351469553430969e-07, - "loss": 0.3989, - "step": 81973 - }, - { - "epoch": 2.1, - "learning_rate": 4.351241221355437e-07, - "loss": 0.4629, - "step": 81974 - }, - { - "epoch": 2.1, - "learning_rate": 4.351012893604904e-07, - "loss": 0.562, - "step": 81975 - }, - { - "epoch": 2.1, - "learning_rate": 4.350784570179537e-07, - "loss": 0.4702, - "step": 81976 - }, - { - "epoch": 2.1, - "learning_rate": 4.350556251079515e-07, - "loss": 0.3723, - "step": 81977 - }, - { - "epoch": 2.1, - "learning_rate": 4.3503279363050106e-07, - "loss": 0.4824, - "step": 81978 - }, - { - "epoch": 2.1, - "learning_rate": 4.350099625856205e-07, - "loss": 0.4465, - "step": 81979 - }, - { - "epoch": 2.1, - "learning_rate": 4.349871319733266e-07, - "loss": 0.4308, - "step": 81980 - }, - { - "epoch": 2.1, - "learning_rate": 4.3496430179363685e-07, - "loss": 0.4951, - "step": 81981 - }, - { - "epoch": 2.1, - "learning_rate": 4.349414720465695e-07, - "loss": 0.4102, - "step": 81982 - }, - { - "epoch": 2.1, - "learning_rate": 4.3491864273214143e-07, - "loss": 0.3772, - "step": 81983 - }, - { - "epoch": 2.1, - "learning_rate": 4.348958138503698e-07, - "loss": 0.5127, - "step": 81984 - }, - { - "epoch": 2.1, - "learning_rate": 4.348729854012724e-07, - "loss": 0.3254, - "step": 81985 - }, - { - "epoch": 2.1, - "learning_rate": 4.348501573848667e-07, - "loss": 0.459, - "step": 81986 - }, - { - "epoch": 2.1, - "learning_rate": 4.3482732980117086e-07, - "loss": 0.395, - "step": 81987 - }, - { - "epoch": 2.1, - "learning_rate": 4.348045026502012e-07, - "loss": 0.5405, - "step": 81988 - }, - { - "epoch": 2.1, - "learning_rate": 4.347816759319758e-07, - "loss": 0.3989, - "step": 81989 - }, - { - "epoch": 2.1, - "learning_rate": 4.347588496465121e-07, - "loss": 0.4307, - "step": 81990 - }, - { - "epoch": 2.1, - "learning_rate": 4.347360237938279e-07, - "loss": 0.5132, - "step": 81991 - }, - { - "epoch": 2.1, - "learning_rate": 4.347131983739403e-07, - "loss": 0.2974, - "step": 81992 - }, - { - "epoch": 2.1, - "learning_rate": 4.3469037338686654e-07, - "loss": 0.4402, - "step": 81993 - }, - { - "epoch": 2.1, - "learning_rate": 4.3466754883262424e-07, - "loss": 0.3707, - "step": 81994 - }, - { - "epoch": 2.1, - "learning_rate": 4.3464472471123103e-07, - "loss": 0.4668, - "step": 81995 - }, - { - "epoch": 2.1, - "learning_rate": 4.346219010227048e-07, - "loss": 0.4287, - "step": 81996 - }, - { - "epoch": 2.1, - "learning_rate": 4.3459907776706216e-07, - "loss": 0.4595, - "step": 81997 - }, - { - "epoch": 2.1, - "learning_rate": 4.34576254944321e-07, - "loss": 0.4307, - "step": 81998 - }, - { - "epoch": 2.1, - "learning_rate": 4.3455343255449894e-07, - "loss": 0.5122, - "step": 81999 - }, - { - "epoch": 2.1, - "learning_rate": 4.345306105976135e-07, - "loss": 0.4087, - "step": 82000 - }, - { - "epoch": 2.1, - "learning_rate": 4.3450778907368167e-07, - "loss": 0.4067, - "step": 82001 - }, - { - "epoch": 2.1, - "learning_rate": 4.344849679827216e-07, - "loss": 0.3677, - "step": 82002 - }, - { - "epoch": 2.1, - "learning_rate": 4.3446214732475004e-07, - "loss": 0.4243, - "step": 82003 - }, - { - "epoch": 2.1, - "learning_rate": 4.3443932709978515e-07, - "loss": 0.4839, - "step": 82004 - }, - { - "epoch": 2.1, - "learning_rate": 4.344165073078437e-07, - "loss": 0.4458, - "step": 82005 - }, - { - "epoch": 2.1, - "learning_rate": 4.343936879489436e-07, - "loss": 0.4072, - "step": 82006 - }, - { - "epoch": 2.1, - "learning_rate": 4.3437086902310216e-07, - "loss": 0.2474, - "step": 82007 - }, - { - "epoch": 2.1, - "learning_rate": 4.3434805053033727e-07, - "loss": 0.375, - "step": 82008 - }, - { - "epoch": 2.1, - "learning_rate": 4.343252324706658e-07, - "loss": 0.5015, - "step": 82009 - }, - { - "epoch": 2.1, - "learning_rate": 4.343024148441055e-07, - "loss": 0.2089, - "step": 82010 - }, - { - "epoch": 2.1, - "learning_rate": 4.342795976506737e-07, - "loss": 0.4897, - "step": 82011 - }, - { - "epoch": 2.1, - "learning_rate": 4.342567808903884e-07, - "loss": 0.4316, - "step": 82012 - }, - { - "epoch": 2.1, - "learning_rate": 4.3423396456326677e-07, - "loss": 0.4785, - "step": 82013 - }, - { - "epoch": 2.1, - "learning_rate": 4.3421114866932576e-07, - "loss": 0.4062, - "step": 82014 - }, - { - "epoch": 2.1, - "learning_rate": 4.341883332085832e-07, - "loss": 0.3679, - "step": 82015 - }, - { - "epoch": 2.1, - "learning_rate": 4.341655181810566e-07, - "loss": 0.5864, - "step": 82016 - }, - { - "epoch": 2.1, - "learning_rate": 4.34142703586764e-07, - "loss": 0.3621, - "step": 82017 - }, - { - "epoch": 2.1, - "learning_rate": 4.3411988942572177e-07, - "loss": 0.3455, - "step": 82018 - }, - { - "epoch": 2.1, - "learning_rate": 4.34097075697948e-07, - "loss": 0.4795, - "step": 82019 - }, - { - "epoch": 2.1, - "learning_rate": 4.3407426240346035e-07, - "loss": 0.4272, - "step": 82020 - }, - { - "epoch": 2.1, - "learning_rate": 4.340514495422757e-07, - "loss": 0.3164, - "step": 82021 - }, - { - "epoch": 2.1, - "learning_rate": 4.340286371144122e-07, - "loss": 0.4868, - "step": 82022 - }, - { - "epoch": 2.1, - "learning_rate": 4.340058251198866e-07, - "loss": 0.5, - "step": 82023 - }, - { - "epoch": 2.1, - "learning_rate": 4.339830135587167e-07, - "loss": 0.3604, - "step": 82024 - }, - { - "epoch": 2.1, - "learning_rate": 4.3396020243092033e-07, - "loss": 0.4204, - "step": 82025 - }, - { - "epoch": 2.1, - "learning_rate": 4.3393739173651436e-07, - "loss": 0.3672, - "step": 82026 - }, - { - "epoch": 2.1, - "learning_rate": 4.339145814755163e-07, - "loss": 0.4868, - "step": 82027 - }, - { - "epoch": 2.1, - "learning_rate": 4.33891771647944e-07, - "loss": 0.3092, - "step": 82028 - }, - { - "epoch": 2.1, - "learning_rate": 4.3386896225381496e-07, - "loss": 0.499, - "step": 82029 - }, - { - "epoch": 2.1, - "learning_rate": 4.338461532931461e-07, - "loss": 0.3621, - "step": 82030 - }, - { - "epoch": 2.1, - "learning_rate": 4.338233447659553e-07, - "loss": 0.417, - "step": 82031 - }, - { - "epoch": 2.1, - "learning_rate": 4.3380053667226026e-07, - "loss": 0.4785, - "step": 82032 - }, - { - "epoch": 2.1, - "learning_rate": 4.3377772901207766e-07, - "loss": 0.4258, - "step": 82033 - }, - { - "epoch": 2.1, - "learning_rate": 4.3375492178542585e-07, - "loss": 0.3726, - "step": 82034 - }, - { - "epoch": 2.1, - "learning_rate": 4.3373211499232154e-07, - "loss": 0.4712, - "step": 82035 - }, - { - "epoch": 2.1, - "learning_rate": 4.3370930863278244e-07, - "loss": 0.2783, - "step": 82036 - }, - { - "epoch": 2.1, - "learning_rate": 4.3368650270682637e-07, - "loss": 0.3645, - "step": 82037 - }, - { - "epoch": 2.1, - "learning_rate": 4.336636972144703e-07, - "loss": 0.3412, - "step": 82038 - }, - { - "epoch": 2.1, - "learning_rate": 4.3364089215573184e-07, - "loss": 0.5117, - "step": 82039 - }, - { - "epoch": 2.1, - "learning_rate": 4.3361808753062843e-07, - "loss": 0.4038, - "step": 82040 - }, - { - "epoch": 2.1, - "learning_rate": 4.3359528333917805e-07, - "loss": 0.4658, - "step": 82041 - }, - { - "epoch": 2.1, - "learning_rate": 4.335724795813978e-07, - "loss": 0.3435, - "step": 82042 - }, - { - "epoch": 2.1, - "learning_rate": 4.335496762573045e-07, - "loss": 0.4307, - "step": 82043 - }, - { - "epoch": 2.1, - "learning_rate": 4.335268733669163e-07, - "loss": 0.3525, - "step": 82044 - }, - { - "epoch": 2.1, - "learning_rate": 4.3350407091025057e-07, - "loss": 0.4487, - "step": 82045 - }, - { - "epoch": 2.1, - "learning_rate": 4.3348126888732496e-07, - "loss": 0.4746, - "step": 82046 - }, - { - "epoch": 2.1, - "learning_rate": 4.334584672981564e-07, - "loss": 0.564, - "step": 82047 - }, - { - "epoch": 2.1, - "learning_rate": 4.3343566614276264e-07, - "loss": 0.3049, - "step": 82048 - }, - { - "epoch": 2.1, - "learning_rate": 4.3341286542116106e-07, - "loss": 0.4434, - "step": 82049 - }, - { - "epoch": 2.1, - "learning_rate": 4.3339006513336964e-07, - "loss": 0.3294, - "step": 82050 - }, - { - "epoch": 2.1, - "learning_rate": 4.3336726527940504e-07, - "loss": 0.3794, - "step": 82051 - }, - { - "epoch": 2.1, - "learning_rate": 4.333444658592854e-07, - "loss": 0.4126, - "step": 82052 - }, - { - "epoch": 2.1, - "learning_rate": 4.333216668730275e-07, - "loss": 0.4678, - "step": 82053 - }, - { - "epoch": 2.1, - "learning_rate": 4.3329886832064953e-07, - "loss": 0.438, - "step": 82054 - }, - { - "epoch": 2.1, - "learning_rate": 4.3327607020216814e-07, - "loss": 0.521, - "step": 82055 - }, - { - "epoch": 2.1, - "learning_rate": 4.3325327251760124e-07, - "loss": 0.3794, - "step": 82056 - }, - { - "epoch": 2.1, - "learning_rate": 4.332304752669662e-07, - "loss": 0.4805, - "step": 82057 - }, - { - "epoch": 2.1, - "learning_rate": 4.3320767845028096e-07, - "loss": 0.5708, - "step": 82058 - }, - { - "epoch": 2.1, - "learning_rate": 4.331848820675621e-07, - "loss": 0.3173, - "step": 82059 - }, - { - "epoch": 2.1, - "learning_rate": 4.3316208611882754e-07, - "loss": 0.3507, - "step": 82060 - }, - { - "epoch": 2.1, - "learning_rate": 4.3313929060409473e-07, - "loss": 0.3901, - "step": 82061 - }, - { - "epoch": 2.1, - "learning_rate": 4.331164955233815e-07, - "loss": 0.4629, - "step": 82062 - }, - { - "epoch": 2.1, - "learning_rate": 4.330937008767048e-07, - "loss": 0.4834, - "step": 82063 - }, - { - "epoch": 2.1, - "learning_rate": 4.33070906664082e-07, - "loss": 0.3613, - "step": 82064 - }, - { - "epoch": 2.1, - "learning_rate": 4.3304811288553055e-07, - "loss": 0.3048, - "step": 82065 - }, - { - "epoch": 2.1, - "learning_rate": 4.3302531954106815e-07, - "loss": 0.3394, - "step": 82066 - }, - { - "epoch": 2.1, - "learning_rate": 4.3300252663071257e-07, - "loss": 0.3481, - "step": 82067 - }, - { - "epoch": 2.1, - "learning_rate": 4.3297973415448054e-07, - "loss": 0.3896, - "step": 82068 - }, - { - "epoch": 2.1, - "learning_rate": 4.3295694211238974e-07, - "loss": 0.376, - "step": 82069 - }, - { - "epoch": 2.1, - "learning_rate": 4.329341505044579e-07, - "loss": 0.3811, - "step": 82070 - }, - { - "epoch": 2.1, - "learning_rate": 4.3291135933070256e-07, - "loss": 0.4717, - "step": 82071 - }, - { - "epoch": 2.1, - "learning_rate": 4.3288856859114096e-07, - "loss": 0.4722, - "step": 82072 - }, - { - "epoch": 2.1, - "learning_rate": 4.328657782857902e-07, - "loss": 0.4697, - "step": 82073 - }, - { - "epoch": 2.1, - "learning_rate": 4.3284298841466793e-07, - "loss": 0.397, - "step": 82074 - }, - { - "epoch": 2.1, - "learning_rate": 4.328201989777921e-07, - "loss": 0.3763, - "step": 82075 - }, - { - "epoch": 2.1, - "learning_rate": 4.3279740997517943e-07, - "loss": 0.4033, - "step": 82076 - }, - { - "epoch": 2.1, - "learning_rate": 4.327746214068477e-07, - "loss": 0.3585, - "step": 82077 - }, - { - "epoch": 2.1, - "learning_rate": 4.3275183327281426e-07, - "loss": 0.5527, - "step": 82078 - }, - { - "epoch": 2.1, - "learning_rate": 4.327290455730972e-07, - "loss": 0.3403, - "step": 82079 - }, - { - "epoch": 2.1, - "learning_rate": 4.327062583077129e-07, - "loss": 0.4287, - "step": 82080 - }, - { - "epoch": 2.1, - "learning_rate": 4.326834714766795e-07, - "loss": 0.4404, - "step": 82081 - }, - { - "epoch": 2.1, - "learning_rate": 4.326606850800145e-07, - "loss": 0.3576, - "step": 82082 - }, - { - "epoch": 2.1, - "learning_rate": 4.3263789911773487e-07, - "loss": 0.2698, - "step": 82083 - }, - { - "epoch": 2.1, - "learning_rate": 4.326151135898586e-07, - "loss": 0.4072, - "step": 82084 - }, - { - "epoch": 2.1, - "learning_rate": 4.325923284964025e-07, - "loss": 0.3523, - "step": 82085 - }, - { - "epoch": 2.1, - "learning_rate": 4.325695438373843e-07, - "loss": 0.3105, - "step": 82086 - }, - { - "epoch": 2.1, - "learning_rate": 4.325467596128216e-07, - "loss": 0.4792, - "step": 82087 - }, - { - "epoch": 2.1, - "learning_rate": 4.32523975822732e-07, - "loss": 0.4543, - "step": 82088 - }, - { - "epoch": 2.1, - "learning_rate": 4.3250119246713245e-07, - "loss": 0.4727, - "step": 82089 - }, - { - "epoch": 2.1, - "learning_rate": 4.3247840954604065e-07, - "loss": 0.4272, - "step": 82090 - }, - { - "epoch": 2.1, - "learning_rate": 4.32455627059474e-07, - "loss": 0.4224, - "step": 82091 - }, - { - "epoch": 2.1, - "learning_rate": 4.3243284500745067e-07, - "loss": 0.3804, - "step": 82092 - }, - { - "epoch": 2.1, - "learning_rate": 4.3241006338998674e-07, - "loss": 0.5371, - "step": 82093 - }, - { - "epoch": 2.1, - "learning_rate": 4.323872822071004e-07, - "loss": 0.5073, - "step": 82094 - }, - { - "epoch": 2.1, - "learning_rate": 4.3236450145880885e-07, - "loss": 0.3984, - "step": 82095 - }, - { - "epoch": 2.1, - "learning_rate": 4.323417211451302e-07, - "loss": 0.2361, - "step": 82096 - }, - { - "epoch": 2.1, - "learning_rate": 4.32318941266081e-07, - "loss": 0.2567, - "step": 82097 - }, - { - "epoch": 2.1, - "learning_rate": 4.3229616182167905e-07, - "loss": 0.2469, - "step": 82098 - }, - { - "epoch": 2.1, - "learning_rate": 4.3227338281194183e-07, - "loss": 0.5024, - "step": 82099 - }, - { - "epoch": 2.1, - "learning_rate": 4.322506042368872e-07, - "loss": 0.2769, - "step": 82100 - }, - { - "epoch": 2.1, - "learning_rate": 4.3222782609653174e-07, - "loss": 0.395, - "step": 82101 - }, - { - "epoch": 2.1, - "learning_rate": 4.3220504839089365e-07, - "loss": 0.3564, - "step": 82102 - }, - { - "epoch": 2.1, - "learning_rate": 4.321822711199897e-07, - "loss": 0.3584, - "step": 82103 - }, - { - "epoch": 2.1, - "learning_rate": 4.321594942838378e-07, - "loss": 0.3033, - "step": 82104 - }, - { - "epoch": 2.1, - "learning_rate": 4.3213671788245555e-07, - "loss": 0.5078, - "step": 82105 - }, - { - "epoch": 2.1, - "learning_rate": 4.321139419158597e-07, - "loss": 0.4067, - "step": 82106 - }, - { - "epoch": 2.1, - "learning_rate": 4.320911663840682e-07, - "loss": 0.3726, - "step": 82107 - }, - { - "epoch": 2.1, - "learning_rate": 4.320683912870983e-07, - "loss": 0.5308, - "step": 82108 - }, - { - "epoch": 2.1, - "learning_rate": 4.3204561662496784e-07, - "loss": 0.4307, - "step": 82109 - }, - { - "epoch": 2.1, - "learning_rate": 4.320228423976936e-07, - "loss": 0.48, - "step": 82110 - }, - { - "epoch": 2.1, - "learning_rate": 4.320000686052934e-07, - "loss": 0.2898, - "step": 82111 - }, - { - "epoch": 2.1, - "learning_rate": 4.3197729524778505e-07, - "loss": 0.3497, - "step": 82112 - }, - { - "epoch": 2.1, - "learning_rate": 4.3195452232518547e-07, - "loss": 0.4805, - "step": 82113 - }, - { - "epoch": 2.1, - "learning_rate": 4.319317498375118e-07, - "loss": 0.4053, - "step": 82114 - }, - { - "epoch": 2.1, - "learning_rate": 4.3190897778478196e-07, - "loss": 0.459, - "step": 82115 - }, - { - "epoch": 2.1, - "learning_rate": 4.3188620616701323e-07, - "loss": 0.4336, - "step": 82116 - }, - { - "epoch": 2.1, - "learning_rate": 4.318634349842235e-07, - "loss": 0.418, - "step": 82117 - }, - { - "epoch": 2.1, - "learning_rate": 4.318406642364294e-07, - "loss": 0.3164, - "step": 82118 - }, - { - "epoch": 2.1, - "learning_rate": 4.3181789392364887e-07, - "loss": 0.4644, - "step": 82119 - }, - { - "epoch": 2.1, - "learning_rate": 4.317951240458991e-07, - "loss": 0.2532, - "step": 82120 - }, - { - "epoch": 2.1, - "learning_rate": 4.317723546031983e-07, - "loss": 0.4619, - "step": 82121 - }, - { - "epoch": 2.1, - "learning_rate": 4.3174958559556307e-07, - "loss": 0.3735, - "step": 82122 - }, - { - "epoch": 2.1, - "learning_rate": 4.317268170230107e-07, - "loss": 0.4546, - "step": 82123 - }, - { - "epoch": 2.1, - "learning_rate": 4.31704048885559e-07, - "loss": 0.3057, - "step": 82124 - }, - { - "epoch": 2.1, - "learning_rate": 4.3168128118322546e-07, - "loss": 0.5654, - "step": 82125 - }, - { - "epoch": 2.1, - "learning_rate": 4.316585139160277e-07, - "loss": 0.4424, - "step": 82126 - }, - { - "epoch": 2.1, - "learning_rate": 4.316357470839825e-07, - "loss": 0.2769, - "step": 82127 - }, - { - "epoch": 2.1, - "learning_rate": 4.3161298068710783e-07, - "loss": 0.5625, - "step": 82128 - }, - { - "epoch": 2.11, - "learning_rate": 4.3159021472542125e-07, - "loss": 0.4131, - "step": 82129 - }, - { - "epoch": 2.11, - "learning_rate": 4.315674491989395e-07, - "loss": 0.4541, - "step": 82130 - }, - { - "epoch": 2.11, - "learning_rate": 4.315446841076804e-07, - "loss": 0.4282, - "step": 82131 - }, - { - "epoch": 2.11, - "learning_rate": 4.315219194516618e-07, - "loss": 0.2381, - "step": 82132 - }, - { - "epoch": 2.11, - "learning_rate": 4.314991552309004e-07, - "loss": 0.3429, - "step": 82133 - }, - { - "epoch": 2.11, - "learning_rate": 4.3147639144541427e-07, - "loss": 0.4453, - "step": 82134 - }, - { - "epoch": 2.11, - "learning_rate": 4.314536280952201e-07, - "loss": 0.3371, - "step": 82135 - }, - { - "epoch": 2.11, - "learning_rate": 4.314308651803359e-07, - "loss": 0.3572, - "step": 82136 - }, - { - "epoch": 2.11, - "learning_rate": 4.3140810270077886e-07, - "loss": 0.2562, - "step": 82137 - }, - { - "epoch": 2.11, - "learning_rate": 4.313853406565668e-07, - "loss": 0.3823, - "step": 82138 - }, - { - "epoch": 2.11, - "learning_rate": 4.3136257904771655e-07, - "loss": 0.2991, - "step": 82139 - }, - { - "epoch": 2.11, - "learning_rate": 4.313398178742459e-07, - "loss": 0.5137, - "step": 82140 - }, - { - "epoch": 2.11, - "learning_rate": 4.313170571361721e-07, - "loss": 0.4531, - "step": 82141 - }, - { - "epoch": 2.11, - "learning_rate": 4.3129429683351304e-07, - "loss": 0.394, - "step": 82142 - }, - { - "epoch": 2.11, - "learning_rate": 4.312715369662858e-07, - "loss": 0.4937, - "step": 82143 - }, - { - "epoch": 2.11, - "learning_rate": 4.312487775345074e-07, - "loss": 0.2415, - "step": 82144 - }, - { - "epoch": 2.11, - "learning_rate": 4.312260185381957e-07, - "loss": 0.3362, - "step": 82145 - }, - { - "epoch": 2.11, - "learning_rate": 4.312032599773685e-07, - "loss": 0.4634, - "step": 82146 - }, - { - "epoch": 2.11, - "learning_rate": 4.3118050185204234e-07, - "loss": 0.4448, - "step": 82147 - }, - { - "epoch": 2.11, - "learning_rate": 4.3115774416223516e-07, - "loss": 0.4424, - "step": 82148 - }, - { - "epoch": 2.11, - "learning_rate": 4.3113498690796437e-07, - "loss": 0.3174, - "step": 82149 - }, - { - "epoch": 2.11, - "learning_rate": 4.3111223008924767e-07, - "loss": 0.5156, - "step": 82150 - }, - { - "epoch": 2.11, - "learning_rate": 4.3108947370610183e-07, - "loss": 0.4785, - "step": 82151 - }, - { - "epoch": 2.11, - "learning_rate": 4.3106671775854496e-07, - "loss": 0.4644, - "step": 82152 - }, - { - "epoch": 2.11, - "learning_rate": 4.310439622465939e-07, - "loss": 0.429, - "step": 82153 - }, - { - "epoch": 2.11, - "learning_rate": 4.3102120717026626e-07, - "loss": 0.4775, - "step": 82154 - }, - { - "epoch": 2.11, - "learning_rate": 4.309984525295798e-07, - "loss": 0.439, - "step": 82155 - }, - { - "epoch": 2.11, - "learning_rate": 4.309756983245514e-07, - "loss": 0.335, - "step": 82156 - }, - { - "epoch": 2.11, - "learning_rate": 4.309529445551987e-07, - "loss": 0.3657, - "step": 82157 - }, - { - "epoch": 2.11, - "learning_rate": 4.3093019122153915e-07, - "loss": 0.4861, - "step": 82158 - }, - { - "epoch": 2.11, - "learning_rate": 4.309074383235906e-07, - "loss": 0.499, - "step": 82159 - }, - { - "epoch": 2.11, - "learning_rate": 4.308846858613696e-07, - "loss": 0.38, - "step": 82160 - }, - { - "epoch": 2.11, - "learning_rate": 4.3086193383489444e-07, - "loss": 0.3828, - "step": 82161 - }, - { - "epoch": 2.11, - "learning_rate": 4.308391822441818e-07, - "loss": 0.4683, - "step": 82162 - }, - { - "epoch": 2.11, - "learning_rate": 4.308164310892497e-07, - "loss": 0.3556, - "step": 82163 - }, - { - "epoch": 2.11, - "learning_rate": 4.30793680370115e-07, - "loss": 0.2393, - "step": 82164 - }, - { - "epoch": 2.11, - "learning_rate": 4.3077093008679544e-07, - "loss": 0.2894, - "step": 82165 - }, - { - "epoch": 2.11, - "learning_rate": 4.307481802393084e-07, - "loss": 0.3464, - "step": 82166 - }, - { - "epoch": 2.11, - "learning_rate": 4.3072543082767156e-07, - "loss": 0.4341, - "step": 82167 - }, - { - "epoch": 2.11, - "learning_rate": 4.3070268185190174e-07, - "loss": 0.3445, - "step": 82168 - }, - { - "epoch": 2.11, - "learning_rate": 4.3067993331201677e-07, - "loss": 0.4497, - "step": 82169 - }, - { - "epoch": 2.11, - "learning_rate": 4.3065718520803396e-07, - "loss": 0.3394, - "step": 82170 - }, - { - "epoch": 2.11, - "learning_rate": 4.306344375399712e-07, - "loss": 0.3813, - "step": 82171 - }, - { - "epoch": 2.11, - "learning_rate": 4.306116903078454e-07, - "loss": 0.3016, - "step": 82172 - }, - { - "epoch": 2.11, - "learning_rate": 4.305889435116736e-07, - "loss": 0.6045, - "step": 82173 - }, - { - "epoch": 2.11, - "learning_rate": 4.305661971514738e-07, - "loss": 0.4575, - "step": 82174 - }, - { - "epoch": 2.11, - "learning_rate": 4.305434512272632e-07, - "loss": 0.5288, - "step": 82175 - }, - { - "epoch": 2.11, - "learning_rate": 4.3052070573905973e-07, - "loss": 0.5366, - "step": 82176 - }, - { - "epoch": 2.11, - "learning_rate": 4.3049796068687994e-07, - "loss": 0.3804, - "step": 82177 - }, - { - "epoch": 2.11, - "learning_rate": 4.304752160707418e-07, - "loss": 0.4443, - "step": 82178 - }, - { - "epoch": 2.11, - "learning_rate": 4.3045247189066246e-07, - "loss": 0.5044, - "step": 82179 - }, - { - "epoch": 2.11, - "learning_rate": 4.304297281466599e-07, - "loss": 0.3955, - "step": 82180 - }, - { - "epoch": 2.11, - "learning_rate": 4.3040698483875105e-07, - "loss": 0.4307, - "step": 82181 - }, - { - "epoch": 2.11, - "learning_rate": 4.303842419669531e-07, - "loss": 0.3475, - "step": 82182 - }, - { - "epoch": 2.11, - "learning_rate": 4.3036149953128366e-07, - "loss": 0.3716, - "step": 82183 - }, - { - "epoch": 2.11, - "learning_rate": 4.3033875753176063e-07, - "loss": 0.5103, - "step": 82184 - }, - { - "epoch": 2.11, - "learning_rate": 4.303160159684007e-07, - "loss": 0.4011, - "step": 82185 - }, - { - "epoch": 2.11, - "learning_rate": 4.302932748412216e-07, - "loss": 0.3867, - "step": 82186 - }, - { - "epoch": 2.11, - "learning_rate": 4.302705341502406e-07, - "loss": 0.4341, - "step": 82187 - }, - { - "epoch": 2.11, - "learning_rate": 4.3024779389547573e-07, - "loss": 0.4673, - "step": 82188 - }, - { - "epoch": 2.11, - "learning_rate": 4.3022505407694353e-07, - "loss": 0.4272, - "step": 82189 - }, - { - "epoch": 2.11, - "learning_rate": 4.3020231469466184e-07, - "loss": 0.3938, - "step": 82190 - }, - { - "epoch": 2.11, - "learning_rate": 4.301795757486485e-07, - "loss": 0.4219, - "step": 82191 - }, - { - "epoch": 2.11, - "learning_rate": 4.3015683723891993e-07, - "loss": 0.3213, - "step": 82192 - }, - { - "epoch": 2.11, - "learning_rate": 4.3013409916549446e-07, - "loss": 0.394, - "step": 82193 - }, - { - "epoch": 2.11, - "learning_rate": 4.301113615283888e-07, - "loss": 0.4829, - "step": 82194 - }, - { - "epoch": 2.11, - "learning_rate": 4.300886243276206e-07, - "loss": 0.4355, - "step": 82195 - }, - { - "epoch": 2.11, - "learning_rate": 4.300658875632074e-07, - "loss": 0.3472, - "step": 82196 - }, - { - "epoch": 2.11, - "learning_rate": 4.300431512351669e-07, - "loss": 0.3687, - "step": 82197 - }, - { - "epoch": 2.11, - "learning_rate": 4.3002041534351575e-07, - "loss": 0.4678, - "step": 82198 - }, - { - "epoch": 2.11, - "learning_rate": 4.2999767988827187e-07, - "loss": 0.3406, - "step": 82199 - }, - { - "epoch": 2.11, - "learning_rate": 4.2997494486945276e-07, - "loss": 0.2095, - "step": 82200 - }, - { - "epoch": 2.11, - "learning_rate": 4.2995221028707575e-07, - "loss": 0.4009, - "step": 82201 - }, - { - "epoch": 2.11, - "learning_rate": 4.299294761411576e-07, - "loss": 0.3246, - "step": 82202 - }, - { - "epoch": 2.11, - "learning_rate": 4.2990674243171644e-07, - "loss": 0.3227, - "step": 82203 - }, - { - "epoch": 2.11, - "learning_rate": 4.298840091587693e-07, - "loss": 0.4741, - "step": 82204 - }, - { - "epoch": 2.11, - "learning_rate": 4.2986127632233424e-07, - "loss": 0.4648, - "step": 82205 - }, - { - "epoch": 2.11, - "learning_rate": 4.298385439224278e-07, - "loss": 0.4739, - "step": 82206 - }, - { - "epoch": 2.11, - "learning_rate": 4.298158119590677e-07, - "loss": 0.3182, - "step": 82207 - }, - { - "epoch": 2.11, - "learning_rate": 4.2979308043227145e-07, - "loss": 0.4165, - "step": 82208 - }, - { - "epoch": 2.11, - "learning_rate": 4.297703493420568e-07, - "loss": 0.355, - "step": 82209 - }, - { - "epoch": 2.11, - "learning_rate": 4.2974761868844046e-07, - "loss": 0.4502, - "step": 82210 - }, - { - "epoch": 2.11, - "learning_rate": 4.297248884714404e-07, - "loss": 0.3701, - "step": 82211 - }, - { - "epoch": 2.11, - "learning_rate": 4.297021586910735e-07, - "loss": 0.3657, - "step": 82212 - }, - { - "epoch": 2.11, - "learning_rate": 4.2967942934735737e-07, - "loss": 0.4094, - "step": 82213 - }, - { - "epoch": 2.11, - "learning_rate": 4.296567004403099e-07, - "loss": 0.3279, - "step": 82214 - }, - { - "epoch": 2.11, - "learning_rate": 4.2963397196994767e-07, - "loss": 0.4282, - "step": 82215 - }, - { - "epoch": 2.11, - "learning_rate": 4.2961124393628846e-07, - "loss": 0.375, - "step": 82216 - }, - { - "epoch": 2.11, - "learning_rate": 4.2958851633935013e-07, - "loss": 0.4253, - "step": 82217 - }, - { - "epoch": 2.11, - "learning_rate": 4.295657891791492e-07, - "loss": 0.3381, - "step": 82218 - }, - { - "epoch": 2.11, - "learning_rate": 4.295430624557036e-07, - "loss": 0.3972, - "step": 82219 - }, - { - "epoch": 2.11, - "learning_rate": 4.295203361690305e-07, - "loss": 0.4104, - "step": 82220 - }, - { - "epoch": 2.11, - "learning_rate": 4.2949761031914797e-07, - "loss": 0.4307, - "step": 82221 - }, - { - "epoch": 2.11, - "learning_rate": 4.2947488490607276e-07, - "loss": 0.4937, - "step": 82222 - }, - { - "epoch": 2.11, - "learning_rate": 4.294521599298222e-07, - "loss": 0.4873, - "step": 82223 - }, - { - "epoch": 2.11, - "learning_rate": 4.2942943539041375e-07, - "loss": 0.3152, - "step": 82224 - }, - { - "epoch": 2.11, - "learning_rate": 4.29406711287865e-07, - "loss": 0.4071, - "step": 82225 - }, - { - "epoch": 2.11, - "learning_rate": 4.293839876221936e-07, - "loss": 0.4165, - "step": 82226 - }, - { - "epoch": 2.11, - "learning_rate": 4.2936126439341637e-07, - "loss": 0.439, - "step": 82227 - }, - { - "epoch": 2.11, - "learning_rate": 4.293385416015509e-07, - "loss": 0.4189, - "step": 82228 - }, - { - "epoch": 2.11, - "learning_rate": 4.2931581924661466e-07, - "loss": 0.3992, - "step": 82229 - }, - { - "epoch": 2.11, - "learning_rate": 4.292930973286255e-07, - "loss": 0.3171, - "step": 82230 - }, - { - "epoch": 2.11, - "learning_rate": 4.2927037584760026e-07, - "loss": 0.4075, - "step": 82231 - }, - { - "epoch": 2.11, - "learning_rate": 4.292476548035562e-07, - "loss": 0.3381, - "step": 82232 - }, - { - "epoch": 2.11, - "learning_rate": 4.2922493419651093e-07, - "loss": 0.4492, - "step": 82233 - }, - { - "epoch": 2.11, - "learning_rate": 4.2920221402648226e-07, - "loss": 0.2314, - "step": 82234 - }, - { - "epoch": 2.11, - "learning_rate": 4.2917949429348686e-07, - "loss": 0.3567, - "step": 82235 - }, - { - "epoch": 2.11, - "learning_rate": 4.2915677499754245e-07, - "loss": 0.4199, - "step": 82236 - }, - { - "epoch": 2.11, - "learning_rate": 4.2913405613866636e-07, - "loss": 0.4517, - "step": 82237 - }, - { - "epoch": 2.11, - "learning_rate": 4.291113377168766e-07, - "loss": 0.4485, - "step": 82238 - }, - { - "epoch": 2.11, - "learning_rate": 4.290886197321896e-07, - "loss": 0.502, - "step": 82239 - }, - { - "epoch": 2.11, - "learning_rate": 4.2906590218462314e-07, - "loss": 0.4014, - "step": 82240 - }, - { - "epoch": 2.11, - "learning_rate": 4.290431850741951e-07, - "loss": 0.4707, - "step": 82241 - }, - { - "epoch": 2.11, - "learning_rate": 4.29020468400922e-07, - "loss": 0.519, - "step": 82242 - }, - { - "epoch": 2.11, - "learning_rate": 4.2899775216482217e-07, - "loss": 0.3723, - "step": 82243 - }, - { - "epoch": 2.11, - "learning_rate": 4.2897503636591205e-07, - "loss": 0.4401, - "step": 82244 - }, - { - "epoch": 2.11, - "learning_rate": 4.289523210042094e-07, - "loss": 0.4722, - "step": 82245 - }, - { - "epoch": 2.11, - "learning_rate": 4.289296060797318e-07, - "loss": 0.4004, - "step": 82246 - }, - { - "epoch": 2.11, - "learning_rate": 4.2890689159249694e-07, - "loss": 0.4175, - "step": 82247 - }, - { - "epoch": 2.11, - "learning_rate": 4.288841775425215e-07, - "loss": 0.4297, - "step": 82248 - }, - { - "epoch": 2.11, - "learning_rate": 4.28861463929823e-07, - "loss": 0.4497, - "step": 82249 - }, - { - "epoch": 2.11, - "learning_rate": 4.288387507544192e-07, - "loss": 0.314, - "step": 82250 - }, - { - "epoch": 2.11, - "learning_rate": 4.288160380163276e-07, - "loss": 0.3215, - "step": 82251 - }, - { - "epoch": 2.11, - "learning_rate": 4.2879332571556524e-07, - "loss": 0.3999, - "step": 82252 - }, - { - "epoch": 2.11, - "learning_rate": 4.287706138521493e-07, - "loss": 0.4292, - "step": 82253 - }, - { - "epoch": 2.11, - "learning_rate": 4.2874790242609737e-07, - "loss": 0.3955, - "step": 82254 - }, - { - "epoch": 2.11, - "learning_rate": 4.2872519143742727e-07, - "loss": 0.5166, - "step": 82255 - }, - { - "epoch": 2.11, - "learning_rate": 4.2870248088615567e-07, - "loss": 0.2712, - "step": 82256 - }, - { - "epoch": 2.11, - "learning_rate": 4.286797707723002e-07, - "loss": 0.4531, - "step": 82257 - }, - { - "epoch": 2.11, - "learning_rate": 4.286570610958785e-07, - "loss": 0.4668, - "step": 82258 - }, - { - "epoch": 2.11, - "learning_rate": 4.2863435185690824e-07, - "loss": 0.3813, - "step": 82259 - }, - { - "epoch": 2.11, - "learning_rate": 4.2861164305540586e-07, - "loss": 0.4678, - "step": 82260 - }, - { - "epoch": 2.11, - "learning_rate": 4.285889346913897e-07, - "loss": 0.3442, - "step": 82261 - }, - { - "epoch": 2.11, - "learning_rate": 4.285662267648764e-07, - "loss": 0.4575, - "step": 82262 - }, - { - "epoch": 2.11, - "learning_rate": 4.285435192758836e-07, - "loss": 0.5356, - "step": 82263 - }, - { - "epoch": 2.11, - "learning_rate": 4.2852081222442917e-07, - "loss": 0.3396, - "step": 82264 - }, - { - "epoch": 2.11, - "learning_rate": 4.2849810561052966e-07, - "loss": 0.2955, - "step": 82265 - }, - { - "epoch": 2.11, - "learning_rate": 4.284753994342029e-07, - "loss": 0.46, - "step": 82266 - }, - { - "epoch": 2.11, - "learning_rate": 4.284526936954662e-07, - "loss": 0.2488, - "step": 82267 - }, - { - "epoch": 2.11, - "learning_rate": 4.284299883943374e-07, - "loss": 0.4346, - "step": 82268 - }, - { - "epoch": 2.11, - "learning_rate": 4.284072835308331e-07, - "loss": 0.5625, - "step": 82269 - }, - { - "epoch": 2.11, - "learning_rate": 4.2838457910497117e-07, - "loss": 0.4443, - "step": 82270 - }, - { - "epoch": 2.11, - "learning_rate": 4.2836187511676913e-07, - "loss": 0.4163, - "step": 82271 - }, - { - "epoch": 2.11, - "learning_rate": 4.283391715662441e-07, - "loss": 0.3682, - "step": 82272 - }, - { - "epoch": 2.11, - "learning_rate": 4.283164684534132e-07, - "loss": 0.438, - "step": 82273 - }, - { - "epoch": 2.11, - "learning_rate": 4.2829376577829403e-07, - "loss": 0.3813, - "step": 82274 - }, - { - "epoch": 2.11, - "learning_rate": 4.28271063540904e-07, - "loss": 0.4897, - "step": 82275 - }, - { - "epoch": 2.11, - "learning_rate": 4.28248361741261e-07, - "loss": 0.4458, - "step": 82276 - }, - { - "epoch": 2.11, - "learning_rate": 4.2822566037938145e-07, - "loss": 0.3389, - "step": 82277 - }, - { - "epoch": 2.11, - "learning_rate": 4.282029594552833e-07, - "loss": 0.4331, - "step": 82278 - }, - { - "epoch": 2.11, - "learning_rate": 4.2818025896898393e-07, - "loss": 0.4519, - "step": 82279 - }, - { - "epoch": 2.11, - "learning_rate": 4.2815755892050085e-07, - "loss": 0.2495, - "step": 82280 - }, - { - "epoch": 2.11, - "learning_rate": 4.281348593098513e-07, - "loss": 0.4526, - "step": 82281 - }, - { - "epoch": 2.11, - "learning_rate": 4.281121601370522e-07, - "loss": 0.406, - "step": 82282 - }, - { - "epoch": 2.11, - "learning_rate": 4.2808946140212145e-07, - "loss": 0.3585, - "step": 82283 - }, - { - "epoch": 2.11, - "learning_rate": 4.280667631050762e-07, - "loss": 0.4961, - "step": 82284 - }, - { - "epoch": 2.11, - "learning_rate": 4.2804406524593426e-07, - "loss": 0.4214, - "step": 82285 - }, - { - "epoch": 2.11, - "learning_rate": 4.2802136782471233e-07, - "loss": 0.2615, - "step": 82286 - }, - { - "epoch": 2.11, - "learning_rate": 4.2799867084142814e-07, - "loss": 0.3612, - "step": 82287 - }, - { - "epoch": 2.11, - "learning_rate": 4.279759742960991e-07, - "loss": 0.4482, - "step": 82288 - }, - { - "epoch": 2.11, - "learning_rate": 4.279532781887429e-07, - "loss": 0.415, - "step": 82289 - }, - { - "epoch": 2.11, - "learning_rate": 4.279305825193763e-07, - "loss": 0.4771, - "step": 82290 - }, - { - "epoch": 2.11, - "learning_rate": 4.279078872880172e-07, - "loss": 0.3945, - "step": 82291 - }, - { - "epoch": 2.11, - "learning_rate": 4.2788519249468247e-07, - "loss": 0.4482, - "step": 82292 - }, - { - "epoch": 2.11, - "learning_rate": 4.2786249813939e-07, - "loss": 0.1985, - "step": 82293 - }, - { - "epoch": 2.11, - "learning_rate": 4.278398042221566e-07, - "loss": 0.3542, - "step": 82294 - }, - { - "epoch": 2.11, - "learning_rate": 4.2781711074299986e-07, - "loss": 0.324, - "step": 82295 - }, - { - "epoch": 2.11, - "learning_rate": 4.2779441770193734e-07, - "loss": 0.3618, - "step": 82296 - }, - { - "epoch": 2.11, - "learning_rate": 4.2777172509898663e-07, - "loss": 0.3418, - "step": 82297 - }, - { - "epoch": 2.11, - "learning_rate": 4.277490329341645e-07, - "loss": 0.4258, - "step": 82298 - }, - { - "epoch": 2.11, - "learning_rate": 4.277263412074885e-07, - "loss": 0.3887, - "step": 82299 - }, - { - "epoch": 2.11, - "learning_rate": 4.277036499189763e-07, - "loss": 0.5103, - "step": 82300 - }, - { - "epoch": 2.11, - "learning_rate": 4.276809590686453e-07, - "loss": 0.3403, - "step": 82301 - }, - { - "epoch": 2.11, - "learning_rate": 4.2765826865651276e-07, - "loss": 0.3159, - "step": 82302 - }, - { - "epoch": 2.11, - "learning_rate": 4.276355786825957e-07, - "loss": 0.3525, - "step": 82303 - }, - { - "epoch": 2.11, - "learning_rate": 4.276128891469116e-07, - "loss": 0.4927, - "step": 82304 - }, - { - "epoch": 2.11, - "learning_rate": 4.275902000494781e-07, - "loss": 0.4536, - "step": 82305 - }, - { - "epoch": 2.11, - "learning_rate": 4.2756751139031276e-07, - "loss": 0.4155, - "step": 82306 - }, - { - "epoch": 2.11, - "learning_rate": 4.275448231694323e-07, - "loss": 0.4399, - "step": 82307 - }, - { - "epoch": 2.11, - "learning_rate": 4.275221353868544e-07, - "loss": 0.3555, - "step": 82308 - }, - { - "epoch": 2.11, - "learning_rate": 4.2749944804259696e-07, - "loss": 0.4307, - "step": 82309 - }, - { - "epoch": 2.11, - "learning_rate": 4.274767611366764e-07, - "loss": 0.4355, - "step": 82310 - }, - { - "epoch": 2.11, - "learning_rate": 4.2745407466911096e-07, - "loss": 0.3843, - "step": 82311 - }, - { - "epoch": 2.11, - "learning_rate": 4.2743138863991726e-07, - "loss": 0.4209, - "step": 82312 - }, - { - "epoch": 2.11, - "learning_rate": 4.2740870304911303e-07, - "loss": 0.3867, - "step": 82313 - }, - { - "epoch": 2.11, - "learning_rate": 4.273860178967159e-07, - "loss": 0.4438, - "step": 82314 - }, - { - "epoch": 2.11, - "learning_rate": 4.2736333318274276e-07, - "loss": 0.5005, - "step": 82315 - }, - { - "epoch": 2.11, - "learning_rate": 4.27340648907211e-07, - "loss": 0.312, - "step": 82316 - }, - { - "epoch": 2.11, - "learning_rate": 4.2731796507013827e-07, - "loss": 0.3936, - "step": 82317 - }, - { - "epoch": 2.11, - "learning_rate": 4.272952816715423e-07, - "loss": 0.4351, - "step": 82318 - }, - { - "epoch": 2.11, - "learning_rate": 4.272725987114395e-07, - "loss": 0.4624, - "step": 82319 - }, - { - "epoch": 2.11, - "learning_rate": 4.2724991618984775e-07, - "loss": 0.3962, - "step": 82320 - }, - { - "epoch": 2.11, - "learning_rate": 4.2722723410678483e-07, - "loss": 0.6025, - "step": 82321 - }, - { - "epoch": 2.11, - "learning_rate": 4.272045524622673e-07, - "loss": 0.3618, - "step": 82322 - }, - { - "epoch": 2.11, - "learning_rate": 4.2718187125631323e-07, - "loss": 0.4673, - "step": 82323 - }, - { - "epoch": 2.11, - "learning_rate": 4.2715919048893933e-07, - "loss": 0.4604, - "step": 82324 - }, - { - "epoch": 2.11, - "learning_rate": 4.271365101601633e-07, - "loss": 0.4336, - "step": 82325 - }, - { - "epoch": 2.11, - "learning_rate": 4.271138302700028e-07, - "loss": 0.3345, - "step": 82326 - }, - { - "epoch": 2.11, - "learning_rate": 4.270911508184746e-07, - "loss": 0.3916, - "step": 82327 - }, - { - "epoch": 2.11, - "learning_rate": 4.2706847180559634e-07, - "loss": 0.4336, - "step": 82328 - }, - { - "epoch": 2.11, - "learning_rate": 4.2704579323138546e-07, - "loss": 0.3467, - "step": 82329 - }, - { - "epoch": 2.11, - "learning_rate": 4.2702311509585956e-07, - "loss": 0.4902, - "step": 82330 - }, - { - "epoch": 2.11, - "learning_rate": 4.270004373990357e-07, - "loss": 0.4907, - "step": 82331 - }, - { - "epoch": 2.11, - "learning_rate": 4.26977760140931e-07, - "loss": 0.396, - "step": 82332 - }, - { - "epoch": 2.11, - "learning_rate": 4.2695508332156294e-07, - "loss": 0.4751, - "step": 82333 - }, - { - "epoch": 2.11, - "learning_rate": 4.269324069409491e-07, - "loss": 0.4287, - "step": 82334 - }, - { - "epoch": 2.11, - "learning_rate": 4.269097309991072e-07, - "loss": 0.4277, - "step": 82335 - }, - { - "epoch": 2.11, - "learning_rate": 4.2688705549605377e-07, - "loss": 0.4529, - "step": 82336 - }, - { - "epoch": 2.11, - "learning_rate": 4.268643804318065e-07, - "loss": 0.4263, - "step": 82337 - }, - { - "epoch": 2.11, - "learning_rate": 4.268417058063828e-07, - "loss": 0.3345, - "step": 82338 - }, - { - "epoch": 2.11, - "learning_rate": 4.2681903161980046e-07, - "loss": 0.3936, - "step": 82339 - }, - { - "epoch": 2.11, - "learning_rate": 4.267963578720761e-07, - "loss": 0.4219, - "step": 82340 - }, - { - "epoch": 2.11, - "learning_rate": 4.267736845632278e-07, - "loss": 0.3854, - "step": 82341 - }, - { - "epoch": 2.11, - "learning_rate": 4.267510116932721e-07, - "loss": 0.4102, - "step": 82342 - }, - { - "epoch": 2.11, - "learning_rate": 4.267283392622272e-07, - "loss": 0.6729, - "step": 82343 - }, - { - "epoch": 2.11, - "learning_rate": 4.267056672701097e-07, - "loss": 0.3865, - "step": 82344 - }, - { - "epoch": 2.11, - "learning_rate": 4.2668299571693723e-07, - "loss": 0.4277, - "step": 82345 - }, - { - "epoch": 2.11, - "learning_rate": 4.2666032460272725e-07, - "loss": 0.4351, - "step": 82346 - }, - { - "epoch": 2.11, - "learning_rate": 4.266376539274975e-07, - "loss": 0.3555, - "step": 82347 - }, - { - "epoch": 2.11, - "learning_rate": 4.266149836912646e-07, - "loss": 0.3401, - "step": 82348 - }, - { - "epoch": 2.11, - "learning_rate": 4.2659231389404617e-07, - "loss": 0.4331, - "step": 82349 - }, - { - "epoch": 2.11, - "learning_rate": 4.2656964453585964e-07, - "loss": 0.3652, - "step": 82350 - }, - { - "epoch": 2.11, - "learning_rate": 4.2654697561672284e-07, - "loss": 0.458, - "step": 82351 - }, - { - "epoch": 2.11, - "learning_rate": 4.2652430713665256e-07, - "loss": 0.405, - "step": 82352 - }, - { - "epoch": 2.11, - "learning_rate": 4.2650163909566584e-07, - "loss": 0.4678, - "step": 82353 - }, - { - "epoch": 2.11, - "learning_rate": 4.264789714937805e-07, - "loss": 0.4399, - "step": 82354 - }, - { - "epoch": 2.11, - "learning_rate": 4.2645630433101387e-07, - "loss": 0.4202, - "step": 82355 - }, - { - "epoch": 2.11, - "learning_rate": 4.264336376073836e-07, - "loss": 0.3535, - "step": 82356 - }, - { - "epoch": 2.11, - "learning_rate": 4.2641097132290637e-07, - "loss": 0.2379, - "step": 82357 - }, - { - "epoch": 2.11, - "learning_rate": 4.2638830547759983e-07, - "loss": 0.392, - "step": 82358 - }, - { - "epoch": 2.11, - "learning_rate": 4.2636564007148147e-07, - "loss": 0.3994, - "step": 82359 - }, - { - "epoch": 2.11, - "learning_rate": 4.2634297510456895e-07, - "loss": 0.3877, - "step": 82360 - }, - { - "epoch": 2.11, - "learning_rate": 4.2632031057687913e-07, - "loss": 0.385, - "step": 82361 - }, - { - "epoch": 2.11, - "learning_rate": 4.2629764648842914e-07, - "loss": 0.3916, - "step": 82362 - }, - { - "epoch": 2.11, - "learning_rate": 4.262749828392367e-07, - "loss": 0.4614, - "step": 82363 - }, - { - "epoch": 2.11, - "learning_rate": 4.2625231962931953e-07, - "loss": 0.4102, - "step": 82364 - }, - { - "epoch": 2.11, - "learning_rate": 4.2622965685869415e-07, - "loss": 0.3474, - "step": 82365 - }, - { - "epoch": 2.11, - "learning_rate": 4.262069945273783e-07, - "loss": 0.3238, - "step": 82366 - }, - { - "epoch": 2.11, - "learning_rate": 4.2618433263538944e-07, - "loss": 0.2572, - "step": 82367 - }, - { - "epoch": 2.11, - "learning_rate": 4.2616167118274516e-07, - "loss": 0.4395, - "step": 82368 - }, - { - "epoch": 2.11, - "learning_rate": 4.2613901016946216e-07, - "loss": 0.4028, - "step": 82369 - }, - { - "epoch": 2.11, - "learning_rate": 4.261163495955582e-07, - "loss": 0.4736, - "step": 82370 - }, - { - "epoch": 2.11, - "learning_rate": 4.2609368946105085e-07, - "loss": 0.4302, - "step": 82371 - }, - { - "epoch": 2.11, - "learning_rate": 4.260710297659568e-07, - "loss": 0.4009, - "step": 82372 - }, - { - "epoch": 2.11, - "learning_rate": 4.260483705102942e-07, - "loss": 0.3955, - "step": 82373 - }, - { - "epoch": 2.11, - "learning_rate": 4.260257116940795e-07, - "loss": 0.3794, - "step": 82374 - }, - { - "epoch": 2.11, - "learning_rate": 4.2600305331733066e-07, - "loss": 0.4331, - "step": 82375 - }, - { - "epoch": 2.11, - "learning_rate": 4.259803953800648e-07, - "loss": 0.448, - "step": 82376 - }, - { - "epoch": 2.11, - "learning_rate": 4.2595773788229973e-07, - "loss": 0.4268, - "step": 82377 - }, - { - "epoch": 2.11, - "learning_rate": 4.2593508082405205e-07, - "loss": 0.3442, - "step": 82378 - }, - { - "epoch": 2.11, - "learning_rate": 4.2591242420533957e-07, - "loss": 0.4487, - "step": 82379 - }, - { - "epoch": 2.11, - "learning_rate": 4.258897680261798e-07, - "loss": 0.4169, - "step": 82380 - }, - { - "epoch": 2.11, - "learning_rate": 4.258671122865899e-07, - "loss": 0.4639, - "step": 82381 - }, - { - "epoch": 2.11, - "learning_rate": 4.258444569865868e-07, - "loss": 0.3979, - "step": 82382 - }, - { - "epoch": 2.11, - "learning_rate": 4.258218021261881e-07, - "loss": 0.3135, - "step": 82383 - }, - { - "epoch": 2.11, - "learning_rate": 4.2579914770541136e-07, - "loss": 0.3531, - "step": 82384 - }, - { - "epoch": 2.11, - "learning_rate": 4.2577649372427413e-07, - "loss": 0.3779, - "step": 82385 - }, - { - "epoch": 2.11, - "learning_rate": 4.2575384018279317e-07, - "loss": 0.4834, - "step": 82386 - }, - { - "epoch": 2.11, - "learning_rate": 4.257311870809859e-07, - "loss": 0.363, - "step": 82387 - }, - { - "epoch": 2.11, - "learning_rate": 4.2570853441887e-07, - "loss": 0.5117, - "step": 82388 - }, - { - "epoch": 2.11, - "learning_rate": 4.25685882196463e-07, - "loss": 0.4155, - "step": 82389 - }, - { - "epoch": 2.11, - "learning_rate": 4.256632304137815e-07, - "loss": 0.377, - "step": 82390 - }, - { - "epoch": 2.11, - "learning_rate": 4.256405790708436e-07, - "loss": 0.4229, - "step": 82391 - }, - { - "epoch": 2.11, - "learning_rate": 4.2561792816766607e-07, - "loss": 0.2994, - "step": 82392 - }, - { - "epoch": 2.11, - "learning_rate": 4.255952777042664e-07, - "loss": 0.2295, - "step": 82393 - }, - { - "epoch": 2.11, - "learning_rate": 4.2557262768066225e-07, - "loss": 0.4648, - "step": 82394 - }, - { - "epoch": 2.11, - "learning_rate": 4.255499780968705e-07, - "loss": 0.3738, - "step": 82395 - }, - { - "epoch": 2.11, - "learning_rate": 4.2552732895290875e-07, - "loss": 0.376, - "step": 82396 - }, - { - "epoch": 2.11, - "learning_rate": 4.255046802487946e-07, - "loss": 0.3405, - "step": 82397 - }, - { - "epoch": 2.11, - "learning_rate": 4.254820319845448e-07, - "loss": 0.4175, - "step": 82398 - }, - { - "epoch": 2.11, - "learning_rate": 4.254593841601769e-07, - "loss": 0.4636, - "step": 82399 - }, - { - "epoch": 2.11, - "learning_rate": 4.254367367757085e-07, - "loss": 0.4346, - "step": 82400 - }, - { - "epoch": 2.11, - "learning_rate": 4.25414089831157e-07, - "loss": 0.2913, - "step": 82401 - }, - { - "epoch": 2.11, - "learning_rate": 4.2539144332653953e-07, - "loss": 0.3589, - "step": 82402 - }, - { - "epoch": 2.11, - "learning_rate": 4.2536879726187303e-07, - "loss": 0.5571, - "step": 82403 - }, - { - "epoch": 2.11, - "learning_rate": 4.2534615163717524e-07, - "loss": 0.4297, - "step": 82404 - }, - { - "epoch": 2.11, - "learning_rate": 4.253235064524635e-07, - "loss": 0.4033, - "step": 82405 - }, - { - "epoch": 2.11, - "learning_rate": 4.2530086170775546e-07, - "loss": 0.4277, - "step": 82406 - }, - { - "epoch": 2.11, - "learning_rate": 4.2527821740306767e-07, - "loss": 0.4966, - "step": 82407 - }, - { - "epoch": 2.11, - "learning_rate": 4.252555735384181e-07, - "loss": 0.4375, - "step": 82408 - }, - { - "epoch": 2.11, - "learning_rate": 4.2523293011382375e-07, - "loss": 0.4043, - "step": 82409 - }, - { - "epoch": 2.11, - "learning_rate": 4.252102871293026e-07, - "loss": 0.5044, - "step": 82410 - }, - { - "epoch": 2.11, - "learning_rate": 4.251876445848715e-07, - "loss": 0.3638, - "step": 82411 - }, - { - "epoch": 2.11, - "learning_rate": 4.2516500248054743e-07, - "loss": 0.3665, - "step": 82412 - }, - { - "epoch": 2.11, - "learning_rate": 4.25142360816348e-07, - "loss": 0.4395, - "step": 82413 - }, - { - "epoch": 2.11, - "learning_rate": 4.2511971959229067e-07, - "loss": 0.4297, - "step": 82414 - }, - { - "epoch": 2.11, - "learning_rate": 4.2509707880839316e-07, - "loss": 0.302, - "step": 82415 - }, - { - "epoch": 2.11, - "learning_rate": 4.2507443846467194e-07, - "loss": 0.417, - "step": 82416 - }, - { - "epoch": 2.11, - "learning_rate": 4.250517985611448e-07, - "loss": 0.4478, - "step": 82417 - }, - { - "epoch": 2.11, - "learning_rate": 4.2502915909782945e-07, - "loss": 0.5928, - "step": 82418 - }, - { - "epoch": 2.11, - "learning_rate": 4.2500652007474245e-07, - "loss": 0.4917, - "step": 82419 - }, - { - "epoch": 2.11, - "learning_rate": 4.2498388149190155e-07, - "loss": 0.4224, - "step": 82420 - }, - { - "epoch": 2.11, - "learning_rate": 4.2496124334932435e-07, - "loss": 0.415, - "step": 82421 - }, - { - "epoch": 2.11, - "learning_rate": 4.249386056470277e-07, - "loss": 0.3621, - "step": 82422 - }, - { - "epoch": 2.11, - "learning_rate": 4.249159683850293e-07, - "loss": 0.4639, - "step": 82423 - }, - { - "epoch": 2.11, - "learning_rate": 4.2489333156334594e-07, - "loss": 0.4131, - "step": 82424 - }, - { - "epoch": 2.11, - "learning_rate": 4.2487069518199535e-07, - "loss": 0.4558, - "step": 82425 - }, - { - "epoch": 2.11, - "learning_rate": 4.2484805924099485e-07, - "loss": 0.502, - "step": 82426 - }, - { - "epoch": 2.11, - "learning_rate": 4.248254237403621e-07, - "loss": 0.345, - "step": 82427 - }, - { - "epoch": 2.11, - "learning_rate": 4.2480278868011366e-07, - "loss": 0.4795, - "step": 82428 - }, - { - "epoch": 2.11, - "learning_rate": 4.2478015406026735e-07, - "loss": 0.3318, - "step": 82429 - }, - { - "epoch": 2.11, - "learning_rate": 4.247575198808404e-07, - "loss": 0.4609, - "step": 82430 - }, - { - "epoch": 2.11, - "learning_rate": 4.247348861418505e-07, - "loss": 0.2961, - "step": 82431 - }, - { - "epoch": 2.11, - "learning_rate": 4.247122528433147e-07, - "loss": 0.4441, - "step": 82432 - }, - { - "epoch": 2.11, - "learning_rate": 4.246896199852499e-07, - "loss": 0.4766, - "step": 82433 - }, - { - "epoch": 2.11, - "learning_rate": 4.2466698756767373e-07, - "loss": 0.3584, - "step": 82434 - }, - { - "epoch": 2.11, - "learning_rate": 4.246443555906041e-07, - "loss": 0.3921, - "step": 82435 - }, - { - "epoch": 2.11, - "learning_rate": 4.246217240540573e-07, - "loss": 0.3612, - "step": 82436 - }, - { - "epoch": 2.11, - "learning_rate": 4.245990929580513e-07, - "loss": 0.3955, - "step": 82437 - }, - { - "epoch": 2.11, - "learning_rate": 4.2457646230260325e-07, - "loss": 0.3787, - "step": 82438 - }, - { - "epoch": 2.11, - "learning_rate": 4.2455383208773096e-07, - "loss": 0.3059, - "step": 82439 - }, - { - "epoch": 2.11, - "learning_rate": 4.2453120231345097e-07, - "loss": 0.2856, - "step": 82440 - }, - { - "epoch": 2.11, - "learning_rate": 4.2450857297978137e-07, - "loss": 0.3103, - "step": 82441 - }, - { - "epoch": 2.11, - "learning_rate": 4.244859440867387e-07, - "loss": 0.4135, - "step": 82442 - }, - { - "epoch": 2.11, - "learning_rate": 4.244633156343407e-07, - "loss": 0.3385, - "step": 82443 - }, - { - "epoch": 2.11, - "learning_rate": 4.2444068762260496e-07, - "loss": 0.4038, - "step": 82444 - }, - { - "epoch": 2.11, - "learning_rate": 4.2441806005154824e-07, - "loss": 0.4487, - "step": 82445 - }, - { - "epoch": 2.11, - "learning_rate": 4.2439543292118805e-07, - "loss": 0.3982, - "step": 82446 - }, - { - "epoch": 2.11, - "learning_rate": 4.243728062315419e-07, - "loss": 0.3901, - "step": 82447 - }, - { - "epoch": 2.11, - "learning_rate": 4.2435017998262733e-07, - "loss": 0.4268, - "step": 82448 - }, - { - "epoch": 2.11, - "learning_rate": 4.243275541744611e-07, - "loss": 0.4883, - "step": 82449 - }, - { - "epoch": 2.11, - "learning_rate": 4.243049288070607e-07, - "loss": 0.3843, - "step": 82450 - }, - { - "epoch": 2.11, - "learning_rate": 4.242823038804439e-07, - "loss": 0.358, - "step": 82451 - }, - { - "epoch": 2.11, - "learning_rate": 4.242596793946277e-07, - "loss": 0.3162, - "step": 82452 - }, - { - "epoch": 2.11, - "learning_rate": 4.2423705534962905e-07, - "loss": 0.4238, - "step": 82453 - }, - { - "epoch": 2.11, - "learning_rate": 4.242144317454656e-07, - "loss": 0.4824, - "step": 82454 - }, - { - "epoch": 2.11, - "learning_rate": 4.2419180858215466e-07, - "loss": 0.4678, - "step": 82455 - }, - { - "epoch": 2.11, - "learning_rate": 4.2416918585971396e-07, - "loss": 0.5044, - "step": 82456 - }, - { - "epoch": 2.11, - "learning_rate": 4.2414656357816004e-07, - "loss": 0.3955, - "step": 82457 - }, - { - "epoch": 2.11, - "learning_rate": 4.2412394173751065e-07, - "loss": 0.5078, - "step": 82458 - }, - { - "epoch": 2.11, - "learning_rate": 4.24101320337783e-07, - "loss": 0.4097, - "step": 82459 - }, - { - "epoch": 2.11, - "learning_rate": 4.24078699378995e-07, - "loss": 0.4746, - "step": 82460 - }, - { - "epoch": 2.11, - "learning_rate": 4.240560788611633e-07, - "loss": 0.4683, - "step": 82461 - }, - { - "epoch": 2.11, - "learning_rate": 4.240334587843052e-07, - "loss": 0.2338, - "step": 82462 - }, - { - "epoch": 2.11, - "learning_rate": 4.2401083914843805e-07, - "loss": 0.3672, - "step": 82463 - }, - { - "epoch": 2.11, - "learning_rate": 4.2398821995357934e-07, - "loss": 0.5132, - "step": 82464 - }, - { - "epoch": 2.11, - "learning_rate": 4.2396560119974676e-07, - "loss": 0.4685, - "step": 82465 - }, - { - "epoch": 2.11, - "learning_rate": 4.2394298288695683e-07, - "loss": 0.4434, - "step": 82466 - }, - { - "epoch": 2.11, - "learning_rate": 4.239203650152273e-07, - "loss": 0.3609, - "step": 82467 - }, - { - "epoch": 2.11, - "learning_rate": 4.238977475845754e-07, - "loss": 0.4001, - "step": 82468 - }, - { - "epoch": 2.11, - "learning_rate": 4.23875130595019e-07, - "loss": 0.4353, - "step": 82469 - }, - { - "epoch": 2.11, - "learning_rate": 4.2385251404657484e-07, - "loss": 0.416, - "step": 82470 - }, - { - "epoch": 2.11, - "learning_rate": 4.2382989793925996e-07, - "loss": 0.4326, - "step": 82471 - }, - { - "epoch": 2.11, - "learning_rate": 4.23807282273092e-07, - "loss": 0.5464, - "step": 82472 - }, - { - "epoch": 2.11, - "learning_rate": 4.237846670480887e-07, - "loss": 0.4585, - "step": 82473 - }, - { - "epoch": 2.11, - "learning_rate": 4.2376205226426667e-07, - "loss": 0.3619, - "step": 82474 - }, - { - "epoch": 2.11, - "learning_rate": 4.2373943792164345e-07, - "loss": 0.3767, - "step": 82475 - }, - { - "epoch": 2.11, - "learning_rate": 4.2371682402023647e-07, - "loss": 0.4595, - "step": 82476 - }, - { - "epoch": 2.11, - "learning_rate": 4.236942105600634e-07, - "loss": 0.3804, - "step": 82477 - }, - { - "epoch": 2.11, - "learning_rate": 4.2367159754114077e-07, - "loss": 0.5088, - "step": 82478 - }, - { - "epoch": 2.11, - "learning_rate": 4.2364898496348646e-07, - "loss": 0.3232, - "step": 82479 - }, - { - "epoch": 2.11, - "learning_rate": 4.236263728271178e-07, - "loss": 0.5439, - "step": 82480 - }, - { - "epoch": 2.11, - "learning_rate": 4.2360376113205163e-07, - "loss": 0.5037, - "step": 82481 - }, - { - "epoch": 2.11, - "learning_rate": 4.2358114987830596e-07, - "loss": 0.5591, - "step": 82482 - }, - { - "epoch": 2.11, - "learning_rate": 4.235585390658972e-07, - "loss": 0.543, - "step": 82483 - }, - { - "epoch": 2.11, - "learning_rate": 4.2353592869484335e-07, - "loss": 0.4888, - "step": 82484 - }, - { - "epoch": 2.11, - "learning_rate": 4.2351331876516137e-07, - "loss": 0.3436, - "step": 82485 - }, - { - "epoch": 2.11, - "learning_rate": 4.2349070927686915e-07, - "loss": 0.4224, - "step": 82486 - }, - { - "epoch": 2.11, - "learning_rate": 4.2346810022998327e-07, - "loss": 0.3716, - "step": 82487 - }, - { - "epoch": 2.11, - "learning_rate": 4.2344549162452126e-07, - "loss": 0.4644, - "step": 82488 - }, - { - "epoch": 2.11, - "learning_rate": 4.2342288346050105e-07, - "loss": 0.3887, - "step": 82489 - }, - { - "epoch": 2.11, - "learning_rate": 4.234002757379392e-07, - "loss": 0.3633, - "step": 82490 - }, - { - "epoch": 2.11, - "learning_rate": 4.233776684568531e-07, - "loss": 0.3521, - "step": 82491 - }, - { - "epoch": 2.11, - "learning_rate": 4.233550616172601e-07, - "loss": 0.4497, - "step": 82492 - }, - { - "epoch": 2.11, - "learning_rate": 4.233324552191776e-07, - "loss": 0.3262, - "step": 82493 - }, - { - "epoch": 2.11, - "learning_rate": 4.2330984926262334e-07, - "loss": 0.5342, - "step": 82494 - }, - { - "epoch": 2.11, - "learning_rate": 4.232872437476138e-07, - "loss": 0.4185, - "step": 82495 - }, - { - "epoch": 2.11, - "learning_rate": 4.2326463867416674e-07, - "loss": 0.4331, - "step": 82496 - }, - { - "epoch": 2.11, - "learning_rate": 4.232420340422994e-07, - "loss": 0.4351, - "step": 82497 - }, - { - "epoch": 2.11, - "learning_rate": 4.2321942985202954e-07, - "loss": 0.3484, - "step": 82498 - }, - { - "epoch": 2.11, - "learning_rate": 4.231968261033736e-07, - "loss": 0.397, - "step": 82499 - }, - { - "epoch": 2.11, - "learning_rate": 4.2317422279634974e-07, - "loss": 0.4541, - "step": 82500 - }, - { - "epoch": 2.11, - "learning_rate": 4.2315161993097447e-07, - "loss": 0.3596, - "step": 82501 - }, - { - "epoch": 2.11, - "learning_rate": 4.2312901750726547e-07, - "loss": 0.4424, - "step": 82502 - }, - { - "epoch": 2.11, - "learning_rate": 4.231064155252404e-07, - "loss": 0.2982, - "step": 82503 - }, - { - "epoch": 2.11, - "learning_rate": 4.230838139849159e-07, - "loss": 0.2219, - "step": 82504 - }, - { - "epoch": 2.11, - "learning_rate": 4.230612128863096e-07, - "loss": 0.3444, - "step": 82505 - }, - { - "epoch": 2.11, - "learning_rate": 4.2303861222943915e-07, - "loss": 0.4009, - "step": 82506 - }, - { - "epoch": 2.11, - "learning_rate": 4.2301601201432113e-07, - "loss": 0.4434, - "step": 82507 - }, - { - "epoch": 2.11, - "learning_rate": 4.229934122409733e-07, - "loss": 0.4351, - "step": 82508 - }, - { - "epoch": 2.11, - "learning_rate": 4.229708129094127e-07, - "loss": 0.4814, - "step": 82509 - }, - { - "epoch": 2.11, - "learning_rate": 4.229482140196573e-07, - "loss": 0.3994, - "step": 82510 - }, - { - "epoch": 2.11, - "learning_rate": 4.229256155717239e-07, - "loss": 0.2307, - "step": 82511 - }, - { - "epoch": 2.11, - "learning_rate": 4.2290301756562954e-07, - "loss": 0.458, - "step": 82512 - }, - { - "epoch": 2.11, - "learning_rate": 4.228804200013917e-07, - "loss": 0.3064, - "step": 82513 - }, - { - "epoch": 2.11, - "learning_rate": 4.228578228790278e-07, - "loss": 0.4512, - "step": 82514 - }, - { - "epoch": 2.11, - "learning_rate": 4.228352261985555e-07, - "loss": 0.3716, - "step": 82515 - }, - { - "epoch": 2.11, - "learning_rate": 4.2281262995999143e-07, - "loss": 0.3789, - "step": 82516 - }, - { - "epoch": 2.11, - "learning_rate": 4.227900341633531e-07, - "loss": 0.3257, - "step": 82517 - }, - { - "epoch": 2.11, - "learning_rate": 4.2276743880865795e-07, - "loss": 0.4104, - "step": 82518 - }, - { - "epoch": 2.12, - "learning_rate": 4.2274484389592356e-07, - "loss": 0.3188, - "step": 82519 - }, - { - "epoch": 2.12, - "learning_rate": 4.22722249425167e-07, - "loss": 0.4751, - "step": 82520 - }, - { - "epoch": 2.12, - "learning_rate": 4.2269965539640497e-07, - "loss": 0.4346, - "step": 82521 - }, - { - "epoch": 2.12, - "learning_rate": 4.2267706180965535e-07, - "loss": 0.2236, - "step": 82522 - }, - { - "epoch": 2.12, - "learning_rate": 4.226544686649357e-07, - "loss": 0.4893, - "step": 82523 - }, - { - "epoch": 2.12, - "learning_rate": 4.2263187596226256e-07, - "loss": 0.438, - "step": 82524 - }, - { - "epoch": 2.12, - "learning_rate": 4.226092837016537e-07, - "loss": 0.3857, - "step": 82525 - }, - { - "epoch": 2.12, - "learning_rate": 4.2258669188312633e-07, - "loss": 0.5234, - "step": 82526 - }, - { - "epoch": 2.12, - "learning_rate": 4.225641005066982e-07, - "loss": 0.4526, - "step": 82527 - }, - { - "epoch": 2.12, - "learning_rate": 4.225415095723858e-07, - "loss": 0.3342, - "step": 82528 - }, - { - "epoch": 2.12, - "learning_rate": 4.2251891908020676e-07, - "loss": 0.3956, - "step": 82529 - }, - { - "epoch": 2.12, - "learning_rate": 4.2249632903017883e-07, - "loss": 0.3711, - "step": 82530 - }, - { - "epoch": 2.12, - "learning_rate": 4.2247373942231857e-07, - "loss": 0.4246, - "step": 82531 - }, - { - "epoch": 2.12, - "learning_rate": 4.22451150256644e-07, - "loss": 0.457, - "step": 82532 - }, - { - "epoch": 2.12, - "learning_rate": 4.2242856153317164e-07, - "loss": 0.4053, - "step": 82533 - }, - { - "epoch": 2.12, - "learning_rate": 4.2240597325191907e-07, - "loss": 0.3503, - "step": 82534 - }, - { - "epoch": 2.12, - "learning_rate": 4.2238338541290384e-07, - "loss": 0.3645, - "step": 82535 - }, - { - "epoch": 2.12, - "learning_rate": 4.2236079801614335e-07, - "loss": 0.4292, - "step": 82536 - }, - { - "epoch": 2.12, - "learning_rate": 4.2233821106165434e-07, - "loss": 0.3848, - "step": 82537 - }, - { - "epoch": 2.12, - "learning_rate": 4.2231562454945433e-07, - "loss": 0.3156, - "step": 82538 - }, - { - "epoch": 2.12, - "learning_rate": 4.222930384795608e-07, - "loss": 0.4399, - "step": 82539 - }, - { - "epoch": 2.12, - "learning_rate": 4.2227045285199146e-07, - "loss": 0.3418, - "step": 82540 - }, - { - "epoch": 2.12, - "learning_rate": 4.222478676667626e-07, - "loss": 0.5522, - "step": 82541 - }, - { - "epoch": 2.12, - "learning_rate": 4.222252829238918e-07, - "loss": 0.4678, - "step": 82542 - }, - { - "epoch": 2.12, - "learning_rate": 4.222026986233965e-07, - "loss": 0.5889, - "step": 82543 - }, - { - "epoch": 2.12, - "learning_rate": 4.2218011476529446e-07, - "loss": 0.214, - "step": 82544 - }, - { - "epoch": 2.12, - "learning_rate": 4.221575313496022e-07, - "loss": 0.3885, - "step": 82545 - }, - { - "epoch": 2.12, - "learning_rate": 4.2213494837633736e-07, - "loss": 0.2524, - "step": 82546 - }, - { - "epoch": 2.12, - "learning_rate": 4.2211236584551725e-07, - "loss": 0.4055, - "step": 82547 - }, - { - "epoch": 2.12, - "learning_rate": 4.220897837571594e-07, - "loss": 0.3539, - "step": 82548 - }, - { - "epoch": 2.12, - "learning_rate": 4.220672021112804e-07, - "loss": 0.4512, - "step": 82549 - }, - { - "epoch": 2.12, - "learning_rate": 4.220446209078985e-07, - "loss": 0.4316, - "step": 82550 - }, - { - "epoch": 2.12, - "learning_rate": 4.2202204014703005e-07, - "loss": 0.2832, - "step": 82551 - }, - { - "epoch": 2.12, - "learning_rate": 4.2199945982869266e-07, - "loss": 0.3761, - "step": 82552 - }, - { - "epoch": 2.12, - "learning_rate": 4.219768799529042e-07, - "loss": 0.4438, - "step": 82553 - }, - { - "epoch": 2.12, - "learning_rate": 4.2195430051968094e-07, - "loss": 0.3273, - "step": 82554 - }, - { - "epoch": 2.12, - "learning_rate": 4.2193172152904086e-07, - "loss": 0.3936, - "step": 82555 - }, - { - "epoch": 2.12, - "learning_rate": 4.21909142981001e-07, - "loss": 0.3618, - "step": 82556 - }, - { - "epoch": 2.12, - "learning_rate": 4.218865648755791e-07, - "loss": 0.4673, - "step": 82557 - }, - { - "epoch": 2.12, - "learning_rate": 4.2186398721279173e-07, - "loss": 0.4302, - "step": 82558 - }, - { - "epoch": 2.12, - "learning_rate": 4.218414099926565e-07, - "loss": 0.4062, - "step": 82559 - }, - { - "epoch": 2.12, - "learning_rate": 4.2181883321519105e-07, - "loss": 0.4521, - "step": 82560 - }, - { - "epoch": 2.12, - "learning_rate": 4.217962568804124e-07, - "loss": 0.4307, - "step": 82561 - }, - { - "epoch": 2.12, - "learning_rate": 4.217736809883373e-07, - "loss": 0.3745, - "step": 82562 - }, - { - "epoch": 2.12, - "learning_rate": 4.2175110553898365e-07, - "loss": 0.4541, - "step": 82563 - }, - { - "epoch": 2.12, - "learning_rate": 4.2172853053236843e-07, - "loss": 0.428, - "step": 82564 - }, - { - "epoch": 2.12, - "learning_rate": 4.2170595596850957e-07, - "loss": 0.3882, - "step": 82565 - }, - { - "epoch": 2.12, - "learning_rate": 4.2168338184742347e-07, - "loss": 0.4478, - "step": 82566 - }, - { - "epoch": 2.12, - "learning_rate": 4.2166080816912786e-07, - "loss": 0.4321, - "step": 82567 - }, - { - "epoch": 2.12, - "learning_rate": 4.216382349336399e-07, - "loss": 0.3508, - "step": 82568 - }, - { - "epoch": 2.12, - "learning_rate": 4.2161566214097733e-07, - "loss": 0.417, - "step": 82569 - }, - { - "epoch": 2.12, - "learning_rate": 4.2159308979115714e-07, - "loss": 0.2996, - "step": 82570 - }, - { - "epoch": 2.12, - "learning_rate": 4.2157051788419605e-07, - "loss": 0.3213, - "step": 82571 - }, - { - "epoch": 2.12, - "learning_rate": 4.215479464201118e-07, - "loss": 0.4243, - "step": 82572 - }, - { - "epoch": 2.12, - "learning_rate": 4.2152537539892176e-07, - "loss": 0.213, - "step": 82573 - }, - { - "epoch": 2.12, - "learning_rate": 4.215028048206435e-07, - "loss": 0.356, - "step": 82574 - }, - { - "epoch": 2.12, - "learning_rate": 4.214802346852936e-07, - "loss": 0.46, - "step": 82575 - }, - { - "epoch": 2.12, - "learning_rate": 4.214576649928897e-07, - "loss": 0.5615, - "step": 82576 - }, - { - "epoch": 2.12, - "learning_rate": 4.214350957434489e-07, - "loss": 0.303, - "step": 82577 - }, - { - "epoch": 2.12, - "learning_rate": 4.2141252693698913e-07, - "loss": 0.3389, - "step": 82578 - }, - { - "epoch": 2.12, - "learning_rate": 4.213899585735269e-07, - "loss": 0.4102, - "step": 82579 - }, - { - "epoch": 2.12, - "learning_rate": 4.2136739065308e-07, - "loss": 0.499, - "step": 82580 - }, - { - "epoch": 2.12, - "learning_rate": 4.213448231756652e-07, - "loss": 0.3623, - "step": 82581 - }, - { - "epoch": 2.12, - "learning_rate": 4.2132225614130034e-07, - "loss": 0.246, - "step": 82582 - }, - { - "epoch": 2.12, - "learning_rate": 4.212996895500022e-07, - "loss": 0.4644, - "step": 82583 - }, - { - "epoch": 2.12, - "learning_rate": 4.2127712340178814e-07, - "loss": 0.364, - "step": 82584 - }, - { - "epoch": 2.12, - "learning_rate": 4.212545576966756e-07, - "loss": 0.2921, - "step": 82585 - }, - { - "epoch": 2.12, - "learning_rate": 4.212319924346822e-07, - "loss": 0.3506, - "step": 82586 - }, - { - "epoch": 2.12, - "learning_rate": 4.2120942761582454e-07, - "loss": 0.4316, - "step": 82587 - }, - { - "epoch": 2.12, - "learning_rate": 4.211868632401202e-07, - "loss": 0.3386, - "step": 82588 - }, - { - "epoch": 2.12, - "learning_rate": 4.2116429930758643e-07, - "loss": 0.3967, - "step": 82589 - }, - { - "epoch": 2.12, - "learning_rate": 4.21141735818241e-07, - "loss": 0.5249, - "step": 82590 - }, - { - "epoch": 2.12, - "learning_rate": 4.211191727721006e-07, - "loss": 0.3345, - "step": 82591 - }, - { - "epoch": 2.12, - "learning_rate": 4.210966101691823e-07, - "loss": 0.397, - "step": 82592 - }, - { - "epoch": 2.12, - "learning_rate": 4.2107404800950373e-07, - "loss": 0.4536, - "step": 82593 - }, - { - "epoch": 2.12, - "learning_rate": 4.2105148629308205e-07, - "loss": 0.3462, - "step": 82594 - }, - { - "epoch": 2.12, - "learning_rate": 4.2102892501993516e-07, - "loss": 0.3171, - "step": 82595 - }, - { - "epoch": 2.12, - "learning_rate": 4.210063641900793e-07, - "loss": 0.4448, - "step": 82596 - }, - { - "epoch": 2.12, - "learning_rate": 4.209838038035323e-07, - "loss": 0.4902, - "step": 82597 - }, - { - "epoch": 2.12, - "learning_rate": 4.209612438603117e-07, - "loss": 0.3755, - "step": 82598 - }, - { - "epoch": 2.12, - "learning_rate": 4.209386843604342e-07, - "loss": 0.3837, - "step": 82599 - }, - { - "epoch": 2.12, - "learning_rate": 4.209161253039176e-07, - "loss": 0.478, - "step": 82600 - }, - { - "epoch": 2.12, - "learning_rate": 4.208935666907785e-07, - "loss": 0.3967, - "step": 82601 - }, - { - "epoch": 2.12, - "learning_rate": 4.208710085210346e-07, - "loss": 0.4058, - "step": 82602 - }, - { - "epoch": 2.12, - "learning_rate": 4.2084845079470357e-07, - "loss": 0.3732, - "step": 82603 - }, - { - "epoch": 2.12, - "learning_rate": 4.2082589351180173e-07, - "loss": 0.4175, - "step": 82604 - }, - { - "epoch": 2.12, - "learning_rate": 4.20803336672347e-07, - "loss": 0.3943, - "step": 82605 - }, - { - "epoch": 2.12, - "learning_rate": 4.2078078027635653e-07, - "loss": 0.3765, - "step": 82606 - }, - { - "epoch": 2.12, - "learning_rate": 4.207582243238479e-07, - "loss": 0.4536, - "step": 82607 - }, - { - "epoch": 2.12, - "learning_rate": 4.207356688148377e-07, - "loss": 0.3647, - "step": 82608 - }, - { - "epoch": 2.12, - "learning_rate": 4.207131137493436e-07, - "loss": 0.3469, - "step": 82609 - }, - { - "epoch": 2.12, - "learning_rate": 4.206905591273832e-07, - "loss": 0.4062, - "step": 82610 - }, - { - "epoch": 2.12, - "learning_rate": 4.206680049489729e-07, - "loss": 0.4834, - "step": 82611 - }, - { - "epoch": 2.12, - "learning_rate": 4.20645451214131e-07, - "loss": 0.3082, - "step": 82612 - }, - { - "epoch": 2.12, - "learning_rate": 4.206228979228739e-07, - "loss": 0.5039, - "step": 82613 - }, - { - "epoch": 2.12, - "learning_rate": 4.2060034507521904e-07, - "loss": 0.4072, - "step": 82614 - }, - { - "epoch": 2.12, - "learning_rate": 4.205777926711843e-07, - "loss": 0.3823, - "step": 82615 - }, - { - "epoch": 2.12, - "learning_rate": 4.205552407107862e-07, - "loss": 0.4653, - "step": 82616 - }, - { - "epoch": 2.12, - "learning_rate": 4.2053268919404215e-07, - "loss": 0.2732, - "step": 82617 - }, - { - "epoch": 2.12, - "learning_rate": 4.2051013812096967e-07, - "loss": 0.395, - "step": 82618 - }, - { - "epoch": 2.12, - "learning_rate": 4.2048758749158633e-07, - "loss": 0.4604, - "step": 82619 - }, - { - "epoch": 2.12, - "learning_rate": 4.2046503730590897e-07, - "loss": 0.3584, - "step": 82620 - }, - { - "epoch": 2.12, - "learning_rate": 4.2044248756395453e-07, - "loss": 0.4722, - "step": 82621 - }, - { - "epoch": 2.12, - "learning_rate": 4.2041993826574064e-07, - "loss": 0.3889, - "step": 82622 - }, - { - "epoch": 2.12, - "learning_rate": 4.2039738941128445e-07, - "loss": 0.3801, - "step": 82623 - }, - { - "epoch": 2.12, - "learning_rate": 4.203748410006038e-07, - "loss": 0.5107, - "step": 82624 - }, - { - "epoch": 2.12, - "learning_rate": 4.203522930337151e-07, - "loss": 0.3877, - "step": 82625 - }, - { - "epoch": 2.12, - "learning_rate": 4.203297455106359e-07, - "loss": 0.224, - "step": 82626 - }, - { - "epoch": 2.12, - "learning_rate": 4.2030719843138375e-07, - "loss": 0.4316, - "step": 82627 - }, - { - "epoch": 2.12, - "learning_rate": 4.2028465179597596e-07, - "loss": 0.4668, - "step": 82628 - }, - { - "epoch": 2.12, - "learning_rate": 4.202621056044292e-07, - "loss": 0.4434, - "step": 82629 - }, - { - "epoch": 2.12, - "learning_rate": 4.202395598567614e-07, - "loss": 0.4016, - "step": 82630 - }, - { - "epoch": 2.12, - "learning_rate": 4.202170145529893e-07, - "loss": 0.2842, - "step": 82631 - }, - { - "epoch": 2.12, - "learning_rate": 4.201944696931307e-07, - "loss": 0.3557, - "step": 82632 - }, - { - "epoch": 2.12, - "learning_rate": 4.2017192527720205e-07, - "loss": 0.3459, - "step": 82633 - }, - { - "epoch": 2.12, - "learning_rate": 4.2014938130522117e-07, - "loss": 0.5405, - "step": 82634 - }, - { - "epoch": 2.12, - "learning_rate": 4.2012683777720525e-07, - "loss": 0.3887, - "step": 82635 - }, - { - "epoch": 2.12, - "learning_rate": 4.2010429469317187e-07, - "loss": 0.406, - "step": 82636 - }, - { - "epoch": 2.12, - "learning_rate": 4.2008175205313765e-07, - "loss": 0.4688, - "step": 82637 - }, - { - "epoch": 2.12, - "learning_rate": 4.2005920985712016e-07, - "loss": 0.2112, - "step": 82638 - }, - { - "epoch": 2.12, - "learning_rate": 4.200366681051366e-07, - "loss": 0.418, - "step": 82639 - }, - { - "epoch": 2.12, - "learning_rate": 4.200141267972047e-07, - "loss": 0.4419, - "step": 82640 - }, - { - "epoch": 2.12, - "learning_rate": 4.199915859333414e-07, - "loss": 0.3616, - "step": 82641 - }, - { - "epoch": 2.12, - "learning_rate": 4.199690455135635e-07, - "loss": 0.2949, - "step": 82642 - }, - { - "epoch": 2.12, - "learning_rate": 4.1994650553788845e-07, - "loss": 0.4763, - "step": 82643 - }, - { - "epoch": 2.12, - "learning_rate": 4.1992396600633385e-07, - "loss": 0.3931, - "step": 82644 - }, - { - "epoch": 2.12, - "learning_rate": 4.1990142691891717e-07, - "loss": 0.4717, - "step": 82645 - }, - { - "epoch": 2.12, - "learning_rate": 4.1987888827565487e-07, - "loss": 0.5439, - "step": 82646 - }, - { - "epoch": 2.12, - "learning_rate": 4.1985635007656463e-07, - "loss": 0.5239, - "step": 82647 - }, - { - "epoch": 2.12, - "learning_rate": 4.198338123216637e-07, - "loss": 0.4307, - "step": 82648 - }, - { - "epoch": 2.12, - "learning_rate": 4.198112750109698e-07, - "loss": 0.4141, - "step": 82649 - }, - { - "epoch": 2.12, - "learning_rate": 4.1978873814449964e-07, - "loss": 0.3623, - "step": 82650 - }, - { - "epoch": 2.12, - "learning_rate": 4.1976620172227017e-07, - "loss": 0.5, - "step": 82651 - }, - { - "epoch": 2.12, - "learning_rate": 4.197436657442991e-07, - "loss": 0.3068, - "step": 82652 - }, - { - "epoch": 2.12, - "learning_rate": 4.1972113021060397e-07, - "loss": 0.3616, - "step": 82653 - }, - { - "epoch": 2.12, - "learning_rate": 4.1969859512120133e-07, - "loss": 0.2964, - "step": 82654 - }, - { - "epoch": 2.12, - "learning_rate": 4.196760604761088e-07, - "loss": 0.3719, - "step": 82655 - }, - { - "epoch": 2.12, - "learning_rate": 4.196535262753437e-07, - "loss": 0.4712, - "step": 82656 - }, - { - "epoch": 2.12, - "learning_rate": 4.196309925189234e-07, - "loss": 0.2635, - "step": 82657 - }, - { - "epoch": 2.12, - "learning_rate": 4.196084592068647e-07, - "loss": 0.4697, - "step": 82658 - }, - { - "epoch": 2.12, - "learning_rate": 4.195859263391851e-07, - "loss": 0.4492, - "step": 82659 - }, - { - "epoch": 2.12, - "learning_rate": 4.1956339391590224e-07, - "loss": 0.356, - "step": 82660 - }, - { - "epoch": 2.12, - "learning_rate": 4.1954086193703264e-07, - "loss": 0.519, - "step": 82661 - }, - { - "epoch": 2.12, - "learning_rate": 4.195183304025943e-07, - "loss": 0.2437, - "step": 82662 - }, - { - "epoch": 2.12, - "learning_rate": 4.1949579931260373e-07, - "loss": 0.4805, - "step": 82663 - }, - { - "epoch": 2.12, - "learning_rate": 4.1947326866707845e-07, - "loss": 0.3569, - "step": 82664 - }, - { - "epoch": 2.12, - "learning_rate": 4.194507384660358e-07, - "loss": 0.3838, - "step": 82665 - }, - { - "epoch": 2.12, - "learning_rate": 4.194282087094935e-07, - "loss": 0.5352, - "step": 82666 - }, - { - "epoch": 2.12, - "learning_rate": 4.1940567939746785e-07, - "loss": 0.4233, - "step": 82667 - }, - { - "epoch": 2.12, - "learning_rate": 4.1938315052997664e-07, - "loss": 0.4819, - "step": 82668 - }, - { - "epoch": 2.12, - "learning_rate": 4.193606221070374e-07, - "loss": 0.3668, - "step": 82669 - }, - { - "epoch": 2.12, - "learning_rate": 4.1933809412866697e-07, - "loss": 0.4331, - "step": 82670 - }, - { - "epoch": 2.12, - "learning_rate": 4.1931556659488244e-07, - "loss": 0.4448, - "step": 82671 - }, - { - "epoch": 2.12, - "learning_rate": 4.1929303950570117e-07, - "loss": 0.5693, - "step": 82672 - }, - { - "epoch": 2.12, - "learning_rate": 4.1927051286114047e-07, - "loss": 0.3572, - "step": 82673 - }, - { - "epoch": 2.12, - "learning_rate": 4.1924798666121806e-07, - "loss": 0.4136, - "step": 82674 - }, - { - "epoch": 2.12, - "learning_rate": 4.1922546090595047e-07, - "loss": 0.4736, - "step": 82675 - }, - { - "epoch": 2.12, - "learning_rate": 4.1920293559535516e-07, - "loss": 0.3136, - "step": 82676 - }, - { - "epoch": 2.12, - "learning_rate": 4.1918041072944956e-07, - "loss": 0.2109, - "step": 82677 - }, - { - "epoch": 2.12, - "learning_rate": 4.1915788630825097e-07, - "loss": 0.3084, - "step": 82678 - }, - { - "epoch": 2.12, - "learning_rate": 4.191353623317763e-07, - "loss": 0.2535, - "step": 82679 - }, - { - "epoch": 2.12, - "learning_rate": 4.1911283880004324e-07, - "loss": 0.3701, - "step": 82680 - }, - { - "epoch": 2.12, - "learning_rate": 4.190903157130685e-07, - "loss": 0.457, - "step": 82681 - }, - { - "epoch": 2.12, - "learning_rate": 4.190677930708695e-07, - "loss": 0.4365, - "step": 82682 - }, - { - "epoch": 2.12, - "learning_rate": 4.1904527087346395e-07, - "loss": 0.3896, - "step": 82683 - }, - { - "epoch": 2.12, - "learning_rate": 4.1902274912086845e-07, - "loss": 0.6333, - "step": 82684 - }, - { - "epoch": 2.12, - "learning_rate": 4.190002278131004e-07, - "loss": 0.4232, - "step": 82685 - }, - { - "epoch": 2.12, - "learning_rate": 4.1897770695017763e-07, - "loss": 0.4561, - "step": 82686 - }, - { - "epoch": 2.12, - "learning_rate": 4.1895518653211647e-07, - "loss": 0.3843, - "step": 82687 - }, - { - "epoch": 2.12, - "learning_rate": 4.189326665589347e-07, - "loss": 0.3477, - "step": 82688 - }, - { - "epoch": 2.12, - "learning_rate": 4.189101470306493e-07, - "loss": 0.3003, - "step": 82689 - }, - { - "epoch": 2.12, - "learning_rate": 4.1888762794727817e-07, - "loss": 0.5327, - "step": 82690 - }, - { - "epoch": 2.12, - "learning_rate": 4.188651093088381e-07, - "loss": 0.3892, - "step": 82691 - }, - { - "epoch": 2.12, - "learning_rate": 4.188425911153458e-07, - "loss": 0.4634, - "step": 82692 - }, - { - "epoch": 2.12, - "learning_rate": 4.1882007336681915e-07, - "loss": 0.4888, - "step": 82693 - }, - { - "epoch": 2.12, - "learning_rate": 4.1879755606327515e-07, - "loss": 0.4492, - "step": 82694 - }, - { - "epoch": 2.12, - "learning_rate": 4.1877503920473157e-07, - "loss": 0.4116, - "step": 82695 - }, - { - "epoch": 2.12, - "learning_rate": 4.1875252279120475e-07, - "loss": 0.366, - "step": 82696 - }, - { - "epoch": 2.12, - "learning_rate": 4.1873000682271253e-07, - "loss": 0.4976, - "step": 82697 - }, - { - "epoch": 2.12, - "learning_rate": 4.1870749129927185e-07, - "loss": 0.3777, - "step": 82698 - }, - { - "epoch": 2.12, - "learning_rate": 4.186849762209006e-07, - "loss": 0.3359, - "step": 82699 - }, - { - "epoch": 2.12, - "learning_rate": 4.1866246158761555e-07, - "loss": 0.3918, - "step": 82700 - }, - { - "epoch": 2.12, - "learning_rate": 4.1863994739943354e-07, - "loss": 0.3457, - "step": 82701 - }, - { - "epoch": 2.12, - "learning_rate": 4.1861743365637216e-07, - "loss": 0.3281, - "step": 82702 - }, - { - "epoch": 2.12, - "learning_rate": 4.18594920358449e-07, - "loss": 0.4111, - "step": 82703 - }, - { - "epoch": 2.12, - "learning_rate": 4.185724075056807e-07, - "loss": 0.342, - "step": 82704 - }, - { - "epoch": 2.12, - "learning_rate": 4.185498950980847e-07, - "loss": 0.4961, - "step": 82705 - }, - { - "epoch": 2.12, - "learning_rate": 4.185273831356784e-07, - "loss": 0.3665, - "step": 82706 - }, - { - "epoch": 2.12, - "learning_rate": 4.1850487161847925e-07, - "loss": 0.4941, - "step": 82707 - }, - { - "epoch": 2.12, - "learning_rate": 4.1848236054650376e-07, - "loss": 0.4189, - "step": 82708 - }, - { - "epoch": 2.12, - "learning_rate": 4.1845984991976966e-07, - "loss": 0.418, - "step": 82709 - }, - { - "epoch": 2.12, - "learning_rate": 4.184373397382944e-07, - "loss": 0.3555, - "step": 82710 - }, - { - "epoch": 2.12, - "learning_rate": 4.1841483000209466e-07, - "loss": 0.3841, - "step": 82711 - }, - { - "epoch": 2.12, - "learning_rate": 4.1839232071118837e-07, - "loss": 0.4961, - "step": 82712 - }, - { - "epoch": 2.12, - "learning_rate": 4.183698118655918e-07, - "loss": 0.3951, - "step": 82713 - }, - { - "epoch": 2.12, - "learning_rate": 4.183473034653228e-07, - "loss": 0.479, - "step": 82714 - }, - { - "epoch": 2.12, - "learning_rate": 4.183247955103986e-07, - "loss": 0.4141, - "step": 82715 - }, - { - "epoch": 2.12, - "learning_rate": 4.1830228800083657e-07, - "loss": 0.2834, - "step": 82716 - }, - { - "epoch": 2.12, - "learning_rate": 4.182797809366535e-07, - "loss": 0.3994, - "step": 82717 - }, - { - "epoch": 2.12, - "learning_rate": 4.1825727431786674e-07, - "loss": 0.4761, - "step": 82718 - }, - { - "epoch": 2.12, - "learning_rate": 4.1823476814449365e-07, - "loss": 0.457, - "step": 82719 - }, - { - "epoch": 2.12, - "learning_rate": 4.1821226241655226e-07, - "loss": 0.4189, - "step": 82720 - }, - { - "epoch": 2.12, - "learning_rate": 4.1818975713405824e-07, - "loss": 0.3533, - "step": 82721 - }, - { - "epoch": 2.12, - "learning_rate": 4.1816725229702955e-07, - "loss": 0.3308, - "step": 82722 - }, - { - "epoch": 2.12, - "learning_rate": 4.181447479054835e-07, - "loss": 0.394, - "step": 82723 - }, - { - "epoch": 2.12, - "learning_rate": 4.181222439594375e-07, - "loss": 0.3923, - "step": 82724 - }, - { - "epoch": 2.12, - "learning_rate": 4.180997404589083e-07, - "loss": 0.4299, - "step": 82725 - }, - { - "epoch": 2.12, - "learning_rate": 4.180772374039133e-07, - "loss": 0.4036, - "step": 82726 - }, - { - "epoch": 2.12, - "learning_rate": 4.180547347944698e-07, - "loss": 0.4111, - "step": 82727 - }, - { - "epoch": 2.12, - "learning_rate": 4.1803223263059537e-07, - "loss": 0.5005, - "step": 82728 - }, - { - "epoch": 2.12, - "learning_rate": 4.180097309123066e-07, - "loss": 0.4546, - "step": 82729 - }, - { - "epoch": 2.12, - "learning_rate": 4.179872296396214e-07, - "loss": 0.3779, - "step": 82730 - }, - { - "epoch": 2.12, - "learning_rate": 4.179647288125562e-07, - "loss": 0.4062, - "step": 82731 - }, - { - "epoch": 2.12, - "learning_rate": 4.179422284311287e-07, - "loss": 0.3447, - "step": 82732 - }, - { - "epoch": 2.12, - "learning_rate": 4.179197284953564e-07, - "loss": 0.373, - "step": 82733 - }, - { - "epoch": 2.12, - "learning_rate": 4.178972290052558e-07, - "loss": 0.4189, - "step": 82734 - }, - { - "epoch": 2.12, - "learning_rate": 4.178747299608445e-07, - "loss": 0.4243, - "step": 82735 - }, - { - "epoch": 2.12, - "learning_rate": 4.178522313621399e-07, - "loss": 0.5938, - "step": 82736 - }, - { - "epoch": 2.12, - "learning_rate": 4.178297332091593e-07, - "loss": 0.4204, - "step": 82737 - }, - { - "epoch": 2.12, - "learning_rate": 4.178072355019194e-07, - "loss": 0.4138, - "step": 82738 - }, - { - "epoch": 2.12, - "learning_rate": 4.177847382404377e-07, - "loss": 0.3682, - "step": 82739 - }, - { - "epoch": 2.12, - "learning_rate": 4.1776224142473184e-07, - "loss": 0.4253, - "step": 82740 - }, - { - "epoch": 2.12, - "learning_rate": 4.1773974505481866e-07, - "loss": 0.4214, - "step": 82741 - }, - { - "epoch": 2.12, - "learning_rate": 4.1771724913071506e-07, - "loss": 0.4338, - "step": 82742 - }, - { - "epoch": 2.12, - "learning_rate": 4.176947536524386e-07, - "loss": 0.4902, - "step": 82743 - }, - { - "epoch": 2.12, - "learning_rate": 4.1767225862000646e-07, - "loss": 0.4253, - "step": 82744 - }, - { - "epoch": 2.12, - "learning_rate": 4.1764976403343623e-07, - "loss": 0.3813, - "step": 82745 - }, - { - "epoch": 2.12, - "learning_rate": 4.176272698927443e-07, - "loss": 0.3247, - "step": 82746 - }, - { - "epoch": 2.12, - "learning_rate": 4.1760477619794863e-07, - "loss": 0.3989, - "step": 82747 - }, - { - "epoch": 2.12, - "learning_rate": 4.1758228294906604e-07, - "loss": 0.1436, - "step": 82748 - }, - { - "epoch": 2.12, - "learning_rate": 4.175597901461144e-07, - "loss": 0.4263, - "step": 82749 - }, - { - "epoch": 2.12, - "learning_rate": 4.175372977891104e-07, - "loss": 0.3298, - "step": 82750 - }, - { - "epoch": 2.12, - "learning_rate": 4.17514805878071e-07, - "loss": 0.2788, - "step": 82751 - }, - { - "epoch": 2.12, - "learning_rate": 4.174923144130136e-07, - "loss": 0.4163, - "step": 82752 - }, - { - "epoch": 2.12, - "learning_rate": 4.1746982339395564e-07, - "loss": 0.4006, - "step": 82753 - }, - { - "epoch": 2.12, - "learning_rate": 4.174473328209146e-07, - "loss": 0.3382, - "step": 82754 - }, - { - "epoch": 2.12, - "learning_rate": 4.17424842693907e-07, - "loss": 0.3911, - "step": 82755 - }, - { - "epoch": 2.12, - "learning_rate": 4.1740235301295037e-07, - "loss": 0.3402, - "step": 82756 - }, - { - "epoch": 2.12, - "learning_rate": 4.17379863778062e-07, - "loss": 0.3337, - "step": 82757 - }, - { - "epoch": 2.12, - "learning_rate": 4.173573749892595e-07, - "loss": 0.3152, - "step": 82758 - }, - { - "epoch": 2.12, - "learning_rate": 4.173348866465596e-07, - "loss": 0.3259, - "step": 82759 - }, - { - "epoch": 2.12, - "learning_rate": 4.1731239874997916e-07, - "loss": 0.3779, - "step": 82760 - }, - { - "epoch": 2.12, - "learning_rate": 4.1728991129953594e-07, - "loss": 0.3904, - "step": 82761 - }, - { - "epoch": 2.12, - "learning_rate": 4.172674242952473e-07, - "loss": 0.4312, - "step": 82762 - }, - { - "epoch": 2.12, - "learning_rate": 4.1724493773712985e-07, - "loss": 0.2676, - "step": 82763 - }, - { - "epoch": 2.12, - "learning_rate": 4.172224516252013e-07, - "loss": 0.4438, - "step": 82764 - }, - { - "epoch": 2.12, - "learning_rate": 4.171999659594786e-07, - "loss": 0.3815, - "step": 82765 - }, - { - "epoch": 2.12, - "learning_rate": 4.1717748073997947e-07, - "loss": 0.4741, - "step": 82766 - }, - { - "epoch": 2.12, - "learning_rate": 4.171549959667203e-07, - "loss": 0.4141, - "step": 82767 - }, - { - "epoch": 2.12, - "learning_rate": 4.1713251163971886e-07, - "loss": 0.3677, - "step": 82768 - }, - { - "epoch": 2.12, - "learning_rate": 4.171100277589926e-07, - "loss": 0.4658, - "step": 82769 - }, - { - "epoch": 2.12, - "learning_rate": 4.1708754432455806e-07, - "loss": 0.4453, - "step": 82770 - }, - { - "epoch": 2.12, - "learning_rate": 4.1706506133643306e-07, - "loss": 0.4736, - "step": 82771 - }, - { - "epoch": 2.12, - "learning_rate": 4.1704257879463423e-07, - "loss": 0.3296, - "step": 82772 - }, - { - "epoch": 2.12, - "learning_rate": 4.1702009669917905e-07, - "loss": 0.3657, - "step": 82773 - }, - { - "epoch": 2.12, - "learning_rate": 4.169976150500848e-07, - "loss": 0.3979, - "step": 82774 - }, - { - "epoch": 2.12, - "learning_rate": 4.1697513384736905e-07, - "loss": 0.4526, - "step": 82775 - }, - { - "epoch": 2.12, - "learning_rate": 4.1695265309104834e-07, - "loss": 0.4478, - "step": 82776 - }, - { - "epoch": 2.12, - "learning_rate": 4.169301727811401e-07, - "loss": 0.4155, - "step": 82777 - }, - { - "epoch": 2.12, - "learning_rate": 4.1690769291766193e-07, - "loss": 0.4583, - "step": 82778 - }, - { - "epoch": 2.12, - "learning_rate": 4.168852135006308e-07, - "loss": 0.4629, - "step": 82779 - }, - { - "epoch": 2.12, - "learning_rate": 4.168627345300634e-07, - "loss": 0.3276, - "step": 82780 - }, - { - "epoch": 2.12, - "learning_rate": 4.168402560059774e-07, - "loss": 0.4253, - "step": 82781 - }, - { - "epoch": 2.12, - "learning_rate": 4.168177779283901e-07, - "loss": 0.4922, - "step": 82782 - }, - { - "epoch": 2.12, - "learning_rate": 4.167953002973189e-07, - "loss": 0.3975, - "step": 82783 - }, - { - "epoch": 2.12, - "learning_rate": 4.167728231127804e-07, - "loss": 0.4082, - "step": 82784 - }, - { - "epoch": 2.12, - "learning_rate": 4.1675034637479213e-07, - "loss": 0.3335, - "step": 82785 - }, - { - "epoch": 2.12, - "learning_rate": 4.167278700833713e-07, - "loss": 0.4111, - "step": 82786 - }, - { - "epoch": 2.12, - "learning_rate": 4.1670539423853543e-07, - "loss": 0.3877, - "step": 82787 - }, - { - "epoch": 2.12, - "learning_rate": 4.1668291884030104e-07, - "loss": 0.4116, - "step": 82788 - }, - { - "epoch": 2.12, - "learning_rate": 4.1666044388868616e-07, - "loss": 0.3489, - "step": 82789 - }, - { - "epoch": 2.12, - "learning_rate": 4.166379693837072e-07, - "loss": 0.4546, - "step": 82790 - }, - { - "epoch": 2.12, - "learning_rate": 4.1661549532538167e-07, - "loss": 0.4189, - "step": 82791 - }, - { - "epoch": 2.12, - "learning_rate": 4.165930217137272e-07, - "loss": 0.3459, - "step": 82792 - }, - { - "epoch": 2.12, - "learning_rate": 4.165705485487603e-07, - "loss": 0.4287, - "step": 82793 - }, - { - "epoch": 2.12, - "learning_rate": 4.1654807583049845e-07, - "loss": 0.2396, - "step": 82794 - }, - { - "epoch": 2.12, - "learning_rate": 4.165256035589594e-07, - "loss": 0.3682, - "step": 82795 - }, - { - "epoch": 2.12, - "learning_rate": 4.165031317341593e-07, - "loss": 0.4844, - "step": 82796 - }, - { - "epoch": 2.12, - "learning_rate": 4.1648066035611604e-07, - "loss": 0.374, - "step": 82797 - }, - { - "epoch": 2.12, - "learning_rate": 4.164581894248468e-07, - "loss": 0.4458, - "step": 82798 - }, - { - "epoch": 2.12, - "learning_rate": 4.164357189403689e-07, - "loss": 0.4321, - "step": 82799 - }, - { - "epoch": 2.12, - "learning_rate": 4.1641324890269935e-07, - "loss": 0.2822, - "step": 82800 - }, - { - "epoch": 2.12, - "learning_rate": 4.163907793118551e-07, - "loss": 0.3342, - "step": 82801 - }, - { - "epoch": 2.12, - "learning_rate": 4.163683101678535e-07, - "loss": 0.2921, - "step": 82802 - }, - { - "epoch": 2.12, - "learning_rate": 4.163458414707118e-07, - "loss": 0.3314, - "step": 82803 - }, - { - "epoch": 2.12, - "learning_rate": 4.1632337322044775e-07, - "loss": 0.3582, - "step": 82804 - }, - { - "epoch": 2.12, - "learning_rate": 4.1630090541707753e-07, - "loss": 0.3638, - "step": 82805 - }, - { - "epoch": 2.12, - "learning_rate": 4.1627843806061904e-07, - "loss": 0.3028, - "step": 82806 - }, - { - "epoch": 2.12, - "learning_rate": 4.1625597115108923e-07, - "loss": 0.52, - "step": 82807 - }, - { - "epoch": 2.12, - "learning_rate": 4.162335046885057e-07, - "loss": 0.4897, - "step": 82808 - }, - { - "epoch": 2.12, - "learning_rate": 4.162110386728854e-07, - "loss": 0.5034, - "step": 82809 - }, - { - "epoch": 2.12, - "learning_rate": 4.1618857310424507e-07, - "loss": 0.4927, - "step": 82810 - }, - { - "epoch": 2.12, - "learning_rate": 4.1616610798260233e-07, - "loss": 0.2697, - "step": 82811 - }, - { - "epoch": 2.12, - "learning_rate": 4.1614364330797467e-07, - "loss": 0.3853, - "step": 82812 - }, - { - "epoch": 2.12, - "learning_rate": 4.161211790803787e-07, - "loss": 0.355, - "step": 82813 - }, - { - "epoch": 2.12, - "learning_rate": 4.1609871529983174e-07, - "loss": 0.3831, - "step": 82814 - }, - { - "epoch": 2.12, - "learning_rate": 4.160762519663513e-07, - "loss": 0.4009, - "step": 82815 - }, - { - "epoch": 2.12, - "learning_rate": 4.1605378907995467e-07, - "loss": 0.479, - "step": 82816 - }, - { - "epoch": 2.12, - "learning_rate": 4.1603132664065855e-07, - "loss": 0.4819, - "step": 82817 - }, - { - "epoch": 2.12, - "learning_rate": 4.160088646484804e-07, - "loss": 0.4243, - "step": 82818 - }, - { - "epoch": 2.12, - "learning_rate": 4.159864031034377e-07, - "loss": 0.459, - "step": 82819 - }, - { - "epoch": 2.12, - "learning_rate": 4.15963942005547e-07, - "loss": 0.3784, - "step": 82820 - }, - { - "epoch": 2.12, - "learning_rate": 4.159414813548262e-07, - "loss": 0.4468, - "step": 82821 - }, - { - "epoch": 2.12, - "learning_rate": 4.1591902115129187e-07, - "loss": 0.3994, - "step": 82822 - }, - { - "epoch": 2.12, - "learning_rate": 4.1589656139496144e-07, - "loss": 0.4441, - "step": 82823 - }, - { - "epoch": 2.12, - "learning_rate": 4.1587410208585206e-07, - "loss": 0.4294, - "step": 82824 - }, - { - "epoch": 2.12, - "learning_rate": 4.158516432239815e-07, - "loss": 0.3643, - "step": 82825 - }, - { - "epoch": 2.12, - "learning_rate": 4.158291848093661e-07, - "loss": 0.4502, - "step": 82826 - }, - { - "epoch": 2.12, - "learning_rate": 4.1580672684202343e-07, - "loss": 0.5098, - "step": 82827 - }, - { - "epoch": 2.12, - "learning_rate": 4.157842693219706e-07, - "loss": 0.4341, - "step": 82828 - }, - { - "epoch": 2.12, - "learning_rate": 4.157618122492258e-07, - "loss": 0.3916, - "step": 82829 - }, - { - "epoch": 2.12, - "learning_rate": 4.157393556238045e-07, - "loss": 0.479, - "step": 82830 - }, - { - "epoch": 2.12, - "learning_rate": 4.157168994457246e-07, - "loss": 0.5293, - "step": 82831 - }, - { - "epoch": 2.12, - "learning_rate": 4.156944437150035e-07, - "loss": 0.5757, - "step": 82832 - }, - { - "epoch": 2.12, - "learning_rate": 4.1567198843165876e-07, - "loss": 0.3542, - "step": 82833 - }, - { - "epoch": 2.12, - "learning_rate": 4.1564953359570667e-07, - "loss": 0.2935, - "step": 82834 - }, - { - "epoch": 2.12, - "learning_rate": 4.156270792071648e-07, - "loss": 0.3816, - "step": 82835 - }, - { - "epoch": 2.12, - "learning_rate": 4.1560462526605044e-07, - "loss": 0.3057, - "step": 82836 - }, - { - "epoch": 2.12, - "learning_rate": 4.155821717723811e-07, - "loss": 0.5869, - "step": 82837 - }, - { - "epoch": 2.12, - "learning_rate": 4.1555971872617324e-07, - "loss": 0.2991, - "step": 82838 - }, - { - "epoch": 2.12, - "learning_rate": 4.155372661274449e-07, - "loss": 0.5552, - "step": 82839 - }, - { - "epoch": 2.12, - "learning_rate": 4.1551481397621234e-07, - "loss": 0.3813, - "step": 82840 - }, - { - "epoch": 2.12, - "learning_rate": 4.1549236227249316e-07, - "loss": 0.5, - "step": 82841 - }, - { - "epoch": 2.12, - "learning_rate": 4.154699110163051e-07, - "loss": 0.4941, - "step": 82842 - }, - { - "epoch": 2.12, - "learning_rate": 4.154474602076644e-07, - "loss": 0.4692, - "step": 82843 - }, - { - "epoch": 2.12, - "learning_rate": 4.154250098465888e-07, - "loss": 0.4233, - "step": 82844 - }, - { - "epoch": 2.12, - "learning_rate": 4.1540255993309525e-07, - "loss": 0.4478, - "step": 82845 - }, - { - "epoch": 2.12, - "learning_rate": 4.1538011046720154e-07, - "loss": 0.4453, - "step": 82846 - }, - { - "epoch": 2.12, - "learning_rate": 4.1535766144892404e-07, - "loss": 0.3772, - "step": 82847 - }, - { - "epoch": 2.12, - "learning_rate": 4.153352128782802e-07, - "loss": 0.4526, - "step": 82848 - }, - { - "epoch": 2.12, - "learning_rate": 4.1531276475528774e-07, - "loss": 0.458, - "step": 82849 - }, - { - "epoch": 2.12, - "learning_rate": 4.1529031707996345e-07, - "loss": 0.3566, - "step": 82850 - }, - { - "epoch": 2.12, - "learning_rate": 4.152678698523241e-07, - "loss": 0.5703, - "step": 82851 - }, - { - "epoch": 2.12, - "learning_rate": 4.152454230723872e-07, - "loss": 0.3706, - "step": 82852 - }, - { - "epoch": 2.12, - "learning_rate": 4.1522297674017003e-07, - "loss": 0.4272, - "step": 82853 - }, - { - "epoch": 2.12, - "learning_rate": 4.152005308556901e-07, - "loss": 0.4238, - "step": 82854 - }, - { - "epoch": 2.12, - "learning_rate": 4.151780854189638e-07, - "loss": 0.3038, - "step": 82855 - }, - { - "epoch": 2.12, - "learning_rate": 4.1515564043000886e-07, - "loss": 0.4888, - "step": 82856 - }, - { - "epoch": 2.12, - "learning_rate": 4.151331958888423e-07, - "loss": 0.457, - "step": 82857 - }, - { - "epoch": 2.12, - "learning_rate": 4.151107517954817e-07, - "loss": 0.3403, - "step": 82858 - }, - { - "epoch": 2.12, - "learning_rate": 4.150883081499439e-07, - "loss": 0.343, - "step": 82859 - }, - { - "epoch": 2.12, - "learning_rate": 4.150658649522458e-07, - "loss": 0.215, - "step": 82860 - }, - { - "epoch": 2.12, - "learning_rate": 4.1504342220240484e-07, - "loss": 0.4377, - "step": 82861 - }, - { - "epoch": 2.12, - "learning_rate": 4.150209799004382e-07, - "loss": 0.3733, - "step": 82862 - }, - { - "epoch": 2.12, - "learning_rate": 4.1499853804636345e-07, - "loss": 0.3374, - "step": 82863 - }, - { - "epoch": 2.12, - "learning_rate": 4.149760966401971e-07, - "loss": 0.3901, - "step": 82864 - }, - { - "epoch": 2.12, - "learning_rate": 4.149536556819566e-07, - "loss": 0.3513, - "step": 82865 - }, - { - "epoch": 2.12, - "learning_rate": 4.1493121517165963e-07, - "loss": 0.4492, - "step": 82866 - }, - { - "epoch": 2.12, - "learning_rate": 4.149087751093225e-07, - "loss": 0.3215, - "step": 82867 - }, - { - "epoch": 2.12, - "learning_rate": 4.148863354949629e-07, - "loss": 0.4824, - "step": 82868 - }, - { - "epoch": 2.12, - "learning_rate": 4.148638963285982e-07, - "loss": 0.2946, - "step": 82869 - }, - { - "epoch": 2.12, - "learning_rate": 4.148414576102449e-07, - "loss": 0.2722, - "step": 82870 - }, - { - "epoch": 2.12, - "learning_rate": 4.1481901933992104e-07, - "loss": 0.2947, - "step": 82871 - }, - { - "epoch": 2.12, - "learning_rate": 4.14796581517643e-07, - "loss": 0.3589, - "step": 82872 - }, - { - "epoch": 2.12, - "learning_rate": 4.1477414414342825e-07, - "loss": 0.4492, - "step": 82873 - }, - { - "epoch": 2.12, - "learning_rate": 4.1475170721729416e-07, - "loss": 0.4233, - "step": 82874 - }, - { - "epoch": 2.12, - "learning_rate": 4.14729270739258e-07, - "loss": 0.2872, - "step": 82875 - }, - { - "epoch": 2.12, - "learning_rate": 4.1470683470933645e-07, - "loss": 0.5024, - "step": 82876 - }, - { - "epoch": 2.12, - "learning_rate": 4.1468439912754683e-07, - "loss": 0.5117, - "step": 82877 - }, - { - "epoch": 2.12, - "learning_rate": 4.146619639939066e-07, - "loss": 0.3579, - "step": 82878 - }, - { - "epoch": 2.12, - "learning_rate": 4.1463952930843307e-07, - "loss": 0.4858, - "step": 82879 - }, - { - "epoch": 2.12, - "learning_rate": 4.146170950711432e-07, - "loss": 0.405, - "step": 82880 - }, - { - "epoch": 2.12, - "learning_rate": 4.145946612820537e-07, - "loss": 0.415, - "step": 82881 - }, - { - "epoch": 2.12, - "learning_rate": 4.1457222794118205e-07, - "loss": 0.3696, - "step": 82882 - }, - { - "epoch": 2.12, - "learning_rate": 4.14549795048546e-07, - "loss": 0.4575, - "step": 82883 - }, - { - "epoch": 2.12, - "learning_rate": 4.14527362604162e-07, - "loss": 0.2693, - "step": 82884 - }, - { - "epoch": 2.12, - "learning_rate": 4.1450493060804726e-07, - "loss": 0.2902, - "step": 82885 - }, - { - "epoch": 2.12, - "learning_rate": 4.144824990602193e-07, - "loss": 0.4741, - "step": 82886 - }, - { - "epoch": 2.12, - "learning_rate": 4.1446006796069556e-07, - "loss": 0.222, - "step": 82887 - }, - { - "epoch": 2.12, - "learning_rate": 4.1443763730949234e-07, - "loss": 0.6152, - "step": 82888 - }, - { - "epoch": 2.12, - "learning_rate": 4.144152071066277e-07, - "loss": 0.3163, - "step": 82889 - }, - { - "epoch": 2.12, - "learning_rate": 4.1439277735211806e-07, - "loss": 0.4033, - "step": 82890 - }, - { - "epoch": 2.12, - "learning_rate": 4.1437034804598104e-07, - "loss": 0.4307, - "step": 82891 - }, - { - "epoch": 2.12, - "learning_rate": 4.14347919188234e-07, - "loss": 0.3992, - "step": 82892 - }, - { - "epoch": 2.12, - "learning_rate": 4.1432549077889336e-07, - "loss": 0.3835, - "step": 82893 - }, - { - "epoch": 2.12, - "learning_rate": 4.143030628179769e-07, - "loss": 0.3706, - "step": 82894 - }, - { - "epoch": 2.12, - "learning_rate": 4.142806353055016e-07, - "loss": 0.4746, - "step": 82895 - }, - { - "epoch": 2.12, - "learning_rate": 4.1425820824148503e-07, - "loss": 0.2032, - "step": 82896 - }, - { - "epoch": 2.12, - "learning_rate": 4.1423578162594377e-07, - "loss": 0.3481, - "step": 82897 - }, - { - "epoch": 2.12, - "learning_rate": 4.1421335545889513e-07, - "loss": 0.4908, - "step": 82898 - }, - { - "epoch": 2.12, - "learning_rate": 4.1419092974035673e-07, - "loss": 0.5044, - "step": 82899 - }, - { - "epoch": 2.12, - "learning_rate": 4.1416850447034547e-07, - "loss": 0.3345, - "step": 82900 - }, - { - "epoch": 2.12, - "learning_rate": 4.1414607964887806e-07, - "loss": 0.415, - "step": 82901 - }, - { - "epoch": 2.12, - "learning_rate": 4.1412365527597205e-07, - "loss": 0.4106, - "step": 82902 - }, - { - "epoch": 2.12, - "learning_rate": 4.1410123135164467e-07, - "loss": 0.502, - "step": 82903 - }, - { - "epoch": 2.12, - "learning_rate": 4.140788078759133e-07, - "loss": 0.4751, - "step": 82904 - }, - { - "epoch": 2.12, - "learning_rate": 4.1405638484879457e-07, - "loss": 0.3896, - "step": 82905 - }, - { - "epoch": 2.12, - "learning_rate": 4.140339622703058e-07, - "loss": 0.5156, - "step": 82906 - }, - { - "epoch": 2.12, - "learning_rate": 4.1401154014046444e-07, - "loss": 0.4858, - "step": 82907 - }, - { - "epoch": 2.12, - "learning_rate": 4.1398911845928773e-07, - "loss": 0.3875, - "step": 82908 - }, - { - "epoch": 2.12, - "learning_rate": 4.139666972267927e-07, - "loss": 0.2994, - "step": 82909 - }, - { - "epoch": 2.13, - "learning_rate": 4.13944276442996e-07, - "loss": 0.4351, - "step": 82910 - }, - { - "epoch": 2.13, - "learning_rate": 4.139218561079153e-07, - "loss": 0.3923, - "step": 82911 - }, - { - "epoch": 2.13, - "learning_rate": 4.1389943622156766e-07, - "loss": 0.4136, - "step": 82912 - }, - { - "epoch": 2.13, - "learning_rate": 4.138770167839706e-07, - "loss": 0.3403, - "step": 82913 - }, - { - "epoch": 2.13, - "learning_rate": 4.1385459779514065e-07, - "loss": 0.3325, - "step": 82914 - }, - { - "epoch": 2.13, - "learning_rate": 4.1383217925509515e-07, - "loss": 0.4351, - "step": 82915 - }, - { - "epoch": 2.13, - "learning_rate": 4.138097611638516e-07, - "loss": 0.498, - "step": 82916 - }, - { - "epoch": 2.13, - "learning_rate": 4.137873435214272e-07, - "loss": 0.4775, - "step": 82917 - }, - { - "epoch": 2.13, - "learning_rate": 4.1376492632783843e-07, - "loss": 0.2937, - "step": 82918 - }, - { - "epoch": 2.13, - "learning_rate": 4.137425095831034e-07, - "loss": 0.4292, - "step": 82919 - }, - { - "epoch": 2.13, - "learning_rate": 4.1372009328723834e-07, - "loss": 0.4453, - "step": 82920 - }, - { - "epoch": 2.13, - "learning_rate": 4.136976774402613e-07, - "loss": 0.5107, - "step": 82921 - }, - { - "epoch": 2.13, - "learning_rate": 4.136752620421885e-07, - "loss": 0.3464, - "step": 82922 - }, - { - "epoch": 2.13, - "learning_rate": 4.1365284709303773e-07, - "loss": 0.4917, - "step": 82923 - }, - { - "epoch": 2.13, - "learning_rate": 4.1363043259282593e-07, - "loss": 0.3379, - "step": 82924 - }, - { - "epoch": 2.13, - "learning_rate": 4.136080185415707e-07, - "loss": 0.3452, - "step": 82925 - }, - { - "epoch": 2.13, - "learning_rate": 4.135856049392885e-07, - "loss": 0.2823, - "step": 82926 - }, - { - "epoch": 2.13, - "learning_rate": 4.1356319178599685e-07, - "loss": 0.4922, - "step": 82927 - }, - { - "epoch": 2.13, - "learning_rate": 4.135407790817129e-07, - "loss": 0.415, - "step": 82928 - }, - { - "epoch": 2.13, - "learning_rate": 4.1351836682645414e-07, - "loss": 0.3604, - "step": 82929 - }, - { - "epoch": 2.13, - "learning_rate": 4.134959550202375e-07, - "loss": 0.4429, - "step": 82930 - }, - { - "epoch": 2.13, - "learning_rate": 4.134735436630795e-07, - "loss": 0.3984, - "step": 82931 - }, - { - "epoch": 2.13, - "learning_rate": 4.1345113275499796e-07, - "loss": 0.4849, - "step": 82932 - }, - { - "epoch": 2.13, - "learning_rate": 4.134287222960099e-07, - "loss": 0.436, - "step": 82933 - }, - { - "epoch": 2.13, - "learning_rate": 4.134063122861329e-07, - "loss": 0.4771, - "step": 82934 - }, - { - "epoch": 2.13, - "learning_rate": 4.1338390272538327e-07, - "loss": 0.375, - "step": 82935 - }, - { - "epoch": 2.13, - "learning_rate": 4.133614936137787e-07, - "loss": 0.3657, - "step": 82936 - }, - { - "epoch": 2.13, - "learning_rate": 4.133390849513362e-07, - "loss": 0.3765, - "step": 82937 - }, - { - "epoch": 2.13, - "learning_rate": 4.1331667673807334e-07, - "loss": 0.2132, - "step": 82938 - }, - { - "epoch": 2.13, - "learning_rate": 4.132942689740069e-07, - "loss": 0.3573, - "step": 82939 - }, - { - "epoch": 2.13, - "learning_rate": 4.1327186165915376e-07, - "loss": 0.4399, - "step": 82940 - }, - { - "epoch": 2.13, - "learning_rate": 4.1324945479353133e-07, - "loss": 0.4604, - "step": 82941 - }, - { - "epoch": 2.13, - "learning_rate": 4.132270483771573e-07, - "loss": 0.4214, - "step": 82942 - }, - { - "epoch": 2.13, - "learning_rate": 4.1320464241004783e-07, - "loss": 0.439, - "step": 82943 - }, - { - "epoch": 2.13, - "learning_rate": 4.1318223689222063e-07, - "loss": 0.2936, - "step": 82944 - }, - { - "epoch": 2.13, - "learning_rate": 4.1315983182369285e-07, - "loss": 0.3651, - "step": 82945 - }, - { - "epoch": 2.13, - "learning_rate": 4.1313742720448184e-07, - "loss": 0.3807, - "step": 82946 - }, - { - "epoch": 2.13, - "learning_rate": 4.1311502303460435e-07, - "loss": 0.4961, - "step": 82947 - }, - { - "epoch": 2.13, - "learning_rate": 4.1309261931407757e-07, - "loss": 0.4149, - "step": 82948 - }, - { - "epoch": 2.13, - "learning_rate": 4.1307021604291913e-07, - "loss": 0.4814, - "step": 82949 - }, - { - "epoch": 2.13, - "learning_rate": 4.1304781322114544e-07, - "loss": 0.4128, - "step": 82950 - }, - { - "epoch": 2.13, - "learning_rate": 4.130254108487745e-07, - "loss": 0.3241, - "step": 82951 - }, - { - "epoch": 2.13, - "learning_rate": 4.1300300892582275e-07, - "loss": 0.5166, - "step": 82952 - }, - { - "epoch": 2.13, - "learning_rate": 4.1298060745230746e-07, - "loss": 0.1882, - "step": 82953 - }, - { - "epoch": 2.13, - "learning_rate": 4.1295820642824595e-07, - "loss": 0.4702, - "step": 82954 - }, - { - "epoch": 2.13, - "learning_rate": 4.129358058536557e-07, - "loss": 0.5869, - "step": 82955 - }, - { - "epoch": 2.13, - "learning_rate": 4.1291340572855313e-07, - "loss": 0.3978, - "step": 82956 - }, - { - "epoch": 2.13, - "learning_rate": 4.128910060529559e-07, - "loss": 0.5542, - "step": 82957 - }, - { - "epoch": 2.13, - "learning_rate": 4.128686068268813e-07, - "loss": 0.4468, - "step": 82958 - }, - { - "epoch": 2.13, - "learning_rate": 4.128462080503462e-07, - "loss": 0.3953, - "step": 82959 - }, - { - "epoch": 2.13, - "learning_rate": 4.1282380972336737e-07, - "loss": 0.3376, - "step": 82960 - }, - { - "epoch": 2.13, - "learning_rate": 4.128014118459624e-07, - "loss": 0.4419, - "step": 82961 - }, - { - "epoch": 2.13, - "learning_rate": 4.1277901441814845e-07, - "loss": 0.5098, - "step": 82962 - }, - { - "epoch": 2.13, - "learning_rate": 4.1275661743994283e-07, - "loss": 0.3828, - "step": 82963 - }, - { - "epoch": 2.13, - "learning_rate": 4.127342209113622e-07, - "loss": 0.4604, - "step": 82964 - }, - { - "epoch": 2.13, - "learning_rate": 4.1271182483242395e-07, - "loss": 0.3823, - "step": 82965 - }, - { - "epoch": 2.13, - "learning_rate": 4.126894292031452e-07, - "loss": 0.3094, - "step": 82966 - }, - { - "epoch": 2.13, - "learning_rate": 4.1266703402354364e-07, - "loss": 0.3708, - "step": 82967 - }, - { - "epoch": 2.13, - "learning_rate": 4.1264463929363547e-07, - "loss": 0.4546, - "step": 82968 - }, - { - "epoch": 2.13, - "learning_rate": 4.126222450134387e-07, - "loss": 0.3735, - "step": 82969 - }, - { - "epoch": 2.13, - "learning_rate": 4.1259985118296956e-07, - "loss": 0.46, - "step": 82970 - }, - { - "epoch": 2.13, - "learning_rate": 4.1257745780224586e-07, - "loss": 0.4155, - "step": 82971 - }, - { - "epoch": 2.13, - "learning_rate": 4.125550648712849e-07, - "loss": 0.5103, - "step": 82972 - }, - { - "epoch": 2.13, - "learning_rate": 4.1253267239010325e-07, - "loss": 0.4565, - "step": 82973 - }, - { - "epoch": 2.13, - "learning_rate": 4.125102803587182e-07, - "loss": 0.436, - "step": 82974 - }, - { - "epoch": 2.13, - "learning_rate": 4.1248788877714735e-07, - "loss": 0.3591, - "step": 82975 - }, - { - "epoch": 2.13, - "learning_rate": 4.124654976454073e-07, - "loss": 0.3071, - "step": 82976 - }, - { - "epoch": 2.13, - "learning_rate": 4.124431069635153e-07, - "loss": 0.4487, - "step": 82977 - }, - { - "epoch": 2.13, - "learning_rate": 4.124207167314886e-07, - "loss": 0.4727, - "step": 82978 - }, - { - "epoch": 2.13, - "learning_rate": 4.123983269493447e-07, - "loss": 0.2476, - "step": 82979 - }, - { - "epoch": 2.13, - "learning_rate": 4.123759376171004e-07, - "loss": 0.3599, - "step": 82980 - }, - { - "epoch": 2.13, - "learning_rate": 4.1235354873477246e-07, - "loss": 0.3208, - "step": 82981 - }, - { - "epoch": 2.13, - "learning_rate": 4.1233116030237833e-07, - "loss": 0.3882, - "step": 82982 - }, - { - "epoch": 2.13, - "learning_rate": 4.123087723199353e-07, - "loss": 0.4487, - "step": 82983 - }, - { - "epoch": 2.13, - "learning_rate": 4.122863847874607e-07, - "loss": 0.3518, - "step": 82984 - }, - { - "epoch": 2.13, - "learning_rate": 4.1226399770497113e-07, - "loss": 0.4121, - "step": 82985 - }, - { - "epoch": 2.13, - "learning_rate": 4.122416110724839e-07, - "loss": 0.4482, - "step": 82986 - }, - { - "epoch": 2.13, - "learning_rate": 4.122192248900163e-07, - "loss": 0.397, - "step": 82987 - }, - { - "epoch": 2.13, - "learning_rate": 4.1219683915758574e-07, - "loss": 0.3525, - "step": 82988 - }, - { - "epoch": 2.13, - "learning_rate": 4.121744538752091e-07, - "loss": 0.2573, - "step": 82989 - }, - { - "epoch": 2.13, - "learning_rate": 4.12152069042903e-07, - "loss": 0.406, - "step": 82990 - }, - { - "epoch": 2.13, - "learning_rate": 4.121296846606851e-07, - "loss": 0.3861, - "step": 82991 - }, - { - "epoch": 2.13, - "learning_rate": 4.121073007285728e-07, - "loss": 0.4541, - "step": 82992 - }, - { - "epoch": 2.13, - "learning_rate": 4.120849172465825e-07, - "loss": 0.3799, - "step": 82993 - }, - { - "epoch": 2.13, - "learning_rate": 4.1206253421473183e-07, - "loss": 0.3867, - "step": 82994 - }, - { - "epoch": 2.13, - "learning_rate": 4.1204015163303774e-07, - "loss": 0.52, - "step": 82995 - }, - { - "epoch": 2.13, - "learning_rate": 4.120177695015179e-07, - "loss": 0.4785, - "step": 82996 - }, - { - "epoch": 2.13, - "learning_rate": 4.119953878201886e-07, - "loss": 0.3132, - "step": 82997 - }, - { - "epoch": 2.13, - "learning_rate": 4.1197300658906753e-07, - "loss": 0.4951, - "step": 82998 - }, - { - "epoch": 2.13, - "learning_rate": 4.1195062580817195e-07, - "loss": 0.5195, - "step": 82999 - }, - { - "epoch": 2.13, - "learning_rate": 4.1192824547751837e-07, - "loss": 0.417, - "step": 83000 - }, - { - "epoch": 2.13, - "learning_rate": 4.119058655971247e-07, - "loss": 0.4248, - "step": 83001 - }, - { - "epoch": 2.13, - "learning_rate": 4.118834861670073e-07, - "loss": 0.356, - "step": 83002 - }, - { - "epoch": 2.13, - "learning_rate": 4.1186110718718356e-07, - "loss": 0.3394, - "step": 83003 - }, - { - "epoch": 2.13, - "learning_rate": 4.118387286576709e-07, - "loss": 0.4407, - "step": 83004 - }, - { - "epoch": 2.13, - "learning_rate": 4.1181635057848654e-07, - "loss": 0.252, - "step": 83005 - }, - { - "epoch": 2.13, - "learning_rate": 4.1179397294964704e-07, - "loss": 0.4194, - "step": 83006 - }, - { - "epoch": 2.13, - "learning_rate": 4.117715957711698e-07, - "loss": 0.4136, - "step": 83007 - }, - { - "epoch": 2.13, - "learning_rate": 4.1174921904307204e-07, - "loss": 0.4292, - "step": 83008 - }, - { - "epoch": 2.13, - "learning_rate": 4.1172684276537164e-07, - "loss": 0.4368, - "step": 83009 - }, - { - "epoch": 2.13, - "learning_rate": 4.1170446693808413e-07, - "loss": 0.4556, - "step": 83010 - }, - { - "epoch": 2.13, - "learning_rate": 4.1168209156122747e-07, - "loss": 0.4736, - "step": 83011 - }, - { - "epoch": 2.13, - "learning_rate": 4.116597166348188e-07, - "loss": 0.3511, - "step": 83012 - }, - { - "epoch": 2.13, - "learning_rate": 4.116373421588756e-07, - "loss": 0.4658, - "step": 83013 - }, - { - "epoch": 2.13, - "learning_rate": 4.1161496813341424e-07, - "loss": 0.4292, - "step": 83014 - }, - { - "epoch": 2.13, - "learning_rate": 4.115925945584522e-07, - "loss": 0.3711, - "step": 83015 - }, - { - "epoch": 2.13, - "learning_rate": 4.1157022143400674e-07, - "loss": 0.3994, - "step": 83016 - }, - { - "epoch": 2.13, - "learning_rate": 4.1154784876009516e-07, - "loss": 0.4624, - "step": 83017 - }, - { - "epoch": 2.13, - "learning_rate": 4.115254765367341e-07, - "loss": 0.4202, - "step": 83018 - }, - { - "epoch": 2.13, - "learning_rate": 4.115031047639412e-07, - "loss": 0.4214, - "step": 83019 - }, - { - "epoch": 2.13, - "learning_rate": 4.1148073344173307e-07, - "loss": 0.3887, - "step": 83020 - }, - { - "epoch": 2.13, - "learning_rate": 4.11458362570127e-07, - "loss": 0.4282, - "step": 83021 - }, - { - "epoch": 2.13, - "learning_rate": 4.114359921491405e-07, - "loss": 0.4993, - "step": 83022 - }, - { - "epoch": 2.13, - "learning_rate": 4.1141362217879014e-07, - "loss": 0.4019, - "step": 83023 - }, - { - "epoch": 2.13, - "learning_rate": 4.1139125265909325e-07, - "loss": 0.347, - "step": 83024 - }, - { - "epoch": 2.13, - "learning_rate": 4.1136888359006706e-07, - "loss": 0.3547, - "step": 83025 - }, - { - "epoch": 2.13, - "learning_rate": 4.11346514971729e-07, - "loss": 0.395, - "step": 83026 - }, - { - "epoch": 2.13, - "learning_rate": 4.1132414680409543e-07, - "loss": 0.3541, - "step": 83027 - }, - { - "epoch": 2.13, - "learning_rate": 4.1130177908718386e-07, - "loss": 0.4331, - "step": 83028 - }, - { - "epoch": 2.13, - "learning_rate": 4.112794118210119e-07, - "loss": 0.3376, - "step": 83029 - }, - { - "epoch": 2.13, - "learning_rate": 4.112570450055962e-07, - "loss": 0.4209, - "step": 83030 - }, - { - "epoch": 2.13, - "learning_rate": 4.1123467864095363e-07, - "loss": 0.519, - "step": 83031 - }, - { - "epoch": 2.13, - "learning_rate": 4.1121231272710146e-07, - "loss": 0.3594, - "step": 83032 - }, - { - "epoch": 2.13, - "learning_rate": 4.11189947264057e-07, - "loss": 0.3245, - "step": 83033 - }, - { - "epoch": 2.13, - "learning_rate": 4.111675822518377e-07, - "loss": 0.4629, - "step": 83034 - }, - { - "epoch": 2.13, - "learning_rate": 4.1114521769045995e-07, - "loss": 0.4038, - "step": 83035 - }, - { - "epoch": 2.13, - "learning_rate": 4.1112285357994124e-07, - "loss": 0.3984, - "step": 83036 - }, - { - "epoch": 2.13, - "learning_rate": 4.1110048992029865e-07, - "loss": 0.4146, - "step": 83037 - }, - { - "epoch": 2.13, - "learning_rate": 4.1107812671154963e-07, - "loss": 0.457, - "step": 83038 - }, - { - "epoch": 2.13, - "learning_rate": 4.110557639537111e-07, - "loss": 0.4297, - "step": 83039 - }, - { - "epoch": 2.13, - "learning_rate": 4.1103340164679976e-07, - "loss": 0.4177, - "step": 83040 - }, - { - "epoch": 2.13, - "learning_rate": 4.11011039790833e-07, - "loss": 0.3159, - "step": 83041 - }, - { - "epoch": 2.13, - "learning_rate": 4.109886783858281e-07, - "loss": 0.4312, - "step": 83042 - }, - { - "epoch": 2.13, - "learning_rate": 4.109663174318023e-07, - "loss": 0.3975, - "step": 83043 - }, - { - "epoch": 2.13, - "learning_rate": 4.1094395692877216e-07, - "loss": 0.4468, - "step": 83044 - }, - { - "epoch": 2.13, - "learning_rate": 4.109215968767552e-07, - "loss": 0.447, - "step": 83045 - }, - { - "epoch": 2.13, - "learning_rate": 4.1089923727576893e-07, - "loss": 0.3708, - "step": 83046 - }, - { - "epoch": 2.13, - "learning_rate": 4.108768781258295e-07, - "loss": 0.407, - "step": 83047 - }, - { - "epoch": 2.13, - "learning_rate": 4.1085451942695504e-07, - "loss": 0.3679, - "step": 83048 - }, - { - "epoch": 2.13, - "learning_rate": 4.1083216117916175e-07, - "loss": 0.3955, - "step": 83049 - }, - { - "epoch": 2.13, - "learning_rate": 4.108098033824673e-07, - "loss": 0.4399, - "step": 83050 - }, - { - "epoch": 2.13, - "learning_rate": 4.1078744603688896e-07, - "loss": 0.3162, - "step": 83051 - }, - { - "epoch": 2.13, - "learning_rate": 4.1076508914244325e-07, - "loss": 0.4468, - "step": 83052 - }, - { - "epoch": 2.13, - "learning_rate": 4.107427326991475e-07, - "loss": 0.4585, - "step": 83053 - }, - { - "epoch": 2.13, - "learning_rate": 4.107203767070191e-07, - "loss": 0.4873, - "step": 83054 - }, - { - "epoch": 2.13, - "learning_rate": 4.1069802116607533e-07, - "loss": 0.2744, - "step": 83055 - }, - { - "epoch": 2.13, - "learning_rate": 4.106756660763325e-07, - "loss": 0.3135, - "step": 83056 - }, - { - "epoch": 2.13, - "learning_rate": 4.1065331143780844e-07, - "loss": 0.4741, - "step": 83057 - }, - { - "epoch": 2.13, - "learning_rate": 4.106309572505202e-07, - "loss": 0.4399, - "step": 83058 - }, - { - "epoch": 2.13, - "learning_rate": 4.1060860351448454e-07, - "loss": 0.519, - "step": 83059 - }, - { - "epoch": 2.13, - "learning_rate": 4.1058625022971907e-07, - "loss": 0.3208, - "step": 83060 - }, - { - "epoch": 2.13, - "learning_rate": 4.105638973962402e-07, - "loss": 0.458, - "step": 83061 - }, - { - "epoch": 2.13, - "learning_rate": 4.1054154501406547e-07, - "loss": 0.4646, - "step": 83062 - }, - { - "epoch": 2.13, - "learning_rate": 4.1051919308321234e-07, - "loss": 0.4038, - "step": 83063 - }, - { - "epoch": 2.13, - "learning_rate": 4.104968416036972e-07, - "loss": 0.3723, - "step": 83064 - }, - { - "epoch": 2.13, - "learning_rate": 4.1047449057553753e-07, - "loss": 0.4253, - "step": 83065 - }, - { - "epoch": 2.13, - "learning_rate": 4.1045213999875053e-07, - "loss": 0.2243, - "step": 83066 - }, - { - "epoch": 2.13, - "learning_rate": 4.104297898733534e-07, - "loss": 0.4423, - "step": 83067 - }, - { - "epoch": 2.13, - "learning_rate": 4.1040744019936314e-07, - "loss": 0.5171, - "step": 83068 - }, - { - "epoch": 2.13, - "learning_rate": 4.103850909767964e-07, - "loss": 0.2869, - "step": 83069 - }, - { - "epoch": 2.13, - "learning_rate": 4.103627422056708e-07, - "loss": 0.4048, - "step": 83070 - }, - { - "epoch": 2.13, - "learning_rate": 4.103403938860033e-07, - "loss": 0.3235, - "step": 83071 - }, - { - "epoch": 2.13, - "learning_rate": 4.103180460178113e-07, - "loss": 0.4075, - "step": 83072 - }, - { - "epoch": 2.13, - "learning_rate": 4.1029569860111136e-07, - "loss": 0.4497, - "step": 83073 - }, - { - "epoch": 2.13, - "learning_rate": 4.102733516359209e-07, - "loss": 0.5298, - "step": 83074 - }, - { - "epoch": 2.13, - "learning_rate": 4.102510051222571e-07, - "loss": 0.563, - "step": 83075 - }, - { - "epoch": 2.13, - "learning_rate": 4.1022865906013727e-07, - "loss": 0.3354, - "step": 83076 - }, - { - "epoch": 2.13, - "learning_rate": 4.102063134495778e-07, - "loss": 0.2767, - "step": 83077 - }, - { - "epoch": 2.13, - "learning_rate": 4.1018396829059665e-07, - "loss": 0.4043, - "step": 83078 - }, - { - "epoch": 2.13, - "learning_rate": 4.1016162358321027e-07, - "loss": 0.4723, - "step": 83079 - }, - { - "epoch": 2.13, - "learning_rate": 4.1013927932743586e-07, - "loss": 0.347, - "step": 83080 - }, - { - "epoch": 2.13, - "learning_rate": 4.101169355232911e-07, - "loss": 0.4775, - "step": 83081 - }, - { - "epoch": 2.13, - "learning_rate": 4.1009459217079236e-07, - "loss": 0.4385, - "step": 83082 - }, - { - "epoch": 2.13, - "learning_rate": 4.10072249269957e-07, - "loss": 0.4575, - "step": 83083 - }, - { - "epoch": 2.13, - "learning_rate": 4.1004990682080253e-07, - "loss": 0.501, - "step": 83084 - }, - { - "epoch": 2.13, - "learning_rate": 4.1002756482334544e-07, - "loss": 0.3926, - "step": 83085 - }, - { - "epoch": 2.13, - "learning_rate": 4.100052232776031e-07, - "loss": 0.4087, - "step": 83086 - }, - { - "epoch": 2.13, - "learning_rate": 4.099828821835926e-07, - "loss": 0.3324, - "step": 83087 - }, - { - "epoch": 2.13, - "learning_rate": 4.099605415413314e-07, - "loss": 0.4126, - "step": 83088 - }, - { - "epoch": 2.13, - "learning_rate": 4.0993820135083635e-07, - "loss": 0.498, - "step": 83089 - }, - { - "epoch": 2.13, - "learning_rate": 4.099158616121241e-07, - "loss": 0.4448, - "step": 83090 - }, - { - "epoch": 2.13, - "learning_rate": 4.0989352232521226e-07, - "loss": 0.3461, - "step": 83091 - }, - { - "epoch": 2.13, - "learning_rate": 4.098711834901176e-07, - "loss": 0.4683, - "step": 83092 - }, - { - "epoch": 2.13, - "learning_rate": 4.098488451068579e-07, - "loss": 0.4312, - "step": 83093 - }, - { - "epoch": 2.13, - "learning_rate": 4.0982650717544953e-07, - "loss": 0.4143, - "step": 83094 - }, - { - "epoch": 2.13, - "learning_rate": 4.098041696959098e-07, - "loss": 0.4707, - "step": 83095 - }, - { - "epoch": 2.13, - "learning_rate": 4.0978183266825583e-07, - "loss": 0.3738, - "step": 83096 - }, - { - "epoch": 2.13, - "learning_rate": 4.0975949609250517e-07, - "loss": 0.4666, - "step": 83097 - }, - { - "epoch": 2.13, - "learning_rate": 4.0973715996867453e-07, - "loss": 0.2965, - "step": 83098 - }, - { - "epoch": 2.13, - "learning_rate": 4.097148242967806e-07, - "loss": 0.2426, - "step": 83099 - }, - { - "epoch": 2.13, - "learning_rate": 4.0969248907684096e-07, - "loss": 0.4761, - "step": 83100 - }, - { - "epoch": 2.13, - "learning_rate": 4.0967015430887296e-07, - "loss": 0.3804, - "step": 83101 - }, - { - "epoch": 2.13, - "learning_rate": 4.09647819992893e-07, - "loss": 0.4668, - "step": 83102 - }, - { - "epoch": 2.13, - "learning_rate": 4.0962548612891866e-07, - "loss": 0.4102, - "step": 83103 - }, - { - "epoch": 2.13, - "learning_rate": 4.0960315271696687e-07, - "loss": 0.397, - "step": 83104 - }, - { - "epoch": 2.13, - "learning_rate": 4.095808197570552e-07, - "loss": 0.2809, - "step": 83105 - }, - { - "epoch": 2.13, - "learning_rate": 4.0955848724919983e-07, - "loss": 0.5127, - "step": 83106 - }, - { - "epoch": 2.13, - "learning_rate": 4.0953615519341857e-07, - "loss": 0.4001, - "step": 83107 - }, - { - "epoch": 2.13, - "learning_rate": 4.0951382358972855e-07, - "loss": 0.3174, - "step": 83108 - }, - { - "epoch": 2.13, - "learning_rate": 4.094914924381463e-07, - "loss": 0.46, - "step": 83109 - }, - { - "epoch": 2.13, - "learning_rate": 4.094691617386897e-07, - "loss": 0.3065, - "step": 83110 - }, - { - "epoch": 2.13, - "learning_rate": 4.0944683149137503e-07, - "loss": 0.4214, - "step": 83111 - }, - { - "epoch": 2.13, - "learning_rate": 4.094245016962197e-07, - "loss": 0.416, - "step": 83112 - }, - { - "epoch": 2.13, - "learning_rate": 4.0940217235324095e-07, - "loss": 0.4126, - "step": 83113 - }, - { - "epoch": 2.13, - "learning_rate": 4.0937984346245616e-07, - "loss": 0.4534, - "step": 83114 - }, - { - "epoch": 2.13, - "learning_rate": 4.093575150238816e-07, - "loss": 0.3156, - "step": 83115 - }, - { - "epoch": 2.13, - "learning_rate": 4.093351870375349e-07, - "loss": 0.4678, - "step": 83116 - }, - { - "epoch": 2.13, - "learning_rate": 4.093128595034331e-07, - "loss": 0.4238, - "step": 83117 - }, - { - "epoch": 2.13, - "learning_rate": 4.092905324215941e-07, - "loss": 0.4047, - "step": 83118 - }, - { - "epoch": 2.13, - "learning_rate": 4.0926820579203326e-07, - "loss": 0.4463, - "step": 83119 - }, - { - "epoch": 2.13, - "learning_rate": 4.0924587961476875e-07, - "loss": 0.4153, - "step": 83120 - }, - { - "epoch": 2.13, - "learning_rate": 4.0922355388981746e-07, - "loss": 0.3105, - "step": 83121 - }, - { - "epoch": 2.13, - "learning_rate": 4.0920122861719685e-07, - "loss": 0.4272, - "step": 83122 - }, - { - "epoch": 2.13, - "learning_rate": 4.0917890379692333e-07, - "loss": 0.4536, - "step": 83123 - }, - { - "epoch": 2.13, - "learning_rate": 4.091565794290144e-07, - "loss": 0.2917, - "step": 83124 - }, - { - "epoch": 2.13, - "learning_rate": 4.0913425551348714e-07, - "loss": 0.373, - "step": 83125 - }, - { - "epoch": 2.13, - "learning_rate": 4.0911193205035887e-07, - "loss": 0.4619, - "step": 83126 - }, - { - "epoch": 2.13, - "learning_rate": 4.0908960903964604e-07, - "loss": 0.4324, - "step": 83127 - }, - { - "epoch": 2.13, - "learning_rate": 4.090672864813667e-07, - "loss": 0.4084, - "step": 83128 - }, - { - "epoch": 2.13, - "learning_rate": 4.090449643755368e-07, - "loss": 0.3264, - "step": 83129 - }, - { - "epoch": 2.13, - "learning_rate": 4.0902264272217414e-07, - "loss": 0.4341, - "step": 83130 - }, - { - "epoch": 2.13, - "learning_rate": 4.090003215212959e-07, - "loss": 0.2644, - "step": 83131 - }, - { - "epoch": 2.13, - "learning_rate": 4.089780007729187e-07, - "loss": 0.3489, - "step": 83132 - }, - { - "epoch": 2.13, - "learning_rate": 4.0895568047705973e-07, - "loss": 0.3804, - "step": 83133 - }, - { - "epoch": 2.13, - "learning_rate": 4.089333606337363e-07, - "loss": 0.4524, - "step": 83134 - }, - { - "epoch": 2.13, - "learning_rate": 4.0891104124296583e-07, - "loss": 0.4888, - "step": 83135 - }, - { - "epoch": 2.13, - "learning_rate": 4.0888872230476455e-07, - "loss": 0.4517, - "step": 83136 - }, - { - "epoch": 2.13, - "learning_rate": 4.0886640381915006e-07, - "loss": 0.4458, - "step": 83137 - }, - { - "epoch": 2.13, - "learning_rate": 4.088440857861397e-07, - "loss": 0.3013, - "step": 83138 - }, - { - "epoch": 2.13, - "learning_rate": 4.088217682057502e-07, - "loss": 0.4229, - "step": 83139 - }, - { - "epoch": 2.13, - "learning_rate": 4.087994510779984e-07, - "loss": 0.3479, - "step": 83140 - }, - { - "epoch": 2.13, - "learning_rate": 4.087771344029016e-07, - "loss": 0.3872, - "step": 83141 - }, - { - "epoch": 2.13, - "learning_rate": 4.0875481818047706e-07, - "loss": 0.3605, - "step": 83142 - }, - { - "epoch": 2.13, - "learning_rate": 4.087325024107421e-07, - "loss": 0.5718, - "step": 83143 - }, - { - "epoch": 2.13, - "learning_rate": 4.087101870937131e-07, - "loss": 0.3655, - "step": 83144 - }, - { - "epoch": 2.13, - "learning_rate": 4.086878722294075e-07, - "loss": 0.3687, - "step": 83145 - }, - { - "epoch": 2.13, - "learning_rate": 4.086655578178425e-07, - "loss": 0.5435, - "step": 83146 - }, - { - "epoch": 2.13, - "learning_rate": 4.0864324385903535e-07, - "loss": 0.4272, - "step": 83147 - }, - { - "epoch": 2.13, - "learning_rate": 4.0862093035300294e-07, - "loss": 0.5083, - "step": 83148 - }, - { - "epoch": 2.13, - "learning_rate": 4.0859861729976184e-07, - "loss": 0.3706, - "step": 83149 - }, - { - "epoch": 2.13, - "learning_rate": 4.085763046993297e-07, - "loss": 0.293, - "step": 83150 - }, - { - "epoch": 2.13, - "learning_rate": 4.085539925517234e-07, - "loss": 0.4048, - "step": 83151 - }, - { - "epoch": 2.13, - "learning_rate": 4.0853168085696057e-07, - "loss": 0.3564, - "step": 83152 - }, - { - "epoch": 2.13, - "learning_rate": 4.0850936961505734e-07, - "loss": 0.3638, - "step": 83153 - }, - { - "epoch": 2.13, - "learning_rate": 4.084870588260314e-07, - "loss": 0.4292, - "step": 83154 - }, - { - "epoch": 2.13, - "learning_rate": 4.084647484899001e-07, - "loss": 0.3119, - "step": 83155 - }, - { - "epoch": 2.13, - "learning_rate": 4.084424386066797e-07, - "loss": 0.3955, - "step": 83156 - }, - { - "epoch": 2.13, - "learning_rate": 4.0842012917638767e-07, - "loss": 0.4263, - "step": 83157 - }, - { - "epoch": 2.13, - "learning_rate": 4.083978201990417e-07, - "loss": 0.5073, - "step": 83158 - }, - { - "epoch": 2.13, - "learning_rate": 4.083755116746578e-07, - "loss": 0.3506, - "step": 83159 - }, - { - "epoch": 2.13, - "learning_rate": 4.08353203603254e-07, - "loss": 0.4204, - "step": 83160 - }, - { - "epoch": 2.13, - "learning_rate": 4.083308959848465e-07, - "loss": 0.3601, - "step": 83161 - }, - { - "epoch": 2.13, - "learning_rate": 4.0830858881945286e-07, - "loss": 0.439, - "step": 83162 - }, - { - "epoch": 2.13, - "learning_rate": 4.0828628210709014e-07, - "loss": 0.3564, - "step": 83163 - }, - { - "epoch": 2.13, - "learning_rate": 4.0826397584777585e-07, - "loss": 0.3708, - "step": 83164 - }, - { - "epoch": 2.13, - "learning_rate": 4.082416700415262e-07, - "loss": 0.447, - "step": 83165 - }, - { - "epoch": 2.13, - "learning_rate": 4.082193646883586e-07, - "loss": 0.3799, - "step": 83166 - }, - { - "epoch": 2.13, - "learning_rate": 4.0819705978829035e-07, - "loss": 0.4565, - "step": 83167 - }, - { - "epoch": 2.13, - "learning_rate": 4.0817475534133874e-07, - "loss": 0.4678, - "step": 83168 - }, - { - "epoch": 2.13, - "learning_rate": 4.0815245134752053e-07, - "loss": 0.4376, - "step": 83169 - }, - { - "epoch": 2.13, - "learning_rate": 4.081301478068523e-07, - "loss": 0.3809, - "step": 83170 - }, - { - "epoch": 2.13, - "learning_rate": 4.0810784471935166e-07, - "loss": 0.3955, - "step": 83171 - }, - { - "epoch": 2.13, - "learning_rate": 4.08085542085036e-07, - "loss": 0.5132, - "step": 83172 - }, - { - "epoch": 2.13, - "learning_rate": 4.0806323990392165e-07, - "loss": 0.4077, - "step": 83173 - }, - { - "epoch": 2.13, - "learning_rate": 4.0804093817602616e-07, - "loss": 0.314, - "step": 83174 - }, - { - "epoch": 2.13, - "learning_rate": 4.080186369013664e-07, - "loss": 0.252, - "step": 83175 - }, - { - "epoch": 2.13, - "learning_rate": 4.0799633607995985e-07, - "loss": 0.5044, - "step": 83176 - }, - { - "epoch": 2.13, - "learning_rate": 4.07974035711823e-07, - "loss": 0.5347, - "step": 83177 - }, - { - "epoch": 2.13, - "learning_rate": 4.079517357969736e-07, - "loss": 0.3833, - "step": 83178 - }, - { - "epoch": 2.13, - "learning_rate": 4.07929436335428e-07, - "loss": 0.3999, - "step": 83179 - }, - { - "epoch": 2.13, - "learning_rate": 4.079071373272035e-07, - "loss": 0.3838, - "step": 83180 - }, - { - "epoch": 2.13, - "learning_rate": 4.078848387723176e-07, - "loss": 0.354, - "step": 83181 - }, - { - "epoch": 2.13, - "learning_rate": 4.0786254067078683e-07, - "loss": 0.3136, - "step": 83182 - }, - { - "epoch": 2.13, - "learning_rate": 4.0784024302262844e-07, - "loss": 0.3691, - "step": 83183 - }, - { - "epoch": 2.13, - "learning_rate": 4.078179458278596e-07, - "loss": 0.458, - "step": 83184 - }, - { - "epoch": 2.13, - "learning_rate": 4.0779564908649755e-07, - "loss": 0.386, - "step": 83185 - }, - { - "epoch": 2.13, - "learning_rate": 4.0777335279855883e-07, - "loss": 0.3672, - "step": 83186 - }, - { - "epoch": 2.13, - "learning_rate": 4.0775105696406087e-07, - "loss": 0.4619, - "step": 83187 - }, - { - "epoch": 2.13, - "learning_rate": 4.0772876158302105e-07, - "loss": 0.3092, - "step": 83188 - }, - { - "epoch": 2.13, - "learning_rate": 4.0770646665545615e-07, - "loss": 0.4294, - "step": 83189 - }, - { - "epoch": 2.13, - "learning_rate": 4.0768417218138274e-07, - "loss": 0.4463, - "step": 83190 - }, - { - "epoch": 2.13, - "learning_rate": 4.0766187816081833e-07, - "loss": 0.3696, - "step": 83191 - }, - { - "epoch": 2.13, - "learning_rate": 4.076395845937799e-07, - "loss": 0.4263, - "step": 83192 - }, - { - "epoch": 2.13, - "learning_rate": 4.07617291480285e-07, - "loss": 0.5293, - "step": 83193 - }, - { - "epoch": 2.13, - "learning_rate": 4.0759499882035007e-07, - "loss": 0.4844, - "step": 83194 - }, - { - "epoch": 2.13, - "learning_rate": 4.075727066139922e-07, - "loss": 0.3809, - "step": 83195 - }, - { - "epoch": 2.13, - "learning_rate": 4.075504148612289e-07, - "loss": 0.3264, - "step": 83196 - }, - { - "epoch": 2.13, - "learning_rate": 4.075281235620772e-07, - "loss": 0.3569, - "step": 83197 - }, - { - "epoch": 2.13, - "learning_rate": 4.0750583271655403e-07, - "loss": 0.3701, - "step": 83198 - }, - { - "epoch": 2.13, - "learning_rate": 4.0748354232467607e-07, - "loss": 0.4082, - "step": 83199 - }, - { - "epoch": 2.13, - "learning_rate": 4.074612523864607e-07, - "loss": 0.5229, - "step": 83200 - }, - { - "epoch": 2.13, - "learning_rate": 4.074389629019249e-07, - "loss": 0.363, - "step": 83201 - }, - { - "epoch": 2.13, - "learning_rate": 4.0741667387108633e-07, - "loss": 0.3264, - "step": 83202 - }, - { - "epoch": 2.13, - "learning_rate": 4.073943852939612e-07, - "loss": 0.4849, - "step": 83203 - }, - { - "epoch": 2.13, - "learning_rate": 4.073720971705669e-07, - "loss": 0.3733, - "step": 83204 - }, - { - "epoch": 2.13, - "learning_rate": 4.0734980950092046e-07, - "loss": 0.374, - "step": 83205 - }, - { - "epoch": 2.13, - "learning_rate": 4.0732752228503955e-07, - "loss": 0.3726, - "step": 83206 - }, - { - "epoch": 2.13, - "learning_rate": 4.073052355229402e-07, - "loss": 0.4221, - "step": 83207 - }, - { - "epoch": 2.13, - "learning_rate": 4.0728294921464035e-07, - "loss": 0.5073, - "step": 83208 - }, - { - "epoch": 2.13, - "learning_rate": 4.0726066336015643e-07, - "loss": 0.3848, - "step": 83209 - }, - { - "epoch": 2.13, - "learning_rate": 4.07238377959506e-07, - "loss": 0.4268, - "step": 83210 - }, - { - "epoch": 2.13, - "learning_rate": 4.0721609301270563e-07, - "loss": 0.3779, - "step": 83211 - }, - { - "epoch": 2.13, - "learning_rate": 4.071938085197726e-07, - "loss": 0.3662, - "step": 83212 - }, - { - "epoch": 2.13, - "learning_rate": 4.07171524480724e-07, - "loss": 0.4443, - "step": 83213 - }, - { - "epoch": 2.13, - "learning_rate": 4.0714924089557734e-07, - "loss": 0.3882, - "step": 83214 - }, - { - "epoch": 2.13, - "learning_rate": 4.071269577643488e-07, - "loss": 0.3184, - "step": 83215 - }, - { - "epoch": 2.13, - "learning_rate": 4.0710467508705593e-07, - "loss": 0.3633, - "step": 83216 - }, - { - "epoch": 2.13, - "learning_rate": 4.070823928637157e-07, - "loss": 0.4026, - "step": 83217 - }, - { - "epoch": 2.13, - "learning_rate": 4.070601110943457e-07, - "loss": 0.3416, - "step": 83218 - }, - { - "epoch": 2.13, - "learning_rate": 4.070378297789624e-07, - "loss": 0.4893, - "step": 83219 - }, - { - "epoch": 2.13, - "learning_rate": 4.070155489175826e-07, - "loss": 0.4351, - "step": 83220 - }, - { - "epoch": 2.13, - "learning_rate": 4.0699326851022376e-07, - "loss": 0.3874, - "step": 83221 - }, - { - "epoch": 2.13, - "learning_rate": 4.069709885569029e-07, - "loss": 0.3058, - "step": 83222 - }, - { - "epoch": 2.13, - "learning_rate": 4.0694870905763747e-07, - "loss": 0.3589, - "step": 83223 - }, - { - "epoch": 2.13, - "learning_rate": 4.0692643001244373e-07, - "loss": 0.4199, - "step": 83224 - }, - { - "epoch": 2.13, - "learning_rate": 4.0690415142133917e-07, - "loss": 0.446, - "step": 83225 - }, - { - "epoch": 2.13, - "learning_rate": 4.068818732843412e-07, - "loss": 0.321, - "step": 83226 - }, - { - "epoch": 2.13, - "learning_rate": 4.0685959560146623e-07, - "loss": 0.4458, - "step": 83227 - }, - { - "epoch": 2.13, - "learning_rate": 4.0683731837273184e-07, - "loss": 0.3337, - "step": 83228 - }, - { - "epoch": 2.13, - "learning_rate": 4.068150415981545e-07, - "loss": 0.5283, - "step": 83229 - }, - { - "epoch": 2.13, - "learning_rate": 4.0679276527775166e-07, - "loss": 0.282, - "step": 83230 - }, - { - "epoch": 2.13, - "learning_rate": 4.067704894115407e-07, - "loss": 0.375, - "step": 83231 - }, - { - "epoch": 2.13, - "learning_rate": 4.0674821399953783e-07, - "loss": 0.5376, - "step": 83232 - }, - { - "epoch": 2.13, - "learning_rate": 4.0672593904176066e-07, - "loss": 0.4426, - "step": 83233 - }, - { - "epoch": 2.13, - "learning_rate": 4.0670366453822613e-07, - "loss": 0.4236, - "step": 83234 - }, - { - "epoch": 2.13, - "learning_rate": 4.066813904889517e-07, - "loss": 0.3948, - "step": 83235 - }, - { - "epoch": 2.13, - "learning_rate": 4.066591168939536e-07, - "loss": 0.2944, - "step": 83236 - }, - { - "epoch": 2.13, - "learning_rate": 4.066368437532495e-07, - "loss": 0.4194, - "step": 83237 - }, - { - "epoch": 2.13, - "learning_rate": 4.066145710668565e-07, - "loss": 0.4263, - "step": 83238 - }, - { - "epoch": 2.13, - "learning_rate": 4.0659229883479117e-07, - "loss": 0.4531, - "step": 83239 - }, - { - "epoch": 2.13, - "learning_rate": 4.0657002705707113e-07, - "loss": 0.5151, - "step": 83240 - }, - { - "epoch": 2.13, - "learning_rate": 4.065477557337128e-07, - "loss": 0.3707, - "step": 83241 - }, - { - "epoch": 2.13, - "learning_rate": 4.065254848647336e-07, - "loss": 0.4321, - "step": 83242 - }, - { - "epoch": 2.13, - "learning_rate": 4.065032144501505e-07, - "loss": 0.4033, - "step": 83243 - }, - { - "epoch": 2.13, - "learning_rate": 4.0648094448998093e-07, - "loss": 0.4023, - "step": 83244 - }, - { - "epoch": 2.13, - "learning_rate": 4.0645867498424123e-07, - "loss": 0.3216, - "step": 83245 - }, - { - "epoch": 2.13, - "learning_rate": 4.0643640593294894e-07, - "loss": 0.3733, - "step": 83246 - }, - { - "epoch": 2.13, - "learning_rate": 4.064141373361213e-07, - "loss": 0.4014, - "step": 83247 - }, - { - "epoch": 2.13, - "learning_rate": 4.063918691937751e-07, - "loss": 0.4419, - "step": 83248 - }, - { - "epoch": 2.13, - "learning_rate": 4.0636960150592694e-07, - "loss": 0.2581, - "step": 83249 - }, - { - "epoch": 2.13, - "learning_rate": 4.0634733427259426e-07, - "loss": 0.4761, - "step": 83250 - }, - { - "epoch": 2.13, - "learning_rate": 4.0632506749379423e-07, - "loss": 0.4575, - "step": 83251 - }, - { - "epoch": 2.13, - "learning_rate": 4.0630280116954405e-07, - "loss": 0.4097, - "step": 83252 - }, - { - "epoch": 2.13, - "learning_rate": 4.062805352998603e-07, - "loss": 0.3047, - "step": 83253 - }, - { - "epoch": 2.13, - "learning_rate": 4.0625826988476007e-07, - "loss": 0.3608, - "step": 83254 - }, - { - "epoch": 2.13, - "learning_rate": 4.0623600492426067e-07, - "loss": 0.3574, - "step": 83255 - }, - { - "epoch": 2.13, - "learning_rate": 4.0621374041837943e-07, - "loss": 0.417, - "step": 83256 - }, - { - "epoch": 2.13, - "learning_rate": 4.061914763671326e-07, - "loss": 0.3225, - "step": 83257 - }, - { - "epoch": 2.13, - "learning_rate": 4.061692127705381e-07, - "loss": 0.3848, - "step": 83258 - }, - { - "epoch": 2.13, - "learning_rate": 4.0614694962861207e-07, - "loss": 0.3008, - "step": 83259 - }, - { - "epoch": 2.13, - "learning_rate": 4.0612468694137213e-07, - "loss": 0.4355, - "step": 83260 - }, - { - "epoch": 2.13, - "learning_rate": 4.0610242470883547e-07, - "loss": 0.4014, - "step": 83261 - }, - { - "epoch": 2.13, - "learning_rate": 4.0608016293101854e-07, - "loss": 0.4282, - "step": 83262 - }, - { - "epoch": 2.13, - "learning_rate": 4.060579016079387e-07, - "loss": 0.4868, - "step": 83263 - }, - { - "epoch": 2.13, - "learning_rate": 4.060356407396135e-07, - "loss": 0.2797, - "step": 83264 - }, - { - "epoch": 2.13, - "learning_rate": 4.0601338032605903e-07, - "loss": 0.3059, - "step": 83265 - }, - { - "epoch": 2.13, - "learning_rate": 4.059911203672929e-07, - "loss": 0.4172, - "step": 83266 - }, - { - "epoch": 2.13, - "learning_rate": 4.0596886086333195e-07, - "loss": 0.4502, - "step": 83267 - }, - { - "epoch": 2.13, - "learning_rate": 4.059466018141937e-07, - "loss": 0.4839, - "step": 83268 - }, - { - "epoch": 2.13, - "learning_rate": 4.059243432198948e-07, - "loss": 0.5562, - "step": 83269 - }, - { - "epoch": 2.13, - "learning_rate": 4.05902085080452e-07, - "loss": 0.5615, - "step": 83270 - }, - { - "epoch": 2.13, - "learning_rate": 4.0587982739588265e-07, - "loss": 0.3302, - "step": 83271 - }, - { - "epoch": 2.13, - "learning_rate": 4.0585757016620383e-07, - "loss": 0.4141, - "step": 83272 - }, - { - "epoch": 2.13, - "learning_rate": 4.0583531339143286e-07, - "loss": 0.3828, - "step": 83273 - }, - { - "epoch": 2.13, - "learning_rate": 4.0581305707158607e-07, - "loss": 0.2847, - "step": 83274 - }, - { - "epoch": 2.13, - "learning_rate": 4.05790801206681e-07, - "loss": 0.4131, - "step": 83275 - }, - { - "epoch": 2.13, - "learning_rate": 4.0576854579673457e-07, - "loss": 0.5278, - "step": 83276 - }, - { - "epoch": 2.13, - "learning_rate": 4.0574629084176417e-07, - "loss": 0.4187, - "step": 83277 - }, - { - "epoch": 2.13, - "learning_rate": 4.057240363417865e-07, - "loss": 0.4019, - "step": 83278 - }, - { - "epoch": 2.13, - "learning_rate": 4.057017822968183e-07, - "loss": 0.3721, - "step": 83279 - }, - { - "epoch": 2.13, - "learning_rate": 4.0567952870687684e-07, - "loss": 0.4102, - "step": 83280 - }, - { - "epoch": 2.13, - "learning_rate": 4.056572755719797e-07, - "loss": 0.2705, - "step": 83281 - }, - { - "epoch": 2.13, - "learning_rate": 4.0563502289214303e-07, - "loss": 0.4521, - "step": 83282 - }, - { - "epoch": 2.13, - "learning_rate": 4.0561277066738433e-07, - "loss": 0.4946, - "step": 83283 - }, - { - "epoch": 2.13, - "learning_rate": 4.0559051889772056e-07, - "loss": 0.4507, - "step": 83284 - }, - { - "epoch": 2.13, - "learning_rate": 4.055682675831692e-07, - "loss": 0.4375, - "step": 83285 - }, - { - "epoch": 2.13, - "learning_rate": 4.0554601672374643e-07, - "loss": 0.502, - "step": 83286 - }, - { - "epoch": 2.13, - "learning_rate": 4.0552376631946986e-07, - "loss": 0.3187, - "step": 83287 - }, - { - "epoch": 2.13, - "learning_rate": 4.055015163703567e-07, - "loss": 0.3848, - "step": 83288 - }, - { - "epoch": 2.13, - "learning_rate": 4.0547926687642334e-07, - "loss": 0.5356, - "step": 83289 - }, - { - "epoch": 2.13, - "learning_rate": 4.054570178376876e-07, - "loss": 0.3408, - "step": 83290 - }, - { - "epoch": 2.13, - "learning_rate": 4.0543476925416567e-07, - "loss": 0.481, - "step": 83291 - }, - { - "epoch": 2.13, - "learning_rate": 4.05412521125875e-07, - "loss": 0.4766, - "step": 83292 - }, - { - "epoch": 2.13, - "learning_rate": 4.053902734528325e-07, - "loss": 0.343, - "step": 83293 - }, - { - "epoch": 2.13, - "learning_rate": 4.0536802623505585e-07, - "loss": 0.4624, - "step": 83294 - }, - { - "epoch": 2.13, - "learning_rate": 4.053457794725611e-07, - "loss": 0.3701, - "step": 83295 - }, - { - "epoch": 2.13, - "learning_rate": 4.053235331653658e-07, - "loss": 0.4756, - "step": 83296 - }, - { - "epoch": 2.13, - "learning_rate": 4.05301287313487e-07, - "loss": 0.501, - "step": 83297 - }, - { - "epoch": 2.13, - "learning_rate": 4.052790419169423e-07, - "loss": 0.3893, - "step": 83298 - }, - { - "epoch": 2.13, - "learning_rate": 4.052567969757473e-07, - "loss": 0.4119, - "step": 83299 - }, - { - "epoch": 2.14, - "learning_rate": 4.0523455248991986e-07, - "loss": 0.4839, - "step": 83300 - }, - { - "epoch": 2.14, - "learning_rate": 4.0521230845947707e-07, - "loss": 0.376, - "step": 83301 - }, - { - "epoch": 2.14, - "learning_rate": 4.051900648844362e-07, - "loss": 0.3848, - "step": 83302 - }, - { - "epoch": 2.14, - "learning_rate": 4.051678217648136e-07, - "loss": 0.3245, - "step": 83303 - }, - { - "epoch": 2.14, - "learning_rate": 4.051455791006265e-07, - "loss": 0.3804, - "step": 83304 - }, - { - "epoch": 2.14, - "learning_rate": 4.051233368918923e-07, - "loss": 0.308, - "step": 83305 - }, - { - "epoch": 2.14, - "learning_rate": 4.05101095138628e-07, - "loss": 0.5176, - "step": 83306 - }, - { - "epoch": 2.14, - "learning_rate": 4.050788538408501e-07, - "loss": 0.4614, - "step": 83307 - }, - { - "epoch": 2.14, - "learning_rate": 4.050566129985763e-07, - "loss": 0.3486, - "step": 83308 - }, - { - "epoch": 2.14, - "learning_rate": 4.0503437261182307e-07, - "loss": 0.3419, - "step": 83309 - }, - { - "epoch": 2.14, - "learning_rate": 4.0501213268060755e-07, - "loss": 0.3076, - "step": 83310 - }, - { - "epoch": 2.14, - "learning_rate": 4.0498989320494726e-07, - "loss": 0.4609, - "step": 83311 - }, - { - "epoch": 2.14, - "learning_rate": 4.0496765418485855e-07, - "loss": 0.308, - "step": 83312 - }, - { - "epoch": 2.14, - "learning_rate": 4.0494541562035865e-07, - "loss": 0.4529, - "step": 83313 - }, - { - "epoch": 2.14, - "learning_rate": 4.049231775114648e-07, - "loss": 0.4263, - "step": 83314 - }, - { - "epoch": 2.14, - "learning_rate": 4.049009398581942e-07, - "loss": 0.3438, - "step": 83315 - }, - { - "epoch": 2.14, - "learning_rate": 4.048787026605631e-07, - "loss": 0.459, - "step": 83316 - }, - { - "epoch": 2.14, - "learning_rate": 4.0485646591858926e-07, - "loss": 0.3022, - "step": 83317 - }, - { - "epoch": 2.14, - "learning_rate": 4.0483422963228965e-07, - "loss": 0.4194, - "step": 83318 - }, - { - "epoch": 2.14, - "learning_rate": 4.048119938016812e-07, - "loss": 0.4596, - "step": 83319 - }, - { - "epoch": 2.14, - "learning_rate": 4.0478975842678044e-07, - "loss": 0.4785, - "step": 83320 - }, - { - "epoch": 2.14, - "learning_rate": 4.047675235076048e-07, - "loss": 0.3916, - "step": 83321 - }, - { - "epoch": 2.14, - "learning_rate": 4.0474528904417126e-07, - "loss": 0.3528, - "step": 83322 - }, - { - "epoch": 2.14, - "learning_rate": 4.047230550364973e-07, - "loss": 0.4727, - "step": 83323 - }, - { - "epoch": 2.14, - "learning_rate": 4.0470082148459907e-07, - "loss": 0.4976, - "step": 83324 - }, - { - "epoch": 2.14, - "learning_rate": 4.046785883884941e-07, - "loss": 0.4448, - "step": 83325 - }, - { - "epoch": 2.14, - "learning_rate": 4.0465635574819933e-07, - "loss": 0.2217, - "step": 83326 - }, - { - "epoch": 2.14, - "learning_rate": 4.0463412356373226e-07, - "loss": 0.5034, - "step": 83327 - }, - { - "epoch": 2.14, - "learning_rate": 4.046118918351095e-07, - "loss": 0.3962, - "step": 83328 - }, - { - "epoch": 2.14, - "learning_rate": 4.0458966056234754e-07, - "loss": 0.3594, - "step": 83329 - }, - { - "epoch": 2.14, - "learning_rate": 4.04567429745464e-07, - "loss": 0.3682, - "step": 83330 - }, - { - "epoch": 2.14, - "learning_rate": 4.0454519938447573e-07, - "loss": 0.3511, - "step": 83331 - }, - { - "epoch": 2.14, - "learning_rate": 4.045229694794002e-07, - "loss": 0.3728, - "step": 83332 - }, - { - "epoch": 2.14, - "learning_rate": 4.045007400302537e-07, - "loss": 0.5015, - "step": 83333 - }, - { - "epoch": 2.14, - "learning_rate": 4.0447851103705354e-07, - "loss": 0.478, - "step": 83334 - }, - { - "epoch": 2.14, - "learning_rate": 4.0445628249981733e-07, - "loss": 0.3931, - "step": 83335 - }, - { - "epoch": 2.14, - "learning_rate": 4.0443405441856103e-07, - "loss": 0.5327, - "step": 83336 - }, - { - "epoch": 2.14, - "learning_rate": 4.044118267933023e-07, - "loss": 0.3411, - "step": 83337 - }, - { - "epoch": 2.14, - "learning_rate": 4.0438959962405836e-07, - "loss": 0.3726, - "step": 83338 - }, - { - "epoch": 2.14, - "learning_rate": 4.0436737291084556e-07, - "loss": 0.4839, - "step": 83339 - }, - { - "epoch": 2.14, - "learning_rate": 4.043451466536816e-07, - "loss": 0.4722, - "step": 83340 - }, - { - "epoch": 2.14, - "learning_rate": 4.043229208525829e-07, - "loss": 0.4341, - "step": 83341 - }, - { - "epoch": 2.14, - "learning_rate": 4.043006955075666e-07, - "loss": 0.3055, - "step": 83342 - }, - { - "epoch": 2.14, - "learning_rate": 4.042784706186501e-07, - "loss": 0.4585, - "step": 83343 - }, - { - "epoch": 2.14, - "learning_rate": 4.042562461858503e-07, - "loss": 0.3916, - "step": 83344 - }, - { - "epoch": 2.14, - "learning_rate": 4.042340222091839e-07, - "loss": 0.344, - "step": 83345 - }, - { - "epoch": 2.14, - "learning_rate": 4.0421179868866807e-07, - "loss": 0.438, - "step": 83346 - }, - { - "epoch": 2.14, - "learning_rate": 4.041895756243202e-07, - "loss": 0.418, - "step": 83347 - }, - { - "epoch": 2.14, - "learning_rate": 4.0416735301615666e-07, - "loss": 0.4033, - "step": 83348 - }, - { - "epoch": 2.14, - "learning_rate": 4.041451308641951e-07, - "loss": 0.3691, - "step": 83349 - }, - { - "epoch": 2.14, - "learning_rate": 4.0412290916845184e-07, - "loss": 0.3205, - "step": 83350 - }, - { - "epoch": 2.14, - "learning_rate": 4.0410068792894434e-07, - "loss": 0.3793, - "step": 83351 - }, - { - "epoch": 2.14, - "learning_rate": 4.040784671456898e-07, - "loss": 0.4122, - "step": 83352 - }, - { - "epoch": 2.14, - "learning_rate": 4.0405624681870475e-07, - "loss": 0.3501, - "step": 83353 - }, - { - "epoch": 2.14, - "learning_rate": 4.0403402694800636e-07, - "loss": 0.3669, - "step": 83354 - }, - { - "epoch": 2.14, - "learning_rate": 4.0401180753361177e-07, - "loss": 0.3511, - "step": 83355 - }, - { - "epoch": 2.14, - "learning_rate": 4.0398958857553813e-07, - "loss": 0.4326, - "step": 83356 - }, - { - "epoch": 2.14, - "learning_rate": 4.0396737007380243e-07, - "loss": 0.4067, - "step": 83357 - }, - { - "epoch": 2.14, - "learning_rate": 4.0394515202842103e-07, - "loss": 0.4521, - "step": 83358 - }, - { - "epoch": 2.14, - "learning_rate": 4.039229344394115e-07, - "loss": 0.3966, - "step": 83359 - }, - { - "epoch": 2.14, - "learning_rate": 4.0390071730679074e-07, - "loss": 0.4058, - "step": 83360 - }, - { - "epoch": 2.14, - "learning_rate": 4.0387850063057616e-07, - "loss": 0.3055, - "step": 83361 - }, - { - "epoch": 2.14, - "learning_rate": 4.03856284410784e-07, - "loss": 0.3254, - "step": 83362 - }, - { - "epoch": 2.14, - "learning_rate": 4.038340686474317e-07, - "loss": 0.4185, - "step": 83363 - }, - { - "epoch": 2.14, - "learning_rate": 4.0381185334053627e-07, - "loss": 0.4448, - "step": 83364 - }, - { - "epoch": 2.14, - "learning_rate": 4.03789638490115e-07, - "loss": 0.4878, - "step": 83365 - }, - { - "epoch": 2.14, - "learning_rate": 4.0376742409618434e-07, - "loss": 0.377, - "step": 83366 - }, - { - "epoch": 2.14, - "learning_rate": 4.0374521015876186e-07, - "loss": 0.4106, - "step": 83367 - }, - { - "epoch": 2.14, - "learning_rate": 4.037229966778638e-07, - "loss": 0.3843, - "step": 83368 - }, - { - "epoch": 2.14, - "learning_rate": 4.03700783653508e-07, - "loss": 0.3779, - "step": 83369 - }, - { - "epoch": 2.14, - "learning_rate": 4.036785710857108e-07, - "loss": 0.4985, - "step": 83370 - }, - { - "epoch": 2.14, - "learning_rate": 4.0365635897448946e-07, - "loss": 0.4102, - "step": 83371 - }, - { - "epoch": 2.14, - "learning_rate": 4.036341473198611e-07, - "loss": 0.4595, - "step": 83372 - }, - { - "epoch": 2.14, - "learning_rate": 4.0361193612184297e-07, - "loss": 0.5005, - "step": 83373 - }, - { - "epoch": 2.14, - "learning_rate": 4.0358972538045134e-07, - "loss": 0.4507, - "step": 83374 - }, - { - "epoch": 2.14, - "learning_rate": 4.0356751509570376e-07, - "loss": 0.3896, - "step": 83375 - }, - { - "epoch": 2.14, - "learning_rate": 4.03545305267617e-07, - "loss": 0.4229, - "step": 83376 - }, - { - "epoch": 2.14, - "learning_rate": 4.0352309589620846e-07, - "loss": 0.4634, - "step": 83377 - }, - { - "epoch": 2.14, - "learning_rate": 4.03500886981495e-07, - "loss": 0.4644, - "step": 83378 - }, - { - "epoch": 2.14, - "learning_rate": 4.0347867852349313e-07, - "loss": 0.2947, - "step": 83379 - }, - { - "epoch": 2.14, - "learning_rate": 4.034564705222201e-07, - "loss": 0.4785, - "step": 83380 - }, - { - "epoch": 2.14, - "learning_rate": 4.0343426297769313e-07, - "loss": 0.3762, - "step": 83381 - }, - { - "epoch": 2.14, - "learning_rate": 4.034120558899294e-07, - "loss": 0.4276, - "step": 83382 - }, - { - "epoch": 2.14, - "learning_rate": 4.0338984925894527e-07, - "loss": 0.5078, - "step": 83383 - }, - { - "epoch": 2.14, - "learning_rate": 4.033676430847581e-07, - "loss": 0.4751, - "step": 83384 - }, - { - "epoch": 2.14, - "learning_rate": 4.033454373673849e-07, - "loss": 0.3233, - "step": 83385 - }, - { - "epoch": 2.14, - "learning_rate": 4.0332323210684305e-07, - "loss": 0.3662, - "step": 83386 - }, - { - "epoch": 2.14, - "learning_rate": 4.033010273031492e-07, - "loss": 0.3416, - "step": 83387 - }, - { - "epoch": 2.14, - "learning_rate": 4.032788229563199e-07, - "loss": 0.4272, - "step": 83388 - }, - { - "epoch": 2.14, - "learning_rate": 4.0325661906637254e-07, - "loss": 0.3394, - "step": 83389 - }, - { - "epoch": 2.14, - "learning_rate": 4.032344156333246e-07, - "loss": 0.3247, - "step": 83390 - }, - { - "epoch": 2.14, - "learning_rate": 4.0321221265719216e-07, - "loss": 0.3767, - "step": 83391 - }, - { - "epoch": 2.14, - "learning_rate": 4.031900101379928e-07, - "loss": 0.3245, - "step": 83392 - }, - { - "epoch": 2.14, - "learning_rate": 4.0316780807574335e-07, - "loss": 0.4751, - "step": 83393 - }, - { - "epoch": 2.14, - "learning_rate": 4.0314560647046116e-07, - "loss": 0.4392, - "step": 83394 - }, - { - "epoch": 2.14, - "learning_rate": 4.031234053221626e-07, - "loss": 0.4624, - "step": 83395 - }, - { - "epoch": 2.14, - "learning_rate": 4.0310120463086503e-07, - "loss": 0.3552, - "step": 83396 - }, - { - "epoch": 2.14, - "learning_rate": 4.030790043965858e-07, - "loss": 0.2489, - "step": 83397 - }, - { - "epoch": 2.14, - "learning_rate": 4.0305680461934124e-07, - "loss": 0.4917, - "step": 83398 - }, - { - "epoch": 2.14, - "learning_rate": 4.030346052991489e-07, - "loss": 0.385, - "step": 83399 - }, - { - "epoch": 2.14, - "learning_rate": 4.030124064360252e-07, - "loss": 0.3462, - "step": 83400 - }, - { - "epoch": 2.14, - "learning_rate": 4.029902080299874e-07, - "loss": 0.4663, - "step": 83401 - }, - { - "epoch": 2.14, - "learning_rate": 4.029680100810525e-07, - "loss": 0.4033, - "step": 83402 - }, - { - "epoch": 2.14, - "learning_rate": 4.02945812589238e-07, - "loss": 0.3517, - "step": 83403 - }, - { - "epoch": 2.14, - "learning_rate": 4.029236155545601e-07, - "loss": 0.4199, - "step": 83404 - }, - { - "epoch": 2.14, - "learning_rate": 4.02901418977036e-07, - "loss": 0.5518, - "step": 83405 - }, - { - "epoch": 2.14, - "learning_rate": 4.02879222856683e-07, - "loss": 0.3926, - "step": 83406 - }, - { - "epoch": 2.14, - "learning_rate": 4.0285702719351856e-07, - "loss": 0.3228, - "step": 83407 - }, - { - "epoch": 2.14, - "learning_rate": 4.028348319875583e-07, - "loss": 0.54, - "step": 83408 - }, - { - "epoch": 2.14, - "learning_rate": 4.0281263723881986e-07, - "loss": 0.3784, - "step": 83409 - }, - { - "epoch": 2.14, - "learning_rate": 4.0279044294732047e-07, - "loss": 0.4438, - "step": 83410 - }, - { - "epoch": 2.14, - "learning_rate": 4.0276824911307726e-07, - "loss": 0.4282, - "step": 83411 - }, - { - "epoch": 2.14, - "learning_rate": 4.0274605573610664e-07, - "loss": 0.3021, - "step": 83412 - }, - { - "epoch": 2.14, - "learning_rate": 4.027238628164259e-07, - "loss": 0.3901, - "step": 83413 - }, - { - "epoch": 2.14, - "learning_rate": 4.02701670354052e-07, - "loss": 0.4055, - "step": 83414 - }, - { - "epoch": 2.14, - "learning_rate": 4.026794783490023e-07, - "loss": 0.4561, - "step": 83415 - }, - { - "epoch": 2.14, - "learning_rate": 4.026572868012932e-07, - "loss": 0.4531, - "step": 83416 - }, - { - "epoch": 2.14, - "learning_rate": 4.0263509571094223e-07, - "loss": 0.5225, - "step": 83417 - }, - { - "epoch": 2.14, - "learning_rate": 4.0261290507796576e-07, - "loss": 0.5513, - "step": 83418 - }, - { - "epoch": 2.14, - "learning_rate": 4.0259071490238105e-07, - "loss": 0.2632, - "step": 83419 - }, - { - "epoch": 2.14, - "learning_rate": 4.025685251842056e-07, - "loss": 0.4678, - "step": 83420 - }, - { - "epoch": 2.14, - "learning_rate": 4.0254633592345555e-07, - "loss": 0.4189, - "step": 83421 - }, - { - "epoch": 2.14, - "learning_rate": 4.025241471201484e-07, - "loss": 0.5244, - "step": 83422 - }, - { - "epoch": 2.14, - "learning_rate": 4.0250195877430095e-07, - "loss": 0.4272, - "step": 83423 - }, - { - "epoch": 2.14, - "learning_rate": 4.0247977088593066e-07, - "loss": 0.4771, - "step": 83424 - }, - { - "epoch": 2.14, - "learning_rate": 4.0245758345505377e-07, - "loss": 0.3195, - "step": 83425 - }, - { - "epoch": 2.14, - "learning_rate": 4.0243539648168765e-07, - "loss": 0.3813, - "step": 83426 - }, - { - "epoch": 2.14, - "learning_rate": 4.024132099658496e-07, - "loss": 0.439, - "step": 83427 - }, - { - "epoch": 2.14, - "learning_rate": 4.023910239075563e-07, - "loss": 0.3892, - "step": 83428 - }, - { - "epoch": 2.14, - "learning_rate": 4.0236883830682433e-07, - "loss": 0.4111, - "step": 83429 - }, - { - "epoch": 2.14, - "learning_rate": 4.023466531636711e-07, - "loss": 0.4009, - "step": 83430 - }, - { - "epoch": 2.14, - "learning_rate": 4.0232446847811354e-07, - "loss": 0.4824, - "step": 83431 - }, - { - "epoch": 2.14, - "learning_rate": 4.02302284250169e-07, - "loss": 0.4299, - "step": 83432 - }, - { - "epoch": 2.14, - "learning_rate": 4.022801004798537e-07, - "loss": 0.4722, - "step": 83433 - }, - { - "epoch": 2.14, - "learning_rate": 4.0225791716718516e-07, - "loss": 0.4062, - "step": 83434 - }, - { - "epoch": 2.14, - "learning_rate": 4.0223573431218015e-07, - "loss": 0.3877, - "step": 83435 - }, - { - "epoch": 2.14, - "learning_rate": 4.0221355191485616e-07, - "loss": 0.3417, - "step": 83436 - }, - { - "epoch": 2.14, - "learning_rate": 4.021913699752297e-07, - "loss": 0.4607, - "step": 83437 - }, - { - "epoch": 2.14, - "learning_rate": 4.021691884933176e-07, - "loss": 0.4019, - "step": 83438 - }, - { - "epoch": 2.14, - "learning_rate": 4.02147007469137e-07, - "loss": 0.498, - "step": 83439 - }, - { - "epoch": 2.14, - "learning_rate": 4.0212482690270486e-07, - "loss": 0.3831, - "step": 83440 - }, - { - "epoch": 2.14, - "learning_rate": 4.021026467940387e-07, - "loss": 0.2504, - "step": 83441 - }, - { - "epoch": 2.14, - "learning_rate": 4.0208046714315467e-07, - "loss": 0.3143, - "step": 83442 - }, - { - "epoch": 2.14, - "learning_rate": 4.0205828795007013e-07, - "loss": 0.5215, - "step": 83443 - }, - { - "epoch": 2.14, - "learning_rate": 4.0203610921480246e-07, - "loss": 0.4473, - "step": 83444 - }, - { - "epoch": 2.14, - "learning_rate": 4.020139309373679e-07, - "loss": 0.384, - "step": 83445 - }, - { - "epoch": 2.14, - "learning_rate": 4.0199175311778366e-07, - "loss": 0.3191, - "step": 83446 - }, - { - "epoch": 2.14, - "learning_rate": 4.0196957575606726e-07, - "loss": 0.4009, - "step": 83447 - }, - { - "epoch": 2.14, - "learning_rate": 4.0194739885223495e-07, - "loss": 0.4102, - "step": 83448 - }, - { - "epoch": 2.14, - "learning_rate": 4.019252224063043e-07, - "loss": 0.3994, - "step": 83449 - }, - { - "epoch": 2.14, - "learning_rate": 4.0190304641829177e-07, - "loss": 0.3628, - "step": 83450 - }, - { - "epoch": 2.14, - "learning_rate": 4.0188087088821445e-07, - "loss": 0.4722, - "step": 83451 - }, - { - "epoch": 2.14, - "learning_rate": 4.0185869581608946e-07, - "loss": 0.3828, - "step": 83452 - }, - { - "epoch": 2.14, - "learning_rate": 4.018365212019341e-07, - "loss": 0.5024, - "step": 83453 - }, - { - "epoch": 2.14, - "learning_rate": 4.018143470457648e-07, - "loss": 0.4883, - "step": 83454 - }, - { - "epoch": 2.14, - "learning_rate": 4.0179217334759865e-07, - "loss": 0.4114, - "step": 83455 - }, - { - "epoch": 2.14, - "learning_rate": 4.0177000010745267e-07, - "loss": 0.3368, - "step": 83456 - }, - { - "epoch": 2.14, - "learning_rate": 4.017478273253443e-07, - "loss": 0.2852, - "step": 83457 - }, - { - "epoch": 2.14, - "learning_rate": 4.017256550012901e-07, - "loss": 0.4404, - "step": 83458 - }, - { - "epoch": 2.14, - "learning_rate": 4.017034831353068e-07, - "loss": 0.3838, - "step": 83459 - }, - { - "epoch": 2.14, - "learning_rate": 4.016813117274115e-07, - "loss": 0.3672, - "step": 83460 - }, - { - "epoch": 2.14, - "learning_rate": 4.0165914077762174e-07, - "loss": 0.2881, - "step": 83461 - }, - { - "epoch": 2.14, - "learning_rate": 4.0163697028595367e-07, - "loss": 0.4883, - "step": 83462 - }, - { - "epoch": 2.14, - "learning_rate": 4.0161480025242466e-07, - "loss": 0.3774, - "step": 83463 - }, - { - "epoch": 2.14, - "learning_rate": 4.0159263067705164e-07, - "loss": 0.4326, - "step": 83464 - }, - { - "epoch": 2.14, - "learning_rate": 4.015704615598521e-07, - "loss": 0.4253, - "step": 83465 - }, - { - "epoch": 2.14, - "learning_rate": 4.0154829290084214e-07, - "loss": 0.3566, - "step": 83466 - }, - { - "epoch": 2.14, - "learning_rate": 4.015261247000394e-07, - "loss": 0.3882, - "step": 83467 - }, - { - "epoch": 2.14, - "learning_rate": 4.015039569574603e-07, - "loss": 0.5488, - "step": 83468 - }, - { - "epoch": 2.14, - "learning_rate": 4.014817896731221e-07, - "loss": 0.3568, - "step": 83469 - }, - { - "epoch": 2.14, - "learning_rate": 4.0145962284704216e-07, - "loss": 0.3268, - "step": 83470 - }, - { - "epoch": 2.14, - "learning_rate": 4.0143745647923664e-07, - "loss": 0.4917, - "step": 83471 - }, - { - "epoch": 2.14, - "learning_rate": 4.01415290569723e-07, - "loss": 0.4717, - "step": 83472 - }, - { - "epoch": 2.14, - "learning_rate": 4.013931251185182e-07, - "loss": 0.4951, - "step": 83473 - }, - { - "epoch": 2.14, - "learning_rate": 4.0137096012563943e-07, - "loss": 0.3979, - "step": 83474 - }, - { - "epoch": 2.14, - "learning_rate": 4.01348795591103e-07, - "loss": 0.4146, - "step": 83475 - }, - { - "epoch": 2.14, - "learning_rate": 4.0132663151492627e-07, - "loss": 0.4961, - "step": 83476 - }, - { - "epoch": 2.14, - "learning_rate": 4.0130446789712667e-07, - "loss": 0.5059, - "step": 83477 - }, - { - "epoch": 2.14, - "learning_rate": 4.0128230473772064e-07, - "loss": 0.3936, - "step": 83478 - }, - { - "epoch": 2.14, - "learning_rate": 4.012601420367249e-07, - "loss": 0.3706, - "step": 83479 - }, - { - "epoch": 2.14, - "learning_rate": 4.0123797979415674e-07, - "loss": 0.4351, - "step": 83480 - }, - { - "epoch": 2.14, - "learning_rate": 4.01215818010033e-07, - "loss": 0.4888, - "step": 83481 - }, - { - "epoch": 2.14, - "learning_rate": 4.011936566843713e-07, - "loss": 0.1868, - "step": 83482 - }, - { - "epoch": 2.14, - "learning_rate": 4.011714958171877e-07, - "loss": 0.3472, - "step": 83483 - }, - { - "epoch": 2.14, - "learning_rate": 4.0114933540849946e-07, - "loss": 0.385, - "step": 83484 - }, - { - "epoch": 2.14, - "learning_rate": 4.0112717545832367e-07, - "loss": 0.4819, - "step": 83485 - }, - { - "epoch": 2.14, - "learning_rate": 4.0110501596667767e-07, - "loss": 0.4011, - "step": 83486 - }, - { - "epoch": 2.14, - "learning_rate": 4.0108285693357804e-07, - "loss": 0.2612, - "step": 83487 - }, - { - "epoch": 2.14, - "learning_rate": 4.0106069835904124e-07, - "loss": 0.2828, - "step": 83488 - }, - { - "epoch": 2.14, - "learning_rate": 4.010385402430848e-07, - "loss": 0.2788, - "step": 83489 - }, - { - "epoch": 2.14, - "learning_rate": 4.010163825857257e-07, - "loss": 0.4912, - "step": 83490 - }, - { - "epoch": 2.14, - "learning_rate": 4.00994225386981e-07, - "loss": 0.3597, - "step": 83491 - }, - { - "epoch": 2.14, - "learning_rate": 4.0097206864686726e-07, - "loss": 0.3494, - "step": 83492 - }, - { - "epoch": 2.14, - "learning_rate": 4.0094991236540154e-07, - "loss": 0.3535, - "step": 83493 - }, - { - "epoch": 2.14, - "learning_rate": 4.0092775654260104e-07, - "loss": 0.4146, - "step": 83494 - }, - { - "epoch": 2.14, - "learning_rate": 4.0090560117848296e-07, - "loss": 0.3125, - "step": 83495 - }, - { - "epoch": 2.14, - "learning_rate": 4.008834462730635e-07, - "loss": 0.3835, - "step": 83496 - }, - { - "epoch": 2.14, - "learning_rate": 4.008612918263604e-07, - "loss": 0.3828, - "step": 83497 - }, - { - "epoch": 2.14, - "learning_rate": 4.0083913783838996e-07, - "loss": 0.4194, - "step": 83498 - }, - { - "epoch": 2.14, - "learning_rate": 4.0081698430916976e-07, - "loss": 0.439, - "step": 83499 - }, - { - "epoch": 2.14, - "learning_rate": 4.0079483123871605e-07, - "loss": 0.5142, - "step": 83500 - }, - { - "epoch": 2.14, - "learning_rate": 4.0077267862704624e-07, - "loss": 0.4722, - "step": 83501 - }, - { - "epoch": 2.14, - "learning_rate": 4.007505264741772e-07, - "loss": 0.522, - "step": 83502 - }, - { - "epoch": 2.14, - "learning_rate": 4.0072837478012634e-07, - "loss": 0.3157, - "step": 83503 - }, - { - "epoch": 2.14, - "learning_rate": 4.007062235449098e-07, - "loss": 0.4583, - "step": 83504 - }, - { - "epoch": 2.14, - "learning_rate": 4.00684072768545e-07, - "loss": 0.3931, - "step": 83505 - }, - { - "epoch": 2.14, - "learning_rate": 4.006619224510488e-07, - "loss": 0.4526, - "step": 83506 - }, - { - "epoch": 2.14, - "learning_rate": 4.0063977259243855e-07, - "loss": 0.333, - "step": 83507 - }, - { - "epoch": 2.14, - "learning_rate": 4.0061762319273086e-07, - "loss": 0.4746, - "step": 83508 - }, - { - "epoch": 2.14, - "learning_rate": 4.005954742519424e-07, - "loss": 0.4639, - "step": 83509 - }, - { - "epoch": 2.14, - "learning_rate": 4.005733257700904e-07, - "loss": 0.4453, - "step": 83510 - }, - { - "epoch": 2.14, - "learning_rate": 4.005511777471918e-07, - "loss": 0.321, - "step": 83511 - }, - { - "epoch": 2.14, - "learning_rate": 4.00529030183264e-07, - "loss": 0.4663, - "step": 83512 - }, - { - "epoch": 2.14, - "learning_rate": 4.005068830783231e-07, - "loss": 0.4619, - "step": 83513 - }, - { - "epoch": 2.14, - "learning_rate": 4.004847364323867e-07, - "loss": 0.4565, - "step": 83514 - }, - { - "epoch": 2.14, - "learning_rate": 4.004625902454718e-07, - "loss": 0.5518, - "step": 83515 - }, - { - "epoch": 2.14, - "learning_rate": 4.0044044451759486e-07, - "loss": 0.4731, - "step": 83516 - }, - { - "epoch": 2.14, - "learning_rate": 4.0041829924877337e-07, - "loss": 0.3892, - "step": 83517 - }, - { - "epoch": 2.14, - "learning_rate": 4.003961544390237e-07, - "loss": 0.5098, - "step": 83518 - }, - { - "epoch": 2.14, - "learning_rate": 4.0037401008836313e-07, - "loss": 0.4814, - "step": 83519 - }, - { - "epoch": 2.14, - "learning_rate": 4.0035186619680895e-07, - "loss": 0.394, - "step": 83520 - }, - { - "epoch": 2.14, - "learning_rate": 4.003297227643775e-07, - "loss": 0.4731, - "step": 83521 - }, - { - "epoch": 2.14, - "learning_rate": 4.0030757979108586e-07, - "loss": 0.4976, - "step": 83522 - }, - { - "epoch": 2.14, - "learning_rate": 4.002854372769512e-07, - "loss": 0.4492, - "step": 83523 - }, - { - "epoch": 2.14, - "learning_rate": 4.0026329522199077e-07, - "loss": 0.2637, - "step": 83524 - }, - { - "epoch": 2.14, - "learning_rate": 4.002411536262208e-07, - "loss": 0.3438, - "step": 83525 - }, - { - "epoch": 2.14, - "learning_rate": 4.002190124896586e-07, - "loss": 0.4321, - "step": 83526 - }, - { - "epoch": 2.14, - "learning_rate": 4.001968718123215e-07, - "loss": 0.3823, - "step": 83527 - }, - { - "epoch": 2.14, - "learning_rate": 4.0017473159422567e-07, - "loss": 0.3208, - "step": 83528 - }, - { - "epoch": 2.14, - "learning_rate": 4.0015259183538886e-07, - "loss": 0.4309, - "step": 83529 - }, - { - "epoch": 2.14, - "learning_rate": 4.0013045253582724e-07, - "loss": 0.3113, - "step": 83530 - }, - { - "epoch": 2.14, - "learning_rate": 4.0010831369555817e-07, - "loss": 0.4702, - "step": 83531 - }, - { - "epoch": 2.14, - "learning_rate": 4.0008617531459897e-07, - "loss": 0.3762, - "step": 83532 - }, - { - "epoch": 2.14, - "learning_rate": 4.0006403739296577e-07, - "loss": 0.335, - "step": 83533 - }, - { - "epoch": 2.14, - "learning_rate": 4.0004189993067606e-07, - "loss": 0.4277, - "step": 83534 - }, - { - "epoch": 2.14, - "learning_rate": 4.0001976292774665e-07, - "loss": 0.4219, - "step": 83535 - }, - { - "epoch": 2.14, - "learning_rate": 3.9999762638419477e-07, - "loss": 0.3396, - "step": 83536 - }, - { - "epoch": 2.14, - "learning_rate": 3.999754903000372e-07, - "loss": 0.4341, - "step": 83537 - }, - { - "epoch": 2.14, - "learning_rate": 3.999533546752905e-07, - "loss": 0.4255, - "step": 83538 - }, - { - "epoch": 2.14, - "learning_rate": 3.999312195099718e-07, - "loss": 0.3752, - "step": 83539 - }, - { - "epoch": 2.14, - "learning_rate": 3.999090848040982e-07, - "loss": 0.4448, - "step": 83540 - }, - { - "epoch": 2.14, - "learning_rate": 3.9988695055768704e-07, - "loss": 0.4185, - "step": 83541 - }, - { - "epoch": 2.14, - "learning_rate": 3.9986481677075444e-07, - "loss": 0.5811, - "step": 83542 - }, - { - "epoch": 2.14, - "learning_rate": 3.9984268344331783e-07, - "loss": 0.4717, - "step": 83543 - }, - { - "epoch": 2.14, - "learning_rate": 3.99820550575394e-07, - "loss": 0.3445, - "step": 83544 - }, - { - "epoch": 2.14, - "learning_rate": 3.9979841816700043e-07, - "loss": 0.3735, - "step": 83545 - }, - { - "epoch": 2.14, - "learning_rate": 3.997762862181532e-07, - "loss": 0.395, - "step": 83546 - }, - { - "epoch": 2.14, - "learning_rate": 3.9975415472887e-07, - "loss": 0.437, - "step": 83547 - }, - { - "epoch": 2.14, - "learning_rate": 3.997320236991671e-07, - "loss": 0.5366, - "step": 83548 - }, - { - "epoch": 2.14, - "learning_rate": 3.997098931290621e-07, - "loss": 0.355, - "step": 83549 - }, - { - "epoch": 2.14, - "learning_rate": 3.9968776301857134e-07, - "loss": 0.4021, - "step": 83550 - }, - { - "epoch": 2.14, - "learning_rate": 3.996656333677121e-07, - "loss": 0.4336, - "step": 83551 - }, - { - "epoch": 2.14, - "learning_rate": 3.996435041765012e-07, - "loss": 0.2737, - "step": 83552 - }, - { - "epoch": 2.14, - "learning_rate": 3.99621375444956e-07, - "loss": 0.3611, - "step": 83553 - }, - { - "epoch": 2.14, - "learning_rate": 3.995992471730929e-07, - "loss": 0.2714, - "step": 83554 - }, - { - "epoch": 2.14, - "learning_rate": 3.9957711936092885e-07, - "loss": 0.5063, - "step": 83555 - }, - { - "epoch": 2.14, - "learning_rate": 3.995549920084811e-07, - "loss": 0.2288, - "step": 83556 - }, - { - "epoch": 2.14, - "learning_rate": 3.995328651157669e-07, - "loss": 0.3466, - "step": 83557 - }, - { - "epoch": 2.14, - "learning_rate": 3.995107386828026e-07, - "loss": 0.4375, - "step": 83558 - }, - { - "epoch": 2.14, - "learning_rate": 3.994886127096051e-07, - "loss": 0.3669, - "step": 83559 - }, - { - "epoch": 2.14, - "learning_rate": 3.994664871961916e-07, - "loss": 0.4907, - "step": 83560 - }, - { - "epoch": 2.14, - "learning_rate": 3.994443621425788e-07, - "loss": 0.3064, - "step": 83561 - }, - { - "epoch": 2.14, - "learning_rate": 3.9942223754878436e-07, - "loss": 0.4438, - "step": 83562 - }, - { - "epoch": 2.14, - "learning_rate": 3.9940011341482425e-07, - "loss": 0.3491, - "step": 83563 - }, - { - "epoch": 2.14, - "learning_rate": 3.993779897407159e-07, - "loss": 0.5103, - "step": 83564 - }, - { - "epoch": 2.14, - "learning_rate": 3.993558665264762e-07, - "loss": 0.3425, - "step": 83565 - }, - { - "epoch": 2.14, - "learning_rate": 3.9933374377212245e-07, - "loss": 0.4541, - "step": 83566 - }, - { - "epoch": 2.14, - "learning_rate": 3.9931162147767126e-07, - "loss": 0.3333, - "step": 83567 - }, - { - "epoch": 2.14, - "learning_rate": 3.992894996431392e-07, - "loss": 0.3062, - "step": 83568 - }, - { - "epoch": 2.14, - "learning_rate": 3.992673782685435e-07, - "loss": 0.2939, - "step": 83569 - }, - { - "epoch": 2.14, - "learning_rate": 3.9924525735390146e-07, - "loss": 0.3508, - "step": 83570 - }, - { - "epoch": 2.14, - "learning_rate": 3.992231368992295e-07, - "loss": 0.4771, - "step": 83571 - }, - { - "epoch": 2.14, - "learning_rate": 3.9920101690454464e-07, - "loss": 0.3489, - "step": 83572 - }, - { - "epoch": 2.14, - "learning_rate": 3.99178897369864e-07, - "loss": 0.4248, - "step": 83573 - }, - { - "epoch": 2.14, - "learning_rate": 3.991567782952047e-07, - "loss": 0.4561, - "step": 83574 - }, - { - "epoch": 2.14, - "learning_rate": 3.9913465968058315e-07, - "loss": 0.4487, - "step": 83575 - }, - { - "epoch": 2.14, - "learning_rate": 3.991125415260165e-07, - "loss": 0.4062, - "step": 83576 - }, - { - "epoch": 2.14, - "learning_rate": 3.9909042383152214e-07, - "loss": 0.4082, - "step": 83577 - }, - { - "epoch": 2.14, - "learning_rate": 3.9906830659711633e-07, - "loss": 0.501, - "step": 83578 - }, - { - "epoch": 2.14, - "learning_rate": 3.9904618982281655e-07, - "loss": 0.4061, - "step": 83579 - }, - { - "epoch": 2.14, - "learning_rate": 3.990240735086392e-07, - "loss": 0.5117, - "step": 83580 - }, - { - "epoch": 2.14, - "learning_rate": 3.990019576546014e-07, - "loss": 0.4258, - "step": 83581 - }, - { - "epoch": 2.14, - "learning_rate": 3.9897984226072013e-07, - "loss": 0.3556, - "step": 83582 - }, - { - "epoch": 2.14, - "learning_rate": 3.989577273270128e-07, - "loss": 0.4893, - "step": 83583 - }, - { - "epoch": 2.14, - "learning_rate": 3.989356128534955e-07, - "loss": 0.5054, - "step": 83584 - }, - { - "epoch": 2.14, - "learning_rate": 3.9891349884018564e-07, - "loss": 0.3708, - "step": 83585 - }, - { - "epoch": 2.14, - "learning_rate": 3.9889138528709995e-07, - "loss": 0.4668, - "step": 83586 - }, - { - "epoch": 2.14, - "learning_rate": 3.9886927219425634e-07, - "loss": 0.4849, - "step": 83587 - }, - { - "epoch": 2.14, - "learning_rate": 3.9884715956167016e-07, - "loss": 0.4858, - "step": 83588 - }, - { - "epoch": 2.14, - "learning_rate": 3.98825047389359e-07, - "loss": 0.5176, - "step": 83589 - }, - { - "epoch": 2.14, - "learning_rate": 3.988029356773398e-07, - "loss": 0.2875, - "step": 83590 - }, - { - "epoch": 2.14, - "learning_rate": 3.9878082442563e-07, - "loss": 0.3313, - "step": 83591 - }, - { - "epoch": 2.14, - "learning_rate": 3.987587136342457e-07, - "loss": 0.4521, - "step": 83592 - }, - { - "epoch": 2.14, - "learning_rate": 3.987366033032042e-07, - "loss": 0.3898, - "step": 83593 - }, - { - "epoch": 2.14, - "learning_rate": 3.987144934325225e-07, - "loss": 0.4771, - "step": 83594 - }, - { - "epoch": 2.14, - "learning_rate": 3.986923840222177e-07, - "loss": 0.438, - "step": 83595 - }, - { - "epoch": 2.14, - "learning_rate": 3.9867027507230623e-07, - "loss": 0.6152, - "step": 83596 - }, - { - "epoch": 2.14, - "learning_rate": 3.9864816658280563e-07, - "loss": 0.3892, - "step": 83597 - }, - { - "epoch": 2.14, - "learning_rate": 3.986260585537321e-07, - "loss": 0.2844, - "step": 83598 - }, - { - "epoch": 2.14, - "learning_rate": 3.9860395098510294e-07, - "loss": 0.4307, - "step": 83599 - }, - { - "epoch": 2.14, - "learning_rate": 3.985818438769354e-07, - "loss": 0.4678, - "step": 83600 - }, - { - "epoch": 2.14, - "learning_rate": 3.9855973722924575e-07, - "loss": 0.4287, - "step": 83601 - }, - { - "epoch": 2.14, - "learning_rate": 3.9853763104205127e-07, - "loss": 0.3955, - "step": 83602 - }, - { - "epoch": 2.14, - "learning_rate": 3.985155253153689e-07, - "loss": 0.2395, - "step": 83603 - }, - { - "epoch": 2.14, - "learning_rate": 3.9849342004921593e-07, - "loss": 0.3442, - "step": 83604 - }, - { - "epoch": 2.14, - "learning_rate": 3.984713152436084e-07, - "loss": 0.5049, - "step": 83605 - }, - { - "epoch": 2.14, - "learning_rate": 3.9844921089856386e-07, - "loss": 0.4971, - "step": 83606 - }, - { - "epoch": 2.14, - "learning_rate": 3.9842710701409933e-07, - "loss": 0.3708, - "step": 83607 - }, - { - "epoch": 2.14, - "learning_rate": 3.984050035902316e-07, - "loss": 0.4253, - "step": 83608 - }, - { - "epoch": 2.14, - "learning_rate": 3.983829006269771e-07, - "loss": 0.4707, - "step": 83609 - }, - { - "epoch": 2.14, - "learning_rate": 3.983607981243532e-07, - "loss": 0.3463, - "step": 83610 - }, - { - "epoch": 2.14, - "learning_rate": 3.983386960823767e-07, - "loss": 0.3098, - "step": 83611 - }, - { - "epoch": 2.14, - "learning_rate": 3.983165945010649e-07, - "loss": 0.4775, - "step": 83612 - }, - { - "epoch": 2.14, - "learning_rate": 3.982944933804342e-07, - "loss": 0.3489, - "step": 83613 - }, - { - "epoch": 2.14, - "learning_rate": 3.982723927205017e-07, - "loss": 0.3051, - "step": 83614 - }, - { - "epoch": 2.14, - "learning_rate": 3.9825029252128426e-07, - "loss": 0.436, - "step": 83615 - }, - { - "epoch": 2.14, - "learning_rate": 3.982281927827994e-07, - "loss": 0.3413, - "step": 83616 - }, - { - "epoch": 2.14, - "learning_rate": 3.982060935050635e-07, - "loss": 0.4771, - "step": 83617 - }, - { - "epoch": 2.14, - "learning_rate": 3.9818399468809316e-07, - "loss": 0.4292, - "step": 83618 - }, - { - "epoch": 2.14, - "learning_rate": 3.981618963319057e-07, - "loss": 0.2808, - "step": 83619 - }, - { - "epoch": 2.14, - "learning_rate": 3.981397984365179e-07, - "loss": 0.3892, - "step": 83620 - }, - { - "epoch": 2.14, - "learning_rate": 3.981177010019472e-07, - "loss": 0.4609, - "step": 83621 - }, - { - "epoch": 2.14, - "learning_rate": 3.9809560402820973e-07, - "loss": 0.4067, - "step": 83622 - }, - { - "epoch": 2.14, - "learning_rate": 3.9807350751532275e-07, - "loss": 0.3792, - "step": 83623 - }, - { - "epoch": 2.14, - "learning_rate": 3.9805141146330365e-07, - "loss": 0.3853, - "step": 83624 - }, - { - "epoch": 2.14, - "learning_rate": 3.9802931587216847e-07, - "loss": 0.4512, - "step": 83625 - }, - { - "epoch": 2.14, - "learning_rate": 3.980072207419346e-07, - "loss": 0.3281, - "step": 83626 - }, - { - "epoch": 2.14, - "learning_rate": 3.9798512607261924e-07, - "loss": 0.5308, - "step": 83627 - }, - { - "epoch": 2.14, - "learning_rate": 3.9796303186423876e-07, - "loss": 0.3643, - "step": 83628 - }, - { - "epoch": 2.14, - "learning_rate": 3.979409381168105e-07, - "loss": 0.542, - "step": 83629 - }, - { - "epoch": 2.14, - "learning_rate": 3.979188448303509e-07, - "loss": 0.3341, - "step": 83630 - }, - { - "epoch": 2.14, - "learning_rate": 3.9789675200487717e-07, - "loss": 0.501, - "step": 83631 - }, - { - "epoch": 2.14, - "learning_rate": 3.978746596404061e-07, - "loss": 0.384, - "step": 83632 - }, - { - "epoch": 2.14, - "learning_rate": 3.9785256773695517e-07, - "loss": 0.562, - "step": 83633 - }, - { - "epoch": 2.14, - "learning_rate": 3.978304762945406e-07, - "loss": 0.4404, - "step": 83634 - }, - { - "epoch": 2.14, - "learning_rate": 3.9780838531317937e-07, - "loss": 0.4053, - "step": 83635 - }, - { - "epoch": 2.14, - "learning_rate": 3.977862947928886e-07, - "loss": 0.4302, - "step": 83636 - }, - { - "epoch": 2.14, - "learning_rate": 3.977642047336855e-07, - "loss": 0.2266, - "step": 83637 - }, - { - "epoch": 2.14, - "learning_rate": 3.9774211513558674e-07, - "loss": 0.4238, - "step": 83638 - }, - { - "epoch": 2.14, - "learning_rate": 3.977200259986088e-07, - "loss": 0.424, - "step": 83639 - }, - { - "epoch": 2.14, - "learning_rate": 3.976979373227689e-07, - "loss": 0.4409, - "step": 83640 - }, - { - "epoch": 2.14, - "learning_rate": 3.976758491080844e-07, - "loss": 0.3806, - "step": 83641 - }, - { - "epoch": 2.14, - "learning_rate": 3.976537613545713e-07, - "loss": 0.4077, - "step": 83642 - }, - { - "epoch": 2.14, - "learning_rate": 3.9763167406224716e-07, - "loss": 0.4712, - "step": 83643 - }, - { - "epoch": 2.14, - "learning_rate": 3.9760958723112867e-07, - "loss": 0.3643, - "step": 83644 - }, - { - "epoch": 2.14, - "learning_rate": 3.975875008612333e-07, - "loss": 0.5508, - "step": 83645 - }, - { - "epoch": 2.14, - "learning_rate": 3.9756541495257735e-07, - "loss": 0.3643, - "step": 83646 - }, - { - "epoch": 2.14, - "learning_rate": 3.9754332950517755e-07, - "loss": 0.4478, - "step": 83647 - }, - { - "epoch": 2.14, - "learning_rate": 3.9752124451905114e-07, - "loss": 0.3287, - "step": 83648 - }, - { - "epoch": 2.14, - "learning_rate": 3.97499159994215e-07, - "loss": 0.4797, - "step": 83649 - }, - { - "epoch": 2.14, - "learning_rate": 3.9747707593068636e-07, - "loss": 0.5312, - "step": 83650 - }, - { - "epoch": 2.14, - "learning_rate": 3.9745499232848155e-07, - "loss": 0.5029, - "step": 83651 - }, - { - "epoch": 2.14, - "learning_rate": 3.9743290918761774e-07, - "loss": 0.3984, - "step": 83652 - }, - { - "epoch": 2.14, - "learning_rate": 3.9741082650811176e-07, - "loss": 0.272, - "step": 83653 - }, - { - "epoch": 2.14, - "learning_rate": 3.97388744289981e-07, - "loss": 0.5767, - "step": 83654 - }, - { - "epoch": 2.14, - "learning_rate": 3.973666625332416e-07, - "loss": 0.3306, - "step": 83655 - }, - { - "epoch": 2.14, - "learning_rate": 3.9734458123791126e-07, - "loss": 0.5435, - "step": 83656 - }, - { - "epoch": 2.14, - "learning_rate": 3.9732250040400605e-07, - "loss": 0.4766, - "step": 83657 - }, - { - "epoch": 2.14, - "learning_rate": 3.9730042003154364e-07, - "loss": 0.3237, - "step": 83658 - }, - { - "epoch": 2.14, - "learning_rate": 3.972783401205402e-07, - "loss": 0.4585, - "step": 83659 - }, - { - "epoch": 2.14, - "learning_rate": 3.9725626067101313e-07, - "loss": 0.5054, - "step": 83660 - }, - { - "epoch": 2.14, - "learning_rate": 3.9723418168297917e-07, - "loss": 0.3567, - "step": 83661 - }, - { - "epoch": 2.14, - "learning_rate": 3.972121031564556e-07, - "loss": 0.3018, - "step": 83662 - }, - { - "epoch": 2.14, - "learning_rate": 3.971900250914586e-07, - "loss": 0.3328, - "step": 83663 - }, - { - "epoch": 2.14, - "learning_rate": 3.9716794748800566e-07, - "loss": 0.4219, - "step": 83664 - }, - { - "epoch": 2.14, - "learning_rate": 3.9714587034611337e-07, - "loss": 0.3958, - "step": 83665 - }, - { - "epoch": 2.14, - "learning_rate": 3.971237936657992e-07, - "loss": 0.2384, - "step": 83666 - }, - { - "epoch": 2.14, - "learning_rate": 3.9710171744707956e-07, - "loss": 0.3124, - "step": 83667 - }, - { - "epoch": 2.14, - "learning_rate": 3.97079641689971e-07, - "loss": 0.4634, - "step": 83668 - }, - { - "epoch": 2.14, - "learning_rate": 3.970575663944909e-07, - "loss": 0.5449, - "step": 83669 - }, - { - "epoch": 2.14, - "learning_rate": 3.970354915606561e-07, - "loss": 0.3823, - "step": 83670 - }, - { - "epoch": 2.14, - "learning_rate": 3.9701341718848393e-07, - "loss": 0.3208, - "step": 83671 - }, - { - "epoch": 2.14, - "learning_rate": 3.9699134327799045e-07, - "loss": 0.4263, - "step": 83672 - }, - { - "epoch": 2.14, - "learning_rate": 3.969692698291929e-07, - "loss": 0.4355, - "step": 83673 - }, - { - "epoch": 2.14, - "learning_rate": 3.969471968421083e-07, - "loss": 0.342, - "step": 83674 - }, - { - "epoch": 2.14, - "learning_rate": 3.9692512431675384e-07, - "loss": 0.3845, - "step": 83675 - }, - { - "epoch": 2.14, - "learning_rate": 3.9690305225314614e-07, - "loss": 0.3276, - "step": 83676 - }, - { - "epoch": 2.14, - "learning_rate": 3.968809806513016e-07, - "loss": 0.353, - "step": 83677 - }, - { - "epoch": 2.14, - "learning_rate": 3.968589095112377e-07, - "loss": 0.3438, - "step": 83678 - }, - { - "epoch": 2.14, - "learning_rate": 3.9683683883297137e-07, - "loss": 0.5444, - "step": 83679 - }, - { - "epoch": 2.14, - "learning_rate": 3.968147686165191e-07, - "loss": 0.3008, - "step": 83680 - }, - { - "epoch": 2.14, - "learning_rate": 3.9679269886189805e-07, - "loss": 0.2686, - "step": 83681 - }, - { - "epoch": 2.14, - "learning_rate": 3.96770629569125e-07, - "loss": 0.3679, - "step": 83682 - }, - { - "epoch": 2.14, - "learning_rate": 3.967485607382174e-07, - "loss": 0.4551, - "step": 83683 - }, - { - "epoch": 2.14, - "learning_rate": 3.967264923691913e-07, - "loss": 0.3433, - "step": 83684 - }, - { - "epoch": 2.14, - "learning_rate": 3.96704424462064e-07, - "loss": 0.3589, - "step": 83685 - }, - { - "epoch": 2.14, - "learning_rate": 3.966823570168526e-07, - "loss": 0.4849, - "step": 83686 - }, - { - "epoch": 2.14, - "learning_rate": 3.966602900335736e-07, - "loss": 0.3306, - "step": 83687 - }, - { - "epoch": 2.14, - "learning_rate": 3.966382235122443e-07, - "loss": 0.3745, - "step": 83688 - }, - { - "epoch": 2.14, - "learning_rate": 3.9661615745288114e-07, - "loss": 0.4473, - "step": 83689 - }, - { - "epoch": 2.15, - "learning_rate": 3.965940918555012e-07, - "loss": 0.582, - "step": 83690 - }, - { - "epoch": 2.15, - "learning_rate": 3.9657202672012137e-07, - "loss": 0.3447, - "step": 83691 - }, - { - "epoch": 2.15, - "learning_rate": 3.9654996204675893e-07, - "loss": 0.4478, - "step": 83692 - }, - { - "epoch": 2.15, - "learning_rate": 3.9652789783543014e-07, - "loss": 0.5552, - "step": 83693 - }, - { - "epoch": 2.15, - "learning_rate": 3.965058340861521e-07, - "loss": 0.418, - "step": 83694 - }, - { - "epoch": 2.15, - "learning_rate": 3.9648377079894226e-07, - "loss": 0.4565, - "step": 83695 - }, - { - "epoch": 2.15, - "learning_rate": 3.9646170797381704e-07, - "loss": 0.5366, - "step": 83696 - }, - { - "epoch": 2.15, - "learning_rate": 3.964396456107929e-07, - "loss": 0.4302, - "step": 83697 - }, - { - "epoch": 2.15, - "learning_rate": 3.964175837098873e-07, - "loss": 0.4731, - "step": 83698 - }, - { - "epoch": 2.15, - "learning_rate": 3.963955222711168e-07, - "loss": 0.3505, - "step": 83699 - }, - { - "epoch": 2.15, - "learning_rate": 3.963734612944991e-07, - "loss": 0.2896, - "step": 83700 - }, - { - "epoch": 2.15, - "learning_rate": 3.963514007800499e-07, - "loss": 0.4893, - "step": 83701 - }, - { - "epoch": 2.15, - "learning_rate": 3.963293407277869e-07, - "loss": 0.5327, - "step": 83702 - }, - { - "epoch": 2.15, - "learning_rate": 3.963072811377266e-07, - "loss": 0.3616, - "step": 83703 - }, - { - "epoch": 2.15, - "learning_rate": 3.9628522200988645e-07, - "loss": 0.3638, - "step": 83704 - }, - { - "epoch": 2.15, - "learning_rate": 3.9626316334428254e-07, - "loss": 0.4229, - "step": 83705 - }, - { - "epoch": 2.15, - "learning_rate": 3.9624110514093267e-07, - "loss": 0.4438, - "step": 83706 - }, - { - "epoch": 2.15, - "learning_rate": 3.962190473998528e-07, - "loss": 0.438, - "step": 83707 - }, - { - "epoch": 2.15, - "learning_rate": 3.961969901210602e-07, - "loss": 0.3999, - "step": 83708 - }, - { - "epoch": 2.15, - "learning_rate": 3.9617493330457217e-07, - "loss": 0.3589, - "step": 83709 - }, - { - "epoch": 2.15, - "learning_rate": 3.961528769504049e-07, - "loss": 0.2773, - "step": 83710 - }, - { - "epoch": 2.15, - "learning_rate": 3.9613082105857556e-07, - "loss": 0.4302, - "step": 83711 - }, - { - "epoch": 2.15, - "learning_rate": 3.9610876562910147e-07, - "loss": 0.4307, - "step": 83712 - }, - { - "epoch": 2.15, - "learning_rate": 3.9608671066199873e-07, - "loss": 0.297, - "step": 83713 - }, - { - "epoch": 2.15, - "learning_rate": 3.9606465615728466e-07, - "loss": 0.5435, - "step": 83714 - }, - { - "epoch": 2.15, - "learning_rate": 3.960426021149762e-07, - "loss": 0.4824, - "step": 83715 - }, - { - "epoch": 2.15, - "learning_rate": 3.9602054853509035e-07, - "loss": 0.3425, - "step": 83716 - }, - { - "epoch": 2.15, - "learning_rate": 3.9599849541764383e-07, - "loss": 0.4624, - "step": 83717 - }, - { - "epoch": 2.15, - "learning_rate": 3.959764427626533e-07, - "loss": 0.4341, - "step": 83718 - }, - { - "epoch": 2.15, - "learning_rate": 3.959543905701357e-07, - "loss": 0.2916, - "step": 83719 - }, - { - "epoch": 2.15, - "learning_rate": 3.95932338840108e-07, - "loss": 0.2756, - "step": 83720 - }, - { - "epoch": 2.15, - "learning_rate": 3.959102875725876e-07, - "loss": 0.2732, - "step": 83721 - }, - { - "epoch": 2.15, - "learning_rate": 3.958882367675904e-07, - "loss": 0.5947, - "step": 83722 - }, - { - "epoch": 2.15, - "learning_rate": 3.9586618642513393e-07, - "loss": 0.4097, - "step": 83723 - }, - { - "epoch": 2.15, - "learning_rate": 3.9584413654523495e-07, - "loss": 0.354, - "step": 83724 - }, - { - "epoch": 2.15, - "learning_rate": 3.9582208712791066e-07, - "loss": 0.3955, - "step": 83725 - }, - { - "epoch": 2.15, - "learning_rate": 3.9580003817317765e-07, - "loss": 0.3005, - "step": 83726 - }, - { - "epoch": 2.15, - "learning_rate": 3.9577798968105237e-07, - "loss": 0.4001, - "step": 83727 - }, - { - "epoch": 2.15, - "learning_rate": 3.9575594165155213e-07, - "loss": 0.4673, - "step": 83728 - }, - { - "epoch": 2.15, - "learning_rate": 3.9573389408469403e-07, - "loss": 0.3354, - "step": 83729 - }, - { - "epoch": 2.15, - "learning_rate": 3.9571184698049444e-07, - "loss": 0.5034, - "step": 83730 - }, - { - "epoch": 2.15, - "learning_rate": 3.956898003389705e-07, - "loss": 0.3961, - "step": 83731 - }, - { - "epoch": 2.15, - "learning_rate": 3.956677541601391e-07, - "loss": 0.3647, - "step": 83732 - }, - { - "epoch": 2.15, - "learning_rate": 3.9564570844401744e-07, - "loss": 0.3574, - "step": 83733 - }, - { - "epoch": 2.15, - "learning_rate": 3.956236631906218e-07, - "loss": 0.4287, - "step": 83734 - }, - { - "epoch": 2.15, - "learning_rate": 3.956016183999692e-07, - "loss": 0.3948, - "step": 83735 - }, - { - "epoch": 2.15, - "learning_rate": 3.955795740720771e-07, - "loss": 0.5586, - "step": 83736 - }, - { - "epoch": 2.15, - "learning_rate": 3.955575302069616e-07, - "loss": 0.5054, - "step": 83737 - }, - { - "epoch": 2.15, - "learning_rate": 3.955354868046401e-07, - "loss": 0.4355, - "step": 83738 - }, - { - "epoch": 2.15, - "learning_rate": 3.955134438651291e-07, - "loss": 0.584, - "step": 83739 - }, - { - "epoch": 2.15, - "learning_rate": 3.954914013884456e-07, - "loss": 0.3718, - "step": 83740 - }, - { - "epoch": 2.15, - "learning_rate": 3.9546935937460645e-07, - "loss": 0.4746, - "step": 83741 - }, - { - "epoch": 2.15, - "learning_rate": 3.954473178236291e-07, - "loss": 0.522, - "step": 83742 - }, - { - "epoch": 2.15, - "learning_rate": 3.954252767355295e-07, - "loss": 0.3721, - "step": 83743 - }, - { - "epoch": 2.15, - "learning_rate": 3.95403236110325e-07, - "loss": 0.4893, - "step": 83744 - }, - { - "epoch": 2.15, - "learning_rate": 3.9538119594803245e-07, - "loss": 0.2104, - "step": 83745 - }, - { - "epoch": 2.15, - "learning_rate": 3.953591562486691e-07, - "loss": 0.2144, - "step": 83746 - }, - { - "epoch": 2.15, - "learning_rate": 3.9533711701225134e-07, - "loss": 0.4248, - "step": 83747 - }, - { - "epoch": 2.15, - "learning_rate": 3.9531507823879596e-07, - "loss": 0.3535, - "step": 83748 - }, - { - "epoch": 2.15, - "learning_rate": 3.9529303992831984e-07, - "loss": 0.4321, - "step": 83749 - }, - { - "epoch": 2.15, - "learning_rate": 3.952710020808405e-07, - "loss": 0.3394, - "step": 83750 - }, - { - "epoch": 2.15, - "learning_rate": 3.9524896469637405e-07, - "loss": 0.2925, - "step": 83751 - }, - { - "epoch": 2.15, - "learning_rate": 3.9522692777493747e-07, - "loss": 0.342, - "step": 83752 - }, - { - "epoch": 2.15, - "learning_rate": 3.95204891316548e-07, - "loss": 0.3311, - "step": 83753 - }, - { - "epoch": 2.15, - "learning_rate": 3.9518285532122253e-07, - "loss": 0.3721, - "step": 83754 - }, - { - "epoch": 2.15, - "learning_rate": 3.9516081978897753e-07, - "loss": 0.4229, - "step": 83755 - }, - { - "epoch": 2.15, - "learning_rate": 3.951387847198303e-07, - "loss": 0.3687, - "step": 83756 - }, - { - "epoch": 2.15, - "learning_rate": 3.951167501137973e-07, - "loss": 0.46, - "step": 83757 - }, - { - "epoch": 2.15, - "learning_rate": 3.950947159708955e-07, - "loss": 0.3511, - "step": 83758 - }, - { - "epoch": 2.15, - "learning_rate": 3.950726822911422e-07, - "loss": 0.5098, - "step": 83759 - }, - { - "epoch": 2.15, - "learning_rate": 3.9505064907455357e-07, - "loss": 0.4453, - "step": 83760 - }, - { - "epoch": 2.15, - "learning_rate": 3.950286163211468e-07, - "loss": 0.3264, - "step": 83761 - }, - { - "epoch": 2.15, - "learning_rate": 3.9500658403093887e-07, - "loss": 0.417, - "step": 83762 - }, - { - "epoch": 2.15, - "learning_rate": 3.94984552203947e-07, - "loss": 0.3921, - "step": 83763 - }, - { - "epoch": 2.15, - "learning_rate": 3.949625208401872e-07, - "loss": 0.4819, - "step": 83764 - }, - { - "epoch": 2.15, - "learning_rate": 3.949404899396768e-07, - "loss": 0.4614, - "step": 83765 - }, - { - "epoch": 2.15, - "learning_rate": 3.9491845950243296e-07, - "loss": 0.4004, - "step": 83766 - }, - { - "epoch": 2.15, - "learning_rate": 3.9489642952847236e-07, - "loss": 0.2859, - "step": 83767 - }, - { - "epoch": 2.15, - "learning_rate": 3.9487440001781126e-07, - "loss": 0.4087, - "step": 83768 - }, - { - "epoch": 2.15, - "learning_rate": 3.9485237097046697e-07, - "loss": 0.3672, - "step": 83769 - }, - { - "epoch": 2.15, - "learning_rate": 3.948303423864565e-07, - "loss": 0.46, - "step": 83770 - }, - { - "epoch": 2.15, - "learning_rate": 3.94808314265797e-07, - "loss": 0.4102, - "step": 83771 - }, - { - "epoch": 2.15, - "learning_rate": 3.947862866085044e-07, - "loss": 0.5527, - "step": 83772 - }, - { - "epoch": 2.15, - "learning_rate": 3.947642594145962e-07, - "loss": 0.4043, - "step": 83773 - }, - { - "epoch": 2.15, - "learning_rate": 3.947422326840894e-07, - "loss": 0.3432, - "step": 83774 - }, - { - "epoch": 2.15, - "learning_rate": 3.9472020641700066e-07, - "loss": 0.4551, - "step": 83775 - }, - { - "epoch": 2.15, - "learning_rate": 3.94698180613347e-07, - "loss": 0.3513, - "step": 83776 - }, - { - "epoch": 2.15, - "learning_rate": 3.946761552731448e-07, - "loss": 0.3279, - "step": 83777 - }, - { - "epoch": 2.15, - "learning_rate": 3.9465413039641116e-07, - "loss": 0.5303, - "step": 83778 - }, - { - "epoch": 2.15, - "learning_rate": 3.94632105983163e-07, - "loss": 0.478, - "step": 83779 - }, - { - "epoch": 2.15, - "learning_rate": 3.946100820334175e-07, - "loss": 0.394, - "step": 83780 - }, - { - "epoch": 2.15, - "learning_rate": 3.94588058547191e-07, - "loss": 0.3579, - "step": 83781 - }, - { - "epoch": 2.15, - "learning_rate": 3.945660355245005e-07, - "loss": 0.3547, - "step": 83782 - }, - { - "epoch": 2.15, - "learning_rate": 3.94544012965363e-07, - "loss": 0.397, - "step": 83783 - }, - { - "epoch": 2.15, - "learning_rate": 3.9452199086979567e-07, - "loss": 0.3828, - "step": 83784 - }, - { - "epoch": 2.15, - "learning_rate": 3.944999692378146e-07, - "loss": 0.4636, - "step": 83785 - }, - { - "epoch": 2.15, - "learning_rate": 3.944779480694375e-07, - "loss": 0.4927, - "step": 83786 - }, - { - "epoch": 2.15, - "learning_rate": 3.9445592736468034e-07, - "loss": 0.4438, - "step": 83787 - }, - { - "epoch": 2.15, - "learning_rate": 3.9443390712356083e-07, - "loss": 0.3662, - "step": 83788 - }, - { - "epoch": 2.15, - "learning_rate": 3.944118873460951e-07, - "loss": 0.522, - "step": 83789 - }, - { - "epoch": 2.15, - "learning_rate": 3.9438986803230035e-07, - "loss": 0.3921, - "step": 83790 - }, - { - "epoch": 2.15, - "learning_rate": 3.9436784918219333e-07, - "loss": 0.4653, - "step": 83791 - }, - { - "epoch": 2.15, - "learning_rate": 3.943458307957914e-07, - "loss": 0.4189, - "step": 83792 - }, - { - "epoch": 2.15, - "learning_rate": 3.9432381287311077e-07, - "loss": 0.3555, - "step": 83793 - }, - { - "epoch": 2.15, - "learning_rate": 3.9430179541416844e-07, - "loss": 0.3887, - "step": 83794 - }, - { - "epoch": 2.15, - "learning_rate": 3.942797784189814e-07, - "loss": 0.3787, - "step": 83795 - }, - { - "epoch": 2.15, - "learning_rate": 3.942577618875669e-07, - "loss": 0.3672, - "step": 83796 - }, - { - "epoch": 2.15, - "learning_rate": 3.942357458199412e-07, - "loss": 0.4458, - "step": 83797 - }, - { - "epoch": 2.15, - "learning_rate": 3.9421373021612116e-07, - "loss": 0.3945, - "step": 83798 - }, - { - "epoch": 2.15, - "learning_rate": 3.941917150761237e-07, - "loss": 0.425, - "step": 83799 - }, - { - "epoch": 2.15, - "learning_rate": 3.941697003999659e-07, - "loss": 0.3618, - "step": 83800 - }, - { - "epoch": 2.15, - "learning_rate": 3.941476861876648e-07, - "loss": 0.3433, - "step": 83801 - }, - { - "epoch": 2.15, - "learning_rate": 3.941256724392366e-07, - "loss": 0.4436, - "step": 83802 - }, - { - "epoch": 2.15, - "learning_rate": 3.9410365915469844e-07, - "loss": 0.416, - "step": 83803 - }, - { - "epoch": 2.15, - "learning_rate": 3.940816463340677e-07, - "loss": 0.4443, - "step": 83804 - }, - { - "epoch": 2.15, - "learning_rate": 3.940596339773604e-07, - "loss": 0.3076, - "step": 83805 - }, - { - "epoch": 2.15, - "learning_rate": 3.9403762208459424e-07, - "loss": 0.3711, - "step": 83806 - }, - { - "epoch": 2.15, - "learning_rate": 3.940156106557851e-07, - "loss": 0.4456, - "step": 83807 - }, - { - "epoch": 2.15, - "learning_rate": 3.9399359969095037e-07, - "loss": 0.4092, - "step": 83808 - }, - { - "epoch": 2.15, - "learning_rate": 3.939715891901073e-07, - "loss": 0.2858, - "step": 83809 - }, - { - "epoch": 2.15, - "learning_rate": 3.939495791532719e-07, - "loss": 0.3289, - "step": 83810 - }, - { - "epoch": 2.15, - "learning_rate": 3.9392756958046147e-07, - "loss": 0.5068, - "step": 83811 - }, - { - "epoch": 2.15, - "learning_rate": 3.9390556047169274e-07, - "loss": 0.3279, - "step": 83812 - }, - { - "epoch": 2.15, - "learning_rate": 3.938835518269832e-07, - "loss": 0.4531, - "step": 83813 - }, - { - "epoch": 2.15, - "learning_rate": 3.938615436463486e-07, - "loss": 0.3438, - "step": 83814 - }, - { - "epoch": 2.15, - "learning_rate": 3.9383953592980643e-07, - "loss": 0.4087, - "step": 83815 - }, - { - "epoch": 2.15, - "learning_rate": 3.9381752867737383e-07, - "loss": 0.2812, - "step": 83816 - }, - { - "epoch": 2.15, - "learning_rate": 3.9379552188906695e-07, - "loss": 0.314, - "step": 83817 - }, - { - "epoch": 2.15, - "learning_rate": 3.937735155649032e-07, - "loss": 0.3799, - "step": 83818 - }, - { - "epoch": 2.15, - "learning_rate": 3.9375150970489903e-07, - "loss": 0.2712, - "step": 83819 - }, - { - "epoch": 2.15, - "learning_rate": 3.937295043090713e-07, - "loss": 0.3096, - "step": 83820 - }, - { - "epoch": 2.15, - "learning_rate": 3.9370749937743743e-07, - "loss": 0.4404, - "step": 83821 - }, - { - "epoch": 2.15, - "learning_rate": 3.936854949100135e-07, - "loss": 0.3998, - "step": 83822 - }, - { - "epoch": 2.15, - "learning_rate": 3.936634909068166e-07, - "loss": 0.4355, - "step": 83823 - }, - { - "epoch": 2.15, - "learning_rate": 3.936414873678637e-07, - "loss": 0.4128, - "step": 83824 - }, - { - "epoch": 2.15, - "learning_rate": 3.9361948429317217e-07, - "loss": 0.3735, - "step": 83825 - }, - { - "epoch": 2.15, - "learning_rate": 3.935974816827582e-07, - "loss": 0.5117, - "step": 83826 - }, - { - "epoch": 2.15, - "learning_rate": 3.935754795366384e-07, - "loss": 0.4165, - "step": 83827 - }, - { - "epoch": 2.15, - "learning_rate": 3.935534778548299e-07, - "loss": 0.5024, - "step": 83828 - }, - { - "epoch": 2.15, - "learning_rate": 3.9353147663734974e-07, - "loss": 0.5259, - "step": 83829 - }, - { - "epoch": 2.15, - "learning_rate": 3.935094758842149e-07, - "loss": 0.2935, - "step": 83830 - }, - { - "epoch": 2.15, - "learning_rate": 3.934874755954417e-07, - "loss": 0.4688, - "step": 83831 - }, - { - "epoch": 2.15, - "learning_rate": 3.9346547577104714e-07, - "loss": 0.3982, - "step": 83832 - }, - { - "epoch": 2.15, - "learning_rate": 3.9344347641104827e-07, - "loss": 0.4219, - "step": 83833 - }, - { - "epoch": 2.15, - "learning_rate": 3.9342147751546216e-07, - "loss": 0.5024, - "step": 83834 - }, - { - "epoch": 2.15, - "learning_rate": 3.9339947908430506e-07, - "loss": 0.3916, - "step": 83835 - }, - { - "epoch": 2.15, - "learning_rate": 3.933774811175943e-07, - "loss": 0.4199, - "step": 83836 - }, - { - "epoch": 2.15, - "learning_rate": 3.933554836153462e-07, - "loss": 0.4512, - "step": 83837 - }, - { - "epoch": 2.15, - "learning_rate": 3.9333348657757825e-07, - "loss": 0.3325, - "step": 83838 - }, - { - "epoch": 2.15, - "learning_rate": 3.9331149000430676e-07, - "loss": 0.3337, - "step": 83839 - }, - { - "epoch": 2.15, - "learning_rate": 3.9328949389554857e-07, - "loss": 0.4585, - "step": 83840 - }, - { - "epoch": 2.15, - "learning_rate": 3.9326749825132077e-07, - "loss": 0.3546, - "step": 83841 - }, - { - "epoch": 2.15, - "learning_rate": 3.932455030716405e-07, - "loss": 0.3877, - "step": 83842 - }, - { - "epoch": 2.15, - "learning_rate": 3.9322350835652394e-07, - "loss": 0.3477, - "step": 83843 - }, - { - "epoch": 2.15, - "learning_rate": 3.932015141059882e-07, - "loss": 0.4121, - "step": 83844 - }, - { - "epoch": 2.15, - "learning_rate": 3.931795203200502e-07, - "loss": 0.4458, - "step": 83845 - }, - { - "epoch": 2.15, - "learning_rate": 3.9315752699872705e-07, - "loss": 0.3945, - "step": 83846 - }, - { - "epoch": 2.15, - "learning_rate": 3.931355341420354e-07, - "loss": 0.3135, - "step": 83847 - }, - { - "epoch": 2.15, - "learning_rate": 3.9311354174999144e-07, - "loss": 0.3926, - "step": 83848 - }, - { - "epoch": 2.15, - "learning_rate": 3.930915498226126e-07, - "loss": 0.3252, - "step": 83849 - }, - { - "epoch": 2.15, - "learning_rate": 3.9306955835991573e-07, - "loss": 0.4233, - "step": 83850 - }, - { - "epoch": 2.15, - "learning_rate": 3.930475673619178e-07, - "loss": 0.3442, - "step": 83851 - }, - { - "epoch": 2.15, - "learning_rate": 3.9302557682863524e-07, - "loss": 0.4109, - "step": 83852 - }, - { - "epoch": 2.15, - "learning_rate": 3.9300358676008493e-07, - "loss": 0.4971, - "step": 83853 - }, - { - "epoch": 2.15, - "learning_rate": 3.9298159715628397e-07, - "loss": 0.3725, - "step": 83854 - }, - { - "epoch": 2.15, - "learning_rate": 3.9295960801724935e-07, - "loss": 0.4492, - "step": 83855 - }, - { - "epoch": 2.15, - "learning_rate": 3.9293761934299775e-07, - "loss": 0.4517, - "step": 83856 - }, - { - "epoch": 2.15, - "learning_rate": 3.929156311335455e-07, - "loss": 0.3391, - "step": 83857 - }, - { - "epoch": 2.15, - "learning_rate": 3.9289364338890983e-07, - "loss": 0.4775, - "step": 83858 - }, - { - "epoch": 2.15, - "learning_rate": 3.92871656109108e-07, - "loss": 0.3984, - "step": 83859 - }, - { - "epoch": 2.15, - "learning_rate": 3.9284966929415606e-07, - "loss": 0.244, - "step": 83860 - }, - { - "epoch": 2.15, - "learning_rate": 3.9282768294407107e-07, - "loss": 0.4197, - "step": 83861 - }, - { - "epoch": 2.15, - "learning_rate": 3.928056970588702e-07, - "loss": 0.4146, - "step": 83862 - }, - { - "epoch": 2.15, - "learning_rate": 3.9278371163857037e-07, - "loss": 0.3281, - "step": 83863 - }, - { - "epoch": 2.15, - "learning_rate": 3.9276172668318776e-07, - "loss": 0.4175, - "step": 83864 - }, - { - "epoch": 2.15, - "learning_rate": 3.927397421927395e-07, - "loss": 0.3757, - "step": 83865 - }, - { - "epoch": 2.15, - "learning_rate": 3.9271775816724296e-07, - "loss": 0.3594, - "step": 83866 - }, - { - "epoch": 2.15, - "learning_rate": 3.926957746067141e-07, - "loss": 0.4746, - "step": 83867 - }, - { - "epoch": 2.15, - "learning_rate": 3.9267379151117054e-07, - "loss": 0.3667, - "step": 83868 - }, - { - "epoch": 2.15, - "learning_rate": 3.9265180888062845e-07, - "loss": 0.3892, - "step": 83869 - }, - { - "epoch": 2.15, - "learning_rate": 3.926298267151048e-07, - "loss": 0.4203, - "step": 83870 - }, - { - "epoch": 2.15, - "learning_rate": 3.9260784501461665e-07, - "loss": 0.4785, - "step": 83871 - }, - { - "epoch": 2.15, - "learning_rate": 3.9258586377918103e-07, - "loss": 0.396, - "step": 83872 - }, - { - "epoch": 2.15, - "learning_rate": 3.9256388300881414e-07, - "loss": 0.4263, - "step": 83873 - }, - { - "epoch": 2.15, - "learning_rate": 3.9254190270353324e-07, - "loss": 0.3364, - "step": 83874 - }, - { - "epoch": 2.15, - "learning_rate": 3.9251992286335544e-07, - "loss": 0.3142, - "step": 83875 - }, - { - "epoch": 2.15, - "learning_rate": 3.9249794348829713e-07, - "loss": 0.4487, - "step": 83876 - }, - { - "epoch": 2.15, - "learning_rate": 3.9247596457837485e-07, - "loss": 0.3912, - "step": 83877 - }, - { - "epoch": 2.15, - "learning_rate": 3.924539861336058e-07, - "loss": 0.4912, - "step": 83878 - }, - { - "epoch": 2.15, - "learning_rate": 3.924320081540068e-07, - "loss": 0.5146, - "step": 83879 - }, - { - "epoch": 2.15, - "learning_rate": 3.92410030639595e-07, - "loss": 0.5073, - "step": 83880 - }, - { - "epoch": 2.15, - "learning_rate": 3.9238805359038664e-07, - "loss": 0.3354, - "step": 83881 - }, - { - "epoch": 2.15, - "learning_rate": 3.9236607700639867e-07, - "loss": 0.3691, - "step": 83882 - }, - { - "epoch": 2.15, - "learning_rate": 3.9234410088764826e-07, - "loss": 0.3936, - "step": 83883 - }, - { - "epoch": 2.15, - "learning_rate": 3.923221252341522e-07, - "loss": 0.4111, - "step": 83884 - }, - { - "epoch": 2.15, - "learning_rate": 3.9230015004592687e-07, - "loss": 0.2786, - "step": 83885 - }, - { - "epoch": 2.15, - "learning_rate": 3.9227817532298966e-07, - "loss": 0.3496, - "step": 83886 - }, - { - "epoch": 2.15, - "learning_rate": 3.9225620106535683e-07, - "loss": 0.4771, - "step": 83887 - }, - { - "epoch": 2.15, - "learning_rate": 3.9223422727304546e-07, - "loss": 0.3921, - "step": 83888 - }, - { - "epoch": 2.15, - "learning_rate": 3.922122539460727e-07, - "loss": 0.4746, - "step": 83889 - }, - { - "epoch": 2.15, - "learning_rate": 3.9219028108445483e-07, - "loss": 0.3735, - "step": 83890 - }, - { - "epoch": 2.15, - "learning_rate": 3.921683086882088e-07, - "loss": 0.3959, - "step": 83891 - }, - { - "epoch": 2.15, - "learning_rate": 3.92146336757352e-07, - "loss": 0.4417, - "step": 83892 - }, - { - "epoch": 2.15, - "learning_rate": 3.921243652919004e-07, - "loss": 0.4277, - "step": 83893 - }, - { - "epoch": 2.15, - "learning_rate": 3.921023942918712e-07, - "loss": 0.4297, - "step": 83894 - }, - { - "epoch": 2.15, - "learning_rate": 3.9208042375728123e-07, - "loss": 0.2795, - "step": 83895 - }, - { - "epoch": 2.15, - "learning_rate": 3.920584536881477e-07, - "loss": 0.2692, - "step": 83896 - }, - { - "epoch": 2.15, - "learning_rate": 3.920364840844871e-07, - "loss": 0.4551, - "step": 83897 - }, - { - "epoch": 2.15, - "learning_rate": 3.920145149463158e-07, - "loss": 0.4697, - "step": 83898 - }, - { - "epoch": 2.15, - "learning_rate": 3.9199254627365107e-07, - "loss": 0.2656, - "step": 83899 - }, - { - "epoch": 2.15, - "learning_rate": 3.919705780665097e-07, - "loss": 0.4385, - "step": 83900 - }, - { - "epoch": 2.15, - "learning_rate": 3.9194861032490876e-07, - "loss": 0.3801, - "step": 83901 - }, - { - "epoch": 2.15, - "learning_rate": 3.919266430488646e-07, - "loss": 0.3735, - "step": 83902 - }, - { - "epoch": 2.15, - "learning_rate": 3.9190467623839417e-07, - "loss": 0.4556, - "step": 83903 - }, - { - "epoch": 2.15, - "learning_rate": 3.918827098935144e-07, - "loss": 0.3208, - "step": 83904 - }, - { - "epoch": 2.15, - "learning_rate": 3.918607440142423e-07, - "loss": 0.4163, - "step": 83905 - }, - { - "epoch": 2.15, - "learning_rate": 3.9183877860059465e-07, - "loss": 0.4382, - "step": 83906 - }, - { - "epoch": 2.15, - "learning_rate": 3.9181681365258754e-07, - "loss": 0.2817, - "step": 83907 - }, - { - "epoch": 2.15, - "learning_rate": 3.9179484917023854e-07, - "loss": 0.3208, - "step": 83908 - }, - { - "epoch": 2.15, - "learning_rate": 3.917728851535641e-07, - "loss": 0.3503, - "step": 83909 - }, - { - "epoch": 2.15, - "learning_rate": 3.917509216025816e-07, - "loss": 0.4316, - "step": 83910 - }, - { - "epoch": 2.15, - "learning_rate": 3.917289585173071e-07, - "loss": 0.4312, - "step": 83911 - }, - { - "epoch": 2.15, - "learning_rate": 3.917069958977578e-07, - "loss": 0.3469, - "step": 83912 - }, - { - "epoch": 2.15, - "learning_rate": 3.916850337439508e-07, - "loss": 0.3906, - "step": 83913 - }, - { - "epoch": 2.15, - "learning_rate": 3.916630720559023e-07, - "loss": 0.3577, - "step": 83914 - }, - { - "epoch": 2.15, - "learning_rate": 3.916411108336294e-07, - "loss": 0.4312, - "step": 83915 - }, - { - "epoch": 2.15, - "learning_rate": 3.916191500771492e-07, - "loss": 0.5381, - "step": 83916 - }, - { - "epoch": 2.15, - "learning_rate": 3.9159718978647793e-07, - "loss": 0.3645, - "step": 83917 - }, - { - "epoch": 2.15, - "learning_rate": 3.9157522996163303e-07, - "loss": 0.4424, - "step": 83918 - }, - { - "epoch": 2.15, - "learning_rate": 3.915532706026308e-07, - "loss": 0.4324, - "step": 83919 - }, - { - "epoch": 2.15, - "learning_rate": 3.9153131170948804e-07, - "loss": 0.5146, - "step": 83920 - }, - { - "epoch": 2.15, - "learning_rate": 3.915093532822219e-07, - "loss": 0.2793, - "step": 83921 - }, - { - "epoch": 2.15, - "learning_rate": 3.914873953208494e-07, - "loss": 0.4614, - "step": 83922 - }, - { - "epoch": 2.15, - "learning_rate": 3.9146543782538677e-07, - "loss": 0.4907, - "step": 83923 - }, - { - "epoch": 2.15, - "learning_rate": 3.9144348079585086e-07, - "loss": 0.3901, - "step": 83924 - }, - { - "epoch": 2.15, - "learning_rate": 3.9142152423225894e-07, - "loss": 0.5046, - "step": 83925 - }, - { - "epoch": 2.15, - "learning_rate": 3.913995681346277e-07, - "loss": 0.3724, - "step": 83926 - }, - { - "epoch": 2.15, - "learning_rate": 3.9137761250297396e-07, - "loss": 0.437, - "step": 83927 - }, - { - "epoch": 2.15, - "learning_rate": 3.9135565733731404e-07, - "loss": 0.5156, - "step": 83928 - }, - { - "epoch": 2.15, - "learning_rate": 3.9133370263766507e-07, - "loss": 0.4131, - "step": 83929 - }, - { - "epoch": 2.15, - "learning_rate": 3.9131174840404426e-07, - "loss": 0.4277, - "step": 83930 - }, - { - "epoch": 2.15, - "learning_rate": 3.912897946364677e-07, - "loss": 0.4917, - "step": 83931 - }, - { - "epoch": 2.15, - "learning_rate": 3.912678413349526e-07, - "loss": 0.3677, - "step": 83932 - }, - { - "epoch": 2.15, - "learning_rate": 3.912458884995157e-07, - "loss": 0.373, - "step": 83933 - }, - { - "epoch": 2.15, - "learning_rate": 3.912239361301741e-07, - "loss": 0.4355, - "step": 83934 - }, - { - "epoch": 2.15, - "learning_rate": 3.912019842269444e-07, - "loss": 0.3523, - "step": 83935 - }, - { - "epoch": 2.15, - "learning_rate": 3.91180032789843e-07, - "loss": 0.4012, - "step": 83936 - }, - { - "epoch": 2.15, - "learning_rate": 3.911580818188871e-07, - "loss": 0.377, - "step": 83937 - }, - { - "epoch": 2.15, - "learning_rate": 3.911361313140934e-07, - "loss": 0.5093, - "step": 83938 - }, - { - "epoch": 2.15, - "learning_rate": 3.9111418127547913e-07, - "loss": 0.2825, - "step": 83939 - }, - { - "epoch": 2.15, - "learning_rate": 3.9109223170306036e-07, - "loss": 0.3287, - "step": 83940 - }, - { - "epoch": 2.15, - "learning_rate": 3.910702825968543e-07, - "loss": 0.3926, - "step": 83941 - }, - { - "epoch": 2.15, - "learning_rate": 3.9104833395687775e-07, - "loss": 0.4082, - "step": 83942 - }, - { - "epoch": 2.15, - "learning_rate": 3.9102638578314786e-07, - "loss": 0.3625, - "step": 83943 - }, - { - "epoch": 2.15, - "learning_rate": 3.9100443807568065e-07, - "loss": 0.3101, - "step": 83944 - }, - { - "epoch": 2.15, - "learning_rate": 3.9098249083449363e-07, - "loss": 0.325, - "step": 83945 - }, - { - "epoch": 2.15, - "learning_rate": 3.909605440596031e-07, - "loss": 0.4031, - "step": 83946 - }, - { - "epoch": 2.15, - "learning_rate": 3.9093859775102634e-07, - "loss": 0.356, - "step": 83947 - }, - { - "epoch": 2.15, - "learning_rate": 3.909166519087795e-07, - "loss": 0.3555, - "step": 83948 - }, - { - "epoch": 2.15, - "learning_rate": 3.908947065328799e-07, - "loss": 0.3073, - "step": 83949 - }, - { - "epoch": 2.15, - "learning_rate": 3.9087276162334416e-07, - "loss": 0.3292, - "step": 83950 - }, - { - "epoch": 2.15, - "learning_rate": 3.908508171801895e-07, - "loss": 0.3663, - "step": 83951 - }, - { - "epoch": 2.15, - "learning_rate": 3.9082887320343206e-07, - "loss": 0.4053, - "step": 83952 - }, - { - "epoch": 2.15, - "learning_rate": 3.908069296930888e-07, - "loss": 0.2779, - "step": 83953 - }, - { - "epoch": 2.15, - "learning_rate": 3.907849866491768e-07, - "loss": 0.4048, - "step": 83954 - }, - { - "epoch": 2.15, - "learning_rate": 3.90763044071713e-07, - "loss": 0.5762, - "step": 83955 - }, - { - "epoch": 2.15, - "learning_rate": 3.9074110196071397e-07, - "loss": 0.395, - "step": 83956 - }, - { - "epoch": 2.15, - "learning_rate": 3.90719160316196e-07, - "loss": 0.4688, - "step": 83957 - }, - { - "epoch": 2.15, - "learning_rate": 3.9069721913817643e-07, - "loss": 0.2743, - "step": 83958 - }, - { - "epoch": 2.15, - "learning_rate": 3.90675278426672e-07, - "loss": 0.363, - "step": 83959 - }, - { - "epoch": 2.15, - "learning_rate": 3.906533381816999e-07, - "loss": 0.3369, - "step": 83960 - }, - { - "epoch": 2.15, - "learning_rate": 3.906313984032761e-07, - "loss": 0.3452, - "step": 83961 - }, - { - "epoch": 2.15, - "learning_rate": 3.9060945909141775e-07, - "loss": 0.4438, - "step": 83962 - }, - { - "epoch": 2.15, - "learning_rate": 3.9058752024614185e-07, - "loss": 0.2382, - "step": 83963 - }, - { - "epoch": 2.15, - "learning_rate": 3.9056558186746533e-07, - "loss": 0.3105, - "step": 83964 - }, - { - "epoch": 2.15, - "learning_rate": 3.9054364395540476e-07, - "loss": 0.356, - "step": 83965 - }, - { - "epoch": 2.15, - "learning_rate": 3.905217065099765e-07, - "loss": 0.4624, - "step": 83966 - }, - { - "epoch": 2.15, - "learning_rate": 3.904997695311978e-07, - "loss": 0.5181, - "step": 83967 - }, - { - "epoch": 2.15, - "learning_rate": 3.904778330190857e-07, - "loss": 0.3618, - "step": 83968 - }, - { - "epoch": 2.15, - "learning_rate": 3.9045589697365633e-07, - "loss": 0.4385, - "step": 83969 - }, - { - "epoch": 2.15, - "learning_rate": 3.904339613949269e-07, - "loss": 0.2594, - "step": 83970 - }, - { - "epoch": 2.15, - "learning_rate": 3.9041202628291414e-07, - "loss": 0.437, - "step": 83971 - }, - { - "epoch": 2.15, - "learning_rate": 3.9039009163763524e-07, - "loss": 0.4873, - "step": 83972 - }, - { - "epoch": 2.15, - "learning_rate": 3.903681574591062e-07, - "loss": 0.3872, - "step": 83973 - }, - { - "epoch": 2.15, - "learning_rate": 3.903462237473444e-07, - "loss": 0.4746, - "step": 83974 - }, - { - "epoch": 2.15, - "learning_rate": 3.903242905023666e-07, - "loss": 0.3799, - "step": 83975 - }, - { - "epoch": 2.15, - "learning_rate": 3.903023577241893e-07, - "loss": 0.4897, - "step": 83976 - }, - { - "epoch": 2.15, - "learning_rate": 3.902804254128297e-07, - "loss": 0.3011, - "step": 83977 - }, - { - "epoch": 2.15, - "learning_rate": 3.90258493568304e-07, - "loss": 0.4438, - "step": 83978 - }, - { - "epoch": 2.15, - "learning_rate": 3.9023656219062927e-07, - "loss": 0.4829, - "step": 83979 - }, - { - "epoch": 2.15, - "learning_rate": 3.902146312798225e-07, - "loss": 0.5605, - "step": 83980 - }, - { - "epoch": 2.15, - "learning_rate": 3.901927008359005e-07, - "loss": 0.4561, - "step": 83981 - }, - { - "epoch": 2.15, - "learning_rate": 3.901707708588797e-07, - "loss": 0.3809, - "step": 83982 - }, - { - "epoch": 2.15, - "learning_rate": 3.901488413487771e-07, - "loss": 0.4092, - "step": 83983 - }, - { - "epoch": 2.15, - "learning_rate": 3.901269123056098e-07, - "loss": 0.4297, - "step": 83984 - }, - { - "epoch": 2.15, - "learning_rate": 3.9010498372939437e-07, - "loss": 0.3945, - "step": 83985 - }, - { - "epoch": 2.15, - "learning_rate": 3.900830556201471e-07, - "loss": 0.4429, - "step": 83986 - }, - { - "epoch": 2.15, - "learning_rate": 3.9006112797788514e-07, - "loss": 0.4121, - "step": 83987 - }, - { - "epoch": 2.15, - "learning_rate": 3.900392008026254e-07, - "loss": 0.5039, - "step": 83988 - }, - { - "epoch": 2.15, - "learning_rate": 3.900172740943849e-07, - "loss": 0.4673, - "step": 83989 - }, - { - "epoch": 2.15, - "learning_rate": 3.899953478531798e-07, - "loss": 0.3221, - "step": 83990 - }, - { - "epoch": 2.15, - "learning_rate": 3.899734220790272e-07, - "loss": 0.3726, - "step": 83991 - }, - { - "epoch": 2.15, - "learning_rate": 3.8995149677194395e-07, - "loss": 0.459, - "step": 83992 - }, - { - "epoch": 2.15, - "learning_rate": 3.899295719319471e-07, - "loss": 0.4585, - "step": 83993 - }, - { - "epoch": 2.15, - "learning_rate": 3.899076475590527e-07, - "loss": 0.4526, - "step": 83994 - }, - { - "epoch": 2.15, - "learning_rate": 3.8988572365327845e-07, - "loss": 0.4351, - "step": 83995 - }, - { - "epoch": 2.15, - "learning_rate": 3.8986380021464015e-07, - "loss": 0.3823, - "step": 83996 - }, - { - "epoch": 2.15, - "learning_rate": 3.898418772431552e-07, - "loss": 0.3931, - "step": 83997 - }, - { - "epoch": 2.15, - "learning_rate": 3.8981995473884055e-07, - "loss": 0.4546, - "step": 83998 - }, - { - "epoch": 2.15, - "learning_rate": 3.897980327017124e-07, - "loss": 0.4695, - "step": 83999 - }, - { - "epoch": 2.15, - "learning_rate": 3.8977611113178786e-07, - "loss": 0.3994, - "step": 84000 - }, - { - "epoch": 2.15, - "learning_rate": 3.8975419002908395e-07, - "loss": 0.4224, - "step": 84001 - }, - { - "epoch": 2.15, - "learning_rate": 3.897322693936169e-07, - "loss": 0.4482, - "step": 84002 - }, - { - "epoch": 2.15, - "learning_rate": 3.897103492254038e-07, - "loss": 0.4507, - "step": 84003 - }, - { - "epoch": 2.15, - "learning_rate": 3.896884295244615e-07, - "loss": 0.4141, - "step": 84004 - }, - { - "epoch": 2.15, - "learning_rate": 3.8966651029080686e-07, - "loss": 0.3857, - "step": 84005 - }, - { - "epoch": 2.15, - "learning_rate": 3.896445915244567e-07, - "loss": 0.4248, - "step": 84006 - }, - { - "epoch": 2.15, - "learning_rate": 3.896226732254272e-07, - "loss": 0.5239, - "step": 84007 - }, - { - "epoch": 2.15, - "learning_rate": 3.896007553937355e-07, - "loss": 0.5049, - "step": 84008 - }, - { - "epoch": 2.15, - "learning_rate": 3.895788380293985e-07, - "loss": 0.436, - "step": 84009 - }, - { - "epoch": 2.15, - "learning_rate": 3.8955692113243323e-07, - "loss": 0.4658, - "step": 84010 - }, - { - "epoch": 2.15, - "learning_rate": 3.8953500470285583e-07, - "loss": 0.3501, - "step": 84011 - }, - { - "epoch": 2.15, - "learning_rate": 3.8951308874068333e-07, - "loss": 0.4116, - "step": 84012 - }, - { - "epoch": 2.15, - "learning_rate": 3.8949117324593273e-07, - "loss": 0.2777, - "step": 84013 - }, - { - "epoch": 2.15, - "learning_rate": 3.8946925821862086e-07, - "loss": 0.4331, - "step": 84014 - }, - { - "epoch": 2.15, - "learning_rate": 3.894473436587644e-07, - "loss": 0.4092, - "step": 84015 - }, - { - "epoch": 2.15, - "learning_rate": 3.894254295663797e-07, - "loss": 0.5278, - "step": 84016 - }, - { - "epoch": 2.15, - "learning_rate": 3.894035159414839e-07, - "loss": 0.4663, - "step": 84017 - }, - { - "epoch": 2.15, - "learning_rate": 3.8938160278409406e-07, - "loss": 0.4478, - "step": 84018 - }, - { - "epoch": 2.15, - "learning_rate": 3.893596900942262e-07, - "loss": 0.4509, - "step": 84019 - }, - { - "epoch": 2.15, - "learning_rate": 3.893377778718977e-07, - "loss": 0.3828, - "step": 84020 - }, - { - "epoch": 2.15, - "learning_rate": 3.893158661171251e-07, - "loss": 0.4185, - "step": 84021 - }, - { - "epoch": 2.15, - "learning_rate": 3.8929395482992554e-07, - "loss": 0.313, - "step": 84022 - }, - { - "epoch": 2.15, - "learning_rate": 3.892720440103153e-07, - "loss": 0.364, - "step": 84023 - }, - { - "epoch": 2.15, - "learning_rate": 3.892501336583114e-07, - "loss": 0.479, - "step": 84024 - }, - { - "epoch": 2.15, - "learning_rate": 3.8922822377393084e-07, - "loss": 0.3535, - "step": 84025 - }, - { - "epoch": 2.15, - "learning_rate": 3.8920631435718977e-07, - "loss": 0.3579, - "step": 84026 - }, - { - "epoch": 2.15, - "learning_rate": 3.891844054081057e-07, - "loss": 0.4819, - "step": 84027 - }, - { - "epoch": 2.15, - "learning_rate": 3.891624969266948e-07, - "loss": 0.3838, - "step": 84028 - }, - { - "epoch": 2.15, - "learning_rate": 3.8914058891297406e-07, - "loss": 0.3799, - "step": 84029 - }, - { - "epoch": 2.15, - "learning_rate": 3.8911868136696026e-07, - "loss": 0.4702, - "step": 84030 - }, - { - "epoch": 2.15, - "learning_rate": 3.890967742886705e-07, - "loss": 0.3787, - "step": 84031 - }, - { - "epoch": 2.15, - "learning_rate": 3.890748676781209e-07, - "loss": 0.282, - "step": 84032 - }, - { - "epoch": 2.15, - "learning_rate": 3.8905296153532863e-07, - "loss": 0.4263, - "step": 84033 - }, - { - "epoch": 2.15, - "learning_rate": 3.890310558603104e-07, - "loss": 0.2653, - "step": 84034 - }, - { - "epoch": 2.15, - "learning_rate": 3.890091506530837e-07, - "loss": 0.418, - "step": 84035 - }, - { - "epoch": 2.15, - "learning_rate": 3.8898724591366395e-07, - "loss": 0.4053, - "step": 84036 - }, - { - "epoch": 2.15, - "learning_rate": 3.889653416420685e-07, - "loss": 0.4141, - "step": 84037 - }, - { - "epoch": 2.15, - "learning_rate": 3.889434378383142e-07, - "loss": 0.4106, - "step": 84038 - }, - { - "epoch": 2.15, - "learning_rate": 3.8892153450241815e-07, - "loss": 0.4482, - "step": 84039 - }, - { - "epoch": 2.15, - "learning_rate": 3.8889963163439653e-07, - "loss": 0.4482, - "step": 84040 - }, - { - "epoch": 2.15, - "learning_rate": 3.8887772923426633e-07, - "loss": 0.4082, - "step": 84041 - }, - { - "epoch": 2.15, - "learning_rate": 3.888558273020442e-07, - "loss": 0.458, - "step": 84042 - }, - { - "epoch": 2.15, - "learning_rate": 3.888339258377475e-07, - "loss": 0.4585, - "step": 84043 - }, - { - "epoch": 2.15, - "learning_rate": 3.888120248413923e-07, - "loss": 0.4922, - "step": 84044 - }, - { - "epoch": 2.15, - "learning_rate": 3.8879012431299593e-07, - "loss": 0.4902, - "step": 84045 - }, - { - "epoch": 2.15, - "learning_rate": 3.887682242525745e-07, - "loss": 0.3845, - "step": 84046 - }, - { - "epoch": 2.15, - "learning_rate": 3.887463246601451e-07, - "loss": 0.4404, - "step": 84047 - }, - { - "epoch": 2.15, - "learning_rate": 3.8872442553572495e-07, - "loss": 0.2937, - "step": 84048 - }, - { - "epoch": 2.15, - "learning_rate": 3.8870252687933003e-07, - "loss": 0.3457, - "step": 84049 - }, - { - "epoch": 2.15, - "learning_rate": 3.886806286909774e-07, - "loss": 0.3435, - "step": 84050 - }, - { - "epoch": 2.15, - "learning_rate": 3.88658730970684e-07, - "loss": 0.4287, - "step": 84051 - }, - { - "epoch": 2.15, - "learning_rate": 3.8863683371846676e-07, - "loss": 0.4429, - "step": 84052 - }, - { - "epoch": 2.15, - "learning_rate": 3.8861493693434187e-07, - "loss": 0.394, - "step": 84053 - }, - { - "epoch": 2.15, - "learning_rate": 3.8859304061832656e-07, - "loss": 0.4851, - "step": 84054 - }, - { - "epoch": 2.15, - "learning_rate": 3.885711447704376e-07, - "loss": 0.4966, - "step": 84055 - }, - { - "epoch": 2.15, - "learning_rate": 3.8854924939069167e-07, - "loss": 0.4915, - "step": 84056 - }, - { - "epoch": 2.15, - "learning_rate": 3.885273544791051e-07, - "loss": 0.4561, - "step": 84057 - }, - { - "epoch": 2.15, - "learning_rate": 3.8850546003569505e-07, - "loss": 0.4229, - "step": 84058 - }, - { - "epoch": 2.15, - "learning_rate": 3.8848356606047817e-07, - "loss": 0.4829, - "step": 84059 - }, - { - "epoch": 2.15, - "learning_rate": 3.884616725534717e-07, - "loss": 0.4736, - "step": 84060 - }, - { - "epoch": 2.15, - "learning_rate": 3.8843977951469173e-07, - "loss": 0.394, - "step": 84061 - }, - { - "epoch": 2.15, - "learning_rate": 3.884178869441552e-07, - "loss": 0.4839, - "step": 84062 - }, - { - "epoch": 2.15, - "learning_rate": 3.88395994841879e-07, - "loss": 0.4941, - "step": 84063 - }, - { - "epoch": 2.15, - "learning_rate": 3.8837410320788035e-07, - "loss": 0.3828, - "step": 84064 - }, - { - "epoch": 2.15, - "learning_rate": 3.883522120421754e-07, - "loss": 0.4448, - "step": 84065 - }, - { - "epoch": 2.15, - "learning_rate": 3.883303213447806e-07, - "loss": 0.4038, - "step": 84066 - }, - { - "epoch": 2.15, - "learning_rate": 3.883084311157133e-07, - "loss": 0.4429, - "step": 84067 - }, - { - "epoch": 2.15, - "learning_rate": 3.8828654135499007e-07, - "loss": 0.415, - "step": 84068 - }, - { - "epoch": 2.15, - "learning_rate": 3.88264652062628e-07, - "loss": 0.3235, - "step": 84069 - }, - { - "epoch": 2.15, - "learning_rate": 3.882427632386432e-07, - "loss": 0.4468, - "step": 84070 - }, - { - "epoch": 2.15, - "learning_rate": 3.882208748830529e-07, - "loss": 0.3787, - "step": 84071 - }, - { - "epoch": 2.15, - "learning_rate": 3.881989869958736e-07, - "loss": 0.457, - "step": 84072 - }, - { - "epoch": 2.15, - "learning_rate": 3.8817709957712265e-07, - "loss": 0.3518, - "step": 84073 - }, - { - "epoch": 2.15, - "learning_rate": 3.881552126268161e-07, - "loss": 0.3569, - "step": 84074 - }, - { - "epoch": 2.15, - "learning_rate": 3.881333261449712e-07, - "loss": 0.3582, - "step": 84075 - }, - { - "epoch": 2.15, - "learning_rate": 3.881114401316041e-07, - "loss": 0.2848, - "step": 84076 - }, - { - "epoch": 2.15, - "learning_rate": 3.880895545867323e-07, - "loss": 0.4912, - "step": 84077 - }, - { - "epoch": 2.15, - "learning_rate": 3.8806766951037184e-07, - "loss": 0.3691, - "step": 84078 - }, - { - "epoch": 2.15, - "learning_rate": 3.880457849025399e-07, - "loss": 0.3809, - "step": 84079 - }, - { - "epoch": 2.16, - "learning_rate": 3.880239007632531e-07, - "loss": 0.416, - "step": 84080 - }, - { - "epoch": 2.16, - "learning_rate": 3.8800201709252865e-07, - "loss": 0.3635, - "step": 84081 - }, - { - "epoch": 2.16, - "learning_rate": 3.879801338903825e-07, - "loss": 0.2853, - "step": 84082 - }, - { - "epoch": 2.16, - "learning_rate": 3.879582511568319e-07, - "loss": 0.3396, - "step": 84083 - }, - { - "epoch": 2.16, - "learning_rate": 3.8793636889189353e-07, - "loss": 0.3779, - "step": 84084 - }, - { - "epoch": 2.16, - "learning_rate": 3.879144870955844e-07, - "loss": 0.5312, - "step": 84085 - }, - { - "epoch": 2.16, - "learning_rate": 3.8789260576792106e-07, - "loss": 0.3428, - "step": 84086 - }, - { - "epoch": 2.16, - "learning_rate": 3.878707249089198e-07, - "loss": 0.3549, - "step": 84087 - }, - { - "epoch": 2.16, - "learning_rate": 3.878488445185979e-07, - "loss": 0.4238, - "step": 84088 - }, - { - "epoch": 2.16, - "learning_rate": 3.8782696459697193e-07, - "loss": 0.4053, - "step": 84089 - }, - { - "epoch": 2.16, - "learning_rate": 3.8780508514405896e-07, - "loss": 0.311, - "step": 84090 - }, - { - "epoch": 2.16, - "learning_rate": 3.877832061598753e-07, - "loss": 0.3167, - "step": 84091 - }, - { - "epoch": 2.16, - "learning_rate": 3.8776132764443783e-07, - "loss": 0.5474, - "step": 84092 - }, - { - "epoch": 2.16, - "learning_rate": 3.877394495977636e-07, - "loss": 0.5249, - "step": 84093 - }, - { - "epoch": 2.16, - "learning_rate": 3.8771757201986887e-07, - "loss": 0.4272, - "step": 84094 - }, - { - "epoch": 2.16, - "learning_rate": 3.87695694910771e-07, - "loss": 0.4629, - "step": 84095 - }, - { - "epoch": 2.16, - "learning_rate": 3.8767381827048606e-07, - "loss": 0.3474, - "step": 84096 - }, - { - "epoch": 2.16, - "learning_rate": 3.876519420990311e-07, - "loss": 0.392, - "step": 84097 - }, - { - "epoch": 2.16, - "learning_rate": 3.8763006639642313e-07, - "loss": 0.3286, - "step": 84098 - }, - { - "epoch": 2.16, - "learning_rate": 3.876081911626784e-07, - "loss": 0.3979, - "step": 84099 - }, - { - "epoch": 2.16, - "learning_rate": 3.875863163978139e-07, - "loss": 0.3367, - "step": 84100 - }, - { - "epoch": 2.16, - "learning_rate": 3.875644421018465e-07, - "loss": 0.519, - "step": 84101 - }, - { - "epoch": 2.16, - "learning_rate": 3.8754256827479304e-07, - "loss": 0.4224, - "step": 84102 - }, - { - "epoch": 2.16, - "learning_rate": 3.8752069491666985e-07, - "loss": 0.4829, - "step": 84103 - }, - { - "epoch": 2.16, - "learning_rate": 3.8749882202749385e-07, - "loss": 0.436, - "step": 84104 - }, - { - "epoch": 2.16, - "learning_rate": 3.8747694960728215e-07, - "loss": 0.5405, - "step": 84105 - }, - { - "epoch": 2.16, - "learning_rate": 3.874550776560509e-07, - "loss": 0.3066, - "step": 84106 - }, - { - "epoch": 2.16, - "learning_rate": 3.8743320617381747e-07, - "loss": 0.4155, - "step": 84107 - }, - { - "epoch": 2.16, - "learning_rate": 3.874113351605979e-07, - "loss": 0.4868, - "step": 84108 - }, - { - "epoch": 2.16, - "learning_rate": 3.873894646164093e-07, - "loss": 0.3877, - "step": 84109 - }, - { - "epoch": 2.16, - "learning_rate": 3.873675945412688e-07, - "loss": 0.4849, - "step": 84110 - }, - { - "epoch": 2.16, - "learning_rate": 3.8734572493519233e-07, - "loss": 0.5166, - "step": 84111 - }, - { - "epoch": 2.16, - "learning_rate": 3.8732385579819717e-07, - "loss": 0.377, - "step": 84112 - }, - { - "epoch": 2.16, - "learning_rate": 3.873019871302998e-07, - "loss": 0.3536, - "step": 84113 - }, - { - "epoch": 2.16, - "learning_rate": 3.8728011893151767e-07, - "loss": 0.2193, - "step": 84114 - }, - { - "epoch": 2.16, - "learning_rate": 3.8725825120186695e-07, - "loss": 0.4253, - "step": 84115 - }, - { - "epoch": 2.16, - "learning_rate": 3.872363839413639e-07, - "loss": 0.4199, - "step": 84116 - }, - { - "epoch": 2.16, - "learning_rate": 3.8721451715002596e-07, - "loss": 0.437, - "step": 84117 - }, - { - "epoch": 2.16, - "learning_rate": 3.8719265082786956e-07, - "loss": 0.5093, - "step": 84118 - }, - { - "epoch": 2.16, - "learning_rate": 3.871707849749121e-07, - "loss": 0.478, - "step": 84119 - }, - { - "epoch": 2.16, - "learning_rate": 3.8714891959116925e-07, - "loss": 0.4072, - "step": 84120 - }, - { - "epoch": 2.16, - "learning_rate": 3.871270546766583e-07, - "loss": 0.312, - "step": 84121 - }, - { - "epoch": 2.16, - "learning_rate": 3.871051902313961e-07, - "loss": 0.4512, - "step": 84122 - }, - { - "epoch": 2.16, - "learning_rate": 3.8708332625539954e-07, - "loss": 0.4111, - "step": 84123 - }, - { - "epoch": 2.16, - "learning_rate": 3.870614627486848e-07, - "loss": 0.4702, - "step": 84124 - }, - { - "epoch": 2.16, - "learning_rate": 3.870395997112692e-07, - "loss": 0.3296, - "step": 84125 - }, - { - "epoch": 2.16, - "learning_rate": 3.870177371431689e-07, - "loss": 0.3599, - "step": 84126 - }, - { - "epoch": 2.16, - "learning_rate": 3.8699587504440123e-07, - "loss": 0.3357, - "step": 84127 - }, - { - "epoch": 2.16, - "learning_rate": 3.869740134149824e-07, - "loss": 0.3319, - "step": 84128 - }, - { - "epoch": 2.16, - "learning_rate": 3.8695215225492926e-07, - "loss": 0.3258, - "step": 84129 - }, - { - "epoch": 2.16, - "learning_rate": 3.869302915642587e-07, - "loss": 0.3745, - "step": 84130 - }, - { - "epoch": 2.16, - "learning_rate": 3.8690843134298777e-07, - "loss": 0.4321, - "step": 84131 - }, - { - "epoch": 2.16, - "learning_rate": 3.868865715911325e-07, - "loss": 0.4521, - "step": 84132 - }, - { - "epoch": 2.16, - "learning_rate": 3.8686471230871e-07, - "loss": 0.3521, - "step": 84133 - }, - { - "epoch": 2.16, - "learning_rate": 3.868428534957371e-07, - "loss": 0.2231, - "step": 84134 - }, - { - "epoch": 2.16, - "learning_rate": 3.8682099515223064e-07, - "loss": 0.3696, - "step": 84135 - }, - { - "epoch": 2.16, - "learning_rate": 3.867991372782072e-07, - "loss": 0.4092, - "step": 84136 - }, - { - "epoch": 2.16, - "learning_rate": 3.8677727987368315e-07, - "loss": 0.4321, - "step": 84137 - }, - { - "epoch": 2.16, - "learning_rate": 3.8675542293867547e-07, - "loss": 0.322, - "step": 84138 - }, - { - "epoch": 2.16, - "learning_rate": 3.86733566473201e-07, - "loss": 0.3213, - "step": 84139 - }, - { - "epoch": 2.16, - "learning_rate": 3.867117104772768e-07, - "loss": 0.4453, - "step": 84140 - }, - { - "epoch": 2.16, - "learning_rate": 3.8668985495091887e-07, - "loss": 0.3911, - "step": 84141 - }, - { - "epoch": 2.16, - "learning_rate": 3.8666799989414434e-07, - "loss": 0.2468, - "step": 84142 - }, - { - "epoch": 2.16, - "learning_rate": 3.866461453069699e-07, - "loss": 0.4648, - "step": 84143 - }, - { - "epoch": 2.16, - "learning_rate": 3.8662429118941267e-07, - "loss": 0.4775, - "step": 84144 - }, - { - "epoch": 2.16, - "learning_rate": 3.8660243754148903e-07, - "loss": 0.3755, - "step": 84145 - }, - { - "epoch": 2.16, - "learning_rate": 3.8658058436321526e-07, - "loss": 0.3895, - "step": 84146 - }, - { - "epoch": 2.16, - "learning_rate": 3.865587316546086e-07, - "loss": 0.4087, - "step": 84147 - }, - { - "epoch": 2.16, - "learning_rate": 3.8653687941568616e-07, - "loss": 0.4097, - "step": 84148 - }, - { - "epoch": 2.16, - "learning_rate": 3.865150276464637e-07, - "loss": 0.3828, - "step": 84149 - }, - { - "epoch": 2.16, - "learning_rate": 3.8649317634695856e-07, - "loss": 0.4023, - "step": 84150 - }, - { - "epoch": 2.16, - "learning_rate": 3.864713255171874e-07, - "loss": 0.4072, - "step": 84151 - }, - { - "epoch": 2.16, - "learning_rate": 3.864494751571673e-07, - "loss": 0.3999, - "step": 84152 - }, - { - "epoch": 2.16, - "learning_rate": 3.864276252669142e-07, - "loss": 0.2937, - "step": 84153 - }, - { - "epoch": 2.16, - "learning_rate": 3.8640577584644527e-07, - "loss": 0.2554, - "step": 84154 - }, - { - "epoch": 2.16, - "learning_rate": 3.8638392689577757e-07, - "loss": 0.3821, - "step": 84155 - }, - { - "epoch": 2.16, - "learning_rate": 3.863620784149272e-07, - "loss": 0.3945, - "step": 84156 - }, - { - "epoch": 2.16, - "learning_rate": 3.863402304039115e-07, - "loss": 0.356, - "step": 84157 - }, - { - "epoch": 2.16, - "learning_rate": 3.8631838286274656e-07, - "loss": 0.2657, - "step": 84158 - }, - { - "epoch": 2.16, - "learning_rate": 3.8629653579144926e-07, - "loss": 0.3125, - "step": 84159 - }, - { - "epoch": 2.16, - "learning_rate": 3.862746891900366e-07, - "loss": 0.4238, - "step": 84160 - }, - { - "epoch": 2.16, - "learning_rate": 3.862528430585256e-07, - "loss": 0.3542, - "step": 84161 - }, - { - "epoch": 2.16, - "learning_rate": 3.862309973969321e-07, - "loss": 0.4688, - "step": 84162 - }, - { - "epoch": 2.16, - "learning_rate": 3.862091522052734e-07, - "loss": 0.4048, - "step": 84163 - }, - { - "epoch": 2.16, - "learning_rate": 3.861873074835664e-07, - "loss": 0.3904, - "step": 84164 - }, - { - "epoch": 2.16, - "learning_rate": 3.8616546323182755e-07, - "loss": 0.2668, - "step": 84165 - }, - { - "epoch": 2.16, - "learning_rate": 3.861436194500732e-07, - "loss": 0.3872, - "step": 84166 - }, - { - "epoch": 2.16, - "learning_rate": 3.8612177613832064e-07, - "loss": 0.4146, - "step": 84167 - }, - { - "epoch": 2.16, - "learning_rate": 3.8609993329658617e-07, - "loss": 0.3656, - "step": 84168 - }, - { - "epoch": 2.16, - "learning_rate": 3.860780909248873e-07, - "loss": 0.1659, - "step": 84169 - }, - { - "epoch": 2.16, - "learning_rate": 3.8605624902323973e-07, - "loss": 0.4902, - "step": 84170 - }, - { - "epoch": 2.16, - "learning_rate": 3.8603440759166074e-07, - "loss": 0.3481, - "step": 84171 - }, - { - "epoch": 2.16, - "learning_rate": 3.860125666301669e-07, - "loss": 0.4047, - "step": 84172 - }, - { - "epoch": 2.16, - "learning_rate": 3.8599072613877546e-07, - "loss": 0.3826, - "step": 84173 - }, - { - "epoch": 2.16, - "learning_rate": 3.859688861175022e-07, - "loss": 0.4326, - "step": 84174 - }, - { - "epoch": 2.16, - "learning_rate": 3.859470465663648e-07, - "loss": 0.2064, - "step": 84175 - }, - { - "epoch": 2.16, - "learning_rate": 3.8592520748537915e-07, - "loss": 0.3818, - "step": 84176 - }, - { - "epoch": 2.16, - "learning_rate": 3.8590336887456233e-07, - "loss": 0.3674, - "step": 84177 - }, - { - "epoch": 2.16, - "learning_rate": 3.858815307339314e-07, - "loss": 0.4756, - "step": 84178 - }, - { - "epoch": 2.16, - "learning_rate": 3.858596930635023e-07, - "loss": 0.3796, - "step": 84179 - }, - { - "epoch": 2.16, - "learning_rate": 3.858378558632923e-07, - "loss": 0.3787, - "step": 84180 - }, - { - "epoch": 2.16, - "learning_rate": 3.858160191333183e-07, - "loss": 0.2665, - "step": 84181 - }, - { - "epoch": 2.16, - "learning_rate": 3.857941828735964e-07, - "loss": 0.4634, - "step": 84182 - }, - { - "epoch": 2.16, - "learning_rate": 3.8577234708414376e-07, - "loss": 0.4521, - "step": 84183 - }, - { - "epoch": 2.16, - "learning_rate": 3.8575051176497687e-07, - "loss": 0.3511, - "step": 84184 - }, - { - "epoch": 2.16, - "learning_rate": 3.85728676916113e-07, - "loss": 0.3774, - "step": 84185 - }, - { - "epoch": 2.16, - "learning_rate": 3.8570684253756836e-07, - "loss": 0.4287, - "step": 84186 - }, - { - "epoch": 2.16, - "learning_rate": 3.8568500862935935e-07, - "loss": 0.4263, - "step": 84187 - }, - { - "epoch": 2.16, - "learning_rate": 3.8566317519150314e-07, - "loss": 0.3887, - "step": 84188 - }, - { - "epoch": 2.16, - "learning_rate": 3.8564134222401645e-07, - "loss": 0.4502, - "step": 84189 - }, - { - "epoch": 2.16, - "learning_rate": 3.8561950972691626e-07, - "loss": 0.276, - "step": 84190 - }, - { - "epoch": 2.16, - "learning_rate": 3.855976777002186e-07, - "loss": 0.4351, - "step": 84191 - }, - { - "epoch": 2.16, - "learning_rate": 3.8557584614394055e-07, - "loss": 0.3682, - "step": 84192 - }, - { - "epoch": 2.16, - "learning_rate": 3.855540150580988e-07, - "loss": 0.3306, - "step": 84193 - }, - { - "epoch": 2.16, - "learning_rate": 3.855321844427104e-07, - "loss": 0.2659, - "step": 84194 - }, - { - "epoch": 2.16, - "learning_rate": 3.855103542977919e-07, - "loss": 0.3265, - "step": 84195 - }, - { - "epoch": 2.16, - "learning_rate": 3.854885246233593e-07, - "loss": 0.4409, - "step": 84196 - }, - { - "epoch": 2.16, - "learning_rate": 3.8546669541943e-07, - "loss": 0.3264, - "step": 84197 - }, - { - "epoch": 2.16, - "learning_rate": 3.8544486668602094e-07, - "loss": 0.3774, - "step": 84198 - }, - { - "epoch": 2.16, - "learning_rate": 3.8542303842314815e-07, - "loss": 0.4482, - "step": 84199 - }, - { - "epoch": 2.16, - "learning_rate": 3.8540121063082873e-07, - "loss": 0.4492, - "step": 84200 - }, - { - "epoch": 2.16, - "learning_rate": 3.8537938330907926e-07, - "loss": 0.3538, - "step": 84201 - }, - { - "epoch": 2.16, - "learning_rate": 3.853575564579169e-07, - "loss": 0.4058, - "step": 84202 - }, - { - "epoch": 2.16, - "learning_rate": 3.8533573007735767e-07, - "loss": 0.562, - "step": 84203 - }, - { - "epoch": 2.16, - "learning_rate": 3.853139041674186e-07, - "loss": 0.3722, - "step": 84204 - }, - { - "epoch": 2.16, - "learning_rate": 3.8529207872811677e-07, - "loss": 0.3877, - "step": 84205 - }, - { - "epoch": 2.16, - "learning_rate": 3.852702537594681e-07, - "loss": 0.4854, - "step": 84206 - }, - { - "epoch": 2.16, - "learning_rate": 3.8524842926149014e-07, - "loss": 0.436, - "step": 84207 - }, - { - "epoch": 2.16, - "learning_rate": 3.8522660523419893e-07, - "loss": 0.4888, - "step": 84208 - }, - { - "epoch": 2.16, - "learning_rate": 3.852047816776113e-07, - "loss": 0.3679, - "step": 84209 - }, - { - "epoch": 2.16, - "learning_rate": 3.851829585917442e-07, - "loss": 0.4048, - "step": 84210 - }, - { - "epoch": 2.16, - "learning_rate": 3.8516113597661446e-07, - "loss": 0.4272, - "step": 84211 - }, - { - "epoch": 2.16, - "learning_rate": 3.851393138322383e-07, - "loss": 0.4248, - "step": 84212 - }, - { - "epoch": 2.16, - "learning_rate": 3.8511749215863276e-07, - "loss": 0.3979, - "step": 84213 - }, - { - "epoch": 2.16, - "learning_rate": 3.850956709558144e-07, - "loss": 0.3203, - "step": 84214 - }, - { - "epoch": 2.16, - "learning_rate": 3.850738502238008e-07, - "loss": 0.3835, - "step": 84215 - }, - { - "epoch": 2.16, - "learning_rate": 3.85052029962607e-07, - "loss": 0.4102, - "step": 84216 - }, - { - "epoch": 2.16, - "learning_rate": 3.850302101722508e-07, - "loss": 0.4878, - "step": 84217 - }, - { - "epoch": 2.16, - "learning_rate": 3.850083908527485e-07, - "loss": 0.3857, - "step": 84218 - }, - { - "epoch": 2.16, - "learning_rate": 3.8498657200411744e-07, - "loss": 0.4873, - "step": 84219 - }, - { - "epoch": 2.16, - "learning_rate": 3.8496475362637357e-07, - "loss": 0.354, - "step": 84220 - }, - { - "epoch": 2.16, - "learning_rate": 3.8494293571953385e-07, - "loss": 0.3892, - "step": 84221 - }, - { - "epoch": 2.16, - "learning_rate": 3.8492111828361507e-07, - "loss": 0.3813, - "step": 84222 - }, - { - "epoch": 2.16, - "learning_rate": 3.848993013186342e-07, - "loss": 0.4187, - "step": 84223 - }, - { - "epoch": 2.16, - "learning_rate": 3.8487748482460735e-07, - "loss": 0.3774, - "step": 84224 - }, - { - "epoch": 2.16, - "learning_rate": 3.8485566880155186e-07, - "loss": 0.4526, - "step": 84225 - }, - { - "epoch": 2.16, - "learning_rate": 3.848338532494838e-07, - "loss": 0.4541, - "step": 84226 - }, - { - "epoch": 2.16, - "learning_rate": 3.848120381684201e-07, - "loss": 0.4839, - "step": 84227 - }, - { - "epoch": 2.16, - "learning_rate": 3.847902235583779e-07, - "loss": 0.4021, - "step": 84228 - }, - { - "epoch": 2.16, - "learning_rate": 3.847684094193733e-07, - "loss": 0.4072, - "step": 84229 - }, - { - "epoch": 2.16, - "learning_rate": 3.847465957514231e-07, - "loss": 0.2708, - "step": 84230 - }, - { - "epoch": 2.16, - "learning_rate": 3.847247825545442e-07, - "loss": 0.2715, - "step": 84231 - }, - { - "epoch": 2.16, - "learning_rate": 3.847029698287535e-07, - "loss": 0.4561, - "step": 84232 - }, - { - "epoch": 2.16, - "learning_rate": 3.8468115757406715e-07, - "loss": 0.2569, - "step": 84233 - }, - { - "epoch": 2.16, - "learning_rate": 3.846593457905026e-07, - "loss": 0.5361, - "step": 84234 - }, - { - "epoch": 2.16, - "learning_rate": 3.846375344780757e-07, - "loss": 0.4097, - "step": 84235 - }, - { - "epoch": 2.16, - "learning_rate": 3.846157236368038e-07, - "loss": 0.4106, - "step": 84236 - }, - { - "epoch": 2.16, - "learning_rate": 3.845939132667031e-07, - "loss": 0.3967, - "step": 84237 - }, - { - "epoch": 2.16, - "learning_rate": 3.8457210336779045e-07, - "loss": 0.478, - "step": 84238 - }, - { - "epoch": 2.16, - "learning_rate": 3.8455029394008263e-07, - "loss": 0.3999, - "step": 84239 - }, - { - "epoch": 2.16, - "learning_rate": 3.845284849835968e-07, - "loss": 0.3646, - "step": 84240 - }, - { - "epoch": 2.16, - "learning_rate": 3.8450667649834877e-07, - "loss": 0.3723, - "step": 84241 - }, - { - "epoch": 2.16, - "learning_rate": 3.844848684843558e-07, - "loss": 0.4331, - "step": 84242 - }, - { - "epoch": 2.16, - "learning_rate": 3.844630609416344e-07, - "loss": 0.3784, - "step": 84243 - }, - { - "epoch": 2.16, - "learning_rate": 3.8444125387020164e-07, - "loss": 0.438, - "step": 84244 - }, - { - "epoch": 2.16, - "learning_rate": 3.844194472700739e-07, - "loss": 0.437, - "step": 84245 - }, - { - "epoch": 2.16, - "learning_rate": 3.843976411412676e-07, - "loss": 0.3406, - "step": 84246 - }, - { - "epoch": 2.16, - "learning_rate": 3.843758354837997e-07, - "loss": 0.4204, - "step": 84247 - }, - { - "epoch": 2.16, - "learning_rate": 3.8435403029768685e-07, - "loss": 0.3081, - "step": 84248 - }, - { - "epoch": 2.16, - "learning_rate": 3.843322255829463e-07, - "loss": 0.4331, - "step": 84249 - }, - { - "epoch": 2.16, - "learning_rate": 3.843104213395938e-07, - "loss": 0.386, - "step": 84250 - }, - { - "epoch": 2.16, - "learning_rate": 3.842886175676465e-07, - "loss": 0.4028, - "step": 84251 - }, - { - "epoch": 2.16, - "learning_rate": 3.8426681426712113e-07, - "loss": 0.4663, - "step": 84252 - }, - { - "epoch": 2.16, - "learning_rate": 3.842450114380347e-07, - "loss": 0.4873, - "step": 84253 - }, - { - "epoch": 2.16, - "learning_rate": 3.842232090804035e-07, - "loss": 0.3774, - "step": 84254 - }, - { - "epoch": 2.16, - "learning_rate": 3.84201407194244e-07, - "loss": 0.3594, - "step": 84255 - }, - { - "epoch": 2.16, - "learning_rate": 3.841796057795731e-07, - "loss": 0.4937, - "step": 84256 - }, - { - "epoch": 2.16, - "learning_rate": 3.841578048364079e-07, - "loss": 0.3438, - "step": 84257 - }, - { - "epoch": 2.16, - "learning_rate": 3.841360043647645e-07, - "loss": 0.3179, - "step": 84258 - }, - { - "epoch": 2.16, - "learning_rate": 3.841142043646598e-07, - "loss": 0.3424, - "step": 84259 - }, - { - "epoch": 2.16, - "learning_rate": 3.840924048361105e-07, - "loss": 0.4575, - "step": 84260 - }, - { - "epoch": 2.16, - "learning_rate": 3.840706057791338e-07, - "loss": 0.3901, - "step": 84261 - }, - { - "epoch": 2.16, - "learning_rate": 3.840488071937453e-07, - "loss": 0.479, - "step": 84262 - }, - { - "epoch": 2.16, - "learning_rate": 3.8402700907996254e-07, - "loss": 0.479, - "step": 84263 - }, - { - "epoch": 2.16, - "learning_rate": 3.8400521143780216e-07, - "loss": 0.5093, - "step": 84264 - }, - { - "epoch": 2.16, - "learning_rate": 3.839834142672804e-07, - "loss": 0.3833, - "step": 84265 - }, - { - "epoch": 2.16, - "learning_rate": 3.839616175684146e-07, - "loss": 0.4897, - "step": 84266 - }, - { - "epoch": 2.16, - "learning_rate": 3.8393982134122073e-07, - "loss": 0.4707, - "step": 84267 - }, - { - "epoch": 2.16, - "learning_rate": 3.839180255857157e-07, - "loss": 0.3882, - "step": 84268 - }, - { - "epoch": 2.16, - "learning_rate": 3.8389623030191645e-07, - "loss": 0.4805, - "step": 84269 - }, - { - "epoch": 2.16, - "learning_rate": 3.838744354898398e-07, - "loss": 0.429, - "step": 84270 - }, - { - "epoch": 2.16, - "learning_rate": 3.838526411495018e-07, - "loss": 0.3398, - "step": 84271 - }, - { - "epoch": 2.16, - "learning_rate": 3.838308472809195e-07, - "loss": 0.5142, - "step": 84272 - }, - { - "epoch": 2.16, - "learning_rate": 3.8380905388411e-07, - "loss": 0.3932, - "step": 84273 - }, - { - "epoch": 2.16, - "learning_rate": 3.837872609590895e-07, - "loss": 0.4172, - "step": 84274 - }, - { - "epoch": 2.16, - "learning_rate": 3.837654685058744e-07, - "loss": 0.3262, - "step": 84275 - }, - { - "epoch": 2.16, - "learning_rate": 3.837436765244818e-07, - "loss": 0.418, - "step": 84276 - }, - { - "epoch": 2.16, - "learning_rate": 3.8372188501492843e-07, - "loss": 0.2736, - "step": 84277 - }, - { - "epoch": 2.16, - "learning_rate": 3.83700093977231e-07, - "loss": 0.3618, - "step": 84278 - }, - { - "epoch": 2.16, - "learning_rate": 3.8367830341140596e-07, - "loss": 0.323, - "step": 84279 - }, - { - "epoch": 2.16, - "learning_rate": 3.8365651331746995e-07, - "loss": 0.3608, - "step": 84280 - }, - { - "epoch": 2.16, - "learning_rate": 3.836347236954398e-07, - "loss": 0.4932, - "step": 84281 - }, - { - "epoch": 2.16, - "learning_rate": 3.836129345453326e-07, - "loss": 0.4487, - "step": 84282 - }, - { - "epoch": 2.16, - "learning_rate": 3.8359114586716425e-07, - "loss": 0.3433, - "step": 84283 - }, - { - "epoch": 2.16, - "learning_rate": 3.8356935766095223e-07, - "loss": 0.4009, - "step": 84284 - }, - { - "epoch": 2.16, - "learning_rate": 3.835475699267123e-07, - "loss": 0.328, - "step": 84285 - }, - { - "epoch": 2.16, - "learning_rate": 3.8352578266446187e-07, - "loss": 0.2615, - "step": 84286 - }, - { - "epoch": 2.16, - "learning_rate": 3.835039958742177e-07, - "loss": 0.4229, - "step": 84287 - }, - { - "epoch": 2.16, - "learning_rate": 3.8348220955599567e-07, - "loss": 0.3984, - "step": 84288 - }, - { - "epoch": 2.16, - "learning_rate": 3.8346042370981315e-07, - "loss": 0.4204, - "step": 84289 - }, - { - "epoch": 2.16, - "learning_rate": 3.834386383356868e-07, - "loss": 0.3882, - "step": 84290 - }, - { - "epoch": 2.16, - "learning_rate": 3.8341685343363295e-07, - "loss": 0.3834, - "step": 84291 - }, - { - "epoch": 2.16, - "learning_rate": 3.8339506900366835e-07, - "loss": 0.5098, - "step": 84292 - }, - { - "epoch": 2.16, - "learning_rate": 3.833732850458099e-07, - "loss": 0.3262, - "step": 84293 - }, - { - "epoch": 2.16, - "learning_rate": 3.8335150156007443e-07, - "loss": 0.3896, - "step": 84294 - }, - { - "epoch": 2.16, - "learning_rate": 3.8332971854647836e-07, - "loss": 0.3452, - "step": 84295 - }, - { - "epoch": 2.16, - "learning_rate": 3.833079360050381e-07, - "loss": 0.4727, - "step": 84296 - }, - { - "epoch": 2.16, - "learning_rate": 3.8328615393577056e-07, - "loss": 0.4517, - "step": 84297 - }, - { - "epoch": 2.16, - "learning_rate": 3.8326437233869235e-07, - "loss": 0.3682, - "step": 84298 - }, - { - "epoch": 2.16, - "learning_rate": 3.832425912138207e-07, - "loss": 0.2932, - "step": 84299 - }, - { - "epoch": 2.16, - "learning_rate": 3.832208105611715e-07, - "loss": 0.353, - "step": 84300 - }, - { - "epoch": 2.16, - "learning_rate": 3.831990303807617e-07, - "loss": 0.4316, - "step": 84301 - }, - { - "epoch": 2.16, - "learning_rate": 3.831772506726082e-07, - "loss": 0.3386, - "step": 84302 - }, - { - "epoch": 2.16, - "learning_rate": 3.831554714367278e-07, - "loss": 0.3462, - "step": 84303 - }, - { - "epoch": 2.16, - "learning_rate": 3.831336926731368e-07, - "loss": 0.48, - "step": 84304 - }, - { - "epoch": 2.16, - "learning_rate": 3.8311191438185167e-07, - "loss": 0.4585, - "step": 84305 - }, - { - "epoch": 2.16, - "learning_rate": 3.830901365628894e-07, - "loss": 0.344, - "step": 84306 - }, - { - "epoch": 2.16, - "learning_rate": 3.830683592162669e-07, - "loss": 0.3119, - "step": 84307 - }, - { - "epoch": 2.16, - "learning_rate": 3.8304658234200037e-07, - "loss": 0.4624, - "step": 84308 - }, - { - "epoch": 2.16, - "learning_rate": 3.830248059401067e-07, - "loss": 0.4058, - "step": 84309 - }, - { - "epoch": 2.16, - "learning_rate": 3.830030300106024e-07, - "loss": 0.3367, - "step": 84310 - }, - { - "epoch": 2.16, - "learning_rate": 3.8298125455350485e-07, - "loss": 0.2988, - "step": 84311 - }, - { - "epoch": 2.16, - "learning_rate": 3.829594795688298e-07, - "loss": 0.3341, - "step": 84312 - }, - { - "epoch": 2.16, - "learning_rate": 3.829377050565942e-07, - "loss": 0.3652, - "step": 84313 - }, - { - "epoch": 2.16, - "learning_rate": 3.829159310168152e-07, - "loss": 0.4761, - "step": 84314 - }, - { - "epoch": 2.16, - "learning_rate": 3.828941574495088e-07, - "loss": 0.4883, - "step": 84315 - }, - { - "epoch": 2.16, - "learning_rate": 3.828723843546924e-07, - "loss": 0.2949, - "step": 84316 - }, - { - "epoch": 2.16, - "learning_rate": 3.8285061173238175e-07, - "loss": 0.439, - "step": 84317 - }, - { - "epoch": 2.16, - "learning_rate": 3.8282883958259404e-07, - "loss": 0.3008, - "step": 84318 - }, - { - "epoch": 2.16, - "learning_rate": 3.828070679053459e-07, - "loss": 0.4746, - "step": 84319 - }, - { - "epoch": 2.16, - "learning_rate": 3.827852967006544e-07, - "loss": 0.502, - "step": 84320 - }, - { - "epoch": 2.16, - "learning_rate": 3.827635259685354e-07, - "loss": 0.4512, - "step": 84321 - }, - { - "epoch": 2.16, - "learning_rate": 3.8274175570900603e-07, - "loss": 0.2839, - "step": 84322 - }, - { - "epoch": 2.16, - "learning_rate": 3.82719985922083e-07, - "loss": 0.3569, - "step": 84323 - }, - { - "epoch": 2.16, - "learning_rate": 3.8269821660778345e-07, - "loss": 0.2767, - "step": 84324 - }, - { - "epoch": 2.16, - "learning_rate": 3.8267644776612284e-07, - "loss": 0.3823, - "step": 84325 - }, - { - "epoch": 2.16, - "learning_rate": 3.826546793971186e-07, - "loss": 0.48, - "step": 84326 - }, - { - "epoch": 2.16, - "learning_rate": 3.826329115007871e-07, - "loss": 0.4512, - "step": 84327 - }, - { - "epoch": 2.16, - "learning_rate": 3.8261114407714567e-07, - "loss": 0.3555, - "step": 84328 - }, - { - "epoch": 2.16, - "learning_rate": 3.825893771262101e-07, - "loss": 0.4399, - "step": 84329 - }, - { - "epoch": 2.16, - "learning_rate": 3.825676106479975e-07, - "loss": 0.3472, - "step": 84330 - }, - { - "epoch": 2.16, - "learning_rate": 3.8254584464252447e-07, - "loss": 0.4023, - "step": 84331 - }, - { - "epoch": 2.16, - "learning_rate": 3.82524079109808e-07, - "loss": 0.4951, - "step": 84332 - }, - { - "epoch": 2.16, - "learning_rate": 3.825023140498641e-07, - "loss": 0.4331, - "step": 84333 - }, - { - "epoch": 2.16, - "learning_rate": 3.824805494627102e-07, - "loss": 0.416, - "step": 84334 - }, - { - "epoch": 2.16, - "learning_rate": 3.824587853483622e-07, - "loss": 0.3064, - "step": 84335 - }, - { - "epoch": 2.16, - "learning_rate": 3.82437021706837e-07, - "loss": 0.4326, - "step": 84336 - }, - { - "epoch": 2.16, - "learning_rate": 3.824152585381518e-07, - "loss": 0.4487, - "step": 84337 - }, - { - "epoch": 2.16, - "learning_rate": 3.823934958423225e-07, - "loss": 0.4648, - "step": 84338 - }, - { - "epoch": 2.16, - "learning_rate": 3.8237173361936615e-07, - "loss": 0.4604, - "step": 84339 - }, - { - "epoch": 2.16, - "learning_rate": 3.823499718692993e-07, - "loss": 0.3467, - "step": 84340 - }, - { - "epoch": 2.16, - "learning_rate": 3.8232821059213906e-07, - "loss": 0.4546, - "step": 84341 - }, - { - "epoch": 2.16, - "learning_rate": 3.823064497879013e-07, - "loss": 0.4556, - "step": 84342 - }, - { - "epoch": 2.16, - "learning_rate": 3.822846894566031e-07, - "loss": 0.4673, - "step": 84343 - }, - { - "epoch": 2.16, - "learning_rate": 3.8226292959826156e-07, - "loss": 0.3625, - "step": 84344 - }, - { - "epoch": 2.16, - "learning_rate": 3.822411702128928e-07, - "loss": 0.46, - "step": 84345 - }, - { - "epoch": 2.16, - "learning_rate": 3.822194113005132e-07, - "loss": 0.3496, - "step": 84346 - }, - { - "epoch": 2.16, - "learning_rate": 3.8219765286113983e-07, - "loss": 0.4102, - "step": 84347 - }, - { - "epoch": 2.16, - "learning_rate": 3.821758948947893e-07, - "loss": 0.449, - "step": 84348 - }, - { - "epoch": 2.16, - "learning_rate": 3.821541374014786e-07, - "loss": 0.3338, - "step": 84349 - }, - { - "epoch": 2.16, - "learning_rate": 3.8213238038122375e-07, - "loss": 0.3125, - "step": 84350 - }, - { - "epoch": 2.16, - "learning_rate": 3.821106238340418e-07, - "loss": 0.3848, - "step": 84351 - }, - { - "epoch": 2.16, - "learning_rate": 3.820888677599492e-07, - "loss": 0.4443, - "step": 84352 - }, - { - "epoch": 2.16, - "learning_rate": 3.8206711215896314e-07, - "loss": 0.2826, - "step": 84353 - }, - { - "epoch": 2.16, - "learning_rate": 3.820453570311e-07, - "loss": 0.281, - "step": 84354 - }, - { - "epoch": 2.16, - "learning_rate": 3.820236023763758e-07, - "loss": 0.3745, - "step": 84355 - }, - { - "epoch": 2.16, - "learning_rate": 3.820018481948077e-07, - "loss": 0.3584, - "step": 84356 - }, - { - "epoch": 2.16, - "learning_rate": 3.8198009448641244e-07, - "loss": 0.3933, - "step": 84357 - }, - { - "epoch": 2.16, - "learning_rate": 3.81958341251207e-07, - "loss": 0.5293, - "step": 84358 - }, - { - "epoch": 2.16, - "learning_rate": 3.8193658848920727e-07, - "loss": 0.3752, - "step": 84359 - }, - { - "epoch": 2.16, - "learning_rate": 3.819148362004302e-07, - "loss": 0.2527, - "step": 84360 - }, - { - "epoch": 2.16, - "learning_rate": 3.81893084384893e-07, - "loss": 0.457, - "step": 84361 - }, - { - "epoch": 2.16, - "learning_rate": 3.818713330426113e-07, - "loss": 0.4912, - "step": 84362 - }, - { - "epoch": 2.16, - "learning_rate": 3.8184958217360243e-07, - "loss": 0.3926, - "step": 84363 - }, - { - "epoch": 2.16, - "learning_rate": 3.8182783177788323e-07, - "loss": 0.3691, - "step": 84364 - }, - { - "epoch": 2.16, - "learning_rate": 3.818060818554697e-07, - "loss": 0.478, - "step": 84365 - }, - { - "epoch": 2.16, - "learning_rate": 3.817843324063792e-07, - "loss": 0.4385, - "step": 84366 - }, - { - "epoch": 2.16, - "learning_rate": 3.8176258343062763e-07, - "loss": 0.4072, - "step": 84367 - }, - { - "epoch": 2.16, - "learning_rate": 3.8174083492823205e-07, - "loss": 0.3174, - "step": 84368 - }, - { - "epoch": 2.16, - "learning_rate": 3.8171908689920904e-07, - "loss": 0.4243, - "step": 84369 - }, - { - "epoch": 2.16, - "learning_rate": 3.8169733934357575e-07, - "loss": 0.4414, - "step": 84370 - }, - { - "epoch": 2.16, - "learning_rate": 3.8167559226134795e-07, - "loss": 0.396, - "step": 84371 - }, - { - "epoch": 2.16, - "learning_rate": 3.8165384565254265e-07, - "loss": 0.4272, - "step": 84372 - }, - { - "epoch": 2.16, - "learning_rate": 3.8163209951717667e-07, - "loss": 0.3478, - "step": 84373 - }, - { - "epoch": 2.16, - "learning_rate": 3.8161035385526685e-07, - "loss": 0.3782, - "step": 84374 - }, - { - "epoch": 2.16, - "learning_rate": 3.815886086668295e-07, - "loss": 0.5181, - "step": 84375 - }, - { - "epoch": 2.16, - "learning_rate": 3.8156686395188107e-07, - "loss": 0.5161, - "step": 84376 - }, - { - "epoch": 2.16, - "learning_rate": 3.8154511971043846e-07, - "loss": 0.3273, - "step": 84377 - }, - { - "epoch": 2.16, - "learning_rate": 3.815233759425186e-07, - "loss": 0.4141, - "step": 84378 - }, - { - "epoch": 2.16, - "learning_rate": 3.815016326481375e-07, - "loss": 0.3896, - "step": 84379 - }, - { - "epoch": 2.16, - "learning_rate": 3.814798898273122e-07, - "loss": 0.4136, - "step": 84380 - }, - { - "epoch": 2.16, - "learning_rate": 3.8145814748005934e-07, - "loss": 0.2812, - "step": 84381 - }, - { - "epoch": 2.16, - "learning_rate": 3.814364056063958e-07, - "loss": 0.3561, - "step": 84382 - }, - { - "epoch": 2.16, - "learning_rate": 3.814146642063376e-07, - "loss": 0.3828, - "step": 84383 - }, - { - "epoch": 2.16, - "learning_rate": 3.813929232799021e-07, - "loss": 0.2969, - "step": 84384 - }, - { - "epoch": 2.16, - "learning_rate": 3.8137118282710536e-07, - "loss": 0.4287, - "step": 84385 - }, - { - "epoch": 2.16, - "learning_rate": 3.813494428479642e-07, - "loss": 0.3525, - "step": 84386 - }, - { - "epoch": 2.16, - "learning_rate": 3.813277033424956e-07, - "loss": 0.3008, - "step": 84387 - }, - { - "epoch": 2.16, - "learning_rate": 3.813059643107157e-07, - "loss": 0.3318, - "step": 84388 - }, - { - "epoch": 2.16, - "learning_rate": 3.812842257526414e-07, - "loss": 0.4492, - "step": 84389 - }, - { - "epoch": 2.16, - "learning_rate": 3.812624876682892e-07, - "loss": 0.2203, - "step": 84390 - }, - { - "epoch": 2.16, - "learning_rate": 3.812407500576763e-07, - "loss": 0.418, - "step": 84391 - }, - { - "epoch": 2.16, - "learning_rate": 3.812190129208185e-07, - "loss": 0.2435, - "step": 84392 - }, - { - "epoch": 2.16, - "learning_rate": 3.8119727625773277e-07, - "loss": 0.3525, - "step": 84393 - }, - { - "epoch": 2.16, - "learning_rate": 3.8117554006843634e-07, - "loss": 0.4321, - "step": 84394 - }, - { - "epoch": 2.16, - "learning_rate": 3.811538043529453e-07, - "loss": 0.2795, - "step": 84395 - }, - { - "epoch": 2.16, - "learning_rate": 3.8113206911127595e-07, - "loss": 0.2905, - "step": 84396 - }, - { - "epoch": 2.16, - "learning_rate": 3.811103343434453e-07, - "loss": 0.2708, - "step": 84397 - }, - { - "epoch": 2.16, - "learning_rate": 3.810886000494701e-07, - "loss": 0.3076, - "step": 84398 - }, - { - "epoch": 2.16, - "learning_rate": 3.810668662293671e-07, - "loss": 0.4604, - "step": 84399 - }, - { - "epoch": 2.16, - "learning_rate": 3.8104513288315256e-07, - "loss": 0.3696, - "step": 84400 - }, - { - "epoch": 2.16, - "learning_rate": 3.810234000108432e-07, - "loss": 0.4302, - "step": 84401 - }, - { - "epoch": 2.16, - "learning_rate": 3.810016676124558e-07, - "loss": 0.4097, - "step": 84402 - }, - { - "epoch": 2.16, - "learning_rate": 3.8097993568800737e-07, - "loss": 0.3563, - "step": 84403 - }, - { - "epoch": 2.16, - "learning_rate": 3.80958204237514e-07, - "loss": 0.5146, - "step": 84404 - }, - { - "epoch": 2.16, - "learning_rate": 3.809364732609922e-07, - "loss": 0.3999, - "step": 84405 - }, - { - "epoch": 2.16, - "learning_rate": 3.809147427584589e-07, - "loss": 0.4065, - "step": 84406 - }, - { - "epoch": 2.16, - "learning_rate": 3.808930127299307e-07, - "loss": 0.4985, - "step": 84407 - }, - { - "epoch": 2.16, - "learning_rate": 3.808712831754245e-07, - "loss": 0.4106, - "step": 84408 - }, - { - "epoch": 2.16, - "learning_rate": 3.8084955409495647e-07, - "loss": 0.4321, - "step": 84409 - }, - { - "epoch": 2.16, - "learning_rate": 3.808278254885434e-07, - "loss": 0.353, - "step": 84410 - }, - { - "epoch": 2.16, - "learning_rate": 3.808060973562021e-07, - "loss": 0.4829, - "step": 84411 - }, - { - "epoch": 2.16, - "learning_rate": 3.8078436969794924e-07, - "loss": 0.5312, - "step": 84412 - }, - { - "epoch": 2.16, - "learning_rate": 3.8076264251380106e-07, - "loss": 0.4604, - "step": 84413 - }, - { - "epoch": 2.16, - "learning_rate": 3.8074091580377486e-07, - "loss": 0.395, - "step": 84414 - }, - { - "epoch": 2.16, - "learning_rate": 3.807191895678865e-07, - "loss": 0.3743, - "step": 84415 - }, - { - "epoch": 2.16, - "learning_rate": 3.806974638061533e-07, - "loss": 0.4053, - "step": 84416 - }, - { - "epoch": 2.16, - "learning_rate": 3.8067573851859125e-07, - "loss": 0.5068, - "step": 84417 - }, - { - "epoch": 2.16, - "learning_rate": 3.806540137052173e-07, - "loss": 0.323, - "step": 84418 - }, - { - "epoch": 2.16, - "learning_rate": 3.806322893660482e-07, - "loss": 0.4058, - "step": 84419 - }, - { - "epoch": 2.16, - "learning_rate": 3.806105655011007e-07, - "loss": 0.4346, - "step": 84420 - }, - { - "epoch": 2.16, - "learning_rate": 3.8058884211039087e-07, - "loss": 0.4287, - "step": 84421 - }, - { - "epoch": 2.16, - "learning_rate": 3.805671191939357e-07, - "loss": 0.215, - "step": 84422 - }, - { - "epoch": 2.16, - "learning_rate": 3.805453967517518e-07, - "loss": 0.3416, - "step": 84423 - }, - { - "epoch": 2.16, - "learning_rate": 3.8052367478385616e-07, - "loss": 0.4121, - "step": 84424 - }, - { - "epoch": 2.16, - "learning_rate": 3.80501953290265e-07, - "loss": 0.438, - "step": 84425 - }, - { - "epoch": 2.16, - "learning_rate": 3.8048023227099477e-07, - "loss": 0.4038, - "step": 84426 - }, - { - "epoch": 2.16, - "learning_rate": 3.8045851172606225e-07, - "loss": 0.2635, - "step": 84427 - }, - { - "epoch": 2.16, - "learning_rate": 3.8043679165548427e-07, - "loss": 0.522, - "step": 84428 - }, - { - "epoch": 2.16, - "learning_rate": 3.8041507205927757e-07, - "loss": 0.478, - "step": 84429 - }, - { - "epoch": 2.16, - "learning_rate": 3.8039335293745823e-07, - "loss": 0.5332, - "step": 84430 - }, - { - "epoch": 2.16, - "learning_rate": 3.8037163429004325e-07, - "loss": 0.3965, - "step": 84431 - }, - { - "epoch": 2.16, - "learning_rate": 3.8034991611704926e-07, - "loss": 0.4783, - "step": 84432 - }, - { - "epoch": 2.16, - "learning_rate": 3.803281984184932e-07, - "loss": 0.481, - "step": 84433 - }, - { - "epoch": 2.16, - "learning_rate": 3.8030648119439124e-07, - "loss": 0.3708, - "step": 84434 - }, - { - "epoch": 2.16, - "learning_rate": 3.802847644447598e-07, - "loss": 0.3208, - "step": 84435 - }, - { - "epoch": 2.16, - "learning_rate": 3.8026304816961584e-07, - "loss": 0.4463, - "step": 84436 - }, - { - "epoch": 2.16, - "learning_rate": 3.802413323689764e-07, - "loss": 0.3569, - "step": 84437 - }, - { - "epoch": 2.16, - "learning_rate": 3.802196170428572e-07, - "loss": 0.3711, - "step": 84438 - }, - { - "epoch": 2.16, - "learning_rate": 3.8019790219127533e-07, - "loss": 0.4185, - "step": 84439 - }, - { - "epoch": 2.16, - "learning_rate": 3.801761878142475e-07, - "loss": 0.4546, - "step": 84440 - }, - { - "epoch": 2.16, - "learning_rate": 3.801544739117906e-07, - "loss": 0.3613, - "step": 84441 - }, - { - "epoch": 2.16, - "learning_rate": 3.801327604839205e-07, - "loss": 0.4104, - "step": 84442 - }, - { - "epoch": 2.16, - "learning_rate": 3.8011104753065436e-07, - "loss": 0.4502, - "step": 84443 - }, - { - "epoch": 2.16, - "learning_rate": 3.80089335052009e-07, - "loss": 0.3201, - "step": 84444 - }, - { - "epoch": 2.16, - "learning_rate": 3.8006762304800035e-07, - "loss": 0.4172, - "step": 84445 - }, - { - "epoch": 2.16, - "learning_rate": 3.8004591151864575e-07, - "loss": 0.4683, - "step": 84446 - }, - { - "epoch": 2.16, - "learning_rate": 3.800242004639612e-07, - "loss": 0.4238, - "step": 84447 - }, - { - "epoch": 2.16, - "learning_rate": 3.800024898839636e-07, - "loss": 0.4121, - "step": 84448 - }, - { - "epoch": 2.16, - "learning_rate": 3.799807797786695e-07, - "loss": 0.4219, - "step": 84449 - }, - { - "epoch": 2.16, - "learning_rate": 3.79959070148096e-07, - "loss": 0.3511, - "step": 84450 - }, - { - "epoch": 2.16, - "learning_rate": 3.7993736099225903e-07, - "loss": 0.4312, - "step": 84451 - }, - { - "epoch": 2.16, - "learning_rate": 3.799156523111755e-07, - "loss": 0.4839, - "step": 84452 - }, - { - "epoch": 2.16, - "learning_rate": 3.798939441048624e-07, - "loss": 0.3479, - "step": 84453 - }, - { - "epoch": 2.16, - "learning_rate": 3.79872236373336e-07, - "loss": 0.3074, - "step": 84454 - }, - { - "epoch": 2.16, - "learning_rate": 3.798505291166125e-07, - "loss": 0.3755, - "step": 84455 - }, - { - "epoch": 2.16, - "learning_rate": 3.7982882233470893e-07, - "loss": 0.5366, - "step": 84456 - }, - { - "epoch": 2.16, - "learning_rate": 3.7980711602764205e-07, - "loss": 0.3506, - "step": 84457 - }, - { - "epoch": 2.16, - "learning_rate": 3.797854101954285e-07, - "loss": 0.3647, - "step": 84458 - }, - { - "epoch": 2.16, - "learning_rate": 3.797637048380845e-07, - "loss": 0.3625, - "step": 84459 - }, - { - "epoch": 2.16, - "learning_rate": 3.7974199995562695e-07, - "loss": 0.3369, - "step": 84460 - }, - { - "epoch": 2.16, - "learning_rate": 3.797202955480724e-07, - "loss": 0.3911, - "step": 84461 - }, - { - "epoch": 2.16, - "learning_rate": 3.7969859161543785e-07, - "loss": 0.3202, - "step": 84462 - }, - { - "epoch": 2.16, - "learning_rate": 3.7967688815773914e-07, - "loss": 0.4009, - "step": 84463 - }, - { - "epoch": 2.16, - "learning_rate": 3.7965518517499373e-07, - "loss": 0.498, - "step": 84464 - }, - { - "epoch": 2.16, - "learning_rate": 3.796334826672175e-07, - "loss": 0.3225, - "step": 84465 - }, - { - "epoch": 2.16, - "learning_rate": 3.7961178063442735e-07, - "loss": 0.1563, - "step": 84466 - }, - { - "epoch": 2.16, - "learning_rate": 3.795900790766402e-07, - "loss": 0.521, - "step": 84467 - }, - { - "epoch": 2.16, - "learning_rate": 3.795683779938722e-07, - "loss": 0.4233, - "step": 84468 - }, - { - "epoch": 2.16, - "learning_rate": 3.795466773861401e-07, - "loss": 0.4492, - "step": 84469 - }, - { - "epoch": 2.17, - "learning_rate": 3.795249772534609e-07, - "loss": 0.5039, - "step": 84470 - }, - { - "epoch": 2.17, - "learning_rate": 3.795032775958505e-07, - "loss": 0.5156, - "step": 84471 - }, - { - "epoch": 2.17, - "learning_rate": 3.7948157841332605e-07, - "loss": 0.4766, - "step": 84472 - }, - { - "epoch": 2.17, - "learning_rate": 3.79459879705904e-07, - "loss": 0.3071, - "step": 84473 - }, - { - "epoch": 2.17, - "learning_rate": 3.794381814736013e-07, - "loss": 0.4795, - "step": 84474 - }, - { - "epoch": 2.17, - "learning_rate": 3.794164837164342e-07, - "loss": 0.4761, - "step": 84475 - }, - { - "epoch": 2.17, - "learning_rate": 3.79394786434419e-07, - "loss": 0.2471, - "step": 84476 - }, - { - "epoch": 2.17, - "learning_rate": 3.7937308962757277e-07, - "loss": 0.355, - "step": 84477 - }, - { - "epoch": 2.17, - "learning_rate": 3.7935139329591206e-07, - "loss": 0.4022, - "step": 84478 - }, - { - "epoch": 2.17, - "learning_rate": 3.793296974394536e-07, - "loss": 0.4243, - "step": 84479 - }, - { - "epoch": 2.17, - "learning_rate": 3.793080020582137e-07, - "loss": 0.301, - "step": 84480 - }, - { - "epoch": 2.17, - "learning_rate": 3.792863071522091e-07, - "loss": 0.3804, - "step": 84481 - }, - { - "epoch": 2.17, - "learning_rate": 3.7926461272145637e-07, - "loss": 0.3289, - "step": 84482 - }, - { - "epoch": 2.17, - "learning_rate": 3.792429187659726e-07, - "loss": 0.417, - "step": 84483 - }, - { - "epoch": 2.17, - "learning_rate": 3.792212252857738e-07, - "loss": 0.3364, - "step": 84484 - }, - { - "epoch": 2.17, - "learning_rate": 3.7919953228087666e-07, - "loss": 0.3848, - "step": 84485 - }, - { - "epoch": 2.17, - "learning_rate": 3.7917783975129766e-07, - "loss": 0.4243, - "step": 84486 - }, - { - "epoch": 2.17, - "learning_rate": 3.791561476970542e-07, - "loss": 0.5098, - "step": 84487 - }, - { - "epoch": 2.17, - "learning_rate": 3.7913445611816184e-07, - "loss": 0.5591, - "step": 84488 - }, - { - "epoch": 2.17, - "learning_rate": 3.791127650146377e-07, - "loss": 0.4402, - "step": 84489 - }, - { - "epoch": 2.17, - "learning_rate": 3.7909107438649845e-07, - "loss": 0.448, - "step": 84490 - }, - { - "epoch": 2.17, - "learning_rate": 3.790693842337609e-07, - "loss": 0.3923, - "step": 84491 - }, - { - "epoch": 2.17, - "learning_rate": 3.7904769455644103e-07, - "loss": 0.3823, - "step": 84492 - }, - { - "epoch": 2.17, - "learning_rate": 3.7902600535455586e-07, - "loss": 0.4002, - "step": 84493 - }, - { - "epoch": 2.17, - "learning_rate": 3.7900431662812213e-07, - "loss": 0.3857, - "step": 84494 - }, - { - "epoch": 2.17, - "learning_rate": 3.78982628377156e-07, - "loss": 0.4094, - "step": 84495 - }, - { - "epoch": 2.17, - "learning_rate": 3.7896094060167463e-07, - "loss": 0.5796, - "step": 84496 - }, - { - "epoch": 2.17, - "learning_rate": 3.7893925330169394e-07, - "loss": 0.5063, - "step": 84497 - }, - { - "epoch": 2.17, - "learning_rate": 3.7891756647723093e-07, - "loss": 0.606, - "step": 84498 - }, - { - "epoch": 2.17, - "learning_rate": 3.788958801283022e-07, - "loss": 0.3701, - "step": 84499 - }, - { - "epoch": 2.17, - "learning_rate": 3.7887419425492475e-07, - "loss": 0.46, - "step": 84500 - }, - { - "epoch": 2.17, - "learning_rate": 3.788525088571143e-07, - "loss": 0.3066, - "step": 84501 - }, - { - "epoch": 2.17, - "learning_rate": 3.78830823934888e-07, - "loss": 0.4714, - "step": 84502 - }, - { - "epoch": 2.17, - "learning_rate": 3.7880913948826234e-07, - "loss": 0.4026, - "step": 84503 - }, - { - "epoch": 2.17, - "learning_rate": 3.7878745551725464e-07, - "loss": 0.3147, - "step": 84504 - }, - { - "epoch": 2.17, - "learning_rate": 3.787657720218801e-07, - "loss": 0.4409, - "step": 84505 - }, - { - "epoch": 2.17, - "learning_rate": 3.7874408900215604e-07, - "loss": 0.4893, - "step": 84506 - }, - { - "epoch": 2.17, - "learning_rate": 3.7872240645809917e-07, - "loss": 0.4814, - "step": 84507 - }, - { - "epoch": 2.17, - "learning_rate": 3.787007243897262e-07, - "loss": 0.3101, - "step": 84508 - }, - { - "epoch": 2.17, - "learning_rate": 3.786790427970533e-07, - "loss": 0.3357, - "step": 84509 - }, - { - "epoch": 2.17, - "learning_rate": 3.786573616800972e-07, - "loss": 0.4561, - "step": 84510 - }, - { - "epoch": 2.17, - "learning_rate": 3.7863568103887464e-07, - "loss": 0.374, - "step": 84511 - }, - { - "epoch": 2.17, - "learning_rate": 3.7861400087340244e-07, - "loss": 0.3665, - "step": 84512 - }, - { - "epoch": 2.17, - "learning_rate": 3.785923211836967e-07, - "loss": 0.3745, - "step": 84513 - }, - { - "epoch": 2.17, - "learning_rate": 3.785706419697745e-07, - "loss": 0.5669, - "step": 84514 - }, - { - "epoch": 2.17, - "learning_rate": 3.7854896323165187e-07, - "loss": 0.4404, - "step": 84515 - }, - { - "epoch": 2.17, - "learning_rate": 3.785272849693457e-07, - "loss": 0.46, - "step": 84516 - }, - { - "epoch": 2.17, - "learning_rate": 3.7850560718287295e-07, - "loss": 0.3757, - "step": 84517 - }, - { - "epoch": 2.17, - "learning_rate": 3.7848392987224964e-07, - "loss": 0.4243, - "step": 84518 - }, - { - "epoch": 2.17, - "learning_rate": 3.7846225303749247e-07, - "loss": 0.395, - "step": 84519 - }, - { - "epoch": 2.17, - "learning_rate": 3.784405766786183e-07, - "loss": 0.3293, - "step": 84520 - }, - { - "epoch": 2.17, - "learning_rate": 3.784189007956439e-07, - "loss": 0.4316, - "step": 84521 - }, - { - "epoch": 2.17, - "learning_rate": 3.783972253885851e-07, - "loss": 0.3052, - "step": 84522 - }, - { - "epoch": 2.17, - "learning_rate": 3.783755504574591e-07, - "loss": 0.5083, - "step": 84523 - }, - { - "epoch": 2.17, - "learning_rate": 3.783538760022826e-07, - "loss": 0.5322, - "step": 84524 - }, - { - "epoch": 2.17, - "learning_rate": 3.7833220202307203e-07, - "loss": 0.4165, - "step": 84525 - }, - { - "epoch": 2.17, - "learning_rate": 3.7831052851984356e-07, - "loss": 0.3866, - "step": 84526 - }, - { - "epoch": 2.17, - "learning_rate": 3.7828885549261415e-07, - "loss": 0.2363, - "step": 84527 - }, - { - "epoch": 2.17, - "learning_rate": 3.7826718294140037e-07, - "loss": 0.3796, - "step": 84528 - }, - { - "epoch": 2.17, - "learning_rate": 3.7824551086621915e-07, - "loss": 0.4355, - "step": 84529 - }, - { - "epoch": 2.17, - "learning_rate": 3.7822383926708633e-07, - "loss": 0.4736, - "step": 84530 - }, - { - "epoch": 2.17, - "learning_rate": 3.7820216814401907e-07, - "loss": 0.3982, - "step": 84531 - }, - { - "epoch": 2.17, - "learning_rate": 3.781804974970337e-07, - "loss": 0.3511, - "step": 84532 - }, - { - "epoch": 2.17, - "learning_rate": 3.7815882732614736e-07, - "loss": 0.4146, - "step": 84533 - }, - { - "epoch": 2.17, - "learning_rate": 3.781371576313761e-07, - "loss": 0.2974, - "step": 84534 - }, - { - "epoch": 2.17, - "learning_rate": 3.7811548841273644e-07, - "loss": 0.3965, - "step": 84535 - }, - { - "epoch": 2.17, - "learning_rate": 3.78093819670245e-07, - "loss": 0.541, - "step": 84536 - }, - { - "epoch": 2.17, - "learning_rate": 3.780721514039186e-07, - "loss": 0.3308, - "step": 84537 - }, - { - "epoch": 2.17, - "learning_rate": 3.7805048361377413e-07, - "loss": 0.5005, - "step": 84538 - }, - { - "epoch": 2.17, - "learning_rate": 3.780288162998274e-07, - "loss": 0.3833, - "step": 84539 - }, - { - "epoch": 2.17, - "learning_rate": 3.7800714946209545e-07, - "loss": 0.4849, - "step": 84540 - }, - { - "epoch": 2.17, - "learning_rate": 3.779854831005952e-07, - "loss": 0.3791, - "step": 84541 - }, - { - "epoch": 2.17, - "learning_rate": 3.779638172153424e-07, - "loss": 0.4009, - "step": 84542 - }, - { - "epoch": 2.17, - "learning_rate": 3.779421518063546e-07, - "loss": 0.3094, - "step": 84543 - }, - { - "epoch": 2.17, - "learning_rate": 3.779204868736474e-07, - "loss": 0.4482, - "step": 84544 - }, - { - "epoch": 2.17, - "learning_rate": 3.778988224172379e-07, - "loss": 0.3998, - "step": 84545 - }, - { - "epoch": 2.17, - "learning_rate": 3.778771584371432e-07, - "loss": 0.3789, - "step": 84546 - }, - { - "epoch": 2.17, - "learning_rate": 3.778554949333788e-07, - "loss": 0.2621, - "step": 84547 - }, - { - "epoch": 2.17, - "learning_rate": 3.7783383190596195e-07, - "loss": 0.3048, - "step": 84548 - }, - { - "epoch": 2.17, - "learning_rate": 3.7781216935490903e-07, - "loss": 0.3618, - "step": 84549 - }, - { - "epoch": 2.17, - "learning_rate": 3.777905072802371e-07, - "loss": 0.4453, - "step": 84550 - }, - { - "epoch": 2.17, - "learning_rate": 3.777688456819621e-07, - "loss": 0.3627, - "step": 84551 - }, - { - "epoch": 2.17, - "learning_rate": 3.777471845601008e-07, - "loss": 0.4082, - "step": 84552 - }, - { - "epoch": 2.17, - "learning_rate": 3.7772552391467027e-07, - "loss": 0.541, - "step": 84553 - }, - { - "epoch": 2.17, - "learning_rate": 3.777038637456863e-07, - "loss": 0.3506, - "step": 84554 - }, - { - "epoch": 2.17, - "learning_rate": 3.7768220405316633e-07, - "loss": 0.3296, - "step": 84555 - }, - { - "epoch": 2.17, - "learning_rate": 3.7766054483712597e-07, - "loss": 0.3494, - "step": 84556 - }, - { - "epoch": 2.17, - "learning_rate": 3.7763888609758245e-07, - "loss": 0.3412, - "step": 84557 - }, - { - "epoch": 2.17, - "learning_rate": 3.776172278345524e-07, - "loss": 0.3398, - "step": 84558 - }, - { - "epoch": 2.17, - "learning_rate": 3.77595570048052e-07, - "loss": 0.4255, - "step": 84559 - }, - { - "epoch": 2.17, - "learning_rate": 3.77573912738098e-07, - "loss": 0.2875, - "step": 84560 - }, - { - "epoch": 2.17, - "learning_rate": 3.7755225590470707e-07, - "loss": 0.4414, - "step": 84561 - }, - { - "epoch": 2.17, - "learning_rate": 3.7753059954789614e-07, - "loss": 0.3633, - "step": 84562 - }, - { - "epoch": 2.17, - "learning_rate": 3.7750894366768137e-07, - "loss": 0.3293, - "step": 84563 - }, - { - "epoch": 2.17, - "learning_rate": 3.774872882640791e-07, - "loss": 0.261, - "step": 84564 - }, - { - "epoch": 2.17, - "learning_rate": 3.7746563333710603e-07, - "loss": 0.5552, - "step": 84565 - }, - { - "epoch": 2.17, - "learning_rate": 3.77443978886779e-07, - "loss": 0.4829, - "step": 84566 - }, - { - "epoch": 2.17, - "learning_rate": 3.7742232491311487e-07, - "loss": 0.4292, - "step": 84567 - }, - { - "epoch": 2.17, - "learning_rate": 3.774006714161294e-07, - "loss": 0.3037, - "step": 84568 - }, - { - "epoch": 2.17, - "learning_rate": 3.773790183958396e-07, - "loss": 0.3801, - "step": 84569 - }, - { - "epoch": 2.17, - "learning_rate": 3.7735736585226217e-07, - "loss": 0.3481, - "step": 84570 - }, - { - "epoch": 2.17, - "learning_rate": 3.7733571378541387e-07, - "loss": 0.3711, - "step": 84571 - }, - { - "epoch": 2.17, - "learning_rate": 3.773140621953106e-07, - "loss": 0.3865, - "step": 84572 - }, - { - "epoch": 2.17, - "learning_rate": 3.7729241108196973e-07, - "loss": 0.4299, - "step": 84573 - }, - { - "epoch": 2.17, - "learning_rate": 3.772707604454071e-07, - "loss": 0.5508, - "step": 84574 - }, - { - "epoch": 2.17, - "learning_rate": 3.7724911028563986e-07, - "loss": 0.436, - "step": 84575 - }, - { - "epoch": 2.17, - "learning_rate": 3.7722746060268405e-07, - "loss": 0.4028, - "step": 84576 - }, - { - "epoch": 2.17, - "learning_rate": 3.772058113965565e-07, - "loss": 0.3977, - "step": 84577 - }, - { - "epoch": 2.17, - "learning_rate": 3.771841626672739e-07, - "loss": 0.4341, - "step": 84578 - }, - { - "epoch": 2.17, - "learning_rate": 3.77162514414853e-07, - "loss": 0.6299, - "step": 84579 - }, - { - "epoch": 2.17, - "learning_rate": 3.771408666393099e-07, - "loss": 0.5884, - "step": 84580 - }, - { - "epoch": 2.17, - "learning_rate": 3.7711921934066125e-07, - "loss": 0.4056, - "step": 84581 - }, - { - "epoch": 2.17, - "learning_rate": 3.770975725189239e-07, - "loss": 0.4712, - "step": 84582 - }, - { - "epoch": 2.17, - "learning_rate": 3.7707592617411453e-07, - "loss": 0.4609, - "step": 84583 - }, - { - "epoch": 2.17, - "learning_rate": 3.7705428030624965e-07, - "loss": 0.4155, - "step": 84584 - }, - { - "epoch": 2.17, - "learning_rate": 3.770326349153452e-07, - "loss": 0.4116, - "step": 84585 - }, - { - "epoch": 2.17, - "learning_rate": 3.770109900014182e-07, - "loss": 0.3977, - "step": 84586 - }, - { - "epoch": 2.17, - "learning_rate": 3.7698934556448525e-07, - "loss": 0.4039, - "step": 84587 - }, - { - "epoch": 2.17, - "learning_rate": 3.7696770160456325e-07, - "loss": 0.4114, - "step": 84588 - }, - { - "epoch": 2.17, - "learning_rate": 3.769460581216681e-07, - "loss": 0.3553, - "step": 84589 - }, - { - "epoch": 2.17, - "learning_rate": 3.7692441511581676e-07, - "loss": 0.3511, - "step": 84590 - }, - { - "epoch": 2.17, - "learning_rate": 3.7690277258702575e-07, - "loss": 0.2913, - "step": 84591 - }, - { - "epoch": 2.17, - "learning_rate": 3.768811305353119e-07, - "loss": 0.4023, - "step": 84592 - }, - { - "epoch": 2.17, - "learning_rate": 3.7685948896069153e-07, - "loss": 0.4185, - "step": 84593 - }, - { - "epoch": 2.17, - "learning_rate": 3.7683784786318084e-07, - "loss": 0.3792, - "step": 84594 - }, - { - "epoch": 2.17, - "learning_rate": 3.768162072427968e-07, - "loss": 0.3728, - "step": 84595 - }, - { - "epoch": 2.17, - "learning_rate": 3.7679456709955625e-07, - "loss": 0.3987, - "step": 84596 - }, - { - "epoch": 2.17, - "learning_rate": 3.7677292743347513e-07, - "loss": 0.3271, - "step": 84597 - }, - { - "epoch": 2.17, - "learning_rate": 3.767512882445704e-07, - "loss": 0.2659, - "step": 84598 - }, - { - "epoch": 2.17, - "learning_rate": 3.767296495328583e-07, - "loss": 0.325, - "step": 84599 - }, - { - "epoch": 2.17, - "learning_rate": 3.7670801129835627e-07, - "loss": 0.397, - "step": 84600 - }, - { - "epoch": 2.17, - "learning_rate": 3.7668637354107977e-07, - "loss": 0.4624, - "step": 84601 - }, - { - "epoch": 2.17, - "learning_rate": 3.766647362610459e-07, - "loss": 0.5234, - "step": 84602 - }, - { - "epoch": 2.17, - "learning_rate": 3.7664309945827143e-07, - "loss": 0.5015, - "step": 84603 - }, - { - "epoch": 2.17, - "learning_rate": 3.766214631327724e-07, - "loss": 0.4067, - "step": 84604 - }, - { - "epoch": 2.17, - "learning_rate": 3.765998272845661e-07, - "loss": 0.3562, - "step": 84605 - }, - { - "epoch": 2.17, - "learning_rate": 3.7657819191366813e-07, - "loss": 0.4109, - "step": 84606 - }, - { - "epoch": 2.17, - "learning_rate": 3.765565570200957e-07, - "loss": 0.2994, - "step": 84607 - }, - { - "epoch": 2.17, - "learning_rate": 3.765349226038652e-07, - "loss": 0.4009, - "step": 84608 - }, - { - "epoch": 2.17, - "learning_rate": 3.7651328866499354e-07, - "loss": 0.3679, - "step": 84609 - }, - { - "epoch": 2.17, - "learning_rate": 3.764916552034967e-07, - "loss": 0.4312, - "step": 84610 - }, - { - "epoch": 2.17, - "learning_rate": 3.764700222193915e-07, - "loss": 0.3489, - "step": 84611 - }, - { - "epoch": 2.17, - "learning_rate": 3.7644838971269457e-07, - "loss": 0.3726, - "step": 84612 - }, - { - "epoch": 2.17, - "learning_rate": 3.764267576834231e-07, - "loss": 0.4048, - "step": 84613 - }, - { - "epoch": 2.17, - "learning_rate": 3.7640512613159225e-07, - "loss": 0.4375, - "step": 84614 - }, - { - "epoch": 2.17, - "learning_rate": 3.7638349505721947e-07, - "loss": 0.5381, - "step": 84615 - }, - { - "epoch": 2.17, - "learning_rate": 3.76361864460321e-07, - "loss": 0.4058, - "step": 84616 - }, - { - "epoch": 2.17, - "learning_rate": 3.76340234340914e-07, - "loss": 0.3276, - "step": 84617 - }, - { - "epoch": 2.17, - "learning_rate": 3.763186046990142e-07, - "loss": 0.3284, - "step": 84618 - }, - { - "epoch": 2.17, - "learning_rate": 3.7629697553463866e-07, - "loss": 0.355, - "step": 84619 - }, - { - "epoch": 2.17, - "learning_rate": 3.7627534684780384e-07, - "loss": 0.4067, - "step": 84620 - }, - { - "epoch": 2.17, - "learning_rate": 3.762537186385266e-07, - "loss": 0.3448, - "step": 84621 - }, - { - "epoch": 2.17, - "learning_rate": 3.76232090906823e-07, - "loss": 0.4688, - "step": 84622 - }, - { - "epoch": 2.17, - "learning_rate": 3.762104636527099e-07, - "loss": 0.4268, - "step": 84623 - }, - { - "epoch": 2.17, - "learning_rate": 3.7618883687620365e-07, - "loss": 0.3193, - "step": 84624 - }, - { - "epoch": 2.17, - "learning_rate": 3.761672105773208e-07, - "loss": 0.5254, - "step": 84625 - }, - { - "epoch": 2.17, - "learning_rate": 3.761455847560784e-07, - "loss": 0.5107, - "step": 84626 - }, - { - "epoch": 2.17, - "learning_rate": 3.761239594124923e-07, - "loss": 0.2996, - "step": 84627 - }, - { - "epoch": 2.17, - "learning_rate": 3.761023345465794e-07, - "loss": 0.3818, - "step": 84628 - }, - { - "epoch": 2.17, - "learning_rate": 3.760807101583563e-07, - "loss": 0.3403, - "step": 84629 - }, - { - "epoch": 2.17, - "learning_rate": 3.760590862478398e-07, - "loss": 0.3234, - "step": 84630 - }, - { - "epoch": 2.17, - "learning_rate": 3.760374628150458e-07, - "loss": 0.4614, - "step": 84631 - }, - { - "epoch": 2.17, - "learning_rate": 3.760158398599913e-07, - "loss": 0.4917, - "step": 84632 - }, - { - "epoch": 2.17, - "learning_rate": 3.75994217382693e-07, - "loss": 0.2502, - "step": 84633 - }, - { - "epoch": 2.17, - "learning_rate": 3.759725953831674e-07, - "loss": 0.4272, - "step": 84634 - }, - { - "epoch": 2.17, - "learning_rate": 3.759509738614304e-07, - "loss": 0.2732, - "step": 84635 - }, - { - "epoch": 2.17, - "learning_rate": 3.7592935281749917e-07, - "loss": 0.4751, - "step": 84636 - }, - { - "epoch": 2.17, - "learning_rate": 3.759077322513901e-07, - "loss": 0.2689, - "step": 84637 - }, - { - "epoch": 2.17, - "learning_rate": 3.7588611216312006e-07, - "loss": 0.4087, - "step": 84638 - }, - { - "epoch": 2.17, - "learning_rate": 3.75864492552705e-07, - "loss": 0.4272, - "step": 84639 - }, - { - "epoch": 2.17, - "learning_rate": 3.7584287342016185e-07, - "loss": 0.3263, - "step": 84640 - }, - { - "epoch": 2.17, - "learning_rate": 3.7582125476550707e-07, - "loss": 0.478, - "step": 84641 - }, - { - "epoch": 2.17, - "learning_rate": 3.757996365887576e-07, - "loss": 0.564, - "step": 84642 - }, - { - "epoch": 2.17, - "learning_rate": 3.7577801888992966e-07, - "loss": 0.3547, - "step": 84643 - }, - { - "epoch": 2.17, - "learning_rate": 3.7575640166903945e-07, - "loss": 0.5049, - "step": 84644 - }, - { - "epoch": 2.17, - "learning_rate": 3.757347849261039e-07, - "loss": 0.3542, - "step": 84645 - }, - { - "epoch": 2.17, - "learning_rate": 3.7571316866113947e-07, - "loss": 0.3582, - "step": 84646 - }, - { - "epoch": 2.17, - "learning_rate": 3.756915528741631e-07, - "loss": 0.2747, - "step": 84647 - }, - { - "epoch": 2.17, - "learning_rate": 3.7566993756519074e-07, - "loss": 0.4648, - "step": 84648 - }, - { - "epoch": 2.17, - "learning_rate": 3.756483227342391e-07, - "loss": 0.3264, - "step": 84649 - }, - { - "epoch": 2.17, - "learning_rate": 3.7562670838132513e-07, - "loss": 0.4233, - "step": 84650 - }, - { - "epoch": 2.17, - "learning_rate": 3.756050945064648e-07, - "loss": 0.2933, - "step": 84651 - }, - { - "epoch": 2.17, - "learning_rate": 3.755834811096751e-07, - "loss": 0.259, - "step": 84652 - }, - { - "epoch": 2.17, - "learning_rate": 3.755618681909726e-07, - "loss": 0.4214, - "step": 84653 - }, - { - "epoch": 2.17, - "learning_rate": 3.755402557503733e-07, - "loss": 0.4346, - "step": 84654 - }, - { - "epoch": 2.17, - "learning_rate": 3.7551864378789445e-07, - "loss": 0.5557, - "step": 84655 - }, - { - "epoch": 2.17, - "learning_rate": 3.75497032303552e-07, - "loss": 0.3275, - "step": 84656 - }, - { - "epoch": 2.17, - "learning_rate": 3.7547542129736265e-07, - "loss": 0.3848, - "step": 84657 - }, - { - "epoch": 2.17, - "learning_rate": 3.7545381076934313e-07, - "loss": 0.4062, - "step": 84658 - }, - { - "epoch": 2.17, - "learning_rate": 3.754322007195103e-07, - "loss": 0.4712, - "step": 84659 - }, - { - "epoch": 2.17, - "learning_rate": 3.7541059114787985e-07, - "loss": 0.3774, - "step": 84660 - }, - { - "epoch": 2.17, - "learning_rate": 3.753889820544689e-07, - "loss": 0.2917, - "step": 84661 - }, - { - "epoch": 2.17, - "learning_rate": 3.753673734392938e-07, - "loss": 0.4016, - "step": 84662 - }, - { - "epoch": 2.17, - "learning_rate": 3.753457653023716e-07, - "loss": 0.3945, - "step": 84663 - }, - { - "epoch": 2.17, - "learning_rate": 3.753241576437184e-07, - "loss": 0.3799, - "step": 84664 - }, - { - "epoch": 2.17, - "learning_rate": 3.7530255046335044e-07, - "loss": 0.4167, - "step": 84665 - }, - { - "epoch": 2.17, - "learning_rate": 3.752809437612845e-07, - "loss": 0.3349, - "step": 84666 - }, - { - "epoch": 2.17, - "learning_rate": 3.752593375375377e-07, - "loss": 0.4351, - "step": 84667 - }, - { - "epoch": 2.17, - "learning_rate": 3.752377317921257e-07, - "loss": 0.3789, - "step": 84668 - }, - { - "epoch": 2.17, - "learning_rate": 3.752161265250654e-07, - "loss": 0.3486, - "step": 84669 - }, - { - "epoch": 2.17, - "learning_rate": 3.7519452173637334e-07, - "loss": 0.479, - "step": 84670 - }, - { - "epoch": 2.17, - "learning_rate": 3.751729174260666e-07, - "loss": 0.2671, - "step": 84671 - }, - { - "epoch": 2.17, - "learning_rate": 3.7515131359416076e-07, - "loss": 0.3613, - "step": 84672 - }, - { - "epoch": 2.17, - "learning_rate": 3.751297102406732e-07, - "loss": 0.5107, - "step": 84673 - }, - { - "epoch": 2.17, - "learning_rate": 3.751081073656198e-07, - "loss": 0.5649, - "step": 84674 - }, - { - "epoch": 2.17, - "learning_rate": 3.7508650496901726e-07, - "loss": 0.3904, - "step": 84675 - }, - { - "epoch": 2.17, - "learning_rate": 3.750649030508828e-07, - "loss": 0.36, - "step": 84676 - }, - { - "epoch": 2.17, - "learning_rate": 3.7504330161123185e-07, - "loss": 0.3782, - "step": 84677 - }, - { - "epoch": 2.17, - "learning_rate": 3.7502170065008165e-07, - "loss": 0.2546, - "step": 84678 - }, - { - "epoch": 2.17, - "learning_rate": 3.750001001674485e-07, - "loss": 0.3726, - "step": 84679 - }, - { - "epoch": 2.17, - "learning_rate": 3.749785001633494e-07, - "loss": 0.4072, - "step": 84680 - }, - { - "epoch": 2.17, - "learning_rate": 3.749569006378003e-07, - "loss": 0.5273, - "step": 84681 - }, - { - "epoch": 2.17, - "learning_rate": 3.7493530159081786e-07, - "loss": 0.458, - "step": 84682 - }, - { - "epoch": 2.17, - "learning_rate": 3.749137030224191e-07, - "loss": 0.4536, - "step": 84683 - }, - { - "epoch": 2.17, - "learning_rate": 3.748921049326201e-07, - "loss": 0.353, - "step": 84684 - }, - { - "epoch": 2.17, - "learning_rate": 3.748705073214372e-07, - "loss": 0.3923, - "step": 84685 - }, - { - "epoch": 2.17, - "learning_rate": 3.748489101888872e-07, - "loss": 0.4146, - "step": 84686 - }, - { - "epoch": 2.17, - "learning_rate": 3.748273135349865e-07, - "loss": 0.4106, - "step": 84687 - }, - { - "epoch": 2.17, - "learning_rate": 3.748057173597523e-07, - "loss": 0.3882, - "step": 84688 - }, - { - "epoch": 2.17, - "learning_rate": 3.7478412166320027e-07, - "loss": 0.4336, - "step": 84689 - }, - { - "epoch": 2.17, - "learning_rate": 3.747625264453472e-07, - "loss": 0.3655, - "step": 84690 - }, - { - "epoch": 2.17, - "learning_rate": 3.7474093170620977e-07, - "loss": 0.3457, - "step": 84691 - }, - { - "epoch": 2.17, - "learning_rate": 3.7471933744580476e-07, - "loss": 0.5137, - "step": 84692 - }, - { - "epoch": 2.17, - "learning_rate": 3.7469774366414853e-07, - "loss": 0.4209, - "step": 84693 - }, - { - "epoch": 2.17, - "learning_rate": 3.74676150361257e-07, - "loss": 0.4033, - "step": 84694 - }, - { - "epoch": 2.17, - "learning_rate": 3.7465455753714726e-07, - "loss": 0.4878, - "step": 84695 - }, - { - "epoch": 2.17, - "learning_rate": 3.7463296519183573e-07, - "loss": 0.3315, - "step": 84696 - }, - { - "epoch": 2.17, - "learning_rate": 3.746113733253393e-07, - "loss": 0.4995, - "step": 84697 - }, - { - "epoch": 2.17, - "learning_rate": 3.7458978193767386e-07, - "loss": 0.3379, - "step": 84698 - }, - { - "epoch": 2.17, - "learning_rate": 3.745681910288563e-07, - "loss": 0.479, - "step": 84699 - }, - { - "epoch": 2.17, - "learning_rate": 3.745466005989031e-07, - "loss": 0.323, - "step": 84700 - }, - { - "epoch": 2.17, - "learning_rate": 3.7452501064783114e-07, - "loss": 0.437, - "step": 84701 - }, - { - "epoch": 2.17, - "learning_rate": 3.7450342117565636e-07, - "loss": 0.4194, - "step": 84702 - }, - { - "epoch": 2.17, - "learning_rate": 3.744818321823958e-07, - "loss": 0.3352, - "step": 84703 - }, - { - "epoch": 2.17, - "learning_rate": 3.744602436680654e-07, - "loss": 0.2561, - "step": 84704 - }, - { - "epoch": 2.17, - "learning_rate": 3.744386556326824e-07, - "loss": 0.4741, - "step": 84705 - }, - { - "epoch": 2.17, - "learning_rate": 3.744170680762626e-07, - "loss": 0.416, - "step": 84706 - }, - { - "epoch": 2.17, - "learning_rate": 3.743954809988229e-07, - "loss": 0.4546, - "step": 84707 - }, - { - "epoch": 2.17, - "learning_rate": 3.743738944003798e-07, - "loss": 0.4565, - "step": 84708 - }, - { - "epoch": 2.17, - "learning_rate": 3.743523082809502e-07, - "loss": 0.3687, - "step": 84709 - }, - { - "epoch": 2.17, - "learning_rate": 3.743307226405499e-07, - "loss": 0.5786, - "step": 84710 - }, - { - "epoch": 2.17, - "learning_rate": 3.743091374791958e-07, - "loss": 0.4507, - "step": 84711 - }, - { - "epoch": 2.17, - "learning_rate": 3.742875527969045e-07, - "loss": 0.3911, - "step": 84712 - }, - { - "epoch": 2.17, - "learning_rate": 3.7426596859369277e-07, - "loss": 0.5259, - "step": 84713 - }, - { - "epoch": 2.17, - "learning_rate": 3.7424438486957664e-07, - "loss": 0.4092, - "step": 84714 - }, - { - "epoch": 2.17, - "learning_rate": 3.7422280162457263e-07, - "loss": 0.4072, - "step": 84715 - }, - { - "epoch": 2.17, - "learning_rate": 3.7420121885869746e-07, - "loss": 0.3657, - "step": 84716 - }, - { - "epoch": 2.17, - "learning_rate": 3.741796365719676e-07, - "loss": 0.4309, - "step": 84717 - }, - { - "epoch": 2.17, - "learning_rate": 3.741580547644e-07, - "loss": 0.3153, - "step": 84718 - }, - { - "epoch": 2.17, - "learning_rate": 3.741364734360104e-07, - "loss": 0.4834, - "step": 84719 - }, - { - "epoch": 2.17, - "learning_rate": 3.741148925868157e-07, - "loss": 0.5493, - "step": 84720 - }, - { - "epoch": 2.17, - "learning_rate": 3.7409331221683284e-07, - "loss": 0.3979, - "step": 84721 - }, - { - "epoch": 2.17, - "learning_rate": 3.7407173232607756e-07, - "loss": 0.459, - "step": 84722 - }, - { - "epoch": 2.17, - "learning_rate": 3.740501529145672e-07, - "loss": 0.439, - "step": 84723 - }, - { - "epoch": 2.17, - "learning_rate": 3.740285739823175e-07, - "loss": 0.4326, - "step": 84724 - }, - { - "epoch": 2.17, - "learning_rate": 3.7400699552934536e-07, - "loss": 0.3799, - "step": 84725 - }, - { - "epoch": 2.17, - "learning_rate": 3.739854175556676e-07, - "loss": 0.4227, - "step": 84726 - }, - { - "epoch": 2.17, - "learning_rate": 3.739638400613e-07, - "loss": 0.4502, - "step": 84727 - }, - { - "epoch": 2.17, - "learning_rate": 3.739422630462595e-07, - "loss": 0.3982, - "step": 84728 - }, - { - "epoch": 2.17, - "learning_rate": 3.7392068651056277e-07, - "loss": 0.4067, - "step": 84729 - }, - { - "epoch": 2.17, - "learning_rate": 3.738991104542264e-07, - "loss": 0.3618, - "step": 84730 - }, - { - "epoch": 2.17, - "learning_rate": 3.7387753487726637e-07, - "loss": 0.4321, - "step": 84731 - }, - { - "epoch": 2.17, - "learning_rate": 3.7385595977969954e-07, - "loss": 0.4082, - "step": 84732 - }, - { - "epoch": 2.17, - "learning_rate": 3.7383438516154277e-07, - "loss": 0.3065, - "step": 84733 - }, - { - "epoch": 2.17, - "learning_rate": 3.7381281102281183e-07, - "loss": 0.2838, - "step": 84734 - }, - { - "epoch": 2.17, - "learning_rate": 3.7379123736352404e-07, - "loss": 0.2582, - "step": 84735 - }, - { - "epoch": 2.17, - "learning_rate": 3.73769664183695e-07, - "loss": 0.2854, - "step": 84736 - }, - { - "epoch": 2.17, - "learning_rate": 3.7374809148334186e-07, - "loss": 0.2902, - "step": 84737 - }, - { - "epoch": 2.17, - "learning_rate": 3.7372651926248135e-07, - "loss": 0.4097, - "step": 84738 - }, - { - "epoch": 2.17, - "learning_rate": 3.7370494752112936e-07, - "loss": 0.4473, - "step": 84739 - }, - { - "epoch": 2.17, - "learning_rate": 3.736833762593026e-07, - "loss": 0.3267, - "step": 84740 - }, - { - "epoch": 2.17, - "learning_rate": 3.7366180547701773e-07, - "loss": 0.4414, - "step": 84741 - }, - { - "epoch": 2.17, - "learning_rate": 3.7364023517429154e-07, - "loss": 0.2566, - "step": 84742 - }, - { - "epoch": 2.17, - "learning_rate": 3.7361866535114016e-07, - "loss": 0.3716, - "step": 84743 - }, - { - "epoch": 2.17, - "learning_rate": 3.7359709600757995e-07, - "loss": 0.5322, - "step": 84744 - }, - { - "epoch": 2.17, - "learning_rate": 3.735755271436275e-07, - "loss": 0.5723, - "step": 84745 - }, - { - "epoch": 2.17, - "learning_rate": 3.735539587592996e-07, - "loss": 0.4658, - "step": 84746 - }, - { - "epoch": 2.17, - "learning_rate": 3.7353239085461286e-07, - "loss": 0.3896, - "step": 84747 - }, - { - "epoch": 2.17, - "learning_rate": 3.735108234295833e-07, - "loss": 0.3877, - "step": 84748 - }, - { - "epoch": 2.17, - "learning_rate": 3.734892564842277e-07, - "loss": 0.4604, - "step": 84749 - }, - { - "epoch": 2.17, - "learning_rate": 3.7346769001856247e-07, - "loss": 0.4194, - "step": 84750 - }, - { - "epoch": 2.17, - "learning_rate": 3.7344612403260465e-07, - "loss": 0.2966, - "step": 84751 - }, - { - "epoch": 2.17, - "learning_rate": 3.7342455852637e-07, - "loss": 0.377, - "step": 84752 - }, - { - "epoch": 2.17, - "learning_rate": 3.734029934998757e-07, - "loss": 0.4219, - "step": 84753 - }, - { - "epoch": 2.17, - "learning_rate": 3.733814289531375e-07, - "loss": 0.4924, - "step": 84754 - }, - { - "epoch": 2.17, - "learning_rate": 3.733598648861723e-07, - "loss": 0.4258, - "step": 84755 - }, - { - "epoch": 2.17, - "learning_rate": 3.7333830129899714e-07, - "loss": 0.3794, - "step": 84756 - }, - { - "epoch": 2.17, - "learning_rate": 3.733167381916276e-07, - "loss": 0.3882, - "step": 84757 - }, - { - "epoch": 2.17, - "learning_rate": 3.7329517556408054e-07, - "loss": 0.3195, - "step": 84758 - }, - { - "epoch": 2.17, - "learning_rate": 3.73273613416373e-07, - "loss": 0.4434, - "step": 84759 - }, - { - "epoch": 2.17, - "learning_rate": 3.732520517485206e-07, - "loss": 0.4277, - "step": 84760 - }, - { - "epoch": 2.17, - "learning_rate": 3.7323049056054035e-07, - "loss": 0.3767, - "step": 84761 - }, - { - "epoch": 2.17, - "learning_rate": 3.732089298524487e-07, - "loss": 0.5054, - "step": 84762 - }, - { - "epoch": 2.17, - "learning_rate": 3.7318736962426244e-07, - "loss": 0.4541, - "step": 84763 - }, - { - "epoch": 2.17, - "learning_rate": 3.7316580987599776e-07, - "loss": 0.2854, - "step": 84764 - }, - { - "epoch": 2.17, - "learning_rate": 3.7314425060767094e-07, - "loss": 0.5415, - "step": 84765 - }, - { - "epoch": 2.17, - "learning_rate": 3.7312269181929867e-07, - "loss": 0.3949, - "step": 84766 - }, - { - "epoch": 2.17, - "learning_rate": 3.7310113351089767e-07, - "loss": 0.3833, - "step": 84767 - }, - { - "epoch": 2.17, - "learning_rate": 3.730795756824845e-07, - "loss": 0.5723, - "step": 84768 - }, - { - "epoch": 2.17, - "learning_rate": 3.7305801833407524e-07, - "loss": 0.3901, - "step": 84769 - }, - { - "epoch": 2.17, - "learning_rate": 3.730364614656866e-07, - "loss": 0.4214, - "step": 84770 - }, - { - "epoch": 2.17, - "learning_rate": 3.7301490507733504e-07, - "loss": 0.3138, - "step": 84771 - }, - { - "epoch": 2.17, - "learning_rate": 3.729933491690375e-07, - "loss": 0.3546, - "step": 84772 - }, - { - "epoch": 2.17, - "learning_rate": 3.729717937408101e-07, - "loss": 0.3655, - "step": 84773 - }, - { - "epoch": 2.17, - "learning_rate": 3.729502387926692e-07, - "loss": 0.4648, - "step": 84774 - }, - { - "epoch": 2.17, - "learning_rate": 3.7292868432463134e-07, - "loss": 0.4897, - "step": 84775 - }, - { - "epoch": 2.17, - "learning_rate": 3.7290713033671337e-07, - "loss": 0.421, - "step": 84776 - }, - { - "epoch": 2.17, - "learning_rate": 3.728855768289314e-07, - "loss": 0.4048, - "step": 84777 - }, - { - "epoch": 2.17, - "learning_rate": 3.728640238013021e-07, - "loss": 0.3921, - "step": 84778 - }, - { - "epoch": 2.17, - "learning_rate": 3.728424712538419e-07, - "loss": 0.3896, - "step": 84779 - }, - { - "epoch": 2.17, - "learning_rate": 3.7282091918656777e-07, - "loss": 0.3877, - "step": 84780 - }, - { - "epoch": 2.17, - "learning_rate": 3.727993675994955e-07, - "loss": 0.2597, - "step": 84781 - }, - { - "epoch": 2.17, - "learning_rate": 3.7277781649264193e-07, - "loss": 0.3379, - "step": 84782 - }, - { - "epoch": 2.17, - "learning_rate": 3.727562658660238e-07, - "loss": 0.2605, - "step": 84783 - }, - { - "epoch": 2.17, - "learning_rate": 3.7273471571965707e-07, - "loss": 0.5, - "step": 84784 - }, - { - "epoch": 2.17, - "learning_rate": 3.7271316605355896e-07, - "loss": 0.4424, - "step": 84785 - }, - { - "epoch": 2.17, - "learning_rate": 3.726916168677451e-07, - "loss": 0.5049, - "step": 84786 - }, - { - "epoch": 2.17, - "learning_rate": 3.7267006816223243e-07, - "loss": 0.4224, - "step": 84787 - }, - { - "epoch": 2.17, - "learning_rate": 3.7264851993703736e-07, - "loss": 0.4663, - "step": 84788 - }, - { - "epoch": 2.17, - "learning_rate": 3.72626972192177e-07, - "loss": 0.4644, - "step": 84789 - }, - { - "epoch": 2.17, - "learning_rate": 3.726054249276668e-07, - "loss": 0.4321, - "step": 84790 - }, - { - "epoch": 2.17, - "learning_rate": 3.7258387814352386e-07, - "loss": 0.4438, - "step": 84791 - }, - { - "epoch": 2.17, - "learning_rate": 3.725623318397646e-07, - "loss": 0.4172, - "step": 84792 - }, - { - "epoch": 2.17, - "learning_rate": 3.7254078601640615e-07, - "loss": 0.4238, - "step": 84793 - }, - { - "epoch": 2.17, - "learning_rate": 3.725192406734637e-07, - "loss": 0.3722, - "step": 84794 - }, - { - "epoch": 2.17, - "learning_rate": 3.7249769581095446e-07, - "loss": 0.3252, - "step": 84795 - }, - { - "epoch": 2.17, - "learning_rate": 3.724761514288949e-07, - "loss": 0.4893, - "step": 84796 - }, - { - "epoch": 2.17, - "learning_rate": 3.7245460752730174e-07, - "loss": 0.4209, - "step": 84797 - }, - { - "epoch": 2.17, - "learning_rate": 3.7243306410619104e-07, - "loss": 0.5132, - "step": 84798 - }, - { - "epoch": 2.17, - "learning_rate": 3.7241152116557927e-07, - "loss": 0.3945, - "step": 84799 - }, - { - "epoch": 2.17, - "learning_rate": 3.723899787054833e-07, - "loss": 0.4844, - "step": 84800 - }, - { - "epoch": 2.17, - "learning_rate": 3.7236843672591977e-07, - "loss": 0.3821, - "step": 84801 - }, - { - "epoch": 2.17, - "learning_rate": 3.7234689522690454e-07, - "loss": 0.4197, - "step": 84802 - }, - { - "epoch": 2.17, - "learning_rate": 3.723253542084548e-07, - "loss": 0.3938, - "step": 84803 - }, - { - "epoch": 2.17, - "learning_rate": 3.723038136705863e-07, - "loss": 0.3706, - "step": 84804 - }, - { - "epoch": 2.17, - "learning_rate": 3.722822736133159e-07, - "loss": 0.4282, - "step": 84805 - }, - { - "epoch": 2.17, - "learning_rate": 3.7226073403666037e-07, - "loss": 0.3386, - "step": 84806 - }, - { - "epoch": 2.17, - "learning_rate": 3.722391949406356e-07, - "loss": 0.3064, - "step": 84807 - }, - { - "epoch": 2.17, - "learning_rate": 3.722176563252585e-07, - "loss": 0.3682, - "step": 84808 - }, - { - "epoch": 2.17, - "learning_rate": 3.721961181905455e-07, - "loss": 0.4443, - "step": 84809 - }, - { - "epoch": 2.17, - "learning_rate": 3.721745805365133e-07, - "loss": 0.3572, - "step": 84810 - }, - { - "epoch": 2.17, - "learning_rate": 3.7215304336317785e-07, - "loss": 0.2302, - "step": 84811 - }, - { - "epoch": 2.17, - "learning_rate": 3.7213150667055606e-07, - "loss": 0.3623, - "step": 84812 - }, - { - "epoch": 2.17, - "learning_rate": 3.7210997045866454e-07, - "loss": 0.4243, - "step": 84813 - }, - { - "epoch": 2.17, - "learning_rate": 3.720884347275195e-07, - "loss": 0.4727, - "step": 84814 - }, - { - "epoch": 2.17, - "learning_rate": 3.720668994771372e-07, - "loss": 0.3975, - "step": 84815 - }, - { - "epoch": 2.17, - "learning_rate": 3.720453647075343e-07, - "loss": 0.479, - "step": 84816 - }, - { - "epoch": 2.17, - "learning_rate": 3.7202383041872755e-07, - "loss": 0.311, - "step": 84817 - }, - { - "epoch": 2.17, - "learning_rate": 3.720022966107336e-07, - "loss": 0.3118, - "step": 84818 - }, - { - "epoch": 2.17, - "learning_rate": 3.719807632835682e-07, - "loss": 0.3784, - "step": 84819 - }, - { - "epoch": 2.17, - "learning_rate": 3.719592304372483e-07, - "loss": 0.3906, - "step": 84820 - }, - { - "epoch": 2.17, - "learning_rate": 3.719376980717903e-07, - "loss": 0.4502, - "step": 84821 - }, - { - "epoch": 2.17, - "learning_rate": 3.71916166187211e-07, - "loss": 0.4127, - "step": 84822 - }, - { - "epoch": 2.17, - "learning_rate": 3.7189463478352676e-07, - "loss": 0.3881, - "step": 84823 - }, - { - "epoch": 2.17, - "learning_rate": 3.7187310386075354e-07, - "loss": 0.4021, - "step": 84824 - }, - { - "epoch": 2.17, - "learning_rate": 3.7185157341890816e-07, - "loss": 0.3862, - "step": 84825 - }, - { - "epoch": 2.17, - "learning_rate": 3.718300434580072e-07, - "loss": 0.5664, - "step": 84826 - }, - { - "epoch": 2.17, - "learning_rate": 3.7180851397806735e-07, - "loss": 0.4604, - "step": 84827 - }, - { - "epoch": 2.17, - "learning_rate": 3.7178698497910454e-07, - "loss": 0.3279, - "step": 84828 - }, - { - "epoch": 2.17, - "learning_rate": 3.7176545646113546e-07, - "loss": 0.374, - "step": 84829 - }, - { - "epoch": 2.17, - "learning_rate": 3.7174392842417713e-07, - "loss": 0.3374, - "step": 84830 - }, - { - "epoch": 2.17, - "learning_rate": 3.7172240086824527e-07, - "loss": 0.416, - "step": 84831 - }, - { - "epoch": 2.17, - "learning_rate": 3.717008737933569e-07, - "loss": 0.5447, - "step": 84832 - }, - { - "epoch": 2.17, - "learning_rate": 3.716793471995281e-07, - "loss": 0.396, - "step": 84833 - }, - { - "epoch": 2.17, - "learning_rate": 3.7165782108677537e-07, - "loss": 0.3301, - "step": 84834 - }, - { - "epoch": 2.17, - "learning_rate": 3.7163629545511574e-07, - "loss": 0.3264, - "step": 84835 - }, - { - "epoch": 2.17, - "learning_rate": 3.71614770304565e-07, - "loss": 0.4302, - "step": 84836 - }, - { - "epoch": 2.17, - "learning_rate": 3.7159324563513995e-07, - "loss": 0.2568, - "step": 84837 - }, - { - "epoch": 2.17, - "learning_rate": 3.7157172144685714e-07, - "loss": 0.458, - "step": 84838 - }, - { - "epoch": 2.17, - "learning_rate": 3.715501977397332e-07, - "loss": 0.4526, - "step": 84839 - }, - { - "epoch": 2.17, - "learning_rate": 3.71528674513784e-07, - "loss": 0.4326, - "step": 84840 - }, - { - "epoch": 2.17, - "learning_rate": 3.7150715176902646e-07, - "loss": 0.4121, - "step": 84841 - }, - { - "epoch": 2.17, - "learning_rate": 3.7148562950547726e-07, - "loss": 0.3381, - "step": 84842 - }, - { - "epoch": 2.17, - "learning_rate": 3.714641077231524e-07, - "loss": 0.3418, - "step": 84843 - }, - { - "epoch": 2.17, - "learning_rate": 3.7144258642206885e-07, - "loss": 0.4111, - "step": 84844 - }, - { - "epoch": 2.17, - "learning_rate": 3.714210656022424e-07, - "loss": 0.3413, - "step": 84845 - }, - { - "epoch": 2.17, - "learning_rate": 3.7139954526369e-07, - "loss": 0.5479, - "step": 84846 - }, - { - "epoch": 2.17, - "learning_rate": 3.713780254064284e-07, - "loss": 0.3625, - "step": 84847 - }, - { - "epoch": 2.17, - "learning_rate": 3.7135650603047343e-07, - "loss": 0.4761, - "step": 84848 - }, - { - "epoch": 2.17, - "learning_rate": 3.7133498713584176e-07, - "loss": 0.4614, - "step": 84849 - }, - { - "epoch": 2.17, - "learning_rate": 3.713134687225501e-07, - "loss": 0.417, - "step": 84850 - }, - { - "epoch": 2.17, - "learning_rate": 3.7129195079061517e-07, - "loss": 0.4624, - "step": 84851 - }, - { - "epoch": 2.17, - "learning_rate": 3.71270433340053e-07, - "loss": 0.415, - "step": 84852 - }, - { - "epoch": 2.17, - "learning_rate": 3.7124891637087987e-07, - "loss": 0.4106, - "step": 84853 - }, - { - "epoch": 2.17, - "learning_rate": 3.712273998831125e-07, - "loss": 0.3723, - "step": 84854 - }, - { - "epoch": 2.17, - "learning_rate": 3.7120588387676745e-07, - "loss": 0.4312, - "step": 84855 - }, - { - "epoch": 2.17, - "learning_rate": 3.711843683518614e-07, - "loss": 0.5679, - "step": 84856 - }, - { - "epoch": 2.17, - "learning_rate": 3.711628533084102e-07, - "loss": 0.3704, - "step": 84857 - }, - { - "epoch": 2.17, - "learning_rate": 3.7114133874643085e-07, - "loss": 0.3945, - "step": 84858 - }, - { - "epoch": 2.17, - "learning_rate": 3.711198246659395e-07, - "loss": 0.3896, - "step": 84859 - }, - { - "epoch": 2.18, - "learning_rate": 3.7109831106695324e-07, - "loss": 0.3921, - "step": 84860 - }, - { - "epoch": 2.18, - "learning_rate": 3.7107679794948766e-07, - "loss": 0.3752, - "step": 84861 - }, - { - "epoch": 2.18, - "learning_rate": 3.710552853135601e-07, - "loss": 0.3501, - "step": 84862 - }, - { - "epoch": 2.18, - "learning_rate": 3.7103377315918617e-07, - "loss": 0.4297, - "step": 84863 - }, - { - "epoch": 2.18, - "learning_rate": 3.710122614863831e-07, - "loss": 0.31, - "step": 84864 - }, - { - "epoch": 2.18, - "learning_rate": 3.7099075029516667e-07, - "loss": 0.3501, - "step": 84865 - }, - { - "epoch": 2.18, - "learning_rate": 3.709692395855537e-07, - "loss": 0.4053, - "step": 84866 - }, - { - "epoch": 2.18, - "learning_rate": 3.709477293575607e-07, - "loss": 0.3428, - "step": 84867 - }, - { - "epoch": 2.18, - "learning_rate": 3.709262196112044e-07, - "loss": 0.3894, - "step": 84868 - }, - { - "epoch": 2.18, - "learning_rate": 3.709047103465006e-07, - "loss": 0.377, - "step": 84869 - }, - { - "epoch": 2.18, - "learning_rate": 3.708832015634662e-07, - "loss": 0.3558, - "step": 84870 - }, - { - "epoch": 2.18, - "learning_rate": 3.708616932621176e-07, - "loss": 0.3123, - "step": 84871 - }, - { - "epoch": 2.18, - "learning_rate": 3.7084018544247163e-07, - "loss": 0.3513, - "step": 84872 - }, - { - "epoch": 2.18, - "learning_rate": 3.7081867810454436e-07, - "loss": 0.365, - "step": 84873 - }, - { - "epoch": 2.18, - "learning_rate": 3.70797171248352e-07, - "loss": 0.3391, - "step": 84874 - }, - { - "epoch": 2.18, - "learning_rate": 3.707756648739113e-07, - "loss": 0.4174, - "step": 84875 - }, - { - "epoch": 2.18, - "learning_rate": 3.7075415898123876e-07, - "loss": 0.3152, - "step": 84876 - }, - { - "epoch": 2.18, - "learning_rate": 3.707326535703511e-07, - "loss": 0.4482, - "step": 84877 - }, - { - "epoch": 2.18, - "learning_rate": 3.707111486412642e-07, - "loss": 0.3678, - "step": 84878 - }, - { - "epoch": 2.18, - "learning_rate": 3.7068964419399487e-07, - "loss": 0.4893, - "step": 84879 - }, - { - "epoch": 2.18, - "learning_rate": 3.706681402285594e-07, - "loss": 0.4707, - "step": 84880 - }, - { - "epoch": 2.18, - "learning_rate": 3.706466367449749e-07, - "loss": 0.4961, - "step": 84881 - }, - { - "epoch": 2.18, - "learning_rate": 3.7062513374325733e-07, - "loss": 0.3752, - "step": 84882 - }, - { - "epoch": 2.18, - "learning_rate": 3.7060363122342277e-07, - "loss": 0.3481, - "step": 84883 - }, - { - "epoch": 2.18, - "learning_rate": 3.7058212918548806e-07, - "loss": 0.4912, - "step": 84884 - }, - { - "epoch": 2.18, - "learning_rate": 3.7056062762947005e-07, - "loss": 0.4458, - "step": 84885 - }, - { - "epoch": 2.18, - "learning_rate": 3.7053912655538446e-07, - "loss": 0.3611, - "step": 84886 - }, - { - "epoch": 2.18, - "learning_rate": 3.705176259632481e-07, - "loss": 0.5264, - "step": 84887 - }, - { - "epoch": 2.18, - "learning_rate": 3.7049612585307744e-07, - "loss": 0.3589, - "step": 84888 - }, - { - "epoch": 2.18, - "learning_rate": 3.704746262248893e-07, - "loss": 0.4805, - "step": 84889 - }, - { - "epoch": 2.18, - "learning_rate": 3.7045312707869947e-07, - "loss": 0.3997, - "step": 84890 - }, - { - "epoch": 2.18, - "learning_rate": 3.704316284145247e-07, - "loss": 0.3589, - "step": 84891 - }, - { - "epoch": 2.18, - "learning_rate": 3.704101302323819e-07, - "loss": 0.342, - "step": 84892 - }, - { - "epoch": 2.18, - "learning_rate": 3.703886325322867e-07, - "loss": 0.4712, - "step": 84893 - }, - { - "epoch": 2.18, - "learning_rate": 3.7036713531425635e-07, - "loss": 0.417, - "step": 84894 - }, - { - "epoch": 2.18, - "learning_rate": 3.703456385783066e-07, - "loss": 0.3735, - "step": 84895 - }, - { - "epoch": 2.18, - "learning_rate": 3.703241423244542e-07, - "loss": 0.3618, - "step": 84896 - }, - { - "epoch": 2.18, - "learning_rate": 3.703026465527157e-07, - "loss": 0.3984, - "step": 84897 - }, - { - "epoch": 2.18, - "learning_rate": 3.7028115126310775e-07, - "loss": 0.4702, - "step": 84898 - }, - { - "epoch": 2.18, - "learning_rate": 3.702596564556464e-07, - "loss": 0.479, - "step": 84899 - }, - { - "epoch": 2.18, - "learning_rate": 3.702381621303482e-07, - "loss": 0.3645, - "step": 84900 - }, - { - "epoch": 2.18, - "learning_rate": 3.7021666828722996e-07, - "loss": 0.5024, - "step": 84901 - }, - { - "epoch": 2.18, - "learning_rate": 3.701951749263079e-07, - "loss": 0.5166, - "step": 84902 - }, - { - "epoch": 2.18, - "learning_rate": 3.701736820475981e-07, - "loss": 0.4012, - "step": 84903 - }, - { - "epoch": 2.18, - "learning_rate": 3.7015218965111737e-07, - "loss": 0.4121, - "step": 84904 - }, - { - "epoch": 2.18, - "learning_rate": 3.701306977368821e-07, - "loss": 0.5027, - "step": 84905 - }, - { - "epoch": 2.18, - "learning_rate": 3.7010920630490915e-07, - "loss": 0.3196, - "step": 84906 - }, - { - "epoch": 2.18, - "learning_rate": 3.700877153552143e-07, - "loss": 0.4624, - "step": 84907 - }, - { - "epoch": 2.18, - "learning_rate": 3.7006622488781424e-07, - "loss": 0.3766, - "step": 84908 - }, - { - "epoch": 2.18, - "learning_rate": 3.700447349027256e-07, - "loss": 0.5195, - "step": 84909 - }, - { - "epoch": 2.18, - "learning_rate": 3.700232453999651e-07, - "loss": 0.418, - "step": 84910 - }, - { - "epoch": 2.18, - "learning_rate": 3.7000175637954844e-07, - "loss": 0.4624, - "step": 84911 - }, - { - "epoch": 2.18, - "learning_rate": 3.699802678414928e-07, - "loss": 0.4136, - "step": 84912 - }, - { - "epoch": 2.18, - "learning_rate": 3.6995877978581404e-07, - "loss": 0.3635, - "step": 84913 - }, - { - "epoch": 2.18, - "learning_rate": 3.699372922125288e-07, - "loss": 0.5186, - "step": 84914 - }, - { - "epoch": 2.18, - "learning_rate": 3.699158051216539e-07, - "loss": 0.4438, - "step": 84915 - }, - { - "epoch": 2.18, - "learning_rate": 3.6989431851320517e-07, - "loss": 0.4521, - "step": 84916 - }, - { - "epoch": 2.18, - "learning_rate": 3.698728323871995e-07, - "loss": 0.4766, - "step": 84917 - }, - { - "epoch": 2.18, - "learning_rate": 3.6985134674365316e-07, - "loss": 0.2822, - "step": 84918 - }, - { - "epoch": 2.18, - "learning_rate": 3.69829861582583e-07, - "loss": 0.5386, - "step": 84919 - }, - { - "epoch": 2.18, - "learning_rate": 3.698083769040048e-07, - "loss": 0.3784, - "step": 84920 - }, - { - "epoch": 2.18, - "learning_rate": 3.697868927079353e-07, - "loss": 0.4409, - "step": 84921 - }, - { - "epoch": 2.18, - "learning_rate": 3.6976540899439135e-07, - "loss": 0.344, - "step": 84922 - }, - { - "epoch": 2.18, - "learning_rate": 3.697439257633891e-07, - "loss": 0.4087, - "step": 84923 - }, - { - "epoch": 2.18, - "learning_rate": 3.697224430149446e-07, - "loss": 0.3525, - "step": 84924 - }, - { - "epoch": 2.18, - "learning_rate": 3.697009607490746e-07, - "loss": 0.3542, - "step": 84925 - }, - { - "epoch": 2.18, - "learning_rate": 3.6967947896579567e-07, - "loss": 0.3098, - "step": 84926 - }, - { - "epoch": 2.18, - "learning_rate": 3.696579976651245e-07, - "loss": 0.3613, - "step": 84927 - }, - { - "epoch": 2.18, - "learning_rate": 3.6963651684707687e-07, - "loss": 0.4019, - "step": 84928 - }, - { - "epoch": 2.18, - "learning_rate": 3.6961503651166956e-07, - "loss": 0.3691, - "step": 84929 - }, - { - "epoch": 2.18, - "learning_rate": 3.69593556658919e-07, - "loss": 0.502, - "step": 84930 - }, - { - "epoch": 2.18, - "learning_rate": 3.695720772888421e-07, - "loss": 0.4468, - "step": 84931 - }, - { - "epoch": 2.18, - "learning_rate": 3.6955059840145473e-07, - "loss": 0.2987, - "step": 84932 - }, - { - "epoch": 2.18, - "learning_rate": 3.6952911999677327e-07, - "loss": 0.4402, - "step": 84933 - }, - { - "epoch": 2.18, - "learning_rate": 3.6950764207481434e-07, - "loss": 0.4531, - "step": 84934 - }, - { - "epoch": 2.18, - "learning_rate": 3.694861646355943e-07, - "loss": 0.3845, - "step": 84935 - }, - { - "epoch": 2.18, - "learning_rate": 3.694646876791302e-07, - "loss": 0.4321, - "step": 84936 - }, - { - "epoch": 2.18, - "learning_rate": 3.6944321120543763e-07, - "loss": 0.4331, - "step": 84937 - }, - { - "epoch": 2.18, - "learning_rate": 3.6942173521453336e-07, - "loss": 0.2831, - "step": 84938 - }, - { - "epoch": 2.18, - "learning_rate": 3.6940025970643416e-07, - "loss": 0.3511, - "step": 84939 - }, - { - "epoch": 2.18, - "learning_rate": 3.69378784681156e-07, - "loss": 0.4456, - "step": 84940 - }, - { - "epoch": 2.18, - "learning_rate": 3.693573101387154e-07, - "loss": 0.4243, - "step": 84941 - }, - { - "epoch": 2.18, - "learning_rate": 3.693358360791292e-07, - "loss": 0.4131, - "step": 84942 - }, - { - "epoch": 2.18, - "learning_rate": 3.693143625024133e-07, - "loss": 0.3798, - "step": 84943 - }, - { - "epoch": 2.18, - "learning_rate": 3.692928894085847e-07, - "loss": 0.3855, - "step": 84944 - }, - { - "epoch": 2.18, - "learning_rate": 3.6927141679765926e-07, - "loss": 0.3765, - "step": 84945 - }, - { - "epoch": 2.18, - "learning_rate": 3.6924994466965367e-07, - "loss": 0.5146, - "step": 84946 - }, - { - "epoch": 2.18, - "learning_rate": 3.692284730245844e-07, - "loss": 0.395, - "step": 84947 - }, - { - "epoch": 2.18, - "learning_rate": 3.692070018624681e-07, - "loss": 0.6177, - "step": 84948 - }, - { - "epoch": 2.18, - "learning_rate": 3.6918553118332083e-07, - "loss": 0.3694, - "step": 84949 - }, - { - "epoch": 2.18, - "learning_rate": 3.691640609871591e-07, - "loss": 0.4844, - "step": 84950 - }, - { - "epoch": 2.18, - "learning_rate": 3.691425912739994e-07, - "loss": 0.3057, - "step": 84951 - }, - { - "epoch": 2.18, - "learning_rate": 3.691211220438586e-07, - "loss": 0.3988, - "step": 84952 - }, - { - "epoch": 2.18, - "learning_rate": 3.6909965329675275e-07, - "loss": 0.4539, - "step": 84953 - }, - { - "epoch": 2.18, - "learning_rate": 3.6907818503269796e-07, - "loss": 0.3652, - "step": 84954 - }, - { - "epoch": 2.18, - "learning_rate": 3.6905671725171103e-07, - "loss": 0.3398, - "step": 84955 - }, - { - "epoch": 2.18, - "learning_rate": 3.6903524995380865e-07, - "loss": 0.4668, - "step": 84956 - }, - { - "epoch": 2.18, - "learning_rate": 3.6901378313900653e-07, - "loss": 0.4346, - "step": 84957 - }, - { - "epoch": 2.18, - "learning_rate": 3.6899231680732167e-07, - "loss": 0.4066, - "step": 84958 - }, - { - "epoch": 2.18, - "learning_rate": 3.689708509587703e-07, - "loss": 0.4521, - "step": 84959 - }, - { - "epoch": 2.18, - "learning_rate": 3.689493855933694e-07, - "loss": 0.4141, - "step": 84960 - }, - { - "epoch": 2.18, - "learning_rate": 3.6892792071113454e-07, - "loss": 0.4863, - "step": 84961 - }, - { - "epoch": 2.18, - "learning_rate": 3.689064563120828e-07, - "loss": 0.5464, - "step": 84962 - }, - { - "epoch": 2.18, - "learning_rate": 3.6888499239623016e-07, - "loss": 0.4795, - "step": 84963 - }, - { - "epoch": 2.18, - "learning_rate": 3.6886352896359317e-07, - "loss": 0.4937, - "step": 84964 - }, - { - "epoch": 2.18, - "learning_rate": 3.6884206601418874e-07, - "loss": 0.4229, - "step": 84965 - }, - { - "epoch": 2.18, - "learning_rate": 3.6882060354803255e-07, - "loss": 0.3218, - "step": 84966 - }, - { - "epoch": 2.18, - "learning_rate": 3.6879914156514147e-07, - "loss": 0.292, - "step": 84967 - }, - { - "epoch": 2.18, - "learning_rate": 3.6877768006553176e-07, - "loss": 0.4419, - "step": 84968 - }, - { - "epoch": 2.18, - "learning_rate": 3.6875621904922037e-07, - "loss": 0.4185, - "step": 84969 - }, - { - "epoch": 2.18, - "learning_rate": 3.6873475851622306e-07, - "loss": 0.4927, - "step": 84970 - }, - { - "epoch": 2.18, - "learning_rate": 3.687132984665564e-07, - "loss": 0.395, - "step": 84971 - }, - { - "epoch": 2.18, - "learning_rate": 3.6869183890023726e-07, - "loss": 0.5894, - "step": 84972 - }, - { - "epoch": 2.18, - "learning_rate": 3.686703798172818e-07, - "loss": 0.3887, - "step": 84973 - }, - { - "epoch": 2.18, - "learning_rate": 3.6864892121770606e-07, - "loss": 0.46, - "step": 84974 - }, - { - "epoch": 2.18, - "learning_rate": 3.686274631015268e-07, - "loss": 0.3683, - "step": 84975 - }, - { - "epoch": 2.18, - "learning_rate": 3.686060054687604e-07, - "loss": 0.4087, - "step": 84976 - }, - { - "epoch": 2.18, - "learning_rate": 3.6858454831942376e-07, - "loss": 0.3707, - "step": 84977 - }, - { - "epoch": 2.18, - "learning_rate": 3.685630916535326e-07, - "loss": 0.4319, - "step": 84978 - }, - { - "epoch": 2.18, - "learning_rate": 3.685416354711035e-07, - "loss": 0.4243, - "step": 84979 - }, - { - "epoch": 2.18, - "learning_rate": 3.685201797721532e-07, - "loss": 0.303, - "step": 84980 - }, - { - "epoch": 2.18, - "learning_rate": 3.684987245566982e-07, - "loss": 0.333, - "step": 84981 - }, - { - "epoch": 2.18, - "learning_rate": 3.684772698247547e-07, - "loss": 0.4526, - "step": 84982 - }, - { - "epoch": 2.18, - "learning_rate": 3.6845581557633886e-07, - "loss": 0.3184, - "step": 84983 - }, - { - "epoch": 2.18, - "learning_rate": 3.6843436181146727e-07, - "loss": 0.3727, - "step": 84984 - }, - { - "epoch": 2.18, - "learning_rate": 3.684129085301565e-07, - "loss": 0.3406, - "step": 84985 - }, - { - "epoch": 2.18, - "learning_rate": 3.6839145573242326e-07, - "loss": 0.2668, - "step": 84986 - }, - { - "epoch": 2.18, - "learning_rate": 3.6837000341828326e-07, - "loss": 0.4746, - "step": 84987 - }, - { - "epoch": 2.18, - "learning_rate": 3.6834855158775333e-07, - "loss": 0.4458, - "step": 84988 - }, - { - "epoch": 2.18, - "learning_rate": 3.683271002408499e-07, - "loss": 0.4419, - "step": 84989 - }, - { - "epoch": 2.18, - "learning_rate": 3.683056493775896e-07, - "loss": 0.4014, - "step": 84990 - }, - { - "epoch": 2.18, - "learning_rate": 3.6828419899798835e-07, - "loss": 0.5601, - "step": 84991 - }, - { - "epoch": 2.18, - "learning_rate": 3.6826274910206324e-07, - "loss": 0.4678, - "step": 84992 - }, - { - "epoch": 2.18, - "learning_rate": 3.6824129968982985e-07, - "loss": 0.5112, - "step": 84993 - }, - { - "epoch": 2.18, - "learning_rate": 3.6821985076130547e-07, - "loss": 0.5312, - "step": 84994 - }, - { - "epoch": 2.18, - "learning_rate": 3.6819840231650567e-07, - "loss": 0.408, - "step": 84995 - }, - { - "epoch": 2.18, - "learning_rate": 3.681769543554474e-07, - "loss": 0.222, - "step": 84996 - }, - { - "epoch": 2.18, - "learning_rate": 3.681555068781469e-07, - "loss": 0.3833, - "step": 84997 - }, - { - "epoch": 2.18, - "learning_rate": 3.681340598846211e-07, - "loss": 0.5103, - "step": 84998 - }, - { - "epoch": 2.18, - "learning_rate": 3.6811261337488565e-07, - "loss": 0.4241, - "step": 84999 - }, - { - "epoch": 2.18, - "learning_rate": 3.680911673489572e-07, - "loss": 0.4688, - "step": 85000 - } - ], - "logging_steps": 1.0, - "max_steps": 117048, - "num_train_epochs": 3, - "save_steps": 5000, - "total_flos": 2207165233029120.0, - "trial_name": null, - "trial_params": null -}